diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,9 +1,9 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 0.7689153167931105, + "epoch": 1.665983186385073, "eval_steps": 500, - "global_step": 30000, + "global_step": 65000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, @@ -180007,13 +180007,210013 @@ "learning_rate": 1.7432139447297147e-06, "loss": 0.6895, "step": 30000 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431954314219354e-06, + "loss": 0.73, + "step": 30001 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431769175451262e-06, + "loss": 0.8896, + "step": 30002 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431584030992999e-06, + "loss": 0.8604, + "step": 30003 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431398880844718e-06, + "loss": 0.9375, + "step": 30004 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431213725006555e-06, + "loss": 1.0127, + "step": 30005 + }, + { + "epoch": 0.77, + "learning_rate": 1.7431028563478653e-06, + "loss": 0.9746, + "step": 30006 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430843396261155e-06, + "loss": 1.0654, + "step": 30007 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430658223354202e-06, + "loss": 0.8325, + "step": 30008 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430473044757934e-06, + "loss": 0.8613, + "step": 30009 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430287860472497e-06, + "loss": 0.7666, + "step": 30010 + }, + { + "epoch": 0.77, + "learning_rate": 1.7430102670498027e-06, + "loss": 0.9316, + "step": 30011 + }, + { + "epoch": 0.77, + "learning_rate": 1.742991747483467e-06, + "loss": 0.8403, + "step": 30012 + }, + { + "epoch": 0.77, + "learning_rate": 1.742973227348257e-06, + "loss": 0.8047, + "step": 30013 + }, + { + "epoch": 0.77, + "learning_rate": 1.7429547066441862e-06, + "loss": 0.8672, + "step": 30014 + }, + { + "epoch": 0.77, + "learning_rate": 1.742936185371269e-06, + "loss": 1.0479, + "step": 30015 + }, + { + "epoch": 0.77, + "learning_rate": 1.7429176635295204e-06, + "loss": 0.8672, + "step": 30016 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428991411189535e-06, + "loss": 0.792, + "step": 30017 + }, + { + "epoch": 0.77, + "learning_rate": 1.742880618139583e-06, + "loss": 1.0469, + "step": 30018 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428620945914228e-06, + "loss": 0.9912, + "step": 30019 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428435704744873e-06, + "loss": 0.9141, + "step": 30020 + }, + { + "epoch": 0.77, + "learning_rate": 1.7428250457887907e-06, + "loss": 0.8887, + "step": 30021 + }, + { + "epoch": 0.77, + "learning_rate": 1.742806520534347e-06, + "loss": 0.9609, + "step": 30022 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427879947111705e-06, + "loss": 0.7607, + "step": 30023 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427694683192758e-06, + "loss": 0.9001, + "step": 30024 + }, + { + "epoch": 0.77, + "learning_rate": 1.742750941358676e-06, + "loss": 0.9395, + "step": 30025 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427324138293865e-06, + "loss": 0.6309, + "step": 30026 + }, + { + "epoch": 0.77, + "learning_rate": 1.7427138857314207e-06, + "loss": 0.9854, + "step": 30027 + }, + { + "epoch": 0.77, + "learning_rate": 1.742695357064793e-06, + "loss": 0.7715, + "step": 30028 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426768278295175e-06, + "loss": 0.5098, + "step": 30029 + }, + { + "epoch": 0.77, + "learning_rate": 1.742658298025609e-06, + "loss": 0.8594, + "step": 30030 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426397676530806e-06, + "loss": 0.6719, + "step": 30031 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426212367119475e-06, + "loss": 1.0283, + "step": 30032 + }, + { + "epoch": 0.77, + "learning_rate": 1.7426027052022234e-06, + "loss": 0.8555, + "step": 30033 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425841731239223e-06, + "loss": 0.8174, + "step": 30034 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425656404770588e-06, + "loss": 0.9258, + "step": 30035 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425471072616471e-06, + "loss": 0.9824, + "step": 30036 + }, + { + "epoch": 0.77, + "learning_rate": 1.7425285734777008e-06, + "loss": 0.9385, + "step": 30037 + }, + { + "epoch": 0.77, + "learning_rate": 1.742510039125235e-06, + "loss": 1.1328, + "step": 30038 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424915042042632e-06, + "loss": 0.9463, + "step": 30039 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424729687147997e-06, + "loss": 1.1299, + "step": 30040 + }, + { + "epoch": 0.77, + "learning_rate": 1.742454432656859e-06, + "loss": 0.8906, + "step": 30041 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424358960304549e-06, + "loss": 0.8525, + "step": 30042 + }, + { + "epoch": 0.77, + "learning_rate": 1.7424173588356017e-06, + "loss": 1.0215, + "step": 30043 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423988210723136e-06, + "loss": 0.9785, + "step": 30044 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423802827406052e-06, + "loss": 1.0156, + "step": 30045 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423617438404903e-06, + "loss": 0.9365, + "step": 30046 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423432043719833e-06, + "loss": 0.7378, + "step": 30047 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423246643350978e-06, + "loss": 0.96, + "step": 30048 + }, + { + "epoch": 0.77, + "learning_rate": 1.7423061237298486e-06, + "loss": 0.7695, + "step": 30049 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422875825562498e-06, + "loss": 0.7852, + "step": 30050 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422690408143154e-06, + "loss": 1.0078, + "step": 30051 + }, + { + "epoch": 0.77, + "learning_rate": 1.74225049850406e-06, + "loss": 0.8975, + "step": 30052 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422319556254972e-06, + "loss": 0.8242, + "step": 30053 + }, + { + "epoch": 0.77, + "learning_rate": 1.7422134121786415e-06, + "loss": 0.6711, + "step": 30054 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421948681635075e-06, + "loss": 0.8564, + "step": 30055 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421763235801085e-06, + "loss": 0.8779, + "step": 30056 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421577784284595e-06, + "loss": 1.0498, + "step": 30057 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421392327085746e-06, + "loss": 0.8994, + "step": 30058 + }, + { + "epoch": 0.77, + "learning_rate": 1.7421206864204679e-06, + "loss": 0.8682, + "step": 30059 + }, + { + "epoch": 0.77, + "learning_rate": 1.742102139564153e-06, + "loss": 0.6389, + "step": 30060 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420835921396448e-06, + "loss": 0.9697, + "step": 30061 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420650441469573e-06, + "loss": 0.6621, + "step": 30062 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420464955861049e-06, + "loss": 0.9287, + "step": 30063 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420279464571017e-06, + "loss": 0.8994, + "step": 30064 + }, + { + "epoch": 0.77, + "learning_rate": 1.7420093967599616e-06, + "loss": 0.9678, + "step": 30065 + }, + { + "epoch": 0.77, + "learning_rate": 1.741990846494699e-06, + "loss": 0.8489, + "step": 30066 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419722956613284e-06, + "loss": 0.9453, + "step": 30067 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419537442598633e-06, + "loss": 0.728, + "step": 30068 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419351922903184e-06, + "loss": 0.8184, + "step": 30069 + }, + { + "epoch": 0.77, + "learning_rate": 1.7419166397527083e-06, + "loss": 0.8877, + "step": 30070 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418980866470464e-06, + "loss": 0.6064, + "step": 30071 + }, + { + "epoch": 0.77, + "learning_rate": 1.741879532973347e-06, + "loss": 0.8477, + "step": 30072 + }, + { + "epoch": 0.77, + "learning_rate": 1.741860978731625e-06, + "loss": 0.7124, + "step": 30073 + }, + { + "epoch": 0.77, + "learning_rate": 1.741842423921894e-06, + "loss": 0.7188, + "step": 30074 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418238685441684e-06, + "loss": 0.6265, + "step": 30075 + }, + { + "epoch": 0.77, + "learning_rate": 1.7418053125984624e-06, + "loss": 0.6475, + "step": 30076 + }, + { + "epoch": 0.77, + "learning_rate": 1.7417867560847901e-06, + "loss": 0.6787, + "step": 30077 + }, + { + "epoch": 0.77, + "learning_rate": 1.741768199003166e-06, + "loss": 0.9756, + "step": 30078 + }, + { + "epoch": 0.77, + "learning_rate": 1.7417496413536034e-06, + "loss": 1.0234, + "step": 30079 + }, + { + "epoch": 0.77, + "learning_rate": 1.741731083136118e-06, + "loss": 0.9351, + "step": 30080 + }, + { + "epoch": 0.77, + "learning_rate": 1.741712524350723e-06, + "loss": 0.9102, + "step": 30081 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416939649974327e-06, + "loss": 1.0098, + "step": 30082 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416754050762612e-06, + "loss": 0.8119, + "step": 30083 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416568445872235e-06, + "loss": 0.8242, + "step": 30084 + }, + { + "epoch": 0.77, + "learning_rate": 1.7416382835303329e-06, + "loss": 0.917, + "step": 30085 + }, + { + "epoch": 0.77, + "learning_rate": 1.741619721905604e-06, + "loss": 1.0117, + "step": 30086 + }, + { + "epoch": 0.77, + "learning_rate": 1.741601159713051e-06, + "loss": 0.916, + "step": 30087 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415825969526882e-06, + "loss": 0.6831, + "step": 30088 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415640336245297e-06, + "loss": 0.9668, + "step": 30089 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415454697285896e-06, + "loss": 0.8506, + "step": 30090 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415269052648825e-06, + "loss": 0.9053, + "step": 30091 + }, + { + "epoch": 0.77, + "learning_rate": 1.7415083402334219e-06, + "loss": 0.7109, + "step": 30092 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414897746342226e-06, + "loss": 1.0107, + "step": 30093 + }, + { + "epoch": 0.77, + "learning_rate": 1.741471208467299e-06, + "loss": 0.7842, + "step": 30094 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414526417326645e-06, + "loss": 0.7759, + "step": 30095 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414340744303341e-06, + "loss": 0.9102, + "step": 30096 + }, + { + "epoch": 0.77, + "learning_rate": 1.7414155065603217e-06, + "loss": 0.7686, + "step": 30097 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413969381226416e-06, + "loss": 0.9473, + "step": 30098 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413783691173079e-06, + "loss": 1.0576, + "step": 30099 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413597995443349e-06, + "loss": 0.605, + "step": 30100 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413412294037367e-06, + "loss": 1.0273, + "step": 30101 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413226586955275e-06, + "loss": 0.8276, + "step": 30102 + }, + { + "epoch": 0.77, + "learning_rate": 1.7413040874197216e-06, + "loss": 0.8486, + "step": 30103 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412855155763335e-06, + "loss": 0.9004, + "step": 30104 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412669431653773e-06, + "loss": 0.6589, + "step": 30105 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412483701868668e-06, + "loss": 1.0703, + "step": 30106 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412297966408165e-06, + "loss": 0.9082, + "step": 30107 + }, + { + "epoch": 0.77, + "learning_rate": 1.7412112225272405e-06, + "loss": 0.9766, + "step": 30108 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411926478461534e-06, + "loss": 0.9307, + "step": 30109 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411740725975692e-06, + "loss": 0.8652, + "step": 30110 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411554967815021e-06, + "loss": 0.8672, + "step": 30111 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411369203979662e-06, + "loss": 0.9072, + "step": 30112 + }, + { + "epoch": 0.77, + "learning_rate": 1.7411183434469758e-06, + "loss": 1.04, + "step": 30113 + }, + { + "epoch": 0.77, + "learning_rate": 1.741099765928545e-06, + "loss": 0.8672, + "step": 30114 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410811878426887e-06, + "loss": 0.7842, + "step": 30115 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410626091894202e-06, + "loss": 0.8511, + "step": 30116 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410440299687544e-06, + "loss": 0.9414, + "step": 30117 + }, + { + "epoch": 0.77, + "learning_rate": 1.741025450180705e-06, + "loss": 0.7871, + "step": 30118 + }, + { + "epoch": 0.77, + "learning_rate": 1.7410068698252866e-06, + "loss": 0.9775, + "step": 30119 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409882889025134e-06, + "loss": 0.9014, + "step": 30120 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409697074123994e-06, + "loss": 0.7017, + "step": 30121 + }, + { + "epoch": 0.77, + "learning_rate": 1.740951125354959e-06, + "loss": 1.0225, + "step": 30122 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409325427302064e-06, + "loss": 0.7537, + "step": 30123 + }, + { + "epoch": 0.77, + "learning_rate": 1.7409139595381559e-06, + "loss": 0.853, + "step": 30124 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408953757788214e-06, + "loss": 0.8369, + "step": 30125 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408767914522177e-06, + "loss": 0.8428, + "step": 30126 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408582065583585e-06, + "loss": 0.9619, + "step": 30127 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408396210972582e-06, + "loss": 1.0498, + "step": 30128 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408210350689314e-06, + "loss": 0.8613, + "step": 30129 + }, + { + "epoch": 0.77, + "learning_rate": 1.7408024484733916e-06, + "loss": 0.8013, + "step": 30130 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407838613106537e-06, + "loss": 0.8193, + "step": 30131 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407652735807313e-06, + "loss": 0.9072, + "step": 30132 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407466852836395e-06, + "loss": 0.875, + "step": 30133 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407280964193918e-06, + "loss": 1.0312, + "step": 30134 + }, + { + "epoch": 0.77, + "learning_rate": 1.7407095069880024e-06, + "loss": 0.9639, + "step": 30135 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406909169894863e-06, + "loss": 0.7524, + "step": 30136 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406723264238567e-06, + "loss": 0.6846, + "step": 30137 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406537352911287e-06, + "loss": 0.8516, + "step": 30138 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406351435913163e-06, + "loss": 0.6411, + "step": 30139 + }, + { + "epoch": 0.77, + "learning_rate": 1.7406165513244332e-06, + "loss": 0.8232, + "step": 30140 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405979584904945e-06, + "loss": 0.8765, + "step": 30141 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405793650895135e-06, + "loss": 1.0625, + "step": 30142 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405607711215054e-06, + "loss": 1.0586, + "step": 30143 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405421765864837e-06, + "loss": 0.6953, + "step": 30144 + }, + { + "epoch": 0.77, + "learning_rate": 1.740523581484463e-06, + "loss": 0.8872, + "step": 30145 + }, + { + "epoch": 0.77, + "learning_rate": 1.7405049858154573e-06, + "loss": 1.042, + "step": 30146 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404863895794813e-06, + "loss": 0.7988, + "step": 30147 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404677927765485e-06, + "loss": 0.9473, + "step": 30148 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404491954066738e-06, + "loss": 0.7305, + "step": 30149 + }, + { + "epoch": 0.77, + "learning_rate": 1.7404305974698712e-06, + "loss": 0.8945, + "step": 30150 + }, + { + "epoch": 0.77, + "learning_rate": 1.740411998966155e-06, + "loss": 0.8506, + "step": 30151 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403933998955393e-06, + "loss": 0.8779, + "step": 30152 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403748002580386e-06, + "loss": 0.7495, + "step": 30153 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403562000536668e-06, + "loss": 0.9785, + "step": 30154 + }, + { + "epoch": 0.77, + "learning_rate": 1.740337599282438e-06, + "loss": 0.9492, + "step": 30155 + }, + { + "epoch": 0.77, + "learning_rate": 1.740318997944367e-06, + "loss": 0.7407, + "step": 30156 + }, + { + "epoch": 0.77, + "learning_rate": 1.7403003960394678e-06, + "loss": 1.1143, + "step": 30157 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402817935677545e-06, + "loss": 0.657, + "step": 30158 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402631905292418e-06, + "loss": 0.9424, + "step": 30159 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402445869239434e-06, + "loss": 0.6904, + "step": 30160 + }, + { + "epoch": 0.77, + "learning_rate": 1.7402259827518738e-06, + "loss": 0.6812, + "step": 30161 + }, + { + "epoch": 0.77, + "learning_rate": 1.740207378013047e-06, + "loss": 0.8228, + "step": 30162 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401887727074777e-06, + "loss": 0.9106, + "step": 30163 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401701668351799e-06, + "loss": 0.75, + "step": 30164 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401515603961676e-06, + "loss": 0.7104, + "step": 30165 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401329533904554e-06, + "loss": 1.0049, + "step": 30166 + }, + { + "epoch": 0.77, + "learning_rate": 1.7401143458180573e-06, + "loss": 0.9951, + "step": 30167 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400957376789881e-06, + "loss": 0.6538, + "step": 30168 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400771289732613e-06, + "loss": 0.873, + "step": 30169 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400585197008914e-06, + "loss": 1.0586, + "step": 30170 + }, + { + "epoch": 0.77, + "learning_rate": 1.740039909861893e-06, + "loss": 0.7783, + "step": 30171 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400212994562796e-06, + "loss": 0.999, + "step": 30172 + }, + { + "epoch": 0.77, + "learning_rate": 1.7400026884840667e-06, + "loss": 0.9355, + "step": 30173 + }, + { + "epoch": 0.77, + "learning_rate": 1.739984076945267e-06, + "loss": 0.8682, + "step": 30174 + }, + { + "epoch": 0.77, + "learning_rate": 1.739965464839896e-06, + "loss": 0.8291, + "step": 30175 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399468521679672e-06, + "loss": 0.6477, + "step": 30176 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399282389294952e-06, + "loss": 0.9854, + "step": 30177 + }, + { + "epoch": 0.77, + "learning_rate": 1.7399096251244943e-06, + "loss": 0.8579, + "step": 30178 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398910107529785e-06, + "loss": 0.7935, + "step": 30179 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398723958149621e-06, + "loss": 0.9609, + "step": 30180 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398537803104593e-06, + "loss": 0.7815, + "step": 30181 + }, + { + "epoch": 0.77, + "learning_rate": 1.739835164239485e-06, + "loss": 0.8408, + "step": 30182 + }, + { + "epoch": 0.77, + "learning_rate": 1.7398165476020522e-06, + "loss": 0.6514, + "step": 30183 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397979303981764e-06, + "loss": 0.9893, + "step": 30184 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397793126278714e-06, + "loss": 0.8281, + "step": 30185 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397606942911513e-06, + "loss": 0.7368, + "step": 30186 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397420753880306e-06, + "loss": 0.8271, + "step": 30187 + }, + { + "epoch": 0.77, + "learning_rate": 1.739723455918523e-06, + "loss": 0.8574, + "step": 30188 + }, + { + "epoch": 0.77, + "learning_rate": 1.7397048358826432e-06, + "loss": 0.7236, + "step": 30189 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396862152804057e-06, + "loss": 0.7354, + "step": 30190 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396675941118245e-06, + "loss": 0.8447, + "step": 30191 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396489723769134e-06, + "loss": 0.9609, + "step": 30192 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396303500756875e-06, + "loss": 0.6792, + "step": 30193 + }, + { + "epoch": 0.77, + "learning_rate": 1.7396117272081606e-06, + "loss": 0.8379, + "step": 30194 + }, + { + "epoch": 0.77, + "learning_rate": 1.739593103774347e-06, + "loss": 0.8652, + "step": 30195 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395744797742609e-06, + "loss": 0.7949, + "step": 30196 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395558552079166e-06, + "loss": 0.6934, + "step": 30197 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395372300753283e-06, + "loss": 0.8174, + "step": 30198 + }, + { + "epoch": 0.77, + "learning_rate": 1.7395186043765103e-06, + "loss": 0.9131, + "step": 30199 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394999781114773e-06, + "loss": 0.8418, + "step": 30200 + }, + { + "epoch": 0.77, + "learning_rate": 1.739481351280243e-06, + "loss": 1.0859, + "step": 30201 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394627238828216e-06, + "loss": 0.7998, + "step": 30202 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394440959192279e-06, + "loss": 0.729, + "step": 30203 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394254673894757e-06, + "loss": 0.7725, + "step": 30204 + }, + { + "epoch": 0.77, + "learning_rate": 1.7394068382935796e-06, + "loss": 0.875, + "step": 30205 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393882086315535e-06, + "loss": 0.7285, + "step": 30206 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393695784034117e-06, + "loss": 0.793, + "step": 30207 + }, + { + "epoch": 0.77, + "learning_rate": 1.739350947609169e-06, + "loss": 0.8779, + "step": 30208 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393323162488392e-06, + "loss": 0.9805, + "step": 30209 + }, + { + "epoch": 0.77, + "learning_rate": 1.7393136843224363e-06, + "loss": 0.6309, + "step": 30210 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392950518299751e-06, + "loss": 0.7703, + "step": 30211 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392764187714696e-06, + "loss": 0.8018, + "step": 30212 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392577851469343e-06, + "loss": 0.7725, + "step": 30213 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392391509563834e-06, + "loss": 0.7744, + "step": 30214 + }, + { + "epoch": 0.77, + "learning_rate": 1.7392205161998308e-06, + "loss": 0.8311, + "step": 30215 + }, + { + "epoch": 0.77, + "learning_rate": 1.739201880877291e-06, + "loss": 0.8701, + "step": 30216 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391832449887784e-06, + "loss": 0.7534, + "step": 30217 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391646085343075e-06, + "loss": 0.6035, + "step": 30218 + }, + { + "epoch": 0.77, + "learning_rate": 1.739145971513892e-06, + "loss": 0.7715, + "step": 30219 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391273339275463e-06, + "loss": 0.8525, + "step": 30220 + }, + { + "epoch": 0.77, + "learning_rate": 1.7391086957752847e-06, + "loss": 0.8438, + "step": 30221 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390900570571218e-06, + "loss": 0.7949, + "step": 30222 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390714177730717e-06, + "loss": 0.7783, + "step": 30223 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390527779231485e-06, + "loss": 0.8828, + "step": 30224 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390341375073664e-06, + "loss": 0.6558, + "step": 30225 + }, + { + "epoch": 0.77, + "learning_rate": 1.7390154965257399e-06, + "loss": 0.8223, + "step": 30226 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389968549782835e-06, + "loss": 1.0234, + "step": 30227 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389782128650107e-06, + "loss": 1.001, + "step": 30228 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389595701859367e-06, + "loss": 0.8154, + "step": 30229 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389409269410752e-06, + "loss": 1.0703, + "step": 30230 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389222831304406e-06, + "loss": 1.1436, + "step": 30231 + }, + { + "epoch": 0.77, + "learning_rate": 1.7389036387540472e-06, + "loss": 0.8828, + "step": 30232 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388849938119093e-06, + "loss": 0.4924, + "step": 30233 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388663483040409e-06, + "loss": 0.792, + "step": 30234 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388477022304567e-06, + "loss": 0.8311, + "step": 30235 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388290555911706e-06, + "loss": 1.0156, + "step": 30236 + }, + { + "epoch": 0.77, + "learning_rate": 1.7388104083861975e-06, + "loss": 0.6714, + "step": 30237 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387917606155509e-06, + "loss": 0.8828, + "step": 30238 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387731122792454e-06, + "loss": 0.7871, + "step": 30239 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387544633772952e-06, + "loss": 0.8174, + "step": 30240 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387358139097153e-06, + "loss": 1.0166, + "step": 30241 + }, + { + "epoch": 0.78, + "learning_rate": 1.7387171638765189e-06, + "loss": 0.9453, + "step": 30242 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386985132777205e-06, + "loss": 1.0244, + "step": 30243 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386798621133349e-06, + "loss": 0.8242, + "step": 30244 + }, + { + "epoch": 0.78, + "learning_rate": 1.738661210383376e-06, + "loss": 0.8535, + "step": 30245 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386425580878585e-06, + "loss": 1.0713, + "step": 30246 + }, + { + "epoch": 0.78, + "learning_rate": 1.738623905226796e-06, + "loss": 0.9316, + "step": 30247 + }, + { + "epoch": 0.78, + "learning_rate": 1.7386052518002033e-06, + "loss": 0.8516, + "step": 30248 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385865978080942e-06, + "loss": 0.6208, + "step": 30249 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385679432504836e-06, + "loss": 0.8916, + "step": 30250 + }, + { + "epoch": 0.78, + "learning_rate": 1.7385492881273855e-06, + "loss": 0.8545, + "step": 30251 + }, + { + "epoch": 0.78, + "learning_rate": 1.738530632438814e-06, + "loss": 0.9424, + "step": 30252 + }, + { + "epoch": 0.78, + "learning_rate": 1.738511976184784e-06, + "loss": 0.5132, + "step": 30253 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384933193653088e-06, + "loss": 0.9106, + "step": 30254 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384746619804034e-06, + "loss": 0.9678, + "step": 30255 + }, + { + "epoch": 0.78, + "learning_rate": 1.738456004030082e-06, + "loss": 0.9316, + "step": 30256 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384373455143586e-06, + "loss": 0.7559, + "step": 30257 + }, + { + "epoch": 0.78, + "learning_rate": 1.738418686433248e-06, + "loss": 0.7959, + "step": 30258 + }, + { + "epoch": 0.78, + "learning_rate": 1.7384000267867638e-06, + "loss": 0.9883, + "step": 30259 + }, + { + "epoch": 0.78, + "learning_rate": 1.738381366574921e-06, + "loss": 0.835, + "step": 30260 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383627057977332e-06, + "loss": 0.8623, + "step": 30261 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383440444552152e-06, + "loss": 0.9297, + "step": 30262 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383253825473814e-06, + "loss": 0.8213, + "step": 30263 + }, + { + "epoch": 0.78, + "learning_rate": 1.7383067200742452e-06, + "loss": 0.8599, + "step": 30264 + }, + { + "epoch": 0.78, + "learning_rate": 1.738288057035822e-06, + "loss": 0.8857, + "step": 30265 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382693934321253e-06, + "loss": 0.832, + "step": 30266 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382507292631696e-06, + "loss": 0.7212, + "step": 30267 + }, + { + "epoch": 0.78, + "learning_rate": 1.7382320645289697e-06, + "loss": 0.8838, + "step": 30268 + }, + { + "epoch": 0.78, + "learning_rate": 1.738213399229539e-06, + "loss": 0.8926, + "step": 30269 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381947333648923e-06, + "loss": 1.0518, + "step": 30270 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381760669350443e-06, + "loss": 0.9883, + "step": 30271 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381573999400082e-06, + "loss": 0.458, + "step": 30272 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381387323797994e-06, + "loss": 0.8584, + "step": 30273 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381200642544314e-06, + "loss": 0.7959, + "step": 30274 + }, + { + "epoch": 0.78, + "learning_rate": 1.7381013955639188e-06, + "loss": 0.7988, + "step": 30275 + }, + { + "epoch": 0.78, + "learning_rate": 1.738082726308276e-06, + "loss": 0.6157, + "step": 30276 + }, + { + "epoch": 0.78, + "learning_rate": 1.7380640564875172e-06, + "loss": 0.5559, + "step": 30277 + }, + { + "epoch": 0.78, + "learning_rate": 1.7380453861016569e-06, + "loss": 0.9351, + "step": 30278 + }, + { + "epoch": 0.78, + "learning_rate": 1.738026715150709e-06, + "loss": 0.999, + "step": 30279 + }, + { + "epoch": 0.78, + "learning_rate": 1.738008043634688e-06, + "loss": 1.0986, + "step": 30280 + }, + { + "epoch": 0.78, + "learning_rate": 1.737989371553608e-06, + "loss": 0.7803, + "step": 30281 + }, + { + "epoch": 0.78, + "learning_rate": 1.7379706989074835e-06, + "loss": 0.874, + "step": 30282 + }, + { + "epoch": 0.78, + "learning_rate": 1.737952025696329e-06, + "loss": 1.1289, + "step": 30283 + }, + { + "epoch": 0.78, + "learning_rate": 1.7379333519201584e-06, + "loss": 1.0225, + "step": 30284 + }, + { + "epoch": 0.78, + "learning_rate": 1.737914677578986e-06, + "loss": 0.67, + "step": 30285 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378960026728269e-06, + "loss": 0.9209, + "step": 30286 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378773272016941e-06, + "loss": 1.0312, + "step": 30287 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378586511656027e-06, + "loss": 0.7856, + "step": 30288 + }, + { + "epoch": 0.78, + "learning_rate": 1.737839974564567e-06, + "loss": 0.8936, + "step": 30289 + }, + { + "epoch": 0.78, + "learning_rate": 1.737821297398601e-06, + "loss": 0.9736, + "step": 30290 + }, + { + "epoch": 0.78, + "learning_rate": 1.7378026196677197e-06, + "loss": 1.0264, + "step": 30291 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377839413719362e-06, + "loss": 0.6729, + "step": 30292 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377652625112658e-06, + "loss": 0.8789, + "step": 30293 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377465830857223e-06, + "loss": 0.8611, + "step": 30294 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377279030953202e-06, + "loss": 0.8027, + "step": 30295 + }, + { + "epoch": 0.78, + "learning_rate": 1.7377092225400738e-06, + "loss": 0.7178, + "step": 30296 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376905414199975e-06, + "loss": 0.7063, + "step": 30297 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376718597351052e-06, + "loss": 0.9229, + "step": 30298 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376531774854115e-06, + "loss": 0.4912, + "step": 30299 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376344946709306e-06, + "loss": 1.0498, + "step": 30300 + }, + { + "epoch": 0.78, + "learning_rate": 1.7376158112916772e-06, + "loss": 0.957, + "step": 30301 + }, + { + "epoch": 0.78, + "learning_rate": 1.7375971273476653e-06, + "loss": 0.7397, + "step": 30302 + }, + { + "epoch": 0.78, + "learning_rate": 1.737578442838909e-06, + "loss": 0.9224, + "step": 30303 + }, + { + "epoch": 0.78, + "learning_rate": 1.737559757765423e-06, + "loss": 0.6968, + "step": 30304 + }, + { + "epoch": 0.78, + "learning_rate": 1.737541072127221e-06, + "loss": 0.8496, + "step": 30305 + }, + { + "epoch": 0.78, + "learning_rate": 1.737522385924318e-06, + "loss": 0.8818, + "step": 30306 + }, + { + "epoch": 0.78, + "learning_rate": 1.737503699156728e-06, + "loss": 0.834, + "step": 30307 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374850118244653e-06, + "loss": 1.0293, + "step": 30308 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374663239275443e-06, + "loss": 0.9229, + "step": 30309 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374476354659793e-06, + "loss": 0.7646, + "step": 30310 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374289464397842e-06, + "loss": 0.9375, + "step": 30311 + }, + { + "epoch": 0.78, + "learning_rate": 1.7374102568489742e-06, + "loss": 0.9668, + "step": 30312 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373915666935628e-06, + "loss": 0.8223, + "step": 30313 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373728759735645e-06, + "loss": 1.0098, + "step": 30314 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373541846889937e-06, + "loss": 0.8125, + "step": 30315 + }, + { + "epoch": 0.78, + "learning_rate": 1.7373354928398648e-06, + "loss": 0.7646, + "step": 30316 + }, + { + "epoch": 0.78, + "learning_rate": 1.737316800426192e-06, + "loss": 0.8721, + "step": 30317 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372981074479895e-06, + "loss": 0.8506, + "step": 30318 + }, + { + "epoch": 0.78, + "learning_rate": 1.737279413905272e-06, + "loss": 0.5801, + "step": 30319 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372607197980533e-06, + "loss": 0.9014, + "step": 30320 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372420251263482e-06, + "loss": 0.6562, + "step": 30321 + }, + { + "epoch": 0.78, + "learning_rate": 1.7372233298901705e-06, + "loss": 0.6641, + "step": 30322 + }, + { + "epoch": 0.78, + "learning_rate": 1.737204634089535e-06, + "loss": 0.8643, + "step": 30323 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371859377244558e-06, + "loss": 0.9082, + "step": 30324 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371672407949474e-06, + "loss": 0.8652, + "step": 30325 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371485433010235e-06, + "loss": 0.9053, + "step": 30326 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371298452426993e-06, + "loss": 0.8364, + "step": 30327 + }, + { + "epoch": 0.78, + "learning_rate": 1.7371111466199881e-06, + "loss": 0.8066, + "step": 30328 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370924474329055e-06, + "loss": 0.6079, + "step": 30329 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370737476814645e-06, + "loss": 0.8218, + "step": 30330 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370550473656804e-06, + "loss": 0.811, + "step": 30331 + }, + { + "epoch": 0.78, + "learning_rate": 1.7370363464855671e-06, + "loss": 0.8223, + "step": 30332 + }, + { + "epoch": 0.78, + "learning_rate": 1.737017645041139e-06, + "loss": 0.6294, + "step": 30333 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369989430324102e-06, + "loss": 0.9473, + "step": 30334 + }, + { + "epoch": 0.78, + "learning_rate": 1.736980240459395e-06, + "loss": 0.9619, + "step": 30335 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369615373221082e-06, + "loss": 0.8083, + "step": 30336 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369428336205638e-06, + "loss": 0.6841, + "step": 30337 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369241293547764e-06, + "loss": 0.7646, + "step": 30338 + }, + { + "epoch": 0.78, + "learning_rate": 1.7369054245247596e-06, + "loss": 0.9561, + "step": 30339 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368867191305285e-06, + "loss": 0.9238, + "step": 30340 + }, + { + "epoch": 0.78, + "learning_rate": 1.736868013172097e-06, + "loss": 0.9028, + "step": 30341 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368493066494796e-06, + "loss": 0.6772, + "step": 30342 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368305995626905e-06, + "loss": 0.8584, + "step": 30343 + }, + { + "epoch": 0.78, + "learning_rate": 1.7368118919117442e-06, + "loss": 0.8086, + "step": 30344 + }, + { + "epoch": 0.78, + "learning_rate": 1.736793183696655e-06, + "loss": 0.8525, + "step": 30345 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367744749174368e-06, + "loss": 0.9971, + "step": 30346 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367557655741045e-06, + "loss": 0.8477, + "step": 30347 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367370556666722e-06, + "loss": 0.9004, + "step": 30348 + }, + { + "epoch": 0.78, + "learning_rate": 1.7367183451951545e-06, + "loss": 0.9785, + "step": 30349 + }, + { + "epoch": 0.78, + "learning_rate": 1.736699634159565e-06, + "loss": 0.6392, + "step": 30350 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366809225599183e-06, + "loss": 0.9531, + "step": 30351 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366622103962293e-06, + "loss": 0.8154, + "step": 30352 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366434976685118e-06, + "loss": 0.7285, + "step": 30353 + }, + { + "epoch": 0.78, + "learning_rate": 1.7366247843767803e-06, + "loss": 0.8096, + "step": 30354 + }, + { + "epoch": 0.78, + "learning_rate": 1.736606070521049e-06, + "loss": 0.7668, + "step": 30355 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365873561013324e-06, + "loss": 0.9199, + "step": 30356 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365686411176445e-06, + "loss": 0.8145, + "step": 30357 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365499255700002e-06, + "loss": 0.9717, + "step": 30358 + }, + { + "epoch": 0.78, + "learning_rate": 1.736531209458413e-06, + "loss": 0.7241, + "step": 30359 + }, + { + "epoch": 0.78, + "learning_rate": 1.7365124927828982e-06, + "loss": 0.8271, + "step": 30360 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364937755434695e-06, + "loss": 0.7866, + "step": 30361 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364750577401413e-06, + "loss": 1.0381, + "step": 30362 + }, + { + "epoch": 0.78, + "learning_rate": 1.736456339372928e-06, + "loss": 1.0342, + "step": 30363 + }, + { + "epoch": 0.78, + "learning_rate": 1.736437620441844e-06, + "loss": 0.856, + "step": 30364 + }, + { + "epoch": 0.78, + "learning_rate": 1.7364189009469036e-06, + "loss": 0.6858, + "step": 30365 + }, + { + "epoch": 0.78, + "learning_rate": 1.736400180888121e-06, + "loss": 0.7666, + "step": 30366 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363814602655106e-06, + "loss": 0.9805, + "step": 30367 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363627390790869e-06, + "loss": 0.7764, + "step": 30368 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363440173288645e-06, + "loss": 0.7876, + "step": 30369 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363252950148567e-06, + "loss": 0.8164, + "step": 30370 + }, + { + "epoch": 0.78, + "learning_rate": 1.7363065721370789e-06, + "loss": 1.0156, + "step": 30371 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362878486955449e-06, + "loss": 0.8711, + "step": 30372 + }, + { + "epoch": 0.78, + "learning_rate": 1.736269124690269e-06, + "loss": 0.6108, + "step": 30373 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362504001212658e-06, + "loss": 0.793, + "step": 30374 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362316749885494e-06, + "loss": 0.8994, + "step": 30375 + }, + { + "epoch": 0.78, + "learning_rate": 1.7362129492921343e-06, + "loss": 0.8867, + "step": 30376 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361942230320347e-06, + "loss": 0.7246, + "step": 30377 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361754962082653e-06, + "loss": 1.0, + "step": 30378 + }, + { + "epoch": 0.78, + "learning_rate": 1.73615676882084e-06, + "loss": 0.7754, + "step": 30379 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361380408697736e-06, + "loss": 0.7783, + "step": 30380 + }, + { + "epoch": 0.78, + "learning_rate": 1.73611931235508e-06, + "loss": 0.9141, + "step": 30381 + }, + { + "epoch": 0.78, + "learning_rate": 1.7361005832767734e-06, + "loss": 0.7754, + "step": 30382 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360818536348689e-06, + "loss": 0.8477, + "step": 30383 + }, + { + "epoch": 0.78, + "learning_rate": 1.73606312342938e-06, + "loss": 1.002, + "step": 30384 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360443926603216e-06, + "loss": 0.8555, + "step": 30385 + }, + { + "epoch": 0.78, + "learning_rate": 1.7360256613277077e-06, + "loss": 0.8359, + "step": 30386 + }, + { + "epoch": 0.78, + "learning_rate": 1.736006929431553e-06, + "loss": 0.4766, + "step": 30387 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359881969718716e-06, + "loss": 0.8652, + "step": 30388 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359694639486774e-06, + "loss": 0.8398, + "step": 30389 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359507303619859e-06, + "loss": 0.9033, + "step": 30390 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359319962118103e-06, + "loss": 0.793, + "step": 30391 + }, + { + "epoch": 0.78, + "learning_rate": 1.7359132614981658e-06, + "loss": 0.687, + "step": 30392 + }, + { + "epoch": 0.78, + "learning_rate": 1.735894526221066e-06, + "loss": 0.7871, + "step": 30393 + }, + { + "epoch": 0.78, + "learning_rate": 1.735875790380526e-06, + "loss": 0.834, + "step": 30394 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358570539765593e-06, + "loss": 0.7656, + "step": 30395 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358383170091807e-06, + "loss": 0.7188, + "step": 30396 + }, + { + "epoch": 0.78, + "learning_rate": 1.735819579478405e-06, + "loss": 0.9629, + "step": 30397 + }, + { + "epoch": 0.78, + "learning_rate": 1.7358008413842456e-06, + "loss": 0.9473, + "step": 30398 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357821027267177e-06, + "loss": 0.7524, + "step": 30399 + }, + { + "epoch": 0.78, + "learning_rate": 1.735763363505835e-06, + "loss": 1.0625, + "step": 30400 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357446237216123e-06, + "loss": 0.9697, + "step": 30401 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357258833740637e-06, + "loss": 1.0645, + "step": 30402 + }, + { + "epoch": 0.78, + "learning_rate": 1.7357071424632034e-06, + "loss": 0.5676, + "step": 30403 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356884009890465e-06, + "loss": 0.9717, + "step": 30404 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356696589516064e-06, + "loss": 0.9316, + "step": 30405 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356509163508978e-06, + "loss": 1.1523, + "step": 30406 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356321731869354e-06, + "loss": 0.8955, + "step": 30407 + }, + { + "epoch": 0.78, + "learning_rate": 1.7356134294597333e-06, + "loss": 0.8975, + "step": 30408 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355946851693054e-06, + "loss": 0.6885, + "step": 30409 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355759403156669e-06, + "loss": 0.874, + "step": 30410 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355571948988317e-06, + "loss": 0.9355, + "step": 30411 + }, + { + "epoch": 0.78, + "learning_rate": 1.735538448918814e-06, + "loss": 0.9609, + "step": 30412 + }, + { + "epoch": 0.78, + "learning_rate": 1.7355197023756282e-06, + "loss": 0.8965, + "step": 30413 + }, + { + "epoch": 0.78, + "learning_rate": 1.735500955269289e-06, + "loss": 0.9951, + "step": 30414 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354822075998108e-06, + "loss": 0.8281, + "step": 30415 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354634593672073e-06, + "loss": 0.9629, + "step": 30416 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354447105714933e-06, + "loss": 0.7324, + "step": 30417 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354259612126832e-06, + "loss": 0.7095, + "step": 30418 + }, + { + "epoch": 0.78, + "learning_rate": 1.7354072112907912e-06, + "loss": 0.7957, + "step": 30419 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353884608058318e-06, + "loss": 0.9199, + "step": 30420 + }, + { + "epoch": 0.78, + "learning_rate": 1.735369709757819e-06, + "loss": 0.9746, + "step": 30421 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353509581467676e-06, + "loss": 0.9316, + "step": 30422 + }, + { + "epoch": 0.78, + "learning_rate": 1.7353322059726917e-06, + "loss": 1.0078, + "step": 30423 + }, + { + "epoch": 0.78, + "learning_rate": 1.735313453235606e-06, + "loss": 0.6899, + "step": 30424 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352946999355247e-06, + "loss": 0.7977, + "step": 30425 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352759460724617e-06, + "loss": 0.7266, + "step": 30426 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352571916464318e-06, + "loss": 0.8389, + "step": 30427 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352384366574492e-06, + "loss": 0.9033, + "step": 30428 + }, + { + "epoch": 0.78, + "learning_rate": 1.7352196811055287e-06, + "loss": 0.7617, + "step": 30429 + }, + { + "epoch": 0.78, + "learning_rate": 1.735200924990684e-06, + "loss": 0.8818, + "step": 30430 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351821683129298e-06, + "loss": 0.6753, + "step": 30431 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351634110722801e-06, + "loss": 0.8887, + "step": 30432 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351446532687502e-06, + "loss": 0.7773, + "step": 30433 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351258949023536e-06, + "loss": 0.9092, + "step": 30434 + }, + { + "epoch": 0.78, + "learning_rate": 1.7351071359731043e-06, + "loss": 0.9736, + "step": 30435 + }, + { + "epoch": 0.78, + "learning_rate": 1.735088376481018e-06, + "loss": 0.7393, + "step": 30436 + }, + { + "epoch": 0.78, + "learning_rate": 1.735069616426108e-06, + "loss": 0.7231, + "step": 30437 + }, + { + "epoch": 0.78, + "learning_rate": 1.7350508558083892e-06, + "loss": 0.9727, + "step": 30438 + }, + { + "epoch": 0.78, + "learning_rate": 1.7350320946278757e-06, + "loss": 0.8271, + "step": 30439 + }, + { + "epoch": 0.78, + "learning_rate": 1.735013332884582e-06, + "loss": 0.7329, + "step": 30440 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349945705785223e-06, + "loss": 0.7881, + "step": 30441 + }, + { + "epoch": 0.78, + "learning_rate": 1.734975807709711e-06, + "loss": 0.9746, + "step": 30442 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349570442781624e-06, + "loss": 0.6055, + "step": 30443 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349382802838912e-06, + "loss": 0.9287, + "step": 30444 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349195157269117e-06, + "loss": 0.7637, + "step": 30445 + }, + { + "epoch": 0.78, + "learning_rate": 1.7349007506072378e-06, + "loss": 0.7705, + "step": 30446 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348819849248844e-06, + "loss": 0.9512, + "step": 30447 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348632186798656e-06, + "loss": 0.8486, + "step": 30448 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348444518721958e-06, + "loss": 0.7852, + "step": 30449 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348256845018894e-06, + "loss": 0.5398, + "step": 30450 + }, + { + "epoch": 0.78, + "learning_rate": 1.7348069165689607e-06, + "loss": 0.6875, + "step": 30451 + }, + { + "epoch": 0.78, + "learning_rate": 1.734788148073424e-06, + "loss": 1.1006, + "step": 30452 + }, + { + "epoch": 0.78, + "learning_rate": 1.7347693790152941e-06, + "loss": 0.9321, + "step": 30453 + }, + { + "epoch": 0.78, + "learning_rate": 1.734750609394585e-06, + "loss": 0.9775, + "step": 30454 + }, + { + "epoch": 0.78, + "learning_rate": 1.734731839211311e-06, + "loss": 0.9697, + "step": 30455 + }, + { + "epoch": 0.78, + "learning_rate": 1.7347130684654868e-06, + "loss": 0.9287, + "step": 30456 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346942971571266e-06, + "loss": 0.6709, + "step": 30457 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346755252862443e-06, + "loss": 0.5254, + "step": 30458 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346567528528554e-06, + "loss": 0.5513, + "step": 30459 + }, + { + "epoch": 0.78, + "learning_rate": 1.734637979856973e-06, + "loss": 0.9453, + "step": 30460 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346192062986124e-06, + "loss": 0.9609, + "step": 30461 + }, + { + "epoch": 0.78, + "learning_rate": 1.7346004321777875e-06, + "loss": 0.7346, + "step": 30462 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345816574945132e-06, + "loss": 0.915, + "step": 30463 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345628822488031e-06, + "loss": 0.9121, + "step": 30464 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345441064406723e-06, + "loss": 0.8682, + "step": 30465 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345253300701346e-06, + "loss": 0.9775, + "step": 30466 + }, + { + "epoch": 0.78, + "learning_rate": 1.7345065531372048e-06, + "loss": 0.9287, + "step": 30467 + }, + { + "epoch": 0.78, + "learning_rate": 1.734487775641897e-06, + "loss": 0.9219, + "step": 30468 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344689975842255e-06, + "loss": 0.7517, + "step": 30469 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344502189642053e-06, + "loss": 1.0527, + "step": 30470 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344314397818498e-06, + "loss": 0.636, + "step": 30471 + }, + { + "epoch": 0.78, + "learning_rate": 1.7344126600371744e-06, + "loss": 0.8555, + "step": 30472 + }, + { + "epoch": 0.78, + "learning_rate": 1.734393879730193e-06, + "loss": 0.9053, + "step": 30473 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343750988609196e-06, + "loss": 0.9199, + "step": 30474 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343563174293692e-06, + "loss": 0.769, + "step": 30475 + }, + { + "epoch": 0.78, + "learning_rate": 1.7343375354355557e-06, + "loss": 0.8955, + "step": 30476 + }, + { + "epoch": 0.78, + "learning_rate": 1.734318752879494e-06, + "loss": 0.8574, + "step": 30477 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342999697611979e-06, + "loss": 0.8267, + "step": 30478 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342811860806824e-06, + "loss": 0.998, + "step": 30479 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342624018379612e-06, + "loss": 0.7568, + "step": 30480 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342436170330493e-06, + "loss": 0.6804, + "step": 30481 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342248316659606e-06, + "loss": 0.8516, + "step": 30482 + }, + { + "epoch": 0.78, + "learning_rate": 1.7342060457367102e-06, + "loss": 0.9766, + "step": 30483 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341872592453116e-06, + "loss": 1.1631, + "step": 30484 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341684721917797e-06, + "loss": 0.8999, + "step": 30485 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341496845761286e-06, + "loss": 0.8945, + "step": 30486 + }, + { + "epoch": 0.78, + "learning_rate": 1.7341308963983733e-06, + "loss": 0.9268, + "step": 30487 + }, + { + "epoch": 0.78, + "learning_rate": 1.734112107658527e-06, + "loss": 0.7632, + "step": 30488 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340933183566053e-06, + "loss": 0.7451, + "step": 30489 + }, + { + "epoch": 0.78, + "learning_rate": 1.734074528492622e-06, + "loss": 0.791, + "step": 30490 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340557380665916e-06, + "loss": 0.6831, + "step": 30491 + }, + { + "epoch": 0.78, + "learning_rate": 1.7340369470785286e-06, + "loss": 1.0508, + "step": 30492 + }, + { + "epoch": 0.78, + "learning_rate": 1.734018155528447e-06, + "loss": 0.9355, + "step": 30493 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339993634163618e-06, + "loss": 0.8164, + "step": 30494 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339805707422866e-06, + "loss": 0.7178, + "step": 30495 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339617775062364e-06, + "loss": 0.9414, + "step": 30496 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339429837082256e-06, + "loss": 0.8706, + "step": 30497 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339241893482682e-06, + "loss": 0.8223, + "step": 30498 + }, + { + "epoch": 0.78, + "learning_rate": 1.7339053944263787e-06, + "loss": 0.9092, + "step": 30499 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338865989425718e-06, + "loss": 0.8975, + "step": 30500 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338678028968617e-06, + "loss": 0.8462, + "step": 30501 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338490062892625e-06, + "loss": 0.8555, + "step": 30502 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338302091197891e-06, + "loss": 0.7319, + "step": 30503 + }, + { + "epoch": 0.78, + "learning_rate": 1.7338114113884555e-06, + "loss": 0.8154, + "step": 30504 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337926130952764e-06, + "loss": 0.8486, + "step": 30505 + }, + { + "epoch": 0.78, + "learning_rate": 1.733773814240266e-06, + "loss": 0.8848, + "step": 30506 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337550148234387e-06, + "loss": 0.9111, + "step": 30507 + }, + { + "epoch": 0.78, + "learning_rate": 1.733736214844809e-06, + "loss": 0.6182, + "step": 30508 + }, + { + "epoch": 0.78, + "learning_rate": 1.7337174143043911e-06, + "loss": 0.8281, + "step": 30509 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336986132021996e-06, + "loss": 0.9531, + "step": 30510 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336798115382485e-06, + "loss": 0.8115, + "step": 30511 + }, + { + "epoch": 0.78, + "learning_rate": 1.733661009312553e-06, + "loss": 1.0127, + "step": 30512 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336422065251268e-06, + "loss": 0.7402, + "step": 30513 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336234031759841e-06, + "loss": 0.9121, + "step": 30514 + }, + { + "epoch": 0.78, + "learning_rate": 1.7336045992651402e-06, + "loss": 0.6697, + "step": 30515 + }, + { + "epoch": 0.78, + "learning_rate": 1.733585794792609e-06, + "loss": 0.9053, + "step": 30516 + }, + { + "epoch": 0.78, + "learning_rate": 1.7335669897584047e-06, + "loss": 0.9092, + "step": 30517 + }, + { + "epoch": 0.78, + "learning_rate": 1.733548184162542e-06, + "loss": 0.8135, + "step": 30518 + }, + { + "epoch": 0.78, + "learning_rate": 1.733529378005035e-06, + "loss": 0.8057, + "step": 30519 + }, + { + "epoch": 0.78, + "learning_rate": 1.7335105712858983e-06, + "loss": 0.9346, + "step": 30520 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334917640051466e-06, + "loss": 0.8418, + "step": 30521 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334729561627938e-06, + "loss": 0.8701, + "step": 30522 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334541477588545e-06, + "loss": 1.0752, + "step": 30523 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334353387933428e-06, + "loss": 0.7444, + "step": 30524 + }, + { + "epoch": 0.78, + "learning_rate": 1.7334165292662734e-06, + "loss": 0.7549, + "step": 30525 + }, + { + "epoch": 0.78, + "learning_rate": 1.733397719177661e-06, + "loss": 0.8662, + "step": 30526 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333789085275198e-06, + "loss": 0.9736, + "step": 30527 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333600973158637e-06, + "loss": 1.002, + "step": 30528 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333412855427077e-06, + "loss": 0.8721, + "step": 30529 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333224732080661e-06, + "loss": 0.7183, + "step": 30530 + }, + { + "epoch": 0.78, + "learning_rate": 1.7333036603119528e-06, + "loss": 1.3154, + "step": 30531 + }, + { + "epoch": 0.78, + "learning_rate": 1.733284846854383e-06, + "loss": 0.6633, + "step": 30532 + }, + { + "epoch": 0.78, + "learning_rate": 1.7332660328353708e-06, + "loss": 0.9033, + "step": 30533 + }, + { + "epoch": 0.78, + "learning_rate": 1.73324721825493e-06, + "loss": 0.7578, + "step": 30534 + }, + { + "epoch": 0.78, + "learning_rate": 1.733228403113076e-06, + "loss": 0.8159, + "step": 30535 + }, + { + "epoch": 0.78, + "learning_rate": 1.7332095874098224e-06, + "loss": 0.8262, + "step": 30536 + }, + { + "epoch": 0.78, + "learning_rate": 1.733190771145184e-06, + "loss": 0.7373, + "step": 30537 + }, + { + "epoch": 0.78, + "learning_rate": 1.7331719543191755e-06, + "loss": 0.875, + "step": 30538 + }, + { + "epoch": 0.78, + "learning_rate": 1.7331531369318104e-06, + "loss": 0.7832, + "step": 30539 + }, + { + "epoch": 0.78, + "learning_rate": 1.733134318983104e-06, + "loss": 1.0068, + "step": 30540 + }, + { + "epoch": 0.78, + "learning_rate": 1.73311550047307e-06, + "loss": 0.6387, + "step": 30541 + }, + { + "epoch": 0.78, + "learning_rate": 1.733096681401724e-06, + "loss": 0.4897, + "step": 30542 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330778617690788e-06, + "loss": 0.9326, + "step": 30543 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330590415751497e-06, + "loss": 0.7754, + "step": 30544 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330402208199514e-06, + "loss": 0.7222, + "step": 30545 + }, + { + "epoch": 0.78, + "learning_rate": 1.7330213995034975e-06, + "loss": 0.5425, + "step": 30546 + }, + { + "epoch": 0.78, + "learning_rate": 1.733002577625803e-06, + "loss": 0.9404, + "step": 30547 + }, + { + "epoch": 0.78, + "learning_rate": 1.732983755186882e-06, + "loss": 0.8896, + "step": 30548 + }, + { + "epoch": 0.78, + "learning_rate": 1.732964932186749e-06, + "loss": 1.0615, + "step": 30549 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329461086254188e-06, + "loss": 0.752, + "step": 30550 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329272845029053e-06, + "loss": 0.9912, + "step": 30551 + }, + { + "epoch": 0.78, + "learning_rate": 1.7329084598192228e-06, + "loss": 0.915, + "step": 30552 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328896345743864e-06, + "loss": 0.8042, + "step": 30553 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328708087684096e-06, + "loss": 1.0801, + "step": 30554 + }, + { + "epoch": 0.78, + "learning_rate": 1.732851982401308e-06, + "loss": 0.9268, + "step": 30555 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328331554730948e-06, + "loss": 0.7891, + "step": 30556 + }, + { + "epoch": 0.78, + "learning_rate": 1.7328143279837853e-06, + "loss": 0.958, + "step": 30557 + }, + { + "epoch": 0.78, + "learning_rate": 1.732795499933393e-06, + "loss": 0.8281, + "step": 30558 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327766713219334e-06, + "loss": 0.9209, + "step": 30559 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327578421494201e-06, + "loss": 0.8965, + "step": 30560 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327390124158682e-06, + "loss": 0.8203, + "step": 30561 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327201821212916e-06, + "loss": 0.8018, + "step": 30562 + }, + { + "epoch": 0.78, + "learning_rate": 1.7327013512657048e-06, + "loss": 1.082, + "step": 30563 + }, + { + "epoch": 0.78, + "learning_rate": 1.732682519849122e-06, + "loss": 0.6718, + "step": 30564 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326636878715584e-06, + "loss": 0.5869, + "step": 30565 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326448553330274e-06, + "loss": 0.8535, + "step": 30566 + }, + { + "epoch": 0.78, + "learning_rate": 1.732626022233544e-06, + "loss": 0.8374, + "step": 30567 + }, + { + "epoch": 0.78, + "learning_rate": 1.7326071885731228e-06, + "loss": 0.9932, + "step": 30568 + }, + { + "epoch": 0.78, + "learning_rate": 1.732588354351778e-06, + "loss": 0.7178, + "step": 30569 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325695195695236e-06, + "loss": 0.6948, + "step": 30570 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325506842263746e-06, + "loss": 0.8452, + "step": 30571 + }, + { + "epoch": 0.78, + "learning_rate": 1.7325318483223454e-06, + "loss": 0.8237, + "step": 30572 + }, + { + "epoch": 0.78, + "learning_rate": 1.73251301185745e-06, + "loss": 0.6733, + "step": 30573 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324941748317033e-06, + "loss": 0.7646, + "step": 30574 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324753372451192e-06, + "loss": 0.9355, + "step": 30575 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324564990977127e-06, + "loss": 0.8018, + "step": 30576 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324376603894977e-06, + "loss": 0.8105, + "step": 30577 + }, + { + "epoch": 0.78, + "learning_rate": 1.7324188211204889e-06, + "loss": 0.8164, + "step": 30578 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323999812907006e-06, + "loss": 0.8276, + "step": 30579 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323811409001475e-06, + "loss": 0.9834, + "step": 30580 + }, + { + "epoch": 0.78, + "learning_rate": 1.732362299948844e-06, + "loss": 0.9404, + "step": 30581 + }, + { + "epoch": 0.78, + "learning_rate": 1.732343458436804e-06, + "loss": 0.8856, + "step": 30582 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323246163640425e-06, + "loss": 0.9883, + "step": 30583 + }, + { + "epoch": 0.78, + "learning_rate": 1.7323057737305737e-06, + "loss": 0.8076, + "step": 30584 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322869305364121e-06, + "loss": 1.0283, + "step": 30585 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322680867815719e-06, + "loss": 0.8428, + "step": 30586 + }, + { + "epoch": 0.78, + "learning_rate": 1.732249242466068e-06, + "loss": 0.7949, + "step": 30587 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322303975899141e-06, + "loss": 0.7578, + "step": 30588 + }, + { + "epoch": 0.78, + "learning_rate": 1.7322115521531252e-06, + "loss": 0.958, + "step": 30589 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321927061557155e-06, + "loss": 0.689, + "step": 30590 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321738595977e-06, + "loss": 0.7959, + "step": 30591 + }, + { + "epoch": 0.78, + "learning_rate": 1.732155012479092e-06, + "loss": 0.686, + "step": 30592 + }, + { + "epoch": 0.78, + "learning_rate": 1.732136164799907e-06, + "loss": 0.8398, + "step": 30593 + }, + { + "epoch": 0.78, + "learning_rate": 1.7321173165601588e-06, + "loss": 1.126, + "step": 30594 + }, + { + "epoch": 0.78, + "learning_rate": 1.732098467759862e-06, + "loss": 0.5806, + "step": 30595 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320796183990312e-06, + "loss": 0.9243, + "step": 30596 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320607684776807e-06, + "loss": 0.7998, + "step": 30597 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320419179958247e-06, + "loss": 0.7847, + "step": 30598 + }, + { + "epoch": 0.78, + "learning_rate": 1.732023066953478e-06, + "loss": 0.7148, + "step": 30599 + }, + { + "epoch": 0.78, + "learning_rate": 1.7320042153506554e-06, + "loss": 0.9365, + "step": 30600 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319853631873703e-06, + "loss": 0.7783, + "step": 30601 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319665104636378e-06, + "loss": 1.0088, + "step": 30602 + }, + { + "epoch": 0.78, + "learning_rate": 1.731947657179472e-06, + "loss": 0.8848, + "step": 30603 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319288033348877e-06, + "loss": 0.8232, + "step": 30604 + }, + { + "epoch": 0.78, + "learning_rate": 1.7319099489298992e-06, + "loss": 0.7803, + "step": 30605 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318910939645207e-06, + "loss": 0.8047, + "step": 30606 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318722384387673e-06, + "loss": 0.8945, + "step": 30607 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318533823526524e-06, + "loss": 0.7021, + "step": 30608 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318345257061916e-06, + "loss": 0.7354, + "step": 30609 + }, + { + "epoch": 0.78, + "learning_rate": 1.7318156684993983e-06, + "loss": 1.1035, + "step": 30610 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317968107322875e-06, + "loss": 0.9072, + "step": 30611 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317779524048736e-06, + "loss": 1.0566, + "step": 30612 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317590935171708e-06, + "loss": 0.707, + "step": 30613 + }, + { + "epoch": 0.78, + "learning_rate": 1.731740234069194e-06, + "loss": 0.9629, + "step": 30614 + }, + { + "epoch": 0.78, + "learning_rate": 1.731721374060957e-06, + "loss": 1.0205, + "step": 30615 + }, + { + "epoch": 0.78, + "learning_rate": 1.7317025134924749e-06, + "loss": 0.8296, + "step": 30616 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316836523637618e-06, + "loss": 0.8252, + "step": 30617 + }, + { + "epoch": 0.78, + "learning_rate": 1.731664790674832e-06, + "loss": 0.9951, + "step": 30618 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316459284257001e-06, + "loss": 0.874, + "step": 30619 + }, + { + "epoch": 0.78, + "learning_rate": 1.7316270656163807e-06, + "loss": 0.6406, + "step": 30620 + }, + { + "epoch": 0.78, + "learning_rate": 1.731608202246888e-06, + "loss": 0.8818, + "step": 30621 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315893383172369e-06, + "loss": 0.9746, + "step": 30622 + }, + { + "epoch": 0.78, + "learning_rate": 1.731570473827441e-06, + "loss": 0.7412, + "step": 30623 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315516087775156e-06, + "loss": 1.0381, + "step": 30624 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315327431674744e-06, + "loss": 0.6729, + "step": 30625 + }, + { + "epoch": 0.78, + "learning_rate": 1.7315138769973326e-06, + "loss": 1.002, + "step": 30626 + }, + { + "epoch": 0.78, + "learning_rate": 1.7314950102671038e-06, + "loss": 1.1914, + "step": 30627 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314761429768032e-06, + "loss": 0.8379, + "step": 30628 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314572751264448e-06, + "loss": 0.8652, + "step": 30629 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314384067160434e-06, + "loss": 0.8247, + "step": 30630 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314195377456131e-06, + "loss": 0.6304, + "step": 30631 + }, + { + "epoch": 0.79, + "learning_rate": 1.7314006682151688e-06, + "loss": 0.8838, + "step": 30632 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313817981247242e-06, + "loss": 0.7842, + "step": 30633 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313629274742946e-06, + "loss": 0.8135, + "step": 30634 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313440562638935e-06, + "loss": 0.8188, + "step": 30635 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313251844935364e-06, + "loss": 0.6675, + "step": 30636 + }, + { + "epoch": 0.79, + "learning_rate": 1.7313063121632369e-06, + "loss": 0.7959, + "step": 30637 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312874392730099e-06, + "loss": 0.6084, + "step": 30638 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312685658228697e-06, + "loss": 0.7371, + "step": 30639 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312496918128308e-06, + "loss": 0.8535, + "step": 30640 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312308172429076e-06, + "loss": 0.7988, + "step": 30641 + }, + { + "epoch": 0.79, + "learning_rate": 1.7312119421131146e-06, + "loss": 0.7402, + "step": 30642 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311930664234664e-06, + "loss": 0.9268, + "step": 30643 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311741901739772e-06, + "loss": 0.8018, + "step": 30644 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311553133646615e-06, + "loss": 0.8467, + "step": 30645 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311364359955337e-06, + "loss": 0.7932, + "step": 30646 + }, + { + "epoch": 0.79, + "learning_rate": 1.7311175580666085e-06, + "loss": 0.8853, + "step": 30647 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310986795779003e-06, + "loss": 0.8682, + "step": 30648 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310798005294234e-06, + "loss": 0.7578, + "step": 30649 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310609209211919e-06, + "loss": 0.9893, + "step": 30650 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310420407532211e-06, + "loss": 1.0547, + "step": 30651 + }, + { + "epoch": 0.79, + "learning_rate": 1.731023160025525e-06, + "loss": 0.9307, + "step": 30652 + }, + { + "epoch": 0.79, + "learning_rate": 1.7310042787381182e-06, + "loss": 0.8369, + "step": 30653 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309853968910147e-06, + "loss": 0.9434, + "step": 30654 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309665144842294e-06, + "loss": 0.8984, + "step": 30655 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309476315177767e-06, + "loss": 0.9951, + "step": 30656 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309287479916708e-06, + "loss": 0.6865, + "step": 30657 + }, + { + "epoch": 0.79, + "learning_rate": 1.7309098639059268e-06, + "loss": 0.8862, + "step": 30658 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308909792605584e-06, + "loss": 0.9023, + "step": 30659 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308720940555804e-06, + "loss": 0.5674, + "step": 30660 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308532082910072e-06, + "loss": 0.9004, + "step": 30661 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308343219668535e-06, + "loss": 0.9258, + "step": 30662 + }, + { + "epoch": 0.79, + "learning_rate": 1.7308154350831337e-06, + "loss": 0.7988, + "step": 30663 + }, + { + "epoch": 0.79, + "learning_rate": 1.730796547639862e-06, + "loss": 0.9365, + "step": 30664 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307776596370526e-06, + "loss": 0.9473, + "step": 30665 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307587710747207e-06, + "loss": 1.0078, + "step": 30666 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307398819528802e-06, + "loss": 0.9219, + "step": 30667 + }, + { + "epoch": 0.79, + "learning_rate": 1.730720992271546e-06, + "loss": 0.7881, + "step": 30668 + }, + { + "epoch": 0.79, + "learning_rate": 1.7307021020307325e-06, + "loss": 0.8232, + "step": 30669 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306832112304535e-06, + "loss": 0.9795, + "step": 30670 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306643198707243e-06, + "loss": 0.7393, + "step": 30671 + }, + { + "epoch": 0.79, + "learning_rate": 1.730645427951559e-06, + "loss": 0.9336, + "step": 30672 + }, + { + "epoch": 0.79, + "learning_rate": 1.7306265354729722e-06, + "loss": 0.5161, + "step": 30673 + }, + { + "epoch": 0.79, + "learning_rate": 1.730607642434978e-06, + "loss": 0.7217, + "step": 30674 + }, + { + "epoch": 0.79, + "learning_rate": 1.730588748837591e-06, + "loss": 0.998, + "step": 30675 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305698546808261e-06, + "loss": 1.0957, + "step": 30676 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305509599646976e-06, + "loss": 0.9785, + "step": 30677 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305320646892193e-06, + "loss": 0.8037, + "step": 30678 + }, + { + "epoch": 0.79, + "learning_rate": 1.7305131688544065e-06, + "loss": 0.8936, + "step": 30679 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304942724602734e-06, + "loss": 0.9551, + "step": 30680 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304753755068342e-06, + "loss": 0.8755, + "step": 30681 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304564779941039e-06, + "loss": 0.8535, + "step": 30682 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304375799220962e-06, + "loss": 0.9248, + "step": 30683 + }, + { + "epoch": 0.79, + "learning_rate": 1.7304186812908265e-06, + "loss": 0.915, + "step": 30684 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303997821003086e-06, + "loss": 0.9404, + "step": 30685 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303808823505572e-06, + "loss": 0.8135, + "step": 30686 + }, + { + "epoch": 0.79, + "learning_rate": 1.730361982041587e-06, + "loss": 0.8438, + "step": 30687 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303430811734119e-06, + "loss": 0.6401, + "step": 30688 + }, + { + "epoch": 0.79, + "learning_rate": 1.7303241797460468e-06, + "loss": 0.9736, + "step": 30689 + }, + { + "epoch": 0.79, + "learning_rate": 1.730305277759506e-06, + "loss": 0.7427, + "step": 30690 + }, + { + "epoch": 0.79, + "learning_rate": 1.730286375213804e-06, + "loss": 0.6758, + "step": 30691 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302674721089555e-06, + "loss": 0.8867, + "step": 30692 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302485684449745e-06, + "loss": 0.8105, + "step": 30693 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302296642218758e-06, + "loss": 0.959, + "step": 30694 + }, + { + "epoch": 0.79, + "learning_rate": 1.7302107594396738e-06, + "loss": 1.0459, + "step": 30695 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301918540983832e-06, + "loss": 0.7739, + "step": 30696 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301729481980182e-06, + "loss": 0.8809, + "step": 30697 + }, + { + "epoch": 0.79, + "learning_rate": 1.730154041738593e-06, + "loss": 0.7354, + "step": 30698 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301351347201232e-06, + "loss": 0.8906, + "step": 30699 + }, + { + "epoch": 0.79, + "learning_rate": 1.7301162271426218e-06, + "loss": 0.7607, + "step": 30700 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300973190061044e-06, + "loss": 0.7153, + "step": 30701 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300784103105847e-06, + "loss": 0.9541, + "step": 30702 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300595010560777e-06, + "loss": 0.8428, + "step": 30703 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300405912425978e-06, + "loss": 0.8223, + "step": 30704 + }, + { + "epoch": 0.79, + "learning_rate": 1.730021680870159e-06, + "loss": 0.9473, + "step": 30705 + }, + { + "epoch": 0.79, + "learning_rate": 1.7300027699387765e-06, + "loss": 0.8545, + "step": 30706 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299838584484644e-06, + "loss": 0.7676, + "step": 30707 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299649463992374e-06, + "loss": 1.1797, + "step": 30708 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299460337911097e-06, + "loss": 0.7607, + "step": 30709 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299271206240954e-06, + "loss": 0.7832, + "step": 30710 + }, + { + "epoch": 0.79, + "learning_rate": 1.7299082068982101e-06, + "loss": 0.8047, + "step": 30711 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298892926134677e-06, + "loss": 0.7607, + "step": 30712 + }, + { + "epoch": 0.79, + "learning_rate": 1.729870377769882e-06, + "loss": 0.9463, + "step": 30713 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298514623674688e-06, + "loss": 0.8525, + "step": 30714 + }, + { + "epoch": 0.79, + "learning_rate": 1.7298325464062415e-06, + "loss": 0.9541, + "step": 30715 + }, + { + "epoch": 0.79, + "learning_rate": 1.729813629886215e-06, + "loss": 0.8672, + "step": 30716 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297947128074037e-06, + "loss": 1.0127, + "step": 30717 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297757951698224e-06, + "loss": 0.8555, + "step": 30718 + }, + { + "epoch": 0.79, + "learning_rate": 1.729756876973485e-06, + "loss": 0.8232, + "step": 30719 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297379582184066e-06, + "loss": 0.9443, + "step": 30720 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297190389046013e-06, + "loss": 0.8086, + "step": 30721 + }, + { + "epoch": 0.79, + "learning_rate": 1.7297001190320837e-06, + "loss": 0.6499, + "step": 30722 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296811986008681e-06, + "loss": 0.7642, + "step": 30723 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296622776109695e-06, + "loss": 0.8613, + "step": 30724 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296433560624018e-06, + "loss": 0.7678, + "step": 30725 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296244339551797e-06, + "loss": 0.6841, + "step": 30726 + }, + { + "epoch": 0.79, + "learning_rate": 1.7296055112893178e-06, + "loss": 0.835, + "step": 30727 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295865880648304e-06, + "loss": 0.9883, + "step": 30728 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295676642817324e-06, + "loss": 0.917, + "step": 30729 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295487399400376e-06, + "loss": 1.0215, + "step": 30730 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295298150397612e-06, + "loss": 0.5799, + "step": 30731 + }, + { + "epoch": 0.79, + "learning_rate": 1.7295108895809171e-06, + "loss": 0.9072, + "step": 30732 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294919635635203e-06, + "loss": 0.9473, + "step": 30733 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294730369875849e-06, + "loss": 0.9014, + "step": 30734 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294541098531256e-06, + "loss": 0.7461, + "step": 30735 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294351821601566e-06, + "loss": 0.6836, + "step": 30736 + }, + { + "epoch": 0.79, + "learning_rate": 1.7294162539086932e-06, + "loss": 0.6914, + "step": 30737 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293973250987488e-06, + "loss": 0.9395, + "step": 30738 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293783957303387e-06, + "loss": 0.6709, + "step": 30739 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293594658034768e-06, + "loss": 0.7412, + "step": 30740 + }, + { + "epoch": 0.79, + "learning_rate": 1.729340535318178e-06, + "loss": 1.0283, + "step": 30741 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293216042744568e-06, + "loss": 1.0615, + "step": 30742 + }, + { + "epoch": 0.79, + "learning_rate": 1.7293026726723276e-06, + "loss": 1.0049, + "step": 30743 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292837405118048e-06, + "loss": 0.8662, + "step": 30744 + }, + { + "epoch": 0.79, + "learning_rate": 1.729264807792903e-06, + "loss": 0.8394, + "step": 30745 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292458745156365e-06, + "loss": 0.8701, + "step": 30746 + }, + { + "epoch": 0.79, + "learning_rate": 1.72922694068002e-06, + "loss": 0.8379, + "step": 30747 + }, + { + "epoch": 0.79, + "learning_rate": 1.7292080062860681e-06, + "loss": 0.8882, + "step": 30748 + }, + { + "epoch": 0.79, + "learning_rate": 1.729189071333795e-06, + "loss": 0.6709, + "step": 30749 + }, + { + "epoch": 0.79, + "learning_rate": 1.7291701358232155e-06, + "loss": 0.9414, + "step": 30750 + }, + { + "epoch": 0.79, + "learning_rate": 1.729151199754344e-06, + "loss": 0.9365, + "step": 30751 + }, + { + "epoch": 0.79, + "learning_rate": 1.729132263127195e-06, + "loss": 0.6064, + "step": 30752 + }, + { + "epoch": 0.79, + "learning_rate": 1.7291133259417827e-06, + "loss": 0.8164, + "step": 30753 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290943881981221e-06, + "loss": 0.7495, + "step": 30754 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290754498962272e-06, + "loss": 1.1338, + "step": 30755 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290565110361128e-06, + "loss": 0.9697, + "step": 30756 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290375716177938e-06, + "loss": 0.9658, + "step": 30757 + }, + { + "epoch": 0.79, + "learning_rate": 1.7290186316412838e-06, + "loss": 0.917, + "step": 30758 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289996911065977e-06, + "loss": 0.7979, + "step": 30759 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289807500137502e-06, + "loss": 1.0078, + "step": 30760 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289618083627557e-06, + "loss": 0.7764, + "step": 30761 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289428661536286e-06, + "loss": 0.7451, + "step": 30762 + }, + { + "epoch": 0.79, + "learning_rate": 1.7289239233863838e-06, + "loss": 0.7949, + "step": 30763 + }, + { + "epoch": 0.79, + "learning_rate": 1.728904980061035e-06, + "loss": 0.8408, + "step": 30764 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288860361775974e-06, + "loss": 0.9346, + "step": 30765 + }, + { + "epoch": 0.79, + "learning_rate": 1.728867091736085e-06, + "loss": 0.7803, + "step": 30766 + }, + { + "epoch": 0.79, + "learning_rate": 1.728848146736513e-06, + "loss": 0.8271, + "step": 30767 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288292011788955e-06, + "loss": 0.9258, + "step": 30768 + }, + { + "epoch": 0.79, + "learning_rate": 1.7288102550632466e-06, + "loss": 0.7881, + "step": 30769 + }, + { + "epoch": 0.79, + "learning_rate": 1.728791308389581e-06, + "loss": 0.8535, + "step": 30770 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287723611579141e-06, + "loss": 0.9434, + "step": 30771 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287534133682594e-06, + "loss": 1.1094, + "step": 30772 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287344650206317e-06, + "loss": 0.8115, + "step": 30773 + }, + { + "epoch": 0.79, + "learning_rate": 1.7287155161150455e-06, + "loss": 0.9668, + "step": 30774 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286965666515154e-06, + "loss": 0.7739, + "step": 30775 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286776166300557e-06, + "loss": 0.7461, + "step": 30776 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286586660506814e-06, + "loss": 0.8396, + "step": 30777 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286397149134064e-06, + "loss": 1.3643, + "step": 30778 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286207632182455e-06, + "loss": 0.3237, + "step": 30779 + }, + { + "epoch": 0.79, + "learning_rate": 1.7286018109652132e-06, + "loss": 0.8613, + "step": 30780 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285828581543238e-06, + "loss": 0.9844, + "step": 30781 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285639047855923e-06, + "loss": 0.9209, + "step": 30782 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285449508590331e-06, + "loss": 0.6904, + "step": 30783 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285259963746602e-06, + "loss": 0.7217, + "step": 30784 + }, + { + "epoch": 0.79, + "learning_rate": 1.7285070413324885e-06, + "loss": 0.8623, + "step": 30785 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284880857325324e-06, + "loss": 0.7988, + "step": 30786 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284691295748065e-06, + "loss": 0.7505, + "step": 30787 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284501728593252e-06, + "loss": 0.9697, + "step": 30788 + }, + { + "epoch": 0.79, + "learning_rate": 1.7284312155861033e-06, + "loss": 0.5938, + "step": 30789 + }, + { + "epoch": 0.79, + "learning_rate": 1.728412257755155e-06, + "loss": 0.9629, + "step": 30790 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283932993664948e-06, + "loss": 0.7476, + "step": 30791 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283743404201374e-06, + "loss": 0.833, + "step": 30792 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283553809160974e-06, + "loss": 0.7886, + "step": 30793 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283364208543892e-06, + "loss": 0.7654, + "step": 30794 + }, + { + "epoch": 0.79, + "learning_rate": 1.7283174602350271e-06, + "loss": 0.8564, + "step": 30795 + }, + { + "epoch": 0.79, + "learning_rate": 1.728298499058026e-06, + "loss": 0.8252, + "step": 30796 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282795373234002e-06, + "loss": 0.7617, + "step": 30797 + }, + { + "epoch": 0.79, + "learning_rate": 1.728260575031164e-06, + "loss": 1.0146, + "step": 30798 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282416121813326e-06, + "loss": 0.7578, + "step": 30799 + }, + { + "epoch": 0.79, + "learning_rate": 1.72822264877392e-06, + "loss": 0.7676, + "step": 30800 + }, + { + "epoch": 0.79, + "learning_rate": 1.7282036848089404e-06, + "loss": 0.8965, + "step": 30801 + }, + { + "epoch": 0.79, + "learning_rate": 1.728184720286409e-06, + "loss": 0.9629, + "step": 30802 + }, + { + "epoch": 0.79, + "learning_rate": 1.72816575520634e-06, + "loss": 0.667, + "step": 30803 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281467895687481e-06, + "loss": 0.9229, + "step": 30804 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281278233736477e-06, + "loss": 0.9121, + "step": 30805 + }, + { + "epoch": 0.79, + "learning_rate": 1.7281088566210528e-06, + "loss": 0.7524, + "step": 30806 + }, + { + "epoch": 0.79, + "learning_rate": 1.728089889310979e-06, + "loss": 0.8926, + "step": 30807 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280709214434398e-06, + "loss": 0.7563, + "step": 30808 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280519530184506e-06, + "loss": 0.8652, + "step": 30809 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280329840360252e-06, + "loss": 1.0264, + "step": 30810 + }, + { + "epoch": 0.79, + "learning_rate": 1.7280140144961788e-06, + "loss": 0.9258, + "step": 30811 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279950443989252e-06, + "loss": 0.9375, + "step": 30812 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279760737442795e-06, + "loss": 0.9346, + "step": 30813 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279571025322554e-06, + "loss": 0.9365, + "step": 30814 + }, + { + "epoch": 0.79, + "learning_rate": 1.7279381307628686e-06, + "loss": 0.7412, + "step": 30815 + }, + { + "epoch": 0.79, + "learning_rate": 1.727919158436133e-06, + "loss": 0.8342, + "step": 30816 + }, + { + "epoch": 0.79, + "learning_rate": 1.727900185552063e-06, + "loss": 0.9189, + "step": 30817 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278812121106734e-06, + "loss": 0.7227, + "step": 30818 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278622381119784e-06, + "loss": 0.7285, + "step": 30819 + }, + { + "epoch": 0.79, + "learning_rate": 1.727843263555993e-06, + "loss": 1.1104, + "step": 30820 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278242884427316e-06, + "loss": 0.8984, + "step": 30821 + }, + { + "epoch": 0.79, + "learning_rate": 1.7278053127722086e-06, + "loss": 0.8809, + "step": 30822 + }, + { + "epoch": 0.79, + "learning_rate": 1.727786336544438e-06, + "loss": 0.7734, + "step": 30823 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277673597594356e-06, + "loss": 0.7505, + "step": 30824 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277483824172147e-06, + "loss": 0.8125, + "step": 30825 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277294045177903e-06, + "loss": 0.8115, + "step": 30826 + }, + { + "epoch": 0.79, + "learning_rate": 1.7277104260611773e-06, + "loss": 0.8604, + "step": 30827 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276914470473898e-06, + "loss": 0.6641, + "step": 30828 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276724674764422e-06, + "loss": 1.0703, + "step": 30829 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276534873483492e-06, + "loss": 0.6675, + "step": 30830 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276345066631258e-06, + "loss": 0.8984, + "step": 30831 + }, + { + "epoch": 0.79, + "learning_rate": 1.7276155254207857e-06, + "loss": 0.998, + "step": 30832 + }, + { + "epoch": 0.79, + "learning_rate": 1.727596543621344e-06, + "loss": 1.1318, + "step": 30833 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275775612648151e-06, + "loss": 0.7549, + "step": 30834 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275585783512136e-06, + "loss": 0.8301, + "step": 30835 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275395948805539e-06, + "loss": 0.8984, + "step": 30836 + }, + { + "epoch": 0.79, + "learning_rate": 1.7275206108528506e-06, + "loss": 0.915, + "step": 30837 + }, + { + "epoch": 0.79, + "learning_rate": 1.727501626268118e-06, + "loss": 0.8535, + "step": 30838 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274826411263712e-06, + "loss": 0.6948, + "step": 30839 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274636554276243e-06, + "loss": 0.9629, + "step": 30840 + }, + { + "epoch": 0.79, + "learning_rate": 1.727444669171892e-06, + "loss": 0.8662, + "step": 30841 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274256823591883e-06, + "loss": 0.5795, + "step": 30842 + }, + { + "epoch": 0.79, + "learning_rate": 1.7274066949895288e-06, + "loss": 0.7158, + "step": 30843 + }, + { + "epoch": 0.79, + "learning_rate": 1.727387707062927e-06, + "loss": 0.8926, + "step": 30844 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273687185793978e-06, + "loss": 0.9131, + "step": 30845 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273497295389563e-06, + "loss": 0.9062, + "step": 30846 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273307399416162e-06, + "loss": 0.9111, + "step": 30847 + }, + { + "epoch": 0.79, + "learning_rate": 1.7273117497873926e-06, + "loss": 0.917, + "step": 30848 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272927590762997e-06, + "loss": 0.8555, + "step": 30849 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272737678083521e-06, + "loss": 0.6226, + "step": 30850 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272547759835646e-06, + "loss": 0.8052, + "step": 30851 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272357836019516e-06, + "loss": 0.8379, + "step": 30852 + }, + { + "epoch": 0.79, + "learning_rate": 1.7272167906635276e-06, + "loss": 0.8438, + "step": 30853 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271977971683073e-06, + "loss": 1.0205, + "step": 30854 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271788031163044e-06, + "loss": 0.9951, + "step": 30855 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271598085075348e-06, + "loss": 0.6318, + "step": 30856 + }, + { + "epoch": 0.79, + "learning_rate": 1.727140813342012e-06, + "loss": 0.5947, + "step": 30857 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271218176197511e-06, + "loss": 0.6785, + "step": 30858 + }, + { + "epoch": 0.79, + "learning_rate": 1.7271028213407663e-06, + "loss": 1.0205, + "step": 30859 + }, + { + "epoch": 0.79, + "learning_rate": 1.7270838245050725e-06, + "loss": 0.834, + "step": 30860 + }, + { + "epoch": 0.79, + "learning_rate": 1.727064827112684e-06, + "loss": 0.7422, + "step": 30861 + }, + { + "epoch": 0.79, + "learning_rate": 1.7270458291636153e-06, + "loss": 0.9854, + "step": 30862 + }, + { + "epoch": 0.79, + "learning_rate": 1.727026830657881e-06, + "loss": 0.7017, + "step": 30863 + }, + { + "epoch": 0.79, + "learning_rate": 1.727007831595496e-06, + "loss": 0.9648, + "step": 30864 + }, + { + "epoch": 0.79, + "learning_rate": 1.726988831976474e-06, + "loss": 0.9546, + "step": 30865 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269698318008304e-06, + "loss": 0.8252, + "step": 30866 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269508310685794e-06, + "loss": 0.7969, + "step": 30867 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269318297797354e-06, + "loss": 0.7014, + "step": 30868 + }, + { + "epoch": 0.79, + "learning_rate": 1.7269128279343135e-06, + "loss": 0.9746, + "step": 30869 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268938255323277e-06, + "loss": 0.9131, + "step": 30870 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268748225737925e-06, + "loss": 0.5811, + "step": 30871 + }, + { + "epoch": 0.79, + "learning_rate": 1.726855819058723e-06, + "loss": 0.9307, + "step": 30872 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268368149871333e-06, + "loss": 0.6079, + "step": 30873 + }, + { + "epoch": 0.79, + "learning_rate": 1.7268178103590382e-06, + "loss": 0.7808, + "step": 30874 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267988051744519e-06, + "loss": 0.7905, + "step": 30875 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267797994333893e-06, + "loss": 0.8799, + "step": 30876 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267607931358648e-06, + "loss": 0.916, + "step": 30877 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267417862818929e-06, + "loss": 0.8447, + "step": 30878 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267227788714882e-06, + "loss": 0.6489, + "step": 30879 + }, + { + "epoch": 0.79, + "learning_rate": 1.7267037709046655e-06, + "loss": 0.8613, + "step": 30880 + }, + { + "epoch": 0.79, + "learning_rate": 1.726684762381439e-06, + "loss": 0.8574, + "step": 30881 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266657533018231e-06, + "loss": 0.8115, + "step": 30882 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266467436658329e-06, + "loss": 0.8203, + "step": 30883 + }, + { + "epoch": 0.79, + "learning_rate": 1.726627733473483e-06, + "loss": 0.9375, + "step": 30884 + }, + { + "epoch": 0.79, + "learning_rate": 1.7266087227247875e-06, + "loss": 0.8433, + "step": 30885 + }, + { + "epoch": 0.79, + "learning_rate": 1.726589711419761e-06, + "loss": 0.9668, + "step": 30886 + }, + { + "epoch": 0.79, + "learning_rate": 1.726570699558418e-06, + "loss": 0.8721, + "step": 30887 + }, + { + "epoch": 0.79, + "learning_rate": 1.7265516871407736e-06, + "loss": 0.7227, + "step": 30888 + }, + { + "epoch": 0.79, + "learning_rate": 1.7265326741668416e-06, + "loss": 0.8584, + "step": 30889 + }, + { + "epoch": 0.79, + "learning_rate": 1.726513660636637e-06, + "loss": 0.6096, + "step": 30890 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264946465501745e-06, + "loss": 0.9502, + "step": 30891 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264756319074684e-06, + "loss": 1.085, + "step": 30892 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264566167085332e-06, + "loss": 0.668, + "step": 30893 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264376009533838e-06, + "loss": 0.833, + "step": 30894 + }, + { + "epoch": 0.79, + "learning_rate": 1.7264185846420344e-06, + "loss": 0.9814, + "step": 30895 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263995677744997e-06, + "loss": 0.7217, + "step": 30896 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263805503507945e-06, + "loss": 0.6875, + "step": 30897 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263615323709326e-06, + "loss": 0.7966, + "step": 30898 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263425138349295e-06, + "loss": 0.7261, + "step": 30899 + }, + { + "epoch": 0.79, + "learning_rate": 1.726323494742799e-06, + "loss": 0.9727, + "step": 30900 + }, + { + "epoch": 0.79, + "learning_rate": 1.7263044750945563e-06, + "loss": 0.7759, + "step": 30901 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262854548902154e-06, + "loss": 0.8057, + "step": 30902 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262664341297912e-06, + "loss": 0.8311, + "step": 30903 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262474128132983e-06, + "loss": 0.7666, + "step": 30904 + }, + { + "epoch": 0.79, + "learning_rate": 1.726228390940751e-06, + "loss": 0.8926, + "step": 30905 + }, + { + "epoch": 0.79, + "learning_rate": 1.7262093685121642e-06, + "loss": 0.999, + "step": 30906 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261903455275521e-06, + "loss": 0.7432, + "step": 30907 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261713219869295e-06, + "loss": 0.7808, + "step": 30908 + }, + { + "epoch": 0.79, + "learning_rate": 1.726152297890311e-06, + "loss": 1.0039, + "step": 30909 + }, + { + "epoch": 0.79, + "learning_rate": 1.7261332732377109e-06, + "loss": 0.8984, + "step": 30910 + }, + { + "epoch": 0.79, + "learning_rate": 1.726114248029144e-06, + "loss": 0.9717, + "step": 30911 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260952222646249e-06, + "loss": 0.646, + "step": 30912 + }, + { + "epoch": 0.79, + "learning_rate": 1.726076195944168e-06, + "loss": 1.0166, + "step": 30913 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260571690677879e-06, + "loss": 0.5547, + "step": 30914 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260381416354992e-06, + "loss": 0.9209, + "step": 30915 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260191136473168e-06, + "loss": 0.5781, + "step": 30916 + }, + { + "epoch": 0.79, + "learning_rate": 1.7260000851032547e-06, + "loss": 0.7217, + "step": 30917 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259810560033277e-06, + "loss": 0.8848, + "step": 30918 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259620263475503e-06, + "loss": 0.7539, + "step": 30919 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259429961359371e-06, + "loss": 1.0293, + "step": 30920 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259239653685032e-06, + "loss": 0.6611, + "step": 30921 + }, + { + "epoch": 0.79, + "learning_rate": 1.7259049340452622e-06, + "loss": 0.8193, + "step": 30922 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258859021662293e-06, + "loss": 0.6641, + "step": 30923 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258668697314192e-06, + "loss": 0.9102, + "step": 30924 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258478367408459e-06, + "loss": 0.8252, + "step": 30925 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258288031945243e-06, + "loss": 1.0122, + "step": 30926 + }, + { + "epoch": 0.79, + "learning_rate": 1.7258097690924691e-06, + "loss": 0.9561, + "step": 30927 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257907344346947e-06, + "loss": 0.8613, + "step": 30928 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257716992212154e-06, + "loss": 0.79, + "step": 30929 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257526634520464e-06, + "loss": 0.7197, + "step": 30930 + }, + { + "epoch": 0.79, + "learning_rate": 1.725733627127202e-06, + "loss": 0.7122, + "step": 30931 + }, + { + "epoch": 0.79, + "learning_rate": 1.7257145902466967e-06, + "loss": 0.6953, + "step": 30932 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256955528105453e-06, + "loss": 0.7808, + "step": 30933 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256765148187617e-06, + "loss": 0.7471, + "step": 30934 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256574762713614e-06, + "loss": 0.8066, + "step": 30935 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256384371683584e-06, + "loss": 1.1328, + "step": 30936 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256193975097673e-06, + "loss": 0.6895, + "step": 30937 + }, + { + "epoch": 0.79, + "learning_rate": 1.7256003572956028e-06, + "loss": 0.7656, + "step": 30938 + }, + { + "epoch": 0.79, + "learning_rate": 1.7255813165258796e-06, + "loss": 0.7168, + "step": 30939 + }, + { + "epoch": 0.79, + "learning_rate": 1.725562275200612e-06, + "loss": 0.9619, + "step": 30940 + }, + { + "epoch": 0.79, + "learning_rate": 1.725543233319815e-06, + "loss": 0.8496, + "step": 30941 + }, + { + "epoch": 0.79, + "learning_rate": 1.7255241908835027e-06, + "loss": 0.7505, + "step": 30942 + }, + { + "epoch": 0.79, + "learning_rate": 1.72550514789169e-06, + "loss": 0.7407, + "step": 30943 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254861043443911e-06, + "loss": 0.9502, + "step": 30944 + }, + { + "epoch": 0.79, + "learning_rate": 1.725467060241621e-06, + "loss": 0.9121, + "step": 30945 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254480155833942e-06, + "loss": 0.6084, + "step": 30946 + }, + { + "epoch": 0.79, + "learning_rate": 1.725428970369725e-06, + "loss": 0.8867, + "step": 30947 + }, + { + "epoch": 0.79, + "learning_rate": 1.7254099246006283e-06, + "loss": 0.9629, + "step": 30948 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253908782761187e-06, + "loss": 0.9277, + "step": 30949 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253718313962105e-06, + "loss": 0.8975, + "step": 30950 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253527839609188e-06, + "loss": 1.0146, + "step": 30951 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253337359702575e-06, + "loss": 0.9434, + "step": 30952 + }, + { + "epoch": 0.79, + "learning_rate": 1.7253146874242414e-06, + "loss": 0.8203, + "step": 30953 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252956383228857e-06, + "loss": 0.8965, + "step": 30954 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252765886662037e-06, + "loss": 0.915, + "step": 30955 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252575384542114e-06, + "loss": 0.6187, + "step": 30956 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252384876869225e-06, + "loss": 0.7583, + "step": 30957 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252194363643523e-06, + "loss": 0.7102, + "step": 30958 + }, + { + "epoch": 0.79, + "learning_rate": 1.7252003844865143e-06, + "loss": 1.0117, + "step": 30959 + }, + { + "epoch": 0.79, + "learning_rate": 1.725181332053424e-06, + "loss": 0.8633, + "step": 30960 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251622790650954e-06, + "loss": 0.5498, + "step": 30961 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251432255215436e-06, + "loss": 0.9658, + "step": 30962 + }, + { + "epoch": 0.79, + "learning_rate": 1.725124171422783e-06, + "loss": 0.4546, + "step": 30963 + }, + { + "epoch": 0.79, + "learning_rate": 1.7251051167688284e-06, + "loss": 1.1436, + "step": 30964 + }, + { + "epoch": 0.79, + "learning_rate": 1.725086061559694e-06, + "loss": 0.873, + "step": 30965 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250670057953943e-06, + "loss": 0.7964, + "step": 30966 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250479494759442e-06, + "loss": 0.9375, + "step": 30967 + }, + { + "epoch": 0.79, + "learning_rate": 1.7250288926013582e-06, + "loss": 0.7354, + "step": 30968 + }, + { + "epoch": 0.79, + "learning_rate": 1.725009835171651e-06, + "loss": 1.002, + "step": 30969 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249907771868374e-06, + "loss": 1.0029, + "step": 30970 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249717186469313e-06, + "loss": 0.7441, + "step": 30971 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249526595519477e-06, + "loss": 1.0234, + "step": 30972 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249335999019014e-06, + "loss": 1.043, + "step": 30973 + }, + { + "epoch": 0.79, + "learning_rate": 1.7249145396968067e-06, + "loss": 0.7227, + "step": 30974 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248954789366784e-06, + "loss": 0.855, + "step": 30975 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248764176215306e-06, + "loss": 1.1406, + "step": 30976 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248573557513786e-06, + "loss": 0.6768, + "step": 30977 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248382933262365e-06, + "loss": 0.9111, + "step": 30978 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248192303461191e-06, + "loss": 0.9805, + "step": 30979 + }, + { + "epoch": 0.79, + "learning_rate": 1.7248001668110408e-06, + "loss": 0.8467, + "step": 30980 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247811027210163e-06, + "loss": 0.5366, + "step": 30981 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247620380760605e-06, + "loss": 0.6313, + "step": 30982 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247429728761876e-06, + "loss": 1.0205, + "step": 30983 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247239071214124e-06, + "loss": 0.8154, + "step": 30984 + }, + { + "epoch": 0.79, + "learning_rate": 1.7247048408117495e-06, + "loss": 0.9131, + "step": 30985 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246857739472132e-06, + "loss": 0.5234, + "step": 30986 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246667065278183e-06, + "loss": 0.7632, + "step": 30987 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246476385535798e-06, + "loss": 1.042, + "step": 30988 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246285700245115e-06, + "loss": 0.8901, + "step": 30989 + }, + { + "epoch": 0.79, + "learning_rate": 1.7246095009406285e-06, + "loss": 0.9092, + "step": 30990 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245904313019457e-06, + "loss": 0.8096, + "step": 30991 + }, + { + "epoch": 0.79, + "learning_rate": 1.724571361108477e-06, + "loss": 0.791, + "step": 30992 + }, + { + "epoch": 0.79, + "learning_rate": 1.724552290360237e-06, + "loss": 0.9658, + "step": 30993 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245332190572413e-06, + "loss": 0.6792, + "step": 30994 + }, + { + "epoch": 0.79, + "learning_rate": 1.7245141471995033e-06, + "loss": 0.833, + "step": 30995 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244950747870383e-06, + "loss": 0.8691, + "step": 30996 + }, + { + "epoch": 0.79, + "learning_rate": 1.724476001819861e-06, + "loss": 0.7969, + "step": 30997 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244569282979856e-06, + "loss": 0.7949, + "step": 30998 + }, + { + "epoch": 0.79, + "learning_rate": 1.7244378542214267e-06, + "loss": 0.8877, + "step": 30999 + }, + { + "epoch": 0.79, + "learning_rate": 1.724418779590199e-06, + "loss": 0.8154, + "step": 31000 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243997044043176e-06, + "loss": 0.8594, + "step": 31001 + }, + { + "epoch": 0.79, + "learning_rate": 1.724380628663796e-06, + "loss": 0.7969, + "step": 31002 + }, + { + "epoch": 0.79, + "learning_rate": 1.72436155236865e-06, + "loss": 0.9062, + "step": 31003 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243424755188934e-06, + "loss": 1.0107, + "step": 31004 + }, + { + "epoch": 0.79, + "learning_rate": 1.724323398114541e-06, + "loss": 1.0371, + "step": 31005 + }, + { + "epoch": 0.79, + "learning_rate": 1.7243043201556077e-06, + "loss": 0.8467, + "step": 31006 + }, + { + "epoch": 0.79, + "learning_rate": 1.7242852416421076e-06, + "loss": 0.8774, + "step": 31007 + }, + { + "epoch": 0.79, + "learning_rate": 1.724266162574056e-06, + "loss": 0.8994, + "step": 31008 + }, + { + "epoch": 0.79, + "learning_rate": 1.724247082951467e-06, + "loss": 0.998, + "step": 31009 + }, + { + "epoch": 0.79, + "learning_rate": 1.724228002774355e-06, + "loss": 0.7471, + "step": 31010 + }, + { + "epoch": 0.79, + "learning_rate": 1.7242089220427353e-06, + "loss": 0.6445, + "step": 31011 + }, + { + "epoch": 0.79, + "learning_rate": 1.724189840756622e-06, + "loss": 0.8398, + "step": 31012 + }, + { + "epoch": 0.79, + "learning_rate": 1.7241707589160295e-06, + "loss": 0.8652, + "step": 31013 + }, + { + "epoch": 0.79, + "learning_rate": 1.724151676520973e-06, + "loss": 0.7451, + "step": 31014 + }, + { + "epoch": 0.79, + "learning_rate": 1.724132593571467e-06, + "loss": 0.7783, + "step": 31015 + }, + { + "epoch": 0.79, + "learning_rate": 1.724113510067526e-06, + "loss": 0.6699, + "step": 31016 + }, + { + "epoch": 0.79, + "learning_rate": 1.7240944260091643e-06, + "loss": 0.9883, + "step": 31017 + }, + { + "epoch": 0.8, + "learning_rate": 1.724075341396397e-06, + "loss": 0.8984, + "step": 31018 + }, + { + "epoch": 0.8, + "learning_rate": 1.7240562562292383e-06, + "loss": 0.8574, + "step": 31019 + }, + { + "epoch": 0.8, + "learning_rate": 1.724037170507703e-06, + "loss": 0.8887, + "step": 31020 + }, + { + "epoch": 0.8, + "learning_rate": 1.724018084231806e-06, + "loss": 0.6758, + "step": 31021 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239989974015616e-06, + "loss": 0.8203, + "step": 31022 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239799100169844e-06, + "loss": 0.9404, + "step": 31023 + }, + { + "epoch": 0.8, + "learning_rate": 1.723960822078089e-06, + "loss": 0.7275, + "step": 31024 + }, + { + "epoch": 0.8, + "learning_rate": 1.72394173358489e-06, + "loss": 0.8818, + "step": 31025 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239226445374025e-06, + "loss": 0.7051, + "step": 31026 + }, + { + "epoch": 0.8, + "learning_rate": 1.7239035549356405e-06, + "loss": 0.8447, + "step": 31027 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238844647796188e-06, + "loss": 1.0176, + "step": 31028 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238653740693518e-06, + "loss": 0.9102, + "step": 31029 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238462828048548e-06, + "loss": 0.9736, + "step": 31030 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238271909861419e-06, + "loss": 0.8301, + "step": 31031 + }, + { + "epoch": 0.8, + "learning_rate": 1.7238080986132278e-06, + "loss": 0.595, + "step": 31032 + }, + { + "epoch": 0.8, + "learning_rate": 1.723789005686127e-06, + "loss": 0.6909, + "step": 31033 + }, + { + "epoch": 0.8, + "learning_rate": 1.723769912204854e-06, + "loss": 0.8662, + "step": 31034 + }, + { + "epoch": 0.8, + "learning_rate": 1.723750818169424e-06, + "loss": 0.9883, + "step": 31035 + }, + { + "epoch": 0.8, + "learning_rate": 1.7237317235798513e-06, + "loss": 1.0752, + "step": 31036 + }, + { + "epoch": 0.8, + "learning_rate": 1.7237126284361506e-06, + "loss": 0.6611, + "step": 31037 + }, + { + "epoch": 0.8, + "learning_rate": 1.723693532738336e-06, + "loss": 0.7383, + "step": 31038 + }, + { + "epoch": 0.8, + "learning_rate": 1.7236744364864226e-06, + "loss": 1.0088, + "step": 31039 + }, + { + "epoch": 0.8, + "learning_rate": 1.723655339680425e-06, + "loss": 0.8574, + "step": 31040 + }, + { + "epoch": 0.8, + "learning_rate": 1.723636242320358e-06, + "loss": 0.7446, + "step": 31041 + }, + { + "epoch": 0.8, + "learning_rate": 1.723617144406236e-06, + "loss": 0.7732, + "step": 31042 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235980459380736e-06, + "loss": 0.9268, + "step": 31043 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235789469158853e-06, + "loss": 1.0498, + "step": 31044 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235598473396857e-06, + "loss": 0.9502, + "step": 31045 + }, + { + "epoch": 0.8, + "learning_rate": 1.72354074720949e-06, + "loss": 0.7266, + "step": 31046 + }, + { + "epoch": 0.8, + "learning_rate": 1.723521646525312e-06, + "loss": 0.7529, + "step": 31047 + }, + { + "epoch": 0.8, + "learning_rate": 1.7235025452871672e-06, + "loss": 0.5576, + "step": 31048 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234834434950699e-06, + "loss": 0.834, + "step": 31049 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234643411490342e-06, + "loss": 0.9219, + "step": 31050 + }, + { + "epoch": 0.8, + "learning_rate": 1.723445238249075e-06, + "loss": 0.9297, + "step": 31051 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234261347952073e-06, + "loss": 0.9189, + "step": 31052 + }, + { + "epoch": 0.8, + "learning_rate": 1.7234070307874452e-06, + "loss": 0.7417, + "step": 31053 + }, + { + "epoch": 0.8, + "learning_rate": 1.723387926225804e-06, + "loss": 1.0361, + "step": 31054 + }, + { + "epoch": 0.8, + "learning_rate": 1.7233688211102976e-06, + "loss": 0.9922, + "step": 31055 + }, + { + "epoch": 0.8, + "learning_rate": 1.7233497154409413e-06, + "loss": 0.7852, + "step": 31056 + }, + { + "epoch": 0.8, + "learning_rate": 1.723330609217749e-06, + "loss": 0.5734, + "step": 31057 + }, + { + "epoch": 0.8, + "learning_rate": 1.723311502440736e-06, + "loss": 0.8608, + "step": 31058 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232923951099166e-06, + "loss": 0.9209, + "step": 31059 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232732872253051e-06, + "loss": 0.749, + "step": 31060 + }, + { + "epoch": 0.8, + "learning_rate": 1.723254178786917e-06, + "loss": 0.7578, + "step": 31061 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232350697947663e-06, + "loss": 0.8037, + "step": 31062 + }, + { + "epoch": 0.8, + "learning_rate": 1.7232159602488675e-06, + "loss": 0.8643, + "step": 31063 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231968501492356e-06, + "loss": 0.8574, + "step": 31064 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231777394958852e-06, + "loss": 0.8877, + "step": 31065 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231586282888307e-06, + "loss": 0.9082, + "step": 31066 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231395165280874e-06, + "loss": 0.8633, + "step": 31067 + }, + { + "epoch": 0.8, + "learning_rate": 1.723120404213669e-06, + "loss": 0.6313, + "step": 31068 + }, + { + "epoch": 0.8, + "learning_rate": 1.7231012913455905e-06, + "loss": 0.7075, + "step": 31069 + }, + { + "epoch": 0.8, + "learning_rate": 1.723082177923867e-06, + "loss": 0.9971, + "step": 31070 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230630639485124e-06, + "loss": 0.7485, + "step": 31071 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230439494195417e-06, + "loss": 0.8975, + "step": 31072 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230248343369693e-06, + "loss": 0.9707, + "step": 31073 + }, + { + "epoch": 0.8, + "learning_rate": 1.7230057187008103e-06, + "loss": 0.9619, + "step": 31074 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229866025110789e-06, + "loss": 0.8413, + "step": 31075 + }, + { + "epoch": 0.8, + "learning_rate": 1.72296748576779e-06, + "loss": 0.7266, + "step": 31076 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229483684709583e-06, + "loss": 0.5337, + "step": 31077 + }, + { + "epoch": 0.8, + "learning_rate": 1.722929250620598e-06, + "loss": 0.7969, + "step": 31078 + }, + { + "epoch": 0.8, + "learning_rate": 1.7229101322167244e-06, + "loss": 0.9092, + "step": 31079 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228910132593513e-06, + "loss": 0.7441, + "step": 31080 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228718937484939e-06, + "loss": 0.8936, + "step": 31081 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228527736841669e-06, + "loss": 0.6597, + "step": 31082 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228336530663846e-06, + "loss": 0.5833, + "step": 31083 + }, + { + "epoch": 0.8, + "learning_rate": 1.7228145318951617e-06, + "loss": 0.7783, + "step": 31084 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227954101705132e-06, + "loss": 0.7192, + "step": 31085 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227762878924535e-06, + "loss": 0.7881, + "step": 31086 + }, + { + "epoch": 0.8, + "learning_rate": 1.7227571650609972e-06, + "loss": 0.9092, + "step": 31087 + }, + { + "epoch": 0.8, + "learning_rate": 1.722738041676159e-06, + "loss": 0.8828, + "step": 31088 + }, + { + "epoch": 0.8, + "learning_rate": 1.722718917737953e-06, + "loss": 0.9404, + "step": 31089 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226997932463951e-06, + "loss": 1.0361, + "step": 31090 + }, + { + "epoch": 0.8, + "learning_rate": 1.722680668201499e-06, + "loss": 0.5918, + "step": 31091 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226615426032792e-06, + "loss": 0.4253, + "step": 31092 + }, + { + "epoch": 0.8, + "learning_rate": 1.722642416451751e-06, + "loss": 0.9307, + "step": 31093 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226232897469286e-06, + "loss": 0.9893, + "step": 31094 + }, + { + "epoch": 0.8, + "learning_rate": 1.7226041624888268e-06, + "loss": 0.6304, + "step": 31095 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225850346774605e-06, + "loss": 0.873, + "step": 31096 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225659063128438e-06, + "loss": 1.0137, + "step": 31097 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225467773949914e-06, + "loss": 0.8594, + "step": 31098 + }, + { + "epoch": 0.8, + "learning_rate": 1.7225276479239184e-06, + "loss": 0.8682, + "step": 31099 + }, + { + "epoch": 0.8, + "learning_rate": 1.722508517899639e-06, + "loss": 0.875, + "step": 31100 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224893873221685e-06, + "loss": 0.793, + "step": 31101 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224702561915208e-06, + "loss": 0.8086, + "step": 31102 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224511245077107e-06, + "loss": 0.9395, + "step": 31103 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224319922707533e-06, + "loss": 1.0508, + "step": 31104 + }, + { + "epoch": 0.8, + "learning_rate": 1.7224128594806626e-06, + "loss": 0.9375, + "step": 31105 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223937261374539e-06, + "loss": 1.0645, + "step": 31106 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223745922411411e-06, + "loss": 1.0029, + "step": 31107 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223554577917398e-06, + "loss": 0.7744, + "step": 31108 + }, + { + "epoch": 0.8, + "learning_rate": 1.722336322789264e-06, + "loss": 0.7842, + "step": 31109 + }, + { + "epoch": 0.8, + "learning_rate": 1.7223171872337286e-06, + "loss": 0.7246, + "step": 31110 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222980511251479e-06, + "loss": 0.8623, + "step": 31111 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222789144635368e-06, + "loss": 0.8936, + "step": 31112 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222597772489103e-06, + "loss": 0.8115, + "step": 31113 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222406394812824e-06, + "loss": 0.8828, + "step": 31114 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222215011606677e-06, + "loss": 0.7324, + "step": 31115 + }, + { + "epoch": 0.8, + "learning_rate": 1.7222023622870818e-06, + "loss": 1.0391, + "step": 31116 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221832228605386e-06, + "loss": 0.7754, + "step": 31117 + }, + { + "epoch": 0.8, + "learning_rate": 1.722164082881053e-06, + "loss": 0.8711, + "step": 31118 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221449423486392e-06, + "loss": 0.7515, + "step": 31119 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221258012633126e-06, + "loss": 0.6846, + "step": 31120 + }, + { + "epoch": 0.8, + "learning_rate": 1.7221066596250873e-06, + "loss": 0.9746, + "step": 31121 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220875174339779e-06, + "loss": 0.7969, + "step": 31122 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220683746899999e-06, + "loss": 0.7227, + "step": 31123 + }, + { + "epoch": 0.8, + "learning_rate": 1.722049231393167e-06, + "loss": 0.9102, + "step": 31124 + }, + { + "epoch": 0.8, + "learning_rate": 1.7220300875434938e-06, + "loss": 1.0117, + "step": 31125 + }, + { + "epoch": 0.8, + "learning_rate": 1.722010943140996e-06, + "loss": 0.9062, + "step": 31126 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219917981856873e-06, + "loss": 1.0361, + "step": 31127 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219726526775828e-06, + "loss": 0.8508, + "step": 31128 + }, + { + "epoch": 0.8, + "learning_rate": 1.721953506616697e-06, + "loss": 0.8701, + "step": 31129 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219343600030448e-06, + "loss": 0.9492, + "step": 31130 + }, + { + "epoch": 0.8, + "learning_rate": 1.7219152128366404e-06, + "loss": 0.8301, + "step": 31131 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218960651174985e-06, + "loss": 0.9209, + "step": 31132 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218769168456344e-06, + "loss": 0.9873, + "step": 31133 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218577680210622e-06, + "loss": 0.9414, + "step": 31134 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218386186437968e-06, + "loss": 0.9053, + "step": 31135 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218194687138526e-06, + "loss": 0.7891, + "step": 31136 + }, + { + "epoch": 0.8, + "learning_rate": 1.7218003182312443e-06, + "loss": 1.0039, + "step": 31137 + }, + { + "epoch": 0.8, + "learning_rate": 1.721781167195987e-06, + "loss": 0.8545, + "step": 31138 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217620156080948e-06, + "loss": 0.79, + "step": 31139 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217428634675829e-06, + "loss": 0.7031, + "step": 31140 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217237107744653e-06, + "loss": 0.7932, + "step": 31141 + }, + { + "epoch": 0.8, + "learning_rate": 1.7217045575287572e-06, + "loss": 0.6641, + "step": 31142 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216854037304732e-06, + "loss": 0.7141, + "step": 31143 + }, + { + "epoch": 0.8, + "learning_rate": 1.721666249379628e-06, + "loss": 0.9189, + "step": 31144 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216470944762357e-06, + "loss": 0.7861, + "step": 31145 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216279390203118e-06, + "loss": 0.782, + "step": 31146 + }, + { + "epoch": 0.8, + "learning_rate": 1.7216087830118703e-06, + "loss": 0.8867, + "step": 31147 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215896264509263e-06, + "loss": 0.875, + "step": 31148 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215704693374944e-06, + "loss": 0.9834, + "step": 31149 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215513116715888e-06, + "loss": 0.9785, + "step": 31150 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215321534532247e-06, + "loss": 0.8503, + "step": 31151 + }, + { + "epoch": 0.8, + "learning_rate": 1.7215129946824168e-06, + "loss": 0.9756, + "step": 31152 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214938353591792e-06, + "loss": 0.8828, + "step": 31153 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214746754835274e-06, + "loss": 0.5942, + "step": 31154 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214555150554752e-06, + "loss": 0.7822, + "step": 31155 + }, + { + "epoch": 0.8, + "learning_rate": 1.7214363540750381e-06, + "loss": 0.96, + "step": 31156 + }, + { + "epoch": 0.8, + "learning_rate": 1.72141719254223e-06, + "loss": 0.7568, + "step": 31157 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213980304570664e-06, + "loss": 0.8789, + "step": 31158 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213788678195612e-06, + "loss": 1.1016, + "step": 31159 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213597046297293e-06, + "loss": 0.6943, + "step": 31160 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213405408875853e-06, + "loss": 1.0293, + "step": 31161 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213213765931443e-06, + "loss": 0.8545, + "step": 31162 + }, + { + "epoch": 0.8, + "learning_rate": 1.7213022117464205e-06, + "loss": 0.7324, + "step": 31163 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212830463474288e-06, + "loss": 0.6758, + "step": 31164 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212638803961838e-06, + "loss": 0.7542, + "step": 31165 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212447138927003e-06, + "loss": 0.8457, + "step": 31166 + }, + { + "epoch": 0.8, + "learning_rate": 1.721225546836993e-06, + "loss": 0.6719, + "step": 31167 + }, + { + "epoch": 0.8, + "learning_rate": 1.7212063792290766e-06, + "loss": 0.9775, + "step": 31168 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211872110689652e-06, + "loss": 0.9307, + "step": 31169 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211680423566742e-06, + "loss": 0.7358, + "step": 31170 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211488730922176e-06, + "loss": 1.0098, + "step": 31171 + }, + { + "epoch": 0.8, + "learning_rate": 1.721129703275611e-06, + "loss": 0.8804, + "step": 31172 + }, + { + "epoch": 0.8, + "learning_rate": 1.7211105329068682e-06, + "loss": 0.8076, + "step": 31173 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210913619860042e-06, + "loss": 0.8008, + "step": 31174 + }, + { + "epoch": 0.8, + "learning_rate": 1.721072190513034e-06, + "loss": 0.8936, + "step": 31175 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210530184879716e-06, + "loss": 0.7944, + "step": 31176 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210338459108323e-06, + "loss": 0.5916, + "step": 31177 + }, + { + "epoch": 0.8, + "learning_rate": 1.7210146727816306e-06, + "loss": 0.8838, + "step": 31178 + }, + { + "epoch": 0.8, + "learning_rate": 1.720995499100381e-06, + "loss": 0.7119, + "step": 31179 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209763248670983e-06, + "loss": 0.9199, + "step": 31180 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209571500817972e-06, + "loss": 0.8545, + "step": 31181 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209379747444922e-06, + "loss": 0.6396, + "step": 31182 + }, + { + "epoch": 0.8, + "learning_rate": 1.7209187988551985e-06, + "loss": 0.7695, + "step": 31183 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208996224139302e-06, + "loss": 0.8018, + "step": 31184 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208804454207022e-06, + "loss": 0.7725, + "step": 31185 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208612678755292e-06, + "loss": 0.8145, + "step": 31186 + }, + { + "epoch": 0.8, + "learning_rate": 1.720842089778426e-06, + "loss": 0.9014, + "step": 31187 + }, + { + "epoch": 0.8, + "learning_rate": 1.720822911129407e-06, + "loss": 0.7939, + "step": 31188 + }, + { + "epoch": 0.8, + "learning_rate": 1.7208037319284872e-06, + "loss": 0.9883, + "step": 31189 + }, + { + "epoch": 0.8, + "learning_rate": 1.720784552175681e-06, + "loss": 0.8882, + "step": 31190 + }, + { + "epoch": 0.8, + "learning_rate": 1.720765371871003e-06, + "loss": 0.8223, + "step": 31191 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207461910144684e-06, + "loss": 1.0029, + "step": 31192 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207270096060916e-06, + "loss": 0.9209, + "step": 31193 + }, + { + "epoch": 0.8, + "learning_rate": 1.7207078276458872e-06, + "loss": 0.6989, + "step": 31194 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206886451338698e-06, + "loss": 1.2227, + "step": 31195 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206694620700544e-06, + "loss": 1.0215, + "step": 31196 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206502784544554e-06, + "loss": 1.0566, + "step": 31197 + }, + { + "epoch": 0.8, + "learning_rate": 1.7206310942870879e-06, + "loss": 0.9023, + "step": 31198 + }, + { + "epoch": 0.8, + "learning_rate": 1.720611909567966e-06, + "loss": 0.5334, + "step": 31199 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205927242971048e-06, + "loss": 0.9375, + "step": 31200 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205735384745191e-06, + "loss": 0.5137, + "step": 31201 + }, + { + "epoch": 0.8, + "learning_rate": 1.720554352100223e-06, + "loss": 0.8799, + "step": 31202 + }, + { + "epoch": 0.8, + "learning_rate": 1.720535165174232e-06, + "loss": 0.8828, + "step": 31203 + }, + { + "epoch": 0.8, + "learning_rate": 1.7205159776965598e-06, + "loss": 0.7695, + "step": 31204 + }, + { + "epoch": 0.8, + "learning_rate": 1.720496789667222e-06, + "loss": 1.0098, + "step": 31205 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204776010862329e-06, + "loss": 0.7773, + "step": 31206 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204584119536074e-06, + "loss": 0.668, + "step": 31207 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204392222693597e-06, + "loss": 0.7417, + "step": 31208 + }, + { + "epoch": 0.8, + "learning_rate": 1.720420032033505e-06, + "loss": 0.6729, + "step": 31209 + }, + { + "epoch": 0.8, + "learning_rate": 1.7204008412460578e-06, + "loss": 0.8438, + "step": 31210 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203816499070326e-06, + "loss": 1.0723, + "step": 31211 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203624580164444e-06, + "loss": 0.916, + "step": 31212 + }, + { + "epoch": 0.8, + "learning_rate": 1.720343265574308e-06, + "loss": 0.8916, + "step": 31213 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203240725806376e-06, + "loss": 0.9678, + "step": 31214 + }, + { + "epoch": 0.8, + "learning_rate": 1.7203048790354484e-06, + "loss": 0.9229, + "step": 31215 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202856849387548e-06, + "loss": 1.1953, + "step": 31216 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202664902905718e-06, + "loss": 0.6743, + "step": 31217 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202472950909135e-06, + "loss": 0.9336, + "step": 31218 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202280993397951e-06, + "loss": 0.8076, + "step": 31219 + }, + { + "epoch": 0.8, + "learning_rate": 1.7202089030372312e-06, + "loss": 0.9023, + "step": 31220 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201897061832363e-06, + "loss": 0.7285, + "step": 31221 + }, + { + "epoch": 0.8, + "learning_rate": 1.720170508777825e-06, + "loss": 0.6909, + "step": 31222 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201513108210128e-06, + "loss": 0.7114, + "step": 31223 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201321123128136e-06, + "loss": 1.0547, + "step": 31224 + }, + { + "epoch": 0.8, + "learning_rate": 1.7201129132532425e-06, + "loss": 0.606, + "step": 31225 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200937136423142e-06, + "loss": 0.6963, + "step": 31226 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200745134800428e-06, + "loss": 0.8701, + "step": 31227 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200553127664438e-06, + "loss": 1.0273, + "step": 31228 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200361115015315e-06, + "loss": 0.5615, + "step": 31229 + }, + { + "epoch": 0.8, + "learning_rate": 1.7200169096853205e-06, + "loss": 0.9971, + "step": 31230 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199977073178257e-06, + "loss": 0.8672, + "step": 31231 + }, + { + "epoch": 0.8, + "learning_rate": 1.719978504399062e-06, + "loss": 0.4878, + "step": 31232 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199593009290435e-06, + "loss": 0.8447, + "step": 31233 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199400969077856e-06, + "loss": 0.8252, + "step": 31234 + }, + { + "epoch": 0.8, + "learning_rate": 1.7199208923353027e-06, + "loss": 0.917, + "step": 31235 + }, + { + "epoch": 0.8, + "learning_rate": 1.719901687211609e-06, + "loss": 0.8828, + "step": 31236 + }, + { + "epoch": 0.8, + "learning_rate": 1.71988248153672e-06, + "loss": 0.9287, + "step": 31237 + }, + { + "epoch": 0.8, + "learning_rate": 1.71986327531065e-06, + "loss": 0.6245, + "step": 31238 + }, + { + "epoch": 0.8, + "learning_rate": 1.7198440685334141e-06, + "loss": 0.6816, + "step": 31239 + }, + { + "epoch": 0.8, + "learning_rate": 1.7198248612050263e-06, + "loss": 0.7451, + "step": 31240 + }, + { + "epoch": 0.8, + "learning_rate": 1.719805653325502e-06, + "loss": 0.917, + "step": 31241 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197864448948556e-06, + "loss": 0.6787, + "step": 31242 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197672359131014e-06, + "loss": 0.7373, + "step": 31243 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197480263802549e-06, + "loss": 0.8223, + "step": 31244 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197288162963304e-06, + "loss": 0.8359, + "step": 31245 + }, + { + "epoch": 0.8, + "learning_rate": 1.7197096056613424e-06, + "loss": 0.9844, + "step": 31246 + }, + { + "epoch": 0.8, + "learning_rate": 1.719690394475306e-06, + "loss": 0.6466, + "step": 31247 + }, + { + "epoch": 0.8, + "learning_rate": 1.719671182738236e-06, + "loss": 1.0454, + "step": 31248 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196519704501466e-06, + "loss": 0.6433, + "step": 31249 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196327576110527e-06, + "loss": 0.8574, + "step": 31250 + }, + { + "epoch": 0.8, + "learning_rate": 1.7196135442209693e-06, + "loss": 0.7881, + "step": 31251 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195943302799107e-06, + "loss": 0.9221, + "step": 31252 + }, + { + "epoch": 0.8, + "learning_rate": 1.719575115787892e-06, + "loss": 0.6362, + "step": 31253 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195559007449277e-06, + "loss": 0.7678, + "step": 31254 + }, + { + "epoch": 0.8, + "learning_rate": 1.7195366851510325e-06, + "loss": 0.7871, + "step": 31255 + }, + { + "epoch": 0.8, + "learning_rate": 1.719517469006221e-06, + "loss": 0.9639, + "step": 31256 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194982523105081e-06, + "loss": 0.8887, + "step": 31257 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194790350639087e-06, + "loss": 0.9355, + "step": 31258 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194598172664372e-06, + "loss": 1.0605, + "step": 31259 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194405989181082e-06, + "loss": 1.0381, + "step": 31260 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194213800189367e-06, + "loss": 0.9043, + "step": 31261 + }, + { + "epoch": 0.8, + "learning_rate": 1.7194021605689374e-06, + "loss": 0.998, + "step": 31262 + }, + { + "epoch": 0.8, + "learning_rate": 1.719382940568125e-06, + "loss": 0.5486, + "step": 31263 + }, + { + "epoch": 0.8, + "learning_rate": 1.7193637200165139e-06, + "loss": 0.9482, + "step": 31264 + }, + { + "epoch": 0.8, + "learning_rate": 1.7193444989141193e-06, + "loss": 0.791, + "step": 31265 + }, + { + "epoch": 0.8, + "learning_rate": 1.719325277260956e-06, + "loss": 0.7197, + "step": 31266 + }, + { + "epoch": 0.8, + "learning_rate": 1.719306055057038e-06, + "loss": 0.9258, + "step": 31267 + }, + { + "epoch": 0.8, + "learning_rate": 1.71928683230238e-06, + "loss": 0.9844, + "step": 31268 + }, + { + "epoch": 0.8, + "learning_rate": 1.719267608996998e-06, + "loss": 0.6836, + "step": 31269 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192483851409055e-06, + "loss": 1.0176, + "step": 31270 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192291607341174e-06, + "loss": 0.7939, + "step": 31271 + }, + { + "epoch": 0.8, + "learning_rate": 1.7192099357766489e-06, + "loss": 0.7307, + "step": 31272 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191907102685143e-06, + "loss": 1.0488, + "step": 31273 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191714842097284e-06, + "loss": 0.6807, + "step": 31274 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191522576003061e-06, + "loss": 1.0723, + "step": 31275 + }, + { + "epoch": 0.8, + "learning_rate": 1.719133030440262e-06, + "loss": 0.9395, + "step": 31276 + }, + { + "epoch": 0.8, + "learning_rate": 1.7191138027296105e-06, + "loss": 0.8384, + "step": 31277 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190945744683669e-06, + "loss": 1.0303, + "step": 31278 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190753456565456e-06, + "loss": 0.835, + "step": 31279 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190561162941614e-06, + "loss": 1.0078, + "step": 31280 + }, + { + "epoch": 0.8, + "learning_rate": 1.7190368863812287e-06, + "loss": 0.7979, + "step": 31281 + }, + { + "epoch": 0.8, + "learning_rate": 1.719017655917763e-06, + "loss": 0.8311, + "step": 31282 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189984249037784e-06, + "loss": 0.9443, + "step": 31283 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189791933392894e-06, + "loss": 0.8438, + "step": 31284 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189599612243116e-06, + "loss": 0.4159, + "step": 31285 + }, + { + "epoch": 0.8, + "learning_rate": 1.718940728558859e-06, + "loss": 0.7905, + "step": 31286 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189214953429466e-06, + "loss": 0.7554, + "step": 31287 + }, + { + "epoch": 0.8, + "learning_rate": 1.7189022615765887e-06, + "loss": 1.0059, + "step": 31288 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188830272598008e-06, + "loss": 0.8462, + "step": 31289 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188637923925971e-06, + "loss": 0.9072, + "step": 31290 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188445569749925e-06, + "loss": 0.8223, + "step": 31291 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188253210070016e-06, + "loss": 0.833, + "step": 31292 + }, + { + "epoch": 0.8, + "learning_rate": 1.7188060844886391e-06, + "loss": 0.7861, + "step": 31293 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187868474199202e-06, + "loss": 0.9268, + "step": 31294 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187676098008587e-06, + "loss": 0.8213, + "step": 31295 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187483716314704e-06, + "loss": 0.8643, + "step": 31296 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187291329117693e-06, + "loss": 0.8525, + "step": 31297 + }, + { + "epoch": 0.8, + "learning_rate": 1.7187098936417703e-06, + "loss": 0.9199, + "step": 31298 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186906538214886e-06, + "loss": 1.0967, + "step": 31299 + }, + { + "epoch": 0.8, + "learning_rate": 1.718671413450938e-06, + "loss": 0.7021, + "step": 31300 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186521725301339e-06, + "loss": 0.8369, + "step": 31301 + }, + { + "epoch": 0.8, + "learning_rate": 1.718632931059091e-06, + "loss": 0.8867, + "step": 31302 + }, + { + "epoch": 0.8, + "learning_rate": 1.7186136890378238e-06, + "loss": 0.7271, + "step": 31303 + }, + { + "epoch": 0.8, + "learning_rate": 1.718594446466347e-06, + "loss": 0.791, + "step": 31304 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185752033446756e-06, + "loss": 0.8979, + "step": 31305 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185559596728243e-06, + "loss": 0.8838, + "step": 31306 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185367154508077e-06, + "loss": 0.6624, + "step": 31307 + }, + { + "epoch": 0.8, + "learning_rate": 1.7185174706786405e-06, + "loss": 0.6304, + "step": 31308 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184982253563376e-06, + "loss": 1.1016, + "step": 31309 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184789794839135e-06, + "loss": 0.9434, + "step": 31310 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184597330613833e-06, + "loss": 0.8486, + "step": 31311 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184404860887613e-06, + "loss": 0.9023, + "step": 31312 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184212385660625e-06, + "loss": 0.5947, + "step": 31313 + }, + { + "epoch": 0.8, + "learning_rate": 1.7184019904933018e-06, + "loss": 0.9795, + "step": 31314 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183827418704938e-06, + "loss": 1.0469, + "step": 31315 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183634926976528e-06, + "loss": 0.9414, + "step": 31316 + }, + { + "epoch": 0.8, + "learning_rate": 1.718344242974794e-06, + "loss": 1.0869, + "step": 31317 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183249927019321e-06, + "loss": 0.6885, + "step": 31318 + }, + { + "epoch": 0.8, + "learning_rate": 1.7183057418790818e-06, + "loss": 0.9902, + "step": 31319 + }, + { + "epoch": 0.8, + "learning_rate": 1.7182864905062577e-06, + "loss": 0.6494, + "step": 31320 + }, + { + "epoch": 0.8, + "learning_rate": 1.718267238583475e-06, + "loss": 0.832, + "step": 31321 + }, + { + "epoch": 0.8, + "learning_rate": 1.718247986110748e-06, + "loss": 0.8799, + "step": 31322 + }, + { + "epoch": 0.8, + "learning_rate": 1.7182287330880913e-06, + "loss": 0.7402, + "step": 31323 + }, + { + "epoch": 0.8, + "learning_rate": 1.71820947951552e-06, + "loss": 0.5845, + "step": 31324 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181902253930486e-06, + "loss": 0.9385, + "step": 31325 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181709707206921e-06, + "loss": 0.9287, + "step": 31326 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181517154984651e-06, + "loss": 0.9131, + "step": 31327 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181324597263824e-06, + "loss": 0.8965, + "step": 31328 + }, + { + "epoch": 0.8, + "learning_rate": 1.7181132034044587e-06, + "loss": 1.0986, + "step": 31329 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180939465327087e-06, + "loss": 1.0684, + "step": 31330 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180746891111471e-06, + "loss": 0.9248, + "step": 31331 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180554311397887e-06, + "loss": 0.8271, + "step": 31332 + }, + { + "epoch": 0.8, + "learning_rate": 1.7180361726186483e-06, + "loss": 1.0674, + "step": 31333 + }, + { + "epoch": 0.8, + "learning_rate": 1.718016913547741e-06, + "loss": 0.7949, + "step": 31334 + }, + { + "epoch": 0.8, + "learning_rate": 1.717997653927081e-06, + "loss": 0.9697, + "step": 31335 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179783937566827e-06, + "loss": 0.8926, + "step": 31336 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179591330365617e-06, + "loss": 0.7891, + "step": 31337 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179398717667323e-06, + "loss": 0.5605, + "step": 31338 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179206099472096e-06, + "loss": 0.7568, + "step": 31339 + }, + { + "epoch": 0.8, + "learning_rate": 1.7179013475780079e-06, + "loss": 0.6387, + "step": 31340 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178820846591423e-06, + "loss": 0.8613, + "step": 31341 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178628211906275e-06, + "loss": 0.8379, + "step": 31342 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178435571724782e-06, + "loss": 0.8652, + "step": 31343 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178242926047086e-06, + "loss": 0.9834, + "step": 31344 + }, + { + "epoch": 0.8, + "learning_rate": 1.7178050274873343e-06, + "loss": 0.7803, + "step": 31345 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177857618203694e-06, + "loss": 0.8984, + "step": 31346 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177664956038295e-06, + "loss": 0.9199, + "step": 31347 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177472288377284e-06, + "loss": 0.6509, + "step": 31348 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177279615220812e-06, + "loss": 1.0049, + "step": 31349 + }, + { + "epoch": 0.8, + "learning_rate": 1.7177086936569028e-06, + "loss": 0.6841, + "step": 31350 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176894252422078e-06, + "loss": 0.6843, + "step": 31351 + }, + { + "epoch": 0.8, + "learning_rate": 1.717670156278011e-06, + "loss": 0.6846, + "step": 31352 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176508867643274e-06, + "loss": 0.9463, + "step": 31353 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176316167011713e-06, + "loss": 0.7861, + "step": 31354 + }, + { + "epoch": 0.8, + "learning_rate": 1.7176123460885577e-06, + "loss": 1.0273, + "step": 31355 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175930749265013e-06, + "loss": 0.875, + "step": 31356 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175738032150168e-06, + "loss": 0.9062, + "step": 31357 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175545309541192e-06, + "loss": 0.9521, + "step": 31358 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175352581438229e-06, + "loss": 1.0322, + "step": 31359 + }, + { + "epoch": 0.8, + "learning_rate": 1.7175159847841431e-06, + "loss": 0.5898, + "step": 31360 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174967108750943e-06, + "loss": 0.6841, + "step": 31361 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174774364166913e-06, + "loss": 0.8152, + "step": 31362 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174581614089486e-06, + "loss": 0.8486, + "step": 31363 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174388858518811e-06, + "loss": 0.9727, + "step": 31364 + }, + { + "epoch": 0.8, + "learning_rate": 1.717419609745504e-06, + "loss": 0.6404, + "step": 31365 + }, + { + "epoch": 0.8, + "learning_rate": 1.7174003330898311e-06, + "loss": 0.9863, + "step": 31366 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173810558848784e-06, + "loss": 0.8115, + "step": 31367 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173617781306598e-06, + "loss": 0.5669, + "step": 31368 + }, + { + "epoch": 0.8, + "learning_rate": 1.71734249982719e-06, + "loss": 0.9082, + "step": 31369 + }, + { + "epoch": 0.8, + "learning_rate": 1.7173232209744843e-06, + "loss": 0.7622, + "step": 31370 + }, + { + "epoch": 0.8, + "learning_rate": 1.717303941572557e-06, + "loss": 0.896, + "step": 31371 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172846616214232e-06, + "loss": 0.8916, + "step": 31372 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172653811210975e-06, + "loss": 1.0059, + "step": 31373 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172461000715948e-06, + "loss": 0.8335, + "step": 31374 + }, + { + "epoch": 0.8, + "learning_rate": 1.7172268184729295e-06, + "loss": 0.8818, + "step": 31375 + }, + { + "epoch": 0.8, + "learning_rate": 1.717207536325117e-06, + "loss": 0.8125, + "step": 31376 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171882536281712e-06, + "loss": 0.8652, + "step": 31377 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171689703821075e-06, + "loss": 0.8574, + "step": 31378 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171496865869405e-06, + "loss": 0.6934, + "step": 31379 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171304022426849e-06, + "loss": 0.9141, + "step": 31380 + }, + { + "epoch": 0.8, + "learning_rate": 1.7171111173493556e-06, + "loss": 0.5537, + "step": 31381 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170918319069675e-06, + "loss": 1.0625, + "step": 31382 + }, + { + "epoch": 0.8, + "learning_rate": 1.717072545915535e-06, + "loss": 0.9648, + "step": 31383 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170532593750728e-06, + "loss": 0.6079, + "step": 31384 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170339722855962e-06, + "loss": 0.9717, + "step": 31385 + }, + { + "epoch": 0.8, + "learning_rate": 1.7170146846471193e-06, + "loss": 0.793, + "step": 31386 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169953964596575e-06, + "loss": 1.0088, + "step": 31387 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169761077232252e-06, + "loss": 0.7544, + "step": 31388 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169568184378376e-06, + "loss": 1.0225, + "step": 31389 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169375286035086e-06, + "loss": 0.9512, + "step": 31390 + }, + { + "epoch": 0.8, + "learning_rate": 1.7169182382202539e-06, + "loss": 1.1172, + "step": 31391 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168989472880875e-06, + "loss": 0.7344, + "step": 31392 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168796558070246e-06, + "loss": 0.686, + "step": 31393 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168603637770802e-06, + "loss": 1.0449, + "step": 31394 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168410711982686e-06, + "loss": 0.6147, + "step": 31395 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168217780706047e-06, + "loss": 0.8525, + "step": 31396 + }, + { + "epoch": 0.8, + "learning_rate": 1.7168024843941036e-06, + "loss": 0.644, + "step": 31397 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167831901687794e-06, + "loss": 0.792, + "step": 31398 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167638953946477e-06, + "loss": 0.8818, + "step": 31399 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167446000717225e-06, + "loss": 0.8506, + "step": 31400 + }, + { + "epoch": 0.8, + "learning_rate": 1.7167253042000191e-06, + "loss": 0.7822, + "step": 31401 + }, + { + "epoch": 0.8, + "learning_rate": 1.716706007779552e-06, + "loss": 0.7534, + "step": 31402 + }, + { + "epoch": 0.8, + "learning_rate": 1.716686710810336e-06, + "loss": 0.9375, + "step": 31403 + }, + { + "epoch": 0.8, + "learning_rate": 1.716667413292386e-06, + "loss": 0.6499, + "step": 31404 + }, + { + "epoch": 0.8, + "learning_rate": 1.716648115225717e-06, + "loss": 0.939, + "step": 31405 + }, + { + "epoch": 0.8, + "learning_rate": 1.716628816610343e-06, + "loss": 1.0137, + "step": 31406 + }, + { + "epoch": 0.8, + "learning_rate": 1.7166095174462795e-06, + "loss": 0.625, + "step": 31407 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165902177335411e-06, + "loss": 0.7832, + "step": 31408 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165709174721426e-06, + "loss": 0.5706, + "step": 31409 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165516166620986e-06, + "loss": 0.7651, + "step": 31410 + }, + { + "epoch": 0.81, + "learning_rate": 1.716532315303424e-06, + "loss": 0.7783, + "step": 31411 + }, + { + "epoch": 0.81, + "learning_rate": 1.7165130133961335e-06, + "loss": 0.7578, + "step": 31412 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164937109402418e-06, + "loss": 0.8438, + "step": 31413 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164744079357641e-06, + "loss": 0.8545, + "step": 31414 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164551043827147e-06, + "loss": 0.876, + "step": 31415 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164358002811085e-06, + "loss": 0.7622, + "step": 31416 + }, + { + "epoch": 0.81, + "learning_rate": 1.7164164956309604e-06, + "loss": 0.9072, + "step": 31417 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163971904322851e-06, + "loss": 0.8838, + "step": 31418 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163778846850976e-06, + "loss": 0.9639, + "step": 31419 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163585783894123e-06, + "loss": 0.8054, + "step": 31420 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163392715452442e-06, + "loss": 0.769, + "step": 31421 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163199641526082e-06, + "loss": 0.9873, + "step": 31422 + }, + { + "epoch": 0.81, + "learning_rate": 1.7163006562115188e-06, + "loss": 0.9043, + "step": 31423 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162813477219912e-06, + "loss": 0.8301, + "step": 31424 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162620386840394e-06, + "loss": 0.9434, + "step": 31425 + }, + { + "epoch": 0.81, + "learning_rate": 1.716242729097679e-06, + "loss": 0.8174, + "step": 31426 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162234189629246e-06, + "loss": 0.9355, + "step": 31427 + }, + { + "epoch": 0.81, + "learning_rate": 1.7162041082797907e-06, + "loss": 1.0742, + "step": 31428 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161847970482923e-06, + "loss": 0.8662, + "step": 31429 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161654852684443e-06, + "loss": 0.6682, + "step": 31430 + }, + { + "epoch": 0.81, + "learning_rate": 1.716146172940261e-06, + "loss": 0.6797, + "step": 31431 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161268600637574e-06, + "loss": 1.1807, + "step": 31432 + }, + { + "epoch": 0.81, + "learning_rate": 1.7161075466389487e-06, + "loss": 0.8252, + "step": 31433 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160882326658493e-06, + "loss": 0.8311, + "step": 31434 + }, + { + "epoch": 0.81, + "learning_rate": 1.716068918144474e-06, + "loss": 1.0381, + "step": 31435 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160496030748377e-06, + "loss": 0.8467, + "step": 31436 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160302874569552e-06, + "loss": 0.7129, + "step": 31437 + }, + { + "epoch": 0.81, + "learning_rate": 1.7160109712908413e-06, + "loss": 0.8691, + "step": 31438 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159916545765105e-06, + "loss": 0.9678, + "step": 31439 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159723373139778e-06, + "loss": 0.9707, + "step": 31440 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159530195032584e-06, + "loss": 0.873, + "step": 31441 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159337011443663e-06, + "loss": 0.7612, + "step": 31442 + }, + { + "epoch": 0.81, + "learning_rate": 1.7159143822373169e-06, + "loss": 0.8369, + "step": 31443 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158950627821244e-06, + "loss": 0.5562, + "step": 31444 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158757427788045e-06, + "loss": 0.8149, + "step": 31445 + }, + { + "epoch": 0.81, + "learning_rate": 1.715856422227371e-06, + "loss": 0.707, + "step": 31446 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158371011278395e-06, + "loss": 0.915, + "step": 31447 + }, + { + "epoch": 0.81, + "learning_rate": 1.7158177794802242e-06, + "loss": 0.752, + "step": 31448 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157984572845403e-06, + "loss": 1.043, + "step": 31449 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157791345408024e-06, + "loss": 0.7559, + "step": 31450 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157598112490253e-06, + "loss": 0.8271, + "step": 31451 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157404874092238e-06, + "loss": 0.9463, + "step": 31452 + }, + { + "epoch": 0.81, + "learning_rate": 1.7157211630214127e-06, + "loss": 0.7998, + "step": 31453 + }, + { + "epoch": 0.81, + "learning_rate": 1.715701838085607e-06, + "loss": 0.918, + "step": 31454 + }, + { + "epoch": 0.81, + "learning_rate": 1.715682512601821e-06, + "loss": 0.7314, + "step": 31455 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156631865700701e-06, + "loss": 0.8164, + "step": 31456 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156438599903686e-06, + "loss": 0.9609, + "step": 31457 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156245328627316e-06, + "loss": 0.8311, + "step": 31458 + }, + { + "epoch": 0.81, + "learning_rate": 1.7156052051871738e-06, + "loss": 1.0059, + "step": 31459 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155858769637102e-06, + "loss": 0.8428, + "step": 31460 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155665481923552e-06, + "loss": 1.0049, + "step": 31461 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155472188731238e-06, + "loss": 0.8916, + "step": 31462 + }, + { + "epoch": 0.81, + "learning_rate": 1.7155278890060306e-06, + "loss": 0.8086, + "step": 31463 + }, + { + "epoch": 0.81, + "learning_rate": 1.715508558591091e-06, + "loss": 1.0088, + "step": 31464 + }, + { + "epoch": 0.81, + "learning_rate": 1.715489227628319e-06, + "loss": 0.8467, + "step": 31465 + }, + { + "epoch": 0.81, + "learning_rate": 1.71546989611773e-06, + "loss": 0.77, + "step": 31466 + }, + { + "epoch": 0.81, + "learning_rate": 1.7154505640593386e-06, + "loss": 0.7305, + "step": 31467 + }, + { + "epoch": 0.81, + "learning_rate": 1.7154312314531597e-06, + "loss": 0.9707, + "step": 31468 + }, + { + "epoch": 0.81, + "learning_rate": 1.715411898299208e-06, + "loss": 0.9453, + "step": 31469 + }, + { + "epoch": 0.81, + "learning_rate": 1.715392564597498e-06, + "loss": 0.6025, + "step": 31470 + }, + { + "epoch": 0.81, + "learning_rate": 1.715373230348045e-06, + "loss": 0.8965, + "step": 31471 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153538955508635e-06, + "loss": 0.8428, + "step": 31472 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153345602059685e-06, + "loss": 0.6797, + "step": 31473 + }, + { + "epoch": 0.81, + "learning_rate": 1.7153152243133747e-06, + "loss": 0.8174, + "step": 31474 + }, + { + "epoch": 0.81, + "learning_rate": 1.715295887873097e-06, + "loss": 1.0596, + "step": 31475 + }, + { + "epoch": 0.81, + "learning_rate": 1.71527655088515e-06, + "loss": 1.0186, + "step": 31476 + }, + { + "epoch": 0.81, + "learning_rate": 1.715257213349549e-06, + "loss": 0.874, + "step": 31477 + }, + { + "epoch": 0.81, + "learning_rate": 1.715237875266308e-06, + "loss": 0.5916, + "step": 31478 + }, + { + "epoch": 0.81, + "learning_rate": 1.7152185366354424e-06, + "loss": 0.957, + "step": 31479 + }, + { + "epoch": 0.81, + "learning_rate": 1.715199197456967e-06, + "loss": 0.8955, + "step": 31480 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151798577308963e-06, + "loss": 0.958, + "step": 31481 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151605174572455e-06, + "loss": 0.9121, + "step": 31482 + }, + { + "epoch": 0.81, + "learning_rate": 1.715141176636029e-06, + "loss": 0.7686, + "step": 31483 + }, + { + "epoch": 0.81, + "learning_rate": 1.7151218352672613e-06, + "loss": 0.8145, + "step": 31484 + }, + { + "epoch": 0.81, + "learning_rate": 1.715102493350958e-06, + "loss": 0.8984, + "step": 31485 + }, + { + "epoch": 0.81, + "learning_rate": 1.715083150887134e-06, + "loss": 0.7236, + "step": 31486 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150638078758035e-06, + "loss": 0.6587, + "step": 31487 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150444643169816e-06, + "loss": 0.8298, + "step": 31488 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150251202106829e-06, + "loss": 1.0342, + "step": 31489 + }, + { + "epoch": 0.81, + "learning_rate": 1.7150057755569222e-06, + "loss": 0.8936, + "step": 31490 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149864303557147e-06, + "loss": 0.8921, + "step": 31491 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149670846070748e-06, + "loss": 0.8418, + "step": 31492 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149477383110176e-06, + "loss": 0.8203, + "step": 31493 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149283914675578e-06, + "loss": 0.688, + "step": 31494 + }, + { + "epoch": 0.81, + "learning_rate": 1.7149090440767101e-06, + "loss": 1.0928, + "step": 31495 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148896961384892e-06, + "loss": 0.9258, + "step": 31496 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148703476529108e-06, + "loss": 0.8613, + "step": 31497 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148509986199885e-06, + "loss": 0.7852, + "step": 31498 + }, + { + "epoch": 0.81, + "learning_rate": 1.714831649039738e-06, + "loss": 0.9863, + "step": 31499 + }, + { + "epoch": 0.81, + "learning_rate": 1.7148122989121734e-06, + "loss": 1.0596, + "step": 31500 + }, + { + "epoch": 0.81, + "learning_rate": 1.71479294823731e-06, + "loss": 0.7012, + "step": 31501 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147735970151627e-06, + "loss": 0.5493, + "step": 31502 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147542452457459e-06, + "loss": 0.6846, + "step": 31503 + }, + { + "epoch": 0.81, + "learning_rate": 1.7147348929290747e-06, + "loss": 0.8936, + "step": 31504 + }, + { + "epoch": 0.81, + "learning_rate": 1.714715540065164e-06, + "loss": 0.9014, + "step": 31505 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146961866540284e-06, + "loss": 0.7236, + "step": 31506 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146768326956827e-06, + "loss": 0.7188, + "step": 31507 + }, + { + "epoch": 0.81, + "learning_rate": 1.714657478190142e-06, + "loss": 0.8379, + "step": 31508 + }, + { + "epoch": 0.81, + "learning_rate": 1.7146381231374205e-06, + "loss": 0.7852, + "step": 31509 + }, + { + "epoch": 0.81, + "learning_rate": 1.714618767537534e-06, + "loss": 0.8682, + "step": 31510 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145994113904965e-06, + "loss": 0.708, + "step": 31511 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145800546963233e-06, + "loss": 0.7598, + "step": 31512 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145606974550283e-06, + "loss": 0.9678, + "step": 31513 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145413396666278e-06, + "loss": 1.0557, + "step": 31514 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145219813311355e-06, + "loss": 1.0029, + "step": 31515 + }, + { + "epoch": 0.81, + "learning_rate": 1.7145026224485669e-06, + "loss": 0.8096, + "step": 31516 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144832630189363e-06, + "loss": 0.6533, + "step": 31517 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144639030422586e-06, + "loss": 0.8975, + "step": 31518 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144445425185488e-06, + "loss": 0.7808, + "step": 31519 + }, + { + "epoch": 0.81, + "learning_rate": 1.7144251814478217e-06, + "loss": 0.8252, + "step": 31520 + }, + { + "epoch": 0.81, + "learning_rate": 1.714405819830092e-06, + "loss": 0.8594, + "step": 31521 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143864576653748e-06, + "loss": 0.75, + "step": 31522 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143670949536847e-06, + "loss": 0.7554, + "step": 31523 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143477316950366e-06, + "loss": 0.7363, + "step": 31524 + }, + { + "epoch": 0.81, + "learning_rate": 1.714328367889445e-06, + "loss": 1.0303, + "step": 31525 + }, + { + "epoch": 0.81, + "learning_rate": 1.7143090035369253e-06, + "loss": 0.8701, + "step": 31526 + }, + { + "epoch": 0.81, + "learning_rate": 1.714289638637492e-06, + "loss": 0.957, + "step": 31527 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142702731911598e-06, + "loss": 1.167, + "step": 31528 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142509071979437e-06, + "loss": 0.8418, + "step": 31529 + }, + { + "epoch": 0.81, + "learning_rate": 1.7142315406578586e-06, + "loss": 0.8667, + "step": 31530 + }, + { + "epoch": 0.81, + "learning_rate": 1.714212173570919e-06, + "loss": 0.8818, + "step": 31531 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141928059371406e-06, + "loss": 0.7852, + "step": 31532 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141734377565374e-06, + "loss": 0.5671, + "step": 31533 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141540690291244e-06, + "loss": 0.6848, + "step": 31534 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141346997549162e-06, + "loss": 0.7695, + "step": 31535 + }, + { + "epoch": 0.81, + "learning_rate": 1.7141153299339282e-06, + "loss": 0.5859, + "step": 31536 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140959595661745e-06, + "loss": 1.0, + "step": 31537 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140765886516707e-06, + "loss": 0.9492, + "step": 31538 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140572171904314e-06, + "loss": 0.7988, + "step": 31539 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140378451824708e-06, + "loss": 0.8359, + "step": 31540 + }, + { + "epoch": 0.81, + "learning_rate": 1.7140184726278048e-06, + "loss": 1.0283, + "step": 31541 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139990995264475e-06, + "loss": 0.7466, + "step": 31542 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139797258784139e-06, + "loss": 0.791, + "step": 31543 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139603516837192e-06, + "loss": 0.791, + "step": 31544 + }, + { + "epoch": 0.81, + "learning_rate": 1.713940976942377e-06, + "loss": 0.7896, + "step": 31545 + }, + { + "epoch": 0.81, + "learning_rate": 1.713921601654404e-06, + "loss": 0.8594, + "step": 31546 + }, + { + "epoch": 0.81, + "learning_rate": 1.7139022258198135e-06, + "loss": 0.625, + "step": 31547 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138828494386211e-06, + "loss": 0.9971, + "step": 31548 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138634725108414e-06, + "loss": 0.8975, + "step": 31549 + }, + { + "epoch": 0.81, + "learning_rate": 1.713844095036489e-06, + "loss": 0.96, + "step": 31550 + }, + { + "epoch": 0.81, + "learning_rate": 1.7138247170155795e-06, + "loss": 1.043, + "step": 31551 + }, + { + "epoch": 0.81, + "learning_rate": 1.713805338448127e-06, + "loss": 0.7788, + "step": 31552 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137859593341465e-06, + "loss": 0.7385, + "step": 31553 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137665796736527e-06, + "loss": 0.8936, + "step": 31554 + }, + { + "epoch": 0.81, + "learning_rate": 1.713747199466661e-06, + "loss": 0.7202, + "step": 31555 + }, + { + "epoch": 0.81, + "learning_rate": 1.7137278187131858e-06, + "loss": 0.7266, + "step": 31556 + }, + { + "epoch": 0.81, + "learning_rate": 1.713708437413242e-06, + "loss": 0.9395, + "step": 31557 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136890555668444e-06, + "loss": 0.748, + "step": 31558 + }, + { + "epoch": 0.81, + "learning_rate": 1.713669673174008e-06, + "loss": 0.9648, + "step": 31559 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136502902347477e-06, + "loss": 1.0635, + "step": 31560 + }, + { + "epoch": 0.81, + "learning_rate": 1.713630906749078e-06, + "loss": 0.7246, + "step": 31561 + }, + { + "epoch": 0.81, + "learning_rate": 1.7136115227170139e-06, + "loss": 0.9805, + "step": 31562 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135921381385702e-06, + "loss": 0.9756, + "step": 31563 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135727530137621e-06, + "loss": 0.9541, + "step": 31564 + }, + { + "epoch": 0.81, + "learning_rate": 1.713553367342604e-06, + "loss": 0.8057, + "step": 31565 + }, + { + "epoch": 0.81, + "learning_rate": 1.713533981125111e-06, + "loss": 0.666, + "step": 31566 + }, + { + "epoch": 0.81, + "learning_rate": 1.7135145943612974e-06, + "loss": 0.8662, + "step": 31567 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134952070511789e-06, + "loss": 0.8604, + "step": 31568 + }, + { + "epoch": 0.81, + "learning_rate": 1.71347581919477e-06, + "loss": 0.875, + "step": 31569 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134564307920854e-06, + "loss": 0.9893, + "step": 31570 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134370418431395e-06, + "loss": 0.6816, + "step": 31571 + }, + { + "epoch": 0.81, + "learning_rate": 1.7134176523479483e-06, + "loss": 0.8257, + "step": 31572 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133982623065258e-06, + "loss": 0.8652, + "step": 31573 + }, + { + "epoch": 0.81, + "learning_rate": 1.713378871718887e-06, + "loss": 0.8896, + "step": 31574 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133594805850469e-06, + "loss": 0.5898, + "step": 31575 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133400889050203e-06, + "loss": 0.9551, + "step": 31576 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133206966788216e-06, + "loss": 0.6616, + "step": 31577 + }, + { + "epoch": 0.81, + "learning_rate": 1.7133013039064666e-06, + "loss": 0.7788, + "step": 31578 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132819105879692e-06, + "loss": 0.917, + "step": 31579 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132625167233447e-06, + "loss": 0.7202, + "step": 31580 + }, + { + "epoch": 0.81, + "learning_rate": 1.713243122312608e-06, + "loss": 0.877, + "step": 31581 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132237273557737e-06, + "loss": 0.6106, + "step": 31582 + }, + { + "epoch": 0.81, + "learning_rate": 1.7132043318528568e-06, + "loss": 1.0264, + "step": 31583 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131849358038724e-06, + "loss": 0.7744, + "step": 31584 + }, + { + "epoch": 0.81, + "learning_rate": 1.713165539208835e-06, + "loss": 0.8926, + "step": 31585 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131461420677593e-06, + "loss": 0.9385, + "step": 31586 + }, + { + "epoch": 0.81, + "learning_rate": 1.7131267443806606e-06, + "loss": 0.8154, + "step": 31587 + }, + { + "epoch": 0.81, + "learning_rate": 1.713107346147553e-06, + "loss": 0.7803, + "step": 31588 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130879473684527e-06, + "loss": 0.8662, + "step": 31589 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130685480433736e-06, + "loss": 0.8252, + "step": 31590 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130491481723303e-06, + "loss": 0.9609, + "step": 31591 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130297477553382e-06, + "loss": 0.9189, + "step": 31592 + }, + { + "epoch": 0.81, + "learning_rate": 1.7130103467924122e-06, + "loss": 1.002, + "step": 31593 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129909452835668e-06, + "loss": 0.8164, + "step": 31594 + }, + { + "epoch": 0.81, + "learning_rate": 1.712971543228817e-06, + "loss": 0.8394, + "step": 31595 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129521406281778e-06, + "loss": 0.8735, + "step": 31596 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129327374816636e-06, + "loss": 0.6709, + "step": 31597 + }, + { + "epoch": 0.81, + "learning_rate": 1.7129133337892898e-06, + "loss": 0.9795, + "step": 31598 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128939295510714e-06, + "loss": 0.6934, + "step": 31599 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128745247670225e-06, + "loss": 0.6772, + "step": 31600 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128551194371582e-06, + "loss": 0.6548, + "step": 31601 + }, + { + "epoch": 0.81, + "learning_rate": 1.712835713561494e-06, + "loss": 1.0391, + "step": 31602 + }, + { + "epoch": 0.81, + "learning_rate": 1.7128163071400439e-06, + "loss": 0.73, + "step": 31603 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127969001728232e-06, + "loss": 0.9814, + "step": 31604 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127774926598465e-06, + "loss": 0.8389, + "step": 31605 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127580846011295e-06, + "loss": 0.9756, + "step": 31606 + }, + { + "epoch": 0.81, + "learning_rate": 1.712738675996686e-06, + "loss": 0.8025, + "step": 31607 + }, + { + "epoch": 0.81, + "learning_rate": 1.7127192668465312e-06, + "loss": 0.9297, + "step": 31608 + }, + { + "epoch": 0.81, + "learning_rate": 1.71269985715068e-06, + "loss": 0.9409, + "step": 31609 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126804469091473e-06, + "loss": 0.7236, + "step": 31610 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126610361219482e-06, + "loss": 0.7905, + "step": 31611 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126416247890969e-06, + "loss": 0.8906, + "step": 31612 + }, + { + "epoch": 0.81, + "learning_rate": 1.7126222129106091e-06, + "loss": 0.6943, + "step": 31613 + }, + { + "epoch": 0.81, + "learning_rate": 1.712602800486499e-06, + "loss": 0.8184, + "step": 31614 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125833875167817e-06, + "loss": 0.665, + "step": 31615 + }, + { + "epoch": 0.81, + "learning_rate": 1.712563974001472e-06, + "loss": 1.0322, + "step": 31616 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125445599405853e-06, + "loss": 0.7979, + "step": 31617 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125251453341356e-06, + "loss": 0.957, + "step": 31618 + }, + { + "epoch": 0.81, + "learning_rate": 1.7125057301821379e-06, + "loss": 0.5947, + "step": 31619 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124863144846077e-06, + "loss": 0.5942, + "step": 31620 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124668982415595e-06, + "loss": 0.8525, + "step": 31621 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124474814530081e-06, + "loss": 0.804, + "step": 31622 + }, + { + "epoch": 0.81, + "learning_rate": 1.7124280641189684e-06, + "loss": 0.793, + "step": 31623 + }, + { + "epoch": 0.81, + "learning_rate": 1.712408646239455e-06, + "loss": 0.7119, + "step": 31624 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123892278144835e-06, + "loss": 0.9463, + "step": 31625 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123698088440684e-06, + "loss": 0.9053, + "step": 31626 + }, + { + "epoch": 0.81, + "learning_rate": 1.712350389328224e-06, + "loss": 0.8975, + "step": 31627 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123309692669658e-06, + "loss": 0.7656, + "step": 31628 + }, + { + "epoch": 0.81, + "learning_rate": 1.7123115486603088e-06, + "loss": 0.9834, + "step": 31629 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122921275082677e-06, + "loss": 0.9111, + "step": 31630 + }, + { + "epoch": 0.81, + "learning_rate": 1.712272705810857e-06, + "loss": 0.7271, + "step": 31631 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122532835680916e-06, + "loss": 1.124, + "step": 31632 + }, + { + "epoch": 0.81, + "learning_rate": 1.712233860779987e-06, + "loss": 1.2744, + "step": 31633 + }, + { + "epoch": 0.81, + "learning_rate": 1.7122144374465575e-06, + "loss": 0.854, + "step": 31634 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121950135678182e-06, + "loss": 0.8848, + "step": 31635 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121755891437842e-06, + "loss": 0.9111, + "step": 31636 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121561641744696e-06, + "loss": 0.7334, + "step": 31637 + }, + { + "epoch": 0.81, + "learning_rate": 1.71213673865989e-06, + "loss": 0.8086, + "step": 31638 + }, + { + "epoch": 0.81, + "learning_rate": 1.7121173126000602e-06, + "loss": 0.999, + "step": 31639 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120978859949945e-06, + "loss": 1.042, + "step": 31640 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120784588447086e-06, + "loss": 0.5464, + "step": 31641 + }, + { + "epoch": 0.81, + "learning_rate": 1.712059031149217e-06, + "loss": 0.8887, + "step": 31642 + }, + { + "epoch": 0.81, + "learning_rate": 1.712039602908534e-06, + "loss": 0.9321, + "step": 31643 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120201741226756e-06, + "loss": 0.8315, + "step": 31644 + }, + { + "epoch": 0.81, + "learning_rate": 1.7120007447916559e-06, + "loss": 1.0566, + "step": 31645 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119813149154898e-06, + "loss": 0.9346, + "step": 31646 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119618844941926e-06, + "loss": 0.7676, + "step": 31647 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119424535277788e-06, + "loss": 0.8623, + "step": 31648 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119230220162634e-06, + "loss": 0.6523, + "step": 31649 + }, + { + "epoch": 0.81, + "learning_rate": 1.7119035899596615e-06, + "loss": 0.5405, + "step": 31650 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118841573579873e-06, + "loss": 0.9131, + "step": 31651 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118647242112566e-06, + "loss": 0.7017, + "step": 31652 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118452905194834e-06, + "loss": 0.815, + "step": 31653 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118258562826833e-06, + "loss": 0.8887, + "step": 31654 + }, + { + "epoch": 0.81, + "learning_rate": 1.7118064215008707e-06, + "loss": 0.9854, + "step": 31655 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117869861740605e-06, + "loss": 0.5005, + "step": 31656 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117675503022682e-06, + "loss": 0.8979, + "step": 31657 + }, + { + "epoch": 0.81, + "learning_rate": 1.711748113885508e-06, + "loss": 0.7466, + "step": 31658 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117286769237948e-06, + "loss": 1.1523, + "step": 31659 + }, + { + "epoch": 0.81, + "learning_rate": 1.7117092394171438e-06, + "loss": 0.8848, + "step": 31660 + }, + { + "epoch": 0.81, + "learning_rate": 1.71168980136557e-06, + "loss": 0.875, + "step": 31661 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116703627690878e-06, + "loss": 0.4827, + "step": 31662 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116509236277122e-06, + "loss": 0.6553, + "step": 31663 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116314839414585e-06, + "loss": 0.8198, + "step": 31664 + }, + { + "epoch": 0.81, + "learning_rate": 1.7116120437103411e-06, + "loss": 0.7329, + "step": 31665 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115926029343753e-06, + "loss": 0.8428, + "step": 31666 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115731616135754e-06, + "loss": 0.9219, + "step": 31667 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115537197479568e-06, + "loss": 0.9346, + "step": 31668 + }, + { + "epoch": 0.81, + "learning_rate": 1.7115342773375346e-06, + "loss": 0.9229, + "step": 31669 + }, + { + "epoch": 0.81, + "learning_rate": 1.711514834382323e-06, + "loss": 0.8242, + "step": 31670 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114953908823371e-06, + "loss": 0.8301, + "step": 31671 + }, + { + "epoch": 0.81, + "learning_rate": 1.711475946837592e-06, + "loss": 0.9365, + "step": 31672 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114565022481023e-06, + "loss": 0.79, + "step": 31673 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114370571138835e-06, + "loss": 0.6304, + "step": 31674 + }, + { + "epoch": 0.81, + "learning_rate": 1.7114176114349496e-06, + "loss": 0.9043, + "step": 31675 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113981652113163e-06, + "loss": 0.9678, + "step": 31676 + }, + { + "epoch": 0.81, + "learning_rate": 1.711378718442998e-06, + "loss": 0.9453, + "step": 31677 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113592711300098e-06, + "loss": 1.0166, + "step": 31678 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113398232723664e-06, + "loss": 1.0088, + "step": 31679 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113203748700829e-06, + "loss": 0.5432, + "step": 31680 + }, + { + "epoch": 0.81, + "learning_rate": 1.7113009259231741e-06, + "loss": 0.7109, + "step": 31681 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112814764316547e-06, + "loss": 0.7793, + "step": 31682 + }, + { + "epoch": 0.81, + "learning_rate": 1.71126202639554e-06, + "loss": 0.9785, + "step": 31683 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112425758148446e-06, + "loss": 0.7539, + "step": 31684 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112231246895833e-06, + "loss": 0.9238, + "step": 31685 + }, + { + "epoch": 0.81, + "learning_rate": 1.7112036730197713e-06, + "loss": 0.9775, + "step": 31686 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111842208054235e-06, + "loss": 0.918, + "step": 31687 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111647680465543e-06, + "loss": 0.8564, + "step": 31688 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111453147431792e-06, + "loss": 0.8496, + "step": 31689 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111258608953128e-06, + "loss": 1.0068, + "step": 31690 + }, + { + "epoch": 0.81, + "learning_rate": 1.7111064065029698e-06, + "loss": 0.9365, + "step": 31691 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110869515661657e-06, + "loss": 0.8584, + "step": 31692 + }, + { + "epoch": 0.81, + "learning_rate": 1.711067496084915e-06, + "loss": 0.876, + "step": 31693 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110480400592322e-06, + "loss": 0.8271, + "step": 31694 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110285834891332e-06, + "loss": 0.6111, + "step": 31695 + }, + { + "epoch": 0.81, + "learning_rate": 1.7110091263746317e-06, + "loss": 1.0117, + "step": 31696 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109896687157437e-06, + "loss": 0.7432, + "step": 31697 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109702105124833e-06, + "loss": 0.8574, + "step": 31698 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109507517648659e-06, + "loss": 0.4272, + "step": 31699 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109312924729057e-06, + "loss": 0.7622, + "step": 31700 + }, + { + "epoch": 0.81, + "learning_rate": 1.7109118326366187e-06, + "loss": 0.9658, + "step": 31701 + }, + { + "epoch": 0.81, + "learning_rate": 1.710892372256019e-06, + "loss": 1.0967, + "step": 31702 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108729113311218e-06, + "loss": 0.6372, + "step": 31703 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108534498619416e-06, + "loss": 0.707, + "step": 31704 + }, + { + "epoch": 0.81, + "learning_rate": 1.7108339878484936e-06, + "loss": 0.998, + "step": 31705 + }, + { + "epoch": 0.81, + "learning_rate": 1.710814525290793e-06, + "loss": 0.7935, + "step": 31706 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107950621888543e-06, + "loss": 0.8154, + "step": 31707 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107755985426925e-06, + "loss": 0.791, + "step": 31708 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107561343523224e-06, + "loss": 0.9219, + "step": 31709 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107366696177593e-06, + "loss": 1.0156, + "step": 31710 + }, + { + "epoch": 0.81, + "learning_rate": 1.7107172043390175e-06, + "loss": 1.1221, + "step": 31711 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106977385161122e-06, + "loss": 0.875, + "step": 31712 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106782721490585e-06, + "loss": 0.8882, + "step": 31713 + }, + { + "epoch": 0.81, + "learning_rate": 1.710658805237871e-06, + "loss": 0.6064, + "step": 31714 + }, + { + "epoch": 0.81, + "learning_rate": 1.710639337782565e-06, + "loss": 0.707, + "step": 31715 + }, + { + "epoch": 0.81, + "learning_rate": 1.710619869783155e-06, + "loss": 0.7026, + "step": 31716 + }, + { + "epoch": 0.81, + "learning_rate": 1.7106004012396557e-06, + "loss": 1.0264, + "step": 31717 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105809321520827e-06, + "loss": 0.6914, + "step": 31718 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105614625204504e-06, + "loss": 0.9033, + "step": 31719 + }, + { + "epoch": 0.81, + "learning_rate": 1.710541992344774e-06, + "loss": 0.7705, + "step": 31720 + }, + { + "epoch": 0.81, + "learning_rate": 1.7105225216250682e-06, + "loss": 0.605, + "step": 31721 + }, + { + "epoch": 0.81, + "learning_rate": 1.710503050361348e-06, + "loss": 0.7803, + "step": 31722 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104835785536285e-06, + "loss": 0.8516, + "step": 31723 + }, + { + "epoch": 0.81, + "learning_rate": 1.710464106201924e-06, + "loss": 0.6602, + "step": 31724 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104446333062498e-06, + "loss": 1.082, + "step": 31725 + }, + { + "epoch": 0.81, + "learning_rate": 1.710425159866621e-06, + "loss": 0.8154, + "step": 31726 + }, + { + "epoch": 0.81, + "learning_rate": 1.7104056858830523e-06, + "loss": 0.7158, + "step": 31727 + }, + { + "epoch": 0.81, + "learning_rate": 1.7103862113555584e-06, + "loss": 0.8613, + "step": 31728 + }, + { + "epoch": 0.81, + "learning_rate": 1.710366736284155e-06, + "loss": 1.0176, + "step": 31729 + }, + { + "epoch": 0.81, + "learning_rate": 1.710347260668856e-06, + "loss": 0.8447, + "step": 31730 + }, + { + "epoch": 0.81, + "learning_rate": 1.710327784509677e-06, + "loss": 0.8076, + "step": 31731 + }, + { + "epoch": 0.81, + "learning_rate": 1.7103083078066326e-06, + "loss": 0.7773, + "step": 31732 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102888305597377e-06, + "loss": 0.9443, + "step": 31733 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102693527690074e-06, + "loss": 1.0068, + "step": 31734 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102498744344564e-06, + "loss": 0.7344, + "step": 31735 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102303955560998e-06, + "loss": 0.8555, + "step": 31736 + }, + { + "epoch": 0.81, + "learning_rate": 1.7102109161339525e-06, + "loss": 0.8672, + "step": 31737 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101914361680291e-06, + "loss": 0.6929, + "step": 31738 + }, + { + "epoch": 0.81, + "learning_rate": 1.710171955658345e-06, + "loss": 0.9395, + "step": 31739 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101524746049146e-06, + "loss": 0.769, + "step": 31740 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101329930077536e-06, + "loss": 0.6631, + "step": 31741 + }, + { + "epoch": 0.81, + "learning_rate": 1.7101135108668762e-06, + "loss": 0.7695, + "step": 31742 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100940281822975e-06, + "loss": 0.8462, + "step": 31743 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100745449540326e-06, + "loss": 0.7246, + "step": 31744 + }, + { + "epoch": 0.81, + "learning_rate": 1.710055061182096e-06, + "loss": 0.8887, + "step": 31745 + }, + { + "epoch": 0.81, + "learning_rate": 1.710035576866503e-06, + "loss": 0.8125, + "step": 31746 + }, + { + "epoch": 0.81, + "learning_rate": 1.7100160920072687e-06, + "loss": 0.7285, + "step": 31747 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099966066044075e-06, + "loss": 0.7334, + "step": 31748 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099771206579345e-06, + "loss": 0.873, + "step": 31749 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099576341678646e-06, + "loss": 0.9033, + "step": 31750 + }, + { + "epoch": 0.81, + "learning_rate": 1.709938147134213e-06, + "loss": 0.8818, + "step": 31751 + }, + { + "epoch": 0.81, + "learning_rate": 1.7099186595569938e-06, + "loss": 0.6418, + "step": 31752 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098991714362232e-06, + "loss": 1.0029, + "step": 31753 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098796827719152e-06, + "loss": 0.647, + "step": 31754 + }, + { + "epoch": 0.81, + "learning_rate": 1.709860193564085e-06, + "loss": 0.8394, + "step": 31755 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098407038127477e-06, + "loss": 0.6973, + "step": 31756 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098212135179178e-06, + "loss": 0.6797, + "step": 31757 + }, + { + "epoch": 0.81, + "learning_rate": 1.7098017226796103e-06, + "loss": 0.7441, + "step": 31758 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097822312978404e-06, + "loss": 0.8467, + "step": 31759 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097627393726229e-06, + "loss": 0.8086, + "step": 31760 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097432469039727e-06, + "loss": 0.8438, + "step": 31761 + }, + { + "epoch": 0.81, + "learning_rate": 1.7097237538919047e-06, + "loss": 0.6538, + "step": 31762 + }, + { + "epoch": 0.81, + "learning_rate": 1.709704260336434e-06, + "loss": 0.9258, + "step": 31763 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096847662375753e-06, + "loss": 0.9365, + "step": 31764 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096652715953433e-06, + "loss": 1.0283, + "step": 31765 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096457764097536e-06, + "loss": 0.8613, + "step": 31766 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096262806808207e-06, + "loss": 0.8589, + "step": 31767 + }, + { + "epoch": 0.81, + "learning_rate": 1.7096067844085595e-06, + "loss": 0.9688, + "step": 31768 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095872875929852e-06, + "loss": 0.8066, + "step": 31769 + }, + { + "epoch": 0.81, + "learning_rate": 1.709567790234112e-06, + "loss": 0.7622, + "step": 31770 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095482923319562e-06, + "loss": 0.7832, + "step": 31771 + }, + { + "epoch": 0.81, + "learning_rate": 1.7095287938865312e-06, + "loss": 0.8369, + "step": 31772 + }, + { + "epoch": 0.81, + "learning_rate": 1.709509294897853e-06, + "loss": 0.9766, + "step": 31773 + }, + { + "epoch": 0.81, + "learning_rate": 1.709489795365936e-06, + "loss": 0.9248, + "step": 31774 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094702952907953e-06, + "loss": 1.0195, + "step": 31775 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094507946724458e-06, + "loss": 0.8271, + "step": 31776 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094312935109025e-06, + "loss": 0.8057, + "step": 31777 + }, + { + "epoch": 0.81, + "learning_rate": 1.7094117918061803e-06, + "loss": 0.8154, + "step": 31778 + }, + { + "epoch": 0.81, + "learning_rate": 1.7093922895582942e-06, + "loss": 0.8447, + "step": 31779 + }, + { + "epoch": 0.81, + "learning_rate": 1.709372786767259e-06, + "loss": 0.7207, + "step": 31780 + }, + { + "epoch": 0.81, + "learning_rate": 1.7093532834330896e-06, + "loss": 0.7373, + "step": 31781 + }, + { + "epoch": 0.81, + "learning_rate": 1.709333779555801e-06, + "loss": 0.7747, + "step": 31782 + }, + { + "epoch": 0.81, + "learning_rate": 1.709314275135408e-06, + "loss": 0.8599, + "step": 31783 + }, + { + "epoch": 0.81, + "learning_rate": 1.709294770171926e-06, + "loss": 0.958, + "step": 31784 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092752646653695e-06, + "loss": 0.7944, + "step": 31785 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092557586157535e-06, + "loss": 0.8145, + "step": 31786 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092362520230927e-06, + "loss": 0.7646, + "step": 31787 + }, + { + "epoch": 0.81, + "learning_rate": 1.7092167448874028e-06, + "loss": 0.6885, + "step": 31788 + }, + { + "epoch": 0.81, + "learning_rate": 1.709197237208698e-06, + "loss": 0.8525, + "step": 31789 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091777289869933e-06, + "loss": 0.7922, + "step": 31790 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091582202223044e-06, + "loss": 0.8105, + "step": 31791 + }, + { + "epoch": 0.81, + "learning_rate": 1.7091387109146451e-06, + "loss": 0.7158, + "step": 31792 + }, + { + "epoch": 0.81, + "learning_rate": 1.709119201064031e-06, + "loss": 0.916, + "step": 31793 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090996906704768e-06, + "loss": 0.7483, + "step": 31794 + }, + { + "epoch": 0.81, + "learning_rate": 1.709080179733998e-06, + "loss": 0.9883, + "step": 31795 + }, + { + "epoch": 0.81, + "learning_rate": 1.709060668254609e-06, + "loss": 0.9824, + "step": 31796 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090411562323247e-06, + "loss": 0.9082, + "step": 31797 + }, + { + "epoch": 0.81, + "learning_rate": 1.7090216436671603e-06, + "loss": 0.7998, + "step": 31798 + }, + { + "epoch": 0.82, + "learning_rate": 1.7090021305591304e-06, + "loss": 0.9033, + "step": 31799 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089826169082505e-06, + "loss": 0.8164, + "step": 31800 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089631027145348e-06, + "loss": 0.8779, + "step": 31801 + }, + { + "epoch": 0.82, + "learning_rate": 1.708943587977999e-06, + "loss": 0.875, + "step": 31802 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089240726986577e-06, + "loss": 1.1104, + "step": 31803 + }, + { + "epoch": 0.82, + "learning_rate": 1.7089045568765256e-06, + "loss": 0.7979, + "step": 31804 + }, + { + "epoch": 0.82, + "learning_rate": 1.708885040511618e-06, + "loss": 0.8838, + "step": 31805 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088655236039498e-06, + "loss": 0.8828, + "step": 31806 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088460061535356e-06, + "loss": 0.8467, + "step": 31807 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088264881603908e-06, + "loss": 0.9307, + "step": 31808 + }, + { + "epoch": 0.82, + "learning_rate": 1.7088069696245303e-06, + "loss": 0.8203, + "step": 31809 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087874505459687e-06, + "loss": 0.832, + "step": 31810 + }, + { + "epoch": 0.82, + "learning_rate": 1.708767930924721e-06, + "loss": 0.6553, + "step": 31811 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087484107608028e-06, + "loss": 0.8926, + "step": 31812 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087288900542283e-06, + "loss": 0.9512, + "step": 31813 + }, + { + "epoch": 0.82, + "learning_rate": 1.7087093688050124e-06, + "loss": 0.9033, + "step": 31814 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086898470131705e-06, + "loss": 0.8896, + "step": 31815 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086703246787173e-06, + "loss": 0.8843, + "step": 31816 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086508018016682e-06, + "loss": 0.8408, + "step": 31817 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086312783820373e-06, + "loss": 0.6875, + "step": 31818 + }, + { + "epoch": 0.82, + "learning_rate": 1.7086117544198403e-06, + "loss": 0.6951, + "step": 31819 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085922299150917e-06, + "loss": 0.7422, + "step": 31820 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085727048678066e-06, + "loss": 0.8838, + "step": 31821 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085531792779997e-06, + "loss": 0.8037, + "step": 31822 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085336531456867e-06, + "loss": 0.79, + "step": 31823 + }, + { + "epoch": 0.82, + "learning_rate": 1.7085141264708817e-06, + "loss": 0.751, + "step": 31824 + }, + { + "epoch": 0.82, + "learning_rate": 1.7084945992536004e-06, + "loss": 0.8711, + "step": 31825 + }, + { + "epoch": 0.82, + "learning_rate": 1.708475071493857e-06, + "loss": 0.7178, + "step": 31826 + }, + { + "epoch": 0.82, + "learning_rate": 1.708455543191667e-06, + "loss": 0.8516, + "step": 31827 + }, + { + "epoch": 0.82, + "learning_rate": 1.708436014347045e-06, + "loss": 1.0156, + "step": 31828 + }, + { + "epoch": 0.82, + "learning_rate": 1.7084164849600065e-06, + "loss": 0.9229, + "step": 31829 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083969550305657e-06, + "loss": 0.6924, + "step": 31830 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083774245587382e-06, + "loss": 0.8613, + "step": 31831 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083578935445385e-06, + "loss": 0.9736, + "step": 31832 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083383619879817e-06, + "loss": 0.6699, + "step": 31833 + }, + { + "epoch": 0.82, + "learning_rate": 1.7083188298890829e-06, + "loss": 0.9639, + "step": 31834 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082992972478568e-06, + "loss": 0.5278, + "step": 31835 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082797640643185e-06, + "loss": 0.9189, + "step": 31836 + }, + { + "epoch": 0.82, + "learning_rate": 1.708260230338483e-06, + "loss": 0.7744, + "step": 31837 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082406960703652e-06, + "loss": 0.7646, + "step": 31838 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082211612599805e-06, + "loss": 0.7246, + "step": 31839 + }, + { + "epoch": 0.82, + "learning_rate": 1.7082016259073426e-06, + "loss": 0.7881, + "step": 31840 + }, + { + "epoch": 0.82, + "learning_rate": 1.708182090012468e-06, + "loss": 0.7441, + "step": 31841 + }, + { + "epoch": 0.82, + "learning_rate": 1.7081625535753704e-06, + "loss": 0.7156, + "step": 31842 + }, + { + "epoch": 0.82, + "learning_rate": 1.7081430165960655e-06, + "loss": 1.0742, + "step": 31843 + }, + { + "epoch": 0.82, + "learning_rate": 1.708123479074568e-06, + "loss": 1.0654, + "step": 31844 + }, + { + "epoch": 0.82, + "learning_rate": 1.708103941010893e-06, + "loss": 0.7002, + "step": 31845 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080844024050556e-06, + "loss": 0.5337, + "step": 31846 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080648632570702e-06, + "loss": 0.7986, + "step": 31847 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080453235669524e-06, + "loss": 0.6611, + "step": 31848 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080257833347165e-06, + "loss": 1.0635, + "step": 31849 + }, + { + "epoch": 0.82, + "learning_rate": 1.7080062425603781e-06, + "loss": 0.8574, + "step": 31850 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079867012439518e-06, + "loss": 0.877, + "step": 31851 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079671593854523e-06, + "loss": 0.9199, + "step": 31852 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079476169848955e-06, + "loss": 1.0596, + "step": 31853 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079280740422953e-06, + "loss": 0.9561, + "step": 31854 + }, + { + "epoch": 0.82, + "learning_rate": 1.7079085305576672e-06, + "loss": 0.9824, + "step": 31855 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078889865310262e-06, + "loss": 0.6748, + "step": 31856 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078694419623872e-06, + "loss": 0.7803, + "step": 31857 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078498968517648e-06, + "loss": 0.8804, + "step": 31858 + }, + { + "epoch": 0.82, + "learning_rate": 1.7078303511991746e-06, + "loss": 1.0449, + "step": 31859 + }, + { + "epoch": 0.82, + "learning_rate": 1.707810805004631e-06, + "loss": 0.3906, + "step": 31860 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077912582681495e-06, + "loss": 0.8066, + "step": 31861 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077717109897445e-06, + "loss": 0.8311, + "step": 31862 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077521631694314e-06, + "loss": 0.9639, + "step": 31863 + }, + { + "epoch": 0.82, + "learning_rate": 1.707732614807225e-06, + "loss": 1.001, + "step": 31864 + }, + { + "epoch": 0.82, + "learning_rate": 1.7077130659031402e-06, + "loss": 0.8379, + "step": 31865 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076935164571921e-06, + "loss": 0.9541, + "step": 31866 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076739664693958e-06, + "loss": 0.9453, + "step": 31867 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076544159397658e-06, + "loss": 0.8975, + "step": 31868 + }, + { + "epoch": 0.82, + "learning_rate": 1.7076348648683174e-06, + "loss": 0.7393, + "step": 31869 + }, + { + "epoch": 0.82, + "learning_rate": 1.707615313255066e-06, + "loss": 1.041, + "step": 31870 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075957611000256e-06, + "loss": 0.8027, + "step": 31871 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075762084032115e-06, + "loss": 0.9009, + "step": 31872 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075566551646392e-06, + "loss": 0.8486, + "step": 31873 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075371013843232e-06, + "loss": 0.8457, + "step": 31874 + }, + { + "epoch": 0.82, + "learning_rate": 1.7075175470622787e-06, + "loss": 0.813, + "step": 31875 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074979921985203e-06, + "loss": 1.0288, + "step": 31876 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074784367930633e-06, + "loss": 0.7559, + "step": 31877 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074588808459228e-06, + "loss": 0.8662, + "step": 31878 + }, + { + "epoch": 0.82, + "learning_rate": 1.707439324357113e-06, + "loss": 0.7549, + "step": 31879 + }, + { + "epoch": 0.82, + "learning_rate": 1.70741976732665e-06, + "loss": 0.6968, + "step": 31880 + }, + { + "epoch": 0.82, + "learning_rate": 1.7074002097545481e-06, + "loss": 0.9131, + "step": 31881 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073806516408223e-06, + "loss": 0.9131, + "step": 31882 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073610929854877e-06, + "loss": 0.7212, + "step": 31883 + }, + { + "epoch": 0.82, + "learning_rate": 1.707341533788559e-06, + "loss": 1.084, + "step": 31884 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073219740500518e-06, + "loss": 1.0547, + "step": 31885 + }, + { + "epoch": 0.82, + "learning_rate": 1.7073024137699804e-06, + "loss": 0.8545, + "step": 31886 + }, + { + "epoch": 0.82, + "learning_rate": 1.70728285294836e-06, + "loss": 0.8828, + "step": 31887 + }, + { + "epoch": 0.82, + "learning_rate": 1.707263291585206e-06, + "loss": 0.5757, + "step": 31888 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072437296805328e-06, + "loss": 0.877, + "step": 31889 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072241672343556e-06, + "loss": 0.9346, + "step": 31890 + }, + { + "epoch": 0.82, + "learning_rate": 1.7072046042466894e-06, + "loss": 0.9805, + "step": 31891 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071850407175492e-06, + "loss": 0.9268, + "step": 31892 + }, + { + "epoch": 0.82, + "learning_rate": 1.70716547664695e-06, + "loss": 0.6416, + "step": 31893 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071459120349065e-06, + "loss": 0.8438, + "step": 31894 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071263468814341e-06, + "loss": 1.0215, + "step": 31895 + }, + { + "epoch": 0.82, + "learning_rate": 1.7071067811865474e-06, + "loss": 1.0059, + "step": 31896 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070872149502616e-06, + "loss": 0.7842, + "step": 31897 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070676481725915e-06, + "loss": 0.7197, + "step": 31898 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070480808535526e-06, + "loss": 0.9395, + "step": 31899 + }, + { + "epoch": 0.82, + "learning_rate": 1.7070285129931593e-06, + "loss": 0.7822, + "step": 31900 + }, + { + "epoch": 0.82, + "learning_rate": 1.707008944591427e-06, + "loss": 1.2422, + "step": 31901 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069893756483697e-06, + "loss": 1.1035, + "step": 31902 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069698061640039e-06, + "loss": 0.9023, + "step": 31903 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069502361383434e-06, + "loss": 0.6616, + "step": 31904 + }, + { + "epoch": 0.82, + "learning_rate": 1.706930665571404e-06, + "loss": 1.0166, + "step": 31905 + }, + { + "epoch": 0.82, + "learning_rate": 1.7069110944632e-06, + "loss": 0.6484, + "step": 31906 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068915228137465e-06, + "loss": 0.9043, + "step": 31907 + }, + { + "epoch": 0.82, + "learning_rate": 1.706871950623059e-06, + "loss": 0.8369, + "step": 31908 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068523778911522e-06, + "loss": 0.8584, + "step": 31909 + }, + { + "epoch": 0.82, + "learning_rate": 1.7068328046180409e-06, + "loss": 0.5923, + "step": 31910 + }, + { + "epoch": 0.82, + "learning_rate": 1.70681323080374e-06, + "loss": 0.8301, + "step": 31911 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067936564482653e-06, + "loss": 0.9619, + "step": 31912 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067740815516304e-06, + "loss": 0.6206, + "step": 31913 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067545061138517e-06, + "loss": 0.8037, + "step": 31914 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067349301349435e-06, + "loss": 0.8223, + "step": 31915 + }, + { + "epoch": 0.82, + "learning_rate": 1.7067153536149207e-06, + "loss": 0.7354, + "step": 31916 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066957765537984e-06, + "loss": 0.8066, + "step": 31917 + }, + { + "epoch": 0.82, + "learning_rate": 1.706676198951592e-06, + "loss": 0.835, + "step": 31918 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066566208083158e-06, + "loss": 0.7285, + "step": 31919 + }, + { + "epoch": 0.82, + "learning_rate": 1.7066370421239853e-06, + "loss": 0.8311, + "step": 31920 + }, + { + "epoch": 0.82, + "learning_rate": 1.706617462898615e-06, + "loss": 0.6943, + "step": 31921 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065978831322205e-06, + "loss": 0.6741, + "step": 31922 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065783028248163e-06, + "loss": 0.6816, + "step": 31923 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065587219764176e-06, + "loss": 0.8574, + "step": 31924 + }, + { + "epoch": 0.82, + "learning_rate": 1.7065391405870396e-06, + "loss": 0.8809, + "step": 31925 + }, + { + "epoch": 0.82, + "learning_rate": 1.706519558656697e-06, + "loss": 0.9375, + "step": 31926 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064999761854045e-06, + "loss": 0.7651, + "step": 31927 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064803931731778e-06, + "loss": 0.5275, + "step": 31928 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064608096200314e-06, + "loss": 0.9512, + "step": 31929 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064412255259806e-06, + "loss": 0.9268, + "step": 31930 + }, + { + "epoch": 0.82, + "learning_rate": 1.7064216408910401e-06, + "loss": 0.7144, + "step": 31931 + }, + { + "epoch": 0.82, + "learning_rate": 1.706402055715225e-06, + "loss": 0.9492, + "step": 31932 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063824699985505e-06, + "loss": 0.7993, + "step": 31933 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063628837410312e-06, + "loss": 0.9697, + "step": 31934 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063432969426827e-06, + "loss": 0.573, + "step": 31935 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063237096035192e-06, + "loss": 0.8057, + "step": 31936 + }, + { + "epoch": 0.82, + "learning_rate": 1.7063041217235564e-06, + "loss": 0.8486, + "step": 31937 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062845333028085e-06, + "loss": 1.0703, + "step": 31938 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062649443412918e-06, + "loss": 0.686, + "step": 31939 + }, + { + "epoch": 0.82, + "learning_rate": 1.70624535483902e-06, + "loss": 0.9316, + "step": 31940 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062257647960087e-06, + "loss": 0.8564, + "step": 31941 + }, + { + "epoch": 0.82, + "learning_rate": 1.7062061742122728e-06, + "loss": 0.6753, + "step": 31942 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061865830878276e-06, + "loss": 1.0469, + "step": 31943 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061669914226875e-06, + "loss": 0.6016, + "step": 31944 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061473992168675e-06, + "loss": 0.7007, + "step": 31945 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061278064703832e-06, + "loss": 0.887, + "step": 31946 + }, + { + "epoch": 0.82, + "learning_rate": 1.7061082131832495e-06, + "loss": 1.042, + "step": 31947 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060886193554808e-06, + "loss": 0.7671, + "step": 31948 + }, + { + "epoch": 0.82, + "learning_rate": 1.706069024987093e-06, + "loss": 0.8135, + "step": 31949 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060494300781003e-06, + "loss": 0.834, + "step": 31950 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060298346285182e-06, + "loss": 0.6138, + "step": 31951 + }, + { + "epoch": 0.82, + "learning_rate": 1.7060102386383614e-06, + "loss": 0.8486, + "step": 31952 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059906421076452e-06, + "loss": 0.8848, + "step": 31953 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059710450363842e-06, + "loss": 0.6306, + "step": 31954 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059514474245935e-06, + "loss": 0.6919, + "step": 31955 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059318492722885e-06, + "loss": 0.9854, + "step": 31956 + }, + { + "epoch": 0.82, + "learning_rate": 1.7059122505794838e-06, + "loss": 0.5931, + "step": 31957 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058926513461946e-06, + "loss": 0.9678, + "step": 31958 + }, + { + "epoch": 0.82, + "learning_rate": 1.705873051572436e-06, + "loss": 0.7949, + "step": 31959 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058534512582227e-06, + "loss": 0.6143, + "step": 31960 + }, + { + "epoch": 0.82, + "learning_rate": 1.70583385040357e-06, + "loss": 0.7241, + "step": 31961 + }, + { + "epoch": 0.82, + "learning_rate": 1.7058142490084925e-06, + "loss": 0.9766, + "step": 31962 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057946470730058e-06, + "loss": 0.7627, + "step": 31963 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057750445971247e-06, + "loss": 0.7812, + "step": 31964 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057554415808637e-06, + "loss": 0.8066, + "step": 31965 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057358380242383e-06, + "loss": 0.7988, + "step": 31966 + }, + { + "epoch": 0.82, + "learning_rate": 1.7057162339272634e-06, + "loss": 0.8359, + "step": 31967 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056966292899542e-06, + "loss": 0.9619, + "step": 31968 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056770241123256e-06, + "loss": 0.8359, + "step": 31969 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056574183943925e-06, + "loss": 0.9531, + "step": 31970 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056378121361696e-06, + "loss": 1.0078, + "step": 31971 + }, + { + "epoch": 0.82, + "learning_rate": 1.7056182053376725e-06, + "loss": 0.8242, + "step": 31972 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055985979989162e-06, + "loss": 0.8359, + "step": 31973 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055789901199153e-06, + "loss": 1.0156, + "step": 31974 + }, + { + "epoch": 0.82, + "learning_rate": 1.705559381700685e-06, + "loss": 0.5875, + "step": 31975 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055397727412403e-06, + "loss": 0.793, + "step": 31976 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055201632415962e-06, + "loss": 0.7822, + "step": 31977 + }, + { + "epoch": 0.82, + "learning_rate": 1.7055005532017681e-06, + "loss": 0.8364, + "step": 31978 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054809426217704e-06, + "loss": 0.6084, + "step": 31979 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054613315016185e-06, + "loss": 0.874, + "step": 31980 + }, + { + "epoch": 0.82, + "learning_rate": 1.705441719841327e-06, + "loss": 1.1133, + "step": 31981 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054221076409113e-06, + "loss": 0.791, + "step": 31982 + }, + { + "epoch": 0.82, + "learning_rate": 1.7054024949003867e-06, + "loss": 0.9355, + "step": 31983 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053828816197675e-06, + "loss": 1.0479, + "step": 31984 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053632677990693e-06, + "loss": 0.9531, + "step": 31985 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053436534383066e-06, + "loss": 0.8037, + "step": 31986 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053240385374947e-06, + "loss": 0.9531, + "step": 31987 + }, + { + "epoch": 0.82, + "learning_rate": 1.7053044230966486e-06, + "loss": 0.7842, + "step": 31988 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052848071157837e-06, + "loss": 1.1133, + "step": 31989 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052651905949144e-06, + "loss": 0.6694, + "step": 31990 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052455735340558e-06, + "loss": 0.7563, + "step": 31991 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052259559332237e-06, + "loss": 0.6404, + "step": 31992 + }, + { + "epoch": 0.82, + "learning_rate": 1.7052063377924317e-06, + "loss": 0.9736, + "step": 31993 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051867191116961e-06, + "loss": 0.7715, + "step": 31994 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051670998910316e-06, + "loss": 0.8408, + "step": 31995 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051474801304529e-06, + "loss": 0.8926, + "step": 31996 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051278598299751e-06, + "loss": 0.7891, + "step": 31997 + }, + { + "epoch": 0.82, + "learning_rate": 1.7051082389896134e-06, + "loss": 1.1318, + "step": 31998 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050886176093827e-06, + "loss": 0.9248, + "step": 31999 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050689956892981e-06, + "loss": 0.8721, + "step": 32000 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050493732293744e-06, + "loss": 0.6841, + "step": 32001 + }, + { + "epoch": 0.82, + "learning_rate": 1.705029750229627e-06, + "loss": 0.79, + "step": 32002 + }, + { + "epoch": 0.82, + "learning_rate": 1.7050101266900706e-06, + "loss": 0.7979, + "step": 32003 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049905026107208e-06, + "loss": 0.9229, + "step": 32004 + }, + { + "epoch": 0.82, + "learning_rate": 1.704970877991592e-06, + "loss": 0.688, + "step": 32005 + }, + { + "epoch": 0.82, + "learning_rate": 1.704951252832699e-06, + "loss": 0.8115, + "step": 32006 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049316271340576e-06, + "loss": 1.0566, + "step": 32007 + }, + { + "epoch": 0.82, + "learning_rate": 1.7049120008956824e-06, + "loss": 1.0635, + "step": 32008 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048923741175888e-06, + "loss": 0.6826, + "step": 32009 + }, + { + "epoch": 0.82, + "learning_rate": 1.704872746799791e-06, + "loss": 0.7827, + "step": 32010 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048531189423048e-06, + "loss": 0.6406, + "step": 32011 + }, + { + "epoch": 0.82, + "learning_rate": 1.704833490545145e-06, + "loss": 0.7168, + "step": 32012 + }, + { + "epoch": 0.82, + "learning_rate": 1.7048138616083265e-06, + "loss": 0.8682, + "step": 32013 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047942321318644e-06, + "loss": 0.728, + "step": 32014 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047746021157741e-06, + "loss": 0.8643, + "step": 32015 + }, + { + "epoch": 0.82, + "learning_rate": 1.70475497156007e-06, + "loss": 0.8672, + "step": 32016 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047353404647672e-06, + "loss": 0.8008, + "step": 32017 + }, + { + "epoch": 0.82, + "learning_rate": 1.7047157088298814e-06, + "loss": 0.8696, + "step": 32018 + }, + { + "epoch": 0.82, + "learning_rate": 1.704696076655427e-06, + "loss": 0.7451, + "step": 32019 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046764439414193e-06, + "loss": 0.834, + "step": 32020 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046568106878731e-06, + "loss": 0.7339, + "step": 32021 + }, + { + "epoch": 0.82, + "learning_rate": 1.7046371768948036e-06, + "loss": 0.7729, + "step": 32022 + }, + { + "epoch": 0.82, + "learning_rate": 1.704617542562226e-06, + "loss": 0.8945, + "step": 32023 + }, + { + "epoch": 0.82, + "learning_rate": 1.704597907690155e-06, + "loss": 0.9033, + "step": 32024 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045782722786058e-06, + "loss": 0.8525, + "step": 32025 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045586363275932e-06, + "loss": 0.7744, + "step": 32026 + }, + { + "epoch": 0.82, + "learning_rate": 1.7045389998371327e-06, + "loss": 0.8545, + "step": 32027 + }, + { + "epoch": 0.82, + "learning_rate": 1.704519362807239e-06, + "loss": 1.0, + "step": 32028 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044997252379274e-06, + "loss": 0.9346, + "step": 32029 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044800871292124e-06, + "loss": 0.77, + "step": 32030 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044604484811099e-06, + "loss": 0.6118, + "step": 32031 + }, + { + "epoch": 0.82, + "learning_rate": 1.704440809293634e-06, + "loss": 0.874, + "step": 32032 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044211695668003e-06, + "loss": 0.9951, + "step": 32033 + }, + { + "epoch": 0.82, + "learning_rate": 1.7044015293006237e-06, + "loss": 0.7725, + "step": 32034 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043818884951192e-06, + "loss": 0.7949, + "step": 32035 + }, + { + "epoch": 0.82, + "learning_rate": 1.704362247150302e-06, + "loss": 0.9785, + "step": 32036 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043426052661869e-06, + "loss": 0.7197, + "step": 32037 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043229628427889e-06, + "loss": 0.9346, + "step": 32038 + }, + { + "epoch": 0.82, + "learning_rate": 1.7043033198801236e-06, + "loss": 0.7637, + "step": 32039 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042836763782053e-06, + "loss": 0.8779, + "step": 32040 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042640323370496e-06, + "loss": 0.71, + "step": 32041 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042443877566712e-06, + "loss": 0.55, + "step": 32042 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042247426370851e-06, + "loss": 0.8516, + "step": 32043 + }, + { + "epoch": 0.82, + "learning_rate": 1.7042050969783065e-06, + "loss": 0.8301, + "step": 32044 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041854507803506e-06, + "loss": 0.9688, + "step": 32045 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041658040432325e-06, + "loss": 0.8345, + "step": 32046 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041461567669666e-06, + "loss": 0.9609, + "step": 32047 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041265089515688e-06, + "loss": 0.835, + "step": 32048 + }, + { + "epoch": 0.82, + "learning_rate": 1.7041068605970534e-06, + "loss": 0.6689, + "step": 32049 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040872117034357e-06, + "loss": 0.835, + "step": 32050 + }, + { + "epoch": 0.82, + "learning_rate": 1.704067562270731e-06, + "loss": 0.7905, + "step": 32051 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040479122989538e-06, + "loss": 0.8447, + "step": 32052 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040282617881201e-06, + "loss": 0.8638, + "step": 32053 + }, + { + "epoch": 0.82, + "learning_rate": 1.7040086107382439e-06, + "loss": 0.7334, + "step": 32054 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039889591493406e-06, + "loss": 0.9648, + "step": 32055 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039693070214253e-06, + "loss": 0.835, + "step": 32056 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039496543545134e-06, + "loss": 0.8936, + "step": 32057 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039300011486195e-06, + "loss": 0.6211, + "step": 32058 + }, + { + "epoch": 0.82, + "learning_rate": 1.7039103474037586e-06, + "loss": 0.8838, + "step": 32059 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038906931199461e-06, + "loss": 0.7476, + "step": 32060 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038710382971968e-06, + "loss": 0.8726, + "step": 32061 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038513829355256e-06, + "loss": 0.8408, + "step": 32062 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038317270349483e-06, + "loss": 0.9023, + "step": 32063 + }, + { + "epoch": 0.82, + "learning_rate": 1.7038120705954788e-06, + "loss": 0.7056, + "step": 32064 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037924136171332e-06, + "loss": 0.791, + "step": 32065 + }, + { + "epoch": 0.82, + "learning_rate": 1.703772756099926e-06, + "loss": 1.0332, + "step": 32066 + }, + { + "epoch": 0.82, + "learning_rate": 1.703753098043872e-06, + "loss": 1.1289, + "step": 32067 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037334394489871e-06, + "loss": 0.54, + "step": 32068 + }, + { + "epoch": 0.82, + "learning_rate": 1.7037137803152857e-06, + "loss": 0.6609, + "step": 32069 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036941206427828e-06, + "loss": 0.7283, + "step": 32070 + }, + { + "epoch": 0.82, + "learning_rate": 1.703674460431494e-06, + "loss": 0.8408, + "step": 32071 + }, + { + "epoch": 0.82, + "learning_rate": 1.703654799681434e-06, + "loss": 0.8613, + "step": 32072 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036351383926178e-06, + "loss": 0.9185, + "step": 32073 + }, + { + "epoch": 0.82, + "learning_rate": 1.7036154765650602e-06, + "loss": 0.9775, + "step": 32074 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035958141987772e-06, + "loss": 0.6895, + "step": 32075 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035761512937827e-06, + "loss": 0.8779, + "step": 32076 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035564878500925e-06, + "loss": 0.6382, + "step": 32077 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035368238677217e-06, + "loss": 0.8633, + "step": 32078 + }, + { + "epoch": 0.82, + "learning_rate": 1.7035171593466848e-06, + "loss": 0.9658, + "step": 32079 + }, + { + "epoch": 0.82, + "learning_rate": 1.703497494286997e-06, + "loss": 0.9922, + "step": 32080 + }, + { + "epoch": 0.82, + "learning_rate": 1.703477828688674e-06, + "loss": 0.8525, + "step": 32081 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034581625517299e-06, + "loss": 1.0098, + "step": 32082 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034384958761805e-06, + "loss": 0.7983, + "step": 32083 + }, + { + "epoch": 0.82, + "learning_rate": 1.7034188286620403e-06, + "loss": 0.9951, + "step": 32084 + }, + { + "epoch": 0.82, + "learning_rate": 1.703399160909325e-06, + "loss": 1.0908, + "step": 32085 + }, + { + "epoch": 0.82, + "learning_rate": 1.7033794926180495e-06, + "loss": 0.79, + "step": 32086 + }, + { + "epoch": 0.82, + "learning_rate": 1.703359823788228e-06, + "loss": 0.7207, + "step": 32087 + }, + { + "epoch": 0.82, + "learning_rate": 1.7033401544198766e-06, + "loss": 0.9092, + "step": 32088 + }, + { + "epoch": 0.82, + "learning_rate": 1.70332048451301e-06, + "loss": 0.8906, + "step": 32089 + }, + { + "epoch": 0.82, + "learning_rate": 1.703300814067643e-06, + "loss": 0.668, + "step": 32090 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032811430837912e-06, + "loss": 0.8081, + "step": 32091 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032614715614693e-06, + "loss": 0.9651, + "step": 32092 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032417995006926e-06, + "loss": 0.6914, + "step": 32093 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032221269014756e-06, + "loss": 1.0498, + "step": 32094 + }, + { + "epoch": 0.82, + "learning_rate": 1.7032024537638342e-06, + "loss": 0.9326, + "step": 32095 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031827800877825e-06, + "loss": 0.7827, + "step": 32096 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031631058733362e-06, + "loss": 1.2617, + "step": 32097 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031434311205107e-06, + "loss": 0.9619, + "step": 32098 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031237558293201e-06, + "loss": 0.7256, + "step": 32099 + }, + { + "epoch": 0.82, + "learning_rate": 1.7031040799997802e-06, + "loss": 0.8428, + "step": 32100 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030844036319055e-06, + "loss": 0.9209, + "step": 32101 + }, + { + "epoch": 0.82, + "learning_rate": 1.703064726725712e-06, + "loss": 0.8125, + "step": 32102 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030450492812138e-06, + "loss": 0.6917, + "step": 32103 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030253712984263e-06, + "loss": 0.5117, + "step": 32104 + }, + { + "epoch": 0.82, + "learning_rate": 1.7030056927773648e-06, + "loss": 0.8125, + "step": 32105 + }, + { + "epoch": 0.82, + "learning_rate": 1.702986013718044e-06, + "loss": 0.623, + "step": 32106 + }, + { + "epoch": 0.82, + "learning_rate": 1.702966334120479e-06, + "loss": 0.9131, + "step": 32107 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029466539846853e-06, + "loss": 0.8147, + "step": 32108 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029269733106774e-06, + "loss": 0.958, + "step": 32109 + }, + { + "epoch": 0.82, + "learning_rate": 1.7029072920984708e-06, + "loss": 0.9932, + "step": 32110 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028876103480805e-06, + "loss": 0.7432, + "step": 32111 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028679280595216e-06, + "loss": 0.8115, + "step": 32112 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028482452328087e-06, + "loss": 0.8496, + "step": 32113 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028285618679574e-06, + "loss": 0.9688, + "step": 32114 + }, + { + "epoch": 0.82, + "learning_rate": 1.7028088779649824e-06, + "loss": 0.8296, + "step": 32115 + }, + { + "epoch": 0.82, + "learning_rate": 1.702789193523899e-06, + "loss": 0.5969, + "step": 32116 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027695085447224e-06, + "loss": 1.0039, + "step": 32117 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027498230274676e-06, + "loss": 0.7275, + "step": 32118 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027301369721493e-06, + "loss": 0.8086, + "step": 32119 + }, + { + "epoch": 0.82, + "learning_rate": 1.7027104503787828e-06, + "loss": 0.9043, + "step": 32120 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026907632473835e-06, + "loss": 0.8262, + "step": 32121 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026710755779662e-06, + "loss": 0.7026, + "step": 32122 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026513873705458e-06, + "loss": 0.8662, + "step": 32123 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026316986251374e-06, + "loss": 0.9648, + "step": 32124 + }, + { + "epoch": 0.82, + "learning_rate": 1.7026120093417565e-06, + "loss": 0.8867, + "step": 32125 + }, + { + "epoch": 0.82, + "learning_rate": 1.7025923195204177e-06, + "loss": 0.6958, + "step": 32126 + }, + { + "epoch": 0.82, + "learning_rate": 1.702572629161136e-06, + "loss": 0.959, + "step": 32127 + }, + { + "epoch": 0.82, + "learning_rate": 1.7025529382639272e-06, + "loss": 0.8506, + "step": 32128 + }, + { + "epoch": 0.82, + "learning_rate": 1.702533246828806e-06, + "loss": 0.8955, + "step": 32129 + }, + { + "epoch": 0.82, + "learning_rate": 1.702513554855787e-06, + "loss": 0.6958, + "step": 32130 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024938623448862e-06, + "loss": 0.9521, + "step": 32131 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024741692961174e-06, + "loss": 0.918, + "step": 32132 + }, + { + "epoch": 0.82, + "learning_rate": 1.702454475709497e-06, + "loss": 0.7754, + "step": 32133 + }, + { + "epoch": 0.82, + "learning_rate": 1.7024347815850396e-06, + "loss": 0.6245, + "step": 32134 + }, + { + "epoch": 0.82, + "learning_rate": 1.70241508692276e-06, + "loss": 0.7939, + "step": 32135 + }, + { + "epoch": 0.82, + "learning_rate": 1.702395391722673e-06, + "loss": 0.6794, + "step": 32136 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023756959847946e-06, + "loss": 0.7188, + "step": 32137 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023559997091395e-06, + "loss": 0.7832, + "step": 32138 + }, + { + "epoch": 0.82, + "learning_rate": 1.7023363028957225e-06, + "loss": 0.8584, + "step": 32139 + }, + { + "epoch": 0.82, + "learning_rate": 1.702316605544559e-06, + "loss": 0.957, + "step": 32140 + }, + { + "epoch": 0.82, + "learning_rate": 1.702296907655664e-06, + "loss": 0.7002, + "step": 32141 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022772092290523e-06, + "loss": 0.9004, + "step": 32142 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022575102647395e-06, + "loss": 0.6733, + "step": 32143 + }, + { + "epoch": 0.82, + "learning_rate": 1.7022378107627404e-06, + "loss": 0.7734, + "step": 32144 + }, + { + "epoch": 0.82, + "learning_rate": 1.70221811072307e-06, + "loss": 0.8252, + "step": 32145 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021984101457436e-06, + "loss": 0.801, + "step": 32146 + }, + { + "epoch": 0.82, + "learning_rate": 1.702178709030776e-06, + "loss": 0.627, + "step": 32147 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021590073781827e-06, + "loss": 0.9365, + "step": 32148 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021393051879781e-06, + "loss": 0.96, + "step": 32149 + }, + { + "epoch": 0.82, + "learning_rate": 1.7021196024601781e-06, + "loss": 0.8516, + "step": 32150 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020998991947972e-06, + "loss": 0.8809, + "step": 32151 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020801953918506e-06, + "loss": 0.6533, + "step": 32152 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020604910513538e-06, + "loss": 0.8193, + "step": 32153 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020407861733215e-06, + "loss": 0.7256, + "step": 32154 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020210807577686e-06, + "loss": 0.96, + "step": 32155 + }, + { + "epoch": 0.82, + "learning_rate": 1.7020013748047108e-06, + "loss": 0.5815, + "step": 32156 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019816683141626e-06, + "loss": 0.8076, + "step": 32157 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019619612861393e-06, + "loss": 0.8535, + "step": 32158 + }, + { + "epoch": 0.82, + "learning_rate": 1.7019422537206563e-06, + "loss": 0.9414, + "step": 32159 + }, + { + "epoch": 0.82, + "learning_rate": 1.701922545617728e-06, + "loss": 0.8701, + "step": 32160 + }, + { + "epoch": 0.82, + "learning_rate": 1.70190283697737e-06, + "loss": 0.7041, + "step": 32161 + }, + { + "epoch": 0.82, + "learning_rate": 1.701883127799597e-06, + "loss": 0.9775, + "step": 32162 + }, + { + "epoch": 0.82, + "learning_rate": 1.701863418084425e-06, + "loss": 0.7129, + "step": 32163 + }, + { + "epoch": 0.82, + "learning_rate": 1.7018437078318679e-06, + "loss": 0.9688, + "step": 32164 + }, + { + "epoch": 0.82, + "learning_rate": 1.7018239970419418e-06, + "loss": 1.0107, + "step": 32165 + }, + { + "epoch": 0.82, + "learning_rate": 1.701804285714661e-06, + "loss": 0.8535, + "step": 32166 + }, + { + "epoch": 0.82, + "learning_rate": 1.701784573850041e-06, + "loss": 0.7676, + "step": 32167 + }, + { + "epoch": 0.82, + "learning_rate": 1.701764861448097e-06, + "loss": 0.7134, + "step": 32168 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017451485088436e-06, + "loss": 0.7998, + "step": 32169 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017254350322965e-06, + "loss": 0.7646, + "step": 32170 + }, + { + "epoch": 0.82, + "learning_rate": 1.7017057210184702e-06, + "loss": 0.8037, + "step": 32171 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016860064673803e-06, + "loss": 0.9111, + "step": 32172 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016662913790417e-06, + "loss": 0.7803, + "step": 32173 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016465757534695e-06, + "loss": 0.8398, + "step": 32174 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016268595906787e-06, + "loss": 1.1387, + "step": 32175 + }, + { + "epoch": 0.82, + "learning_rate": 1.7016071428906844e-06, + "loss": 0.9141, + "step": 32176 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015874256535018e-06, + "loss": 0.9922, + "step": 32177 + }, + { + "epoch": 0.82, + "learning_rate": 1.701567707879146e-06, + "loss": 0.9766, + "step": 32178 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015479895676322e-06, + "loss": 0.6973, + "step": 32179 + }, + { + "epoch": 0.82, + "learning_rate": 1.7015282707189753e-06, + "loss": 0.8599, + "step": 32180 + }, + { + "epoch": 0.82, + "learning_rate": 1.70150855133319e-06, + "loss": 0.7964, + "step": 32181 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014888314102923e-06, + "loss": 0.9727, + "step": 32182 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014691109502972e-06, + "loss": 0.8164, + "step": 32183 + }, + { + "epoch": 0.82, + "learning_rate": 1.701449389953219e-06, + "loss": 0.6577, + "step": 32184 + }, + { + "epoch": 0.82, + "learning_rate": 1.7014296684190733e-06, + "loss": 0.9092, + "step": 32185 + }, + { + "epoch": 0.82, + "learning_rate": 1.701409946347875e-06, + "loss": 0.7754, + "step": 32186 + }, + { + "epoch": 0.82, + "learning_rate": 1.7013902237396397e-06, + "loss": 0.9316, + "step": 32187 + }, + { + "epoch": 0.82, + "learning_rate": 1.7013705005943821e-06, + "loss": 0.6982, + "step": 32188 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013507769121174e-06, + "loss": 0.7837, + "step": 32189 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013310526928604e-06, + "loss": 1.1074, + "step": 32190 + }, + { + "epoch": 0.83, + "learning_rate": 1.7013113279366266e-06, + "loss": 0.8149, + "step": 32191 + }, + { + "epoch": 0.83, + "learning_rate": 1.701291602643431e-06, + "loss": 1.1914, + "step": 32192 + }, + { + "epoch": 0.83, + "learning_rate": 1.7012718768132886e-06, + "loss": 0.627, + "step": 32193 + }, + { + "epoch": 0.83, + "learning_rate": 1.7012521504462146e-06, + "loss": 0.8379, + "step": 32194 + }, + { + "epoch": 0.83, + "learning_rate": 1.701232423542224e-06, + "loss": 0.8428, + "step": 32195 + }, + { + "epoch": 0.83, + "learning_rate": 1.701212696101332e-06, + "loss": 1.0283, + "step": 32196 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011929681235538e-06, + "loss": 0.6528, + "step": 32197 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011732396089042e-06, + "loss": 0.8926, + "step": 32198 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011535105573985e-06, + "loss": 0.9136, + "step": 32199 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011337809690521e-06, + "loss": 0.9688, + "step": 32200 + }, + { + "epoch": 0.83, + "learning_rate": 1.7011140508438793e-06, + "loss": 0.8379, + "step": 32201 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010943201818961e-06, + "loss": 0.7153, + "step": 32202 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010745889831173e-06, + "loss": 0.998, + "step": 32203 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010548572475578e-06, + "loss": 0.9932, + "step": 32204 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010351249752327e-06, + "loss": 0.9551, + "step": 32205 + }, + { + "epoch": 0.83, + "learning_rate": 1.7010153921661572e-06, + "loss": 0.8633, + "step": 32206 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009956588203466e-06, + "loss": 1.1104, + "step": 32207 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009759249378156e-06, + "loss": 0.875, + "step": 32208 + }, + { + "epoch": 0.83, + "learning_rate": 1.70095619051858e-06, + "loss": 0.6794, + "step": 32209 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009364555626542e-06, + "loss": 0.7539, + "step": 32210 + }, + { + "epoch": 0.83, + "learning_rate": 1.7009167200700536e-06, + "loss": 0.9209, + "step": 32211 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008969840407935e-06, + "loss": 0.7036, + "step": 32212 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008772474748886e-06, + "loss": 0.6338, + "step": 32213 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008575103723541e-06, + "loss": 0.7097, + "step": 32214 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008377727332056e-06, + "loss": 0.5322, + "step": 32215 + }, + { + "epoch": 0.83, + "learning_rate": 1.7008180345574577e-06, + "loss": 0.8844, + "step": 32216 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007982958451254e-06, + "loss": 1.0, + "step": 32217 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007785565962242e-06, + "loss": 0.8975, + "step": 32218 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007588168107691e-06, + "loss": 0.75, + "step": 32219 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007390764887752e-06, + "loss": 0.7549, + "step": 32220 + }, + { + "epoch": 0.83, + "learning_rate": 1.7007193356302578e-06, + "loss": 0.7114, + "step": 32221 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006995942352317e-06, + "loss": 0.6616, + "step": 32222 + }, + { + "epoch": 0.83, + "learning_rate": 1.700679852303712e-06, + "loss": 0.8447, + "step": 32223 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006601098357144e-06, + "loss": 1.1289, + "step": 32224 + }, + { + "epoch": 0.83, + "learning_rate": 1.700640366831253e-06, + "loss": 0.7959, + "step": 32225 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006206232903437e-06, + "loss": 0.7192, + "step": 32226 + }, + { + "epoch": 0.83, + "learning_rate": 1.7006008792130014e-06, + "loss": 0.917, + "step": 32227 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005811345992415e-06, + "loss": 1.0361, + "step": 32228 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005613894490785e-06, + "loss": 0.6829, + "step": 32229 + }, + { + "epoch": 0.83, + "learning_rate": 1.700541643762528e-06, + "loss": 0.7236, + "step": 32230 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005218975396049e-06, + "loss": 0.7773, + "step": 32231 + }, + { + "epoch": 0.83, + "learning_rate": 1.7005021507803243e-06, + "loss": 0.8599, + "step": 32232 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004824034847016e-06, + "loss": 1.0938, + "step": 32233 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004626556527518e-06, + "loss": 0.7676, + "step": 32234 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004429072844897e-06, + "loss": 0.6851, + "step": 32235 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004231583799307e-06, + "loss": 0.7417, + "step": 32236 + }, + { + "epoch": 0.83, + "learning_rate": 1.7004034089390901e-06, + "loss": 0.835, + "step": 32237 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003836589619826e-06, + "loss": 0.7705, + "step": 32238 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003639084486236e-06, + "loss": 0.8604, + "step": 32239 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003441573990282e-06, + "loss": 1.0645, + "step": 32240 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003244058132115e-06, + "loss": 0.8701, + "step": 32241 + }, + { + "epoch": 0.83, + "learning_rate": 1.7003046536911887e-06, + "loss": 0.6855, + "step": 32242 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002849010329748e-06, + "loss": 0.7651, + "step": 32243 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002651478385848e-06, + "loss": 0.7793, + "step": 32244 + }, + { + "epoch": 0.83, + "learning_rate": 1.700245394108034e-06, + "loss": 0.7725, + "step": 32245 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002256398413375e-06, + "loss": 0.8887, + "step": 32246 + }, + { + "epoch": 0.83, + "learning_rate": 1.7002058850385105e-06, + "loss": 0.9199, + "step": 32247 + }, + { + "epoch": 0.83, + "learning_rate": 1.700186129699568e-06, + "loss": 0.8467, + "step": 32248 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001663738245253e-06, + "loss": 0.9678, + "step": 32249 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001466174133972e-06, + "loss": 0.9092, + "step": 32250 + }, + { + "epoch": 0.83, + "learning_rate": 1.7001268604661992e-06, + "loss": 0.7993, + "step": 32251 + }, + { + "epoch": 0.83, + "learning_rate": 1.700107102982946e-06, + "loss": 0.7163, + "step": 32252 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000873449636532e-06, + "loss": 0.9531, + "step": 32253 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000675864083357e-06, + "loss": 0.8521, + "step": 32254 + }, + { + "epoch": 0.83, + "learning_rate": 1.7000478273170086e-06, + "loss": 1.0391, + "step": 32255 + }, + { + "epoch": 0.83, + "learning_rate": 1.700028067689687e-06, + "loss": 0.7715, + "step": 32256 + }, + { + "epoch": 0.83, + "learning_rate": 1.700008307526386e-06, + "loss": 0.688, + "step": 32257 + }, + { + "epoch": 0.83, + "learning_rate": 1.699988546827121e-06, + "loss": 0.8975, + "step": 32258 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999687855919072e-06, + "loss": 0.541, + "step": 32259 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999490238207591e-06, + "loss": 0.9619, + "step": 32260 + }, + { + "epoch": 0.83, + "learning_rate": 1.6999292615136924e-06, + "loss": 0.8457, + "step": 32261 + }, + { + "epoch": 0.83, + "learning_rate": 1.699909498670722e-06, + "loss": 0.593, + "step": 32262 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998897352918632e-06, + "loss": 0.8691, + "step": 32263 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998699713771307e-06, + "loss": 0.7422, + "step": 32264 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998502069265404e-06, + "loss": 0.9219, + "step": 32265 + }, + { + "epoch": 0.83, + "learning_rate": 1.6998304419401066e-06, + "loss": 0.6094, + "step": 32266 + }, + { + "epoch": 0.83, + "learning_rate": 1.699810676417845e-06, + "loss": 0.8804, + "step": 32267 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997909103597703e-06, + "loss": 0.9307, + "step": 32268 + }, + { + "epoch": 0.83, + "learning_rate": 1.699771143765898e-06, + "loss": 0.9756, + "step": 32269 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997513766362433e-06, + "loss": 0.8477, + "step": 32270 + }, + { + "epoch": 0.83, + "learning_rate": 1.699731608970821e-06, + "loss": 0.7915, + "step": 32271 + }, + { + "epoch": 0.83, + "learning_rate": 1.6997118407696463e-06, + "loss": 1.0957, + "step": 32272 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996920720327345e-06, + "loss": 0.7051, + "step": 32273 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996723027601008e-06, + "loss": 0.8506, + "step": 32274 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996525329517599e-06, + "loss": 0.7861, + "step": 32275 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996327626077273e-06, + "loss": 0.6855, + "step": 32276 + }, + { + "epoch": 0.83, + "learning_rate": 1.6996129917280183e-06, + "loss": 0.8545, + "step": 32277 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995932203126477e-06, + "loss": 1.0879, + "step": 32278 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995734483616306e-06, + "loss": 0.6411, + "step": 32279 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995536758749825e-06, + "loss": 0.6772, + "step": 32280 + }, + { + "epoch": 0.83, + "learning_rate": 1.699533902852718e-06, + "loss": 0.7695, + "step": 32281 + }, + { + "epoch": 0.83, + "learning_rate": 1.6995141292948527e-06, + "loss": 0.9795, + "step": 32282 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994943552014015e-06, + "loss": 0.791, + "step": 32283 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994745805723799e-06, + "loss": 0.8457, + "step": 32284 + }, + { + "epoch": 0.83, + "learning_rate": 1.6994548054078026e-06, + "loss": 0.835, + "step": 32285 + }, + { + "epoch": 0.83, + "learning_rate": 1.699435029707685e-06, + "loss": 0.9463, + "step": 32286 + }, + { + "epoch": 0.83, + "learning_rate": 1.699415253472042e-06, + "loss": 0.9951, + "step": 32287 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993954767008891e-06, + "loss": 0.7285, + "step": 32288 + }, + { + "epoch": 0.83, + "learning_rate": 1.699375699394241e-06, + "loss": 0.7822, + "step": 32289 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993559215521133e-06, + "loss": 0.8252, + "step": 32290 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993361431745209e-06, + "loss": 0.542, + "step": 32291 + }, + { + "epoch": 0.83, + "learning_rate": 1.6993163642614787e-06, + "loss": 0.8301, + "step": 32292 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992965848130028e-06, + "loss": 0.6802, + "step": 32293 + }, + { + "epoch": 0.83, + "learning_rate": 1.699276804829107e-06, + "loss": 0.875, + "step": 32294 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992570243098073e-06, + "loss": 0.9189, + "step": 32295 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992372432551188e-06, + "loss": 0.7192, + "step": 32296 + }, + { + "epoch": 0.83, + "learning_rate": 1.6992174616650563e-06, + "loss": 0.8135, + "step": 32297 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991976795396353e-06, + "loss": 0.8828, + "step": 32298 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991778968788706e-06, + "loss": 0.9512, + "step": 32299 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991581136827775e-06, + "loss": 0.8672, + "step": 32300 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991383299513713e-06, + "loss": 1.1553, + "step": 32301 + }, + { + "epoch": 0.83, + "learning_rate": 1.6991185456846671e-06, + "loss": 0.9697, + "step": 32302 + }, + { + "epoch": 0.83, + "learning_rate": 1.69909876088268e-06, + "loss": 0.8926, + "step": 32303 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990789755454249e-06, + "loss": 0.8096, + "step": 32304 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990591896729173e-06, + "loss": 0.8994, + "step": 32305 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990394032651722e-06, + "loss": 0.9053, + "step": 32306 + }, + { + "epoch": 0.83, + "learning_rate": 1.6990196163222047e-06, + "loss": 0.689, + "step": 32307 + }, + { + "epoch": 0.83, + "learning_rate": 1.6989998288440304e-06, + "loss": 0.8389, + "step": 32308 + }, + { + "epoch": 0.83, + "learning_rate": 1.6989800408306636e-06, + "loss": 0.96, + "step": 32309 + }, + { + "epoch": 0.83, + "learning_rate": 1.69896025228212e-06, + "loss": 0.97, + "step": 32310 + }, + { + "epoch": 0.83, + "learning_rate": 1.698940463198415e-06, + "loss": 0.6951, + "step": 32311 + }, + { + "epoch": 0.83, + "learning_rate": 1.698920673579563e-06, + "loss": 1.0059, + "step": 32312 + }, + { + "epoch": 0.83, + "learning_rate": 1.69890088342558e-06, + "loss": 0.8887, + "step": 32313 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988810927364805e-06, + "loss": 0.8247, + "step": 32314 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988613015122799e-06, + "loss": 0.9268, + "step": 32315 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988415097529933e-06, + "loss": 0.9053, + "step": 32316 + }, + { + "epoch": 0.83, + "learning_rate": 1.698821717458636e-06, + "loss": 0.6719, + "step": 32317 + }, + { + "epoch": 0.83, + "learning_rate": 1.6988019246292228e-06, + "loss": 0.7959, + "step": 32318 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987821312647694e-06, + "loss": 0.6631, + "step": 32319 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987623373652906e-06, + "loss": 0.8965, + "step": 32320 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987425429308014e-06, + "loss": 0.8711, + "step": 32321 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987227479613174e-06, + "loss": 0.8438, + "step": 32322 + }, + { + "epoch": 0.83, + "learning_rate": 1.6987029524568532e-06, + "loss": 0.873, + "step": 32323 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986831564174246e-06, + "loss": 0.7769, + "step": 32324 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986633598430463e-06, + "loss": 0.9033, + "step": 32325 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986435627337336e-06, + "loss": 0.9961, + "step": 32326 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986237650895016e-06, + "loss": 0.9014, + "step": 32327 + }, + { + "epoch": 0.83, + "learning_rate": 1.6986039669103657e-06, + "loss": 0.8301, + "step": 32328 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985841681963406e-06, + "loss": 0.9033, + "step": 32329 + }, + { + "epoch": 0.83, + "learning_rate": 1.698564368947442e-06, + "loss": 0.8965, + "step": 32330 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985445691636846e-06, + "loss": 0.9766, + "step": 32331 + }, + { + "epoch": 0.83, + "learning_rate": 1.698524768845084e-06, + "loss": 0.7666, + "step": 32332 + }, + { + "epoch": 0.83, + "learning_rate": 1.6985049679916545e-06, + "loss": 0.7681, + "step": 32333 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984851666034126e-06, + "loss": 0.7793, + "step": 32334 + }, + { + "epoch": 0.83, + "learning_rate": 1.698465364680372e-06, + "loss": 0.834, + "step": 32335 + }, + { + "epoch": 0.83, + "learning_rate": 1.698445562222549e-06, + "loss": 0.8232, + "step": 32336 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984257592299583e-06, + "loss": 0.8447, + "step": 32337 + }, + { + "epoch": 0.83, + "learning_rate": 1.6984059557026153e-06, + "loss": 0.6357, + "step": 32338 + }, + { + "epoch": 0.83, + "learning_rate": 1.698386151640535e-06, + "loss": 0.7979, + "step": 32339 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983663470437322e-06, + "loss": 0.8574, + "step": 32340 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983465419122226e-06, + "loss": 0.7104, + "step": 32341 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983267362460213e-06, + "loss": 0.9609, + "step": 32342 + }, + { + "epoch": 0.83, + "learning_rate": 1.6983069300451427e-06, + "loss": 1.0723, + "step": 32343 + }, + { + "epoch": 0.83, + "learning_rate": 1.698287123309603e-06, + "loss": 0.8525, + "step": 32344 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982673160394172e-06, + "loss": 0.6587, + "step": 32345 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982475082346e-06, + "loss": 1.0449, + "step": 32346 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982276998951668e-06, + "loss": 0.9092, + "step": 32347 + }, + { + "epoch": 0.83, + "learning_rate": 1.6982078910211329e-06, + "loss": 0.8237, + "step": 32348 + }, + { + "epoch": 0.83, + "learning_rate": 1.698188081612513e-06, + "loss": 0.6575, + "step": 32349 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981682716693226e-06, + "loss": 0.4856, + "step": 32350 + }, + { + "epoch": 0.83, + "learning_rate": 1.698148461191577e-06, + "loss": 0.7871, + "step": 32351 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981286501792913e-06, + "loss": 0.9355, + "step": 32352 + }, + { + "epoch": 0.83, + "learning_rate": 1.6981088386324807e-06, + "loss": 0.9824, + "step": 32353 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980890265511598e-06, + "loss": 0.8032, + "step": 32354 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980692139353445e-06, + "loss": 0.9258, + "step": 32355 + }, + { + "epoch": 0.83, + "learning_rate": 1.69804940078505e-06, + "loss": 1.0498, + "step": 32356 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980295871002908e-06, + "loss": 0.9043, + "step": 32357 + }, + { + "epoch": 0.83, + "learning_rate": 1.6980097728810826e-06, + "loss": 0.9121, + "step": 32358 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979899581274402e-06, + "loss": 0.6704, + "step": 32359 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979701428393791e-06, + "loss": 0.792, + "step": 32360 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979503270169144e-06, + "loss": 1.0654, + "step": 32361 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979305106600612e-06, + "loss": 0.8213, + "step": 32362 + }, + { + "epoch": 0.83, + "learning_rate": 1.6979106937688349e-06, + "loss": 0.8652, + "step": 32363 + }, + { + "epoch": 0.83, + "learning_rate": 1.69789087634325e-06, + "loss": 0.6978, + "step": 32364 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978710583833228e-06, + "loss": 1.0186, + "step": 32365 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978512398890673e-06, + "loss": 0.7866, + "step": 32366 + }, + { + "epoch": 0.83, + "learning_rate": 1.6978314208604994e-06, + "loss": 0.7007, + "step": 32367 + }, + { + "epoch": 0.83, + "learning_rate": 1.697811601297634e-06, + "loss": 0.7207, + "step": 32368 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977917812004864e-06, + "loss": 0.7422, + "step": 32369 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977719605690717e-06, + "loss": 0.8359, + "step": 32370 + }, + { + "epoch": 0.83, + "learning_rate": 1.697752139403405e-06, + "loss": 0.9795, + "step": 32371 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977323177035014e-06, + "loss": 0.9033, + "step": 32372 + }, + { + "epoch": 0.83, + "learning_rate": 1.6977124954693767e-06, + "loss": 0.8008, + "step": 32373 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976926727010455e-06, + "loss": 0.814, + "step": 32374 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976728493985228e-06, + "loss": 0.835, + "step": 32375 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976530255618245e-06, + "loss": 1.0059, + "step": 32376 + }, + { + "epoch": 0.83, + "learning_rate": 1.697633201190965e-06, + "loss": 0.9214, + "step": 32377 + }, + { + "epoch": 0.83, + "learning_rate": 1.6976133762859601e-06, + "loss": 0.6667, + "step": 32378 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975935508468245e-06, + "loss": 0.9092, + "step": 32379 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975737248735737e-06, + "loss": 0.8506, + "step": 32380 + }, + { + "epoch": 0.83, + "learning_rate": 1.6975538983662229e-06, + "loss": 1.0098, + "step": 32381 + }, + { + "epoch": 0.83, + "learning_rate": 1.697534071324787e-06, + "loss": 0.7852, + "step": 32382 + }, + { + "epoch": 0.83, + "learning_rate": 1.697514243749281e-06, + "loss": 0.8506, + "step": 32383 + }, + { + "epoch": 0.83, + "learning_rate": 1.697494415639721e-06, + "loss": 0.439, + "step": 32384 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974745869961213e-06, + "loss": 0.7764, + "step": 32385 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974547578184974e-06, + "loss": 0.7871, + "step": 32386 + }, + { + "epoch": 0.83, + "learning_rate": 1.6974349281068648e-06, + "loss": 0.5645, + "step": 32387 + }, + { + "epoch": 0.83, + "learning_rate": 1.697415097861238e-06, + "loss": 0.7637, + "step": 32388 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973952670816325e-06, + "loss": 0.8301, + "step": 32389 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973754357680634e-06, + "loss": 0.9873, + "step": 32390 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973556039205463e-06, + "loss": 0.8613, + "step": 32391 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973357715390961e-06, + "loss": 0.7593, + "step": 32392 + }, + { + "epoch": 0.83, + "learning_rate": 1.6973159386237278e-06, + "loss": 1.0947, + "step": 32393 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972961051744568e-06, + "loss": 0.5903, + "step": 32394 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972762711912982e-06, + "loss": 0.9502, + "step": 32395 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972564366742672e-06, + "loss": 0.9482, + "step": 32396 + }, + { + "epoch": 0.83, + "learning_rate": 1.6972366016233793e-06, + "loss": 0.8867, + "step": 32397 + }, + { + "epoch": 0.83, + "learning_rate": 1.697216766038649e-06, + "loss": 0.9453, + "step": 32398 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971969299200919e-06, + "loss": 1.041, + "step": 32399 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971770932677232e-06, + "loss": 0.8066, + "step": 32400 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971572560815585e-06, + "loss": 0.958, + "step": 32401 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971374183616121e-06, + "loss": 0.7461, + "step": 32402 + }, + { + "epoch": 0.83, + "learning_rate": 1.6971175801078993e-06, + "loss": 1.0215, + "step": 32403 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970977413204364e-06, + "loss": 0.9463, + "step": 32404 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970779019992372e-06, + "loss": 0.8574, + "step": 32405 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970580621443178e-06, + "loss": 0.9648, + "step": 32406 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970382217556934e-06, + "loss": 0.917, + "step": 32407 + }, + { + "epoch": 0.83, + "learning_rate": 1.6970183808333785e-06, + "loss": 0.8574, + "step": 32408 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969985393773887e-06, + "loss": 0.7856, + "step": 32409 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969786973877392e-06, + "loss": 0.9355, + "step": 32410 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969588548644448e-06, + "loss": 0.8506, + "step": 32411 + }, + { + "epoch": 0.83, + "learning_rate": 1.6969390118075216e-06, + "loss": 0.834, + "step": 32412 + }, + { + "epoch": 0.83, + "learning_rate": 1.696919168216984e-06, + "loss": 0.833, + "step": 32413 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968993240928476e-06, + "loss": 0.9414, + "step": 32414 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968794794351272e-06, + "loss": 0.6855, + "step": 32415 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968596342438382e-06, + "loss": 0.8672, + "step": 32416 + }, + { + "epoch": 0.83, + "learning_rate": 1.696839788518996e-06, + "loss": 1.1602, + "step": 32417 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968199422606157e-06, + "loss": 0.7227, + "step": 32418 + }, + { + "epoch": 0.83, + "learning_rate": 1.6968000954687123e-06, + "loss": 0.7236, + "step": 32419 + }, + { + "epoch": 0.83, + "learning_rate": 1.696780248143301e-06, + "loss": 0.7363, + "step": 32420 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967604002843972e-06, + "loss": 0.8301, + "step": 32421 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967405518920161e-06, + "loss": 0.6475, + "step": 32422 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967207029661727e-06, + "loss": 0.9497, + "step": 32423 + }, + { + "epoch": 0.83, + "learning_rate": 1.6967008535068823e-06, + "loss": 0.8315, + "step": 32424 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966810035141598e-06, + "loss": 0.9717, + "step": 32425 + }, + { + "epoch": 0.83, + "learning_rate": 1.696661152988021e-06, + "loss": 0.8223, + "step": 32426 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966413019284809e-06, + "loss": 0.625, + "step": 32427 + }, + { + "epoch": 0.83, + "learning_rate": 1.6966214503355545e-06, + "loss": 0.7445, + "step": 32428 + }, + { + "epoch": 0.83, + "learning_rate": 1.696601598209257e-06, + "loss": 0.9512, + "step": 32429 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965817455496036e-06, + "loss": 0.8232, + "step": 32430 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965618923566098e-06, + "loss": 0.7329, + "step": 32431 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965420386302903e-06, + "loss": 0.7134, + "step": 32432 + }, + { + "epoch": 0.83, + "learning_rate": 1.696522184370661e-06, + "loss": 0.6416, + "step": 32433 + }, + { + "epoch": 0.83, + "learning_rate": 1.6965023295777362e-06, + "loss": 0.8672, + "step": 32434 + }, + { + "epoch": 0.83, + "learning_rate": 1.696482474251532e-06, + "loss": 0.8955, + "step": 32435 + }, + { + "epoch": 0.83, + "learning_rate": 1.696462618392063e-06, + "loss": 0.7227, + "step": 32436 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964427619993447e-06, + "loss": 0.9277, + "step": 32437 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964229050733922e-06, + "loss": 0.6787, + "step": 32438 + }, + { + "epoch": 0.83, + "learning_rate": 1.6964030476142206e-06, + "loss": 1.041, + "step": 32439 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963831896218453e-06, + "loss": 0.6553, + "step": 32440 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963633310962812e-06, + "loss": 0.7954, + "step": 32441 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963434720375442e-06, + "loss": 0.7744, + "step": 32442 + }, + { + "epoch": 0.83, + "learning_rate": 1.6963236124456487e-06, + "loss": 0.833, + "step": 32443 + }, + { + "epoch": 0.83, + "learning_rate": 1.69630375232061e-06, + "loss": 0.8818, + "step": 32444 + }, + { + "epoch": 0.83, + "learning_rate": 1.696283891662444e-06, + "loss": 0.783, + "step": 32445 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962640304711654e-06, + "loss": 0.9336, + "step": 32446 + }, + { + "epoch": 0.83, + "learning_rate": 1.696244168746789e-06, + "loss": 0.9375, + "step": 32447 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962243064893308e-06, + "loss": 1.0742, + "step": 32448 + }, + { + "epoch": 0.83, + "learning_rate": 1.6962044436988054e-06, + "loss": 0.7729, + "step": 32449 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961845803752283e-06, + "loss": 0.8115, + "step": 32450 + }, + { + "epoch": 0.83, + "learning_rate": 1.696164716518615e-06, + "loss": 0.9619, + "step": 32451 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961448521289805e-06, + "loss": 1.0195, + "step": 32452 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961249872063394e-06, + "loss": 0.8789, + "step": 32453 + }, + { + "epoch": 0.83, + "learning_rate": 1.6961051217507077e-06, + "loss": 0.7451, + "step": 32454 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960852557621002e-06, + "loss": 0.644, + "step": 32455 + }, + { + "epoch": 0.83, + "learning_rate": 1.696065389240532e-06, + "loss": 0.8047, + "step": 32456 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960455221860191e-06, + "loss": 0.9346, + "step": 32457 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960256545985758e-06, + "loss": 0.7788, + "step": 32458 + }, + { + "epoch": 0.83, + "learning_rate": 1.6960057864782176e-06, + "loss": 0.9326, + "step": 32459 + }, + { + "epoch": 0.83, + "learning_rate": 1.69598591782496e-06, + "loss": 0.5102, + "step": 32460 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959660486388177e-06, + "loss": 0.8799, + "step": 32461 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959461789198066e-06, + "loss": 0.5645, + "step": 32462 + }, + { + "epoch": 0.83, + "learning_rate": 1.695926308667941e-06, + "loss": 0.8301, + "step": 32463 + }, + { + "epoch": 0.83, + "learning_rate": 1.6959064378832371e-06, + "loss": 0.8379, + "step": 32464 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958865665657093e-06, + "loss": 0.6826, + "step": 32465 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958666947153734e-06, + "loss": 0.8096, + "step": 32466 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958468223322444e-06, + "loss": 0.6465, + "step": 32467 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958269494163374e-06, + "loss": 0.8398, + "step": 32468 + }, + { + "epoch": 0.83, + "learning_rate": 1.6958070759676675e-06, + "loss": 1.0303, + "step": 32469 + }, + { + "epoch": 0.83, + "learning_rate": 1.69578720198625e-06, + "loss": 0.9414, + "step": 32470 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957673274721005e-06, + "loss": 0.9902, + "step": 32471 + }, + { + "epoch": 0.83, + "learning_rate": 1.695747452425234e-06, + "loss": 0.9766, + "step": 32472 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957275768456656e-06, + "loss": 1.0557, + "step": 32473 + }, + { + "epoch": 0.83, + "learning_rate": 1.6957077007334108e-06, + "loss": 0.8438, + "step": 32474 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956878240884842e-06, + "loss": 0.9668, + "step": 32475 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956679469109017e-06, + "loss": 0.9092, + "step": 32476 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956480692006783e-06, + "loss": 0.8086, + "step": 32477 + }, + { + "epoch": 0.83, + "learning_rate": 1.695628190957829e-06, + "loss": 0.5361, + "step": 32478 + }, + { + "epoch": 0.83, + "learning_rate": 1.6956083121823692e-06, + "loss": 0.6602, + "step": 32479 + }, + { + "epoch": 0.83, + "learning_rate": 1.695588432874314e-06, + "loss": 0.8027, + "step": 32480 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955685530336787e-06, + "loss": 0.9365, + "step": 32481 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955486726604789e-06, + "loss": 0.8486, + "step": 32482 + }, + { + "epoch": 0.83, + "learning_rate": 1.6955287917547293e-06, + "loss": 0.8398, + "step": 32483 + }, + { + "epoch": 0.83, + "learning_rate": 1.695508910316445e-06, + "loss": 0.73, + "step": 32484 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954890283456417e-06, + "loss": 0.6985, + "step": 32485 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954691458423346e-06, + "loss": 0.8955, + "step": 32486 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954492628065385e-06, + "loss": 0.7969, + "step": 32487 + }, + { + "epoch": 0.83, + "learning_rate": 1.695429379238269e-06, + "loss": 0.7515, + "step": 32488 + }, + { + "epoch": 0.83, + "learning_rate": 1.6954094951375411e-06, + "loss": 0.8447, + "step": 32489 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953896105043701e-06, + "loss": 1.0205, + "step": 32490 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953697253387715e-06, + "loss": 0.8423, + "step": 32491 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953498396407603e-06, + "loss": 0.8643, + "step": 32492 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953299534103513e-06, + "loss": 0.7881, + "step": 32493 + }, + { + "epoch": 0.83, + "learning_rate": 1.6953100666475605e-06, + "loss": 0.8828, + "step": 32494 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952901793524025e-06, + "loss": 0.8262, + "step": 32495 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952702915248928e-06, + "loss": 0.8726, + "step": 32496 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952504031650468e-06, + "loss": 0.6685, + "step": 32497 + }, + { + "epoch": 0.83, + "learning_rate": 1.6952305142728793e-06, + "loss": 0.9209, + "step": 32498 + }, + { + "epoch": 0.83, + "learning_rate": 1.695210624848406e-06, + "loss": 0.8359, + "step": 32499 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951907348916419e-06, + "loss": 0.8029, + "step": 32500 + }, + { + "epoch": 0.83, + "learning_rate": 1.695170844402602e-06, + "loss": 0.877, + "step": 32501 + }, + { + "epoch": 0.83, + "learning_rate": 1.695150953381302e-06, + "loss": 0.5042, + "step": 32502 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951310618277566e-06, + "loss": 0.9033, + "step": 32503 + }, + { + "epoch": 0.83, + "learning_rate": 1.6951111697419816e-06, + "loss": 0.6904, + "step": 32504 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950912771239917e-06, + "loss": 0.6943, + "step": 32505 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950713839738024e-06, + "loss": 0.7197, + "step": 32506 + }, + { + "epoch": 0.83, + "learning_rate": 1.695051490291429e-06, + "loss": 0.6885, + "step": 32507 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950315960768866e-06, + "loss": 0.7842, + "step": 32508 + }, + { + "epoch": 0.83, + "learning_rate": 1.6950117013301902e-06, + "loss": 0.9268, + "step": 32509 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949918060513558e-06, + "loss": 0.7417, + "step": 32510 + }, + { + "epoch": 0.83, + "learning_rate": 1.694971910240398e-06, + "loss": 0.9336, + "step": 32511 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949520138973318e-06, + "loss": 0.9326, + "step": 32512 + }, + { + "epoch": 0.83, + "learning_rate": 1.694932117022173e-06, + "loss": 0.5508, + "step": 32513 + }, + { + "epoch": 0.83, + "learning_rate": 1.6949122196149368e-06, + "loss": 0.5701, + "step": 32514 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948923216756382e-06, + "loss": 1.0352, + "step": 32515 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948724232042924e-06, + "loss": 1.0107, + "step": 32516 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948525242009147e-06, + "loss": 0.8193, + "step": 32517 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948326246655204e-06, + "loss": 0.7593, + "step": 32518 + }, + { + "epoch": 0.83, + "learning_rate": 1.6948127245981247e-06, + "loss": 0.96, + "step": 32519 + }, + { + "epoch": 0.83, + "learning_rate": 1.694792823998743e-06, + "loss": 0.9023, + "step": 32520 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947729228673904e-06, + "loss": 0.5811, + "step": 32521 + }, + { + "epoch": 0.83, + "learning_rate": 1.694753021204082e-06, + "loss": 0.7451, + "step": 32522 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947331190088333e-06, + "loss": 0.751, + "step": 32523 + }, + { + "epoch": 0.83, + "learning_rate": 1.6947132162816591e-06, + "loss": 0.8633, + "step": 32524 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946933130225752e-06, + "loss": 1.0264, + "step": 32525 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946734092315964e-06, + "loss": 0.7637, + "step": 32526 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946535049087382e-06, + "loss": 1.0039, + "step": 32527 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946336000540159e-06, + "loss": 0.7178, + "step": 32528 + }, + { + "epoch": 0.83, + "learning_rate": 1.6946136946674443e-06, + "loss": 0.8848, + "step": 32529 + }, + { + "epoch": 0.83, + "learning_rate": 1.694593788749039e-06, + "loss": 0.8594, + "step": 32530 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945738822988152e-06, + "loss": 0.6758, + "step": 32531 + }, + { + "epoch": 0.83, + "learning_rate": 1.694553975316788e-06, + "loss": 0.8647, + "step": 32532 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945340678029729e-06, + "loss": 1.0186, + "step": 32533 + }, + { + "epoch": 0.83, + "learning_rate": 1.6945141597573851e-06, + "loss": 0.8086, + "step": 32534 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944942511800394e-06, + "loss": 0.9277, + "step": 32535 + }, + { + "epoch": 0.83, + "learning_rate": 1.694474342070952e-06, + "loss": 0.7588, + "step": 32536 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944544324301372e-06, + "loss": 1.0303, + "step": 32537 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944345222576104e-06, + "loss": 0.915, + "step": 32538 + }, + { + "epoch": 0.83, + "learning_rate": 1.6944146115533872e-06, + "loss": 0.6445, + "step": 32539 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943947003174826e-06, + "loss": 0.6758, + "step": 32540 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943747885499118e-06, + "loss": 0.749, + "step": 32541 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943548762506904e-06, + "loss": 0.7026, + "step": 32542 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943349634198333e-06, + "loss": 0.8047, + "step": 32543 + }, + { + "epoch": 0.83, + "learning_rate": 1.6943150500573558e-06, + "loss": 0.7705, + "step": 32544 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942951361632732e-06, + "loss": 0.8511, + "step": 32545 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942752217376008e-06, + "loss": 0.8447, + "step": 32546 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942553067803538e-06, + "loss": 0.6807, + "step": 32547 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942353912915474e-06, + "loss": 0.8936, + "step": 32548 + }, + { + "epoch": 0.83, + "learning_rate": 1.6942154752711968e-06, + "loss": 0.874, + "step": 32549 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941955587193173e-06, + "loss": 0.8142, + "step": 32550 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941756416359242e-06, + "loss": 0.8174, + "step": 32551 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941557240210328e-06, + "loss": 0.8535, + "step": 32552 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941358058746583e-06, + "loss": 0.9795, + "step": 32553 + }, + { + "epoch": 0.83, + "learning_rate": 1.6941158871968159e-06, + "loss": 0.8047, + "step": 32554 + }, + { + "epoch": 0.83, + "learning_rate": 1.694095967987521e-06, + "loss": 0.8359, + "step": 32555 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940760482467887e-06, + "loss": 0.9775, + "step": 32556 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940561279746342e-06, + "loss": 0.8145, + "step": 32557 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940362071710729e-06, + "loss": 0.8857, + "step": 32558 + }, + { + "epoch": 0.83, + "learning_rate": 1.6940162858361195e-06, + "loss": 0.8945, + "step": 32559 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939963639697903e-06, + "loss": 0.793, + "step": 32560 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939764415720998e-06, + "loss": 0.8169, + "step": 32561 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939565186430636e-06, + "loss": 0.9189, + "step": 32562 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939365951826966e-06, + "loss": 0.752, + "step": 32563 + }, + { + "epoch": 0.83, + "learning_rate": 1.6939166711910144e-06, + "loss": 0.8604, + "step": 32564 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938967466680323e-06, + "loss": 0.959, + "step": 32565 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938768216137648e-06, + "loss": 0.8018, + "step": 32566 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938568960282286e-06, + "loss": 0.7383, + "step": 32567 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938369699114375e-06, + "loss": 0.8379, + "step": 32568 + }, + { + "epoch": 0.83, + "learning_rate": 1.6938170432634072e-06, + "loss": 0.7842, + "step": 32569 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937971160841533e-06, + "loss": 0.9688, + "step": 32570 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937771883736906e-06, + "loss": 0.9102, + "step": 32571 + }, + { + "epoch": 0.83, + "learning_rate": 1.693757260132035e-06, + "loss": 0.8286, + "step": 32572 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937373313592015e-06, + "loss": 0.7295, + "step": 32573 + }, + { + "epoch": 0.83, + "learning_rate": 1.6937174020552047e-06, + "loss": 0.8594, + "step": 32574 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936974722200606e-06, + "loss": 1.043, + "step": 32575 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936775418537842e-06, + "loss": 0.874, + "step": 32576 + }, + { + "epoch": 0.83, + "learning_rate": 1.693657610956391e-06, + "loss": 0.7769, + "step": 32577 + }, + { + "epoch": 0.83, + "learning_rate": 1.6936376795278959e-06, + "loss": 0.7236, + "step": 32578 + }, + { + "epoch": 0.84, + "learning_rate": 1.6936177475683143e-06, + "loss": 0.8418, + "step": 32579 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935978150776613e-06, + "loss": 0.876, + "step": 32580 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935778820559527e-06, + "loss": 0.8398, + "step": 32581 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935579485032035e-06, + "loss": 0.8818, + "step": 32582 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935380144194285e-06, + "loss": 0.8472, + "step": 32583 + }, + { + "epoch": 0.84, + "learning_rate": 1.6935180798046434e-06, + "loss": 0.9492, + "step": 32584 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934981446588635e-06, + "loss": 0.9355, + "step": 32585 + }, + { + "epoch": 0.84, + "learning_rate": 1.693478208982104e-06, + "loss": 0.9341, + "step": 32586 + }, + { + "epoch": 0.84, + "learning_rate": 1.69345827277438e-06, + "loss": 0.6836, + "step": 32587 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934383360357072e-06, + "loss": 0.9756, + "step": 32588 + }, + { + "epoch": 0.84, + "learning_rate": 1.6934183987661002e-06, + "loss": 0.8457, + "step": 32589 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933984609655747e-06, + "loss": 0.793, + "step": 32590 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933785226341458e-06, + "loss": 0.7036, + "step": 32591 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933585837718289e-06, + "loss": 0.7363, + "step": 32592 + }, + { + "epoch": 0.84, + "learning_rate": 1.6933386443786396e-06, + "loss": 0.8477, + "step": 32593 + }, + { + "epoch": 0.84, + "learning_rate": 1.693318704454592e-06, + "loss": 1.0586, + "step": 32594 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932987639997028e-06, + "loss": 0.5798, + "step": 32595 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932788230139863e-06, + "loss": 0.9023, + "step": 32596 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932588814974582e-06, + "loss": 1.0205, + "step": 32597 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932389394501337e-06, + "loss": 0.6011, + "step": 32598 + }, + { + "epoch": 0.84, + "learning_rate": 1.6932189968720279e-06, + "loss": 0.6641, + "step": 32599 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931990537631564e-06, + "loss": 0.8779, + "step": 32600 + }, + { + "epoch": 0.84, + "learning_rate": 1.693179110123534e-06, + "loss": 0.8223, + "step": 32601 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931591659531763e-06, + "loss": 0.7847, + "step": 32602 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931392212520986e-06, + "loss": 0.8242, + "step": 32603 + }, + { + "epoch": 0.84, + "learning_rate": 1.6931192760203159e-06, + "loss": 0.6538, + "step": 32604 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930993302578439e-06, + "loss": 1.0166, + "step": 32605 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930793839646973e-06, + "loss": 0.7764, + "step": 32606 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930594371408917e-06, + "loss": 0.8213, + "step": 32607 + }, + { + "epoch": 0.84, + "learning_rate": 1.6930394897864427e-06, + "loss": 1.0322, + "step": 32608 + }, + { + "epoch": 0.84, + "learning_rate": 1.693019541901365e-06, + "loss": 1.2217, + "step": 32609 + }, + { + "epoch": 0.84, + "learning_rate": 1.692999593485674e-06, + "loss": 0.7891, + "step": 32610 + }, + { + "epoch": 0.84, + "learning_rate": 1.692979644539385e-06, + "loss": 0.8867, + "step": 32611 + }, + { + "epoch": 0.84, + "learning_rate": 1.6929596950625137e-06, + "loss": 1.1074, + "step": 32612 + }, + { + "epoch": 0.84, + "learning_rate": 1.692939745055075e-06, + "loss": 0.8477, + "step": 32613 + }, + { + "epoch": 0.84, + "learning_rate": 1.6929197945170841e-06, + "loss": 0.8271, + "step": 32614 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928998434485563e-06, + "loss": 0.9463, + "step": 32615 + }, + { + "epoch": 0.84, + "learning_rate": 1.692879891849507e-06, + "loss": 0.7681, + "step": 32616 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928599397199515e-06, + "loss": 0.6245, + "step": 32617 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928399870599052e-06, + "loss": 0.8633, + "step": 32618 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928200338693826e-06, + "loss": 0.9141, + "step": 32619 + }, + { + "epoch": 0.84, + "learning_rate": 1.6928000801484e-06, + "loss": 0.7495, + "step": 32620 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927801258969718e-06, + "loss": 0.6797, + "step": 32621 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927601711151143e-06, + "loss": 0.9307, + "step": 32622 + }, + { + "epoch": 0.84, + "learning_rate": 1.692740215802842e-06, + "loss": 0.5938, + "step": 32623 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927202599601699e-06, + "loss": 0.7573, + "step": 32624 + }, + { + "epoch": 0.84, + "learning_rate": 1.6927003035871144e-06, + "loss": 0.6396, + "step": 32625 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926803466836896e-06, + "loss": 0.9355, + "step": 32626 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926603892499119e-06, + "loss": 1.0977, + "step": 32627 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926404312857954e-06, + "loss": 0.5513, + "step": 32628 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926204727913562e-06, + "loss": 0.7222, + "step": 32629 + }, + { + "epoch": 0.84, + "learning_rate": 1.6926005137666092e-06, + "loss": 1.1328, + "step": 32630 + }, + { + "epoch": 0.84, + "learning_rate": 1.69258055421157e-06, + "loss": 0.6992, + "step": 32631 + }, + { + "epoch": 0.84, + "learning_rate": 1.692560594126254e-06, + "loss": 1.0674, + "step": 32632 + }, + { + "epoch": 0.84, + "learning_rate": 1.692540633510676e-06, + "loss": 0.7119, + "step": 32633 + }, + { + "epoch": 0.84, + "learning_rate": 1.6925206723648513e-06, + "loss": 0.9014, + "step": 32634 + }, + { + "epoch": 0.84, + "learning_rate": 1.6925007106887955e-06, + "loss": 0.8447, + "step": 32635 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924807484825237e-06, + "loss": 1.0742, + "step": 32636 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924607857460514e-06, + "loss": 0.811, + "step": 32637 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924408224793933e-06, + "loss": 0.8398, + "step": 32638 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924208586825651e-06, + "loss": 0.8789, + "step": 32639 + }, + { + "epoch": 0.84, + "learning_rate": 1.6924008943555825e-06, + "loss": 0.7852, + "step": 32640 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923809294984603e-06, + "loss": 0.6685, + "step": 32641 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923609641112137e-06, + "loss": 0.7725, + "step": 32642 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923409981938583e-06, + "loss": 0.8467, + "step": 32643 + }, + { + "epoch": 0.84, + "learning_rate": 1.692321031746409e-06, + "loss": 0.8252, + "step": 32644 + }, + { + "epoch": 0.84, + "learning_rate": 1.6923010647688818e-06, + "loss": 0.8311, + "step": 32645 + }, + { + "epoch": 0.84, + "learning_rate": 1.692281097261291e-06, + "loss": 1.1221, + "step": 32646 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922611292236527e-06, + "loss": 0.8213, + "step": 32647 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922411606559816e-06, + "loss": 0.9199, + "step": 32648 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922211915582936e-06, + "loss": 0.6226, + "step": 32649 + }, + { + "epoch": 0.84, + "learning_rate": 1.6922012219306035e-06, + "loss": 1.0371, + "step": 32650 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921812517729266e-06, + "loss": 0.8081, + "step": 32651 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921612810852786e-06, + "loss": 0.7993, + "step": 32652 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921413098676744e-06, + "loss": 0.7378, + "step": 32653 + }, + { + "epoch": 0.84, + "learning_rate": 1.6921213381201294e-06, + "loss": 1.001, + "step": 32654 + }, + { + "epoch": 0.84, + "learning_rate": 1.692101365842659e-06, + "loss": 0.835, + "step": 32655 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920813930352785e-06, + "loss": 0.791, + "step": 32656 + }, + { + "epoch": 0.84, + "learning_rate": 1.692061419698003e-06, + "loss": 0.8696, + "step": 32657 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920414458308478e-06, + "loss": 0.7393, + "step": 32658 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920214714338284e-06, + "loss": 1.0811, + "step": 32659 + }, + { + "epoch": 0.84, + "learning_rate": 1.6920014965069598e-06, + "loss": 0.9404, + "step": 32660 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919815210502577e-06, + "loss": 0.4829, + "step": 32661 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919615450637371e-06, + "loss": 0.9502, + "step": 32662 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919415685474135e-06, + "loss": 0.9092, + "step": 32663 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919215915013015e-06, + "loss": 0.8848, + "step": 32664 + }, + { + "epoch": 0.84, + "learning_rate": 1.6919016139254177e-06, + "loss": 0.677, + "step": 32665 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918816358197763e-06, + "loss": 0.8066, + "step": 32666 + }, + { + "epoch": 0.84, + "learning_rate": 1.691861657184393e-06, + "loss": 0.9316, + "step": 32667 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918416780192825e-06, + "loss": 0.7729, + "step": 32668 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918216983244612e-06, + "loss": 0.7424, + "step": 32669 + }, + { + "epoch": 0.84, + "learning_rate": 1.6918017180999437e-06, + "loss": 0.9834, + "step": 32670 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917817373457457e-06, + "loss": 0.8486, + "step": 32671 + }, + { + "epoch": 0.84, + "learning_rate": 1.691761756061882e-06, + "loss": 0.7158, + "step": 32672 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917417742483682e-06, + "loss": 1.0215, + "step": 32673 + }, + { + "epoch": 0.84, + "learning_rate": 1.6917217919052194e-06, + "loss": 0.9209, + "step": 32674 + }, + { + "epoch": 0.84, + "learning_rate": 1.691701809032451e-06, + "loss": 0.8516, + "step": 32675 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916818256300787e-06, + "loss": 0.6421, + "step": 32676 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916618416981171e-06, + "loss": 0.7856, + "step": 32677 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916418572365817e-06, + "loss": 0.833, + "step": 32678 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916218722454883e-06, + "loss": 0.6514, + "step": 32679 + }, + { + "epoch": 0.84, + "learning_rate": 1.6916018867248515e-06, + "loss": 1.0576, + "step": 32680 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915819006746874e-06, + "loss": 1.0625, + "step": 32681 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915619140950106e-06, + "loss": 0.6445, + "step": 32682 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915419269858365e-06, + "loss": 0.7544, + "step": 32683 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915219393471807e-06, + "loss": 0.8557, + "step": 32684 + }, + { + "epoch": 0.84, + "learning_rate": 1.6915019511790583e-06, + "loss": 0.5503, + "step": 32685 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914819624814847e-06, + "loss": 0.7061, + "step": 32686 + }, + { + "epoch": 0.84, + "learning_rate": 1.691461973254475e-06, + "loss": 0.7959, + "step": 32687 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914419834980447e-06, + "loss": 0.8188, + "step": 32688 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914219932122091e-06, + "loss": 0.7051, + "step": 32689 + }, + { + "epoch": 0.84, + "learning_rate": 1.6914020023969835e-06, + "loss": 0.7407, + "step": 32690 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913820110523834e-06, + "loss": 0.9854, + "step": 32691 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913620191784235e-06, + "loss": 0.8574, + "step": 32692 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913420267751194e-06, + "loss": 0.8633, + "step": 32693 + }, + { + "epoch": 0.84, + "learning_rate": 1.691322033842487e-06, + "loss": 0.9883, + "step": 32694 + }, + { + "epoch": 0.84, + "learning_rate": 1.6913020403805408e-06, + "loss": 0.668, + "step": 32695 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912820463892964e-06, + "loss": 0.6665, + "step": 32696 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912620518687692e-06, + "loss": 0.8506, + "step": 32697 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912420568189744e-06, + "loss": 0.8237, + "step": 32698 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912220612399275e-06, + "loss": 0.9629, + "step": 32699 + }, + { + "epoch": 0.84, + "learning_rate": 1.6912020651316435e-06, + "loss": 0.8994, + "step": 32700 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911820684941378e-06, + "loss": 0.6746, + "step": 32701 + }, + { + "epoch": 0.84, + "learning_rate": 1.691162071327426e-06, + "loss": 1.001, + "step": 32702 + }, + { + "epoch": 0.84, + "learning_rate": 1.691142073631523e-06, + "loss": 0.8535, + "step": 32703 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911220754064442e-06, + "loss": 0.7261, + "step": 32704 + }, + { + "epoch": 0.84, + "learning_rate": 1.6911020766522051e-06, + "loss": 0.8379, + "step": 32705 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910820773688211e-06, + "loss": 0.9697, + "step": 32706 + }, + { + "epoch": 0.84, + "learning_rate": 1.691062077556307e-06, + "loss": 0.8252, + "step": 32707 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910420772146786e-06, + "loss": 0.7197, + "step": 32708 + }, + { + "epoch": 0.84, + "learning_rate": 1.691022076343951e-06, + "loss": 0.7344, + "step": 32709 + }, + { + "epoch": 0.84, + "learning_rate": 1.6910020749441399e-06, + "loss": 0.7603, + "step": 32710 + }, + { + "epoch": 0.84, + "learning_rate": 1.69098207301526e-06, + "loss": 0.9014, + "step": 32711 + }, + { + "epoch": 0.84, + "learning_rate": 1.690962070557327e-06, + "loss": 0.8418, + "step": 32712 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909420675703558e-06, + "loss": 0.8428, + "step": 32713 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909220640543621e-06, + "loss": 0.8369, + "step": 32714 + }, + { + "epoch": 0.84, + "learning_rate": 1.6909020600093614e-06, + "loss": 0.8701, + "step": 32715 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908820554353688e-06, + "loss": 1.0547, + "step": 32716 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908620503323996e-06, + "loss": 0.6548, + "step": 32717 + }, + { + "epoch": 0.84, + "learning_rate": 1.690842044700469e-06, + "loss": 0.7949, + "step": 32718 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908220385395923e-06, + "loss": 0.8369, + "step": 32719 + }, + { + "epoch": 0.84, + "learning_rate": 1.6908020318497848e-06, + "loss": 0.9326, + "step": 32720 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907820246310624e-06, + "loss": 0.6157, + "step": 32721 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907620168834397e-06, + "loss": 0.8066, + "step": 32722 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907420086069322e-06, + "loss": 0.8926, + "step": 32723 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907219998015554e-06, + "loss": 0.9893, + "step": 32724 + }, + { + "epoch": 0.84, + "learning_rate": 1.6907019904673244e-06, + "loss": 0.7612, + "step": 32725 + }, + { + "epoch": 0.84, + "learning_rate": 1.690681980604255e-06, + "loss": 0.9502, + "step": 32726 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906619702123618e-06, + "loss": 0.8428, + "step": 32727 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906419592916606e-06, + "loss": 0.8506, + "step": 32728 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906219478421666e-06, + "loss": 1.0342, + "step": 32729 + }, + { + "epoch": 0.84, + "learning_rate": 1.6906019358638951e-06, + "loss": 0.9082, + "step": 32730 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905819233568617e-06, + "loss": 0.6787, + "step": 32731 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905619103210812e-06, + "loss": 0.9209, + "step": 32732 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905418967565693e-06, + "loss": 0.9453, + "step": 32733 + }, + { + "epoch": 0.84, + "learning_rate": 1.690521882663341e-06, + "loss": 0.9717, + "step": 32734 + }, + { + "epoch": 0.84, + "learning_rate": 1.6905018680414122e-06, + "loss": 0.959, + "step": 32735 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904818528907978e-06, + "loss": 0.5698, + "step": 32736 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904618372115131e-06, + "loss": 0.832, + "step": 32737 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904418210035733e-06, + "loss": 0.541, + "step": 32738 + }, + { + "epoch": 0.84, + "learning_rate": 1.6904218042669944e-06, + "loss": 0.79, + "step": 32739 + }, + { + "epoch": 0.84, + "learning_rate": 1.690401787001791e-06, + "loss": 0.9102, + "step": 32740 + }, + { + "epoch": 0.84, + "learning_rate": 1.690381769207979e-06, + "loss": 0.9531, + "step": 32741 + }, + { + "epoch": 0.84, + "learning_rate": 1.690361750885573e-06, + "loss": 0.8096, + "step": 32742 + }, + { + "epoch": 0.84, + "learning_rate": 1.690341732034589e-06, + "loss": 0.9004, + "step": 32743 + }, + { + "epoch": 0.84, + "learning_rate": 1.690321712655042e-06, + "loss": 1.1875, + "step": 32744 + }, + { + "epoch": 0.84, + "learning_rate": 1.690301692746947e-06, + "loss": 0.9346, + "step": 32745 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902816723103206e-06, + "loss": 0.6777, + "step": 32746 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902616513451768e-06, + "loss": 0.6724, + "step": 32747 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902416298515312e-06, + "loss": 0.832, + "step": 32748 + }, + { + "epoch": 0.84, + "learning_rate": 1.6902216078293997e-06, + "loss": 0.9062, + "step": 32749 + }, + { + "epoch": 0.84, + "learning_rate": 1.690201585278797e-06, + "loss": 0.9248, + "step": 32750 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901815621997388e-06, + "loss": 0.9785, + "step": 32751 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901615385922403e-06, + "loss": 0.6389, + "step": 32752 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901415144563167e-06, + "loss": 0.6914, + "step": 32753 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901214897919837e-06, + "loss": 0.5713, + "step": 32754 + }, + { + "epoch": 0.84, + "learning_rate": 1.6901014645992563e-06, + "loss": 0.7368, + "step": 32755 + }, + { + "epoch": 0.84, + "learning_rate": 1.69008143887815e-06, + "loss": 0.813, + "step": 32756 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900614126286798e-06, + "loss": 0.8262, + "step": 32757 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900413858508615e-06, + "loss": 0.7095, + "step": 32758 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900213585447103e-06, + "loss": 1.1133, + "step": 32759 + }, + { + "epoch": 0.84, + "learning_rate": 1.6900013307102414e-06, + "loss": 0.9297, + "step": 32760 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899813023474706e-06, + "loss": 0.8818, + "step": 32761 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899612734564122e-06, + "loss": 0.7549, + "step": 32762 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899412440370825e-06, + "loss": 0.8662, + "step": 32763 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899212140894962e-06, + "loss": 0.6445, + "step": 32764 + }, + { + "epoch": 0.84, + "learning_rate": 1.6899011836136693e-06, + "loss": 0.8975, + "step": 32765 + }, + { + "epoch": 0.84, + "learning_rate": 1.689881152609617e-06, + "loss": 0.8535, + "step": 32766 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898611210773538e-06, + "loss": 0.9395, + "step": 32767 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898410890168962e-06, + "loss": 0.7998, + "step": 32768 + }, + { + "epoch": 0.84, + "learning_rate": 1.6898210564282586e-06, + "loss": 0.6821, + "step": 32769 + }, + { + "epoch": 0.84, + "learning_rate": 1.689801023311457e-06, + "loss": 0.5591, + "step": 32770 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897809896665068e-06, + "loss": 0.876, + "step": 32771 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897609554934221e-06, + "loss": 0.7334, + "step": 32772 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897409207922198e-06, + "loss": 0.9072, + "step": 32773 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897208855629145e-06, + "loss": 0.8491, + "step": 32774 + }, + { + "epoch": 0.84, + "learning_rate": 1.6897008498055217e-06, + "loss": 0.9688, + "step": 32775 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896808135200567e-06, + "loss": 0.7336, + "step": 32776 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896607767065344e-06, + "loss": 0.7573, + "step": 32777 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896407393649708e-06, + "loss": 1.1504, + "step": 32778 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896207014953812e-06, + "loss": 0.8164, + "step": 32779 + }, + { + "epoch": 0.84, + "learning_rate": 1.6896006630977807e-06, + "loss": 0.8149, + "step": 32780 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895806241721843e-06, + "loss": 0.877, + "step": 32781 + }, + { + "epoch": 0.84, + "learning_rate": 1.689560584718608e-06, + "loss": 0.6904, + "step": 32782 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895405447370669e-06, + "loss": 0.8906, + "step": 32783 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895205042275763e-06, + "loss": 0.7686, + "step": 32784 + }, + { + "epoch": 0.84, + "learning_rate": 1.6895004631901512e-06, + "loss": 0.8672, + "step": 32785 + }, + { + "epoch": 0.84, + "learning_rate": 1.689480421624808e-06, + "loss": 0.6331, + "step": 32786 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894603795315606e-06, + "loss": 0.8574, + "step": 32787 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894403369104256e-06, + "loss": 0.6338, + "step": 32788 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894202937614177e-06, + "loss": 0.667, + "step": 32789 + }, + { + "epoch": 0.84, + "learning_rate": 1.6894002500845522e-06, + "loss": 0.8154, + "step": 32790 + }, + { + "epoch": 0.84, + "learning_rate": 1.689380205879845e-06, + "loss": 0.8027, + "step": 32791 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893601611473108e-06, + "loss": 0.7673, + "step": 32792 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893401158869653e-06, + "loss": 0.8066, + "step": 32793 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893200700988238e-06, + "loss": 0.6328, + "step": 32794 + }, + { + "epoch": 0.84, + "learning_rate": 1.6893000237829016e-06, + "loss": 0.749, + "step": 32795 + }, + { + "epoch": 0.84, + "learning_rate": 1.689279976939214e-06, + "loss": 0.8584, + "step": 32796 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892599295677762e-06, + "loss": 1.0449, + "step": 32797 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892398816686042e-06, + "loss": 1.1133, + "step": 32798 + }, + { + "epoch": 0.84, + "learning_rate": 1.6892198332417126e-06, + "loss": 0.8936, + "step": 32799 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891997842871172e-06, + "loss": 0.856, + "step": 32800 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891797348048334e-06, + "loss": 0.7666, + "step": 32801 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891596847948762e-06, + "loss": 0.9814, + "step": 32802 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891396342572609e-06, + "loss": 0.8652, + "step": 32803 + }, + { + "epoch": 0.84, + "learning_rate": 1.6891195831920034e-06, + "loss": 0.8926, + "step": 32804 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890995315991186e-06, + "loss": 0.856, + "step": 32805 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890794794786222e-06, + "loss": 0.8374, + "step": 32806 + }, + { + "epoch": 0.84, + "learning_rate": 1.689059426830529e-06, + "loss": 0.9067, + "step": 32807 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890393736548546e-06, + "loss": 0.6797, + "step": 32808 + }, + { + "epoch": 0.84, + "learning_rate": 1.6890193199516146e-06, + "loss": 0.9697, + "step": 32809 + }, + { + "epoch": 0.84, + "learning_rate": 1.688999265720824e-06, + "loss": 0.6309, + "step": 32810 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889792109624988e-06, + "loss": 1.1328, + "step": 32811 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889591556766535e-06, + "loss": 0.6685, + "step": 32812 + }, + { + "epoch": 0.84, + "learning_rate": 1.688939099863304e-06, + "loss": 0.96, + "step": 32813 + }, + { + "epoch": 0.84, + "learning_rate": 1.6889190435224654e-06, + "loss": 0.6001, + "step": 32814 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888989866541533e-06, + "loss": 1.0146, + "step": 32815 + }, + { + "epoch": 0.84, + "learning_rate": 1.688878929258383e-06, + "loss": 1.0586, + "step": 32816 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888588713351697e-06, + "loss": 0.8428, + "step": 32817 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888388128845288e-06, + "loss": 0.9707, + "step": 32818 + }, + { + "epoch": 0.84, + "learning_rate": 1.6888187539064756e-06, + "loss": 0.8301, + "step": 32819 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887986944010258e-06, + "loss": 0.7666, + "step": 32820 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887786343681942e-06, + "loss": 0.9443, + "step": 32821 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887585738079966e-06, + "loss": 0.8281, + "step": 32822 + }, + { + "epoch": 0.84, + "learning_rate": 1.688738512720448e-06, + "loss": 1.0312, + "step": 32823 + }, + { + "epoch": 0.84, + "learning_rate": 1.6887184511055646e-06, + "loss": 0.8008, + "step": 32824 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886983889633605e-06, + "loss": 0.6516, + "step": 32825 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886783262938522e-06, + "loss": 1.0273, + "step": 32826 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886582630970544e-06, + "loss": 0.7251, + "step": 32827 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886381993729825e-06, + "loss": 0.8887, + "step": 32828 + }, + { + "epoch": 0.84, + "learning_rate": 1.6886181351216522e-06, + "loss": 0.6699, + "step": 32829 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885980703430786e-06, + "loss": 0.7305, + "step": 32830 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885780050372772e-06, + "loss": 0.6895, + "step": 32831 + }, + { + "epoch": 0.84, + "learning_rate": 1.688557939204263e-06, + "loss": 1.1113, + "step": 32832 + }, + { + "epoch": 0.84, + "learning_rate": 1.6885378728440518e-06, + "loss": 0.8867, + "step": 32833 + }, + { + "epoch": 0.84, + "learning_rate": 1.688517805956659e-06, + "loss": 0.7852, + "step": 32834 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884977385420992e-06, + "loss": 1.0957, + "step": 32835 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884776706003891e-06, + "loss": 0.793, + "step": 32836 + }, + { + "epoch": 0.84, + "learning_rate": 1.688457602131543e-06, + "loss": 0.96, + "step": 32837 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884375331355764e-06, + "loss": 0.7458, + "step": 32838 + }, + { + "epoch": 0.84, + "learning_rate": 1.6884174636125051e-06, + "loss": 0.4956, + "step": 32839 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883973935623439e-06, + "loss": 0.7754, + "step": 32840 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883773229851087e-06, + "loss": 0.7852, + "step": 32841 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883572518808148e-06, + "loss": 0.7513, + "step": 32842 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883371802494768e-06, + "loss": 0.6484, + "step": 32843 + }, + { + "epoch": 0.84, + "learning_rate": 1.6883171080911111e-06, + "loss": 0.8135, + "step": 32844 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882970354057327e-06, + "loss": 1.0049, + "step": 32845 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882769621933565e-06, + "loss": 0.8623, + "step": 32846 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882568884539987e-06, + "loss": 1.1406, + "step": 32847 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882368141876742e-06, + "loss": 0.8477, + "step": 32848 + }, + { + "epoch": 0.84, + "learning_rate": 1.6882167393943983e-06, + "loss": 0.9629, + "step": 32849 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881966640741865e-06, + "loss": 0.8477, + "step": 32850 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881765882270541e-06, + "loss": 0.8225, + "step": 32851 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881565118530167e-06, + "loss": 0.8418, + "step": 32852 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881364349520894e-06, + "loss": 0.9404, + "step": 32853 + }, + { + "epoch": 0.84, + "learning_rate": 1.6881163575242877e-06, + "loss": 1.1133, + "step": 32854 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880962795696268e-06, + "loss": 0.8408, + "step": 32855 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880762010881227e-06, + "loss": 0.6523, + "step": 32856 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880561220797897e-06, + "loss": 0.8691, + "step": 32857 + }, + { + "epoch": 0.84, + "learning_rate": 1.688036042544644e-06, + "loss": 0.9619, + "step": 32858 + }, + { + "epoch": 0.84, + "learning_rate": 1.6880159624827006e-06, + "loss": 0.854, + "step": 32859 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879958818939753e-06, + "loss": 0.8608, + "step": 32860 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879758007784833e-06, + "loss": 0.8159, + "step": 32861 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879557191362395e-06, + "loss": 0.689, + "step": 32862 + }, + { + "epoch": 0.84, + "learning_rate": 1.6879356369672598e-06, + "loss": 0.9434, + "step": 32863 + }, + { + "epoch": 0.84, + "learning_rate": 1.687915554271559e-06, + "loss": 0.9492, + "step": 32864 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878954710491533e-06, + "loss": 0.7939, + "step": 32865 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878753873000578e-06, + "loss": 0.627, + "step": 32866 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878553030242875e-06, + "loss": 0.8281, + "step": 32867 + }, + { + "epoch": 0.84, + "learning_rate": 1.687835218221858e-06, + "loss": 0.8682, + "step": 32868 + }, + { + "epoch": 0.84, + "learning_rate": 1.6878151328927848e-06, + "loss": 0.8232, + "step": 32869 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877950470370832e-06, + "loss": 0.8723, + "step": 32870 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877749606547687e-06, + "loss": 0.8711, + "step": 32871 + }, + { + "epoch": 0.84, + "learning_rate": 1.687754873745856e-06, + "loss": 0.7817, + "step": 32872 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877347863103615e-06, + "loss": 0.958, + "step": 32873 + }, + { + "epoch": 0.84, + "learning_rate": 1.6877146983482999e-06, + "loss": 0.8174, + "step": 32874 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876946098596868e-06, + "loss": 0.7344, + "step": 32875 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876745208445379e-06, + "loss": 0.8105, + "step": 32876 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876544313028678e-06, + "loss": 0.79, + "step": 32877 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876343412346926e-06, + "loss": 1.0615, + "step": 32878 + }, + { + "epoch": 0.84, + "learning_rate": 1.6876142506400272e-06, + "loss": 0.9375, + "step": 32879 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875941595188871e-06, + "loss": 1.0381, + "step": 32880 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875740678712882e-06, + "loss": 0.7832, + "step": 32881 + }, + { + "epoch": 0.84, + "learning_rate": 1.687553975697245e-06, + "loss": 0.791, + "step": 32882 + }, + { + "epoch": 0.84, + "learning_rate": 1.6875338829967736e-06, + "loss": 0.8457, + "step": 32883 + }, + { + "epoch": 0.84, + "learning_rate": 1.687513789769889e-06, + "loss": 0.6855, + "step": 32884 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874936960166067e-06, + "loss": 0.8247, + "step": 32885 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874736017369422e-06, + "loss": 0.9189, + "step": 32886 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874535069309106e-06, + "loss": 0.7178, + "step": 32887 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874334115985276e-06, + "loss": 0.8477, + "step": 32888 + }, + { + "epoch": 0.84, + "learning_rate": 1.6874133157398084e-06, + "loss": 0.8438, + "step": 32889 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873932193547683e-06, + "loss": 0.8223, + "step": 32890 + }, + { + "epoch": 0.84, + "learning_rate": 1.687373122443423e-06, + "loss": 0.9658, + "step": 32891 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873530250057877e-06, + "loss": 0.8418, + "step": 32892 + }, + { + "epoch": 0.84, + "learning_rate": 1.687332927041878e-06, + "loss": 1.0166, + "step": 32893 + }, + { + "epoch": 0.84, + "learning_rate": 1.6873128285517084e-06, + "loss": 0.8496, + "step": 32894 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872927295352955e-06, + "loss": 0.8174, + "step": 32895 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872726299926543e-06, + "loss": 0.6748, + "step": 32896 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872525299238e-06, + "loss": 0.8047, + "step": 32897 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872324293287474e-06, + "loss": 0.7783, + "step": 32898 + }, + { + "epoch": 0.84, + "learning_rate": 1.6872123282075133e-06, + "loss": 0.7334, + "step": 32899 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871922265601118e-06, + "loss": 0.7119, + "step": 32900 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871721243865592e-06, + "loss": 0.6597, + "step": 32901 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871520216868703e-06, + "loss": 0.8379, + "step": 32902 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871319184610606e-06, + "loss": 0.6753, + "step": 32903 + }, + { + "epoch": 0.84, + "learning_rate": 1.6871118147091457e-06, + "loss": 1.0, + "step": 32904 + }, + { + "epoch": 0.84, + "learning_rate": 1.687091710431141e-06, + "loss": 0.9551, + "step": 32905 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870716056270618e-06, + "loss": 1.1973, + "step": 32906 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870515002969233e-06, + "loss": 0.7393, + "step": 32907 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870313944407407e-06, + "loss": 0.8398, + "step": 32908 + }, + { + "epoch": 0.84, + "learning_rate": 1.6870112880585304e-06, + "loss": 0.6387, + "step": 32909 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869911811503066e-06, + "loss": 0.8613, + "step": 32910 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869710737160856e-06, + "loss": 0.8574, + "step": 32911 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869509657558823e-06, + "loss": 0.9893, + "step": 32912 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869308572697124e-06, + "loss": 0.8926, + "step": 32913 + }, + { + "epoch": 0.84, + "learning_rate": 1.6869107482575911e-06, + "loss": 0.7959, + "step": 32914 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868906387195335e-06, + "loss": 0.9473, + "step": 32915 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868705286555556e-06, + "loss": 0.8304, + "step": 32916 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868504180656724e-06, + "loss": 0.8965, + "step": 32917 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868303069498995e-06, + "loss": 0.9424, + "step": 32918 + }, + { + "epoch": 0.84, + "learning_rate": 1.6868101953082521e-06, + "loss": 1.0, + "step": 32919 + }, + { + "epoch": 0.84, + "learning_rate": 1.686790083140746e-06, + "loss": 0.833, + "step": 32920 + }, + { + "epoch": 0.84, + "learning_rate": 1.686769970447396e-06, + "loss": 0.9629, + "step": 32921 + }, + { + "epoch": 0.84, + "learning_rate": 1.686749857228218e-06, + "loss": 0.6719, + "step": 32922 + }, + { + "epoch": 0.84, + "learning_rate": 1.686729743483227e-06, + "loss": 0.5156, + "step": 32923 + }, + { + "epoch": 0.84, + "learning_rate": 1.686709629212439e-06, + "loss": 0.8965, + "step": 32924 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866895144158686e-06, + "loss": 0.917, + "step": 32925 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866693990935319e-06, + "loss": 0.8877, + "step": 32926 + }, + { + "epoch": 0.84, + "learning_rate": 1.686649283245444e-06, + "loss": 0.8633, + "step": 32927 + }, + { + "epoch": 0.84, + "learning_rate": 1.6866291668716202e-06, + "loss": 0.9434, + "step": 32928 + }, + { + "epoch": 0.84, + "learning_rate": 1.686609049972076e-06, + "loss": 0.8276, + "step": 32929 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865889325468268e-06, + "loss": 0.6685, + "step": 32930 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865688145958881e-06, + "loss": 0.6406, + "step": 32931 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865486961192753e-06, + "loss": 0.6655, + "step": 32932 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865285771170035e-06, + "loss": 0.7617, + "step": 32933 + }, + { + "epoch": 0.84, + "learning_rate": 1.6865084575890887e-06, + "loss": 0.9463, + "step": 32934 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864883375355457e-06, + "loss": 0.8516, + "step": 32935 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864682169563902e-06, + "loss": 0.8828, + "step": 32936 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864480958516371e-06, + "loss": 0.8049, + "step": 32937 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864279742213027e-06, + "loss": 0.8262, + "step": 32938 + }, + { + "epoch": 0.84, + "learning_rate": 1.6864078520654021e-06, + "loss": 0.8213, + "step": 32939 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863877293839504e-06, + "loss": 0.7539, + "step": 32940 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863676061769635e-06, + "loss": 0.7534, + "step": 32941 + }, + { + "epoch": 0.84, + "learning_rate": 1.686347482444456e-06, + "loss": 0.9746, + "step": 32942 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863273581864438e-06, + "loss": 0.8174, + "step": 32943 + }, + { + "epoch": 0.84, + "learning_rate": 1.6863072334029424e-06, + "loss": 0.8125, + "step": 32944 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862871080939674e-06, + "loss": 0.4692, + "step": 32945 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862669822595336e-06, + "loss": 0.9492, + "step": 32946 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862468558996569e-06, + "loss": 0.9443, + "step": 32947 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862267290143525e-06, + "loss": 0.8301, + "step": 32948 + }, + { + "epoch": 0.84, + "learning_rate": 1.6862066016036357e-06, + "loss": 0.9546, + "step": 32949 + }, + { + "epoch": 0.84, + "learning_rate": 1.686186473667522e-06, + "loss": 0.6885, + "step": 32950 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861663452060273e-06, + "loss": 0.8369, + "step": 32951 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861462162191662e-06, + "loss": 0.7227, + "step": 32952 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861260867069547e-06, + "loss": 0.6719, + "step": 32953 + }, + { + "epoch": 0.84, + "learning_rate": 1.6861059566694076e-06, + "loss": 0.7261, + "step": 32954 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860858261065412e-06, + "loss": 0.9727, + "step": 32955 + }, + { + "epoch": 0.84, + "learning_rate": 1.68606569501837e-06, + "loss": 1.0176, + "step": 32956 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860455634049102e-06, + "loss": 0.8096, + "step": 32957 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860254312661768e-06, + "loss": 0.9648, + "step": 32958 + }, + { + "epoch": 0.84, + "learning_rate": 1.6860052986021854e-06, + "loss": 0.9102, + "step": 32959 + }, + { + "epoch": 0.84, + "learning_rate": 1.685985165412951e-06, + "loss": 0.6504, + "step": 32960 + }, + { + "epoch": 0.84, + "learning_rate": 1.6859650316984895e-06, + "loss": 0.8618, + "step": 32961 + }, + { + "epoch": 0.84, + "learning_rate": 1.6859448974588157e-06, + "loss": 0.9023, + "step": 32962 + }, + { + "epoch": 0.84, + "learning_rate": 1.685924762693946e-06, + "loss": 0.7427, + "step": 32963 + }, + { + "epoch": 0.84, + "learning_rate": 1.685904627403895e-06, + "loss": 0.8936, + "step": 32964 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858844915886784e-06, + "loss": 0.7671, + "step": 32965 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858643552483115e-06, + "loss": 0.7935, + "step": 32966 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858442183828099e-06, + "loss": 1.0396, + "step": 32967 + }, + { + "epoch": 0.84, + "learning_rate": 1.6858240809921887e-06, + "loss": 0.5015, + "step": 32968 + }, + { + "epoch": 0.85, + "learning_rate": 1.6858039430764638e-06, + "loss": 0.9209, + "step": 32969 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857838046356503e-06, + "loss": 1.127, + "step": 32970 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857636656697638e-06, + "loss": 0.7959, + "step": 32971 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857435261788192e-06, + "loss": 0.8398, + "step": 32972 + }, + { + "epoch": 0.85, + "learning_rate": 1.6857233861628327e-06, + "loss": 0.9268, + "step": 32973 + }, + { + "epoch": 0.85, + "learning_rate": 1.685703245621819e-06, + "loss": 0.7295, + "step": 32974 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856831045557941e-06, + "loss": 0.8877, + "step": 32975 + }, + { + "epoch": 0.85, + "learning_rate": 1.685662962964773e-06, + "loss": 0.9961, + "step": 32976 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856428208487716e-06, + "loss": 1.0312, + "step": 32977 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856226782078046e-06, + "loss": 0.8877, + "step": 32978 + }, + { + "epoch": 0.85, + "learning_rate": 1.6856025350418883e-06, + "loss": 0.7644, + "step": 32979 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855823913510373e-06, + "loss": 0.7227, + "step": 32980 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855622471352675e-06, + "loss": 0.8848, + "step": 32981 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855421023945944e-06, + "loss": 1.0703, + "step": 32982 + }, + { + "epoch": 0.85, + "learning_rate": 1.685521957129033e-06, + "loss": 0.9648, + "step": 32983 + }, + { + "epoch": 0.85, + "learning_rate": 1.6855018113385988e-06, + "loss": 0.6128, + "step": 32984 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854816650233077e-06, + "loss": 0.9639, + "step": 32985 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854615181831746e-06, + "loss": 1.0244, + "step": 32986 + }, + { + "epoch": 0.85, + "learning_rate": 1.6854413708182153e-06, + "loss": 1.1152, + "step": 32987 + }, + { + "epoch": 0.85, + "learning_rate": 1.685421222928445e-06, + "loss": 0.8672, + "step": 32988 + }, + { + "epoch": 0.85, + "learning_rate": 1.685401074513879e-06, + "loss": 0.7832, + "step": 32989 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853809255745335e-06, + "loss": 0.6543, + "step": 32990 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853607761104226e-06, + "loss": 0.7881, + "step": 32991 + }, + { + "epoch": 0.85, + "learning_rate": 1.685340626121563e-06, + "loss": 0.8008, + "step": 32992 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853204756079694e-06, + "loss": 0.7383, + "step": 32993 + }, + { + "epoch": 0.85, + "learning_rate": 1.6853003245696575e-06, + "loss": 0.9893, + "step": 32994 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852801730066426e-06, + "loss": 0.7168, + "step": 32995 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852600209189403e-06, + "loss": 0.8623, + "step": 32996 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852398683065655e-06, + "loss": 0.9941, + "step": 32997 + }, + { + "epoch": 0.85, + "learning_rate": 1.6852197151695343e-06, + "loss": 0.6924, + "step": 32998 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851995615078619e-06, + "loss": 0.8154, + "step": 32999 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851794073215637e-06, + "loss": 0.7725, + "step": 33000 + }, + { + "epoch": 0.85, + "learning_rate": 1.685159252610655e-06, + "loss": 0.791, + "step": 33001 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851390973751515e-06, + "loss": 0.6465, + "step": 33002 + }, + { + "epoch": 0.85, + "learning_rate": 1.6851189416150687e-06, + "loss": 0.7275, + "step": 33003 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850987853304215e-06, + "loss": 0.7603, + "step": 33004 + }, + { + "epoch": 0.85, + "learning_rate": 1.685078628521226e-06, + "loss": 0.8052, + "step": 33005 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850584711874969e-06, + "loss": 1.1309, + "step": 33006 + }, + { + "epoch": 0.85, + "learning_rate": 1.68503831332925e-06, + "loss": 0.9556, + "step": 33007 + }, + { + "epoch": 0.85, + "learning_rate": 1.6850181549465013e-06, + "loss": 1.0557, + "step": 33008 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849979960392652e-06, + "loss": 0.9238, + "step": 33009 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849778366075577e-06, + "loss": 0.8906, + "step": 33010 + }, + { + "epoch": 0.85, + "learning_rate": 1.6849576766513941e-06, + "loss": 0.8467, + "step": 33011 + }, + { + "epoch": 0.85, + "learning_rate": 1.68493751617079e-06, + "loss": 0.646, + "step": 33012 + }, + { + "epoch": 0.85, + "learning_rate": 1.684917355165761e-06, + "loss": 0.9404, + "step": 33013 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848971936363221e-06, + "loss": 0.8027, + "step": 33014 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848770315824888e-06, + "loss": 0.7627, + "step": 33015 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848568690042768e-06, + "loss": 0.9258, + "step": 33016 + }, + { + "epoch": 0.85, + "learning_rate": 1.6848367059017013e-06, + "loss": 0.8154, + "step": 33017 + }, + { + "epoch": 0.85, + "learning_rate": 1.684816542274778e-06, + "loss": 0.9072, + "step": 33018 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847963781235217e-06, + "loss": 0.9854, + "step": 33019 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847762134479489e-06, + "loss": 0.5991, + "step": 33020 + }, + { + "epoch": 0.85, + "learning_rate": 1.684756048248074e-06, + "loss": 0.7129, + "step": 33021 + }, + { + "epoch": 0.85, + "learning_rate": 1.684735882523913e-06, + "loss": 0.9492, + "step": 33022 + }, + { + "epoch": 0.85, + "learning_rate": 1.6847157162754814e-06, + "loss": 0.6731, + "step": 33023 + }, + { + "epoch": 0.85, + "learning_rate": 1.684695549502794e-06, + "loss": 1.0938, + "step": 33024 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846753822058673e-06, + "loss": 0.7378, + "step": 33025 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846552143847157e-06, + "loss": 0.8301, + "step": 33026 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846350460393553e-06, + "loss": 0.9346, + "step": 33027 + }, + { + "epoch": 0.85, + "learning_rate": 1.6846148771698013e-06, + "loss": 0.9893, + "step": 33028 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845947077760688e-06, + "loss": 0.8042, + "step": 33029 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845745378581744e-06, + "loss": 0.7773, + "step": 33030 + }, + { + "epoch": 0.85, + "learning_rate": 1.684554367416132e-06, + "loss": 0.9111, + "step": 33031 + }, + { + "epoch": 0.85, + "learning_rate": 1.6845341964499582e-06, + "loss": 0.7764, + "step": 33032 + }, + { + "epoch": 0.85, + "learning_rate": 1.684514024959668e-06, + "loss": 0.8506, + "step": 33033 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844938529452766e-06, + "loss": 0.8271, + "step": 33034 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844736804068e-06, + "loss": 0.8682, + "step": 33035 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844535073442534e-06, + "loss": 0.853, + "step": 33036 + }, + { + "epoch": 0.85, + "learning_rate": 1.684433333757652e-06, + "loss": 0.7705, + "step": 33037 + }, + { + "epoch": 0.85, + "learning_rate": 1.6844131596470117e-06, + "loss": 0.9111, + "step": 33038 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843929850123474e-06, + "loss": 1.0742, + "step": 33039 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843728098536754e-06, + "loss": 0.7861, + "step": 33040 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843526341710103e-06, + "loss": 1.1553, + "step": 33041 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843324579643676e-06, + "loss": 0.8789, + "step": 33042 + }, + { + "epoch": 0.85, + "learning_rate": 1.6843122812337634e-06, + "loss": 0.75, + "step": 33043 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842921039792124e-06, + "loss": 0.8799, + "step": 33044 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842719262007309e-06, + "loss": 1.165, + "step": 33045 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842517478983334e-06, + "loss": 0.9961, + "step": 33046 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842315690720359e-06, + "loss": 0.585, + "step": 33047 + }, + { + "epoch": 0.85, + "learning_rate": 1.6842113897218538e-06, + "loss": 0.8301, + "step": 33048 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841912098478024e-06, + "loss": 0.7686, + "step": 33049 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841710294498977e-06, + "loss": 0.9238, + "step": 33050 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841508485281542e-06, + "loss": 0.6978, + "step": 33051 + }, + { + "epoch": 0.85, + "learning_rate": 1.684130667082588e-06, + "loss": 0.9678, + "step": 33052 + }, + { + "epoch": 0.85, + "learning_rate": 1.6841104851132143e-06, + "loss": 0.9258, + "step": 33053 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840903026200487e-06, + "loss": 0.8008, + "step": 33054 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840701196031068e-06, + "loss": 0.8726, + "step": 33055 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840499360624039e-06, + "loss": 0.7959, + "step": 33056 + }, + { + "epoch": 0.85, + "learning_rate": 1.684029751997955e-06, + "loss": 0.8506, + "step": 33057 + }, + { + "epoch": 0.85, + "learning_rate": 1.6840095674097763e-06, + "loss": 0.7681, + "step": 33058 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839893822978828e-06, + "loss": 0.7649, + "step": 33059 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839691966622901e-06, + "loss": 0.8281, + "step": 33060 + }, + { + "epoch": 0.85, + "learning_rate": 1.683949010503014e-06, + "loss": 0.9473, + "step": 33061 + }, + { + "epoch": 0.85, + "learning_rate": 1.683928823820069e-06, + "loss": 0.9902, + "step": 33062 + }, + { + "epoch": 0.85, + "learning_rate": 1.6839086366134713e-06, + "loss": 0.7407, + "step": 33063 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838884488832363e-06, + "loss": 0.8203, + "step": 33064 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838682606293797e-06, + "loss": 0.9014, + "step": 33065 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838480718519162e-06, + "loss": 0.793, + "step": 33066 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838278825508615e-06, + "loss": 0.7197, + "step": 33067 + }, + { + "epoch": 0.85, + "learning_rate": 1.6838076927262317e-06, + "loss": 0.6079, + "step": 33068 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837875023780415e-06, + "loss": 0.7148, + "step": 33069 + }, + { + "epoch": 0.85, + "learning_rate": 1.683767311506307e-06, + "loss": 0.8965, + "step": 33070 + }, + { + "epoch": 0.85, + "learning_rate": 1.683747120111043e-06, + "loss": 0.9375, + "step": 33071 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837269281922652e-06, + "loss": 0.9648, + "step": 33072 + }, + { + "epoch": 0.85, + "learning_rate": 1.6837067357499893e-06, + "loss": 0.7793, + "step": 33073 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836865427842303e-06, + "loss": 0.7131, + "step": 33074 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836663492950045e-06, + "loss": 0.9531, + "step": 33075 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836461552823266e-06, + "loss": 0.8735, + "step": 33076 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836259607462119e-06, + "loss": 0.8232, + "step": 33077 + }, + { + "epoch": 0.85, + "learning_rate": 1.6836057656866766e-06, + "loss": 0.731, + "step": 33078 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835855701037355e-06, + "loss": 1.0254, + "step": 33079 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835653739974047e-06, + "loss": 0.686, + "step": 33080 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835451773676993e-06, + "loss": 0.7408, + "step": 33081 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835249802146348e-06, + "loss": 0.6836, + "step": 33082 + }, + { + "epoch": 0.85, + "learning_rate": 1.6835047825382262e-06, + "loss": 0.6543, + "step": 33083 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834845843384899e-06, + "loss": 0.8091, + "step": 33084 + }, + { + "epoch": 0.85, + "learning_rate": 1.683464385615441e-06, + "loss": 0.9424, + "step": 33085 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834441863690944e-06, + "loss": 0.8721, + "step": 33086 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834239865994664e-06, + "loss": 0.8496, + "step": 33087 + }, + { + "epoch": 0.85, + "learning_rate": 1.6834037863065715e-06, + "loss": 0.9551, + "step": 33088 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833835854904263e-06, + "loss": 0.7783, + "step": 33089 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833633841510455e-06, + "loss": 0.8135, + "step": 33090 + }, + { + "epoch": 0.85, + "learning_rate": 1.683343182288445e-06, + "loss": 0.6313, + "step": 33091 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833229799026397e-06, + "loss": 0.8213, + "step": 33092 + }, + { + "epoch": 0.85, + "learning_rate": 1.6833027769936456e-06, + "loss": 0.7988, + "step": 33093 + }, + { + "epoch": 0.85, + "learning_rate": 1.683282573561478e-06, + "loss": 0.9873, + "step": 33094 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832623696061523e-06, + "loss": 0.7393, + "step": 33095 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832421651276839e-06, + "loss": 0.6987, + "step": 33096 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832219601260883e-06, + "loss": 0.9785, + "step": 33097 + }, + { + "epoch": 0.85, + "learning_rate": 1.6832017546013814e-06, + "loss": 0.8916, + "step": 33098 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831815485535784e-06, + "loss": 0.7324, + "step": 33099 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831613419826947e-06, + "loss": 0.729, + "step": 33100 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831411348887455e-06, + "loss": 0.8213, + "step": 33101 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831209272717466e-06, + "loss": 0.9209, + "step": 33102 + }, + { + "epoch": 0.85, + "learning_rate": 1.6831007191317132e-06, + "loss": 0.9404, + "step": 33103 + }, + { + "epoch": 0.85, + "learning_rate": 1.6830805104686615e-06, + "loss": 0.8926, + "step": 33104 + }, + { + "epoch": 0.85, + "learning_rate": 1.683060301282606e-06, + "loss": 0.9678, + "step": 33105 + }, + { + "epoch": 0.85, + "learning_rate": 1.683040091573563e-06, + "loss": 0.8755, + "step": 33106 + }, + { + "epoch": 0.85, + "learning_rate": 1.6830198813415472e-06, + "loss": 0.7759, + "step": 33107 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829996705865749e-06, + "loss": 0.7783, + "step": 33108 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829794593086609e-06, + "loss": 0.6855, + "step": 33109 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829592475078211e-06, + "loss": 0.73, + "step": 33110 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829390351840707e-06, + "loss": 0.9014, + "step": 33111 + }, + { + "epoch": 0.85, + "learning_rate": 1.6829188223374252e-06, + "loss": 0.7861, + "step": 33112 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828986089679004e-06, + "loss": 0.7031, + "step": 33113 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828783950755112e-06, + "loss": 0.7275, + "step": 33114 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828581806602738e-06, + "loss": 0.9932, + "step": 33115 + }, + { + "epoch": 0.85, + "learning_rate": 1.682837965722203e-06, + "loss": 0.7563, + "step": 33116 + }, + { + "epoch": 0.85, + "learning_rate": 1.6828177502613148e-06, + "loss": 0.9473, + "step": 33117 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827975342776241e-06, + "loss": 0.833, + "step": 33118 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827773177711468e-06, + "loss": 0.9365, + "step": 33119 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827571007418988e-06, + "loss": 0.6934, + "step": 33120 + }, + { + "epoch": 0.85, + "learning_rate": 1.6827368831898947e-06, + "loss": 0.874, + "step": 33121 + }, + { + "epoch": 0.85, + "learning_rate": 1.68271666511515e-06, + "loss": 0.9941, + "step": 33122 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826964465176812e-06, + "loss": 0.8525, + "step": 33123 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826762273975029e-06, + "loss": 0.9023, + "step": 33124 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826560077546307e-06, + "loss": 0.9131, + "step": 33125 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826357875890802e-06, + "loss": 0.7744, + "step": 33126 + }, + { + "epoch": 0.85, + "learning_rate": 1.6826155669008669e-06, + "loss": 0.7793, + "step": 33127 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825953456900061e-06, + "loss": 0.793, + "step": 33128 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825751239565137e-06, + "loss": 0.7681, + "step": 33129 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825549017004047e-06, + "loss": 0.8477, + "step": 33130 + }, + { + "epoch": 0.85, + "learning_rate": 1.682534678921695e-06, + "loss": 0.9199, + "step": 33131 + }, + { + "epoch": 0.85, + "learning_rate": 1.6825144556203998e-06, + "loss": 0.7627, + "step": 33132 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824942317965345e-06, + "loss": 0.7891, + "step": 33133 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824740074501148e-06, + "loss": 0.9326, + "step": 33134 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824537825811565e-06, + "loss": 0.9678, + "step": 33135 + }, + { + "epoch": 0.85, + "learning_rate": 1.6824335571896744e-06, + "loss": 0.9785, + "step": 33136 + }, + { + "epoch": 0.85, + "learning_rate": 1.682413331275684e-06, + "loss": 0.8301, + "step": 33137 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823931048392014e-06, + "loss": 0.8281, + "step": 33138 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823728778802419e-06, + "loss": 0.8213, + "step": 33139 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823526503988208e-06, + "loss": 0.9023, + "step": 33140 + }, + { + "epoch": 0.85, + "learning_rate": 1.6823324223949537e-06, + "loss": 0.915, + "step": 33141 + }, + { + "epoch": 0.85, + "learning_rate": 1.682312193868656e-06, + "loss": 1.0244, + "step": 33142 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822919648199432e-06, + "loss": 1.0049, + "step": 33143 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822717352488308e-06, + "loss": 1.0215, + "step": 33144 + }, + { + "epoch": 0.85, + "learning_rate": 1.6822515051553343e-06, + "loss": 0.8232, + "step": 33145 + }, + { + "epoch": 0.85, + "learning_rate": 1.682231274539469e-06, + "loss": 0.918, + "step": 33146 + }, + { + "epoch": 0.85, + "learning_rate": 1.682211043401251e-06, + "loss": 0.7617, + "step": 33147 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821908117406951e-06, + "loss": 0.6885, + "step": 33148 + }, + { + "epoch": 0.85, + "learning_rate": 1.682170579557817e-06, + "loss": 0.8613, + "step": 33149 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821503468526325e-06, + "loss": 0.6475, + "step": 33150 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821301136251567e-06, + "loss": 0.6631, + "step": 33151 + }, + { + "epoch": 0.85, + "learning_rate": 1.6821098798754055e-06, + "loss": 0.8555, + "step": 33152 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820896456033936e-06, + "loss": 0.7539, + "step": 33153 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820694108091373e-06, + "loss": 0.7744, + "step": 33154 + }, + { + "epoch": 0.85, + "learning_rate": 1.682049175492652e-06, + "loss": 0.7549, + "step": 33155 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820289396539526e-06, + "loss": 1.0459, + "step": 33156 + }, + { + "epoch": 0.85, + "learning_rate": 1.6820087032930555e-06, + "loss": 0.7656, + "step": 33157 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819884664099752e-06, + "loss": 1.0586, + "step": 33158 + }, + { + "epoch": 0.85, + "learning_rate": 1.681968229004728e-06, + "loss": 0.915, + "step": 33159 + }, + { + "epoch": 0.85, + "learning_rate": 1.681947991077329e-06, + "loss": 0.9492, + "step": 33160 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819277526277937e-06, + "loss": 0.9062, + "step": 33161 + }, + { + "epoch": 0.85, + "learning_rate": 1.6819075136561377e-06, + "loss": 1.0029, + "step": 33162 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818872741623764e-06, + "loss": 0.8159, + "step": 33163 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818670341465255e-06, + "loss": 0.7871, + "step": 33164 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818467936086007e-06, + "loss": 0.8281, + "step": 33165 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818265525486166e-06, + "loss": 0.8115, + "step": 33166 + }, + { + "epoch": 0.85, + "learning_rate": 1.6818063109665897e-06, + "loss": 0.6548, + "step": 33167 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817860688625345e-06, + "loss": 0.8984, + "step": 33168 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817658262364675e-06, + "loss": 0.707, + "step": 33169 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817455830884038e-06, + "loss": 0.917, + "step": 33170 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817253394183587e-06, + "loss": 0.874, + "step": 33171 + }, + { + "epoch": 0.85, + "learning_rate": 1.6817050952263476e-06, + "loss": 0.9023, + "step": 33172 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816848505123866e-06, + "loss": 0.8389, + "step": 33173 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816646052764906e-06, + "loss": 0.9404, + "step": 33174 + }, + { + "epoch": 0.85, + "learning_rate": 1.681644359518676e-06, + "loss": 0.9727, + "step": 33175 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816241132389571e-06, + "loss": 0.6934, + "step": 33176 + }, + { + "epoch": 0.85, + "learning_rate": 1.6816038664373498e-06, + "loss": 0.7507, + "step": 33177 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815836191138701e-06, + "loss": 0.7729, + "step": 33178 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815633712685329e-06, + "loss": 0.8086, + "step": 33179 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815431229013543e-06, + "loss": 0.71, + "step": 33180 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815228740123492e-06, + "loss": 0.8608, + "step": 33181 + }, + { + "epoch": 0.85, + "learning_rate": 1.6815026246015335e-06, + "loss": 0.7344, + "step": 33182 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814823746689224e-06, + "loss": 0.7432, + "step": 33183 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814621242145318e-06, + "loss": 0.8691, + "step": 33184 + }, + { + "epoch": 0.85, + "learning_rate": 1.681441873238377e-06, + "loss": 0.5488, + "step": 33185 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814216217404735e-06, + "loss": 0.8955, + "step": 33186 + }, + { + "epoch": 0.85, + "learning_rate": 1.6814013697208366e-06, + "loss": 0.7581, + "step": 33187 + }, + { + "epoch": 0.85, + "learning_rate": 1.681381117179482e-06, + "loss": 0.9512, + "step": 33188 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813608641164251e-06, + "loss": 0.9043, + "step": 33189 + }, + { + "epoch": 0.85, + "learning_rate": 1.681340610531682e-06, + "loss": 0.8809, + "step": 33190 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813203564252673e-06, + "loss": 1.0215, + "step": 33191 + }, + { + "epoch": 0.85, + "learning_rate": 1.6813001017971973e-06, + "loss": 0.7627, + "step": 33192 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812798466474869e-06, + "loss": 0.8882, + "step": 33193 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812595909761517e-06, + "loss": 0.7344, + "step": 33194 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812393347832078e-06, + "loss": 0.7754, + "step": 33195 + }, + { + "epoch": 0.85, + "learning_rate": 1.6812190780686699e-06, + "loss": 0.8457, + "step": 33196 + }, + { + "epoch": 0.85, + "learning_rate": 1.681198820832554e-06, + "loss": 1.0049, + "step": 33197 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811785630748753e-06, + "loss": 0.6338, + "step": 33198 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811583047956496e-06, + "loss": 0.6562, + "step": 33199 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811380459948924e-06, + "loss": 0.7144, + "step": 33200 + }, + { + "epoch": 0.85, + "learning_rate": 1.6811177866726191e-06, + "loss": 0.7598, + "step": 33201 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810975268288453e-06, + "loss": 1.0488, + "step": 33202 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810772664635864e-06, + "loss": 0.9961, + "step": 33203 + }, + { + "epoch": 0.85, + "learning_rate": 1.681057005576858e-06, + "loss": 0.8359, + "step": 33204 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810367441686751e-06, + "loss": 0.8447, + "step": 33205 + }, + { + "epoch": 0.85, + "learning_rate": 1.6810164822390542e-06, + "loss": 0.582, + "step": 33206 + }, + { + "epoch": 0.85, + "learning_rate": 1.68099621978801e-06, + "loss": 0.8047, + "step": 33207 + }, + { + "epoch": 0.85, + "learning_rate": 1.6809759568155586e-06, + "loss": 0.9658, + "step": 33208 + }, + { + "epoch": 0.85, + "learning_rate": 1.680955693321715e-06, + "loss": 0.9199, + "step": 33209 + }, + { + "epoch": 0.85, + "learning_rate": 1.680935429306495e-06, + "loss": 0.6914, + "step": 33210 + }, + { + "epoch": 0.85, + "learning_rate": 1.6809151647699142e-06, + "loss": 0.7314, + "step": 33211 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808948997119878e-06, + "loss": 0.8447, + "step": 33212 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808746341327313e-06, + "loss": 0.6143, + "step": 33213 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808543680321607e-06, + "loss": 0.9023, + "step": 33214 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808341014102911e-06, + "loss": 1.0264, + "step": 33215 + }, + { + "epoch": 0.85, + "learning_rate": 1.6808138342671384e-06, + "loss": 0.7598, + "step": 33216 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807935666027175e-06, + "loss": 0.9209, + "step": 33217 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807732984170443e-06, + "loss": 1.0049, + "step": 33218 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807530297101345e-06, + "loss": 0.7026, + "step": 33219 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807327604820031e-06, + "loss": 0.792, + "step": 33220 + }, + { + "epoch": 0.85, + "learning_rate": 1.6807124907326662e-06, + "loss": 1.0156, + "step": 33221 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806922204621388e-06, + "loss": 0.8369, + "step": 33222 + }, + { + "epoch": 0.85, + "learning_rate": 1.680671949670437e-06, + "loss": 0.8574, + "step": 33223 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806516783575757e-06, + "loss": 0.9097, + "step": 33224 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806314065235708e-06, + "loss": 1.0117, + "step": 33225 + }, + { + "epoch": 0.85, + "learning_rate": 1.6806111341684378e-06, + "loss": 1.0801, + "step": 33226 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805908612921919e-06, + "loss": 0.9609, + "step": 33227 + }, + { + "epoch": 0.85, + "learning_rate": 1.680570587894849e-06, + "loss": 0.8115, + "step": 33228 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805503139764248e-06, + "loss": 0.8906, + "step": 33229 + }, + { + "epoch": 0.85, + "learning_rate": 1.6805300395369342e-06, + "loss": 0.7266, + "step": 33230 + }, + { + "epoch": 0.85, + "learning_rate": 1.680509764576393e-06, + "loss": 0.9287, + "step": 33231 + }, + { + "epoch": 0.85, + "learning_rate": 1.680489489094817e-06, + "loss": 0.7158, + "step": 33232 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804692130922212e-06, + "loss": 0.7407, + "step": 33233 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804489365686218e-06, + "loss": 0.9541, + "step": 33234 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804286595240336e-06, + "loss": 0.751, + "step": 33235 + }, + { + "epoch": 0.85, + "learning_rate": 1.6804083819584727e-06, + "loss": 0.9629, + "step": 33236 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803881038719543e-06, + "loss": 0.8926, + "step": 33237 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803678252644938e-06, + "loss": 0.8525, + "step": 33238 + }, + { + "epoch": 0.85, + "learning_rate": 1.680347546136107e-06, + "loss": 0.6763, + "step": 33239 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803272664868096e-06, + "loss": 0.751, + "step": 33240 + }, + { + "epoch": 0.85, + "learning_rate": 1.6803069863166169e-06, + "loss": 0.7988, + "step": 33241 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802867056255444e-06, + "loss": 0.9204, + "step": 33242 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802664244136072e-06, + "loss": 0.8428, + "step": 33243 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802461426808217e-06, + "loss": 0.8276, + "step": 33244 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802258604272028e-06, + "loss": 0.9004, + "step": 33245 + }, + { + "epoch": 0.85, + "learning_rate": 1.6802055776527664e-06, + "loss": 0.583, + "step": 33246 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801852943575278e-06, + "loss": 0.9385, + "step": 33247 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801650105415028e-06, + "loss": 0.9316, + "step": 33248 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801447262047065e-06, + "loss": 0.7104, + "step": 33249 + }, + { + "epoch": 0.85, + "learning_rate": 1.6801244413471548e-06, + "loss": 0.8486, + "step": 33250 + }, + { + "epoch": 0.85, + "learning_rate": 1.680104155968863e-06, + "loss": 0.8867, + "step": 33251 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800838700698465e-06, + "loss": 0.9092, + "step": 33252 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800635836501214e-06, + "loss": 0.8369, + "step": 33253 + }, + { + "epoch": 0.85, + "learning_rate": 1.680043296709703e-06, + "loss": 0.9355, + "step": 33254 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800230092486062e-06, + "loss": 0.833, + "step": 33255 + }, + { + "epoch": 0.85, + "learning_rate": 1.6800027212668476e-06, + "loss": 0.7441, + "step": 33256 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799824327644417e-06, + "loss": 0.8389, + "step": 33257 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799621437414046e-06, + "loss": 0.9277, + "step": 33258 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799418541977521e-06, + "loss": 0.8242, + "step": 33259 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799215641334993e-06, + "loss": 0.8945, + "step": 33260 + }, + { + "epoch": 0.85, + "learning_rate": 1.6799012735486614e-06, + "loss": 0.9219, + "step": 33261 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798809824432547e-06, + "loss": 0.9707, + "step": 33262 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798606908172944e-06, + "loss": 0.8154, + "step": 33263 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798403986707959e-06, + "loss": 0.709, + "step": 33264 + }, + { + "epoch": 0.85, + "learning_rate": 1.6798201060037749e-06, + "loss": 0.8877, + "step": 33265 + }, + { + "epoch": 0.85, + "learning_rate": 1.679799812816247e-06, + "loss": 0.3755, + "step": 33266 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797795191082276e-06, + "loss": 0.8027, + "step": 33267 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797592248797323e-06, + "loss": 0.8984, + "step": 33268 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797389301307766e-06, + "loss": 1.0361, + "step": 33269 + }, + { + "epoch": 0.85, + "learning_rate": 1.6797186348613758e-06, + "loss": 0.8281, + "step": 33270 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796983390715461e-06, + "loss": 0.8125, + "step": 33271 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796780427613024e-06, + "loss": 0.9863, + "step": 33272 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796577459306604e-06, + "loss": 0.8379, + "step": 33273 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796374485796362e-06, + "loss": 0.853, + "step": 33274 + }, + { + "epoch": 0.85, + "learning_rate": 1.6796171507082444e-06, + "loss": 0.8848, + "step": 33275 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795968523165008e-06, + "loss": 0.8428, + "step": 33276 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795765534044218e-06, + "loss": 0.9375, + "step": 33277 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795562539720218e-06, + "loss": 0.7969, + "step": 33278 + }, + { + "epoch": 0.85, + "learning_rate": 1.679535954019317e-06, + "loss": 0.917, + "step": 33279 + }, + { + "epoch": 0.85, + "learning_rate": 1.6795156535463226e-06, + "loss": 0.9771, + "step": 33280 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794953525530543e-06, + "loss": 0.876, + "step": 33281 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794750510395278e-06, + "loss": 0.6279, + "step": 33282 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794547490057584e-06, + "loss": 0.5913, + "step": 33283 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794344464517622e-06, + "loss": 0.6807, + "step": 33284 + }, + { + "epoch": 0.85, + "learning_rate": 1.6794141433775536e-06, + "loss": 0.8994, + "step": 33285 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793938397831493e-06, + "loss": 1.0391, + "step": 33286 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793735356685642e-06, + "loss": 0.7295, + "step": 33287 + }, + { + "epoch": 0.85, + "learning_rate": 1.679353231033814e-06, + "loss": 0.8076, + "step": 33288 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793329258789145e-06, + "loss": 0.8486, + "step": 33289 + }, + { + "epoch": 0.85, + "learning_rate": 1.6793126202038806e-06, + "loss": 0.8132, + "step": 33290 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792923140087285e-06, + "loss": 0.8467, + "step": 33291 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792720072934734e-06, + "loss": 0.918, + "step": 33292 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792517000581313e-06, + "loss": 0.9561, + "step": 33293 + }, + { + "epoch": 0.85, + "learning_rate": 1.679231392302717e-06, + "loss": 0.8306, + "step": 33294 + }, + { + "epoch": 0.85, + "learning_rate": 1.6792110840272464e-06, + "loss": 0.7542, + "step": 33295 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791907752317353e-06, + "loss": 0.6335, + "step": 33296 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791704659161992e-06, + "loss": 0.7988, + "step": 33297 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791501560806532e-06, + "loss": 0.7451, + "step": 33298 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791298457251135e-06, + "loss": 0.9902, + "step": 33299 + }, + { + "epoch": 0.85, + "learning_rate": 1.6791095348495952e-06, + "loss": 0.9248, + "step": 33300 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790892234541135e-06, + "loss": 0.9844, + "step": 33301 + }, + { + "epoch": 0.85, + "learning_rate": 1.679068911538685e-06, + "loss": 0.8154, + "step": 33302 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790485991033246e-06, + "loss": 0.6509, + "step": 33303 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790282861480476e-06, + "loss": 0.8652, + "step": 33304 + }, + { + "epoch": 0.85, + "learning_rate": 1.6790079726728701e-06, + "loss": 0.8857, + "step": 33305 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789876586778073e-06, + "loss": 0.7856, + "step": 33306 + }, + { + "epoch": 0.85, + "learning_rate": 1.678967344162875e-06, + "loss": 0.9023, + "step": 33307 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789470291280883e-06, + "loss": 1.0332, + "step": 33308 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789267135734635e-06, + "loss": 0.9043, + "step": 33309 + }, + { + "epoch": 0.85, + "learning_rate": 1.6789063974990154e-06, + "loss": 0.585, + "step": 33310 + }, + { + "epoch": 0.85, + "learning_rate": 1.67888608090476e-06, + "loss": 0.8901, + "step": 33311 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788657637907128e-06, + "loss": 0.8667, + "step": 33312 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788454461568896e-06, + "loss": 0.8633, + "step": 33313 + }, + { + "epoch": 0.85, + "learning_rate": 1.678825128003305e-06, + "loss": 0.9668, + "step": 33314 + }, + { + "epoch": 0.85, + "learning_rate": 1.6788048093299756e-06, + "loss": 0.5161, + "step": 33315 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787844901369165e-06, + "loss": 1.0068, + "step": 33316 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787641704241432e-06, + "loss": 0.707, + "step": 33317 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787438501916714e-06, + "loss": 0.8232, + "step": 33318 + }, + { + "epoch": 0.85, + "learning_rate": 1.6787235294395172e-06, + "loss": 0.71, + "step": 33319 + }, + { + "epoch": 0.85, + "learning_rate": 1.678703208167695e-06, + "loss": 0.7375, + "step": 33320 + }, + { + "epoch": 0.85, + "learning_rate": 1.678682886376221e-06, + "loss": 0.5332, + "step": 33321 + }, + { + "epoch": 0.85, + "learning_rate": 1.678662564065111e-06, + "loss": 0.5955, + "step": 33322 + }, + { + "epoch": 0.85, + "learning_rate": 1.67864224123438e-06, + "loss": 0.8965, + "step": 33323 + }, + { + "epoch": 0.85, + "learning_rate": 1.6786219178840442e-06, + "loss": 0.8994, + "step": 33324 + }, + { + "epoch": 0.85, + "learning_rate": 1.6786015940141185e-06, + "loss": 0.71, + "step": 33325 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785812696246189e-06, + "loss": 0.8076, + "step": 33326 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785609447155606e-06, + "loss": 0.7991, + "step": 33327 + }, + { + "epoch": 0.85, + "learning_rate": 1.6785406192869595e-06, + "loss": 0.7686, + "step": 33328 + }, + { + "epoch": 0.85, + "learning_rate": 1.678520293338831e-06, + "loss": 0.7979, + "step": 33329 + }, + { + "epoch": 0.85, + "learning_rate": 1.678499966871191e-06, + "loss": 0.5913, + "step": 33330 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784796398840547e-06, + "loss": 0.9912, + "step": 33331 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784593123774376e-06, + "loss": 0.7812, + "step": 33332 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784389843513553e-06, + "loss": 0.8271, + "step": 33333 + }, + { + "epoch": 0.85, + "learning_rate": 1.6784186558058236e-06, + "loss": 0.6426, + "step": 33334 + }, + { + "epoch": 0.85, + "learning_rate": 1.678398326740858e-06, + "loss": 0.8594, + "step": 33335 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783779971564737e-06, + "loss": 0.8105, + "step": 33336 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783576670526869e-06, + "loss": 0.8984, + "step": 33337 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783373364295126e-06, + "loss": 0.8584, + "step": 33338 + }, + { + "epoch": 0.85, + "learning_rate": 1.6783170052869668e-06, + "loss": 0.6719, + "step": 33339 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782966736250648e-06, + "loss": 0.8203, + "step": 33340 + }, + { + "epoch": 0.85, + "learning_rate": 1.678276341443822e-06, + "loss": 0.7598, + "step": 33341 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782560087432544e-06, + "loss": 0.9834, + "step": 33342 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782356755233772e-06, + "loss": 0.8525, + "step": 33343 + }, + { + "epoch": 0.85, + "learning_rate": 1.6782153417842063e-06, + "loss": 0.728, + "step": 33344 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781950075257572e-06, + "loss": 0.8896, + "step": 33345 + }, + { + "epoch": 0.85, + "learning_rate": 1.678174672748045e-06, + "loss": 1.0469, + "step": 33346 + }, + { + "epoch": 0.85, + "learning_rate": 1.678154337451086e-06, + "loss": 0.6934, + "step": 33347 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781340016348953e-06, + "loss": 0.9082, + "step": 33348 + }, + { + "epoch": 0.85, + "learning_rate": 1.6781136652994886e-06, + "loss": 0.7231, + "step": 33349 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780933284448814e-06, + "loss": 0.8418, + "step": 33350 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780729910710894e-06, + "loss": 0.5332, + "step": 33351 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780526531781278e-06, + "loss": 0.9795, + "step": 33352 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780323147660127e-06, + "loss": 0.999, + "step": 33353 + }, + { + "epoch": 0.85, + "learning_rate": 1.6780119758347592e-06, + "loss": 0.8115, + "step": 33354 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779916363843834e-06, + "loss": 0.8037, + "step": 33355 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779712964149004e-06, + "loss": 0.8867, + "step": 33356 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779509559263262e-06, + "loss": 0.9023, + "step": 33357 + }, + { + "epoch": 0.85, + "learning_rate": 1.6779306149186758e-06, + "loss": 0.791, + "step": 33358 + }, + { + "epoch": 0.86, + "learning_rate": 1.6779102733919653e-06, + "loss": 0.9678, + "step": 33359 + }, + { + "epoch": 0.86, + "learning_rate": 1.67788993134621e-06, + "loss": 0.6895, + "step": 33360 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778695887814257e-06, + "loss": 0.875, + "step": 33361 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778492456976276e-06, + "loss": 0.999, + "step": 33362 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778289020948316e-06, + "loss": 1.0293, + "step": 33363 + }, + { + "epoch": 0.86, + "learning_rate": 1.6778085579730533e-06, + "loss": 0.9482, + "step": 33364 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777882133323077e-06, + "loss": 0.8486, + "step": 33365 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777678681726113e-06, + "loss": 0.6895, + "step": 33366 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777475224939793e-06, + "loss": 0.77, + "step": 33367 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777271762964268e-06, + "loss": 0.832, + "step": 33368 + }, + { + "epoch": 0.86, + "learning_rate": 1.6777068295799702e-06, + "loss": 0.915, + "step": 33369 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776864823446242e-06, + "loss": 0.811, + "step": 33370 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776661345904049e-06, + "loss": 0.7017, + "step": 33371 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776457863173277e-06, + "loss": 0.6433, + "step": 33372 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776254375254087e-06, + "loss": 0.9736, + "step": 33373 + }, + { + "epoch": 0.86, + "learning_rate": 1.6776050882146628e-06, + "loss": 0.8145, + "step": 33374 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775847383851058e-06, + "loss": 0.6987, + "step": 33375 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775643880367534e-06, + "loss": 0.835, + "step": 33376 + }, + { + "epoch": 0.86, + "learning_rate": 1.677544037169621e-06, + "loss": 0.6592, + "step": 33377 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775236857837243e-06, + "loss": 0.6748, + "step": 33378 + }, + { + "epoch": 0.86, + "learning_rate": 1.6775033338790791e-06, + "loss": 0.8242, + "step": 33379 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774829814557006e-06, + "loss": 0.6904, + "step": 33380 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774626285136043e-06, + "loss": 0.7246, + "step": 33381 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774422750528063e-06, + "loss": 0.793, + "step": 33382 + }, + { + "epoch": 0.86, + "learning_rate": 1.6774219210733217e-06, + "loss": 0.834, + "step": 33383 + }, + { + "epoch": 0.86, + "learning_rate": 1.677401566575167e-06, + "loss": 0.8174, + "step": 33384 + }, + { + "epoch": 0.86, + "learning_rate": 1.677381211558356e-06, + "loss": 0.8281, + "step": 33385 + }, + { + "epoch": 0.86, + "learning_rate": 1.677360856022906e-06, + "loss": 0.833, + "step": 33386 + }, + { + "epoch": 0.86, + "learning_rate": 1.6773404999688317e-06, + "loss": 0.7412, + "step": 33387 + }, + { + "epoch": 0.86, + "learning_rate": 1.677320143396149e-06, + "loss": 0.792, + "step": 33388 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772997863048737e-06, + "loss": 0.7031, + "step": 33389 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772794286950207e-06, + "loss": 0.9229, + "step": 33390 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772590705666062e-06, + "loss": 0.8154, + "step": 33391 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772387119196454e-06, + "loss": 0.6592, + "step": 33392 + }, + { + "epoch": 0.86, + "learning_rate": 1.6772183527541542e-06, + "loss": 0.7715, + "step": 33393 + }, + { + "epoch": 0.86, + "learning_rate": 1.677197993070148e-06, + "loss": 1.335, + "step": 33394 + }, + { + "epoch": 0.86, + "learning_rate": 1.677177632867642e-06, + "loss": 0.6533, + "step": 33395 + }, + { + "epoch": 0.86, + "learning_rate": 1.677157272146653e-06, + "loss": 0.9365, + "step": 33396 + }, + { + "epoch": 0.86, + "learning_rate": 1.6771369109071954e-06, + "loss": 0.7124, + "step": 33397 + }, + { + "epoch": 0.86, + "learning_rate": 1.6771165491492851e-06, + "loss": 0.8945, + "step": 33398 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770961868729381e-06, + "loss": 0.8779, + "step": 33399 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770758240781695e-06, + "loss": 0.7217, + "step": 33400 + }, + { + "epoch": 0.86, + "learning_rate": 1.677055460764995e-06, + "loss": 0.8096, + "step": 33401 + }, + { + "epoch": 0.86, + "learning_rate": 1.6770350969334303e-06, + "loss": 0.8164, + "step": 33402 + }, + { + "epoch": 0.86, + "learning_rate": 1.677014732583491e-06, + "loss": 0.8203, + "step": 33403 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769943677151927e-06, + "loss": 0.9692, + "step": 33404 + }, + { + "epoch": 0.86, + "learning_rate": 1.676974002328551e-06, + "loss": 0.7939, + "step": 33405 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769536364235814e-06, + "loss": 0.9336, + "step": 33406 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769332700002994e-06, + "loss": 0.7109, + "step": 33407 + }, + { + "epoch": 0.86, + "learning_rate": 1.6769129030587209e-06, + "loss": 0.728, + "step": 33408 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768925355988613e-06, + "loss": 0.8345, + "step": 33409 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768721676207357e-06, + "loss": 0.8555, + "step": 33410 + }, + { + "epoch": 0.86, + "learning_rate": 1.676851799124361e-06, + "loss": 0.9521, + "step": 33411 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768314301097514e-06, + "loss": 1.0361, + "step": 33412 + }, + { + "epoch": 0.86, + "learning_rate": 1.6768110605769233e-06, + "loss": 0.795, + "step": 33413 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767906905258924e-06, + "loss": 0.6631, + "step": 33414 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767703199566733e-06, + "loss": 0.7822, + "step": 33415 + }, + { + "epoch": 0.86, + "learning_rate": 1.676749948869283e-06, + "loss": 0.6885, + "step": 33416 + }, + { + "epoch": 0.86, + "learning_rate": 1.676729577263736e-06, + "loss": 0.9277, + "step": 33417 + }, + { + "epoch": 0.86, + "learning_rate": 1.6767092051400482e-06, + "loss": 0.7983, + "step": 33418 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766888324982355e-06, + "loss": 0.8223, + "step": 33419 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766684593383134e-06, + "loss": 0.8799, + "step": 33420 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766480856602971e-06, + "loss": 1.0107, + "step": 33421 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766277114642024e-06, + "loss": 0.918, + "step": 33422 + }, + { + "epoch": 0.86, + "learning_rate": 1.6766073367500452e-06, + "loss": 0.8672, + "step": 33423 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765869615178408e-06, + "loss": 0.6785, + "step": 33424 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765665857676047e-06, + "loss": 0.8867, + "step": 33425 + }, + { + "epoch": 0.86, + "learning_rate": 1.676546209499353e-06, + "loss": 0.9707, + "step": 33426 + }, + { + "epoch": 0.86, + "learning_rate": 1.6765258327131008e-06, + "loss": 0.9033, + "step": 33427 + }, + { + "epoch": 0.86, + "learning_rate": 1.676505455408864e-06, + "loss": 0.8447, + "step": 33428 + }, + { + "epoch": 0.86, + "learning_rate": 1.676485077586658e-06, + "loss": 0.6846, + "step": 33429 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764646992464984e-06, + "loss": 0.8213, + "step": 33430 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764443203884008e-06, + "loss": 0.7783, + "step": 33431 + }, + { + "epoch": 0.86, + "learning_rate": 1.676423941012381e-06, + "loss": 0.7092, + "step": 33432 + }, + { + "epoch": 0.86, + "learning_rate": 1.6764035611184546e-06, + "loss": 0.5874, + "step": 33433 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763831807066372e-06, + "loss": 0.8203, + "step": 33434 + }, + { + "epoch": 0.86, + "learning_rate": 1.676362799776944e-06, + "loss": 1.0713, + "step": 33435 + }, + { + "epoch": 0.86, + "learning_rate": 1.676342418329391e-06, + "loss": 0.7881, + "step": 33436 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763220363639938e-06, + "loss": 0.6855, + "step": 33437 + }, + { + "epoch": 0.86, + "learning_rate": 1.6763016538807676e-06, + "loss": 0.6611, + "step": 33438 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762812708797286e-06, + "loss": 0.9248, + "step": 33439 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762608873608924e-06, + "loss": 0.7915, + "step": 33440 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762405033242739e-06, + "loss": 0.8135, + "step": 33441 + }, + { + "epoch": 0.86, + "learning_rate": 1.6762201187698893e-06, + "loss": 0.9414, + "step": 33442 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761997336977541e-06, + "loss": 0.7559, + "step": 33443 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761793481078836e-06, + "loss": 0.7629, + "step": 33444 + }, + { + "epoch": 0.86, + "learning_rate": 1.676158962000294e-06, + "loss": 0.9014, + "step": 33445 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761385753750003e-06, + "loss": 0.8838, + "step": 33446 + }, + { + "epoch": 0.86, + "learning_rate": 1.6761181882320185e-06, + "loss": 0.8252, + "step": 33447 + }, + { + "epoch": 0.86, + "learning_rate": 1.676097800571364e-06, + "loss": 1.0391, + "step": 33448 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760774123930529e-06, + "loss": 1.0986, + "step": 33449 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760570236970998e-06, + "loss": 0.7783, + "step": 33450 + }, + { + "epoch": 0.86, + "learning_rate": 1.676036634483521e-06, + "loss": 0.8389, + "step": 33451 + }, + { + "epoch": 0.86, + "learning_rate": 1.6760162447523323e-06, + "loss": 0.8154, + "step": 33452 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759958545035491e-06, + "loss": 0.793, + "step": 33453 + }, + { + "epoch": 0.86, + "learning_rate": 1.675975463737187e-06, + "loss": 0.6865, + "step": 33454 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759550724532613e-06, + "loss": 0.9346, + "step": 33455 + }, + { + "epoch": 0.86, + "learning_rate": 1.675934680651788e-06, + "loss": 0.7568, + "step": 33456 + }, + { + "epoch": 0.86, + "learning_rate": 1.6759142883327826e-06, + "loss": 0.7637, + "step": 33457 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758938954962606e-06, + "loss": 0.9258, + "step": 33458 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758735021422381e-06, + "loss": 0.7695, + "step": 33459 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758531082707302e-06, + "loss": 0.9668, + "step": 33460 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758327138817525e-06, + "loss": 0.9355, + "step": 33461 + }, + { + "epoch": 0.86, + "learning_rate": 1.6758123189753207e-06, + "loss": 0.8779, + "step": 33462 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757919235514506e-06, + "loss": 0.9541, + "step": 33463 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757715276101577e-06, + "loss": 0.8623, + "step": 33464 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757511311514575e-06, + "loss": 0.8184, + "step": 33465 + }, + { + "epoch": 0.86, + "learning_rate": 1.6757307341753659e-06, + "loss": 0.7969, + "step": 33466 + }, + { + "epoch": 0.86, + "learning_rate": 1.675710336681898e-06, + "loss": 0.9785, + "step": 33467 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756899386710701e-06, + "loss": 0.8037, + "step": 33468 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756695401428976e-06, + "loss": 0.8193, + "step": 33469 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756491410973958e-06, + "loss": 0.8623, + "step": 33470 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756287415345803e-06, + "loss": 0.6733, + "step": 33471 + }, + { + "epoch": 0.86, + "learning_rate": 1.6756083414544672e-06, + "loss": 0.9189, + "step": 33472 + }, + { + "epoch": 0.86, + "learning_rate": 1.675587940857072e-06, + "loss": 0.6123, + "step": 33473 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755675397424097e-06, + "loss": 0.9268, + "step": 33474 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755471381104971e-06, + "loss": 0.8398, + "step": 33475 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755267359613485e-06, + "loss": 0.6865, + "step": 33476 + }, + { + "epoch": 0.86, + "learning_rate": 1.6755063332949804e-06, + "loss": 1.0703, + "step": 33477 + }, + { + "epoch": 0.86, + "learning_rate": 1.675485930111408e-06, + "loss": 0.7715, + "step": 33478 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754655264106475e-06, + "loss": 0.7202, + "step": 33479 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754451221927136e-06, + "loss": 0.7148, + "step": 33480 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754247174576225e-06, + "loss": 0.8857, + "step": 33481 + }, + { + "epoch": 0.86, + "learning_rate": 1.6754043122053903e-06, + "loss": 0.8428, + "step": 33482 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753839064360315e-06, + "loss": 0.8291, + "step": 33483 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753635001495625e-06, + "loss": 0.9326, + "step": 33484 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753430933459986e-06, + "loss": 1.1074, + "step": 33485 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753226860253557e-06, + "loss": 0.8115, + "step": 33486 + }, + { + "epoch": 0.86, + "learning_rate": 1.6753022781876492e-06, + "loss": 0.793, + "step": 33487 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752818698328948e-06, + "loss": 0.8457, + "step": 33488 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752614609611082e-06, + "loss": 0.8154, + "step": 33489 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752410515723048e-06, + "loss": 0.7715, + "step": 33490 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752206416665005e-06, + "loss": 0.5874, + "step": 33491 + }, + { + "epoch": 0.86, + "learning_rate": 1.6752002312437106e-06, + "loss": 0.5474, + "step": 33492 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751798203039511e-06, + "loss": 0.4722, + "step": 33493 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751594088472377e-06, + "loss": 0.8633, + "step": 33494 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751389968735854e-06, + "loss": 0.7891, + "step": 33495 + }, + { + "epoch": 0.86, + "learning_rate": 1.6751185843830102e-06, + "loss": 0.8311, + "step": 33496 + }, + { + "epoch": 0.86, + "learning_rate": 1.675098171375528e-06, + "loss": 0.8374, + "step": 33497 + }, + { + "epoch": 0.86, + "learning_rate": 1.675077757851154e-06, + "loss": 0.8574, + "step": 33498 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750573438099043e-06, + "loss": 0.8999, + "step": 33499 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750369292517935e-06, + "loss": 0.8418, + "step": 33500 + }, + { + "epoch": 0.86, + "learning_rate": 1.6750165141768387e-06, + "loss": 0.9521, + "step": 33501 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749960985850544e-06, + "loss": 0.6766, + "step": 33502 + }, + { + "epoch": 0.86, + "learning_rate": 1.674975682476457e-06, + "loss": 0.8789, + "step": 33503 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749552658510615e-06, + "loss": 0.9287, + "step": 33504 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749348487088838e-06, + "loss": 0.9141, + "step": 33505 + }, + { + "epoch": 0.86, + "learning_rate": 1.6749144310499394e-06, + "loss": 1.0781, + "step": 33506 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748940128742444e-06, + "loss": 0.7676, + "step": 33507 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748735941818137e-06, + "loss": 0.9209, + "step": 33508 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748531749726636e-06, + "loss": 0.7344, + "step": 33509 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748327552468093e-06, + "loss": 0.7588, + "step": 33510 + }, + { + "epoch": 0.86, + "learning_rate": 1.6748123350042667e-06, + "loss": 0.7998, + "step": 33511 + }, + { + "epoch": 0.86, + "learning_rate": 1.674791914245051e-06, + "loss": 0.8125, + "step": 33512 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747714929691785e-06, + "loss": 0.6616, + "step": 33513 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747510711766645e-06, + "loss": 0.9229, + "step": 33514 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747306488675244e-06, + "loss": 0.8521, + "step": 33515 + }, + { + "epoch": 0.86, + "learning_rate": 1.6747102260417743e-06, + "loss": 0.918, + "step": 33516 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746898026994293e-06, + "loss": 0.7686, + "step": 33517 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746693788405058e-06, + "loss": 0.7197, + "step": 33518 + }, + { + "epoch": 0.86, + "learning_rate": 1.674648954465019e-06, + "loss": 0.7744, + "step": 33519 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746285295729838e-06, + "loss": 0.9414, + "step": 33520 + }, + { + "epoch": 0.86, + "learning_rate": 1.6746081041644171e-06, + "loss": 0.9219, + "step": 33521 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745876782393338e-06, + "loss": 1.0752, + "step": 33522 + }, + { + "epoch": 0.86, + "learning_rate": 1.67456725179775e-06, + "loss": 0.9727, + "step": 33523 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745468248396807e-06, + "loss": 0.8662, + "step": 33524 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745263973651423e-06, + "loss": 0.7534, + "step": 33525 + }, + { + "epoch": 0.86, + "learning_rate": 1.6745059693741499e-06, + "loss": 0.834, + "step": 33526 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744855408667191e-06, + "loss": 0.8604, + "step": 33527 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744651118428662e-06, + "loss": 0.7637, + "step": 33528 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744446823026062e-06, + "loss": 0.8975, + "step": 33529 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744242522459543e-06, + "loss": 0.8613, + "step": 33530 + }, + { + "epoch": 0.86, + "learning_rate": 1.6744038216729274e-06, + "loss": 1.0049, + "step": 33531 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743833905835404e-06, + "loss": 1.042, + "step": 33532 + }, + { + "epoch": 0.86, + "learning_rate": 1.674362958977809e-06, + "loss": 0.7812, + "step": 33533 + }, + { + "epoch": 0.86, + "learning_rate": 1.674342526855749e-06, + "loss": 0.8555, + "step": 33534 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743220942173757e-06, + "loss": 0.8042, + "step": 33535 + }, + { + "epoch": 0.86, + "learning_rate": 1.6743016610627052e-06, + "loss": 0.915, + "step": 33536 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742812273917527e-06, + "loss": 0.6133, + "step": 33537 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742607932045343e-06, + "loss": 0.6862, + "step": 33538 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742403585010654e-06, + "loss": 0.7766, + "step": 33539 + }, + { + "epoch": 0.86, + "learning_rate": 1.6742199232813614e-06, + "loss": 0.9561, + "step": 33540 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741994875454383e-06, + "loss": 0.8325, + "step": 33541 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741790512933118e-06, + "loss": 0.6388, + "step": 33542 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741586145249976e-06, + "loss": 0.916, + "step": 33543 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741381772405109e-06, + "loss": 0.8252, + "step": 33544 + }, + { + "epoch": 0.86, + "learning_rate": 1.6741177394398672e-06, + "loss": 0.8047, + "step": 33545 + }, + { + "epoch": 0.86, + "learning_rate": 1.674097301123083e-06, + "loss": 0.8193, + "step": 33546 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740768622901735e-06, + "loss": 0.8535, + "step": 33547 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740564229411543e-06, + "loss": 0.6626, + "step": 33548 + }, + { + "epoch": 0.86, + "learning_rate": 1.674035983076041e-06, + "loss": 1.2129, + "step": 33549 + }, + { + "epoch": 0.86, + "learning_rate": 1.6740155426948495e-06, + "loss": 0.7812, + "step": 33550 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739951017975951e-06, + "loss": 0.9883, + "step": 33551 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739746603842937e-06, + "loss": 0.9941, + "step": 33552 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739542184549608e-06, + "loss": 0.8604, + "step": 33553 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739337760096124e-06, + "loss": 0.8682, + "step": 33554 + }, + { + "epoch": 0.86, + "learning_rate": 1.6739133330482637e-06, + "loss": 0.8311, + "step": 33555 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738928895709306e-06, + "loss": 0.8877, + "step": 33556 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738724455776287e-06, + "loss": 0.835, + "step": 33557 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738520010683738e-06, + "loss": 0.9238, + "step": 33558 + }, + { + "epoch": 0.86, + "learning_rate": 1.673831556043181e-06, + "loss": 0.8105, + "step": 33559 + }, + { + "epoch": 0.86, + "learning_rate": 1.6738111105020667e-06, + "loss": 0.7007, + "step": 33560 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737906644450461e-06, + "loss": 0.8174, + "step": 33561 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737702178721352e-06, + "loss": 1.0771, + "step": 33562 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737497707833493e-06, + "loss": 0.8594, + "step": 33563 + }, + { + "epoch": 0.86, + "learning_rate": 1.673729323178704e-06, + "loss": 1.1504, + "step": 33564 + }, + { + "epoch": 0.86, + "learning_rate": 1.6737088750582152e-06, + "loss": 0.8813, + "step": 33565 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736884264218985e-06, + "loss": 0.7053, + "step": 33566 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736679772697696e-06, + "loss": 0.751, + "step": 33567 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736475276018443e-06, + "loss": 0.918, + "step": 33568 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736270774181378e-06, + "loss": 1.0, + "step": 33569 + }, + { + "epoch": 0.86, + "learning_rate": 1.6736066267186662e-06, + "loss": 0.6814, + "step": 33570 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735861755034447e-06, + "loss": 0.8506, + "step": 33571 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735657237724894e-06, + "loss": 0.8311, + "step": 33572 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735452715258158e-06, + "loss": 0.565, + "step": 33573 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735248187634397e-06, + "loss": 0.9463, + "step": 33574 + }, + { + "epoch": 0.86, + "learning_rate": 1.6735043654853764e-06, + "loss": 0.6903, + "step": 33575 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734839116916417e-06, + "loss": 0.8809, + "step": 33576 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734634573822514e-06, + "loss": 0.8496, + "step": 33577 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734430025572213e-06, + "loss": 0.959, + "step": 33578 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734225472165665e-06, + "loss": 0.8945, + "step": 33579 + }, + { + "epoch": 0.86, + "learning_rate": 1.6734020913603035e-06, + "loss": 0.8125, + "step": 33580 + }, + { + "epoch": 0.86, + "learning_rate": 1.673381634988447e-06, + "loss": 0.7466, + "step": 33581 + }, + { + "epoch": 0.86, + "learning_rate": 1.6733611781010135e-06, + "loss": 0.8711, + "step": 33582 + }, + { + "epoch": 0.86, + "learning_rate": 1.673340720698018e-06, + "loss": 0.8936, + "step": 33583 + }, + { + "epoch": 0.86, + "learning_rate": 1.673320262779477e-06, + "loss": 0.8008, + "step": 33584 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732998043454053e-06, + "loss": 0.6743, + "step": 33585 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732793453958188e-06, + "loss": 1.0273, + "step": 33586 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732588859307333e-06, + "loss": 0.8896, + "step": 33587 + }, + { + "epoch": 0.86, + "learning_rate": 1.6732384259501646e-06, + "loss": 0.7021, + "step": 33588 + }, + { + "epoch": 0.86, + "learning_rate": 1.673217965454128e-06, + "loss": 0.8955, + "step": 33589 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731975044426395e-06, + "loss": 0.6929, + "step": 33590 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731770429157145e-06, + "loss": 0.9639, + "step": 33591 + }, + { + "epoch": 0.86, + "learning_rate": 1.673156580873369e-06, + "loss": 0.9541, + "step": 33592 + }, + { + "epoch": 0.86, + "learning_rate": 1.6731361183156183e-06, + "loss": 0.8286, + "step": 33593 + }, + { + "epoch": 0.86, + "learning_rate": 1.673115655242478e-06, + "loss": 0.7393, + "step": 33594 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730951916539644e-06, + "loss": 0.8115, + "step": 33595 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730747275500927e-06, + "loss": 0.6504, + "step": 33596 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730542629308784e-06, + "loss": 0.8945, + "step": 33597 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730337977963376e-06, + "loss": 0.9736, + "step": 33598 + }, + { + "epoch": 0.86, + "learning_rate": 1.6730133321464857e-06, + "loss": 1.0479, + "step": 33599 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729928659813385e-06, + "loss": 0.8643, + "step": 33600 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729723993009115e-06, + "loss": 0.835, + "step": 33601 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729519321052204e-06, + "loss": 0.5422, + "step": 33602 + }, + { + "epoch": 0.86, + "learning_rate": 1.672931464394281e-06, + "loss": 0.7734, + "step": 33603 + }, + { + "epoch": 0.86, + "learning_rate": 1.6729109961681091e-06, + "loss": 1.1172, + "step": 33604 + }, + { + "epoch": 0.86, + "learning_rate": 1.67289052742672e-06, + "loss": 0.9463, + "step": 33605 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728700581701297e-06, + "loss": 0.6938, + "step": 33606 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728495883983537e-06, + "loss": 0.9014, + "step": 33607 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728291181114078e-06, + "loss": 0.8936, + "step": 33608 + }, + { + "epoch": 0.86, + "learning_rate": 1.6728086473093072e-06, + "loss": 0.8818, + "step": 33609 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727881759920684e-06, + "loss": 0.8359, + "step": 33610 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727677041597064e-06, + "loss": 0.636, + "step": 33611 + }, + { + "epoch": 0.86, + "learning_rate": 1.672747231812237e-06, + "loss": 0.79, + "step": 33612 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727267589496764e-06, + "loss": 0.8604, + "step": 33613 + }, + { + "epoch": 0.86, + "learning_rate": 1.6727062855720396e-06, + "loss": 0.7842, + "step": 33614 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726858116793422e-06, + "loss": 0.6167, + "step": 33615 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726653372716007e-06, + "loss": 0.9092, + "step": 33616 + }, + { + "epoch": 0.86, + "learning_rate": 1.67264486234883e-06, + "loss": 0.9707, + "step": 33617 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726243869110464e-06, + "loss": 0.8604, + "step": 33618 + }, + { + "epoch": 0.86, + "learning_rate": 1.6726039109582648e-06, + "loss": 0.7773, + "step": 33619 + }, + { + "epoch": 0.86, + "learning_rate": 1.6725834344905017e-06, + "loss": 0.9111, + "step": 33620 + }, + { + "epoch": 0.86, + "learning_rate": 1.672562957507772e-06, + "loss": 0.9482, + "step": 33621 + }, + { + "epoch": 0.86, + "learning_rate": 1.672542480010092e-06, + "loss": 0.8105, + "step": 33622 + }, + { + "epoch": 0.86, + "learning_rate": 1.672522001997477e-06, + "loss": 0.7139, + "step": 33623 + }, + { + "epoch": 0.86, + "learning_rate": 1.672501523469943e-06, + "loss": 0.8584, + "step": 33624 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724810444275055e-06, + "loss": 0.6855, + "step": 33625 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724605648701802e-06, + "loss": 0.7969, + "step": 33626 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724400847979828e-06, + "loss": 0.9199, + "step": 33627 + }, + { + "epoch": 0.86, + "learning_rate": 1.6724196042109286e-06, + "loss": 0.7871, + "step": 33628 + }, + { + "epoch": 0.86, + "learning_rate": 1.672399123109034e-06, + "loss": 0.5742, + "step": 33629 + }, + { + "epoch": 0.86, + "learning_rate": 1.672378641492314e-06, + "loss": 0.8262, + "step": 33630 + }, + { + "epoch": 0.86, + "learning_rate": 1.672358159360785e-06, + "loss": 0.7588, + "step": 33631 + }, + { + "epoch": 0.86, + "learning_rate": 1.6723376767144619e-06, + "loss": 0.8447, + "step": 33632 + }, + { + "epoch": 0.86, + "learning_rate": 1.672317193553361e-06, + "loss": 0.6621, + "step": 33633 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722967098774976e-06, + "loss": 0.9209, + "step": 33634 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722762256868875e-06, + "loss": 0.791, + "step": 33635 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722557409815465e-06, + "loss": 0.9678, + "step": 33636 + }, + { + "epoch": 0.86, + "learning_rate": 1.67223525576149e-06, + "loss": 0.918, + "step": 33637 + }, + { + "epoch": 0.86, + "learning_rate": 1.6722147700267341e-06, + "loss": 0.7017, + "step": 33638 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721942837772941e-06, + "loss": 0.7935, + "step": 33639 + }, + { + "epoch": 0.86, + "learning_rate": 1.672173797013186e-06, + "loss": 0.8774, + "step": 33640 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721533097344254e-06, + "loss": 0.8369, + "step": 33641 + }, + { + "epoch": 0.86, + "learning_rate": 1.6721328219410276e-06, + "loss": 0.6992, + "step": 33642 + }, + { + "epoch": 0.86, + "learning_rate": 1.672112333633009e-06, + "loss": 0.875, + "step": 33643 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720918448103847e-06, + "loss": 0.8213, + "step": 33644 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720713554731704e-06, + "loss": 0.8818, + "step": 33645 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720508656213821e-06, + "loss": 0.8574, + "step": 33646 + }, + { + "epoch": 0.86, + "learning_rate": 1.6720303752550353e-06, + "loss": 1.0352, + "step": 33647 + }, + { + "epoch": 0.86, + "learning_rate": 1.672009884374146e-06, + "loss": 1.0029, + "step": 33648 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719893929787295e-06, + "loss": 0.6704, + "step": 33649 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719689010688013e-06, + "loss": 0.7422, + "step": 33650 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719484086443779e-06, + "loss": 0.9766, + "step": 33651 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719279157054742e-06, + "loss": 1.1641, + "step": 33652 + }, + { + "epoch": 0.86, + "learning_rate": 1.6719074222521065e-06, + "loss": 0.7783, + "step": 33653 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718869282842897e-06, + "loss": 0.958, + "step": 33654 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718664338020404e-06, + "loss": 0.9287, + "step": 33655 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718459388053736e-06, + "loss": 0.9893, + "step": 33656 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718254432943053e-06, + "loss": 0.8291, + "step": 33657 + }, + { + "epoch": 0.86, + "learning_rate": 1.6718049472688513e-06, + "loss": 0.6533, + "step": 33658 + }, + { + "epoch": 0.86, + "learning_rate": 1.671784450729027e-06, + "loss": 0.6348, + "step": 33659 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717639536748483e-06, + "loss": 0.9531, + "step": 33660 + }, + { + "epoch": 0.86, + "learning_rate": 1.671743456106331e-06, + "loss": 0.832, + "step": 33661 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717229580234902e-06, + "loss": 0.7559, + "step": 33662 + }, + { + "epoch": 0.86, + "learning_rate": 1.6717024594263425e-06, + "loss": 0.8789, + "step": 33663 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716819603149025e-06, + "loss": 0.9424, + "step": 33664 + }, + { + "epoch": 0.86, + "learning_rate": 1.671661460689187e-06, + "loss": 1.0264, + "step": 33665 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716409605492112e-06, + "loss": 0.9893, + "step": 33666 + }, + { + "epoch": 0.86, + "learning_rate": 1.6716204598949905e-06, + "loss": 0.876, + "step": 33667 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715999587265413e-06, + "loss": 0.5815, + "step": 33668 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715794570438786e-06, + "loss": 0.8643, + "step": 33669 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715589548470183e-06, + "loss": 0.8779, + "step": 33670 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715384521359765e-06, + "loss": 0.9541, + "step": 33671 + }, + { + "epoch": 0.86, + "learning_rate": 1.6715179489107683e-06, + "loss": 1.0352, + "step": 33672 + }, + { + "epoch": 0.86, + "learning_rate": 1.67149744517141e-06, + "loss": 0.7578, + "step": 33673 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714769409179165e-06, + "loss": 0.7666, + "step": 33674 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714564361503043e-06, + "loss": 0.7949, + "step": 33675 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714359308685888e-06, + "loss": 0.9482, + "step": 33676 + }, + { + "epoch": 0.86, + "learning_rate": 1.6714154250727855e-06, + "loss": 0.689, + "step": 33677 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713949187629107e-06, + "loss": 0.8604, + "step": 33678 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713744119389795e-06, + "loss": 0.9092, + "step": 33679 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713539046010074e-06, + "loss": 0.9805, + "step": 33680 + }, + { + "epoch": 0.86, + "learning_rate": 1.6713333967490107e-06, + "loss": 0.8511, + "step": 33681 + }, + { + "epoch": 0.86, + "learning_rate": 1.671312888383005e-06, + "loss": 0.8398, + "step": 33682 + }, + { + "epoch": 0.86, + "learning_rate": 1.671292379503006e-06, + "loss": 0.8828, + "step": 33683 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712718701090293e-06, + "loss": 0.79, + "step": 33684 + }, + { + "epoch": 0.86, + "learning_rate": 1.67125136020109e-06, + "loss": 0.8867, + "step": 33685 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712308497792049e-06, + "loss": 1.0195, + "step": 33686 + }, + { + "epoch": 0.86, + "learning_rate": 1.6712103388433892e-06, + "loss": 0.8438, + "step": 33687 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711898273936586e-06, + "loss": 0.835, + "step": 33688 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711693154300286e-06, + "loss": 0.9277, + "step": 33689 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711488029525154e-06, + "loss": 0.5605, + "step": 33690 + }, + { + "epoch": 0.86, + "learning_rate": 1.671128289961134e-06, + "loss": 0.9229, + "step": 33691 + }, + { + "epoch": 0.86, + "learning_rate": 1.6711077764559009e-06, + "loss": 0.8369, + "step": 33692 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710872624368316e-06, + "loss": 0.8701, + "step": 33693 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710667479039412e-06, + "loss": 1.0156, + "step": 33694 + }, + { + "epoch": 0.86, + "learning_rate": 1.671046232857246e-06, + "loss": 0.9004, + "step": 33695 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710257172967616e-06, + "loss": 0.8213, + "step": 33696 + }, + { + "epoch": 0.86, + "learning_rate": 1.6710052012225036e-06, + "loss": 0.9277, + "step": 33697 + }, + { + "epoch": 0.86, + "learning_rate": 1.670984684634488e-06, + "loss": 0.8857, + "step": 33698 + }, + { + "epoch": 0.86, + "learning_rate": 1.67096416753273e-06, + "loss": 0.7559, + "step": 33699 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709436499172458e-06, + "loss": 0.8164, + "step": 33700 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709231317880508e-06, + "loss": 0.9531, + "step": 33701 + }, + { + "epoch": 0.86, + "learning_rate": 1.6709026131451607e-06, + "loss": 0.8804, + "step": 33702 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708820939885918e-06, + "loss": 1.0303, + "step": 33703 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708615743183585e-06, + "loss": 0.8232, + "step": 33704 + }, + { + "epoch": 0.86, + "learning_rate": 1.670841054134478e-06, + "loss": 0.9111, + "step": 33705 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708205334369652e-06, + "loss": 1.1113, + "step": 33706 + }, + { + "epoch": 0.86, + "learning_rate": 1.6708000122258357e-06, + "loss": 0.6646, + "step": 33707 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707794905011058e-06, + "loss": 0.812, + "step": 33708 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707589682627907e-06, + "loss": 0.3755, + "step": 33709 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707384455109063e-06, + "loss": 0.8438, + "step": 33710 + }, + { + "epoch": 0.86, + "learning_rate": 1.6707179222454684e-06, + "loss": 1.0342, + "step": 33711 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706973984664926e-06, + "loss": 1.0049, + "step": 33712 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706768741739947e-06, + "loss": 0.8315, + "step": 33713 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706563493679902e-06, + "loss": 0.8945, + "step": 33714 + }, + { + "epoch": 0.86, + "learning_rate": 1.670635824048495e-06, + "loss": 0.9961, + "step": 33715 + }, + { + "epoch": 0.86, + "learning_rate": 1.6706152982155247e-06, + "loss": 0.9971, + "step": 33716 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705947718690955e-06, + "loss": 0.9697, + "step": 33717 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705742450092225e-06, + "loss": 0.9092, + "step": 33718 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705537176359217e-06, + "loss": 0.7539, + "step": 33719 + }, + { + "epoch": 0.86, + "learning_rate": 1.6705331897492086e-06, + "loss": 0.6257, + "step": 33720 + }, + { + "epoch": 0.86, + "learning_rate": 1.670512661349099e-06, + "loss": 0.9531, + "step": 33721 + }, + { + "epoch": 0.86, + "learning_rate": 1.670492132435609e-06, + "loss": 0.7207, + "step": 33722 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704716030087538e-06, + "loss": 0.6108, + "step": 33723 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704510730685493e-06, + "loss": 0.6836, + "step": 33724 + }, + { + "epoch": 0.86, + "learning_rate": 1.670430542615011e-06, + "loss": 0.8818, + "step": 33725 + }, + { + "epoch": 0.86, + "learning_rate": 1.6704100116481552e-06, + "loss": 0.6943, + "step": 33726 + }, + { + "epoch": 0.86, + "learning_rate": 1.6703894801679974e-06, + "loss": 1.0615, + "step": 33727 + }, + { + "epoch": 0.86, + "learning_rate": 1.670368948174553e-06, + "loss": 0.8408, + "step": 33728 + }, + { + "epoch": 0.86, + "learning_rate": 1.670348415667838e-06, + "loss": 0.9209, + "step": 33729 + }, + { + "epoch": 0.86, + "learning_rate": 1.670327882647868e-06, + "loss": 0.7065, + "step": 33730 + }, + { + "epoch": 0.86, + "learning_rate": 1.6703073491146586e-06, + "loss": 0.9385, + "step": 33731 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702868150682258e-06, + "loss": 0.7939, + "step": 33732 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702662805085855e-06, + "loss": 0.9219, + "step": 33733 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702457454357529e-06, + "loss": 0.8975, + "step": 33734 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702252098497439e-06, + "loss": 0.9326, + "step": 33735 + }, + { + "epoch": 0.86, + "learning_rate": 1.6702046737505741e-06, + "loss": 0.9453, + "step": 33736 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701841371382598e-06, + "loss": 0.7603, + "step": 33737 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701636000128158e-06, + "loss": 0.6826, + "step": 33738 + }, + { + "epoch": 0.86, + "learning_rate": 1.670143062374259e-06, + "loss": 0.6948, + "step": 33739 + }, + { + "epoch": 0.86, + "learning_rate": 1.670122524222604e-06, + "loss": 0.5615, + "step": 33740 + }, + { + "epoch": 0.86, + "learning_rate": 1.6701019855578671e-06, + "loss": 0.7852, + "step": 33741 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700814463800638e-06, + "loss": 0.8604, + "step": 33742 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700609066892101e-06, + "loss": 0.9092, + "step": 33743 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700403664853217e-06, + "loss": 0.7285, + "step": 33744 + }, + { + "epoch": 0.86, + "learning_rate": 1.6700198257684142e-06, + "loss": 0.8071, + "step": 33745 + }, + { + "epoch": 0.86, + "learning_rate": 1.6699992845385032e-06, + "loss": 0.7227, + "step": 33746 + }, + { + "epoch": 0.86, + "learning_rate": 1.6699787427956046e-06, + "loss": 0.6128, + "step": 33747 + }, + { + "epoch": 0.86, + "learning_rate": 1.669958200539734e-06, + "loss": 0.8262, + "step": 33748 + }, + { + "epoch": 0.87, + "learning_rate": 1.6699376577709071e-06, + "loss": 0.9014, + "step": 33749 + }, + { + "epoch": 0.87, + "learning_rate": 1.66991711448914e-06, + "loss": 0.8105, + "step": 33750 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698965706944482e-06, + "loss": 0.8096, + "step": 33751 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698760263868469e-06, + "loss": 1.0361, + "step": 33752 + }, + { + "epoch": 0.87, + "learning_rate": 1.669855481566353e-06, + "loss": 0.999, + "step": 33753 + }, + { + "epoch": 0.87, + "learning_rate": 1.669834936232981e-06, + "loss": 0.8389, + "step": 33754 + }, + { + "epoch": 0.87, + "learning_rate": 1.6698143903867474e-06, + "loss": 1.0508, + "step": 33755 + }, + { + "epoch": 0.87, + "learning_rate": 1.669793844027668e-06, + "loss": 0.9609, + "step": 33756 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697732971557578e-06, + "loss": 0.8242, + "step": 33757 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697527497710332e-06, + "loss": 0.6426, + "step": 33758 + }, + { + "epoch": 0.87, + "learning_rate": 1.6697322018735098e-06, + "loss": 0.9434, + "step": 33759 + }, + { + "epoch": 0.87, + "learning_rate": 1.669711653463203e-06, + "loss": 0.6416, + "step": 33760 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696911045401292e-06, + "loss": 0.8926, + "step": 33761 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696705551043033e-06, + "loss": 0.728, + "step": 33762 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696500051557417e-06, + "loss": 0.8154, + "step": 33763 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696294546944598e-06, + "loss": 0.9795, + "step": 33764 + }, + { + "epoch": 0.87, + "learning_rate": 1.6696089037204732e-06, + "loss": 0.7734, + "step": 33765 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695883522337982e-06, + "loss": 0.7241, + "step": 33766 + }, + { + "epoch": 0.87, + "learning_rate": 1.66956780023445e-06, + "loss": 0.6963, + "step": 33767 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695472477224446e-06, + "loss": 0.9775, + "step": 33768 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695266946977977e-06, + "loss": 0.8975, + "step": 33769 + }, + { + "epoch": 0.87, + "learning_rate": 1.6695061411605246e-06, + "loss": 0.8633, + "step": 33770 + }, + { + "epoch": 0.87, + "learning_rate": 1.669485587110642e-06, + "loss": 0.6726, + "step": 33771 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694650325481646e-06, + "loss": 0.791, + "step": 33772 + }, + { + "epoch": 0.87, + "learning_rate": 1.669444477473109e-06, + "loss": 0.7256, + "step": 33773 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694239218854905e-06, + "loss": 0.8159, + "step": 33774 + }, + { + "epoch": 0.87, + "learning_rate": 1.6694033657853246e-06, + "loss": 0.7339, + "step": 33775 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693828091726275e-06, + "loss": 0.7124, + "step": 33776 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693622520474147e-06, + "loss": 0.8174, + "step": 33777 + }, + { + "epoch": 0.87, + "learning_rate": 1.669341694409702e-06, + "loss": 0.7354, + "step": 33778 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693211362595051e-06, + "loss": 0.9102, + "step": 33779 + }, + { + "epoch": 0.87, + "learning_rate": 1.6693005775968399e-06, + "loss": 0.8027, + "step": 33780 + }, + { + "epoch": 0.87, + "learning_rate": 1.669280018421722e-06, + "loss": 0.8379, + "step": 33781 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692594587341672e-06, + "loss": 0.6938, + "step": 33782 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692388985341912e-06, + "loss": 0.9902, + "step": 33783 + }, + { + "epoch": 0.87, + "learning_rate": 1.6692183378218098e-06, + "loss": 0.7773, + "step": 33784 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691977765970384e-06, + "loss": 0.5803, + "step": 33785 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691772148598932e-06, + "loss": 0.7715, + "step": 33786 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691566526103897e-06, + "loss": 0.5513, + "step": 33787 + }, + { + "epoch": 0.87, + "learning_rate": 1.669136089848544e-06, + "loss": 0.8086, + "step": 33788 + }, + { + "epoch": 0.87, + "learning_rate": 1.6691155265743712e-06, + "loss": 0.7832, + "step": 33789 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690949627878878e-06, + "loss": 0.9395, + "step": 33790 + }, + { + "epoch": 0.87, + "learning_rate": 1.669074398489109e-06, + "loss": 0.7339, + "step": 33791 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690538336780505e-06, + "loss": 0.9902, + "step": 33792 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690332683547283e-06, + "loss": 0.9082, + "step": 33793 + }, + { + "epoch": 0.87, + "learning_rate": 1.6690127025191583e-06, + "loss": 0.7734, + "step": 33794 + }, + { + "epoch": 0.87, + "learning_rate": 1.668992136171356e-06, + "loss": 1.0244, + "step": 33795 + }, + { + "epoch": 0.87, + "learning_rate": 1.668971569311337e-06, + "loss": 0.8408, + "step": 33796 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689510019391173e-06, + "loss": 0.7803, + "step": 33797 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689304340547127e-06, + "loss": 0.7944, + "step": 33798 + }, + { + "epoch": 0.87, + "learning_rate": 1.6689098656581386e-06, + "loss": 0.7148, + "step": 33799 + }, + { + "epoch": 0.87, + "learning_rate": 1.6688892967494113e-06, + "loss": 0.8359, + "step": 33800 + }, + { + "epoch": 0.87, + "learning_rate": 1.668868727328546e-06, + "loss": 0.9785, + "step": 33801 + }, + { + "epoch": 0.87, + "learning_rate": 1.6688481573955586e-06, + "loss": 0.959, + "step": 33802 + }, + { + "epoch": 0.87, + "learning_rate": 1.668827586950465e-06, + "loss": 0.6887, + "step": 33803 + }, + { + "epoch": 0.87, + "learning_rate": 1.668807015993281e-06, + "loss": 0.7109, + "step": 33804 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687864445240218e-06, + "loss": 0.8252, + "step": 33805 + }, + { + "epoch": 0.87, + "learning_rate": 1.668765872542704e-06, + "loss": 0.626, + "step": 33806 + }, + { + "epoch": 0.87, + "learning_rate": 1.668745300049343e-06, + "loss": 0.5913, + "step": 33807 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687247270439543e-06, + "loss": 0.9365, + "step": 33808 + }, + { + "epoch": 0.87, + "learning_rate": 1.6687041535265535e-06, + "loss": 0.7861, + "step": 33809 + }, + { + "epoch": 0.87, + "learning_rate": 1.668683579497157e-06, + "loss": 0.8877, + "step": 33810 + }, + { + "epoch": 0.87, + "learning_rate": 1.6686630049557802e-06, + "loss": 0.8291, + "step": 33811 + }, + { + "epoch": 0.87, + "learning_rate": 1.668642429902439e-06, + "loss": 0.9229, + "step": 33812 + }, + { + "epoch": 0.87, + "learning_rate": 1.6686218543371488e-06, + "loss": 0.8857, + "step": 33813 + }, + { + "epoch": 0.87, + "learning_rate": 1.668601278259926e-06, + "loss": 0.752, + "step": 33814 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685807016707853e-06, + "loss": 0.6377, + "step": 33815 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685601245697436e-06, + "loss": 0.8555, + "step": 33816 + }, + { + "epoch": 0.87, + "learning_rate": 1.668539546956816e-06, + "loss": 0.6631, + "step": 33817 + }, + { + "epoch": 0.87, + "learning_rate": 1.6685189688320186e-06, + "loss": 0.7354, + "step": 33818 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684983901953667e-06, + "loss": 0.7764, + "step": 33819 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684778110468764e-06, + "loss": 0.7715, + "step": 33820 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684572313865634e-06, + "loss": 0.9219, + "step": 33821 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684366512144434e-06, + "loss": 1.0596, + "step": 33822 + }, + { + "epoch": 0.87, + "learning_rate": 1.6684160705305321e-06, + "loss": 1.0381, + "step": 33823 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683954893348457e-06, + "loss": 0.8975, + "step": 33824 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683749076273991e-06, + "loss": 0.8574, + "step": 33825 + }, + { + "epoch": 0.87, + "learning_rate": 1.668354325408209e-06, + "loss": 0.8066, + "step": 33826 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683337426772905e-06, + "loss": 0.7275, + "step": 33827 + }, + { + "epoch": 0.87, + "learning_rate": 1.6683131594346596e-06, + "loss": 0.7725, + "step": 33828 + }, + { + "epoch": 0.87, + "learning_rate": 1.668292575680332e-06, + "loss": 0.9004, + "step": 33829 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682719914143237e-06, + "loss": 0.7031, + "step": 33830 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682514066366502e-06, + "loss": 0.833, + "step": 33831 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682308213473272e-06, + "loss": 0.9648, + "step": 33832 + }, + { + "epoch": 0.87, + "learning_rate": 1.6682102355463707e-06, + "loss": 0.9648, + "step": 33833 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681896492337963e-06, + "loss": 0.8506, + "step": 33834 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681690624096198e-06, + "loss": 0.8779, + "step": 33835 + }, + { + "epoch": 0.87, + "learning_rate": 1.668148475073857e-06, + "loss": 0.8389, + "step": 33836 + }, + { + "epoch": 0.87, + "learning_rate": 1.668127887226524e-06, + "loss": 0.623, + "step": 33837 + }, + { + "epoch": 0.87, + "learning_rate": 1.6681072988676355e-06, + "loss": 0.7891, + "step": 33838 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680867099972082e-06, + "loss": 0.8828, + "step": 33839 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680661206152577e-06, + "loss": 0.7158, + "step": 33840 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680455307217997e-06, + "loss": 0.7144, + "step": 33841 + }, + { + "epoch": 0.87, + "learning_rate": 1.66802494031685e-06, + "loss": 0.96, + "step": 33842 + }, + { + "epoch": 0.87, + "learning_rate": 1.6680043494004244e-06, + "loss": 0.5376, + "step": 33843 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679837579725385e-06, + "loss": 1.0137, + "step": 33844 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679631660332079e-06, + "loss": 0.6233, + "step": 33845 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679425735824488e-06, + "loss": 0.8779, + "step": 33846 + }, + { + "epoch": 0.87, + "learning_rate": 1.667921980620277e-06, + "loss": 0.8184, + "step": 33847 + }, + { + "epoch": 0.87, + "learning_rate": 1.6679013871467078e-06, + "loss": 0.915, + "step": 33848 + }, + { + "epoch": 0.87, + "learning_rate": 1.6678807931617573e-06, + "loss": 0.7607, + "step": 33849 + }, + { + "epoch": 0.87, + "learning_rate": 1.667860198665441e-06, + "loss": 0.8438, + "step": 33850 + }, + { + "epoch": 0.87, + "learning_rate": 1.667839603657775e-06, + "loss": 0.9355, + "step": 33851 + }, + { + "epoch": 0.87, + "learning_rate": 1.667819008138775e-06, + "loss": 0.8867, + "step": 33852 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677984121084567e-06, + "loss": 0.8115, + "step": 33853 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677778155668358e-06, + "loss": 0.6685, + "step": 33854 + }, + { + "epoch": 0.87, + "learning_rate": 1.667757218513928e-06, + "loss": 0.7603, + "step": 33855 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677366209497495e-06, + "loss": 0.8027, + "step": 33856 + }, + { + "epoch": 0.87, + "learning_rate": 1.6677160228743157e-06, + "loss": 1.0596, + "step": 33857 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676954242876425e-06, + "loss": 0.5299, + "step": 33858 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676748251897453e-06, + "loss": 1.0693, + "step": 33859 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676542255806402e-06, + "loss": 0.9697, + "step": 33860 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676336254603432e-06, + "loss": 0.8474, + "step": 33861 + }, + { + "epoch": 0.87, + "learning_rate": 1.6676130248288698e-06, + "loss": 0.8271, + "step": 33862 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675924236862357e-06, + "loss": 0.9268, + "step": 33863 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675718220324568e-06, + "loss": 0.8008, + "step": 33864 + }, + { + "epoch": 0.87, + "learning_rate": 1.667551219867549e-06, + "loss": 0.9443, + "step": 33865 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675306171915278e-06, + "loss": 0.9111, + "step": 33866 + }, + { + "epoch": 0.87, + "learning_rate": 1.6675100140044093e-06, + "loss": 0.9336, + "step": 33867 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674894103062088e-06, + "loss": 1.0215, + "step": 33868 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674688060969423e-06, + "loss": 0.8169, + "step": 33869 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674482013766257e-06, + "loss": 0.9297, + "step": 33870 + }, + { + "epoch": 0.87, + "learning_rate": 1.667427596145275e-06, + "loss": 0.8677, + "step": 33871 + }, + { + "epoch": 0.87, + "learning_rate": 1.6674069904029053e-06, + "loss": 0.9277, + "step": 33872 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673863841495327e-06, + "loss": 1.0693, + "step": 33873 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673657773851732e-06, + "loss": 0.9473, + "step": 33874 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673451701098427e-06, + "loss": 0.7285, + "step": 33875 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673245623235563e-06, + "loss": 0.916, + "step": 33876 + }, + { + "epoch": 0.87, + "learning_rate": 1.6673039540263303e-06, + "loss": 0.6084, + "step": 33877 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672833452181804e-06, + "loss": 1.0, + "step": 33878 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672627358991222e-06, + "loss": 0.8564, + "step": 33879 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672421260691717e-06, + "loss": 1.0342, + "step": 33880 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672215157283445e-06, + "loss": 0.5425, + "step": 33881 + }, + { + "epoch": 0.87, + "learning_rate": 1.6672009048766567e-06, + "loss": 0.7812, + "step": 33882 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671802935141237e-06, + "loss": 1.0332, + "step": 33883 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671596816407614e-06, + "loss": 0.832, + "step": 33884 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671390692565854e-06, + "loss": 0.6567, + "step": 33885 + }, + { + "epoch": 0.87, + "learning_rate": 1.6671184563616118e-06, + "loss": 1.0215, + "step": 33886 + }, + { + "epoch": 0.87, + "learning_rate": 1.6670978429558567e-06, + "loss": 0.916, + "step": 33887 + }, + { + "epoch": 0.87, + "learning_rate": 1.667077229039335e-06, + "loss": 0.9121, + "step": 33888 + }, + { + "epoch": 0.87, + "learning_rate": 1.667056614612063e-06, + "loss": 1.0938, + "step": 33889 + }, + { + "epoch": 0.87, + "learning_rate": 1.6670359996740567e-06, + "loss": 0.9668, + "step": 33890 + }, + { + "epoch": 0.87, + "learning_rate": 1.667015384225331e-06, + "loss": 0.7017, + "step": 33891 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669947682659029e-06, + "loss": 0.959, + "step": 33892 + }, + { + "epoch": 0.87, + "learning_rate": 1.666974151795787e-06, + "loss": 0.7295, + "step": 33893 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669535348150002e-06, + "loss": 0.7363, + "step": 33894 + }, + { + "epoch": 0.87, + "learning_rate": 1.6669329173235576e-06, + "loss": 0.8828, + "step": 33895 + }, + { + "epoch": 0.87, + "learning_rate": 1.666912299321475e-06, + "loss": 0.6953, + "step": 33896 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668916808087684e-06, + "loss": 0.9268, + "step": 33897 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668710617854535e-06, + "loss": 0.8457, + "step": 33898 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668504422515462e-06, + "loss": 0.7227, + "step": 33899 + }, + { + "epoch": 0.87, + "learning_rate": 1.6668298222070623e-06, + "loss": 0.7246, + "step": 33900 + }, + { + "epoch": 0.87, + "learning_rate": 1.666809201652017e-06, + "loss": 0.6772, + "step": 33901 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667885805864271e-06, + "loss": 0.96, + "step": 33902 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667679590103073e-06, + "loss": 0.7852, + "step": 33903 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667473369236742e-06, + "loss": 0.7329, + "step": 33904 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667267143265433e-06, + "loss": 0.9072, + "step": 33905 + }, + { + "epoch": 0.87, + "learning_rate": 1.6667060912189305e-06, + "loss": 0.7114, + "step": 33906 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666854676008515e-06, + "loss": 0.8096, + "step": 33907 + }, + { + "epoch": 0.87, + "learning_rate": 1.666664843472322e-06, + "loss": 0.8438, + "step": 33908 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666442188333578e-06, + "loss": 0.5942, + "step": 33909 + }, + { + "epoch": 0.87, + "learning_rate": 1.6666235936839749e-06, + "loss": 0.8311, + "step": 33910 + }, + { + "epoch": 0.87, + "learning_rate": 1.666602968024189e-06, + "loss": 0.8318, + "step": 33911 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665823418540157e-06, + "loss": 0.6421, + "step": 33912 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665617151734713e-06, + "loss": 0.7598, + "step": 33913 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665410879825708e-06, + "loss": 0.9072, + "step": 33914 + }, + { + "epoch": 0.87, + "learning_rate": 1.6665204602813305e-06, + "loss": 0.999, + "step": 33915 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664998320697664e-06, + "loss": 0.9678, + "step": 33916 + }, + { + "epoch": 0.87, + "learning_rate": 1.666479203347894e-06, + "loss": 0.6821, + "step": 33917 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664585741157288e-06, + "loss": 0.8281, + "step": 33918 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664379443732873e-06, + "loss": 0.7358, + "step": 33919 + }, + { + "epoch": 0.87, + "learning_rate": 1.6664173141205846e-06, + "loss": 0.7783, + "step": 33920 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663966833576368e-06, + "loss": 1.0078, + "step": 33921 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663760520844598e-06, + "loss": 0.8311, + "step": 33922 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663554203010695e-06, + "loss": 0.9355, + "step": 33923 + }, + { + "epoch": 0.87, + "learning_rate": 1.6663347880074814e-06, + "loss": 0.5664, + "step": 33924 + }, + { + "epoch": 0.87, + "learning_rate": 1.666314155203711e-06, + "loss": 0.999, + "step": 33925 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662935218897748e-06, + "loss": 0.9346, + "step": 33926 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662728880656886e-06, + "loss": 0.916, + "step": 33927 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662522537314673e-06, + "loss": 1.0859, + "step": 33928 + }, + { + "epoch": 0.87, + "learning_rate": 1.6662316188871276e-06, + "loss": 0.6875, + "step": 33929 + }, + { + "epoch": 0.87, + "learning_rate": 1.666210983532685e-06, + "loss": 0.8066, + "step": 33930 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661903476681553e-06, + "loss": 0.7222, + "step": 33931 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661697112935543e-06, + "loss": 0.8008, + "step": 33932 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661490744088975e-06, + "loss": 0.8169, + "step": 33933 + }, + { + "epoch": 0.87, + "learning_rate": 1.6661284370142013e-06, + "loss": 0.8252, + "step": 33934 + }, + { + "epoch": 0.87, + "learning_rate": 1.666107799109481e-06, + "loss": 0.7686, + "step": 33935 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660871606947525e-06, + "loss": 0.7463, + "step": 33936 + }, + { + "epoch": 0.87, + "learning_rate": 1.666066521770032e-06, + "loss": 0.7617, + "step": 33937 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660458823353348e-06, + "loss": 0.833, + "step": 33938 + }, + { + "epoch": 0.87, + "learning_rate": 1.666025242390677e-06, + "loss": 0.791, + "step": 33939 + }, + { + "epoch": 0.87, + "learning_rate": 1.6660046019360742e-06, + "loss": 0.7217, + "step": 33940 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659839609715422e-06, + "loss": 0.9678, + "step": 33941 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659633194970972e-06, + "loss": 0.8535, + "step": 33942 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659426775127545e-06, + "loss": 0.8418, + "step": 33943 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659220350185301e-06, + "loss": 0.832, + "step": 33944 + }, + { + "epoch": 0.87, + "learning_rate": 1.6659013920144398e-06, + "loss": 0.8916, + "step": 33945 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658807485004995e-06, + "loss": 0.8408, + "step": 33946 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658601044767249e-06, + "loss": 1.0762, + "step": 33947 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658394599431321e-06, + "loss": 0.9434, + "step": 33948 + }, + { + "epoch": 0.87, + "learning_rate": 1.6658188148997362e-06, + "loss": 0.7783, + "step": 33949 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657981693465536e-06, + "loss": 0.8252, + "step": 33950 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657775232836e-06, + "loss": 0.7393, + "step": 33951 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657568767108913e-06, + "loss": 1.0625, + "step": 33952 + }, + { + "epoch": 0.87, + "learning_rate": 1.665736229628443e-06, + "loss": 0.9893, + "step": 33953 + }, + { + "epoch": 0.87, + "learning_rate": 1.6657155820362712e-06, + "loss": 0.959, + "step": 33954 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656949339343914e-06, + "loss": 0.7354, + "step": 33955 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656742853228197e-06, + "loss": 0.7998, + "step": 33956 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656536362015716e-06, + "loss": 0.6416, + "step": 33957 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656329865706635e-06, + "loss": 0.8125, + "step": 33958 + }, + { + "epoch": 0.87, + "learning_rate": 1.6656123364301107e-06, + "loss": 0.7529, + "step": 33959 + }, + { + "epoch": 0.87, + "learning_rate": 1.665591685779929e-06, + "loss": 0.9512, + "step": 33960 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655710346201346e-06, + "loss": 0.8252, + "step": 33961 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655503829507426e-06, + "loss": 0.7881, + "step": 33962 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655297307717697e-06, + "loss": 0.8213, + "step": 33963 + }, + { + "epoch": 0.87, + "learning_rate": 1.6655090780832312e-06, + "loss": 0.686, + "step": 33964 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654884248851428e-06, + "loss": 0.9434, + "step": 33965 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654677711775208e-06, + "loss": 0.6631, + "step": 33966 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654471169603808e-06, + "loss": 0.9507, + "step": 33967 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654264622337384e-06, + "loss": 0.9062, + "step": 33968 + }, + { + "epoch": 0.87, + "learning_rate": 1.6654058069976094e-06, + "loss": 0.9453, + "step": 33969 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653851512520099e-06, + "loss": 0.6138, + "step": 33970 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653644949969554e-06, + "loss": 0.7046, + "step": 33971 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653438382324622e-06, + "loss": 0.9141, + "step": 33972 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653231809585457e-06, + "loss": 0.6384, + "step": 33973 + }, + { + "epoch": 0.87, + "learning_rate": 1.6653025231752218e-06, + "loss": 0.9229, + "step": 33974 + }, + { + "epoch": 0.87, + "learning_rate": 1.6652818648825063e-06, + "loss": 0.8887, + "step": 33975 + }, + { + "epoch": 0.87, + "learning_rate": 1.665261206080415e-06, + "loss": 0.8008, + "step": 33976 + }, + { + "epoch": 0.87, + "learning_rate": 1.6652405467689641e-06, + "loss": 0.96, + "step": 33977 + }, + { + "epoch": 0.87, + "learning_rate": 1.665219886948169e-06, + "loss": 0.668, + "step": 33978 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651992266180455e-06, + "loss": 1.0566, + "step": 33979 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651785657786094e-06, + "loss": 1.0625, + "step": 33980 + }, + { + "epoch": 0.87, + "learning_rate": 1.665157904429877e-06, + "loss": 1.0889, + "step": 33981 + }, + { + "epoch": 0.87, + "learning_rate": 1.6651372425718634e-06, + "loss": 0.751, + "step": 33982 + }, + { + "epoch": 0.87, + "learning_rate": 1.665116580204585e-06, + "loss": 0.7549, + "step": 33983 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650959173280574e-06, + "loss": 0.6484, + "step": 33984 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650752539422965e-06, + "loss": 0.7437, + "step": 33985 + }, + { + "epoch": 0.87, + "learning_rate": 1.665054590047318e-06, + "loss": 0.917, + "step": 33986 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650339256431378e-06, + "loss": 0.9414, + "step": 33987 + }, + { + "epoch": 0.87, + "learning_rate": 1.6650132607297718e-06, + "loss": 0.6943, + "step": 33988 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649925953072357e-06, + "loss": 0.9365, + "step": 33989 + }, + { + "epoch": 0.87, + "learning_rate": 1.664971929375545e-06, + "loss": 0.8594, + "step": 33990 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649512629347163e-06, + "loss": 0.9658, + "step": 33991 + }, + { + "epoch": 0.87, + "learning_rate": 1.664930595984765e-06, + "loss": 0.9561, + "step": 33992 + }, + { + "epoch": 0.87, + "learning_rate": 1.6649099285257067e-06, + "loss": 1.0322, + "step": 33993 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648892605575573e-06, + "loss": 0.8853, + "step": 33994 + }, + { + "epoch": 0.87, + "learning_rate": 1.664868592080333e-06, + "loss": 0.8916, + "step": 33995 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648479230940493e-06, + "loss": 0.9141, + "step": 33996 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648272535987223e-06, + "loss": 0.6904, + "step": 33997 + }, + { + "epoch": 0.87, + "learning_rate": 1.6648065835943674e-06, + "loss": 0.9785, + "step": 33998 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647859130810007e-06, + "loss": 0.8418, + "step": 33999 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647652420586382e-06, + "loss": 0.7588, + "step": 34000 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647445705272954e-06, + "loss": 0.8711, + "step": 34001 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647238984869883e-06, + "loss": 0.7607, + "step": 34002 + }, + { + "epoch": 0.87, + "learning_rate": 1.6647032259377327e-06, + "loss": 0.6333, + "step": 34003 + }, + { + "epoch": 0.87, + "learning_rate": 1.6646825528795443e-06, + "loss": 0.9658, + "step": 34004 + }, + { + "epoch": 0.87, + "learning_rate": 1.664661879312439e-06, + "loss": 0.7729, + "step": 34005 + }, + { + "epoch": 0.87, + "learning_rate": 1.6646412052364327e-06, + "loss": 1.0166, + "step": 34006 + }, + { + "epoch": 0.87, + "learning_rate": 1.664620530651541e-06, + "loss": 0.7549, + "step": 34007 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645998555577802e-06, + "loss": 1.0312, + "step": 34008 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645791799551657e-06, + "loss": 0.9775, + "step": 34009 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645585038437135e-06, + "loss": 0.7969, + "step": 34010 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645378272234397e-06, + "loss": 0.9482, + "step": 34011 + }, + { + "epoch": 0.87, + "learning_rate": 1.6645171500943595e-06, + "loss": 0.8633, + "step": 34012 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644964724564892e-06, + "loss": 0.8887, + "step": 34013 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644757943098444e-06, + "loss": 0.917, + "step": 34014 + }, + { + "epoch": 0.87, + "learning_rate": 1.664455115654441e-06, + "loss": 0.5789, + "step": 34015 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644344364902952e-06, + "loss": 0.8613, + "step": 34016 + }, + { + "epoch": 0.87, + "learning_rate": 1.6644137568174224e-06, + "loss": 0.8752, + "step": 34017 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643930766358382e-06, + "loss": 0.9766, + "step": 34018 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643723959455592e-06, + "loss": 1.0459, + "step": 34019 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643517147466003e-06, + "loss": 0.8613, + "step": 34020 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643310330389785e-06, + "loss": 0.7397, + "step": 34021 + }, + { + "epoch": 0.87, + "learning_rate": 1.6643103508227084e-06, + "loss": 0.7778, + "step": 34022 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642896680978068e-06, + "loss": 0.9375, + "step": 34023 + }, + { + "epoch": 0.87, + "learning_rate": 1.664268984864289e-06, + "loss": 0.6675, + "step": 34024 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642483011221708e-06, + "loss": 0.7339, + "step": 34025 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642276168714685e-06, + "loss": 0.96, + "step": 34026 + }, + { + "epoch": 0.87, + "learning_rate": 1.6642069321121974e-06, + "loss": 1.0088, + "step": 34027 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641862468443737e-06, + "loss": 0.8916, + "step": 34028 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641655610680131e-06, + "loss": 0.8584, + "step": 34029 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641448747831315e-06, + "loss": 1.0181, + "step": 34030 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641241879897447e-06, + "loss": 0.9648, + "step": 34031 + }, + { + "epoch": 0.87, + "learning_rate": 1.6641035006878688e-06, + "loss": 0.79, + "step": 34032 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640828128775191e-06, + "loss": 0.6348, + "step": 34033 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640621245587117e-06, + "loss": 0.9678, + "step": 34034 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640414357314624e-06, + "loss": 0.8047, + "step": 34035 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640207463957873e-06, + "loss": 0.8896, + "step": 34036 + }, + { + "epoch": 0.87, + "learning_rate": 1.6640000565517023e-06, + "loss": 0.9243, + "step": 34037 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639793661992228e-06, + "loss": 0.8525, + "step": 34038 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639586753383645e-06, + "loss": 0.6357, + "step": 34039 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639379839691437e-06, + "loss": 0.9033, + "step": 34040 + }, + { + "epoch": 0.87, + "learning_rate": 1.6639172920915762e-06, + "loss": 0.833, + "step": 34041 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638965997056779e-06, + "loss": 0.8906, + "step": 34042 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638759068114645e-06, + "loss": 0.752, + "step": 34043 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638552134089517e-06, + "loss": 0.707, + "step": 34044 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638345194981553e-06, + "loss": 0.6777, + "step": 34045 + }, + { + "epoch": 0.87, + "learning_rate": 1.6638138250790916e-06, + "loss": 0.9043, + "step": 34046 + }, + { + "epoch": 0.87, + "learning_rate": 1.663793130151776e-06, + "loss": 0.9619, + "step": 34047 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637724347162248e-06, + "loss": 0.7744, + "step": 34048 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637517387724533e-06, + "loss": 0.9014, + "step": 34049 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637310423204779e-06, + "loss": 0.8701, + "step": 34050 + }, + { + "epoch": 0.87, + "learning_rate": 1.6637103453603138e-06, + "loss": 0.7043, + "step": 34051 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636896478919774e-06, + "loss": 0.7773, + "step": 34052 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636689499154844e-06, + "loss": 0.8462, + "step": 34053 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636482514308506e-06, + "loss": 1.0635, + "step": 34054 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636275524380916e-06, + "loss": 0.8379, + "step": 34055 + }, + { + "epoch": 0.87, + "learning_rate": 1.6636068529372237e-06, + "loss": 0.7974, + "step": 34056 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635861529282626e-06, + "loss": 0.8867, + "step": 34057 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635654524112242e-06, + "loss": 0.8604, + "step": 34058 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635447513861238e-06, + "loss": 0.8193, + "step": 34059 + }, + { + "epoch": 0.87, + "learning_rate": 1.663524049852978e-06, + "loss": 0.7178, + "step": 34060 + }, + { + "epoch": 0.87, + "learning_rate": 1.6635033478118023e-06, + "loss": 0.7812, + "step": 34061 + }, + { + "epoch": 0.87, + "learning_rate": 1.6634826452626127e-06, + "loss": 0.8994, + "step": 34062 + }, + { + "epoch": 0.87, + "learning_rate": 1.663461942205425e-06, + "loss": 0.6953, + "step": 34063 + }, + { + "epoch": 0.87, + "learning_rate": 1.6634412386402548e-06, + "loss": 0.9189, + "step": 34064 + }, + { + "epoch": 0.87, + "learning_rate": 1.663420534567118e-06, + "loss": 0.7246, + "step": 34065 + }, + { + "epoch": 0.87, + "learning_rate": 1.663399829986031e-06, + "loss": 0.9111, + "step": 34066 + }, + { + "epoch": 0.87, + "learning_rate": 1.663379124897009e-06, + "loss": 0.874, + "step": 34067 + }, + { + "epoch": 0.87, + "learning_rate": 1.663358419300068e-06, + "loss": 1.0352, + "step": 34068 + }, + { + "epoch": 0.87, + "learning_rate": 1.6633377131952245e-06, + "loss": 0.6226, + "step": 34069 + }, + { + "epoch": 0.87, + "learning_rate": 1.6633170065824932e-06, + "loss": 1.1113, + "step": 34070 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632962994618907e-06, + "loss": 0.9434, + "step": 34071 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632755918334329e-06, + "loss": 1.0732, + "step": 34072 + }, + { + "epoch": 0.87, + "learning_rate": 1.6632548836971354e-06, + "loss": 0.9053, + "step": 34073 + }, + { + "epoch": 0.87, + "learning_rate": 1.663234175053014e-06, + "loss": 1.0576, + "step": 34074 + }, + { + "epoch": 0.87, + "learning_rate": 1.663213465901085e-06, + "loss": 1.0049, + "step": 34075 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631927562413637e-06, + "loss": 0.7427, + "step": 34076 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631720460738664e-06, + "loss": 0.7285, + "step": 34077 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631513353986084e-06, + "loss": 0.8486, + "step": 34078 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631306242156062e-06, + "loss": 0.8682, + "step": 34079 + }, + { + "epoch": 0.87, + "learning_rate": 1.6631099125248754e-06, + "loss": 0.7439, + "step": 34080 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630892003264317e-06, + "loss": 0.8428, + "step": 34081 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630684876202913e-06, + "loss": 0.9795, + "step": 34082 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630477744064698e-06, + "loss": 0.8501, + "step": 34083 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630270606849827e-06, + "loss": 0.835, + "step": 34084 + }, + { + "epoch": 0.87, + "learning_rate": 1.6630063464558466e-06, + "loss": 0.8242, + "step": 34085 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629856317190768e-06, + "loss": 0.6221, + "step": 34086 + }, + { + "epoch": 0.87, + "learning_rate": 1.66296491647469e-06, + "loss": 0.9678, + "step": 34087 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629442007227008e-06, + "loss": 0.8555, + "step": 34088 + }, + { + "epoch": 0.87, + "learning_rate": 1.662923484463126e-06, + "loss": 0.8154, + "step": 34089 + }, + { + "epoch": 0.87, + "learning_rate": 1.6629027676959811e-06, + "loss": 0.8643, + "step": 34090 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628820504212819e-06, + "loss": 0.7344, + "step": 34091 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628613326390446e-06, + "loss": 0.647, + "step": 34092 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628406143492848e-06, + "loss": 0.8379, + "step": 34093 + }, + { + "epoch": 0.87, + "learning_rate": 1.6628198955520184e-06, + "loss": 0.9717, + "step": 34094 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627991762472614e-06, + "loss": 0.8154, + "step": 34095 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627784564350291e-06, + "loss": 1.0293, + "step": 34096 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627577361153383e-06, + "loss": 0.6709, + "step": 34097 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627370152882043e-06, + "loss": 0.9238, + "step": 34098 + }, + { + "epoch": 0.87, + "learning_rate": 1.6627162939536427e-06, + "loss": 0.6348, + "step": 34099 + }, + { + "epoch": 0.87, + "learning_rate": 1.66269557211167e-06, + "loss": 0.7671, + "step": 34100 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626748497623018e-06, + "loss": 0.8916, + "step": 34101 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626541269055538e-06, + "loss": 0.8242, + "step": 34102 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626334035414422e-06, + "loss": 1.0605, + "step": 34103 + }, + { + "epoch": 0.87, + "learning_rate": 1.6626126796699826e-06, + "loss": 0.7861, + "step": 34104 + }, + { + "epoch": 0.87, + "learning_rate": 1.662591955291191e-06, + "loss": 0.5156, + "step": 34105 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625712304050827e-06, + "loss": 0.957, + "step": 34106 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625505050116745e-06, + "loss": 0.5942, + "step": 34107 + }, + { + "epoch": 0.87, + "learning_rate": 1.662529779110982e-06, + "loss": 1.0264, + "step": 34108 + }, + { + "epoch": 0.87, + "learning_rate": 1.6625090527030208e-06, + "loss": 0.7505, + "step": 34109 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624883257878066e-06, + "loss": 0.9502, + "step": 34110 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624675983653558e-06, + "loss": 0.9355, + "step": 34111 + }, + { + "epoch": 0.87, + "learning_rate": 1.662446870435684e-06, + "loss": 1.0059, + "step": 34112 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624261419988073e-06, + "loss": 0.8018, + "step": 34113 + }, + { + "epoch": 0.87, + "learning_rate": 1.6624054130547412e-06, + "loss": 0.9443, + "step": 34114 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623846836035014e-06, + "loss": 0.8203, + "step": 34115 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623639536451045e-06, + "loss": 0.8438, + "step": 34116 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623432231795658e-06, + "loss": 0.6953, + "step": 34117 + }, + { + "epoch": 0.87, + "learning_rate": 1.6623224922069014e-06, + "loss": 0.8013, + "step": 34118 + }, + { + "epoch": 0.87, + "learning_rate": 1.662301760727127e-06, + "loss": 0.9941, + "step": 34119 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622810287402587e-06, + "loss": 1.0205, + "step": 34120 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622602962463124e-06, + "loss": 0.8984, + "step": 34121 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622395632453037e-06, + "loss": 0.8223, + "step": 34122 + }, + { + "epoch": 0.87, + "learning_rate": 1.6622188297372485e-06, + "loss": 0.7815, + "step": 34123 + }, + { + "epoch": 0.87, + "learning_rate": 1.662198095722163e-06, + "loss": 0.7271, + "step": 34124 + }, + { + "epoch": 0.87, + "learning_rate": 1.662177361200063e-06, + "loss": 0.7939, + "step": 34125 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621566261709638e-06, + "loss": 0.9912, + "step": 34126 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621358906348822e-06, + "loss": 0.8447, + "step": 34127 + }, + { + "epoch": 0.87, + "learning_rate": 1.6621151545918332e-06, + "loss": 0.7881, + "step": 34128 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620944180418333e-06, + "loss": 0.8186, + "step": 34129 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620736809848981e-06, + "loss": 0.7485, + "step": 34130 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620529434210436e-06, + "loss": 0.6404, + "step": 34131 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620322053502854e-06, + "loss": 0.6953, + "step": 34132 + }, + { + "epoch": 0.87, + "learning_rate": 1.6620114667726398e-06, + "loss": 0.9365, + "step": 34133 + }, + { + "epoch": 0.87, + "learning_rate": 1.661990727688122e-06, + "loss": 0.7266, + "step": 34134 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619699880967489e-06, + "loss": 0.6877, + "step": 34135 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619492479985355e-06, + "loss": 0.7134, + "step": 34136 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619285073934981e-06, + "loss": 0.8276, + "step": 34137 + }, + { + "epoch": 0.87, + "learning_rate": 1.6619077662816526e-06, + "loss": 0.8906, + "step": 34138 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618870246630145e-06, + "loss": 0.79, + "step": 34139 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618662825376002e-06, + "loss": 0.6687, + "step": 34140 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618455399054251e-06, + "loss": 1.0576, + "step": 34141 + }, + { + "epoch": 0.88, + "learning_rate": 1.6618247967665054e-06, + "loss": 1.1064, + "step": 34142 + }, + { + "epoch": 0.88, + "learning_rate": 1.661804053120857e-06, + "loss": 0.9277, + "step": 34143 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617833089684955e-06, + "loss": 0.7563, + "step": 34144 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617625643094369e-06, + "loss": 0.8604, + "step": 34145 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617418191436973e-06, + "loss": 0.6997, + "step": 34146 + }, + { + "epoch": 0.88, + "learning_rate": 1.6617210734712923e-06, + "loss": 0.5957, + "step": 34147 + }, + { + "epoch": 0.88, + "learning_rate": 1.661700327292238e-06, + "loss": 0.9844, + "step": 34148 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616795806065503e-06, + "loss": 0.6543, + "step": 34149 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616588334142448e-06, + "loss": 0.6042, + "step": 34150 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616380857153374e-06, + "loss": 0.9121, + "step": 34151 + }, + { + "epoch": 0.88, + "learning_rate": 1.6616173375098444e-06, + "loss": 1.043, + "step": 34152 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615965887977812e-06, + "loss": 0.731, + "step": 34153 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615758395791639e-06, + "loss": 0.8926, + "step": 34154 + }, + { + "epoch": 0.88, + "learning_rate": 1.6615550898540084e-06, + "loss": 0.8369, + "step": 34155 + }, + { + "epoch": 0.88, + "learning_rate": 1.661534339622331e-06, + "loss": 1.0859, + "step": 34156 + }, + { + "epoch": 0.88, + "learning_rate": 1.661513588884147e-06, + "loss": 0.8408, + "step": 34157 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614928376394722e-06, + "loss": 0.8857, + "step": 34158 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614720858883228e-06, + "loss": 0.8896, + "step": 34159 + }, + { + "epoch": 0.88, + "learning_rate": 1.661451333630715e-06, + "loss": 0.9717, + "step": 34160 + }, + { + "epoch": 0.88, + "learning_rate": 1.6614305808666643e-06, + "loss": 0.7896, + "step": 34161 + }, + { + "epoch": 0.88, + "learning_rate": 1.661409827596186e-06, + "loss": 0.7031, + "step": 34162 + }, + { + "epoch": 0.88, + "learning_rate": 1.661389073819297e-06, + "loss": 0.7808, + "step": 34163 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613683195360129e-06, + "loss": 0.771, + "step": 34164 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613475647463494e-06, + "loss": 0.6191, + "step": 34165 + }, + { + "epoch": 0.88, + "learning_rate": 1.6613268094503226e-06, + "loss": 0.8545, + "step": 34166 + }, + { + "epoch": 0.88, + "learning_rate": 1.661306053647948e-06, + "loss": 0.9385, + "step": 34167 + }, + { + "epoch": 0.88, + "learning_rate": 1.661285297339242e-06, + "loss": 0.999, + "step": 34168 + }, + { + "epoch": 0.88, + "learning_rate": 1.66126454052422e-06, + "loss": 1.0996, + "step": 34169 + }, + { + "epoch": 0.88, + "learning_rate": 1.6612437832028982e-06, + "loss": 0.7837, + "step": 34170 + }, + { + "epoch": 0.88, + "learning_rate": 1.661223025375293e-06, + "loss": 0.8516, + "step": 34171 + }, + { + "epoch": 0.88, + "learning_rate": 1.661202267041419e-06, + "loss": 0.73, + "step": 34172 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611815082012933e-06, + "loss": 0.9048, + "step": 34173 + }, + { + "epoch": 0.88, + "learning_rate": 1.661160748854931e-06, + "loss": 0.8672, + "step": 34174 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611399890023484e-06, + "loss": 0.8096, + "step": 34175 + }, + { + "epoch": 0.88, + "learning_rate": 1.6611192286435616e-06, + "loss": 0.8022, + "step": 34176 + }, + { + "epoch": 0.88, + "learning_rate": 1.661098467778586e-06, + "loss": 0.9033, + "step": 34177 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610777064074376e-06, + "loss": 0.8154, + "step": 34178 + }, + { + "epoch": 0.88, + "learning_rate": 1.661056944530132e-06, + "loss": 0.7136, + "step": 34179 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610361821466862e-06, + "loss": 1.0117, + "step": 34180 + }, + { + "epoch": 0.88, + "learning_rate": 1.6610154192571151e-06, + "loss": 0.8477, + "step": 34181 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609946558614349e-06, + "loss": 0.9355, + "step": 34182 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609738919596616e-06, + "loss": 1.0488, + "step": 34183 + }, + { + "epoch": 0.88, + "learning_rate": 1.660953127551811e-06, + "loss": 0.7666, + "step": 34184 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609323626378987e-06, + "loss": 0.729, + "step": 34185 + }, + { + "epoch": 0.88, + "learning_rate": 1.6609115972179412e-06, + "loss": 0.791, + "step": 34186 + }, + { + "epoch": 0.88, + "learning_rate": 1.660890831291954e-06, + "loss": 1.0225, + "step": 34187 + }, + { + "epoch": 0.88, + "learning_rate": 1.660870064859953e-06, + "loss": 0.731, + "step": 34188 + }, + { + "epoch": 0.88, + "learning_rate": 1.660849297921954e-06, + "loss": 0.9365, + "step": 34189 + }, + { + "epoch": 0.88, + "learning_rate": 1.6608285304779735e-06, + "loss": 0.8525, + "step": 34190 + }, + { + "epoch": 0.88, + "learning_rate": 1.6608077625280266e-06, + "loss": 0.7441, + "step": 34191 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607869940721298e-06, + "loss": 0.7393, + "step": 34192 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607662251102988e-06, + "loss": 0.8564, + "step": 34193 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607454556425493e-06, + "loss": 0.9609, + "step": 34194 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607246856688974e-06, + "loss": 1.0518, + "step": 34195 + }, + { + "epoch": 0.88, + "learning_rate": 1.6607039151893592e-06, + "loss": 1.1182, + "step": 34196 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606831442039504e-06, + "loss": 0.8984, + "step": 34197 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606623727126867e-06, + "loss": 0.8828, + "step": 34198 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606416007155844e-06, + "loss": 0.748, + "step": 34199 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606208282126588e-06, + "loss": 1.0342, + "step": 34200 + }, + { + "epoch": 0.88, + "learning_rate": 1.6606000552039267e-06, + "loss": 0.6328, + "step": 34201 + }, + { + "epoch": 0.88, + "learning_rate": 1.660579281689403e-06, + "loss": 0.6836, + "step": 34202 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605585076691048e-06, + "loss": 0.8516, + "step": 34203 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605377331430467e-06, + "loss": 0.79, + "step": 34204 + }, + { + "epoch": 0.88, + "learning_rate": 1.6605169581112454e-06, + "loss": 1.0596, + "step": 34205 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604961825737167e-06, + "loss": 0.9004, + "step": 34206 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604754065304768e-06, + "loss": 0.8594, + "step": 34207 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604546299815408e-06, + "loss": 0.8311, + "step": 34208 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604338529269249e-06, + "loss": 0.8252, + "step": 34209 + }, + { + "epoch": 0.88, + "learning_rate": 1.6604130753666455e-06, + "loss": 0.8525, + "step": 34210 + }, + { + "epoch": 0.88, + "learning_rate": 1.660392297300718e-06, + "loss": 0.9473, + "step": 34211 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603715187291586e-06, + "loss": 0.8445, + "step": 34212 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603507396519832e-06, + "loss": 0.8271, + "step": 34213 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603299600692073e-06, + "loss": 1.0713, + "step": 34214 + }, + { + "epoch": 0.88, + "learning_rate": 1.6603091799808474e-06, + "loss": 0.812, + "step": 34215 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602883993869191e-06, + "loss": 0.9717, + "step": 34216 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602676182874382e-06, + "loss": 0.6768, + "step": 34217 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602468366824206e-06, + "loss": 0.8789, + "step": 34218 + }, + { + "epoch": 0.88, + "learning_rate": 1.6602260545718826e-06, + "loss": 0.7695, + "step": 34219 + }, + { + "epoch": 0.88, + "learning_rate": 1.66020527195584e-06, + "loss": 0.8662, + "step": 34220 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601844888343085e-06, + "loss": 1.041, + "step": 34221 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601637052073039e-06, + "loss": 0.6768, + "step": 34222 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601429210748423e-06, + "loss": 0.8164, + "step": 34223 + }, + { + "epoch": 0.88, + "learning_rate": 1.6601221364369399e-06, + "loss": 1.0566, + "step": 34224 + }, + { + "epoch": 0.88, + "learning_rate": 1.660101351293612e-06, + "loss": 0.8799, + "step": 34225 + }, + { + "epoch": 0.88, + "learning_rate": 1.660080565644875e-06, + "loss": 0.6855, + "step": 34226 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600597794907447e-06, + "loss": 0.6545, + "step": 34227 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600389928312368e-06, + "loss": 0.8516, + "step": 34228 + }, + { + "epoch": 0.88, + "learning_rate": 1.6600182056663674e-06, + "loss": 0.8984, + "step": 34229 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599974179961527e-06, + "loss": 0.7134, + "step": 34230 + }, + { + "epoch": 0.88, + "learning_rate": 1.659976629820608e-06, + "loss": 0.8896, + "step": 34231 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599558411397498e-06, + "loss": 0.9707, + "step": 34232 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599350519535937e-06, + "loss": 0.999, + "step": 34233 + }, + { + "epoch": 0.88, + "learning_rate": 1.6599142622621557e-06, + "loss": 0.9072, + "step": 34234 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598934720654513e-06, + "loss": 0.6304, + "step": 34235 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598726813634975e-06, + "loss": 0.7256, + "step": 34236 + }, + { + "epoch": 0.88, + "learning_rate": 1.659851890156309e-06, + "loss": 0.644, + "step": 34237 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598310984439024e-06, + "loss": 0.8848, + "step": 34238 + }, + { + "epoch": 0.88, + "learning_rate": 1.6598103062262934e-06, + "loss": 0.7117, + "step": 34239 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597895135034983e-06, + "loss": 0.8223, + "step": 34240 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597687202755324e-06, + "loss": 1.0859, + "step": 34241 + }, + { + "epoch": 0.88, + "learning_rate": 1.659747926542412e-06, + "loss": 0.7168, + "step": 34242 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597271323041531e-06, + "loss": 0.8896, + "step": 34243 + }, + { + "epoch": 0.88, + "learning_rate": 1.6597063375607712e-06, + "loss": 0.6392, + "step": 34244 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596855423122827e-06, + "loss": 0.8359, + "step": 34245 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596647465587031e-06, + "loss": 0.8867, + "step": 34246 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596439503000489e-06, + "loss": 0.7271, + "step": 34247 + }, + { + "epoch": 0.88, + "learning_rate": 1.659623153536335e-06, + "loss": 0.8613, + "step": 34248 + }, + { + "epoch": 0.88, + "learning_rate": 1.6596023562675786e-06, + "loss": 0.8936, + "step": 34249 + }, + { + "epoch": 0.88, + "learning_rate": 1.659581558493795e-06, + "loss": 0.5469, + "step": 34250 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595607602149997e-06, + "loss": 0.9058, + "step": 34251 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595399614312094e-06, + "loss": 0.9668, + "step": 34252 + }, + { + "epoch": 0.88, + "learning_rate": 1.6595191621424394e-06, + "loss": 0.8662, + "step": 34253 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594983623487063e-06, + "loss": 0.9834, + "step": 34254 + }, + { + "epoch": 0.88, + "learning_rate": 1.659477562050025e-06, + "loss": 0.9697, + "step": 34255 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594567612464128e-06, + "loss": 0.7827, + "step": 34256 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594359599378845e-06, + "loss": 0.8025, + "step": 34257 + }, + { + "epoch": 0.88, + "learning_rate": 1.6594151581244561e-06, + "loss": 0.7976, + "step": 34258 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593943558061442e-06, + "loss": 0.6943, + "step": 34259 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593735529829645e-06, + "loss": 0.8633, + "step": 34260 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593527496549328e-06, + "loss": 0.9775, + "step": 34261 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593319458220648e-06, + "loss": 0.9199, + "step": 34262 + }, + { + "epoch": 0.88, + "learning_rate": 1.6593111414843769e-06, + "loss": 1.0557, + "step": 34263 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592903366418841e-06, + "loss": 0.9131, + "step": 34264 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592695312946034e-06, + "loss": 1.0869, + "step": 34265 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592487254425508e-06, + "loss": 1.0879, + "step": 34266 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592279190857412e-06, + "loss": 0.563, + "step": 34267 + }, + { + "epoch": 0.88, + "learning_rate": 1.6592071122241913e-06, + "loss": 0.6777, + "step": 34268 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591863048579167e-06, + "loss": 0.8291, + "step": 34269 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591654969869335e-06, + "loss": 0.8408, + "step": 34270 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591446886112578e-06, + "loss": 0.9014, + "step": 34271 + }, + { + "epoch": 0.88, + "learning_rate": 1.659123879730905e-06, + "loss": 0.9023, + "step": 34272 + }, + { + "epoch": 0.88, + "learning_rate": 1.6591030703458917e-06, + "loss": 0.7671, + "step": 34273 + }, + { + "epoch": 0.88, + "learning_rate": 1.659082260456233e-06, + "loss": 0.7471, + "step": 34274 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590614500619457e-06, + "loss": 0.9492, + "step": 34275 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590406391630454e-06, + "loss": 0.916, + "step": 34276 + }, + { + "epoch": 0.88, + "learning_rate": 1.6590198277595477e-06, + "loss": 0.6265, + "step": 34277 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589990158514691e-06, + "loss": 0.9111, + "step": 34278 + }, + { + "epoch": 0.88, + "learning_rate": 1.658978203438825e-06, + "loss": 0.834, + "step": 34279 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589573905216318e-06, + "loss": 0.7124, + "step": 34280 + }, + { + "epoch": 0.88, + "learning_rate": 1.6589365770999053e-06, + "loss": 0.8428, + "step": 34281 + }, + { + "epoch": 0.88, + "learning_rate": 1.658915763173661e-06, + "loss": 1.0938, + "step": 34282 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588949487429154e-06, + "loss": 0.7793, + "step": 34283 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588741338076844e-06, + "loss": 0.9062, + "step": 34284 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588533183679833e-06, + "loss": 0.6089, + "step": 34285 + }, + { + "epoch": 0.88, + "learning_rate": 1.658832502423829e-06, + "loss": 0.8838, + "step": 34286 + }, + { + "epoch": 0.88, + "learning_rate": 1.6588116859752367e-06, + "loss": 0.9971, + "step": 34287 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587908690222227e-06, + "loss": 0.8369, + "step": 34288 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587700515648026e-06, + "loss": 0.9004, + "step": 34289 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587492336029927e-06, + "loss": 0.8691, + "step": 34290 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587284151368093e-06, + "loss": 0.7393, + "step": 34291 + }, + { + "epoch": 0.88, + "learning_rate": 1.6587075961662672e-06, + "loss": 0.7861, + "step": 34292 + }, + { + "epoch": 0.88, + "learning_rate": 1.658686776691383e-06, + "loss": 0.6919, + "step": 34293 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586659567121729e-06, + "loss": 0.5806, + "step": 34294 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586451362286522e-06, + "loss": 0.7402, + "step": 34295 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586243152408376e-06, + "loss": 0.7285, + "step": 34296 + }, + { + "epoch": 0.88, + "learning_rate": 1.6586034937487445e-06, + "loss": 0.6689, + "step": 34297 + }, + { + "epoch": 0.88, + "learning_rate": 1.658582671752389e-06, + "loss": 0.8877, + "step": 34298 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585618492517868e-06, + "loss": 0.7812, + "step": 34299 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585410262469544e-06, + "loss": 0.9775, + "step": 34300 + }, + { + "epoch": 0.88, + "learning_rate": 1.6585202027379075e-06, + "loss": 0.7954, + "step": 34301 + }, + { + "epoch": 0.88, + "learning_rate": 1.6584993787246616e-06, + "loss": 0.876, + "step": 34302 + }, + { + "epoch": 0.88, + "learning_rate": 1.658478554207233e-06, + "loss": 0.8027, + "step": 34303 + }, + { + "epoch": 0.88, + "learning_rate": 1.6584577291856378e-06, + "loss": 0.6594, + "step": 34304 + }, + { + "epoch": 0.88, + "learning_rate": 1.658436903659892e-06, + "loss": 0.8154, + "step": 34305 + }, + { + "epoch": 0.88, + "learning_rate": 1.658416077630011e-06, + "loss": 0.7168, + "step": 34306 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583952510960115e-06, + "loss": 0.959, + "step": 34307 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583744240579085e-06, + "loss": 1.1162, + "step": 34308 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583535965157189e-06, + "loss": 0.7617, + "step": 34309 + }, + { + "epoch": 0.88, + "learning_rate": 1.658332768469458e-06, + "loss": 1.0615, + "step": 34310 + }, + { + "epoch": 0.88, + "learning_rate": 1.6583119399191422e-06, + "loss": 0.8247, + "step": 34311 + }, + { + "epoch": 0.88, + "learning_rate": 1.658291110864787e-06, + "loss": 0.7583, + "step": 34312 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582702813064086e-06, + "loss": 0.7163, + "step": 34313 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582494512440228e-06, + "loss": 0.9092, + "step": 34314 + }, + { + "epoch": 0.88, + "learning_rate": 1.658228620677646e-06, + "loss": 0.6323, + "step": 34315 + }, + { + "epoch": 0.88, + "learning_rate": 1.6582077896072935e-06, + "loss": 1.04, + "step": 34316 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581869580329815e-06, + "loss": 0.7715, + "step": 34317 + }, + { + "epoch": 0.88, + "learning_rate": 1.658166125954726e-06, + "loss": 0.9639, + "step": 34318 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581452933725434e-06, + "loss": 0.7559, + "step": 34319 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581244602864488e-06, + "loss": 0.897, + "step": 34320 + }, + { + "epoch": 0.88, + "learning_rate": 1.6581036266964587e-06, + "loss": 0.9775, + "step": 34321 + }, + { + "epoch": 0.88, + "learning_rate": 1.658082792602589e-06, + "loss": 1.0732, + "step": 34322 + }, + { + "epoch": 0.88, + "learning_rate": 1.6580619580048555e-06, + "loss": 0.8604, + "step": 34323 + }, + { + "epoch": 0.88, + "learning_rate": 1.6580411229032742e-06, + "loss": 0.9775, + "step": 34324 + }, + { + "epoch": 0.88, + "learning_rate": 1.658020287297861e-06, + "loss": 0.6465, + "step": 34325 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579994511886322e-06, + "loss": 0.6143, + "step": 34326 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579786145756031e-06, + "loss": 0.9512, + "step": 34327 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579577774587902e-06, + "loss": 0.874, + "step": 34328 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579369398382093e-06, + "loss": 0.8149, + "step": 34329 + }, + { + "epoch": 0.88, + "learning_rate": 1.6579161017138763e-06, + "loss": 0.875, + "step": 34330 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578952630858073e-06, + "loss": 0.8691, + "step": 34331 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578744239540182e-06, + "loss": 0.873, + "step": 34332 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578535843185246e-06, + "loss": 0.8457, + "step": 34333 + }, + { + "epoch": 0.88, + "learning_rate": 1.657832744179343e-06, + "loss": 0.8789, + "step": 34334 + }, + { + "epoch": 0.88, + "learning_rate": 1.6578119035364888e-06, + "loss": 0.7139, + "step": 34335 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577910623899789e-06, + "loss": 0.7905, + "step": 34336 + }, + { + "epoch": 0.88, + "learning_rate": 1.657770220739828e-06, + "loss": 0.7285, + "step": 34337 + }, + { + "epoch": 0.88, + "learning_rate": 1.657749378586053e-06, + "loss": 0.6013, + "step": 34338 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577285359286694e-06, + "loss": 0.7295, + "step": 34339 + }, + { + "epoch": 0.88, + "learning_rate": 1.6577076927676935e-06, + "loss": 0.75, + "step": 34340 + }, + { + "epoch": 0.88, + "learning_rate": 1.657686849103141e-06, + "loss": 0.9336, + "step": 34341 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576660049350278e-06, + "loss": 0.6709, + "step": 34342 + }, + { + "epoch": 0.88, + "learning_rate": 1.65764516026337e-06, + "loss": 0.7434, + "step": 34343 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576243150881834e-06, + "loss": 0.7891, + "step": 34344 + }, + { + "epoch": 0.88, + "learning_rate": 1.6576034694094845e-06, + "loss": 0.7178, + "step": 34345 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575826232272886e-06, + "loss": 0.603, + "step": 34346 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575617765416122e-06, + "loss": 0.8242, + "step": 34347 + }, + { + "epoch": 0.88, + "learning_rate": 1.6575409293524705e-06, + "loss": 0.9355, + "step": 34348 + }, + { + "epoch": 0.88, + "learning_rate": 1.65752008165988e-06, + "loss": 0.8457, + "step": 34349 + }, + { + "epoch": 0.88, + "learning_rate": 1.657499233463857e-06, + "loss": 0.8154, + "step": 34350 + }, + { + "epoch": 0.88, + "learning_rate": 1.657478384764417e-06, + "loss": 0.7456, + "step": 34351 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574575355615759e-06, + "loss": 0.9551, + "step": 34352 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574366858553497e-06, + "loss": 0.7524, + "step": 34353 + }, + { + "epoch": 0.88, + "learning_rate": 1.6574158356457546e-06, + "loss": 0.9453, + "step": 34354 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573949849328065e-06, + "loss": 0.6885, + "step": 34355 + }, + { + "epoch": 0.88, + "learning_rate": 1.657374133716521e-06, + "loss": 0.9727, + "step": 34356 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573532819969144e-06, + "loss": 0.8408, + "step": 34357 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573324297740028e-06, + "loss": 0.9492, + "step": 34358 + }, + { + "epoch": 0.88, + "learning_rate": 1.6573115770478018e-06, + "loss": 0.8604, + "step": 34359 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572907238183278e-06, + "loss": 0.7578, + "step": 34360 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572698700855962e-06, + "loss": 0.7783, + "step": 34361 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572490158496234e-06, + "loss": 0.6738, + "step": 34362 + }, + { + "epoch": 0.88, + "learning_rate": 1.6572281611104255e-06, + "loss": 0.9385, + "step": 34363 + }, + { + "epoch": 0.88, + "learning_rate": 1.657207305868018e-06, + "loss": 0.8252, + "step": 34364 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571864501224174e-06, + "loss": 0.8149, + "step": 34365 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571655938736391e-06, + "loss": 0.8506, + "step": 34366 + }, + { + "epoch": 0.88, + "learning_rate": 1.657144737121699e-06, + "loss": 1.0176, + "step": 34367 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571238798666137e-06, + "loss": 0.7217, + "step": 34368 + }, + { + "epoch": 0.88, + "learning_rate": 1.6571030221083988e-06, + "loss": 0.7095, + "step": 34369 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570821638470704e-06, + "loss": 0.9229, + "step": 34370 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570613050826445e-06, + "loss": 0.8945, + "step": 34371 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570404458151367e-06, + "loss": 0.7842, + "step": 34372 + }, + { + "epoch": 0.88, + "learning_rate": 1.6570195860445635e-06, + "loss": 0.5664, + "step": 34373 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569987257709403e-06, + "loss": 0.873, + "step": 34374 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569778649942836e-06, + "loss": 0.8633, + "step": 34375 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569570037146095e-06, + "loss": 0.7402, + "step": 34376 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569361419319333e-06, + "loss": 0.5537, + "step": 34377 + }, + { + "epoch": 0.88, + "learning_rate": 1.6569152796462711e-06, + "loss": 0.9297, + "step": 34378 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568944168576393e-06, + "loss": 0.8613, + "step": 34379 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568735535660533e-06, + "loss": 0.9268, + "step": 34380 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568526897715303e-06, + "loss": 0.6685, + "step": 34381 + }, + { + "epoch": 0.88, + "learning_rate": 1.6568318254740844e-06, + "loss": 0.7773, + "step": 34382 + }, + { + "epoch": 0.88, + "learning_rate": 1.656810960673733e-06, + "loss": 0.9326, + "step": 34383 + }, + { + "epoch": 0.88, + "learning_rate": 1.656790095370492e-06, + "loss": 0.8633, + "step": 34384 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567692295643764e-06, + "loss": 0.79, + "step": 34385 + }, + { + "epoch": 0.88, + "learning_rate": 1.656748363255403e-06, + "loss": 0.7639, + "step": 34386 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567274964435877e-06, + "loss": 0.9062, + "step": 34387 + }, + { + "epoch": 0.88, + "learning_rate": 1.6567066291289463e-06, + "loss": 0.8545, + "step": 34388 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566857613114947e-06, + "loss": 0.7612, + "step": 34389 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566648929912493e-06, + "loss": 0.7451, + "step": 34390 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566440241682256e-06, + "loss": 0.8779, + "step": 34391 + }, + { + "epoch": 0.88, + "learning_rate": 1.6566231548424398e-06, + "loss": 0.8506, + "step": 34392 + }, + { + "epoch": 0.88, + "learning_rate": 1.656602285013908e-06, + "loss": 0.9434, + "step": 34393 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565814146826455e-06, + "loss": 0.709, + "step": 34394 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565605438486695e-06, + "loss": 0.7773, + "step": 34395 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565396725119948e-06, + "loss": 0.8291, + "step": 34396 + }, + { + "epoch": 0.88, + "learning_rate": 1.6565188006726381e-06, + "loss": 1.0176, + "step": 34397 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564979283306148e-06, + "loss": 0.8633, + "step": 34398 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564770554859418e-06, + "loss": 0.7114, + "step": 34399 + }, + { + "epoch": 0.88, + "learning_rate": 1.656456182138634e-06, + "loss": 0.8037, + "step": 34400 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564353082887081e-06, + "loss": 0.8174, + "step": 34401 + }, + { + "epoch": 0.88, + "learning_rate": 1.6564144339361799e-06, + "loss": 0.874, + "step": 34402 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563935590810653e-06, + "loss": 0.8428, + "step": 34403 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563726837233802e-06, + "loss": 0.9717, + "step": 34404 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563518078631407e-06, + "loss": 1.0225, + "step": 34405 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563309315003631e-06, + "loss": 0.876, + "step": 34406 + }, + { + "epoch": 0.88, + "learning_rate": 1.6563100546350627e-06, + "loss": 0.6743, + "step": 34407 + }, + { + "epoch": 0.88, + "learning_rate": 1.656289177267256e-06, + "loss": 0.8691, + "step": 34408 + }, + { + "epoch": 0.88, + "learning_rate": 1.656268299396959e-06, + "loss": 0.8047, + "step": 34409 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562474210241878e-06, + "loss": 0.8496, + "step": 34410 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562265421489576e-06, + "loss": 0.7964, + "step": 34411 + }, + { + "epoch": 0.88, + "learning_rate": 1.6562056627712852e-06, + "loss": 0.875, + "step": 34412 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561847828911862e-06, + "loss": 0.8311, + "step": 34413 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561639025086764e-06, + "loss": 0.7568, + "step": 34414 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561430216237726e-06, + "loss": 0.6426, + "step": 34415 + }, + { + "epoch": 0.88, + "learning_rate": 1.65612214023649e-06, + "loss": 0.9707, + "step": 34416 + }, + { + "epoch": 0.88, + "learning_rate": 1.6561012583468448e-06, + "loss": 0.6792, + "step": 34417 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560803759548532e-06, + "loss": 0.9678, + "step": 34418 + }, + { + "epoch": 0.88, + "learning_rate": 1.656059493060531e-06, + "loss": 0.8555, + "step": 34419 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560386096638941e-06, + "loss": 0.7686, + "step": 34420 + }, + { + "epoch": 0.88, + "learning_rate": 1.6560177257649586e-06, + "loss": 0.6611, + "step": 34421 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559968413637405e-06, + "loss": 0.7783, + "step": 34422 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559759564602558e-06, + "loss": 0.8052, + "step": 34423 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559550710545204e-06, + "loss": 0.9814, + "step": 34424 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559341851465504e-06, + "loss": 0.8789, + "step": 34425 + }, + { + "epoch": 0.88, + "learning_rate": 1.6559132987363618e-06, + "loss": 0.9385, + "step": 34426 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558924118239706e-06, + "loss": 0.9199, + "step": 34427 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558715244093928e-06, + "loss": 0.7402, + "step": 34428 + }, + { + "epoch": 0.88, + "learning_rate": 1.655850636492644e-06, + "loss": 0.9121, + "step": 34429 + }, + { + "epoch": 0.88, + "learning_rate": 1.6558297480737408e-06, + "loss": 0.7715, + "step": 34430 + }, + { + "epoch": 0.88, + "learning_rate": 1.655808859152699e-06, + "loss": 1.0635, + "step": 34431 + }, + { + "epoch": 0.88, + "learning_rate": 1.6557879697295342e-06, + "loss": 0.8486, + "step": 34432 + }, + { + "epoch": 0.88, + "learning_rate": 1.655767079804263e-06, + "loss": 0.7126, + "step": 34433 + }, + { + "epoch": 0.88, + "learning_rate": 1.655746189376901e-06, + "loss": 0.6156, + "step": 34434 + }, + { + "epoch": 0.88, + "learning_rate": 1.6557252984474644e-06, + "loss": 0.8584, + "step": 34435 + }, + { + "epoch": 0.88, + "learning_rate": 1.655704407015969e-06, + "loss": 0.7073, + "step": 34436 + }, + { + "epoch": 0.88, + "learning_rate": 1.6556835150824306e-06, + "loss": 0.9824, + "step": 34437 + }, + { + "epoch": 0.88, + "learning_rate": 1.6556626226468657e-06, + "loss": 0.583, + "step": 34438 + }, + { + "epoch": 0.88, + "learning_rate": 1.65564172970929e-06, + "loss": 0.7046, + "step": 34439 + }, + { + "epoch": 0.88, + "learning_rate": 1.65562083626972e-06, + "loss": 0.8652, + "step": 34440 + }, + { + "epoch": 0.88, + "learning_rate": 1.655599942328171e-06, + "loss": 0.9053, + "step": 34441 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555790478846592e-06, + "loss": 0.8408, + "step": 34442 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555581529392004e-06, + "loss": 0.9033, + "step": 34443 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555372574918113e-06, + "loss": 0.833, + "step": 34444 + }, + { + "epoch": 0.88, + "learning_rate": 1.6555163615425075e-06, + "loss": 0.9697, + "step": 34445 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554954650913047e-06, + "loss": 0.8857, + "step": 34446 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554745681382192e-06, + "loss": 0.8018, + "step": 34447 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554536706832671e-06, + "loss": 0.6953, + "step": 34448 + }, + { + "epoch": 0.88, + "learning_rate": 1.655432772726464e-06, + "loss": 0.8008, + "step": 34449 + }, + { + "epoch": 0.88, + "learning_rate": 1.6554118742678265e-06, + "loss": 0.8838, + "step": 34450 + }, + { + "epoch": 0.88, + "learning_rate": 1.65539097530737e-06, + "loss": 0.8467, + "step": 34451 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553700758451109e-06, + "loss": 0.5132, + "step": 34452 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553491758810649e-06, + "loss": 0.7666, + "step": 34453 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553282754152484e-06, + "loss": 0.6992, + "step": 34454 + }, + { + "epoch": 0.88, + "learning_rate": 1.6553073744476772e-06, + "loss": 0.7471, + "step": 34455 + }, + { + "epoch": 0.88, + "learning_rate": 1.655286472978367e-06, + "loss": 0.8159, + "step": 34456 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552655710073342e-06, + "loss": 0.7451, + "step": 34457 + }, + { + "epoch": 0.88, + "learning_rate": 1.655244668534595e-06, + "loss": 0.7764, + "step": 34458 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552237655601645e-06, + "loss": 0.8525, + "step": 34459 + }, + { + "epoch": 0.88, + "learning_rate": 1.6552028620840596e-06, + "loss": 0.4675, + "step": 34460 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551819581062963e-06, + "loss": 0.8809, + "step": 34461 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551610536268896e-06, + "loss": 0.8555, + "step": 34462 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551401486458567e-06, + "loss": 0.8701, + "step": 34463 + }, + { + "epoch": 0.88, + "learning_rate": 1.6551192431632132e-06, + "loss": 0.7832, + "step": 34464 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550983371789747e-06, + "loss": 0.8281, + "step": 34465 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550774306931577e-06, + "loss": 0.8525, + "step": 34466 + }, + { + "epoch": 0.88, + "learning_rate": 1.655056523705778e-06, + "loss": 0.7852, + "step": 34467 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550356162168515e-06, + "loss": 1.082, + "step": 34468 + }, + { + "epoch": 0.88, + "learning_rate": 1.6550147082263944e-06, + "loss": 0.9902, + "step": 34469 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549937997344228e-06, + "loss": 0.7646, + "step": 34470 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549728907409524e-06, + "loss": 0.7188, + "step": 34471 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549519812459996e-06, + "loss": 0.8945, + "step": 34472 + }, + { + "epoch": 0.88, + "learning_rate": 1.65493107124958e-06, + "loss": 0.4934, + "step": 34473 + }, + { + "epoch": 0.88, + "learning_rate": 1.6549101607517098e-06, + "loss": 0.772, + "step": 34474 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548892497524053e-06, + "loss": 0.9111, + "step": 34475 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548683382516816e-06, + "loss": 0.71, + "step": 34476 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548474262495557e-06, + "loss": 0.7188, + "step": 34477 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548265137460433e-06, + "loss": 0.7783, + "step": 34478 + }, + { + "epoch": 0.88, + "learning_rate": 1.6548056007411604e-06, + "loss": 0.7468, + "step": 34479 + }, + { + "epoch": 0.88, + "learning_rate": 1.654784687234923e-06, + "loss": 0.958, + "step": 34480 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547637732273468e-06, + "loss": 0.918, + "step": 34481 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547428587184479e-06, + "loss": 0.6821, + "step": 34482 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547219437082429e-06, + "loss": 0.8057, + "step": 34483 + }, + { + "epoch": 0.88, + "learning_rate": 1.6547010281967473e-06, + "loss": 0.5962, + "step": 34484 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546801121839773e-06, + "loss": 0.875, + "step": 34485 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546591956699488e-06, + "loss": 0.7244, + "step": 34486 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546382786546779e-06, + "loss": 0.8926, + "step": 34487 + }, + { + "epoch": 0.88, + "learning_rate": 1.6546173611381803e-06, + "loss": 1.0742, + "step": 34488 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545964431204724e-06, + "loss": 0.7451, + "step": 34489 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545755246015704e-06, + "loss": 1.0068, + "step": 34490 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545546055814898e-06, + "loss": 1.1768, + "step": 34491 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545336860602467e-06, + "loss": 0.729, + "step": 34492 + }, + { + "epoch": 0.88, + "learning_rate": 1.6545127660378574e-06, + "loss": 0.7874, + "step": 34493 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544918455143376e-06, + "loss": 0.7021, + "step": 34494 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544709244897036e-06, + "loss": 0.8896, + "step": 34495 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544500029639717e-06, + "loss": 0.7539, + "step": 34496 + }, + { + "epoch": 0.88, + "learning_rate": 1.654429080937157e-06, + "loss": 0.8643, + "step": 34497 + }, + { + "epoch": 0.88, + "learning_rate": 1.6544081584092763e-06, + "loss": 1.0723, + "step": 34498 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543872353803453e-06, + "loss": 0.666, + "step": 34499 + }, + { + "epoch": 0.88, + "learning_rate": 1.65436631185038e-06, + "loss": 0.7461, + "step": 34500 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543453878193968e-06, + "loss": 0.9912, + "step": 34501 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543244632874109e-06, + "loss": 0.9854, + "step": 34502 + }, + { + "epoch": 0.88, + "learning_rate": 1.6543035382544393e-06, + "loss": 1.123, + "step": 34503 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542826127204972e-06, + "loss": 0.9912, + "step": 34504 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542616866856017e-06, + "loss": 1.0908, + "step": 34505 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542407601497673e-06, + "loss": 0.8252, + "step": 34506 + }, + { + "epoch": 0.88, + "learning_rate": 1.6542198331130114e-06, + "loss": 0.8906, + "step": 34507 + }, + { + "epoch": 0.88, + "learning_rate": 1.654198905575349e-06, + "loss": 0.6123, + "step": 34508 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541779775367966e-06, + "loss": 0.6273, + "step": 34509 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541570489973707e-06, + "loss": 0.6318, + "step": 34510 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541361199570863e-06, + "loss": 0.9326, + "step": 34511 + }, + { + "epoch": 0.88, + "learning_rate": 1.6541151904159603e-06, + "loss": 0.7979, + "step": 34512 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540942603740081e-06, + "loss": 0.9043, + "step": 34513 + }, + { + "epoch": 0.88, + "learning_rate": 1.654073329831246e-06, + "loss": 0.6992, + "step": 34514 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540523987876903e-06, + "loss": 0.8389, + "step": 34515 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540314672433567e-06, + "loss": 0.7461, + "step": 34516 + }, + { + "epoch": 0.88, + "learning_rate": 1.6540105351982611e-06, + "loss": 0.8623, + "step": 34517 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539896026524199e-06, + "loss": 0.6924, + "step": 34518 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539686696058487e-06, + "loss": 0.5852, + "step": 34519 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539477360585638e-06, + "loss": 0.666, + "step": 34520 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539268020105815e-06, + "loss": 0.448, + "step": 34521 + }, + { + "epoch": 0.88, + "learning_rate": 1.6539058674619173e-06, + "loss": 0.8574, + "step": 34522 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538849324125871e-06, + "loss": 0.8755, + "step": 34523 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538639968626078e-06, + "loss": 0.5488, + "step": 34524 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538430608119947e-06, + "loss": 0.6567, + "step": 34525 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538221242607641e-06, + "loss": 0.7383, + "step": 34526 + }, + { + "epoch": 0.88, + "learning_rate": 1.6538011872089318e-06, + "loss": 0.9766, + "step": 34527 + }, + { + "epoch": 0.88, + "learning_rate": 1.6537802496565143e-06, + "loss": 0.772, + "step": 34528 + }, + { + "epoch": 0.88, + "learning_rate": 1.653759311603527e-06, + "loss": 0.9727, + "step": 34529 + }, + { + "epoch": 0.89, + "learning_rate": 1.6537383730499865e-06, + "loss": 0.7969, + "step": 34530 + }, + { + "epoch": 0.89, + "learning_rate": 1.6537174339959083e-06, + "loss": 0.668, + "step": 34531 + }, + { + "epoch": 0.89, + "learning_rate": 1.653696494441309e-06, + "loss": 0.9717, + "step": 34532 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536755543862042e-06, + "loss": 1.0986, + "step": 34533 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536546138306102e-06, + "loss": 0.8623, + "step": 34534 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536336727745427e-06, + "loss": 1.0361, + "step": 34535 + }, + { + "epoch": 0.89, + "learning_rate": 1.6536127312180183e-06, + "loss": 1.0195, + "step": 34536 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535917891610524e-06, + "loss": 0.915, + "step": 34537 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535708466036616e-06, + "loss": 0.5605, + "step": 34538 + }, + { + "epoch": 0.89, + "learning_rate": 1.653549903545861e-06, + "loss": 0.873, + "step": 34539 + }, + { + "epoch": 0.89, + "learning_rate": 1.653528959987668e-06, + "loss": 1.001, + "step": 34540 + }, + { + "epoch": 0.89, + "learning_rate": 1.6535080159290974e-06, + "loss": 0.96, + "step": 34541 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534870713701662e-06, + "loss": 0.7395, + "step": 34542 + }, + { + "epoch": 0.89, + "learning_rate": 1.65346612631089e-06, + "loss": 0.8906, + "step": 34543 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534451807512847e-06, + "loss": 0.9404, + "step": 34544 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534242346913664e-06, + "loss": 0.9316, + "step": 34545 + }, + { + "epoch": 0.89, + "learning_rate": 1.6534032881311512e-06, + "loss": 0.8945, + "step": 34546 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533823410706552e-06, + "loss": 0.792, + "step": 34547 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533613935098943e-06, + "loss": 0.9717, + "step": 34548 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533404454488847e-06, + "loss": 1.1738, + "step": 34549 + }, + { + "epoch": 0.89, + "learning_rate": 1.6533194968876426e-06, + "loss": 0.627, + "step": 34550 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532985478261835e-06, + "loss": 0.877, + "step": 34551 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532775982645237e-06, + "loss": 0.7944, + "step": 34552 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532566482026793e-06, + "loss": 0.8188, + "step": 34553 + }, + { + "epoch": 0.89, + "learning_rate": 1.6532356976406664e-06, + "loss": 0.8193, + "step": 34554 + }, + { + "epoch": 0.89, + "learning_rate": 1.653214746578501e-06, + "loss": 0.8057, + "step": 34555 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531937950161992e-06, + "loss": 0.7202, + "step": 34556 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531728429537765e-06, + "loss": 0.8789, + "step": 34557 + }, + { + "epoch": 0.89, + "learning_rate": 1.65315189039125e-06, + "loss": 0.8184, + "step": 34558 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531309373286346e-06, + "loss": 0.8301, + "step": 34559 + }, + { + "epoch": 0.89, + "learning_rate": 1.6531099837659475e-06, + "loss": 0.6694, + "step": 34560 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530890297032034e-06, + "loss": 0.9346, + "step": 34561 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530680751404197e-06, + "loss": 0.8008, + "step": 34562 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530471200776112e-06, + "loss": 0.7192, + "step": 34563 + }, + { + "epoch": 0.89, + "learning_rate": 1.653026164514795e-06, + "loss": 0.7217, + "step": 34564 + }, + { + "epoch": 0.89, + "learning_rate": 1.6530052084519865e-06, + "loss": 0.9604, + "step": 34565 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529842518892019e-06, + "loss": 0.8594, + "step": 34566 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529632948264574e-06, + "loss": 0.9287, + "step": 34567 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529423372637688e-06, + "loss": 0.8828, + "step": 34568 + }, + { + "epoch": 0.89, + "learning_rate": 1.6529213792011524e-06, + "loss": 0.7759, + "step": 34569 + }, + { + "epoch": 0.89, + "learning_rate": 1.652900420638624e-06, + "loss": 0.9307, + "step": 34570 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528794615762e-06, + "loss": 0.6533, + "step": 34571 + }, + { + "epoch": 0.89, + "learning_rate": 1.652858502013896e-06, + "loss": 0.7222, + "step": 34572 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528375419517281e-06, + "loss": 0.7236, + "step": 34573 + }, + { + "epoch": 0.89, + "learning_rate": 1.6528165813897129e-06, + "loss": 0.7783, + "step": 34574 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527956203278662e-06, + "loss": 0.8555, + "step": 34575 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527746587662034e-06, + "loss": 0.7231, + "step": 34576 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527536967047412e-06, + "loss": 0.8577, + "step": 34577 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527327341434957e-06, + "loss": 0.9287, + "step": 34578 + }, + { + "epoch": 0.89, + "learning_rate": 1.6527117710824827e-06, + "loss": 0.8848, + "step": 34579 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526908075217184e-06, + "loss": 1.0254, + "step": 34580 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526698434612186e-06, + "loss": 0.8174, + "step": 34581 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526488789009995e-06, + "loss": 0.8506, + "step": 34582 + }, + { + "epoch": 0.89, + "learning_rate": 1.652627913841077e-06, + "loss": 0.8311, + "step": 34583 + }, + { + "epoch": 0.89, + "learning_rate": 1.6526069482814674e-06, + "loss": 0.6572, + "step": 34584 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525859822221867e-06, + "loss": 0.7617, + "step": 34585 + }, + { + "epoch": 0.89, + "learning_rate": 1.652565015663251e-06, + "loss": 0.6914, + "step": 34586 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525440486046765e-06, + "loss": 0.8213, + "step": 34587 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525230810464789e-06, + "loss": 0.8081, + "step": 34588 + }, + { + "epoch": 0.89, + "learning_rate": 1.6525021129886741e-06, + "loss": 0.9814, + "step": 34589 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524811444312787e-06, + "loss": 0.8535, + "step": 34590 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524601753743084e-06, + "loss": 0.9873, + "step": 34591 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524392058177793e-06, + "loss": 0.5947, + "step": 34592 + }, + { + "epoch": 0.89, + "learning_rate": 1.6524182357617073e-06, + "loss": 0.8271, + "step": 34593 + }, + { + "epoch": 0.89, + "learning_rate": 1.652397265206109e-06, + "loss": 0.8145, + "step": 34594 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523762941510002e-06, + "loss": 0.9336, + "step": 34595 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523553225963967e-06, + "loss": 0.7881, + "step": 34596 + }, + { + "epoch": 0.89, + "learning_rate": 1.6523343505423145e-06, + "loss": 0.7051, + "step": 34597 + }, + { + "epoch": 0.89, + "learning_rate": 1.65231337798877e-06, + "loss": 0.8213, + "step": 34598 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522924049357791e-06, + "loss": 0.9521, + "step": 34599 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522714313833583e-06, + "loss": 0.7861, + "step": 34600 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522504573315228e-06, + "loss": 0.8279, + "step": 34601 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522294827802893e-06, + "loss": 0.9619, + "step": 34602 + }, + { + "epoch": 0.89, + "learning_rate": 1.6522085077296737e-06, + "loss": 0.8848, + "step": 34603 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521875321796918e-06, + "loss": 0.9023, + "step": 34604 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521665561303603e-06, + "loss": 0.4976, + "step": 34605 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521455795816947e-06, + "loss": 0.8848, + "step": 34606 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521246025337111e-06, + "loss": 0.9702, + "step": 34607 + }, + { + "epoch": 0.89, + "learning_rate": 1.652103624986426e-06, + "loss": 0.6973, + "step": 34608 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520826469398546e-06, + "loss": 0.8701, + "step": 34609 + }, + { + "epoch": 0.89, + "learning_rate": 1.652061668394014e-06, + "loss": 1.0889, + "step": 34610 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520406893489197e-06, + "loss": 0.7271, + "step": 34611 + }, + { + "epoch": 0.89, + "learning_rate": 1.6520197098045873e-06, + "loss": 0.6699, + "step": 34612 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519987297610339e-06, + "loss": 0.8867, + "step": 34613 + }, + { + "epoch": 0.89, + "learning_rate": 1.651977749218275e-06, + "loss": 0.8252, + "step": 34614 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519567681763267e-06, + "loss": 0.9131, + "step": 34615 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519357866352049e-06, + "loss": 0.9053, + "step": 34616 + }, + { + "epoch": 0.89, + "learning_rate": 1.6519148045949258e-06, + "loss": 0.6357, + "step": 34617 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518938220555057e-06, + "loss": 0.7817, + "step": 34618 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518728390169604e-06, + "loss": 0.8496, + "step": 34619 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518518554793063e-06, + "loss": 0.5593, + "step": 34620 + }, + { + "epoch": 0.89, + "learning_rate": 1.651830871442559e-06, + "loss": 0.5693, + "step": 34621 + }, + { + "epoch": 0.89, + "learning_rate": 1.6518098869067347e-06, + "loss": 1.043, + "step": 34622 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517889018718496e-06, + "loss": 0.5894, + "step": 34623 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517679163379196e-06, + "loss": 0.9209, + "step": 34624 + }, + { + "epoch": 0.89, + "learning_rate": 1.651746930304961e-06, + "loss": 0.8613, + "step": 34625 + }, + { + "epoch": 0.89, + "learning_rate": 1.6517259437729898e-06, + "loss": 1.0381, + "step": 34626 + }, + { + "epoch": 0.89, + "learning_rate": 1.651704956742022e-06, + "loss": 0.9502, + "step": 34627 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516839692120737e-06, + "loss": 0.874, + "step": 34628 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516629811831608e-06, + "loss": 0.7983, + "step": 34629 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516419926553e-06, + "loss": 0.9883, + "step": 34630 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516210036285061e-06, + "loss": 0.8604, + "step": 34631 + }, + { + "epoch": 0.89, + "learning_rate": 1.6516000141027964e-06, + "loss": 0.8813, + "step": 34632 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515790240781864e-06, + "loss": 0.4575, + "step": 34633 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515580335546923e-06, + "loss": 0.8174, + "step": 34634 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515370425323302e-06, + "loss": 0.9043, + "step": 34635 + }, + { + "epoch": 0.89, + "learning_rate": 1.6515160510111163e-06, + "loss": 0.8936, + "step": 34636 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514950589910663e-06, + "loss": 0.7988, + "step": 34637 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514740664721969e-06, + "loss": 0.6274, + "step": 34638 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514530734545233e-06, + "loss": 0.9121, + "step": 34639 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514320799380623e-06, + "loss": 0.8999, + "step": 34640 + }, + { + "epoch": 0.89, + "learning_rate": 1.6514110859228295e-06, + "loss": 0.9233, + "step": 34641 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513900914088413e-06, + "loss": 0.8975, + "step": 34642 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513690963961136e-06, + "loss": 0.8281, + "step": 34643 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513481008846628e-06, + "loss": 0.8379, + "step": 34644 + }, + { + "epoch": 0.89, + "learning_rate": 1.6513271048745044e-06, + "loss": 0.5896, + "step": 34645 + }, + { + "epoch": 0.89, + "learning_rate": 1.651306108365655e-06, + "loss": 0.6904, + "step": 34646 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512851113581303e-06, + "loss": 0.6885, + "step": 34647 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512641138519465e-06, + "loss": 0.8975, + "step": 34648 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512431158471197e-06, + "loss": 0.7646, + "step": 34649 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512221173436663e-06, + "loss": 0.8926, + "step": 34650 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512011183416016e-06, + "loss": 0.8447, + "step": 34651 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511801188409424e-06, + "loss": 0.6069, + "step": 34652 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511591188417046e-06, + "loss": 0.6877, + "step": 34653 + }, + { + "epoch": 0.89, + "learning_rate": 1.6511381183439042e-06, + "loss": 0.5923, + "step": 34654 + }, + { + "epoch": 0.89, + "learning_rate": 1.651117117347557e-06, + "loss": 0.9023, + "step": 34655 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510961158526796e-06, + "loss": 1.0361, + "step": 34656 + }, + { + "epoch": 0.89, + "learning_rate": 1.651075113859288e-06, + "loss": 0.9102, + "step": 34657 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510541113673978e-06, + "loss": 0.8613, + "step": 34658 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510331083770256e-06, + "loss": 0.8516, + "step": 34659 + }, + { + "epoch": 0.89, + "learning_rate": 1.6510121048881875e-06, + "loss": 0.8555, + "step": 34660 + }, + { + "epoch": 0.89, + "learning_rate": 1.650991100900899e-06, + "loss": 0.9463, + "step": 34661 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509700964151767e-06, + "loss": 0.6099, + "step": 34662 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509490914310363e-06, + "loss": 0.8418, + "step": 34663 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509280859484942e-06, + "loss": 0.9824, + "step": 34664 + }, + { + "epoch": 0.89, + "learning_rate": 1.6509070799675667e-06, + "loss": 0.8472, + "step": 34665 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508860734882693e-06, + "loss": 0.7036, + "step": 34666 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508650665106182e-06, + "loss": 0.9365, + "step": 34667 + }, + { + "epoch": 0.89, + "learning_rate": 1.65084405903463e-06, + "loss": 0.7002, + "step": 34668 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508230510603202e-06, + "loss": 0.9199, + "step": 34669 + }, + { + "epoch": 0.89, + "learning_rate": 1.6508020425877055e-06, + "loss": 1.0693, + "step": 34670 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507810336168012e-06, + "loss": 0.8438, + "step": 34671 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507600241476238e-06, + "loss": 0.9746, + "step": 34672 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507390141801895e-06, + "loss": 0.9414, + "step": 34673 + }, + { + "epoch": 0.89, + "learning_rate": 1.6507180037145143e-06, + "loss": 0.8115, + "step": 34674 + }, + { + "epoch": 0.89, + "learning_rate": 1.650696992750614e-06, + "loss": 0.8467, + "step": 34675 + }, + { + "epoch": 0.89, + "learning_rate": 1.650675981288505e-06, + "loss": 0.8223, + "step": 34676 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506549693282036e-06, + "loss": 0.7141, + "step": 34677 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506339568697254e-06, + "loss": 0.9424, + "step": 34678 + }, + { + "epoch": 0.89, + "learning_rate": 1.6506129439130867e-06, + "loss": 0.8506, + "step": 34679 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505919304583038e-06, + "loss": 1.0049, + "step": 34680 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505709165053925e-06, + "loss": 0.8984, + "step": 34681 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505499020543688e-06, + "loss": 0.688, + "step": 34682 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505288871052487e-06, + "loss": 0.6343, + "step": 34683 + }, + { + "epoch": 0.89, + "learning_rate": 1.6505078716580489e-06, + "loss": 0.7324, + "step": 34684 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504868557127854e-06, + "loss": 0.8613, + "step": 34685 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504658392694736e-06, + "loss": 0.7383, + "step": 34686 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504448223281303e-06, + "loss": 0.8701, + "step": 34687 + }, + { + "epoch": 0.89, + "learning_rate": 1.6504238048887708e-06, + "loss": 0.917, + "step": 34688 + }, + { + "epoch": 0.89, + "learning_rate": 1.650402786951412e-06, + "loss": 0.9561, + "step": 34689 + }, + { + "epoch": 0.89, + "learning_rate": 1.65038176851607e-06, + "loss": 0.6553, + "step": 34690 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503607495827603e-06, + "loss": 0.9502, + "step": 34691 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503397301514993e-06, + "loss": 0.7744, + "step": 34692 + }, + { + "epoch": 0.89, + "learning_rate": 1.6503187102223027e-06, + "loss": 1.0029, + "step": 34693 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502976897951874e-06, + "loss": 1.0654, + "step": 34694 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502766688701692e-06, + "loss": 0.9375, + "step": 34695 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502556474472637e-06, + "loss": 0.8018, + "step": 34696 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502346255264875e-06, + "loss": 0.957, + "step": 34697 + }, + { + "epoch": 0.89, + "learning_rate": 1.6502136031078563e-06, + "loss": 0.8652, + "step": 34698 + }, + { + "epoch": 0.89, + "learning_rate": 1.650192580191387e-06, + "loss": 0.9883, + "step": 34699 + }, + { + "epoch": 0.89, + "learning_rate": 1.6501715567770948e-06, + "loss": 0.9268, + "step": 34700 + }, + { + "epoch": 0.89, + "learning_rate": 1.650150532864996e-06, + "loss": 0.7949, + "step": 34701 + }, + { + "epoch": 0.89, + "learning_rate": 1.650129508455107e-06, + "loss": 0.7441, + "step": 34702 + }, + { + "epoch": 0.89, + "learning_rate": 1.6501084835474438e-06, + "loss": 0.7852, + "step": 34703 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500874581420221e-06, + "loss": 1.0254, + "step": 34704 + }, + { + "epoch": 0.89, + "learning_rate": 1.650066432238859e-06, + "loss": 1.0869, + "step": 34705 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500454058379694e-06, + "loss": 1.0352, + "step": 34706 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500243789393697e-06, + "loss": 0.7793, + "step": 34707 + }, + { + "epoch": 0.89, + "learning_rate": 1.6500033515430767e-06, + "loss": 0.8423, + "step": 34708 + }, + { + "epoch": 0.89, + "learning_rate": 1.649982323649106e-06, + "loss": 0.749, + "step": 34709 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499612952574734e-06, + "loss": 0.7607, + "step": 34710 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499402663681955e-06, + "loss": 0.8281, + "step": 34711 + }, + { + "epoch": 0.89, + "learning_rate": 1.6499192369812885e-06, + "loss": 0.8555, + "step": 34712 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498982070967678e-06, + "loss": 0.8159, + "step": 34713 + }, + { + "epoch": 0.89, + "learning_rate": 1.64987717671465e-06, + "loss": 0.592, + "step": 34714 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498561458349514e-06, + "loss": 0.8042, + "step": 34715 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498351144576877e-06, + "loss": 0.6831, + "step": 34716 + }, + { + "epoch": 0.89, + "learning_rate": 1.6498140825828748e-06, + "loss": 0.7793, + "step": 34717 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497930502105292e-06, + "loss": 1.0684, + "step": 34718 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497720173406674e-06, + "loss": 0.8389, + "step": 34719 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497509839733046e-06, + "loss": 0.6382, + "step": 34720 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497299501084576e-06, + "loss": 0.9746, + "step": 34721 + }, + { + "epoch": 0.89, + "learning_rate": 1.6497089157461421e-06, + "loss": 0.8457, + "step": 34722 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496878808863746e-06, + "loss": 0.7871, + "step": 34723 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496668455291709e-06, + "loss": 0.998, + "step": 34724 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496458096745469e-06, + "loss": 1.0186, + "step": 34725 + }, + { + "epoch": 0.89, + "learning_rate": 1.649624773322519e-06, + "loss": 0.9023, + "step": 34726 + }, + { + "epoch": 0.89, + "learning_rate": 1.6496037364731037e-06, + "loss": 0.8682, + "step": 34727 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495826991263164e-06, + "loss": 0.8564, + "step": 34728 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495616612821736e-06, + "loss": 0.8535, + "step": 34729 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495406229406909e-06, + "loss": 0.7988, + "step": 34730 + }, + { + "epoch": 0.89, + "learning_rate": 1.649519584101885e-06, + "loss": 0.9102, + "step": 34731 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494985447657723e-06, + "loss": 0.7368, + "step": 34732 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494775049323679e-06, + "loss": 0.7627, + "step": 34733 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494564646016889e-06, + "loss": 0.5718, + "step": 34734 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494354237737507e-06, + "loss": 0.8506, + "step": 34735 + }, + { + "epoch": 0.89, + "learning_rate": 1.6494143824485693e-06, + "loss": 0.9062, + "step": 34736 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493933406261617e-06, + "loss": 0.7056, + "step": 34737 + }, + { + "epoch": 0.89, + "learning_rate": 1.649372298306543e-06, + "loss": 0.8652, + "step": 34738 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493512554897305e-06, + "loss": 0.9463, + "step": 34739 + }, + { + "epoch": 0.89, + "learning_rate": 1.649330212175739e-06, + "loss": 0.7344, + "step": 34740 + }, + { + "epoch": 0.89, + "learning_rate": 1.6493091683645853e-06, + "loss": 0.5061, + "step": 34741 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492881240562855e-06, + "loss": 0.6191, + "step": 34742 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492670792508555e-06, + "loss": 0.8574, + "step": 34743 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492460339483119e-06, + "loss": 0.7061, + "step": 34744 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492249881486702e-06, + "loss": 0.8154, + "step": 34745 + }, + { + "epoch": 0.89, + "learning_rate": 1.6492039418519468e-06, + "loss": 0.73, + "step": 34746 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491828950581578e-06, + "loss": 1.0762, + "step": 34747 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491618477673193e-06, + "loss": 0.9688, + "step": 34748 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491407999794476e-06, + "loss": 0.9199, + "step": 34749 + }, + { + "epoch": 0.89, + "learning_rate": 1.6491197516945583e-06, + "loss": 0.6592, + "step": 34750 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490987029126682e-06, + "loss": 0.6309, + "step": 34751 + }, + { + "epoch": 0.89, + "learning_rate": 1.649077653633793e-06, + "loss": 0.8359, + "step": 34752 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490566038579487e-06, + "loss": 0.833, + "step": 34753 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490355535851519e-06, + "loss": 1.0088, + "step": 34754 + }, + { + "epoch": 0.89, + "learning_rate": 1.6490145028154182e-06, + "loss": 0.7104, + "step": 34755 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489934515487637e-06, + "loss": 0.9814, + "step": 34756 + }, + { + "epoch": 0.89, + "learning_rate": 1.648972399785205e-06, + "loss": 0.9072, + "step": 34757 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489513475247581e-06, + "loss": 0.8135, + "step": 34758 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489302947674387e-06, + "loss": 0.7178, + "step": 34759 + }, + { + "epoch": 0.89, + "learning_rate": 1.6489092415132638e-06, + "loss": 0.9824, + "step": 34760 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488881877622482e-06, + "loss": 0.6331, + "step": 34761 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488671335144094e-06, + "loss": 0.9092, + "step": 34762 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488460787697624e-06, + "loss": 0.7021, + "step": 34763 + }, + { + "epoch": 0.89, + "learning_rate": 1.648825023528324e-06, + "loss": 0.8076, + "step": 34764 + }, + { + "epoch": 0.89, + "learning_rate": 1.6488039677901097e-06, + "loss": 0.6738, + "step": 34765 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487829115551367e-06, + "loss": 0.8799, + "step": 34766 + }, + { + "epoch": 0.89, + "learning_rate": 1.64876185482342e-06, + "loss": 0.614, + "step": 34767 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487407975949763e-06, + "loss": 0.9126, + "step": 34768 + }, + { + "epoch": 0.89, + "learning_rate": 1.6487197398698216e-06, + "loss": 0.8047, + "step": 34769 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486986816479721e-06, + "loss": 0.7576, + "step": 34770 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486776229294439e-06, + "loss": 0.9404, + "step": 34771 + }, + { + "epoch": 0.89, + "learning_rate": 1.648656563714253e-06, + "loss": 0.6182, + "step": 34772 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486355040024153e-06, + "loss": 0.8237, + "step": 34773 + }, + { + "epoch": 0.89, + "learning_rate": 1.6486144437939477e-06, + "loss": 0.8867, + "step": 34774 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485933830888656e-06, + "loss": 0.8896, + "step": 34775 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485723218871853e-06, + "loss": 0.915, + "step": 34776 + }, + { + "epoch": 0.89, + "learning_rate": 1.648551260188923e-06, + "loss": 0.8555, + "step": 34777 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485301979940952e-06, + "loss": 0.8359, + "step": 34778 + }, + { + "epoch": 0.89, + "learning_rate": 1.6485091353027175e-06, + "loss": 0.6987, + "step": 34779 + }, + { + "epoch": 0.89, + "learning_rate": 1.648488072114806e-06, + "loss": 0.8662, + "step": 34780 + }, + { + "epoch": 0.89, + "learning_rate": 1.648467008430377e-06, + "loss": 0.7627, + "step": 34781 + }, + { + "epoch": 0.89, + "learning_rate": 1.6484459442494465e-06, + "loss": 0.9756, + "step": 34782 + }, + { + "epoch": 0.89, + "learning_rate": 1.648424879572031e-06, + "loss": 0.8418, + "step": 34783 + }, + { + "epoch": 0.89, + "learning_rate": 1.6484038143981462e-06, + "loss": 0.9004, + "step": 34784 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483827487278087e-06, + "loss": 1.042, + "step": 34785 + }, + { + "epoch": 0.89, + "learning_rate": 1.648361682561034e-06, + "loss": 0.7832, + "step": 34786 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483406158978388e-06, + "loss": 0.7886, + "step": 34787 + }, + { + "epoch": 0.89, + "learning_rate": 1.6483195487382391e-06, + "loss": 0.7334, + "step": 34788 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482984810822508e-06, + "loss": 0.8242, + "step": 34789 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482774129298899e-06, + "loss": 0.7471, + "step": 34790 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482563442811732e-06, + "loss": 0.8174, + "step": 34791 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482352751361162e-06, + "loss": 0.8887, + "step": 34792 + }, + { + "epoch": 0.89, + "learning_rate": 1.6482142054947351e-06, + "loss": 0.9229, + "step": 34793 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481931353570465e-06, + "loss": 0.7617, + "step": 34794 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481720647230661e-06, + "loss": 1.0039, + "step": 34795 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481509935928101e-06, + "loss": 0.9365, + "step": 34796 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481299219662947e-06, + "loss": 0.6914, + "step": 34797 + }, + { + "epoch": 0.89, + "learning_rate": 1.6481088498435364e-06, + "loss": 0.7734, + "step": 34798 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480877772245507e-06, + "loss": 0.8271, + "step": 34799 + }, + { + "epoch": 0.89, + "learning_rate": 1.648066704109354e-06, + "loss": 0.957, + "step": 34800 + }, + { + "epoch": 0.89, + "learning_rate": 1.648045630497962e-06, + "loss": 0.8672, + "step": 34801 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480245563903918e-06, + "loss": 0.8193, + "step": 34802 + }, + { + "epoch": 0.89, + "learning_rate": 1.6480034817866585e-06, + "loss": 0.7061, + "step": 34803 + }, + { + "epoch": 0.89, + "learning_rate": 1.647982406686779e-06, + "loss": 0.6987, + "step": 34804 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479613310907695e-06, + "loss": 0.8496, + "step": 34805 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479402549986453e-06, + "loss": 0.9043, + "step": 34806 + }, + { + "epoch": 0.89, + "learning_rate": 1.6479191784104233e-06, + "loss": 0.8608, + "step": 34807 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478981013261195e-06, + "loss": 0.9199, + "step": 34808 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478770237457495e-06, + "loss": 0.8682, + "step": 34809 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478559456693302e-06, + "loss": 0.998, + "step": 34810 + }, + { + "epoch": 0.89, + "learning_rate": 1.6478348670968774e-06, + "loss": 0.8945, + "step": 34811 + }, + { + "epoch": 0.89, + "learning_rate": 1.647813788028407e-06, + "loss": 0.8154, + "step": 34812 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477927084639353e-06, + "loss": 0.6431, + "step": 34813 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477716284034788e-06, + "loss": 0.8174, + "step": 34814 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477505478470533e-06, + "loss": 0.7891, + "step": 34815 + }, + { + "epoch": 0.89, + "learning_rate": 1.6477294667946747e-06, + "loss": 0.9541, + "step": 34816 + }, + { + "epoch": 0.89, + "learning_rate": 1.64770838524636e-06, + "loss": 0.8135, + "step": 34817 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476873032021242e-06, + "loss": 1.0195, + "step": 34818 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476662206619842e-06, + "loss": 0.8926, + "step": 34819 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476451376259561e-06, + "loss": 0.8203, + "step": 34820 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476240540940557e-06, + "loss": 0.8623, + "step": 34821 + }, + { + "epoch": 0.89, + "learning_rate": 1.6476029700662997e-06, + "loss": 0.917, + "step": 34822 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475818855427033e-06, + "loss": 0.8574, + "step": 34823 + }, + { + "epoch": 0.89, + "learning_rate": 1.647560800523284e-06, + "loss": 0.6821, + "step": 34824 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475397150080564e-06, + "loss": 0.8154, + "step": 34825 + }, + { + "epoch": 0.89, + "learning_rate": 1.6475186289970377e-06, + "loss": 0.8633, + "step": 34826 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474975424902437e-06, + "loss": 0.9238, + "step": 34827 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474764554876908e-06, + "loss": 0.9209, + "step": 34828 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474553679893947e-06, + "loss": 0.8428, + "step": 34829 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474342799953722e-06, + "loss": 0.877, + "step": 34830 + }, + { + "epoch": 0.89, + "learning_rate": 1.6474131915056386e-06, + "loss": 0.562, + "step": 34831 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473921025202108e-06, + "loss": 0.8271, + "step": 34832 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473710130391044e-06, + "loss": 1.0723, + "step": 34833 + }, + { + "epoch": 0.89, + "learning_rate": 1.647349923062336e-06, + "loss": 0.6689, + "step": 34834 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473288325899213e-06, + "loss": 1.0234, + "step": 34835 + }, + { + "epoch": 0.89, + "learning_rate": 1.6473077416218769e-06, + "loss": 0.9141, + "step": 34836 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472866501582185e-06, + "loss": 0.999, + "step": 34837 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472655581989624e-06, + "loss": 1.0176, + "step": 34838 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472444657441253e-06, + "loss": 1.0469, + "step": 34839 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472233727937226e-06, + "loss": 1.0645, + "step": 34840 + }, + { + "epoch": 0.89, + "learning_rate": 1.6472022793477708e-06, + "loss": 0.9512, + "step": 34841 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471811854062858e-06, + "loss": 0.8711, + "step": 34842 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471600909692839e-06, + "loss": 0.5391, + "step": 34843 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471389960367816e-06, + "loss": 0.8926, + "step": 34844 + }, + { + "epoch": 0.89, + "learning_rate": 1.6471179006087946e-06, + "loss": 0.8701, + "step": 34845 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470968046853391e-06, + "loss": 0.8862, + "step": 34846 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470757082664313e-06, + "loss": 1.0098, + "step": 34847 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470546113520873e-06, + "loss": 0.7783, + "step": 34848 + }, + { + "epoch": 0.89, + "learning_rate": 1.6470335139423233e-06, + "loss": 0.8477, + "step": 34849 + }, + { + "epoch": 0.89, + "learning_rate": 1.647012416037156e-06, + "loss": 0.7446, + "step": 34850 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469913176366003e-06, + "loss": 0.7861, + "step": 34851 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469702187406736e-06, + "loss": 0.7227, + "step": 34852 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469491193493914e-06, + "loss": 0.9395, + "step": 34853 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469280194627703e-06, + "loss": 0.7993, + "step": 34854 + }, + { + "epoch": 0.89, + "learning_rate": 1.6469069190808256e-06, + "loss": 0.8521, + "step": 34855 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468858182035743e-06, + "loss": 0.6147, + "step": 34856 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468647168310323e-06, + "loss": 0.8613, + "step": 34857 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468436149632157e-06, + "loss": 0.7812, + "step": 34858 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468225126001406e-06, + "loss": 0.752, + "step": 34859 + }, + { + "epoch": 0.89, + "learning_rate": 1.6468014097418234e-06, + "loss": 0.6709, + "step": 34860 + }, + { + "epoch": 0.89, + "learning_rate": 1.64678030638828e-06, + "loss": 0.8633, + "step": 34861 + }, + { + "epoch": 0.89, + "learning_rate": 1.646759202539527e-06, + "loss": 0.8545, + "step": 34862 + }, + { + "epoch": 0.89, + "learning_rate": 1.6467380981955797e-06, + "loss": 0.8218, + "step": 34863 + }, + { + "epoch": 0.89, + "learning_rate": 1.6467169933564554e-06, + "loss": 0.8145, + "step": 34864 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466958880221691e-06, + "loss": 0.6699, + "step": 34865 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466747821927375e-06, + "loss": 0.6982, + "step": 34866 + }, + { + "epoch": 0.89, + "learning_rate": 1.646653675868177e-06, + "loss": 0.8467, + "step": 34867 + }, + { + "epoch": 0.89, + "learning_rate": 1.6466325690485031e-06, + "loss": 0.876, + "step": 34868 + }, + { + "epoch": 0.89, + "learning_rate": 1.646611461733733e-06, + "loss": 0.6685, + "step": 34869 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465903539238818e-06, + "loss": 0.6924, + "step": 34870 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465692456189663e-06, + "loss": 1.0742, + "step": 34871 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465481368190025e-06, + "loss": 1.043, + "step": 34872 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465270275240063e-06, + "loss": 0.8066, + "step": 34873 + }, + { + "epoch": 0.89, + "learning_rate": 1.6465059177339939e-06, + "loss": 0.7104, + "step": 34874 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464848074489822e-06, + "loss": 0.833, + "step": 34875 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464636966689863e-06, + "loss": 0.6382, + "step": 34876 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464425853940234e-06, + "loss": 0.9375, + "step": 34877 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464214736241086e-06, + "loss": 1.1475, + "step": 34878 + }, + { + "epoch": 0.89, + "learning_rate": 1.6464003613592588e-06, + "loss": 0.9736, + "step": 34879 + }, + { + "epoch": 0.89, + "learning_rate": 1.64637924859949e-06, + "loss": 0.8408, + "step": 34880 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463581353448183e-06, + "loss": 0.6826, + "step": 34881 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463370215952602e-06, + "loss": 0.8416, + "step": 34882 + }, + { + "epoch": 0.89, + "learning_rate": 1.6463159073508311e-06, + "loss": 0.7344, + "step": 34883 + }, + { + "epoch": 0.89, + "learning_rate": 1.646294792611548e-06, + "loss": 0.8408, + "step": 34884 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462736773774264e-06, + "loss": 0.606, + "step": 34885 + }, + { + "epoch": 0.89, + "learning_rate": 1.646252561648483e-06, + "loss": 0.6787, + "step": 34886 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462314454247333e-06, + "loss": 0.7695, + "step": 34887 + }, + { + "epoch": 0.89, + "learning_rate": 1.6462103287061942e-06, + "loss": 0.7312, + "step": 34888 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461892114928819e-06, + "loss": 0.7891, + "step": 34889 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461680937848116e-06, + "loss": 0.7979, + "step": 34890 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461469755820006e-06, + "loss": 0.7354, + "step": 34891 + }, + { + "epoch": 0.89, + "learning_rate": 1.6461258568844642e-06, + "loss": 0.9004, + "step": 34892 + }, + { + "epoch": 0.89, + "learning_rate": 1.646104737692219e-06, + "loss": 1.0283, + "step": 34893 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460836180052815e-06, + "loss": 0.8711, + "step": 34894 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460624978236671e-06, + "loss": 1.0186, + "step": 34895 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460413771473927e-06, + "loss": 1.04, + "step": 34896 + }, + { + "epoch": 0.89, + "learning_rate": 1.6460202559764737e-06, + "loss": 0.9912, + "step": 34897 + }, + { + "epoch": 0.89, + "learning_rate": 1.645999134310927e-06, + "loss": 0.8896, + "step": 34898 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459780121507683e-06, + "loss": 0.8164, + "step": 34899 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459568894960138e-06, + "loss": 0.8887, + "step": 34900 + }, + { + "epoch": 0.89, + "learning_rate": 1.64593576634668e-06, + "loss": 0.7109, + "step": 34901 + }, + { + "epoch": 0.89, + "learning_rate": 1.6459146427027828e-06, + "loss": 0.9346, + "step": 34902 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458935185643386e-06, + "loss": 0.7253, + "step": 34903 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458723939313634e-06, + "loss": 0.8721, + "step": 34904 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458512688038735e-06, + "loss": 0.6919, + "step": 34905 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458301431818846e-06, + "loss": 0.7217, + "step": 34906 + }, + { + "epoch": 0.89, + "learning_rate": 1.6458090170654138e-06, + "loss": 0.7236, + "step": 34907 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457878904544763e-06, + "loss": 0.7695, + "step": 34908 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457667633490888e-06, + "loss": 0.8394, + "step": 34909 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457456357492676e-06, + "loss": 0.8887, + "step": 34910 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457245076550286e-06, + "loss": 0.8555, + "step": 34911 + }, + { + "epoch": 0.89, + "learning_rate": 1.6457033790663877e-06, + "loss": 0.7651, + "step": 34912 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456822499833615e-06, + "loss": 0.9336, + "step": 34913 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456611204059666e-06, + "loss": 0.5151, + "step": 34914 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456399903342182e-06, + "loss": 0.9258, + "step": 34915 + }, + { + "epoch": 0.89, + "learning_rate": 1.6456188597681328e-06, + "loss": 0.6289, + "step": 34916 + }, + { + "epoch": 0.89, + "learning_rate": 1.645597728707727e-06, + "loss": 0.6133, + "step": 34917 + }, + { + "epoch": 0.89, + "learning_rate": 1.6455765971530168e-06, + "loss": 0.8037, + "step": 34918 + }, + { + "epoch": 0.89, + "learning_rate": 1.6455554651040183e-06, + "loss": 1.0088, + "step": 34919 + }, + { + "epoch": 0.9, + "learning_rate": 1.6455343325607474e-06, + "loss": 0.8232, + "step": 34920 + }, + { + "epoch": 0.9, + "learning_rate": 1.6455131995232206e-06, + "loss": 0.9209, + "step": 34921 + }, + { + "epoch": 0.9, + "learning_rate": 1.645492065991454e-06, + "loss": 0.6553, + "step": 34922 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454709319654641e-06, + "loss": 0.9639, + "step": 34923 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454497974452667e-06, + "loss": 0.9736, + "step": 34924 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454286624308778e-06, + "loss": 0.9287, + "step": 34925 + }, + { + "epoch": 0.9, + "learning_rate": 1.6454075269223138e-06, + "loss": 0.9844, + "step": 34926 + }, + { + "epoch": 0.9, + "learning_rate": 1.645386390919591e-06, + "loss": 0.875, + "step": 34927 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453652544227259e-06, + "loss": 0.917, + "step": 34928 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453441174317342e-06, + "loss": 0.8345, + "step": 34929 + }, + { + "epoch": 0.9, + "learning_rate": 1.645322979946632e-06, + "loss": 0.7578, + "step": 34930 + }, + { + "epoch": 0.9, + "learning_rate": 1.6453018419674357e-06, + "loss": 0.877, + "step": 34931 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452807034941613e-06, + "loss": 0.8271, + "step": 34932 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452595645268255e-06, + "loss": 0.7957, + "step": 34933 + }, + { + "epoch": 0.9, + "learning_rate": 1.6452384250654438e-06, + "loss": 0.8311, + "step": 34934 + }, + { + "epoch": 0.9, + "learning_rate": 1.645217285110033e-06, + "loss": 0.7666, + "step": 34935 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451961446606085e-06, + "loss": 0.9668, + "step": 34936 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451750037171875e-06, + "loss": 0.73, + "step": 34937 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451538622797854e-06, + "loss": 0.8271, + "step": 34938 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451327203484186e-06, + "loss": 0.811, + "step": 34939 + }, + { + "epoch": 0.9, + "learning_rate": 1.6451115779231036e-06, + "loss": 0.9697, + "step": 34940 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450904350038562e-06, + "loss": 0.9014, + "step": 34941 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450692915906924e-06, + "loss": 0.6943, + "step": 34942 + }, + { + "epoch": 0.9, + "learning_rate": 1.645048147683629e-06, + "loss": 0.9424, + "step": 34943 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450270032826821e-06, + "loss": 0.7573, + "step": 34944 + }, + { + "epoch": 0.9, + "learning_rate": 1.6450058583878674e-06, + "loss": 0.8887, + "step": 34945 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449847129992013e-06, + "loss": 0.8252, + "step": 34946 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449635671167004e-06, + "loss": 0.7979, + "step": 34947 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449424207403801e-06, + "loss": 0.8125, + "step": 34948 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449212738702576e-06, + "loss": 0.7891, + "step": 34949 + }, + { + "epoch": 0.9, + "learning_rate": 1.6449001265063482e-06, + "loss": 0.8945, + "step": 34950 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448789786486685e-06, + "loss": 0.9248, + "step": 34951 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448578302972345e-06, + "loss": 0.8105, + "step": 34952 + }, + { + "epoch": 0.9, + "learning_rate": 1.6448366814520624e-06, + "loss": 0.9453, + "step": 34953 + }, + { + "epoch": 0.9, + "learning_rate": 1.644815532113169e-06, + "loss": 0.9961, + "step": 34954 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447943822805694e-06, + "loss": 0.7529, + "step": 34955 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447732319542808e-06, + "loss": 0.7104, + "step": 34956 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447520811343187e-06, + "loss": 0.8809, + "step": 34957 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447309298207e-06, + "loss": 0.7803, + "step": 34958 + }, + { + "epoch": 0.9, + "learning_rate": 1.6447097780134403e-06, + "loss": 1.1113, + "step": 34959 + }, + { + "epoch": 0.9, + "learning_rate": 1.644688625712556e-06, + "loss": 1.0791, + "step": 34960 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446674729180629e-06, + "loss": 0.7656, + "step": 34961 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446463196299779e-06, + "loss": 0.9141, + "step": 34962 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446251658483169e-06, + "loss": 1.0156, + "step": 34963 + }, + { + "epoch": 0.9, + "learning_rate": 1.6446040115730957e-06, + "loss": 0.9404, + "step": 34964 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445828568043312e-06, + "loss": 0.7363, + "step": 34965 + }, + { + "epoch": 0.9, + "learning_rate": 1.644561701542039e-06, + "loss": 0.8369, + "step": 34966 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445405457862354e-06, + "loss": 0.7876, + "step": 34967 + }, + { + "epoch": 0.9, + "learning_rate": 1.6445193895369372e-06, + "loss": 0.8857, + "step": 34968 + }, + { + "epoch": 0.9, + "learning_rate": 1.64449823279416e-06, + "loss": 0.7725, + "step": 34969 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444770755579201e-06, + "loss": 0.5283, + "step": 34970 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444559178282336e-06, + "loss": 0.7793, + "step": 34971 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444347596051168e-06, + "loss": 1.0898, + "step": 34972 + }, + { + "epoch": 0.9, + "learning_rate": 1.6444136008885861e-06, + "loss": 0.9209, + "step": 34973 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443924416786577e-06, + "loss": 0.9746, + "step": 34974 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443712819753474e-06, + "loss": 0.6064, + "step": 34975 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443501217786718e-06, + "loss": 0.8652, + "step": 34976 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443289610886467e-06, + "loss": 0.8184, + "step": 34977 + }, + { + "epoch": 0.9, + "learning_rate": 1.6443077999052886e-06, + "loss": 0.7471, + "step": 34978 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442866382286139e-06, + "loss": 1.0234, + "step": 34979 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442654760586382e-06, + "loss": 0.876, + "step": 34980 + }, + { + "epoch": 0.9, + "learning_rate": 1.644244313395378e-06, + "loss": 0.916, + "step": 34981 + }, + { + "epoch": 0.9, + "learning_rate": 1.64422315023885e-06, + "loss": 0.8325, + "step": 34982 + }, + { + "epoch": 0.9, + "learning_rate": 1.6442019865890698e-06, + "loss": 0.7144, + "step": 34983 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441808224460537e-06, + "loss": 1.0293, + "step": 34984 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441596578098179e-06, + "loss": 0.8545, + "step": 34985 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441384926803785e-06, + "loss": 0.7983, + "step": 34986 + }, + { + "epoch": 0.9, + "learning_rate": 1.6441173270577521e-06, + "loss": 0.8203, + "step": 34987 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440961609419545e-06, + "loss": 0.7812, + "step": 34988 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440749943330025e-06, + "loss": 0.9209, + "step": 34989 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440538272309117e-06, + "loss": 1.1465, + "step": 34990 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440326596356983e-06, + "loss": 0.8779, + "step": 34991 + }, + { + "epoch": 0.9, + "learning_rate": 1.6440114915473789e-06, + "loss": 0.9116, + "step": 34992 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439903229659696e-06, + "loss": 0.8906, + "step": 34993 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439691538914864e-06, + "loss": 0.9287, + "step": 34994 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439479843239457e-06, + "loss": 0.7588, + "step": 34995 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439268142633634e-06, + "loss": 0.7314, + "step": 34996 + }, + { + "epoch": 0.9, + "learning_rate": 1.6439056437097559e-06, + "loss": 0.8369, + "step": 34997 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438844726631396e-06, + "loss": 0.9453, + "step": 34998 + }, + { + "epoch": 0.9, + "learning_rate": 1.643863301123531e-06, + "loss": 0.7656, + "step": 34999 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438421290909452e-06, + "loss": 0.9951, + "step": 35000 + }, + { + "epoch": 0.9, + "learning_rate": 1.6438209565653996e-06, + "loss": 0.8135, + "step": 35001 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437997835469095e-06, + "loss": 0.7607, + "step": 35002 + }, + { + "epoch": 0.9, + "learning_rate": 1.643778610035492e-06, + "loss": 0.8057, + "step": 35003 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437574360311624e-06, + "loss": 1.0967, + "step": 35004 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437362615339371e-06, + "loss": 0.8838, + "step": 35005 + }, + { + "epoch": 0.9, + "learning_rate": 1.6437150865438332e-06, + "loss": 0.8555, + "step": 35006 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436939110608655e-06, + "loss": 0.957, + "step": 35007 + }, + { + "epoch": 0.9, + "learning_rate": 1.643672735085052e-06, + "loss": 0.8291, + "step": 35008 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436515586164071e-06, + "loss": 0.6753, + "step": 35009 + }, + { + "epoch": 0.9, + "learning_rate": 1.643630381654948e-06, + "loss": 0.7783, + "step": 35010 + }, + { + "epoch": 0.9, + "learning_rate": 1.6436092042006906e-06, + "loss": 0.8076, + "step": 35011 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435880262536512e-06, + "loss": 0.7256, + "step": 35012 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435668478138466e-06, + "loss": 0.7852, + "step": 35013 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435456688812917e-06, + "loss": 0.8643, + "step": 35014 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435244894560038e-06, + "loss": 0.8613, + "step": 35015 + }, + { + "epoch": 0.9, + "learning_rate": 1.6435033095379988e-06, + "loss": 0.7842, + "step": 35016 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434821291272928e-06, + "loss": 0.6729, + "step": 35017 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434609482239024e-06, + "loss": 0.8096, + "step": 35018 + }, + { + "epoch": 0.9, + "learning_rate": 1.6434397668278433e-06, + "loss": 0.9668, + "step": 35019 + }, + { + "epoch": 0.9, + "learning_rate": 1.643418584939132e-06, + "loss": 0.9766, + "step": 35020 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433974025577847e-06, + "loss": 0.6406, + "step": 35021 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433762196838174e-06, + "loss": 0.6526, + "step": 35022 + }, + { + "epoch": 0.9, + "learning_rate": 1.643355036317247e-06, + "loss": 0.8003, + "step": 35023 + }, + { + "epoch": 0.9, + "learning_rate": 1.643333852458089e-06, + "loss": 0.8828, + "step": 35024 + }, + { + "epoch": 0.9, + "learning_rate": 1.6433126681063596e-06, + "loss": 0.998, + "step": 35025 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432914832620753e-06, + "loss": 0.7227, + "step": 35026 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432702979252526e-06, + "loss": 0.8828, + "step": 35027 + }, + { + "epoch": 0.9, + "learning_rate": 1.643249112095907e-06, + "loss": 0.8691, + "step": 35028 + }, + { + "epoch": 0.9, + "learning_rate": 1.6432279257740555e-06, + "loss": 0.8994, + "step": 35029 + }, + { + "epoch": 0.9, + "learning_rate": 1.643206738959714e-06, + "loss": 0.9229, + "step": 35030 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431855516528983e-06, + "loss": 0.9502, + "step": 35031 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431643638536252e-06, + "loss": 1.0684, + "step": 35032 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431431755619109e-06, + "loss": 0.7749, + "step": 35033 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431219867777712e-06, + "loss": 0.6562, + "step": 35034 + }, + { + "epoch": 0.9, + "learning_rate": 1.6431007975012225e-06, + "loss": 0.873, + "step": 35035 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430796077322812e-06, + "loss": 0.6775, + "step": 35036 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430584174709635e-06, + "loss": 0.8301, + "step": 35037 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430372267172854e-06, + "loss": 0.6914, + "step": 35038 + }, + { + "epoch": 0.9, + "learning_rate": 1.6430160354712635e-06, + "loss": 0.5869, + "step": 35039 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429948437329135e-06, + "loss": 0.6592, + "step": 35040 + }, + { + "epoch": 0.9, + "learning_rate": 1.642973651502252e-06, + "loss": 0.7432, + "step": 35041 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429524587792952e-06, + "loss": 0.6467, + "step": 35042 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429312655640596e-06, + "loss": 0.958, + "step": 35043 + }, + { + "epoch": 0.9, + "learning_rate": 1.6429100718565606e-06, + "loss": 0.3379, + "step": 35044 + }, + { + "epoch": 0.9, + "learning_rate": 1.642888877656815e-06, + "loss": 0.646, + "step": 35045 + }, + { + "epoch": 0.9, + "learning_rate": 1.642867682964839e-06, + "loss": 0.8315, + "step": 35046 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428464877806488e-06, + "loss": 0.6299, + "step": 35047 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428252921042605e-06, + "loss": 0.9131, + "step": 35048 + }, + { + "epoch": 0.9, + "learning_rate": 1.6428040959356905e-06, + "loss": 0.7612, + "step": 35049 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427828992749548e-06, + "loss": 0.5732, + "step": 35050 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427617021220701e-06, + "loss": 0.8301, + "step": 35051 + }, + { + "epoch": 0.9, + "learning_rate": 1.642740504477052e-06, + "loss": 1.0225, + "step": 35052 + }, + { + "epoch": 0.9, + "learning_rate": 1.6427193063399174e-06, + "loss": 0.8838, + "step": 35053 + }, + { + "epoch": 0.9, + "learning_rate": 1.642698107710682e-06, + "loss": 0.8428, + "step": 35054 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426769085893622e-06, + "loss": 0.9756, + "step": 35055 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426557089759742e-06, + "loss": 0.7627, + "step": 35056 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426345088705343e-06, + "loss": 0.9775, + "step": 35057 + }, + { + "epoch": 0.9, + "learning_rate": 1.6426133082730588e-06, + "loss": 0.5925, + "step": 35058 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425921071835637e-06, + "loss": 0.9707, + "step": 35059 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425709056020657e-06, + "loss": 0.8047, + "step": 35060 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425497035285805e-06, + "loss": 0.9521, + "step": 35061 + }, + { + "epoch": 0.9, + "learning_rate": 1.6425285009631243e-06, + "loss": 0.71, + "step": 35062 + }, + { + "epoch": 0.9, + "learning_rate": 1.642507297905714e-06, + "loss": 0.835, + "step": 35063 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424860943563653e-06, + "loss": 0.6899, + "step": 35064 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424648903150942e-06, + "loss": 0.875, + "step": 35065 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424436857819174e-06, + "loss": 0.8311, + "step": 35066 + }, + { + "epoch": 0.9, + "learning_rate": 1.642422480756851e-06, + "loss": 0.9268, + "step": 35067 + }, + { + "epoch": 0.9, + "learning_rate": 1.6424012752399117e-06, + "loss": 0.7451, + "step": 35068 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423800692311148e-06, + "loss": 0.6836, + "step": 35069 + }, + { + "epoch": 0.9, + "learning_rate": 1.642358862730477e-06, + "loss": 0.8379, + "step": 35070 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423376557380148e-06, + "loss": 0.7139, + "step": 35071 + }, + { + "epoch": 0.9, + "learning_rate": 1.6423164482537438e-06, + "loss": 0.9766, + "step": 35072 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422952402776811e-06, + "loss": 0.9619, + "step": 35073 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422740318098423e-06, + "loss": 0.7158, + "step": 35074 + }, + { + "epoch": 0.9, + "learning_rate": 1.642252822850244e-06, + "loss": 0.875, + "step": 35075 + }, + { + "epoch": 0.9, + "learning_rate": 1.642231613398902e-06, + "loss": 0.7471, + "step": 35076 + }, + { + "epoch": 0.9, + "learning_rate": 1.6422104034558325e-06, + "loss": 0.9561, + "step": 35077 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421891930210526e-06, + "loss": 0.834, + "step": 35078 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421679820945778e-06, + "loss": 0.958, + "step": 35079 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421467706764242e-06, + "loss": 0.9248, + "step": 35080 + }, + { + "epoch": 0.9, + "learning_rate": 1.6421255587666085e-06, + "loss": 0.8599, + "step": 35081 + }, + { + "epoch": 0.9, + "learning_rate": 1.642104346365147e-06, + "loss": 0.8594, + "step": 35082 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420831334720555e-06, + "loss": 0.8574, + "step": 35083 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420619200873508e-06, + "loss": 1.0703, + "step": 35084 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420407062110484e-06, + "loss": 0.5884, + "step": 35085 + }, + { + "epoch": 0.9, + "learning_rate": 1.6420194918431652e-06, + "loss": 0.7832, + "step": 35086 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419982769837168e-06, + "loss": 0.877, + "step": 35087 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419770616327205e-06, + "loss": 0.4651, + "step": 35088 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419558457901915e-06, + "loss": 0.7671, + "step": 35089 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419346294561463e-06, + "loss": 0.5342, + "step": 35090 + }, + { + "epoch": 0.9, + "learning_rate": 1.6419134126306013e-06, + "loss": 0.7769, + "step": 35091 + }, + { + "epoch": 0.9, + "learning_rate": 1.641892195313573e-06, + "loss": 0.48, + "step": 35092 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418709775050772e-06, + "loss": 0.8687, + "step": 35093 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418497592051303e-06, + "loss": 0.8564, + "step": 35094 + }, + { + "epoch": 0.9, + "learning_rate": 1.6418285404137486e-06, + "loss": 0.9385, + "step": 35095 + }, + { + "epoch": 0.9, + "learning_rate": 1.641807321130948e-06, + "loss": 1.0312, + "step": 35096 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417861013567453e-06, + "loss": 0.7178, + "step": 35097 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417648810911567e-06, + "loss": 0.8867, + "step": 35098 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417436603341978e-06, + "loss": 0.7117, + "step": 35099 + }, + { + "epoch": 0.9, + "learning_rate": 1.6417224390858854e-06, + "loss": 0.626, + "step": 35100 + }, + { + "epoch": 0.9, + "learning_rate": 1.641701217346236e-06, + "loss": 0.7852, + "step": 35101 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416799951152651e-06, + "loss": 0.6909, + "step": 35102 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416587723929894e-06, + "loss": 0.8916, + "step": 35103 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416375491794253e-06, + "loss": 0.8369, + "step": 35104 + }, + { + "epoch": 0.9, + "learning_rate": 1.6416163254745887e-06, + "loss": 0.7222, + "step": 35105 + }, + { + "epoch": 0.9, + "learning_rate": 1.641595101278496e-06, + "loss": 1.0264, + "step": 35106 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415738765911633e-06, + "loss": 0.8701, + "step": 35107 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415526514126073e-06, + "loss": 0.9453, + "step": 35108 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415314257428437e-06, + "loss": 1.0361, + "step": 35109 + }, + { + "epoch": 0.9, + "learning_rate": 1.6415101995818889e-06, + "loss": 0.8223, + "step": 35110 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414889729297594e-06, + "loss": 0.8555, + "step": 35111 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414677457864712e-06, + "loss": 1.0156, + "step": 35112 + }, + { + "epoch": 0.9, + "learning_rate": 1.641446518152041e-06, + "loss": 1.0029, + "step": 35113 + }, + { + "epoch": 0.9, + "learning_rate": 1.641425290026484e-06, + "loss": 0.8262, + "step": 35114 + }, + { + "epoch": 0.9, + "learning_rate": 1.6414040614098177e-06, + "loss": 0.8252, + "step": 35115 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413828323020575e-06, + "loss": 0.7471, + "step": 35116 + }, + { + "epoch": 0.9, + "learning_rate": 1.64136160270322e-06, + "loss": 0.8896, + "step": 35117 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413403726133215e-06, + "loss": 1.083, + "step": 35118 + }, + { + "epoch": 0.9, + "learning_rate": 1.6413191420323783e-06, + "loss": 0.8398, + "step": 35119 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412979109604063e-06, + "loss": 0.7324, + "step": 35120 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412766793974222e-06, + "loss": 0.958, + "step": 35121 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412554473434417e-06, + "loss": 0.9941, + "step": 35122 + }, + { + "epoch": 0.9, + "learning_rate": 1.6412342147984817e-06, + "loss": 0.9204, + "step": 35123 + }, + { + "epoch": 0.9, + "learning_rate": 1.641212981762558e-06, + "loss": 0.8154, + "step": 35124 + }, + { + "epoch": 0.9, + "learning_rate": 1.641191748235687e-06, + "loss": 0.6792, + "step": 35125 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411705142178849e-06, + "loss": 1.0547, + "step": 35126 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411492797091682e-06, + "loss": 0.7646, + "step": 35127 + }, + { + "epoch": 0.9, + "learning_rate": 1.641128044709553e-06, + "loss": 0.8301, + "step": 35128 + }, + { + "epoch": 0.9, + "learning_rate": 1.6411068092190555e-06, + "loss": 1.1201, + "step": 35129 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410855732376918e-06, + "loss": 1.1445, + "step": 35130 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410643367654781e-06, + "loss": 0.8301, + "step": 35131 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410430998024314e-06, + "loss": 0.8975, + "step": 35132 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410218623485673e-06, + "loss": 0.7217, + "step": 35133 + }, + { + "epoch": 0.9, + "learning_rate": 1.6410006244039026e-06, + "loss": 0.7178, + "step": 35134 + }, + { + "epoch": 0.9, + "learning_rate": 1.640979385968453e-06, + "loss": 0.9736, + "step": 35135 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409581470422347e-06, + "loss": 0.9141, + "step": 35136 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409369076252642e-06, + "loss": 0.9121, + "step": 35137 + }, + { + "epoch": 0.9, + "learning_rate": 1.6409156677175583e-06, + "loss": 0.7339, + "step": 35138 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408944273191322e-06, + "loss": 0.875, + "step": 35139 + }, + { + "epoch": 0.9, + "learning_rate": 1.640873186430003e-06, + "loss": 0.9023, + "step": 35140 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408519450501866e-06, + "loss": 0.7695, + "step": 35141 + }, + { + "epoch": 0.9, + "learning_rate": 1.640830703179699e-06, + "loss": 1.082, + "step": 35142 + }, + { + "epoch": 0.9, + "learning_rate": 1.6408094608185572e-06, + "loss": 0.5334, + "step": 35143 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407882179667769e-06, + "loss": 0.8467, + "step": 35144 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407669746243745e-06, + "loss": 0.8125, + "step": 35145 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407457307913663e-06, + "loss": 0.9092, + "step": 35146 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407244864677688e-06, + "loss": 0.8594, + "step": 35147 + }, + { + "epoch": 0.9, + "learning_rate": 1.6407032416535978e-06, + "loss": 0.9941, + "step": 35148 + }, + { + "epoch": 0.9, + "learning_rate": 1.64068199634887e-06, + "loss": 0.877, + "step": 35149 + }, + { + "epoch": 0.9, + "learning_rate": 1.6406607505536012e-06, + "loss": 0.7666, + "step": 35150 + }, + { + "epoch": 0.9, + "learning_rate": 1.640639504267808e-06, + "loss": 0.9551, + "step": 35151 + }, + { + "epoch": 0.9, + "learning_rate": 1.6406182574915066e-06, + "loss": 0.8115, + "step": 35152 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405970102247134e-06, + "loss": 0.8945, + "step": 35153 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405757624674444e-06, + "loss": 0.9175, + "step": 35154 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405545142197159e-06, + "loss": 0.9521, + "step": 35155 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405332654815442e-06, + "loss": 0.7378, + "step": 35156 + }, + { + "epoch": 0.9, + "learning_rate": 1.6405120162529458e-06, + "loss": 0.9805, + "step": 35157 + }, + { + "epoch": 0.9, + "learning_rate": 1.640490766533937e-06, + "loss": 0.8486, + "step": 35158 + }, + { + "epoch": 0.9, + "learning_rate": 1.6404695163245334e-06, + "loss": 0.9004, + "step": 35159 + }, + { + "epoch": 0.9, + "learning_rate": 1.640448265624752e-06, + "loss": 0.874, + "step": 35160 + }, + { + "epoch": 0.9, + "learning_rate": 1.640427014434609e-06, + "loss": 0.9014, + "step": 35161 + }, + { + "epoch": 0.9, + "learning_rate": 1.6404057627541201e-06, + "loss": 1.0771, + "step": 35162 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403845105833024e-06, + "loss": 0.8486, + "step": 35163 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403632579221713e-06, + "loss": 0.9482, + "step": 35164 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403420047707438e-06, + "loss": 0.8516, + "step": 35165 + }, + { + "epoch": 0.9, + "learning_rate": 1.6403207511290353e-06, + "loss": 0.835, + "step": 35166 + }, + { + "epoch": 0.9, + "learning_rate": 1.640299496997063e-06, + "loss": 0.6279, + "step": 35167 + }, + { + "epoch": 0.9, + "learning_rate": 1.640278242374843e-06, + "loss": 0.9033, + "step": 35168 + }, + { + "epoch": 0.9, + "learning_rate": 1.6402569872623912e-06, + "loss": 0.9727, + "step": 35169 + }, + { + "epoch": 0.9, + "learning_rate": 1.6402357316597244e-06, + "loss": 0.7549, + "step": 35170 + }, + { + "epoch": 0.9, + "learning_rate": 1.640214475566858e-06, + "loss": 0.7939, + "step": 35171 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401932189838092e-06, + "loss": 0.6001, + "step": 35172 + }, + { + "epoch": 0.9, + "learning_rate": 1.640171961910594e-06, + "loss": 0.8008, + "step": 35173 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401507043472283e-06, + "loss": 1.0166, + "step": 35174 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401294462937284e-06, + "loss": 0.9346, + "step": 35175 + }, + { + "epoch": 0.9, + "learning_rate": 1.6401081877501113e-06, + "loss": 0.8838, + "step": 35176 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400869287163925e-06, + "loss": 0.9092, + "step": 35177 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400656691925889e-06, + "loss": 0.7393, + "step": 35178 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400444091787161e-06, + "loss": 1.2139, + "step": 35179 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400231486747908e-06, + "loss": 0.7891, + "step": 35180 + }, + { + "epoch": 0.9, + "learning_rate": 1.6400018876808296e-06, + "loss": 0.7551, + "step": 35181 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399806261968477e-06, + "loss": 1.0254, + "step": 35182 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399593642228626e-06, + "loss": 0.958, + "step": 35183 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399381017588896e-06, + "loss": 0.8828, + "step": 35184 + }, + { + "epoch": 0.9, + "learning_rate": 1.6399168388049458e-06, + "loss": 0.9053, + "step": 35185 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398955753610468e-06, + "loss": 0.7695, + "step": 35186 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398743114272096e-06, + "loss": 0.6487, + "step": 35187 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398530470034495e-06, + "loss": 0.8638, + "step": 35188 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398317820897838e-06, + "loss": 0.7881, + "step": 35189 + }, + { + "epoch": 0.9, + "learning_rate": 1.6398105166862282e-06, + "loss": 0.6929, + "step": 35190 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397892507927988e-06, + "loss": 0.9883, + "step": 35191 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397679844095125e-06, + "loss": 0.8896, + "step": 35192 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397467175363854e-06, + "loss": 0.7725, + "step": 35193 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397254501734335e-06, + "loss": 0.7021, + "step": 35194 + }, + { + "epoch": 0.9, + "learning_rate": 1.6397041823206732e-06, + "loss": 0.8457, + "step": 35195 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396829139781207e-06, + "loss": 0.958, + "step": 35196 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396616451457926e-06, + "loss": 0.6938, + "step": 35197 + }, + { + "epoch": 0.9, + "learning_rate": 1.639640375823705e-06, + "loss": 0.9014, + "step": 35198 + }, + { + "epoch": 0.9, + "learning_rate": 1.6396191060118743e-06, + "loss": 0.9434, + "step": 35199 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395978357103163e-06, + "loss": 0.8936, + "step": 35200 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395765649190477e-06, + "loss": 0.6826, + "step": 35201 + }, + { + "epoch": 0.9, + "learning_rate": 1.639555293638085e-06, + "loss": 0.8564, + "step": 35202 + }, + { + "epoch": 0.9, + "learning_rate": 1.639534021867444e-06, + "loss": 0.6855, + "step": 35203 + }, + { + "epoch": 0.9, + "learning_rate": 1.6395127496071415e-06, + "loss": 0.8877, + "step": 35204 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394914768571932e-06, + "loss": 0.7603, + "step": 35205 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394702036176157e-06, + "loss": 1.0459, + "step": 35206 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394489298884254e-06, + "loss": 0.7656, + "step": 35207 + }, + { + "epoch": 0.9, + "learning_rate": 1.6394276556696384e-06, + "loss": 0.8232, + "step": 35208 + }, + { + "epoch": 0.9, + "learning_rate": 1.639406380961271e-06, + "loss": 0.8125, + "step": 35209 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393851057633397e-06, + "loss": 0.9463, + "step": 35210 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393638300758603e-06, + "loss": 0.7568, + "step": 35211 + }, + { + "epoch": 0.9, + "learning_rate": 1.6393425538988498e-06, + "loss": 0.6707, + "step": 35212 + }, + { + "epoch": 0.9, + "learning_rate": 1.639321277232324e-06, + "loss": 0.8809, + "step": 35213 + }, + { + "epoch": 0.9, + "learning_rate": 1.639300000076299e-06, + "loss": 0.6279, + "step": 35214 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392787224307917e-06, + "loss": 0.9902, + "step": 35215 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392574442958177e-06, + "loss": 0.814, + "step": 35216 + }, + { + "epoch": 0.9, + "learning_rate": 1.639236165671394e-06, + "loss": 1.0566, + "step": 35217 + }, + { + "epoch": 0.9, + "learning_rate": 1.6392148865575367e-06, + "loss": 0.9414, + "step": 35218 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391936069542616e-06, + "loss": 0.8169, + "step": 35219 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391723268615855e-06, + "loss": 0.8765, + "step": 35220 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391510462795247e-06, + "loss": 0.8145, + "step": 35221 + }, + { + "epoch": 0.9, + "learning_rate": 1.639129765208095e-06, + "loss": 0.9492, + "step": 35222 + }, + { + "epoch": 0.9, + "learning_rate": 1.6391084836473132e-06, + "loss": 0.917, + "step": 35223 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390872015971955e-06, + "loss": 0.9219, + "step": 35224 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390659190577577e-06, + "loss": 0.6758, + "step": 35225 + }, + { + "epoch": 0.9, + "learning_rate": 1.639044636029017e-06, + "loss": 0.8525, + "step": 35226 + }, + { + "epoch": 0.9, + "learning_rate": 1.639023352510989e-06, + "loss": 0.6753, + "step": 35227 + }, + { + "epoch": 0.9, + "learning_rate": 1.6390020685036905e-06, + "loss": 0.834, + "step": 35228 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389807840071372e-06, + "loss": 0.8604, + "step": 35229 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389594990213457e-06, + "loss": 0.8936, + "step": 35230 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389382135463323e-06, + "loss": 0.8555, + "step": 35231 + }, + { + "epoch": 0.9, + "learning_rate": 1.6389169275821132e-06, + "loss": 0.9258, + "step": 35232 + }, + { + "epoch": 0.9, + "learning_rate": 1.638895641128705e-06, + "loss": 0.667, + "step": 35233 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388743541861239e-06, + "loss": 0.8975, + "step": 35234 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388530667543856e-06, + "loss": 0.9277, + "step": 35235 + }, + { + "epoch": 0.9, + "learning_rate": 1.638831778833507e-06, + "loss": 0.9922, + "step": 35236 + }, + { + "epoch": 0.9, + "learning_rate": 1.6388104904235046e-06, + "loss": 0.7549, + "step": 35237 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387892015243945e-06, + "loss": 0.7266, + "step": 35238 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387679121361925e-06, + "loss": 0.8374, + "step": 35239 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387466222589153e-06, + "loss": 0.8779, + "step": 35240 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387253318925791e-06, + "loss": 0.793, + "step": 35241 + }, + { + "epoch": 0.9, + "learning_rate": 1.6387040410372007e-06, + "loss": 1.0479, + "step": 35242 + }, + { + "epoch": 0.9, + "learning_rate": 1.6386827496927957e-06, + "loss": 1.1123, + "step": 35243 + }, + { + "epoch": 0.9, + "learning_rate": 1.6386614578593807e-06, + "loss": 0.8643, + "step": 35244 + }, + { + "epoch": 0.9, + "learning_rate": 1.638640165536972e-06, + "loss": 0.6284, + "step": 35245 + }, + { + "epoch": 0.9, + "learning_rate": 1.638618872725586e-06, + "loss": 0.9121, + "step": 35246 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385975794252388e-06, + "loss": 1.0576, + "step": 35247 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385762856359467e-06, + "loss": 0.6167, + "step": 35248 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385549913577261e-06, + "loss": 0.7773, + "step": 35249 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385336965905934e-06, + "loss": 0.7881, + "step": 35250 + }, + { + "epoch": 0.9, + "learning_rate": 1.6385124013345647e-06, + "loss": 0.8721, + "step": 35251 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384911055896566e-06, + "loss": 0.958, + "step": 35252 + }, + { + "epoch": 0.9, + "learning_rate": 1.638469809355885e-06, + "loss": 0.8545, + "step": 35253 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384485126332667e-06, + "loss": 0.9082, + "step": 35254 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384272154218177e-06, + "loss": 0.5962, + "step": 35255 + }, + { + "epoch": 0.9, + "learning_rate": 1.6384059177215544e-06, + "loss": 0.7417, + "step": 35256 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383846195324926e-06, + "loss": 0.7163, + "step": 35257 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383633208546495e-06, + "loss": 0.783, + "step": 35258 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383420216880408e-06, + "loss": 0.8193, + "step": 35259 + }, + { + "epoch": 0.9, + "learning_rate": 1.6383207220326826e-06, + "loss": 0.7417, + "step": 35260 + }, + { + "epoch": 0.9, + "learning_rate": 1.638299421888592e-06, + "loss": 1.0186, + "step": 35261 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382781212557849e-06, + "loss": 0.4438, + "step": 35262 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382568201342775e-06, + "loss": 0.916, + "step": 35263 + }, + { + "epoch": 0.9, + "learning_rate": 1.638235518524086e-06, + "loss": 1.0137, + "step": 35264 + }, + { + "epoch": 0.9, + "learning_rate": 1.6382142164252272e-06, + "loss": 0.9717, + "step": 35265 + }, + { + "epoch": 0.9, + "learning_rate": 1.6381929138377171e-06, + "loss": 0.915, + "step": 35266 + }, + { + "epoch": 0.9, + "learning_rate": 1.638171610761572e-06, + "loss": 0.8047, + "step": 35267 + }, + { + "epoch": 0.9, + "learning_rate": 1.6381503071968084e-06, + "loss": 0.6865, + "step": 35268 + }, + { + "epoch": 0.9, + "learning_rate": 1.638129003143442e-06, + "loss": 0.8506, + "step": 35269 + }, + { + "epoch": 0.9, + "learning_rate": 1.63810769860149e-06, + "loss": 0.8213, + "step": 35270 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380863935709679e-06, + "loss": 0.7297, + "step": 35271 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380650880518924e-06, + "loss": 0.9199, + "step": 35272 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380437820442804e-06, + "loss": 0.8174, + "step": 35273 + }, + { + "epoch": 0.9, + "learning_rate": 1.638022475548147e-06, + "loss": 0.6479, + "step": 35274 + }, + { + "epoch": 0.9, + "learning_rate": 1.6380011685635092e-06, + "loss": 0.8662, + "step": 35275 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379798610903834e-06, + "loss": 0.6294, + "step": 35276 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379585531287856e-06, + "loss": 0.8584, + "step": 35277 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379372446787328e-06, + "loss": 0.9453, + "step": 35278 + }, + { + "epoch": 0.9, + "learning_rate": 1.6379159357402402e-06, + "loss": 0.6133, + "step": 35279 + }, + { + "epoch": 0.9, + "learning_rate": 1.637894626313325e-06, + "loss": 0.5513, + "step": 35280 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378733163980028e-06, + "loss": 0.8242, + "step": 35281 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378520059942906e-06, + "loss": 1.0186, + "step": 35282 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378306951022048e-06, + "loss": 0.8779, + "step": 35283 + }, + { + "epoch": 0.9, + "learning_rate": 1.6378093837217609e-06, + "loss": 0.7441, + "step": 35284 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377880718529758e-06, + "loss": 0.8027, + "step": 35285 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377667594958658e-06, + "loss": 0.9824, + "step": 35286 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377454466504469e-06, + "loss": 0.793, + "step": 35287 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377241333167357e-06, + "loss": 0.7422, + "step": 35288 + }, + { + "epoch": 0.9, + "learning_rate": 1.6377028194947487e-06, + "loss": 0.9531, + "step": 35289 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376815051845017e-06, + "loss": 0.8882, + "step": 35290 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376601903860111e-06, + "loss": 0.8818, + "step": 35291 + }, + { + "epoch": 0.9, + "learning_rate": 1.6376388750992937e-06, + "loss": 0.8701, + "step": 35292 + }, + { + "epoch": 0.9, + "learning_rate": 1.637617559324366e-06, + "loss": 0.7676, + "step": 35293 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375962430612433e-06, + "loss": 0.8018, + "step": 35294 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375749263099424e-06, + "loss": 0.9248, + "step": 35295 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375536090704799e-06, + "loss": 0.718, + "step": 35296 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375322913428719e-06, + "loss": 0.9902, + "step": 35297 + }, + { + "epoch": 0.9, + "learning_rate": 1.6375109731271347e-06, + "loss": 0.8145, + "step": 35298 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374896544232848e-06, + "loss": 1.0283, + "step": 35299 + }, + { + "epoch": 0.9, + "learning_rate": 1.637468335231338e-06, + "loss": 0.832, + "step": 35300 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374470155513115e-06, + "loss": 0.9473, + "step": 35301 + }, + { + "epoch": 0.9, + "learning_rate": 1.637425695383221e-06, + "loss": 0.8516, + "step": 35302 + }, + { + "epoch": 0.9, + "learning_rate": 1.6374043747270827e-06, + "loss": 0.6699, + "step": 35303 + }, + { + "epoch": 0.9, + "learning_rate": 1.6373830535829135e-06, + "loss": 0.9316, + "step": 35304 + }, + { + "epoch": 0.9, + "learning_rate": 1.6373617319507288e-06, + "loss": 0.7463, + "step": 35305 + }, + { + "epoch": 0.9, + "learning_rate": 1.637340409830546e-06, + "loss": 0.6592, + "step": 35306 + }, + { + "epoch": 0.9, + "learning_rate": 1.637319087222381e-06, + "loss": 0.6699, + "step": 35307 + }, + { + "epoch": 0.9, + "learning_rate": 1.63729776412625e-06, + "loss": 0.8047, + "step": 35308 + }, + { + "epoch": 0.9, + "learning_rate": 1.6372764405421695e-06, + "loss": 0.5991, + "step": 35309 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372551164701556e-06, + "loss": 0.8096, + "step": 35310 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372337919102246e-06, + "loss": 0.6616, + "step": 35311 + }, + { + "epoch": 0.91, + "learning_rate": 1.6372124668623936e-06, + "loss": 0.7334, + "step": 35312 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371911413266777e-06, + "loss": 1.0059, + "step": 35313 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371698153030939e-06, + "loss": 1.0371, + "step": 35314 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371484887916587e-06, + "loss": 0.8262, + "step": 35315 + }, + { + "epoch": 0.91, + "learning_rate": 1.637127161792388e-06, + "loss": 0.7812, + "step": 35316 + }, + { + "epoch": 0.91, + "learning_rate": 1.6371058343052986e-06, + "loss": 0.5088, + "step": 35317 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370845063304065e-06, + "loss": 0.7944, + "step": 35318 + }, + { + "epoch": 0.91, + "learning_rate": 1.637063177867728e-06, + "loss": 0.7275, + "step": 35319 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370418489172794e-06, + "loss": 0.6138, + "step": 35320 + }, + { + "epoch": 0.91, + "learning_rate": 1.6370205194790771e-06, + "loss": 0.9619, + "step": 35321 + }, + { + "epoch": 0.91, + "learning_rate": 1.6369991895531378e-06, + "loss": 0.9199, + "step": 35322 + }, + { + "epoch": 0.91, + "learning_rate": 1.636977859139477e-06, + "loss": 0.6738, + "step": 35323 + }, + { + "epoch": 0.91, + "learning_rate": 1.636956528238112e-06, + "loss": 1.0508, + "step": 35324 + }, + { + "epoch": 0.91, + "learning_rate": 1.6369351968490586e-06, + "loss": 0.8779, + "step": 35325 + }, + { + "epoch": 0.91, + "learning_rate": 1.636913864972333e-06, + "loss": 0.7002, + "step": 35326 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368925326079521e-06, + "loss": 0.8887, + "step": 35327 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368711997559318e-06, + "loss": 0.9912, + "step": 35328 + }, + { + "epoch": 0.91, + "learning_rate": 1.636849866416288e-06, + "loss": 0.8052, + "step": 35329 + }, + { + "epoch": 0.91, + "learning_rate": 1.636828532589038e-06, + "loss": 0.7588, + "step": 35330 + }, + { + "epoch": 0.91, + "learning_rate": 1.6368071982741975e-06, + "loss": 1.1348, + "step": 35331 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367858634717834e-06, + "loss": 0.9883, + "step": 35332 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367645281818114e-06, + "loss": 0.9189, + "step": 35333 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367431924042978e-06, + "loss": 0.8887, + "step": 35334 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367218561392594e-06, + "loss": 1.041, + "step": 35335 + }, + { + "epoch": 0.91, + "learning_rate": 1.6367005193867125e-06, + "loss": 0.75, + "step": 35336 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366791821466733e-06, + "loss": 0.5796, + "step": 35337 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366578444191582e-06, + "loss": 0.9961, + "step": 35338 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366365062041832e-06, + "loss": 0.7666, + "step": 35339 + }, + { + "epoch": 0.91, + "learning_rate": 1.6366151675017647e-06, + "loss": 0.832, + "step": 35340 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365938283119194e-06, + "loss": 0.9805, + "step": 35341 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365724886346639e-06, + "loss": 0.6187, + "step": 35342 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365511484700137e-06, + "loss": 0.7124, + "step": 35343 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365298078179856e-06, + "loss": 0.7773, + "step": 35344 + }, + { + "epoch": 0.91, + "learning_rate": 1.6365084666785957e-06, + "loss": 0.9512, + "step": 35345 + }, + { + "epoch": 0.91, + "learning_rate": 1.636487125051861e-06, + "loss": 1.0723, + "step": 35346 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364657829377973e-06, + "loss": 0.752, + "step": 35347 + }, + { + "epoch": 0.91, + "learning_rate": 1.636444440336421e-06, + "loss": 0.8281, + "step": 35348 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364230972477482e-06, + "loss": 1.0254, + "step": 35349 + }, + { + "epoch": 0.91, + "learning_rate": 1.6364017536717954e-06, + "loss": 0.6978, + "step": 35350 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363804096085793e-06, + "loss": 0.9697, + "step": 35351 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363590650581162e-06, + "loss": 0.8291, + "step": 35352 + }, + { + "epoch": 0.91, + "learning_rate": 1.6363377200204221e-06, + "loss": 0.8062, + "step": 35353 + }, + { + "epoch": 0.91, + "learning_rate": 1.636316374495513e-06, + "loss": 0.9414, + "step": 35354 + }, + { + "epoch": 0.91, + "learning_rate": 1.636295028483406e-06, + "loss": 0.9502, + "step": 35355 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362736819841172e-06, + "loss": 1.2451, + "step": 35356 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362523349976631e-06, + "loss": 0.8867, + "step": 35357 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362309875240597e-06, + "loss": 0.7905, + "step": 35358 + }, + { + "epoch": 0.91, + "learning_rate": 1.6362096395633233e-06, + "loss": 0.7852, + "step": 35359 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361882911154706e-06, + "loss": 0.8164, + "step": 35360 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361669421805178e-06, + "loss": 0.8916, + "step": 35361 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361455927584813e-06, + "loss": 0.9141, + "step": 35362 + }, + { + "epoch": 0.91, + "learning_rate": 1.636124242849377e-06, + "loss": 0.832, + "step": 35363 + }, + { + "epoch": 0.91, + "learning_rate": 1.6361028924532221e-06, + "loss": 0.6985, + "step": 35364 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360815415700322e-06, + "loss": 0.9185, + "step": 35365 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360601901998239e-06, + "loss": 0.9404, + "step": 35366 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360388383426135e-06, + "loss": 0.874, + "step": 35367 + }, + { + "epoch": 0.91, + "learning_rate": 1.6360174859984175e-06, + "loss": 1.0293, + "step": 35368 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359961331672523e-06, + "loss": 0.709, + "step": 35369 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359747798491338e-06, + "loss": 0.9492, + "step": 35370 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359534260440789e-06, + "loss": 0.627, + "step": 35371 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359320717521037e-06, + "loss": 0.8008, + "step": 35372 + }, + { + "epoch": 0.91, + "learning_rate": 1.6359107169732243e-06, + "loss": 0.9736, + "step": 35373 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358893617074573e-06, + "loss": 0.9424, + "step": 35374 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358680059548193e-06, + "loss": 0.7349, + "step": 35375 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358466497153263e-06, + "loss": 0.6035, + "step": 35376 + }, + { + "epoch": 0.91, + "learning_rate": 1.635825292988995e-06, + "loss": 0.5889, + "step": 35377 + }, + { + "epoch": 0.91, + "learning_rate": 1.6358039357758414e-06, + "loss": 0.8428, + "step": 35378 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357825780758816e-06, + "loss": 0.8252, + "step": 35379 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357612198891327e-06, + "loss": 0.604, + "step": 35380 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357398612156103e-06, + "loss": 0.8652, + "step": 35381 + }, + { + "epoch": 0.91, + "learning_rate": 1.6357185020553316e-06, + "loss": 0.7461, + "step": 35382 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356971424083123e-06, + "loss": 0.6738, + "step": 35383 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356757822745688e-06, + "loss": 0.9043, + "step": 35384 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356544216541178e-06, + "loss": 0.5308, + "step": 35385 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356330605469753e-06, + "loss": 1.0449, + "step": 35386 + }, + { + "epoch": 0.91, + "learning_rate": 1.6356116989531576e-06, + "loss": 0.8789, + "step": 35387 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355903368726813e-06, + "loss": 0.9165, + "step": 35388 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355689743055629e-06, + "loss": 0.8867, + "step": 35389 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355476112518185e-06, + "loss": 0.7925, + "step": 35390 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355262477114646e-06, + "loss": 0.8994, + "step": 35391 + }, + { + "epoch": 0.91, + "learning_rate": 1.6355048836845175e-06, + "loss": 0.7217, + "step": 35392 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354835191709934e-06, + "loss": 0.918, + "step": 35393 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354621541709088e-06, + "loss": 1.0449, + "step": 35394 + }, + { + "epoch": 0.91, + "learning_rate": 1.63544078868428e-06, + "loss": 0.9258, + "step": 35395 + }, + { + "epoch": 0.91, + "learning_rate": 1.6354194227111233e-06, + "loss": 0.8145, + "step": 35396 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353980562514555e-06, + "loss": 0.7151, + "step": 35397 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353766893052926e-06, + "loss": 0.8994, + "step": 35398 + }, + { + "epoch": 0.91, + "learning_rate": 1.635355321872651e-06, + "loss": 0.8379, + "step": 35399 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353339539535463e-06, + "loss": 0.9141, + "step": 35400 + }, + { + "epoch": 0.91, + "learning_rate": 1.6353125855479963e-06, + "loss": 0.7471, + "step": 35401 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352912166560166e-06, + "loss": 0.6362, + "step": 35402 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352698472776236e-06, + "loss": 1.0439, + "step": 35403 + }, + { + "epoch": 0.91, + "learning_rate": 1.635248477412834e-06, + "loss": 0.9736, + "step": 35404 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352271070616632e-06, + "loss": 0.8311, + "step": 35405 + }, + { + "epoch": 0.91, + "learning_rate": 1.6352057362241284e-06, + "loss": 0.8755, + "step": 35406 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351843649002462e-06, + "loss": 0.8789, + "step": 35407 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351629930900321e-06, + "loss": 0.7747, + "step": 35408 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351416207935032e-06, + "loss": 0.7666, + "step": 35409 + }, + { + "epoch": 0.91, + "learning_rate": 1.6351202480106751e-06, + "loss": 0.75, + "step": 35410 + }, + { + "epoch": 0.91, + "learning_rate": 1.635098874741565e-06, + "loss": 0.7888, + "step": 35411 + }, + { + "epoch": 0.91, + "learning_rate": 1.635077500986189e-06, + "loss": 0.8242, + "step": 35412 + }, + { + "epoch": 0.91, + "learning_rate": 1.6350561267445632e-06, + "loss": 0.8098, + "step": 35413 + }, + { + "epoch": 0.91, + "learning_rate": 1.635034752016704e-06, + "loss": 0.876, + "step": 35414 + }, + { + "epoch": 0.91, + "learning_rate": 1.635013376802628e-06, + "loss": 0.9395, + "step": 35415 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349920011023516e-06, + "loss": 0.8877, + "step": 35416 + }, + { + "epoch": 0.91, + "learning_rate": 1.634970624915891e-06, + "loss": 0.9424, + "step": 35417 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349492482432623e-06, + "loss": 1.0205, + "step": 35418 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349278710844822e-06, + "loss": 0.7061, + "step": 35419 + }, + { + "epoch": 0.91, + "learning_rate": 1.6349064934395673e-06, + "loss": 1.0098, + "step": 35420 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348851153085336e-06, + "loss": 0.9414, + "step": 35421 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348637366913976e-06, + "loss": 0.7305, + "step": 35422 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348423575881753e-06, + "loss": 0.9062, + "step": 35423 + }, + { + "epoch": 0.91, + "learning_rate": 1.6348209779988837e-06, + "loss": 0.9131, + "step": 35424 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347995979235388e-06, + "loss": 0.8496, + "step": 35425 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347782173621568e-06, + "loss": 0.8398, + "step": 35426 + }, + { + "epoch": 0.91, + "learning_rate": 1.634756836314755e-06, + "loss": 0.8252, + "step": 35427 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347354547813486e-06, + "loss": 0.7559, + "step": 35428 + }, + { + "epoch": 0.91, + "learning_rate": 1.6347140727619544e-06, + "loss": 0.8623, + "step": 35429 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346926902565887e-06, + "loss": 0.8779, + "step": 35430 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346713072652683e-06, + "loss": 0.5322, + "step": 35431 + }, + { + "epoch": 0.91, + "learning_rate": 1.634649923788009e-06, + "loss": 0.7314, + "step": 35432 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346285398248276e-06, + "loss": 0.6641, + "step": 35433 + }, + { + "epoch": 0.91, + "learning_rate": 1.6346071553757404e-06, + "loss": 1.1748, + "step": 35434 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345857704407636e-06, + "loss": 0.7227, + "step": 35435 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345643850199136e-06, + "loss": 0.6941, + "step": 35436 + }, + { + "epoch": 0.91, + "learning_rate": 1.634542999113207e-06, + "loss": 1.0498, + "step": 35437 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345216127206599e-06, + "loss": 0.8047, + "step": 35438 + }, + { + "epoch": 0.91, + "learning_rate": 1.6345002258422883e-06, + "loss": 0.8081, + "step": 35439 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344788384781097e-06, + "loss": 0.7373, + "step": 35440 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344574506281395e-06, + "loss": 0.8721, + "step": 35441 + }, + { + "epoch": 0.91, + "learning_rate": 1.6344360622923946e-06, + "loss": 0.9629, + "step": 35442 + }, + { + "epoch": 0.91, + "learning_rate": 1.634414673470891e-06, + "loss": 0.7539, + "step": 35443 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343932841636455e-06, + "loss": 0.9111, + "step": 35444 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343718943706742e-06, + "loss": 1.0186, + "step": 35445 + }, + { + "epoch": 0.91, + "learning_rate": 1.634350504091993e-06, + "loss": 0.9023, + "step": 35446 + }, + { + "epoch": 0.91, + "learning_rate": 1.6343291133276194e-06, + "loss": 0.8555, + "step": 35447 + }, + { + "epoch": 0.91, + "learning_rate": 1.634307722077569e-06, + "loss": 0.8428, + "step": 35448 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342863303418582e-06, + "loss": 0.8301, + "step": 35449 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342649381205036e-06, + "loss": 0.7861, + "step": 35450 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342435454135215e-06, + "loss": 0.7803, + "step": 35451 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342221522209285e-06, + "loss": 0.8311, + "step": 35452 + }, + { + "epoch": 0.91, + "learning_rate": 1.6342007585427403e-06, + "loss": 0.563, + "step": 35453 + }, + { + "epoch": 0.91, + "learning_rate": 1.634179364378974e-06, + "loss": 1.1055, + "step": 35454 + }, + { + "epoch": 0.91, + "learning_rate": 1.6341579697296459e-06, + "loss": 0.8311, + "step": 35455 + }, + { + "epoch": 0.91, + "learning_rate": 1.634136574594772e-06, + "loss": 1.0605, + "step": 35456 + }, + { + "epoch": 0.91, + "learning_rate": 1.6341151789743688e-06, + "loss": 0.9707, + "step": 35457 + }, + { + "epoch": 0.91, + "learning_rate": 1.634093782868453e-06, + "loss": 0.6287, + "step": 35458 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340723862770405e-06, + "loss": 0.4653, + "step": 35459 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340509892001479e-06, + "loss": 1.0098, + "step": 35460 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340295916377917e-06, + "loss": 0.7383, + "step": 35461 + }, + { + "epoch": 0.91, + "learning_rate": 1.6340081935899886e-06, + "loss": 0.9365, + "step": 35462 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339867950567542e-06, + "loss": 0.8193, + "step": 35463 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339653960381052e-06, + "loss": 0.7471, + "step": 35464 + }, + { + "epoch": 0.91, + "learning_rate": 1.633943996534058e-06, + "loss": 0.8652, + "step": 35465 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339225965446292e-06, + "loss": 0.7676, + "step": 35466 + }, + { + "epoch": 0.91, + "learning_rate": 1.6339011960698352e-06, + "loss": 0.8428, + "step": 35467 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338797951096918e-06, + "loss": 1.0049, + "step": 35468 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338583936642158e-06, + "loss": 0.9482, + "step": 35469 + }, + { + "epoch": 0.91, + "learning_rate": 1.6338369917334238e-06, + "loss": 0.7578, + "step": 35470 + }, + { + "epoch": 0.91, + "learning_rate": 1.633815589317332e-06, + "loss": 0.7822, + "step": 35471 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337941864159567e-06, + "loss": 0.8022, + "step": 35472 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337727830293143e-06, + "loss": 0.8906, + "step": 35473 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337513791574211e-06, + "loss": 0.9551, + "step": 35474 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337299748002937e-06, + "loss": 0.9546, + "step": 35475 + }, + { + "epoch": 0.91, + "learning_rate": 1.6337085699579485e-06, + "loss": 0.8076, + "step": 35476 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336871646304019e-06, + "loss": 0.7793, + "step": 35477 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336657588176697e-06, + "loss": 0.9414, + "step": 35478 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336443525197691e-06, + "loss": 1.0723, + "step": 35479 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336229457367158e-06, + "loss": 0.8447, + "step": 35480 + }, + { + "epoch": 0.91, + "learning_rate": 1.6336015384685272e-06, + "loss": 1.0527, + "step": 35481 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335801307152188e-06, + "loss": 0.8271, + "step": 35482 + }, + { + "epoch": 0.91, + "learning_rate": 1.633558722476807e-06, + "loss": 0.8096, + "step": 35483 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335373137533084e-06, + "loss": 0.9756, + "step": 35484 + }, + { + "epoch": 0.91, + "learning_rate": 1.6335159045447396e-06, + "loss": 0.8379, + "step": 35485 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334944948511168e-06, + "loss": 0.7627, + "step": 35486 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334730846724562e-06, + "loss": 0.835, + "step": 35487 + }, + { + "epoch": 0.91, + "learning_rate": 1.6334516740087746e-06, + "loss": 0.915, + "step": 35488 + }, + { + "epoch": 0.91, + "learning_rate": 1.633430262860088e-06, + "loss": 0.5811, + "step": 35489 + }, + { + "epoch": 0.91, + "learning_rate": 1.633408851226413e-06, + "loss": 0.8105, + "step": 35490 + }, + { + "epoch": 0.91, + "learning_rate": 1.633387439107766e-06, + "loss": 0.8496, + "step": 35491 + }, + { + "epoch": 0.91, + "learning_rate": 1.6333660265041639e-06, + "loss": 0.8721, + "step": 35492 + }, + { + "epoch": 0.91, + "learning_rate": 1.633344613415622e-06, + "loss": 0.9053, + "step": 35493 + }, + { + "epoch": 0.91, + "learning_rate": 1.633323199842157e-06, + "loss": 0.8701, + "step": 35494 + }, + { + "epoch": 0.91, + "learning_rate": 1.633301785783786e-06, + "loss": 0.8125, + "step": 35495 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332803712405245e-06, + "loss": 0.5515, + "step": 35496 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332589562123898e-06, + "loss": 0.8789, + "step": 35497 + }, + { + "epoch": 0.91, + "learning_rate": 1.633237540699398e-06, + "loss": 0.9326, + "step": 35498 + }, + { + "epoch": 0.91, + "learning_rate": 1.6332161247015645e-06, + "loss": 0.6948, + "step": 35499 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331947082189074e-06, + "loss": 0.7959, + "step": 35500 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331732912514418e-06, + "loss": 0.8047, + "step": 35501 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331518737991846e-06, + "loss": 0.8091, + "step": 35502 + }, + { + "epoch": 0.91, + "learning_rate": 1.633130455862152e-06, + "loss": 0.6245, + "step": 35503 + }, + { + "epoch": 0.91, + "learning_rate": 1.6331090374403607e-06, + "loss": 1.0791, + "step": 35504 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330876185338267e-06, + "loss": 0.8408, + "step": 35505 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330661991425666e-06, + "loss": 0.8438, + "step": 35506 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330447792665973e-06, + "loss": 0.8545, + "step": 35507 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330233589059342e-06, + "loss": 0.8579, + "step": 35508 + }, + { + "epoch": 0.91, + "learning_rate": 1.6330019380605945e-06, + "loss": 0.7583, + "step": 35509 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329805167305942e-06, + "loss": 0.7129, + "step": 35510 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329590949159498e-06, + "loss": 1.1748, + "step": 35511 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329376726166778e-06, + "loss": 0.7666, + "step": 35512 + }, + { + "epoch": 0.91, + "learning_rate": 1.6329162498327946e-06, + "loss": 0.874, + "step": 35513 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328948265643166e-06, + "loss": 0.9346, + "step": 35514 + }, + { + "epoch": 0.91, + "learning_rate": 1.63287340281126e-06, + "loss": 0.7285, + "step": 35515 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328519785736411e-06, + "loss": 0.7949, + "step": 35516 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328305538514772e-06, + "loss": 0.7803, + "step": 35517 + }, + { + "epoch": 0.91, + "learning_rate": 1.6328091286447834e-06, + "loss": 0.8076, + "step": 35518 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327877029535771e-06, + "loss": 0.9277, + "step": 35519 + }, + { + "epoch": 0.91, + "learning_rate": 1.632766276777874e-06, + "loss": 0.7212, + "step": 35520 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327448501176911e-06, + "loss": 0.6763, + "step": 35521 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327234229730444e-06, + "loss": 0.9785, + "step": 35522 + }, + { + "epoch": 0.91, + "learning_rate": 1.6327019953439506e-06, + "loss": 0.9385, + "step": 35523 + }, + { + "epoch": 0.91, + "learning_rate": 1.632680567230426e-06, + "loss": 0.8486, + "step": 35524 + }, + { + "epoch": 0.91, + "learning_rate": 1.632659138632487e-06, + "loss": 0.7944, + "step": 35525 + }, + { + "epoch": 0.91, + "learning_rate": 1.63263770955015e-06, + "loss": 0.8145, + "step": 35526 + }, + { + "epoch": 0.91, + "learning_rate": 1.6326162799834316e-06, + "loss": 0.6875, + "step": 35527 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325948499323477e-06, + "loss": 0.8726, + "step": 35528 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325734193969146e-06, + "loss": 0.6401, + "step": 35529 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325519883771496e-06, + "loss": 0.8115, + "step": 35530 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325305568730688e-06, + "loss": 0.9521, + "step": 35531 + }, + { + "epoch": 0.91, + "learning_rate": 1.6325091248846883e-06, + "loss": 0.8506, + "step": 35532 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324876924120246e-06, + "loss": 0.7568, + "step": 35533 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324662594550942e-06, + "loss": 0.8066, + "step": 35534 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324448260139132e-06, + "loss": 0.7871, + "step": 35535 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324233920884986e-06, + "loss": 1.0068, + "step": 35536 + }, + { + "epoch": 0.91, + "learning_rate": 1.6324019576788667e-06, + "loss": 0.8906, + "step": 35537 + }, + { + "epoch": 0.91, + "learning_rate": 1.632380522785033e-06, + "loss": 0.8379, + "step": 35538 + }, + { + "epoch": 0.91, + "learning_rate": 1.632359087407015e-06, + "loss": 0.8438, + "step": 35539 + }, + { + "epoch": 0.91, + "learning_rate": 1.6323376515448289e-06, + "loss": 0.6968, + "step": 35540 + }, + { + "epoch": 0.91, + "learning_rate": 1.6323162151984904e-06, + "loss": 0.8506, + "step": 35541 + }, + { + "epoch": 0.91, + "learning_rate": 1.632294778368017e-06, + "loss": 0.6729, + "step": 35542 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322733410534245e-06, + "loss": 0.9268, + "step": 35543 + }, + { + "epoch": 0.91, + "learning_rate": 1.632251903254729e-06, + "loss": 0.7568, + "step": 35544 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322304649719474e-06, + "loss": 0.9443, + "step": 35545 + }, + { + "epoch": 0.91, + "learning_rate": 1.6322090262050963e-06, + "loss": 1.0039, + "step": 35546 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321875869541914e-06, + "loss": 0.8135, + "step": 35547 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321661472192497e-06, + "loss": 0.8271, + "step": 35548 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321447070002879e-06, + "loss": 0.8008, + "step": 35549 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321232662973214e-06, + "loss": 0.8389, + "step": 35550 + }, + { + "epoch": 0.91, + "learning_rate": 1.6321018251103673e-06, + "loss": 0.7705, + "step": 35551 + }, + { + "epoch": 0.91, + "learning_rate": 1.632080383439442e-06, + "loss": 0.5488, + "step": 35552 + }, + { + "epoch": 0.91, + "learning_rate": 1.632058941284562e-06, + "loss": 0.9629, + "step": 35553 + }, + { + "epoch": 0.91, + "learning_rate": 1.6320374986457433e-06, + "loss": 0.8018, + "step": 35554 + }, + { + "epoch": 0.91, + "learning_rate": 1.6320160555230023e-06, + "loss": 0.917, + "step": 35555 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319946119163559e-06, + "loss": 0.9116, + "step": 35556 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319731678258207e-06, + "loss": 0.8687, + "step": 35557 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319517232514122e-06, + "loss": 0.8975, + "step": 35558 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319302781931472e-06, + "loss": 0.9082, + "step": 35559 + }, + { + "epoch": 0.91, + "learning_rate": 1.6319088326510427e-06, + "loss": 0.8062, + "step": 35560 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318873866251143e-06, + "loss": 0.873, + "step": 35561 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318659401153791e-06, + "loss": 0.9229, + "step": 35562 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318444931218532e-06, + "loss": 0.8652, + "step": 35563 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318230456445527e-06, + "loss": 0.8145, + "step": 35564 + }, + { + "epoch": 0.91, + "learning_rate": 1.6318015976834946e-06, + "loss": 0.8291, + "step": 35565 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317801492386946e-06, + "loss": 0.7578, + "step": 35566 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317587003101702e-06, + "loss": 0.8726, + "step": 35567 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317372508979369e-06, + "loss": 0.696, + "step": 35568 + }, + { + "epoch": 0.91, + "learning_rate": 1.6317158010020115e-06, + "loss": 0.7939, + "step": 35569 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316943506224104e-06, + "loss": 1.0225, + "step": 35570 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316728997591497e-06, + "loss": 0.9287, + "step": 35571 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316514484122465e-06, + "loss": 0.8486, + "step": 35572 + }, + { + "epoch": 0.91, + "learning_rate": 1.6316299965817168e-06, + "loss": 0.8721, + "step": 35573 + }, + { + "epoch": 0.91, + "learning_rate": 1.631608544267577e-06, + "loss": 0.8708, + "step": 35574 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315870914698433e-06, + "loss": 0.6333, + "step": 35575 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315656381885329e-06, + "loss": 0.6001, + "step": 35576 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315441844236615e-06, + "loss": 0.8193, + "step": 35577 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315227301752454e-06, + "loss": 0.584, + "step": 35578 + }, + { + "epoch": 0.91, + "learning_rate": 1.6315012754433017e-06, + "loss": 0.9424, + "step": 35579 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314798202278466e-06, + "loss": 0.8613, + "step": 35580 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314583645288962e-06, + "loss": 0.8975, + "step": 35581 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314369083464676e-06, + "loss": 0.6929, + "step": 35582 + }, + { + "epoch": 0.91, + "learning_rate": 1.6314154516805766e-06, + "loss": 0.6714, + "step": 35583 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313939945312396e-06, + "loss": 0.9443, + "step": 35584 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313725368984731e-06, + "loss": 0.8579, + "step": 35585 + }, + { + "epoch": 0.91, + "learning_rate": 1.631351078782294e-06, + "loss": 0.9424, + "step": 35586 + }, + { + "epoch": 0.91, + "learning_rate": 1.6313296201827184e-06, + "loss": 0.8906, + "step": 35587 + }, + { + "epoch": 0.91, + "learning_rate": 1.631308161099763e-06, + "loss": 0.7988, + "step": 35588 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312867015334434e-06, + "loss": 0.7666, + "step": 35589 + }, + { + "epoch": 0.91, + "learning_rate": 1.631265241483777e-06, + "loss": 0.8975, + "step": 35590 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312437809507796e-06, + "loss": 1.0293, + "step": 35591 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312223199344678e-06, + "loss": 0.8281, + "step": 35592 + }, + { + "epoch": 0.91, + "learning_rate": 1.6312008584348583e-06, + "loss": 0.8574, + "step": 35593 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311793964519676e-06, + "loss": 0.6997, + "step": 35594 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311579339858112e-06, + "loss": 0.7441, + "step": 35595 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311364710364067e-06, + "loss": 0.9102, + "step": 35596 + }, + { + "epoch": 0.91, + "learning_rate": 1.6311150076037698e-06, + "loss": 0.7148, + "step": 35597 + }, + { + "epoch": 0.91, + "learning_rate": 1.631093543687917e-06, + "loss": 0.5958, + "step": 35598 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310720792888653e-06, + "loss": 0.7622, + "step": 35599 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310506144066306e-06, + "loss": 0.7656, + "step": 35600 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310291490412296e-06, + "loss": 0.8262, + "step": 35601 + }, + { + "epoch": 0.91, + "learning_rate": 1.6310076831926781e-06, + "loss": 0.8037, + "step": 35602 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309862168609936e-06, + "loss": 0.7012, + "step": 35603 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309647500461914e-06, + "loss": 0.8545, + "step": 35604 + }, + { + "epoch": 0.91, + "learning_rate": 1.630943282748289e-06, + "loss": 0.6826, + "step": 35605 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309218149673024e-06, + "loss": 0.75, + "step": 35606 + }, + { + "epoch": 0.91, + "learning_rate": 1.6309003467032473e-06, + "loss": 0.5825, + "step": 35607 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308788779561412e-06, + "loss": 0.9102, + "step": 35608 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308574087260004e-06, + "loss": 0.5508, + "step": 35609 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308359390128408e-06, + "loss": 0.8662, + "step": 35610 + }, + { + "epoch": 0.91, + "learning_rate": 1.6308144688166792e-06, + "loss": 0.6008, + "step": 35611 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307929981375318e-06, + "loss": 0.5984, + "step": 35612 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307715269754154e-06, + "loss": 0.8604, + "step": 35613 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307500553303463e-06, + "loss": 0.6636, + "step": 35614 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307285832023406e-06, + "loss": 0.8506, + "step": 35615 + }, + { + "epoch": 0.91, + "learning_rate": 1.6307071105914156e-06, + "loss": 0.9365, + "step": 35616 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306856374975868e-06, + "loss": 0.7803, + "step": 35617 + }, + { + "epoch": 0.91, + "learning_rate": 1.630664163920871e-06, + "loss": 0.7148, + "step": 35618 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306426898612843e-06, + "loss": 0.8467, + "step": 35619 + }, + { + "epoch": 0.91, + "learning_rate": 1.6306212153188438e-06, + "loss": 0.9707, + "step": 35620 + }, + { + "epoch": 0.91, + "learning_rate": 1.630599740293566e-06, + "loss": 0.9668, + "step": 35621 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305782647854666e-06, + "loss": 0.5068, + "step": 35622 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305567887945623e-06, + "loss": 0.4688, + "step": 35623 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305353123208701e-06, + "loss": 0.791, + "step": 35624 + }, + { + "epoch": 0.91, + "learning_rate": 1.6305138353644054e-06, + "loss": 0.916, + "step": 35625 + }, + { + "epoch": 0.91, + "learning_rate": 1.6304923579251857e-06, + "loss": 0.9521, + "step": 35626 + }, + { + "epoch": 0.91, + "learning_rate": 1.630470880003227e-06, + "loss": 0.7314, + "step": 35627 + }, + { + "epoch": 0.91, + "learning_rate": 1.6304494015985455e-06, + "loss": 0.832, + "step": 35628 + }, + { + "epoch": 0.91, + "learning_rate": 1.630427922711158e-06, + "loss": 1.0269, + "step": 35629 + }, + { + "epoch": 0.91, + "learning_rate": 1.630406443341081e-06, + "loss": 0.9424, + "step": 35630 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303849634883305e-06, + "loss": 0.8984, + "step": 35631 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303634831529232e-06, + "loss": 0.998, + "step": 35632 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303420023348755e-06, + "loss": 0.8291, + "step": 35633 + }, + { + "epoch": 0.91, + "learning_rate": 1.6303205210342043e-06, + "loss": 0.8613, + "step": 35634 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302990392509256e-06, + "loss": 0.752, + "step": 35635 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302775569850555e-06, + "loss": 0.6558, + "step": 35636 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302560742366112e-06, + "loss": 0.8335, + "step": 35637 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302345910056085e-06, + "loss": 1.1309, + "step": 35638 + }, + { + "epoch": 0.91, + "learning_rate": 1.6302131072920645e-06, + "loss": 0.835, + "step": 35639 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301916230959952e-06, + "loss": 0.6473, + "step": 35640 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301701384174172e-06, + "loss": 0.8955, + "step": 35641 + }, + { + "epoch": 0.91, + "learning_rate": 1.630148653256347e-06, + "loss": 0.6694, + "step": 35642 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301271676128004e-06, + "loss": 0.7979, + "step": 35643 + }, + { + "epoch": 0.91, + "learning_rate": 1.6301056814867947e-06, + "loss": 0.9648, + "step": 35644 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300841948783462e-06, + "loss": 0.8062, + "step": 35645 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300627077874713e-06, + "loss": 0.8516, + "step": 35646 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300412202141861e-06, + "loss": 0.9443, + "step": 35647 + }, + { + "epoch": 0.91, + "learning_rate": 1.6300197321585075e-06, + "loss": 0.6758, + "step": 35648 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299982436204514e-06, + "loss": 0.8359, + "step": 35649 + }, + { + "epoch": 0.91, + "learning_rate": 1.629976754600035e-06, + "loss": 0.7021, + "step": 35650 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299552650972744e-06, + "loss": 1.0361, + "step": 35651 + }, + { + "epoch": 0.91, + "learning_rate": 1.6299337751121858e-06, + "loss": 0.8066, + "step": 35652 + }, + { + "epoch": 0.91, + "learning_rate": 1.629912284644786e-06, + "loss": 0.8516, + "step": 35653 + }, + { + "epoch": 0.91, + "learning_rate": 1.629890793695091e-06, + "loss": 0.8799, + "step": 35654 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298693022631177e-06, + "loss": 0.8408, + "step": 35655 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298478103488828e-06, + "loss": 0.6284, + "step": 35656 + }, + { + "epoch": 0.91, + "learning_rate": 1.629826317952402e-06, + "loss": 0.8643, + "step": 35657 + }, + { + "epoch": 0.91, + "learning_rate": 1.6298048250736924e-06, + "loss": 0.7539, + "step": 35658 + }, + { + "epoch": 0.91, + "learning_rate": 1.62978333171277e-06, + "loss": 0.7998, + "step": 35659 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297618378696517e-06, + "loss": 0.7715, + "step": 35660 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297403435443537e-06, + "loss": 0.7168, + "step": 35661 + }, + { + "epoch": 0.91, + "learning_rate": 1.6297188487368922e-06, + "loss": 0.7183, + "step": 35662 + }, + { + "epoch": 0.91, + "learning_rate": 1.629697353447284e-06, + "loss": 0.9443, + "step": 35663 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296758576755459e-06, + "loss": 0.835, + "step": 35664 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296543614216934e-06, + "loss": 0.8584, + "step": 35665 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296328646857437e-06, + "loss": 0.6082, + "step": 35666 + }, + { + "epoch": 0.91, + "learning_rate": 1.6296113674677133e-06, + "loss": 1.0366, + "step": 35667 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295898697676183e-06, + "loss": 0.8364, + "step": 35668 + }, + { + "epoch": 0.91, + "learning_rate": 1.629568371585475e-06, + "loss": 0.9385, + "step": 35669 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295468729213004e-06, + "loss": 0.8662, + "step": 35670 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295253737751108e-06, + "loss": 1.082, + "step": 35671 + }, + { + "epoch": 0.91, + "learning_rate": 1.6295038741469224e-06, + "loss": 0.6631, + "step": 35672 + }, + { + "epoch": 0.91, + "learning_rate": 1.629482374036752e-06, + "loss": 0.8848, + "step": 35673 + }, + { + "epoch": 0.91, + "learning_rate": 1.6294608734446155e-06, + "loss": 0.9609, + "step": 35674 + }, + { + "epoch": 0.91, + "learning_rate": 1.6294393723705302e-06, + "loss": 0.8232, + "step": 35675 + }, + { + "epoch": 0.91, + "learning_rate": 1.629417870814512e-06, + "loss": 0.9258, + "step": 35676 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293963687765776e-06, + "loss": 1.0273, + "step": 35677 + }, + { + "epoch": 0.91, + "learning_rate": 1.629374866256743e-06, + "loss": 0.7314, + "step": 35678 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293533632550252e-06, + "loss": 0.9473, + "step": 35679 + }, + { + "epoch": 0.91, + "learning_rate": 1.6293318597714402e-06, + "loss": 0.75, + "step": 35680 + }, + { + "epoch": 0.91, + "learning_rate": 1.629310355806005e-06, + "loss": 0.8159, + "step": 35681 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292888513587357e-06, + "loss": 0.9355, + "step": 35682 + }, + { + "epoch": 0.91, + "learning_rate": 1.629267346429649e-06, + "loss": 0.875, + "step": 35683 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292458410187613e-06, + "loss": 0.6841, + "step": 35684 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292243351260888e-06, + "loss": 0.8672, + "step": 35685 + }, + { + "epoch": 0.91, + "learning_rate": 1.6292028287516482e-06, + "loss": 0.9131, + "step": 35686 + }, + { + "epoch": 0.91, + "learning_rate": 1.629181321895456e-06, + "loss": 0.8613, + "step": 35687 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291598145575284e-06, + "loss": 0.9111, + "step": 35688 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291383067378822e-06, + "loss": 1.0215, + "step": 35689 + }, + { + "epoch": 0.91, + "learning_rate": 1.6291167984365334e-06, + "loss": 0.7783, + "step": 35690 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290952896534992e-06, + "loss": 0.9512, + "step": 35691 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290737803887957e-06, + "loss": 0.9014, + "step": 35692 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290522706424392e-06, + "loss": 0.8057, + "step": 35693 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290307604144462e-06, + "loss": 0.4137, + "step": 35694 + }, + { + "epoch": 0.91, + "learning_rate": 1.6290092497048335e-06, + "loss": 0.7373, + "step": 35695 + }, + { + "epoch": 0.91, + "learning_rate": 1.6289877385136173e-06, + "loss": 0.8828, + "step": 35696 + }, + { + "epoch": 0.91, + "learning_rate": 1.628966226840814e-06, + "loss": 0.9238, + "step": 35697 + }, + { + "epoch": 0.91, + "learning_rate": 1.6289447146864401e-06, + "loss": 0.7656, + "step": 35698 + }, + { + "epoch": 0.91, + "learning_rate": 1.628923202050512e-06, + "loss": 0.7148, + "step": 35699 + }, + { + "epoch": 0.92, + "learning_rate": 1.628901688933047e-06, + "loss": 0.7354, + "step": 35700 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288801753340602e-06, + "loss": 1.0088, + "step": 35701 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288586612535691e-06, + "loss": 0.7734, + "step": 35702 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288371466915897e-06, + "loss": 0.8252, + "step": 35703 + }, + { + "epoch": 0.92, + "learning_rate": 1.6288156316481386e-06, + "loss": 0.8594, + "step": 35704 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287941161232323e-06, + "loss": 0.7485, + "step": 35705 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287726001168875e-06, + "loss": 0.9912, + "step": 35706 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287510836291203e-06, + "loss": 0.8037, + "step": 35707 + }, + { + "epoch": 0.92, + "learning_rate": 1.6287295666599472e-06, + "loss": 0.9121, + "step": 35708 + }, + { + "epoch": 0.92, + "learning_rate": 1.628708049209385e-06, + "loss": 0.748, + "step": 35709 + }, + { + "epoch": 0.92, + "learning_rate": 1.6286865312774496e-06, + "loss": 0.8809, + "step": 35710 + }, + { + "epoch": 0.92, + "learning_rate": 1.6286650128641582e-06, + "loss": 1.0234, + "step": 35711 + }, + { + "epoch": 0.92, + "learning_rate": 1.628643493969527e-06, + "loss": 0.7886, + "step": 35712 + }, + { + "epoch": 0.92, + "learning_rate": 1.628621974593572e-06, + "loss": 0.8291, + "step": 35713 + }, + { + "epoch": 0.92, + "learning_rate": 1.62860045473631e-06, + "loss": 0.71, + "step": 35714 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285789343977576e-06, + "loss": 0.6509, + "step": 35715 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285574135779316e-06, + "loss": 0.5269, + "step": 35716 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285358922768478e-06, + "loss": 0.8633, + "step": 35717 + }, + { + "epoch": 0.92, + "learning_rate": 1.6285143704945228e-06, + "loss": 0.874, + "step": 35718 + }, + { + "epoch": 0.92, + "learning_rate": 1.6284928482309734e-06, + "loss": 0.8408, + "step": 35719 + }, + { + "epoch": 0.92, + "learning_rate": 1.628471325486216e-06, + "loss": 0.9482, + "step": 35720 + }, + { + "epoch": 0.92, + "learning_rate": 1.628449802260267e-06, + "loss": 0.8398, + "step": 35721 + }, + { + "epoch": 0.92, + "learning_rate": 1.6284282785531426e-06, + "loss": 0.7729, + "step": 35722 + }, + { + "epoch": 0.92, + "learning_rate": 1.62840675436486e-06, + "loss": 0.873, + "step": 35723 + }, + { + "epoch": 0.92, + "learning_rate": 1.628385229695435e-06, + "loss": 0.8311, + "step": 35724 + }, + { + "epoch": 0.92, + "learning_rate": 1.6283637045448844e-06, + "loss": 0.5376, + "step": 35725 + }, + { + "epoch": 0.92, + "learning_rate": 1.6283421789132246e-06, + "loss": 0.9277, + "step": 35726 + }, + { + "epoch": 0.92, + "learning_rate": 1.628320652800472e-06, + "loss": 0.8418, + "step": 35727 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282991262066432e-06, + "loss": 0.7832, + "step": 35728 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282775991317546e-06, + "loss": 0.7725, + "step": 35729 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282560715758229e-06, + "loss": 0.9238, + "step": 35730 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282345435388646e-06, + "loss": 1.0127, + "step": 35731 + }, + { + "epoch": 0.92, + "learning_rate": 1.6282130150208955e-06, + "loss": 0.8965, + "step": 35732 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281914860219328e-06, + "loss": 0.7793, + "step": 35733 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281699565419929e-06, + "loss": 0.8662, + "step": 35734 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281484265810915e-06, + "loss": 0.5859, + "step": 35735 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281268961392468e-06, + "loss": 0.9287, + "step": 35736 + }, + { + "epoch": 0.92, + "learning_rate": 1.6281053652164735e-06, + "loss": 1.1426, + "step": 35737 + }, + { + "epoch": 0.92, + "learning_rate": 1.628083833812789e-06, + "loss": 0.6318, + "step": 35738 + }, + { + "epoch": 0.92, + "learning_rate": 1.6280623019282093e-06, + "loss": 1.04, + "step": 35739 + }, + { + "epoch": 0.92, + "learning_rate": 1.6280407695627516e-06, + "loss": 1.0332, + "step": 35740 + }, + { + "epoch": 0.92, + "learning_rate": 1.628019236716432e-06, + "loss": 0.7007, + "step": 35741 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279977033892664e-06, + "loss": 1.0459, + "step": 35742 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279761695812723e-06, + "loss": 0.9111, + "step": 35743 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279546352924656e-06, + "loss": 0.8086, + "step": 35744 + }, + { + "epoch": 0.92, + "learning_rate": 1.627933100522863e-06, + "loss": 0.7588, + "step": 35745 + }, + { + "epoch": 0.92, + "learning_rate": 1.6279115652724808e-06, + "loss": 0.9238, + "step": 35746 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278900295413354e-06, + "loss": 0.9106, + "step": 35747 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278684933294438e-06, + "loss": 0.7422, + "step": 35748 + }, + { + "epoch": 0.92, + "learning_rate": 1.627846956636822e-06, + "loss": 0.8623, + "step": 35749 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278254194634866e-06, + "loss": 0.7607, + "step": 35750 + }, + { + "epoch": 0.92, + "learning_rate": 1.6278038818094544e-06, + "loss": 0.7417, + "step": 35751 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277823436747413e-06, + "loss": 0.7363, + "step": 35752 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277608050593642e-06, + "loss": 0.7383, + "step": 35753 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277392659633398e-06, + "loss": 0.9395, + "step": 35754 + }, + { + "epoch": 0.92, + "learning_rate": 1.6277177263866841e-06, + "loss": 0.8916, + "step": 35755 + }, + { + "epoch": 0.92, + "learning_rate": 1.627696186329414e-06, + "loss": 0.7601, + "step": 35756 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276746457915454e-06, + "loss": 1.0112, + "step": 35757 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276531047730955e-06, + "loss": 0.9287, + "step": 35758 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276315632740803e-06, + "loss": 0.8357, + "step": 35759 + }, + { + "epoch": 0.92, + "learning_rate": 1.6276100212945165e-06, + "loss": 0.7979, + "step": 35760 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275884788344206e-06, + "loss": 0.9102, + "step": 35761 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275669358938092e-06, + "loss": 0.6953, + "step": 35762 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275453924726984e-06, + "loss": 0.8936, + "step": 35763 + }, + { + "epoch": 0.92, + "learning_rate": 1.627523848571105e-06, + "loss": 0.771, + "step": 35764 + }, + { + "epoch": 0.92, + "learning_rate": 1.6275023041890457e-06, + "loss": 1.001, + "step": 35765 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274807593265366e-06, + "loss": 0.7688, + "step": 35766 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274592139835942e-06, + "loss": 0.9922, + "step": 35767 + }, + { + "epoch": 0.92, + "learning_rate": 1.627437668160235e-06, + "loss": 0.9082, + "step": 35768 + }, + { + "epoch": 0.92, + "learning_rate": 1.6274161218564759e-06, + "loss": 0.9238, + "step": 35769 + }, + { + "epoch": 0.92, + "learning_rate": 1.627394575072333e-06, + "loss": 0.7021, + "step": 35770 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273730278078231e-06, + "loss": 0.7725, + "step": 35771 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273514800629623e-06, + "loss": 0.8491, + "step": 35772 + }, + { + "epoch": 0.92, + "learning_rate": 1.6273299318377676e-06, + "loss": 0.7261, + "step": 35773 + }, + { + "epoch": 0.92, + "learning_rate": 1.627308383132255e-06, + "loss": 0.8232, + "step": 35774 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272868339464412e-06, + "loss": 0.897, + "step": 35775 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272652842803426e-06, + "loss": 0.9209, + "step": 35776 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272437341339762e-06, + "loss": 0.6318, + "step": 35777 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272221835073579e-06, + "loss": 0.8735, + "step": 35778 + }, + { + "epoch": 0.92, + "learning_rate": 1.6272006324005045e-06, + "loss": 0.9678, + "step": 35779 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271790808134322e-06, + "loss": 0.9912, + "step": 35780 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271575287461578e-06, + "loss": 0.752, + "step": 35781 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271359761986977e-06, + "loss": 0.9053, + "step": 35782 + }, + { + "epoch": 0.92, + "learning_rate": 1.6271144231710684e-06, + "loss": 0.6409, + "step": 35783 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270928696632869e-06, + "loss": 0.835, + "step": 35784 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270713156753687e-06, + "loss": 0.7461, + "step": 35785 + }, + { + "epoch": 0.92, + "learning_rate": 1.627049761207331e-06, + "loss": 1.0889, + "step": 35786 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270282062591903e-06, + "loss": 0.6846, + "step": 35787 + }, + { + "epoch": 0.92, + "learning_rate": 1.6270066508309626e-06, + "loss": 0.6914, + "step": 35788 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269850949226647e-06, + "loss": 0.7573, + "step": 35789 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269635385343134e-06, + "loss": 0.9658, + "step": 35790 + }, + { + "epoch": 0.92, + "learning_rate": 1.626941981665925e-06, + "loss": 1.0049, + "step": 35791 + }, + { + "epoch": 0.92, + "learning_rate": 1.6269204243175154e-06, + "loss": 0.7939, + "step": 35792 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268988664891024e-06, + "loss": 0.9277, + "step": 35793 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268773081807012e-06, + "loss": 0.8057, + "step": 35794 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268557493923289e-06, + "loss": 0.5688, + "step": 35795 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268341901240024e-06, + "loss": 0.7695, + "step": 35796 + }, + { + "epoch": 0.92, + "learning_rate": 1.6268126303757374e-06, + "loss": 0.9619, + "step": 35797 + }, + { + "epoch": 0.92, + "learning_rate": 1.626791070147551e-06, + "loss": 0.9141, + "step": 35798 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267695094394596e-06, + "loss": 0.9961, + "step": 35799 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267479482514795e-06, + "loss": 0.5913, + "step": 35800 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267263865836273e-06, + "loss": 0.8213, + "step": 35801 + }, + { + "epoch": 0.92, + "learning_rate": 1.6267048244359193e-06, + "loss": 0.8896, + "step": 35802 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266832618083726e-06, + "loss": 0.8867, + "step": 35803 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266616987010032e-06, + "loss": 0.7466, + "step": 35804 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266401351138275e-06, + "loss": 0.697, + "step": 35805 + }, + { + "epoch": 0.92, + "learning_rate": 1.6266185710468627e-06, + "loss": 0.8066, + "step": 35806 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265970065001246e-06, + "loss": 0.9961, + "step": 35807 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265754414736299e-06, + "loss": 0.7246, + "step": 35808 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265538759673954e-06, + "loss": 0.8994, + "step": 35809 + }, + { + "epoch": 0.92, + "learning_rate": 1.6265323099814372e-06, + "loss": 0.8887, + "step": 35810 + }, + { + "epoch": 0.92, + "learning_rate": 1.626510743515772e-06, + "loss": 0.6855, + "step": 35811 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264891765704167e-06, + "loss": 0.9805, + "step": 35812 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264676091453872e-06, + "loss": 0.9199, + "step": 35813 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264460412407001e-06, + "loss": 0.8965, + "step": 35814 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264244728563724e-06, + "loss": 0.7905, + "step": 35815 + }, + { + "epoch": 0.92, + "learning_rate": 1.6264029039924203e-06, + "loss": 0.7461, + "step": 35816 + }, + { + "epoch": 0.92, + "learning_rate": 1.62638133464886e-06, + "loss": 0.9014, + "step": 35817 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263597648257084e-06, + "loss": 0.5918, + "step": 35818 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263381945229821e-06, + "loss": 0.877, + "step": 35819 + }, + { + "epoch": 0.92, + "learning_rate": 1.6263166237406973e-06, + "loss": 0.8018, + "step": 35820 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262950524788708e-06, + "loss": 0.7278, + "step": 35821 + }, + { + "epoch": 0.92, + "learning_rate": 1.626273480737519e-06, + "loss": 0.9316, + "step": 35822 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262519085166582e-06, + "loss": 0.7974, + "step": 35823 + }, + { + "epoch": 0.92, + "learning_rate": 1.626230335816305e-06, + "loss": 0.71, + "step": 35824 + }, + { + "epoch": 0.92, + "learning_rate": 1.6262087626364762e-06, + "loss": 0.6541, + "step": 35825 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261871889771883e-06, + "loss": 0.792, + "step": 35826 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261656148384574e-06, + "loss": 0.6631, + "step": 35827 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261440402203004e-06, + "loss": 0.7686, + "step": 35828 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261224651227336e-06, + "loss": 0.915, + "step": 35829 + }, + { + "epoch": 0.92, + "learning_rate": 1.6261008895457735e-06, + "loss": 0.7896, + "step": 35830 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260793134894372e-06, + "loss": 0.7163, + "step": 35831 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260577369537404e-06, + "loss": 0.833, + "step": 35832 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260361599387e-06, + "loss": 0.791, + "step": 35833 + }, + { + "epoch": 0.92, + "learning_rate": 1.6260145824443327e-06, + "loss": 0.9277, + "step": 35834 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259930044706547e-06, + "loss": 0.75, + "step": 35835 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259714260176827e-06, + "loss": 0.8379, + "step": 35836 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259498470854329e-06, + "loss": 0.8179, + "step": 35837 + }, + { + "epoch": 0.92, + "learning_rate": 1.6259282676739224e-06, + "loss": 0.6426, + "step": 35838 + }, + { + "epoch": 0.92, + "learning_rate": 1.625906687783167e-06, + "loss": 0.6636, + "step": 35839 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258851074131838e-06, + "loss": 0.96, + "step": 35840 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258635265639895e-06, + "loss": 0.96, + "step": 35841 + }, + { + "epoch": 0.92, + "learning_rate": 1.6258419452356003e-06, + "loss": 0.8145, + "step": 35842 + }, + { + "epoch": 0.92, + "learning_rate": 1.625820363428032e-06, + "loss": 0.8174, + "step": 35843 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257987811413023e-06, + "loss": 0.3842, + "step": 35844 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257771983754273e-06, + "loss": 0.7256, + "step": 35845 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257556151304238e-06, + "loss": 0.7969, + "step": 35846 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257340314063074e-06, + "loss": 0.7661, + "step": 35847 + }, + { + "epoch": 0.92, + "learning_rate": 1.6257124472030953e-06, + "loss": 0.9023, + "step": 35848 + }, + { + "epoch": 0.92, + "learning_rate": 1.6256908625208042e-06, + "loss": 0.5884, + "step": 35849 + }, + { + "epoch": 0.92, + "learning_rate": 1.62566927735945e-06, + "loss": 0.959, + "step": 35850 + }, + { + "epoch": 0.92, + "learning_rate": 1.6256476917190501e-06, + "loss": 0.7642, + "step": 35851 + }, + { + "epoch": 0.92, + "learning_rate": 1.62562610559962e-06, + "loss": 0.8213, + "step": 35852 + }, + { + "epoch": 0.92, + "learning_rate": 1.625604519001177e-06, + "loss": 0.6338, + "step": 35853 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255829319237375e-06, + "loss": 0.8193, + "step": 35854 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255613443673176e-06, + "loss": 0.6411, + "step": 35855 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255397563319346e-06, + "loss": 0.792, + "step": 35856 + }, + { + "epoch": 0.92, + "learning_rate": 1.6255181678176041e-06, + "loss": 0.8252, + "step": 35857 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254965788243435e-06, + "loss": 0.8223, + "step": 35858 + }, + { + "epoch": 0.92, + "learning_rate": 1.625474989352169e-06, + "loss": 0.8672, + "step": 35859 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254533994010966e-06, + "loss": 0.7061, + "step": 35860 + }, + { + "epoch": 0.92, + "learning_rate": 1.6254318089711437e-06, + "loss": 0.9258, + "step": 35861 + }, + { + "epoch": 0.92, + "learning_rate": 1.625410218062326e-06, + "loss": 0.793, + "step": 35862 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253886266746609e-06, + "loss": 0.8623, + "step": 35863 + }, + { + "epoch": 0.92, + "learning_rate": 1.625367034808164e-06, + "loss": 0.8662, + "step": 35864 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253454424628527e-06, + "loss": 0.7969, + "step": 35865 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253238496387432e-06, + "loss": 0.7803, + "step": 35866 + }, + { + "epoch": 0.92, + "learning_rate": 1.6253022563358518e-06, + "loss": 0.8638, + "step": 35867 + }, + { + "epoch": 0.92, + "learning_rate": 1.625280662554195e-06, + "loss": 0.875, + "step": 35868 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252590682937899e-06, + "loss": 0.5085, + "step": 35869 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252374735546526e-06, + "loss": 0.877, + "step": 35870 + }, + { + "epoch": 0.92, + "learning_rate": 1.6252158783368e-06, + "loss": 0.7744, + "step": 35871 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251942826402478e-06, + "loss": 0.6128, + "step": 35872 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251726864650132e-06, + "loss": 0.8467, + "step": 35873 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251510898111129e-06, + "loss": 0.6753, + "step": 35874 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251294926785631e-06, + "loss": 0.6992, + "step": 35875 + }, + { + "epoch": 0.92, + "learning_rate": 1.6251078950673803e-06, + "loss": 0.9277, + "step": 35876 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250862969775812e-06, + "loss": 0.9111, + "step": 35877 + }, + { + "epoch": 0.92, + "learning_rate": 1.625064698409182e-06, + "loss": 0.793, + "step": 35878 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250430993621996e-06, + "loss": 0.8574, + "step": 35879 + }, + { + "epoch": 0.92, + "learning_rate": 1.6250214998366505e-06, + "loss": 0.8545, + "step": 35880 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249998998325513e-06, + "loss": 0.8252, + "step": 35881 + }, + { + "epoch": 0.92, + "learning_rate": 1.624978299349918e-06, + "loss": 0.7783, + "step": 35882 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249566983887682e-06, + "loss": 0.7827, + "step": 35883 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249350969491173e-06, + "loss": 0.9238, + "step": 35884 + }, + { + "epoch": 0.92, + "learning_rate": 1.6249134950309826e-06, + "loss": 0.8159, + "step": 35885 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248918926343804e-06, + "loss": 0.9229, + "step": 35886 + }, + { + "epoch": 0.92, + "learning_rate": 1.624870289759327e-06, + "loss": 0.8447, + "step": 35887 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248486864058392e-06, + "loss": 0.7998, + "step": 35888 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248270825739335e-06, + "loss": 0.958, + "step": 35889 + }, + { + "epoch": 0.92, + "learning_rate": 1.6248054782636268e-06, + "loss": 0.8037, + "step": 35890 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247838734749347e-06, + "loss": 0.8477, + "step": 35891 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247622682078746e-06, + "loss": 0.8887, + "step": 35892 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247406624624626e-06, + "loss": 0.8867, + "step": 35893 + }, + { + "epoch": 0.92, + "learning_rate": 1.6247190562387155e-06, + "loss": 0.8047, + "step": 35894 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246974495366498e-06, + "loss": 0.7056, + "step": 35895 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246758423562819e-06, + "loss": 0.6155, + "step": 35896 + }, + { + "epoch": 0.92, + "learning_rate": 1.6246542346976285e-06, + "loss": 0.8682, + "step": 35897 + }, + { + "epoch": 0.92, + "learning_rate": 1.624632626560706e-06, + "loss": 1.0293, + "step": 35898 + }, + { + "epoch": 0.92, + "learning_rate": 1.624611017945531e-06, + "loss": 0.7607, + "step": 35899 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245894088521202e-06, + "loss": 0.8545, + "step": 35900 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245677992804897e-06, + "loss": 0.8984, + "step": 35901 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245461892306566e-06, + "loss": 0.8438, + "step": 35902 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245245787026374e-06, + "loss": 0.7959, + "step": 35903 + }, + { + "epoch": 0.92, + "learning_rate": 1.6245029676964482e-06, + "loss": 0.9766, + "step": 35904 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244813562121057e-06, + "loss": 0.876, + "step": 35905 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244597442496267e-06, + "loss": 0.9307, + "step": 35906 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244381318090276e-06, + "loss": 0.5574, + "step": 35907 + }, + { + "epoch": 0.92, + "learning_rate": 1.6244165188903249e-06, + "loss": 0.916, + "step": 35908 + }, + { + "epoch": 0.92, + "learning_rate": 1.624394905493535e-06, + "loss": 0.7061, + "step": 35909 + }, + { + "epoch": 0.92, + "learning_rate": 1.624373291618675e-06, + "loss": 0.98, + "step": 35910 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243516772657608e-06, + "loss": 0.9551, + "step": 35911 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243300624348094e-06, + "loss": 0.7532, + "step": 35912 + }, + { + "epoch": 0.92, + "learning_rate": 1.6243084471258368e-06, + "loss": 0.6694, + "step": 35913 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242868313388604e-06, + "loss": 0.9258, + "step": 35914 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242652150738962e-06, + "loss": 0.3662, + "step": 35915 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242435983309606e-06, + "loss": 0.7405, + "step": 35916 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242219811100705e-06, + "loss": 0.751, + "step": 35917 + }, + { + "epoch": 0.92, + "learning_rate": 1.6242003634112425e-06, + "loss": 0.8496, + "step": 35918 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241787452344927e-06, + "loss": 0.6826, + "step": 35919 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241571265798378e-06, + "loss": 0.7412, + "step": 35920 + }, + { + "epoch": 0.92, + "learning_rate": 1.624135507447295e-06, + "loss": 0.4719, + "step": 35921 + }, + { + "epoch": 0.92, + "learning_rate": 1.6241138878368801e-06, + "loss": 0.7598, + "step": 35922 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240922677486099e-06, + "loss": 0.8438, + "step": 35923 + }, + { + "epoch": 0.92, + "learning_rate": 1.624070647182501e-06, + "loss": 0.7114, + "step": 35924 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240490261385697e-06, + "loss": 0.876, + "step": 35925 + }, + { + "epoch": 0.92, + "learning_rate": 1.624027404616833e-06, + "loss": 0.9785, + "step": 35926 + }, + { + "epoch": 0.92, + "learning_rate": 1.6240057826173069e-06, + "loss": 0.6162, + "step": 35927 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239841601400084e-06, + "loss": 0.7671, + "step": 35928 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239625371849539e-06, + "loss": 0.9648, + "step": 35929 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239409137521603e-06, + "loss": 0.7871, + "step": 35930 + }, + { + "epoch": 0.92, + "learning_rate": 1.6239192898416437e-06, + "loss": 0.8477, + "step": 35931 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238976654534207e-06, + "loss": 0.9424, + "step": 35932 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238760405875077e-06, + "loss": 0.8916, + "step": 35933 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238544152439217e-06, + "loss": 0.8999, + "step": 35934 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238327894226792e-06, + "loss": 0.7153, + "step": 35935 + }, + { + "epoch": 0.92, + "learning_rate": 1.6238111631237966e-06, + "loss": 1.0645, + "step": 35936 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237895363472903e-06, + "loss": 0.6816, + "step": 35937 + }, + { + "epoch": 0.92, + "learning_rate": 1.623767909093177e-06, + "loss": 0.9619, + "step": 35938 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237462813614733e-06, + "loss": 0.834, + "step": 35939 + }, + { + "epoch": 0.92, + "learning_rate": 1.623724653152196e-06, + "loss": 0.7617, + "step": 35940 + }, + { + "epoch": 0.92, + "learning_rate": 1.6237030244653614e-06, + "loss": 0.8438, + "step": 35941 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236813953009857e-06, + "loss": 0.79, + "step": 35942 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236597656590861e-06, + "loss": 0.9453, + "step": 35943 + }, + { + "epoch": 0.92, + "learning_rate": 1.623638135539679e-06, + "loss": 0.709, + "step": 35944 + }, + { + "epoch": 0.92, + "learning_rate": 1.6236165049427807e-06, + "loss": 0.8281, + "step": 35945 + }, + { + "epoch": 0.92, + "learning_rate": 1.623594873868408e-06, + "loss": 0.8489, + "step": 35946 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235732423165774e-06, + "loss": 1.0283, + "step": 35947 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235516102873051e-06, + "loss": 0.96, + "step": 35948 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235299777806084e-06, + "loss": 0.5596, + "step": 35949 + }, + { + "epoch": 0.92, + "learning_rate": 1.6235083447965034e-06, + "loss": 0.917, + "step": 35950 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234867113350066e-06, + "loss": 0.6865, + "step": 35951 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234650773961347e-06, + "loss": 0.7715, + "step": 35952 + }, + { + "epoch": 0.92, + "learning_rate": 1.6234434429799043e-06, + "loss": 0.562, + "step": 35953 + }, + { + "epoch": 0.92, + "learning_rate": 1.623421808086332e-06, + "loss": 0.8574, + "step": 35954 + }, + { + "epoch": 0.92, + "learning_rate": 1.623400172715434e-06, + "loss": 0.772, + "step": 35955 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233785368672278e-06, + "loss": 0.8516, + "step": 35956 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233569005417285e-06, + "loss": 0.8516, + "step": 35957 + }, + { + "epoch": 0.92, + "learning_rate": 1.623335263738954e-06, + "loss": 0.9561, + "step": 35958 + }, + { + "epoch": 0.92, + "learning_rate": 1.6233136264589202e-06, + "loss": 0.8008, + "step": 35959 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232919887016441e-06, + "loss": 0.8179, + "step": 35960 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232703504671416e-06, + "loss": 0.8203, + "step": 35961 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232487117554297e-06, + "loss": 0.8037, + "step": 35962 + }, + { + "epoch": 0.92, + "learning_rate": 1.623227072566525e-06, + "loss": 0.8389, + "step": 35963 + }, + { + "epoch": 0.92, + "learning_rate": 1.6232054329004439e-06, + "loss": 0.8779, + "step": 35964 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231837927572032e-06, + "loss": 0.8076, + "step": 35965 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231621521368192e-06, + "loss": 0.6655, + "step": 35966 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231405110393087e-06, + "loss": 0.8594, + "step": 35967 + }, + { + "epoch": 0.92, + "learning_rate": 1.6231188694646881e-06, + "loss": 0.8457, + "step": 35968 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230972274129743e-06, + "loss": 0.8066, + "step": 35969 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230755848841833e-06, + "loss": 0.7324, + "step": 35970 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230539418783317e-06, + "loss": 0.686, + "step": 35971 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230322983954367e-06, + "loss": 0.7676, + "step": 35972 + }, + { + "epoch": 0.92, + "learning_rate": 1.6230106544355143e-06, + "loss": 0.8076, + "step": 35973 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229890099985818e-06, + "loss": 0.7295, + "step": 35974 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229673650846549e-06, + "loss": 0.957, + "step": 35975 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229457196937508e-06, + "loss": 1.0547, + "step": 35976 + }, + { + "epoch": 0.92, + "learning_rate": 1.6229240738258856e-06, + "loss": 0.6523, + "step": 35977 + }, + { + "epoch": 0.92, + "learning_rate": 1.622902427481076e-06, + "loss": 0.874, + "step": 35978 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228807806593386e-06, + "loss": 0.9336, + "step": 35979 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228591333606902e-06, + "loss": 0.7549, + "step": 35980 + }, + { + "epoch": 0.92, + "learning_rate": 1.6228374855851472e-06, + "loss": 0.9668, + "step": 35981 + }, + { + "epoch": 0.92, + "learning_rate": 1.622815837332726e-06, + "loss": 0.9678, + "step": 35982 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227941886034435e-06, + "loss": 0.9287, + "step": 35983 + }, + { + "epoch": 0.92, + "learning_rate": 1.622772539397316e-06, + "loss": 0.875, + "step": 35984 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227508897143605e-06, + "loss": 0.4636, + "step": 35985 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227292395545931e-06, + "loss": 0.5842, + "step": 35986 + }, + { + "epoch": 0.92, + "learning_rate": 1.6227075889180303e-06, + "loss": 0.6948, + "step": 35987 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226859378046894e-06, + "loss": 0.7881, + "step": 35988 + }, + { + "epoch": 0.92, + "learning_rate": 1.622664286214586e-06, + "loss": 0.9004, + "step": 35989 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226426341477378e-06, + "loss": 0.9707, + "step": 35990 + }, + { + "epoch": 0.92, + "learning_rate": 1.6226209816041604e-06, + "loss": 0.8809, + "step": 35991 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225993285838706e-06, + "loss": 0.6445, + "step": 35992 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225776750868852e-06, + "loss": 0.6782, + "step": 35993 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225560211132207e-06, + "loss": 0.8838, + "step": 35994 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225343666628942e-06, + "loss": 0.7773, + "step": 35995 + }, + { + "epoch": 0.92, + "learning_rate": 1.6225127117359213e-06, + "loss": 1.0215, + "step": 35996 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224910563323189e-06, + "loss": 1.0391, + "step": 35997 + }, + { + "epoch": 0.92, + "learning_rate": 1.622469400452104e-06, + "loss": 0.8142, + "step": 35998 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224477440952926e-06, + "loss": 0.8682, + "step": 35999 + }, + { + "epoch": 0.92, + "learning_rate": 1.622426087261902e-06, + "loss": 1.1377, + "step": 36000 + }, + { + "epoch": 0.92, + "learning_rate": 1.6224044299519481e-06, + "loss": 0.9082, + "step": 36001 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223827721654477e-06, + "loss": 0.7227, + "step": 36002 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223611139024175e-06, + "loss": 0.834, + "step": 36003 + }, + { + "epoch": 0.92, + "learning_rate": 1.6223394551628743e-06, + "loss": 0.9082, + "step": 36004 + }, + { + "epoch": 0.92, + "learning_rate": 1.622317795946834e-06, + "loss": 0.8115, + "step": 36005 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222961362543137e-06, + "loss": 0.6672, + "step": 36006 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222744760853297e-06, + "loss": 0.8789, + "step": 36007 + }, + { + "epoch": 0.92, + "learning_rate": 1.622252815439899e-06, + "loss": 0.7617, + "step": 36008 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222311543180378e-06, + "loss": 0.9961, + "step": 36009 + }, + { + "epoch": 0.92, + "learning_rate": 1.6222094927197629e-06, + "loss": 0.9805, + "step": 36010 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221878306450908e-06, + "loss": 0.876, + "step": 36011 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221661680940382e-06, + "loss": 0.6919, + "step": 36012 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221445050666213e-06, + "loss": 0.8901, + "step": 36013 + }, + { + "epoch": 0.92, + "learning_rate": 1.6221228415628573e-06, + "loss": 0.7651, + "step": 36014 + }, + { + "epoch": 0.92, + "learning_rate": 1.622101177582762e-06, + "loss": 0.8262, + "step": 36015 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220795131263528e-06, + "loss": 0.6797, + "step": 36016 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220578481936458e-06, + "loss": 0.6616, + "step": 36017 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220361827846575e-06, + "loss": 0.7373, + "step": 36018 + }, + { + "epoch": 0.92, + "learning_rate": 1.6220145168994048e-06, + "loss": 0.6484, + "step": 36019 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219928505379047e-06, + "loss": 0.7229, + "step": 36020 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219711837001725e-06, + "loss": 0.7456, + "step": 36021 + }, + { + "epoch": 0.92, + "learning_rate": 1.621949516386226e-06, + "loss": 0.9297, + "step": 36022 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219278485960813e-06, + "loss": 0.8027, + "step": 36023 + }, + { + "epoch": 0.92, + "learning_rate": 1.6219061803297549e-06, + "loss": 0.522, + "step": 36024 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218845115872637e-06, + "loss": 0.7083, + "step": 36025 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218628423686243e-06, + "loss": 0.6572, + "step": 36026 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218411726738528e-06, + "loss": 0.8218, + "step": 36027 + }, + { + "epoch": 0.92, + "learning_rate": 1.6218195025029661e-06, + "loss": 0.7678, + "step": 36028 + }, + { + "epoch": 0.92, + "learning_rate": 1.621797831855981e-06, + "loss": 0.8447, + "step": 36029 + }, + { + "epoch": 0.92, + "learning_rate": 1.6217761607329137e-06, + "loss": 1.0107, + "step": 36030 + }, + { + "epoch": 0.92, + "learning_rate": 1.621754489133781e-06, + "loss": 0.8271, + "step": 36031 + }, + { + "epoch": 0.92, + "learning_rate": 1.6217328170585997e-06, + "loss": 0.5933, + "step": 36032 + }, + { + "epoch": 0.92, + "learning_rate": 1.621711144507386e-06, + "loss": 0.9287, + "step": 36033 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216894714801566e-06, + "loss": 1.0537, + "step": 36034 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216677979769282e-06, + "loss": 0.8784, + "step": 36035 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216461239977176e-06, + "loss": 1.0469, + "step": 36036 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216244495425406e-06, + "loss": 0.6504, + "step": 36037 + }, + { + "epoch": 0.92, + "learning_rate": 1.6216027746114146e-06, + "loss": 0.9912, + "step": 36038 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215810992043562e-06, + "loss": 0.9688, + "step": 36039 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215594233213816e-06, + "loss": 0.7178, + "step": 36040 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215377469625072e-06, + "loss": 0.7861, + "step": 36041 + }, + { + "epoch": 0.92, + "learning_rate": 1.6215160701277505e-06, + "loss": 0.7578, + "step": 36042 + }, + { + "epoch": 0.92, + "learning_rate": 1.621494392817127e-06, + "loss": 0.9668, + "step": 36043 + }, + { + "epoch": 0.92, + "learning_rate": 1.621472715030654e-06, + "loss": 1.001, + "step": 36044 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214510367683484e-06, + "loss": 1.0264, + "step": 36045 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214293580302256e-06, + "loss": 0.8076, + "step": 36046 + }, + { + "epoch": 0.92, + "learning_rate": 1.6214076788163032e-06, + "loss": 0.7764, + "step": 36047 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213859991265975e-06, + "loss": 0.7451, + "step": 36048 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213643189611253e-06, + "loss": 0.9678, + "step": 36049 + }, + { + "epoch": 0.92, + "learning_rate": 1.6213426383199029e-06, + "loss": 0.8135, + "step": 36050 + }, + { + "epoch": 0.92, + "learning_rate": 1.621320957202947e-06, + "loss": 0.8906, + "step": 36051 + }, + { + "epoch": 0.92, + "learning_rate": 1.621299275610274e-06, + "loss": 0.9111, + "step": 36052 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212775935419007e-06, + "loss": 1.0537, + "step": 36053 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212559109978438e-06, + "loss": 0.8271, + "step": 36054 + }, + { + "epoch": 0.92, + "learning_rate": 1.6212342279781202e-06, + "loss": 0.646, + "step": 36055 + }, + { + "epoch": 0.92, + "learning_rate": 1.621212544482746e-06, + "loss": 0.8789, + "step": 36056 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211908605117374e-06, + "loss": 0.8965, + "step": 36057 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211691760651119e-06, + "loss": 0.9619, + "step": 36058 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211474911428856e-06, + "loss": 1.1113, + "step": 36059 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211258057450753e-06, + "loss": 0.6841, + "step": 36060 + }, + { + "epoch": 0.92, + "learning_rate": 1.6211041198716977e-06, + "loss": 0.9062, + "step": 36061 + }, + { + "epoch": 0.92, + "learning_rate": 1.621082433522769e-06, + "loss": 0.7319, + "step": 36062 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210607466983062e-06, + "loss": 0.7466, + "step": 36063 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210390593983254e-06, + "loss": 1.0303, + "step": 36064 + }, + { + "epoch": 0.92, + "learning_rate": 1.6210173716228441e-06, + "loss": 0.8867, + "step": 36065 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209956833718779e-06, + "loss": 0.959, + "step": 36066 + }, + { + "epoch": 0.92, + "learning_rate": 1.620973994645444e-06, + "loss": 0.6753, + "step": 36067 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209523054435587e-06, + "loss": 0.8828, + "step": 36068 + }, + { + "epoch": 0.92, + "learning_rate": 1.620930615766239e-06, + "loss": 0.584, + "step": 36069 + }, + { + "epoch": 0.92, + "learning_rate": 1.6209089256135014e-06, + "loss": 0.8887, + "step": 36070 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208872349853622e-06, + "loss": 0.7344, + "step": 36071 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208655438818382e-06, + "loss": 0.6177, + "step": 36072 + }, + { + "epoch": 0.92, + "learning_rate": 1.620843852302946e-06, + "loss": 0.7388, + "step": 36073 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208221602487021e-06, + "loss": 0.9121, + "step": 36074 + }, + { + "epoch": 0.92, + "learning_rate": 1.6208004677191237e-06, + "loss": 0.7397, + "step": 36075 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207787747142265e-06, + "loss": 0.8193, + "step": 36076 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207570812340274e-06, + "loss": 0.7666, + "step": 36077 + }, + { + "epoch": 0.92, + "learning_rate": 1.6207353872785433e-06, + "loss": 0.5269, + "step": 36078 + }, + { + "epoch": 0.92, + "learning_rate": 1.620713692847791e-06, + "loss": 0.853, + "step": 36079 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206919979417864e-06, + "loss": 0.7305, + "step": 36080 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206703025605463e-06, + "loss": 0.9004, + "step": 36081 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206486067040878e-06, + "loss": 0.9316, + "step": 36082 + }, + { + "epoch": 0.92, + "learning_rate": 1.6206269103724272e-06, + "loss": 0.8975, + "step": 36083 + }, + { + "epoch": 0.92, + "learning_rate": 1.620605213565581e-06, + "loss": 0.71, + "step": 36084 + }, + { + "epoch": 0.92, + "learning_rate": 1.620583516283566e-06, + "loss": 0.9717, + "step": 36085 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205618185263988e-06, + "loss": 0.7188, + "step": 36086 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205401202940958e-06, + "loss": 0.6924, + "step": 36087 + }, + { + "epoch": 0.92, + "learning_rate": 1.6205184215866737e-06, + "loss": 0.8896, + "step": 36088 + }, + { + "epoch": 0.92, + "learning_rate": 1.6204967224041494e-06, + "loss": 0.8145, + "step": 36089 + }, + { + "epoch": 0.93, + "learning_rate": 1.620475022746539e-06, + "loss": 0.8896, + "step": 36090 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204533226138599e-06, + "loss": 0.7554, + "step": 36091 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204316220061278e-06, + "loss": 1.0381, + "step": 36092 + }, + { + "epoch": 0.93, + "learning_rate": 1.6204099209233597e-06, + "loss": 0.7832, + "step": 36093 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203882193655726e-06, + "loss": 1.0586, + "step": 36094 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203665173327825e-06, + "loss": 0.8105, + "step": 36095 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203448148250064e-06, + "loss": 0.7578, + "step": 36096 + }, + { + "epoch": 0.93, + "learning_rate": 1.6203231118422606e-06, + "loss": 0.6323, + "step": 36097 + }, + { + "epoch": 0.93, + "learning_rate": 1.620301408384562e-06, + "loss": 0.8896, + "step": 36098 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202797044519275e-06, + "loss": 0.9102, + "step": 36099 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202580000443732e-06, + "loss": 0.8057, + "step": 36100 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202362951619154e-06, + "loss": 0.9707, + "step": 36101 + }, + { + "epoch": 0.93, + "learning_rate": 1.6202145898045717e-06, + "loss": 0.8594, + "step": 36102 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201928839723577e-06, + "loss": 0.6189, + "step": 36103 + }, + { + "epoch": 0.93, + "learning_rate": 1.620171177665291e-06, + "loss": 0.8379, + "step": 36104 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201494708833879e-06, + "loss": 1.0322, + "step": 36105 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201277636266642e-06, + "loss": 0.8457, + "step": 36106 + }, + { + "epoch": 0.93, + "learning_rate": 1.6201060558951376e-06, + "loss": 0.9512, + "step": 36107 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200843476888242e-06, + "loss": 1.0449, + "step": 36108 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200626390077407e-06, + "loss": 1.0049, + "step": 36109 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200409298519039e-06, + "loss": 0.8711, + "step": 36110 + }, + { + "epoch": 0.93, + "learning_rate": 1.6200192202213303e-06, + "loss": 0.752, + "step": 36111 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199975101160363e-06, + "loss": 0.8657, + "step": 36112 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199757995360388e-06, + "loss": 0.9092, + "step": 36113 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199540884813543e-06, + "loss": 0.8457, + "step": 36114 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199323769519997e-06, + "loss": 0.9141, + "step": 36115 + }, + { + "epoch": 0.93, + "learning_rate": 1.6199106649479913e-06, + "loss": 0.9844, + "step": 36116 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198889524693455e-06, + "loss": 0.999, + "step": 36117 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198672395160796e-06, + "loss": 0.8652, + "step": 36118 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198455260882095e-06, + "loss": 0.7026, + "step": 36119 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198238121857523e-06, + "loss": 0.8306, + "step": 36120 + }, + { + "epoch": 0.93, + "learning_rate": 1.6198020978087246e-06, + "loss": 0.7119, + "step": 36121 + }, + { + "epoch": 0.93, + "learning_rate": 1.619780382957143e-06, + "loss": 0.8887, + "step": 36122 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197586676310237e-06, + "loss": 1.1035, + "step": 36123 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197369518303841e-06, + "loss": 0.7285, + "step": 36124 + }, + { + "epoch": 0.93, + "learning_rate": 1.6197152355552403e-06, + "loss": 1.1201, + "step": 36125 + }, + { + "epoch": 0.93, + "learning_rate": 1.619693518805609e-06, + "loss": 0.8301, + "step": 36126 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196718015815068e-06, + "loss": 0.8311, + "step": 36127 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196500838829503e-06, + "loss": 0.6008, + "step": 36128 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196283657099565e-06, + "loss": 0.8721, + "step": 36129 + }, + { + "epoch": 0.93, + "learning_rate": 1.6196066470625417e-06, + "loss": 0.7427, + "step": 36130 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195849279407226e-06, + "loss": 0.7266, + "step": 36131 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195632083445157e-06, + "loss": 0.8701, + "step": 36132 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195414882739375e-06, + "loss": 0.8906, + "step": 36133 + }, + { + "epoch": 0.93, + "learning_rate": 1.6195197677290052e-06, + "loss": 0.9629, + "step": 36134 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194980467097353e-06, + "loss": 0.8213, + "step": 36135 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194763252161439e-06, + "loss": 0.8774, + "step": 36136 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194546032482479e-06, + "loss": 0.8672, + "step": 36137 + }, + { + "epoch": 0.93, + "learning_rate": 1.6194328808060642e-06, + "loss": 0.9336, + "step": 36138 + }, + { + "epoch": 0.93, + "learning_rate": 1.619411157889609e-06, + "loss": 0.9375, + "step": 36139 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193894344988993e-06, + "loss": 0.752, + "step": 36140 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193677106339515e-06, + "loss": 0.7871, + "step": 36141 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193459862947828e-06, + "loss": 0.8672, + "step": 36142 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193242614814088e-06, + "loss": 0.7891, + "step": 36143 + }, + { + "epoch": 0.93, + "learning_rate": 1.6193025361938469e-06, + "loss": 0.8398, + "step": 36144 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192808104321136e-06, + "loss": 0.6797, + "step": 36145 + }, + { + "epoch": 0.93, + "learning_rate": 1.619259084196225e-06, + "loss": 0.8818, + "step": 36146 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192373574861988e-06, + "loss": 0.7966, + "step": 36147 + }, + { + "epoch": 0.93, + "learning_rate": 1.6192156303020507e-06, + "loss": 0.918, + "step": 36148 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191939026437978e-06, + "loss": 0.7119, + "step": 36149 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191721745114567e-06, + "loss": 0.6406, + "step": 36150 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191504459050435e-06, + "loss": 0.793, + "step": 36151 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191287168245754e-06, + "loss": 0.8604, + "step": 36152 + }, + { + "epoch": 0.93, + "learning_rate": 1.6191069872700692e-06, + "loss": 0.9697, + "step": 36153 + }, + { + "epoch": 0.93, + "learning_rate": 1.619085257241541e-06, + "loss": 0.6533, + "step": 36154 + }, + { + "epoch": 0.93, + "learning_rate": 1.619063526739008e-06, + "loss": 0.8359, + "step": 36155 + }, + { + "epoch": 0.93, + "learning_rate": 1.6190417957624863e-06, + "loss": 0.686, + "step": 36156 + }, + { + "epoch": 0.93, + "learning_rate": 1.6190200643119927e-06, + "loss": 0.7314, + "step": 36157 + }, + { + "epoch": 0.93, + "learning_rate": 1.618998332387544e-06, + "loss": 0.8359, + "step": 36158 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189765999891564e-06, + "loss": 0.9033, + "step": 36159 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189548671168475e-06, + "loss": 0.8413, + "step": 36160 + }, + { + "epoch": 0.93, + "learning_rate": 1.618933133770633e-06, + "loss": 0.8223, + "step": 36161 + }, + { + "epoch": 0.93, + "learning_rate": 1.6189113999505298e-06, + "loss": 0.7627, + "step": 36162 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188896656565547e-06, + "loss": 0.7324, + "step": 36163 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188679308887241e-06, + "loss": 0.9434, + "step": 36164 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188461956470549e-06, + "loss": 0.7422, + "step": 36165 + }, + { + "epoch": 0.93, + "learning_rate": 1.6188244599315638e-06, + "loss": 0.7627, + "step": 36166 + }, + { + "epoch": 0.93, + "learning_rate": 1.618802723742267e-06, + "loss": 0.9932, + "step": 36167 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187809870791815e-06, + "loss": 0.8086, + "step": 36168 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187592499423237e-06, + "loss": 0.7295, + "step": 36169 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187375123317106e-06, + "loss": 0.7559, + "step": 36170 + }, + { + "epoch": 0.93, + "learning_rate": 1.6187157742473585e-06, + "loss": 0.8584, + "step": 36171 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186940356892844e-06, + "loss": 1.0635, + "step": 36172 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186722966575044e-06, + "loss": 0.7949, + "step": 36173 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186505571520356e-06, + "loss": 0.9141, + "step": 36174 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186288171728948e-06, + "loss": 0.96, + "step": 36175 + }, + { + "epoch": 0.93, + "learning_rate": 1.6186070767200982e-06, + "loss": 0.546, + "step": 36176 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185853357936624e-06, + "loss": 0.6758, + "step": 36177 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185635943936043e-06, + "loss": 0.9443, + "step": 36178 + }, + { + "epoch": 0.93, + "learning_rate": 1.6185418525199404e-06, + "loss": 0.7969, + "step": 36179 + }, + { + "epoch": 0.93, + "learning_rate": 1.618520110172688e-06, + "loss": 0.7375, + "step": 36180 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184983673518627e-06, + "loss": 0.9453, + "step": 36181 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184766240574817e-06, + "loss": 0.9492, + "step": 36182 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184548802895615e-06, + "loss": 0.8105, + "step": 36183 + }, + { + "epoch": 0.93, + "learning_rate": 1.618433136048119e-06, + "loss": 0.9932, + "step": 36184 + }, + { + "epoch": 0.93, + "learning_rate": 1.6184113913331706e-06, + "loss": 0.5708, + "step": 36185 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183896461447333e-06, + "loss": 0.8906, + "step": 36186 + }, + { + "epoch": 0.93, + "learning_rate": 1.618367900482823e-06, + "loss": 0.9902, + "step": 36187 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183461543474573e-06, + "loss": 0.8096, + "step": 36188 + }, + { + "epoch": 0.93, + "learning_rate": 1.618324407738652e-06, + "loss": 0.6846, + "step": 36189 + }, + { + "epoch": 0.93, + "learning_rate": 1.6183026606564244e-06, + "loss": 0.8359, + "step": 36190 + }, + { + "epoch": 0.93, + "learning_rate": 1.618280913100791e-06, + "loss": 0.9072, + "step": 36191 + }, + { + "epoch": 0.93, + "learning_rate": 1.6182591650717679e-06, + "loss": 0.5708, + "step": 36192 + }, + { + "epoch": 0.93, + "learning_rate": 1.6182374165693724e-06, + "loss": 0.6807, + "step": 36193 + }, + { + "epoch": 0.93, + "learning_rate": 1.618215667593621e-06, + "loss": 0.6753, + "step": 36194 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181939181445303e-06, + "loss": 0.8779, + "step": 36195 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181721682221167e-06, + "loss": 0.7441, + "step": 36196 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181504178263974e-06, + "loss": 0.833, + "step": 36197 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181286669573887e-06, + "loss": 0.8027, + "step": 36198 + }, + { + "epoch": 0.93, + "learning_rate": 1.6181069156151073e-06, + "loss": 0.9863, + "step": 36199 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180851637995695e-06, + "loss": 0.8296, + "step": 36200 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180634115107928e-06, + "loss": 1.0049, + "step": 36201 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180416587487931e-06, + "loss": 0.8345, + "step": 36202 + }, + { + "epoch": 0.93, + "learning_rate": 1.6180199055135875e-06, + "loss": 0.7656, + "step": 36203 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179981518051925e-06, + "loss": 0.876, + "step": 36204 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179763976236242e-06, + "loss": 0.7173, + "step": 36205 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179546429689005e-06, + "loss": 0.7598, + "step": 36206 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179328878410368e-06, + "loss": 0.7495, + "step": 36207 + }, + { + "epoch": 0.93, + "learning_rate": 1.6179111322400506e-06, + "loss": 0.5125, + "step": 36208 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178893761659583e-06, + "loss": 0.8428, + "step": 36209 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178676196187762e-06, + "loss": 0.9209, + "step": 36210 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178458625985214e-06, + "loss": 0.8291, + "step": 36211 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178241051052107e-06, + "loss": 0.6836, + "step": 36212 + }, + { + "epoch": 0.93, + "learning_rate": 1.6178023471388602e-06, + "loss": 0.7969, + "step": 36213 + }, + { + "epoch": 0.93, + "learning_rate": 1.617780588699487e-06, + "loss": 0.7129, + "step": 36214 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177588297871077e-06, + "loss": 0.8076, + "step": 36215 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177370704017386e-06, + "loss": 0.915, + "step": 36216 + }, + { + "epoch": 0.93, + "learning_rate": 1.6177153105433967e-06, + "loss": 0.8594, + "step": 36217 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176935502120986e-06, + "loss": 0.7969, + "step": 36218 + }, + { + "epoch": 0.93, + "learning_rate": 1.617671789407861e-06, + "loss": 0.9248, + "step": 36219 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176500281307006e-06, + "loss": 0.9297, + "step": 36220 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176282663806338e-06, + "loss": 0.79, + "step": 36221 + }, + { + "epoch": 0.93, + "learning_rate": 1.6176065041576776e-06, + "loss": 0.8525, + "step": 36222 + }, + { + "epoch": 0.93, + "learning_rate": 1.617584741461848e-06, + "loss": 0.792, + "step": 36223 + }, + { + "epoch": 0.93, + "learning_rate": 1.6175629782931631e-06, + "loss": 0.9316, + "step": 36224 + }, + { + "epoch": 0.93, + "learning_rate": 1.6175412146516379e-06, + "loss": 0.8457, + "step": 36225 + }, + { + "epoch": 0.93, + "learning_rate": 1.61751945053729e-06, + "loss": 0.9746, + "step": 36226 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174976859501359e-06, + "loss": 0.916, + "step": 36227 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174759208901921e-06, + "loss": 0.9238, + "step": 36228 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174541553574756e-06, + "loss": 0.8262, + "step": 36229 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174323893520026e-06, + "loss": 0.8428, + "step": 36230 + }, + { + "epoch": 0.93, + "learning_rate": 1.6174106228737898e-06, + "loss": 0.7373, + "step": 36231 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173888559228543e-06, + "loss": 0.8418, + "step": 36232 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173670884992129e-06, + "loss": 1.0127, + "step": 36233 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173453206028814e-06, + "loss": 0.6846, + "step": 36234 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173235522338773e-06, + "loss": 0.6431, + "step": 36235 + }, + { + "epoch": 0.93, + "learning_rate": 1.6173017833922167e-06, + "loss": 1.1553, + "step": 36236 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172800140779167e-06, + "loss": 0.9248, + "step": 36237 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172582442909936e-06, + "loss": 0.6699, + "step": 36238 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172364740314646e-06, + "loss": 0.594, + "step": 36239 + }, + { + "epoch": 0.93, + "learning_rate": 1.6172147032993457e-06, + "loss": 0.6385, + "step": 36240 + }, + { + "epoch": 0.93, + "learning_rate": 1.617192932094654e-06, + "loss": 0.9443, + "step": 36241 + }, + { + "epoch": 0.93, + "learning_rate": 1.617171160417406e-06, + "loss": 0.7417, + "step": 36242 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171493882676183e-06, + "loss": 0.8955, + "step": 36243 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171276156453079e-06, + "loss": 0.9307, + "step": 36244 + }, + { + "epoch": 0.93, + "learning_rate": 1.6171058425504911e-06, + "loss": 0.9473, + "step": 36245 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170840689831848e-06, + "loss": 0.8701, + "step": 36246 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170622949434056e-06, + "loss": 0.9277, + "step": 36247 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170405204311704e-06, + "loss": 0.7627, + "step": 36248 + }, + { + "epoch": 0.93, + "learning_rate": 1.6170187454464955e-06, + "loss": 0.8633, + "step": 36249 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169969699893974e-06, + "loss": 0.7759, + "step": 36250 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169751940598934e-06, + "loss": 0.7354, + "step": 36251 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169534176579998e-06, + "loss": 0.9258, + "step": 36252 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169316407837333e-06, + "loss": 0.7549, + "step": 36253 + }, + { + "epoch": 0.93, + "learning_rate": 1.6169098634371107e-06, + "loss": 0.9185, + "step": 36254 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168880856181483e-06, + "loss": 0.9111, + "step": 36255 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168663073268634e-06, + "loss": 0.7178, + "step": 36256 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168445285632721e-06, + "loss": 0.7793, + "step": 36257 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168227493273915e-06, + "loss": 1.0547, + "step": 36258 + }, + { + "epoch": 0.93, + "learning_rate": 1.6168009696192382e-06, + "loss": 0.9746, + "step": 36259 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167791894388284e-06, + "loss": 0.7627, + "step": 36260 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167574087861793e-06, + "loss": 0.752, + "step": 36261 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167356276613075e-06, + "loss": 0.6592, + "step": 36262 + }, + { + "epoch": 0.93, + "learning_rate": 1.6167138460642296e-06, + "loss": 0.6948, + "step": 36263 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166920639949622e-06, + "loss": 0.6924, + "step": 36264 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166702814535218e-06, + "loss": 0.8076, + "step": 36265 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166484984399255e-06, + "loss": 0.8877, + "step": 36266 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166267149541899e-06, + "loss": 0.8555, + "step": 36267 + }, + { + "epoch": 0.93, + "learning_rate": 1.6166049309963314e-06, + "loss": 0.5864, + "step": 36268 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165831465663673e-06, + "loss": 0.6846, + "step": 36269 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165613616643134e-06, + "loss": 0.5808, + "step": 36270 + }, + { + "epoch": 0.93, + "learning_rate": 1.616539576290187e-06, + "loss": 1.0488, + "step": 36271 + }, + { + "epoch": 0.93, + "learning_rate": 1.6165177904440044e-06, + "loss": 0.9189, + "step": 36272 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164960041257825e-06, + "loss": 1.0635, + "step": 36273 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164742173355382e-06, + "loss": 0.8135, + "step": 36274 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164524300732878e-06, + "loss": 0.8975, + "step": 36275 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164306423390479e-06, + "loss": 0.835, + "step": 36276 + }, + { + "epoch": 0.93, + "learning_rate": 1.6164088541328358e-06, + "loss": 0.9072, + "step": 36277 + }, + { + "epoch": 0.93, + "learning_rate": 1.6163870654546675e-06, + "loss": 0.834, + "step": 36278 + }, + { + "epoch": 0.93, + "learning_rate": 1.6163652763045601e-06, + "loss": 0.7007, + "step": 36279 + }, + { + "epoch": 0.93, + "learning_rate": 1.61634348668253e-06, + "loss": 0.9268, + "step": 36280 + }, + { + "epoch": 0.93, + "learning_rate": 1.616321696588594e-06, + "loss": 0.8174, + "step": 36281 + }, + { + "epoch": 0.93, + "learning_rate": 1.616299906022769e-06, + "loss": 0.6924, + "step": 36282 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162781149850715e-06, + "loss": 0.9102, + "step": 36283 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162563234755183e-06, + "loss": 0.9375, + "step": 36284 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162345314941257e-06, + "loss": 0.877, + "step": 36285 + }, + { + "epoch": 0.93, + "learning_rate": 1.6162127390409107e-06, + "loss": 0.8164, + "step": 36286 + }, + { + "epoch": 0.93, + "learning_rate": 1.61619094611589e-06, + "loss": 0.8022, + "step": 36287 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161691527190801e-06, + "loss": 0.7148, + "step": 36288 + }, + { + "epoch": 0.93, + "learning_rate": 1.616147358850498e-06, + "loss": 0.9189, + "step": 36289 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161255645101602e-06, + "loss": 0.9512, + "step": 36290 + }, + { + "epoch": 0.93, + "learning_rate": 1.6161037696980834e-06, + "loss": 0.791, + "step": 36291 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160819744142841e-06, + "loss": 0.5991, + "step": 36292 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160601786587793e-06, + "loss": 0.6641, + "step": 36293 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160383824315855e-06, + "loss": 0.5469, + "step": 36294 + }, + { + "epoch": 0.93, + "learning_rate": 1.6160165857327195e-06, + "loss": 0.5046, + "step": 36295 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159947885621978e-06, + "loss": 0.7725, + "step": 36296 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159729909200372e-06, + "loss": 0.8599, + "step": 36297 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159511928062545e-06, + "loss": 0.8242, + "step": 36298 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159293942208666e-06, + "loss": 0.918, + "step": 36299 + }, + { + "epoch": 0.93, + "learning_rate": 1.6159075951638894e-06, + "loss": 0.9131, + "step": 36300 + }, + { + "epoch": 0.93, + "learning_rate": 1.6158857956353402e-06, + "loss": 1.0127, + "step": 36301 + }, + { + "epoch": 0.93, + "learning_rate": 1.6158639956352355e-06, + "loss": 0.917, + "step": 36302 + }, + { + "epoch": 0.93, + "learning_rate": 1.615842195163592e-06, + "loss": 0.5266, + "step": 36303 + }, + { + "epoch": 0.93, + "learning_rate": 1.615820394220427e-06, + "loss": 0.6777, + "step": 36304 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157985928057562e-06, + "loss": 0.8418, + "step": 36305 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157767909195967e-06, + "loss": 0.751, + "step": 36306 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157549885619653e-06, + "loss": 0.793, + "step": 36307 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157331857328784e-06, + "loss": 0.8154, + "step": 36308 + }, + { + "epoch": 0.93, + "learning_rate": 1.6157113824323534e-06, + "loss": 0.9004, + "step": 36309 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156895786604063e-06, + "loss": 0.9111, + "step": 36310 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156677744170537e-06, + "loss": 0.6958, + "step": 36311 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156459697023127e-06, + "loss": 0.9229, + "step": 36312 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156241645162001e-06, + "loss": 0.9014, + "step": 36313 + }, + { + "epoch": 0.93, + "learning_rate": 1.6156023588587325e-06, + "loss": 0.8311, + "step": 36314 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155805527299262e-06, + "loss": 0.8672, + "step": 36315 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155587461297984e-06, + "loss": 0.6958, + "step": 36316 + }, + { + "epoch": 0.93, + "learning_rate": 1.6155369390583653e-06, + "loss": 0.897, + "step": 36317 + }, + { + "epoch": 0.93, + "learning_rate": 1.615515131515644e-06, + "loss": 0.7812, + "step": 36318 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154933235016513e-06, + "loss": 0.999, + "step": 36319 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154715150164034e-06, + "loss": 0.7578, + "step": 36320 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154497060599173e-06, + "loss": 0.8975, + "step": 36321 + }, + { + "epoch": 0.93, + "learning_rate": 1.6154278966322097e-06, + "loss": 0.8721, + "step": 36322 + }, + { + "epoch": 0.93, + "learning_rate": 1.615406086733297e-06, + "loss": 0.7627, + "step": 36323 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153842763631965e-06, + "loss": 0.9248, + "step": 36324 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153624655219243e-06, + "loss": 0.603, + "step": 36325 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153406542094974e-06, + "loss": 0.873, + "step": 36326 + }, + { + "epoch": 0.93, + "learning_rate": 1.6153188424259328e-06, + "loss": 0.7842, + "step": 36327 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152970301712466e-06, + "loss": 0.9043, + "step": 36328 + }, + { + "epoch": 0.93, + "learning_rate": 1.615275217445456e-06, + "loss": 0.6538, + "step": 36329 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152534042485768e-06, + "loss": 0.7334, + "step": 36330 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152315905806267e-06, + "loss": 0.8984, + "step": 36331 + }, + { + "epoch": 0.93, + "learning_rate": 1.6152097764416221e-06, + "loss": 0.9082, + "step": 36332 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151879618315797e-06, + "loss": 0.9785, + "step": 36333 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151661467505165e-06, + "loss": 0.8398, + "step": 36334 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151443311984484e-06, + "loss": 0.8379, + "step": 36335 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151225151753924e-06, + "loss": 0.7671, + "step": 36336 + }, + { + "epoch": 0.93, + "learning_rate": 1.6151006986813658e-06, + "loss": 0.8584, + "step": 36337 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150788817163848e-06, + "loss": 1.0107, + "step": 36338 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150570642804663e-06, + "loss": 0.9824, + "step": 36339 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150352463736266e-06, + "loss": 0.9424, + "step": 36340 + }, + { + "epoch": 0.93, + "learning_rate": 1.6150134279958828e-06, + "loss": 0.9238, + "step": 36341 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149916091472515e-06, + "loss": 0.8735, + "step": 36342 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149697898277492e-06, + "loss": 0.9297, + "step": 36343 + }, + { + "epoch": 0.93, + "learning_rate": 1.614947970037393e-06, + "loss": 0.8779, + "step": 36344 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149261497761995e-06, + "loss": 0.7388, + "step": 36345 + }, + { + "epoch": 0.93, + "learning_rate": 1.6149043290441852e-06, + "loss": 0.7749, + "step": 36346 + }, + { + "epoch": 0.93, + "learning_rate": 1.614882507841367e-06, + "loss": 0.8848, + "step": 36347 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148606861677615e-06, + "loss": 0.71, + "step": 36348 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148388640233854e-06, + "loss": 0.9463, + "step": 36349 + }, + { + "epoch": 0.93, + "learning_rate": 1.6148170414082558e-06, + "loss": 0.9326, + "step": 36350 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147952183223886e-06, + "loss": 0.9531, + "step": 36351 + }, + { + "epoch": 0.93, + "learning_rate": 1.614773394765801e-06, + "loss": 0.8398, + "step": 36352 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147515707385097e-06, + "loss": 0.8193, + "step": 36353 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147297462405318e-06, + "loss": 0.6724, + "step": 36354 + }, + { + "epoch": 0.93, + "learning_rate": 1.6147079212718832e-06, + "loss": 0.7988, + "step": 36355 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146860958325811e-06, + "loss": 0.999, + "step": 36356 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146642699226423e-06, + "loss": 0.6785, + "step": 36357 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146424435420832e-06, + "loss": 0.5757, + "step": 36358 + }, + { + "epoch": 0.93, + "learning_rate": 1.6146206166909205e-06, + "loss": 0.8086, + "step": 36359 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145987893691712e-06, + "loss": 0.8994, + "step": 36360 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145769615768518e-06, + "loss": 0.7529, + "step": 36361 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145551333139792e-06, + "loss": 0.7925, + "step": 36362 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145333045805698e-06, + "loss": 0.7197, + "step": 36363 + }, + { + "epoch": 0.93, + "learning_rate": 1.6145114753766408e-06, + "loss": 1.1016, + "step": 36364 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144896457022083e-06, + "loss": 0.8711, + "step": 36365 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144678155572894e-06, + "loss": 0.9971, + "step": 36366 + }, + { + "epoch": 0.93, + "learning_rate": 1.614445984941901e-06, + "loss": 0.6147, + "step": 36367 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144241538560594e-06, + "loss": 0.708, + "step": 36368 + }, + { + "epoch": 0.93, + "learning_rate": 1.6144023222997816e-06, + "loss": 0.7153, + "step": 36369 + }, + { + "epoch": 0.93, + "learning_rate": 1.614380490273084e-06, + "loss": 1.166, + "step": 36370 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143586577759834e-06, + "loss": 0.8955, + "step": 36371 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143368248084967e-06, + "loss": 0.8682, + "step": 36372 + }, + { + "epoch": 0.93, + "learning_rate": 1.6143149913706409e-06, + "loss": 0.7754, + "step": 36373 + }, + { + "epoch": 0.93, + "learning_rate": 1.614293157462432e-06, + "loss": 1.0127, + "step": 36374 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142713230838872e-06, + "loss": 0.8086, + "step": 36375 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142494882350231e-06, + "loss": 0.7422, + "step": 36376 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142276529158561e-06, + "loss": 0.7734, + "step": 36377 + }, + { + "epoch": 0.93, + "learning_rate": 1.6142058171264035e-06, + "loss": 0.8174, + "step": 36378 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141839808666816e-06, + "loss": 0.9482, + "step": 36379 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141621441367078e-06, + "loss": 0.6279, + "step": 36380 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141403069364979e-06, + "loss": 0.8018, + "step": 36381 + }, + { + "epoch": 0.93, + "learning_rate": 1.6141184692660688e-06, + "loss": 0.9307, + "step": 36382 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140966311254376e-06, + "loss": 0.6909, + "step": 36383 + }, + { + "epoch": 0.93, + "learning_rate": 1.614074792514621e-06, + "loss": 0.8711, + "step": 36384 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140529534336354e-06, + "loss": 0.7896, + "step": 36385 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140311138824978e-06, + "loss": 0.8745, + "step": 36386 + }, + { + "epoch": 0.93, + "learning_rate": 1.6140092738612246e-06, + "loss": 0.9854, + "step": 36387 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139874333698328e-06, + "loss": 0.9551, + "step": 36388 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139655924083392e-06, + "loss": 0.6592, + "step": 36389 + }, + { + "epoch": 0.93, + "learning_rate": 1.61394375097676e-06, + "loss": 0.8872, + "step": 36390 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139219090751128e-06, + "loss": 0.8662, + "step": 36391 + }, + { + "epoch": 0.93, + "learning_rate": 1.6139000667034138e-06, + "loss": 0.7686, + "step": 36392 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138782238616794e-06, + "loss": 0.8496, + "step": 36393 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138563805499267e-06, + "loss": 0.9512, + "step": 36394 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138345367681727e-06, + "loss": 0.6885, + "step": 36395 + }, + { + "epoch": 0.93, + "learning_rate": 1.6138126925164337e-06, + "loss": 0.8662, + "step": 36396 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137908477947264e-06, + "loss": 0.5215, + "step": 36397 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137690026030677e-06, + "loss": 0.792, + "step": 36398 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137471569414744e-06, + "loss": 0.9824, + "step": 36399 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137253108099632e-06, + "loss": 0.8799, + "step": 36400 + }, + { + "epoch": 0.93, + "learning_rate": 1.6137034642085507e-06, + "loss": 0.8506, + "step": 36401 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136816171372535e-06, + "loss": 0.9365, + "step": 36402 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136597695960888e-06, + "loss": 0.8418, + "step": 36403 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136379215850729e-06, + "loss": 0.8848, + "step": 36404 + }, + { + "epoch": 0.93, + "learning_rate": 1.6136160731042226e-06, + "loss": 1.0, + "step": 36405 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135942241535545e-06, + "loss": 0.7598, + "step": 36406 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135723747330859e-06, + "loss": 0.8457, + "step": 36407 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135505248428327e-06, + "loss": 0.8857, + "step": 36408 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135286744828125e-06, + "loss": 0.6611, + "step": 36409 + }, + { + "epoch": 0.93, + "learning_rate": 1.6135068236530414e-06, + "loss": 0.957, + "step": 36410 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134849723535365e-06, + "loss": 0.614, + "step": 36411 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134631205843142e-06, + "loss": 0.9082, + "step": 36412 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134412683453913e-06, + "loss": 0.7598, + "step": 36413 + }, + { + "epoch": 0.93, + "learning_rate": 1.6134194156367849e-06, + "loss": 0.6328, + "step": 36414 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133975624585111e-06, + "loss": 0.6685, + "step": 36415 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133757088105873e-06, + "loss": 0.707, + "step": 36416 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133538546930298e-06, + "loss": 0.7603, + "step": 36417 + }, + { + "epoch": 0.93, + "learning_rate": 1.6133320001058555e-06, + "loss": 0.874, + "step": 36418 + }, + { + "epoch": 0.93, + "learning_rate": 1.613310145049081e-06, + "loss": 0.9385, + "step": 36419 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132882895227234e-06, + "loss": 0.8369, + "step": 36420 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132664335267988e-06, + "loss": 0.8145, + "step": 36421 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132445770613242e-06, + "loss": 1.0977, + "step": 36422 + }, + { + "epoch": 0.93, + "learning_rate": 1.6132227201263169e-06, + "loss": 0.8232, + "step": 36423 + }, + { + "epoch": 0.93, + "learning_rate": 1.613200862721793e-06, + "loss": 0.9912, + "step": 36424 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131790048477694e-06, + "loss": 0.6582, + "step": 36425 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131571465042627e-06, + "loss": 0.9053, + "step": 36426 + }, + { + "epoch": 0.93, + "learning_rate": 1.61313528769129e-06, + "loss": 0.7568, + "step": 36427 + }, + { + "epoch": 0.93, + "learning_rate": 1.6131134284088675e-06, + "loss": 0.959, + "step": 36428 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130915686570123e-06, + "loss": 0.6694, + "step": 36429 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130697084357411e-06, + "loss": 0.9551, + "step": 36430 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130478477450708e-06, + "loss": 0.8779, + "step": 36431 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130259865850178e-06, + "loss": 0.8945, + "step": 36432 + }, + { + "epoch": 0.93, + "learning_rate": 1.6130041249555988e-06, + "loss": 0.8174, + "step": 36433 + }, + { + "epoch": 0.93, + "learning_rate": 1.612982262856831e-06, + "loss": 0.7461, + "step": 36434 + }, + { + "epoch": 0.93, + "learning_rate": 1.6129604002887309e-06, + "loss": 0.8203, + "step": 36435 + }, + { + "epoch": 0.93, + "learning_rate": 1.612938537251315e-06, + "loss": 0.8223, + "step": 36436 + }, + { + "epoch": 0.93, + "learning_rate": 1.6129166737446005e-06, + "loss": 0.8872, + "step": 36437 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128948097686038e-06, + "loss": 0.7358, + "step": 36438 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128729453233415e-06, + "loss": 0.8672, + "step": 36439 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128510804088307e-06, + "loss": 0.812, + "step": 36440 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128292150250879e-06, + "loss": 0.8135, + "step": 36441 + }, + { + "epoch": 0.93, + "learning_rate": 1.6128073491721303e-06, + "loss": 1.0586, + "step": 36442 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127854828499737e-06, + "loss": 0.9297, + "step": 36443 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127636160586363e-06, + "loss": 0.8623, + "step": 36444 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127417487981334e-06, + "loss": 0.793, + "step": 36445 + }, + { + "epoch": 0.93, + "learning_rate": 1.6127198810684822e-06, + "loss": 0.8301, + "step": 36446 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126980128696998e-06, + "loss": 0.792, + "step": 36447 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126761442018027e-06, + "loss": 0.917, + "step": 36448 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126542750648078e-06, + "loss": 0.8066, + "step": 36449 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126324054587314e-06, + "loss": 0.8169, + "step": 36450 + }, + { + "epoch": 0.93, + "learning_rate": 1.6126105353835905e-06, + "loss": 1.0352, + "step": 36451 + }, + { + "epoch": 0.93, + "learning_rate": 1.6125886648394022e-06, + "loss": 0.8613, + "step": 36452 + }, + { + "epoch": 0.93, + "learning_rate": 1.6125667938261828e-06, + "loss": 0.8398, + "step": 36453 + }, + { + "epoch": 0.93, + "learning_rate": 1.612544922343949e-06, + "loss": 0.9414, + "step": 36454 + }, + { + "epoch": 0.93, + "learning_rate": 1.612523050392718e-06, + "loss": 0.7998, + "step": 36455 + }, + { + "epoch": 0.93, + "learning_rate": 1.612501177972506e-06, + "loss": 0.7534, + "step": 36456 + }, + { + "epoch": 0.93, + "learning_rate": 1.61247930508333e-06, + "loss": 1.0186, + "step": 36457 + }, + { + "epoch": 0.93, + "learning_rate": 1.6124574317252068e-06, + "loss": 0.8975, + "step": 36458 + }, + { + "epoch": 0.93, + "learning_rate": 1.6124355578981534e-06, + "loss": 0.5931, + "step": 36459 + }, + { + "epoch": 0.93, + "learning_rate": 1.612413683602186e-06, + "loss": 1.0215, + "step": 36460 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123918088373217e-06, + "loss": 0.8096, + "step": 36461 + }, + { + "epoch": 0.93, + "learning_rate": 1.612369933603577e-06, + "loss": 0.8633, + "step": 36462 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123480579009688e-06, + "loss": 0.8025, + "step": 36463 + }, + { + "epoch": 0.93, + "learning_rate": 1.612326181729514e-06, + "loss": 0.8633, + "step": 36464 + }, + { + "epoch": 0.93, + "learning_rate": 1.6123043050892293e-06, + "loss": 0.8115, + "step": 36465 + }, + { + "epoch": 0.93, + "learning_rate": 1.612282427980131e-06, + "loss": 1.0059, + "step": 36466 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122605504022365e-06, + "loss": 0.792, + "step": 36467 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122386723555619e-06, + "loss": 0.8232, + "step": 36468 + }, + { + "epoch": 0.93, + "learning_rate": 1.6122167938401248e-06, + "loss": 0.9033, + "step": 36469 + }, + { + "epoch": 0.93, + "learning_rate": 1.612194914855941e-06, + "loss": 0.8867, + "step": 36470 + }, + { + "epoch": 0.93, + "learning_rate": 1.612173035403028e-06, + "loss": 0.9072, + "step": 36471 + }, + { + "epoch": 0.93, + "learning_rate": 1.612151155481402e-06, + "loss": 0.7412, + "step": 36472 + }, + { + "epoch": 0.93, + "learning_rate": 1.6121292750910802e-06, + "loss": 0.8389, + "step": 36473 + }, + { + "epoch": 0.93, + "learning_rate": 1.6121073942320793e-06, + "loss": 0.8525, + "step": 36474 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120855129044158e-06, + "loss": 0.7393, + "step": 36475 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120636311081063e-06, + "loss": 1.0225, + "step": 36476 + }, + { + "epoch": 0.93, + "learning_rate": 1.612041748843168e-06, + "loss": 0.7546, + "step": 36477 + }, + { + "epoch": 0.93, + "learning_rate": 1.6120198661096173e-06, + "loss": 0.7568, + "step": 36478 + }, + { + "epoch": 0.93, + "learning_rate": 1.6119979829074714e-06, + "loss": 0.8965, + "step": 36479 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119760992367468e-06, + "loss": 0.8564, + "step": 36480 + }, + { + "epoch": 0.94, + "learning_rate": 1.61195421509746e-06, + "loss": 0.9961, + "step": 36481 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119323304896282e-06, + "loss": 0.7666, + "step": 36482 + }, + { + "epoch": 0.94, + "learning_rate": 1.6119104454132679e-06, + "loss": 1.0234, + "step": 36483 + }, + { + "epoch": 0.94, + "learning_rate": 1.611888559868396e-06, + "loss": 0.8223, + "step": 36484 + }, + { + "epoch": 0.94, + "learning_rate": 1.611866673855029e-06, + "loss": 0.6924, + "step": 36485 + }, + { + "epoch": 0.94, + "learning_rate": 1.611844787373184e-06, + "loss": 0.8252, + "step": 36486 + }, + { + "epoch": 0.94, + "learning_rate": 1.6118229004228772e-06, + "loss": 0.7607, + "step": 36487 + }, + { + "epoch": 0.94, + "learning_rate": 1.6118010130041263e-06, + "loss": 1.1455, + "step": 36488 + }, + { + "epoch": 0.94, + "learning_rate": 1.611779125116947e-06, + "loss": 0.8955, + "step": 36489 + }, + { + "epoch": 0.94, + "learning_rate": 1.6117572367613567e-06, + "loss": 0.8438, + "step": 36490 + }, + { + "epoch": 0.94, + "learning_rate": 1.6117353479373721e-06, + "loss": 0.832, + "step": 36491 + }, + { + "epoch": 0.94, + "learning_rate": 1.61171345864501e-06, + "loss": 0.8848, + "step": 36492 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116915688842868e-06, + "loss": 0.8066, + "step": 36493 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116696786552195e-06, + "loss": 0.6528, + "step": 36494 + }, + { + "epoch": 0.94, + "learning_rate": 1.611647787957825e-06, + "loss": 0.8599, + "step": 36495 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116258967921197e-06, + "loss": 1.0117, + "step": 36496 + }, + { + "epoch": 0.94, + "learning_rate": 1.6116040051581207e-06, + "loss": 0.7578, + "step": 36497 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115821130558449e-06, + "loss": 0.7754, + "step": 36498 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115602204853084e-06, + "loss": 0.7686, + "step": 36499 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115383274465284e-06, + "loss": 0.8447, + "step": 36500 + }, + { + "epoch": 0.94, + "learning_rate": 1.6115164339395217e-06, + "loss": 0.9902, + "step": 36501 + }, + { + "epoch": 0.94, + "learning_rate": 1.611494539964305e-06, + "loss": 0.7695, + "step": 36502 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114726455208951e-06, + "loss": 1.0117, + "step": 36503 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114507506093085e-06, + "loss": 0.8887, + "step": 36504 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114288552295623e-06, + "loss": 0.9053, + "step": 36505 + }, + { + "epoch": 0.94, + "learning_rate": 1.6114069593816733e-06, + "loss": 0.7656, + "step": 36506 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113850630656578e-06, + "loss": 0.8359, + "step": 36507 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113631662815332e-06, + "loss": 0.7705, + "step": 36508 + }, + { + "epoch": 0.94, + "learning_rate": 1.611341269029316e-06, + "loss": 0.7153, + "step": 36509 + }, + { + "epoch": 0.94, + "learning_rate": 1.6113193713090226e-06, + "loss": 0.9111, + "step": 36510 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112974731206702e-06, + "loss": 0.7969, + "step": 36511 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112755744642751e-06, + "loss": 0.6035, + "step": 36512 + }, + { + "epoch": 0.94, + "learning_rate": 1.611253675339855e-06, + "loss": 1.0859, + "step": 36513 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112317757474256e-06, + "loss": 0.7871, + "step": 36514 + }, + { + "epoch": 0.94, + "learning_rate": 1.6112098756870043e-06, + "loss": 0.6855, + "step": 36515 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111879751586078e-06, + "loss": 0.9609, + "step": 36516 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111660741622526e-06, + "loss": 0.7441, + "step": 36517 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111441726979558e-06, + "loss": 0.8223, + "step": 36518 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111222707657337e-06, + "loss": 0.8047, + "step": 36519 + }, + { + "epoch": 0.94, + "learning_rate": 1.6111003683656038e-06, + "loss": 0.8955, + "step": 36520 + }, + { + "epoch": 0.94, + "learning_rate": 1.611078465497582e-06, + "loss": 0.9355, + "step": 36521 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110565621616856e-06, + "loss": 0.9248, + "step": 36522 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110346583579318e-06, + "loss": 0.7515, + "step": 36523 + }, + { + "epoch": 0.94, + "learning_rate": 1.6110127540863364e-06, + "loss": 0.8643, + "step": 36524 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109908493469166e-06, + "loss": 0.8965, + "step": 36525 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109689441396892e-06, + "loss": 0.9834, + "step": 36526 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109470384646713e-06, + "loss": 0.8516, + "step": 36527 + }, + { + "epoch": 0.94, + "learning_rate": 1.610925132321879e-06, + "loss": 0.6544, + "step": 36528 + }, + { + "epoch": 0.94, + "learning_rate": 1.6109032257113294e-06, + "loss": 0.9062, + "step": 36529 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108813186330397e-06, + "loss": 0.7104, + "step": 36530 + }, + { + "epoch": 0.94, + "learning_rate": 1.610859411087026e-06, + "loss": 0.6309, + "step": 36531 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108375030733053e-06, + "loss": 0.8071, + "step": 36532 + }, + { + "epoch": 0.94, + "learning_rate": 1.6108155945918945e-06, + "loss": 0.7695, + "step": 36533 + }, + { + "epoch": 0.94, + "learning_rate": 1.61079368564281e-06, + "loss": 0.6934, + "step": 36534 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107717762260693e-06, + "loss": 0.8555, + "step": 36535 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107498663416886e-06, + "loss": 0.6992, + "step": 36536 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107279559896845e-06, + "loss": 0.9014, + "step": 36537 + }, + { + "epoch": 0.94, + "learning_rate": 1.6107060451700748e-06, + "loss": 1.0371, + "step": 36538 + }, + { + "epoch": 0.94, + "learning_rate": 1.610684133882875e-06, + "loss": 0.8467, + "step": 36539 + }, + { + "epoch": 0.94, + "learning_rate": 1.6106622221281024e-06, + "loss": 0.7715, + "step": 36540 + }, + { + "epoch": 0.94, + "learning_rate": 1.610640309905774e-06, + "loss": 1.0537, + "step": 36541 + }, + { + "epoch": 0.94, + "learning_rate": 1.6106183972159062e-06, + "loss": 0.7109, + "step": 36542 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105964840585163e-06, + "loss": 0.8887, + "step": 36543 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105745704336205e-06, + "loss": 0.8457, + "step": 36544 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105526563412358e-06, + "loss": 0.7256, + "step": 36545 + }, + { + "epoch": 0.94, + "learning_rate": 1.610530741781379e-06, + "loss": 1.0742, + "step": 36546 + }, + { + "epoch": 0.94, + "learning_rate": 1.6105088267540672e-06, + "loss": 0.6411, + "step": 36547 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104869112593167e-06, + "loss": 0.8853, + "step": 36548 + }, + { + "epoch": 0.94, + "learning_rate": 1.610464995297144e-06, + "loss": 0.7915, + "step": 36549 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104430788675668e-06, + "loss": 0.5938, + "step": 36550 + }, + { + "epoch": 0.94, + "learning_rate": 1.6104211619706014e-06, + "loss": 1.0566, + "step": 36551 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103992446062643e-06, + "loss": 1.2383, + "step": 36552 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103773267745729e-06, + "loss": 0.8545, + "step": 36553 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103554084755435e-06, + "loss": 0.6982, + "step": 36554 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103334897091928e-06, + "loss": 0.6545, + "step": 36555 + }, + { + "epoch": 0.94, + "learning_rate": 1.6103115704755384e-06, + "loss": 0.8867, + "step": 36556 + }, + { + "epoch": 0.94, + "learning_rate": 1.610289650774596e-06, + "loss": 0.8193, + "step": 36557 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102677306063832e-06, + "loss": 0.7656, + "step": 36558 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102458099709163e-06, + "loss": 0.8994, + "step": 36559 + }, + { + "epoch": 0.94, + "learning_rate": 1.610223888868212e-06, + "loss": 0.7017, + "step": 36560 + }, + { + "epoch": 0.94, + "learning_rate": 1.6102019672982876e-06, + "loss": 1.0264, + "step": 36561 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101800452611593e-06, + "loss": 0.8643, + "step": 36562 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101581227568449e-06, + "loss": 0.7559, + "step": 36563 + }, + { + "epoch": 0.94, + "learning_rate": 1.61013619978536e-06, + "loss": 0.7031, + "step": 36564 + }, + { + "epoch": 0.94, + "learning_rate": 1.6101142763467217e-06, + "loss": 0.9399, + "step": 36565 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100923524409474e-06, + "loss": 0.7574, + "step": 36566 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100704280680529e-06, + "loss": 0.7783, + "step": 36567 + }, + { + "epoch": 0.94, + "learning_rate": 1.610048503228056e-06, + "loss": 0.8164, + "step": 36568 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100265779209728e-06, + "loss": 0.96, + "step": 36569 + }, + { + "epoch": 0.94, + "learning_rate": 1.6100046521468204e-06, + "loss": 0.9277, + "step": 36570 + }, + { + "epoch": 0.94, + "learning_rate": 1.6099827259056154e-06, + "loss": 0.7808, + "step": 36571 + }, + { + "epoch": 0.94, + "learning_rate": 1.6099607991973744e-06, + "loss": 0.7339, + "step": 36572 + }, + { + "epoch": 0.94, + "learning_rate": 1.609938872022115e-06, + "loss": 0.803, + "step": 36573 + }, + { + "epoch": 0.94, + "learning_rate": 1.609916944379853e-06, + "loss": 0.8701, + "step": 36574 + }, + { + "epoch": 0.94, + "learning_rate": 1.609895016270606e-06, + "loss": 0.833, + "step": 36575 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098730876943903e-06, + "loss": 0.9854, + "step": 36576 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098511586512228e-06, + "loss": 0.8145, + "step": 36577 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098292291411202e-06, + "loss": 0.9766, + "step": 36578 + }, + { + "epoch": 0.94, + "learning_rate": 1.6098072991640996e-06, + "loss": 0.8779, + "step": 36579 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097853687201774e-06, + "loss": 0.9072, + "step": 36580 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097634378093705e-06, + "loss": 0.9937, + "step": 36581 + }, + { + "epoch": 0.94, + "learning_rate": 1.609741506431696e-06, + "loss": 0.8452, + "step": 36582 + }, + { + "epoch": 0.94, + "learning_rate": 1.6097195745871707e-06, + "loss": 0.8408, + "step": 36583 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096976422758108e-06, + "loss": 0.6943, + "step": 36584 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096757094976334e-06, + "loss": 0.8311, + "step": 36585 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096537762526556e-06, + "loss": 0.8184, + "step": 36586 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096318425408938e-06, + "loss": 0.71, + "step": 36587 + }, + { + "epoch": 0.94, + "learning_rate": 1.6096099083623649e-06, + "loss": 0.7852, + "step": 36588 + }, + { + "epoch": 0.94, + "learning_rate": 1.609587973717086e-06, + "loss": 0.8721, + "step": 36589 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095660386050732e-06, + "loss": 0.6183, + "step": 36590 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095441030263438e-06, + "loss": 0.6328, + "step": 36591 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095221669809145e-06, + "loss": 0.9648, + "step": 36592 + }, + { + "epoch": 0.94, + "learning_rate": 1.6095002304688024e-06, + "loss": 0.9092, + "step": 36593 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094782934900235e-06, + "loss": 0.7471, + "step": 36594 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094563560445955e-06, + "loss": 0.9199, + "step": 36595 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094344181325345e-06, + "loss": 0.8066, + "step": 36596 + }, + { + "epoch": 0.94, + "learning_rate": 1.6094124797538577e-06, + "loss": 0.9619, + "step": 36597 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093905409085822e-06, + "loss": 0.7197, + "step": 36598 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093686015967238e-06, + "loss": 0.8809, + "step": 36599 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093466618183003e-06, + "loss": 0.8491, + "step": 36600 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093247215733276e-06, + "loss": 0.7925, + "step": 36601 + }, + { + "epoch": 0.94, + "learning_rate": 1.6093027808618235e-06, + "loss": 0.9189, + "step": 36602 + }, + { + "epoch": 0.94, + "learning_rate": 1.6092808396838042e-06, + "loss": 0.6055, + "step": 36603 + }, + { + "epoch": 0.94, + "learning_rate": 1.6092588980392864e-06, + "loss": 1.0059, + "step": 36604 + }, + { + "epoch": 0.94, + "learning_rate": 1.609236955928287e-06, + "loss": 0.6143, + "step": 36605 + }, + { + "epoch": 0.94, + "learning_rate": 1.609215013350823e-06, + "loss": 0.7993, + "step": 36606 + }, + { + "epoch": 0.94, + "learning_rate": 1.609193070306911e-06, + "loss": 0.79, + "step": 36607 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091711267965683e-06, + "loss": 0.769, + "step": 36608 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091491828198107e-06, + "loss": 0.814, + "step": 36609 + }, + { + "epoch": 0.94, + "learning_rate": 1.6091272383766557e-06, + "loss": 0.4893, + "step": 36610 + }, + { + "epoch": 0.94, + "learning_rate": 1.60910529346712e-06, + "loss": 0.7451, + "step": 36611 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090833480912205e-06, + "loss": 0.3989, + "step": 36612 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090614022489738e-06, + "loss": 0.7778, + "step": 36613 + }, + { + "epoch": 0.94, + "learning_rate": 1.609039455940397e-06, + "loss": 0.7949, + "step": 36614 + }, + { + "epoch": 0.94, + "learning_rate": 1.6090175091655065e-06, + "loss": 0.7178, + "step": 36615 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089955619243193e-06, + "loss": 0.916, + "step": 36616 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089736142168523e-06, + "loss": 0.8428, + "step": 36617 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089516660431222e-06, + "loss": 0.7793, + "step": 36618 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089297174031456e-06, + "loss": 1.0469, + "step": 36619 + }, + { + "epoch": 0.94, + "learning_rate": 1.6089077682969397e-06, + "loss": 1.0537, + "step": 36620 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088858187245208e-06, + "loss": 0.8252, + "step": 36621 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088638686859065e-06, + "loss": 0.958, + "step": 36622 + }, + { + "epoch": 0.94, + "learning_rate": 1.608841918181113e-06, + "loss": 0.8555, + "step": 36623 + }, + { + "epoch": 0.94, + "learning_rate": 1.6088199672101572e-06, + "loss": 0.71, + "step": 36624 + }, + { + "epoch": 0.94, + "learning_rate": 1.608798015773056e-06, + "loss": 0.7476, + "step": 36625 + }, + { + "epoch": 0.94, + "learning_rate": 1.608776063869826e-06, + "loss": 0.9004, + "step": 36626 + }, + { + "epoch": 0.94, + "learning_rate": 1.608754111500484e-06, + "loss": 0.7598, + "step": 36627 + }, + { + "epoch": 0.94, + "learning_rate": 1.6087321586650476e-06, + "loss": 0.8975, + "step": 36628 + }, + { + "epoch": 0.94, + "learning_rate": 1.6087102053635324e-06, + "loss": 0.6021, + "step": 36629 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086882515959559e-06, + "loss": 0.8247, + "step": 36630 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086662973623348e-06, + "loss": 0.8789, + "step": 36631 + }, + { + "epoch": 0.94, + "learning_rate": 1.608644342662686e-06, + "loss": 0.7148, + "step": 36632 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086223874970264e-06, + "loss": 0.8369, + "step": 36633 + }, + { + "epoch": 0.94, + "learning_rate": 1.6086004318653724e-06, + "loss": 0.8047, + "step": 36634 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085784757677408e-06, + "loss": 0.6885, + "step": 36635 + }, + { + "epoch": 0.94, + "learning_rate": 1.608556519204149e-06, + "loss": 0.8848, + "step": 36636 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085345621746132e-06, + "loss": 0.8364, + "step": 36637 + }, + { + "epoch": 0.94, + "learning_rate": 1.6085126046791507e-06, + "loss": 0.7988, + "step": 36638 + }, + { + "epoch": 0.94, + "learning_rate": 1.608490646717778e-06, + "loss": 0.8408, + "step": 36639 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084686882905118e-06, + "loss": 0.9219, + "step": 36640 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084467293973693e-06, + "loss": 0.7549, + "step": 36641 + }, + { + "epoch": 0.94, + "learning_rate": 1.608424770038367e-06, + "loss": 0.7939, + "step": 36642 + }, + { + "epoch": 0.94, + "learning_rate": 1.6084028102135221e-06, + "loss": 0.7041, + "step": 36643 + }, + { + "epoch": 0.94, + "learning_rate": 1.608380849922851e-06, + "loss": 0.6001, + "step": 36644 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083588891663706e-06, + "loss": 0.9277, + "step": 36645 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083369279440976e-06, + "loss": 0.7925, + "step": 36646 + }, + { + "epoch": 0.94, + "learning_rate": 1.6083149662560494e-06, + "loss": 0.7212, + "step": 36647 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082930041022421e-06, + "loss": 0.8271, + "step": 36648 + }, + { + "epoch": 0.94, + "learning_rate": 1.608271041482693e-06, + "loss": 0.9668, + "step": 36649 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082490783974186e-06, + "loss": 0.6892, + "step": 36650 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082271148464358e-06, + "loss": 0.9375, + "step": 36651 + }, + { + "epoch": 0.94, + "learning_rate": 1.6082051508297615e-06, + "loss": 0.8096, + "step": 36652 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081831863474124e-06, + "loss": 0.7368, + "step": 36653 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081612213994058e-06, + "loss": 0.7031, + "step": 36654 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081392559857576e-06, + "loss": 0.876, + "step": 36655 + }, + { + "epoch": 0.94, + "learning_rate": 1.6081172901064855e-06, + "loss": 0.6968, + "step": 36656 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080953237616056e-06, + "loss": 0.9873, + "step": 36657 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080733569511352e-06, + "loss": 0.7666, + "step": 36658 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080513896750913e-06, + "loss": 1.0215, + "step": 36659 + }, + { + "epoch": 0.94, + "learning_rate": 1.6080294219334902e-06, + "loss": 0.7705, + "step": 36660 + }, + { + "epoch": 0.94, + "learning_rate": 1.608007453726349e-06, + "loss": 0.9844, + "step": 36661 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079854850536842e-06, + "loss": 0.771, + "step": 36662 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079635159155132e-06, + "loss": 0.8599, + "step": 36663 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079415463118524e-06, + "loss": 0.8887, + "step": 36664 + }, + { + "epoch": 0.94, + "learning_rate": 1.6079195762427185e-06, + "loss": 0.9824, + "step": 36665 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078976057081288e-06, + "loss": 0.8301, + "step": 36666 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078756347080997e-06, + "loss": 0.6367, + "step": 36667 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078536632426483e-06, + "loss": 1.0039, + "step": 36668 + }, + { + "epoch": 0.94, + "learning_rate": 1.607831691311791e-06, + "loss": 0.8564, + "step": 36669 + }, + { + "epoch": 0.94, + "learning_rate": 1.6078097189155452e-06, + "loss": 0.6245, + "step": 36670 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077877460539273e-06, + "loss": 1.0015, + "step": 36671 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077657727269544e-06, + "loss": 0.8506, + "step": 36672 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077437989346434e-06, + "loss": 0.7358, + "step": 36673 + }, + { + "epoch": 0.94, + "learning_rate": 1.6077218246770104e-06, + "loss": 0.8584, + "step": 36674 + }, + { + "epoch": 0.94, + "learning_rate": 1.607699849954073e-06, + "loss": 0.9551, + "step": 36675 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076778747658479e-06, + "loss": 0.9688, + "step": 36676 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076558991123514e-06, + "loss": 0.8584, + "step": 36677 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076339229936013e-06, + "loss": 0.8662, + "step": 36678 + }, + { + "epoch": 0.94, + "learning_rate": 1.6076119464096137e-06, + "loss": 0.9351, + "step": 36679 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075899693604051e-06, + "loss": 0.9873, + "step": 36680 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075679918459933e-06, + "loss": 0.7842, + "step": 36681 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075460138663942e-06, + "loss": 0.6494, + "step": 36682 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075240354216254e-06, + "loss": 0.9121, + "step": 36683 + }, + { + "epoch": 0.94, + "learning_rate": 1.6075020565117033e-06, + "loss": 0.7881, + "step": 36684 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074800771366445e-06, + "loss": 0.7578, + "step": 36685 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074580972964666e-06, + "loss": 0.8975, + "step": 36686 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074361169911857e-06, + "loss": 0.7451, + "step": 36687 + }, + { + "epoch": 0.94, + "learning_rate": 1.6074141362208188e-06, + "loss": 0.771, + "step": 36688 + }, + { + "epoch": 0.94, + "learning_rate": 1.607392154985383e-06, + "loss": 0.6157, + "step": 36689 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073701732848953e-06, + "loss": 0.8564, + "step": 36690 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073481911193716e-06, + "loss": 0.9326, + "step": 36691 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073262084888295e-06, + "loss": 1.1191, + "step": 36692 + }, + { + "epoch": 0.94, + "learning_rate": 1.6073042253932859e-06, + "loss": 0.9004, + "step": 36693 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072822418327572e-06, + "loss": 0.8833, + "step": 36694 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072602578072603e-06, + "loss": 0.8877, + "step": 36695 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072382733168122e-06, + "loss": 0.7676, + "step": 36696 + }, + { + "epoch": 0.94, + "learning_rate": 1.6072162883614294e-06, + "loss": 0.6724, + "step": 36697 + }, + { + "epoch": 0.94, + "learning_rate": 1.6071943029411298e-06, + "loss": 0.8506, + "step": 36698 + }, + { + "epoch": 0.94, + "learning_rate": 1.6071723170559288e-06, + "loss": 0.7041, + "step": 36699 + }, + { + "epoch": 0.94, + "learning_rate": 1.607150330705844e-06, + "loss": 0.8057, + "step": 36700 + }, + { + "epoch": 0.94, + "learning_rate": 1.607128343890892e-06, + "loss": 0.749, + "step": 36701 + }, + { + "epoch": 0.94, + "learning_rate": 1.60710635661109e-06, + "loss": 0.9736, + "step": 36702 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070843688664546e-06, + "loss": 0.8691, + "step": 36703 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070623806570023e-06, + "loss": 1.082, + "step": 36704 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070403919827506e-06, + "loss": 1.0273, + "step": 36705 + }, + { + "epoch": 0.94, + "learning_rate": 1.6070184028437156e-06, + "loss": 0.8838, + "step": 36706 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069964132399147e-06, + "loss": 0.7666, + "step": 36707 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069744231713646e-06, + "loss": 0.8135, + "step": 36708 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069524326380823e-06, + "loss": 0.7568, + "step": 36709 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069304416400842e-06, + "loss": 0.7734, + "step": 36710 + }, + { + "epoch": 0.94, + "learning_rate": 1.6069084501773873e-06, + "loss": 0.9238, + "step": 36711 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068864582500086e-06, + "loss": 0.5776, + "step": 36712 + }, + { + "epoch": 0.94, + "learning_rate": 1.606864465857965e-06, + "loss": 0.876, + "step": 36713 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068424730012731e-06, + "loss": 0.9404, + "step": 36714 + }, + { + "epoch": 0.94, + "learning_rate": 1.6068204796799494e-06, + "loss": 1.002, + "step": 36715 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067984858940116e-06, + "loss": 0.6699, + "step": 36716 + }, + { + "epoch": 0.94, + "learning_rate": 1.606776491643476e-06, + "loss": 0.7275, + "step": 36717 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067544969283597e-06, + "loss": 0.9316, + "step": 36718 + }, + { + "epoch": 0.94, + "learning_rate": 1.606732501748679e-06, + "loss": 1.0498, + "step": 36719 + }, + { + "epoch": 0.94, + "learning_rate": 1.6067105061044514e-06, + "loss": 0.709, + "step": 36720 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066885099956933e-06, + "loss": 0.9033, + "step": 36721 + }, + { + "epoch": 0.94, + "learning_rate": 1.606666513422422e-06, + "loss": 0.6382, + "step": 36722 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066445163846539e-06, + "loss": 0.7324, + "step": 36723 + }, + { + "epoch": 0.94, + "learning_rate": 1.6066225188824058e-06, + "loss": 0.958, + "step": 36724 + }, + { + "epoch": 0.94, + "learning_rate": 1.606600520915695e-06, + "loss": 0.8828, + "step": 36725 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065785224845378e-06, + "loss": 0.8789, + "step": 36726 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065565235889515e-06, + "loss": 0.7031, + "step": 36727 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065345242289527e-06, + "loss": 0.835, + "step": 36728 + }, + { + "epoch": 0.94, + "learning_rate": 1.6065125244045583e-06, + "loss": 0.6587, + "step": 36729 + }, + { + "epoch": 0.94, + "learning_rate": 1.6064905241157853e-06, + "loss": 0.5886, + "step": 36730 + }, + { + "epoch": 0.94, + "learning_rate": 1.60646852336265e-06, + "loss": 0.9912, + "step": 36731 + }, + { + "epoch": 0.94, + "learning_rate": 1.60644652214517e-06, + "loss": 0.9395, + "step": 36732 + }, + { + "epoch": 0.94, + "learning_rate": 1.6064245204633617e-06, + "loss": 0.8467, + "step": 36733 + }, + { + "epoch": 0.94, + "learning_rate": 1.606402518317242e-06, + "loss": 0.7959, + "step": 36734 + }, + { + "epoch": 0.94, + "learning_rate": 1.606380515706828e-06, + "loss": 0.9189, + "step": 36735 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063585126321359e-06, + "loss": 0.7979, + "step": 36736 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063365090931833e-06, + "loss": 0.8721, + "step": 36737 + }, + { + "epoch": 0.94, + "learning_rate": 1.6063145050899866e-06, + "loss": 0.6851, + "step": 36738 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062925006225627e-06, + "loss": 0.7402, + "step": 36739 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062704956909286e-06, + "loss": 0.8086, + "step": 36740 + }, + { + "epoch": 0.94, + "learning_rate": 1.606248490295101e-06, + "loss": 0.7065, + "step": 36741 + }, + { + "epoch": 0.94, + "learning_rate": 1.6062264844350968e-06, + "loss": 0.8516, + "step": 36742 + }, + { + "epoch": 0.94, + "learning_rate": 1.606204478110933e-06, + "loss": 0.8457, + "step": 36743 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061824713226262e-06, + "loss": 0.9531, + "step": 36744 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061604640701933e-06, + "loss": 0.8525, + "step": 36745 + }, + { + "epoch": 0.94, + "learning_rate": 1.6061384563536512e-06, + "loss": 0.6855, + "step": 36746 + }, + { + "epoch": 0.94, + "learning_rate": 1.606116448173017e-06, + "loss": 0.5852, + "step": 36747 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060944395283072e-06, + "loss": 0.8467, + "step": 36748 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060724304195383e-06, + "loss": 1.0449, + "step": 36749 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060504208467283e-06, + "loss": 0.8496, + "step": 36750 + }, + { + "epoch": 0.94, + "learning_rate": 1.606028410809893e-06, + "loss": 0.5876, + "step": 36751 + }, + { + "epoch": 0.94, + "learning_rate": 1.6060064003090496e-06, + "loss": 0.9053, + "step": 36752 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059843893442149e-06, + "loss": 0.8291, + "step": 36753 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059623779154058e-06, + "loss": 0.9688, + "step": 36754 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059403660226395e-06, + "loss": 0.8379, + "step": 36755 + }, + { + "epoch": 0.94, + "learning_rate": 1.6059183536659324e-06, + "loss": 0.8281, + "step": 36756 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058963408453012e-06, + "loss": 0.7578, + "step": 36757 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058743275607634e-06, + "loss": 0.8101, + "step": 36758 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058523138123352e-06, + "loss": 0.9409, + "step": 36759 + }, + { + "epoch": 0.94, + "learning_rate": 1.605830299600034e-06, + "loss": 0.8242, + "step": 36760 + }, + { + "epoch": 0.94, + "learning_rate": 1.6058082849238761e-06, + "loss": 0.9248, + "step": 36761 + }, + { + "epoch": 0.94, + "learning_rate": 1.6057862697838788e-06, + "loss": 1.0156, + "step": 36762 + }, + { + "epoch": 0.94, + "learning_rate": 1.605764254180059e-06, + "loss": 0.9922, + "step": 36763 + }, + { + "epoch": 0.94, + "learning_rate": 1.605742238112433e-06, + "loss": 0.6904, + "step": 36764 + }, + { + "epoch": 0.94, + "learning_rate": 1.6057202215810183e-06, + "loss": 0.9961, + "step": 36765 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056982045858315e-06, + "loss": 0.7861, + "step": 36766 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056761871268894e-06, + "loss": 0.8516, + "step": 36767 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056541692042086e-06, + "loss": 0.7261, + "step": 36768 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056321508178066e-06, + "loss": 0.7871, + "step": 36769 + }, + { + "epoch": 0.94, + "learning_rate": 1.6056101319676997e-06, + "loss": 0.8682, + "step": 36770 + }, + { + "epoch": 0.94, + "learning_rate": 1.605588112653905e-06, + "loss": 0.9756, + "step": 36771 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055660928764393e-06, + "loss": 0.9844, + "step": 36772 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055440726353195e-06, + "loss": 0.873, + "step": 36773 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055220519305626e-06, + "loss": 0.835, + "step": 36774 + }, + { + "epoch": 0.94, + "learning_rate": 1.6055000307621853e-06, + "loss": 1.001, + "step": 36775 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054780091302043e-06, + "loss": 0.8506, + "step": 36776 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054559870346367e-06, + "loss": 0.8115, + "step": 36777 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054339644754996e-06, + "loss": 0.7075, + "step": 36778 + }, + { + "epoch": 0.94, + "learning_rate": 1.6054119414528091e-06, + "loss": 0.7642, + "step": 36779 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053899179665824e-06, + "loss": 0.9297, + "step": 36780 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053678940168366e-06, + "loss": 0.9375, + "step": 36781 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053458696035889e-06, + "loss": 0.833, + "step": 36782 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053238447268553e-06, + "loss": 0.8701, + "step": 36783 + }, + { + "epoch": 0.94, + "learning_rate": 1.6053018193866532e-06, + "loss": 0.9707, + "step": 36784 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052797935829992e-06, + "loss": 0.7939, + "step": 36785 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052577673159104e-06, + "loss": 0.8198, + "step": 36786 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052357405854035e-06, + "loss": 0.7764, + "step": 36787 + }, + { + "epoch": 0.94, + "learning_rate": 1.6052137133914956e-06, + "loss": 0.9912, + "step": 36788 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051916857342032e-06, + "loss": 0.75, + "step": 36789 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051696576135435e-06, + "loss": 1.0244, + "step": 36790 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051476290295328e-06, + "loss": 0.7441, + "step": 36791 + }, + { + "epoch": 0.94, + "learning_rate": 1.6051255999821888e-06, + "loss": 0.8013, + "step": 36792 + }, + { + "epoch": 0.94, + "learning_rate": 1.605103570471528e-06, + "loss": 0.7422, + "step": 36793 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050815404975671e-06, + "loss": 1.0225, + "step": 36794 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050595100603231e-06, + "loss": 0.6857, + "step": 36795 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050374791598127e-06, + "loss": 0.792, + "step": 36796 + }, + { + "epoch": 0.94, + "learning_rate": 1.6050154477960531e-06, + "loss": 0.8867, + "step": 36797 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049934159690608e-06, + "loss": 0.7871, + "step": 36798 + }, + { + "epoch": 0.94, + "learning_rate": 1.604971383678853e-06, + "loss": 0.6265, + "step": 36799 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049493509254463e-06, + "loss": 0.8262, + "step": 36800 + }, + { + "epoch": 0.94, + "learning_rate": 1.604927317708858e-06, + "loss": 0.9629, + "step": 36801 + }, + { + "epoch": 0.94, + "learning_rate": 1.6049052840291047e-06, + "loss": 0.9238, + "step": 36802 + }, + { + "epoch": 0.94, + "learning_rate": 1.604883249886203e-06, + "loss": 0.8799, + "step": 36803 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048612152801698e-06, + "loss": 0.8721, + "step": 36804 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048391802110223e-06, + "loss": 0.8535, + "step": 36805 + }, + { + "epoch": 0.94, + "learning_rate": 1.6048171446787775e-06, + "loss": 0.7969, + "step": 36806 + }, + { + "epoch": 0.94, + "learning_rate": 1.604795108683452e-06, + "loss": 0.6964, + "step": 36807 + }, + { + "epoch": 0.94, + "learning_rate": 1.6047730722250626e-06, + "loss": 0.7656, + "step": 36808 + }, + { + "epoch": 0.94, + "learning_rate": 1.604751035303626e-06, + "loss": 0.8096, + "step": 36809 + }, + { + "epoch": 0.94, + "learning_rate": 1.6047289979191598e-06, + "loss": 0.6191, + "step": 36810 + }, + { + "epoch": 0.94, + "learning_rate": 1.60470696007168e-06, + "loss": 0.6587, + "step": 36811 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046849217612043e-06, + "loss": 0.9971, + "step": 36812 + }, + { + "epoch": 0.94, + "learning_rate": 1.604662882987749e-06, + "loss": 1.0283, + "step": 36813 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046408437513308e-06, + "loss": 0.7471, + "step": 36814 + }, + { + "epoch": 0.94, + "learning_rate": 1.6046188040519673e-06, + "loss": 0.9785, + "step": 36815 + }, + { + "epoch": 0.94, + "learning_rate": 1.604596763889675e-06, + "loss": 0.7725, + "step": 36816 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045747232644703e-06, + "loss": 0.8447, + "step": 36817 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045526821763708e-06, + "loss": 0.8359, + "step": 36818 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045306406253933e-06, + "loss": 0.8906, + "step": 36819 + }, + { + "epoch": 0.94, + "learning_rate": 1.6045085986115543e-06, + "loss": 1.0557, + "step": 36820 + }, + { + "epoch": 0.94, + "learning_rate": 1.6044865561348711e-06, + "loss": 0.7002, + "step": 36821 + }, + { + "epoch": 0.94, + "learning_rate": 1.60446451319536e-06, + "loss": 0.9922, + "step": 36822 + }, + { + "epoch": 0.94, + "learning_rate": 1.6044424697930382e-06, + "loss": 0.9639, + "step": 36823 + }, + { + "epoch": 0.94, + "learning_rate": 1.604420425927923e-06, + "loss": 0.5459, + "step": 36824 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043983816000305e-06, + "loss": 0.6255, + "step": 36825 + }, + { + "epoch": 0.94, + "learning_rate": 1.604376336809378e-06, + "loss": 0.96, + "step": 36826 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043542915559826e-06, + "loss": 0.8955, + "step": 36827 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043322458398607e-06, + "loss": 0.7725, + "step": 36828 + }, + { + "epoch": 0.94, + "learning_rate": 1.6043101996610293e-06, + "loss": 0.8262, + "step": 36829 + }, + { + "epoch": 0.94, + "learning_rate": 1.6042881530195056e-06, + "loss": 0.9531, + "step": 36830 + }, + { + "epoch": 0.94, + "learning_rate": 1.6042661059153061e-06, + "loss": 0.7095, + "step": 36831 + }, + { + "epoch": 0.94, + "learning_rate": 1.604244058348448e-06, + "loss": 0.9463, + "step": 36832 + }, + { + "epoch": 0.94, + "learning_rate": 1.604222010318948e-06, + "loss": 1.0156, + "step": 36833 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041999618268225e-06, + "loss": 0.8057, + "step": 36834 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041779128720894e-06, + "loss": 0.7979, + "step": 36835 + }, + { + "epoch": 0.94, + "learning_rate": 1.604155863454765e-06, + "loss": 0.8701, + "step": 36836 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041338135748662e-06, + "loss": 0.834, + "step": 36837 + }, + { + "epoch": 0.94, + "learning_rate": 1.6041117632324096e-06, + "loss": 0.9258, + "step": 36838 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040897124274126e-06, + "loss": 0.9775, + "step": 36839 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040676611598918e-06, + "loss": 0.6758, + "step": 36840 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040456094298645e-06, + "loss": 0.9102, + "step": 36841 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040235572373471e-06, + "loss": 0.8223, + "step": 36842 + }, + { + "epoch": 0.94, + "learning_rate": 1.6040015045823565e-06, + "loss": 0.8047, + "step": 36843 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039794514649096e-06, + "loss": 0.6562, + "step": 36844 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039573978850236e-06, + "loss": 0.9961, + "step": 36845 + }, + { + "epoch": 0.94, + "learning_rate": 1.603935343842715e-06, + "loss": 0.8184, + "step": 36846 + }, + { + "epoch": 0.94, + "learning_rate": 1.6039132893380013e-06, + "loss": 0.752, + "step": 36847 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038912343708985e-06, + "loss": 0.9023, + "step": 36848 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038691789414242e-06, + "loss": 0.9316, + "step": 36849 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038471230495952e-06, + "loss": 1.0342, + "step": 36850 + }, + { + "epoch": 0.94, + "learning_rate": 1.603825066695428e-06, + "loss": 0.9771, + "step": 36851 + }, + { + "epoch": 0.94, + "learning_rate": 1.6038030098789398e-06, + "loss": 0.7437, + "step": 36852 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037809526001473e-06, + "loss": 0.6604, + "step": 36853 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037588948590678e-06, + "loss": 0.7939, + "step": 36854 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037368366557174e-06, + "loss": 0.792, + "step": 36855 + }, + { + "epoch": 0.94, + "learning_rate": 1.6037147779901137e-06, + "loss": 0.8369, + "step": 36856 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036927188622732e-06, + "loss": 0.8408, + "step": 36857 + }, + { + "epoch": 0.94, + "learning_rate": 1.603670659272213e-06, + "loss": 0.8857, + "step": 36858 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036485992199503e-06, + "loss": 0.8906, + "step": 36859 + }, + { + "epoch": 0.94, + "learning_rate": 1.6036265387055013e-06, + "loss": 0.835, + "step": 36860 + }, + { + "epoch": 0.94, + "learning_rate": 1.603604477728883e-06, + "loss": 0.7085, + "step": 36861 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035824162901127e-06, + "loss": 0.73, + "step": 36862 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035603543892071e-06, + "loss": 0.9736, + "step": 36863 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035382920261832e-06, + "loss": 0.5967, + "step": 36864 + }, + { + "epoch": 0.94, + "learning_rate": 1.6035162292010578e-06, + "loss": 0.729, + "step": 36865 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034941659138474e-06, + "loss": 0.647, + "step": 36866 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034721021645698e-06, + "loss": 0.8613, + "step": 36867 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034500379532412e-06, + "loss": 0.8281, + "step": 36868 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034279732798784e-06, + "loss": 0.7393, + "step": 36869 + }, + { + "epoch": 0.94, + "learning_rate": 1.6034059081444988e-06, + "loss": 0.8281, + "step": 36870 + }, + { + "epoch": 0.95, + "learning_rate": 1.603383842547119e-06, + "loss": 0.5913, + "step": 36871 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033617764877559e-06, + "loss": 0.7466, + "step": 36872 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033397099664266e-06, + "loss": 0.8008, + "step": 36873 + }, + { + "epoch": 0.95, + "learning_rate": 1.6033176429831473e-06, + "loss": 0.6978, + "step": 36874 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032955755379361e-06, + "loss": 0.7944, + "step": 36875 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032735076308086e-06, + "loss": 0.8018, + "step": 36876 + }, + { + "epoch": 0.95, + "learning_rate": 1.6032514392617826e-06, + "loss": 0.9102, + "step": 36877 + }, + { + "epoch": 0.95, + "learning_rate": 1.603229370430875e-06, + "loss": 0.9385, + "step": 36878 + }, + { + "epoch": 0.95, + "learning_rate": 1.603207301138102e-06, + "loss": 0.9297, + "step": 36879 + }, + { + "epoch": 0.95, + "learning_rate": 1.603185231383481e-06, + "loss": 0.8027, + "step": 36880 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031631611670288e-06, + "loss": 0.8359, + "step": 36881 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031410904887623e-06, + "loss": 0.855, + "step": 36882 + }, + { + "epoch": 0.95, + "learning_rate": 1.6031190193486985e-06, + "loss": 0.8154, + "step": 36883 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030969477468541e-06, + "loss": 0.644, + "step": 36884 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030748756832462e-06, + "loss": 0.4723, + "step": 36885 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030528031578915e-06, + "loss": 0.7651, + "step": 36886 + }, + { + "epoch": 0.95, + "learning_rate": 1.603030730170807e-06, + "loss": 0.9414, + "step": 36887 + }, + { + "epoch": 0.95, + "learning_rate": 1.6030086567220096e-06, + "loss": 0.8838, + "step": 36888 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029865828115164e-06, + "loss": 0.7988, + "step": 36889 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029645084393437e-06, + "loss": 0.9004, + "step": 36890 + }, + { + "epoch": 0.95, + "learning_rate": 1.602942433605509e-06, + "loss": 0.9619, + "step": 36891 + }, + { + "epoch": 0.95, + "learning_rate": 1.6029203583100292e-06, + "loss": 0.8252, + "step": 36892 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028982825529207e-06, + "loss": 1.0684, + "step": 36893 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028762063342009e-06, + "loss": 0.709, + "step": 36894 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028541296538864e-06, + "loss": 0.7715, + "step": 36895 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028320525119943e-06, + "loss": 0.8818, + "step": 36896 + }, + { + "epoch": 0.95, + "learning_rate": 1.6028099749085416e-06, + "loss": 0.6101, + "step": 36897 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027878968435447e-06, + "loss": 0.9248, + "step": 36898 + }, + { + "epoch": 0.95, + "learning_rate": 1.602765818317021e-06, + "loss": 1.082, + "step": 36899 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027437393289868e-06, + "loss": 1.0117, + "step": 36900 + }, + { + "epoch": 0.95, + "learning_rate": 1.6027216598794597e-06, + "loss": 0.9033, + "step": 36901 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026995799684566e-06, + "loss": 0.8828, + "step": 36902 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026774995959941e-06, + "loss": 0.8711, + "step": 36903 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026554187620889e-06, + "loss": 0.8574, + "step": 36904 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026333374667584e-06, + "loss": 0.9961, + "step": 36905 + }, + { + "epoch": 0.95, + "learning_rate": 1.6026112557100188e-06, + "loss": 0.749, + "step": 36906 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025891734918878e-06, + "loss": 0.7681, + "step": 36907 + }, + { + "epoch": 0.95, + "learning_rate": 1.602567090812382e-06, + "loss": 0.9629, + "step": 36908 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025450076715186e-06, + "loss": 0.6606, + "step": 36909 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025229240693136e-06, + "loss": 1.082, + "step": 36910 + }, + { + "epoch": 0.95, + "learning_rate": 1.6025008400057848e-06, + "loss": 0.7183, + "step": 36911 + }, + { + "epoch": 0.95, + "learning_rate": 1.602478755480949e-06, + "loss": 0.7002, + "step": 36912 + }, + { + "epoch": 0.95, + "learning_rate": 1.6024566704948225e-06, + "loss": 0.7344, + "step": 36913 + }, + { + "epoch": 0.95, + "learning_rate": 1.602434585047423e-06, + "loss": 0.7388, + "step": 36914 + }, + { + "epoch": 0.95, + "learning_rate": 1.6024124991387669e-06, + "loss": 0.8162, + "step": 36915 + }, + { + "epoch": 0.95, + "learning_rate": 1.602390412768871e-06, + "loss": 0.6685, + "step": 36916 + }, + { + "epoch": 0.95, + "learning_rate": 1.602368325937753e-06, + "loss": 0.873, + "step": 36917 + }, + { + "epoch": 0.95, + "learning_rate": 1.6023462386454286e-06, + "loss": 1.0195, + "step": 36918 + }, + { + "epoch": 0.95, + "learning_rate": 1.6023241508919158e-06, + "loss": 0.8916, + "step": 36919 + }, + { + "epoch": 0.95, + "learning_rate": 1.602302062677231e-06, + "loss": 0.7959, + "step": 36920 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022799740013913e-06, + "loss": 0.5293, + "step": 36921 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022578848644134e-06, + "loss": 0.832, + "step": 36922 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022357952663144e-06, + "loss": 0.6704, + "step": 36923 + }, + { + "epoch": 0.95, + "learning_rate": 1.6022137052071111e-06, + "loss": 0.9746, + "step": 36924 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021916146868204e-06, + "loss": 0.958, + "step": 36925 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021695237054594e-06, + "loss": 0.709, + "step": 36926 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021474322630448e-06, + "loss": 0.8838, + "step": 36927 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021253403595938e-06, + "loss": 0.7129, + "step": 36928 + }, + { + "epoch": 0.95, + "learning_rate": 1.6021032479951226e-06, + "loss": 0.9561, + "step": 36929 + }, + { + "epoch": 0.95, + "learning_rate": 1.602081155169649e-06, + "loss": 0.8027, + "step": 36930 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020590618831897e-06, + "loss": 0.7109, + "step": 36931 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020369681357613e-06, + "loss": 0.8711, + "step": 36932 + }, + { + "epoch": 0.95, + "learning_rate": 1.6020148739273807e-06, + "loss": 0.4648, + "step": 36933 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019927792580651e-06, + "loss": 0.5925, + "step": 36934 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019706841278313e-06, + "loss": 0.8691, + "step": 36935 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019485885366963e-06, + "loss": 0.8359, + "step": 36936 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019264924846772e-06, + "loss": 0.915, + "step": 36937 + }, + { + "epoch": 0.95, + "learning_rate": 1.6019043959717901e-06, + "loss": 0.5112, + "step": 36938 + }, + { + "epoch": 0.95, + "learning_rate": 1.601882298998053e-06, + "loss": 0.6816, + "step": 36939 + }, + { + "epoch": 0.95, + "learning_rate": 1.601860201563482e-06, + "loss": 0.7905, + "step": 36940 + }, + { + "epoch": 0.95, + "learning_rate": 1.6018381036680944e-06, + "loss": 0.8301, + "step": 36941 + }, + { + "epoch": 0.95, + "learning_rate": 1.6018160053119072e-06, + "loss": 0.7598, + "step": 36942 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017939064949366e-06, + "loss": 0.7134, + "step": 36943 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017718072172006e-06, + "loss": 0.8945, + "step": 36944 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017497074787153e-06, + "loss": 0.9561, + "step": 36945 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017276072794981e-06, + "loss": 1.001, + "step": 36946 + }, + { + "epoch": 0.95, + "learning_rate": 1.6017055066195658e-06, + "loss": 0.6128, + "step": 36947 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016834054989351e-06, + "loss": 0.8828, + "step": 36948 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016613039176232e-06, + "loss": 0.9219, + "step": 36949 + }, + { + "epoch": 0.95, + "learning_rate": 1.6016392018756468e-06, + "loss": 0.9316, + "step": 36950 + }, + { + "epoch": 0.95, + "learning_rate": 1.601617099373023e-06, + "loss": 0.8945, + "step": 36951 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015949964097688e-06, + "loss": 0.8838, + "step": 36952 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015728929859008e-06, + "loss": 0.6816, + "step": 36953 + }, + { + "epoch": 0.95, + "learning_rate": 1.601550789101436e-06, + "loss": 0.9443, + "step": 36954 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015286847563914e-06, + "loss": 0.5864, + "step": 36955 + }, + { + "epoch": 0.95, + "learning_rate": 1.6015065799507842e-06, + "loss": 0.7354, + "step": 36956 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014844746846307e-06, + "loss": 0.5762, + "step": 36957 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014623689579486e-06, + "loss": 1.0107, + "step": 36958 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014402627707542e-06, + "loss": 1.0137, + "step": 36959 + }, + { + "epoch": 0.95, + "learning_rate": 1.6014181561230648e-06, + "loss": 0.8457, + "step": 36960 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013960490148968e-06, + "loss": 0.874, + "step": 36961 + }, + { + "epoch": 0.95, + "learning_rate": 1.601373941446268e-06, + "loss": 0.6431, + "step": 36962 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013518334171945e-06, + "loss": 0.8721, + "step": 36963 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013297249276936e-06, + "loss": 1.04, + "step": 36964 + }, + { + "epoch": 0.95, + "learning_rate": 1.6013076159777822e-06, + "loss": 0.8447, + "step": 36965 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012855065674773e-06, + "loss": 0.8105, + "step": 36966 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012633966967956e-06, + "loss": 0.8721, + "step": 36967 + }, + { + "epoch": 0.95, + "learning_rate": 1.6012412863657544e-06, + "loss": 0.7739, + "step": 36968 + }, + { + "epoch": 0.95, + "learning_rate": 1.60121917557437e-06, + "loss": 0.8516, + "step": 36969 + }, + { + "epoch": 0.95, + "learning_rate": 1.60119706432266e-06, + "loss": 0.7993, + "step": 36970 + }, + { + "epoch": 0.95, + "learning_rate": 1.601174952610641e-06, + "loss": 0.7471, + "step": 36971 + }, + { + "epoch": 0.95, + "learning_rate": 1.60115284043833e-06, + "loss": 0.7302, + "step": 36972 + }, + { + "epoch": 0.95, + "learning_rate": 1.6011307278057439e-06, + "loss": 0.8721, + "step": 36973 + }, + { + "epoch": 0.95, + "learning_rate": 1.6011086147128997e-06, + "loss": 0.7686, + "step": 36974 + }, + { + "epoch": 0.95, + "learning_rate": 1.601086501159814e-06, + "loss": 0.873, + "step": 36975 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010643871465044e-06, + "loss": 0.8516, + "step": 36976 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010422726729874e-06, + "loss": 0.9727, + "step": 36977 + }, + { + "epoch": 0.95, + "learning_rate": 1.6010201577392797e-06, + "loss": 0.7666, + "step": 36978 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009980423453985e-06, + "loss": 0.8423, + "step": 36979 + }, + { + "epoch": 0.95, + "learning_rate": 1.600975926491361e-06, + "loss": 0.8867, + "step": 36980 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009538101771836e-06, + "loss": 0.9297, + "step": 36981 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009316934028837e-06, + "loss": 0.9395, + "step": 36982 + }, + { + "epoch": 0.95, + "learning_rate": 1.6009095761684778e-06, + "loss": 0.8469, + "step": 36983 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008874584739834e-06, + "loss": 0.771, + "step": 36984 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008653403194168e-06, + "loss": 0.9502, + "step": 36985 + }, + { + "epoch": 0.95, + "learning_rate": 1.6008432217047953e-06, + "loss": 0.8203, + "step": 36986 + }, + { + "epoch": 0.95, + "learning_rate": 1.600821102630136e-06, + "loss": 1.0371, + "step": 36987 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007989830954553e-06, + "loss": 0.8936, + "step": 36988 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007768631007705e-06, + "loss": 0.9678, + "step": 36989 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007547426460987e-06, + "loss": 0.7598, + "step": 36990 + }, + { + "epoch": 0.95, + "learning_rate": 1.6007326217314562e-06, + "loss": 0.7393, + "step": 36991 + }, + { + "epoch": 0.95, + "learning_rate": 1.600710500356861e-06, + "loss": 0.8271, + "step": 36992 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006883785223288e-06, + "loss": 0.9668, + "step": 36993 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006662562278775e-06, + "loss": 0.6816, + "step": 36994 + }, + { + "epoch": 0.95, + "learning_rate": 1.6006441334735235e-06, + "loss": 0.8276, + "step": 36995 + }, + { + "epoch": 0.95, + "learning_rate": 1.600622010259284e-06, + "loss": 1.0215, + "step": 36996 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005998865851757e-06, + "loss": 0.7607, + "step": 36997 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005777624512157e-06, + "loss": 0.6421, + "step": 36998 + }, + { + "epoch": 0.95, + "learning_rate": 1.600555637857421e-06, + "loss": 0.7539, + "step": 36999 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005335128038082e-06, + "loss": 0.8047, + "step": 37000 + }, + { + "epoch": 0.95, + "learning_rate": 1.6005113872903947e-06, + "loss": 0.7422, + "step": 37001 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004892613171976e-06, + "loss": 0.7754, + "step": 37002 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004671348842331e-06, + "loss": 0.8169, + "step": 37003 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004450079915186e-06, + "loss": 0.7969, + "step": 37004 + }, + { + "epoch": 0.95, + "learning_rate": 1.6004228806390708e-06, + "loss": 0.7515, + "step": 37005 + }, + { + "epoch": 0.95, + "learning_rate": 1.600400752826907e-06, + "loss": 0.9072, + "step": 37006 + }, + { + "epoch": 0.95, + "learning_rate": 1.600378624555044e-06, + "loss": 0.8022, + "step": 37007 + }, + { + "epoch": 0.95, + "learning_rate": 1.6003564958234988e-06, + "loss": 0.7007, + "step": 37008 + }, + { + "epoch": 0.95, + "learning_rate": 1.600334366632288e-06, + "loss": 0.877, + "step": 37009 + }, + { + "epoch": 0.95, + "learning_rate": 1.6003122369814288e-06, + "loss": 0.9131, + "step": 37010 + }, + { + "epoch": 0.95, + "learning_rate": 1.600290106870938e-06, + "loss": 0.7988, + "step": 37011 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002679763008331e-06, + "loss": 0.8706, + "step": 37012 + }, + { + "epoch": 0.95, + "learning_rate": 1.60024584527113e-06, + "loss": 0.9385, + "step": 37013 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002237137818467e-06, + "loss": 0.959, + "step": 37014 + }, + { + "epoch": 0.95, + "learning_rate": 1.6002015818329998e-06, + "loss": 0.9014, + "step": 37015 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001794494246058e-06, + "loss": 1.0156, + "step": 37016 + }, + { + "epoch": 0.95, + "learning_rate": 1.600157316556682e-06, + "loss": 0.9766, + "step": 37017 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001351832292456e-06, + "loss": 0.7002, + "step": 37018 + }, + { + "epoch": 0.95, + "learning_rate": 1.6001130494423131e-06, + "loss": 0.8052, + "step": 37019 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000909151959015e-06, + "loss": 0.9062, + "step": 37020 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000687804900284e-06, + "loss": 0.6924, + "step": 37021 + }, + { + "epoch": 0.95, + "learning_rate": 1.60004664532471e-06, + "loss": 0.7876, + "step": 37022 + }, + { + "epoch": 0.95, + "learning_rate": 1.600024509699963e-06, + "loss": 0.6509, + "step": 37023 + }, + { + "epoch": 0.95, + "learning_rate": 1.6000023736158052e-06, + "loss": 1.0332, + "step": 37024 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999802370722533e-06, + "loss": 0.9082, + "step": 37025 + }, + { + "epoch": 0.95, + "learning_rate": 1.599958100069324e-06, + "loss": 0.8169, + "step": 37026 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999359626070343e-06, + "loss": 0.874, + "step": 37027 + }, + { + "epoch": 0.95, + "learning_rate": 1.5999138246854012e-06, + "loss": 0.8486, + "step": 37028 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998916863044417e-06, + "loss": 0.6304, + "step": 37029 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998695474641729e-06, + "loss": 0.7261, + "step": 37030 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998474081646115e-06, + "loss": 0.8047, + "step": 37031 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998252684057744e-06, + "loss": 1.1895, + "step": 37032 + }, + { + "epoch": 0.95, + "learning_rate": 1.5998031281876786e-06, + "loss": 0.6655, + "step": 37033 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997809875103412e-06, + "loss": 1.0215, + "step": 37034 + }, + { + "epoch": 0.95, + "learning_rate": 1.599758846373779e-06, + "loss": 0.8398, + "step": 37035 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997367047780094e-06, + "loss": 0.8027, + "step": 37036 + }, + { + "epoch": 0.95, + "learning_rate": 1.5997145627230487e-06, + "loss": 0.689, + "step": 37037 + }, + { + "epoch": 0.95, + "learning_rate": 1.599692420208914e-06, + "loss": 0.6787, + "step": 37038 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996702772356225e-06, + "loss": 0.7278, + "step": 37039 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996481338031913e-06, + "loss": 0.9404, + "step": 37040 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996259899116366e-06, + "loss": 0.8789, + "step": 37041 + }, + { + "epoch": 0.95, + "learning_rate": 1.5996038455609763e-06, + "loss": 0.7661, + "step": 37042 + }, + { + "epoch": 0.95, + "learning_rate": 1.599581700751227e-06, + "loss": 1.2041, + "step": 37043 + }, + { + "epoch": 0.95, + "learning_rate": 1.599559555482405e-06, + "loss": 0.6016, + "step": 37044 + }, + { + "epoch": 0.95, + "learning_rate": 1.5995374097545282e-06, + "loss": 0.873, + "step": 37045 + }, + { + "epoch": 0.95, + "learning_rate": 1.599515263567613e-06, + "loss": 0.6299, + "step": 37046 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994931169216768e-06, + "loss": 0.8477, + "step": 37047 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994709698167362e-06, + "loss": 0.8955, + "step": 37048 + }, + { + "epoch": 0.95, + "learning_rate": 1.599448822252808e-06, + "loss": 0.7988, + "step": 37049 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994266742299094e-06, + "loss": 0.769, + "step": 37050 + }, + { + "epoch": 0.95, + "learning_rate": 1.5994045257480577e-06, + "loss": 0.8877, + "step": 37051 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993823768072693e-06, + "loss": 1.0166, + "step": 37052 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993602274075615e-06, + "loss": 0.8066, + "step": 37053 + }, + { + "epoch": 0.95, + "learning_rate": 1.599338077548951e-06, + "loss": 1.042, + "step": 37054 + }, + { + "epoch": 0.95, + "learning_rate": 1.5993159272314549e-06, + "loss": 0.9238, + "step": 37055 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992937764550902e-06, + "loss": 0.834, + "step": 37056 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992716252198738e-06, + "loss": 0.6201, + "step": 37057 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992494735258229e-06, + "loss": 1.1162, + "step": 37058 + }, + { + "epoch": 0.95, + "learning_rate": 1.5992273213729539e-06, + "loss": 1.1816, + "step": 37059 + }, + { + "epoch": 0.95, + "learning_rate": 1.599205168761284e-06, + "loss": 0.7622, + "step": 37060 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991830156908303e-06, + "loss": 0.7979, + "step": 37061 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991608621616098e-06, + "loss": 1.042, + "step": 37062 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991387081736395e-06, + "loss": 1.0508, + "step": 37063 + }, + { + "epoch": 0.95, + "learning_rate": 1.5991165537269363e-06, + "loss": 0.75, + "step": 37064 + }, + { + "epoch": 0.95, + "learning_rate": 1.599094398821517e-06, + "loss": 0.8047, + "step": 37065 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990722434573987e-06, + "loss": 0.9678, + "step": 37066 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990500876345983e-06, + "loss": 0.8599, + "step": 37067 + }, + { + "epoch": 0.95, + "learning_rate": 1.5990279313531328e-06, + "loss": 0.8462, + "step": 37068 + }, + { + "epoch": 0.95, + "learning_rate": 1.599005774613019e-06, + "loss": 0.8213, + "step": 37069 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989836174142743e-06, + "loss": 0.8555, + "step": 37070 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989614597569151e-06, + "loss": 0.8359, + "step": 37071 + }, + { + "epoch": 0.95, + "learning_rate": 1.598939301640959e-06, + "loss": 0.7104, + "step": 37072 + }, + { + "epoch": 0.95, + "learning_rate": 1.5989171430664223e-06, + "loss": 1.0137, + "step": 37073 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988949840333223e-06, + "loss": 0.9834, + "step": 37074 + }, + { + "epoch": 0.95, + "learning_rate": 1.598872824541676e-06, + "loss": 0.7461, + "step": 37075 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988506645915005e-06, + "loss": 0.7051, + "step": 37076 + }, + { + "epoch": 0.95, + "learning_rate": 1.5988285041828125e-06, + "loss": 0.9482, + "step": 37077 + }, + { + "epoch": 0.95, + "learning_rate": 1.598806343315629e-06, + "loss": 0.832, + "step": 37078 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987841819899667e-06, + "loss": 0.5952, + "step": 37079 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987620202058433e-06, + "loss": 0.8564, + "step": 37080 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987398579632752e-06, + "loss": 0.7583, + "step": 37081 + }, + { + "epoch": 0.95, + "learning_rate": 1.5987176952622797e-06, + "loss": 0.9424, + "step": 37082 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986955321028733e-06, + "loss": 0.7251, + "step": 37083 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986733684850735e-06, + "loss": 0.6357, + "step": 37084 + }, + { + "epoch": 0.95, + "learning_rate": 1.598651204408897e-06, + "loss": 0.9199, + "step": 37085 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986290398743608e-06, + "loss": 0.9297, + "step": 37086 + }, + { + "epoch": 0.95, + "learning_rate": 1.5986068748814815e-06, + "loss": 0.9219, + "step": 37087 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985847094302768e-06, + "loss": 0.7383, + "step": 37088 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985625435207633e-06, + "loss": 0.9443, + "step": 37089 + }, + { + "epoch": 0.95, + "learning_rate": 1.598540377152958e-06, + "loss": 0.6147, + "step": 37090 + }, + { + "epoch": 0.95, + "learning_rate": 1.5985182103268779e-06, + "loss": 0.9521, + "step": 37091 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984960430425399e-06, + "loss": 0.8701, + "step": 37092 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984738752999606e-06, + "loss": 0.833, + "step": 37093 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984517070991576e-06, + "loss": 0.8535, + "step": 37094 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984295384401478e-06, + "loss": 0.918, + "step": 37095 + }, + { + "epoch": 0.95, + "learning_rate": 1.5984073693229482e-06, + "loss": 0.6934, + "step": 37096 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983851997475752e-06, + "loss": 0.7241, + "step": 37097 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983630297140465e-06, + "loss": 0.9395, + "step": 37098 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983408592223784e-06, + "loss": 0.7456, + "step": 37099 + }, + { + "epoch": 0.95, + "learning_rate": 1.5983186882725886e-06, + "loss": 0.835, + "step": 37100 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982965168646937e-06, + "loss": 0.8369, + "step": 37101 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982743449987102e-06, + "loss": 0.7739, + "step": 37102 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982521726746558e-06, + "loss": 0.9814, + "step": 37103 + }, + { + "epoch": 0.95, + "learning_rate": 1.598229999892547e-06, + "loss": 0.9023, + "step": 37104 + }, + { + "epoch": 0.95, + "learning_rate": 1.5982078266524013e-06, + "loss": 0.873, + "step": 37105 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981856529542352e-06, + "loss": 0.8838, + "step": 37106 + }, + { + "epoch": 0.95, + "learning_rate": 1.598163478798066e-06, + "loss": 0.7344, + "step": 37107 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981413041839104e-06, + "loss": 0.7852, + "step": 37108 + }, + { + "epoch": 0.95, + "learning_rate": 1.5981191291117855e-06, + "loss": 0.8066, + "step": 37109 + }, + { + "epoch": 0.95, + "learning_rate": 1.5980969535817082e-06, + "loss": 0.8682, + "step": 37110 + }, + { + "epoch": 0.95, + "learning_rate": 1.598074777593696e-06, + "loss": 0.9473, + "step": 37111 + }, + { + "epoch": 0.95, + "learning_rate": 1.598052601147765e-06, + "loss": 0.8481, + "step": 37112 + }, + { + "epoch": 0.95, + "learning_rate": 1.5980304242439328e-06, + "loss": 0.75, + "step": 37113 + }, + { + "epoch": 0.95, + "learning_rate": 1.598008246882216e-06, + "loss": 0.8418, + "step": 37114 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979860690626321e-06, + "loss": 0.9307, + "step": 37115 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979638907851977e-06, + "loss": 0.9287, + "step": 37116 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979417120499297e-06, + "loss": 0.916, + "step": 37117 + }, + { + "epoch": 0.95, + "learning_rate": 1.5979195328568453e-06, + "loss": 0.8252, + "step": 37118 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978973532059614e-06, + "loss": 1.0967, + "step": 37119 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978751730972949e-06, + "loss": 0.8525, + "step": 37120 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978529925308632e-06, + "loss": 0.7773, + "step": 37121 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978308115066827e-06, + "loss": 0.9463, + "step": 37122 + }, + { + "epoch": 0.95, + "learning_rate": 1.5978086300247706e-06, + "loss": 0.9834, + "step": 37123 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977864480851437e-06, + "loss": 0.6812, + "step": 37124 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977642656878196e-06, + "loss": 0.7002, + "step": 37125 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977420828328148e-06, + "loss": 0.9062, + "step": 37126 + }, + { + "epoch": 0.95, + "learning_rate": 1.5977198995201465e-06, + "loss": 0.9482, + "step": 37127 + }, + { + "epoch": 0.95, + "learning_rate": 1.5976977157498313e-06, + "loss": 0.718, + "step": 37128 + }, + { + "epoch": 0.95, + "learning_rate": 1.5976755315218865e-06, + "loss": 1.0684, + "step": 37129 + }, + { + "epoch": 0.95, + "learning_rate": 1.597653346836329e-06, + "loss": 0.8184, + "step": 37130 + }, + { + "epoch": 0.95, + "learning_rate": 1.597631161693176e-06, + "loss": 0.7246, + "step": 37131 + }, + { + "epoch": 0.95, + "learning_rate": 1.597608976092444e-06, + "loss": 0.7656, + "step": 37132 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975867900341504e-06, + "loss": 0.8105, + "step": 37133 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975646035183122e-06, + "loss": 0.8145, + "step": 37134 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975424165449461e-06, + "loss": 0.5356, + "step": 37135 + }, + { + "epoch": 0.95, + "learning_rate": 1.5975202291140695e-06, + "loss": 0.6787, + "step": 37136 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974980412256989e-06, + "loss": 0.6382, + "step": 37137 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974758528798515e-06, + "loss": 0.7588, + "step": 37138 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974536640765445e-06, + "loss": 0.9482, + "step": 37139 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974314748157944e-06, + "loss": 0.7539, + "step": 37140 + }, + { + "epoch": 0.95, + "learning_rate": 1.5974092850976191e-06, + "loss": 0.8418, + "step": 37141 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973870949220345e-06, + "loss": 1.082, + "step": 37142 + }, + { + "epoch": 0.95, + "learning_rate": 1.597364904289058e-06, + "loss": 0.8203, + "step": 37143 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973427131987067e-06, + "loss": 0.8438, + "step": 37144 + }, + { + "epoch": 0.95, + "learning_rate": 1.5973205216509977e-06, + "loss": 1.0293, + "step": 37145 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972983296459479e-06, + "loss": 0.5304, + "step": 37146 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972761371835742e-06, + "loss": 0.9385, + "step": 37147 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972539442638935e-06, + "loss": 0.9756, + "step": 37148 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972317508869228e-06, + "loss": 0.8184, + "step": 37149 + }, + { + "epoch": 0.95, + "learning_rate": 1.5972095570526793e-06, + "loss": 0.6255, + "step": 37150 + }, + { + "epoch": 0.95, + "learning_rate": 1.59718736276118e-06, + "loss": 0.9795, + "step": 37151 + }, + { + "epoch": 0.95, + "learning_rate": 1.597165168012442e-06, + "loss": 0.5879, + "step": 37152 + }, + { + "epoch": 0.95, + "learning_rate": 1.5971429728064818e-06, + "loss": 0.8945, + "step": 37153 + }, + { + "epoch": 0.95, + "learning_rate": 1.5971207771433167e-06, + "loss": 0.9209, + "step": 37154 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970985810229639e-06, + "loss": 0.8955, + "step": 37155 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970763844454398e-06, + "loss": 0.9131, + "step": 37156 + }, + { + "epoch": 0.95, + "learning_rate": 1.597054187410762e-06, + "loss": 0.9009, + "step": 37157 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970319899189473e-06, + "loss": 0.7939, + "step": 37158 + }, + { + "epoch": 0.95, + "learning_rate": 1.5970097919700126e-06, + "loss": 0.7383, + "step": 37159 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969875935639748e-06, + "loss": 0.8682, + "step": 37160 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969653947008515e-06, + "loss": 0.7432, + "step": 37161 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969431953806587e-06, + "loss": 0.9229, + "step": 37162 + }, + { + "epoch": 0.95, + "learning_rate": 1.5969209956034141e-06, + "loss": 0.8525, + "step": 37163 + }, + { + "epoch": 0.95, + "learning_rate": 1.596898795369135e-06, + "loss": 1.0098, + "step": 37164 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968765946778374e-06, + "loss": 1.001, + "step": 37165 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968543935295391e-06, + "loss": 0.9043, + "step": 37166 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968321919242564e-06, + "loss": 0.8594, + "step": 37167 + }, + { + "epoch": 0.95, + "learning_rate": 1.5968099898620072e-06, + "loss": 0.8125, + "step": 37168 + }, + { + "epoch": 0.95, + "learning_rate": 1.596787787342808e-06, + "loss": 0.5669, + "step": 37169 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967655843666757e-06, + "loss": 1.0059, + "step": 37170 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967433809336276e-06, + "loss": 0.9248, + "step": 37171 + }, + { + "epoch": 0.95, + "learning_rate": 1.5967211770436802e-06, + "loss": 0.647, + "step": 37172 + }, + { + "epoch": 0.95, + "learning_rate": 1.596698972696851e-06, + "loss": 1.083, + "step": 37173 + }, + { + "epoch": 0.95, + "learning_rate": 1.596676767893157e-06, + "loss": 0.833, + "step": 37174 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966545626326146e-06, + "loss": 0.876, + "step": 37175 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966323569152417e-06, + "loss": 0.8779, + "step": 37176 + }, + { + "epoch": 0.95, + "learning_rate": 1.5966101507410548e-06, + "loss": 0.8057, + "step": 37177 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965879441100706e-06, + "loss": 0.8691, + "step": 37178 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965657370223066e-06, + "loss": 0.75, + "step": 37179 + }, + { + "epoch": 0.95, + "learning_rate": 1.5965435294777799e-06, + "loss": 0.6716, + "step": 37180 + }, + { + "epoch": 0.95, + "learning_rate": 1.596521321476507e-06, + "loss": 0.6445, + "step": 37181 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964991130185053e-06, + "loss": 0.9414, + "step": 37182 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964769041037913e-06, + "loss": 1.168, + "step": 37183 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964546947323827e-06, + "loss": 0.9268, + "step": 37184 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964324849042964e-06, + "loss": 0.7979, + "step": 37185 + }, + { + "epoch": 0.95, + "learning_rate": 1.5964102746195488e-06, + "loss": 0.7788, + "step": 37186 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963880638781573e-06, + "loss": 0.8701, + "step": 37187 + }, + { + "epoch": 0.95, + "learning_rate": 1.596365852680139e-06, + "loss": 1.1035, + "step": 37188 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963436410255104e-06, + "loss": 0.5938, + "step": 37189 + }, + { + "epoch": 0.95, + "learning_rate": 1.5963214289142891e-06, + "loss": 0.9238, + "step": 37190 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962992163464924e-06, + "loss": 0.9229, + "step": 37191 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962770033221363e-06, + "loss": 0.9536, + "step": 37192 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962547898412385e-06, + "loss": 0.9111, + "step": 37193 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962325759038155e-06, + "loss": 1.0059, + "step": 37194 + }, + { + "epoch": 0.95, + "learning_rate": 1.5962103615098849e-06, + "loss": 0.8496, + "step": 37195 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961881466594635e-06, + "loss": 0.7549, + "step": 37196 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961659313525682e-06, + "loss": 0.8086, + "step": 37197 + }, + { + "epoch": 0.95, + "learning_rate": 1.596143715589216e-06, + "loss": 1.0557, + "step": 37198 + }, + { + "epoch": 0.95, + "learning_rate": 1.5961214993694241e-06, + "loss": 0.8398, + "step": 37199 + }, + { + "epoch": 0.95, + "learning_rate": 1.596099282693209e-06, + "loss": 0.9375, + "step": 37200 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960770655605886e-06, + "loss": 0.8926, + "step": 37201 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960548479715793e-06, + "loss": 0.8994, + "step": 37202 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960326299261979e-06, + "loss": 0.8057, + "step": 37203 + }, + { + "epoch": 0.95, + "learning_rate": 1.5960104114244618e-06, + "loss": 0.8926, + "step": 37204 + }, + { + "epoch": 0.95, + "learning_rate": 1.595988192466388e-06, + "loss": 0.8496, + "step": 37205 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959659730519936e-06, + "loss": 0.6543, + "step": 37206 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959437531812954e-06, + "loss": 0.564, + "step": 37207 + }, + { + "epoch": 0.95, + "learning_rate": 1.5959215328543102e-06, + "loss": 0.999, + "step": 37208 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958993120710556e-06, + "loss": 0.4927, + "step": 37209 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958770908315483e-06, + "loss": 0.835, + "step": 37210 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958548691358051e-06, + "loss": 0.6656, + "step": 37211 + }, + { + "epoch": 0.95, + "learning_rate": 1.5958326469838435e-06, + "loss": 0.6572, + "step": 37212 + }, + { + "epoch": 0.95, + "learning_rate": 1.59581042437568e-06, + "loss": 0.7925, + "step": 37213 + }, + { + "epoch": 0.95, + "learning_rate": 1.5957882013113317e-06, + "loss": 0.7107, + "step": 37214 + }, + { + "epoch": 0.95, + "learning_rate": 1.595765977790816e-06, + "loss": 0.7688, + "step": 37215 + }, + { + "epoch": 0.95, + "learning_rate": 1.5957437538141499e-06, + "loss": 0.9424, + "step": 37216 + }, + { + "epoch": 0.95, + "learning_rate": 1.59572152938135e-06, + "loss": 0.6423, + "step": 37217 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956993044924334e-06, + "loss": 0.8887, + "step": 37218 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956770791474172e-06, + "loss": 0.8086, + "step": 37219 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956548533463186e-06, + "loss": 0.8682, + "step": 37220 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956326270891546e-06, + "loss": 0.6792, + "step": 37221 + }, + { + "epoch": 0.95, + "learning_rate": 1.5956104003759419e-06, + "loss": 0.7715, + "step": 37222 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955881732066976e-06, + "loss": 0.9561, + "step": 37223 + }, + { + "epoch": 0.95, + "learning_rate": 1.595565945581439e-06, + "loss": 0.8311, + "step": 37224 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955437175001826e-06, + "loss": 0.7793, + "step": 37225 + }, + { + "epoch": 0.95, + "learning_rate": 1.5955214889629463e-06, + "loss": 0.9053, + "step": 37226 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954992599697464e-06, + "loss": 0.918, + "step": 37227 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954770305206e-06, + "loss": 0.8301, + "step": 37228 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954548006155242e-06, + "loss": 0.917, + "step": 37229 + }, + { + "epoch": 0.95, + "learning_rate": 1.595432570254536e-06, + "loss": 0.8105, + "step": 37230 + }, + { + "epoch": 0.95, + "learning_rate": 1.5954103394376527e-06, + "loss": 0.9473, + "step": 37231 + }, + { + "epoch": 0.95, + "learning_rate": 1.595388108164891e-06, + "loss": 0.918, + "step": 37232 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953658764362676e-06, + "loss": 0.7539, + "step": 37233 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953436442518004e-06, + "loss": 0.9297, + "step": 37234 + }, + { + "epoch": 0.95, + "learning_rate": 1.5953214116115058e-06, + "loss": 0.8174, + "step": 37235 + }, + { + "epoch": 0.95, + "learning_rate": 1.595299178515401e-06, + "loss": 0.7363, + "step": 37236 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952769449635032e-06, + "loss": 0.8145, + "step": 37237 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952547109558284e-06, + "loss": 0.6501, + "step": 37238 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952324764923951e-06, + "loss": 0.9141, + "step": 37239 + }, + { + "epoch": 0.95, + "learning_rate": 1.5952102415732198e-06, + "loss": 0.9619, + "step": 37240 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951880061983189e-06, + "loss": 0.915, + "step": 37241 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951657703677105e-06, + "loss": 0.5903, + "step": 37242 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951435340814106e-06, + "loss": 0.917, + "step": 37243 + }, + { + "epoch": 0.95, + "learning_rate": 1.5951212973394369e-06, + "loss": 0.9287, + "step": 37244 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950990601418058e-06, + "loss": 0.7393, + "step": 37245 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950768224885351e-06, + "loss": 0.9551, + "step": 37246 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950545843796412e-06, + "loss": 0.8105, + "step": 37247 + }, + { + "epoch": 0.95, + "learning_rate": 1.5950323458151416e-06, + "loss": 0.7256, + "step": 37248 + }, + { + "epoch": 0.95, + "learning_rate": 1.595010106795053e-06, + "loss": 0.8789, + "step": 37249 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949878673193923e-06, + "loss": 0.8296, + "step": 37250 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949656273881771e-06, + "loss": 0.7139, + "step": 37251 + }, + { + "epoch": 0.95, + "learning_rate": 1.594943387001424e-06, + "loss": 0.917, + "step": 37252 + }, + { + "epoch": 0.95, + "learning_rate": 1.5949211461591499e-06, + "loss": 0.576, + "step": 37253 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948989048613722e-06, + "loss": 0.7783, + "step": 37254 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948766631081076e-06, + "loss": 0.5884, + "step": 37255 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948544208993735e-06, + "loss": 0.8838, + "step": 37256 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948321782351865e-06, + "loss": 0.9141, + "step": 37257 + }, + { + "epoch": 0.95, + "learning_rate": 1.5948099351155642e-06, + "loss": 0.8711, + "step": 37258 + }, + { + "epoch": 0.95, + "learning_rate": 1.5947876915405227e-06, + "loss": 0.8408, + "step": 37259 + }, + { + "epoch": 0.95, + "learning_rate": 1.59476544751008e-06, + "loss": 0.6919, + "step": 37260 + }, + { + "epoch": 0.96, + "learning_rate": 1.5947432030242527e-06, + "loss": 0.9492, + "step": 37261 + }, + { + "epoch": 0.96, + "learning_rate": 1.594720958083058e-06, + "loss": 0.9912, + "step": 37262 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946987126865125e-06, + "loss": 0.8164, + "step": 37263 + }, + { + "epoch": 0.96, + "learning_rate": 1.594676466834634e-06, + "loss": 0.812, + "step": 37264 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946542205274386e-06, + "loss": 0.8447, + "step": 37265 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946319737649442e-06, + "loss": 0.9053, + "step": 37266 + }, + { + "epoch": 0.96, + "learning_rate": 1.5946097265471675e-06, + "loss": 0.8218, + "step": 37267 + }, + { + "epoch": 0.96, + "learning_rate": 1.594587478874125e-06, + "loss": 0.9287, + "step": 37268 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945652307458343e-06, + "loss": 1.0342, + "step": 37269 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945429821623125e-06, + "loss": 1.0381, + "step": 37270 + }, + { + "epoch": 0.96, + "learning_rate": 1.5945207331235767e-06, + "loss": 0.7769, + "step": 37271 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944984836296433e-06, + "loss": 0.6562, + "step": 37272 + }, + { + "epoch": 0.96, + "learning_rate": 1.59447623368053e-06, + "loss": 1.0039, + "step": 37273 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944539832762534e-06, + "loss": 0.8252, + "step": 37274 + }, + { + "epoch": 0.96, + "learning_rate": 1.594431732416831e-06, + "loss": 0.8516, + "step": 37275 + }, + { + "epoch": 0.96, + "learning_rate": 1.5944094811022796e-06, + "loss": 0.4946, + "step": 37276 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943872293326157e-06, + "loss": 1.1133, + "step": 37277 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943649771078572e-06, + "loss": 0.8682, + "step": 37278 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943427244280205e-06, + "loss": 0.9902, + "step": 37279 + }, + { + "epoch": 0.96, + "learning_rate": 1.5943204712931231e-06, + "loss": 0.7974, + "step": 37280 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942982177031819e-06, + "loss": 0.8027, + "step": 37281 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942759636582137e-06, + "loss": 0.7178, + "step": 37282 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942537091582357e-06, + "loss": 0.9399, + "step": 37283 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942314542032653e-06, + "loss": 1.0176, + "step": 37284 + }, + { + "epoch": 0.96, + "learning_rate": 1.5942091987933188e-06, + "loss": 0.9492, + "step": 37285 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941869429284137e-06, + "loss": 0.8086, + "step": 37286 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941646866085675e-06, + "loss": 0.9375, + "step": 37287 + }, + { + "epoch": 0.96, + "learning_rate": 1.594142429833796e-06, + "loss": 0.79, + "step": 37288 + }, + { + "epoch": 0.96, + "learning_rate": 1.5941201726041173e-06, + "loss": 0.7012, + "step": 37289 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940979149195482e-06, + "loss": 1.0664, + "step": 37290 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940756567801054e-06, + "loss": 0.9443, + "step": 37291 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940533981858063e-06, + "loss": 0.9932, + "step": 37292 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940311391366678e-06, + "loss": 0.8779, + "step": 37293 + }, + { + "epoch": 0.96, + "learning_rate": 1.5940088796327072e-06, + "loss": 0.8008, + "step": 37294 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939866196739409e-06, + "loss": 0.8369, + "step": 37295 + }, + { + "epoch": 0.96, + "learning_rate": 1.593964359260387e-06, + "loss": 0.6633, + "step": 37296 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939420983920612e-06, + "loss": 0.4458, + "step": 37297 + }, + { + "epoch": 0.96, + "learning_rate": 1.5939198370689815e-06, + "loss": 0.8174, + "step": 37298 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938975752911645e-06, + "loss": 0.8379, + "step": 37299 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938753130586278e-06, + "loss": 0.5981, + "step": 37300 + }, + { + "epoch": 0.96, + "learning_rate": 1.593853050371388e-06, + "loss": 0.9062, + "step": 37301 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938307872294621e-06, + "loss": 0.957, + "step": 37302 + }, + { + "epoch": 0.96, + "learning_rate": 1.5938085236328674e-06, + "loss": 0.8857, + "step": 37303 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937862595816208e-06, + "loss": 0.917, + "step": 37304 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937639950757392e-06, + "loss": 0.6182, + "step": 37305 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937417301152397e-06, + "loss": 0.9746, + "step": 37306 + }, + { + "epoch": 0.96, + "learning_rate": 1.5937194647001398e-06, + "loss": 0.7461, + "step": 37307 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936971988304562e-06, + "loss": 0.9453, + "step": 37308 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936749325062055e-06, + "loss": 0.7861, + "step": 37309 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936526657274056e-06, + "loss": 0.9629, + "step": 37310 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936303984940733e-06, + "loss": 0.7183, + "step": 37311 + }, + { + "epoch": 0.96, + "learning_rate": 1.5936081308062252e-06, + "loss": 0.8442, + "step": 37312 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935858626638786e-06, + "loss": 0.9385, + "step": 37313 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935635940670506e-06, + "loss": 1.0225, + "step": 37314 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935413250157586e-06, + "loss": 1.042, + "step": 37315 + }, + { + "epoch": 0.96, + "learning_rate": 1.5935190555100193e-06, + "loss": 0.7207, + "step": 37316 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934967855498493e-06, + "loss": 0.9736, + "step": 37317 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934745151352664e-06, + "loss": 0.9844, + "step": 37318 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934522442662873e-06, + "loss": 0.9561, + "step": 37319 + }, + { + "epoch": 0.96, + "learning_rate": 1.593429972942929e-06, + "loss": 0.7617, + "step": 37320 + }, + { + "epoch": 0.96, + "learning_rate": 1.5934077011652089e-06, + "loss": 0.7676, + "step": 37321 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933854289331437e-06, + "loss": 0.6304, + "step": 37322 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933631562467503e-06, + "loss": 0.7363, + "step": 37323 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933408831060464e-06, + "loss": 0.7871, + "step": 37324 + }, + { + "epoch": 0.96, + "learning_rate": 1.5933186095110483e-06, + "loss": 0.793, + "step": 37325 + }, + { + "epoch": 0.96, + "learning_rate": 1.593296335461774e-06, + "loss": 0.5431, + "step": 37326 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932740609582393e-06, + "loss": 0.9307, + "step": 37327 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932517860004623e-06, + "loss": 0.5278, + "step": 37328 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932295105884594e-06, + "loss": 0.7773, + "step": 37329 + }, + { + "epoch": 0.96, + "learning_rate": 1.5932072347222483e-06, + "loss": 0.5449, + "step": 37330 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931849584018455e-06, + "loss": 0.9941, + "step": 37331 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931626816272682e-06, + "loss": 0.6484, + "step": 37332 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931404043985337e-06, + "loss": 0.6228, + "step": 37333 + }, + { + "epoch": 0.96, + "learning_rate": 1.5931181267156587e-06, + "loss": 0.9082, + "step": 37334 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930958485786605e-06, + "loss": 0.8457, + "step": 37335 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930735699875561e-06, + "loss": 0.9775, + "step": 37336 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930512909423626e-06, + "loss": 0.8398, + "step": 37337 + }, + { + "epoch": 0.96, + "learning_rate": 1.593029011443097e-06, + "loss": 0.9014, + "step": 37338 + }, + { + "epoch": 0.96, + "learning_rate": 1.5930067314897763e-06, + "loss": 0.7773, + "step": 37339 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929844510824174e-06, + "loss": 0.7656, + "step": 37340 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929621702210381e-06, + "loss": 0.875, + "step": 37341 + }, + { + "epoch": 0.96, + "learning_rate": 1.5929398889056543e-06, + "loss": 0.8115, + "step": 37342 + }, + { + "epoch": 0.96, + "learning_rate": 1.592917607136284e-06, + "loss": 0.7126, + "step": 37343 + }, + { + "epoch": 0.96, + "learning_rate": 1.592895324912944e-06, + "loss": 0.8389, + "step": 37344 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928730422356512e-06, + "loss": 1.0068, + "step": 37345 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928507591044229e-06, + "loss": 0.8906, + "step": 37346 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928284755192757e-06, + "loss": 0.7285, + "step": 37347 + }, + { + "epoch": 0.96, + "learning_rate": 1.5928061914802276e-06, + "loss": 0.6089, + "step": 37348 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927839069872943e-06, + "loss": 0.8047, + "step": 37349 + }, + { + "epoch": 0.96, + "learning_rate": 1.592761622040494e-06, + "loss": 0.6064, + "step": 37350 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927393366398436e-06, + "loss": 1.0625, + "step": 37351 + }, + { + "epoch": 0.96, + "learning_rate": 1.5927170507853599e-06, + "loss": 0.7812, + "step": 37352 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926947644770596e-06, + "loss": 0.8623, + "step": 37353 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926724777149604e-06, + "loss": 0.9648, + "step": 37354 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926501904990792e-06, + "loss": 0.6694, + "step": 37355 + }, + { + "epoch": 0.96, + "learning_rate": 1.592627902829433e-06, + "loss": 1.0342, + "step": 37356 + }, + { + "epoch": 0.96, + "learning_rate": 1.5926056147060386e-06, + "loss": 0.8418, + "step": 37357 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925833261289138e-06, + "loss": 0.9463, + "step": 37358 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925610370980748e-06, + "loss": 1.0205, + "step": 37359 + }, + { + "epoch": 0.96, + "learning_rate": 1.5925387476135393e-06, + "loss": 0.9375, + "step": 37360 + }, + { + "epoch": 0.96, + "learning_rate": 1.592516457675324e-06, + "loss": 0.6074, + "step": 37361 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924941672834461e-06, + "loss": 0.7803, + "step": 37362 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924718764379229e-06, + "loss": 0.7725, + "step": 37363 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924495851387709e-06, + "loss": 0.9229, + "step": 37364 + }, + { + "epoch": 0.96, + "learning_rate": 1.5924272933860077e-06, + "loss": 0.8838, + "step": 37365 + }, + { + "epoch": 0.96, + "learning_rate": 1.59240500117965e-06, + "loss": 0.7842, + "step": 37366 + }, + { + "epoch": 0.96, + "learning_rate": 1.592382708519715e-06, + "loss": 0.7183, + "step": 37367 + }, + { + "epoch": 0.96, + "learning_rate": 1.59236041540622e-06, + "loss": 0.7979, + "step": 37368 + }, + { + "epoch": 0.96, + "learning_rate": 1.5923381218391817e-06, + "loss": 0.8271, + "step": 37369 + }, + { + "epoch": 0.96, + "learning_rate": 1.5923158278186174e-06, + "loss": 0.8652, + "step": 37370 + }, + { + "epoch": 0.96, + "learning_rate": 1.5922935333445441e-06, + "loss": 0.6436, + "step": 37371 + }, + { + "epoch": 0.96, + "learning_rate": 1.592271238416979e-06, + "loss": 0.8447, + "step": 37372 + }, + { + "epoch": 0.96, + "learning_rate": 1.592248943035939e-06, + "loss": 0.8691, + "step": 37373 + }, + { + "epoch": 0.96, + "learning_rate": 1.592226647201441e-06, + "loss": 0.7832, + "step": 37374 + }, + { + "epoch": 0.96, + "learning_rate": 1.5922043509135025e-06, + "loss": 0.7915, + "step": 37375 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921820541721403e-06, + "loss": 1.0547, + "step": 37376 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921597569773715e-06, + "loss": 0.7063, + "step": 37377 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921374593292131e-06, + "loss": 0.8809, + "step": 37378 + }, + { + "epoch": 0.96, + "learning_rate": 1.5921151612276825e-06, + "loss": 0.833, + "step": 37379 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920928626727965e-06, + "loss": 0.7227, + "step": 37380 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920705636645721e-06, + "loss": 0.8716, + "step": 37381 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920482642030267e-06, + "loss": 0.6411, + "step": 37382 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920259642881768e-06, + "loss": 0.8105, + "step": 37383 + }, + { + "epoch": 0.96, + "learning_rate": 1.5920036639200402e-06, + "loss": 0.6135, + "step": 37384 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919813630986336e-06, + "loss": 0.916, + "step": 37385 + }, + { + "epoch": 0.96, + "learning_rate": 1.591959061823974e-06, + "loss": 0.645, + "step": 37386 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919367600960784e-06, + "loss": 0.8789, + "step": 37387 + }, + { + "epoch": 0.96, + "learning_rate": 1.5919144579149641e-06, + "loss": 0.7617, + "step": 37388 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918921552806483e-06, + "loss": 0.7744, + "step": 37389 + }, + { + "epoch": 0.96, + "learning_rate": 1.591869852193148e-06, + "loss": 0.8271, + "step": 37390 + }, + { + "epoch": 0.96, + "learning_rate": 1.59184754865248e-06, + "loss": 1.3281, + "step": 37391 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918252446586613e-06, + "loss": 1.0967, + "step": 37392 + }, + { + "epoch": 0.96, + "learning_rate": 1.5918029402117093e-06, + "loss": 0.9043, + "step": 37393 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917806353116411e-06, + "loss": 0.8926, + "step": 37394 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917583299584738e-06, + "loss": 0.9009, + "step": 37395 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917360241522243e-06, + "loss": 0.7725, + "step": 37396 + }, + { + "epoch": 0.96, + "learning_rate": 1.5917137178929096e-06, + "loss": 0.7559, + "step": 37397 + }, + { + "epoch": 0.96, + "learning_rate": 1.591691411180547e-06, + "loss": 0.8049, + "step": 37398 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916691040151537e-06, + "loss": 0.7969, + "step": 37399 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916467963967463e-06, + "loss": 0.8643, + "step": 37400 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916244883253422e-06, + "loss": 0.7192, + "step": 37401 + }, + { + "epoch": 0.96, + "learning_rate": 1.5916021798009585e-06, + "loss": 0.6528, + "step": 37402 + }, + { + "epoch": 0.96, + "learning_rate": 1.591579870823612e-06, + "loss": 0.8115, + "step": 37403 + }, + { + "epoch": 0.96, + "learning_rate": 1.59155756139332e-06, + "loss": 0.7617, + "step": 37404 + }, + { + "epoch": 0.96, + "learning_rate": 1.5915352515101002e-06, + "loss": 0.9023, + "step": 37405 + }, + { + "epoch": 0.96, + "learning_rate": 1.5915129411739685e-06, + "loss": 0.8506, + "step": 37406 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914906303849426e-06, + "loss": 0.6753, + "step": 37407 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914683191430396e-06, + "loss": 0.8369, + "step": 37408 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914460074482766e-06, + "loss": 1.0078, + "step": 37409 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914236953006707e-06, + "loss": 0.7319, + "step": 37410 + }, + { + "epoch": 0.96, + "learning_rate": 1.5914013827002384e-06, + "loss": 0.7466, + "step": 37411 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913790696469973e-06, + "loss": 0.9346, + "step": 37412 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913567561409647e-06, + "loss": 0.7881, + "step": 37413 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913344421821573e-06, + "loss": 0.7627, + "step": 37414 + }, + { + "epoch": 0.96, + "learning_rate": 1.5913121277705926e-06, + "loss": 0.9756, + "step": 37415 + }, + { + "epoch": 0.96, + "learning_rate": 1.591289812906287e-06, + "loss": 1.0859, + "step": 37416 + }, + { + "epoch": 0.96, + "learning_rate": 1.591267497589258e-06, + "loss": 0.9473, + "step": 37417 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912451818195228e-06, + "loss": 0.834, + "step": 37418 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912228655970985e-06, + "loss": 0.9121, + "step": 37419 + }, + { + "epoch": 0.96, + "learning_rate": 1.5912005489220017e-06, + "loss": 0.7969, + "step": 37420 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911782317942501e-06, + "loss": 0.8232, + "step": 37421 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911559142138602e-06, + "loss": 0.708, + "step": 37422 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911335961808496e-06, + "loss": 0.8213, + "step": 37423 + }, + { + "epoch": 0.96, + "learning_rate": 1.5911112776952354e-06, + "loss": 0.8574, + "step": 37424 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910889587570343e-06, + "loss": 0.7478, + "step": 37425 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910666393662635e-06, + "loss": 0.8945, + "step": 37426 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910443195229402e-06, + "loss": 1.0225, + "step": 37427 + }, + { + "epoch": 0.96, + "learning_rate": 1.5910219992270814e-06, + "loss": 0.8789, + "step": 37428 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909996784787043e-06, + "loss": 0.8003, + "step": 37429 + }, + { + "epoch": 0.96, + "learning_rate": 1.590977357277826e-06, + "loss": 0.8359, + "step": 37430 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909550356244633e-06, + "loss": 0.8164, + "step": 37431 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909327135186335e-06, + "loss": 0.8208, + "step": 37432 + }, + { + "epoch": 0.96, + "learning_rate": 1.5909103909603538e-06, + "loss": 0.6267, + "step": 37433 + }, + { + "epoch": 0.96, + "learning_rate": 1.590888067949641e-06, + "loss": 0.8442, + "step": 37434 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908657444865128e-06, + "loss": 0.853, + "step": 37435 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908434205709856e-06, + "loss": 0.6709, + "step": 37436 + }, + { + "epoch": 0.96, + "learning_rate": 1.5908210962030767e-06, + "loss": 0.8506, + "step": 37437 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907987713828034e-06, + "loss": 0.7417, + "step": 37438 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907764461101824e-06, + "loss": 0.4043, + "step": 37439 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907541203852315e-06, + "loss": 0.9072, + "step": 37440 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907317942079667e-06, + "loss": 0.9307, + "step": 37441 + }, + { + "epoch": 0.96, + "learning_rate": 1.5907094675784062e-06, + "loss": 0.6919, + "step": 37442 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906871404965665e-06, + "loss": 0.8467, + "step": 37443 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906648129624648e-06, + "loss": 0.783, + "step": 37444 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906424849761185e-06, + "loss": 0.9072, + "step": 37445 + }, + { + "epoch": 0.96, + "learning_rate": 1.5906201565375442e-06, + "loss": 0.793, + "step": 37446 + }, + { + "epoch": 0.96, + "learning_rate": 1.590597827646759e-06, + "loss": 0.793, + "step": 37447 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905754983037802e-06, + "loss": 0.8848, + "step": 37448 + }, + { + "epoch": 0.96, + "learning_rate": 1.590553168508625e-06, + "loss": 0.9854, + "step": 37449 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905308382613108e-06, + "loss": 0.7588, + "step": 37450 + }, + { + "epoch": 0.96, + "learning_rate": 1.5905085075618536e-06, + "loss": 1.0186, + "step": 37451 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904861764102715e-06, + "loss": 0.8828, + "step": 37452 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904638448065812e-06, + "loss": 0.8965, + "step": 37453 + }, + { + "epoch": 0.96, + "learning_rate": 1.5904415127508001e-06, + "loss": 0.6196, + "step": 37454 + }, + { + "epoch": 0.96, + "learning_rate": 1.590419180242945e-06, + "loss": 0.7769, + "step": 37455 + }, + { + "epoch": 0.96, + "learning_rate": 1.590396847283033e-06, + "loss": 0.9238, + "step": 37456 + }, + { + "epoch": 0.96, + "learning_rate": 1.5903745138710813e-06, + "loss": 0.8223, + "step": 37457 + }, + { + "epoch": 0.96, + "learning_rate": 1.590352180007107e-06, + "loss": 0.8613, + "step": 37458 + }, + { + "epoch": 0.96, + "learning_rate": 1.5903298456911272e-06, + "loss": 0.8926, + "step": 37459 + }, + { + "epoch": 0.96, + "learning_rate": 1.590307510923159e-06, + "loss": 0.6538, + "step": 37460 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902851757032196e-06, + "loss": 1.0029, + "step": 37461 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902628400313257e-06, + "loss": 0.698, + "step": 37462 + }, + { + "epoch": 0.96, + "learning_rate": 1.590240503907495e-06, + "loss": 0.9668, + "step": 37463 + }, + { + "epoch": 0.96, + "learning_rate": 1.5902181673317438e-06, + "loss": 0.7705, + "step": 37464 + }, + { + "epoch": 0.96, + "learning_rate": 1.59019583030409e-06, + "loss": 0.8857, + "step": 37465 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901734928245506e-06, + "loss": 0.9766, + "step": 37466 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901511548931421e-06, + "loss": 0.7988, + "step": 37467 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901288165098822e-06, + "loss": 0.7637, + "step": 37468 + }, + { + "epoch": 0.96, + "learning_rate": 1.5901064776747877e-06, + "loss": 1.0781, + "step": 37469 + }, + { + "epoch": 0.96, + "learning_rate": 1.590084138387876e-06, + "loss": 0.6128, + "step": 37470 + }, + { + "epoch": 0.96, + "learning_rate": 1.590061798649164e-06, + "loss": 0.7627, + "step": 37471 + }, + { + "epoch": 0.96, + "learning_rate": 1.5900394584586688e-06, + "loss": 0.9404, + "step": 37472 + }, + { + "epoch": 0.96, + "learning_rate": 1.5900171178164072e-06, + "loss": 0.8936, + "step": 37473 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899947767223968e-06, + "loss": 0.8125, + "step": 37474 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899724351766545e-06, + "loss": 0.7207, + "step": 37475 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899500931791976e-06, + "loss": 0.7754, + "step": 37476 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899277507300428e-06, + "loss": 0.96, + "step": 37477 + }, + { + "epoch": 0.96, + "learning_rate": 1.5899054078292076e-06, + "loss": 0.8994, + "step": 37478 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898830644767089e-06, + "loss": 0.9805, + "step": 37479 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898607206725641e-06, + "loss": 0.6145, + "step": 37480 + }, + { + "epoch": 0.96, + "learning_rate": 1.58983837641679e-06, + "loss": 0.7803, + "step": 37481 + }, + { + "epoch": 0.96, + "learning_rate": 1.5898160317094035e-06, + "loss": 1.0791, + "step": 37482 + }, + { + "epoch": 0.96, + "learning_rate": 1.589793686550422e-06, + "loss": 0.7817, + "step": 37483 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897713409398627e-06, + "loss": 0.9619, + "step": 37484 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897489948777428e-06, + "loss": 0.8818, + "step": 37485 + }, + { + "epoch": 0.96, + "learning_rate": 1.589726648364079e-06, + "loss": 0.8506, + "step": 37486 + }, + { + "epoch": 0.96, + "learning_rate": 1.5897043013988886e-06, + "loss": 1.0469, + "step": 37487 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896819539821888e-06, + "loss": 0.958, + "step": 37488 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896596061139967e-06, + "loss": 0.5791, + "step": 37489 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896372577943294e-06, + "loss": 0.9131, + "step": 37490 + }, + { + "epoch": 0.96, + "learning_rate": 1.5896149090232038e-06, + "loss": 0.7627, + "step": 37491 + }, + { + "epoch": 0.96, + "learning_rate": 1.589592559800637e-06, + "loss": 0.9307, + "step": 37492 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895702101266466e-06, + "loss": 0.8838, + "step": 37493 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895478600012493e-06, + "loss": 0.8701, + "step": 37494 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895255094244627e-06, + "loss": 0.7363, + "step": 37495 + }, + { + "epoch": 0.96, + "learning_rate": 1.5895031583963028e-06, + "loss": 0.9912, + "step": 37496 + }, + { + "epoch": 0.96, + "learning_rate": 1.589480806916788e-06, + "loss": 0.6338, + "step": 37497 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894584549859345e-06, + "loss": 0.8262, + "step": 37498 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894361026037597e-06, + "loss": 0.8457, + "step": 37499 + }, + { + "epoch": 0.96, + "learning_rate": 1.5894137497702814e-06, + "loss": 0.6797, + "step": 37500 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893913964855154e-06, + "loss": 0.6147, + "step": 37501 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893690427494799e-06, + "loss": 0.7104, + "step": 37502 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893466885621916e-06, + "loss": 0.8799, + "step": 37503 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893243339236672e-06, + "loss": 0.7046, + "step": 37504 + }, + { + "epoch": 0.96, + "learning_rate": 1.5893019788339248e-06, + "loss": 0.7607, + "step": 37505 + }, + { + "epoch": 0.96, + "learning_rate": 1.589279623292981e-06, + "loss": 0.8071, + "step": 37506 + }, + { + "epoch": 0.96, + "learning_rate": 1.5892572673008524e-06, + "loss": 0.79, + "step": 37507 + }, + { + "epoch": 0.96, + "learning_rate": 1.5892349108575569e-06, + "loss": 0.9082, + "step": 37508 + }, + { + "epoch": 0.96, + "learning_rate": 1.589212553963111e-06, + "loss": 0.7695, + "step": 37509 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891901966175327e-06, + "loss": 0.9092, + "step": 37510 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891678388208382e-06, + "loss": 0.6772, + "step": 37511 + }, + { + "epoch": 0.96, + "learning_rate": 1.589145480573045e-06, + "loss": 0.8037, + "step": 37512 + }, + { + "epoch": 0.96, + "learning_rate": 1.5891231218741705e-06, + "loss": 0.8232, + "step": 37513 + }, + { + "epoch": 0.96, + "learning_rate": 1.589100762724231e-06, + "loss": 1.1387, + "step": 37514 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890784031232446e-06, + "loss": 0.8799, + "step": 37515 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890560430712277e-06, + "loss": 0.6517, + "step": 37516 + }, + { + "epoch": 0.96, + "learning_rate": 1.589033682568198e-06, + "loss": 0.7627, + "step": 37517 + }, + { + "epoch": 0.96, + "learning_rate": 1.5890113216141718e-06, + "loss": 0.8447, + "step": 37518 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889889602091669e-06, + "loss": 0.7881, + "step": 37519 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889665983532004e-06, + "loss": 0.8955, + "step": 37520 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889442360462892e-06, + "loss": 0.875, + "step": 37521 + }, + { + "epoch": 0.96, + "learning_rate": 1.5889218732884505e-06, + "loss": 0.7871, + "step": 37522 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888995100797012e-06, + "loss": 0.6084, + "step": 37523 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888771464200587e-06, + "loss": 0.8721, + "step": 37524 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888547823095402e-06, + "loss": 0.6357, + "step": 37525 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888324177481625e-06, + "loss": 0.5649, + "step": 37526 + }, + { + "epoch": 0.96, + "learning_rate": 1.5888100527359429e-06, + "loss": 0.6914, + "step": 37527 + }, + { + "epoch": 0.96, + "learning_rate": 1.5887876872728984e-06, + "loss": 0.9443, + "step": 37528 + }, + { + "epoch": 0.96, + "learning_rate": 1.5887653213590465e-06, + "loss": 0.875, + "step": 37529 + }, + { + "epoch": 0.96, + "learning_rate": 1.588742954994404e-06, + "loss": 0.9795, + "step": 37530 + }, + { + "epoch": 0.96, + "learning_rate": 1.588720588178988e-06, + "loss": 0.52, + "step": 37531 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886982209128159e-06, + "loss": 0.9033, + "step": 37532 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886758531959044e-06, + "loss": 0.7383, + "step": 37533 + }, + { + "epoch": 0.96, + "learning_rate": 1.588653485028271e-06, + "loss": 0.9287, + "step": 37534 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886311164099327e-06, + "loss": 0.613, + "step": 37535 + }, + { + "epoch": 0.96, + "learning_rate": 1.5886087473409066e-06, + "loss": 0.7559, + "step": 37536 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885863778212098e-06, + "loss": 0.7644, + "step": 37537 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885640078508595e-06, + "loss": 0.7656, + "step": 37538 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885416374298729e-06, + "loss": 0.7134, + "step": 37539 + }, + { + "epoch": 0.96, + "learning_rate": 1.5885192665582673e-06, + "loss": 0.8486, + "step": 37540 + }, + { + "epoch": 0.96, + "learning_rate": 1.588496895236059e-06, + "loss": 0.7578, + "step": 37541 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884745234632657e-06, + "loss": 0.9941, + "step": 37542 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884521512399048e-06, + "loss": 0.9189, + "step": 37543 + }, + { + "epoch": 0.96, + "learning_rate": 1.588429778565993e-06, + "loss": 0.8682, + "step": 37544 + }, + { + "epoch": 0.96, + "learning_rate": 1.5884074054415479e-06, + "loss": 0.9189, + "step": 37545 + }, + { + "epoch": 0.96, + "learning_rate": 1.588385031866586e-06, + "loss": 0.644, + "step": 37546 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883626578411248e-06, + "loss": 0.9766, + "step": 37547 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883402833651811e-06, + "loss": 0.8135, + "step": 37548 + }, + { + "epoch": 0.96, + "learning_rate": 1.5883179084387727e-06, + "loss": 0.8047, + "step": 37549 + }, + { + "epoch": 0.96, + "learning_rate": 1.588295533061916e-06, + "loss": 0.7188, + "step": 37550 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882731572346288e-06, + "loss": 0.7915, + "step": 37551 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882507809569277e-06, + "loss": 0.7319, + "step": 37552 + }, + { + "epoch": 0.96, + "learning_rate": 1.5882284042288298e-06, + "loss": 0.9189, + "step": 37553 + }, + { + "epoch": 0.96, + "learning_rate": 1.588206027050353e-06, + "loss": 0.8315, + "step": 37554 + }, + { + "epoch": 0.96, + "learning_rate": 1.5881836494215134e-06, + "loss": 0.9824, + "step": 37555 + }, + { + "epoch": 0.96, + "learning_rate": 1.588161271342329e-06, + "loss": 0.6086, + "step": 37556 + }, + { + "epoch": 0.96, + "learning_rate": 1.5881388928128163e-06, + "loss": 0.6714, + "step": 37557 + }, + { + "epoch": 0.96, + "learning_rate": 1.588116513832993e-06, + "loss": 0.6694, + "step": 37558 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880941344028753e-06, + "loss": 0.6255, + "step": 37559 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880717545224816e-06, + "loss": 0.7549, + "step": 37560 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880493741918282e-06, + "loss": 0.7119, + "step": 37561 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880269934109322e-06, + "loss": 0.6895, + "step": 37562 + }, + { + "epoch": 0.96, + "learning_rate": 1.5880046121798114e-06, + "loss": 0.9648, + "step": 37563 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879822304984823e-06, + "loss": 0.834, + "step": 37564 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879598483669621e-06, + "loss": 0.9697, + "step": 37565 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879374657852683e-06, + "loss": 0.8164, + "step": 37566 + }, + { + "epoch": 0.96, + "learning_rate": 1.5879150827534175e-06, + "loss": 0.9756, + "step": 37567 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878926992714274e-06, + "loss": 1.0293, + "step": 37568 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878703153393147e-06, + "loss": 0.749, + "step": 37569 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878479309570971e-06, + "loss": 0.7764, + "step": 37570 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878255461247912e-06, + "loss": 0.9814, + "step": 37571 + }, + { + "epoch": 0.96, + "learning_rate": 1.5878031608424142e-06, + "loss": 0.8037, + "step": 37572 + }, + { + "epoch": 0.96, + "learning_rate": 1.5877807751099835e-06, + "loss": 1.04, + "step": 37573 + }, + { + "epoch": 0.96, + "learning_rate": 1.587758388927516e-06, + "loss": 0.9473, + "step": 37574 + }, + { + "epoch": 0.96, + "learning_rate": 1.587736002295029e-06, + "loss": 0.8418, + "step": 37575 + }, + { + "epoch": 0.96, + "learning_rate": 1.5877136152125394e-06, + "loss": 1.0293, + "step": 37576 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876912276800644e-06, + "loss": 0.9668, + "step": 37577 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876688396976214e-06, + "loss": 0.916, + "step": 37578 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876464512652277e-06, + "loss": 0.8408, + "step": 37579 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876240623829e-06, + "loss": 0.7422, + "step": 37580 + }, + { + "epoch": 0.96, + "learning_rate": 1.5876016730506554e-06, + "loss": 0.7246, + "step": 37581 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875792832685111e-06, + "loss": 0.8384, + "step": 37582 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875568930364845e-06, + "loss": 0.7817, + "step": 37583 + }, + { + "epoch": 0.96, + "learning_rate": 1.5875345023545928e-06, + "loss": 1.0693, + "step": 37584 + }, + { + "epoch": 0.96, + "learning_rate": 1.587512111222853e-06, + "loss": 0.9648, + "step": 37585 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874897196412818e-06, + "loss": 0.7861, + "step": 37586 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874673276098968e-06, + "loss": 0.8047, + "step": 37587 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874449351287152e-06, + "loss": 1.002, + "step": 37588 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874225421977539e-06, + "loss": 0.7769, + "step": 37589 + }, + { + "epoch": 0.96, + "learning_rate": 1.5874001488170303e-06, + "loss": 0.8105, + "step": 37590 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873777549865617e-06, + "loss": 0.7153, + "step": 37591 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873553607063644e-06, + "loss": 0.8652, + "step": 37592 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873329659764565e-06, + "loss": 0.9941, + "step": 37593 + }, + { + "epoch": 0.96, + "learning_rate": 1.5873105707968546e-06, + "loss": 0.7422, + "step": 37594 + }, + { + "epoch": 0.96, + "learning_rate": 1.587288175167576e-06, + "loss": 0.9287, + "step": 37595 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872657790886379e-06, + "loss": 0.7324, + "step": 37596 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872433825600574e-06, + "loss": 0.8262, + "step": 37597 + }, + { + "epoch": 0.96, + "learning_rate": 1.5872209855818515e-06, + "loss": 0.8066, + "step": 37598 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871985881540378e-06, + "loss": 0.8223, + "step": 37599 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871761902766328e-06, + "loss": 0.6763, + "step": 37600 + }, + { + "epoch": 0.96, + "learning_rate": 1.587153791949654e-06, + "loss": 0.7861, + "step": 37601 + }, + { + "epoch": 0.96, + "learning_rate": 1.5871313931731188e-06, + "loss": 0.7354, + "step": 37602 + }, + { + "epoch": 0.96, + "learning_rate": 1.587108993947044e-06, + "loss": 0.9873, + "step": 37603 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870865942714466e-06, + "loss": 0.6523, + "step": 37604 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870641941463446e-06, + "loss": 1.0117, + "step": 37605 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870417935717537e-06, + "loss": 0.9609, + "step": 37606 + }, + { + "epoch": 0.96, + "learning_rate": 1.5870193925476924e-06, + "loss": 0.9336, + "step": 37607 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869969910741774e-06, + "loss": 0.8018, + "step": 37608 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869745891512257e-06, + "loss": 0.8467, + "step": 37609 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869521867788544e-06, + "loss": 0.9219, + "step": 37610 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869297839570809e-06, + "loss": 0.9678, + "step": 37611 + }, + { + "epoch": 0.96, + "learning_rate": 1.5869073806859223e-06, + "loss": 0.9375, + "step": 37612 + }, + { + "epoch": 0.96, + "learning_rate": 1.5868849769653956e-06, + "loss": 0.7051, + "step": 37613 + }, + { + "epoch": 0.96, + "learning_rate": 1.586862572795518e-06, + "loss": 0.8721, + "step": 37614 + }, + { + "epoch": 0.96, + "learning_rate": 1.586840168176307e-06, + "loss": 0.8701, + "step": 37615 + }, + { + "epoch": 0.96, + "learning_rate": 1.5868177631077794e-06, + "loss": 0.8535, + "step": 37616 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867953575899523e-06, + "loss": 0.8027, + "step": 37617 + }, + { + "epoch": 0.96, + "learning_rate": 1.586772951622843e-06, + "loss": 0.9043, + "step": 37618 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867505452064686e-06, + "loss": 0.875, + "step": 37619 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867281383408463e-06, + "loss": 0.7676, + "step": 37620 + }, + { + "epoch": 0.96, + "learning_rate": 1.5867057310259932e-06, + "loss": 0.8105, + "step": 37621 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866833232619265e-06, + "loss": 0.8428, + "step": 37622 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866609150486637e-06, + "loss": 0.7637, + "step": 37623 + }, + { + "epoch": 0.96, + "learning_rate": 1.586638506386221e-06, + "loss": 0.957, + "step": 37624 + }, + { + "epoch": 0.96, + "learning_rate": 1.5866160972746168e-06, + "loss": 0.7773, + "step": 37625 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865936877138674e-06, + "loss": 0.6777, + "step": 37626 + }, + { + "epoch": 0.96, + "learning_rate": 1.58657127770399e-06, + "loss": 0.9424, + "step": 37627 + }, + { + "epoch": 0.96, + "learning_rate": 1.586548867245002e-06, + "loss": 0.8013, + "step": 37628 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865264563369205e-06, + "loss": 0.8447, + "step": 37629 + }, + { + "epoch": 0.96, + "learning_rate": 1.5865040449797628e-06, + "loss": 0.6948, + "step": 37630 + }, + { + "epoch": 0.96, + "learning_rate": 1.586481633173546e-06, + "loss": 0.8955, + "step": 37631 + }, + { + "epoch": 0.96, + "learning_rate": 1.5864592209182867e-06, + "loss": 0.9756, + "step": 37632 + }, + { + "epoch": 0.96, + "learning_rate": 1.586436808214003e-06, + "loss": 0.7529, + "step": 37633 + }, + { + "epoch": 0.96, + "learning_rate": 1.5864143950607115e-06, + "loss": 0.8276, + "step": 37634 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863919814584295e-06, + "loss": 0.916, + "step": 37635 + }, + { + "epoch": 0.96, + "learning_rate": 1.586369567407174e-06, + "loss": 0.9473, + "step": 37636 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863471529069623e-06, + "loss": 0.7949, + "step": 37637 + }, + { + "epoch": 0.96, + "learning_rate": 1.5863247379578115e-06, + "loss": 0.7881, + "step": 37638 + }, + { + "epoch": 0.96, + "learning_rate": 1.586302322559739e-06, + "loss": 0.8359, + "step": 37639 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862799067127616e-06, + "loss": 0.959, + "step": 37640 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862574904168966e-06, + "loss": 0.9463, + "step": 37641 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862350736721615e-06, + "loss": 0.6367, + "step": 37642 + }, + { + "epoch": 0.96, + "learning_rate": 1.5862126564785729e-06, + "loss": 0.6289, + "step": 37643 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861902388361483e-06, + "loss": 0.9014, + "step": 37644 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861678207449048e-06, + "loss": 1.0215, + "step": 37645 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861454022048593e-06, + "loss": 0.6162, + "step": 37646 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861229832160294e-06, + "loss": 1.0273, + "step": 37647 + }, + { + "epoch": 0.96, + "learning_rate": 1.5861005637784321e-06, + "loss": 0.9844, + "step": 37648 + }, + { + "epoch": 0.96, + "learning_rate": 1.5860781438920845e-06, + "loss": 0.9873, + "step": 37649 + }, + { + "epoch": 0.96, + "learning_rate": 1.586055723557004e-06, + "loss": 0.9551, + "step": 37650 + }, + { + "epoch": 0.97, + "learning_rate": 1.5860333027732075e-06, + "loss": 0.7979, + "step": 37651 + }, + { + "epoch": 0.97, + "learning_rate": 1.5860108815407123e-06, + "loss": 0.7822, + "step": 37652 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859884598595353e-06, + "loss": 0.8926, + "step": 37653 + }, + { + "epoch": 0.97, + "learning_rate": 1.585966037729694e-06, + "loss": 0.8843, + "step": 37654 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859436151512056e-06, + "loss": 0.833, + "step": 37655 + }, + { + "epoch": 0.97, + "learning_rate": 1.5859211921240869e-06, + "loss": 0.6255, + "step": 37656 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858987686483553e-06, + "loss": 0.8018, + "step": 37657 + }, + { + "epoch": 0.97, + "learning_rate": 1.585876344724028e-06, + "loss": 1.0098, + "step": 37658 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858539203511221e-06, + "loss": 0.7842, + "step": 37659 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858314955296547e-06, + "loss": 0.7605, + "step": 37660 + }, + { + "epoch": 0.97, + "learning_rate": 1.5858090702596433e-06, + "loss": 0.9473, + "step": 37661 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857866445411047e-06, + "loss": 1.0928, + "step": 37662 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857642183740562e-06, + "loss": 0.7812, + "step": 37663 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857417917585152e-06, + "loss": 1.1113, + "step": 37664 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857193646944983e-06, + "loss": 1.0527, + "step": 37665 + }, + { + "epoch": 0.97, + "learning_rate": 1.585696937182023e-06, + "loss": 0.7979, + "step": 37666 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856745092211066e-06, + "loss": 0.875, + "step": 37667 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856520808117662e-06, + "loss": 0.9203, + "step": 37668 + }, + { + "epoch": 0.97, + "learning_rate": 1.5856296519540191e-06, + "loss": 0.6572, + "step": 37669 + }, + { + "epoch": 0.97, + "learning_rate": 1.585607222647882e-06, + "loss": 0.6187, + "step": 37670 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855847928933726e-06, + "loss": 0.7163, + "step": 37671 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855623626905078e-06, + "loss": 0.7642, + "step": 37672 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855399320393046e-06, + "loss": 0.8848, + "step": 37673 + }, + { + "epoch": 0.97, + "learning_rate": 1.5855175009397806e-06, + "loss": 0.8965, + "step": 37674 + }, + { + "epoch": 0.97, + "learning_rate": 1.585495069391953e-06, + "loss": 0.6675, + "step": 37675 + }, + { + "epoch": 0.97, + "learning_rate": 1.585472637395838e-06, + "loss": 0.7783, + "step": 37676 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854502049514542e-06, + "loss": 0.7417, + "step": 37677 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854277720588178e-06, + "loss": 0.8105, + "step": 37678 + }, + { + "epoch": 0.97, + "learning_rate": 1.5854053387179466e-06, + "loss": 0.9414, + "step": 37679 + }, + { + "epoch": 0.97, + "learning_rate": 1.585382904928857e-06, + "loss": 0.8672, + "step": 37680 + }, + { + "epoch": 0.97, + "learning_rate": 1.585360470691567e-06, + "loss": 0.8828, + "step": 37681 + }, + { + "epoch": 0.97, + "learning_rate": 1.5853380360060933e-06, + "loss": 0.9082, + "step": 37682 + }, + { + "epoch": 0.97, + "learning_rate": 1.5853156008724532e-06, + "loss": 0.6533, + "step": 37683 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852931652906636e-06, + "loss": 0.8013, + "step": 37684 + }, + { + "epoch": 0.97, + "learning_rate": 1.585270729260742e-06, + "loss": 0.8916, + "step": 37685 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852482927827056e-06, + "loss": 0.748, + "step": 37686 + }, + { + "epoch": 0.97, + "learning_rate": 1.5852258558565716e-06, + "loss": 1.0273, + "step": 37687 + }, + { + "epoch": 0.97, + "learning_rate": 1.585203418482357e-06, + "loss": 0.7122, + "step": 37688 + }, + { + "epoch": 0.97, + "learning_rate": 1.5851809806600791e-06, + "loss": 0.8379, + "step": 37689 + }, + { + "epoch": 0.97, + "learning_rate": 1.585158542389755e-06, + "loss": 0.5376, + "step": 37690 + }, + { + "epoch": 0.97, + "learning_rate": 1.585136103671402e-06, + "loss": 0.8071, + "step": 37691 + }, + { + "epoch": 0.97, + "learning_rate": 1.585113664505037e-06, + "loss": 0.7505, + "step": 37692 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850912248906774e-06, + "loss": 0.7769, + "step": 37693 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850687848283405e-06, + "loss": 1.0928, + "step": 37694 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850463443180433e-06, + "loss": 0.6582, + "step": 37695 + }, + { + "epoch": 0.97, + "learning_rate": 1.585023903359803e-06, + "loss": 0.8604, + "step": 37696 + }, + { + "epoch": 0.97, + "learning_rate": 1.5850014619536367e-06, + "loss": 0.9834, + "step": 37697 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849790200995617e-06, + "loss": 0.6455, + "step": 37698 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849565777975952e-06, + "loss": 0.5706, + "step": 37699 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849341350477544e-06, + "loss": 0.8652, + "step": 37700 + }, + { + "epoch": 0.97, + "learning_rate": 1.5849116918500562e-06, + "loss": 1.0039, + "step": 37701 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848892482045182e-06, + "loss": 0.8564, + "step": 37702 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848668041111575e-06, + "loss": 0.9639, + "step": 37703 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848443595699913e-06, + "loss": 0.7578, + "step": 37704 + }, + { + "epoch": 0.97, + "learning_rate": 1.5848219145810364e-06, + "loss": 0.9072, + "step": 37705 + }, + { + "epoch": 0.97, + "learning_rate": 1.58479946914431e-06, + "loss": 0.6245, + "step": 37706 + }, + { + "epoch": 0.97, + "learning_rate": 1.58477702325983e-06, + "loss": 0.8818, + "step": 37707 + }, + { + "epoch": 0.97, + "learning_rate": 1.584754576927613e-06, + "loss": 1.3623, + "step": 37708 + }, + { + "epoch": 0.97, + "learning_rate": 1.584732130147676e-06, + "loss": 0.9512, + "step": 37709 + }, + { + "epoch": 0.97, + "learning_rate": 1.5847096829200368e-06, + "loss": 0.9561, + "step": 37710 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846872352447123e-06, + "loss": 0.7578, + "step": 37711 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846647871217194e-06, + "loss": 0.8438, + "step": 37712 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846423385510757e-06, + "loss": 0.9814, + "step": 37713 + }, + { + "epoch": 0.97, + "learning_rate": 1.5846198895327984e-06, + "loss": 0.8887, + "step": 37714 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845974400669047e-06, + "loss": 0.8066, + "step": 37715 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845749901534112e-06, + "loss": 0.7668, + "step": 37716 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845525397923355e-06, + "loss": 0.7041, + "step": 37717 + }, + { + "epoch": 0.97, + "learning_rate": 1.584530088983695e-06, + "loss": 0.7969, + "step": 37718 + }, + { + "epoch": 0.97, + "learning_rate": 1.5845076377275065e-06, + "loss": 0.9956, + "step": 37719 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844851860237877e-06, + "loss": 0.6997, + "step": 37720 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844627338725554e-06, + "loss": 1.0693, + "step": 37721 + }, + { + "epoch": 0.97, + "learning_rate": 1.5844402812738266e-06, + "loss": 0.696, + "step": 37722 + }, + { + "epoch": 0.97, + "learning_rate": 1.584417828227619e-06, + "loss": 0.6357, + "step": 37723 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843953747339494e-06, + "loss": 0.6619, + "step": 37724 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843729207928354e-06, + "loss": 0.6421, + "step": 37725 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843504664042934e-06, + "loss": 0.7197, + "step": 37726 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843280115683414e-06, + "loss": 0.8242, + "step": 37727 + }, + { + "epoch": 0.97, + "learning_rate": 1.5843055562849964e-06, + "loss": 0.8965, + "step": 37728 + }, + { + "epoch": 0.97, + "learning_rate": 1.5842831005542756e-06, + "loss": 0.7617, + "step": 37729 + }, + { + "epoch": 0.97, + "learning_rate": 1.584260644376196e-06, + "loss": 0.6948, + "step": 37730 + }, + { + "epoch": 0.97, + "learning_rate": 1.5842381877507744e-06, + "loss": 0.7373, + "step": 37731 + }, + { + "epoch": 0.97, + "learning_rate": 1.584215730678029e-06, + "loss": 0.8193, + "step": 37732 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841932731579766e-06, + "loss": 0.7383, + "step": 37733 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841708151906338e-06, + "loss": 0.6143, + "step": 37734 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841483567760186e-06, + "loss": 1.0527, + "step": 37735 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841258979141476e-06, + "loss": 0.8682, + "step": 37736 + }, + { + "epoch": 0.97, + "learning_rate": 1.5841034386050388e-06, + "loss": 0.8711, + "step": 37737 + }, + { + "epoch": 0.97, + "learning_rate": 1.5840809788487082e-06, + "loss": 0.6533, + "step": 37738 + }, + { + "epoch": 0.97, + "learning_rate": 1.584058518645174e-06, + "loss": 0.8613, + "step": 37739 + }, + { + "epoch": 0.97, + "learning_rate": 1.584036057994453e-06, + "loss": 0.7617, + "step": 37740 + }, + { + "epoch": 0.97, + "learning_rate": 1.5840135968965625e-06, + "loss": 0.9277, + "step": 37741 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839911353515194e-06, + "loss": 0.7744, + "step": 37742 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839686733593414e-06, + "loss": 0.7197, + "step": 37743 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839462109200454e-06, + "loss": 0.5415, + "step": 37744 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839237480336488e-06, + "loss": 0.7324, + "step": 37745 + }, + { + "epoch": 0.97, + "learning_rate": 1.5839012847001682e-06, + "loss": 0.8535, + "step": 37746 + }, + { + "epoch": 0.97, + "learning_rate": 1.5838788209196214e-06, + "loss": 0.7874, + "step": 37747 + }, + { + "epoch": 0.97, + "learning_rate": 1.5838563566920256e-06, + "loss": 0.7998, + "step": 37748 + }, + { + "epoch": 0.97, + "learning_rate": 1.583833892017398e-06, + "loss": 0.9736, + "step": 37749 + }, + { + "epoch": 0.97, + "learning_rate": 1.583811426895755e-06, + "loss": 0.7832, + "step": 37750 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837889613271149e-06, + "loss": 0.7776, + "step": 37751 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837664953114941e-06, + "loss": 0.8955, + "step": 37752 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837440288489106e-06, + "loss": 0.7344, + "step": 37753 + }, + { + "epoch": 0.97, + "learning_rate": 1.5837215619393809e-06, + "loss": 0.6343, + "step": 37754 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836990945829224e-06, + "loss": 0.9482, + "step": 37755 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836766267795523e-06, + "loss": 0.813, + "step": 37756 + }, + { + "epoch": 0.97, + "learning_rate": 1.583654158529288e-06, + "loss": 0.73, + "step": 37757 + }, + { + "epoch": 0.97, + "learning_rate": 1.5836316898321464e-06, + "loss": 0.9824, + "step": 37758 + }, + { + "epoch": 0.97, + "learning_rate": 1.583609220688145e-06, + "loss": 0.8228, + "step": 37759 + }, + { + "epoch": 0.97, + "learning_rate": 1.5835867510973009e-06, + "loss": 0.7246, + "step": 37760 + }, + { + "epoch": 0.97, + "learning_rate": 1.583564281059631e-06, + "loss": 0.7568, + "step": 37761 + }, + { + "epoch": 0.97, + "learning_rate": 1.583541810575153e-06, + "loss": 0.8057, + "step": 37762 + }, + { + "epoch": 0.97, + "learning_rate": 1.5835193396438837e-06, + "loss": 1.0527, + "step": 37763 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834968682658407e-06, + "loss": 1.0645, + "step": 37764 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834743964410408e-06, + "loss": 0.8101, + "step": 37765 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834519241695015e-06, + "loss": 0.5063, + "step": 37766 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834294514512396e-06, + "loss": 0.8848, + "step": 37767 + }, + { + "epoch": 0.97, + "learning_rate": 1.5834069782862728e-06, + "loss": 0.7949, + "step": 37768 + }, + { + "epoch": 0.97, + "learning_rate": 1.5833845046746184e-06, + "loss": 0.9453, + "step": 37769 + }, + { + "epoch": 0.97, + "learning_rate": 1.583362030616293e-06, + "loss": 0.7715, + "step": 37770 + }, + { + "epoch": 0.97, + "learning_rate": 1.583339556111314e-06, + "loss": 0.8867, + "step": 37771 + }, + { + "epoch": 0.97, + "learning_rate": 1.583317081159699e-06, + "loss": 0.8652, + "step": 37772 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832946057614644e-06, + "loss": 0.8291, + "step": 37773 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832721299166285e-06, + "loss": 1.0166, + "step": 37774 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832496536252079e-06, + "loss": 1.1689, + "step": 37775 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832271768872196e-06, + "loss": 0.8594, + "step": 37776 + }, + { + "epoch": 0.97, + "learning_rate": 1.5832046997026813e-06, + "loss": 0.6323, + "step": 37777 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831822220716097e-06, + "loss": 0.959, + "step": 37778 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831597439940225e-06, + "loss": 0.6938, + "step": 37779 + }, + { + "epoch": 0.97, + "learning_rate": 1.583137265469937e-06, + "loss": 0.9619, + "step": 37780 + }, + { + "epoch": 0.97, + "learning_rate": 1.5831147864993697e-06, + "loss": 1.0283, + "step": 37781 + }, + { + "epoch": 0.97, + "learning_rate": 1.583092307082338e-06, + "loss": 0.7764, + "step": 37782 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830698272188596e-06, + "loss": 0.8003, + "step": 37783 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830473469089518e-06, + "loss": 0.7373, + "step": 37784 + }, + { + "epoch": 0.97, + "learning_rate": 1.5830248661526308e-06, + "loss": 0.7861, + "step": 37785 + }, + { + "epoch": 0.97, + "learning_rate": 1.583002384949915e-06, + "loss": 0.9023, + "step": 37786 + }, + { + "epoch": 0.97, + "learning_rate": 1.582979903300821e-06, + "loss": 0.8887, + "step": 37787 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829574212053658e-06, + "loss": 0.5959, + "step": 37788 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829349386635671e-06, + "loss": 0.8467, + "step": 37789 + }, + { + "epoch": 0.97, + "learning_rate": 1.5829124556754422e-06, + "loss": 0.8018, + "step": 37790 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828899722410073e-06, + "loss": 0.7969, + "step": 37791 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828674883602807e-06, + "loss": 0.792, + "step": 37792 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828450040332796e-06, + "loss": 0.8096, + "step": 37793 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828225192600209e-06, + "loss": 0.791, + "step": 37794 + }, + { + "epoch": 0.97, + "learning_rate": 1.5828000340405212e-06, + "loss": 0.7808, + "step": 37795 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827775483747987e-06, + "loss": 0.8613, + "step": 37796 + }, + { + "epoch": 0.97, + "learning_rate": 1.58275506226287e-06, + "loss": 1.0361, + "step": 37797 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827325757047528e-06, + "loss": 0.7891, + "step": 37798 + }, + { + "epoch": 0.97, + "learning_rate": 1.5827100887004641e-06, + "loss": 0.5698, + "step": 37799 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826876012500208e-06, + "loss": 0.79, + "step": 37800 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826651133534407e-06, + "loss": 0.7637, + "step": 37801 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826426250107402e-06, + "loss": 0.5571, + "step": 37802 + }, + { + "epoch": 0.97, + "learning_rate": 1.5826201362219375e-06, + "loss": 0.7861, + "step": 37803 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825976469870494e-06, + "loss": 0.7065, + "step": 37804 + }, + { + "epoch": 0.97, + "learning_rate": 1.582575157306093e-06, + "loss": 0.7666, + "step": 37805 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825526671790855e-06, + "loss": 0.998, + "step": 37806 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825301766060441e-06, + "loss": 0.6924, + "step": 37807 + }, + { + "epoch": 0.97, + "learning_rate": 1.5825076855869863e-06, + "loss": 0.8682, + "step": 37808 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824851941219293e-06, + "loss": 0.538, + "step": 37809 + }, + { + "epoch": 0.97, + "learning_rate": 1.58246270221089e-06, + "loss": 0.561, + "step": 37810 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824402098538856e-06, + "loss": 0.7432, + "step": 37811 + }, + { + "epoch": 0.97, + "learning_rate": 1.5824177170509337e-06, + "loss": 0.6426, + "step": 37812 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823952238020513e-06, + "loss": 0.6997, + "step": 37813 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823727301072558e-06, + "loss": 0.8438, + "step": 37814 + }, + { + "epoch": 0.97, + "learning_rate": 1.582350235966564e-06, + "loss": 0.9102, + "step": 37815 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823277413799936e-06, + "loss": 0.9199, + "step": 37816 + }, + { + "epoch": 0.97, + "learning_rate": 1.5823052463475614e-06, + "loss": 0.8779, + "step": 37817 + }, + { + "epoch": 0.97, + "learning_rate": 1.5822827508692851e-06, + "loss": 0.8662, + "step": 37818 + }, + { + "epoch": 0.97, + "learning_rate": 1.5822602549451815e-06, + "loss": 0.7197, + "step": 37819 + }, + { + "epoch": 0.97, + "learning_rate": 1.582237758575268e-06, + "loss": 0.9209, + "step": 37820 + }, + { + "epoch": 0.97, + "learning_rate": 1.582215261759562e-06, + "loss": 0.9141, + "step": 37821 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821927644980804e-06, + "loss": 0.8755, + "step": 37822 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821702667908406e-06, + "loss": 0.8379, + "step": 37823 + }, + { + "epoch": 0.97, + "learning_rate": 1.58214776863786e-06, + "loss": 0.8086, + "step": 37824 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821252700391554e-06, + "loss": 0.7812, + "step": 37825 + }, + { + "epoch": 0.97, + "learning_rate": 1.5821027709947442e-06, + "loss": 0.7251, + "step": 37826 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820802715046438e-06, + "loss": 0.8062, + "step": 37827 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820577715688712e-06, + "loss": 0.7471, + "step": 37828 + }, + { + "epoch": 0.97, + "learning_rate": 1.582035271187444e-06, + "loss": 0.7783, + "step": 37829 + }, + { + "epoch": 0.97, + "learning_rate": 1.5820127703603786e-06, + "loss": 0.7295, + "step": 37830 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819902690876931e-06, + "loss": 0.877, + "step": 37831 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819677673694045e-06, + "loss": 0.7363, + "step": 37832 + }, + { + "epoch": 0.97, + "learning_rate": 1.58194526520553e-06, + "loss": 0.9756, + "step": 37833 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819227625960868e-06, + "loss": 0.9648, + "step": 37834 + }, + { + "epoch": 0.97, + "learning_rate": 1.5819002595410917e-06, + "loss": 0.8911, + "step": 37835 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818777560405628e-06, + "loss": 0.688, + "step": 37836 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818552520945165e-06, + "loss": 0.9609, + "step": 37837 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818327477029706e-06, + "loss": 0.9854, + "step": 37838 + }, + { + "epoch": 0.97, + "learning_rate": 1.5818102428659418e-06, + "loss": 0.8848, + "step": 37839 + }, + { + "epoch": 0.97, + "learning_rate": 1.581787737583448e-06, + "loss": 1.0439, + "step": 37840 + }, + { + "epoch": 0.97, + "learning_rate": 1.581765231855506e-06, + "loss": 1.4229, + "step": 37841 + }, + { + "epoch": 0.97, + "learning_rate": 1.5817427256821331e-06, + "loss": 1.1377, + "step": 37842 + }, + { + "epoch": 0.97, + "learning_rate": 1.5817202190633462e-06, + "loss": 0.9199, + "step": 37843 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816977119991635e-06, + "loss": 0.8936, + "step": 37844 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816752044896014e-06, + "loss": 0.8975, + "step": 37845 + }, + { + "epoch": 0.97, + "learning_rate": 1.581652696534677e-06, + "loss": 0.6406, + "step": 37846 + }, + { + "epoch": 0.97, + "learning_rate": 1.581630188134408e-06, + "loss": 0.9502, + "step": 37847 + }, + { + "epoch": 0.97, + "learning_rate": 1.5816076792888118e-06, + "loss": 0.9492, + "step": 37848 + }, + { + "epoch": 0.97, + "learning_rate": 1.5815851699979055e-06, + "loss": 0.707, + "step": 37849 + }, + { + "epoch": 0.97, + "learning_rate": 1.5815626602617055e-06, + "loss": 0.7175, + "step": 37850 + }, + { + "epoch": 0.97, + "learning_rate": 1.58154015008023e-06, + "loss": 0.563, + "step": 37851 + }, + { + "epoch": 0.97, + "learning_rate": 1.581517639453496e-06, + "loss": 1.1787, + "step": 37852 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814951283815207e-06, + "loss": 0.7109, + "step": 37853 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814726168643215e-06, + "loss": 0.9106, + "step": 37854 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814501049019153e-06, + "loss": 0.7896, + "step": 37855 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814275924943195e-06, + "loss": 0.6836, + "step": 37856 + }, + { + "epoch": 0.97, + "learning_rate": 1.5814050796415511e-06, + "loss": 0.9277, + "step": 37857 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813825663436278e-06, + "loss": 0.8887, + "step": 37858 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813600526005666e-06, + "loss": 0.5684, + "step": 37859 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813375384123848e-06, + "loss": 0.9287, + "step": 37860 + }, + { + "epoch": 0.97, + "learning_rate": 1.5813150237790996e-06, + "loss": 0.9443, + "step": 37861 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812925087007278e-06, + "loss": 0.9111, + "step": 37862 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812699931772873e-06, + "loss": 0.8291, + "step": 37863 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812474772087953e-06, + "loss": 0.8838, + "step": 37864 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812249607952686e-06, + "loss": 1.0664, + "step": 37865 + }, + { + "epoch": 0.97, + "learning_rate": 1.5812024439367247e-06, + "loss": 0.8496, + "step": 37866 + }, + { + "epoch": 0.97, + "learning_rate": 1.5811799266331809e-06, + "loss": 0.792, + "step": 37867 + }, + { + "epoch": 0.97, + "learning_rate": 1.5811574088846542e-06, + "loss": 0.8838, + "step": 37868 + }, + { + "epoch": 0.97, + "learning_rate": 1.581134890691162e-06, + "loss": 0.9717, + "step": 37869 + }, + { + "epoch": 0.97, + "learning_rate": 1.581112372052722e-06, + "loss": 0.8818, + "step": 37870 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810898529693505e-06, + "loss": 0.9707, + "step": 37871 + }, + { + "epoch": 0.97, + "learning_rate": 1.581067333441065e-06, + "loss": 1.0225, + "step": 37872 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810448134678834e-06, + "loss": 0.8359, + "step": 37873 + }, + { + "epoch": 0.97, + "learning_rate": 1.5810222930498225e-06, + "loss": 0.8369, + "step": 37874 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809997721868995e-06, + "loss": 0.8008, + "step": 37875 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809772508791315e-06, + "loss": 0.8623, + "step": 37876 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809547291265361e-06, + "loss": 0.7422, + "step": 37877 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809322069291305e-06, + "loss": 0.7441, + "step": 37878 + }, + { + "epoch": 0.97, + "learning_rate": 1.5809096842869315e-06, + "loss": 0.7124, + "step": 37879 + }, + { + "epoch": 0.97, + "learning_rate": 1.580887161199957e-06, + "loss": 0.8076, + "step": 37880 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808646376682236e-06, + "loss": 0.7542, + "step": 37881 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808421136917489e-06, + "loss": 0.8271, + "step": 37882 + }, + { + "epoch": 0.97, + "learning_rate": 1.5808195892705504e-06, + "loss": 0.9395, + "step": 37883 + }, + { + "epoch": 0.97, + "learning_rate": 1.580797064404645e-06, + "loss": 0.8013, + "step": 37884 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807745390940497e-06, + "loss": 1.1436, + "step": 37885 + }, + { + "epoch": 0.97, + "learning_rate": 1.580752013338782e-06, + "loss": 0.9258, + "step": 37886 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807294871388595e-06, + "loss": 0.8335, + "step": 37887 + }, + { + "epoch": 0.97, + "learning_rate": 1.5807069604942988e-06, + "loss": 0.8203, + "step": 37888 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806844334051178e-06, + "loss": 1.0723, + "step": 37889 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806619058713332e-06, + "loss": 0.7812, + "step": 37890 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806393778929628e-06, + "loss": 0.8301, + "step": 37891 + }, + { + "epoch": 0.97, + "learning_rate": 1.5806168494700232e-06, + "loss": 0.6631, + "step": 37892 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805943206025321e-06, + "loss": 0.9375, + "step": 37893 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805717912905067e-06, + "loss": 0.5706, + "step": 37894 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805492615339639e-06, + "loss": 0.6938, + "step": 37895 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805267313329217e-06, + "loss": 0.9814, + "step": 37896 + }, + { + "epoch": 0.97, + "learning_rate": 1.5805042006873964e-06, + "loss": 1.0332, + "step": 37897 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804816695974056e-06, + "loss": 0.6846, + "step": 37898 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804591380629675e-06, + "loss": 0.7009, + "step": 37899 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804366060840976e-06, + "loss": 0.7549, + "step": 37900 + }, + { + "epoch": 0.97, + "learning_rate": 1.5804140736608147e-06, + "loss": 0.9365, + "step": 37901 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803915407931351e-06, + "loss": 0.8057, + "step": 37902 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803690074810767e-06, + "loss": 0.6455, + "step": 37903 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803464737246564e-06, + "loss": 0.8301, + "step": 37904 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803239395238912e-06, + "loss": 0.7979, + "step": 37905 + }, + { + "epoch": 0.97, + "learning_rate": 1.5803014048787987e-06, + "loss": 0.4968, + "step": 37906 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802788697893962e-06, + "loss": 0.6704, + "step": 37907 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802563342557008e-06, + "loss": 0.7158, + "step": 37908 + }, + { + "epoch": 0.97, + "learning_rate": 1.58023379827773e-06, + "loss": 0.7173, + "step": 37909 + }, + { + "epoch": 0.97, + "learning_rate": 1.5802112618555005e-06, + "loss": 0.835, + "step": 37910 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801887249890303e-06, + "loss": 1.1035, + "step": 37911 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801661876783362e-06, + "loss": 0.7578, + "step": 37912 + }, + { + "epoch": 0.97, + "learning_rate": 1.580143649923435e-06, + "loss": 1.0156, + "step": 37913 + }, + { + "epoch": 0.97, + "learning_rate": 1.5801211117243453e-06, + "loss": 0.8916, + "step": 37914 + }, + { + "epoch": 0.97, + "learning_rate": 1.580098573081083e-06, + "loss": 0.9434, + "step": 37915 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800760339936661e-06, + "loss": 0.9668, + "step": 37916 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800534944621115e-06, + "loss": 0.8447, + "step": 37917 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800309544864366e-06, + "loss": 0.7373, + "step": 37918 + }, + { + "epoch": 0.97, + "learning_rate": 1.5800084140666589e-06, + "loss": 0.8154, + "step": 37919 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799858732027952e-06, + "loss": 0.9238, + "step": 37920 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799633318948632e-06, + "loss": 0.7407, + "step": 37921 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799407901428797e-06, + "loss": 0.8848, + "step": 37922 + }, + { + "epoch": 0.97, + "learning_rate": 1.5799182479468623e-06, + "loss": 0.7485, + "step": 37923 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798957053068285e-06, + "loss": 0.8428, + "step": 37924 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798731622227948e-06, + "loss": 0.8506, + "step": 37925 + }, + { + "epoch": 0.97, + "learning_rate": 1.579850618694779e-06, + "loss": 0.9062, + "step": 37926 + }, + { + "epoch": 0.97, + "learning_rate": 1.579828074722798e-06, + "loss": 0.7759, + "step": 37927 + }, + { + "epoch": 0.97, + "learning_rate": 1.5798055303068695e-06, + "loss": 1.1309, + "step": 37928 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797829854470107e-06, + "loss": 0.8906, + "step": 37929 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797604401432387e-06, + "loss": 0.9014, + "step": 37930 + }, + { + "epoch": 0.97, + "learning_rate": 1.5797378943955707e-06, + "loss": 0.6875, + "step": 37931 + }, + { + "epoch": 0.97, + "learning_rate": 1.579715348204024e-06, + "loss": 0.8574, + "step": 37932 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796928015686159e-06, + "loss": 0.8848, + "step": 37933 + }, + { + "epoch": 0.97, + "learning_rate": 1.579670254489364e-06, + "loss": 0.8682, + "step": 37934 + }, + { + "epoch": 0.97, + "learning_rate": 1.579647706966285e-06, + "loss": 0.5796, + "step": 37935 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796251589993963e-06, + "loss": 0.959, + "step": 37936 + }, + { + "epoch": 0.97, + "learning_rate": 1.5796026105887155e-06, + "loss": 0.7072, + "step": 37937 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795800617342595e-06, + "loss": 0.7129, + "step": 37938 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795575124360457e-06, + "loss": 0.7852, + "step": 37939 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795349626940913e-06, + "loss": 0.9336, + "step": 37940 + }, + { + "epoch": 0.97, + "learning_rate": 1.5795124125084137e-06, + "loss": 0.7502, + "step": 37941 + }, + { + "epoch": 0.97, + "learning_rate": 1.57948986187903e-06, + "loss": 0.917, + "step": 37942 + }, + { + "epoch": 0.97, + "learning_rate": 1.5794673108059574e-06, + "loss": 0.9375, + "step": 37943 + }, + { + "epoch": 0.97, + "learning_rate": 1.579444759289214e-06, + "loss": 1.0684, + "step": 37944 + }, + { + "epoch": 0.97, + "learning_rate": 1.579422207328816e-06, + "loss": 0.7197, + "step": 37945 + }, + { + "epoch": 0.97, + "learning_rate": 1.579399654924781e-06, + "loss": 0.9473, + "step": 37946 + }, + { + "epoch": 0.97, + "learning_rate": 1.5793771020771262e-06, + "loss": 0.7568, + "step": 37947 + }, + { + "epoch": 0.97, + "learning_rate": 1.579354548785869e-06, + "loss": 0.6597, + "step": 37948 + }, + { + "epoch": 0.97, + "learning_rate": 1.5793319950510271e-06, + "loss": 0.7646, + "step": 37949 + }, + { + "epoch": 0.97, + "learning_rate": 1.579309440872617e-06, + "loss": 0.7334, + "step": 37950 + }, + { + "epoch": 0.97, + "learning_rate": 1.579286886250656e-06, + "loss": 0.4927, + "step": 37951 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792643311851622e-06, + "loss": 0.9297, + "step": 37952 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792417756761522e-06, + "loss": 0.9473, + "step": 37953 + }, + { + "epoch": 0.97, + "learning_rate": 1.5792192197236433e-06, + "loss": 0.7397, + "step": 37954 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791966633276528e-06, + "loss": 0.7949, + "step": 37955 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791741064881982e-06, + "loss": 0.7393, + "step": 37956 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791515492052966e-06, + "loss": 0.4741, + "step": 37957 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791289914789654e-06, + "loss": 0.6208, + "step": 37958 + }, + { + "epoch": 0.97, + "learning_rate": 1.5791064333092216e-06, + "loss": 0.7568, + "step": 37959 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790838746960826e-06, + "loss": 0.6938, + "step": 37960 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790613156395658e-06, + "loss": 0.7344, + "step": 37961 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790387561396883e-06, + "loss": 0.8616, + "step": 37962 + }, + { + "epoch": 0.97, + "learning_rate": 1.5790161961964677e-06, + "loss": 0.7607, + "step": 37963 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789936358099208e-06, + "loss": 0.748, + "step": 37964 + }, + { + "epoch": 0.97, + "learning_rate": 1.578971074980065e-06, + "loss": 0.9043, + "step": 37965 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789485137069178e-06, + "loss": 0.6482, + "step": 37966 + }, + { + "epoch": 0.97, + "learning_rate": 1.578925951990496e-06, + "loss": 0.604, + "step": 37967 + }, + { + "epoch": 0.97, + "learning_rate": 1.5789033898308177e-06, + "loss": 0.8691, + "step": 37968 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788808272278998e-06, + "loss": 0.8228, + "step": 37969 + }, + { + "epoch": 0.97, + "learning_rate": 1.578858264181759e-06, + "loss": 0.8467, + "step": 37970 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788357006924132e-06, + "loss": 0.7686, + "step": 37971 + }, + { + "epoch": 0.97, + "learning_rate": 1.5788131367598796e-06, + "loss": 0.8662, + "step": 37972 + }, + { + "epoch": 0.97, + "learning_rate": 1.5787905723841755e-06, + "loss": 0.8408, + "step": 37973 + }, + { + "epoch": 0.97, + "learning_rate": 1.5787680075653177e-06, + "loss": 0.7524, + "step": 37974 + }, + { + "epoch": 0.97, + "learning_rate": 1.578745442303324e-06, + "loss": 0.877, + "step": 37975 + }, + { + "epoch": 0.97, + "learning_rate": 1.578722876598212e-06, + "loss": 0.8535, + "step": 37976 + }, + { + "epoch": 0.97, + "learning_rate": 1.578700310449998e-06, + "loss": 0.8623, + "step": 37977 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786777438586998e-06, + "loss": 0.7051, + "step": 37978 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786551768243348e-06, + "loss": 1.1504, + "step": 37979 + }, + { + "epoch": 0.97, + "learning_rate": 1.5786326093469202e-06, + "loss": 0.7715, + "step": 37980 + }, + { + "epoch": 0.97, + "learning_rate": 1.578610041426473e-06, + "loss": 0.9707, + "step": 37981 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785874730630106e-06, + "loss": 0.957, + "step": 37982 + }, + { + "epoch": 0.97, + "learning_rate": 1.578564904256551e-06, + "loss": 0.9785, + "step": 37983 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785423350071104e-06, + "loss": 0.623, + "step": 37984 + }, + { + "epoch": 0.97, + "learning_rate": 1.5785197653147064e-06, + "loss": 1.0781, + "step": 37985 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784971951793566e-06, + "loss": 0.7056, + "step": 37986 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784746246010782e-06, + "loss": 0.6624, + "step": 37987 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784520535798881e-06, + "loss": 0.8916, + "step": 37988 + }, + { + "epoch": 0.97, + "learning_rate": 1.5784294821158042e-06, + "loss": 1.0273, + "step": 37989 + }, + { + "epoch": 0.97, + "learning_rate": 1.578406910208843e-06, + "loss": 1.0645, + "step": 37990 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783843378590227e-06, + "loss": 0.8184, + "step": 37991 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783617650663596e-06, + "loss": 0.8945, + "step": 37992 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783391918308722e-06, + "loss": 0.4985, + "step": 37993 + }, + { + "epoch": 0.97, + "learning_rate": 1.5783166181525766e-06, + "loss": 0.9199, + "step": 37994 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782940440314906e-06, + "loss": 0.7754, + "step": 37995 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782714694676314e-06, + "loss": 1.1816, + "step": 37996 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782488944610164e-06, + "loss": 0.7202, + "step": 37997 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782263190116626e-06, + "loss": 0.9785, + "step": 37998 + }, + { + "epoch": 0.97, + "learning_rate": 1.5782037431195878e-06, + "loss": 0.7593, + "step": 37999 + }, + { + "epoch": 0.97, + "learning_rate": 1.578181166784809e-06, + "loss": 1.0527, + "step": 38000 + }, + { + "epoch": 0.97, + "learning_rate": 1.5781585900073433e-06, + "loss": 0.7051, + "step": 38001 + }, + { + "epoch": 0.97, + "learning_rate": 1.5781360127872082e-06, + "loss": 0.9062, + "step": 38002 + }, + { + "epoch": 0.97, + "learning_rate": 1.578113435124421e-06, + "loss": 0.8184, + "step": 38003 + }, + { + "epoch": 0.97, + "learning_rate": 1.578090857018999e-06, + "loss": 0.8645, + "step": 38004 + }, + { + "epoch": 0.97, + "learning_rate": 1.578068278470959e-06, + "loss": 0.8647, + "step": 38005 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780456994803188e-06, + "loss": 0.9307, + "step": 38006 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780231200470959e-06, + "loss": 0.7871, + "step": 38007 + }, + { + "epoch": 0.97, + "learning_rate": 1.5780005401713076e-06, + "loss": 0.9639, + "step": 38008 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779779598529702e-06, + "loss": 0.8291, + "step": 38009 + }, + { + "epoch": 0.97, + "learning_rate": 1.577955379092102e-06, + "loss": 0.9697, + "step": 38010 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779327978887195e-06, + "loss": 0.7549, + "step": 38011 + }, + { + "epoch": 0.97, + "learning_rate": 1.5779102162428405e-06, + "loss": 0.874, + "step": 38012 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778876341544827e-06, + "loss": 0.634, + "step": 38013 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778650516236627e-06, + "loss": 0.5605, + "step": 38014 + }, + { + "epoch": 0.97, + "learning_rate": 1.577842468650398e-06, + "loss": 0.8887, + "step": 38015 + }, + { + "epoch": 0.97, + "learning_rate": 1.5778198852347058e-06, + "loss": 0.9189, + "step": 38016 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777973013766036e-06, + "loss": 0.8311, + "step": 38017 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777747170761085e-06, + "loss": 0.7134, + "step": 38018 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777521323332378e-06, + "loss": 0.9004, + "step": 38019 + }, + { + "epoch": 0.97, + "learning_rate": 1.5777295471480087e-06, + "loss": 0.6577, + "step": 38020 + }, + { + "epoch": 0.97, + "learning_rate": 1.577706961520439e-06, + "loss": 0.9854, + "step": 38021 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776843754505454e-06, + "loss": 0.7275, + "step": 38022 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776617889383457e-06, + "loss": 0.6338, + "step": 38023 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776392019838567e-06, + "loss": 0.9316, + "step": 38024 + }, + { + "epoch": 0.97, + "learning_rate": 1.5776166145870962e-06, + "loss": 0.7637, + "step": 38025 + }, + { + "epoch": 0.97, + "learning_rate": 1.577594026748081e-06, + "loss": 0.8369, + "step": 38026 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775714384668283e-06, + "loss": 0.9824, + "step": 38027 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775488497433563e-06, + "loss": 0.6836, + "step": 38028 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775262605776815e-06, + "loss": 0.9824, + "step": 38029 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775036709698213e-06, + "loss": 0.8604, + "step": 38030 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774810809197932e-06, + "loss": 0.7998, + "step": 38031 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774584904276141e-06, + "loss": 0.8965, + "step": 38032 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774358994933018e-06, + "loss": 0.6987, + "step": 38033 + }, + { + "epoch": 0.97, + "learning_rate": 1.5774133081168737e-06, + "loss": 0.6963, + "step": 38034 + }, + { + "epoch": 0.97, + "learning_rate": 1.577390716298346e-06, + "loss": 0.7129, + "step": 38035 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773681240377378e-06, + "loss": 0.752, + "step": 38036 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773455313350644e-06, + "loss": 0.8911, + "step": 38037 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773229381903447e-06, + "loss": 1.04, + "step": 38038 + }, + { + "epoch": 0.97, + "learning_rate": 1.5773003446035951e-06, + "loss": 0.7402, + "step": 38039 + }, + { + "epoch": 0.97, + "learning_rate": 1.5772777505748333e-06, + "loss": 0.8857, + "step": 38040 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772551561040763e-06, + "loss": 0.6836, + "step": 38041 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772325611913417e-06, + "loss": 0.957, + "step": 38042 + }, + { + "epoch": 0.98, + "learning_rate": 1.5772099658366468e-06, + "loss": 1.0156, + "step": 38043 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771873700400086e-06, + "loss": 0.7383, + "step": 38044 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771647738014445e-06, + "loss": 0.7935, + "step": 38045 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771421771209719e-06, + "loss": 0.7656, + "step": 38046 + }, + { + "epoch": 0.98, + "learning_rate": 1.5771195799986083e-06, + "loss": 0.9277, + "step": 38047 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770969824343707e-06, + "loss": 0.9468, + "step": 38048 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770743844282763e-06, + "loss": 0.8779, + "step": 38049 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770517859803428e-06, + "loss": 0.6479, + "step": 38050 + }, + { + "epoch": 0.98, + "learning_rate": 1.577029187090587e-06, + "loss": 0.8184, + "step": 38051 + }, + { + "epoch": 0.98, + "learning_rate": 1.5770065877590266e-06, + "loss": 0.8574, + "step": 38052 + }, + { + "epoch": 0.98, + "learning_rate": 1.576983987985679e-06, + "loss": 0.9375, + "step": 38053 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769613877705612e-06, + "loss": 0.8564, + "step": 38054 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769387871136903e-06, + "loss": 0.7363, + "step": 38055 + }, + { + "epoch": 0.98, + "learning_rate": 1.5769161860150841e-06, + "loss": 0.9648, + "step": 38056 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768935844747598e-06, + "loss": 0.8906, + "step": 38057 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768709824927346e-06, + "loss": 0.7236, + "step": 38058 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768483800690256e-06, + "loss": 0.7856, + "step": 38059 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768257772036505e-06, + "loss": 0.9082, + "step": 38060 + }, + { + "epoch": 0.98, + "learning_rate": 1.5768031738966264e-06, + "loss": 0.8242, + "step": 38061 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767805701479704e-06, + "loss": 0.5286, + "step": 38062 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767579659577003e-06, + "loss": 0.7817, + "step": 38063 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767353613258332e-06, + "loss": 0.8091, + "step": 38064 + }, + { + "epoch": 0.98, + "learning_rate": 1.5767127562523864e-06, + "loss": 0.8467, + "step": 38065 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766901507373768e-06, + "loss": 0.792, + "step": 38066 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766675447808222e-06, + "loss": 0.6138, + "step": 38067 + }, + { + "epoch": 0.98, + "learning_rate": 1.5766449383827401e-06, + "loss": 0.5945, + "step": 38068 + }, + { + "epoch": 0.98, + "learning_rate": 1.576622331543147e-06, + "loss": 0.6875, + "step": 38069 + }, + { + "epoch": 0.98, + "learning_rate": 1.576599724262061e-06, + "loss": 1.04, + "step": 38070 + }, + { + "epoch": 0.98, + "learning_rate": 1.576577116539499e-06, + "loss": 0.9346, + "step": 38071 + }, + { + "epoch": 0.98, + "learning_rate": 1.5765545083754783e-06, + "loss": 0.8184, + "step": 38072 + }, + { + "epoch": 0.98, + "learning_rate": 1.5765318997700167e-06, + "loss": 0.5208, + "step": 38073 + }, + { + "epoch": 0.98, + "learning_rate": 1.576509290723131e-06, + "loss": 0.8555, + "step": 38074 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764866812348383e-06, + "loss": 0.6509, + "step": 38075 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764640713051564e-06, + "loss": 0.8242, + "step": 38076 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764414609341027e-06, + "loss": 0.959, + "step": 38077 + }, + { + "epoch": 0.98, + "learning_rate": 1.5764188501216943e-06, + "loss": 0.9062, + "step": 38078 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763962388679483e-06, + "loss": 1.1338, + "step": 38079 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763736271728822e-06, + "loss": 0.8721, + "step": 38080 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763510150365136e-06, + "loss": 0.8457, + "step": 38081 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763284024588593e-06, + "loss": 0.9717, + "step": 38082 + }, + { + "epoch": 0.98, + "learning_rate": 1.5763057894399368e-06, + "loss": 0.707, + "step": 38083 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762831759797635e-06, + "loss": 0.6724, + "step": 38084 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762605620783566e-06, + "loss": 1.001, + "step": 38085 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762379477357334e-06, + "loss": 0.7305, + "step": 38086 + }, + { + "epoch": 0.98, + "learning_rate": 1.5762153329519115e-06, + "loss": 0.9082, + "step": 38087 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761927177269078e-06, + "loss": 0.8604, + "step": 38088 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761701020607401e-06, + "loss": 0.6562, + "step": 38089 + }, + { + "epoch": 0.98, + "learning_rate": 1.5761474859534254e-06, + "loss": 0.7021, + "step": 38090 + }, + { + "epoch": 0.98, + "learning_rate": 1.576124869404981e-06, + "loss": 0.8115, + "step": 38091 + }, + { + "epoch": 0.98, + "learning_rate": 1.576102252415424e-06, + "loss": 0.9863, + "step": 38092 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760796349847726e-06, + "loss": 0.8506, + "step": 38093 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760570171130432e-06, + "loss": 1.0623, + "step": 38094 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760343988002533e-06, + "loss": 0.957, + "step": 38095 + }, + { + "epoch": 0.98, + "learning_rate": 1.5760117800464206e-06, + "loss": 0.7832, + "step": 38096 + }, + { + "epoch": 0.98, + "learning_rate": 1.575989160851562e-06, + "loss": 0.9922, + "step": 38097 + }, + { + "epoch": 0.98, + "learning_rate": 1.5759665412156951e-06, + "loss": 0.7578, + "step": 38098 + }, + { + "epoch": 0.98, + "learning_rate": 1.5759439211388367e-06, + "loss": 0.9111, + "step": 38099 + }, + { + "epoch": 0.98, + "learning_rate": 1.575921300621005e-06, + "loss": 0.7881, + "step": 38100 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758986796622167e-06, + "loss": 0.9531, + "step": 38101 + }, + { + "epoch": 0.98, + "learning_rate": 1.575876058262489e-06, + "loss": 0.6968, + "step": 38102 + }, + { + "epoch": 0.98, + "learning_rate": 1.57585343642184e-06, + "loss": 0.916, + "step": 38103 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758308141402862e-06, + "loss": 0.7783, + "step": 38104 + }, + { + "epoch": 0.98, + "learning_rate": 1.5758081914178454e-06, + "loss": 0.915, + "step": 38105 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757855682545344e-06, + "loss": 0.9609, + "step": 38106 + }, + { + "epoch": 0.98, + "learning_rate": 1.575762944650371e-06, + "loss": 1.0146, + "step": 38107 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757403206053725e-06, + "loss": 0.7324, + "step": 38108 + }, + { + "epoch": 0.98, + "learning_rate": 1.5757176961195562e-06, + "loss": 0.8574, + "step": 38109 + }, + { + "epoch": 0.98, + "learning_rate": 1.575695071192939e-06, + "loss": 1.1904, + "step": 38110 + }, + { + "epoch": 0.98, + "learning_rate": 1.5756724458255387e-06, + "loss": 0.9482, + "step": 38111 + }, + { + "epoch": 0.98, + "learning_rate": 1.5756498200173727e-06, + "loss": 0.7588, + "step": 38112 + }, + { + "epoch": 0.98, + "learning_rate": 1.575627193768458e-06, + "loss": 0.9854, + "step": 38113 + }, + { + "epoch": 0.98, + "learning_rate": 1.575604567078812e-06, + "loss": 0.9619, + "step": 38114 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755819399484518e-06, + "loss": 0.9082, + "step": 38115 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755593123773951e-06, + "loss": 0.8809, + "step": 38116 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755366843656593e-06, + "loss": 1.0283, + "step": 38117 + }, + { + "epoch": 0.98, + "learning_rate": 1.5755140559132617e-06, + "loss": 0.7173, + "step": 38118 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754914270202188e-06, + "loss": 0.6445, + "step": 38119 + }, + { + "epoch": 0.98, + "learning_rate": 1.575468797686549e-06, + "loss": 0.6992, + "step": 38120 + }, + { + "epoch": 0.98, + "learning_rate": 1.575446167912269e-06, + "loss": 0.8018, + "step": 38121 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754235376973965e-06, + "loss": 0.7393, + "step": 38122 + }, + { + "epoch": 0.98, + "learning_rate": 1.5754009070419487e-06, + "loss": 0.7607, + "step": 38123 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753782759459427e-06, + "loss": 0.7832, + "step": 38124 + }, + { + "epoch": 0.98, + "learning_rate": 1.575355644409396e-06, + "loss": 0.8003, + "step": 38125 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753330124323263e-06, + "loss": 0.7339, + "step": 38126 + }, + { + "epoch": 0.98, + "learning_rate": 1.5753103800147502e-06, + "loss": 0.6381, + "step": 38127 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752877471566857e-06, + "loss": 0.7666, + "step": 38128 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752651138581494e-06, + "loss": 0.6357, + "step": 38129 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752424801191592e-06, + "loss": 0.8164, + "step": 38130 + }, + { + "epoch": 0.98, + "learning_rate": 1.5752198459397325e-06, + "loss": 0.8096, + "step": 38131 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751972113198861e-06, + "loss": 0.7939, + "step": 38132 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751745762596381e-06, + "loss": 0.8877, + "step": 38133 + }, + { + "epoch": 0.98, + "learning_rate": 1.575151940759005e-06, + "loss": 0.9297, + "step": 38134 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751293048180045e-06, + "loss": 0.8091, + "step": 38135 + }, + { + "epoch": 0.98, + "learning_rate": 1.5751066684366542e-06, + "loss": 0.6289, + "step": 38136 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750840316149709e-06, + "loss": 0.6936, + "step": 38137 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750613943529723e-06, + "loss": 0.8262, + "step": 38138 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750387566506758e-06, + "loss": 0.9717, + "step": 38139 + }, + { + "epoch": 0.98, + "learning_rate": 1.5750161185080982e-06, + "loss": 0.6611, + "step": 38140 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749934799252574e-06, + "loss": 0.73, + "step": 38141 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749708409021704e-06, + "loss": 0.6538, + "step": 38142 + }, + { + "epoch": 0.98, + "learning_rate": 1.5749482014388552e-06, + "loss": 0.5938, + "step": 38143 + }, + { + "epoch": 0.98, + "learning_rate": 1.574925561535328e-06, + "loss": 0.7725, + "step": 38144 + }, + { + "epoch": 0.98, + "learning_rate": 1.574902921191607e-06, + "loss": 0.9121, + "step": 38145 + }, + { + "epoch": 0.98, + "learning_rate": 1.5748802804077093e-06, + "loss": 0.8779, + "step": 38146 + }, + { + "epoch": 0.98, + "learning_rate": 1.574857639183652e-06, + "loss": 0.7617, + "step": 38147 + }, + { + "epoch": 0.98, + "learning_rate": 1.5748349975194529e-06, + "loss": 0.9043, + "step": 38148 + }, + { + "epoch": 0.98, + "learning_rate": 1.574812355415129e-06, + "loss": 0.8291, + "step": 38149 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747897128706975e-06, + "loss": 0.8145, + "step": 38150 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747670698861758e-06, + "loss": 0.8027, + "step": 38151 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747444264615819e-06, + "loss": 0.6875, + "step": 38152 + }, + { + "epoch": 0.98, + "learning_rate": 1.5747217825969322e-06, + "loss": 0.7749, + "step": 38153 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746991382922446e-06, + "loss": 0.9678, + "step": 38154 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746764935475366e-06, + "loss": 0.8198, + "step": 38155 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746538483628249e-06, + "loss": 0.8066, + "step": 38156 + }, + { + "epoch": 0.98, + "learning_rate": 1.5746312027381272e-06, + "loss": 0.7705, + "step": 38157 + }, + { + "epoch": 0.98, + "learning_rate": 1.574608556673461e-06, + "loss": 0.6714, + "step": 38158 + }, + { + "epoch": 0.98, + "learning_rate": 1.574585910168843e-06, + "loss": 1.0557, + "step": 38159 + }, + { + "epoch": 0.98, + "learning_rate": 1.5745632632242913e-06, + "loss": 0.8662, + "step": 38160 + }, + { + "epoch": 0.98, + "learning_rate": 1.574540615839823e-06, + "loss": 0.8779, + "step": 38161 + }, + { + "epoch": 0.98, + "learning_rate": 1.574517968015455e-06, + "loss": 0.8379, + "step": 38162 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744953197512056e-06, + "loss": 0.8965, + "step": 38163 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744726710470912e-06, + "loss": 0.9824, + "step": 38164 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744500219031296e-06, + "loss": 0.9453, + "step": 38165 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744273723193377e-06, + "loss": 0.873, + "step": 38166 + }, + { + "epoch": 0.98, + "learning_rate": 1.5744047222957336e-06, + "loss": 1.043, + "step": 38167 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743820718323342e-06, + "loss": 1.1006, + "step": 38168 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743594209291567e-06, + "loss": 0.8613, + "step": 38169 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743367695862184e-06, + "loss": 0.7812, + "step": 38170 + }, + { + "epoch": 0.98, + "learning_rate": 1.5743141178035371e-06, + "loss": 0.918, + "step": 38171 + }, + { + "epoch": 0.98, + "learning_rate": 1.5742914655811298e-06, + "loss": 0.7676, + "step": 38172 + }, + { + "epoch": 0.98, + "learning_rate": 1.574268812919014e-06, + "loss": 0.8501, + "step": 38173 + }, + { + "epoch": 0.98, + "learning_rate": 1.574246159817207e-06, + "loss": 0.7375, + "step": 38174 + }, + { + "epoch": 0.98, + "learning_rate": 1.574223506275726e-06, + "loss": 0.5551, + "step": 38175 + }, + { + "epoch": 0.98, + "learning_rate": 1.5742008522945883e-06, + "loss": 0.9209, + "step": 38176 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741781978738118e-06, + "loss": 0.8296, + "step": 38177 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741555430134135e-06, + "loss": 0.9219, + "step": 38178 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741328877134104e-06, + "loss": 0.7979, + "step": 38179 + }, + { + "epoch": 0.98, + "learning_rate": 1.5741102319738203e-06, + "loss": 0.5811, + "step": 38180 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740875757946603e-06, + "loss": 0.8057, + "step": 38181 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740649191759476e-06, + "loss": 0.8008, + "step": 38182 + }, + { + "epoch": 0.98, + "learning_rate": 1.5740422621177004e-06, + "loss": 1.0225, + "step": 38183 + }, + { + "epoch": 0.98, + "learning_rate": 1.574019604619935e-06, + "loss": 0.71, + "step": 38184 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739969466826692e-06, + "loss": 0.8608, + "step": 38185 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739742883059206e-06, + "loss": 0.8154, + "step": 38186 + }, + { + "epoch": 0.98, + "learning_rate": 1.573951629489706e-06, + "loss": 0.9062, + "step": 38187 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739289702340432e-06, + "loss": 0.7812, + "step": 38188 + }, + { + "epoch": 0.98, + "learning_rate": 1.5739063105389492e-06, + "loss": 0.833, + "step": 38189 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738836504044418e-06, + "loss": 0.9707, + "step": 38190 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738609898305377e-06, + "loss": 0.9219, + "step": 38191 + }, + { + "epoch": 0.98, + "learning_rate": 1.573838328817255e-06, + "loss": 0.874, + "step": 38192 + }, + { + "epoch": 0.98, + "learning_rate": 1.5738156673646103e-06, + "loss": 0.8262, + "step": 38193 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737930054726215e-06, + "loss": 0.8447, + "step": 38194 + }, + { + "epoch": 0.98, + "learning_rate": 1.573770343141306e-06, + "loss": 0.6987, + "step": 38195 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737476803706807e-06, + "loss": 1.0078, + "step": 38196 + }, + { + "epoch": 0.98, + "learning_rate": 1.5737250171607631e-06, + "loss": 0.998, + "step": 38197 + }, + { + "epoch": 0.98, + "learning_rate": 1.573702353511571e-06, + "loss": 0.7588, + "step": 38198 + }, + { + "epoch": 0.98, + "learning_rate": 1.573679689423121e-06, + "loss": 0.9219, + "step": 38199 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736570248954312e-06, + "loss": 0.7739, + "step": 38200 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736343599285182e-06, + "loss": 0.7881, + "step": 38201 + }, + { + "epoch": 0.98, + "learning_rate": 1.5736116945224e-06, + "loss": 0.8926, + "step": 38202 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735890286770936e-06, + "loss": 0.8789, + "step": 38203 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735663623926165e-06, + "loss": 1.123, + "step": 38204 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735436956689858e-06, + "loss": 0.7764, + "step": 38205 + }, + { + "epoch": 0.98, + "learning_rate": 1.5735210285062194e-06, + "loss": 0.959, + "step": 38206 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734983609043341e-06, + "loss": 0.7539, + "step": 38207 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734756928633476e-06, + "loss": 0.5684, + "step": 38208 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734530243832772e-06, + "loss": 0.8362, + "step": 38209 + }, + { + "epoch": 0.98, + "learning_rate": 1.57343035546414e-06, + "loss": 0.9053, + "step": 38210 + }, + { + "epoch": 0.98, + "learning_rate": 1.5734076861059538e-06, + "loss": 0.8086, + "step": 38211 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733850163087352e-06, + "loss": 0.7712, + "step": 38212 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733623460725025e-06, + "loss": 0.7217, + "step": 38213 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733396753972725e-06, + "loss": 0.7058, + "step": 38214 + }, + { + "epoch": 0.98, + "learning_rate": 1.5733170042830628e-06, + "loss": 0.9385, + "step": 38215 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732943327298904e-06, + "loss": 0.8208, + "step": 38216 + }, + { + "epoch": 0.98, + "learning_rate": 1.573271660737773e-06, + "loss": 0.9004, + "step": 38217 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732489883067279e-06, + "loss": 1.001, + "step": 38218 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732263154367724e-06, + "loss": 0.7598, + "step": 38219 + }, + { + "epoch": 0.98, + "learning_rate": 1.5732036421279237e-06, + "loss": 0.7754, + "step": 38220 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731809683801994e-06, + "loss": 0.9287, + "step": 38221 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731582941936168e-06, + "loss": 0.8682, + "step": 38222 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731356195681933e-06, + "loss": 0.9248, + "step": 38223 + }, + { + "epoch": 0.98, + "learning_rate": 1.5731129445039462e-06, + "loss": 1.0645, + "step": 38224 + }, + { + "epoch": 0.98, + "learning_rate": 1.573090269000893e-06, + "loss": 0.9355, + "step": 38225 + }, + { + "epoch": 0.98, + "learning_rate": 1.5730675930590506e-06, + "loss": 0.9434, + "step": 38226 + }, + { + "epoch": 0.98, + "learning_rate": 1.573044916678437e-06, + "loss": 0.6611, + "step": 38227 + }, + { + "epoch": 0.98, + "learning_rate": 1.5730222398590694e-06, + "loss": 0.7656, + "step": 38228 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729995626009647e-06, + "loss": 0.957, + "step": 38229 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729768849041406e-06, + "loss": 0.8379, + "step": 38230 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729542067686143e-06, + "loss": 0.9258, + "step": 38231 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729315281944034e-06, + "loss": 0.8818, + "step": 38232 + }, + { + "epoch": 0.98, + "learning_rate": 1.5729088491815255e-06, + "loss": 1.0537, + "step": 38233 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728861697299975e-06, + "loss": 1.0176, + "step": 38234 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728634898398366e-06, + "loss": 0.6978, + "step": 38235 + }, + { + "epoch": 0.98, + "learning_rate": 1.5728408095110606e-06, + "loss": 0.8105, + "step": 38236 + }, + { + "epoch": 0.98, + "learning_rate": 1.572818128743687e-06, + "loss": 0.9424, + "step": 38237 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727954475377328e-06, + "loss": 0.8896, + "step": 38238 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727727658932153e-06, + "loss": 0.7793, + "step": 38239 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727500838101522e-06, + "loss": 1.0332, + "step": 38240 + }, + { + "epoch": 0.98, + "learning_rate": 1.5727274012885606e-06, + "loss": 0.8223, + "step": 38241 + }, + { + "epoch": 0.98, + "learning_rate": 1.572704718328458e-06, + "loss": 0.9746, + "step": 38242 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726820349298616e-06, + "loss": 0.6729, + "step": 38243 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726593510927889e-06, + "loss": 0.8271, + "step": 38244 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726366668172574e-06, + "loss": 0.8091, + "step": 38245 + }, + { + "epoch": 0.98, + "learning_rate": 1.5726139821032841e-06, + "loss": 0.875, + "step": 38246 + }, + { + "epoch": 0.98, + "learning_rate": 1.572591296950887e-06, + "loss": 0.9736, + "step": 38247 + }, + { + "epoch": 0.98, + "learning_rate": 1.572568611360083e-06, + "loss": 0.8271, + "step": 38248 + }, + { + "epoch": 0.98, + "learning_rate": 1.5725459253308892e-06, + "loss": 0.8242, + "step": 38249 + }, + { + "epoch": 0.98, + "learning_rate": 1.5725232388633235e-06, + "loss": 0.8662, + "step": 38250 + }, + { + "epoch": 0.98, + "learning_rate": 1.572500551957403e-06, + "loss": 0.7988, + "step": 38251 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724778646131453e-06, + "loss": 0.9863, + "step": 38252 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724551768305677e-06, + "loss": 1.0166, + "step": 38253 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724324886096874e-06, + "loss": 0.7153, + "step": 38254 + }, + { + "epoch": 0.98, + "learning_rate": 1.5724097999505218e-06, + "loss": 0.6957, + "step": 38255 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723871108530884e-06, + "loss": 0.5254, + "step": 38256 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723644213174046e-06, + "loss": 0.9502, + "step": 38257 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723417313434874e-06, + "loss": 1.0957, + "step": 38258 + }, + { + "epoch": 0.98, + "learning_rate": 1.5723190409313547e-06, + "loss": 1.1123, + "step": 38259 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722963500810234e-06, + "loss": 0.8545, + "step": 38260 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722736587925113e-06, + "loss": 1.0264, + "step": 38261 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722509670658357e-06, + "loss": 0.9785, + "step": 38262 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722282749010133e-06, + "loss": 0.6809, + "step": 38263 + }, + { + "epoch": 0.98, + "learning_rate": 1.5722055822980625e-06, + "loss": 0.6904, + "step": 38264 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721828892570002e-06, + "loss": 0.7529, + "step": 38265 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721601957778434e-06, + "loss": 1.0059, + "step": 38266 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721375018606104e-06, + "loss": 0.8291, + "step": 38267 + }, + { + "epoch": 0.98, + "learning_rate": 1.5721148075053176e-06, + "loss": 0.835, + "step": 38268 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720921127119828e-06, + "loss": 0.7852, + "step": 38269 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720694174806235e-06, + "loss": 0.7812, + "step": 38270 + }, + { + "epoch": 0.98, + "learning_rate": 1.572046721811257e-06, + "loss": 0.7041, + "step": 38271 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720240257039006e-06, + "loss": 0.8555, + "step": 38272 + }, + { + "epoch": 0.98, + "learning_rate": 1.5720013291585716e-06, + "loss": 0.5342, + "step": 38273 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719786321752877e-06, + "loss": 0.8838, + "step": 38274 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719559347540658e-06, + "loss": 0.832, + "step": 38275 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719332368949236e-06, + "loss": 0.5132, + "step": 38276 + }, + { + "epoch": 0.98, + "learning_rate": 1.5719105385978787e-06, + "loss": 0.6411, + "step": 38277 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718878398629478e-06, + "loss": 0.7764, + "step": 38278 + }, + { + "epoch": 0.98, + "learning_rate": 1.571865140690149e-06, + "loss": 0.8223, + "step": 38279 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718424410794992e-06, + "loss": 0.9131, + "step": 38280 + }, + { + "epoch": 0.98, + "learning_rate": 1.5718197410310159e-06, + "loss": 0.7734, + "step": 38281 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717970405447165e-06, + "loss": 0.6001, + "step": 38282 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717743396206186e-06, + "loss": 0.9551, + "step": 38283 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717516382587392e-06, + "loss": 1.166, + "step": 38284 + }, + { + "epoch": 0.98, + "learning_rate": 1.5717289364590957e-06, + "loss": 0.7588, + "step": 38285 + }, + { + "epoch": 0.98, + "learning_rate": 1.571706234221706e-06, + "loss": 0.96, + "step": 38286 + }, + { + "epoch": 0.98, + "learning_rate": 1.571683531546587e-06, + "loss": 0.8296, + "step": 38287 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716608284337562e-06, + "loss": 0.8105, + "step": 38288 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716381248832308e-06, + "loss": 0.7656, + "step": 38289 + }, + { + "epoch": 0.98, + "learning_rate": 1.5716154208950287e-06, + "loss": 1.0039, + "step": 38290 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715927164691668e-06, + "loss": 0.7861, + "step": 38291 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715700116056627e-06, + "loss": 0.6968, + "step": 38292 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715473063045335e-06, + "loss": 1.0586, + "step": 38293 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715246005657972e-06, + "loss": 0.624, + "step": 38294 + }, + { + "epoch": 0.98, + "learning_rate": 1.5715018943894704e-06, + "loss": 0.8286, + "step": 38295 + }, + { + "epoch": 0.98, + "learning_rate": 1.571479187775571e-06, + "loss": 0.8296, + "step": 38296 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714564807241164e-06, + "loss": 0.6782, + "step": 38297 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714337732351238e-06, + "loss": 0.8896, + "step": 38298 + }, + { + "epoch": 0.98, + "learning_rate": 1.5714110653086104e-06, + "loss": 0.7617, + "step": 38299 + }, + { + "epoch": 0.98, + "learning_rate": 1.571388356944594e-06, + "loss": 0.9727, + "step": 38300 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713656481430916e-06, + "loss": 0.8799, + "step": 38301 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713429389041215e-06, + "loss": 1.0117, + "step": 38302 + }, + { + "epoch": 0.98, + "learning_rate": 1.5713202292276997e-06, + "loss": 1.0713, + "step": 38303 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712975191138445e-06, + "loss": 0.834, + "step": 38304 + }, + { + "epoch": 0.98, + "learning_rate": 1.571274808562573e-06, + "loss": 0.7949, + "step": 38305 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712520975739026e-06, + "loss": 0.5737, + "step": 38306 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712293861478506e-06, + "loss": 0.8936, + "step": 38307 + }, + { + "epoch": 0.98, + "learning_rate": 1.5712066742844349e-06, + "loss": 0.8916, + "step": 38308 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711839619836723e-06, + "loss": 0.8779, + "step": 38309 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711612492455805e-06, + "loss": 0.7656, + "step": 38310 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711385360701768e-06, + "loss": 0.8818, + "step": 38311 + }, + { + "epoch": 0.98, + "learning_rate": 1.5711158224574786e-06, + "loss": 0.7412, + "step": 38312 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710931084075032e-06, + "loss": 1.0312, + "step": 38313 + }, + { + "epoch": 0.98, + "learning_rate": 1.571070393920268e-06, + "loss": 0.9639, + "step": 38314 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710476789957906e-06, + "loss": 1.0225, + "step": 38315 + }, + { + "epoch": 0.98, + "learning_rate": 1.571024963634088e-06, + "loss": 0.6509, + "step": 38316 + }, + { + "epoch": 0.98, + "learning_rate": 1.5710022478351782e-06, + "loss": 0.9189, + "step": 38317 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709795315990779e-06, + "loss": 0.832, + "step": 38318 + }, + { + "epoch": 0.98, + "learning_rate": 1.570956814925805e-06, + "loss": 0.7861, + "step": 38319 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709340978153768e-06, + "loss": 0.7061, + "step": 38320 + }, + { + "epoch": 0.98, + "learning_rate": 1.5709113802678103e-06, + "loss": 1.0, + "step": 38321 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708886622831238e-06, + "loss": 0.8052, + "step": 38322 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708659438613335e-06, + "loss": 0.8008, + "step": 38323 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708432250024575e-06, + "loss": 1.0107, + "step": 38324 + }, + { + "epoch": 0.98, + "learning_rate": 1.5708205057065134e-06, + "loss": 0.6838, + "step": 38325 + }, + { + "epoch": 0.98, + "learning_rate": 1.570797785973518e-06, + "loss": 1.002, + "step": 38326 + }, + { + "epoch": 0.98, + "learning_rate": 1.570775065803489e-06, + "loss": 0.7273, + "step": 38327 + }, + { + "epoch": 0.98, + "learning_rate": 1.570752345196444e-06, + "loss": 0.7148, + "step": 38328 + }, + { + "epoch": 0.98, + "learning_rate": 1.5707296241524e-06, + "loss": 0.7422, + "step": 38329 + }, + { + "epoch": 0.98, + "learning_rate": 1.5707069026713743e-06, + "loss": 0.9385, + "step": 38330 + }, + { + "epoch": 0.98, + "learning_rate": 1.570684180753385e-06, + "loss": 0.9863, + "step": 38331 + }, + { + "epoch": 0.98, + "learning_rate": 1.570661458398449e-06, + "loss": 0.8223, + "step": 38332 + }, + { + "epoch": 0.98, + "learning_rate": 1.5706387356065839e-06, + "loss": 0.7622, + "step": 38333 + }, + { + "epoch": 0.98, + "learning_rate": 1.5706160123778065e-06, + "loss": 0.791, + "step": 38334 + }, + { + "epoch": 0.98, + "learning_rate": 1.570593288712135e-06, + "loss": 0.7979, + "step": 38335 + }, + { + "epoch": 0.98, + "learning_rate": 1.570570564609586e-06, + "loss": 0.6597, + "step": 38336 + }, + { + "epoch": 0.98, + "learning_rate": 1.570547840070178e-06, + "loss": 0.8115, + "step": 38337 + }, + { + "epoch": 0.98, + "learning_rate": 1.5705251150939277e-06, + "loss": 0.8945, + "step": 38338 + }, + { + "epoch": 0.98, + "learning_rate": 1.570502389680852e-06, + "loss": 0.7476, + "step": 38339 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704796638309692e-06, + "loss": 0.7324, + "step": 38340 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704569375442964e-06, + "loss": 0.7393, + "step": 38341 + }, + { + "epoch": 0.98, + "learning_rate": 1.570434210820851e-06, + "loss": 0.769, + "step": 38342 + }, + { + "epoch": 0.98, + "learning_rate": 1.5704114836606502e-06, + "loss": 0.6943, + "step": 38343 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703887560637114e-06, + "loss": 0.79, + "step": 38344 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703660280300523e-06, + "loss": 0.8711, + "step": 38345 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703432995596902e-06, + "loss": 1.0479, + "step": 38346 + }, + { + "epoch": 0.98, + "learning_rate": 1.5703205706526426e-06, + "loss": 0.73, + "step": 38347 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702978413089266e-06, + "loss": 0.8047, + "step": 38348 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702751115285598e-06, + "loss": 1.0039, + "step": 38349 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702523813115597e-06, + "loss": 1.0044, + "step": 38350 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702296506579434e-06, + "loss": 0.8525, + "step": 38351 + }, + { + "epoch": 0.98, + "learning_rate": 1.5702069195677283e-06, + "loss": 0.7026, + "step": 38352 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701841880409323e-06, + "loss": 0.8086, + "step": 38353 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701614560775723e-06, + "loss": 0.6416, + "step": 38354 + }, + { + "epoch": 0.98, + "learning_rate": 1.570138723677666e-06, + "loss": 0.9971, + "step": 38355 + }, + { + "epoch": 0.98, + "learning_rate": 1.5701159908412308e-06, + "loss": 0.6875, + "step": 38356 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700932575682837e-06, + "loss": 0.917, + "step": 38357 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700705238588426e-06, + "loss": 1.0078, + "step": 38358 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700477897129246e-06, + "loss": 0.7783, + "step": 38359 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700250551305474e-06, + "loss": 0.708, + "step": 38360 + }, + { + "epoch": 0.98, + "learning_rate": 1.5700023201117278e-06, + "loss": 0.9551, + "step": 38361 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699795846564843e-06, + "loss": 0.7583, + "step": 38362 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699568487648334e-06, + "loss": 0.8159, + "step": 38363 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699341124367925e-06, + "loss": 1.0186, + "step": 38364 + }, + { + "epoch": 0.98, + "learning_rate": 1.5699113756723793e-06, + "loss": 0.8984, + "step": 38365 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698886384716113e-06, + "loss": 0.8662, + "step": 38366 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698659008345057e-06, + "loss": 0.7686, + "step": 38367 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698431627610801e-06, + "loss": 0.7871, + "step": 38368 + }, + { + "epoch": 0.98, + "learning_rate": 1.5698204242513517e-06, + "loss": 1.0469, + "step": 38369 + }, + { + "epoch": 0.98, + "learning_rate": 1.569797685305338e-06, + "loss": 0.7803, + "step": 38370 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697749459230565e-06, + "loss": 0.9648, + "step": 38371 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697522061045243e-06, + "loss": 0.7451, + "step": 38372 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697294658497594e-06, + "loss": 1.0557, + "step": 38373 + }, + { + "epoch": 0.98, + "learning_rate": 1.5697067251587784e-06, + "loss": 0.6348, + "step": 38374 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696839840315993e-06, + "loss": 0.6748, + "step": 38375 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696612424682396e-06, + "loss": 0.8965, + "step": 38376 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696385004687166e-06, + "loss": 0.7583, + "step": 38377 + }, + { + "epoch": 0.98, + "learning_rate": 1.5696157580330472e-06, + "loss": 0.8779, + "step": 38378 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695930151612492e-06, + "loss": 0.8535, + "step": 38379 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695702718533402e-06, + "loss": 0.9141, + "step": 38380 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695475281093373e-06, + "loss": 1.0098, + "step": 38381 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695247839292582e-06, + "loss": 0.6743, + "step": 38382 + }, + { + "epoch": 0.98, + "learning_rate": 1.5695020393131202e-06, + "loss": 0.9971, + "step": 38383 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694792942609402e-06, + "loss": 0.7417, + "step": 38384 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694565487727366e-06, + "loss": 0.7988, + "step": 38385 + }, + { + "epoch": 0.98, + "learning_rate": 1.569433802848526e-06, + "loss": 0.8047, + "step": 38386 + }, + { + "epoch": 0.98, + "learning_rate": 1.5694110564883266e-06, + "loss": 0.9746, + "step": 38387 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693883096921549e-06, + "loss": 0.9355, + "step": 38388 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693655624600289e-06, + "loss": 0.5088, + "step": 38389 + }, + { + "epoch": 0.98, + "learning_rate": 1.5693428147919657e-06, + "loss": 0.8184, + "step": 38390 + }, + { + "epoch": 0.98, + "learning_rate": 1.569320066687983e-06, + "loss": 0.9277, + "step": 38391 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692973181480982e-06, + "loss": 0.5264, + "step": 38392 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692745691723286e-06, + "loss": 0.8086, + "step": 38393 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692518197606917e-06, + "loss": 0.8359, + "step": 38394 + }, + { + "epoch": 0.98, + "learning_rate": 1.5692290699132045e-06, + "loss": 0.9863, + "step": 38395 + }, + { + "epoch": 0.98, + "learning_rate": 1.569206319629885e-06, + "loss": 0.8828, + "step": 38396 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691835689107506e-06, + "loss": 0.8701, + "step": 38397 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691608177558183e-06, + "loss": 0.7808, + "step": 38398 + }, + { + "epoch": 0.98, + "learning_rate": 1.569138066165106e-06, + "loss": 0.8125, + "step": 38399 + }, + { + "epoch": 0.98, + "learning_rate": 1.5691153141386303e-06, + "loss": 0.7686, + "step": 38400 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690925616764095e-06, + "loss": 0.6494, + "step": 38401 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690698087784609e-06, + "loss": 1.0742, + "step": 38402 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690470554448014e-06, + "loss": 0.5983, + "step": 38403 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690243016754487e-06, + "loss": 0.9248, + "step": 38404 + }, + { + "epoch": 0.98, + "learning_rate": 1.5690015474704204e-06, + "loss": 0.9082, + "step": 38405 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689787928297339e-06, + "loss": 0.7773, + "step": 38406 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689560377534062e-06, + "loss": 0.8423, + "step": 38407 + }, + { + "epoch": 0.98, + "learning_rate": 1.5689332822414552e-06, + "loss": 0.9365, + "step": 38408 + }, + { + "epoch": 0.98, + "learning_rate": 1.568910526293898e-06, + "loss": 0.7803, + "step": 38409 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688877699107524e-06, + "loss": 0.7271, + "step": 38410 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688650130920354e-06, + "loss": 0.915, + "step": 38411 + }, + { + "epoch": 0.98, + "learning_rate": 1.5688422558377647e-06, + "loss": 0.998, + "step": 38412 + }, + { + "epoch": 0.98, + "learning_rate": 1.568819498147958e-06, + "loss": 1.001, + "step": 38413 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687967400226318e-06, + "loss": 0.812, + "step": 38414 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687739814618041e-06, + "loss": 0.9219, + "step": 38415 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687512224654927e-06, + "loss": 0.8408, + "step": 38416 + }, + { + "epoch": 0.98, + "learning_rate": 1.5687284630337146e-06, + "loss": 0.7715, + "step": 38417 + }, + { + "epoch": 0.98, + "learning_rate": 1.568705703166487e-06, + "loss": 0.7324, + "step": 38418 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686829428638278e-06, + "loss": 0.9561, + "step": 38419 + }, + { + "epoch": 0.98, + "learning_rate": 1.568660182125754e-06, + "loss": 0.7686, + "step": 38420 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686374209522835e-06, + "loss": 0.9678, + "step": 38421 + }, + { + "epoch": 0.98, + "learning_rate": 1.5686146593434333e-06, + "loss": 0.8633, + "step": 38422 + }, + { + "epoch": 0.98, + "learning_rate": 1.568591897299221e-06, + "loss": 0.9053, + "step": 38423 + }, + { + "epoch": 0.98, + "learning_rate": 1.568569134819664e-06, + "loss": 0.7866, + "step": 38424 + }, + { + "epoch": 0.98, + "learning_rate": 1.5685463719047797e-06, + "loss": 0.7466, + "step": 38425 + }, + { + "epoch": 0.98, + "learning_rate": 1.568523608554586e-06, + "loss": 0.8428, + "step": 38426 + }, + { + "epoch": 0.98, + "learning_rate": 1.5685008447690998e-06, + "loss": 0.7251, + "step": 38427 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684780805483384e-06, + "loss": 1.2061, + "step": 38428 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684553158923195e-06, + "loss": 0.8682, + "step": 38429 + }, + { + "epoch": 0.98, + "learning_rate": 1.5684325508010602e-06, + "loss": 0.7432, + "step": 38430 + }, + { + "epoch": 0.99, + "learning_rate": 1.5684097852745788e-06, + "loss": 0.9199, + "step": 38431 + }, + { + "epoch": 0.99, + "learning_rate": 1.568387019312892e-06, + "loss": 0.8911, + "step": 38432 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683642529160172e-06, + "loss": 0.8652, + "step": 38433 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683414860839723e-06, + "loss": 0.875, + "step": 38434 + }, + { + "epoch": 0.99, + "learning_rate": 1.5683187188167744e-06, + "loss": 0.8047, + "step": 38435 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682959511144408e-06, + "loss": 0.6816, + "step": 38436 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682731829769896e-06, + "loss": 0.7412, + "step": 38437 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682504144044373e-06, + "loss": 1.0732, + "step": 38438 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682276453968018e-06, + "loss": 0.8916, + "step": 38439 + }, + { + "epoch": 0.99, + "learning_rate": 1.5682048759541005e-06, + "loss": 0.9248, + "step": 38440 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681821060763509e-06, + "loss": 0.748, + "step": 38441 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681593357635708e-06, + "loss": 0.7773, + "step": 38442 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681365650157767e-06, + "loss": 0.8599, + "step": 38443 + }, + { + "epoch": 0.99, + "learning_rate": 1.5681137938329866e-06, + "loss": 1.085, + "step": 38444 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680910222152178e-06, + "loss": 0.9639, + "step": 38445 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680682501624883e-06, + "loss": 0.8867, + "step": 38446 + }, + { + "epoch": 0.99, + "learning_rate": 1.5680454776748148e-06, + "loss": 0.6777, + "step": 38447 + }, + { + "epoch": 0.99, + "learning_rate": 1.568022704752215e-06, + "loss": 0.8232, + "step": 38448 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679999313947063e-06, + "loss": 1.0078, + "step": 38449 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679771576023062e-06, + "loss": 0.6704, + "step": 38450 + }, + { + "epoch": 0.99, + "learning_rate": 1.567954383375032e-06, + "loss": 0.6611, + "step": 38451 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679316087129016e-06, + "loss": 0.835, + "step": 38452 + }, + { + "epoch": 0.99, + "learning_rate": 1.5679088336159319e-06, + "loss": 0.6758, + "step": 38453 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678860580841401e-06, + "loss": 0.9824, + "step": 38454 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678632821175445e-06, + "loss": 0.7949, + "step": 38455 + }, + { + "epoch": 0.99, + "learning_rate": 1.567840505716162e-06, + "loss": 0.9229, + "step": 38456 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678177288800103e-06, + "loss": 0.9492, + "step": 38457 + }, + { + "epoch": 0.99, + "learning_rate": 1.5677949516091065e-06, + "loss": 0.6704, + "step": 38458 + }, + { + "epoch": 0.99, + "learning_rate": 1.5677721739034682e-06, + "loss": 0.9639, + "step": 38459 + }, + { + "epoch": 0.99, + "learning_rate": 1.567749395763113e-06, + "loss": 0.9395, + "step": 38460 + }, + { + "epoch": 0.99, + "learning_rate": 1.567726617188058e-06, + "loss": 0.75, + "step": 38461 + }, + { + "epoch": 0.99, + "learning_rate": 1.567703838178321e-06, + "loss": 0.8057, + "step": 38462 + }, + { + "epoch": 0.99, + "learning_rate": 1.567681058733919e-06, + "loss": 0.8916, + "step": 38463 + }, + { + "epoch": 0.99, + "learning_rate": 1.56765827885487e-06, + "loss": 0.8091, + "step": 38464 + }, + { + "epoch": 0.99, + "learning_rate": 1.567635498541191e-06, + "loss": 0.7349, + "step": 38465 + }, + { + "epoch": 0.99, + "learning_rate": 1.5676127177928998e-06, + "loss": 0.8496, + "step": 38466 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675899366100134e-06, + "loss": 0.8447, + "step": 38467 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675671549925495e-06, + "loss": 0.877, + "step": 38468 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675443729405257e-06, + "loss": 0.8203, + "step": 38469 + }, + { + "epoch": 0.99, + "learning_rate": 1.5675215904539593e-06, + "loss": 0.5381, + "step": 38470 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674988075328674e-06, + "loss": 0.8047, + "step": 38471 + }, + { + "epoch": 0.99, + "learning_rate": 1.567476024177268e-06, + "loss": 0.8779, + "step": 38472 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674532403871781e-06, + "loss": 0.792, + "step": 38473 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674304561626155e-06, + "loss": 0.8223, + "step": 38474 + }, + { + "epoch": 0.99, + "learning_rate": 1.5674076715035975e-06, + "loss": 0.6729, + "step": 38475 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673848864101417e-06, + "loss": 1.0166, + "step": 38476 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673621008822653e-06, + "loss": 0.9136, + "step": 38477 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673393149199857e-06, + "loss": 0.8896, + "step": 38478 + }, + { + "epoch": 0.99, + "learning_rate": 1.5673165285233205e-06, + "loss": 0.6567, + "step": 38479 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672937416922869e-06, + "loss": 0.9805, + "step": 38480 + }, + { + "epoch": 0.99, + "learning_rate": 1.567270954426903e-06, + "loss": 0.9561, + "step": 38481 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672481667271854e-06, + "loss": 0.9385, + "step": 38482 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672253785931523e-06, + "loss": 0.9688, + "step": 38483 + }, + { + "epoch": 0.99, + "learning_rate": 1.5672025900248207e-06, + "loss": 1.0107, + "step": 38484 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671798010222078e-06, + "loss": 0.8418, + "step": 38485 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671570115853322e-06, + "loss": 0.7305, + "step": 38486 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671342217142099e-06, + "loss": 0.9521, + "step": 38487 + }, + { + "epoch": 0.99, + "learning_rate": 1.5671114314088595e-06, + "loss": 0.792, + "step": 38488 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670886406692976e-06, + "loss": 0.5576, + "step": 38489 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670658494955417e-06, + "loss": 0.6206, + "step": 38490 + }, + { + "epoch": 0.99, + "learning_rate": 1.56704305788761e-06, + "loss": 0.8447, + "step": 38491 + }, + { + "epoch": 0.99, + "learning_rate": 1.5670202658455196e-06, + "loss": 1.0352, + "step": 38492 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669974733692876e-06, + "loss": 0.769, + "step": 38493 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669746804589316e-06, + "loss": 0.8105, + "step": 38494 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669518871144694e-06, + "loss": 0.8545, + "step": 38495 + }, + { + "epoch": 0.99, + "learning_rate": 1.566929093335918e-06, + "loss": 0.8438, + "step": 38496 + }, + { + "epoch": 0.99, + "learning_rate": 1.5669062991232952e-06, + "loss": 0.791, + "step": 38497 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668835044766185e-06, + "loss": 0.8018, + "step": 38498 + }, + { + "epoch": 0.99, + "learning_rate": 1.566860709395905e-06, + "loss": 0.8867, + "step": 38499 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668379138811722e-06, + "loss": 0.8525, + "step": 38500 + }, + { + "epoch": 0.99, + "learning_rate": 1.5668151179324379e-06, + "loss": 0.7979, + "step": 38501 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667923215497193e-06, + "loss": 0.9297, + "step": 38502 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667695247330337e-06, + "loss": 0.8162, + "step": 38503 + }, + { + "epoch": 0.99, + "learning_rate": 1.566746727482399e-06, + "loss": 0.9038, + "step": 38504 + }, + { + "epoch": 0.99, + "learning_rate": 1.566723929797832e-06, + "loss": 0.8145, + "step": 38505 + }, + { + "epoch": 0.99, + "learning_rate": 1.5667011316793506e-06, + "loss": 0.8125, + "step": 38506 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666783331269726e-06, + "loss": 0.791, + "step": 38507 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666555341407149e-06, + "loss": 0.6934, + "step": 38508 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666327347205948e-06, + "loss": 1.0039, + "step": 38509 + }, + { + "epoch": 0.99, + "learning_rate": 1.5666099348666303e-06, + "loss": 0.6226, + "step": 38510 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665871345788387e-06, + "loss": 0.8145, + "step": 38511 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665643338572374e-06, + "loss": 0.897, + "step": 38512 + }, + { + "epoch": 0.99, + "learning_rate": 1.5665415327018437e-06, + "loss": 0.9961, + "step": 38513 + }, + { + "epoch": 0.99, + "learning_rate": 1.566518731112675e-06, + "loss": 0.8848, + "step": 38514 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664959290897492e-06, + "loss": 0.6782, + "step": 38515 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664731266330837e-06, + "loss": 0.5479, + "step": 38516 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664503237426955e-06, + "loss": 0.7451, + "step": 38517 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664275204186024e-06, + "loss": 0.6167, + "step": 38518 + }, + { + "epoch": 0.99, + "learning_rate": 1.5664047166608218e-06, + "loss": 0.9746, + "step": 38519 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663819124693714e-06, + "loss": 0.8147, + "step": 38520 + }, + { + "epoch": 0.99, + "learning_rate": 1.566359107844268e-06, + "loss": 0.96, + "step": 38521 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663363027855296e-06, + "loss": 0.9385, + "step": 38522 + }, + { + "epoch": 0.99, + "learning_rate": 1.5663134972931736e-06, + "loss": 0.7959, + "step": 38523 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662906913672175e-06, + "loss": 1.0303, + "step": 38524 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662678850076786e-06, + "loss": 0.7432, + "step": 38525 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662450782145742e-06, + "loss": 0.7871, + "step": 38526 + }, + { + "epoch": 0.99, + "learning_rate": 1.5662222709879225e-06, + "loss": 0.9814, + "step": 38527 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661994633277397e-06, + "loss": 0.8848, + "step": 38528 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661766552340446e-06, + "loss": 0.8477, + "step": 38529 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661538467068539e-06, + "loss": 0.877, + "step": 38530 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661310377461852e-06, + "loss": 0.6816, + "step": 38531 + }, + { + "epoch": 0.99, + "learning_rate": 1.5661082283520558e-06, + "loss": 0.9775, + "step": 38532 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660854185244836e-06, + "loss": 0.7456, + "step": 38533 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660626082634857e-06, + "loss": 0.8359, + "step": 38534 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660397975690797e-06, + "loss": 0.7119, + "step": 38535 + }, + { + "epoch": 0.99, + "learning_rate": 1.5660169864412831e-06, + "loss": 0.791, + "step": 38536 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659941748801136e-06, + "loss": 0.998, + "step": 38537 + }, + { + "epoch": 0.99, + "learning_rate": 1.565971362885588e-06, + "loss": 0.7549, + "step": 38538 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659485504577244e-06, + "loss": 0.7295, + "step": 38539 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659257375965399e-06, + "loss": 0.6475, + "step": 38540 + }, + { + "epoch": 0.99, + "learning_rate": 1.5659029243020519e-06, + "loss": 0.8608, + "step": 38541 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658801105742784e-06, + "loss": 0.6169, + "step": 38542 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658572964132363e-06, + "loss": 0.7083, + "step": 38543 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658344818189432e-06, + "loss": 0.9756, + "step": 38544 + }, + { + "epoch": 0.99, + "learning_rate": 1.5658116667914168e-06, + "loss": 0.7803, + "step": 38545 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657888513306743e-06, + "loss": 0.793, + "step": 38546 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657660354367334e-06, + "loss": 0.9854, + "step": 38547 + }, + { + "epoch": 0.99, + "learning_rate": 1.5657432191096116e-06, + "loss": 1.0713, + "step": 38548 + }, + { + "epoch": 0.99, + "learning_rate": 1.565720402349326e-06, + "loss": 0.9355, + "step": 38549 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656975851558944e-06, + "loss": 0.8467, + "step": 38550 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656747675293343e-06, + "loss": 0.9287, + "step": 38551 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656519494696628e-06, + "loss": 0.8145, + "step": 38552 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656291309768976e-06, + "loss": 1.1738, + "step": 38553 + }, + { + "epoch": 0.99, + "learning_rate": 1.5656063120510563e-06, + "loss": 0.9355, + "step": 38554 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655834926921565e-06, + "loss": 0.8701, + "step": 38555 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655606729002151e-06, + "loss": 0.5642, + "step": 38556 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655378526752498e-06, + "loss": 0.7852, + "step": 38557 + }, + { + "epoch": 0.99, + "learning_rate": 1.5655150320172786e-06, + "loss": 0.7529, + "step": 38558 + }, + { + "epoch": 0.99, + "learning_rate": 1.565492210926318e-06, + "loss": 0.6914, + "step": 38559 + }, + { + "epoch": 0.99, + "learning_rate": 1.5654693894023865e-06, + "loss": 0.8389, + "step": 38560 + }, + { + "epoch": 0.99, + "learning_rate": 1.565446567445501e-06, + "loss": 0.7822, + "step": 38561 + }, + { + "epoch": 0.99, + "learning_rate": 1.5654237450556788e-06, + "loss": 0.8389, + "step": 38562 + }, + { + "epoch": 0.99, + "learning_rate": 1.565400922232938e-06, + "loss": 0.6885, + "step": 38563 + }, + { + "epoch": 0.99, + "learning_rate": 1.565378098977295e-06, + "loss": 1.1318, + "step": 38564 + }, + { + "epoch": 0.99, + "learning_rate": 1.565355275288769e-06, + "loss": 0.8184, + "step": 38565 + }, + { + "epoch": 0.99, + "learning_rate": 1.565332451167376e-06, + "loss": 1.0, + "step": 38566 + }, + { + "epoch": 0.99, + "learning_rate": 1.5653096266131337e-06, + "loss": 0.9111, + "step": 38567 + }, + { + "epoch": 0.99, + "learning_rate": 1.56528680162606e-06, + "loss": 0.9062, + "step": 38568 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652639762061721e-06, + "loss": 0.8721, + "step": 38569 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652411503534876e-06, + "loss": 0.7454, + "step": 38570 + }, + { + "epoch": 0.99, + "learning_rate": 1.5652183240680242e-06, + "loss": 0.8018, + "step": 38571 + }, + { + "epoch": 0.99, + "learning_rate": 1.565195497349799e-06, + "loss": 0.9316, + "step": 38572 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651726701988292e-06, + "loss": 0.7725, + "step": 38573 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651498426151331e-06, + "loss": 0.8408, + "step": 38574 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651270145987276e-06, + "loss": 0.9658, + "step": 38575 + }, + { + "epoch": 0.99, + "learning_rate": 1.5651041861496305e-06, + "loss": 0.6729, + "step": 38576 + }, + { + "epoch": 0.99, + "learning_rate": 1.565081357267859e-06, + "loss": 0.8584, + "step": 38577 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650585279534307e-06, + "loss": 0.8115, + "step": 38578 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650356982063628e-06, + "loss": 0.9619, + "step": 38579 + }, + { + "epoch": 0.99, + "learning_rate": 1.5650128680266734e-06, + "loss": 0.9727, + "step": 38580 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649900374143793e-06, + "loss": 0.7705, + "step": 38581 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649672063694987e-06, + "loss": 0.8799, + "step": 38582 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649443748920486e-06, + "loss": 0.7278, + "step": 38583 + }, + { + "epoch": 0.99, + "learning_rate": 1.5649215429820464e-06, + "loss": 0.6978, + "step": 38584 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648987106395097e-06, + "loss": 0.8701, + "step": 38585 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648758778644563e-06, + "loss": 1.0361, + "step": 38586 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648530446569032e-06, + "loss": 0.8779, + "step": 38587 + }, + { + "epoch": 0.99, + "learning_rate": 1.564830211016868e-06, + "loss": 0.7095, + "step": 38588 + }, + { + "epoch": 0.99, + "learning_rate": 1.5648073769443686e-06, + "loss": 0.7334, + "step": 38589 + }, + { + "epoch": 0.99, + "learning_rate": 1.564784542439422e-06, + "loss": 0.9375, + "step": 38590 + }, + { + "epoch": 0.99, + "learning_rate": 1.564761707502046e-06, + "loss": 1.0703, + "step": 38591 + }, + { + "epoch": 0.99, + "learning_rate": 1.5647388721322576e-06, + "loss": 0.4651, + "step": 38592 + }, + { + "epoch": 0.99, + "learning_rate": 1.564716036330075e-06, + "loss": 0.7324, + "step": 38593 + }, + { + "epoch": 0.99, + "learning_rate": 1.564693200095515e-06, + "loss": 1.083, + "step": 38594 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646703634285953e-06, + "loss": 1.0703, + "step": 38595 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646475263293337e-06, + "loss": 0.874, + "step": 38596 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646246887977475e-06, + "loss": 0.8667, + "step": 38597 + }, + { + "epoch": 0.99, + "learning_rate": 1.5646018508338541e-06, + "loss": 0.9277, + "step": 38598 + }, + { + "epoch": 0.99, + "learning_rate": 1.564579012437671e-06, + "loss": 0.7305, + "step": 38599 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645561736092155e-06, + "loss": 0.9014, + "step": 38600 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645333343485056e-06, + "loss": 0.8291, + "step": 38601 + }, + { + "epoch": 0.99, + "learning_rate": 1.5645104946555581e-06, + "loss": 1.0498, + "step": 38602 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644876545303914e-06, + "loss": 0.9238, + "step": 38603 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644648139730219e-06, + "loss": 1.0674, + "step": 38604 + }, + { + "epoch": 0.99, + "learning_rate": 1.564441972983468e-06, + "loss": 0.8564, + "step": 38605 + }, + { + "epoch": 0.99, + "learning_rate": 1.5644191315617468e-06, + "loss": 0.7646, + "step": 38606 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643962897078758e-06, + "loss": 0.6841, + "step": 38607 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643734474218723e-06, + "loss": 0.8428, + "step": 38608 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643506047037543e-06, + "loss": 0.9023, + "step": 38609 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643277615535388e-06, + "loss": 0.8037, + "step": 38610 + }, + { + "epoch": 0.99, + "learning_rate": 1.5643049179712437e-06, + "loss": 0.7842, + "step": 38611 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642820739568862e-06, + "loss": 0.8428, + "step": 38612 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642592295104837e-06, + "loss": 0.731, + "step": 38613 + }, + { + "epoch": 0.99, + "learning_rate": 1.564236384632054e-06, + "loss": 0.8984, + "step": 38614 + }, + { + "epoch": 0.99, + "learning_rate": 1.5642135393216143e-06, + "loss": 0.8975, + "step": 38615 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641906935791825e-06, + "loss": 0.7798, + "step": 38616 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641678474047754e-06, + "loss": 0.7871, + "step": 38617 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641450007984113e-06, + "loss": 0.7349, + "step": 38618 + }, + { + "epoch": 0.99, + "learning_rate": 1.5641221537601072e-06, + "loss": 0.8594, + "step": 38619 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640993062898807e-06, + "loss": 0.9258, + "step": 38620 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640764583877496e-06, + "loss": 0.9033, + "step": 38621 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640536100537305e-06, + "loss": 0.5669, + "step": 38622 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640307612878418e-06, + "loss": 0.7725, + "step": 38623 + }, + { + "epoch": 0.99, + "learning_rate": 1.5640079120901009e-06, + "loss": 0.7568, + "step": 38624 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639850624605246e-06, + "loss": 0.4331, + "step": 38625 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639622123991311e-06, + "loss": 0.876, + "step": 38626 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639393619059377e-06, + "loss": 0.8037, + "step": 38627 + }, + { + "epoch": 0.99, + "learning_rate": 1.5639165109809617e-06, + "loss": 0.8423, + "step": 38628 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638936596242209e-06, + "loss": 0.7329, + "step": 38629 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638708078357325e-06, + "loss": 0.731, + "step": 38630 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638479556155147e-06, + "loss": 0.8359, + "step": 38631 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638251029635838e-06, + "loss": 0.6528, + "step": 38632 + }, + { + "epoch": 0.99, + "learning_rate": 1.5638022498799584e-06, + "loss": 0.7837, + "step": 38633 + }, + { + "epoch": 0.99, + "learning_rate": 1.563779396364655e-06, + "loss": 0.7617, + "step": 38634 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637565424176921e-06, + "loss": 0.9209, + "step": 38635 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637336880390867e-06, + "loss": 0.6646, + "step": 38636 + }, + { + "epoch": 0.99, + "learning_rate": 1.5637108332288562e-06, + "loss": 0.9062, + "step": 38637 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636879779870183e-06, + "loss": 0.7021, + "step": 38638 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636651223135903e-06, + "loss": 0.7568, + "step": 38639 + }, + { + "epoch": 0.99, + "learning_rate": 1.5636422662085899e-06, + "loss": 0.6958, + "step": 38640 + }, + { + "epoch": 0.99, + "learning_rate": 1.563619409672035e-06, + "loss": 0.9609, + "step": 38641 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635965527039421e-06, + "loss": 0.8262, + "step": 38642 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635736953043293e-06, + "loss": 0.8447, + "step": 38643 + }, + { + "epoch": 0.99, + "learning_rate": 1.563550837473214e-06, + "loss": 0.7207, + "step": 38644 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635279792106138e-06, + "loss": 0.877, + "step": 38645 + }, + { + "epoch": 0.99, + "learning_rate": 1.5635051205165462e-06, + "loss": 0.8447, + "step": 38646 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634822613910286e-06, + "loss": 0.9287, + "step": 38647 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634594018340784e-06, + "loss": 0.8906, + "step": 38648 + }, + { + "epoch": 0.99, + "learning_rate": 1.5634365418457133e-06, + "loss": 0.8027, + "step": 38649 + }, + { + "epoch": 0.99, + "learning_rate": 1.563413681425951e-06, + "loss": 0.9658, + "step": 38650 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633908205748085e-06, + "loss": 0.7349, + "step": 38651 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633679592923037e-06, + "loss": 0.8359, + "step": 38652 + }, + { + "epoch": 0.99, + "learning_rate": 1.563345097578454e-06, + "loss": 0.7441, + "step": 38653 + }, + { + "epoch": 0.99, + "learning_rate": 1.5633222354332766e-06, + "loss": 0.9053, + "step": 38654 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632993728567895e-06, + "loss": 1.0596, + "step": 38655 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632765098490099e-06, + "loss": 0.9072, + "step": 38656 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632536464099552e-06, + "loss": 0.9189, + "step": 38657 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632307825396434e-06, + "loss": 0.7476, + "step": 38658 + }, + { + "epoch": 0.99, + "learning_rate": 1.5632079182380915e-06, + "loss": 0.751, + "step": 38659 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631850535053172e-06, + "loss": 0.7214, + "step": 38660 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631621883413382e-06, + "loss": 0.7881, + "step": 38661 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631393227461715e-06, + "loss": 0.8369, + "step": 38662 + }, + { + "epoch": 0.99, + "learning_rate": 1.5631164567198352e-06, + "loss": 0.79, + "step": 38663 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630935902623464e-06, + "loss": 0.8447, + "step": 38664 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630707233737223e-06, + "loss": 0.8276, + "step": 38665 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630478560539815e-06, + "loss": 0.7627, + "step": 38666 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630249883031405e-06, + "loss": 0.8164, + "step": 38667 + }, + { + "epoch": 0.99, + "learning_rate": 1.5630021201212174e-06, + "loss": 0.8584, + "step": 38668 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629792515082292e-06, + "loss": 0.5271, + "step": 38669 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629563824641938e-06, + "loss": 0.7173, + "step": 38670 + }, + { + "epoch": 0.99, + "learning_rate": 1.5629335129891286e-06, + "loss": 0.7891, + "step": 38671 + }, + { + "epoch": 0.99, + "learning_rate": 1.562910643083051e-06, + "loss": 0.8398, + "step": 38672 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628877727459785e-06, + "loss": 1.1045, + "step": 38673 + }, + { + "epoch": 0.99, + "learning_rate": 1.562864901977929e-06, + "loss": 0.7649, + "step": 38674 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628420307789195e-06, + "loss": 0.9004, + "step": 38675 + }, + { + "epoch": 0.99, + "learning_rate": 1.5628191591489681e-06, + "loss": 0.5166, + "step": 38676 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627962870880915e-06, + "loss": 0.8125, + "step": 38677 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627734145963078e-06, + "loss": 0.7144, + "step": 38678 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627505416736347e-06, + "loss": 1.0791, + "step": 38679 + }, + { + "epoch": 0.99, + "learning_rate": 1.562727668320089e-06, + "loss": 0.79, + "step": 38680 + }, + { + "epoch": 0.99, + "learning_rate": 1.5627047945356887e-06, + "loss": 0.7173, + "step": 38681 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626819203204513e-06, + "loss": 0.627, + "step": 38682 + }, + { + "epoch": 0.99, + "learning_rate": 1.562659045674394e-06, + "loss": 0.7139, + "step": 38683 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626361705975345e-06, + "loss": 0.6406, + "step": 38684 + }, + { + "epoch": 0.99, + "learning_rate": 1.5626132950898907e-06, + "loss": 0.7495, + "step": 38685 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625904191514797e-06, + "loss": 0.6714, + "step": 38686 + }, + { + "epoch": 0.99, + "learning_rate": 1.562567542782319e-06, + "loss": 0.8164, + "step": 38687 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625446659824265e-06, + "loss": 0.7549, + "step": 38688 + }, + { + "epoch": 0.99, + "learning_rate": 1.5625217887518187e-06, + "loss": 0.4487, + "step": 38689 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624989110905142e-06, + "loss": 0.8867, + "step": 38690 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624760329985302e-06, + "loss": 0.7119, + "step": 38691 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624531544758843e-06, + "loss": 1.0234, + "step": 38692 + }, + { + "epoch": 0.99, + "learning_rate": 1.5624302755225938e-06, + "loss": 0.8887, + "step": 38693 + }, + { + "epoch": 0.99, + "learning_rate": 1.562407396138676e-06, + "loss": 0.9521, + "step": 38694 + }, + { + "epoch": 0.99, + "learning_rate": 1.562384516324149e-06, + "loss": 0.8428, + "step": 38695 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623616360790301e-06, + "loss": 0.7524, + "step": 38696 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623387554033367e-06, + "loss": 1.0088, + "step": 38697 + }, + { + "epoch": 0.99, + "learning_rate": 1.5623158742970863e-06, + "loss": 0.9414, + "step": 38698 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622929927602964e-06, + "loss": 0.7744, + "step": 38699 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622701107929847e-06, + "loss": 0.7305, + "step": 38700 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622472283951689e-06, + "loss": 0.7524, + "step": 38701 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622243455668657e-06, + "loss": 0.8027, + "step": 38702 + }, + { + "epoch": 0.99, + "learning_rate": 1.5622014623080937e-06, + "loss": 0.8994, + "step": 38703 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621785786188694e-06, + "loss": 0.7646, + "step": 38704 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621556944992112e-06, + "loss": 0.4609, + "step": 38705 + }, + { + "epoch": 0.99, + "learning_rate": 1.5621328099491361e-06, + "loss": 0.6516, + "step": 38706 + }, + { + "epoch": 0.99, + "learning_rate": 1.562109924968662e-06, + "loss": 0.6338, + "step": 38707 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620870395578059e-06, + "loss": 0.8477, + "step": 38708 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620641537165856e-06, + "loss": 0.8535, + "step": 38709 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620412674450185e-06, + "loss": 0.8491, + "step": 38710 + }, + { + "epoch": 0.99, + "learning_rate": 1.5620183807431223e-06, + "loss": 0.9043, + "step": 38711 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619954936109148e-06, + "loss": 0.8306, + "step": 38712 + }, + { + "epoch": 0.99, + "learning_rate": 1.561972606048413e-06, + "loss": 0.7793, + "step": 38713 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619497180556346e-06, + "loss": 0.8682, + "step": 38714 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619268296325969e-06, + "loss": 0.8091, + "step": 38715 + }, + { + "epoch": 0.99, + "learning_rate": 1.5619039407793179e-06, + "loss": 0.8018, + "step": 38716 + }, + { + "epoch": 0.99, + "learning_rate": 1.561881051495815e-06, + "loss": 0.8613, + "step": 38717 + }, + { + "epoch": 0.99, + "learning_rate": 1.5618581617821053e-06, + "loss": 0.7745, + "step": 38718 + }, + { + "epoch": 0.99, + "learning_rate": 1.5618352716382069e-06, + "loss": 0.668, + "step": 38719 + }, + { + "epoch": 0.99, + "learning_rate": 1.561812381064137e-06, + "loss": 0.6682, + "step": 38720 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617894900599134e-06, + "loss": 0.7769, + "step": 38721 + }, + { + "epoch": 0.99, + "learning_rate": 1.561766598625553e-06, + "loss": 1.0215, + "step": 38722 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617437067610739e-06, + "loss": 0.8613, + "step": 38723 + }, + { + "epoch": 0.99, + "learning_rate": 1.5617208144664936e-06, + "loss": 0.6887, + "step": 38724 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616979217418295e-06, + "loss": 0.8271, + "step": 38725 + }, + { + "epoch": 0.99, + "learning_rate": 1.561675028587099e-06, + "loss": 0.73, + "step": 38726 + }, + { + "epoch": 0.99, + "learning_rate": 1.56165213500232e-06, + "loss": 0.7979, + "step": 38727 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616292409875093e-06, + "loss": 0.8418, + "step": 38728 + }, + { + "epoch": 0.99, + "learning_rate": 1.5616063465426855e-06, + "loss": 1.0039, + "step": 38729 + }, + { + "epoch": 0.99, + "learning_rate": 1.561583451667865e-06, + "loss": 0.8164, + "step": 38730 + }, + { + "epoch": 0.99, + "learning_rate": 1.5615605563630663e-06, + "loss": 0.731, + "step": 38731 + }, + { + "epoch": 0.99, + "learning_rate": 1.5615376606283064e-06, + "loss": 0.9707, + "step": 38732 + }, + { + "epoch": 0.99, + "learning_rate": 1.561514764463603e-06, + "loss": 0.6948, + "step": 38733 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614918678689733e-06, + "loss": 0.9556, + "step": 38734 + }, + { + "epoch": 0.99, + "learning_rate": 1.561468970844435e-06, + "loss": 0.9126, + "step": 38735 + }, + { + "epoch": 0.99, + "learning_rate": 1.561446073390006e-06, + "loss": 0.9297, + "step": 38736 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614231755057038e-06, + "loss": 0.5698, + "step": 38737 + }, + { + "epoch": 0.99, + "learning_rate": 1.5614002771915451e-06, + "loss": 0.7041, + "step": 38738 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613773784475484e-06, + "loss": 0.8086, + "step": 38739 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613544792737305e-06, + "loss": 0.8301, + "step": 38740 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613315796701099e-06, + "loss": 0.7183, + "step": 38741 + }, + { + "epoch": 0.99, + "learning_rate": 1.5613086796367033e-06, + "loss": 0.9199, + "step": 38742 + }, + { + "epoch": 0.99, + "learning_rate": 1.561285779173528e-06, + "loss": 0.8545, + "step": 38743 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612628782806025e-06, + "loss": 0.7959, + "step": 38744 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612399769579434e-06, + "loss": 0.623, + "step": 38745 + }, + { + "epoch": 0.99, + "learning_rate": 1.5612170752055694e-06, + "loss": 0.8213, + "step": 38746 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611941730234966e-06, + "loss": 0.6658, + "step": 38747 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611712704117435e-06, + "loss": 0.6792, + "step": 38748 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611483673703272e-06, + "loss": 0.6658, + "step": 38749 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611254638992653e-06, + "loss": 0.9492, + "step": 38750 + }, + { + "epoch": 0.99, + "learning_rate": 1.5611025599985759e-06, + "loss": 1.0156, + "step": 38751 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610796556682755e-06, + "loss": 0.7266, + "step": 38752 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610567509083827e-06, + "loss": 0.8203, + "step": 38753 + }, + { + "epoch": 0.99, + "learning_rate": 1.5610338457189142e-06, + "loss": 0.7207, + "step": 38754 + }, + { + "epoch": 0.99, + "learning_rate": 1.561010940099888e-06, + "loss": 0.5134, + "step": 38755 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609880340513215e-06, + "loss": 0.8379, + "step": 38756 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609651275732323e-06, + "loss": 0.7632, + "step": 38757 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609422206656379e-06, + "loss": 0.833, + "step": 38758 + }, + { + "epoch": 0.99, + "learning_rate": 1.5609193133285558e-06, + "loss": 0.793, + "step": 38759 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608964055620035e-06, + "loss": 0.833, + "step": 38760 + }, + { + "epoch": 0.99, + "learning_rate": 1.560873497365999e-06, + "loss": 0.957, + "step": 38761 + }, + { + "epoch": 0.99, + "learning_rate": 1.560850588740559e-06, + "loss": 0.9746, + "step": 38762 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608276796857016e-06, + "loss": 0.552, + "step": 38763 + }, + { + "epoch": 0.99, + "learning_rate": 1.5608047702014444e-06, + "loss": 0.6558, + "step": 38764 + }, + { + "epoch": 0.99, + "learning_rate": 1.5607818602878044e-06, + "loss": 0.6611, + "step": 38765 + }, + { + "epoch": 0.99, + "learning_rate": 1.5607589499448e-06, + "loss": 0.9717, + "step": 38766 + }, + { + "epoch": 0.99, + "learning_rate": 1.560736039172448e-06, + "loss": 0.6641, + "step": 38767 + }, + { + "epoch": 0.99, + "learning_rate": 1.560713127970766e-06, + "loss": 0.9736, + "step": 38768 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606902163397723e-06, + "loss": 0.8633, + "step": 38769 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606673042794833e-06, + "loss": 0.4866, + "step": 38770 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606443917899176e-06, + "loss": 0.8662, + "step": 38771 + }, + { + "epoch": 0.99, + "learning_rate": 1.5606214788710918e-06, + "loss": 0.8223, + "step": 38772 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605985655230243e-06, + "loss": 0.9023, + "step": 38773 + }, + { + "epoch": 0.99, + "learning_rate": 1.560575651745732e-06, + "loss": 0.8623, + "step": 38774 + }, + { + "epoch": 0.99, + "learning_rate": 1.560552737539233e-06, + "loss": 0.7778, + "step": 38775 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605298229035443e-06, + "loss": 0.7236, + "step": 38776 + }, + { + "epoch": 0.99, + "learning_rate": 1.5605069078386838e-06, + "loss": 0.812, + "step": 38777 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604839923446686e-06, + "loss": 0.8145, + "step": 38778 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604610764215172e-06, + "loss": 0.7432, + "step": 38779 + }, + { + "epoch": 0.99, + "learning_rate": 1.560438160069246e-06, + "loss": 0.7959, + "step": 38780 + }, + { + "epoch": 0.99, + "learning_rate": 1.5604152432878733e-06, + "loss": 0.9082, + "step": 38781 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603923260774163e-06, + "loss": 0.9492, + "step": 38782 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603694084378926e-06, + "loss": 0.5933, + "step": 38783 + }, + { + "epoch": 0.99, + "learning_rate": 1.56034649036932e-06, + "loss": 1.0645, + "step": 38784 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603235718717159e-06, + "loss": 0.7393, + "step": 38785 + }, + { + "epoch": 0.99, + "learning_rate": 1.5603006529450977e-06, + "loss": 0.623, + "step": 38786 + }, + { + "epoch": 0.99, + "learning_rate": 1.560277733589483e-06, + "loss": 0.8682, + "step": 38787 + }, + { + "epoch": 0.99, + "learning_rate": 1.5602548138048897e-06, + "loss": 0.7444, + "step": 38788 + }, + { + "epoch": 0.99, + "learning_rate": 1.5602318935913345e-06, + "loss": 0.9355, + "step": 38789 + }, + { + "epoch": 0.99, + "learning_rate": 1.560208972948836e-06, + "loss": 0.9229, + "step": 38790 + }, + { + "epoch": 0.99, + "learning_rate": 1.560186051877411e-06, + "loss": 0.8081, + "step": 38791 + }, + { + "epoch": 0.99, + "learning_rate": 1.5601631303770772e-06, + "loss": 0.9082, + "step": 38792 + }, + { + "epoch": 0.99, + "learning_rate": 1.5601402084478526e-06, + "loss": 0.958, + "step": 38793 + }, + { + "epoch": 0.99, + "learning_rate": 1.560117286089754e-06, + "loss": 0.6753, + "step": 38794 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600943633027995e-06, + "loss": 0.7676, + "step": 38795 + }, + { + "epoch": 0.99, + "learning_rate": 1.560071440087007e-06, + "loss": 1.1025, + "step": 38796 + }, + { + "epoch": 0.99, + "learning_rate": 1.560048516442393e-06, + "loss": 0.8906, + "step": 38797 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600255923689756e-06, + "loss": 0.6279, + "step": 38798 + }, + { + "epoch": 0.99, + "learning_rate": 1.5600026678667723e-06, + "loss": 0.8643, + "step": 38799 + }, + { + "epoch": 0.99, + "learning_rate": 1.559979742935801e-06, + "loss": 0.6885, + "step": 38800 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599568175760788e-06, + "loss": 0.9438, + "step": 38801 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599338917876234e-06, + "loss": 0.958, + "step": 38802 + }, + { + "epoch": 0.99, + "learning_rate": 1.5599109655704523e-06, + "loss": 0.96, + "step": 38803 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598880389245834e-06, + "loss": 0.7954, + "step": 38804 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598651118500338e-06, + "loss": 0.7969, + "step": 38805 + }, + { + "epoch": 0.99, + "learning_rate": 1.5598421843468212e-06, + "loss": 0.7417, + "step": 38806 + }, + { + "epoch": 0.99, + "learning_rate": 1.559819256414963e-06, + "loss": 0.8574, + "step": 38807 + }, + { + "epoch": 0.99, + "learning_rate": 1.5597963280544772e-06, + "loss": 0.877, + "step": 38808 + }, + { + "epoch": 0.99, + "learning_rate": 1.559773399265381e-06, + "loss": 0.8281, + "step": 38809 + }, + { + "epoch": 0.99, + "learning_rate": 1.559750470047692e-06, + "loss": 0.9531, + "step": 38810 + }, + { + "epoch": 0.99, + "learning_rate": 1.559727540401428e-06, + "loss": 0.9082, + "step": 38811 + }, + { + "epoch": 0.99, + "learning_rate": 1.5597046103266064e-06, + "loss": 0.8955, + "step": 38812 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596816798232447e-06, + "loss": 0.6003, + "step": 38813 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596587488913602e-06, + "loss": 0.9033, + "step": 38814 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596358175309707e-06, + "loss": 0.8633, + "step": 38815 + }, + { + "epoch": 0.99, + "learning_rate": 1.5596128857420944e-06, + "loss": 0.6421, + "step": 38816 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595899535247474e-06, + "loss": 0.8096, + "step": 38817 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595670208789486e-06, + "loss": 1.0049, + "step": 38818 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595440878047148e-06, + "loss": 0.8682, + "step": 38819 + }, + { + "epoch": 0.99, + "learning_rate": 1.5595211543020642e-06, + "loss": 0.9082, + "step": 38820 + }, + { + "epoch": 1.0, + "learning_rate": 1.559498220371014e-06, + "loss": 1.0254, + "step": 38821 + }, + { + "epoch": 1.0, + "learning_rate": 1.5594752860115813e-06, + "loss": 0.8184, + "step": 38822 + }, + { + "epoch": 1.0, + "learning_rate": 1.559452351223784e-06, + "loss": 0.5039, + "step": 38823 + }, + { + "epoch": 1.0, + "learning_rate": 1.55942941600764e-06, + "loss": 0.7378, + "step": 38824 + }, + { + "epoch": 1.0, + "learning_rate": 1.5594064803631667e-06, + "loss": 0.9668, + "step": 38825 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593835442903816e-06, + "loss": 0.6909, + "step": 38826 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593606077893021e-06, + "loss": 0.9844, + "step": 38827 + }, + { + "epoch": 1.0, + "learning_rate": 1.559337670859946e-06, + "loss": 0.9746, + "step": 38828 + }, + { + "epoch": 1.0, + "learning_rate": 1.5593147335023308e-06, + "loss": 0.7148, + "step": 38829 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592917957164739e-06, + "loss": 0.8311, + "step": 38830 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592688575023933e-06, + "loss": 0.9814, + "step": 38831 + }, + { + "epoch": 1.0, + "learning_rate": 1.559245918860106e-06, + "loss": 1.0566, + "step": 38832 + }, + { + "epoch": 1.0, + "learning_rate": 1.55922297978963e-06, + "loss": 0.9863, + "step": 38833 + }, + { + "epoch": 1.0, + "learning_rate": 1.5592000402909823e-06, + "loss": 0.793, + "step": 38834 + }, + { + "epoch": 1.0, + "learning_rate": 1.559177100364181e-06, + "loss": 0.7163, + "step": 38835 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591541600092439e-06, + "loss": 0.5093, + "step": 38836 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591312192261875e-06, + "loss": 0.8193, + "step": 38837 + }, + { + "epoch": 1.0, + "learning_rate": 1.5591082780150306e-06, + "loss": 0.7988, + "step": 38838 + }, + { + "epoch": 1.0, + "learning_rate": 1.55908533637579e-06, + "loss": 1.0645, + "step": 38839 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590623943084832e-06, + "loss": 0.9541, + "step": 38840 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590394518131284e-06, + "loss": 0.8643, + "step": 38841 + }, + { + "epoch": 1.0, + "learning_rate": 1.5590165088897427e-06, + "loss": 0.8574, + "step": 38842 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589935655383437e-06, + "loss": 0.8662, + "step": 38843 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589706217589492e-06, + "loss": 0.75, + "step": 38844 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589476775515765e-06, + "loss": 0.7969, + "step": 38845 + }, + { + "epoch": 1.0, + "learning_rate": 1.558924732916243e-06, + "loss": 0.8398, + "step": 38846 + }, + { + "epoch": 1.0, + "learning_rate": 1.5589017878529669e-06, + "loss": 0.7419, + "step": 38847 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588788423617652e-06, + "loss": 0.54, + "step": 38848 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588558964426557e-06, + "loss": 0.8096, + "step": 38849 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588329500956562e-06, + "loss": 0.7969, + "step": 38850 + }, + { + "epoch": 1.0, + "learning_rate": 1.5588100033207834e-06, + "loss": 0.9111, + "step": 38851 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587870561180561e-06, + "loss": 0.8096, + "step": 38852 + }, + { + "epoch": 1.0, + "learning_rate": 1.558764108487491e-06, + "loss": 0.6445, + "step": 38853 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587411604291056e-06, + "loss": 0.8232, + "step": 38854 + }, + { + "epoch": 1.0, + "learning_rate": 1.5587182119429182e-06, + "loss": 0.7705, + "step": 38855 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586952630289457e-06, + "loss": 0.575, + "step": 38856 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586723136872061e-06, + "loss": 0.8975, + "step": 38857 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586493639177168e-06, + "loss": 0.6479, + "step": 38858 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586264137204953e-06, + "loss": 0.8877, + "step": 38859 + }, + { + "epoch": 1.0, + "learning_rate": 1.5586034630955592e-06, + "loss": 0.9238, + "step": 38860 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585805120429266e-06, + "loss": 0.9971, + "step": 38861 + }, + { + "epoch": 1.0, + "learning_rate": 1.558557560562614e-06, + "loss": 0.7666, + "step": 38862 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585346086546397e-06, + "loss": 0.7397, + "step": 38863 + }, + { + "epoch": 1.0, + "learning_rate": 1.5585116563190211e-06, + "loss": 0.9297, + "step": 38864 + }, + { + "epoch": 1.0, + "learning_rate": 1.558488703555776e-06, + "loss": 0.7681, + "step": 38865 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584657503649217e-06, + "loss": 0.8994, + "step": 38866 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584427967464757e-06, + "loss": 0.9434, + "step": 38867 + }, + { + "epoch": 1.0, + "learning_rate": 1.5584198427004558e-06, + "loss": 0.8135, + "step": 38868 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583968882268796e-06, + "loss": 0.9639, + "step": 38869 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583739333257646e-06, + "loss": 0.8359, + "step": 38870 + }, + { + "epoch": 1.0, + "learning_rate": 1.5583509779971282e-06, + "loss": 0.9531, + "step": 38871 + }, + { + "epoch": 1.0, + "learning_rate": 1.558328022240988e-06, + "loss": 0.7246, + "step": 38872 + }, + { + "epoch": 1.0, + "learning_rate": 1.558305066057362e-06, + "loss": 0.9238, + "step": 38873 + }, + { + "epoch": 1.0, + "learning_rate": 1.5582821094462673e-06, + "loss": 0.6797, + "step": 38874 + }, + { + "epoch": 1.0, + "learning_rate": 1.558259152407722e-06, + "loss": 0.731, + "step": 38875 + }, + { + "epoch": 1.0, + "learning_rate": 1.558236194941743e-06, + "loss": 0.8545, + "step": 38876 + }, + { + "epoch": 1.0, + "learning_rate": 1.5582132370483482e-06, + "loss": 0.916, + "step": 38877 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581902787275554e-06, + "loss": 0.7898, + "step": 38878 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581673199793817e-06, + "loss": 0.8613, + "step": 38879 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581443608038454e-06, + "loss": 0.71, + "step": 38880 + }, + { + "epoch": 1.0, + "learning_rate": 1.5581214012009634e-06, + "loss": 0.7925, + "step": 38881 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580984411707535e-06, + "loss": 0.7427, + "step": 38882 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580754807132328e-06, + "loss": 0.9673, + "step": 38883 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580525198284198e-06, + "loss": 1.0625, + "step": 38884 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580295585163318e-06, + "loss": 0.8447, + "step": 38885 + }, + { + "epoch": 1.0, + "learning_rate": 1.5580065967769862e-06, + "loss": 0.7485, + "step": 38886 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579836346104002e-06, + "loss": 0.8237, + "step": 38887 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579606720165921e-06, + "loss": 0.7344, + "step": 38888 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579377089955792e-06, + "loss": 0.9062, + "step": 38889 + }, + { + "epoch": 1.0, + "learning_rate": 1.5579147455473791e-06, + "loss": 0.5581, + "step": 38890 + }, + { + "epoch": 1.0, + "learning_rate": 1.557891781672009e-06, + "loss": 0.9746, + "step": 38891 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578688173694872e-06, + "loss": 0.9331, + "step": 38892 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578458526398305e-06, + "loss": 0.6719, + "step": 38893 + }, + { + "epoch": 1.0, + "learning_rate": 1.5578228874830572e-06, + "loss": 0.8477, + "step": 38894 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577999218991847e-06, + "loss": 0.7295, + "step": 38895 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577769558882302e-06, + "loss": 1.0117, + "step": 38896 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577539894502114e-06, + "loss": 0.6494, + "step": 38897 + }, + { + "epoch": 1.0, + "learning_rate": 1.557731022585146e-06, + "loss": 0.7686, + "step": 38898 + }, + { + "epoch": 1.0, + "learning_rate": 1.5577080552930516e-06, + "loss": 0.5503, + "step": 38899 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576850875739465e-06, + "loss": 0.7549, + "step": 38900 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576621194278468e-06, + "loss": 0.6912, + "step": 38901 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576391508547713e-06, + "loss": 0.626, + "step": 38902 + }, + { + "epoch": 1.0, + "learning_rate": 1.5576161818547366e-06, + "loss": 0.9219, + "step": 38903 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575932124277612e-06, + "loss": 0.7236, + "step": 38904 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575702425738625e-06, + "loss": 1.0332, + "step": 38905 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575472722930576e-06, + "loss": 0.5837, + "step": 38906 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575243015853644e-06, + "loss": 0.7754, + "step": 38907 + }, + { + "epoch": 1.0, + "learning_rate": 1.5575013304508008e-06, + "loss": 0.8252, + "step": 38908 + }, + { + "epoch": 1.0, + "learning_rate": 1.5574783588893837e-06, + "loss": 0.9248, + "step": 38909 + }, + { + "epoch": 1.0, + "learning_rate": 1.557455386901131e-06, + "loss": 0.8271, + "step": 38910 + }, + { + "epoch": 1.0, + "learning_rate": 1.5574324144860605e-06, + "loss": 0.9668, + "step": 38911 + }, + { + "epoch": 1.0, + "learning_rate": 1.55740944164419e-06, + "loss": 0.8867, + "step": 38912 + }, + { + "epoch": 1.0, + "learning_rate": 1.557386468375536e-06, + "loss": 1.0098, + "step": 38913 + }, + { + "epoch": 1.0, + "learning_rate": 1.5573634946801173e-06, + "loss": 0.6523, + "step": 38914 + }, + { + "epoch": 1.0, + "learning_rate": 1.557340520557951e-06, + "loss": 1.0098, + "step": 38915 + }, + { + "epoch": 1.0, + "learning_rate": 1.5573175460090542e-06, + "loss": 0.9346, + "step": 38916 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572945710334455e-06, + "loss": 0.8887, + "step": 38917 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572715956311417e-06, + "loss": 0.8252, + "step": 38918 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572486198021607e-06, + "loss": 0.6855, + "step": 38919 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572256435465203e-06, + "loss": 0.8628, + "step": 38920 + }, + { + "epoch": 1.0, + "learning_rate": 1.5572026668642377e-06, + "loss": 0.9092, + "step": 38921 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571796897553306e-06, + "loss": 0.7983, + "step": 38922 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571567122198167e-06, + "loss": 1.0938, + "step": 38923 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571337342577132e-06, + "loss": 0.7959, + "step": 38924 + }, + { + "epoch": 1.0, + "learning_rate": 1.5571107558690387e-06, + "loss": 0.9697, + "step": 38925 + }, + { + "epoch": 1.0, + "learning_rate": 1.5570877770538096e-06, + "loss": 0.9141, + "step": 38926 + }, + { + "epoch": 1.0, + "learning_rate": 1.557064797812044e-06, + "loss": 0.8447, + "step": 38927 + }, + { + "epoch": 1.0, + "learning_rate": 1.5570418181437597e-06, + "loss": 0.8945, + "step": 38928 + }, + { + "epoch": 1.0, + "learning_rate": 1.557018838048974e-06, + "loss": 0.7354, + "step": 38929 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569958575277045e-06, + "loss": 0.7402, + "step": 38930 + }, + { + "epoch": 1.0, + "learning_rate": 1.556972876579969e-06, + "loss": 0.9219, + "step": 38931 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569498952057849e-06, + "loss": 0.8545, + "step": 38932 + }, + { + "epoch": 1.0, + "learning_rate": 1.55692691340517e-06, + "loss": 0.9346, + "step": 38933 + }, + { + "epoch": 1.0, + "learning_rate": 1.5569039311781417e-06, + "loss": 0.832, + "step": 38934 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568809485247174e-06, + "loss": 0.7603, + "step": 38935 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568579654449154e-06, + "loss": 1.0693, + "step": 38936 + }, + { + "epoch": 1.0, + "learning_rate": 1.5568349819387527e-06, + "loss": 0.9473, + "step": 38937 + }, + { + "epoch": 1.0, + "learning_rate": 1.556811998006247e-06, + "loss": 0.7842, + "step": 38938 + }, + { + "epoch": 1.0, + "learning_rate": 1.556789013647416e-06, + "loss": 0.6128, + "step": 38939 + }, + { + "epoch": 1.0, + "learning_rate": 1.5567660288622773e-06, + "loss": 0.8252, + "step": 38940 + }, + { + "epoch": 1.0, + "learning_rate": 1.5567430436508485e-06, + "loss": 0.7295, + "step": 38941 + }, + { + "epoch": 1.0, + "learning_rate": 1.556720058013147e-06, + "loss": 0.9277, + "step": 38942 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566970719491903e-06, + "loss": 0.8887, + "step": 38943 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566740854589967e-06, + "loss": 0.7471, + "step": 38944 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566510985425834e-06, + "loss": 0.6475, + "step": 38945 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566281111999678e-06, + "loss": 0.8242, + "step": 38946 + }, + { + "epoch": 1.0, + "learning_rate": 1.5566051234311674e-06, + "loss": 0.9287, + "step": 38947 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565821352362004e-06, + "loss": 0.5776, + "step": 38948 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565591466150837e-06, + "loss": 0.7651, + "step": 38949 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565361575678355e-06, + "loss": 0.6772, + "step": 38950 + }, + { + "epoch": 1.0, + "learning_rate": 1.5565131680944731e-06, + "loss": 0.9268, + "step": 38951 + }, + { + "epoch": 1.0, + "learning_rate": 1.5564901781950143e-06, + "loss": 0.8066, + "step": 38952 + }, + { + "epoch": 1.0, + "learning_rate": 1.5564671878694765e-06, + "loss": 0.6235, + "step": 38953 + }, + { + "epoch": 1.0, + "learning_rate": 1.556444197117877e-06, + "loss": 0.6943, + "step": 38954 + }, + { + "epoch": 1.0, + "learning_rate": 1.556421205940234e-06, + "loss": 0.6968, + "step": 38955 + }, + { + "epoch": 1.0, + "learning_rate": 1.556398214336565e-06, + "loss": 0.7529, + "step": 38956 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563752223068876e-06, + "loss": 0.6217, + "step": 38957 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563522298512188e-06, + "loss": 0.845, + "step": 38958 + }, + { + "epoch": 1.0, + "learning_rate": 1.556329236969577e-06, + "loss": 0.8364, + "step": 38959 + }, + { + "epoch": 1.0, + "learning_rate": 1.5563062436619797e-06, + "loss": 0.9424, + "step": 38960 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562832499284438e-06, + "loss": 0.707, + "step": 38961 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562602557689877e-06, + "loss": 0.7671, + "step": 38962 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562372611836285e-06, + "loss": 0.6191, + "step": 38963 + }, + { + "epoch": 1.0, + "learning_rate": 1.5562142661723842e-06, + "loss": 0.9873, + "step": 38964 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561912707352722e-06, + "loss": 0.4355, + "step": 38965 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561682748723102e-06, + "loss": 0.958, + "step": 38966 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561452785835154e-06, + "loss": 0.8555, + "step": 38967 + }, + { + "epoch": 1.0, + "learning_rate": 1.5561222818689057e-06, + "loss": 0.5605, + "step": 38968 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560992847284991e-06, + "loss": 1.0469, + "step": 38969 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560762871623128e-06, + "loss": 0.8032, + "step": 38970 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560532891703645e-06, + "loss": 0.6294, + "step": 38971 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560302907526713e-06, + "loss": 0.7207, + "step": 38972 + }, + { + "epoch": 1.0, + "learning_rate": 1.5560072919092514e-06, + "loss": 0.8174, + "step": 38973 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559842926401227e-06, + "loss": 0.7979, + "step": 38974 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559612929453023e-06, + "loss": 0.7676, + "step": 38975 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559382928248076e-06, + "loss": 0.8223, + "step": 38976 + }, + { + "epoch": 1.0, + "learning_rate": 1.5559152922786569e-06, + "loss": 0.915, + "step": 38977 + }, + { + "epoch": 1.0, + "learning_rate": 1.555892291306867e-06, + "loss": 0.8789, + "step": 38978 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558692899094562e-06, + "loss": 1.0479, + "step": 38979 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558462880864418e-06, + "loss": 0.6592, + "step": 38980 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558232858378414e-06, + "loss": 0.7261, + "step": 38981 + }, + { + "epoch": 1.0, + "learning_rate": 1.5558002831636725e-06, + "loss": 0.7463, + "step": 38982 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557772800639533e-06, + "loss": 0.7305, + "step": 38983 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557542765387006e-06, + "loss": 0.8403, + "step": 38984 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557312725879327e-06, + "loss": 0.6982, + "step": 38985 + }, + { + "epoch": 1.0, + "learning_rate": 1.5557082682116667e-06, + "loss": 0.8213, + "step": 38986 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556852634099205e-06, + "loss": 0.8779, + "step": 38987 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556622581827117e-06, + "loss": 0.9658, + "step": 38988 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556392525300578e-06, + "loss": 0.7812, + "step": 38989 + }, + { + "epoch": 1.0, + "learning_rate": 1.5556162464519766e-06, + "loss": 1.0293, + "step": 38990 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555932399484854e-06, + "loss": 0.8198, + "step": 38991 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555702330196021e-06, + "loss": 0.8994, + "step": 38992 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555472256653445e-06, + "loss": 0.9023, + "step": 38993 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555242178857295e-06, + "loss": 0.9492, + "step": 38994 + }, + { + "epoch": 1.0, + "learning_rate": 1.5555012096807754e-06, + "loss": 0.9395, + "step": 38995 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554782010504992e-06, + "loss": 0.6084, + "step": 38996 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554551919949193e-06, + "loss": 0.7036, + "step": 38997 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554321825140529e-06, + "loss": 0.9014, + "step": 38998 + }, + { + "epoch": 1.0, + "learning_rate": 1.5554091726079172e-06, + "loss": 0.8135, + "step": 38999 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553861622765306e-06, + "loss": 0.8291, + "step": 39000 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553631515199101e-06, + "loss": 1.041, + "step": 39001 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553401403380738e-06, + "loss": 0.7168, + "step": 39002 + }, + { + "epoch": 1.0, + "learning_rate": 1.5553171287310392e-06, + "loss": 0.7988, + "step": 39003 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552941166988234e-06, + "loss": 0.7693, + "step": 39004 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552711042414446e-06, + "loss": 0.7959, + "step": 39005 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552480913589205e-06, + "loss": 1.0, + "step": 39006 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552250780512682e-06, + "loss": 0.7466, + "step": 39007 + }, + { + "epoch": 1.0, + "learning_rate": 1.5552020643185056e-06, + "loss": 0.8721, + "step": 39008 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551790501606501e-06, + "loss": 0.877, + "step": 39009 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551560355777201e-06, + "loss": 0.8867, + "step": 39010 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551330205697322e-06, + "loss": 0.7402, + "step": 39011 + }, + { + "epoch": 1.0, + "learning_rate": 1.5551100051367047e-06, + "loss": 0.6943, + "step": 39012 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550869892786549e-06, + "loss": 0.8711, + "step": 39013 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550639729956005e-06, + "loss": 0.8037, + "step": 39014 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550409562875593e-06, + "loss": 0.9434, + "step": 39015 + }, + { + "epoch": 1.0, + "learning_rate": 1.5550179391545487e-06, + "loss": 0.7852, + "step": 39016 + }, + { + "epoch": 1.0, + "learning_rate": 1.554994921596586e-06, + "loss": 0.6829, + "step": 39017 + }, + { + "epoch": 1.0, + "learning_rate": 1.5549719036136897e-06, + "loss": 0.7891, + "step": 39018 + }, + { + "epoch": 1.0, + "learning_rate": 1.5549488852058766e-06, + "loss": 0.7266, + "step": 39019 + }, + { + "epoch": 1.0, + "learning_rate": 1.554925866373165e-06, + "loss": 0.7617, + "step": 39020 + }, + { + "epoch": 1.0, + "learning_rate": 1.554902847115572e-06, + "loss": 0.709, + "step": 39021 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548798274331152e-06, + "loss": 0.6033, + "step": 39022 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548568073258125e-06, + "loss": 0.6326, + "step": 39023 + }, + { + "epoch": 1.0, + "learning_rate": 1.5548337867936816e-06, + "loss": 0.6895, + "step": 39024 + }, + { + "epoch": 1.0, + "learning_rate": 1.55481076583674e-06, + "loss": 0.5718, + "step": 39025 + }, + { + "epoch": 1.0, + "learning_rate": 1.5547877444550053e-06, + "loss": 0.6528, + "step": 39026 + }, + { + "epoch": 1.0, + "learning_rate": 1.554764722648495e-06, + "loss": 0.8047, + "step": 39027 + }, + { + "epoch": 1.0, + "learning_rate": 1.554741700417227e-06, + "loss": 0.7305, + "step": 39028 + }, + { + "epoch": 1.0, + "learning_rate": 1.554718677761219e-06, + "loss": 0.6897, + "step": 39029 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546956546804879e-06, + "loss": 0.5771, + "step": 39030 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546726311750521e-06, + "loss": 0.7178, + "step": 39031 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546496072449289e-06, + "loss": 0.7852, + "step": 39032 + }, + { + "epoch": 1.0, + "learning_rate": 1.5546265828901359e-06, + "loss": 0.6973, + "step": 39033 + }, + { + "epoch": 1.0, + "learning_rate": 1.554603558110691e-06, + "loss": 0.7324, + "step": 39034 + }, + { + "epoch": 1.0, + "learning_rate": 1.554580532906612e-06, + "loss": 0.7305, + "step": 39035 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545575072779158e-06, + "loss": 0.6646, + "step": 39036 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545344812246204e-06, + "loss": 0.7188, + "step": 39037 + }, + { + "epoch": 1.0, + "learning_rate": 1.5545114547467436e-06, + "loss": 0.7012, + "step": 39038 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544884278443027e-06, + "loss": 0.667, + "step": 39039 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544654005173156e-06, + "loss": 0.7207, + "step": 39040 + }, + { + "epoch": 1.0, + "learning_rate": 1.5544423727657998e-06, + "loss": 0.7188, + "step": 39041 + }, + { + "epoch": 1.0, + "learning_rate": 1.554419344589773e-06, + "loss": 0.7803, + "step": 39042 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543963159892525e-06, + "loss": 0.47, + "step": 39043 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543732869642568e-06, + "loss": 0.7314, + "step": 39044 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543502575148027e-06, + "loss": 0.7969, + "step": 39045 + }, + { + "epoch": 1.0, + "learning_rate": 1.554327227640908e-06, + "loss": 0.6709, + "step": 39046 + }, + { + "epoch": 1.0, + "learning_rate": 1.5543041973425905e-06, + "loss": 0.6826, + "step": 39047 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542811666198678e-06, + "loss": 0.6523, + "step": 39048 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542581354727576e-06, + "loss": 0.624, + "step": 39049 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542351039012772e-06, + "loss": 0.9346, + "step": 39050 + }, + { + "epoch": 1.0, + "learning_rate": 1.5542120719054445e-06, + "loss": 0.4854, + "step": 39051 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541890394852773e-06, + "loss": 0.5947, + "step": 39052 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541660066407927e-06, + "loss": 0.4493, + "step": 39053 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541429733720088e-06, + "loss": 0.6431, + "step": 39054 + }, + { + "epoch": 1.0, + "learning_rate": 1.5541199396789436e-06, + "loss": 0.6187, + "step": 39055 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540969055616135e-06, + "loss": 0.6377, + "step": 39056 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540738710200375e-06, + "loss": 0.6558, + "step": 39057 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540508360542322e-06, + "loss": 0.6567, + "step": 39058 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540278006642158e-06, + "loss": 0.7207, + "step": 39059 + }, + { + "epoch": 1.0, + "learning_rate": 1.5540047648500058e-06, + "loss": 0.7651, + "step": 39060 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539817286116197e-06, + "loss": 0.6479, + "step": 39061 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539586919490755e-06, + "loss": 0.5249, + "step": 39062 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539356548623903e-06, + "loss": 0.3691, + "step": 39063 + }, + { + "epoch": 1.0, + "learning_rate": 1.5539126173515822e-06, + "loss": 0.7324, + "step": 39064 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538895794166687e-06, + "loss": 0.4797, + "step": 39065 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538665410576672e-06, + "loss": 0.6865, + "step": 39066 + }, + { + "epoch": 1.0, + "learning_rate": 1.553843502274596e-06, + "loss": 0.7236, + "step": 39067 + }, + { + "epoch": 1.0, + "learning_rate": 1.5538204630674717e-06, + "loss": 0.6904, + "step": 39068 + }, + { + "epoch": 1.0, + "learning_rate": 1.553797423436313e-06, + "loss": 0.6719, + "step": 39069 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537743833811373e-06, + "loss": 0.6592, + "step": 39070 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537513429019615e-06, + "loss": 0.7002, + "step": 39071 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537283019988036e-06, + "loss": 0.7598, + "step": 39072 + }, + { + "epoch": 1.0, + "learning_rate": 1.5537052606716817e-06, + "loss": 0.6465, + "step": 39073 + }, + { + "epoch": 1.0, + "learning_rate": 1.5536822189206133e-06, + "loss": 0.7471, + "step": 39074 + }, + { + "epoch": 1.0, + "learning_rate": 1.553659176745616e-06, + "loss": 0.4812, + "step": 39075 + }, + { + "epoch": 1.0, + "learning_rate": 1.553636134146707e-06, + "loss": 0.5994, + "step": 39076 + }, + { + "epoch": 1.0, + "learning_rate": 1.5536130911239042e-06, + "loss": 0.8574, + "step": 39077 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535900476772255e-06, + "loss": 0.8984, + "step": 39078 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535670038066884e-06, + "loss": 0.7021, + "step": 39079 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535439595123102e-06, + "loss": 0.6157, + "step": 39080 + }, + { + "epoch": 1.0, + "learning_rate": 1.5535209147941094e-06, + "loss": 0.6167, + "step": 39081 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534978696521023e-06, + "loss": 0.7852, + "step": 39082 + }, + { + "epoch": 1.0, + "learning_rate": 1.553474824086308e-06, + "loss": 0.8096, + "step": 39083 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534517780967433e-06, + "loss": 0.541, + "step": 39084 + }, + { + "epoch": 1.0, + "learning_rate": 1.553428731683426e-06, + "loss": 0.8232, + "step": 39085 + }, + { + "epoch": 1.0, + "learning_rate": 1.5534056848463738e-06, + "loss": 0.5557, + "step": 39086 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533826375856043e-06, + "loss": 0.7773, + "step": 39087 + }, + { + "epoch": 1.0, + "learning_rate": 1.553359589901135e-06, + "loss": 0.5508, + "step": 39088 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533365417929835e-06, + "loss": 0.6958, + "step": 39089 + }, + { + "epoch": 1.0, + "learning_rate": 1.5533134932611682e-06, + "loss": 0.6875, + "step": 39090 + }, + { + "epoch": 1.0, + "learning_rate": 1.553290444305706e-06, + "loss": 0.7876, + "step": 39091 + }, + { + "epoch": 1.0, + "learning_rate": 1.5532673949266148e-06, + "loss": 0.6143, + "step": 39092 + }, + { + "epoch": 1.0, + "learning_rate": 1.553244345123912e-06, + "loss": 0.6807, + "step": 39093 + }, + { + "epoch": 1.0, + "learning_rate": 1.5532212948976156e-06, + "loss": 0.6182, + "step": 39094 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531982442477432e-06, + "loss": 0.7139, + "step": 39095 + }, + { + "epoch": 1.0, + "learning_rate": 1.553175193174312e-06, + "loss": 0.7793, + "step": 39096 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531521416773404e-06, + "loss": 0.8223, + "step": 39097 + }, + { + "epoch": 1.0, + "learning_rate": 1.5531290897568453e-06, + "loss": 0.6797, + "step": 39098 + }, + { + "epoch": 1.0, + "learning_rate": 1.553106037412845e-06, + "loss": 0.7207, + "step": 39099 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530829846453566e-06, + "loss": 0.7646, + "step": 39100 + }, + { + "epoch": 1.0, + "learning_rate": 1.553059931454398e-06, + "loss": 0.5913, + "step": 39101 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530368778399867e-06, + "loss": 0.8516, + "step": 39102 + }, + { + "epoch": 1.0, + "learning_rate": 1.5530138238021407e-06, + "loss": 0.8389, + "step": 39103 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529907693408775e-06, + "loss": 0.7383, + "step": 39104 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529677144562147e-06, + "loss": 0.6475, + "step": 39105 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529446591481699e-06, + "loss": 0.5557, + "step": 39106 + }, + { + "epoch": 1.0, + "learning_rate": 1.5529216034167604e-06, + "loss": 0.793, + "step": 39107 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528985472620048e-06, + "loss": 0.5508, + "step": 39108 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528754906839198e-06, + "loss": 0.6016, + "step": 39109 + }, + { + "epoch": 1.0, + "learning_rate": 1.552852433682524e-06, + "loss": 0.6494, + "step": 39110 + }, + { + "epoch": 1.0, + "learning_rate": 1.552829376257834e-06, + "loss": 0.6895, + "step": 39111 + }, + { + "epoch": 1.0, + "learning_rate": 1.5528063184098683e-06, + "loss": 0.5325, + "step": 39112 + }, + { + "epoch": 1.0, + "learning_rate": 1.552783260138644e-06, + "loss": 0.5776, + "step": 39113 + }, + { + "epoch": 1.0, + "learning_rate": 1.5527602014441791e-06, + "loss": 0.7842, + "step": 39114 + }, + { + "epoch": 1.0, + "learning_rate": 1.552737142326491e-06, + "loss": 0.8076, + "step": 39115 + }, + { + "epoch": 1.0, + "learning_rate": 1.5527140827855977e-06, + "loss": 0.7334, + "step": 39116 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526910228215165e-06, + "loss": 0.6416, + "step": 39117 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526679624342651e-06, + "loss": 0.7148, + "step": 39118 + }, + { + "epoch": 1.0, + "learning_rate": 1.5526449016238615e-06, + "loss": 0.6445, + "step": 39119 + }, + { + "epoch": 1.0, + "learning_rate": 1.552621840390323e-06, + "loss": 0.7383, + "step": 39120 + }, + { + "epoch": 1.0, + "learning_rate": 1.552598778733667e-06, + "loss": 0.7622, + "step": 39121 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525757166539122e-06, + "loss": 0.4534, + "step": 39122 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525526541510748e-06, + "loss": 0.7383, + "step": 39123 + }, + { + "epoch": 1.0, + "learning_rate": 1.552529591225174e-06, + "loss": 0.6885, + "step": 39124 + }, + { + "epoch": 1.0, + "learning_rate": 1.5525065278762264e-06, + "loss": 0.5137, + "step": 39125 + }, + { + "epoch": 1.0, + "learning_rate": 1.55248346410425e-06, + "loss": 0.6528, + "step": 39126 + }, + { + "epoch": 1.0, + "learning_rate": 1.5524603999092623e-06, + "loss": 0.4695, + "step": 39127 + }, + { + "epoch": 1.0, + "learning_rate": 1.5524373352912813e-06, + "loss": 0.6782, + "step": 39128 + }, + { + "epoch": 1.0, + "learning_rate": 1.552414270250324e-06, + "loss": 0.8594, + "step": 39129 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523912047864087e-06, + "loss": 0.7427, + "step": 39130 + }, + { + "epoch": 1.0, + "learning_rate": 1.552368138899553e-06, + "loss": 0.562, + "step": 39131 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523450725897744e-06, + "loss": 0.8223, + "step": 39132 + }, + { + "epoch": 1.0, + "learning_rate": 1.5523220058570904e-06, + "loss": 0.5339, + "step": 39133 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522989387015192e-06, + "loss": 0.6919, + "step": 39134 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522758711230775e-06, + "loss": 0.708, + "step": 39135 + }, + { + "epoch": 1.0, + "learning_rate": 1.552252803121784e-06, + "loss": 0.7822, + "step": 39136 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522297346976557e-06, + "loss": 0.6875, + "step": 39137 + }, + { + "epoch": 1.0, + "learning_rate": 1.5522066658507106e-06, + "loss": 0.6006, + "step": 39138 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521835965809663e-06, + "loss": 0.6211, + "step": 39139 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521605268884405e-06, + "loss": 0.2896, + "step": 39140 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521374567731503e-06, + "loss": 0.6982, + "step": 39141 + }, + { + "epoch": 1.0, + "learning_rate": 1.5521143862351146e-06, + "loss": 0.8057, + "step": 39142 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520913152743496e-06, + "loss": 0.5574, + "step": 39143 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520682438908741e-06, + "loss": 0.5356, + "step": 39144 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520451720847053e-06, + "loss": 0.4861, + "step": 39145 + }, + { + "epoch": 1.0, + "learning_rate": 1.5520220998558604e-06, + "loss": 0.7939, + "step": 39146 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519990272043582e-06, + "loss": 0.5903, + "step": 39147 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519759541302154e-06, + "loss": 0.6875, + "step": 39148 + }, + { + "epoch": 1.0, + "learning_rate": 1.55195288063345e-06, + "loss": 0.8525, + "step": 39149 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519298067140797e-06, + "loss": 0.8418, + "step": 39150 + }, + { + "epoch": 1.0, + "learning_rate": 1.5519067323721223e-06, + "loss": 0.6963, + "step": 39151 + }, + { + "epoch": 1.0, + "learning_rate": 1.551883657607595e-06, + "loss": 0.6501, + "step": 39152 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518605824205157e-06, + "loss": 0.6533, + "step": 39153 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518375068109023e-06, + "loss": 0.7803, + "step": 39154 + }, + { + "epoch": 1.0, + "learning_rate": 1.5518144307787724e-06, + "loss": 0.5542, + "step": 39155 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517913543241435e-06, + "loss": 0.6465, + "step": 39156 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517682774470334e-06, + "loss": 0.6675, + "step": 39157 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517452001474593e-06, + "loss": 0.5483, + "step": 39158 + }, + { + "epoch": 1.0, + "learning_rate": 1.5517221224254398e-06, + "loss": 0.5811, + "step": 39159 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516990442809918e-06, + "loss": 0.6963, + "step": 39160 + }, + { + "epoch": 1.0, + "learning_rate": 1.551675965714133e-06, + "loss": 0.5317, + "step": 39161 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516528867248818e-06, + "loss": 0.6846, + "step": 39162 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516298073132547e-06, + "loss": 0.7207, + "step": 39163 + }, + { + "epoch": 1.0, + "learning_rate": 1.5516067274792706e-06, + "loss": 0.6377, + "step": 39164 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515836472229462e-06, + "loss": 0.5239, + "step": 39165 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515605665442998e-06, + "loss": 0.6963, + "step": 39166 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515374854433487e-06, + "loss": 0.5217, + "step": 39167 + }, + { + "epoch": 1.0, + "learning_rate": 1.5515144039201106e-06, + "loss": 0.6904, + "step": 39168 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514913219746038e-06, + "loss": 0.5059, + "step": 39169 + }, + { + "epoch": 1.0, + "learning_rate": 1.551468239606845e-06, + "loss": 0.5059, + "step": 39170 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514451568168525e-06, + "loss": 0.6963, + "step": 39171 + }, + { + "epoch": 1.0, + "learning_rate": 1.5514220736046437e-06, + "loss": 0.6289, + "step": 39172 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513989899702361e-06, + "loss": 0.6553, + "step": 39173 + }, + { + "epoch": 1.0, + "learning_rate": 1.551375905913648e-06, + "loss": 0.6309, + "step": 39174 + }, + { + "epoch": 1.0, + "learning_rate": 1.551352821434897e-06, + "loss": 0.5806, + "step": 39175 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513297365339998e-06, + "loss": 0.7197, + "step": 39176 + }, + { + "epoch": 1.0, + "learning_rate": 1.5513066512109753e-06, + "loss": 0.8525, + "step": 39177 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512835654658405e-06, + "loss": 0.6685, + "step": 39178 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512604792986132e-06, + "loss": 0.5864, + "step": 39179 + }, + { + "epoch": 1.0, + "learning_rate": 1.5512373927093113e-06, + "loss": 0.7119, + "step": 39180 + }, + { + "epoch": 1.0, + "learning_rate": 1.551214305697952e-06, + "loss": 0.792, + "step": 39181 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511912182645531e-06, + "loss": 0.6392, + "step": 39182 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511681304091329e-06, + "loss": 0.3884, + "step": 39183 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511450421317083e-06, + "loss": 0.7363, + "step": 39184 + }, + { + "epoch": 1.0, + "learning_rate": 1.5511219534322972e-06, + "loss": 0.6514, + "step": 39185 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510988643109176e-06, + "loss": 0.5842, + "step": 39186 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510757747675868e-06, + "loss": 0.6792, + "step": 39187 + }, + { + "epoch": 1.0, + "learning_rate": 1.5510526848023227e-06, + "loss": 0.603, + "step": 39188 + }, + { + "epoch": 1.0, + "learning_rate": 1.551029594415143e-06, + "loss": 0.4663, + "step": 39189 + }, + { + "epoch": 1.0, + "learning_rate": 1.551006503606065e-06, + "loss": 0.7393, + "step": 39190 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509834123751069e-06, + "loss": 0.7021, + "step": 39191 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509603207222859e-06, + "loss": 0.6211, + "step": 39192 + }, + { + "epoch": 1.0, + "learning_rate": 1.5509372286476202e-06, + "loss": 0.6055, + "step": 39193 + }, + { + "epoch": 1.0, + "learning_rate": 1.550914136151127e-06, + "loss": 0.5854, + "step": 39194 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508910432328244e-06, + "loss": 0.4395, + "step": 39195 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508679498927295e-06, + "loss": 0.6543, + "step": 39196 + }, + { + "epoch": 1.0, + "learning_rate": 1.5508448561308604e-06, + "loss": 0.5815, + "step": 39197 + }, + { + "epoch": 1.0, + "learning_rate": 1.550821761947235e-06, + "loss": 0.7129, + "step": 39198 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507986673418705e-06, + "loss": 0.7134, + "step": 39199 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507755723147851e-06, + "loss": 0.7881, + "step": 39200 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507524768659957e-06, + "loss": 0.6021, + "step": 39201 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507293809955207e-06, + "loss": 0.574, + "step": 39202 + }, + { + "epoch": 1.0, + "learning_rate": 1.5507062847033774e-06, + "loss": 0.6777, + "step": 39203 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506831879895836e-06, + "loss": 0.5696, + "step": 39204 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506600908541572e-06, + "loss": 0.543, + "step": 39205 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506369932971155e-06, + "loss": 0.625, + "step": 39206 + }, + { + "epoch": 1.0, + "learning_rate": 1.5506138953184765e-06, + "loss": 0.6553, + "step": 39207 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505907969182577e-06, + "loss": 0.709, + "step": 39208 + }, + { + "epoch": 1.0, + "learning_rate": 1.550567698096477e-06, + "loss": 0.6855, + "step": 39209 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505445988531517e-06, + "loss": 0.6265, + "step": 39210 + }, + { + "epoch": 1.0, + "learning_rate": 1.5505214991883e-06, + "loss": 0.6172, + "step": 39211 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504983991019392e-06, + "loss": 0.7666, + "step": 39212 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504752985940867e-06, + "loss": 0.6504, + "step": 39213 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504521976647613e-06, + "loss": 0.8174, + "step": 39214 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504290963139795e-06, + "loss": 0.4951, + "step": 39215 + }, + { + "epoch": 1.01, + "learning_rate": 1.5504059945417593e-06, + "loss": 0.5669, + "step": 39216 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503828923481189e-06, + "loss": 0.6646, + "step": 39217 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503597897330754e-06, + "loss": 0.4766, + "step": 39218 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503366866966468e-06, + "loss": 0.7241, + "step": 39219 + }, + { + "epoch": 1.01, + "learning_rate": 1.5503135832388508e-06, + "loss": 0.7017, + "step": 39220 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502904793597047e-06, + "loss": 0.7393, + "step": 39221 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502673750592268e-06, + "loss": 0.6816, + "step": 39222 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502442703374343e-06, + "loss": 0.625, + "step": 39223 + }, + { + "epoch": 1.01, + "learning_rate": 1.5502211651943452e-06, + "loss": 0.5234, + "step": 39224 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501980596299768e-06, + "loss": 0.5781, + "step": 39225 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501749536443472e-06, + "loss": 0.6362, + "step": 39226 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501518472374739e-06, + "loss": 0.5854, + "step": 39227 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501287404093747e-06, + "loss": 0.4189, + "step": 39228 + }, + { + "epoch": 1.01, + "learning_rate": 1.5501056331600672e-06, + "loss": 0.8506, + "step": 39229 + }, + { + "epoch": 1.01, + "learning_rate": 1.5500825254895692e-06, + "loss": 0.5847, + "step": 39230 + }, + { + "epoch": 1.01, + "learning_rate": 1.550059417397898e-06, + "loss": 0.5999, + "step": 39231 + }, + { + "epoch": 1.01, + "learning_rate": 1.550036308885072e-06, + "loss": 0.8389, + "step": 39232 + }, + { + "epoch": 1.01, + "learning_rate": 1.5500131999511082e-06, + "loss": 0.8057, + "step": 39233 + }, + { + "epoch": 1.01, + "learning_rate": 1.5499900905960245e-06, + "loss": 0.5537, + "step": 39234 + }, + { + "epoch": 1.01, + "learning_rate": 1.549966980819839e-06, + "loss": 0.7744, + "step": 39235 + }, + { + "epoch": 1.01, + "learning_rate": 1.5499438706225689e-06, + "loss": 0.6758, + "step": 39236 + }, + { + "epoch": 1.01, + "learning_rate": 1.549920760004232e-06, + "loss": 0.6299, + "step": 39237 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498976489648463e-06, + "loss": 0.6938, + "step": 39238 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498745375044291e-06, + "loss": 0.7393, + "step": 39239 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498514256229983e-06, + "loss": 0.8008, + "step": 39240 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498283133205713e-06, + "loss": 0.6011, + "step": 39241 + }, + { + "epoch": 1.01, + "learning_rate": 1.5498052005971663e-06, + "loss": 0.6201, + "step": 39242 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497820874528004e-06, + "loss": 0.7168, + "step": 39243 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497589738874922e-06, + "loss": 0.4673, + "step": 39244 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497358599012586e-06, + "loss": 0.4619, + "step": 39245 + }, + { + "epoch": 1.01, + "learning_rate": 1.5497127454941174e-06, + "loss": 0.7754, + "step": 39246 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496896306660864e-06, + "loss": 0.9111, + "step": 39247 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496665154171836e-06, + "loss": 0.6597, + "step": 39248 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496433997474263e-06, + "loss": 0.5396, + "step": 39249 + }, + { + "epoch": 1.01, + "learning_rate": 1.5496202836568323e-06, + "loss": 0.6904, + "step": 39250 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495971671454192e-06, + "loss": 0.5425, + "step": 39251 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495740502132048e-06, + "loss": 0.6436, + "step": 39252 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495509328602067e-06, + "loss": 0.6787, + "step": 39253 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495278150864433e-06, + "loss": 0.7998, + "step": 39254 + }, + { + "epoch": 1.01, + "learning_rate": 1.5495046968919315e-06, + "loss": 0.5234, + "step": 39255 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494815782766889e-06, + "loss": 0.6572, + "step": 39256 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494584592407337e-06, + "loss": 0.7607, + "step": 39257 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494353397840833e-06, + "loss": 0.687, + "step": 39258 + }, + { + "epoch": 1.01, + "learning_rate": 1.5494122199067559e-06, + "loss": 0.7969, + "step": 39259 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493890996087684e-06, + "loss": 0.5337, + "step": 39260 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493659788901393e-06, + "loss": 0.4785, + "step": 39261 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493428577508857e-06, + "loss": 0.7002, + "step": 39262 + }, + { + "epoch": 1.01, + "learning_rate": 1.5493197361910256e-06, + "loss": 0.6338, + "step": 39263 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492966142105766e-06, + "loss": 0.7051, + "step": 39264 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492734918095564e-06, + "loss": 0.646, + "step": 39265 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492503689879827e-06, + "loss": 0.4814, + "step": 39266 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492272457458735e-06, + "loss": 0.6641, + "step": 39267 + }, + { + "epoch": 1.01, + "learning_rate": 1.5492041220832458e-06, + "loss": 0.6729, + "step": 39268 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491809980001182e-06, + "loss": 0.6758, + "step": 39269 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491578734965077e-06, + "loss": 0.5273, + "step": 39270 + }, + { + "epoch": 1.01, + "learning_rate": 1.5491347485724325e-06, + "loss": 0.5884, + "step": 39271 + }, + { + "epoch": 1.01, + "learning_rate": 1.54911162322791e-06, + "loss": 0.646, + "step": 39272 + }, + { + "epoch": 1.01, + "learning_rate": 1.549088497462958e-06, + "loss": 0.5542, + "step": 39273 + }, + { + "epoch": 1.01, + "learning_rate": 1.549065371277594e-06, + "loss": 0.5679, + "step": 39274 + }, + { + "epoch": 1.01, + "learning_rate": 1.549042244671836e-06, + "loss": 0.7373, + "step": 39275 + }, + { + "epoch": 1.01, + "learning_rate": 1.5490191176457014e-06, + "loss": 0.7783, + "step": 39276 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489959901992084e-06, + "loss": 0.6787, + "step": 39277 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489728623323744e-06, + "loss": 0.6113, + "step": 39278 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489497340452173e-06, + "loss": 0.5825, + "step": 39279 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489266053377543e-06, + "loss": 0.7666, + "step": 39280 + }, + { + "epoch": 1.01, + "learning_rate": 1.5489034762100034e-06, + "loss": 0.7539, + "step": 39281 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488803466619825e-06, + "loss": 0.7393, + "step": 39282 + }, + { + "epoch": 1.01, + "learning_rate": 1.548857216693709e-06, + "loss": 0.6562, + "step": 39283 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488340863052009e-06, + "loss": 0.749, + "step": 39284 + }, + { + "epoch": 1.01, + "learning_rate": 1.5488109554964758e-06, + "loss": 0.7734, + "step": 39285 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487878242675514e-06, + "loss": 0.6064, + "step": 39286 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487646926184454e-06, + "loss": 0.6499, + "step": 39287 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487415605491754e-06, + "loss": 0.7539, + "step": 39288 + }, + { + "epoch": 1.01, + "learning_rate": 1.5487184280597595e-06, + "loss": 0.5132, + "step": 39289 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486952951502148e-06, + "loss": 0.6035, + "step": 39290 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486721618205594e-06, + "loss": 0.6533, + "step": 39291 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486490280708112e-06, + "loss": 0.625, + "step": 39292 + }, + { + "epoch": 1.01, + "learning_rate": 1.5486258939009874e-06, + "loss": 0.5879, + "step": 39293 + }, + { + "epoch": 1.01, + "learning_rate": 1.548602759311106e-06, + "loss": 0.709, + "step": 39294 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485796243011847e-06, + "loss": 0.7568, + "step": 39295 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485564888712412e-06, + "loss": 0.7207, + "step": 39296 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485333530212932e-06, + "loss": 0.7695, + "step": 39297 + }, + { + "epoch": 1.01, + "learning_rate": 1.5485102167513583e-06, + "loss": 0.7061, + "step": 39298 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484870800614548e-06, + "loss": 0.7832, + "step": 39299 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484639429515997e-06, + "loss": 0.7031, + "step": 39300 + }, + { + "epoch": 1.01, + "learning_rate": 1.548440805421811e-06, + "loss": 0.5811, + "step": 39301 + }, + { + "epoch": 1.01, + "learning_rate": 1.5484176674721064e-06, + "loss": 0.5823, + "step": 39302 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483945291025035e-06, + "loss": 0.6924, + "step": 39303 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483713903130204e-06, + "loss": 0.4331, + "step": 39304 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483482511036744e-06, + "loss": 0.4541, + "step": 39305 + }, + { + "epoch": 1.01, + "learning_rate": 1.548325111474483e-06, + "loss": 0.5225, + "step": 39306 + }, + { + "epoch": 1.01, + "learning_rate": 1.5483019714254648e-06, + "loss": 0.6797, + "step": 39307 + }, + { + "epoch": 1.01, + "learning_rate": 1.5482788309566366e-06, + "loss": 0.6582, + "step": 39308 + }, + { + "epoch": 1.01, + "learning_rate": 1.548255690068017e-06, + "loss": 0.6787, + "step": 39309 + }, + { + "epoch": 1.01, + "learning_rate": 1.548232548759623e-06, + "loss": 0.7109, + "step": 39310 + }, + { + "epoch": 1.01, + "learning_rate": 1.5482094070314721e-06, + "loss": 0.6982, + "step": 39311 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481862648835828e-06, + "loss": 0.6035, + "step": 39312 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481631223159726e-06, + "loss": 0.5273, + "step": 39313 + }, + { + "epoch": 1.01, + "learning_rate": 1.5481399793286589e-06, + "loss": 0.7852, + "step": 39314 + }, + { + "epoch": 1.01, + "learning_rate": 1.54811683592166e-06, + "loss": 0.8955, + "step": 39315 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480936920949929e-06, + "loss": 0.5042, + "step": 39316 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480705478486758e-06, + "loss": 0.5596, + "step": 39317 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480474031827261e-06, + "loss": 0.7051, + "step": 39318 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480242580971618e-06, + "loss": 0.6309, + "step": 39319 + }, + { + "epoch": 1.01, + "learning_rate": 1.5480011125920007e-06, + "loss": 0.686, + "step": 39320 + }, + { + "epoch": 1.01, + "learning_rate": 1.54797796666726e-06, + "loss": 0.7578, + "step": 39321 + }, + { + "epoch": 1.01, + "learning_rate": 1.547954820322958e-06, + "loss": 0.6953, + "step": 39322 + }, + { + "epoch": 1.01, + "learning_rate": 1.547931673559112e-06, + "loss": 0.7188, + "step": 39323 + }, + { + "epoch": 1.01, + "learning_rate": 1.5479085263757403e-06, + "loss": 0.6406, + "step": 39324 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478853787728601e-06, + "loss": 0.52, + "step": 39325 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478622307504892e-06, + "loss": 0.792, + "step": 39326 + }, + { + "epoch": 1.01, + "learning_rate": 1.5478390823086452e-06, + "loss": 0.4535, + "step": 39327 + }, + { + "epoch": 1.01, + "learning_rate": 1.547815933447346e-06, + "loss": 0.645, + "step": 39328 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477927841666096e-06, + "loss": 0.5908, + "step": 39329 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477696344664532e-06, + "loss": 0.4561, + "step": 39330 + }, + { + "epoch": 1.01, + "learning_rate": 1.547746484346895e-06, + "loss": 0.533, + "step": 39331 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477233338079526e-06, + "loss": 0.748, + "step": 39332 + }, + { + "epoch": 1.01, + "learning_rate": 1.5477001828496431e-06, + "loss": 0.7568, + "step": 39333 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476770314719854e-06, + "loss": 0.6611, + "step": 39334 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476538796749962e-06, + "loss": 0.7285, + "step": 39335 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476307274586937e-06, + "loss": 0.6821, + "step": 39336 + }, + { + "epoch": 1.01, + "learning_rate": 1.5476075748230955e-06, + "loss": 0.5703, + "step": 39337 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475844217682192e-06, + "loss": 0.6489, + "step": 39338 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475612682940828e-06, + "loss": 0.7637, + "step": 39339 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475381144007042e-06, + "loss": 0.8486, + "step": 39340 + }, + { + "epoch": 1.01, + "learning_rate": 1.5475149600881006e-06, + "loss": 0.665, + "step": 39341 + }, + { + "epoch": 1.01, + "learning_rate": 1.54749180535629e-06, + "loss": 0.6729, + "step": 39342 + }, + { + "epoch": 1.01, + "learning_rate": 1.5474686502052899e-06, + "loss": 0.6392, + "step": 39343 + }, + { + "epoch": 1.01, + "learning_rate": 1.5474454946351187e-06, + "loss": 0.8301, + "step": 39344 + }, + { + "epoch": 1.01, + "learning_rate": 1.547422338645793e-06, + "loss": 0.5115, + "step": 39345 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473991822373319e-06, + "loss": 0.6797, + "step": 39346 + }, + { + "epoch": 1.01, + "learning_rate": 1.547376025409752e-06, + "loss": 0.6709, + "step": 39347 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473528681630711e-06, + "loss": 0.5737, + "step": 39348 + }, + { + "epoch": 1.01, + "learning_rate": 1.547329710497308e-06, + "loss": 0.4753, + "step": 39349 + }, + { + "epoch": 1.01, + "learning_rate": 1.5473065524124795e-06, + "loss": 0.7021, + "step": 39350 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472833939086033e-06, + "loss": 0.4125, + "step": 39351 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472602349856975e-06, + "loss": 0.6187, + "step": 39352 + }, + { + "epoch": 1.01, + "learning_rate": 1.5472370756437797e-06, + "loss": 0.5249, + "step": 39353 + }, + { + "epoch": 1.01, + "learning_rate": 1.547213915882868e-06, + "loss": 0.6328, + "step": 39354 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471907557029793e-06, + "loss": 0.6367, + "step": 39355 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471675951041315e-06, + "loss": 0.5332, + "step": 39356 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471444340863434e-06, + "loss": 0.6357, + "step": 39357 + }, + { + "epoch": 1.01, + "learning_rate": 1.5471212726496313e-06, + "loss": 0.5791, + "step": 39358 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470981107940139e-06, + "loss": 0.6606, + "step": 39359 + }, + { + "epoch": 1.01, + "learning_rate": 1.547074948519509e-06, + "loss": 0.7324, + "step": 39360 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470517858261334e-06, + "loss": 0.4526, + "step": 39361 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470286227139059e-06, + "loss": 0.5967, + "step": 39362 + }, + { + "epoch": 1.01, + "learning_rate": 1.5470054591828433e-06, + "loss": 0.6294, + "step": 39363 + }, + { + "epoch": 1.01, + "learning_rate": 1.546982295232964e-06, + "loss": 0.6934, + "step": 39364 + }, + { + "epoch": 1.01, + "learning_rate": 1.5469591308642853e-06, + "loss": 0.6094, + "step": 39365 + }, + { + "epoch": 1.01, + "learning_rate": 1.546935966076825e-06, + "loss": 0.6479, + "step": 39366 + }, + { + "epoch": 1.01, + "learning_rate": 1.5469128008706014e-06, + "loss": 0.625, + "step": 39367 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468896352456317e-06, + "loss": 0.7441, + "step": 39368 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468664692019337e-06, + "loss": 0.8271, + "step": 39369 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468433027395253e-06, + "loss": 0.8135, + "step": 39370 + }, + { + "epoch": 1.01, + "learning_rate": 1.5468201358584239e-06, + "loss": 0.5721, + "step": 39371 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467969685586474e-06, + "loss": 0.7031, + "step": 39372 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467738008402141e-06, + "loss": 0.5121, + "step": 39373 + }, + { + "epoch": 1.01, + "learning_rate": 1.546750632703141e-06, + "loss": 0.5312, + "step": 39374 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467274641474458e-06, + "loss": 0.7559, + "step": 39375 + }, + { + "epoch": 1.01, + "learning_rate": 1.5467042951731468e-06, + "loss": 0.7666, + "step": 39376 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466811257802615e-06, + "loss": 0.8477, + "step": 39377 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466579559688073e-06, + "loss": 0.707, + "step": 39378 + }, + { + "epoch": 1.01, + "learning_rate": 1.546634785738803e-06, + "loss": 0.5469, + "step": 39379 + }, + { + "epoch": 1.01, + "learning_rate": 1.5466116150902647e-06, + "loss": 0.6011, + "step": 39380 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465884440232114e-06, + "loss": 0.7266, + "step": 39381 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465652725376603e-06, + "loss": 0.5845, + "step": 39382 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465421006336295e-06, + "loss": 0.7256, + "step": 39383 + }, + { + "epoch": 1.01, + "learning_rate": 1.5465189283111364e-06, + "loss": 0.6982, + "step": 39384 + }, + { + "epoch": 1.01, + "learning_rate": 1.546495755570199e-06, + "loss": 0.6875, + "step": 39385 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464725824108347e-06, + "loss": 0.707, + "step": 39386 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464494088330616e-06, + "loss": 0.8086, + "step": 39387 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464262348368974e-06, + "loss": 0.6875, + "step": 39388 + }, + { + "epoch": 1.01, + "learning_rate": 1.5464030604223597e-06, + "loss": 0.6646, + "step": 39389 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463798855894664e-06, + "loss": 0.6694, + "step": 39390 + }, + { + "epoch": 1.01, + "learning_rate": 1.546356710338235e-06, + "loss": 0.7637, + "step": 39391 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463335346686834e-06, + "loss": 0.7441, + "step": 39392 + }, + { + "epoch": 1.01, + "learning_rate": 1.5463103585808296e-06, + "loss": 0.4692, + "step": 39393 + }, + { + "epoch": 1.01, + "learning_rate": 1.5462871820746907e-06, + "loss": 0.7168, + "step": 39394 + }, + { + "epoch": 1.01, + "learning_rate": 1.546264005150285e-06, + "loss": 0.7139, + "step": 39395 + }, + { + "epoch": 1.01, + "learning_rate": 1.54624082780763e-06, + "loss": 0.6104, + "step": 39396 + }, + { + "epoch": 1.01, + "learning_rate": 1.5462176500467435e-06, + "loss": 0.7578, + "step": 39397 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461944718676435e-06, + "loss": 0.8701, + "step": 39398 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461712932703471e-06, + "loss": 0.6885, + "step": 39399 + }, + { + "epoch": 1.01, + "learning_rate": 1.546148114254873e-06, + "loss": 0.564, + "step": 39400 + }, + { + "epoch": 1.01, + "learning_rate": 1.546124934821238e-06, + "loss": 0.6982, + "step": 39401 + }, + { + "epoch": 1.01, + "learning_rate": 1.5461017549694605e-06, + "loss": 0.5913, + "step": 39402 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460785746995574e-06, + "loss": 0.7183, + "step": 39403 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460553940115477e-06, + "loss": 0.7158, + "step": 39404 + }, + { + "epoch": 1.01, + "learning_rate": 1.5460322129054482e-06, + "loss": 0.6875, + "step": 39405 + }, + { + "epoch": 1.01, + "learning_rate": 1.546009031381277e-06, + "loss": 0.5244, + "step": 39406 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459858494390518e-06, + "loss": 0.6699, + "step": 39407 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459626670787903e-06, + "loss": 0.6465, + "step": 39408 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459394843005105e-06, + "loss": 0.6865, + "step": 39409 + }, + { + "epoch": 1.01, + "learning_rate": 1.5459163011042296e-06, + "loss": 0.667, + "step": 39410 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458931174899658e-06, + "loss": 0.4849, + "step": 39411 + }, + { + "epoch": 1.01, + "learning_rate": 1.545869933457737e-06, + "loss": 0.5986, + "step": 39412 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458467490075604e-06, + "loss": 0.645, + "step": 39413 + }, + { + "epoch": 1.01, + "learning_rate": 1.545823564139454e-06, + "loss": 0.7344, + "step": 39414 + }, + { + "epoch": 1.01, + "learning_rate": 1.5458003788534359e-06, + "loss": 0.5801, + "step": 39415 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457771931495234e-06, + "loss": 0.6963, + "step": 39416 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457540070277344e-06, + "loss": 0.5781, + "step": 39417 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457308204880865e-06, + "loss": 0.5322, + "step": 39418 + }, + { + "epoch": 1.01, + "learning_rate": 1.5457076335305979e-06, + "loss": 0.8262, + "step": 39419 + }, + { + "epoch": 1.01, + "learning_rate": 1.545684446155286e-06, + "loss": 0.5881, + "step": 39420 + }, + { + "epoch": 1.01, + "learning_rate": 1.5456612583621684e-06, + "loss": 0.8135, + "step": 39421 + }, + { + "epoch": 1.01, + "learning_rate": 1.545638070151263e-06, + "loss": 0.792, + "step": 39422 + }, + { + "epoch": 1.01, + "learning_rate": 1.5456148815225877e-06, + "loss": 0.6465, + "step": 39423 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455916924761604e-06, + "loss": 0.8281, + "step": 39424 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455685030119985e-06, + "loss": 0.6309, + "step": 39425 + }, + { + "epoch": 1.01, + "learning_rate": 1.54554531313012e-06, + "loss": 0.6885, + "step": 39426 + }, + { + "epoch": 1.01, + "learning_rate": 1.5455221228305421e-06, + "loss": 0.5161, + "step": 39427 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454989321132835e-06, + "loss": 0.7617, + "step": 39428 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454757409783613e-06, + "loss": 0.79, + "step": 39429 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454525494257933e-06, + "loss": 0.6787, + "step": 39430 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454293574555974e-06, + "loss": 0.7432, + "step": 39431 + }, + { + "epoch": 1.01, + "learning_rate": 1.5454061650677913e-06, + "loss": 0.3538, + "step": 39432 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453829722623927e-06, + "loss": 0.8047, + "step": 39433 + }, + { + "epoch": 1.01, + "learning_rate": 1.54535977903942e-06, + "loss": 0.5698, + "step": 39434 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453365853988895e-06, + "loss": 0.5312, + "step": 39435 + }, + { + "epoch": 1.01, + "learning_rate": 1.5453133913408205e-06, + "loss": 0.624, + "step": 39436 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452901968652298e-06, + "loss": 0.708, + "step": 39437 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452670019721356e-06, + "loss": 0.6343, + "step": 39438 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452438066615555e-06, + "loss": 0.832, + "step": 39439 + }, + { + "epoch": 1.01, + "learning_rate": 1.5452206109335072e-06, + "loss": 0.603, + "step": 39440 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451974147880087e-06, + "loss": 0.6025, + "step": 39441 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451742182250777e-06, + "loss": 0.7129, + "step": 39442 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451510212447319e-06, + "loss": 0.6211, + "step": 39443 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451278238469888e-06, + "loss": 0.5796, + "step": 39444 + }, + { + "epoch": 1.01, + "learning_rate": 1.5451046260318665e-06, + "loss": 0.6738, + "step": 39445 + }, + { + "epoch": 1.01, + "learning_rate": 1.5450814277993824e-06, + "loss": 0.6519, + "step": 39446 + }, + { + "epoch": 1.01, + "learning_rate": 1.545058229149555e-06, + "loss": 0.6777, + "step": 39447 + }, + { + "epoch": 1.01, + "learning_rate": 1.5450350300824011e-06, + "loss": 0.6265, + "step": 39448 + }, + { + "epoch": 1.01, + "learning_rate": 1.545011830597939e-06, + "loss": 0.5249, + "step": 39449 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449886306961866e-06, + "loss": 0.6992, + "step": 39450 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449654303771613e-06, + "loss": 0.7129, + "step": 39451 + }, + { + "epoch": 1.01, + "learning_rate": 1.5449422296408812e-06, + "loss": 0.7363, + "step": 39452 + }, + { + "epoch": 1.01, + "learning_rate": 1.544919028487364e-06, + "loss": 0.5791, + "step": 39453 + }, + { + "epoch": 1.01, + "learning_rate": 1.544895826916627e-06, + "loss": 0.8135, + "step": 39454 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448726249286884e-06, + "loss": 0.5442, + "step": 39455 + }, + { + "epoch": 1.01, + "learning_rate": 1.544849422523566e-06, + "loss": 0.7881, + "step": 39456 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448262197012774e-06, + "loss": 0.624, + "step": 39457 + }, + { + "epoch": 1.01, + "learning_rate": 1.5448030164618406e-06, + "loss": 0.7163, + "step": 39458 + }, + { + "epoch": 1.01, + "learning_rate": 1.544779812805273e-06, + "loss": 0.666, + "step": 39459 + }, + { + "epoch": 1.01, + "learning_rate": 1.5447566087315927e-06, + "loss": 0.8145, + "step": 39460 + }, + { + "epoch": 1.01, + "learning_rate": 1.5447334042408168e-06, + "loss": 0.6128, + "step": 39461 + }, + { + "epoch": 1.01, + "learning_rate": 1.544710199332964e-06, + "loss": 0.8145, + "step": 39462 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446869940080517e-06, + "loss": 0.3967, + "step": 39463 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446637882660975e-06, + "loss": 0.8828, + "step": 39464 + }, + { + "epoch": 1.01, + "learning_rate": 1.5446405821071194e-06, + "loss": 0.7754, + "step": 39465 + }, + { + "epoch": 1.01, + "learning_rate": 1.544617375531135e-06, + "loss": 0.6655, + "step": 39466 + }, + { + "epoch": 1.01, + "learning_rate": 1.544594168538162e-06, + "loss": 0.5762, + "step": 39467 + }, + { + "epoch": 1.01, + "learning_rate": 1.5445709611282186e-06, + "loss": 0.6401, + "step": 39468 + }, + { + "epoch": 1.01, + "learning_rate": 1.544547753301322e-06, + "loss": 0.5032, + "step": 39469 + }, + { + "epoch": 1.01, + "learning_rate": 1.54452454505749e-06, + "loss": 0.6509, + "step": 39470 + }, + { + "epoch": 1.01, + "learning_rate": 1.5445013363967409e-06, + "loss": 0.7529, + "step": 39471 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444781273190919e-06, + "loss": 0.6104, + "step": 39472 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444549178245614e-06, + "loss": 0.7148, + "step": 39473 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444317079131667e-06, + "loss": 0.6914, + "step": 39474 + }, + { + "epoch": 1.01, + "learning_rate": 1.5444084975849254e-06, + "loss": 0.7207, + "step": 39475 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443852868398558e-06, + "loss": 0.832, + "step": 39476 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443620756779753e-06, + "loss": 0.5659, + "step": 39477 + }, + { + "epoch": 1.01, + "learning_rate": 1.544338864099302e-06, + "loss": 0.6157, + "step": 39478 + }, + { + "epoch": 1.01, + "learning_rate": 1.5443156521038532e-06, + "loss": 0.668, + "step": 39479 + }, + { + "epoch": 1.01, + "learning_rate": 1.544292439691647e-06, + "loss": 0.5029, + "step": 39480 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442692268627013e-06, + "loss": 0.6719, + "step": 39481 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442460136170333e-06, + "loss": 0.7373, + "step": 39482 + }, + { + "epoch": 1.01, + "learning_rate": 1.5442227999546616e-06, + "loss": 0.7402, + "step": 39483 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441995858756034e-06, + "loss": 0.6768, + "step": 39484 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441763713798764e-06, + "loss": 0.6416, + "step": 39485 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441531564674985e-06, + "loss": 0.3284, + "step": 39486 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441299411384878e-06, + "loss": 0.7549, + "step": 39487 + }, + { + "epoch": 1.01, + "learning_rate": 1.5441067253928618e-06, + "loss": 0.6406, + "step": 39488 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440835092306386e-06, + "loss": 0.7476, + "step": 39489 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440602926518352e-06, + "loss": 0.7129, + "step": 39490 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440370756564699e-06, + "loss": 0.4922, + "step": 39491 + }, + { + "epoch": 1.01, + "learning_rate": 1.5440138582445603e-06, + "loss": 0.5835, + "step": 39492 + }, + { + "epoch": 1.01, + "learning_rate": 1.543990640416125e-06, + "loss": 0.583, + "step": 39493 + }, + { + "epoch": 1.01, + "learning_rate": 1.5439674221711804e-06, + "loss": 0.791, + "step": 39494 + }, + { + "epoch": 1.01, + "learning_rate": 1.5439442035097452e-06, + "loss": 0.5361, + "step": 39495 + }, + { + "epoch": 1.01, + "learning_rate": 1.543920984431837e-06, + "loss": 0.5791, + "step": 39496 + }, + { + "epoch": 1.01, + "learning_rate": 1.543897764937473e-06, + "loss": 0.5669, + "step": 39497 + }, + { + "epoch": 1.01, + "learning_rate": 1.543874545026672e-06, + "loss": 0.6694, + "step": 39498 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438513246994514e-06, + "loss": 0.686, + "step": 39499 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438281039558283e-06, + "loss": 0.8086, + "step": 39500 + }, + { + "epoch": 1.01, + "learning_rate": 1.5438048827958214e-06, + "loss": 0.5574, + "step": 39501 + }, + { + "epoch": 1.01, + "learning_rate": 1.543781661219448e-06, + "loss": 0.7158, + "step": 39502 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437584392267262e-06, + "loss": 0.5977, + "step": 39503 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437352168176733e-06, + "loss": 0.5265, + "step": 39504 + }, + { + "epoch": 1.01, + "learning_rate": 1.5437119939923075e-06, + "loss": 0.6089, + "step": 39505 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436887707506464e-06, + "loss": 0.8115, + "step": 39506 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436655470927078e-06, + "loss": 0.6426, + "step": 39507 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436423230185094e-06, + "loss": 0.749, + "step": 39508 + }, + { + "epoch": 1.01, + "learning_rate": 1.5436190985280693e-06, + "loss": 0.6494, + "step": 39509 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435958736214049e-06, + "loss": 0.6074, + "step": 39510 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435726482985338e-06, + "loss": 0.7124, + "step": 39511 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435494225594744e-06, + "loss": 0.2881, + "step": 39512 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435261964042442e-06, + "loss": 0.5088, + "step": 39513 + }, + { + "epoch": 1.01, + "learning_rate": 1.5435029698328612e-06, + "loss": 0.5981, + "step": 39514 + }, + { + "epoch": 1.01, + "learning_rate": 1.543479742845343e-06, + "loss": 0.5273, + "step": 39515 + }, + { + "epoch": 1.01, + "learning_rate": 1.543456515441707e-06, + "loss": 0.6279, + "step": 39516 + }, + { + "epoch": 1.01, + "learning_rate": 1.5434332876219713e-06, + "loss": 0.6772, + "step": 39517 + }, + { + "epoch": 1.01, + "learning_rate": 1.543410059386154e-06, + "loss": 0.7314, + "step": 39518 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433868307342723e-06, + "loss": 0.6797, + "step": 39519 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433636016663444e-06, + "loss": 0.6621, + "step": 39520 + }, + { + "epoch": 1.01, + "learning_rate": 1.543340372182388e-06, + "loss": 0.5708, + "step": 39521 + }, + { + "epoch": 1.01, + "learning_rate": 1.5433171422824212e-06, + "loss": 0.6982, + "step": 39522 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432939119664611e-06, + "loss": 0.748, + "step": 39523 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432706812345262e-06, + "loss": 0.7104, + "step": 39524 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432474500866335e-06, + "loss": 0.6348, + "step": 39525 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432242185228013e-06, + "loss": 0.835, + "step": 39526 + }, + { + "epoch": 1.01, + "learning_rate": 1.5432009865430473e-06, + "loss": 0.4668, + "step": 39527 + }, + { + "epoch": 1.01, + "learning_rate": 1.5431777541473893e-06, + "loss": 0.6484, + "step": 39528 + }, + { + "epoch": 1.01, + "learning_rate": 1.543154521335845e-06, + "loss": 0.5493, + "step": 39529 + }, + { + "epoch": 1.01, + "learning_rate": 1.5431312881084324e-06, + "loss": 0.4585, + "step": 39530 + }, + { + "epoch": 1.01, + "learning_rate": 1.543108054465169e-06, + "loss": 0.5552, + "step": 39531 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430848204060728e-06, + "loss": 0.6245, + "step": 39532 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430615859311617e-06, + "loss": 0.6475, + "step": 39533 + }, + { + "epoch": 1.01, + "learning_rate": 1.5430383510404532e-06, + "loss": 0.6284, + "step": 39534 + }, + { + "epoch": 1.01, + "learning_rate": 1.543015115733965e-06, + "loss": 0.7686, + "step": 39535 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429918800117152e-06, + "loss": 0.6445, + "step": 39536 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429686438737214e-06, + "loss": 0.7578, + "step": 39537 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429454073200018e-06, + "loss": 0.5591, + "step": 39538 + }, + { + "epoch": 1.01, + "learning_rate": 1.5429221703505736e-06, + "loss": 0.709, + "step": 39539 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428989329654552e-06, + "loss": 0.3962, + "step": 39540 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428756951646635e-06, + "loss": 0.5698, + "step": 39541 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428524569482174e-06, + "loss": 0.7568, + "step": 39542 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428292183161338e-06, + "loss": 0.5134, + "step": 39543 + }, + { + "epoch": 1.01, + "learning_rate": 1.5428059792684307e-06, + "loss": 0.6553, + "step": 39544 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427827398051262e-06, + "loss": 0.6494, + "step": 39545 + }, + { + "epoch": 1.01, + "learning_rate": 1.542759499926238e-06, + "loss": 0.4629, + "step": 39546 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427362596317837e-06, + "loss": 0.6479, + "step": 39547 + }, + { + "epoch": 1.01, + "learning_rate": 1.5427130189217813e-06, + "loss": 0.6914, + "step": 39548 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426897777962484e-06, + "loss": 0.6309, + "step": 39549 + }, + { + "epoch": 1.01, + "learning_rate": 1.542666536255203e-06, + "loss": 0.707, + "step": 39550 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426432942986627e-06, + "loss": 0.3663, + "step": 39551 + }, + { + "epoch": 1.01, + "learning_rate": 1.5426200519266452e-06, + "loss": 0.5469, + "step": 39552 + }, + { + "epoch": 1.01, + "learning_rate": 1.542596809139169e-06, + "loss": 0.7959, + "step": 39553 + }, + { + "epoch": 1.01, + "learning_rate": 1.542573565936251e-06, + "loss": 0.6104, + "step": 39554 + }, + { + "epoch": 1.01, + "learning_rate": 1.5425503223179093e-06, + "loss": 0.5142, + "step": 39555 + }, + { + "epoch": 1.01, + "learning_rate": 1.542527078284162e-06, + "loss": 0.7065, + "step": 39556 + }, + { + "epoch": 1.01, + "learning_rate": 1.5425038338350263e-06, + "loss": 0.4905, + "step": 39557 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424805889705206e-06, + "loss": 0.6855, + "step": 39558 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424573436906624e-06, + "loss": 0.6602, + "step": 39559 + }, + { + "epoch": 1.01, + "learning_rate": 1.5424340979954697e-06, + "loss": 0.5728, + "step": 39560 + }, + { + "epoch": 1.01, + "learning_rate": 1.54241085188496e-06, + "loss": 0.6377, + "step": 39561 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423876053591514e-06, + "loss": 0.6758, + "step": 39562 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423643584180615e-06, + "loss": 0.6123, + "step": 39563 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423411110617082e-06, + "loss": 0.7617, + "step": 39564 + }, + { + "epoch": 1.01, + "learning_rate": 1.5423178632901087e-06, + "loss": 0.7148, + "step": 39565 + }, + { + "epoch": 1.01, + "learning_rate": 1.542294615103282e-06, + "loss": 0.9102, + "step": 39566 + }, + { + "epoch": 1.01, + "learning_rate": 1.542271366501245e-06, + "loss": 0.6611, + "step": 39567 + }, + { + "epoch": 1.01, + "learning_rate": 1.542248117484016e-06, + "loss": 0.6592, + "step": 39568 + }, + { + "epoch": 1.01, + "learning_rate": 1.5422248680516123e-06, + "loss": 0.5201, + "step": 39569 + }, + { + "epoch": 1.01, + "learning_rate": 1.5422016182040521e-06, + "loss": 0.7017, + "step": 39570 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421783679413526e-06, + "loss": 0.7246, + "step": 39571 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421551172635327e-06, + "loss": 0.6123, + "step": 39572 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421318661706094e-06, + "loss": 0.5952, + "step": 39573 + }, + { + "epoch": 1.01, + "learning_rate": 1.5421086146626006e-06, + "loss": 0.8311, + "step": 39574 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420853627395238e-06, + "loss": 0.7393, + "step": 39575 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420621104013973e-06, + "loss": 0.5383, + "step": 39576 + }, + { + "epoch": 1.01, + "learning_rate": 1.542038857648239e-06, + "loss": 0.6729, + "step": 39577 + }, + { + "epoch": 1.01, + "learning_rate": 1.5420156044800666e-06, + "loss": 0.6021, + "step": 39578 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419923508968976e-06, + "loss": 0.657, + "step": 39579 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419690968987497e-06, + "loss": 0.8125, + "step": 39580 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419458424856413e-06, + "loss": 0.6108, + "step": 39581 + }, + { + "epoch": 1.01, + "learning_rate": 1.5419225876575897e-06, + "loss": 0.4861, + "step": 39582 + }, + { + "epoch": 1.01, + "learning_rate": 1.541899332414613e-06, + "loss": 0.6226, + "step": 39583 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418760767567291e-06, + "loss": 0.5786, + "step": 39584 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418528206839554e-06, + "loss": 0.7139, + "step": 39585 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418295641963097e-06, + "loss": 0.6182, + "step": 39586 + }, + { + "epoch": 1.01, + "learning_rate": 1.5418063072938104e-06, + "loss": 0.8721, + "step": 39587 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417830499764749e-06, + "loss": 0.5786, + "step": 39588 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417597922443206e-06, + "loss": 0.561, + "step": 39589 + }, + { + "epoch": 1.01, + "learning_rate": 1.541736534097366e-06, + "loss": 0.4556, + "step": 39590 + }, + { + "epoch": 1.01, + "learning_rate": 1.5417132755356287e-06, + "loss": 0.5474, + "step": 39591 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416900165591264e-06, + "loss": 0.6992, + "step": 39592 + }, + { + "epoch": 1.01, + "learning_rate": 1.541666757167877e-06, + "loss": 0.6973, + "step": 39593 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416434973618983e-06, + "loss": 0.7231, + "step": 39594 + }, + { + "epoch": 1.01, + "learning_rate": 1.5416202371412078e-06, + "loss": 0.667, + "step": 39595 + }, + { + "epoch": 1.01, + "learning_rate": 1.541596976505824e-06, + "loss": 0.6196, + "step": 39596 + }, + { + "epoch": 1.01, + "learning_rate": 1.541573715455764e-06, + "loss": 0.5181, + "step": 39597 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415504539910465e-06, + "loss": 0.5696, + "step": 39598 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415271921116882e-06, + "loss": 0.6533, + "step": 39599 + }, + { + "epoch": 1.01, + "learning_rate": 1.5415039298177073e-06, + "loss": 0.6963, + "step": 39600 + }, + { + "epoch": 1.01, + "learning_rate": 1.5414806671091218e-06, + "loss": 0.7129, + "step": 39601 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414574039859497e-06, + "loss": 0.6797, + "step": 39602 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414341404482083e-06, + "loss": 0.6892, + "step": 39603 + }, + { + "epoch": 1.02, + "learning_rate": 1.5414108764959158e-06, + "loss": 0.3457, + "step": 39604 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413876121290899e-06, + "loss": 0.6206, + "step": 39605 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413643473477484e-06, + "loss": 0.7773, + "step": 39606 + }, + { + "epoch": 1.02, + "learning_rate": 1.5413410821519091e-06, + "loss": 0.6655, + "step": 39607 + }, + { + "epoch": 1.02, + "learning_rate": 1.54131781654159e-06, + "loss": 0.7295, + "step": 39608 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412945505168084e-06, + "loss": 0.793, + "step": 39609 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412712840775825e-06, + "loss": 0.6299, + "step": 39610 + }, + { + "epoch": 1.02, + "learning_rate": 1.54124801722393e-06, + "loss": 0.7197, + "step": 39611 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412247499558691e-06, + "loss": 0.7334, + "step": 39612 + }, + { + "epoch": 1.02, + "learning_rate": 1.5412014822734174e-06, + "loss": 0.5918, + "step": 39613 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411782141765923e-06, + "loss": 0.5825, + "step": 39614 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411549456654118e-06, + "loss": 0.7209, + "step": 39615 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411316767398944e-06, + "loss": 0.5947, + "step": 39616 + }, + { + "epoch": 1.02, + "learning_rate": 1.5411084074000567e-06, + "loss": 0.7441, + "step": 39617 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410851376459176e-06, + "loss": 0.5308, + "step": 39618 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410618674774943e-06, + "loss": 0.6836, + "step": 39619 + }, + { + "epoch": 1.02, + "learning_rate": 1.541038596894805e-06, + "loss": 0.7568, + "step": 39620 + }, + { + "epoch": 1.02, + "learning_rate": 1.5410153258978672e-06, + "loss": 0.4019, + "step": 39621 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409920544866987e-06, + "loss": 0.8086, + "step": 39622 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409687826613178e-06, + "loss": 0.7026, + "step": 39623 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409455104217416e-06, + "loss": 0.6052, + "step": 39624 + }, + { + "epoch": 1.02, + "learning_rate": 1.5409222377679885e-06, + "loss": 0.7563, + "step": 39625 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408989647000761e-06, + "loss": 0.686, + "step": 39626 + }, + { + "epoch": 1.02, + "learning_rate": 1.540875691218022e-06, + "loss": 0.6011, + "step": 39627 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408524173218446e-06, + "loss": 0.6538, + "step": 39628 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408291430115612e-06, + "loss": 0.6436, + "step": 39629 + }, + { + "epoch": 1.02, + "learning_rate": 1.5408058682871897e-06, + "loss": 0.6772, + "step": 39630 + }, + { + "epoch": 1.02, + "learning_rate": 1.540782593148748e-06, + "loss": 0.752, + "step": 39631 + }, + { + "epoch": 1.02, + "learning_rate": 1.5407593175962543e-06, + "loss": 0.6709, + "step": 39632 + }, + { + "epoch": 1.02, + "learning_rate": 1.540736041629726e-06, + "loss": 0.5391, + "step": 39633 + }, + { + "epoch": 1.02, + "learning_rate": 1.5407127652491807e-06, + "loss": 0.2876, + "step": 39634 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406894884546366e-06, + "loss": 0.5664, + "step": 39635 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406662112461114e-06, + "loss": 0.5874, + "step": 39636 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406429336236228e-06, + "loss": 0.6865, + "step": 39637 + }, + { + "epoch": 1.02, + "learning_rate": 1.5406196555871892e-06, + "loss": 0.6963, + "step": 39638 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405963771368278e-06, + "loss": 0.71, + "step": 39639 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405730982725565e-06, + "loss": 0.5669, + "step": 39640 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405498189943932e-06, + "loss": 0.478, + "step": 39641 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405265393023558e-06, + "loss": 0.573, + "step": 39642 + }, + { + "epoch": 1.02, + "learning_rate": 1.5405032591964623e-06, + "loss": 0.7383, + "step": 39643 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404799786767299e-06, + "loss": 0.6973, + "step": 39644 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404566977431772e-06, + "loss": 0.7148, + "step": 39645 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404334163958214e-06, + "loss": 0.7012, + "step": 39646 + }, + { + "epoch": 1.02, + "learning_rate": 1.5404101346346808e-06, + "loss": 0.7498, + "step": 39647 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403868524597727e-06, + "loss": 0.4644, + "step": 39648 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403635698711156e-06, + "loss": 0.6348, + "step": 39649 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403402868687266e-06, + "loss": 0.6982, + "step": 39650 + }, + { + "epoch": 1.02, + "learning_rate": 1.5403170034526242e-06, + "loss": 0.624, + "step": 39651 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402937196228255e-06, + "loss": 0.6357, + "step": 39652 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402704353793493e-06, + "loss": 0.6406, + "step": 39653 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402471507222125e-06, + "loss": 0.6235, + "step": 39654 + }, + { + "epoch": 1.02, + "learning_rate": 1.5402238656514337e-06, + "loss": 0.512, + "step": 39655 + }, + { + "epoch": 1.02, + "learning_rate": 1.54020058016703e-06, + "loss": 0.4663, + "step": 39656 + }, + { + "epoch": 1.02, + "learning_rate": 1.5401772942690195e-06, + "loss": 0.688, + "step": 39657 + }, + { + "epoch": 1.02, + "learning_rate": 1.5401540079574202e-06, + "loss": 0.4658, + "step": 39658 + }, + { + "epoch": 1.02, + "learning_rate": 1.54013072123225e-06, + "loss": 0.7373, + "step": 39659 + }, + { + "epoch": 1.02, + "learning_rate": 1.540107434093526e-06, + "loss": 0.9561, + "step": 39660 + }, + { + "epoch": 1.02, + "learning_rate": 1.540084146541267e-06, + "loss": 0.6328, + "step": 39661 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400608585754903e-06, + "loss": 0.6094, + "step": 39662 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400375701962137e-06, + "loss": 0.7441, + "step": 39663 + }, + { + "epoch": 1.02, + "learning_rate": 1.5400142814034555e-06, + "loss": 0.4259, + "step": 39664 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399909921972327e-06, + "loss": 0.5227, + "step": 39665 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399677025775638e-06, + "loss": 0.5308, + "step": 39666 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399444125444667e-06, + "loss": 0.6973, + "step": 39667 + }, + { + "epoch": 1.02, + "learning_rate": 1.5399211220979592e-06, + "loss": 0.7041, + "step": 39668 + }, + { + "epoch": 1.02, + "learning_rate": 1.5398978312380583e-06, + "loss": 0.6187, + "step": 39669 + }, + { + "epoch": 1.02, + "learning_rate": 1.5398745399647827e-06, + "loss": 0.5796, + "step": 39670 + }, + { + "epoch": 1.02, + "learning_rate": 1.53985124827815e-06, + "loss": 0.6128, + "step": 39671 + }, + { + "epoch": 1.02, + "learning_rate": 1.539827956178178e-06, + "loss": 0.7939, + "step": 39672 + }, + { + "epoch": 1.02, + "learning_rate": 1.539804663664885e-06, + "loss": 0.6338, + "step": 39673 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397813707382881e-06, + "loss": 0.6572, + "step": 39674 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397580773984048e-06, + "loss": 0.5439, + "step": 39675 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397347836452546e-06, + "loss": 0.6611, + "step": 39676 + }, + { + "epoch": 1.02, + "learning_rate": 1.5397114894788535e-06, + "loss": 0.5444, + "step": 39677 + }, + { + "epoch": 1.02, + "learning_rate": 1.5396881948992206e-06, + "loss": 0.5586, + "step": 39678 + }, + { + "epoch": 1.02, + "learning_rate": 1.539664899906373e-06, + "loss": 0.8662, + "step": 39679 + }, + { + "epoch": 1.02, + "learning_rate": 1.5396416045003288e-06, + "loss": 0.8799, + "step": 39680 + }, + { + "epoch": 1.02, + "learning_rate": 1.539618308681106e-06, + "loss": 0.7588, + "step": 39681 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395950124487222e-06, + "loss": 0.6182, + "step": 39682 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395717158031954e-06, + "loss": 0.667, + "step": 39683 + }, + { + "epoch": 1.02, + "learning_rate": 1.539548418744543e-06, + "loss": 0.6641, + "step": 39684 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395251212727836e-06, + "loss": 0.9258, + "step": 39685 + }, + { + "epoch": 1.02, + "learning_rate": 1.5395018233879345e-06, + "loss": 0.6572, + "step": 39686 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394785250900135e-06, + "loss": 0.3918, + "step": 39687 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394552263790388e-06, + "loss": 0.8779, + "step": 39688 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394319272550278e-06, + "loss": 0.8486, + "step": 39689 + }, + { + "epoch": 1.02, + "learning_rate": 1.5394086277179988e-06, + "loss": 0.4287, + "step": 39690 + }, + { + "epoch": 1.02, + "learning_rate": 1.5393853277679693e-06, + "loss": 0.7275, + "step": 39691 + }, + { + "epoch": 1.02, + "learning_rate": 1.539362027404957e-06, + "loss": 0.5767, + "step": 39692 + }, + { + "epoch": 1.02, + "learning_rate": 1.5393387266289807e-06, + "loss": 0.9229, + "step": 39693 + }, + { + "epoch": 1.02, + "learning_rate": 1.539315425440057e-06, + "loss": 0.752, + "step": 39694 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392921238382047e-06, + "loss": 0.5923, + "step": 39695 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392688218234406e-06, + "loss": 0.5244, + "step": 39696 + }, + { + "epoch": 1.02, + "learning_rate": 1.5392455193957834e-06, + "loss": 0.5537, + "step": 39697 + }, + { + "epoch": 1.02, + "learning_rate": 1.539222216555251e-06, + "loss": 0.6494, + "step": 39698 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391989133018607e-06, + "loss": 0.7246, + "step": 39699 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391756096356306e-06, + "loss": 0.7119, + "step": 39700 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391523055565787e-06, + "loss": 0.6611, + "step": 39701 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391290010647223e-06, + "loss": 0.7432, + "step": 39702 + }, + { + "epoch": 1.02, + "learning_rate": 1.5391056961600798e-06, + "loss": 0.646, + "step": 39703 + }, + { + "epoch": 1.02, + "learning_rate": 1.539082390842669e-06, + "loss": 0.6313, + "step": 39704 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390590851125075e-06, + "loss": 0.6084, + "step": 39705 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390357789696132e-06, + "loss": 0.7988, + "step": 39706 + }, + { + "epoch": 1.02, + "learning_rate": 1.5390124724140038e-06, + "loss": 0.6045, + "step": 39707 + }, + { + "epoch": 1.02, + "learning_rate": 1.538989165445698e-06, + "loss": 0.6919, + "step": 39708 + }, + { + "epoch": 1.02, + "learning_rate": 1.5389658580647123e-06, + "loss": 0.667, + "step": 39709 + }, + { + "epoch": 1.02, + "learning_rate": 1.5389425502710656e-06, + "loss": 0.4604, + "step": 39710 + }, + { + "epoch": 1.02, + "learning_rate": 1.538919242064775e-06, + "loss": 0.7236, + "step": 39711 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388959334458588e-06, + "loss": 0.6602, + "step": 39712 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388726244143353e-06, + "loss": 0.7939, + "step": 39713 + }, + { + "epoch": 1.02, + "learning_rate": 1.5388493149702213e-06, + "loss": 0.6421, + "step": 39714 + }, + { + "epoch": 1.02, + "learning_rate": 1.538826005113535e-06, + "loss": 0.6479, + "step": 39715 + }, + { + "epoch": 1.02, + "learning_rate": 1.538802694844295e-06, + "loss": 0.6465, + "step": 39716 + }, + { + "epoch": 1.02, + "learning_rate": 1.538779384162518e-06, + "loss": 0.6484, + "step": 39717 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387560730682228e-06, + "loss": 0.6758, + "step": 39718 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387327615614267e-06, + "loss": 0.4387, + "step": 39719 + }, + { + "epoch": 1.02, + "learning_rate": 1.5387094496421478e-06, + "loss": 0.666, + "step": 39720 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386861373104035e-06, + "loss": 0.6787, + "step": 39721 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386628245662121e-06, + "loss": 0.6953, + "step": 39722 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386395114095917e-06, + "loss": 0.6475, + "step": 39723 + }, + { + "epoch": 1.02, + "learning_rate": 1.5386161978405597e-06, + "loss": 0.5549, + "step": 39724 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385928838591338e-06, + "loss": 0.5291, + "step": 39725 + }, + { + "epoch": 1.02, + "learning_rate": 1.538569569465332e-06, + "loss": 0.5413, + "step": 39726 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385462546591725e-06, + "loss": 0.6494, + "step": 39727 + }, + { + "epoch": 1.02, + "learning_rate": 1.5385229394406728e-06, + "loss": 0.5918, + "step": 39728 + }, + { + "epoch": 1.02, + "learning_rate": 1.538499623809851e-06, + "loss": 0.6096, + "step": 39729 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384763077667244e-06, + "loss": 0.5962, + "step": 39730 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384529913113115e-06, + "loss": 0.7227, + "step": 39731 + }, + { + "epoch": 1.02, + "learning_rate": 1.53842967444363e-06, + "loss": 0.5532, + "step": 39732 + }, + { + "epoch": 1.02, + "learning_rate": 1.5384063571636978e-06, + "loss": 0.8193, + "step": 39733 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383830394715322e-06, + "loss": 0.627, + "step": 39734 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383597213671518e-06, + "loss": 0.6807, + "step": 39735 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383364028505738e-06, + "loss": 0.6279, + "step": 39736 + }, + { + "epoch": 1.02, + "learning_rate": 1.5383130839218167e-06, + "loss": 0.7295, + "step": 39737 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382897645808978e-06, + "loss": 0.7871, + "step": 39738 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382664448278354e-06, + "loss": 0.6826, + "step": 39739 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382431246626469e-06, + "loss": 0.7676, + "step": 39740 + }, + { + "epoch": 1.02, + "learning_rate": 1.5382198040853504e-06, + "loss": 0.5527, + "step": 39741 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381964830959637e-06, + "loss": 0.6162, + "step": 39742 + }, + { + "epoch": 1.02, + "learning_rate": 1.538173161694505e-06, + "loss": 0.5879, + "step": 39743 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381498398809915e-06, + "loss": 0.7925, + "step": 39744 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381265176554416e-06, + "loss": 0.749, + "step": 39745 + }, + { + "epoch": 1.02, + "learning_rate": 1.5381031950178728e-06, + "loss": 0.624, + "step": 39746 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380798719683034e-06, + "loss": 0.4929, + "step": 39747 + }, + { + "epoch": 1.02, + "learning_rate": 1.538056548506751e-06, + "loss": 0.7021, + "step": 39748 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380332246332333e-06, + "loss": 0.6641, + "step": 39749 + }, + { + "epoch": 1.02, + "learning_rate": 1.5380099003477683e-06, + "loss": 0.707, + "step": 39750 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379865756503737e-06, + "loss": 0.4799, + "step": 39751 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379632505410677e-06, + "loss": 0.7026, + "step": 39752 + }, + { + "epoch": 1.02, + "learning_rate": 1.537939925019868e-06, + "loss": 0.613, + "step": 39753 + }, + { + "epoch": 1.02, + "learning_rate": 1.5379165990867924e-06, + "loss": 0.7354, + "step": 39754 + }, + { + "epoch": 1.02, + "learning_rate": 1.5378932727418589e-06, + "loss": 0.6504, + "step": 39755 + }, + { + "epoch": 1.02, + "learning_rate": 1.537869945985085e-06, + "loss": 0.8359, + "step": 39756 + }, + { + "epoch": 1.02, + "learning_rate": 1.537846618816489e-06, + "loss": 0.5002, + "step": 39757 + }, + { + "epoch": 1.02, + "learning_rate": 1.5378232912360884e-06, + "loss": 0.5215, + "step": 39758 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377999632439013e-06, + "loss": 0.6191, + "step": 39759 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377766348399457e-06, + "loss": 0.6177, + "step": 39760 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377533060242388e-06, + "loss": 0.6001, + "step": 39761 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377299767967995e-06, + "loss": 0.6094, + "step": 39762 + }, + { + "epoch": 1.02, + "learning_rate": 1.5377066471576447e-06, + "loss": 0.7329, + "step": 39763 + }, + { + "epoch": 1.02, + "learning_rate": 1.537683317106793e-06, + "loss": 0.8447, + "step": 39764 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376599866442615e-06, + "loss": 0.6221, + "step": 39765 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376366557700686e-06, + "loss": 0.6714, + "step": 39766 + }, + { + "epoch": 1.02, + "learning_rate": 1.5376133244842322e-06, + "loss": 0.6235, + "step": 39767 + }, + { + "epoch": 1.02, + "learning_rate": 1.53758999278677e-06, + "loss": 0.5508, + "step": 39768 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375666606776995e-06, + "loss": 0.7393, + "step": 39769 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375433281570392e-06, + "loss": 0.7363, + "step": 39770 + }, + { + "epoch": 1.02, + "learning_rate": 1.5375199952248067e-06, + "loss": 0.6006, + "step": 39771 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374966618810197e-06, + "loss": 0.7109, + "step": 39772 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374733281256964e-06, + "loss": 0.5229, + "step": 39773 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374499939588543e-06, + "loss": 0.5679, + "step": 39774 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374266593805115e-06, + "loss": 0.7305, + "step": 39775 + }, + { + "epoch": 1.02, + "learning_rate": 1.5374033243906862e-06, + "loss": 0.7139, + "step": 39776 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373799889893954e-06, + "loss": 0.666, + "step": 39777 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373566531766575e-06, + "loss": 0.6182, + "step": 39778 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373333169524905e-06, + "loss": 0.5557, + "step": 39779 + }, + { + "epoch": 1.02, + "learning_rate": 1.5373099803169122e-06, + "loss": 0.6694, + "step": 39780 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372866432699399e-06, + "loss": 0.5957, + "step": 39781 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372633058115923e-06, + "loss": 0.6777, + "step": 39782 + }, + { + "epoch": 1.02, + "learning_rate": 1.5372399679418868e-06, + "loss": 0.6182, + "step": 39783 + }, + { + "epoch": 1.02, + "learning_rate": 1.537216629660841e-06, + "loss": 0.6401, + "step": 39784 + }, + { + "epoch": 1.02, + "learning_rate": 1.5371932909684738e-06, + "loss": 0.7803, + "step": 39785 + }, + { + "epoch": 1.02, + "learning_rate": 1.537169951864802e-06, + "loss": 0.7949, + "step": 39786 + }, + { + "epoch": 1.02, + "learning_rate": 1.537146612349844e-06, + "loss": 0.6692, + "step": 39787 + }, + { + "epoch": 1.02, + "learning_rate": 1.5371232724236177e-06, + "loss": 0.6338, + "step": 39788 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370999320861403e-06, + "loss": 0.7607, + "step": 39789 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370765913374304e-06, + "loss": 0.7012, + "step": 39790 + }, + { + "epoch": 1.02, + "learning_rate": 1.537053250177506e-06, + "loss": 0.6396, + "step": 39791 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370299086063842e-06, + "loss": 0.6001, + "step": 39792 + }, + { + "epoch": 1.02, + "learning_rate": 1.5370065666240835e-06, + "loss": 0.6641, + "step": 39793 + }, + { + "epoch": 1.02, + "learning_rate": 1.5369832242306212e-06, + "loss": 0.6865, + "step": 39794 + }, + { + "epoch": 1.02, + "learning_rate": 1.536959881426016e-06, + "loss": 0.7095, + "step": 39795 + }, + { + "epoch": 1.02, + "learning_rate": 1.536936538210285e-06, + "loss": 0.71, + "step": 39796 + }, + { + "epoch": 1.02, + "learning_rate": 1.5369131945834465e-06, + "loss": 0.5776, + "step": 39797 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368898505455183e-06, + "loss": 0.4871, + "step": 39798 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368665060965182e-06, + "loss": 0.7754, + "step": 39799 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368431612364643e-06, + "loss": 0.8975, + "step": 39800 + }, + { + "epoch": 1.02, + "learning_rate": 1.5368198159653739e-06, + "loss": 0.6309, + "step": 39801 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367964702832656e-06, + "loss": 0.688, + "step": 39802 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367731241901567e-06, + "loss": 0.7295, + "step": 39803 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367497776860654e-06, + "loss": 0.7134, + "step": 39804 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367264307710092e-06, + "loss": 0.751, + "step": 39805 + }, + { + "epoch": 1.02, + "learning_rate": 1.5367030834450064e-06, + "loss": 0.8047, + "step": 39806 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366797357080752e-06, + "loss": 0.5901, + "step": 39807 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366563875602326e-06, + "loss": 0.5474, + "step": 39808 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366330390014968e-06, + "loss": 0.6614, + "step": 39809 + }, + { + "epoch": 1.02, + "learning_rate": 1.5366096900318857e-06, + "loss": 0.5698, + "step": 39810 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365863406514175e-06, + "loss": 0.7891, + "step": 39811 + }, + { + "epoch": 1.02, + "learning_rate": 1.53656299086011e-06, + "loss": 0.5918, + "step": 39812 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365396406579803e-06, + "loss": 0.6934, + "step": 39813 + }, + { + "epoch": 1.02, + "learning_rate": 1.5365162900450472e-06, + "loss": 0.6748, + "step": 39814 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364929390213282e-06, + "loss": 0.7158, + "step": 39815 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364695875868413e-06, + "loss": 0.5964, + "step": 39816 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364462357416042e-06, + "loss": 0.6802, + "step": 39817 + }, + { + "epoch": 1.02, + "learning_rate": 1.5364228834856348e-06, + "loss": 0.6289, + "step": 39818 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363995308189513e-06, + "loss": 0.7148, + "step": 39819 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363761777415709e-06, + "loss": 0.6284, + "step": 39820 + }, + { + "epoch": 1.02, + "learning_rate": 1.5363528242535125e-06, + "loss": 0.5759, + "step": 39821 + }, + { + "epoch": 1.02, + "learning_rate": 1.536329470354793e-06, + "loss": 0.6553, + "step": 39822 + }, + { + "epoch": 1.02, + "learning_rate": 1.536306116045431e-06, + "loss": 0.7607, + "step": 39823 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362827613254439e-06, + "loss": 0.6028, + "step": 39824 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362594061948495e-06, + "loss": 0.7529, + "step": 39825 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362360506536662e-06, + "loss": 0.7109, + "step": 39826 + }, + { + "epoch": 1.02, + "learning_rate": 1.5362126947019117e-06, + "loss": 0.6807, + "step": 39827 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361893383396035e-06, + "loss": 0.7119, + "step": 39828 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361659815667603e-06, + "loss": 0.6089, + "step": 39829 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361426243833991e-06, + "loss": 0.6367, + "step": 39830 + }, + { + "epoch": 1.02, + "learning_rate": 1.5361192667895383e-06, + "loss": 0.7227, + "step": 39831 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360959087851955e-06, + "loss": 0.709, + "step": 39832 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360725503703886e-06, + "loss": 0.5898, + "step": 39833 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360491915451354e-06, + "loss": 0.6582, + "step": 39834 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360258323094547e-06, + "loss": 0.6504, + "step": 39835 + }, + { + "epoch": 1.02, + "learning_rate": 1.5360024726633628e-06, + "loss": 0.6865, + "step": 39836 + }, + { + "epoch": 1.02, + "learning_rate": 1.535979112606879e-06, + "loss": 0.9023, + "step": 39837 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359557521400209e-06, + "loss": 0.6975, + "step": 39838 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359323912628058e-06, + "loss": 0.6826, + "step": 39839 + }, + { + "epoch": 1.02, + "learning_rate": 1.5359090299752517e-06, + "loss": 0.5283, + "step": 39840 + }, + { + "epoch": 1.02, + "learning_rate": 1.535885668277377e-06, + "loss": 0.5005, + "step": 39841 + }, + { + "epoch": 1.02, + "learning_rate": 1.5358623061691991e-06, + "loss": 0.7832, + "step": 39842 + }, + { + "epoch": 1.02, + "learning_rate": 1.5358389436507361e-06, + "loss": 0.5991, + "step": 39843 + }, + { + "epoch": 1.02, + "learning_rate": 1.535815580722006e-06, + "loss": 0.7559, + "step": 39844 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357922173830262e-06, + "loss": 0.8691, + "step": 39845 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357688536338152e-06, + "loss": 0.7656, + "step": 39846 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357454894743907e-06, + "loss": 0.7383, + "step": 39847 + }, + { + "epoch": 1.02, + "learning_rate": 1.5357221249047705e-06, + "loss": 0.7637, + "step": 39848 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356987599249723e-06, + "loss": 0.6816, + "step": 39849 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356753945350142e-06, + "loss": 0.834, + "step": 39850 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356520287349142e-06, + "loss": 0.5518, + "step": 39851 + }, + { + "epoch": 1.02, + "learning_rate": 1.5356286625246903e-06, + "loss": 0.8203, + "step": 39852 + }, + { + "epoch": 1.02, + "learning_rate": 1.53560529590436e-06, + "loss": 0.6973, + "step": 39853 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355819288739413e-06, + "loss": 0.6528, + "step": 39854 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355585614334518e-06, + "loss": 0.6592, + "step": 39855 + }, + { + "epoch": 1.02, + "learning_rate": 1.53553519358291e-06, + "loss": 0.6421, + "step": 39856 + }, + { + "epoch": 1.02, + "learning_rate": 1.5355118253223341e-06, + "loss": 0.7949, + "step": 39857 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354884566517408e-06, + "loss": 0.5146, + "step": 39858 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354650875711486e-06, + "loss": 0.7031, + "step": 39859 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354417180805754e-06, + "loss": 0.8262, + "step": 39860 + }, + { + "epoch": 1.02, + "learning_rate": 1.5354183481800394e-06, + "loss": 0.8018, + "step": 39861 + }, + { + "epoch": 1.02, + "learning_rate": 1.535394977869558e-06, + "loss": 0.7148, + "step": 39862 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353716071491491e-06, + "loss": 0.6504, + "step": 39863 + }, + { + "epoch": 1.02, + "learning_rate": 1.535348236018831e-06, + "loss": 0.7983, + "step": 39864 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353248644786212e-06, + "loss": 0.4907, + "step": 39865 + }, + { + "epoch": 1.02, + "learning_rate": 1.5353014925285382e-06, + "loss": 0.6396, + "step": 39866 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352781201685991e-06, + "loss": 0.7568, + "step": 39867 + }, + { + "epoch": 1.02, + "learning_rate": 1.535254747398822e-06, + "loss": 0.749, + "step": 39868 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352313742192253e-06, + "loss": 0.5503, + "step": 39869 + }, + { + "epoch": 1.02, + "learning_rate": 1.5352080006298263e-06, + "loss": 0.6826, + "step": 39870 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351846266306434e-06, + "loss": 0.7217, + "step": 39871 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351612522216941e-06, + "loss": 0.5281, + "step": 39872 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351378774029967e-06, + "loss": 0.751, + "step": 39873 + }, + { + "epoch": 1.02, + "learning_rate": 1.5351145021745682e-06, + "loss": 0.5488, + "step": 39874 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350911265364278e-06, + "loss": 0.5591, + "step": 39875 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350677504885924e-06, + "loss": 0.6875, + "step": 39876 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350443740310803e-06, + "loss": 0.8057, + "step": 39877 + }, + { + "epoch": 1.02, + "learning_rate": 1.5350209971639093e-06, + "loss": 0.6504, + "step": 39878 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349976198870972e-06, + "loss": 0.8184, + "step": 39879 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349742422006622e-06, + "loss": 0.6992, + "step": 39880 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349508641046219e-06, + "loss": 0.439, + "step": 39881 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349274855989944e-06, + "loss": 0.5938, + "step": 39882 + }, + { + "epoch": 1.02, + "learning_rate": 1.5349041066837974e-06, + "loss": 0.6719, + "step": 39883 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348807273590492e-06, + "loss": 0.6079, + "step": 39884 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348573476247674e-06, + "loss": 0.9473, + "step": 39885 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348339674809694e-06, + "loss": 0.7949, + "step": 39886 + }, + { + "epoch": 1.02, + "learning_rate": 1.5348105869276743e-06, + "loss": 0.792, + "step": 39887 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347872059648988e-06, + "loss": 0.687, + "step": 39888 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347638245926615e-06, + "loss": 0.7988, + "step": 39889 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347404428109801e-06, + "loss": 0.4424, + "step": 39890 + }, + { + "epoch": 1.02, + "learning_rate": 1.5347170606198724e-06, + "loss": 0.709, + "step": 39891 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346936780193569e-06, + "loss": 0.689, + "step": 39892 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346702950094508e-06, + "loss": 0.7031, + "step": 39893 + }, + { + "epoch": 1.02, + "learning_rate": 1.534646911590172e-06, + "loss": 0.6973, + "step": 39894 + }, + { + "epoch": 1.02, + "learning_rate": 1.534623527761539e-06, + "loss": 0.5742, + "step": 39895 + }, + { + "epoch": 1.02, + "learning_rate": 1.5346001435235691e-06, + "loss": 0.6748, + "step": 39896 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345767588762808e-06, + "loss": 0.6206, + "step": 39897 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345533738196914e-06, + "loss": 0.6533, + "step": 39898 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345299883538188e-06, + "loss": 0.6084, + "step": 39899 + }, + { + "epoch": 1.02, + "learning_rate": 1.5345066024786815e-06, + "loss": 0.7607, + "step": 39900 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344832161942968e-06, + "loss": 0.5151, + "step": 39901 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344598295006835e-06, + "loss": 0.6392, + "step": 39902 + }, + { + "epoch": 1.02, + "learning_rate": 1.5344364423978583e-06, + "loss": 0.6885, + "step": 39903 + }, + { + "epoch": 1.02, + "learning_rate": 1.53441305488584e-06, + "loss": 0.5474, + "step": 39904 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343896669646459e-06, + "loss": 0.5845, + "step": 39905 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343662786342944e-06, + "loss": 0.6343, + "step": 39906 + }, + { + "epoch": 1.02, + "learning_rate": 1.5343428898948032e-06, + "loss": 0.6787, + "step": 39907 + }, + { + "epoch": 1.02, + "learning_rate": 1.53431950074619e-06, + "loss": 0.7168, + "step": 39908 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342961111884733e-06, + "loss": 0.7129, + "step": 39909 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342727212216703e-06, + "loss": 0.7734, + "step": 39910 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342493308457995e-06, + "loss": 0.6191, + "step": 39911 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342259400608783e-06, + "loss": 0.6465, + "step": 39912 + }, + { + "epoch": 1.02, + "learning_rate": 1.5342025488669253e-06, + "loss": 0.5762, + "step": 39913 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341791572639572e-06, + "loss": 0.6621, + "step": 39914 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341557652519934e-06, + "loss": 0.5371, + "step": 39915 + }, + { + "epoch": 1.02, + "learning_rate": 1.5341323728310509e-06, + "loss": 0.7539, + "step": 39916 + }, + { + "epoch": 1.02, + "learning_rate": 1.534108980001148e-06, + "loss": 0.3804, + "step": 39917 + }, + { + "epoch": 1.02, + "learning_rate": 1.534085586762302e-06, + "loss": 0.5312, + "step": 39918 + }, + { + "epoch": 1.02, + "learning_rate": 1.5340621931145314e-06, + "loss": 0.792, + "step": 39919 + }, + { + "epoch": 1.02, + "learning_rate": 1.534038799057854e-06, + "loss": 0.5249, + "step": 39920 + }, + { + "epoch": 1.02, + "learning_rate": 1.5340154045922874e-06, + "loss": 0.6099, + "step": 39921 + }, + { + "epoch": 1.02, + "learning_rate": 1.53399200971785e-06, + "loss": 0.5615, + "step": 39922 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339686144345594e-06, + "loss": 0.5557, + "step": 39923 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339452187424334e-06, + "loss": 0.6331, + "step": 39924 + }, + { + "epoch": 1.02, + "learning_rate": 1.5339218226414902e-06, + "loss": 0.7031, + "step": 39925 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338984261317478e-06, + "loss": 0.5605, + "step": 39926 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338750292132238e-06, + "loss": 0.6157, + "step": 39927 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338516318859366e-06, + "loss": 0.4756, + "step": 39928 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338282341499032e-06, + "loss": 0.5137, + "step": 39929 + }, + { + "epoch": 1.02, + "learning_rate": 1.5338048360051423e-06, + "loss": 0.7598, + "step": 39930 + }, + { + "epoch": 1.02, + "learning_rate": 1.5337814374516716e-06, + "loss": 0.3391, + "step": 39931 + }, + { + "epoch": 1.02, + "learning_rate": 1.533758038489509e-06, + "loss": 0.5732, + "step": 39932 + }, + { + "epoch": 1.02, + "learning_rate": 1.533734639118672e-06, + "loss": 0.8906, + "step": 39933 + }, + { + "epoch": 1.02, + "learning_rate": 1.5337112393391796e-06, + "loss": 0.7627, + "step": 39934 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336878391510487e-06, + "loss": 0.6836, + "step": 39935 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336644385542977e-06, + "loss": 0.6807, + "step": 39936 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336410375489442e-06, + "loss": 0.6533, + "step": 39937 + }, + { + "epoch": 1.02, + "learning_rate": 1.5336176361350063e-06, + "loss": 0.6245, + "step": 39938 + }, + { + "epoch": 1.02, + "learning_rate": 1.533594234312502e-06, + "loss": 0.7783, + "step": 39939 + }, + { + "epoch": 1.02, + "learning_rate": 1.533570832081449e-06, + "loss": 0.6924, + "step": 39940 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335474294418655e-06, + "loss": 0.6482, + "step": 39941 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335240263937697e-06, + "loss": 0.6465, + "step": 39942 + }, + { + "epoch": 1.02, + "learning_rate": 1.5335006229371784e-06, + "loss": 0.5586, + "step": 39943 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334772190721103e-06, + "loss": 0.5581, + "step": 39944 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334538147985833e-06, + "loss": 0.8262, + "step": 39945 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334304101166153e-06, + "loss": 0.5095, + "step": 39946 + }, + { + "epoch": 1.02, + "learning_rate": 1.5334070050262243e-06, + "loss": 0.6821, + "step": 39947 + }, + { + "epoch": 1.02, + "learning_rate": 1.533383599527428e-06, + "loss": 0.6934, + "step": 39948 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333601936202442e-06, + "loss": 0.5542, + "step": 39949 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333367873046914e-06, + "loss": 0.7803, + "step": 39950 + }, + { + "epoch": 1.02, + "learning_rate": 1.5333133805807866e-06, + "loss": 0.623, + "step": 39951 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332899734485488e-06, + "loss": 0.7168, + "step": 39952 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332665659079951e-06, + "loss": 0.7676, + "step": 39953 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332431579591436e-06, + "loss": 0.7676, + "step": 39954 + }, + { + "epoch": 1.02, + "learning_rate": 1.5332197496020127e-06, + "loss": 0.548, + "step": 39955 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331963408366196e-06, + "loss": 0.6362, + "step": 39956 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331729316629828e-06, + "loss": 0.6045, + "step": 39957 + }, + { + "epoch": 1.02, + "learning_rate": 1.53314952208112e-06, + "loss": 0.5684, + "step": 39958 + }, + { + "epoch": 1.02, + "learning_rate": 1.533126112091049e-06, + "loss": 0.6631, + "step": 39959 + }, + { + "epoch": 1.02, + "learning_rate": 1.5331027016927878e-06, + "loss": 0.7109, + "step": 39960 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330792908863548e-06, + "loss": 0.5767, + "step": 39961 + }, + { + "epoch": 1.02, + "learning_rate": 1.533055879671767e-06, + "loss": 0.7832, + "step": 39962 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330324680490432e-06, + "loss": 0.6934, + "step": 39963 + }, + { + "epoch": 1.02, + "learning_rate": 1.5330090560182006e-06, + "loss": 0.4683, + "step": 39964 + }, + { + "epoch": 1.02, + "learning_rate": 1.5329856435792578e-06, + "loss": 0.708, + "step": 39965 + }, + { + "epoch": 1.02, + "learning_rate": 1.532962230732232e-06, + "loss": 1.0166, + "step": 39966 + }, + { + "epoch": 1.02, + "learning_rate": 1.532938817477142e-06, + "loss": 0.624, + "step": 39967 + }, + { + "epoch": 1.02, + "learning_rate": 1.5329154038140048e-06, + "loss": 0.7012, + "step": 39968 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328919897428392e-06, + "loss": 0.7021, + "step": 39969 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328685752636625e-06, + "loss": 0.5493, + "step": 39970 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328451603764929e-06, + "loss": 0.3893, + "step": 39971 + }, + { + "epoch": 1.02, + "learning_rate": 1.5328217450813482e-06, + "loss": 0.7178, + "step": 39972 + }, + { + "epoch": 1.02, + "learning_rate": 1.532798329378246e-06, + "loss": 0.6191, + "step": 39973 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327749132672051e-06, + "loss": 0.6021, + "step": 39974 + }, + { + "epoch": 1.02, + "learning_rate": 1.532751496748243e-06, + "loss": 0.4719, + "step": 39975 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327280798213774e-06, + "loss": 0.3678, + "step": 39976 + }, + { + "epoch": 1.02, + "learning_rate": 1.5327046624866265e-06, + "loss": 0.7578, + "step": 39977 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326812447440082e-06, + "loss": 0.6382, + "step": 39978 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326578265935402e-06, + "loss": 0.7344, + "step": 39979 + }, + { + "epoch": 1.02, + "learning_rate": 1.5326344080352404e-06, + "loss": 0.6094, + "step": 39980 + }, + { + "epoch": 1.02, + "learning_rate": 1.532610989069127e-06, + "loss": 0.5164, + "step": 39981 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325875696952184e-06, + "loss": 0.6621, + "step": 39982 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325641499135316e-06, + "loss": 0.6401, + "step": 39983 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325407297240848e-06, + "loss": 0.5835, + "step": 39984 + }, + { + "epoch": 1.02, + "learning_rate": 1.5325173091268959e-06, + "loss": 0.6631, + "step": 39985 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324938881219835e-06, + "loss": 0.6211, + "step": 39986 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324704667093648e-06, + "loss": 0.666, + "step": 39987 + }, + { + "epoch": 1.02, + "learning_rate": 1.532447044889058e-06, + "loss": 0.6143, + "step": 39988 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324236226610807e-06, + "loss": 0.5378, + "step": 39989 + }, + { + "epoch": 1.02, + "learning_rate": 1.5324002000254515e-06, + "loss": 0.4078, + "step": 39990 + }, + { + "epoch": 1.02, + "learning_rate": 1.5323767769821876e-06, + "loss": 0.709, + "step": 39991 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323533535313076e-06, + "loss": 0.5715, + "step": 39992 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323299296728287e-06, + "loss": 0.6367, + "step": 39993 + }, + { + "epoch": 1.03, + "learning_rate": 1.5323065054067697e-06, + "loss": 0.574, + "step": 39994 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322830807331476e-06, + "loss": 0.5374, + "step": 39995 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322596556519814e-06, + "loss": 0.5913, + "step": 39996 + }, + { + "epoch": 1.03, + "learning_rate": 1.532236230163288e-06, + "loss": 0.6362, + "step": 39997 + }, + { + "epoch": 1.03, + "learning_rate": 1.5322128042670862e-06, + "loss": 0.6562, + "step": 39998 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321893779633933e-06, + "loss": 0.8408, + "step": 39999 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321659512522271e-06, + "loss": 0.4163, + "step": 40000 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321425241336063e-06, + "loss": 0.6865, + "step": 40001 + }, + { + "epoch": 1.03, + "learning_rate": 1.5321190966075483e-06, + "loss": 0.6602, + "step": 40002 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320956686740716e-06, + "loss": 0.6118, + "step": 40003 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320722403331931e-06, + "loss": 0.7441, + "step": 40004 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320488115849318e-06, + "loss": 0.751, + "step": 40005 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320253824293047e-06, + "loss": 0.7861, + "step": 40006 + }, + { + "epoch": 1.03, + "learning_rate": 1.5320019528663309e-06, + "loss": 0.8857, + "step": 40007 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319785228960272e-06, + "loss": 0.748, + "step": 40008 + }, + { + "epoch": 1.03, + "learning_rate": 1.531955092518412e-06, + "loss": 0.8262, + "step": 40009 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319316617335033e-06, + "loss": 0.605, + "step": 40010 + }, + { + "epoch": 1.03, + "learning_rate": 1.5319082305413192e-06, + "loss": 0.7568, + "step": 40011 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318847989418774e-06, + "loss": 0.7148, + "step": 40012 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318613669351957e-06, + "loss": 0.5557, + "step": 40013 + }, + { + "epoch": 1.03, + "learning_rate": 1.531837934521292e-06, + "loss": 0.5977, + "step": 40014 + }, + { + "epoch": 1.03, + "learning_rate": 1.5318145017001846e-06, + "loss": 0.6162, + "step": 40015 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317910684718913e-06, + "loss": 0.7354, + "step": 40016 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317676348364304e-06, + "loss": 0.7217, + "step": 40017 + }, + { + "epoch": 1.03, + "learning_rate": 1.531744200793819e-06, + "loss": 0.7539, + "step": 40018 + }, + { + "epoch": 1.03, + "learning_rate": 1.5317207663440758e-06, + "loss": 0.7168, + "step": 40019 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316973314872183e-06, + "loss": 0.7676, + "step": 40020 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316738962232648e-06, + "loss": 0.3967, + "step": 40021 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316504605522328e-06, + "loss": 0.6851, + "step": 40022 + }, + { + "epoch": 1.03, + "learning_rate": 1.5316270244741405e-06, + "loss": 0.6279, + "step": 40023 + }, + { + "epoch": 1.03, + "learning_rate": 1.531603587989006e-06, + "loss": 0.749, + "step": 40024 + }, + { + "epoch": 1.03, + "learning_rate": 1.531580151096847e-06, + "loss": 0.6885, + "step": 40025 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315567137976815e-06, + "loss": 0.6621, + "step": 40026 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315332760915273e-06, + "loss": 0.75, + "step": 40027 + }, + { + "epoch": 1.03, + "learning_rate": 1.5315098379784028e-06, + "loss": 0.7656, + "step": 40028 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314863994583257e-06, + "loss": 0.7422, + "step": 40029 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314629605313139e-06, + "loss": 0.7554, + "step": 40030 + }, + { + "epoch": 1.03, + "learning_rate": 1.531439521197385e-06, + "loss": 0.7061, + "step": 40031 + }, + { + "epoch": 1.03, + "learning_rate": 1.5314160814565576e-06, + "loss": 0.5337, + "step": 40032 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313926413088491e-06, + "loss": 0.6836, + "step": 40033 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313692007542777e-06, + "loss": 0.5894, + "step": 40034 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313457597928613e-06, + "loss": 0.6274, + "step": 40035 + }, + { + "epoch": 1.03, + "learning_rate": 1.5313223184246184e-06, + "loss": 0.5244, + "step": 40036 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312988766495663e-06, + "loss": 0.7549, + "step": 40037 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312754344677228e-06, + "loss": 0.6191, + "step": 40038 + }, + { + "epoch": 1.03, + "learning_rate": 1.531251991879106e-06, + "loss": 0.7412, + "step": 40039 + }, + { + "epoch": 1.03, + "learning_rate": 1.5312285488837343e-06, + "loss": 0.6274, + "step": 40040 + }, + { + "epoch": 1.03, + "learning_rate": 1.531205105481625e-06, + "loss": 0.6226, + "step": 40041 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311816616727967e-06, + "loss": 0.5518, + "step": 40042 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311582174572667e-06, + "loss": 0.6279, + "step": 40043 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311347728350533e-06, + "loss": 0.7998, + "step": 40044 + }, + { + "epoch": 1.03, + "learning_rate": 1.5311113278061748e-06, + "loss": 0.4695, + "step": 40045 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310878823706488e-06, + "loss": 0.4496, + "step": 40046 + }, + { + "epoch": 1.03, + "learning_rate": 1.531064436528493e-06, + "loss": 0.6616, + "step": 40047 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310409902797255e-06, + "loss": 0.7847, + "step": 40048 + }, + { + "epoch": 1.03, + "learning_rate": 1.5310175436243643e-06, + "loss": 0.3989, + "step": 40049 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309940965624276e-06, + "loss": 0.7168, + "step": 40050 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309706490939332e-06, + "loss": 0.6265, + "step": 40051 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309472012188986e-06, + "loss": 0.7598, + "step": 40052 + }, + { + "epoch": 1.03, + "learning_rate": 1.5309237529373423e-06, + "loss": 0.7852, + "step": 40053 + }, + { + "epoch": 1.03, + "learning_rate": 1.530900304249282e-06, + "loss": 0.8076, + "step": 40054 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308768551547362e-06, + "loss": 0.6206, + "step": 40055 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308534056537221e-06, + "loss": 0.5889, + "step": 40056 + }, + { + "epoch": 1.03, + "learning_rate": 1.530829955746258e-06, + "loss": 0.5874, + "step": 40057 + }, + { + "epoch": 1.03, + "learning_rate": 1.5308065054323618e-06, + "loss": 0.5835, + "step": 40058 + }, + { + "epoch": 1.03, + "learning_rate": 1.5307830547120512e-06, + "loss": 0.7793, + "step": 40059 + }, + { + "epoch": 1.03, + "learning_rate": 1.5307596035853448e-06, + "loss": 0.4873, + "step": 40060 + }, + { + "epoch": 1.03, + "learning_rate": 1.53073615205226e-06, + "loss": 0.6042, + "step": 40061 + }, + { + "epoch": 1.03, + "learning_rate": 1.530712700112815e-06, + "loss": 0.6704, + "step": 40062 + }, + { + "epoch": 1.03, + "learning_rate": 1.5306892477670274e-06, + "loss": 0.5781, + "step": 40063 + }, + { + "epoch": 1.03, + "learning_rate": 1.530665795014916e-06, + "loss": 0.709, + "step": 40064 + }, + { + "epoch": 1.03, + "learning_rate": 1.530642341856498e-06, + "loss": 0.6172, + "step": 40065 + }, + { + "epoch": 1.03, + "learning_rate": 1.5306188882917913e-06, + "loss": 0.8125, + "step": 40066 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305954343208143e-06, + "loss": 0.5051, + "step": 40067 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305719799435849e-06, + "loss": 0.552, + "step": 40068 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305485251601207e-06, + "loss": 0.5005, + "step": 40069 + }, + { + "epoch": 1.03, + "learning_rate": 1.53052506997044e-06, + "loss": 0.7725, + "step": 40070 + }, + { + "epoch": 1.03, + "learning_rate": 1.5305016143745606e-06, + "loss": 0.6914, + "step": 40071 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304781583725007e-06, + "loss": 0.4951, + "step": 40072 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304547019642777e-06, + "loss": 0.6904, + "step": 40073 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304312451499102e-06, + "loss": 0.6763, + "step": 40074 + }, + { + "epoch": 1.03, + "learning_rate": 1.5304077879294158e-06, + "loss": 0.7197, + "step": 40075 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303843303028127e-06, + "loss": 0.6592, + "step": 40076 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303608722701183e-06, + "loss": 0.5654, + "step": 40077 + }, + { + "epoch": 1.03, + "learning_rate": 1.5303374138313515e-06, + "loss": 0.7197, + "step": 40078 + }, + { + "epoch": 1.03, + "learning_rate": 1.530313954986529e-06, + "loss": 0.8125, + "step": 40079 + }, + { + "epoch": 1.03, + "learning_rate": 1.53029049573567e-06, + "loss": 0.7539, + "step": 40080 + }, + { + "epoch": 1.03, + "learning_rate": 1.5302670360787921e-06, + "loss": 0.7021, + "step": 40081 + }, + { + "epoch": 1.03, + "learning_rate": 1.530243576015913e-06, + "loss": 0.7354, + "step": 40082 + }, + { + "epoch": 1.03, + "learning_rate": 1.5302201155470505e-06, + "loss": 0.7627, + "step": 40083 + }, + { + "epoch": 1.03, + "learning_rate": 1.530196654672223e-06, + "loss": 0.7998, + "step": 40084 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301731933914483e-06, + "loss": 0.6699, + "step": 40085 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301497317047444e-06, + "loss": 0.7012, + "step": 40086 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301262696121294e-06, + "loss": 0.6523, + "step": 40087 + }, + { + "epoch": 1.03, + "learning_rate": 1.5301028071136207e-06, + "loss": 0.5261, + "step": 40088 + }, + { + "epoch": 1.03, + "learning_rate": 1.5300793442092368e-06, + "loss": 0.5742, + "step": 40089 + }, + { + "epoch": 1.03, + "learning_rate": 1.5300558808989957e-06, + "loss": 0.6553, + "step": 40090 + }, + { + "epoch": 1.03, + "learning_rate": 1.530032417182915e-06, + "loss": 0.4331, + "step": 40091 + }, + { + "epoch": 1.03, + "learning_rate": 1.530008953061013e-06, + "loss": 0.323, + "step": 40092 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299854885333075e-06, + "loss": 0.6792, + "step": 40093 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299620235998164e-06, + "loss": 0.8057, + "step": 40094 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299385582605578e-06, + "loss": 0.5281, + "step": 40095 + }, + { + "epoch": 1.03, + "learning_rate": 1.5299150925155494e-06, + "loss": 0.5332, + "step": 40096 + }, + { + "epoch": 1.03, + "learning_rate": 1.5298916263648098e-06, + "loss": 0.6755, + "step": 40097 + }, + { + "epoch": 1.03, + "learning_rate": 1.5298681598083561e-06, + "loss": 0.5093, + "step": 40098 + }, + { + "epoch": 1.03, + "learning_rate": 1.529844692846207e-06, + "loss": 0.7188, + "step": 40099 + }, + { + "epoch": 1.03, + "learning_rate": 1.52982122547838e-06, + "loss": 0.6885, + "step": 40100 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297977577048936e-06, + "loss": 0.8369, + "step": 40101 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297742895257647e-06, + "loss": 0.5625, + "step": 40102 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297508209410128e-06, + "loss": 0.5566, + "step": 40103 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297273519506547e-06, + "loss": 0.5703, + "step": 40104 + }, + { + "epoch": 1.03, + "learning_rate": 1.5297038825547086e-06, + "loss": 0.6631, + "step": 40105 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296804127531927e-06, + "loss": 0.7656, + "step": 40106 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296569425461247e-06, + "loss": 0.6313, + "step": 40107 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296334719335232e-06, + "loss": 0.6567, + "step": 40108 + }, + { + "epoch": 1.03, + "learning_rate": 1.5296100009154054e-06, + "loss": 0.5757, + "step": 40109 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295865294917895e-06, + "loss": 0.5737, + "step": 40110 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295630576626937e-06, + "loss": 0.7334, + "step": 40111 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295395854281358e-06, + "loss": 0.835, + "step": 40112 + }, + { + "epoch": 1.03, + "learning_rate": 1.5295161127881336e-06, + "loss": 0.6582, + "step": 40113 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294926397427052e-06, + "loss": 0.6304, + "step": 40114 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294691662918688e-06, + "loss": 0.5928, + "step": 40115 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294456924356425e-06, + "loss": 0.5762, + "step": 40116 + }, + { + "epoch": 1.03, + "learning_rate": 1.5294222181740437e-06, + "loss": 0.7495, + "step": 40117 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293987435070908e-06, + "loss": 0.5037, + "step": 40118 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293752684348013e-06, + "loss": 0.8096, + "step": 40119 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293517929571938e-06, + "loss": 0.5322, + "step": 40120 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293283170742859e-06, + "loss": 0.647, + "step": 40121 + }, + { + "epoch": 1.03, + "learning_rate": 1.5293048407860956e-06, + "loss": 0.5542, + "step": 40122 + }, + { + "epoch": 1.03, + "learning_rate": 1.529281364092641e-06, + "loss": 0.7148, + "step": 40123 + }, + { + "epoch": 1.03, + "learning_rate": 1.5292578869939398e-06, + "loss": 0.7383, + "step": 40124 + }, + { + "epoch": 1.03, + "learning_rate": 1.52923440949001e-06, + "loss": 0.8379, + "step": 40125 + }, + { + "epoch": 1.03, + "learning_rate": 1.5292109315808703e-06, + "loss": 0.6348, + "step": 40126 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291874532665378e-06, + "loss": 0.7217, + "step": 40127 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291639745470311e-06, + "loss": 0.6802, + "step": 40128 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291404954223674e-06, + "loss": 0.6924, + "step": 40129 + }, + { + "epoch": 1.03, + "learning_rate": 1.5291170158925657e-06, + "loss": 0.5718, + "step": 40130 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290935359576432e-06, + "loss": 0.6719, + "step": 40131 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290700556176177e-06, + "loss": 0.7363, + "step": 40132 + }, + { + "epoch": 1.03, + "learning_rate": 1.529046574872508e-06, + "loss": 0.6514, + "step": 40133 + }, + { + "epoch": 1.03, + "learning_rate": 1.5290230937223316e-06, + "loss": 0.5811, + "step": 40134 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289996121671064e-06, + "loss": 0.6733, + "step": 40135 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289761302068506e-06, + "loss": 0.6104, + "step": 40136 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289526478415825e-06, + "loss": 0.6777, + "step": 40137 + }, + { + "epoch": 1.03, + "learning_rate": 1.528929165071319e-06, + "loss": 0.6885, + "step": 40138 + }, + { + "epoch": 1.03, + "learning_rate": 1.5289056818960792e-06, + "loss": 0.5776, + "step": 40139 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288821983158803e-06, + "loss": 0.8545, + "step": 40140 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288587143307412e-06, + "loss": 0.457, + "step": 40141 + }, + { + "epoch": 1.03, + "learning_rate": 1.5288352299406789e-06, + "loss": 0.6465, + "step": 40142 + }, + { + "epoch": 1.03, + "learning_rate": 1.528811745145712e-06, + "loss": 0.6455, + "step": 40143 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287882599458577e-06, + "loss": 0.7646, + "step": 40144 + }, + { + "epoch": 1.03, + "learning_rate": 1.528764774341135e-06, + "loss": 0.6675, + "step": 40145 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287412883315617e-06, + "loss": 0.6582, + "step": 40146 + }, + { + "epoch": 1.03, + "learning_rate": 1.5287178019171552e-06, + "loss": 0.5874, + "step": 40147 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286943150979334e-06, + "loss": 0.6685, + "step": 40148 + }, + { + "epoch": 1.03, + "learning_rate": 1.528670827873915e-06, + "loss": 0.6104, + "step": 40149 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286473402451176e-06, + "loss": 0.7251, + "step": 40150 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286238522115596e-06, + "loss": 0.7666, + "step": 40151 + }, + { + "epoch": 1.03, + "learning_rate": 1.5286003637732585e-06, + "loss": 0.6807, + "step": 40152 + }, + { + "epoch": 1.03, + "learning_rate": 1.528576874930232e-06, + "loss": 0.5703, + "step": 40153 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285533856824988e-06, + "loss": 0.6128, + "step": 40154 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285298960300765e-06, + "loss": 0.6221, + "step": 40155 + }, + { + "epoch": 1.03, + "learning_rate": 1.5285064059729833e-06, + "loss": 0.8599, + "step": 40156 + }, + { + "epoch": 1.03, + "learning_rate": 1.528482915511237e-06, + "loss": 0.8066, + "step": 40157 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284594246448555e-06, + "loss": 0.5361, + "step": 40158 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284359333738567e-06, + "loss": 0.7178, + "step": 40159 + }, + { + "epoch": 1.03, + "learning_rate": 1.5284124416982592e-06, + "loss": 0.6611, + "step": 40160 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283889496180807e-06, + "loss": 0.606, + "step": 40161 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283654571333387e-06, + "loss": 0.9414, + "step": 40162 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283419642440518e-06, + "loss": 0.5947, + "step": 40163 + }, + { + "epoch": 1.03, + "learning_rate": 1.5283184709502375e-06, + "loss": 0.4712, + "step": 40164 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282949772519143e-06, + "loss": 0.7412, + "step": 40165 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282714831490999e-06, + "loss": 0.5288, + "step": 40166 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282479886418122e-06, + "loss": 0.5126, + "step": 40167 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282244937300694e-06, + "loss": 0.6416, + "step": 40168 + }, + { + "epoch": 1.03, + "learning_rate": 1.5282009984138894e-06, + "loss": 0.5874, + "step": 40169 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281775026932899e-06, + "loss": 0.6611, + "step": 40170 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281540065682897e-06, + "loss": 0.54, + "step": 40171 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281305100389059e-06, + "loss": 0.709, + "step": 40172 + }, + { + "epoch": 1.03, + "learning_rate": 1.5281070131051568e-06, + "loss": 0.8408, + "step": 40173 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280835157670606e-06, + "loss": 0.6865, + "step": 40174 + }, + { + "epoch": 1.03, + "learning_rate": 1.528060018024635e-06, + "loss": 0.6738, + "step": 40175 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280365198778982e-06, + "loss": 0.3823, + "step": 40176 + }, + { + "epoch": 1.03, + "learning_rate": 1.5280130213268682e-06, + "loss": 0.7544, + "step": 40177 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279895223715628e-06, + "loss": 0.5664, + "step": 40178 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279660230120005e-06, + "loss": 0.6162, + "step": 40179 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279425232481982e-06, + "loss": 0.6191, + "step": 40180 + }, + { + "epoch": 1.03, + "learning_rate": 1.5279190230801754e-06, + "loss": 0.5186, + "step": 40181 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278955225079484e-06, + "loss": 0.8008, + "step": 40182 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278720215315363e-06, + "loss": 0.5017, + "step": 40183 + }, + { + "epoch": 1.03, + "learning_rate": 1.527848520150957e-06, + "loss": 0.7334, + "step": 40184 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278250183662284e-06, + "loss": 0.5752, + "step": 40185 + }, + { + "epoch": 1.03, + "learning_rate": 1.5278015161773687e-06, + "loss": 0.6768, + "step": 40186 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277780135843953e-06, + "loss": 0.7422, + "step": 40187 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277545105873269e-06, + "loss": 0.5889, + "step": 40188 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277310071861807e-06, + "loss": 0.6367, + "step": 40189 + }, + { + "epoch": 1.03, + "learning_rate": 1.5277075033809753e-06, + "loss": 0.7256, + "step": 40190 + }, + { + "epoch": 1.03, + "learning_rate": 1.5276839991717288e-06, + "loss": 0.7124, + "step": 40191 + }, + { + "epoch": 1.03, + "learning_rate": 1.5276604945584586e-06, + "loss": 0.6123, + "step": 40192 + }, + { + "epoch": 1.03, + "learning_rate": 1.527636989541183e-06, + "loss": 0.7227, + "step": 40193 + }, + { + "epoch": 1.03, + "learning_rate": 1.52761348411992e-06, + "loss": 0.6694, + "step": 40194 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275899782946877e-06, + "loss": 0.5752, + "step": 40195 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275664720655042e-06, + "loss": 0.6543, + "step": 40196 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275429654323871e-06, + "loss": 0.6265, + "step": 40197 + }, + { + "epoch": 1.03, + "learning_rate": 1.5275194583953548e-06, + "loss": 0.5386, + "step": 40198 + }, + { + "epoch": 1.03, + "learning_rate": 1.527495950954425e-06, + "loss": 0.6895, + "step": 40199 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274724431096155e-06, + "loss": 0.5701, + "step": 40200 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274489348609449e-06, + "loss": 0.5483, + "step": 40201 + }, + { + "epoch": 1.03, + "learning_rate": 1.527425426208431e-06, + "loss": 0.644, + "step": 40202 + }, + { + "epoch": 1.03, + "learning_rate": 1.5274019171520914e-06, + "loss": 0.5747, + "step": 40203 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273784076919447e-06, + "loss": 0.6504, + "step": 40204 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273548978280081e-06, + "loss": 0.7119, + "step": 40205 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273313875603009e-06, + "loss": 0.6074, + "step": 40206 + }, + { + "epoch": 1.03, + "learning_rate": 1.5273078768888397e-06, + "loss": 0.6978, + "step": 40207 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272843658136437e-06, + "loss": 0.5632, + "step": 40208 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272608543347297e-06, + "loss": 0.542, + "step": 40209 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272373424521162e-06, + "loss": 0.7427, + "step": 40210 + }, + { + "epoch": 1.03, + "learning_rate": 1.5272138301658219e-06, + "loss": 0.6611, + "step": 40211 + }, + { + "epoch": 1.03, + "learning_rate": 1.527190317475864e-06, + "loss": 0.7188, + "step": 40212 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271668043822605e-06, + "loss": 0.7275, + "step": 40213 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271432908850299e-06, + "loss": 0.7222, + "step": 40214 + }, + { + "epoch": 1.03, + "learning_rate": 1.5271197769841897e-06, + "loss": 0.6519, + "step": 40215 + }, + { + "epoch": 1.03, + "learning_rate": 1.527096262679758e-06, + "loss": 0.5625, + "step": 40216 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270727479717533e-06, + "loss": 0.5977, + "step": 40217 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270492328601931e-06, + "loss": 0.7637, + "step": 40218 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270257173450956e-06, + "loss": 0.5923, + "step": 40219 + }, + { + "epoch": 1.03, + "learning_rate": 1.5270022014264785e-06, + "loss": 0.6992, + "step": 40220 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269786851043604e-06, + "loss": 0.6003, + "step": 40221 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269551683787586e-06, + "loss": 0.7041, + "step": 40222 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269316512496916e-06, + "loss": 0.6816, + "step": 40223 + }, + { + "epoch": 1.03, + "learning_rate": 1.5269081337171772e-06, + "loss": 0.7109, + "step": 40224 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268846157812337e-06, + "loss": 0.5659, + "step": 40225 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268610974418788e-06, + "loss": 0.5107, + "step": 40226 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268375786991303e-06, + "loss": 0.8135, + "step": 40227 + }, + { + "epoch": 1.03, + "learning_rate": 1.5268140595530069e-06, + "loss": 0.7715, + "step": 40228 + }, + { + "epoch": 1.03, + "learning_rate": 1.526790540003526e-06, + "loss": 0.5854, + "step": 40229 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267670200507055e-06, + "loss": 0.7969, + "step": 40230 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267434996945643e-06, + "loss": 0.8135, + "step": 40231 + }, + { + "epoch": 1.03, + "learning_rate": 1.5267199789351195e-06, + "loss": 0.7178, + "step": 40232 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266964577723895e-06, + "loss": 0.7544, + "step": 40233 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266729362063919e-06, + "loss": 0.6104, + "step": 40234 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266494142371455e-06, + "loss": 0.4678, + "step": 40235 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266258918646677e-06, + "loss": 0.7207, + "step": 40236 + }, + { + "epoch": 1.03, + "learning_rate": 1.5266023690889767e-06, + "loss": 0.5845, + "step": 40237 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265788459100905e-06, + "loss": 0.5396, + "step": 40238 + }, + { + "epoch": 1.03, + "learning_rate": 1.526555322328027e-06, + "loss": 0.7246, + "step": 40239 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265317983428042e-06, + "loss": 0.4397, + "step": 40240 + }, + { + "epoch": 1.03, + "learning_rate": 1.5265082739544405e-06, + "loss": 0.3918, + "step": 40241 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264847491629536e-06, + "loss": 0.6133, + "step": 40242 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264612239683615e-06, + "loss": 0.7148, + "step": 40243 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264376983706822e-06, + "loss": 0.541, + "step": 40244 + }, + { + "epoch": 1.03, + "learning_rate": 1.5264141723699337e-06, + "loss": 0.6196, + "step": 40245 + }, + { + "epoch": 1.03, + "learning_rate": 1.526390645966134e-06, + "loss": 0.7207, + "step": 40246 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263671191593012e-06, + "loss": 0.6348, + "step": 40247 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263435919494536e-06, + "loss": 0.7075, + "step": 40248 + }, + { + "epoch": 1.03, + "learning_rate": 1.5263200643366086e-06, + "loss": 0.7871, + "step": 40249 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262965363207845e-06, + "loss": 0.666, + "step": 40250 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262730079019996e-06, + "loss": 0.4595, + "step": 40251 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262494790802715e-06, + "loss": 0.7446, + "step": 40252 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262259498556182e-06, + "loss": 0.4453, + "step": 40253 + }, + { + "epoch": 1.03, + "learning_rate": 1.5262024202280583e-06, + "loss": 0.5679, + "step": 40254 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261788901976092e-06, + "loss": 0.5522, + "step": 40255 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261553597642891e-06, + "loss": 0.7969, + "step": 40256 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261318289281162e-06, + "loss": 0.7344, + "step": 40257 + }, + { + "epoch": 1.03, + "learning_rate": 1.5261082976891081e-06, + "loss": 0.6357, + "step": 40258 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260847660472832e-06, + "loss": 0.7212, + "step": 40259 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260612340026593e-06, + "loss": 0.6001, + "step": 40260 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260377015552546e-06, + "loss": 0.5586, + "step": 40261 + }, + { + "epoch": 1.03, + "learning_rate": 1.5260141687050872e-06, + "loss": 0.6738, + "step": 40262 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259906354521745e-06, + "loss": 0.7373, + "step": 40263 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259671017965352e-06, + "loss": 0.5457, + "step": 40264 + }, + { + "epoch": 1.03, + "learning_rate": 1.525943567738187e-06, + "loss": 0.5225, + "step": 40265 + }, + { + "epoch": 1.03, + "learning_rate": 1.5259200332771477e-06, + "loss": 0.6738, + "step": 40266 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258964984134362e-06, + "loss": 0.603, + "step": 40267 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258729631470696e-06, + "loss": 0.7588, + "step": 40268 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258494274780664e-06, + "loss": 0.5657, + "step": 40269 + }, + { + "epoch": 1.03, + "learning_rate": 1.5258258914064444e-06, + "loss": 0.6143, + "step": 40270 + }, + { + "epoch": 1.03, + "learning_rate": 1.525802354932222e-06, + "loss": 0.6338, + "step": 40271 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257788180554164e-06, + "loss": 0.5596, + "step": 40272 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257552807760463e-06, + "loss": 0.5576, + "step": 40273 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257317430941294e-06, + "loss": 0.5352, + "step": 40274 + }, + { + "epoch": 1.03, + "learning_rate": 1.5257082050096842e-06, + "loss": 0.7744, + "step": 40275 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256846665227283e-06, + "loss": 0.5674, + "step": 40276 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256611276332797e-06, + "loss": 0.7041, + "step": 40277 + }, + { + "epoch": 1.03, + "learning_rate": 1.5256375883413566e-06, + "loss": 0.4795, + "step": 40278 + }, + { + "epoch": 1.03, + "learning_rate": 1.525614048646977e-06, + "loss": 0.5117, + "step": 40279 + }, + { + "epoch": 1.03, + "learning_rate": 1.525590508550159e-06, + "loss": 0.5342, + "step": 40280 + }, + { + "epoch": 1.03, + "learning_rate": 1.5255669680509207e-06, + "loss": 0.7861, + "step": 40281 + }, + { + "epoch": 1.03, + "learning_rate": 1.5255434271492795e-06, + "loss": 0.6157, + "step": 40282 + }, + { + "epoch": 1.03, + "learning_rate": 1.525519885845254e-06, + "loss": 0.7637, + "step": 40283 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254963441388623e-06, + "loss": 0.5264, + "step": 40284 + }, + { + "epoch": 1.03, + "learning_rate": 1.525472802030122e-06, + "loss": 0.7969, + "step": 40285 + }, + { + "epoch": 1.03, + "learning_rate": 1.525449259519051e-06, + "loss": 0.6885, + "step": 40286 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254257166056683e-06, + "loss": 0.6055, + "step": 40287 + }, + { + "epoch": 1.03, + "learning_rate": 1.5254021732899908e-06, + "loss": 0.5337, + "step": 40288 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253786295720373e-06, + "loss": 0.5103, + "step": 40289 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253550854518254e-06, + "loss": 0.6118, + "step": 40290 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253315409293735e-06, + "loss": 0.6953, + "step": 40291 + }, + { + "epoch": 1.03, + "learning_rate": 1.5253079960046994e-06, + "loss": 0.6436, + "step": 40292 + }, + { + "epoch": 1.03, + "learning_rate": 1.525284450677821e-06, + "loss": 0.5806, + "step": 40293 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252609049487562e-06, + "loss": 0.6138, + "step": 40294 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252373588175234e-06, + "loss": 0.54, + "step": 40295 + }, + { + "epoch": 1.03, + "learning_rate": 1.5252138122841407e-06, + "loss": 0.7461, + "step": 40296 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251902653486258e-06, + "loss": 0.6733, + "step": 40297 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251667180109968e-06, + "loss": 0.6885, + "step": 40298 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251431702712717e-06, + "loss": 0.7227, + "step": 40299 + }, + { + "epoch": 1.03, + "learning_rate": 1.5251196221294688e-06, + "loss": 0.7637, + "step": 40300 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250960735856062e-06, + "loss": 0.7246, + "step": 40301 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250725246397016e-06, + "loss": 0.5972, + "step": 40302 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250489752917725e-06, + "loss": 0.6389, + "step": 40303 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250254255418383e-06, + "loss": 0.5925, + "step": 40304 + }, + { + "epoch": 1.03, + "learning_rate": 1.5250018753899157e-06, + "loss": 0.7173, + "step": 40305 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249783248360238e-06, + "loss": 0.8154, + "step": 40306 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249547738801798e-06, + "loss": 0.6221, + "step": 40307 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249312225224022e-06, + "loss": 0.751, + "step": 40308 + }, + { + "epoch": 1.03, + "learning_rate": 1.5249076707627086e-06, + "loss": 0.6816, + "step": 40309 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248841186011179e-06, + "loss": 0.5701, + "step": 40310 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248605660376473e-06, + "loss": 0.71, + "step": 40311 + }, + { + "epoch": 1.03, + "learning_rate": 1.524837013072315e-06, + "loss": 0.7207, + "step": 40312 + }, + { + "epoch": 1.03, + "learning_rate": 1.5248134597051393e-06, + "loss": 0.7822, + "step": 40313 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247899059361378e-06, + "loss": 0.6758, + "step": 40314 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247663517653288e-06, + "loss": 0.7402, + "step": 40315 + }, + { + "epoch": 1.03, + "learning_rate": 1.5247427971927306e-06, + "loss": 0.6343, + "step": 40316 + }, + { + "epoch": 1.03, + "learning_rate": 1.524719242218361e-06, + "loss": 0.7012, + "step": 40317 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246956868422377e-06, + "loss": 0.7842, + "step": 40318 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246721310643792e-06, + "loss": 0.4756, + "step": 40319 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246485748848032e-06, + "loss": 0.79, + "step": 40320 + }, + { + "epoch": 1.03, + "learning_rate": 1.5246250183035282e-06, + "loss": 0.7021, + "step": 40321 + }, + { + "epoch": 1.03, + "learning_rate": 1.524601461320572e-06, + "loss": 0.4829, + "step": 40322 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245779039359523e-06, + "loss": 0.8398, + "step": 40323 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245543461496874e-06, + "loss": 0.668, + "step": 40324 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245307879617957e-06, + "loss": 0.4725, + "step": 40325 + }, + { + "epoch": 1.03, + "learning_rate": 1.5245072293722947e-06, + "loss": 0.6436, + "step": 40326 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244836703812025e-06, + "loss": 0.6104, + "step": 40327 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244601109885373e-06, + "loss": 0.5908, + "step": 40328 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244365511943173e-06, + "loss": 0.6895, + "step": 40329 + }, + { + "epoch": 1.03, + "learning_rate": 1.5244129909985604e-06, + "loss": 0.6528, + "step": 40330 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243894304012841e-06, + "loss": 0.5469, + "step": 40331 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243658694025074e-06, + "loss": 0.5938, + "step": 40332 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243423080022475e-06, + "loss": 0.71, + "step": 40333 + }, + { + "epoch": 1.03, + "learning_rate": 1.5243187462005232e-06, + "loss": 0.6094, + "step": 40334 + }, + { + "epoch": 1.03, + "learning_rate": 1.5242951839973518e-06, + "loss": 0.4534, + "step": 40335 + }, + { + "epoch": 1.03, + "learning_rate": 1.524271621392752e-06, + "loss": 0.5657, + "step": 40336 + }, + { + "epoch": 1.03, + "learning_rate": 1.5242480583867415e-06, + "loss": 0.5425, + "step": 40337 + }, + { + "epoch": 1.03, + "learning_rate": 1.524224494979338e-06, + "loss": 0.7715, + "step": 40338 + }, + { + "epoch": 1.03, + "learning_rate": 1.52420093117056e-06, + "loss": 0.5151, + "step": 40339 + }, + { + "epoch": 1.03, + "learning_rate": 1.524177366960426e-06, + "loss": 0.4988, + "step": 40340 + }, + { + "epoch": 1.03, + "learning_rate": 1.524153802348953e-06, + "loss": 0.5723, + "step": 40341 + }, + { + "epoch": 1.03, + "learning_rate": 1.5241302373361597e-06, + "loss": 0.7637, + "step": 40342 + }, + { + "epoch": 1.03, + "learning_rate": 1.5241066719220639e-06, + "loss": 0.7871, + "step": 40343 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240831061066837e-06, + "loss": 0.7754, + "step": 40344 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240595398900373e-06, + "loss": 0.8291, + "step": 40345 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240359732721425e-06, + "loss": 0.5913, + "step": 40346 + }, + { + "epoch": 1.03, + "learning_rate": 1.5240124062530173e-06, + "loss": 0.6699, + "step": 40347 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239888388326803e-06, + "loss": 0.5947, + "step": 40348 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239652710111485e-06, + "loss": 0.5684, + "step": 40349 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239417027884411e-06, + "loss": 0.8799, + "step": 40350 + }, + { + "epoch": 1.03, + "learning_rate": 1.5239181341645754e-06, + "loss": 0.7676, + "step": 40351 + }, + { + "epoch": 1.03, + "learning_rate": 1.52389456513957e-06, + "loss": 0.541, + "step": 40352 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238709957134424e-06, + "loss": 0.6797, + "step": 40353 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238474258862107e-06, + "loss": 0.5947, + "step": 40354 + }, + { + "epoch": 1.03, + "learning_rate": 1.5238238556578934e-06, + "loss": 0.5814, + "step": 40355 + }, + { + "epoch": 1.03, + "learning_rate": 1.523800285028508e-06, + "loss": 0.6206, + "step": 40356 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237767139980732e-06, + "loss": 0.5498, + "step": 40357 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237531425666062e-06, + "loss": 0.6699, + "step": 40358 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237295707341256e-06, + "loss": 0.4746, + "step": 40359 + }, + { + "epoch": 1.03, + "learning_rate": 1.5237059985006495e-06, + "loss": 0.6567, + "step": 40360 + }, + { + "epoch": 1.03, + "learning_rate": 1.523682425866196e-06, + "loss": 0.6768, + "step": 40361 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236588528307826e-06, + "loss": 0.6885, + "step": 40362 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236352793944275e-06, + "loss": 0.6006, + "step": 40363 + }, + { + "epoch": 1.03, + "learning_rate": 1.5236117055571494e-06, + "loss": 0.6377, + "step": 40364 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235881313189659e-06, + "loss": 0.5483, + "step": 40365 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235645566798948e-06, + "loss": 0.8823, + "step": 40366 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235409816399544e-06, + "loss": 0.6074, + "step": 40367 + }, + { + "epoch": 1.03, + "learning_rate": 1.5235174061991628e-06, + "loss": 0.7422, + "step": 40368 + }, + { + "epoch": 1.03, + "learning_rate": 1.523493830357538e-06, + "loss": 0.4232, + "step": 40369 + }, + { + "epoch": 1.03, + "learning_rate": 1.5234702541150978e-06, + "loss": 0.7109, + "step": 40370 + }, + { + "epoch": 1.03, + "learning_rate": 1.523446677471861e-06, + "loss": 0.6235, + "step": 40371 + }, + { + "epoch": 1.03, + "learning_rate": 1.5234231004278449e-06, + "loss": 0.7852, + "step": 40372 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233995229830678e-06, + "loss": 0.6987, + "step": 40373 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233759451375473e-06, + "loss": 0.4094, + "step": 40374 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233523668913026e-06, + "loss": 0.5972, + "step": 40375 + }, + { + "epoch": 1.03, + "learning_rate": 1.523328788244351e-06, + "loss": 0.7012, + "step": 40376 + }, + { + "epoch": 1.03, + "learning_rate": 1.5233052091967103e-06, + "loss": 0.5234, + "step": 40377 + }, + { + "epoch": 1.03, + "learning_rate": 1.523281629748399e-06, + "loss": 0.644, + "step": 40378 + }, + { + "epoch": 1.03, + "learning_rate": 1.5232580498994347e-06, + "loss": 0.6631, + "step": 40379 + }, + { + "epoch": 1.03, + "learning_rate": 1.5232344696498363e-06, + "loss": 0.6074, + "step": 40380 + }, + { + "epoch": 1.03, + "learning_rate": 1.523210888999621e-06, + "loss": 0.4011, + "step": 40381 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231873079488074e-06, + "loss": 0.5046, + "step": 40382 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231637264974131e-06, + "loss": 0.6401, + "step": 40383 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231401446454567e-06, + "loss": 0.7139, + "step": 40384 + }, + { + "epoch": 1.04, + "learning_rate": 1.5231165623929555e-06, + "loss": 0.5261, + "step": 40385 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230929797399283e-06, + "loss": 0.6899, + "step": 40386 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230693966863925e-06, + "loss": 0.6279, + "step": 40387 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230458132323669e-06, + "loss": 0.6777, + "step": 40388 + }, + { + "epoch": 1.04, + "learning_rate": 1.5230222293778692e-06, + "loss": 0.627, + "step": 40389 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229986451229175e-06, + "loss": 0.5352, + "step": 40390 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229750604675294e-06, + "loss": 0.7959, + "step": 40391 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229514754117236e-06, + "loss": 0.6255, + "step": 40392 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229278899555179e-06, + "loss": 0.6455, + "step": 40393 + }, + { + "epoch": 1.04, + "learning_rate": 1.5229043040989303e-06, + "loss": 0.6836, + "step": 40394 + }, + { + "epoch": 1.04, + "learning_rate": 1.522880717841979e-06, + "loss": 0.6016, + "step": 40395 + }, + { + "epoch": 1.04, + "learning_rate": 1.5228571311846817e-06, + "loss": 0.6416, + "step": 40396 + }, + { + "epoch": 1.04, + "learning_rate": 1.522833544127057e-06, + "loss": 0.5962, + "step": 40397 + }, + { + "epoch": 1.04, + "learning_rate": 1.5228099566691225e-06, + "loss": 0.6313, + "step": 40398 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227863688108966e-06, + "loss": 0.7266, + "step": 40399 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227627805523973e-06, + "loss": 0.6001, + "step": 40400 + }, + { + "epoch": 1.04, + "learning_rate": 1.5227391918936424e-06, + "loss": 0.5508, + "step": 40401 + }, + { + "epoch": 1.04, + "learning_rate": 1.52271560283465e-06, + "loss": 0.8496, + "step": 40402 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226920133754387e-06, + "loss": 0.7344, + "step": 40403 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226684235160258e-06, + "loss": 0.79, + "step": 40404 + }, + { + "epoch": 1.04, + "learning_rate": 1.52264483325643e-06, + "loss": 0.7139, + "step": 40405 + }, + { + "epoch": 1.04, + "learning_rate": 1.5226212425966689e-06, + "loss": 0.626, + "step": 40406 + }, + { + "epoch": 1.04, + "learning_rate": 1.522597651536761e-06, + "loss": 0.8154, + "step": 40407 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225740600767238e-06, + "loss": 0.6572, + "step": 40408 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225504682165759e-06, + "loss": 0.6587, + "step": 40409 + }, + { + "epoch": 1.04, + "learning_rate": 1.522526875956335e-06, + "loss": 0.5928, + "step": 40410 + }, + { + "epoch": 1.04, + "learning_rate": 1.5225032832960194e-06, + "loss": 0.6729, + "step": 40411 + }, + { + "epoch": 1.04, + "learning_rate": 1.522479690235647e-06, + "loss": 0.604, + "step": 40412 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224560967752357e-06, + "loss": 0.5864, + "step": 40413 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224325029148042e-06, + "loss": 0.709, + "step": 40414 + }, + { + "epoch": 1.04, + "learning_rate": 1.5224089086543702e-06, + "loss": 0.5889, + "step": 40415 + }, + { + "epoch": 1.04, + "learning_rate": 1.522385313993951e-06, + "loss": 0.6445, + "step": 40416 + }, + { + "epoch": 1.04, + "learning_rate": 1.5223617189335661e-06, + "loss": 0.7227, + "step": 40417 + }, + { + "epoch": 1.04, + "learning_rate": 1.5223381234732324e-06, + "loss": 0.7354, + "step": 40418 + }, + { + "epoch": 1.04, + "learning_rate": 1.522314527612969e-06, + "loss": 0.5986, + "step": 40419 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222909313527929e-06, + "loss": 0.6914, + "step": 40420 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222673346927227e-06, + "loss": 0.752, + "step": 40421 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222437376327766e-06, + "loss": 0.5867, + "step": 40422 + }, + { + "epoch": 1.04, + "learning_rate": 1.5222201401729722e-06, + "loss": 0.793, + "step": 40423 + }, + { + "epoch": 1.04, + "learning_rate": 1.522196542313328e-06, + "loss": 0.5144, + "step": 40424 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221729440538619e-06, + "loss": 0.583, + "step": 40425 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221493453945922e-06, + "loss": 0.6421, + "step": 40426 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221257463355364e-06, + "loss": 0.748, + "step": 40427 + }, + { + "epoch": 1.04, + "learning_rate": 1.5221021468767131e-06, + "loss": 0.6304, + "step": 40428 + }, + { + "epoch": 1.04, + "learning_rate": 1.52207854701814e-06, + "loss": 0.6172, + "step": 40429 + }, + { + "epoch": 1.04, + "learning_rate": 1.522054946759836e-06, + "loss": 0.6213, + "step": 40430 + }, + { + "epoch": 1.04, + "learning_rate": 1.522031346101818e-06, + "loss": 0.5044, + "step": 40431 + }, + { + "epoch": 1.04, + "learning_rate": 1.5220077450441044e-06, + "loss": 0.7559, + "step": 40432 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219841435867139e-06, + "loss": 0.6606, + "step": 40433 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219605417296642e-06, + "loss": 0.8555, + "step": 40434 + }, + { + "epoch": 1.04, + "learning_rate": 1.5219369394729729e-06, + "loss": 0.8516, + "step": 40435 + }, + { + "epoch": 1.04, + "learning_rate": 1.521913336816659e-06, + "loss": 0.6143, + "step": 40436 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218897337607395e-06, + "loss": 0.4189, + "step": 40437 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218661303052334e-06, + "loss": 0.7725, + "step": 40438 + }, + { + "epoch": 1.04, + "learning_rate": 1.521842526450158e-06, + "loss": 0.6233, + "step": 40439 + }, + { + "epoch": 1.04, + "learning_rate": 1.5218189221955323e-06, + "loss": 0.5842, + "step": 40440 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217953175413735e-06, + "loss": 0.7676, + "step": 40441 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217717124877e-06, + "loss": 0.7979, + "step": 40442 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217481070345302e-06, + "loss": 0.6738, + "step": 40443 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217245011818815e-06, + "loss": 0.7178, + "step": 40444 + }, + { + "epoch": 1.04, + "learning_rate": 1.5217008949297726e-06, + "loss": 0.7837, + "step": 40445 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216772882782213e-06, + "loss": 0.5835, + "step": 40446 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216536812272456e-06, + "loss": 0.6338, + "step": 40447 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216300737768638e-06, + "loss": 0.7324, + "step": 40448 + }, + { + "epoch": 1.04, + "learning_rate": 1.5216064659270935e-06, + "loss": 0.6895, + "step": 40449 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215828576779535e-06, + "loss": 0.8125, + "step": 40450 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215592490294613e-06, + "loss": 0.7451, + "step": 40451 + }, + { + "epoch": 1.04, + "learning_rate": 1.5215356399816351e-06, + "loss": 0.6187, + "step": 40452 + }, + { + "epoch": 1.04, + "learning_rate": 1.521512030534493e-06, + "loss": 0.6387, + "step": 40453 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214884206880534e-06, + "loss": 0.5664, + "step": 40454 + }, + { + "epoch": 1.04, + "learning_rate": 1.521464810442334e-06, + "loss": 0.603, + "step": 40455 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214411997973528e-06, + "loss": 0.7222, + "step": 40456 + }, + { + "epoch": 1.04, + "learning_rate": 1.5214175887531283e-06, + "loss": 0.5889, + "step": 40457 + }, + { + "epoch": 1.04, + "learning_rate": 1.521393977309678e-06, + "loss": 0.5972, + "step": 40458 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213703654670206e-06, + "loss": 0.6072, + "step": 40459 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213467532251738e-06, + "loss": 0.7725, + "step": 40460 + }, + { + "epoch": 1.04, + "learning_rate": 1.5213231405841559e-06, + "loss": 0.668, + "step": 40461 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212995275439843e-06, + "loss": 0.584, + "step": 40462 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212759141046783e-06, + "loss": 0.6094, + "step": 40463 + }, + { + "epoch": 1.04, + "learning_rate": 1.521252300266255e-06, + "loss": 0.5981, + "step": 40464 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212286860287326e-06, + "loss": 0.7305, + "step": 40465 + }, + { + "epoch": 1.04, + "learning_rate": 1.5212050713921297e-06, + "loss": 0.8506, + "step": 40466 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211814563564639e-06, + "loss": 0.8486, + "step": 40467 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211578409217534e-06, + "loss": 0.7109, + "step": 40468 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211342250880161e-06, + "loss": 0.8027, + "step": 40469 + }, + { + "epoch": 1.04, + "learning_rate": 1.5211106088552708e-06, + "loss": 0.6729, + "step": 40470 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210869922235347e-06, + "loss": 0.5884, + "step": 40471 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210633751928264e-06, + "loss": 0.6777, + "step": 40472 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210397577631636e-06, + "loss": 0.4399, + "step": 40473 + }, + { + "epoch": 1.04, + "learning_rate": 1.5210161399345646e-06, + "loss": 0.7061, + "step": 40474 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209925217070478e-06, + "loss": 0.748, + "step": 40475 + }, + { + "epoch": 1.04, + "learning_rate": 1.520968903080631e-06, + "loss": 0.5837, + "step": 40476 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209452840553319e-06, + "loss": 0.6499, + "step": 40477 + }, + { + "epoch": 1.04, + "learning_rate": 1.5209216646311693e-06, + "loss": 0.6855, + "step": 40478 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208980448081607e-06, + "loss": 0.5562, + "step": 40479 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208744245863248e-06, + "loss": 0.6074, + "step": 40480 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208508039656788e-06, + "loss": 0.7148, + "step": 40481 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208271829462417e-06, + "loss": 0.6978, + "step": 40482 + }, + { + "epoch": 1.04, + "learning_rate": 1.5208035615280308e-06, + "loss": 0.6479, + "step": 40483 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207799397110648e-06, + "loss": 0.71, + "step": 40484 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207563174953615e-06, + "loss": 0.6284, + "step": 40485 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207326948809392e-06, + "loss": 0.5625, + "step": 40486 + }, + { + "epoch": 1.04, + "learning_rate": 1.5207090718678154e-06, + "loss": 0.6055, + "step": 40487 + }, + { + "epoch": 1.04, + "learning_rate": 1.520685448456009e-06, + "loss": 0.7305, + "step": 40488 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206618246455375e-06, + "loss": 0.5854, + "step": 40489 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206382004364193e-06, + "loss": 0.6509, + "step": 40490 + }, + { + "epoch": 1.04, + "learning_rate": 1.5206145758286724e-06, + "loss": 0.386, + "step": 40491 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205909508223145e-06, + "loss": 0.7158, + "step": 40492 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205673254173643e-06, + "loss": 0.8535, + "step": 40493 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205436996138396e-06, + "loss": 0.5479, + "step": 40494 + }, + { + "epoch": 1.04, + "learning_rate": 1.5205200734117588e-06, + "loss": 0.7324, + "step": 40495 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204964468111392e-06, + "loss": 0.563, + "step": 40496 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204728198119997e-06, + "loss": 0.585, + "step": 40497 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204491924143582e-06, + "loss": 0.6235, + "step": 40498 + }, + { + "epoch": 1.04, + "learning_rate": 1.5204255646182325e-06, + "loss": 0.6855, + "step": 40499 + }, + { + "epoch": 1.04, + "learning_rate": 1.520401936423641e-06, + "loss": 0.6653, + "step": 40500 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203783078306018e-06, + "loss": 0.543, + "step": 40501 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203546788391325e-06, + "loss": 0.5723, + "step": 40502 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203310494492518e-06, + "loss": 0.5845, + "step": 40503 + }, + { + "epoch": 1.04, + "learning_rate": 1.5203074196609773e-06, + "loss": 0.7695, + "step": 40504 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202837894743277e-06, + "loss": 0.6367, + "step": 40505 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202601588893202e-06, + "loss": 0.7603, + "step": 40506 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202365279059739e-06, + "loss": 0.8838, + "step": 40507 + }, + { + "epoch": 1.04, + "learning_rate": 1.5202128965243062e-06, + "loss": 0.4742, + "step": 40508 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201892647443356e-06, + "loss": 0.7246, + "step": 40509 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201656325660797e-06, + "loss": 0.8027, + "step": 40510 + }, + { + "epoch": 1.04, + "learning_rate": 1.520141999989557e-06, + "loss": 0.6396, + "step": 40511 + }, + { + "epoch": 1.04, + "learning_rate": 1.5201183670147855e-06, + "loss": 0.5498, + "step": 40512 + }, + { + "epoch": 1.04, + "learning_rate": 1.520094733641783e-06, + "loss": 0.7988, + "step": 40513 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200710998705683e-06, + "loss": 0.708, + "step": 40514 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200474657011592e-06, + "loss": 0.4792, + "step": 40515 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200238311335733e-06, + "loss": 0.6484, + "step": 40516 + }, + { + "epoch": 1.04, + "learning_rate": 1.5200001961678291e-06, + "loss": 0.6699, + "step": 40517 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199765608039447e-06, + "loss": 0.6582, + "step": 40518 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199529250419384e-06, + "loss": 0.7158, + "step": 40519 + }, + { + "epoch": 1.04, + "learning_rate": 1.519929288881828e-06, + "loss": 0.4893, + "step": 40520 + }, + { + "epoch": 1.04, + "learning_rate": 1.5199056523236314e-06, + "loss": 0.6567, + "step": 40521 + }, + { + "epoch": 1.04, + "learning_rate": 1.519882015367367e-06, + "loss": 0.5781, + "step": 40522 + }, + { + "epoch": 1.04, + "learning_rate": 1.519858378013053e-06, + "loss": 0.7354, + "step": 40523 + }, + { + "epoch": 1.04, + "learning_rate": 1.5198347402607073e-06, + "loss": 0.5266, + "step": 40524 + }, + { + "epoch": 1.04, + "learning_rate": 1.519811102110348e-06, + "loss": 0.6797, + "step": 40525 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197874635619932e-06, + "loss": 0.6914, + "step": 40526 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197638246156607e-06, + "loss": 0.792, + "step": 40527 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197401852713695e-06, + "loss": 0.5337, + "step": 40528 + }, + { + "epoch": 1.04, + "learning_rate": 1.5197165455291368e-06, + "loss": 0.6191, + "step": 40529 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196929053889813e-06, + "loss": 0.6255, + "step": 40530 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196692648509205e-06, + "loss": 0.4441, + "step": 40531 + }, + { + "epoch": 1.04, + "learning_rate": 1.5196456239149733e-06, + "loss": 0.6846, + "step": 40532 + }, + { + "epoch": 1.04, + "learning_rate": 1.519621982581157e-06, + "loss": 0.8418, + "step": 40533 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195983408494901e-06, + "loss": 0.6123, + "step": 40534 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195746987199909e-06, + "loss": 0.7637, + "step": 40535 + }, + { + "epoch": 1.04, + "learning_rate": 1.519551056192677e-06, + "loss": 0.6226, + "step": 40536 + }, + { + "epoch": 1.04, + "learning_rate": 1.5195274132675667e-06, + "loss": 0.8047, + "step": 40537 + }, + { + "epoch": 1.04, + "learning_rate": 1.519503769944678e-06, + "loss": 0.5977, + "step": 40538 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194801262240296e-06, + "loss": 0.729, + "step": 40539 + }, + { + "epoch": 1.04, + "learning_rate": 1.519456482105639e-06, + "loss": 0.7217, + "step": 40540 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194328375895244e-06, + "loss": 0.7568, + "step": 40541 + }, + { + "epoch": 1.04, + "learning_rate": 1.5194091926757037e-06, + "loss": 0.8535, + "step": 40542 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193855473641954e-06, + "loss": 0.6567, + "step": 40543 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193619016550175e-06, + "loss": 0.5603, + "step": 40544 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193382555481887e-06, + "loss": 0.7842, + "step": 40545 + }, + { + "epoch": 1.04, + "learning_rate": 1.5193146090437257e-06, + "loss": 0.6572, + "step": 40546 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192909621416477e-06, + "loss": 0.6709, + "step": 40547 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192673148419722e-06, + "loss": 0.6309, + "step": 40548 + }, + { + "epoch": 1.04, + "learning_rate": 1.519243667144718e-06, + "loss": 0.6934, + "step": 40549 + }, + { + "epoch": 1.04, + "learning_rate": 1.5192200190499024e-06, + "loss": 0.6299, + "step": 40550 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191963705575442e-06, + "loss": 0.6904, + "step": 40551 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191727216676608e-06, + "loss": 0.5981, + "step": 40552 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191490723802711e-06, + "loss": 0.5366, + "step": 40553 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191254226953928e-06, + "loss": 0.8164, + "step": 40554 + }, + { + "epoch": 1.04, + "learning_rate": 1.5191017726130442e-06, + "loss": 0.6646, + "step": 40555 + }, + { + "epoch": 1.04, + "learning_rate": 1.519078122133243e-06, + "loss": 0.4154, + "step": 40556 + }, + { + "epoch": 1.04, + "learning_rate": 1.5190544712560073e-06, + "loss": 0.7529, + "step": 40557 + }, + { + "epoch": 1.04, + "learning_rate": 1.519030819981356e-06, + "loss": 0.8037, + "step": 40558 + }, + { + "epoch": 1.04, + "learning_rate": 1.5190071683093063e-06, + "loss": 0.7627, + "step": 40559 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189835162398769e-06, + "loss": 0.5725, + "step": 40560 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189598637730855e-06, + "loss": 0.4363, + "step": 40561 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189362109089502e-06, + "loss": 0.7212, + "step": 40562 + }, + { + "epoch": 1.04, + "learning_rate": 1.5189125576474897e-06, + "loss": 0.8066, + "step": 40563 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188889039887215e-06, + "loss": 0.5254, + "step": 40564 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188652499326642e-06, + "loss": 0.6772, + "step": 40565 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188415954793355e-06, + "loss": 0.7446, + "step": 40566 + }, + { + "epoch": 1.04, + "learning_rate": 1.5188179406287534e-06, + "loss": 0.6738, + "step": 40567 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187942853809364e-06, + "loss": 0.5142, + "step": 40568 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187706297359025e-06, + "loss": 0.5776, + "step": 40569 + }, + { + "epoch": 1.04, + "learning_rate": 1.51874697369367e-06, + "loss": 0.5347, + "step": 40570 + }, + { + "epoch": 1.04, + "learning_rate": 1.5187233172542564e-06, + "loss": 0.584, + "step": 40571 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186996604176804e-06, + "loss": 0.7168, + "step": 40572 + }, + { + "epoch": 1.04, + "learning_rate": 1.51867600318396e-06, + "loss": 0.6387, + "step": 40573 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186523455531131e-06, + "loss": 0.7197, + "step": 40574 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186286875251582e-06, + "loss": 0.7529, + "step": 40575 + }, + { + "epoch": 1.04, + "learning_rate": 1.5186050291001126e-06, + "loss": 0.7148, + "step": 40576 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185813702779955e-06, + "loss": 0.6631, + "step": 40577 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185577110588243e-06, + "loss": 0.5537, + "step": 40578 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185340514426172e-06, + "loss": 0.6113, + "step": 40579 + }, + { + "epoch": 1.04, + "learning_rate": 1.5185103914293926e-06, + "loss": 0.5679, + "step": 40580 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184867310191686e-06, + "loss": 0.7261, + "step": 40581 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184630702119628e-06, + "loss": 0.7031, + "step": 40582 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184394090077936e-06, + "loss": 0.6582, + "step": 40583 + }, + { + "epoch": 1.04, + "learning_rate": 1.5184157474066794e-06, + "loss": 0.6929, + "step": 40584 + }, + { + "epoch": 1.04, + "learning_rate": 1.5183920854086383e-06, + "loss": 0.7725, + "step": 40585 + }, + { + "epoch": 1.04, + "learning_rate": 1.518368423013688e-06, + "loss": 0.709, + "step": 40586 + }, + { + "epoch": 1.04, + "learning_rate": 1.518344760221847e-06, + "loss": 0.7246, + "step": 40587 + }, + { + "epoch": 1.04, + "learning_rate": 1.5183210970331329e-06, + "loss": 0.8008, + "step": 40588 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182974334475644e-06, + "loss": 0.5173, + "step": 40589 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182737694651593e-06, + "loss": 0.6841, + "step": 40590 + }, + { + "epoch": 1.04, + "learning_rate": 1.518250105085936e-06, + "loss": 0.958, + "step": 40591 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182264403099121e-06, + "loss": 0.7412, + "step": 40592 + }, + { + "epoch": 1.04, + "learning_rate": 1.5182027751371062e-06, + "loss": 0.5449, + "step": 40593 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181791095675363e-06, + "loss": 0.5693, + "step": 40594 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181554436012208e-06, + "loss": 0.4109, + "step": 40595 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181317772381767e-06, + "loss": 0.8389, + "step": 40596 + }, + { + "epoch": 1.04, + "learning_rate": 1.5181081104784234e-06, + "loss": 0.6709, + "step": 40597 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180844433219785e-06, + "loss": 0.5879, + "step": 40598 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180607757688603e-06, + "loss": 0.5242, + "step": 40599 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180371078190867e-06, + "loss": 0.5996, + "step": 40600 + }, + { + "epoch": 1.04, + "learning_rate": 1.5180134394726758e-06, + "loss": 0.7129, + "step": 40601 + }, + { + "epoch": 1.04, + "learning_rate": 1.517989770729646e-06, + "loss": 0.6602, + "step": 40602 + }, + { + "epoch": 1.04, + "learning_rate": 1.5179661015900149e-06, + "loss": 0.8359, + "step": 40603 + }, + { + "epoch": 1.04, + "learning_rate": 1.5179424320538015e-06, + "loss": 0.5215, + "step": 40604 + }, + { + "epoch": 1.04, + "learning_rate": 1.517918762121023e-06, + "loss": 0.8633, + "step": 40605 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178950917916984e-06, + "loss": 0.6104, + "step": 40606 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178714210658448e-06, + "loss": 0.7324, + "step": 40607 + }, + { + "epoch": 1.04, + "learning_rate": 1.517847749943481e-06, + "loss": 0.6309, + "step": 40608 + }, + { + "epoch": 1.04, + "learning_rate": 1.517824078424625e-06, + "loss": 0.5833, + "step": 40609 + }, + { + "epoch": 1.04, + "learning_rate": 1.5178004065092952e-06, + "loss": 0.6011, + "step": 40610 + }, + { + "epoch": 1.04, + "learning_rate": 1.517776734197509e-06, + "loss": 0.7578, + "step": 40611 + }, + { + "epoch": 1.04, + "learning_rate": 1.517753061489285e-06, + "loss": 0.5625, + "step": 40612 + }, + { + "epoch": 1.04, + "learning_rate": 1.5177293883846414e-06, + "loss": 0.6104, + "step": 40613 + }, + { + "epoch": 1.04, + "learning_rate": 1.5177057148835965e-06, + "loss": 0.5913, + "step": 40614 + }, + { + "epoch": 1.04, + "learning_rate": 1.517682040986168e-06, + "loss": 0.6514, + "step": 40615 + }, + { + "epoch": 1.04, + "learning_rate": 1.517658366692374e-06, + "loss": 0.4094, + "step": 40616 + }, + { + "epoch": 1.04, + "learning_rate": 1.5176346920022327e-06, + "loss": 0.5706, + "step": 40617 + }, + { + "epoch": 1.04, + "learning_rate": 1.5176110169157625e-06, + "loss": 0.4463, + "step": 40618 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175873414329817e-06, + "loss": 0.873, + "step": 40619 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175636655539076e-06, + "loss": 0.5612, + "step": 40620 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175399892785588e-06, + "loss": 0.5791, + "step": 40621 + }, + { + "epoch": 1.04, + "learning_rate": 1.5175163126069533e-06, + "loss": 0.6953, + "step": 40622 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174926355391095e-06, + "loss": 0.5542, + "step": 40623 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174689580750456e-06, + "loss": 0.666, + "step": 40624 + }, + { + "epoch": 1.04, + "learning_rate": 1.5174452802147794e-06, + "loss": 0.7822, + "step": 40625 + }, + { + "epoch": 1.04, + "learning_rate": 1.517421601958329e-06, + "loss": 0.7017, + "step": 40626 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173979233057129e-06, + "loss": 0.4827, + "step": 40627 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173742442569485e-06, + "loss": 0.6201, + "step": 40628 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173505648120553e-06, + "loss": 0.7764, + "step": 40629 + }, + { + "epoch": 1.04, + "learning_rate": 1.51732688497105e-06, + "loss": 0.7295, + "step": 40630 + }, + { + "epoch": 1.04, + "learning_rate": 1.5173032047339513e-06, + "loss": 0.4941, + "step": 40631 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172795241007771e-06, + "loss": 0.6138, + "step": 40632 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172558430715462e-06, + "loss": 0.6318, + "step": 40633 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172321616462761e-06, + "loss": 0.707, + "step": 40634 + }, + { + "epoch": 1.04, + "learning_rate": 1.5172084798249853e-06, + "loss": 0.6091, + "step": 40635 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171847976076918e-06, + "loss": 0.6162, + "step": 40636 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171611149944133e-06, + "loss": 0.4878, + "step": 40637 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171374319851683e-06, + "loss": 0.6738, + "step": 40638 + }, + { + "epoch": 1.04, + "learning_rate": 1.5171137485799753e-06, + "loss": 0.6689, + "step": 40639 + }, + { + "epoch": 1.04, + "learning_rate": 1.517090064778852e-06, + "loss": 0.6592, + "step": 40640 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170663805818164e-06, + "loss": 0.6792, + "step": 40641 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170426959888868e-06, + "loss": 0.5596, + "step": 40642 + }, + { + "epoch": 1.04, + "learning_rate": 1.5170190110000818e-06, + "loss": 0.6206, + "step": 40643 + }, + { + "epoch": 1.04, + "learning_rate": 1.516995325615419e-06, + "loss": 0.6875, + "step": 40644 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169716398349163e-06, + "loss": 0.5596, + "step": 40645 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169479536585925e-06, + "loss": 0.635, + "step": 40646 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169242670864652e-06, + "loss": 0.7812, + "step": 40647 + }, + { + "epoch": 1.04, + "learning_rate": 1.5169005801185529e-06, + "loss": 0.6138, + "step": 40648 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168768927548737e-06, + "loss": 0.6475, + "step": 40649 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168532049954455e-06, + "loss": 0.8105, + "step": 40650 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168295168402865e-06, + "loss": 0.7295, + "step": 40651 + }, + { + "epoch": 1.04, + "learning_rate": 1.5168058282894148e-06, + "loss": 0.6816, + "step": 40652 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167821393428488e-06, + "loss": 0.5415, + "step": 40653 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167584500006068e-06, + "loss": 0.7202, + "step": 40654 + }, + { + "epoch": 1.04, + "learning_rate": 1.5167347602627061e-06, + "loss": 0.7695, + "step": 40655 + }, + { + "epoch": 1.04, + "learning_rate": 1.516711070129166e-06, + "loss": 0.5864, + "step": 40656 + }, + { + "epoch": 1.04, + "learning_rate": 1.516687379600003e-06, + "loss": 0.7266, + "step": 40657 + }, + { + "epoch": 1.04, + "learning_rate": 1.516663688675237e-06, + "loss": 0.6562, + "step": 40658 + }, + { + "epoch": 1.04, + "learning_rate": 1.5166399973548854e-06, + "loss": 0.5327, + "step": 40659 + }, + { + "epoch": 1.04, + "learning_rate": 1.516616305638966e-06, + "loss": 0.6802, + "step": 40660 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165926135274974e-06, + "loss": 0.5801, + "step": 40661 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165689210204976e-06, + "loss": 0.6855, + "step": 40662 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165452281179842e-06, + "loss": 0.6265, + "step": 40663 + }, + { + "epoch": 1.04, + "learning_rate": 1.5165215348199764e-06, + "loss": 0.6411, + "step": 40664 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164978411264918e-06, + "loss": 0.6924, + "step": 40665 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164741470375485e-06, + "loss": 0.6748, + "step": 40666 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164504525531645e-06, + "loss": 0.603, + "step": 40667 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164267576733586e-06, + "loss": 0.5645, + "step": 40668 + }, + { + "epoch": 1.04, + "learning_rate": 1.5164030623981484e-06, + "loss": 0.6924, + "step": 40669 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163793667275514e-06, + "loss": 0.6157, + "step": 40670 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163556706615873e-06, + "loss": 0.6704, + "step": 40671 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163319742002728e-06, + "loss": 0.468, + "step": 40672 + }, + { + "epoch": 1.04, + "learning_rate": 1.5163082773436271e-06, + "loss": 0.6323, + "step": 40673 + }, + { + "epoch": 1.04, + "learning_rate": 1.5162845800916678e-06, + "loss": 0.3464, + "step": 40674 + }, + { + "epoch": 1.04, + "learning_rate": 1.516260882444413e-06, + "loss": 0.7324, + "step": 40675 + }, + { + "epoch": 1.04, + "learning_rate": 1.516237184401881e-06, + "loss": 0.6392, + "step": 40676 + }, + { + "epoch": 1.04, + "learning_rate": 1.5162134859640898e-06, + "loss": 0.5283, + "step": 40677 + }, + { + "epoch": 1.04, + "learning_rate": 1.516189787131058e-06, + "loss": 0.7129, + "step": 40678 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161660879028034e-06, + "loss": 0.7451, + "step": 40679 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161423882793436e-06, + "loss": 0.7393, + "step": 40680 + }, + { + "epoch": 1.04, + "learning_rate": 1.5161186882606977e-06, + "loss": 0.7754, + "step": 40681 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160949878468836e-06, + "loss": 0.5835, + "step": 40682 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160712870379192e-06, + "loss": 0.7178, + "step": 40683 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160475858338227e-06, + "loss": 0.501, + "step": 40684 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160238842346122e-06, + "loss": 0.7383, + "step": 40685 + }, + { + "epoch": 1.04, + "learning_rate": 1.5160001822403062e-06, + "loss": 0.6548, + "step": 40686 + }, + { + "epoch": 1.04, + "learning_rate": 1.5159764798509222e-06, + "loss": 0.7207, + "step": 40687 + }, + { + "epoch": 1.04, + "learning_rate": 1.515952777066479e-06, + "loss": 0.7793, + "step": 40688 + }, + { + "epoch": 1.04, + "learning_rate": 1.5159290738869946e-06, + "loss": 0.6846, + "step": 40689 + }, + { + "epoch": 1.04, + "learning_rate": 1.515905370312487e-06, + "loss": 0.834, + "step": 40690 + }, + { + "epoch": 1.04, + "learning_rate": 1.515881666342974e-06, + "loss": 0.6602, + "step": 40691 + }, + { + "epoch": 1.04, + "learning_rate": 1.5158579619784743e-06, + "loss": 0.6035, + "step": 40692 + }, + { + "epoch": 1.04, + "learning_rate": 1.515834257219006e-06, + "loss": 0.6626, + "step": 40693 + }, + { + "epoch": 1.04, + "learning_rate": 1.5158105520645874e-06, + "loss": 0.5815, + "step": 40694 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157868465152358e-06, + "loss": 0.7373, + "step": 40695 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157631405709702e-06, + "loss": 0.7004, + "step": 40696 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157394342318084e-06, + "loss": 0.4197, + "step": 40697 + }, + { + "epoch": 1.04, + "learning_rate": 1.5157157274977688e-06, + "loss": 0.6709, + "step": 40698 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156920203688693e-06, + "loss": 0.5474, + "step": 40699 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156683128451282e-06, + "loss": 0.7676, + "step": 40700 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156446049265634e-06, + "loss": 0.4626, + "step": 40701 + }, + { + "epoch": 1.04, + "learning_rate": 1.5156208966131933e-06, + "loss": 0.8271, + "step": 40702 + }, + { + "epoch": 1.04, + "learning_rate": 1.515597187905036e-06, + "loss": 0.6494, + "step": 40703 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155734788021098e-06, + "loss": 0.5923, + "step": 40704 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155497693044325e-06, + "loss": 0.4388, + "step": 40705 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155260594120226e-06, + "loss": 0.6855, + "step": 40706 + }, + { + "epoch": 1.04, + "learning_rate": 1.5155023491248978e-06, + "loss": 0.6699, + "step": 40707 + }, + { + "epoch": 1.04, + "learning_rate": 1.515478638443077e-06, + "loss": 0.8887, + "step": 40708 + }, + { + "epoch": 1.04, + "learning_rate": 1.5154549273665774e-06, + "loss": 0.7793, + "step": 40709 + }, + { + "epoch": 1.04, + "learning_rate": 1.515431215895418e-06, + "loss": 0.6221, + "step": 40710 + }, + { + "epoch": 1.04, + "learning_rate": 1.5154075040296165e-06, + "loss": 0.6196, + "step": 40711 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153837917691911e-06, + "loss": 0.6865, + "step": 40712 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153600791141604e-06, + "loss": 0.77, + "step": 40713 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153363660645417e-06, + "loss": 0.6646, + "step": 40714 + }, + { + "epoch": 1.04, + "learning_rate": 1.5153126526203539e-06, + "loss": 0.6078, + "step": 40715 + }, + { + "epoch": 1.04, + "learning_rate": 1.515288938781615e-06, + "loss": 0.6172, + "step": 40716 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152652245483428e-06, + "loss": 0.6327, + "step": 40717 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152415099205559e-06, + "loss": 0.6963, + "step": 40718 + }, + { + "epoch": 1.04, + "learning_rate": 1.5152177948982724e-06, + "loss": 0.5182, + "step": 40719 + }, + { + "epoch": 1.04, + "learning_rate": 1.51519407948151e-06, + "loss": 0.5972, + "step": 40720 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151703636702873e-06, + "loss": 0.7148, + "step": 40721 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151466474646224e-06, + "loss": 0.7803, + "step": 40722 + }, + { + "epoch": 1.04, + "learning_rate": 1.5151229308645331e-06, + "loss": 0.4995, + "step": 40723 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150992138700383e-06, + "loss": 0.5889, + "step": 40724 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150754964811555e-06, + "loss": 0.6587, + "step": 40725 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150517786979032e-06, + "loss": 0.5825, + "step": 40726 + }, + { + "epoch": 1.04, + "learning_rate": 1.5150280605202993e-06, + "loss": 0.6348, + "step": 40727 + }, + { + "epoch": 1.04, + "learning_rate": 1.515004341948362e-06, + "loss": 0.7324, + "step": 40728 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149806229821098e-06, + "loss": 0.6611, + "step": 40729 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149569036215603e-06, + "loss": 0.7686, + "step": 40730 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149331838667325e-06, + "loss": 0.7441, + "step": 40731 + }, + { + "epoch": 1.04, + "learning_rate": 1.5149094637176436e-06, + "loss": 0.6758, + "step": 40732 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148857431743123e-06, + "loss": 0.6953, + "step": 40733 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148620222367567e-06, + "loss": 0.3719, + "step": 40734 + }, + { + "epoch": 1.04, + "learning_rate": 1.5148383009049947e-06, + "loss": 0.7607, + "step": 40735 + }, + { + "epoch": 1.04, + "learning_rate": 1.514814579179045e-06, + "loss": 0.7256, + "step": 40736 + }, + { + "epoch": 1.04, + "learning_rate": 1.5147908570589252e-06, + "loss": 0.6411, + "step": 40737 + }, + { + "epoch": 1.04, + "learning_rate": 1.514767134544654e-06, + "loss": 0.5889, + "step": 40738 + }, + { + "epoch": 1.04, + "learning_rate": 1.5147434116362491e-06, + "loss": 0.6079, + "step": 40739 + }, + { + "epoch": 1.04, + "learning_rate": 1.514719688333729e-06, + "loss": 0.5657, + "step": 40740 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146959646371116e-06, + "loss": 0.5122, + "step": 40741 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146722405464152e-06, + "loss": 0.5728, + "step": 40742 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146485160616575e-06, + "loss": 0.6924, + "step": 40743 + }, + { + "epoch": 1.04, + "learning_rate": 1.5146247911828578e-06, + "loss": 0.709, + "step": 40744 + }, + { + "epoch": 1.04, + "learning_rate": 1.514601065910033e-06, + "loss": 0.707, + "step": 40745 + }, + { + "epoch": 1.04, + "learning_rate": 1.514577340243202e-06, + "loss": 0.6709, + "step": 40746 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145536141823829e-06, + "loss": 0.6875, + "step": 40747 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145298877275936e-06, + "loss": 0.5759, + "step": 40748 + }, + { + "epoch": 1.04, + "learning_rate": 1.5145061608788528e-06, + "loss": 0.6621, + "step": 40749 + }, + { + "epoch": 1.04, + "learning_rate": 1.514482433636178e-06, + "loss": 0.4368, + "step": 40750 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144587059995875e-06, + "loss": 0.8232, + "step": 40751 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144349779691e-06, + "loss": 0.6914, + "step": 40752 + }, + { + "epoch": 1.04, + "learning_rate": 1.5144112495447327e-06, + "loss": 0.4951, + "step": 40753 + }, + { + "epoch": 1.04, + "learning_rate": 1.514387520726505e-06, + "loss": 0.6914, + "step": 40754 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143637915144343e-06, + "loss": 0.5701, + "step": 40755 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143400619085386e-06, + "loss": 0.541, + "step": 40756 + }, + { + "epoch": 1.04, + "learning_rate": 1.5143163319088364e-06, + "loss": 0.7432, + "step": 40757 + }, + { + "epoch": 1.04, + "learning_rate": 1.514292601515346e-06, + "loss": 0.7446, + "step": 40758 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142688707280856e-06, + "loss": 0.7686, + "step": 40759 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142451395470727e-06, + "loss": 0.6787, + "step": 40760 + }, + { + "epoch": 1.04, + "learning_rate": 1.5142214079723262e-06, + "loss": 0.6958, + "step": 40761 + }, + { + "epoch": 1.04, + "learning_rate": 1.514197676003864e-06, + "loss": 0.5496, + "step": 40762 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141739436417042e-06, + "loss": 0.5255, + "step": 40763 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141502108858652e-06, + "loss": 0.623, + "step": 40764 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141264777363652e-06, + "loss": 0.6895, + "step": 40765 + }, + { + "epoch": 1.04, + "learning_rate": 1.5141027441932214e-06, + "loss": 0.7529, + "step": 40766 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140790102564535e-06, + "loss": 0.7666, + "step": 40767 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140552759260788e-06, + "loss": 0.6069, + "step": 40768 + }, + { + "epoch": 1.04, + "learning_rate": 1.5140315412021156e-06, + "loss": 0.6924, + "step": 40769 + }, + { + "epoch": 1.04, + "learning_rate": 1.514007806084582e-06, + "loss": 0.7178, + "step": 40770 + }, + { + "epoch": 1.04, + "learning_rate": 1.5139840705734966e-06, + "loss": 0.6953, + "step": 40771 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139603346688764e-06, + "loss": 0.4707, + "step": 40772 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139365983707412e-06, + "loss": 0.7373, + "step": 40773 + }, + { + "epoch": 1.05, + "learning_rate": 1.5139128616791084e-06, + "loss": 0.7305, + "step": 40774 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138891245939958e-06, + "loss": 0.5679, + "step": 40775 + }, + { + "epoch": 1.05, + "learning_rate": 1.513865387115422e-06, + "loss": 0.7998, + "step": 40776 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138416492434049e-06, + "loss": 0.5615, + "step": 40777 + }, + { + "epoch": 1.05, + "learning_rate": 1.5138179109779633e-06, + "loss": 0.6079, + "step": 40778 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137941723191146e-06, + "loss": 0.6279, + "step": 40779 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137704332668774e-06, + "loss": 0.4638, + "step": 40780 + }, + { + "epoch": 1.05, + "learning_rate": 1.5137466938212699e-06, + "loss": 0.4717, + "step": 40781 + }, + { + "epoch": 1.05, + "learning_rate": 1.51372295398231e-06, + "loss": 0.5195, + "step": 40782 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136992137500161e-06, + "loss": 0.6592, + "step": 40783 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136754731244068e-06, + "loss": 0.6914, + "step": 40784 + }, + { + "epoch": 1.05, + "learning_rate": 1.513651732105499e-06, + "loss": 0.7231, + "step": 40785 + }, + { + "epoch": 1.05, + "learning_rate": 1.5136279906933125e-06, + "loss": 0.5596, + "step": 40786 + }, + { + "epoch": 1.05, + "learning_rate": 1.513604248887864e-06, + "loss": 0.8047, + "step": 40787 + }, + { + "epoch": 1.05, + "learning_rate": 1.513580506689173e-06, + "loss": 0.647, + "step": 40788 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135567640972564e-06, + "loss": 0.7881, + "step": 40789 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135330211121336e-06, + "loss": 0.5747, + "step": 40790 + }, + { + "epoch": 1.05, + "learning_rate": 1.5135092777338216e-06, + "loss": 0.5747, + "step": 40791 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134855339623393e-06, + "loss": 0.5957, + "step": 40792 + }, + { + "epoch": 1.05, + "learning_rate": 1.513461789797705e-06, + "loss": 0.7725, + "step": 40793 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134380452399365e-06, + "loss": 0.6299, + "step": 40794 + }, + { + "epoch": 1.05, + "learning_rate": 1.5134143002890519e-06, + "loss": 0.6719, + "step": 40795 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133905549450698e-06, + "loss": 0.5684, + "step": 40796 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133668092080082e-06, + "loss": 0.5737, + "step": 40797 + }, + { + "epoch": 1.05, + "learning_rate": 1.513343063077885e-06, + "loss": 0.6768, + "step": 40798 + }, + { + "epoch": 1.05, + "learning_rate": 1.5133193165547187e-06, + "loss": 0.6709, + "step": 40799 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132955696385272e-06, + "loss": 0.4805, + "step": 40800 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132718223293292e-06, + "loss": 0.792, + "step": 40801 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132480746271426e-06, + "loss": 0.8477, + "step": 40802 + }, + { + "epoch": 1.05, + "learning_rate": 1.5132243265319855e-06, + "loss": 0.6421, + "step": 40803 + }, + { + "epoch": 1.05, + "learning_rate": 1.513200578043876e-06, + "loss": 0.6592, + "step": 40804 + }, + { + "epoch": 1.05, + "learning_rate": 1.5131768291628326e-06, + "loss": 0.7969, + "step": 40805 + }, + { + "epoch": 1.05, + "learning_rate": 1.513153079888873e-06, + "loss": 0.3901, + "step": 40806 + }, + { + "epoch": 1.05, + "learning_rate": 1.513129330222016e-06, + "loss": 0.7324, + "step": 40807 + }, + { + "epoch": 1.05, + "learning_rate": 1.5131055801622791e-06, + "loss": 0.7148, + "step": 40808 + }, + { + "epoch": 1.05, + "learning_rate": 1.5130818297096815e-06, + "loss": 0.5369, + "step": 40809 + }, + { + "epoch": 1.05, + "learning_rate": 1.51305807886424e-06, + "loss": 0.561, + "step": 40810 + }, + { + "epoch": 1.05, + "learning_rate": 1.5130343276259741e-06, + "loss": 0.6865, + "step": 40811 + }, + { + "epoch": 1.05, + "learning_rate": 1.513010575994901e-06, + "loss": 0.5791, + "step": 40812 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129868239710395e-06, + "loss": 0.7871, + "step": 40813 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129630715544076e-06, + "loss": 0.4775, + "step": 40814 + }, + { + "epoch": 1.05, + "learning_rate": 1.5129393187450233e-06, + "loss": 0.6206, + "step": 40815 + }, + { + "epoch": 1.05, + "learning_rate": 1.512915565542905e-06, + "loss": 0.5046, + "step": 40816 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128918119480706e-06, + "loss": 0.7822, + "step": 40817 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128680579605388e-06, + "loss": 0.7441, + "step": 40818 + }, + { + "epoch": 1.05, + "learning_rate": 1.5128443035803277e-06, + "loss": 0.5386, + "step": 40819 + }, + { + "epoch": 1.05, + "learning_rate": 1.512820548807455e-06, + "loss": 0.6382, + "step": 40820 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127967936419394e-06, + "loss": 0.6226, + "step": 40821 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127730380837986e-06, + "loss": 0.6172, + "step": 40822 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127492821330515e-06, + "loss": 0.7178, + "step": 40823 + }, + { + "epoch": 1.05, + "learning_rate": 1.5127255257897154e-06, + "loss": 0.7383, + "step": 40824 + }, + { + "epoch": 1.05, + "learning_rate": 1.512701769053809e-06, + "loss": 0.6294, + "step": 40825 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126780119253506e-06, + "loss": 0.6162, + "step": 40826 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126542544043579e-06, + "loss": 0.6016, + "step": 40827 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126304964908499e-06, + "loss": 0.6851, + "step": 40828 + }, + { + "epoch": 1.05, + "learning_rate": 1.5126067381848442e-06, + "loss": 0.7578, + "step": 40829 + }, + { + "epoch": 1.05, + "learning_rate": 1.512582979486359e-06, + "loss": 0.6421, + "step": 40830 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125592203954124e-06, + "loss": 0.6396, + "step": 40831 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125354609120228e-06, + "loss": 0.7324, + "step": 40832 + }, + { + "epoch": 1.05, + "learning_rate": 1.5125117010362084e-06, + "loss": 0.7939, + "step": 40833 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124879407679876e-06, + "loss": 0.5444, + "step": 40834 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124641801073784e-06, + "loss": 0.6562, + "step": 40835 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124404190543985e-06, + "loss": 0.7451, + "step": 40836 + }, + { + "epoch": 1.05, + "learning_rate": 1.5124166576090668e-06, + "loss": 0.7666, + "step": 40837 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123928957714012e-06, + "loss": 0.5361, + "step": 40838 + }, + { + "epoch": 1.05, + "learning_rate": 1.51236913354142e-06, + "loss": 0.5386, + "step": 40839 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123453709191412e-06, + "loss": 0.7012, + "step": 40840 + }, + { + "epoch": 1.05, + "learning_rate": 1.5123216079045832e-06, + "loss": 0.6143, + "step": 40841 + }, + { + "epoch": 1.05, + "learning_rate": 1.512297844497764e-06, + "loss": 0.6479, + "step": 40842 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122740806987015e-06, + "loss": 0.6621, + "step": 40843 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122503165074148e-06, + "loss": 0.5811, + "step": 40844 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122265519239217e-06, + "loss": 0.752, + "step": 40845 + }, + { + "epoch": 1.05, + "learning_rate": 1.5122027869482399e-06, + "loss": 0.6162, + "step": 40846 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121790215803882e-06, + "loss": 0.6821, + "step": 40847 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121552558203848e-06, + "loss": 0.6709, + "step": 40848 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121314896682472e-06, + "loss": 0.7061, + "step": 40849 + }, + { + "epoch": 1.05, + "learning_rate": 1.5121077231239942e-06, + "loss": 0.6328, + "step": 40850 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120839561876442e-06, + "loss": 0.6553, + "step": 40851 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120601888592144e-06, + "loss": 0.6445, + "step": 40852 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120364211387243e-06, + "loss": 0.5884, + "step": 40853 + }, + { + "epoch": 1.05, + "learning_rate": 1.5120126530261913e-06, + "loss": 0.6309, + "step": 40854 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119888845216338e-06, + "loss": 0.4473, + "step": 40855 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119651156250695e-06, + "loss": 0.7188, + "step": 40856 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119413463365174e-06, + "loss": 0.4597, + "step": 40857 + }, + { + "epoch": 1.05, + "learning_rate": 1.5119175766559954e-06, + "loss": 0.6655, + "step": 40858 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118938065835217e-06, + "loss": 0.5879, + "step": 40859 + }, + { + "epoch": 1.05, + "learning_rate": 1.511870036119114e-06, + "loss": 0.584, + "step": 40860 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118462652627914e-06, + "loss": 0.7256, + "step": 40861 + }, + { + "epoch": 1.05, + "learning_rate": 1.5118224940145714e-06, + "loss": 0.5811, + "step": 40862 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117987223744727e-06, + "loss": 0.6885, + "step": 40863 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117749503425133e-06, + "loss": 0.4565, + "step": 40864 + }, + { + "epoch": 1.05, + "learning_rate": 1.511751177918711e-06, + "loss": 0.5044, + "step": 40865 + }, + { + "epoch": 1.05, + "learning_rate": 1.5117274051030844e-06, + "loss": 0.6406, + "step": 40866 + }, + { + "epoch": 1.05, + "learning_rate": 1.511703631895652e-06, + "loss": 0.8564, + "step": 40867 + }, + { + "epoch": 1.05, + "learning_rate": 1.511679858296431e-06, + "loss": 0.7773, + "step": 40868 + }, + { + "epoch": 1.05, + "learning_rate": 1.5116560843054411e-06, + "loss": 0.5156, + "step": 40869 + }, + { + "epoch": 1.05, + "learning_rate": 1.5116323099226993e-06, + "loss": 0.7432, + "step": 40870 + }, + { + "epoch": 1.05, + "learning_rate": 1.511608535148224e-06, + "loss": 0.7021, + "step": 40871 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115847599820336e-06, + "loss": 0.5596, + "step": 40872 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115609844241464e-06, + "loss": 0.6697, + "step": 40873 + }, + { + "epoch": 1.05, + "learning_rate": 1.5115372084745808e-06, + "loss": 0.7168, + "step": 40874 + }, + { + "epoch": 1.05, + "learning_rate": 1.511513432133354e-06, + "loss": 0.6973, + "step": 40875 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114896554004856e-06, + "loss": 0.8262, + "step": 40876 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114658782759923e-06, + "loss": 0.6636, + "step": 40877 + }, + { + "epoch": 1.05, + "learning_rate": 1.5114421007598937e-06, + "loss": 0.7002, + "step": 40878 + }, + { + "epoch": 1.05, + "learning_rate": 1.511418322852207e-06, + "loss": 0.7998, + "step": 40879 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113945445529513e-06, + "loss": 0.5688, + "step": 40880 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113707658621438e-06, + "loss": 0.5159, + "step": 40881 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113469867798037e-06, + "loss": 0.6943, + "step": 40882 + }, + { + "epoch": 1.05, + "learning_rate": 1.5113232073059481e-06, + "loss": 0.7061, + "step": 40883 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112994274405964e-06, + "loss": 0.7158, + "step": 40884 + }, + { + "epoch": 1.05, + "learning_rate": 1.511275647183766e-06, + "loss": 0.6406, + "step": 40885 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112518665354755e-06, + "loss": 0.6514, + "step": 40886 + }, + { + "epoch": 1.05, + "learning_rate": 1.5112280854957427e-06, + "loss": 0.6455, + "step": 40887 + }, + { + "epoch": 1.05, + "learning_rate": 1.511204304064586e-06, + "loss": 0.6699, + "step": 40888 + }, + { + "epoch": 1.05, + "learning_rate": 1.511180522242024e-06, + "loss": 0.7832, + "step": 40889 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111567400280745e-06, + "loss": 0.5317, + "step": 40890 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111329574227557e-06, + "loss": 0.5142, + "step": 40891 + }, + { + "epoch": 1.05, + "learning_rate": 1.5111091744260858e-06, + "loss": 0.6909, + "step": 40892 + }, + { + "epoch": 1.05, + "learning_rate": 1.511085391038083e-06, + "loss": 0.6367, + "step": 40893 + }, + { + "epoch": 1.05, + "learning_rate": 1.511061607258766e-06, + "loss": 0.6299, + "step": 40894 + }, + { + "epoch": 1.05, + "learning_rate": 1.5110378230881527e-06, + "loss": 0.8652, + "step": 40895 + }, + { + "epoch": 1.05, + "learning_rate": 1.5110140385262608e-06, + "loss": 0.6416, + "step": 40896 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109902535731092e-06, + "loss": 0.5952, + "step": 40897 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109664682287158e-06, + "loss": 0.6885, + "step": 40898 + }, + { + "epoch": 1.05, + "learning_rate": 1.5109426824930992e-06, + "loss": 0.6753, + "step": 40899 + }, + { + "epoch": 1.05, + "learning_rate": 1.510918896366277e-06, + "loss": 0.4346, + "step": 40900 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108951098482674e-06, + "loss": 0.7061, + "step": 40901 + }, + { + "epoch": 1.05, + "learning_rate": 1.510871322939089e-06, + "loss": 0.7559, + "step": 40902 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108475356387604e-06, + "loss": 0.5374, + "step": 40903 + }, + { + "epoch": 1.05, + "learning_rate": 1.5108237479472988e-06, + "loss": 0.6313, + "step": 40904 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107999598647234e-06, + "loss": 0.6934, + "step": 40905 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107761713910517e-06, + "loss": 0.6035, + "step": 40906 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107523825263023e-06, + "loss": 0.525, + "step": 40907 + }, + { + "epoch": 1.05, + "learning_rate": 1.510728593270493e-06, + "loss": 0.5938, + "step": 40908 + }, + { + "epoch": 1.05, + "learning_rate": 1.5107048036236426e-06, + "loss": 0.7026, + "step": 40909 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106810135857689e-06, + "loss": 0.6121, + "step": 40910 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106572231568901e-06, + "loss": 0.709, + "step": 40911 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106334323370246e-06, + "loss": 0.7432, + "step": 40912 + }, + { + "epoch": 1.05, + "learning_rate": 1.5106096411261909e-06, + "loss": 0.5933, + "step": 40913 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105858495244066e-06, + "loss": 0.6885, + "step": 40914 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105620575316899e-06, + "loss": 0.3085, + "step": 40915 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105382651480599e-06, + "loss": 0.7354, + "step": 40916 + }, + { + "epoch": 1.05, + "learning_rate": 1.5105144723735337e-06, + "loss": 0.6348, + "step": 40917 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104906792081305e-06, + "loss": 0.4229, + "step": 40918 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104668856518677e-06, + "loss": 0.6953, + "step": 40919 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104430917047641e-06, + "loss": 0.8242, + "step": 40920 + }, + { + "epoch": 1.05, + "learning_rate": 1.5104192973668375e-06, + "loss": 0.603, + "step": 40921 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103955026381065e-06, + "loss": 0.5562, + "step": 40922 + }, + { + "epoch": 1.05, + "learning_rate": 1.510371707518589e-06, + "loss": 0.7109, + "step": 40923 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103479120083034e-06, + "loss": 0.6758, + "step": 40924 + }, + { + "epoch": 1.05, + "learning_rate": 1.510324116107268e-06, + "loss": 0.6587, + "step": 40925 + }, + { + "epoch": 1.05, + "learning_rate": 1.5103003198155006e-06, + "loss": 0.6479, + "step": 40926 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102765231330196e-06, + "loss": 0.5708, + "step": 40927 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102527260598442e-06, + "loss": 0.5444, + "step": 40928 + }, + { + "epoch": 1.05, + "learning_rate": 1.5102289285959909e-06, + "loss": 0.8262, + "step": 40929 + }, + { + "epoch": 1.05, + "learning_rate": 1.510205130741479e-06, + "loss": 0.7402, + "step": 40930 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101813324963264e-06, + "loss": 0.708, + "step": 40931 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101575338605518e-06, + "loss": 0.5061, + "step": 40932 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101337348341728e-06, + "loss": 0.4609, + "step": 40933 + }, + { + "epoch": 1.05, + "learning_rate": 1.5101099354172074e-06, + "loss": 0.5884, + "step": 40934 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100861356096748e-06, + "loss": 0.6357, + "step": 40935 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100623354115926e-06, + "loss": 0.7207, + "step": 40936 + }, + { + "epoch": 1.05, + "learning_rate": 1.510038534822979e-06, + "loss": 0.6924, + "step": 40937 + }, + { + "epoch": 1.05, + "learning_rate": 1.5100147338438527e-06, + "loss": 0.4478, + "step": 40938 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099909324742312e-06, + "loss": 0.4559, + "step": 40939 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099671307141332e-06, + "loss": 0.6191, + "step": 40940 + }, + { + "epoch": 1.05, + "learning_rate": 1.509943328563577e-06, + "loss": 0.6895, + "step": 40941 + }, + { + "epoch": 1.05, + "learning_rate": 1.5099195260225802e-06, + "loss": 0.5986, + "step": 40942 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098957230911621e-06, + "loss": 0.6091, + "step": 40943 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098719197693397e-06, + "loss": 0.623, + "step": 40944 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098481160571321e-06, + "loss": 0.7773, + "step": 40945 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098243119545573e-06, + "loss": 0.7256, + "step": 40946 + }, + { + "epoch": 1.05, + "learning_rate": 1.5098005074616333e-06, + "loss": 0.5786, + "step": 40947 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097767025783786e-06, + "loss": 0.6924, + "step": 40948 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097528973048114e-06, + "loss": 0.6831, + "step": 40949 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097290916409495e-06, + "loss": 0.7363, + "step": 40950 + }, + { + "epoch": 1.05, + "learning_rate": 1.5097052855868119e-06, + "loss": 0.6333, + "step": 40951 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096814791424159e-06, + "loss": 0.4749, + "step": 40952 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096576723077808e-06, + "loss": 0.6616, + "step": 40953 + }, + { + "epoch": 1.05, + "learning_rate": 1.509633865082924e-06, + "loss": 0.6309, + "step": 40954 + }, + { + "epoch": 1.05, + "learning_rate": 1.5096100574678636e-06, + "loss": 0.7285, + "step": 40955 + }, + { + "epoch": 1.05, + "learning_rate": 1.5095862494626188e-06, + "loss": 0.5886, + "step": 40956 + }, + { + "epoch": 1.05, + "learning_rate": 1.509562441067207e-06, + "loss": 0.8682, + "step": 40957 + }, + { + "epoch": 1.05, + "learning_rate": 1.5095386322816468e-06, + "loss": 0.6372, + "step": 40958 + }, + { + "epoch": 1.05, + "learning_rate": 1.509514823105956e-06, + "loss": 0.7188, + "step": 40959 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094910135401536e-06, + "loss": 0.5601, + "step": 40960 + }, + { + "epoch": 1.05, + "learning_rate": 1.509467203584257e-06, + "loss": 0.7085, + "step": 40961 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094433932382846e-06, + "loss": 0.7344, + "step": 40962 + }, + { + "epoch": 1.05, + "learning_rate": 1.5094195825022552e-06, + "loss": 0.5518, + "step": 40963 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093957713761865e-06, + "loss": 0.8359, + "step": 40964 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093719598600969e-06, + "loss": 0.627, + "step": 40965 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093481479540047e-06, + "loss": 0.5254, + "step": 40966 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093243356579277e-06, + "loss": 0.6274, + "step": 40967 + }, + { + "epoch": 1.05, + "learning_rate": 1.5093005229718848e-06, + "loss": 0.5671, + "step": 40968 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092767098958938e-06, + "loss": 0.5879, + "step": 40969 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092528964299733e-06, + "loss": 0.437, + "step": 40970 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092290825741409e-06, + "loss": 0.7026, + "step": 40971 + }, + { + "epoch": 1.05, + "learning_rate": 1.5092052683284156e-06, + "loss": 0.613, + "step": 40972 + }, + { + "epoch": 1.05, + "learning_rate": 1.509181453692815e-06, + "loss": 0.7168, + "step": 40973 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091576386673577e-06, + "loss": 0.4756, + "step": 40974 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091338232520614e-06, + "loss": 0.6602, + "step": 40975 + }, + { + "epoch": 1.05, + "learning_rate": 1.5091100074469448e-06, + "loss": 0.709, + "step": 40976 + }, + { + "epoch": 1.05, + "learning_rate": 1.5090861912520265e-06, + "loss": 0.623, + "step": 40977 + }, + { + "epoch": 1.05, + "learning_rate": 1.509062374667324e-06, + "loss": 0.7412, + "step": 40978 + }, + { + "epoch": 1.05, + "learning_rate": 1.509038557692856e-06, + "loss": 0.7334, + "step": 40979 + }, + { + "epoch": 1.05, + "learning_rate": 1.5090147403286407e-06, + "loss": 0.6323, + "step": 40980 + }, + { + "epoch": 1.05, + "learning_rate": 1.508990922574696e-06, + "loss": 0.6504, + "step": 40981 + }, + { + "epoch": 1.05, + "learning_rate": 1.5089671044310404e-06, + "loss": 0.7188, + "step": 40982 + }, + { + "epoch": 1.05, + "learning_rate": 1.508943285897692e-06, + "loss": 0.5151, + "step": 40983 + }, + { + "epoch": 1.05, + "learning_rate": 1.5089194669746691e-06, + "loss": 0.4414, + "step": 40984 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088956476619906e-06, + "loss": 0.5049, + "step": 40985 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088718279596733e-06, + "loss": 0.3945, + "step": 40986 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088480078677366e-06, + "loss": 0.6167, + "step": 40987 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088241873861981e-06, + "loss": 0.6914, + "step": 40988 + }, + { + "epoch": 1.05, + "learning_rate": 1.5088003665150768e-06, + "loss": 0.426, + "step": 40989 + }, + { + "epoch": 1.05, + "learning_rate": 1.50877654525439e-06, + "loss": 0.7471, + "step": 40990 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087527236041568e-06, + "loss": 0.6914, + "step": 40991 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087289015643947e-06, + "loss": 0.4526, + "step": 40992 + }, + { + "epoch": 1.05, + "learning_rate": 1.5087050791351227e-06, + "loss": 0.7583, + "step": 40993 + }, + { + "epoch": 1.05, + "learning_rate": 1.508681256316358e-06, + "loss": 0.4849, + "step": 40994 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086574331081199e-06, + "loss": 0.8027, + "step": 40995 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086336095104258e-06, + "loss": 0.7261, + "step": 40996 + }, + { + "epoch": 1.05, + "learning_rate": 1.5086097855232947e-06, + "loss": 0.6133, + "step": 40997 + }, + { + "epoch": 1.05, + "learning_rate": 1.5085859611467445e-06, + "loss": 0.6973, + "step": 40998 + }, + { + "epoch": 1.05, + "learning_rate": 1.508562136380793e-06, + "loss": 0.6592, + "step": 40999 + }, + { + "epoch": 1.05, + "learning_rate": 1.5085383112254592e-06, + "loss": 0.7031, + "step": 41000 + }, + { + "epoch": 1.05, + "learning_rate": 1.508514485680761e-06, + "loss": 0.5732, + "step": 41001 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084906597467164e-06, + "loss": 0.7803, + "step": 41002 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084668334233442e-06, + "loss": 0.5349, + "step": 41003 + }, + { + "epoch": 1.05, + "learning_rate": 1.508443006710662e-06, + "loss": 0.7617, + "step": 41004 + }, + { + "epoch": 1.05, + "learning_rate": 1.5084191796086887e-06, + "loss": 0.5884, + "step": 41005 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083953521174419e-06, + "loss": 0.6914, + "step": 41006 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083715242369404e-06, + "loss": 0.665, + "step": 41007 + }, + { + "epoch": 1.05, + "learning_rate": 1.508347695967202e-06, + "loss": 0.8057, + "step": 41008 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083238673082456e-06, + "loss": 0.7939, + "step": 41009 + }, + { + "epoch": 1.05, + "learning_rate": 1.5083000382600886e-06, + "loss": 0.8203, + "step": 41010 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082762088227493e-06, + "loss": 0.8223, + "step": 41011 + }, + { + "epoch": 1.05, + "learning_rate": 1.508252378996247e-06, + "loss": 0.6567, + "step": 41012 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082285487805985e-06, + "loss": 0.6528, + "step": 41013 + }, + { + "epoch": 1.05, + "learning_rate": 1.5082047181758233e-06, + "loss": 0.7461, + "step": 41014 + }, + { + "epoch": 1.05, + "learning_rate": 1.508180887181939e-06, + "loss": 0.6787, + "step": 41015 + }, + { + "epoch": 1.05, + "learning_rate": 1.5081570557989638e-06, + "loss": 0.6924, + "step": 41016 + }, + { + "epoch": 1.05, + "learning_rate": 1.508133224026916e-06, + "loss": 0.6035, + "step": 41017 + }, + { + "epoch": 1.05, + "learning_rate": 1.5081093918658145e-06, + "loss": 0.6855, + "step": 41018 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080855593156767e-06, + "loss": 0.667, + "step": 41019 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080617263765213e-06, + "loss": 0.6904, + "step": 41020 + }, + { + "epoch": 1.05, + "learning_rate": 1.508037893048366e-06, + "loss": 0.6279, + "step": 41021 + }, + { + "epoch": 1.05, + "learning_rate": 1.5080140593312298e-06, + "loss": 0.7021, + "step": 41022 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079902252251304e-06, + "loss": 0.7041, + "step": 41023 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079663907300861e-06, + "loss": 0.7202, + "step": 41024 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079425558461157e-06, + "loss": 0.5457, + "step": 41025 + }, + { + "epoch": 1.05, + "learning_rate": 1.5079187205732367e-06, + "loss": 0.6621, + "step": 41026 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078948849114679e-06, + "loss": 0.601, + "step": 41027 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078710488608273e-06, + "loss": 0.5752, + "step": 41028 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078472124213332e-06, + "loss": 0.8096, + "step": 41029 + }, + { + "epoch": 1.05, + "learning_rate": 1.5078233755930037e-06, + "loss": 0.6265, + "step": 41030 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077995383758575e-06, + "loss": 0.5765, + "step": 41031 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077757007699118e-06, + "loss": 0.6812, + "step": 41032 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077518627751866e-06, + "loss": 0.6875, + "step": 41033 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077280243916985e-06, + "loss": 0.5818, + "step": 41034 + }, + { + "epoch": 1.05, + "learning_rate": 1.5077041856194668e-06, + "loss": 0.6365, + "step": 41035 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076803464585091e-06, + "loss": 0.6299, + "step": 41036 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076565069088439e-06, + "loss": 0.5894, + "step": 41037 + }, + { + "epoch": 1.05, + "learning_rate": 1.5076326669704896e-06, + "loss": 0.5615, + "step": 41038 + }, + { + "epoch": 1.05, + "learning_rate": 1.507608826643464e-06, + "loss": 0.6113, + "step": 41039 + }, + { + "epoch": 1.05, + "learning_rate": 1.507584985927786e-06, + "loss": 0.8296, + "step": 41040 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075611448234732e-06, + "loss": 0.7061, + "step": 41041 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075373033305443e-06, + "loss": 0.7676, + "step": 41042 + }, + { + "epoch": 1.05, + "learning_rate": 1.5075134614490174e-06, + "loss": 0.6885, + "step": 41043 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074896191789108e-06, + "loss": 0.9189, + "step": 41044 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074657765202429e-06, + "loss": 0.5974, + "step": 41045 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074419334730318e-06, + "loss": 0.8115, + "step": 41046 + }, + { + "epoch": 1.05, + "learning_rate": 1.5074180900372954e-06, + "loss": 0.5282, + "step": 41047 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073942462130528e-06, + "loss": 0.7754, + "step": 41048 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073704020003212e-06, + "loss": 0.6499, + "step": 41049 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073465573991198e-06, + "loss": 0.7393, + "step": 41050 + }, + { + "epoch": 1.05, + "learning_rate": 1.5073227124094663e-06, + "loss": 0.7319, + "step": 41051 + }, + { + "epoch": 1.05, + "learning_rate": 1.5072988670313792e-06, + "loss": 0.5659, + "step": 41052 + }, + { + "epoch": 1.05, + "learning_rate": 1.5072750212648766e-06, + "loss": 0.5674, + "step": 41053 + }, + { + "epoch": 1.05, + "learning_rate": 1.507251175109977e-06, + "loss": 0.5842, + "step": 41054 + }, + { + "epoch": 1.05, + "learning_rate": 1.507227328566698e-06, + "loss": 0.5361, + "step": 41055 + }, + { + "epoch": 1.05, + "learning_rate": 1.507203481635059e-06, + "loss": 0.613, + "step": 41056 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071796343150774e-06, + "loss": 0.7017, + "step": 41057 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071557866067717e-06, + "loss": 0.344, + "step": 41058 + }, + { + "epoch": 1.05, + "learning_rate": 1.5071319385101599e-06, + "loss": 0.5216, + "step": 41059 + }, + { + "epoch": 1.05, + "learning_rate": 1.507108090025261e-06, + "loss": 0.7227, + "step": 41060 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070842411520922e-06, + "loss": 0.6914, + "step": 41061 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070603918906727e-06, + "loss": 0.7686, + "step": 41062 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070365422410202e-06, + "loss": 0.8623, + "step": 41063 + }, + { + "epoch": 1.05, + "learning_rate": 1.5070126922031532e-06, + "loss": 0.7178, + "step": 41064 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069888417770898e-06, + "loss": 0.7744, + "step": 41065 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069649909628484e-06, + "loss": 0.7402, + "step": 41066 + }, + { + "epoch": 1.05, + "learning_rate": 1.506941139760447e-06, + "loss": 0.6787, + "step": 41067 + }, + { + "epoch": 1.05, + "learning_rate": 1.5069172881699044e-06, + "loss": 0.7744, + "step": 41068 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068934361912385e-06, + "loss": 0.7178, + "step": 41069 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068695838244674e-06, + "loss": 0.5957, + "step": 41070 + }, + { + "epoch": 1.05, + "learning_rate": 1.50684573106961e-06, + "loss": 0.5835, + "step": 41071 + }, + { + "epoch": 1.05, + "learning_rate": 1.5068218779266834e-06, + "loss": 0.6294, + "step": 41072 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067980243957075e-06, + "loss": 0.5151, + "step": 41073 + }, + { + "epoch": 1.05, + "learning_rate": 1.506774170476699e-06, + "loss": 0.6719, + "step": 41074 + }, + { + "epoch": 1.05, + "learning_rate": 1.506750316169677e-06, + "loss": 0.6025, + "step": 41075 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067264614746593e-06, + "loss": 0.6689, + "step": 41076 + }, + { + "epoch": 1.05, + "learning_rate": 1.5067026063916651e-06, + "loss": 0.5641, + "step": 41077 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066787509207116e-06, + "loss": 0.7139, + "step": 41078 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066548950618174e-06, + "loss": 0.6836, + "step": 41079 + }, + { + "epoch": 1.05, + "learning_rate": 1.506631038815001e-06, + "loss": 0.6929, + "step": 41080 + }, + { + "epoch": 1.05, + "learning_rate": 1.5066071821802803e-06, + "loss": 0.791, + "step": 41081 + }, + { + "epoch": 1.05, + "learning_rate": 1.506583325157674e-06, + "loss": 0.5227, + "step": 41082 + }, + { + "epoch": 1.05, + "learning_rate": 1.5065594677472003e-06, + "loss": 0.5596, + "step": 41083 + }, + { + "epoch": 1.05, + "learning_rate": 1.506535609948877e-06, + "loss": 0.6992, + "step": 41084 + }, + { + "epoch": 1.05, + "learning_rate": 1.5065117517627227e-06, + "loss": 0.7266, + "step": 41085 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064878931887557e-06, + "loss": 0.6738, + "step": 41086 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064640342269943e-06, + "loss": 0.6514, + "step": 41087 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064401748774566e-06, + "loss": 0.7661, + "step": 41088 + }, + { + "epoch": 1.05, + "learning_rate": 1.5064163151401608e-06, + "loss": 0.5529, + "step": 41089 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063924550151254e-06, + "loss": 0.6592, + "step": 41090 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063685945023688e-06, + "loss": 0.7432, + "step": 41091 + }, + { + "epoch": 1.05, + "learning_rate": 1.5063447336019089e-06, + "loss": 0.397, + "step": 41092 + }, + { + "epoch": 1.05, + "learning_rate": 1.506320872313764e-06, + "loss": 0.749, + "step": 41093 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062970106379526e-06, + "loss": 0.6235, + "step": 41094 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062731485744928e-06, + "loss": 0.5415, + "step": 41095 + }, + { + "epoch": 1.05, + "learning_rate": 1.506249286123403e-06, + "loss": 0.7402, + "step": 41096 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062254232847016e-06, + "loss": 0.5063, + "step": 41097 + }, + { + "epoch": 1.05, + "learning_rate": 1.5062015600584065e-06, + "loss": 0.5596, + "step": 41098 + }, + { + "epoch": 1.05, + "learning_rate": 1.506177696444536e-06, + "loss": 0.4576, + "step": 41099 + }, + { + "epoch": 1.05, + "learning_rate": 1.5061538324431087e-06, + "loss": 0.7334, + "step": 41100 + }, + { + "epoch": 1.05, + "learning_rate": 1.5061299680541427e-06, + "loss": 0.4922, + "step": 41101 + }, + { + "epoch": 1.05, + "learning_rate": 1.506106103277656e-06, + "loss": 0.6636, + "step": 41102 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060822381136674e-06, + "loss": 0.6533, + "step": 41103 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060583725621947e-06, + "loss": 0.6541, + "step": 41104 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060345066232562e-06, + "loss": 0.5908, + "step": 41105 + }, + { + "epoch": 1.05, + "learning_rate": 1.5060106402968708e-06, + "loss": 0.6211, + "step": 41106 + }, + { + "epoch": 1.05, + "learning_rate": 1.505986773583056e-06, + "loss": 0.6226, + "step": 41107 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059629064818306e-06, + "loss": 0.583, + "step": 41108 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059390389932126e-06, + "loss": 0.7959, + "step": 41109 + }, + { + "epoch": 1.05, + "learning_rate": 1.5059151711172204e-06, + "loss": 0.5872, + "step": 41110 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058913028538722e-06, + "loss": 0.4971, + "step": 41111 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058674342031861e-06, + "loss": 0.7251, + "step": 41112 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058435651651807e-06, + "loss": 0.6055, + "step": 41113 + }, + { + "epoch": 1.05, + "learning_rate": 1.5058196957398742e-06, + "loss": 0.7344, + "step": 41114 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057958259272847e-06, + "loss": 0.6372, + "step": 41115 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057719557274307e-06, + "loss": 0.7246, + "step": 41116 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057480851403304e-06, + "loss": 0.7324, + "step": 41117 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057242141660017e-06, + "loss": 0.4961, + "step": 41118 + }, + { + "epoch": 1.05, + "learning_rate": 1.5057003428044636e-06, + "loss": 0.6113, + "step": 41119 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056764710557336e-06, + "loss": 0.6631, + "step": 41120 + }, + { + "epoch": 1.05, + "learning_rate": 1.505652598919831e-06, + "loss": 0.7827, + "step": 41121 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056287263967732e-06, + "loss": 0.4956, + "step": 41122 + }, + { + "epoch": 1.05, + "learning_rate": 1.5056048534865787e-06, + "loss": 0.5742, + "step": 41123 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055809801892656e-06, + "loss": 0.4404, + "step": 41124 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055571065048527e-06, + "loss": 0.7598, + "step": 41125 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055332324333576e-06, + "loss": 0.5356, + "step": 41126 + }, + { + "epoch": 1.05, + "learning_rate": 1.5055093579747994e-06, + "loss": 0.6729, + "step": 41127 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054854831291956e-06, + "loss": 0.7168, + "step": 41128 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054616078965649e-06, + "loss": 0.8115, + "step": 41129 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054377322769254e-06, + "loss": 0.6992, + "step": 41130 + }, + { + "epoch": 1.05, + "learning_rate": 1.5054138562702957e-06, + "loss": 0.7529, + "step": 41131 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053899798766935e-06, + "loss": 0.6138, + "step": 41132 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053661030961378e-06, + "loss": 0.875, + "step": 41133 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053422259286467e-06, + "loss": 0.5342, + "step": 41134 + }, + { + "epoch": 1.05, + "learning_rate": 1.5053183483742374e-06, + "loss": 0.7412, + "step": 41135 + }, + { + "epoch": 1.05, + "learning_rate": 1.50529447043293e-06, + "loss": 0.5659, + "step": 41136 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052705921047414e-06, + "loss": 0.7783, + "step": 41137 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052467133896904e-06, + "loss": 0.6328, + "step": 41138 + }, + { + "epoch": 1.05, + "learning_rate": 1.5052228342877954e-06, + "loss": 0.6709, + "step": 41139 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051989547990742e-06, + "loss": 0.7178, + "step": 41140 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051750749235454e-06, + "loss": 0.4744, + "step": 41141 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051511946612276e-06, + "loss": 0.6133, + "step": 41142 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051273140121388e-06, + "loss": 0.5653, + "step": 41143 + }, + { + "epoch": 1.05, + "learning_rate": 1.5051034329762971e-06, + "loss": 0.6482, + "step": 41144 + }, + { + "epoch": 1.05, + "learning_rate": 1.5050795515537205e-06, + "loss": 0.6748, + "step": 41145 + }, + { + "epoch": 1.05, + "learning_rate": 1.505055669744428e-06, + "loss": 0.623, + "step": 41146 + }, + { + "epoch": 1.05, + "learning_rate": 1.5050317875484377e-06, + "loss": 0.8301, + "step": 41147 + }, + { + "epoch": 1.05, + "learning_rate": 1.505007904965768e-06, + "loss": 0.4917, + "step": 41148 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049840219964366e-06, + "loss": 0.6416, + "step": 41149 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049601386404622e-06, + "loss": 0.7949, + "step": 41150 + }, + { + "epoch": 1.05, + "learning_rate": 1.504936254897863e-06, + "loss": 0.6855, + "step": 41151 + }, + { + "epoch": 1.05, + "learning_rate": 1.5049123707686576e-06, + "loss": 0.6709, + "step": 41152 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048884862528638e-06, + "loss": 0.7217, + "step": 41153 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048646013505003e-06, + "loss": 0.6562, + "step": 41154 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048407160615849e-06, + "loss": 0.75, + "step": 41155 + }, + { + "epoch": 1.05, + "learning_rate": 1.5048168303861363e-06, + "loss": 0.5427, + "step": 41156 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047929443241726e-06, + "loss": 0.6992, + "step": 41157 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047690578757123e-06, + "loss": 0.9092, + "step": 41158 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047451710407734e-06, + "loss": 0.6426, + "step": 41159 + }, + { + "epoch": 1.05, + "learning_rate": 1.5047212838193743e-06, + "loss": 0.7197, + "step": 41160 + }, + { + "epoch": 1.05, + "learning_rate": 1.5046973962115334e-06, + "loss": 0.6943, + "step": 41161 + }, + { + "epoch": 1.06, + "learning_rate": 1.504673508217269e-06, + "loss": 0.7139, + "step": 41162 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046496198365995e-06, + "loss": 0.5835, + "step": 41163 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046257310695425e-06, + "loss": 0.6274, + "step": 41164 + }, + { + "epoch": 1.06, + "learning_rate": 1.5046018419161173e-06, + "loss": 0.6758, + "step": 41165 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045779523763412e-06, + "loss": 0.7734, + "step": 41166 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045540624502331e-06, + "loss": 0.6982, + "step": 41167 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045301721378113e-06, + "loss": 0.7363, + "step": 41168 + }, + { + "epoch": 1.06, + "learning_rate": 1.5045062814390938e-06, + "loss": 0.6807, + "step": 41169 + }, + { + "epoch": 1.06, + "learning_rate": 1.504482390354099e-06, + "loss": 0.6348, + "step": 41170 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044584988828453e-06, + "loss": 0.5718, + "step": 41171 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044346070253509e-06, + "loss": 0.6914, + "step": 41172 + }, + { + "epoch": 1.06, + "learning_rate": 1.5044107147816342e-06, + "loss": 0.5442, + "step": 41173 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043868221517136e-06, + "loss": 0.6724, + "step": 41174 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043629291356068e-06, + "loss": 0.7373, + "step": 41175 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043390357333325e-06, + "loss": 0.6865, + "step": 41176 + }, + { + "epoch": 1.06, + "learning_rate": 1.5043151419449092e-06, + "loss": 0.583, + "step": 41177 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042912477703551e-06, + "loss": 0.7676, + "step": 41178 + }, + { + "epoch": 1.06, + "learning_rate": 1.504267353209688e-06, + "loss": 0.4966, + "step": 41179 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042434582629269e-06, + "loss": 0.77, + "step": 41180 + }, + { + "epoch": 1.06, + "learning_rate": 1.5042195629300898e-06, + "loss": 0.5913, + "step": 41181 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041956672111945e-06, + "loss": 0.668, + "step": 41182 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041717711062602e-06, + "loss": 0.6387, + "step": 41183 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041478746153046e-06, + "loss": 0.7275, + "step": 41184 + }, + { + "epoch": 1.06, + "learning_rate": 1.504123977738346e-06, + "loss": 0.4414, + "step": 41185 + }, + { + "epoch": 1.06, + "learning_rate": 1.5041000804754034e-06, + "loss": 0.5537, + "step": 41186 + }, + { + "epoch": 1.06, + "learning_rate": 1.504076182826494e-06, + "loss": 0.6816, + "step": 41187 + }, + { + "epoch": 1.06, + "learning_rate": 1.504052284791637e-06, + "loss": 0.7139, + "step": 41188 + }, + { + "epoch": 1.06, + "learning_rate": 1.5040283863708503e-06, + "loss": 0.562, + "step": 41189 + }, + { + "epoch": 1.06, + "learning_rate": 1.5040044875641519e-06, + "loss": 0.6792, + "step": 41190 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039805883715605e-06, + "loss": 0.6069, + "step": 41191 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039566887930947e-06, + "loss": 0.6992, + "step": 41192 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039327888287722e-06, + "loss": 0.6738, + "step": 41193 + }, + { + "epoch": 1.06, + "learning_rate": 1.5039088884786117e-06, + "loss": 0.5554, + "step": 41194 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038849877426312e-06, + "loss": 0.6074, + "step": 41195 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038610866208493e-06, + "loss": 0.624, + "step": 41196 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038371851132837e-06, + "loss": 0.6572, + "step": 41197 + }, + { + "epoch": 1.06, + "learning_rate": 1.5038132832199536e-06, + "loss": 0.7598, + "step": 41198 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037893809408763e-06, + "loss": 0.7549, + "step": 41199 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037654782760712e-06, + "loss": 0.6069, + "step": 41200 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037415752255558e-06, + "loss": 0.5508, + "step": 41201 + }, + { + "epoch": 1.06, + "learning_rate": 1.5037176717893485e-06, + "loss": 0.6436, + "step": 41202 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036937679674682e-06, + "loss": 0.459, + "step": 41203 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036698637599323e-06, + "loss": 0.748, + "step": 41204 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036459591667597e-06, + "loss": 0.603, + "step": 41205 + }, + { + "epoch": 1.06, + "learning_rate": 1.5036220541879683e-06, + "loss": 0.7891, + "step": 41206 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035981488235769e-06, + "loss": 0.6174, + "step": 41207 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035742430736037e-06, + "loss": 0.6646, + "step": 41208 + }, + { + "epoch": 1.06, + "learning_rate": 1.503550336938067e-06, + "loss": 0.8125, + "step": 41209 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035264304169842e-06, + "loss": 0.6533, + "step": 41210 + }, + { + "epoch": 1.06, + "learning_rate": 1.5035025235103749e-06, + "loss": 0.6313, + "step": 41211 + }, + { + "epoch": 1.06, + "learning_rate": 1.503478616218257e-06, + "loss": 0.6875, + "step": 41212 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034547085406483e-06, + "loss": 0.7607, + "step": 41213 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034308004775676e-06, + "loss": 0.752, + "step": 41214 + }, + { + "epoch": 1.06, + "learning_rate": 1.5034068920290332e-06, + "loss": 0.5107, + "step": 41215 + }, + { + "epoch": 1.06, + "learning_rate": 1.503382983195063e-06, + "loss": 0.5435, + "step": 41216 + }, + { + "epoch": 1.06, + "learning_rate": 1.503359073975676e-06, + "loss": 0.6284, + "step": 41217 + }, + { + "epoch": 1.06, + "learning_rate": 1.50333516437089e-06, + "loss": 0.6455, + "step": 41218 + }, + { + "epoch": 1.06, + "learning_rate": 1.5033112543807231e-06, + "loss": 0.7295, + "step": 41219 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032873440051943e-06, + "loss": 0.5996, + "step": 41220 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032634332443212e-06, + "loss": 0.7402, + "step": 41221 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032395220981227e-06, + "loss": 0.6685, + "step": 41222 + }, + { + "epoch": 1.06, + "learning_rate": 1.5032156105666167e-06, + "loss": 0.5669, + "step": 41223 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031916986498217e-06, + "loss": 0.6196, + "step": 41224 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031677863477556e-06, + "loss": 0.5254, + "step": 41225 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031438736604376e-06, + "loss": 0.8623, + "step": 41226 + }, + { + "epoch": 1.06, + "learning_rate": 1.5031199605878852e-06, + "loss": 0.6689, + "step": 41227 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030960471301172e-06, + "loss": 0.7119, + "step": 41228 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030721332871515e-06, + "loss": 0.5323, + "step": 41229 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030482190590066e-06, + "loss": 0.7119, + "step": 41230 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030243044457008e-06, + "loss": 0.7725, + "step": 41231 + }, + { + "epoch": 1.06, + "learning_rate": 1.5030003894472528e-06, + "loss": 0.6846, + "step": 41232 + }, + { + "epoch": 1.06, + "learning_rate": 1.50297647406368e-06, + "loss": 0.8213, + "step": 41233 + }, + { + "epoch": 1.06, + "learning_rate": 1.5029525582950014e-06, + "loss": 0.5723, + "step": 41234 + }, + { + "epoch": 1.06, + "learning_rate": 1.502928642141235e-06, + "loss": 0.7178, + "step": 41235 + }, + { + "epoch": 1.06, + "learning_rate": 1.5029047256023994e-06, + "loss": 0.5952, + "step": 41236 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028808086785129e-06, + "loss": 0.7764, + "step": 41237 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028568913695936e-06, + "loss": 0.7119, + "step": 41238 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028329736756597e-06, + "loss": 0.6299, + "step": 41239 + }, + { + "epoch": 1.06, + "learning_rate": 1.5028090555967302e-06, + "loss": 0.6201, + "step": 41240 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027851371328226e-06, + "loss": 0.5515, + "step": 41241 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027612182839555e-06, + "loss": 0.5957, + "step": 41242 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027372990501474e-06, + "loss": 0.6748, + "step": 41243 + }, + { + "epoch": 1.06, + "learning_rate": 1.5027133794314165e-06, + "loss": 0.6309, + "step": 41244 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026894594277809e-06, + "loss": 0.5625, + "step": 41245 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026655390392592e-06, + "loss": 0.7441, + "step": 41246 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026416182658697e-06, + "loss": 0.6948, + "step": 41247 + }, + { + "epoch": 1.06, + "learning_rate": 1.5026176971076303e-06, + "loss": 0.7061, + "step": 41248 + }, + { + "epoch": 1.06, + "learning_rate": 1.50259377556456e-06, + "loss": 0.7627, + "step": 41249 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025698536366764e-06, + "loss": 0.749, + "step": 41250 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025459313239982e-06, + "loss": 0.6504, + "step": 41251 + }, + { + "epoch": 1.06, + "learning_rate": 1.5025220086265441e-06, + "loss": 0.5811, + "step": 41252 + }, + { + "epoch": 1.06, + "learning_rate": 1.502498085544332e-06, + "loss": 0.6221, + "step": 41253 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024741620773797e-06, + "loss": 0.708, + "step": 41254 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024502382257065e-06, + "loss": 0.605, + "step": 41255 + }, + { + "epoch": 1.06, + "learning_rate": 1.5024263139893299e-06, + "loss": 0.6211, + "step": 41256 + }, + { + "epoch": 1.06, + "learning_rate": 1.502402389368269e-06, + "loss": 0.6792, + "step": 41257 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023784643625413e-06, + "loss": 0.6108, + "step": 41258 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023545389721658e-06, + "loss": 0.5796, + "step": 41259 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023306131971602e-06, + "loss": 0.7656, + "step": 41260 + }, + { + "epoch": 1.06, + "learning_rate": 1.5023066870375437e-06, + "loss": 0.7334, + "step": 41261 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022827604933335e-06, + "loss": 0.5796, + "step": 41262 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022588335645488e-06, + "loss": 0.7134, + "step": 41263 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022349062512075e-06, + "loss": 0.7969, + "step": 41264 + }, + { + "epoch": 1.06, + "learning_rate": 1.5022109785533279e-06, + "loss": 0.6436, + "step": 41265 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021870504709283e-06, + "loss": 0.7969, + "step": 41266 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021631220040277e-06, + "loss": 0.5903, + "step": 41267 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021391931526438e-06, + "loss": 0.5469, + "step": 41268 + }, + { + "epoch": 1.06, + "learning_rate": 1.5021152639167943e-06, + "loss": 0.7568, + "step": 41269 + }, + { + "epoch": 1.06, + "learning_rate": 1.502091334296499e-06, + "loss": 0.6758, + "step": 41270 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020674042917754e-06, + "loss": 0.6689, + "step": 41271 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020434739026417e-06, + "loss": 0.835, + "step": 41272 + }, + { + "epoch": 1.06, + "learning_rate": 1.5020195431291162e-06, + "loss": 0.6128, + "step": 41273 + }, + { + "epoch": 1.06, + "learning_rate": 1.5019956119712175e-06, + "loss": 0.4376, + "step": 41274 + }, + { + "epoch": 1.06, + "learning_rate": 1.501971680428964e-06, + "loss": 0.6807, + "step": 41275 + }, + { + "epoch": 1.06, + "learning_rate": 1.501947748502374e-06, + "loss": 0.7158, + "step": 41276 + }, + { + "epoch": 1.06, + "learning_rate": 1.5019238161914656e-06, + "loss": 0.4878, + "step": 41277 + }, + { + "epoch": 1.06, + "learning_rate": 1.501899883496257e-06, + "loss": 0.6108, + "step": 41278 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018759504167667e-06, + "loss": 0.6221, + "step": 41279 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018520169530133e-06, + "loss": 0.7578, + "step": 41280 + }, + { + "epoch": 1.06, + "learning_rate": 1.5018280831050148e-06, + "loss": 0.7949, + "step": 41281 + }, + { + "epoch": 1.06, + "learning_rate": 1.50180414887279e-06, + "loss": 0.6133, + "step": 41282 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017802142563562e-06, + "loss": 0.7227, + "step": 41283 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017562792557327e-06, + "loss": 0.7012, + "step": 41284 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017323438709371e-06, + "loss": 0.7227, + "step": 41285 + }, + { + "epoch": 1.06, + "learning_rate": 1.5017084081019884e-06, + "loss": 0.6523, + "step": 41286 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016844719489048e-06, + "loss": 0.7334, + "step": 41287 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016605354117044e-06, + "loss": 0.7881, + "step": 41288 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016365984904053e-06, + "loss": 0.8613, + "step": 41289 + }, + { + "epoch": 1.06, + "learning_rate": 1.5016126611850263e-06, + "loss": 0.6885, + "step": 41290 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015887234955854e-06, + "loss": 0.7578, + "step": 41291 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015647854221017e-06, + "loss": 0.5039, + "step": 41292 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015408469645925e-06, + "loss": 0.3525, + "step": 41293 + }, + { + "epoch": 1.06, + "learning_rate": 1.5015169081230763e-06, + "loss": 0.8584, + "step": 41294 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014929688975719e-06, + "loss": 0.4824, + "step": 41295 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014690292880974e-06, + "loss": 0.7549, + "step": 41296 + }, + { + "epoch": 1.06, + "learning_rate": 1.501445089294671e-06, + "loss": 0.6924, + "step": 41297 + }, + { + "epoch": 1.06, + "learning_rate": 1.5014211489173115e-06, + "loss": 0.7773, + "step": 41298 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013972081560366e-06, + "loss": 0.7852, + "step": 41299 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013732670108647e-06, + "loss": 0.665, + "step": 41300 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013493254818146e-06, + "loss": 0.5952, + "step": 41301 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013253835689046e-06, + "loss": 0.6846, + "step": 41302 + }, + { + "epoch": 1.06, + "learning_rate": 1.5013014412721525e-06, + "loss": 0.6582, + "step": 41303 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012774985915767e-06, + "loss": 0.7529, + "step": 41304 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012535555271964e-06, + "loss": 0.4633, + "step": 41305 + }, + { + "epoch": 1.06, + "learning_rate": 1.5012296120790286e-06, + "loss": 0.8984, + "step": 41306 + }, + { + "epoch": 1.06, + "learning_rate": 1.501205668247093e-06, + "loss": 0.8154, + "step": 41307 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011817240314068e-06, + "loss": 0.6567, + "step": 41308 + }, + { + "epoch": 1.06, + "learning_rate": 1.501157779431989e-06, + "loss": 0.8584, + "step": 41309 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011338344488578e-06, + "loss": 0.6528, + "step": 41310 + }, + { + "epoch": 1.06, + "learning_rate": 1.5011098890820312e-06, + "loss": 0.6016, + "step": 41311 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010859433315281e-06, + "loss": 0.665, + "step": 41312 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010619971973663e-06, + "loss": 0.5742, + "step": 41313 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010380506795644e-06, + "loss": 0.7334, + "step": 41314 + }, + { + "epoch": 1.06, + "learning_rate": 1.5010141037781407e-06, + "loss": 0.6289, + "step": 41315 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009901564931138e-06, + "loss": 0.6396, + "step": 41316 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009662088245016e-06, + "loss": 0.564, + "step": 41317 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009422607723226e-06, + "loss": 0.5542, + "step": 41318 + }, + { + "epoch": 1.06, + "learning_rate": 1.5009183123365948e-06, + "loss": 0.6333, + "step": 41319 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008943635173375e-06, + "loss": 0.748, + "step": 41320 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008704143145679e-06, + "loss": 0.522, + "step": 41321 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008464647283055e-06, + "loss": 0.5845, + "step": 41322 + }, + { + "epoch": 1.06, + "learning_rate": 1.5008225147585674e-06, + "loss": 0.6436, + "step": 41323 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007985644053726e-06, + "loss": 0.4241, + "step": 41324 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007746136687395e-06, + "loss": 0.625, + "step": 41325 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007506625486864e-06, + "loss": 0.7871, + "step": 41326 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007267110452312e-06, + "loss": 0.4075, + "step": 41327 + }, + { + "epoch": 1.06, + "learning_rate": 1.5007027591583929e-06, + "loss": 0.5542, + "step": 41328 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006788068881893e-06, + "loss": 0.6816, + "step": 41329 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006548542346394e-06, + "loss": 0.7373, + "step": 41330 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006309011977604e-06, + "loss": 0.5786, + "step": 41331 + }, + { + "epoch": 1.06, + "learning_rate": 1.5006069477775718e-06, + "loss": 0.6445, + "step": 41332 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005829939740914e-06, + "loss": 0.5735, + "step": 41333 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005590397873377e-06, + "loss": 0.668, + "step": 41334 + }, + { + "epoch": 1.06, + "learning_rate": 1.500535085217329e-06, + "loss": 0.5762, + "step": 41335 + }, + { + "epoch": 1.06, + "learning_rate": 1.5005111302640833e-06, + "loss": 0.4728, + "step": 41336 + }, + { + "epoch": 1.06, + "learning_rate": 1.5004871749276196e-06, + "loss": 0.7871, + "step": 41337 + }, + { + "epoch": 1.06, + "learning_rate": 1.5004632192079556e-06, + "loss": 0.519, + "step": 41338 + }, + { + "epoch": 1.06, + "learning_rate": 1.50043926310511e-06, + "loss": 0.6426, + "step": 41339 + }, + { + "epoch": 1.06, + "learning_rate": 1.500415306619101e-06, + "loss": 0.6953, + "step": 41340 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003913497499472e-06, + "loss": 0.5585, + "step": 41341 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003673924976665e-06, + "loss": 0.7734, + "step": 41342 + }, + { + "epoch": 1.06, + "learning_rate": 1.500343434862278e-06, + "loss": 0.8047, + "step": 41343 + }, + { + "epoch": 1.06, + "learning_rate": 1.5003194768437987e-06, + "loss": 0.7891, + "step": 41344 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002955184422485e-06, + "loss": 0.5605, + "step": 41345 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002715596576448e-06, + "loss": 0.6387, + "step": 41346 + }, + { + "epoch": 1.06, + "learning_rate": 1.5002476004900064e-06, + "loss": 0.6338, + "step": 41347 + }, + { + "epoch": 1.06, + "learning_rate": 1.500223640939351e-06, + "loss": 0.6821, + "step": 41348 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001996810056974e-06, + "loss": 0.5094, + "step": 41349 + }, + { + "epoch": 1.06, + "learning_rate": 1.500175720689064e-06, + "loss": 0.7051, + "step": 41350 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001517599894692e-06, + "loss": 0.749, + "step": 41351 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001277989069312e-06, + "loss": 0.4705, + "step": 41352 + }, + { + "epoch": 1.06, + "learning_rate": 1.5001038374414684e-06, + "loss": 0.582, + "step": 41353 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000798755930986e-06, + "loss": 0.7393, + "step": 41354 + }, + { + "epoch": 1.06, + "learning_rate": 1.500055913361841e-06, + "loss": 0.6465, + "step": 41355 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000319507477134e-06, + "loss": 0.4669, + "step": 41356 + }, + { + "epoch": 1.06, + "learning_rate": 1.5000079877507345e-06, + "loss": 0.7236, + "step": 41357 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999840243709226e-06, + "loss": 0.6362, + "step": 41358 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999600606082957e-06, + "loss": 0.8145, + "step": 41359 + }, + { + "epoch": 1.06, + "learning_rate": 1.4999360964628723e-06, + "loss": 0.7061, + "step": 41360 + }, + { + "epoch": 1.06, + "learning_rate": 1.499912131934671e-06, + "loss": 0.6924, + "step": 41361 + }, + { + "epoch": 1.06, + "learning_rate": 1.49988816702371e-06, + "loss": 0.5386, + "step": 41362 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998642017300074e-06, + "loss": 0.5039, + "step": 41363 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998402360535821e-06, + "loss": 0.5682, + "step": 41364 + }, + { + "epoch": 1.06, + "learning_rate": 1.4998162699944517e-06, + "loss": 0.6338, + "step": 41365 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997923035526352e-06, + "loss": 0.6885, + "step": 41366 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997683367281505e-06, + "loss": 0.6064, + "step": 41367 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997443695210167e-06, + "loss": 0.6265, + "step": 41368 + }, + { + "epoch": 1.06, + "learning_rate": 1.4997204019312511e-06, + "loss": 0.6276, + "step": 41369 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996964339588727e-06, + "loss": 0.7065, + "step": 41370 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996724656038997e-06, + "loss": 0.7197, + "step": 41371 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996484968663508e-06, + "loss": 0.7026, + "step": 41372 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996245277462434e-06, + "loss": 0.5566, + "step": 41373 + }, + { + "epoch": 1.06, + "learning_rate": 1.4996005582435968e-06, + "loss": 0.708, + "step": 41374 + }, + { + "epoch": 1.06, + "learning_rate": 1.499576588358429e-06, + "loss": 0.4985, + "step": 41375 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995526180907586e-06, + "loss": 0.6699, + "step": 41376 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995286474406035e-06, + "loss": 0.6191, + "step": 41377 + }, + { + "epoch": 1.06, + "learning_rate": 1.4995046764079821e-06, + "loss": 0.6265, + "step": 41378 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994807049929133e-06, + "loss": 0.5952, + "step": 41379 + }, + { + "epoch": 1.06, + "learning_rate": 1.499456733195415e-06, + "loss": 0.6895, + "step": 41380 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994327610155055e-06, + "loss": 0.582, + "step": 41381 + }, + { + "epoch": 1.06, + "learning_rate": 1.4994087884532034e-06, + "loss": 0.7285, + "step": 41382 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993848155085269e-06, + "loss": 0.7217, + "step": 41383 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993608421814944e-06, + "loss": 0.6021, + "step": 41384 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993368684721244e-06, + "loss": 0.7363, + "step": 41385 + }, + { + "epoch": 1.06, + "learning_rate": 1.4993128943804349e-06, + "loss": 0.6895, + "step": 41386 + }, + { + "epoch": 1.06, + "learning_rate": 1.4992889199064448e-06, + "loss": 0.5649, + "step": 41387 + }, + { + "epoch": 1.06, + "learning_rate": 1.499264945050172e-06, + "loss": 0.625, + "step": 41388 + }, + { + "epoch": 1.06, + "learning_rate": 1.4992409698116348e-06, + "loss": 0.7744, + "step": 41389 + }, + { + "epoch": 1.06, + "learning_rate": 1.499216994190852e-06, + "loss": 0.6541, + "step": 41390 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991930181878417e-06, + "loss": 0.4128, + "step": 41391 + }, + { + "epoch": 1.06, + "learning_rate": 1.499169041802622e-06, + "loss": 0.6143, + "step": 41392 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991450650352119e-06, + "loss": 0.562, + "step": 41393 + }, + { + "epoch": 1.06, + "learning_rate": 1.4991210878856288e-06, + "loss": 0.7256, + "step": 41394 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990971103538921e-06, + "loss": 0.7676, + "step": 41395 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990731324400193e-06, + "loss": 0.686, + "step": 41396 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990491541440299e-06, + "loss": 0.5718, + "step": 41397 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990251754659409e-06, + "loss": 0.6562, + "step": 41398 + }, + { + "epoch": 1.06, + "learning_rate": 1.4990011964057714e-06, + "loss": 0.5648, + "step": 41399 + }, + { + "epoch": 1.06, + "learning_rate": 1.4989772169635395e-06, + "loss": 0.7812, + "step": 41400 + }, + { + "epoch": 1.06, + "learning_rate": 1.498953237139264e-06, + "loss": 0.6455, + "step": 41401 + }, + { + "epoch": 1.06, + "learning_rate": 1.4989292569329625e-06, + "loss": 0.6865, + "step": 41402 + }, + { + "epoch": 1.06, + "learning_rate": 1.498905276344654e-06, + "loss": 0.5457, + "step": 41403 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988812953743568e-06, + "loss": 0.6084, + "step": 41404 + }, + { + "epoch": 1.06, + "learning_rate": 1.498857314022089e-06, + "loss": 0.6807, + "step": 41405 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988333322878692e-06, + "loss": 0.5271, + "step": 41406 + }, + { + "epoch": 1.06, + "learning_rate": 1.4988093501717156e-06, + "loss": 0.6641, + "step": 41407 + }, + { + "epoch": 1.06, + "learning_rate": 1.498785367673647e-06, + "loss": 0.8018, + "step": 41408 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987613847936807e-06, + "loss": 0.6895, + "step": 41409 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987374015318359e-06, + "loss": 0.3518, + "step": 41410 + }, + { + "epoch": 1.06, + "learning_rate": 1.4987134178881312e-06, + "loss": 0.7314, + "step": 41411 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986894338625843e-06, + "loss": 0.6821, + "step": 41412 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986654494552138e-06, + "loss": 0.7949, + "step": 41413 + }, + { + "epoch": 1.06, + "learning_rate": 1.498641464666038e-06, + "loss": 0.623, + "step": 41414 + }, + { + "epoch": 1.06, + "learning_rate": 1.4986174794950754e-06, + "loss": 0.7124, + "step": 41415 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985934939423446e-06, + "loss": 0.8145, + "step": 41416 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985695080078635e-06, + "loss": 0.6704, + "step": 41417 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985455216916509e-06, + "loss": 0.8018, + "step": 41418 + }, + { + "epoch": 1.06, + "learning_rate": 1.4985215349937246e-06, + "loss": 0.6021, + "step": 41419 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984975479141034e-06, + "loss": 0.5583, + "step": 41420 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984735604528053e-06, + "loss": 0.501, + "step": 41421 + }, + { + "epoch": 1.06, + "learning_rate": 1.498449572609849e-06, + "loss": 0.6636, + "step": 41422 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984255843852532e-06, + "loss": 0.5757, + "step": 41423 + }, + { + "epoch": 1.06, + "learning_rate": 1.4984015957790358e-06, + "loss": 0.8193, + "step": 41424 + }, + { + "epoch": 1.06, + "learning_rate": 1.4983776067912145e-06, + "loss": 0.604, + "step": 41425 + }, + { + "epoch": 1.06, + "learning_rate": 1.498353617421809e-06, + "loss": 0.5515, + "step": 41426 + }, + { + "epoch": 1.06, + "learning_rate": 1.498329627670837e-06, + "loss": 0.8125, + "step": 41427 + }, + { + "epoch": 1.06, + "learning_rate": 1.4983056375383167e-06, + "loss": 0.7617, + "step": 41428 + }, + { + "epoch": 1.06, + "learning_rate": 1.498281647024267e-06, + "loss": 0.4036, + "step": 41429 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982576561287056e-06, + "loss": 0.7412, + "step": 41430 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982336648516514e-06, + "loss": 0.6196, + "step": 41431 + }, + { + "epoch": 1.06, + "learning_rate": 1.4982096731931226e-06, + "loss": 0.6362, + "step": 41432 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981856811531378e-06, + "loss": 0.6621, + "step": 41433 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981616887317148e-06, + "loss": 0.7285, + "step": 41434 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981376959288724e-06, + "loss": 0.8096, + "step": 41435 + }, + { + "epoch": 1.06, + "learning_rate": 1.4981137027446286e-06, + "loss": 0.8066, + "step": 41436 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980897091790026e-06, + "loss": 0.6064, + "step": 41437 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980657152320118e-06, + "loss": 0.7178, + "step": 41438 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980417209036751e-06, + "loss": 0.7451, + "step": 41439 + }, + { + "epoch": 1.06, + "learning_rate": 1.4980177261940106e-06, + "loss": 0.604, + "step": 41440 + }, + { + "epoch": 1.06, + "learning_rate": 1.497993731103037e-06, + "loss": 0.5498, + "step": 41441 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979697356307726e-06, + "loss": 0.5134, + "step": 41442 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979457397772354e-06, + "loss": 0.4766, + "step": 41443 + }, + { + "epoch": 1.06, + "learning_rate": 1.4979217435424442e-06, + "loss": 0.6294, + "step": 41444 + }, + { + "epoch": 1.06, + "learning_rate": 1.497897746926417e-06, + "loss": 0.655, + "step": 41445 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978737499291727e-06, + "loss": 0.7773, + "step": 41446 + }, + { + "epoch": 1.06, + "learning_rate": 1.497849752550729e-06, + "loss": 0.5762, + "step": 41447 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978257547911054e-06, + "loss": 0.5662, + "step": 41448 + }, + { + "epoch": 1.06, + "learning_rate": 1.4978017566503188e-06, + "loss": 0.6509, + "step": 41449 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977777581283887e-06, + "loss": 0.5474, + "step": 41450 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977537592253327e-06, + "loss": 0.5825, + "step": 41451 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977297599411696e-06, + "loss": 0.6924, + "step": 41452 + }, + { + "epoch": 1.06, + "learning_rate": 1.4977057602759178e-06, + "loss": 0.6797, + "step": 41453 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976817602295957e-06, + "loss": 0.6675, + "step": 41454 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976577598022214e-06, + "loss": 0.6094, + "step": 41455 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976337589938133e-06, + "loss": 0.7627, + "step": 41456 + }, + { + "epoch": 1.06, + "learning_rate": 1.4976097578043901e-06, + "loss": 0.5693, + "step": 41457 + }, + { + "epoch": 1.06, + "learning_rate": 1.49758575623397e-06, + "loss": 0.3447, + "step": 41458 + }, + { + "epoch": 1.06, + "learning_rate": 1.497561754282571e-06, + "loss": 0.6089, + "step": 41459 + }, + { + "epoch": 1.06, + "learning_rate": 1.4975377519502127e-06, + "loss": 0.5181, + "step": 41460 + }, + { + "epoch": 1.06, + "learning_rate": 1.4975137492369116e-06, + "loss": 0.7373, + "step": 41461 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974897461426881e-06, + "loss": 0.6055, + "step": 41462 + }, + { + "epoch": 1.06, + "learning_rate": 1.497465742667559e-06, + "loss": 0.6631, + "step": 41463 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974417388115432e-06, + "loss": 0.6172, + "step": 41464 + }, + { + "epoch": 1.06, + "learning_rate": 1.4974177345746593e-06, + "loss": 0.6699, + "step": 41465 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973937299569252e-06, + "loss": 0.7393, + "step": 41466 + }, + { + "epoch": 1.06, + "learning_rate": 1.49736972495836e-06, + "loss": 0.6675, + "step": 41467 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973457195789815e-06, + "loss": 0.7803, + "step": 41468 + }, + { + "epoch": 1.06, + "learning_rate": 1.4973217138188083e-06, + "loss": 0.6973, + "step": 41469 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972977076778588e-06, + "loss": 0.7549, + "step": 41470 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972737011561512e-06, + "loss": 0.6377, + "step": 41471 + }, + { + "epoch": 1.06, + "learning_rate": 1.497249694253704e-06, + "loss": 0.667, + "step": 41472 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972256869705357e-06, + "loss": 0.6982, + "step": 41473 + }, + { + "epoch": 1.06, + "learning_rate": 1.4972016793066641e-06, + "loss": 0.5723, + "step": 41474 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971776712621087e-06, + "loss": 0.5896, + "step": 41475 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971536628368866e-06, + "loss": 0.5933, + "step": 41476 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971296540310175e-06, + "loss": 0.5605, + "step": 41477 + }, + { + "epoch": 1.06, + "learning_rate": 1.4971056448445185e-06, + "loss": 0.5103, + "step": 41478 + }, + { + "epoch": 1.06, + "learning_rate": 1.497081635277409e-06, + "loss": 0.4292, + "step": 41479 + }, + { + "epoch": 1.06, + "learning_rate": 1.4970576253297065e-06, + "loss": 0.5977, + "step": 41480 + }, + { + "epoch": 1.06, + "learning_rate": 1.49703361500143e-06, + "loss": 0.501, + "step": 41481 + }, + { + "epoch": 1.06, + "learning_rate": 1.497009604292598e-06, + "loss": 0.6548, + "step": 41482 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969855932032282e-06, + "loss": 0.7197, + "step": 41483 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969615817333394e-06, + "loss": 0.7988, + "step": 41484 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969375698829501e-06, + "loss": 0.6826, + "step": 41485 + }, + { + "epoch": 1.06, + "learning_rate": 1.4969135576520783e-06, + "loss": 0.5371, + "step": 41486 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968895450407432e-06, + "loss": 0.6899, + "step": 41487 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968655320489622e-06, + "loss": 0.7256, + "step": 41488 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968415186767542e-06, + "loss": 0.6211, + "step": 41489 + }, + { + "epoch": 1.06, + "learning_rate": 1.4968175049241377e-06, + "loss": 0.6128, + "step": 41490 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967934907911306e-06, + "loss": 0.5215, + "step": 41491 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967694762777517e-06, + "loss": 0.6553, + "step": 41492 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967454613840192e-06, + "loss": 0.6057, + "step": 41493 + }, + { + "epoch": 1.06, + "learning_rate": 1.4967214461099515e-06, + "loss": 0.96, + "step": 41494 + }, + { + "epoch": 1.06, + "learning_rate": 1.496697430455567e-06, + "loss": 0.7305, + "step": 41495 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966734144208842e-06, + "loss": 0.645, + "step": 41496 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966493980059216e-06, + "loss": 0.7461, + "step": 41497 + }, + { + "epoch": 1.06, + "learning_rate": 1.496625381210697e-06, + "loss": 0.4624, + "step": 41498 + }, + { + "epoch": 1.06, + "learning_rate": 1.4966013640352294e-06, + "loss": 0.7798, + "step": 41499 + }, + { + "epoch": 1.06, + "learning_rate": 1.496577346479537e-06, + "loss": 0.7295, + "step": 41500 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965533285436381e-06, + "loss": 0.709, + "step": 41501 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965293102275514e-06, + "loss": 0.6772, + "step": 41502 + }, + { + "epoch": 1.06, + "learning_rate": 1.4965052915312947e-06, + "loss": 0.6729, + "step": 41503 + }, + { + "epoch": 1.06, + "learning_rate": 1.4964812724548868e-06, + "loss": 0.7812, + "step": 41504 + }, + { + "epoch": 1.06, + "learning_rate": 1.496457252998346e-06, + "loss": 0.7383, + "step": 41505 + }, + { + "epoch": 1.06, + "learning_rate": 1.496433233161691e-06, + "loss": 0.7031, + "step": 41506 + }, + { + "epoch": 1.06, + "learning_rate": 1.4964092129449393e-06, + "loss": 0.7173, + "step": 41507 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963851923481103e-06, + "loss": 0.3887, + "step": 41508 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963611713712218e-06, + "loss": 0.6064, + "step": 41509 + }, + { + "epoch": 1.06, + "learning_rate": 1.4963371500142925e-06, + "loss": 0.5459, + "step": 41510 + }, + { + "epoch": 1.06, + "learning_rate": 1.496313128277341e-06, + "loss": 0.6689, + "step": 41511 + }, + { + "epoch": 1.06, + "learning_rate": 1.496289106160385e-06, + "loss": 0.7134, + "step": 41512 + }, + { + "epoch": 1.06, + "learning_rate": 1.496265083663443e-06, + "loss": 0.6172, + "step": 41513 + }, + { + "epoch": 1.06, + "learning_rate": 1.4962410607865339e-06, + "loss": 0.7109, + "step": 41514 + }, + { + "epoch": 1.06, + "learning_rate": 1.4962170375296758e-06, + "loss": 0.6411, + "step": 41515 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961930138928874e-06, + "loss": 0.7661, + "step": 41516 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961689898761866e-06, + "loss": 0.7378, + "step": 41517 + }, + { + "epoch": 1.06, + "learning_rate": 1.4961449654795919e-06, + "loss": 0.6108, + "step": 41518 + }, + { + "epoch": 1.06, + "learning_rate": 1.496120940703122e-06, + "loss": 0.7139, + "step": 41519 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960969155467948e-06, + "loss": 0.8672, + "step": 41520 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960728900106297e-06, + "loss": 0.7334, + "step": 41521 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960488640946438e-06, + "loss": 0.5369, + "step": 41522 + }, + { + "epoch": 1.06, + "learning_rate": 1.4960248377988562e-06, + "loss": 0.8369, + "step": 41523 + }, + { + "epoch": 1.06, + "learning_rate": 1.496000811123285e-06, + "loss": 0.7314, + "step": 41524 + }, + { + "epoch": 1.06, + "learning_rate": 1.4959767840679492e-06, + "loss": 0.5894, + "step": 41525 + }, + { + "epoch": 1.06, + "learning_rate": 1.4959527566328667e-06, + "loss": 0.512, + "step": 41526 + }, + { + "epoch": 1.06, + "learning_rate": 1.495928728818056e-06, + "loss": 0.6709, + "step": 41527 + }, + { + "epoch": 1.06, + "learning_rate": 1.495904700623535e-06, + "loss": 0.7456, + "step": 41528 + }, + { + "epoch": 1.06, + "learning_rate": 1.495880672049323e-06, + "loss": 0.6768, + "step": 41529 + }, + { + "epoch": 1.06, + "learning_rate": 1.495856643095438e-06, + "loss": 0.7627, + "step": 41530 + }, + { + "epoch": 1.06, + "learning_rate": 1.4958326137618985e-06, + "loss": 0.7021, + "step": 41531 + }, + { + "epoch": 1.06, + "learning_rate": 1.4958085840487225e-06, + "loss": 0.6216, + "step": 41532 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957845539559287e-06, + "loss": 0.7168, + "step": 41533 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957605234835353e-06, + "loss": 0.7832, + "step": 41534 + }, + { + "epoch": 1.06, + "learning_rate": 1.495736492631561e-06, + "loss": 0.5513, + "step": 41535 + }, + { + "epoch": 1.06, + "learning_rate": 1.4957124614000241e-06, + "loss": 0.6201, + "step": 41536 + }, + { + "epoch": 1.06, + "learning_rate": 1.495688429788943e-06, + "loss": 0.709, + "step": 41537 + }, + { + "epoch": 1.06, + "learning_rate": 1.495664397798336e-06, + "loss": 0.7275, + "step": 41538 + }, + { + "epoch": 1.06, + "learning_rate": 1.4956403654282214e-06, + "loss": 0.7002, + "step": 41539 + }, + { + "epoch": 1.06, + "learning_rate": 1.4956163326786179e-06, + "loss": 0.58, + "step": 41540 + }, + { + "epoch": 1.06, + "learning_rate": 1.495592299549544e-06, + "loss": 0.793, + "step": 41541 + }, + { + "epoch": 1.06, + "learning_rate": 1.4955682660410176e-06, + "loss": 0.5601, + "step": 41542 + }, + { + "epoch": 1.06, + "learning_rate": 1.4955442321530574e-06, + "loss": 0.521, + "step": 41543 + }, + { + "epoch": 1.06, + "learning_rate": 1.495520197885682e-06, + "loss": 0.7471, + "step": 41544 + }, + { + "epoch": 1.06, + "learning_rate": 1.495496163238909e-06, + "loss": 0.665, + "step": 41545 + }, + { + "epoch": 1.06, + "learning_rate": 1.495472128212758e-06, + "loss": 0.7505, + "step": 41546 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954480928072464e-06, + "loss": 0.7783, + "step": 41547 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954240570223933e-06, + "loss": 0.6064, + "step": 41548 + }, + { + "epoch": 1.06, + "learning_rate": 1.4954000208582163e-06, + "loss": 0.489, + "step": 41549 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953759843147346e-06, + "loss": 0.7744, + "step": 41550 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953519473919664e-06, + "loss": 0.6934, + "step": 41551 + }, + { + "epoch": 1.06, + "learning_rate": 1.4953279100899298e-06, + "loss": 0.707, + "step": 41552 + }, + { + "epoch": 1.07, + "learning_rate": 1.4953038724086434e-06, + "loss": 0.6084, + "step": 41553 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952798343481257e-06, + "loss": 0.5947, + "step": 41554 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952557959083947e-06, + "loss": 0.6348, + "step": 41555 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952317570894695e-06, + "loss": 0.7354, + "step": 41556 + }, + { + "epoch": 1.07, + "learning_rate": 1.4952077178913677e-06, + "loss": 0.5366, + "step": 41557 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951836783141086e-06, + "loss": 0.6416, + "step": 41558 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951596383577099e-06, + "loss": 0.5903, + "step": 41559 + }, + { + "epoch": 1.07, + "learning_rate": 1.4951355980221902e-06, + "loss": 0.7217, + "step": 41560 + }, + { + "epoch": 1.07, + "learning_rate": 1.495111557307568e-06, + "loss": 0.52, + "step": 41561 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950875162138615e-06, + "loss": 0.7007, + "step": 41562 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950634747410896e-06, + "loss": 0.7432, + "step": 41563 + }, + { + "epoch": 1.07, + "learning_rate": 1.49503943288927e-06, + "loss": 0.7285, + "step": 41564 + }, + { + "epoch": 1.07, + "learning_rate": 1.4950153906584216e-06, + "loss": 0.7256, + "step": 41565 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949913480485628e-06, + "loss": 0.73, + "step": 41566 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949673050597116e-06, + "loss": 0.6494, + "step": 41567 + }, + { + "epoch": 1.07, + "learning_rate": 1.494943261691887e-06, + "loss": 0.6782, + "step": 41568 + }, + { + "epoch": 1.07, + "learning_rate": 1.4949192179451069e-06, + "loss": 0.5757, + "step": 41569 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948951738193899e-06, + "loss": 0.748, + "step": 41570 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948711293147548e-06, + "loss": 0.7539, + "step": 41571 + }, + { + "epoch": 1.07, + "learning_rate": 1.4948470844312192e-06, + "loss": 0.6777, + "step": 41572 + }, + { + "epoch": 1.07, + "learning_rate": 1.494823039168802e-06, + "loss": 0.5796, + "step": 41573 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947989935275214e-06, + "loss": 0.603, + "step": 41574 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947749475073964e-06, + "loss": 0.6826, + "step": 41575 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947509011084447e-06, + "loss": 0.6638, + "step": 41576 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947268543306851e-06, + "loss": 0.5757, + "step": 41577 + }, + { + "epoch": 1.07, + "learning_rate": 1.4947028071741358e-06, + "loss": 0.5508, + "step": 41578 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946787596388153e-06, + "loss": 0.6494, + "step": 41579 + }, + { + "epoch": 1.07, + "learning_rate": 1.494654711724742e-06, + "loss": 0.6353, + "step": 41580 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946306634319343e-06, + "loss": 0.6689, + "step": 41581 + }, + { + "epoch": 1.07, + "learning_rate": 1.4946066147604108e-06, + "loss": 0.3774, + "step": 41582 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945825657101895e-06, + "loss": 0.7549, + "step": 41583 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945585162812894e-06, + "loss": 0.585, + "step": 41584 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945344664737283e-06, + "loss": 0.6392, + "step": 41585 + }, + { + "epoch": 1.07, + "learning_rate": 1.4945104162875253e-06, + "loss": 0.6904, + "step": 41586 + }, + { + "epoch": 1.07, + "learning_rate": 1.494486365722698e-06, + "loss": 0.5527, + "step": 41587 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944623147792656e-06, + "loss": 0.7002, + "step": 41588 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944382634572458e-06, + "loss": 0.5947, + "step": 41589 + }, + { + "epoch": 1.07, + "learning_rate": 1.4944142117566573e-06, + "loss": 0.6309, + "step": 41590 + }, + { + "epoch": 1.07, + "learning_rate": 1.494390159677519e-06, + "loss": 0.6426, + "step": 41591 + }, + { + "epoch": 1.07, + "learning_rate": 1.4943661072198487e-06, + "loss": 0.6748, + "step": 41592 + }, + { + "epoch": 1.07, + "learning_rate": 1.494342054383665e-06, + "loss": 0.8389, + "step": 41593 + }, + { + "epoch": 1.07, + "learning_rate": 1.4943180011689863e-06, + "loss": 0.6797, + "step": 41594 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942939475758308e-06, + "loss": 0.5854, + "step": 41595 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942698936042176e-06, + "loss": 0.7588, + "step": 41596 + }, + { + "epoch": 1.07, + "learning_rate": 1.494245839254164e-06, + "loss": 0.6553, + "step": 41597 + }, + { + "epoch": 1.07, + "learning_rate": 1.4942217845256897e-06, + "loss": 0.875, + "step": 41598 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941977294188122e-06, + "loss": 0.6904, + "step": 41599 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941736739335505e-06, + "loss": 0.7324, + "step": 41600 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941496180699226e-06, + "loss": 0.5, + "step": 41601 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941255618279469e-06, + "loss": 0.6338, + "step": 41602 + }, + { + "epoch": 1.07, + "learning_rate": 1.4941015052076422e-06, + "loss": 0.7441, + "step": 41603 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940774482090265e-06, + "loss": 0.6875, + "step": 41604 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940533908321187e-06, + "loss": 0.6538, + "step": 41605 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940293330769366e-06, + "loss": 0.7275, + "step": 41606 + }, + { + "epoch": 1.07, + "learning_rate": 1.4940052749434993e-06, + "loss": 0.7148, + "step": 41607 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939812164318247e-06, + "loss": 0.7646, + "step": 41608 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939571575419314e-06, + "loss": 0.5688, + "step": 41609 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939330982738377e-06, + "loss": 0.6279, + "step": 41610 + }, + { + "epoch": 1.07, + "learning_rate": 1.4939090386275624e-06, + "loss": 0.7559, + "step": 41611 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938849786031234e-06, + "loss": 0.5771, + "step": 41612 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938609182005394e-06, + "loss": 0.5469, + "step": 41613 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938368574198289e-06, + "loss": 0.7598, + "step": 41614 + }, + { + "epoch": 1.07, + "learning_rate": 1.4938127962610103e-06, + "loss": 0.645, + "step": 41615 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937887347241018e-06, + "loss": 0.479, + "step": 41616 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937646728091223e-06, + "loss": 0.7031, + "step": 41617 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937406105160895e-06, + "loss": 0.6528, + "step": 41618 + }, + { + "epoch": 1.07, + "learning_rate": 1.4937165478450223e-06, + "loss": 0.4648, + "step": 41619 + }, + { + "epoch": 1.07, + "learning_rate": 1.493692484795939e-06, + "loss": 0.7773, + "step": 41620 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936684213688584e-06, + "loss": 0.8271, + "step": 41621 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936443575637983e-06, + "loss": 0.6289, + "step": 41622 + }, + { + "epoch": 1.07, + "learning_rate": 1.4936202933807773e-06, + "loss": 0.7412, + "step": 41623 + }, + { + "epoch": 1.07, + "learning_rate": 1.493596228819814e-06, + "loss": 0.4797, + "step": 41624 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935721638809269e-06, + "loss": 0.5742, + "step": 41625 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935480985641345e-06, + "loss": 0.7959, + "step": 41626 + }, + { + "epoch": 1.07, + "learning_rate": 1.4935240328694544e-06, + "loss": 0.6431, + "step": 41627 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934999667969062e-06, + "loss": 0.4561, + "step": 41628 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934759003465074e-06, + "loss": 0.624, + "step": 41629 + }, + { + "epoch": 1.07, + "learning_rate": 1.493451833518277e-06, + "loss": 0.7939, + "step": 41630 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934277663122332e-06, + "loss": 0.7793, + "step": 41631 + }, + { + "epoch": 1.07, + "learning_rate": 1.4934036987283946e-06, + "loss": 0.5767, + "step": 41632 + }, + { + "epoch": 1.07, + "learning_rate": 1.493379630766779e-06, + "loss": 0.6611, + "step": 41633 + }, + { + "epoch": 1.07, + "learning_rate": 1.493355562427406e-06, + "loss": 0.5885, + "step": 41634 + }, + { + "epoch": 1.07, + "learning_rate": 1.4933314937102926e-06, + "loss": 0.707, + "step": 41635 + }, + { + "epoch": 1.07, + "learning_rate": 1.4933074246154586e-06, + "loss": 0.666, + "step": 41636 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932833551429214e-06, + "loss": 0.6382, + "step": 41637 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932592852927e-06, + "loss": 0.8574, + "step": 41638 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932352150648125e-06, + "loss": 0.7119, + "step": 41639 + }, + { + "epoch": 1.07, + "learning_rate": 1.4932111444592775e-06, + "loss": 0.7021, + "step": 41640 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931870734761134e-06, + "loss": 0.584, + "step": 41641 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931630021153388e-06, + "loss": 0.6205, + "step": 41642 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931389303769717e-06, + "loss": 0.667, + "step": 41643 + }, + { + "epoch": 1.07, + "learning_rate": 1.4931148582610308e-06, + "loss": 0.7144, + "step": 41644 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930907857675345e-06, + "loss": 0.7754, + "step": 41645 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930667128965015e-06, + "loss": 0.5442, + "step": 41646 + }, + { + "epoch": 1.07, + "learning_rate": 1.49304263964795e-06, + "loss": 0.7764, + "step": 41647 + }, + { + "epoch": 1.07, + "learning_rate": 1.4930185660218983e-06, + "loss": 0.7461, + "step": 41648 + }, + { + "epoch": 1.07, + "learning_rate": 1.492994492018365e-06, + "loss": 0.5488, + "step": 41649 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929704176373685e-06, + "loss": 0.5464, + "step": 41650 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929463428789272e-06, + "loss": 0.4419, + "step": 41651 + }, + { + "epoch": 1.07, + "learning_rate": 1.4929222677430596e-06, + "loss": 0.6641, + "step": 41652 + }, + { + "epoch": 1.07, + "learning_rate": 1.492898192229784e-06, + "loss": 0.636, + "step": 41653 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928741163391188e-06, + "loss": 0.4785, + "step": 41654 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928500400710828e-06, + "loss": 0.7109, + "step": 41655 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928259634256942e-06, + "loss": 0.5408, + "step": 41656 + }, + { + "epoch": 1.07, + "learning_rate": 1.4928018864029713e-06, + "loss": 0.6299, + "step": 41657 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927778090029324e-06, + "loss": 0.646, + "step": 41658 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927537312255967e-06, + "loss": 0.7236, + "step": 41659 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927296530709816e-06, + "loss": 0.8037, + "step": 41660 + }, + { + "epoch": 1.07, + "learning_rate": 1.4927055745391066e-06, + "loss": 0.4487, + "step": 41661 + }, + { + "epoch": 1.07, + "learning_rate": 1.492681495629989e-06, + "loss": 0.5522, + "step": 41662 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926574163436485e-06, + "loss": 0.5688, + "step": 41663 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926333366801024e-06, + "loss": 0.7656, + "step": 41664 + }, + { + "epoch": 1.07, + "learning_rate": 1.4926092566393697e-06, + "loss": 0.6318, + "step": 41665 + }, + { + "epoch": 1.07, + "learning_rate": 1.492585176221469e-06, + "loss": 0.7471, + "step": 41666 + }, + { + "epoch": 1.07, + "learning_rate": 1.4925610954264181e-06, + "loss": 0.6748, + "step": 41667 + }, + { + "epoch": 1.07, + "learning_rate": 1.492537014254236e-06, + "loss": 0.5645, + "step": 41668 + }, + { + "epoch": 1.07, + "learning_rate": 1.4925129327049409e-06, + "loss": 0.8018, + "step": 41669 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924888507785513e-06, + "loss": 0.8936, + "step": 41670 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924647684750857e-06, + "loss": 0.8926, + "step": 41671 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924406857945624e-06, + "loss": 0.6758, + "step": 41672 + }, + { + "epoch": 1.07, + "learning_rate": 1.4924166027369997e-06, + "loss": 0.6958, + "step": 41673 + }, + { + "epoch": 1.07, + "learning_rate": 1.4923925193024168e-06, + "loss": 0.6289, + "step": 41674 + }, + { + "epoch": 1.07, + "learning_rate": 1.492368435490831e-06, + "loss": 0.6816, + "step": 41675 + }, + { + "epoch": 1.07, + "learning_rate": 1.492344351302262e-06, + "loss": 0.6323, + "step": 41676 + }, + { + "epoch": 1.07, + "learning_rate": 1.492320266736727e-06, + "loss": 0.6172, + "step": 41677 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922961817942451e-06, + "loss": 0.6885, + "step": 41678 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922720964748345e-06, + "loss": 0.8594, + "step": 41679 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922480107785143e-06, + "loss": 0.79, + "step": 41680 + }, + { + "epoch": 1.07, + "learning_rate": 1.4922239247053022e-06, + "loss": 0.7051, + "step": 41681 + }, + { + "epoch": 1.07, + "learning_rate": 1.492199838255217e-06, + "loss": 0.6504, + "step": 41682 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921757514282765e-06, + "loss": 0.6978, + "step": 41683 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921516642245002e-06, + "loss": 0.5483, + "step": 41684 + }, + { + "epoch": 1.07, + "learning_rate": 1.4921275766439057e-06, + "loss": 0.7158, + "step": 41685 + }, + { + "epoch": 1.07, + "learning_rate": 1.492103488686512e-06, + "loss": 0.5518, + "step": 41686 + }, + { + "epoch": 1.07, + "learning_rate": 1.492079400352337e-06, + "loss": 0.4708, + "step": 41687 + }, + { + "epoch": 1.07, + "learning_rate": 1.4920553116413997e-06, + "loss": 0.5195, + "step": 41688 + }, + { + "epoch": 1.07, + "learning_rate": 1.492031222553718e-06, + "loss": 0.6548, + "step": 41689 + }, + { + "epoch": 1.07, + "learning_rate": 1.4920071330893107e-06, + "loss": 0.5996, + "step": 41690 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919830432481964e-06, + "loss": 0.6167, + "step": 41691 + }, + { + "epoch": 1.07, + "learning_rate": 1.491958953030393e-06, + "loss": 0.6445, + "step": 41692 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919348624359195e-06, + "loss": 0.5537, + "step": 41693 + }, + { + "epoch": 1.07, + "learning_rate": 1.4919107714647937e-06, + "loss": 0.7063, + "step": 41694 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918866801170346e-06, + "loss": 0.6523, + "step": 41695 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918625883926608e-06, + "loss": 0.5083, + "step": 41696 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918384962916903e-06, + "loss": 0.3982, + "step": 41697 + }, + { + "epoch": 1.07, + "learning_rate": 1.4918144038141413e-06, + "loss": 0.7842, + "step": 41698 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917903109600331e-06, + "loss": 0.8232, + "step": 41699 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917662177293835e-06, + "loss": 0.665, + "step": 41700 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917421241222114e-06, + "loss": 0.6094, + "step": 41701 + }, + { + "epoch": 1.07, + "learning_rate": 1.4917180301385344e-06, + "loss": 0.7148, + "step": 41702 + }, + { + "epoch": 1.07, + "learning_rate": 1.491693935778372e-06, + "loss": 0.7246, + "step": 41703 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916698410417418e-06, + "loss": 0.6582, + "step": 41704 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916457459286629e-06, + "loss": 0.6943, + "step": 41705 + }, + { + "epoch": 1.07, + "learning_rate": 1.4916216504391531e-06, + "loss": 0.7539, + "step": 41706 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915975545732317e-06, + "loss": 0.5225, + "step": 41707 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915734583309164e-06, + "loss": 0.7275, + "step": 41708 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915493617122258e-06, + "loss": 0.6611, + "step": 41709 + }, + { + "epoch": 1.07, + "learning_rate": 1.4915252647171785e-06, + "loss": 0.665, + "step": 41710 + }, + { + "epoch": 1.07, + "learning_rate": 1.491501167345793e-06, + "loss": 0.7246, + "step": 41711 + }, + { + "epoch": 1.07, + "learning_rate": 1.4914770695980876e-06, + "loss": 0.519, + "step": 41712 + }, + { + "epoch": 1.07, + "learning_rate": 1.491452971474081e-06, + "loss": 0.5977, + "step": 41713 + }, + { + "epoch": 1.07, + "learning_rate": 1.4914288729737912e-06, + "loss": 0.5356, + "step": 41714 + }, + { + "epoch": 1.07, + "learning_rate": 1.491404774097237e-06, + "loss": 0.5596, + "step": 41715 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913806748444368e-06, + "loss": 0.8066, + "step": 41716 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913565752154087e-06, + "loss": 0.5991, + "step": 41717 + }, + { + "epoch": 1.07, + "learning_rate": 1.491332475210172e-06, + "loss": 0.6074, + "step": 41718 + }, + { + "epoch": 1.07, + "learning_rate": 1.4913083748287441e-06, + "loss": 0.4719, + "step": 41719 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912842740711441e-06, + "loss": 0.5559, + "step": 41720 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912601729373906e-06, + "loss": 0.5442, + "step": 41721 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912360714275019e-06, + "loss": 0.5618, + "step": 41722 + }, + { + "epoch": 1.07, + "learning_rate": 1.4912119695414958e-06, + "loss": 0.7275, + "step": 41723 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911878672793916e-06, + "loss": 0.7773, + "step": 41724 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911637646412072e-06, + "loss": 0.9468, + "step": 41725 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911396616269615e-06, + "loss": 0.6167, + "step": 41726 + }, + { + "epoch": 1.07, + "learning_rate": 1.4911155582366728e-06, + "loss": 0.5669, + "step": 41727 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910914544703594e-06, + "loss": 0.6309, + "step": 41728 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910673503280395e-06, + "loss": 0.7197, + "step": 41729 + }, + { + "epoch": 1.07, + "learning_rate": 1.4910432458097324e-06, + "loss": 0.5957, + "step": 41730 + }, + { + "epoch": 1.07, + "learning_rate": 1.491019140915456e-06, + "loss": 0.6953, + "step": 41731 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909950356452287e-06, + "loss": 0.6338, + "step": 41732 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909709299990691e-06, + "loss": 0.791, + "step": 41733 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909468239769959e-06, + "loss": 0.7412, + "step": 41734 + }, + { + "epoch": 1.07, + "learning_rate": 1.4909227175790266e-06, + "loss": 0.626, + "step": 41735 + }, + { + "epoch": 1.07, + "learning_rate": 1.490898610805181e-06, + "loss": 0.6621, + "step": 41736 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908745036554766e-06, + "loss": 0.7148, + "step": 41737 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908503961299324e-06, + "loss": 0.6089, + "step": 41738 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908262882285664e-06, + "loss": 0.6401, + "step": 41739 + }, + { + "epoch": 1.07, + "learning_rate": 1.4908021799513975e-06, + "loss": 0.6309, + "step": 41740 + }, + { + "epoch": 1.07, + "learning_rate": 1.4907780712984438e-06, + "loss": 0.6626, + "step": 41741 + }, + { + "epoch": 1.07, + "learning_rate": 1.490753962269724e-06, + "loss": 0.5771, + "step": 41742 + }, + { + "epoch": 1.07, + "learning_rate": 1.490729852865256e-06, + "loss": 0.7539, + "step": 41743 + }, + { + "epoch": 1.07, + "learning_rate": 1.4907057430850592e-06, + "loss": 0.873, + "step": 41744 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906816329291514e-06, + "loss": 0.5703, + "step": 41745 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906575223975516e-06, + "loss": 0.7861, + "step": 41746 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906334114902774e-06, + "loss": 0.6172, + "step": 41747 + }, + { + "epoch": 1.07, + "learning_rate": 1.4906093002073478e-06, + "loss": 0.4729, + "step": 41748 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905851885487814e-06, + "loss": 0.7178, + "step": 41749 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905610765145965e-06, + "loss": 0.665, + "step": 41750 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905369641048116e-06, + "loss": 0.7197, + "step": 41751 + }, + { + "epoch": 1.07, + "learning_rate": 1.4905128513194448e-06, + "loss": 0.6836, + "step": 41752 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904887381585152e-06, + "loss": 0.7153, + "step": 41753 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904646246220404e-06, + "loss": 0.7803, + "step": 41754 + }, + { + "epoch": 1.07, + "learning_rate": 1.49044051071004e-06, + "loss": 0.751, + "step": 41755 + }, + { + "epoch": 1.07, + "learning_rate": 1.4904163964225315e-06, + "loss": 0.6709, + "step": 41756 + }, + { + "epoch": 1.07, + "learning_rate": 1.490392281759534e-06, + "loss": 0.5449, + "step": 41757 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903681667210653e-06, + "loss": 0.5425, + "step": 41758 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903440513071445e-06, + "loss": 0.5708, + "step": 41759 + }, + { + "epoch": 1.07, + "learning_rate": 1.4903199355177895e-06, + "loss": 0.5353, + "step": 41760 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902958193530195e-06, + "loss": 0.7461, + "step": 41761 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902717028128524e-06, + "loss": 0.8672, + "step": 41762 + }, + { + "epoch": 1.07, + "learning_rate": 1.4902475858973068e-06, + "loss": 0.7686, + "step": 41763 + }, + { + "epoch": 1.07, + "learning_rate": 1.490223468606401e-06, + "loss": 0.7188, + "step": 41764 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901993509401535e-06, + "loss": 0.438, + "step": 41765 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901752328985835e-06, + "loss": 0.5953, + "step": 41766 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901511144817085e-06, + "loss": 0.6382, + "step": 41767 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901269956895472e-06, + "loss": 0.5697, + "step": 41768 + }, + { + "epoch": 1.07, + "learning_rate": 1.4901028765221183e-06, + "loss": 0.5781, + "step": 41769 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900787569794402e-06, + "loss": 0.4413, + "step": 41770 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900546370615315e-06, + "loss": 0.7471, + "step": 41771 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900305167684104e-06, + "loss": 0.7373, + "step": 41772 + }, + { + "epoch": 1.07, + "learning_rate": 1.4900063961000952e-06, + "loss": 0.6924, + "step": 41773 + }, + { + "epoch": 1.07, + "learning_rate": 1.489982275056605e-06, + "loss": 0.5596, + "step": 41774 + }, + { + "epoch": 1.07, + "learning_rate": 1.4899581536379575e-06, + "loss": 0.7139, + "step": 41775 + }, + { + "epoch": 1.07, + "learning_rate": 1.489934031844172e-06, + "loss": 0.5732, + "step": 41776 + }, + { + "epoch": 1.07, + "learning_rate": 1.4899099096752663e-06, + "loss": 0.5972, + "step": 41777 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898857871312591e-06, + "loss": 0.7578, + "step": 41778 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898616642121688e-06, + "loss": 0.748, + "step": 41779 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898375409180142e-06, + "loss": 0.6963, + "step": 41780 + }, + { + "epoch": 1.07, + "learning_rate": 1.4898134172488136e-06, + "loss": 0.688, + "step": 41781 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897892932045849e-06, + "loss": 0.7236, + "step": 41782 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897651687853473e-06, + "loss": 0.627, + "step": 41783 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897410439911192e-06, + "loss": 0.6582, + "step": 41784 + }, + { + "epoch": 1.07, + "learning_rate": 1.4897169188219185e-06, + "loss": 0.5158, + "step": 41785 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896927932777645e-06, + "loss": 0.6021, + "step": 41786 + }, + { + "epoch": 1.07, + "learning_rate": 1.489668667358675e-06, + "loss": 0.4599, + "step": 41787 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896445410646688e-06, + "loss": 0.8564, + "step": 41788 + }, + { + "epoch": 1.07, + "learning_rate": 1.4896204143957645e-06, + "loss": 0.708, + "step": 41789 + }, + { + "epoch": 1.07, + "learning_rate": 1.48959628735198e-06, + "loss": 0.7676, + "step": 41790 + }, + { + "epoch": 1.07, + "learning_rate": 1.4895721599333344e-06, + "loss": 0.5881, + "step": 41791 + }, + { + "epoch": 1.07, + "learning_rate": 1.4895480321398456e-06, + "loss": 0.6777, + "step": 41792 + }, + { + "epoch": 1.07, + "learning_rate": 1.489523903971533e-06, + "loss": 0.7793, + "step": 41793 + }, + { + "epoch": 1.07, + "learning_rate": 1.4894997754284138e-06, + "loss": 0.6895, + "step": 41794 + }, + { + "epoch": 1.07, + "learning_rate": 1.4894756465105074e-06, + "loss": 0.7148, + "step": 41795 + }, + { + "epoch": 1.07, + "learning_rate": 1.489451517217832e-06, + "loss": 0.8672, + "step": 41796 + }, + { + "epoch": 1.07, + "learning_rate": 1.489427387550406e-06, + "loss": 0.6826, + "step": 41797 + }, + { + "epoch": 1.07, + "learning_rate": 1.489403257508248e-06, + "loss": 0.5647, + "step": 41798 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893791270913765e-06, + "loss": 0.5542, + "step": 41799 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893549962998097e-06, + "loss": 0.4858, + "step": 41800 + }, + { + "epoch": 1.07, + "learning_rate": 1.4893308651335662e-06, + "loss": 0.6943, + "step": 41801 + }, + { + "epoch": 1.07, + "learning_rate": 1.489306733592665e-06, + "loss": 0.4407, + "step": 41802 + }, + { + "epoch": 1.07, + "learning_rate": 1.489282601677124e-06, + "loss": 0.2802, + "step": 41803 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892584693869616e-06, + "loss": 0.7139, + "step": 41804 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892343367221967e-06, + "loss": 0.6733, + "step": 41805 + }, + { + "epoch": 1.07, + "learning_rate": 1.4892102036828476e-06, + "loss": 0.751, + "step": 41806 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891860702689325e-06, + "loss": 0.4595, + "step": 41807 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891619364804702e-06, + "loss": 0.7134, + "step": 41808 + }, + { + "epoch": 1.07, + "learning_rate": 1.489137802317479e-06, + "loss": 0.6738, + "step": 41809 + }, + { + "epoch": 1.07, + "learning_rate": 1.4891136677799778e-06, + "loss": 0.7979, + "step": 41810 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890895328679845e-06, + "loss": 0.7471, + "step": 41811 + }, + { + "epoch": 1.07, + "learning_rate": 1.489065397581518e-06, + "loss": 0.6904, + "step": 41812 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890412619205964e-06, + "loss": 0.584, + "step": 41813 + }, + { + "epoch": 1.07, + "learning_rate": 1.4890171258852384e-06, + "loss": 0.835, + "step": 41814 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889929894754626e-06, + "loss": 0.7681, + "step": 41815 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889688526912875e-06, + "loss": 0.7705, + "step": 41816 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889447155327311e-06, + "loss": 0.5972, + "step": 41817 + }, + { + "epoch": 1.07, + "learning_rate": 1.4889205779998123e-06, + "loss": 0.7344, + "step": 41818 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888964400925494e-06, + "loss": 0.5732, + "step": 41819 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888723018109615e-06, + "loss": 0.625, + "step": 41820 + }, + { + "epoch": 1.07, + "learning_rate": 1.488848163155066e-06, + "loss": 0.3882, + "step": 41821 + }, + { + "epoch": 1.07, + "learning_rate": 1.4888240241248822e-06, + "loss": 0.6313, + "step": 41822 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887998847204282e-06, + "loss": 0.7354, + "step": 41823 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887757449417227e-06, + "loss": 0.6567, + "step": 41824 + }, + { + "epoch": 1.07, + "learning_rate": 1.488751604788784e-06, + "loss": 0.6836, + "step": 41825 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887274642616308e-06, + "loss": 0.7373, + "step": 41826 + }, + { + "epoch": 1.07, + "learning_rate": 1.4887033233602814e-06, + "loss": 0.7246, + "step": 41827 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886791820847542e-06, + "loss": 0.8145, + "step": 41828 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886550404350679e-06, + "loss": 0.6016, + "step": 41829 + }, + { + "epoch": 1.07, + "learning_rate": 1.488630898411241e-06, + "loss": 0.71, + "step": 41830 + }, + { + "epoch": 1.07, + "learning_rate": 1.4886067560132918e-06, + "loss": 0.8369, + "step": 41831 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885826132412388e-06, + "loss": 0.7285, + "step": 41832 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885584700951008e-06, + "loss": 0.7383, + "step": 41833 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885343265748957e-06, + "loss": 0.5518, + "step": 41834 + }, + { + "epoch": 1.07, + "learning_rate": 1.4885101826806428e-06, + "loss": 0.6016, + "step": 41835 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884860384123596e-06, + "loss": 0.7139, + "step": 41836 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884618937700656e-06, + "loss": 0.7754, + "step": 41837 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884377487537782e-06, + "loss": 0.707, + "step": 41838 + }, + { + "epoch": 1.07, + "learning_rate": 1.4884136033635168e-06, + "loss": 0.7881, + "step": 41839 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883894575993e-06, + "loss": 0.3092, + "step": 41840 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883653114611451e-06, + "loss": 0.7646, + "step": 41841 + }, + { + "epoch": 1.07, + "learning_rate": 1.4883411649490717e-06, + "loss": 0.6406, + "step": 41842 + }, + { + "epoch": 1.07, + "learning_rate": 1.488317018063098e-06, + "loss": 0.584, + "step": 41843 + }, + { + "epoch": 1.07, + "learning_rate": 1.4882928708032422e-06, + "loss": 0.7314, + "step": 41844 + }, + { + "epoch": 1.07, + "learning_rate": 1.488268723169523e-06, + "loss": 0.749, + "step": 41845 + }, + { + "epoch": 1.07, + "learning_rate": 1.488244575161959e-06, + "loss": 0.5767, + "step": 41846 + }, + { + "epoch": 1.07, + "learning_rate": 1.4882204267805688e-06, + "loss": 0.5923, + "step": 41847 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881962780253702e-06, + "loss": 0.7012, + "step": 41848 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881721288963825e-06, + "loss": 0.6514, + "step": 41849 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881479793936235e-06, + "loss": 0.6177, + "step": 41850 + }, + { + "epoch": 1.07, + "learning_rate": 1.4881238295171123e-06, + "loss": 0.665, + "step": 41851 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880996792668673e-06, + "loss": 0.6943, + "step": 41852 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880755286429062e-06, + "loss": 0.5811, + "step": 41853 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880513776452488e-06, + "loss": 0.8086, + "step": 41854 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880272262739127e-06, + "loss": 0.5933, + "step": 41855 + }, + { + "epoch": 1.07, + "learning_rate": 1.4880030745289165e-06, + "loss": 0.6777, + "step": 41856 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879789224102788e-06, + "loss": 0.5605, + "step": 41857 + }, + { + "epoch": 1.07, + "learning_rate": 1.487954769918018e-06, + "loss": 0.7393, + "step": 41858 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879306170521526e-06, + "loss": 0.5464, + "step": 41859 + }, + { + "epoch": 1.07, + "learning_rate": 1.4879064638127017e-06, + "loss": 0.5249, + "step": 41860 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878823101996827e-06, + "loss": 0.6099, + "step": 41861 + }, + { + "epoch": 1.07, + "learning_rate": 1.487858156213115e-06, + "loss": 0.6611, + "step": 41862 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878340018530161e-06, + "loss": 0.7842, + "step": 41863 + }, + { + "epoch": 1.07, + "learning_rate": 1.4878098471194058e-06, + "loss": 0.6885, + "step": 41864 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877856920123018e-06, + "loss": 0.7197, + "step": 41865 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877615365317228e-06, + "loss": 0.4634, + "step": 41866 + }, + { + "epoch": 1.07, + "learning_rate": 1.487737380677687e-06, + "loss": 0.5483, + "step": 41867 + }, + { + "epoch": 1.07, + "learning_rate": 1.4877132244502131e-06, + "loss": 0.625, + "step": 41868 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876890678493195e-06, + "loss": 0.6201, + "step": 41869 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876649108750252e-06, + "loss": 0.709, + "step": 41870 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876407535273482e-06, + "loss": 0.6133, + "step": 41871 + }, + { + "epoch": 1.07, + "learning_rate": 1.4876165958063067e-06, + "loss": 0.7041, + "step": 41872 + }, + { + "epoch": 1.07, + "learning_rate": 1.48759243771192e-06, + "loss": 0.6362, + "step": 41873 + }, + { + "epoch": 1.07, + "learning_rate": 1.487568279244206e-06, + "loss": 0.751, + "step": 41874 + }, + { + "epoch": 1.07, + "learning_rate": 1.4875441204031838e-06, + "loss": 0.5938, + "step": 41875 + }, + { + "epoch": 1.07, + "learning_rate": 1.4875199611888708e-06, + "loss": 0.6616, + "step": 41876 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874958016012865e-06, + "loss": 0.6821, + "step": 41877 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874716416404493e-06, + "loss": 0.7148, + "step": 41878 + }, + { + "epoch": 1.07, + "learning_rate": 1.4874474813063772e-06, + "loss": 0.8066, + "step": 41879 + }, + { + "epoch": 1.07, + "learning_rate": 1.487423320599089e-06, + "loss": 0.6899, + "step": 41880 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873991595186035e-06, + "loss": 0.5864, + "step": 41881 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873749980649385e-06, + "loss": 0.7178, + "step": 41882 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873508362381131e-06, + "loss": 0.6277, + "step": 41883 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873266740381454e-06, + "loss": 0.6597, + "step": 41884 + }, + { + "epoch": 1.07, + "learning_rate": 1.4873025114650544e-06, + "loss": 0.7637, + "step": 41885 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872783485188578e-06, + "loss": 0.5664, + "step": 41886 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872541851995748e-06, + "loss": 0.5452, + "step": 41887 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872300215072235e-06, + "loss": 0.6904, + "step": 41888 + }, + { + "epoch": 1.07, + "learning_rate": 1.4872058574418229e-06, + "loss": 0.3972, + "step": 41889 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871816930033912e-06, + "loss": 0.6895, + "step": 41890 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871575281919464e-06, + "loss": 0.4902, + "step": 41891 + }, + { + "epoch": 1.07, + "learning_rate": 1.487133363007508e-06, + "loss": 0.5049, + "step": 41892 + }, + { + "epoch": 1.07, + "learning_rate": 1.4871091974500938e-06, + "loss": 0.7354, + "step": 41893 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870850315197224e-06, + "loss": 0.4302, + "step": 41894 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870608652164122e-06, + "loss": 0.7803, + "step": 41895 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870366985401824e-06, + "loss": 0.5481, + "step": 41896 + }, + { + "epoch": 1.07, + "learning_rate": 1.4870125314910506e-06, + "loss": 0.6328, + "step": 41897 + }, + { + "epoch": 1.07, + "learning_rate": 1.486988364069036e-06, + "loss": 0.6509, + "step": 41898 + }, + { + "epoch": 1.07, + "learning_rate": 1.4869641962741565e-06, + "loss": 0.6309, + "step": 41899 + }, + { + "epoch": 1.07, + "learning_rate": 1.486940028106431e-06, + "loss": 0.7998, + "step": 41900 + }, + { + "epoch": 1.07, + "learning_rate": 1.4869158595658779e-06, + "loss": 0.6553, + "step": 41901 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868916906525157e-06, + "loss": 0.4331, + "step": 41902 + }, + { + "epoch": 1.07, + "learning_rate": 1.486867521366363e-06, + "loss": 0.8115, + "step": 41903 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868433517074382e-06, + "loss": 0.5479, + "step": 41904 + }, + { + "epoch": 1.07, + "learning_rate": 1.4868191816757598e-06, + "loss": 0.6699, + "step": 41905 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867950112713465e-06, + "loss": 0.5781, + "step": 41906 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867708404942164e-06, + "loss": 0.708, + "step": 41907 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867466693443884e-06, + "loss": 0.7036, + "step": 41908 + }, + { + "epoch": 1.07, + "learning_rate": 1.4867224978218808e-06, + "loss": 0.6748, + "step": 41909 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866983259267123e-06, + "loss": 0.7891, + "step": 41910 + }, + { + "epoch": 1.07, + "learning_rate": 1.486674153658901e-06, + "loss": 0.5693, + "step": 41911 + }, + { + "epoch": 1.07, + "learning_rate": 1.486649981018466e-06, + "loss": 0.7119, + "step": 41912 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866258080054254e-06, + "loss": 0.7773, + "step": 41913 + }, + { + "epoch": 1.07, + "learning_rate": 1.4866016346197976e-06, + "loss": 0.7324, + "step": 41914 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865774608616013e-06, + "loss": 0.6567, + "step": 41915 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865532867308552e-06, + "loss": 0.7095, + "step": 41916 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865291122275777e-06, + "loss": 0.623, + "step": 41917 + }, + { + "epoch": 1.07, + "learning_rate": 1.4865049373517869e-06, + "loss": 0.6055, + "step": 41918 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864807621035019e-06, + "loss": 0.6709, + "step": 41919 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864565864827407e-06, + "loss": 0.8232, + "step": 41920 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864324104895225e-06, + "loss": 0.6414, + "step": 41921 + }, + { + "epoch": 1.07, + "learning_rate": 1.4864082341238649e-06, + "loss": 0.707, + "step": 41922 + }, + { + "epoch": 1.07, + "learning_rate": 1.486384057385787e-06, + "loss": 0.5718, + "step": 41923 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863598802753073e-06, + "loss": 0.8096, + "step": 41924 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863357027924444e-06, + "loss": 0.6094, + "step": 41925 + }, + { + "epoch": 1.07, + "learning_rate": 1.4863115249372163e-06, + "loss": 0.6895, + "step": 41926 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862873467096418e-06, + "loss": 0.5781, + "step": 41927 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862631681097396e-06, + "loss": 0.6777, + "step": 41928 + }, + { + "epoch": 1.07, + "learning_rate": 1.486238989137528e-06, + "loss": 0.5205, + "step": 41929 + }, + { + "epoch": 1.07, + "learning_rate": 1.4862148097930256e-06, + "loss": 0.7627, + "step": 41930 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861906300762507e-06, + "loss": 0.7305, + "step": 41931 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861664499872222e-06, + "loss": 0.7354, + "step": 41932 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861422695259585e-06, + "loss": 0.5077, + "step": 41933 + }, + { + "epoch": 1.07, + "learning_rate": 1.4861180886924776e-06, + "loss": 0.7119, + "step": 41934 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860939074867988e-06, + "loss": 0.8135, + "step": 41935 + }, + { + "epoch": 1.07, + "learning_rate": 1.48606972590894e-06, + "loss": 0.6768, + "step": 41936 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860455439589203e-06, + "loss": 0.7373, + "step": 41937 + }, + { + "epoch": 1.07, + "learning_rate": 1.4860213616367576e-06, + "loss": 0.6255, + "step": 41938 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859971789424709e-06, + "loss": 0.6875, + "step": 41939 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859729958760784e-06, + "loss": 0.6504, + "step": 41940 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859488124375985e-06, + "loss": 0.6162, + "step": 41941 + }, + { + "epoch": 1.07, + "learning_rate": 1.4859246286270502e-06, + "loss": 0.7881, + "step": 41942 + }, + { + "epoch": 1.08, + "learning_rate": 1.4859004444444515e-06, + "loss": 0.6006, + "step": 41943 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858762598898214e-06, + "loss": 0.583, + "step": 41944 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858520749631781e-06, + "loss": 0.4937, + "step": 41945 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858278896645404e-06, + "loss": 0.7861, + "step": 41946 + }, + { + "epoch": 1.08, + "learning_rate": 1.4858037039939265e-06, + "loss": 0.7056, + "step": 41947 + }, + { + "epoch": 1.08, + "learning_rate": 1.485779517951355e-06, + "loss": 0.6709, + "step": 41948 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857553315368443e-06, + "loss": 0.6367, + "step": 41949 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857311447504135e-06, + "loss": 0.769, + "step": 41950 + }, + { + "epoch": 1.08, + "learning_rate": 1.4857069575920804e-06, + "loss": 0.4055, + "step": 41951 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856827700618639e-06, + "loss": 0.582, + "step": 41952 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856585821597823e-06, + "loss": 0.5582, + "step": 41953 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856343938858545e-06, + "loss": 0.7192, + "step": 41954 + }, + { + "epoch": 1.08, + "learning_rate": 1.4856102052400986e-06, + "loss": 0.6763, + "step": 41955 + }, + { + "epoch": 1.08, + "learning_rate": 1.4855860162225332e-06, + "loss": 0.6709, + "step": 41956 + }, + { + "epoch": 1.08, + "learning_rate": 1.485561826833177e-06, + "loss": 0.7031, + "step": 41957 + }, + { + "epoch": 1.08, + "learning_rate": 1.4855376370720487e-06, + "loss": 0.6807, + "step": 41958 + }, + { + "epoch": 1.08, + "learning_rate": 1.485513446939166e-06, + "loss": 0.5718, + "step": 41959 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854892564345484e-06, + "loss": 0.7236, + "step": 41960 + }, + { + "epoch": 1.08, + "learning_rate": 1.485465065558214e-06, + "loss": 0.8721, + "step": 41961 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854408743101812e-06, + "loss": 0.6895, + "step": 41962 + }, + { + "epoch": 1.08, + "learning_rate": 1.4854166826904688e-06, + "loss": 0.6514, + "step": 41963 + }, + { + "epoch": 1.08, + "learning_rate": 1.485392490699095e-06, + "loss": 0.7373, + "step": 41964 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853682983360787e-06, + "loss": 0.563, + "step": 41965 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853441056014376e-06, + "loss": 0.6455, + "step": 41966 + }, + { + "epoch": 1.08, + "learning_rate": 1.4853199124951916e-06, + "loss": 0.4392, + "step": 41967 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852957190173578e-06, + "loss": 0.5444, + "step": 41968 + }, + { + "epoch": 1.08, + "learning_rate": 1.485271525167956e-06, + "loss": 0.5957, + "step": 41969 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852473309470037e-06, + "loss": 0.625, + "step": 41970 + }, + { + "epoch": 1.08, + "learning_rate": 1.4852231363545202e-06, + "loss": 0.7441, + "step": 41971 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851989413905233e-06, + "loss": 0.6733, + "step": 41972 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851747460550322e-06, + "loss": 0.5386, + "step": 41973 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851505503480646e-06, + "loss": 0.7373, + "step": 41974 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851263542696399e-06, + "loss": 0.8125, + "step": 41975 + }, + { + "epoch": 1.08, + "learning_rate": 1.4851021578197761e-06, + "loss": 0.5791, + "step": 41976 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850779609984923e-06, + "loss": 0.4792, + "step": 41977 + }, + { + "epoch": 1.08, + "learning_rate": 1.485053763805806e-06, + "loss": 0.7393, + "step": 41978 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850295662417367e-06, + "loss": 0.6597, + "step": 41979 + }, + { + "epoch": 1.08, + "learning_rate": 1.4850053683063023e-06, + "loss": 0.5229, + "step": 41980 + }, + { + "epoch": 1.08, + "learning_rate": 1.484981169999522e-06, + "loss": 0.5625, + "step": 41981 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849569713214137e-06, + "loss": 0.6738, + "step": 41982 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849327722719963e-06, + "loss": 0.7969, + "step": 41983 + }, + { + "epoch": 1.08, + "learning_rate": 1.4849085728512877e-06, + "loss": 0.6299, + "step": 41984 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848843730593073e-06, + "loss": 0.5039, + "step": 41985 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848601728960733e-06, + "loss": 0.6055, + "step": 41986 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848359723616037e-06, + "loss": 0.5308, + "step": 41987 + }, + { + "epoch": 1.08, + "learning_rate": 1.4848117714559178e-06, + "loss": 0.916, + "step": 41988 + }, + { + "epoch": 1.08, + "learning_rate": 1.4847875701790337e-06, + "loss": 0.7119, + "step": 41989 + }, + { + "epoch": 1.08, + "learning_rate": 1.4847633685309707e-06, + "loss": 0.4678, + "step": 41990 + }, + { + "epoch": 1.08, + "learning_rate": 1.484739166511746e-06, + "loss": 0.6589, + "step": 41991 + }, + { + "epoch": 1.08, + "learning_rate": 1.484714964121379e-06, + "loss": 0.6626, + "step": 41992 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846907613598876e-06, + "loss": 0.5366, + "step": 41993 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846665582272913e-06, + "loss": 0.8652, + "step": 41994 + }, + { + "epoch": 1.08, + "learning_rate": 1.484642354723608e-06, + "loss": 0.5137, + "step": 41995 + }, + { + "epoch": 1.08, + "learning_rate": 1.4846181508488565e-06, + "loss": 0.8223, + "step": 41996 + }, + { + "epoch": 1.08, + "learning_rate": 1.4845939466030548e-06, + "loss": 0.6245, + "step": 41997 + }, + { + "epoch": 1.08, + "learning_rate": 1.484569741986222e-06, + "loss": 0.561, + "step": 41998 + }, + { + "epoch": 1.08, + "learning_rate": 1.484545536998376e-06, + "loss": 0.4436, + "step": 41999 + }, + { + "epoch": 1.08, + "learning_rate": 1.4845213316395367e-06, + "loss": 0.7236, + "step": 42000 + }, + { + "epoch": 1.08, + "learning_rate": 1.484497125909721e-06, + "loss": 0.6636, + "step": 42001 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844729198089483e-06, + "loss": 0.7354, + "step": 42002 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844487133372368e-06, + "loss": 0.6479, + "step": 42003 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844245064946055e-06, + "loss": 0.7495, + "step": 42004 + }, + { + "epoch": 1.08, + "learning_rate": 1.4844002992810725e-06, + "loss": 0.6724, + "step": 42005 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843760916966561e-06, + "loss": 0.6689, + "step": 42006 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843518837413757e-06, + "loss": 0.8955, + "step": 42007 + }, + { + "epoch": 1.08, + "learning_rate": 1.484327675415249e-06, + "loss": 0.7998, + "step": 42008 + }, + { + "epoch": 1.08, + "learning_rate": 1.4843034667182952e-06, + "loss": 0.6401, + "step": 42009 + }, + { + "epoch": 1.08, + "learning_rate": 1.4842792576505323e-06, + "loss": 0.7734, + "step": 42010 + }, + { + "epoch": 1.08, + "learning_rate": 1.484255048211979e-06, + "loss": 0.7725, + "step": 42011 + }, + { + "epoch": 1.08, + "learning_rate": 1.484230838402654e-06, + "loss": 0.5476, + "step": 42012 + }, + { + "epoch": 1.08, + "learning_rate": 1.4842066282225755e-06, + "loss": 0.751, + "step": 42013 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841824176717625e-06, + "loss": 0.8242, + "step": 42014 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841582067502333e-06, + "loss": 0.752, + "step": 42015 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841339954580063e-06, + "loss": 0.6924, + "step": 42016 + }, + { + "epoch": 1.08, + "learning_rate": 1.4841097837951002e-06, + "loss": 0.6143, + "step": 42017 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840855717615334e-06, + "loss": 0.7041, + "step": 42018 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840613593573245e-06, + "loss": 0.6943, + "step": 42019 + }, + { + "epoch": 1.08, + "learning_rate": 1.4840371465824925e-06, + "loss": 0.5537, + "step": 42020 + }, + { + "epoch": 1.08, + "learning_rate": 1.484012933437055e-06, + "loss": 0.5405, + "step": 42021 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839887199210312e-06, + "loss": 0.6116, + "step": 42022 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839645060344396e-06, + "loss": 0.6309, + "step": 42023 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839402917772985e-06, + "loss": 0.6709, + "step": 42024 + }, + { + "epoch": 1.08, + "learning_rate": 1.4839160771496268e-06, + "loss": 0.6973, + "step": 42025 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838918621514427e-06, + "loss": 0.6455, + "step": 42026 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838676467827648e-06, + "loss": 0.6475, + "step": 42027 + }, + { + "epoch": 1.08, + "learning_rate": 1.4838434310436116e-06, + "loss": 0.708, + "step": 42028 + }, + { + "epoch": 1.08, + "learning_rate": 1.483819214934002e-06, + "loss": 0.4229, + "step": 42029 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837949984539541e-06, + "loss": 0.5586, + "step": 42030 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837707816034865e-06, + "loss": 0.6401, + "step": 42031 + }, + { + "epoch": 1.08, + "learning_rate": 1.483746564382618e-06, + "loss": 0.5293, + "step": 42032 + }, + { + "epoch": 1.08, + "learning_rate": 1.4837223467913668e-06, + "loss": 0.7139, + "step": 42033 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836981288297519e-06, + "loss": 0.6265, + "step": 42034 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836739104977916e-06, + "loss": 0.6833, + "step": 42035 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836496917955044e-06, + "loss": 0.6328, + "step": 42036 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836254727229087e-06, + "loss": 0.6831, + "step": 42037 + }, + { + "epoch": 1.08, + "learning_rate": 1.4836012532800232e-06, + "loss": 0.5681, + "step": 42038 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835770334668664e-06, + "loss": 0.5815, + "step": 42039 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835528132834576e-06, + "loss": 0.6621, + "step": 42040 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835285927298138e-06, + "loss": 0.5713, + "step": 42041 + }, + { + "epoch": 1.08, + "learning_rate": 1.4835043718059548e-06, + "loss": 0.5444, + "step": 42042 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834801505118985e-06, + "loss": 0.6719, + "step": 42043 + }, + { + "epoch": 1.08, + "learning_rate": 1.483455928847664e-06, + "loss": 0.4604, + "step": 42044 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834317068132692e-06, + "loss": 0.6011, + "step": 42045 + }, + { + "epoch": 1.08, + "learning_rate": 1.4834074844087335e-06, + "loss": 0.7402, + "step": 42046 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833832616340743e-06, + "loss": 0.6909, + "step": 42047 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833590384893112e-06, + "loss": 0.6289, + "step": 42048 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833348149744618e-06, + "loss": 0.5894, + "step": 42049 + }, + { + "epoch": 1.08, + "learning_rate": 1.4833105910895456e-06, + "loss": 0.7314, + "step": 42050 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832863668345804e-06, + "loss": 0.5645, + "step": 42051 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832621422095853e-06, + "loss": 0.7578, + "step": 42052 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832379172145785e-06, + "loss": 0.7197, + "step": 42053 + }, + { + "epoch": 1.08, + "learning_rate": 1.4832136918495785e-06, + "loss": 0.554, + "step": 42054 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831894661146046e-06, + "loss": 0.4246, + "step": 42055 + }, + { + "epoch": 1.08, + "learning_rate": 1.483165240009674e-06, + "loss": 0.7476, + "step": 42056 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831410135348063e-06, + "loss": 0.7568, + "step": 42057 + }, + { + "epoch": 1.08, + "learning_rate": 1.4831167866900197e-06, + "loss": 0.7168, + "step": 42058 + }, + { + "epoch": 1.08, + "learning_rate": 1.483092559475333e-06, + "loss": 0.7422, + "step": 42059 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830683318907644e-06, + "loss": 0.7275, + "step": 42060 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830441039363327e-06, + "loss": 0.7871, + "step": 42061 + }, + { + "epoch": 1.08, + "learning_rate": 1.4830198756120559e-06, + "loss": 0.6201, + "step": 42062 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829956469179534e-06, + "loss": 0.5591, + "step": 42063 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829714178540432e-06, + "loss": 0.5518, + "step": 42064 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829471884203442e-06, + "loss": 0.5908, + "step": 42065 + }, + { + "epoch": 1.08, + "learning_rate": 1.4829229586168743e-06, + "loss": 0.7529, + "step": 42066 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828987284436528e-06, + "loss": 0.6689, + "step": 42067 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828744979006977e-06, + "loss": 0.7168, + "step": 42068 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828502669880284e-06, + "loss": 0.7227, + "step": 42069 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828260357056624e-06, + "loss": 0.707, + "step": 42070 + }, + { + "epoch": 1.08, + "learning_rate": 1.4828018040536185e-06, + "loss": 0.6108, + "step": 42071 + }, + { + "epoch": 1.08, + "learning_rate": 1.482777572031916e-06, + "loss": 0.479, + "step": 42072 + }, + { + "epoch": 1.08, + "learning_rate": 1.4827533396405727e-06, + "loss": 0.5481, + "step": 42073 + }, + { + "epoch": 1.08, + "learning_rate": 1.482729106879607e-06, + "loss": 0.6455, + "step": 42074 + }, + { + "epoch": 1.08, + "learning_rate": 1.4827048737490382e-06, + "loss": 0.6067, + "step": 42075 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826806402488844e-06, + "loss": 0.668, + "step": 42076 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826564063791642e-06, + "loss": 0.6167, + "step": 42077 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826321721398962e-06, + "loss": 0.5781, + "step": 42078 + }, + { + "epoch": 1.08, + "learning_rate": 1.4826079375310989e-06, + "loss": 0.7344, + "step": 42079 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825837025527912e-06, + "loss": 0.7158, + "step": 42080 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825594672049911e-06, + "loss": 0.5781, + "step": 42081 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825352314877173e-06, + "loss": 0.6982, + "step": 42082 + }, + { + "epoch": 1.08, + "learning_rate": 1.4825109954009885e-06, + "loss": 0.7451, + "step": 42083 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824867589448234e-06, + "loss": 0.6123, + "step": 42084 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824625221192402e-06, + "loss": 0.5974, + "step": 42085 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824382849242575e-06, + "loss": 0.6653, + "step": 42086 + }, + { + "epoch": 1.08, + "learning_rate": 1.4824140473598944e-06, + "loss": 0.8574, + "step": 42087 + }, + { + "epoch": 1.08, + "learning_rate": 1.4823898094261687e-06, + "loss": 0.7417, + "step": 42088 + }, + { + "epoch": 1.08, + "learning_rate": 1.4823655711230994e-06, + "loss": 0.7031, + "step": 42089 + }, + { + "epoch": 1.08, + "learning_rate": 1.482341332450705e-06, + "loss": 0.603, + "step": 42090 + }, + { + "epoch": 1.08, + "learning_rate": 1.482317093409004e-06, + "loss": 0.6875, + "step": 42091 + }, + { + "epoch": 1.08, + "learning_rate": 1.482292853998015e-06, + "loss": 0.6572, + "step": 42092 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822686142177566e-06, + "loss": 0.6924, + "step": 42093 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822443740682471e-06, + "loss": 0.6221, + "step": 42094 + }, + { + "epoch": 1.08, + "learning_rate": 1.4822201335495055e-06, + "loss": 0.5801, + "step": 42095 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821958926615498e-06, + "loss": 0.6938, + "step": 42096 + }, + { + "epoch": 1.08, + "learning_rate": 1.482171651404399e-06, + "loss": 0.6038, + "step": 42097 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821474097780714e-06, + "loss": 0.5703, + "step": 42098 + }, + { + "epoch": 1.08, + "learning_rate": 1.4821231677825863e-06, + "loss": 0.6289, + "step": 42099 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820989254179612e-06, + "loss": 0.6636, + "step": 42100 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820746826842152e-06, + "loss": 0.6084, + "step": 42101 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820504395813666e-06, + "loss": 0.5149, + "step": 42102 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820261961094342e-06, + "loss": 0.5894, + "step": 42103 + }, + { + "epoch": 1.08, + "learning_rate": 1.4820019522684369e-06, + "loss": 0.7715, + "step": 42104 + }, + { + "epoch": 1.08, + "learning_rate": 1.4819777080583925e-06, + "loss": 0.792, + "step": 42105 + }, + { + "epoch": 1.08, + "learning_rate": 1.48195346347932e-06, + "loss": 0.709, + "step": 42106 + }, + { + "epoch": 1.08, + "learning_rate": 1.481929218531238e-06, + "loss": 0.6616, + "step": 42107 + }, + { + "epoch": 1.08, + "learning_rate": 1.4819049732141645e-06, + "loss": 0.6865, + "step": 42108 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818807275281193e-06, + "loss": 0.7334, + "step": 42109 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818564814731195e-06, + "loss": 0.6108, + "step": 42110 + }, + { + "epoch": 1.08, + "learning_rate": 1.4818322350491848e-06, + "loss": 0.6292, + "step": 42111 + }, + { + "epoch": 1.08, + "learning_rate": 1.481807988256333e-06, + "loss": 0.7207, + "step": 42112 + }, + { + "epoch": 1.08, + "learning_rate": 1.481783741094583e-06, + "loss": 0.6963, + "step": 42113 + }, + { + "epoch": 1.08, + "learning_rate": 1.4817594935639538e-06, + "loss": 0.5156, + "step": 42114 + }, + { + "epoch": 1.08, + "learning_rate": 1.481735245664463e-06, + "loss": 0.7393, + "step": 42115 + }, + { + "epoch": 1.08, + "learning_rate": 1.4817109973961297e-06, + "loss": 0.6328, + "step": 42116 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816867487589728e-06, + "loss": 0.5444, + "step": 42117 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816624997530101e-06, + "loss": 0.791, + "step": 42118 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816382503782607e-06, + "loss": 0.75, + "step": 42119 + }, + { + "epoch": 1.08, + "learning_rate": 1.4816140006347433e-06, + "loss": 0.6306, + "step": 42120 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815897505224758e-06, + "loss": 0.5361, + "step": 42121 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815655000414772e-06, + "loss": 0.8086, + "step": 42122 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815412491917663e-06, + "loss": 0.5166, + "step": 42123 + }, + { + "epoch": 1.08, + "learning_rate": 1.4815169979733614e-06, + "loss": 0.6865, + "step": 42124 + }, + { + "epoch": 1.08, + "learning_rate": 1.481492746386281e-06, + "loss": 0.7354, + "step": 42125 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814684944305437e-06, + "loss": 0.5967, + "step": 42126 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814442421061678e-06, + "loss": 0.6152, + "step": 42127 + }, + { + "epoch": 1.08, + "learning_rate": 1.4814199894131726e-06, + "loss": 0.6069, + "step": 42128 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813957363515764e-06, + "loss": 0.4907, + "step": 42129 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813714829213974e-06, + "loss": 0.5889, + "step": 42130 + }, + { + "epoch": 1.08, + "learning_rate": 1.4813472291226542e-06, + "loss": 0.7461, + "step": 42131 + }, + { + "epoch": 1.08, + "learning_rate": 1.481322974955366e-06, + "loss": 0.6357, + "step": 42132 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812987204195504e-06, + "loss": 0.4663, + "step": 42133 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812744655152268e-06, + "loss": 0.5537, + "step": 42134 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812502102424136e-06, + "loss": 0.5271, + "step": 42135 + }, + { + "epoch": 1.08, + "learning_rate": 1.481225954601129e-06, + "loss": 0.6387, + "step": 42136 + }, + { + "epoch": 1.08, + "learning_rate": 1.4812016985913918e-06, + "loss": 0.6602, + "step": 42137 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811774422132209e-06, + "loss": 0.6885, + "step": 42138 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811531854666343e-06, + "loss": 0.6309, + "step": 42139 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811289283516506e-06, + "loss": 0.605, + "step": 42140 + }, + { + "epoch": 1.08, + "learning_rate": 1.4811046708682891e-06, + "loss": 0.7559, + "step": 42141 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810804130165674e-06, + "loss": 0.7227, + "step": 42142 + }, + { + "epoch": 1.08, + "learning_rate": 1.481056154796505e-06, + "loss": 0.9766, + "step": 42143 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810318962081198e-06, + "loss": 0.9121, + "step": 42144 + }, + { + "epoch": 1.08, + "learning_rate": 1.4810076372514307e-06, + "loss": 0.6533, + "step": 42145 + }, + { + "epoch": 1.08, + "learning_rate": 1.480983377926456e-06, + "loss": 0.6104, + "step": 42146 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809591182332147e-06, + "loss": 0.4158, + "step": 42147 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809348581717246e-06, + "loss": 0.6418, + "step": 42148 + }, + { + "epoch": 1.08, + "learning_rate": 1.4809105977420054e-06, + "loss": 0.489, + "step": 42149 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808863369440746e-06, + "loss": 0.4556, + "step": 42150 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808620757779515e-06, + "loss": 0.7446, + "step": 42151 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808378142436543e-06, + "loss": 0.7021, + "step": 42152 + }, + { + "epoch": 1.08, + "learning_rate": 1.4808135523412017e-06, + "loss": 0.5723, + "step": 42153 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807892900706125e-06, + "loss": 0.6263, + "step": 42154 + }, + { + "epoch": 1.08, + "learning_rate": 1.480765027431905e-06, + "loss": 0.7573, + "step": 42155 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807407644250976e-06, + "loss": 0.8369, + "step": 42156 + }, + { + "epoch": 1.08, + "learning_rate": 1.4807165010502093e-06, + "loss": 0.7119, + "step": 42157 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806922373072582e-06, + "loss": 0.6121, + "step": 42158 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806679731962635e-06, + "loss": 0.6416, + "step": 42159 + }, + { + "epoch": 1.08, + "learning_rate": 1.4806437087172432e-06, + "loss": 0.5149, + "step": 42160 + }, + { + "epoch": 1.08, + "learning_rate": 1.480619443870216e-06, + "loss": 0.6069, + "step": 42161 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805951786552009e-06, + "loss": 0.7236, + "step": 42162 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805709130722162e-06, + "loss": 0.5801, + "step": 42163 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805466471212803e-06, + "loss": 0.4141, + "step": 42164 + }, + { + "epoch": 1.08, + "learning_rate": 1.4805223808024118e-06, + "loss": 0.7627, + "step": 42165 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804981141156297e-06, + "loss": 0.6885, + "step": 42166 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804738470609518e-06, + "loss": 0.7578, + "step": 42167 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804495796383975e-06, + "loss": 0.6084, + "step": 42168 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804253118479853e-06, + "loss": 0.6445, + "step": 42169 + }, + { + "epoch": 1.08, + "learning_rate": 1.4804010436897331e-06, + "loss": 0.6973, + "step": 42170 + }, + { + "epoch": 1.08, + "learning_rate": 1.48037677516366e-06, + "loss": 0.7373, + "step": 42171 + }, + { + "epoch": 1.08, + "learning_rate": 1.4803525062697846e-06, + "loss": 0.7144, + "step": 42172 + }, + { + "epoch": 1.08, + "learning_rate": 1.4803282370081255e-06, + "loss": 0.6367, + "step": 42173 + }, + { + "epoch": 1.08, + "learning_rate": 1.480303967378701e-06, + "loss": 0.6143, + "step": 42174 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802796973815297e-06, + "loss": 0.5984, + "step": 42175 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802554270166305e-06, + "loss": 0.8105, + "step": 42176 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802311562840218e-06, + "loss": 0.7783, + "step": 42177 + }, + { + "epoch": 1.08, + "learning_rate": 1.4802068851837222e-06, + "loss": 0.436, + "step": 42178 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801826137157502e-06, + "loss": 0.5981, + "step": 42179 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801583418801244e-06, + "loss": 0.6348, + "step": 42180 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801340696768634e-06, + "loss": 0.6411, + "step": 42181 + }, + { + "epoch": 1.08, + "learning_rate": 1.4801097971059862e-06, + "loss": 0.6855, + "step": 42182 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800855241675105e-06, + "loss": 0.7129, + "step": 42183 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800612508614557e-06, + "loss": 0.6025, + "step": 42184 + }, + { + "epoch": 1.08, + "learning_rate": 1.4800369771878401e-06, + "loss": 0.5432, + "step": 42185 + }, + { + "epoch": 1.08, + "learning_rate": 1.480012703146682e-06, + "loss": 0.501, + "step": 42186 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799884287380005e-06, + "loss": 0.6289, + "step": 42187 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799641539618134e-06, + "loss": 0.708, + "step": 42188 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799398788181407e-06, + "loss": 0.7578, + "step": 42189 + }, + { + "epoch": 1.08, + "learning_rate": 1.4799156033069994e-06, + "loss": 0.7422, + "step": 42190 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798913274284091e-06, + "loss": 0.6006, + "step": 42191 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798670511823878e-06, + "loss": 0.7617, + "step": 42192 + }, + { + "epoch": 1.08, + "learning_rate": 1.4798427745689547e-06, + "loss": 0.6133, + "step": 42193 + }, + { + "epoch": 1.08, + "learning_rate": 1.479818497588128e-06, + "loss": 0.8047, + "step": 42194 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797942202399263e-06, + "loss": 0.6924, + "step": 42195 + }, + { + "epoch": 1.08, + "learning_rate": 1.479769942524368e-06, + "loss": 0.6318, + "step": 42196 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797456644414723e-06, + "loss": 0.7358, + "step": 42197 + }, + { + "epoch": 1.08, + "learning_rate": 1.4797213859912572e-06, + "loss": 0.5391, + "step": 42198 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796971071737417e-06, + "loss": 0.8091, + "step": 42199 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796728279889438e-06, + "loss": 0.5557, + "step": 42200 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796485484368826e-06, + "loss": 0.6768, + "step": 42201 + }, + { + "epoch": 1.08, + "learning_rate": 1.4796242685175767e-06, + "loss": 0.6514, + "step": 42202 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795999882310443e-06, + "loss": 0.5515, + "step": 42203 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795757075773045e-06, + "loss": 0.6561, + "step": 42204 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795514265563755e-06, + "loss": 0.6416, + "step": 42205 + }, + { + "epoch": 1.08, + "learning_rate": 1.479527145168276e-06, + "loss": 0.7686, + "step": 42206 + }, + { + "epoch": 1.08, + "learning_rate": 1.4795028634130246e-06, + "loss": 0.6458, + "step": 42207 + }, + { + "epoch": 1.08, + "learning_rate": 1.47947858129064e-06, + "loss": 0.6138, + "step": 42208 + }, + { + "epoch": 1.08, + "learning_rate": 1.479454298801141e-06, + "loss": 0.7588, + "step": 42209 + }, + { + "epoch": 1.08, + "learning_rate": 1.4794300159445454e-06, + "loss": 0.6748, + "step": 42210 + }, + { + "epoch": 1.08, + "learning_rate": 1.4794057327208725e-06, + "loss": 0.8027, + "step": 42211 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793814491301406e-06, + "loss": 0.509, + "step": 42212 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793571651723682e-06, + "loss": 0.7773, + "step": 42213 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793328808475746e-06, + "loss": 0.6958, + "step": 42214 + }, + { + "epoch": 1.08, + "learning_rate": 1.4793085961557774e-06, + "loss": 0.6196, + "step": 42215 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792843110969958e-06, + "loss": 0.5088, + "step": 42216 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792600256712479e-06, + "loss": 0.5864, + "step": 42217 + }, + { + "epoch": 1.08, + "learning_rate": 1.479235739878553e-06, + "loss": 0.645, + "step": 42218 + }, + { + "epoch": 1.08, + "learning_rate": 1.4792114537189293e-06, + "loss": 0.6924, + "step": 42219 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791871671923956e-06, + "loss": 0.7002, + "step": 42220 + }, + { + "epoch": 1.08, + "learning_rate": 1.47916288029897e-06, + "loss": 0.6084, + "step": 42221 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791385930386716e-06, + "loss": 0.6772, + "step": 42222 + }, + { + "epoch": 1.08, + "learning_rate": 1.4791143054115185e-06, + "loss": 0.5947, + "step": 42223 + }, + { + "epoch": 1.08, + "learning_rate": 1.47909001741753e-06, + "loss": 0.7065, + "step": 42224 + }, + { + "epoch": 1.08, + "learning_rate": 1.4790657290567241e-06, + "loss": 0.6245, + "step": 42225 + }, + { + "epoch": 1.08, + "learning_rate": 1.4790414403291199e-06, + "loss": 0.5791, + "step": 42226 + }, + { + "epoch": 1.08, + "learning_rate": 1.479017151234735e-06, + "loss": 0.5742, + "step": 42227 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789928617735895e-06, + "loss": 0.6465, + "step": 42228 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789685719457008e-06, + "loss": 0.6157, + "step": 42229 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789442817510878e-06, + "loss": 0.3962, + "step": 42230 + }, + { + "epoch": 1.08, + "learning_rate": 1.4789199911897692e-06, + "loss": 0.5757, + "step": 42231 + }, + { + "epoch": 1.08, + "learning_rate": 1.4788957002617637e-06, + "loss": 0.7656, + "step": 42232 + }, + { + "epoch": 1.08, + "learning_rate": 1.4788714089670897e-06, + "loss": 0.7231, + "step": 42233 + }, + { + "epoch": 1.08, + "learning_rate": 1.478847117305766e-06, + "loss": 0.7266, + "step": 42234 + }, + { + "epoch": 1.08, + "learning_rate": 1.478822825277811e-06, + "loss": 0.707, + "step": 42235 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787985328832433e-06, + "loss": 0.6895, + "step": 42236 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787742401220817e-06, + "loss": 0.5552, + "step": 42237 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787499469943447e-06, + "loss": 0.5625, + "step": 42238 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787256535000509e-06, + "loss": 0.7339, + "step": 42239 + }, + { + "epoch": 1.08, + "learning_rate": 1.4787013596392188e-06, + "loss": 0.6396, + "step": 42240 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786770654118673e-06, + "loss": 0.6509, + "step": 42241 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786527708180144e-06, + "loss": 0.6045, + "step": 42242 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786284758576793e-06, + "loss": 0.6523, + "step": 42243 + }, + { + "epoch": 1.08, + "learning_rate": 1.4786041805308803e-06, + "loss": 0.6611, + "step": 42244 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785798848376364e-06, + "loss": 0.9355, + "step": 42245 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785555887779652e-06, + "loss": 0.486, + "step": 42246 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785312923518866e-06, + "loss": 0.5337, + "step": 42247 + }, + { + "epoch": 1.08, + "learning_rate": 1.4785069955594182e-06, + "loss": 0.6396, + "step": 42248 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784826984005793e-06, + "loss": 0.6846, + "step": 42249 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784584008753882e-06, + "loss": 0.6602, + "step": 42250 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784341029838632e-06, + "loss": 0.625, + "step": 42251 + }, + { + "epoch": 1.08, + "learning_rate": 1.4784098047260236e-06, + "loss": 0.6836, + "step": 42252 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783855061018873e-06, + "loss": 0.5625, + "step": 42253 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783612071114734e-06, + "loss": 0.5382, + "step": 42254 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783369077548002e-06, + "loss": 0.6465, + "step": 42255 + }, + { + "epoch": 1.08, + "learning_rate": 1.4783126080318864e-06, + "loss": 0.792, + "step": 42256 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782883079427508e-06, + "loss": 0.7354, + "step": 42257 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782640074874119e-06, + "loss": 0.6758, + "step": 42258 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782397066658879e-06, + "loss": 0.7383, + "step": 42259 + }, + { + "epoch": 1.08, + "learning_rate": 1.4782154054781981e-06, + "loss": 0.7515, + "step": 42260 + }, + { + "epoch": 1.08, + "learning_rate": 1.4781911039243604e-06, + "loss": 0.6494, + "step": 42261 + }, + { + "epoch": 1.08, + "learning_rate": 1.478166802004394e-06, + "loss": 0.5547, + "step": 42262 + }, + { + "epoch": 1.08, + "learning_rate": 1.478142499718317e-06, + "loss": 0.526, + "step": 42263 + }, + { + "epoch": 1.08, + "learning_rate": 1.4781181970661487e-06, + "loss": 0.6289, + "step": 42264 + }, + { + "epoch": 1.08, + "learning_rate": 1.478093894047907e-06, + "loss": 0.5952, + "step": 42265 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780695906636108e-06, + "loss": 0.7935, + "step": 42266 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780452869132786e-06, + "loss": 0.5791, + "step": 42267 + }, + { + "epoch": 1.08, + "learning_rate": 1.4780209827969294e-06, + "loss": 0.8789, + "step": 42268 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779966783145814e-06, + "loss": 0.6328, + "step": 42269 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779723734662534e-06, + "loss": 0.4565, + "step": 42270 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779480682519637e-06, + "loss": 0.5232, + "step": 42271 + }, + { + "epoch": 1.08, + "learning_rate": 1.4779237626717313e-06, + "loss": 0.6069, + "step": 42272 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778994567255746e-06, + "loss": 0.6611, + "step": 42273 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778751504135123e-06, + "loss": 0.6162, + "step": 42274 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778508437355627e-06, + "loss": 0.7686, + "step": 42275 + }, + { + "epoch": 1.08, + "learning_rate": 1.477826536691745e-06, + "loss": 0.5908, + "step": 42276 + }, + { + "epoch": 1.08, + "learning_rate": 1.4778022292820776e-06, + "loss": 0.6821, + "step": 42277 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777779215065786e-06, + "loss": 0.6011, + "step": 42278 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777536133652675e-06, + "loss": 0.6509, + "step": 42279 + }, + { + "epoch": 1.08, + "learning_rate": 1.477729304858162e-06, + "loss": 0.627, + "step": 42280 + }, + { + "epoch": 1.08, + "learning_rate": 1.4777049959852815e-06, + "loss": 0.3833, + "step": 42281 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776806867466437e-06, + "loss": 0.748, + "step": 42282 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776563771422682e-06, + "loss": 0.4172, + "step": 42283 + }, + { + "epoch": 1.08, + "learning_rate": 1.4776320671721732e-06, + "loss": 0.6353, + "step": 42284 + }, + { + "epoch": 1.08, + "learning_rate": 1.477607756836377e-06, + "loss": 0.665, + "step": 42285 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775834461348988e-06, + "loss": 0.6631, + "step": 42286 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775591350677569e-06, + "loss": 0.7471, + "step": 42287 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775348236349696e-06, + "loss": 0.7344, + "step": 42288 + }, + { + "epoch": 1.08, + "learning_rate": 1.4775105118365564e-06, + "loss": 0.564, + "step": 42289 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774861996725347e-06, + "loss": 0.7979, + "step": 42290 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774618871429243e-06, + "loss": 0.4644, + "step": 42291 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774375742477427e-06, + "loss": 0.5474, + "step": 42292 + }, + { + "epoch": 1.08, + "learning_rate": 1.4774132609870097e-06, + "loss": 0.7402, + "step": 42293 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773889473607431e-06, + "loss": 0.6724, + "step": 42294 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773646333689616e-06, + "loss": 0.5525, + "step": 42295 + }, + { + "epoch": 1.08, + "learning_rate": 1.4773403190116842e-06, + "loss": 0.4722, + "step": 42296 + }, + { + "epoch": 1.08, + "learning_rate": 1.477316004288929e-06, + "loss": 0.6006, + "step": 42297 + }, + { + "epoch": 1.08, + "learning_rate": 1.477291689200715e-06, + "loss": 0.6958, + "step": 42298 + }, + { + "epoch": 1.08, + "learning_rate": 1.477267373747061e-06, + "loss": 0.6489, + "step": 42299 + }, + { + "epoch": 1.08, + "learning_rate": 1.4772430579279852e-06, + "loss": 0.6504, + "step": 42300 + }, + { + "epoch": 1.08, + "learning_rate": 1.4772187417435057e-06, + "loss": 0.5977, + "step": 42301 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771944251936423e-06, + "loss": 0.6855, + "step": 42302 + }, + { + "epoch": 1.08, + "learning_rate": 1.477170108278413e-06, + "loss": 0.5869, + "step": 42303 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771457909978367e-06, + "loss": 0.7305, + "step": 42304 + }, + { + "epoch": 1.08, + "learning_rate": 1.4771214733519315e-06, + "loss": 0.5654, + "step": 42305 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770971553407166e-06, + "loss": 0.709, + "step": 42306 + }, + { + "epoch": 1.08, + "learning_rate": 1.47707283696421e-06, + "loss": 0.7949, + "step": 42307 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770485182224309e-06, + "loss": 0.6401, + "step": 42308 + }, + { + "epoch": 1.08, + "learning_rate": 1.4770241991153975e-06, + "loss": 0.6533, + "step": 42309 + }, + { + "epoch": 1.08, + "learning_rate": 1.476999879643129e-06, + "loss": 0.48, + "step": 42310 + }, + { + "epoch": 1.08, + "learning_rate": 1.476975559805643e-06, + "loss": 0.3845, + "step": 42311 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769512396029594e-06, + "loss": 0.5918, + "step": 42312 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769269190350957e-06, + "loss": 0.6382, + "step": 42313 + }, + { + "epoch": 1.08, + "learning_rate": 1.4769025981020712e-06, + "loss": 0.5212, + "step": 42314 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768782768039043e-06, + "loss": 0.6714, + "step": 42315 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768539551406136e-06, + "loss": 0.542, + "step": 42316 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768296331122177e-06, + "loss": 0.6621, + "step": 42317 + }, + { + "epoch": 1.08, + "learning_rate": 1.4768053107187352e-06, + "loss": 0.7266, + "step": 42318 + }, + { + "epoch": 1.08, + "learning_rate": 1.476780987960185e-06, + "loss": 0.5415, + "step": 42319 + }, + { + "epoch": 1.08, + "learning_rate": 1.4767566648365856e-06, + "loss": 0.6289, + "step": 42320 + }, + { + "epoch": 1.08, + "learning_rate": 1.4767323413479553e-06, + "loss": 0.7852, + "step": 42321 + }, + { + "epoch": 1.08, + "learning_rate": 1.476708017494313e-06, + "loss": 0.5659, + "step": 42322 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766836932756773e-06, + "loss": 0.4863, + "step": 42323 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766593686920668e-06, + "loss": 0.6152, + "step": 42324 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766350437435003e-06, + "loss": 0.5269, + "step": 42325 + }, + { + "epoch": 1.08, + "learning_rate": 1.4766107184299962e-06, + "loss": 0.6895, + "step": 42326 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765863927515731e-06, + "loss": 0.6621, + "step": 42327 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765620667082494e-06, + "loss": 0.7109, + "step": 42328 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765377403000448e-06, + "loss": 0.667, + "step": 42329 + }, + { + "epoch": 1.08, + "learning_rate": 1.4765134135269767e-06, + "loss": 0.7686, + "step": 42330 + }, + { + "epoch": 1.08, + "learning_rate": 1.4764890863890642e-06, + "loss": 0.5378, + "step": 42331 + }, + { + "epoch": 1.08, + "learning_rate": 1.476464758886326e-06, + "loss": 0.5464, + "step": 42332 + }, + { + "epoch": 1.09, + "learning_rate": 1.4764404310187806e-06, + "loss": 0.5884, + "step": 42333 + }, + { + "epoch": 1.09, + "learning_rate": 1.4764161027864467e-06, + "loss": 0.6719, + "step": 42334 + }, + { + "epoch": 1.09, + "learning_rate": 1.476391774189343e-06, + "loss": 0.7222, + "step": 42335 + }, + { + "epoch": 1.09, + "learning_rate": 1.4763674452274878e-06, + "loss": 0.5112, + "step": 42336 + }, + { + "epoch": 1.09, + "learning_rate": 1.4763431159009002e-06, + "loss": 0.6421, + "step": 42337 + }, + { + "epoch": 1.09, + "learning_rate": 1.476318786209598e-06, + "loss": 0.7637, + "step": 42338 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762944561536011e-06, + "loss": 0.6309, + "step": 42339 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762701257329271e-06, + "loss": 0.6816, + "step": 42340 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762457949475949e-06, + "loss": 0.5789, + "step": 42341 + }, + { + "epoch": 1.09, + "learning_rate": 1.4762214637976236e-06, + "loss": 0.5991, + "step": 42342 + }, + { + "epoch": 1.09, + "learning_rate": 1.476197132283031e-06, + "loss": 0.7051, + "step": 42343 + }, + { + "epoch": 1.09, + "learning_rate": 1.4761728004038365e-06, + "loss": 0.4785, + "step": 42344 + }, + { + "epoch": 1.09, + "learning_rate": 1.476148468160058e-06, + "loss": 0.7314, + "step": 42345 + }, + { + "epoch": 1.09, + "learning_rate": 1.4761241355517146e-06, + "loss": 0.7969, + "step": 42346 + }, + { + "epoch": 1.09, + "learning_rate": 1.476099802578825e-06, + "loss": 0.4631, + "step": 42347 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760754692414078e-06, + "loss": 0.5002, + "step": 42348 + }, + { + "epoch": 1.09, + "learning_rate": 1.476051135539481e-06, + "loss": 0.6191, + "step": 42349 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760268014730644e-06, + "loss": 0.5791, + "step": 42350 + }, + { + "epoch": 1.09, + "learning_rate": 1.4760024670421753e-06, + "loss": 0.7725, + "step": 42351 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759781322468335e-06, + "loss": 0.7402, + "step": 42352 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759537970870567e-06, + "loss": 0.6763, + "step": 42353 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759294615628646e-06, + "loss": 0.7036, + "step": 42354 + }, + { + "epoch": 1.09, + "learning_rate": 1.4759051256742744e-06, + "loss": 0.6787, + "step": 42355 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758807894213061e-06, + "loss": 0.7197, + "step": 42356 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758564528039776e-06, + "loss": 0.5933, + "step": 42357 + }, + { + "epoch": 1.09, + "learning_rate": 1.4758321158223077e-06, + "loss": 0.5381, + "step": 42358 + }, + { + "epoch": 1.09, + "learning_rate": 1.475807778476315e-06, + "loss": 0.5295, + "step": 42359 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757834407660183e-06, + "loss": 0.4236, + "step": 42360 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757591026914357e-06, + "loss": 0.8574, + "step": 42361 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757347642525867e-06, + "loss": 0.708, + "step": 42362 + }, + { + "epoch": 1.09, + "learning_rate": 1.4757104254494892e-06, + "loss": 0.5554, + "step": 42363 + }, + { + "epoch": 1.09, + "learning_rate": 1.4756860862821624e-06, + "loss": 0.6968, + "step": 42364 + }, + { + "epoch": 1.09, + "learning_rate": 1.4756617467506243e-06, + "loss": 0.7163, + "step": 42365 + }, + { + "epoch": 1.09, + "learning_rate": 1.475637406854894e-06, + "loss": 0.5918, + "step": 42366 + }, + { + "epoch": 1.09, + "learning_rate": 1.47561306659499e-06, + "loss": 0.6621, + "step": 42367 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755887259709305e-06, + "loss": 0.5522, + "step": 42368 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755643849827355e-06, + "loss": 0.6299, + "step": 42369 + }, + { + "epoch": 1.09, + "learning_rate": 1.475540043630422e-06, + "loss": 0.6787, + "step": 42370 + }, + { + "epoch": 1.09, + "learning_rate": 1.4755157019140097e-06, + "loss": 0.7236, + "step": 42371 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754913598335166e-06, + "loss": 0.6821, + "step": 42372 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754670173889618e-06, + "loss": 0.5908, + "step": 42373 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754426745803638e-06, + "loss": 0.5, + "step": 42374 + }, + { + "epoch": 1.09, + "learning_rate": 1.4754183314077413e-06, + "loss": 0.6699, + "step": 42375 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753939878711126e-06, + "loss": 0.4185, + "step": 42376 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753696439704969e-06, + "loss": 0.6963, + "step": 42377 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753452997059122e-06, + "loss": 0.8369, + "step": 42378 + }, + { + "epoch": 1.09, + "learning_rate": 1.4753209550773777e-06, + "loss": 0.4895, + "step": 42379 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752966100849115e-06, + "loss": 0.7178, + "step": 42380 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752722647285329e-06, + "loss": 0.6489, + "step": 42381 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752479190082598e-06, + "loss": 0.7295, + "step": 42382 + }, + { + "epoch": 1.09, + "learning_rate": 1.4752235729241115e-06, + "loss": 0.5669, + "step": 42383 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751992264761064e-06, + "loss": 0.749, + "step": 42384 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751748796642628e-06, + "loss": 0.7627, + "step": 42385 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751505324886e-06, + "loss": 0.7891, + "step": 42386 + }, + { + "epoch": 1.09, + "learning_rate": 1.475126184949136e-06, + "loss": 0.5298, + "step": 42387 + }, + { + "epoch": 1.09, + "learning_rate": 1.4751018370458898e-06, + "loss": 0.6641, + "step": 42388 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750774887788802e-06, + "loss": 0.7734, + "step": 42389 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750531401481254e-06, + "loss": 0.6299, + "step": 42390 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750287911536444e-06, + "loss": 0.7412, + "step": 42391 + }, + { + "epoch": 1.09, + "learning_rate": 1.4750044417954554e-06, + "loss": 0.6377, + "step": 42392 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749800920735776e-06, + "loss": 0.7549, + "step": 42393 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749557419880293e-06, + "loss": 0.7773, + "step": 42394 + }, + { + "epoch": 1.09, + "learning_rate": 1.4749313915388291e-06, + "loss": 0.6475, + "step": 42395 + }, + { + "epoch": 1.09, + "learning_rate": 1.474907040725996e-06, + "loss": 0.5576, + "step": 42396 + }, + { + "epoch": 1.09, + "learning_rate": 1.4748826895495482e-06, + "loss": 0.6265, + "step": 42397 + }, + { + "epoch": 1.09, + "learning_rate": 1.4748583380095049e-06, + "loss": 0.6172, + "step": 42398 + }, + { + "epoch": 1.09, + "learning_rate": 1.474833986105884e-06, + "loss": 0.6689, + "step": 42399 + }, + { + "epoch": 1.09, + "learning_rate": 1.474809633838705e-06, + "loss": 0.626, + "step": 42400 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747852812079855e-06, + "loss": 0.7744, + "step": 42401 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747609282137451e-06, + "loss": 0.606, + "step": 42402 + }, + { + "epoch": 1.09, + "learning_rate": 1.4747365748560023e-06, + "loss": 0.79, + "step": 42403 + }, + { + "epoch": 1.09, + "learning_rate": 1.474712221134775e-06, + "loss": 0.6328, + "step": 42404 + }, + { + "epoch": 1.09, + "learning_rate": 1.474687867050083e-06, + "loss": 0.6875, + "step": 42405 + }, + { + "epoch": 1.09, + "learning_rate": 1.474663512601944e-06, + "loss": 0.8184, + "step": 42406 + }, + { + "epoch": 1.09, + "learning_rate": 1.4746391577903767e-06, + "loss": 0.6001, + "step": 42407 + }, + { + "epoch": 1.09, + "learning_rate": 1.4746148026154003e-06, + "loss": 0.5586, + "step": 42408 + }, + { + "epoch": 1.09, + "learning_rate": 1.4745904470770334e-06, + "loss": 0.8447, + "step": 42409 + }, + { + "epoch": 1.09, + "learning_rate": 1.474566091175294e-06, + "loss": 0.6499, + "step": 42410 + }, + { + "epoch": 1.09, + "learning_rate": 1.4745417349102015e-06, + "loss": 0.8096, + "step": 42411 + }, + { + "epoch": 1.09, + "learning_rate": 1.474517378281774e-06, + "loss": 0.6855, + "step": 42412 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744930212900307e-06, + "loss": 0.5942, + "step": 42413 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744686639349894e-06, + "loss": 0.6377, + "step": 42414 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744443062166693e-06, + "loss": 0.6777, + "step": 42415 + }, + { + "epoch": 1.09, + "learning_rate": 1.4744199481350892e-06, + "loss": 0.5728, + "step": 42416 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743955896902675e-06, + "loss": 0.5243, + "step": 42417 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743712308822232e-06, + "loss": 0.646, + "step": 42418 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743468717109746e-06, + "loss": 0.6357, + "step": 42419 + }, + { + "epoch": 1.09, + "learning_rate": 1.4743225121765402e-06, + "loss": 0.5752, + "step": 42420 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742981522789388e-06, + "loss": 0.5176, + "step": 42421 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742737920181892e-06, + "loss": 0.5011, + "step": 42422 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742494313943102e-06, + "loss": 0.7144, + "step": 42423 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742250704073198e-06, + "loss": 0.75, + "step": 42424 + }, + { + "epoch": 1.09, + "learning_rate": 1.4742007090572375e-06, + "loss": 0.5737, + "step": 42425 + }, + { + "epoch": 1.09, + "learning_rate": 1.474176347344081e-06, + "loss": 0.6875, + "step": 42426 + }, + { + "epoch": 1.09, + "learning_rate": 1.47415198526787e-06, + "loss": 0.6748, + "step": 42427 + }, + { + "epoch": 1.09, + "learning_rate": 1.4741276228286223e-06, + "loss": 0.8887, + "step": 42428 + }, + { + "epoch": 1.09, + "learning_rate": 1.4741032600263567e-06, + "loss": 0.6147, + "step": 42429 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740788968610925e-06, + "loss": 0.627, + "step": 42430 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740545333328477e-06, + "loss": 0.8496, + "step": 42431 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740301694416411e-06, + "loss": 0.6787, + "step": 42432 + }, + { + "epoch": 1.09, + "learning_rate": 1.4740058051874916e-06, + "loss": 0.6094, + "step": 42433 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739814405704174e-06, + "loss": 0.8516, + "step": 42434 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739570755904373e-06, + "loss": 0.7852, + "step": 42435 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739327102475704e-06, + "loss": 0.7178, + "step": 42436 + }, + { + "epoch": 1.09, + "learning_rate": 1.4739083445418347e-06, + "loss": 0.6611, + "step": 42437 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738839784732497e-06, + "loss": 0.6357, + "step": 42438 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738596120418329e-06, + "loss": 0.6504, + "step": 42439 + }, + { + "epoch": 1.09, + "learning_rate": 1.4738352452476039e-06, + "loss": 0.5635, + "step": 42440 + }, + { + "epoch": 1.09, + "learning_rate": 1.473810878090581e-06, + "loss": 0.6184, + "step": 42441 + }, + { + "epoch": 1.09, + "learning_rate": 1.473786510570783e-06, + "loss": 0.603, + "step": 42442 + }, + { + "epoch": 1.09, + "learning_rate": 1.4737621426882283e-06, + "loss": 0.6851, + "step": 42443 + }, + { + "epoch": 1.09, + "learning_rate": 1.4737377744429357e-06, + "loss": 0.4866, + "step": 42444 + }, + { + "epoch": 1.09, + "learning_rate": 1.473713405834924e-06, + "loss": 0.5554, + "step": 42445 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736890368642116e-06, + "loss": 0.6816, + "step": 42446 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736646675308171e-06, + "loss": 0.7007, + "step": 42447 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736402978347598e-06, + "loss": 0.6924, + "step": 42448 + }, + { + "epoch": 1.09, + "learning_rate": 1.4736159277760578e-06, + "loss": 0.6304, + "step": 42449 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735915573547297e-06, + "loss": 0.5864, + "step": 42450 + }, + { + "epoch": 1.09, + "learning_rate": 1.473567186570794e-06, + "loss": 0.6943, + "step": 42451 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735428154242705e-06, + "loss": 0.4619, + "step": 42452 + }, + { + "epoch": 1.09, + "learning_rate": 1.4735184439151764e-06, + "loss": 0.7803, + "step": 42453 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734940720435312e-06, + "loss": 0.6621, + "step": 42454 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734696998093532e-06, + "loss": 0.7061, + "step": 42455 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734453272126615e-06, + "loss": 0.6602, + "step": 42456 + }, + { + "epoch": 1.09, + "learning_rate": 1.4734209542534743e-06, + "loss": 0.665, + "step": 42457 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733965809318106e-06, + "loss": 0.6719, + "step": 42458 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733722072476888e-06, + "loss": 0.6543, + "step": 42459 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733478332011275e-06, + "loss": 0.6113, + "step": 42460 + }, + { + "epoch": 1.09, + "learning_rate": 1.4733234587921458e-06, + "loss": 0.4686, + "step": 42461 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732990840207618e-06, + "loss": 0.5649, + "step": 42462 + }, + { + "epoch": 1.09, + "learning_rate": 1.473274708886995e-06, + "loss": 0.7148, + "step": 42463 + }, + { + "epoch": 1.09, + "learning_rate": 1.473250333390863e-06, + "loss": 0.4263, + "step": 42464 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732259575323852e-06, + "loss": 0.8359, + "step": 42465 + }, + { + "epoch": 1.09, + "learning_rate": 1.4732015813115796e-06, + "loss": 0.7832, + "step": 42466 + }, + { + "epoch": 1.09, + "learning_rate": 1.473177204728466e-06, + "loss": 0.6196, + "step": 42467 + }, + { + "epoch": 1.09, + "learning_rate": 1.473152827783062e-06, + "loss": 0.4861, + "step": 42468 + }, + { + "epoch": 1.09, + "learning_rate": 1.4731284504753869e-06, + "loss": 0.5991, + "step": 42469 + }, + { + "epoch": 1.09, + "learning_rate": 1.4731040728054587e-06, + "loss": 0.6294, + "step": 42470 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730796947732968e-06, + "loss": 0.8447, + "step": 42471 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730553163789192e-06, + "loss": 0.426, + "step": 42472 + }, + { + "epoch": 1.09, + "learning_rate": 1.4730309376223452e-06, + "loss": 0.6646, + "step": 42473 + }, + { + "epoch": 1.09, + "learning_rate": 1.473006558503593e-06, + "loss": 0.5962, + "step": 42474 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729821790226816e-06, + "loss": 0.9072, + "step": 42475 + }, + { + "epoch": 1.09, + "learning_rate": 1.472957799179629e-06, + "loss": 0.7275, + "step": 42476 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729334189744549e-06, + "loss": 0.7354, + "step": 42477 + }, + { + "epoch": 1.09, + "learning_rate": 1.4729090384071773e-06, + "loss": 0.6396, + "step": 42478 + }, + { + "epoch": 1.09, + "learning_rate": 1.472884657477815e-06, + "loss": 0.6436, + "step": 42479 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728602761863867e-06, + "loss": 0.6362, + "step": 42480 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728358945329107e-06, + "loss": 0.7295, + "step": 42481 + }, + { + "epoch": 1.09, + "learning_rate": 1.4728115125174064e-06, + "loss": 0.6914, + "step": 42482 + }, + { + "epoch": 1.09, + "learning_rate": 1.472787130139892e-06, + "loss": 0.6777, + "step": 42483 + }, + { + "epoch": 1.09, + "learning_rate": 1.472762747400386e-06, + "loss": 0.646, + "step": 42484 + }, + { + "epoch": 1.09, + "learning_rate": 1.4727383642989075e-06, + "loss": 0.6138, + "step": 42485 + }, + { + "epoch": 1.09, + "learning_rate": 1.472713980835475e-06, + "loss": 0.8223, + "step": 42486 + }, + { + "epoch": 1.09, + "learning_rate": 1.472689597010107e-06, + "loss": 0.699, + "step": 42487 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726652128228225e-06, + "loss": 0.5913, + "step": 42488 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726408282736395e-06, + "loss": 0.6914, + "step": 42489 + }, + { + "epoch": 1.09, + "learning_rate": 1.4726164433625777e-06, + "loss": 0.7041, + "step": 42490 + }, + { + "epoch": 1.09, + "learning_rate": 1.472592058089655e-06, + "loss": 0.7305, + "step": 42491 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725676724548903e-06, + "loss": 0.4193, + "step": 42492 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725432864583022e-06, + "loss": 0.6123, + "step": 42493 + }, + { + "epoch": 1.09, + "learning_rate": 1.4725189000999095e-06, + "loss": 0.6904, + "step": 42494 + }, + { + "epoch": 1.09, + "learning_rate": 1.4724945133797308e-06, + "loss": 0.7021, + "step": 42495 + }, + { + "epoch": 1.09, + "learning_rate": 1.472470126297785e-06, + "loss": 0.4614, + "step": 42496 + }, + { + "epoch": 1.09, + "learning_rate": 1.47244573885409e-06, + "loss": 0.749, + "step": 42497 + }, + { + "epoch": 1.09, + "learning_rate": 1.4724213510486656e-06, + "loss": 0.6338, + "step": 42498 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723969628815295e-06, + "loss": 0.3422, + "step": 42499 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723725743527008e-06, + "loss": 0.5723, + "step": 42500 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723481854621984e-06, + "loss": 0.5537, + "step": 42501 + }, + { + "epoch": 1.09, + "learning_rate": 1.4723237962100405e-06, + "loss": 0.5674, + "step": 42502 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722994065962464e-06, + "loss": 0.5908, + "step": 42503 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722750166208337e-06, + "loss": 0.6416, + "step": 42504 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722506262838224e-06, + "loss": 0.6113, + "step": 42505 + }, + { + "epoch": 1.09, + "learning_rate": 1.47222623558523e-06, + "loss": 0.6855, + "step": 42506 + }, + { + "epoch": 1.09, + "learning_rate": 1.4722018445250757e-06, + "loss": 0.6719, + "step": 42507 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721774531033784e-06, + "loss": 0.5283, + "step": 42508 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721530613201566e-06, + "loss": 0.5308, + "step": 42509 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721286691754283e-06, + "loss": 0.6597, + "step": 42510 + }, + { + "epoch": 1.09, + "learning_rate": 1.4721042766692135e-06, + "loss": 0.6416, + "step": 42511 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720798838015297e-06, + "loss": 0.5972, + "step": 42512 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720554905723964e-06, + "loss": 0.6445, + "step": 42513 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720310969818319e-06, + "loss": 0.751, + "step": 42514 + }, + { + "epoch": 1.09, + "learning_rate": 1.4720067030298549e-06, + "loss": 0.6533, + "step": 42515 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719823087164838e-06, + "loss": 0.6406, + "step": 42516 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719579140417376e-06, + "loss": 0.5649, + "step": 42517 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719335190056353e-06, + "loss": 0.7363, + "step": 42518 + }, + { + "epoch": 1.09, + "learning_rate": 1.4719091236081946e-06, + "loss": 0.6729, + "step": 42519 + }, + { + "epoch": 1.09, + "learning_rate": 1.4718847278494351e-06, + "loss": 0.7148, + "step": 42520 + }, + { + "epoch": 1.09, + "learning_rate": 1.471860331729375e-06, + "loss": 0.6758, + "step": 42521 + }, + { + "epoch": 1.09, + "learning_rate": 1.4718359352480333e-06, + "loss": 0.6553, + "step": 42522 + }, + { + "epoch": 1.09, + "learning_rate": 1.471811538405429e-06, + "loss": 0.6191, + "step": 42523 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717871412015797e-06, + "loss": 0.7725, + "step": 42524 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717627436365045e-06, + "loss": 0.6768, + "step": 42525 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717383457102226e-06, + "loss": 0.6675, + "step": 42526 + }, + { + "epoch": 1.09, + "learning_rate": 1.4717139474227521e-06, + "loss": 0.5093, + "step": 42527 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716895487741125e-06, + "loss": 0.5569, + "step": 42528 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716651497643214e-06, + "loss": 0.4795, + "step": 42529 + }, + { + "epoch": 1.09, + "learning_rate": 1.4716407503933981e-06, + "loss": 0.769, + "step": 42530 + }, + { + "epoch": 1.09, + "learning_rate": 1.471616350661361e-06, + "loss": 0.6392, + "step": 42531 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715919505682293e-06, + "loss": 0.6172, + "step": 42532 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715675501140213e-06, + "loss": 0.7476, + "step": 42533 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715431492987552e-06, + "loss": 0.7686, + "step": 42534 + }, + { + "epoch": 1.09, + "learning_rate": 1.4715187481224507e-06, + "loss": 0.6489, + "step": 42535 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714943465851257e-06, + "loss": 0.5303, + "step": 42536 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714699446867993e-06, + "loss": 0.6406, + "step": 42537 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714455424274902e-06, + "loss": 0.5889, + "step": 42538 + }, + { + "epoch": 1.09, + "learning_rate": 1.4714211398072168e-06, + "loss": 0.6914, + "step": 42539 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713967368259978e-06, + "loss": 0.6997, + "step": 42540 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713723334838516e-06, + "loss": 0.7236, + "step": 42541 + }, + { + "epoch": 1.09, + "learning_rate": 1.471347929780798e-06, + "loss": 0.7061, + "step": 42542 + }, + { + "epoch": 1.09, + "learning_rate": 1.4713235257168549e-06, + "loss": 0.2991, + "step": 42543 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712991212920405e-06, + "loss": 0.5244, + "step": 42544 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712747165063743e-06, + "loss": 0.5596, + "step": 42545 + }, + { + "epoch": 1.09, + "learning_rate": 1.471250311359875e-06, + "loss": 0.5991, + "step": 42546 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712259058525607e-06, + "loss": 0.7188, + "step": 42547 + }, + { + "epoch": 1.09, + "learning_rate": 1.4712014999844505e-06, + "loss": 0.8076, + "step": 42548 + }, + { + "epoch": 1.09, + "learning_rate": 1.471177093755563e-06, + "loss": 0.7529, + "step": 42549 + }, + { + "epoch": 1.09, + "learning_rate": 1.4711526871659168e-06, + "loss": 0.6719, + "step": 42550 + }, + { + "epoch": 1.09, + "learning_rate": 1.4711282802155308e-06, + "loss": 0.9199, + "step": 42551 + }, + { + "epoch": 1.09, + "learning_rate": 1.471103872904423e-06, + "loss": 0.55, + "step": 42552 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710794652326136e-06, + "loss": 0.5576, + "step": 42553 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710550572001195e-06, + "loss": 0.7324, + "step": 42554 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710306488069606e-06, + "loss": 0.7666, + "step": 42555 + }, + { + "epoch": 1.09, + "learning_rate": 1.4710062400531549e-06, + "loss": 0.5645, + "step": 42556 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709818309387214e-06, + "loss": 0.5645, + "step": 42557 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709574214636792e-06, + "loss": 0.5435, + "step": 42558 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709330116280463e-06, + "loss": 0.7344, + "step": 42559 + }, + { + "epoch": 1.09, + "learning_rate": 1.4709086014318413e-06, + "loss": 0.5947, + "step": 42560 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708841908750837e-06, + "loss": 0.7393, + "step": 42561 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708597799577915e-06, + "loss": 0.5801, + "step": 42562 + }, + { + "epoch": 1.09, + "learning_rate": 1.4708353686799838e-06, + "loss": 0.3936, + "step": 42563 + }, + { + "epoch": 1.09, + "learning_rate": 1.470810957041679e-06, + "loss": 0.6338, + "step": 42564 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707865450428956e-06, + "loss": 0.5845, + "step": 42565 + }, + { + "epoch": 1.09, + "learning_rate": 1.470762132683653e-06, + "loss": 0.5449, + "step": 42566 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707377199639693e-06, + "loss": 0.542, + "step": 42567 + }, + { + "epoch": 1.09, + "learning_rate": 1.4707133068838636e-06, + "loss": 0.5957, + "step": 42568 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706888934433542e-06, + "loss": 0.6299, + "step": 42569 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706644796424598e-06, + "loss": 0.6504, + "step": 42570 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706400654811995e-06, + "loss": 0.7568, + "step": 42571 + }, + { + "epoch": 1.09, + "learning_rate": 1.4706156509595915e-06, + "loss": 0.708, + "step": 42572 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705912360776548e-06, + "loss": 0.509, + "step": 42573 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705668208354083e-06, + "loss": 0.6455, + "step": 42574 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705424052328702e-06, + "loss": 0.6182, + "step": 42575 + }, + { + "epoch": 1.09, + "learning_rate": 1.4705179892700594e-06, + "loss": 0.7666, + "step": 42576 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704935729469948e-06, + "loss": 0.5767, + "step": 42577 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704691562636948e-06, + "loss": 0.6045, + "step": 42578 + }, + { + "epoch": 1.09, + "learning_rate": 1.470444739220178e-06, + "loss": 0.5737, + "step": 42579 + }, + { + "epoch": 1.09, + "learning_rate": 1.4704203218164636e-06, + "loss": 0.3473, + "step": 42580 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703959040525697e-06, + "loss": 0.7314, + "step": 42581 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703714859285158e-06, + "loss": 0.7881, + "step": 42582 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703470674443195e-06, + "loss": 0.7441, + "step": 42583 + }, + { + "epoch": 1.09, + "learning_rate": 1.4703226486000002e-06, + "loss": 0.6719, + "step": 42584 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702982293955766e-06, + "loss": 0.9395, + "step": 42585 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702738098310671e-06, + "loss": 0.7627, + "step": 42586 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702493899064907e-06, + "loss": 0.6523, + "step": 42587 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702249696218664e-06, + "loss": 0.8301, + "step": 42588 + }, + { + "epoch": 1.09, + "learning_rate": 1.4702005489772117e-06, + "loss": 0.5208, + "step": 42589 + }, + { + "epoch": 1.09, + "learning_rate": 1.4701761279725463e-06, + "loss": 0.7793, + "step": 42590 + }, + { + "epoch": 1.09, + "learning_rate": 1.470151706607889e-06, + "loss": 0.752, + "step": 42591 + }, + { + "epoch": 1.09, + "learning_rate": 1.4701272848832576e-06, + "loss": 0.5269, + "step": 42592 + }, + { + "epoch": 1.09, + "learning_rate": 1.470102862798672e-06, + "loss": 0.6094, + "step": 42593 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700784403541498e-06, + "loss": 0.6838, + "step": 42594 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700540175497103e-06, + "loss": 0.4852, + "step": 42595 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700295943853717e-06, + "loss": 0.5752, + "step": 42596 + }, + { + "epoch": 1.09, + "learning_rate": 1.4700051708611536e-06, + "loss": 0.5361, + "step": 42597 + }, + { + "epoch": 1.09, + "learning_rate": 1.469980746977074e-06, + "loss": 0.5928, + "step": 42598 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699563227331518e-06, + "loss": 0.6367, + "step": 42599 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699318981294052e-06, + "loss": 0.6211, + "step": 42600 + }, + { + "epoch": 1.09, + "learning_rate": 1.4699074731658541e-06, + "loss": 0.6211, + "step": 42601 + }, + { + "epoch": 1.09, + "learning_rate": 1.4698830478425156e-06, + "loss": 0.7388, + "step": 42602 + }, + { + "epoch": 1.09, + "learning_rate": 1.46985862215941e-06, + "loss": 0.6738, + "step": 42603 + }, + { + "epoch": 1.09, + "learning_rate": 1.469834196116555e-06, + "loss": 0.5503, + "step": 42604 + }, + { + "epoch": 1.09, + "learning_rate": 1.4698097697139694e-06, + "loss": 0.6191, + "step": 42605 + }, + { + "epoch": 1.09, + "learning_rate": 1.4697853429516723e-06, + "loss": 0.8223, + "step": 42606 + }, + { + "epoch": 1.09, + "learning_rate": 1.469760915829682e-06, + "loss": 0.606, + "step": 42607 + }, + { + "epoch": 1.09, + "learning_rate": 1.4697364883480174e-06, + "loss": 0.5356, + "step": 42608 + }, + { + "epoch": 1.09, + "learning_rate": 1.469712060506697e-06, + "loss": 0.8896, + "step": 42609 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696876323057398e-06, + "loss": 0.6387, + "step": 42610 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696632037451644e-06, + "loss": 0.6245, + "step": 42611 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696387748249897e-06, + "loss": 0.6882, + "step": 42612 + }, + { + "epoch": 1.09, + "learning_rate": 1.4696143455452342e-06, + "loss": 0.6221, + "step": 42613 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695899159059162e-06, + "loss": 0.6589, + "step": 42614 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695654859070547e-06, + "loss": 0.748, + "step": 42615 + }, + { + "epoch": 1.09, + "learning_rate": 1.4695410555486692e-06, + "loss": 0.8232, + "step": 42616 + }, + { + "epoch": 1.09, + "learning_rate": 1.469516624830777e-06, + "loss": 0.4525, + "step": 42617 + }, + { + "epoch": 1.09, + "learning_rate": 1.469492193753398e-06, + "loss": 0.6021, + "step": 42618 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694677623165502e-06, + "loss": 0.5413, + "step": 42619 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694433305202524e-06, + "loss": 0.6904, + "step": 42620 + }, + { + "epoch": 1.09, + "learning_rate": 1.4694188983645234e-06, + "loss": 0.4419, + "step": 42621 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693944658493822e-06, + "loss": 0.7441, + "step": 42622 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693700329748472e-06, + "loss": 0.7295, + "step": 42623 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693455997409372e-06, + "loss": 0.6348, + "step": 42624 + }, + { + "epoch": 1.09, + "learning_rate": 1.4693211661476706e-06, + "loss": 0.6431, + "step": 42625 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692967321950665e-06, + "loss": 0.6416, + "step": 42626 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692722978831433e-06, + "loss": 0.5781, + "step": 42627 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692478632119202e-06, + "loss": 0.7256, + "step": 42628 + }, + { + "epoch": 1.09, + "learning_rate": 1.4692234281814155e-06, + "loss": 0.5469, + "step": 42629 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691989927916478e-06, + "loss": 0.6963, + "step": 42630 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691745570426362e-06, + "loss": 0.751, + "step": 42631 + }, + { + "epoch": 1.09, + "learning_rate": 1.469150120934399e-06, + "loss": 0.7793, + "step": 42632 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691256844669555e-06, + "loss": 0.6587, + "step": 42633 + }, + { + "epoch": 1.09, + "learning_rate": 1.4691012476403235e-06, + "loss": 0.4192, + "step": 42634 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690768104545227e-06, + "loss": 0.6133, + "step": 42635 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690523729095712e-06, + "loss": 0.457, + "step": 42636 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690279350054878e-06, + "loss": 0.6528, + "step": 42637 + }, + { + "epoch": 1.09, + "learning_rate": 1.4690034967422916e-06, + "loss": 0.4824, + "step": 42638 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689790581200007e-06, + "loss": 0.7891, + "step": 42639 + }, + { + "epoch": 1.09, + "learning_rate": 1.468954619138634e-06, + "loss": 0.5083, + "step": 42640 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689301797982103e-06, + "loss": 0.4224, + "step": 42641 + }, + { + "epoch": 1.09, + "learning_rate": 1.4689057400987485e-06, + "loss": 0.7412, + "step": 42642 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688813000402673e-06, + "loss": 0.6445, + "step": 42643 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688568596227851e-06, + "loss": 0.8594, + "step": 42644 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688324188463207e-06, + "loss": 0.5498, + "step": 42645 + }, + { + "epoch": 1.09, + "learning_rate": 1.4688079777108926e-06, + "loss": 0.7495, + "step": 42646 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687835362165203e-06, + "loss": 0.7153, + "step": 42647 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687590943632218e-06, + "loss": 0.6101, + "step": 42648 + }, + { + "epoch": 1.09, + "learning_rate": 1.468734652151016e-06, + "loss": 0.7275, + "step": 42649 + }, + { + "epoch": 1.09, + "learning_rate": 1.4687102095799216e-06, + "loss": 0.6201, + "step": 42650 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686857666499574e-06, + "loss": 0.5278, + "step": 42651 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686613233611418e-06, + "loss": 0.7715, + "step": 42652 + }, + { + "epoch": 1.09, + "learning_rate": 1.468636879713494e-06, + "loss": 0.7759, + "step": 42653 + }, + { + "epoch": 1.09, + "learning_rate": 1.4686124357070327e-06, + "loss": 0.751, + "step": 42654 + }, + { + "epoch": 1.09, + "learning_rate": 1.468587991341776e-06, + "loss": 0.3052, + "step": 42655 + }, + { + "epoch": 1.09, + "learning_rate": 1.4685635466177434e-06, + "loss": 0.7744, + "step": 42656 + }, + { + "epoch": 1.09, + "learning_rate": 1.4685391015349528e-06, + "loss": 0.6411, + "step": 42657 + }, + { + "epoch": 1.09, + "learning_rate": 1.468514656093424e-06, + "loss": 0.6221, + "step": 42658 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684902102931745e-06, + "loss": 0.7148, + "step": 42659 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684657641342237e-06, + "loss": 0.6572, + "step": 42660 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684413176165903e-06, + "loss": 0.4521, + "step": 42661 + }, + { + "epoch": 1.09, + "learning_rate": 1.4684168707402928e-06, + "loss": 0.4071, + "step": 42662 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683924235053502e-06, + "loss": 0.5024, + "step": 42663 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683679759117812e-06, + "loss": 0.6445, + "step": 42664 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683435279596039e-06, + "loss": 0.6807, + "step": 42665 + }, + { + "epoch": 1.09, + "learning_rate": 1.4683190796488379e-06, + "loss": 0.719, + "step": 42666 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682946309795013e-06, + "loss": 0.6719, + "step": 42667 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682701819516133e-06, + "loss": 0.5898, + "step": 42668 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682457325651921e-06, + "loss": 0.7217, + "step": 42669 + }, + { + "epoch": 1.09, + "learning_rate": 1.4682212828202566e-06, + "loss": 0.7354, + "step": 42670 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681968327168257e-06, + "loss": 0.7373, + "step": 42671 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681723822549181e-06, + "loss": 0.6162, + "step": 42672 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681479314345526e-06, + "loss": 0.7012, + "step": 42673 + }, + { + "epoch": 1.09, + "learning_rate": 1.4681234802557474e-06, + "loss": 0.7886, + "step": 42674 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680990287185218e-06, + "loss": 0.7881, + "step": 42675 + }, + { + "epoch": 1.09, + "learning_rate": 1.468074576822894e-06, + "loss": 0.5938, + "step": 42676 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680501245688833e-06, + "loss": 0.7383, + "step": 42677 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680256719565082e-06, + "loss": 0.5376, + "step": 42678 + }, + { + "epoch": 1.09, + "learning_rate": 1.4680012189857873e-06, + "loss": 0.6548, + "step": 42679 + }, + { + "epoch": 1.09, + "learning_rate": 1.467976765656739e-06, + "loss": 0.6758, + "step": 42680 + }, + { + "epoch": 1.09, + "learning_rate": 1.467952311969383e-06, + "loss": 0.7856, + "step": 42681 + }, + { + "epoch": 1.09, + "learning_rate": 1.4679278579237368e-06, + "loss": 0.6575, + "step": 42682 + }, + { + "epoch": 1.09, + "learning_rate": 1.4679034035198206e-06, + "loss": 0.7432, + "step": 42683 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678789487576515e-06, + "loss": 0.5918, + "step": 42684 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678544936372495e-06, + "loss": 0.668, + "step": 42685 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678300381586324e-06, + "loss": 0.7012, + "step": 42686 + }, + { + "epoch": 1.09, + "learning_rate": 1.4678055823218197e-06, + "loss": 0.6777, + "step": 42687 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677811261268295e-06, + "loss": 0.665, + "step": 42688 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677566695736812e-06, + "loss": 0.6421, + "step": 42689 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677322126623928e-06, + "loss": 0.6084, + "step": 42690 + }, + { + "epoch": 1.09, + "learning_rate": 1.4677077553929835e-06, + "loss": 0.5723, + "step": 42691 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676832977654717e-06, + "loss": 0.6807, + "step": 42692 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676588397798766e-06, + "loss": 0.5913, + "step": 42693 + }, + { + "epoch": 1.09, + "learning_rate": 1.4676343814362163e-06, + "loss": 0.5547, + "step": 42694 + }, + { + "epoch": 1.09, + "learning_rate": 1.46760992273451e-06, + "loss": 0.5386, + "step": 42695 + }, + { + "epoch": 1.09, + "learning_rate": 1.4675854636747761e-06, + "loss": 0.563, + "step": 42696 + }, + { + "epoch": 1.09, + "learning_rate": 1.467561004257034e-06, + "loss": 0.6265, + "step": 42697 + }, + { + "epoch": 1.09, + "learning_rate": 1.4675365444813014e-06, + "loss": 0.6758, + "step": 42698 + }, + { + "epoch": 1.09, + "learning_rate": 1.467512084347598e-06, + "loss": 0.8301, + "step": 42699 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674876238559416e-06, + "loss": 0.7305, + "step": 42700 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674631630063517e-06, + "loss": 0.3906, + "step": 42701 + }, + { + "epoch": 1.09, + "learning_rate": 1.467438701798847e-06, + "loss": 0.7383, + "step": 42702 + }, + { + "epoch": 1.09, + "learning_rate": 1.4674142402334458e-06, + "loss": 0.5132, + "step": 42703 + }, + { + "epoch": 1.09, + "learning_rate": 1.4673897783101668e-06, + "loss": 0.5647, + "step": 42704 + }, + { + "epoch": 1.09, + "learning_rate": 1.467365316029029e-06, + "loss": 0.5293, + "step": 42705 + }, + { + "epoch": 1.09, + "learning_rate": 1.467340853390051e-06, + "loss": 0.8896, + "step": 42706 + }, + { + "epoch": 1.09, + "learning_rate": 1.4673163903932518e-06, + "loss": 0.4717, + "step": 42707 + }, + { + "epoch": 1.09, + "learning_rate": 1.46729192703865e-06, + "loss": 0.5479, + "step": 42708 + }, + { + "epoch": 1.09, + "learning_rate": 1.4672674633262641e-06, + "loss": 0.6699, + "step": 42709 + }, + { + "epoch": 1.09, + "learning_rate": 1.467242999256113e-06, + "loss": 0.7725, + "step": 42710 + }, + { + "epoch": 1.09, + "learning_rate": 1.4672185348282153e-06, + "loss": 0.6758, + "step": 42711 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671940700425905e-06, + "loss": 0.7021, + "step": 42712 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671696048992559e-06, + "loss": 0.5923, + "step": 42713 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671451393982315e-06, + "loss": 0.562, + "step": 42714 + }, + { + "epoch": 1.09, + "learning_rate": 1.4671206735395352e-06, + "loss": 0.5356, + "step": 42715 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670962073231863e-06, + "loss": 0.3748, + "step": 42716 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670717407492033e-06, + "loss": 0.5991, + "step": 42717 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670472738176044e-06, + "loss": 0.6226, + "step": 42718 + }, + { + "epoch": 1.09, + "learning_rate": 1.4670228065284097e-06, + "loss": 0.6128, + "step": 42719 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669983388816368e-06, + "loss": 0.7305, + "step": 42720 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669738708773046e-06, + "loss": 0.5967, + "step": 42721 + }, + { + "epoch": 1.09, + "learning_rate": 1.4669494025154322e-06, + "loss": 0.8164, + "step": 42722 + }, + { + "epoch": 1.1, + "learning_rate": 1.466924933796038e-06, + "loss": 0.4971, + "step": 42723 + }, + { + "epoch": 1.1, + "learning_rate": 1.4669004647191408e-06, + "loss": 0.7485, + "step": 42724 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668759952847593e-06, + "loss": 0.9453, + "step": 42725 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668515254929123e-06, + "loss": 0.4524, + "step": 42726 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668270553436191e-06, + "loss": 0.5347, + "step": 42727 + }, + { + "epoch": 1.1, + "learning_rate": 1.4668025848368975e-06, + "loss": 0.5759, + "step": 42728 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667781139727665e-06, + "loss": 0.7046, + "step": 42729 + }, + { + "epoch": 1.1, + "learning_rate": 1.466753642751245e-06, + "loss": 0.7705, + "step": 42730 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667291711723516e-06, + "loss": 0.7412, + "step": 42731 + }, + { + "epoch": 1.1, + "learning_rate": 1.4667046992361056e-06, + "loss": 0.5195, + "step": 42732 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666802269425248e-06, + "loss": 0.6943, + "step": 42733 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666557542916287e-06, + "loss": 0.7852, + "step": 42734 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666312812834356e-06, + "loss": 0.5444, + "step": 42735 + }, + { + "epoch": 1.1, + "learning_rate": 1.4666068079179642e-06, + "loss": 0.6523, + "step": 42736 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665823341952338e-06, + "loss": 0.4487, + "step": 42737 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665578601152629e-06, + "loss": 0.7168, + "step": 42738 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665333856780697e-06, + "loss": 0.6436, + "step": 42739 + }, + { + "epoch": 1.1, + "learning_rate": 1.4665089108836735e-06, + "loss": 0.7607, + "step": 42740 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664844357320927e-06, + "loss": 0.6226, + "step": 42741 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664599602233466e-06, + "loss": 0.8262, + "step": 42742 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664354843574528e-06, + "loss": 0.6729, + "step": 42743 + }, + { + "epoch": 1.1, + "learning_rate": 1.4664110081344317e-06, + "loss": 0.7344, + "step": 42744 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663865315543005e-06, + "loss": 0.5496, + "step": 42745 + }, + { + "epoch": 1.1, + "learning_rate": 1.466362054617079e-06, + "loss": 0.6152, + "step": 42746 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663375773227853e-06, + "loss": 0.7588, + "step": 42747 + }, + { + "epoch": 1.1, + "learning_rate": 1.4663130996714384e-06, + "loss": 0.8438, + "step": 42748 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662886216630567e-06, + "loss": 0.5176, + "step": 42749 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662641432976598e-06, + "loss": 0.6987, + "step": 42750 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662396645752653e-06, + "loss": 0.5643, + "step": 42751 + }, + { + "epoch": 1.1, + "learning_rate": 1.4662151854958933e-06, + "loss": 0.791, + "step": 42752 + }, + { + "epoch": 1.1, + "learning_rate": 1.466190706059561e-06, + "loss": 0.548, + "step": 42753 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661662262662884e-06, + "loss": 0.5142, + "step": 42754 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661417461160933e-06, + "loss": 0.7363, + "step": 42755 + }, + { + "epoch": 1.1, + "learning_rate": 1.4661172656089954e-06, + "loss": 0.6479, + "step": 42756 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660927847450126e-06, + "loss": 0.7666, + "step": 42757 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660683035241642e-06, + "loss": 0.6191, + "step": 42758 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660438219464685e-06, + "loss": 0.6738, + "step": 42759 + }, + { + "epoch": 1.1, + "learning_rate": 1.4660193400119447e-06, + "loss": 0.6973, + "step": 42760 + }, + { + "epoch": 1.1, + "learning_rate": 1.465994857720611e-06, + "loss": 0.8506, + "step": 42761 + }, + { + "epoch": 1.1, + "learning_rate": 1.465970375072487e-06, + "loss": 0.7969, + "step": 42762 + }, + { + "epoch": 1.1, + "learning_rate": 1.4659458920675907e-06, + "loss": 0.4927, + "step": 42763 + }, + { + "epoch": 1.1, + "learning_rate": 1.465921408705941e-06, + "loss": 0.5603, + "step": 42764 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658969249875566e-06, + "loss": 0.6924, + "step": 42765 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658724409124563e-06, + "loss": 0.6777, + "step": 42766 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658479564806591e-06, + "loss": 0.5757, + "step": 42767 + }, + { + "epoch": 1.1, + "learning_rate": 1.4658234716921834e-06, + "loss": 0.603, + "step": 42768 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657989865470481e-06, + "loss": 0.6328, + "step": 42769 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657745010452717e-06, + "loss": 0.7705, + "step": 42770 + }, + { + "epoch": 1.1, + "learning_rate": 1.4657500151868735e-06, + "loss": 0.8018, + "step": 42771 + }, + { + "epoch": 1.1, + "learning_rate": 1.465725528971872e-06, + "loss": 0.6455, + "step": 42772 + }, + { + "epoch": 1.1, + "learning_rate": 1.465701042400286e-06, + "loss": 0.6631, + "step": 42773 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656765554721338e-06, + "loss": 0.6396, + "step": 42774 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656520681874344e-06, + "loss": 0.6768, + "step": 42775 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656275805462065e-06, + "loss": 0.7461, + "step": 42776 + }, + { + "epoch": 1.1, + "learning_rate": 1.4656030925484697e-06, + "loss": 0.6342, + "step": 42777 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655786041942415e-06, + "loss": 0.6558, + "step": 42778 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655541154835413e-06, + "loss": 0.66, + "step": 42779 + }, + { + "epoch": 1.1, + "learning_rate": 1.4655296264163875e-06, + "loss": 0.6655, + "step": 42780 + }, + { + "epoch": 1.1, + "learning_rate": 1.465505136992799e-06, + "loss": 0.7168, + "step": 42781 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654806472127952e-06, + "loss": 0.5083, + "step": 42782 + }, + { + "epoch": 1.1, + "learning_rate": 1.465456157076394e-06, + "loss": 0.8008, + "step": 42783 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654316665836142e-06, + "loss": 0.8652, + "step": 42784 + }, + { + "epoch": 1.1, + "learning_rate": 1.4654071757344748e-06, + "loss": 0.665, + "step": 42785 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653826845289948e-06, + "loss": 0.5708, + "step": 42786 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653581929671926e-06, + "loss": 0.6377, + "step": 42787 + }, + { + "epoch": 1.1, + "learning_rate": 1.465333701049087e-06, + "loss": 0.6992, + "step": 42788 + }, + { + "epoch": 1.1, + "learning_rate": 1.4653092087746965e-06, + "loss": 0.4055, + "step": 42789 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652847161440405e-06, + "loss": 0.7065, + "step": 42790 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652602231571369e-06, + "loss": 0.8213, + "step": 42791 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652357298140057e-06, + "loss": 0.7607, + "step": 42792 + }, + { + "epoch": 1.1, + "learning_rate": 1.4652112361146642e-06, + "loss": 0.7119, + "step": 42793 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651867420591324e-06, + "loss": 0.6411, + "step": 42794 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651622476474279e-06, + "loss": 0.6582, + "step": 42795 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651377528795706e-06, + "loss": 0.7012, + "step": 42796 + }, + { + "epoch": 1.1, + "learning_rate": 1.4651132577555785e-06, + "loss": 0.5624, + "step": 42797 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650887622754706e-06, + "loss": 0.3966, + "step": 42798 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650642664392655e-06, + "loss": 0.623, + "step": 42799 + }, + { + "epoch": 1.1, + "learning_rate": 1.4650397702469821e-06, + "loss": 0.5547, + "step": 42800 + }, + { + "epoch": 1.1, + "learning_rate": 1.465015273698639e-06, + "loss": 0.5732, + "step": 42801 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649907767942558e-06, + "loss": 0.4348, + "step": 42802 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649662795338498e-06, + "loss": 0.6602, + "step": 42803 + }, + { + "epoch": 1.1, + "learning_rate": 1.4649417819174409e-06, + "loss": 0.6152, + "step": 42804 + }, + { + "epoch": 1.1, + "learning_rate": 1.464917283945047e-06, + "loss": 0.7104, + "step": 42805 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648927856166878e-06, + "loss": 0.623, + "step": 42806 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648682869323814e-06, + "loss": 0.6567, + "step": 42807 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648437878921464e-06, + "loss": 0.7949, + "step": 42808 + }, + { + "epoch": 1.1, + "learning_rate": 1.4648192884960022e-06, + "loss": 0.5835, + "step": 42809 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647947887439671e-06, + "loss": 0.6694, + "step": 42810 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647702886360603e-06, + "loss": 0.6841, + "step": 42811 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647457881723e-06, + "loss": 0.6357, + "step": 42812 + }, + { + "epoch": 1.1, + "learning_rate": 1.4647212873527055e-06, + "loss": 0.7002, + "step": 42813 + }, + { + "epoch": 1.1, + "learning_rate": 1.464696786177295e-06, + "loss": 0.5874, + "step": 42814 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646722846460877e-06, + "loss": 0.748, + "step": 42815 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646477827591019e-06, + "loss": 0.8037, + "step": 42816 + }, + { + "epoch": 1.1, + "learning_rate": 1.4646232805163573e-06, + "loss": 0.5713, + "step": 42817 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645987779178712e-06, + "loss": 0.5967, + "step": 42818 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645742749636637e-06, + "loss": 0.5522, + "step": 42819 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645497716537527e-06, + "loss": 0.478, + "step": 42820 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645252679881577e-06, + "loss": 0.5962, + "step": 42821 + }, + { + "epoch": 1.1, + "learning_rate": 1.4645007639668968e-06, + "loss": 0.7734, + "step": 42822 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644762595899892e-06, + "loss": 0.7744, + "step": 42823 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644517548574534e-06, + "loss": 0.6914, + "step": 42824 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644272497693081e-06, + "loss": 0.668, + "step": 42825 + }, + { + "epoch": 1.1, + "learning_rate": 1.4644027443255725e-06, + "loss": 0.5439, + "step": 42826 + }, + { + "epoch": 1.1, + "learning_rate": 1.464378238526265e-06, + "loss": 0.5918, + "step": 42827 + }, + { + "epoch": 1.1, + "learning_rate": 1.464353732371404e-06, + "loss": 0.6504, + "step": 42828 + }, + { + "epoch": 1.1, + "learning_rate": 1.4643292258610091e-06, + "loss": 0.5562, + "step": 42829 + }, + { + "epoch": 1.1, + "learning_rate": 1.4643047189950988e-06, + "loss": 0.708, + "step": 42830 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642802117736913e-06, + "loss": 0.666, + "step": 42831 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642557041968061e-06, + "loss": 0.5688, + "step": 42832 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642311962644617e-06, + "loss": 0.6792, + "step": 42833 + }, + { + "epoch": 1.1, + "learning_rate": 1.4642066879766765e-06, + "loss": 0.7969, + "step": 42834 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641821793334698e-06, + "loss": 0.7935, + "step": 42835 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641576703348602e-06, + "loss": 0.6709, + "step": 42836 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641331609808662e-06, + "loss": 0.7676, + "step": 42837 + }, + { + "epoch": 1.1, + "learning_rate": 1.4641086512715073e-06, + "loss": 0.5276, + "step": 42838 + }, + { + "epoch": 1.1, + "learning_rate": 1.464084141206801e-06, + "loss": 0.5996, + "step": 42839 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640596307867674e-06, + "loss": 0.6826, + "step": 42840 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640351200114244e-06, + "loss": 0.7227, + "step": 42841 + }, + { + "epoch": 1.1, + "learning_rate": 1.4640106088807913e-06, + "loss": 0.7461, + "step": 42842 + }, + { + "epoch": 1.1, + "learning_rate": 1.463986097394886e-06, + "loss": 0.6558, + "step": 42843 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639615855537287e-06, + "loss": 0.6792, + "step": 42844 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639370733573367e-06, + "loss": 0.4608, + "step": 42845 + }, + { + "epoch": 1.1, + "learning_rate": 1.4639125608057296e-06, + "loss": 0.6958, + "step": 42846 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638880478989262e-06, + "loss": 0.6826, + "step": 42847 + }, + { + "epoch": 1.1, + "learning_rate": 1.463863534636945e-06, + "loss": 0.8281, + "step": 42848 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638390210198045e-06, + "loss": 0.6768, + "step": 42849 + }, + { + "epoch": 1.1, + "learning_rate": 1.4638145070475241e-06, + "loss": 0.6152, + "step": 42850 + }, + { + "epoch": 1.1, + "learning_rate": 1.463789992720122e-06, + "loss": 0.7881, + "step": 42851 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637654780376174e-06, + "loss": 0.6074, + "step": 42852 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637409630000291e-06, + "loss": 0.6875, + "step": 42853 + }, + { + "epoch": 1.1, + "learning_rate": 1.4637164476073753e-06, + "loss": 0.7451, + "step": 42854 + }, + { + "epoch": 1.1, + "learning_rate": 1.4636919318596755e-06, + "loss": 0.75, + "step": 42855 + }, + { + "epoch": 1.1, + "learning_rate": 1.463667415756948e-06, + "loss": 0.4863, + "step": 42856 + }, + { + "epoch": 1.1, + "learning_rate": 1.4636428992992116e-06, + "loss": 0.5736, + "step": 42857 + }, + { + "epoch": 1.1, + "learning_rate": 1.463618382486485e-06, + "loss": 0.3523, + "step": 42858 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635938653187871e-06, + "loss": 0.582, + "step": 42859 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635693477961368e-06, + "loss": 0.5579, + "step": 42860 + }, + { + "epoch": 1.1, + "learning_rate": 1.463544829918553e-06, + "loss": 0.6228, + "step": 42861 + }, + { + "epoch": 1.1, + "learning_rate": 1.4635203116860543e-06, + "loss": 0.5052, + "step": 42862 + }, + { + "epoch": 1.1, + "learning_rate": 1.463495793098659e-06, + "loss": 0.6396, + "step": 42863 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634712741563862e-06, + "loss": 0.6477, + "step": 42864 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634467548592552e-06, + "loss": 0.7402, + "step": 42865 + }, + { + "epoch": 1.1, + "learning_rate": 1.4634222352072841e-06, + "loss": 0.6963, + "step": 42866 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633977152004922e-06, + "loss": 0.8154, + "step": 42867 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633731948388974e-06, + "loss": 0.5996, + "step": 42868 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633486741225193e-06, + "loss": 0.7041, + "step": 42869 + }, + { + "epoch": 1.1, + "learning_rate": 1.4633241530513764e-06, + "loss": 0.6729, + "step": 42870 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632996316254877e-06, + "loss": 0.709, + "step": 42871 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632751098448718e-06, + "loss": 0.6709, + "step": 42872 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632505877095473e-06, + "loss": 0.7163, + "step": 42873 + }, + { + "epoch": 1.1, + "learning_rate": 1.4632260652195332e-06, + "loss": 0.583, + "step": 42874 + }, + { + "epoch": 1.1, + "learning_rate": 1.463201542374848e-06, + "loss": 0.5049, + "step": 42875 + }, + { + "epoch": 1.1, + "learning_rate": 1.463177019175511e-06, + "loss": 0.7642, + "step": 42876 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631524956215405e-06, + "loss": 0.5513, + "step": 42877 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631279717129554e-06, + "loss": 0.6562, + "step": 42878 + }, + { + "epoch": 1.1, + "learning_rate": 1.4631034474497744e-06, + "loss": 0.4863, + "step": 42879 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630789228320163e-06, + "loss": 0.6177, + "step": 42880 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630543978597004e-06, + "loss": 0.6035, + "step": 42881 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630298725328449e-06, + "loss": 0.7002, + "step": 42882 + }, + { + "epoch": 1.1, + "learning_rate": 1.4630053468514686e-06, + "loss": 0.3999, + "step": 42883 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629808208155903e-06, + "loss": 0.6045, + "step": 42884 + }, + { + "epoch": 1.1, + "learning_rate": 1.462956294425229e-06, + "loss": 0.5986, + "step": 42885 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629317676804033e-06, + "loss": 0.5093, + "step": 42886 + }, + { + "epoch": 1.1, + "learning_rate": 1.4629072405811322e-06, + "loss": 0.5981, + "step": 42887 + }, + { + "epoch": 1.1, + "learning_rate": 1.462882713127434e-06, + "loss": 0.7227, + "step": 42888 + }, + { + "epoch": 1.1, + "learning_rate": 1.462858185319328e-06, + "loss": 0.7988, + "step": 42889 + }, + { + "epoch": 1.1, + "learning_rate": 1.4628336571568328e-06, + "loss": 0.5225, + "step": 42890 + }, + { + "epoch": 1.1, + "learning_rate": 1.4628091286399671e-06, + "loss": 0.593, + "step": 42891 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627845997687499e-06, + "loss": 0.6501, + "step": 42892 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627600705431995e-06, + "loss": 0.5986, + "step": 42893 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627355409633354e-06, + "loss": 0.6943, + "step": 42894 + }, + { + "epoch": 1.1, + "learning_rate": 1.4627110110291754e-06, + "loss": 0.7607, + "step": 42895 + }, + { + "epoch": 1.1, + "learning_rate": 1.462686480740739e-06, + "loss": 0.6162, + "step": 42896 + }, + { + "epoch": 1.1, + "learning_rate": 1.4626619500980454e-06, + "loss": 0.7646, + "step": 42897 + }, + { + "epoch": 1.1, + "learning_rate": 1.462637419101112e-06, + "loss": 0.7378, + "step": 42898 + }, + { + "epoch": 1.1, + "learning_rate": 1.4626128877499588e-06, + "loss": 0.5435, + "step": 42899 + }, + { + "epoch": 1.1, + "learning_rate": 1.4625883560446042e-06, + "loss": 0.6748, + "step": 42900 + }, + { + "epoch": 1.1, + "learning_rate": 1.462563823985067e-06, + "loss": 0.75, + "step": 42901 + }, + { + "epoch": 1.1, + "learning_rate": 1.4625392915713662e-06, + "loss": 0.6963, + "step": 42902 + }, + { + "epoch": 1.1, + "learning_rate": 1.46251475880352e-06, + "loss": 0.6333, + "step": 42903 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624902256815475e-06, + "loss": 0.8789, + "step": 42904 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624656922054674e-06, + "loss": 0.626, + "step": 42905 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624411583752987e-06, + "loss": 0.7754, + "step": 42906 + }, + { + "epoch": 1.1, + "learning_rate": 1.4624166241910603e-06, + "loss": 0.5952, + "step": 42907 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623920896527703e-06, + "loss": 0.698, + "step": 42908 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623675547604486e-06, + "loss": 0.7305, + "step": 42909 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623430195141126e-06, + "loss": 0.749, + "step": 42910 + }, + { + "epoch": 1.1, + "learning_rate": 1.4623184839137823e-06, + "loss": 0.6294, + "step": 42911 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622939479594759e-06, + "loss": 0.6533, + "step": 42912 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622694116512121e-06, + "loss": 0.5737, + "step": 42913 + }, + { + "epoch": 1.1, + "learning_rate": 1.46224487498901e-06, + "loss": 0.7393, + "step": 42914 + }, + { + "epoch": 1.1, + "learning_rate": 1.4622203379728884e-06, + "loss": 0.6895, + "step": 42915 + }, + { + "epoch": 1.1, + "learning_rate": 1.4621958006028657e-06, + "loss": 0.5347, + "step": 42916 + }, + { + "epoch": 1.1, + "learning_rate": 1.462171262878961e-06, + "loss": 0.5554, + "step": 42917 + }, + { + "epoch": 1.1, + "learning_rate": 1.462146724801193e-06, + "loss": 0.833, + "step": 42918 + }, + { + "epoch": 1.1, + "learning_rate": 1.4621221863695805e-06, + "loss": 0.668, + "step": 42919 + }, + { + "epoch": 1.1, + "learning_rate": 1.4620976475841423e-06, + "loss": 0.6226, + "step": 42920 + }, + { + "epoch": 1.1, + "learning_rate": 1.462073108444897e-06, + "loss": 0.6138, + "step": 42921 + }, + { + "epoch": 1.1, + "learning_rate": 1.462048568951864e-06, + "loss": 0.8682, + "step": 42922 + }, + { + "epoch": 1.1, + "learning_rate": 1.4620240291050615e-06, + "loss": 0.6895, + "step": 42923 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619994889045081e-06, + "loss": 0.6223, + "step": 42924 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619749483502233e-06, + "loss": 0.5752, + "step": 42925 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619504074422252e-06, + "loss": 0.8066, + "step": 42926 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619258661805334e-06, + "loss": 0.6147, + "step": 42927 + }, + { + "epoch": 1.1, + "learning_rate": 1.4619013245651659e-06, + "loss": 0.752, + "step": 42928 + }, + { + "epoch": 1.1, + "learning_rate": 1.4618767825961418e-06, + "loss": 0.7969, + "step": 42929 + }, + { + "epoch": 1.1, + "learning_rate": 1.46185224027348e-06, + "loss": 0.8291, + "step": 42930 + }, + { + "epoch": 1.1, + "learning_rate": 1.4618276975971988e-06, + "loss": 0.6577, + "step": 42931 + }, + { + "epoch": 1.1, + "learning_rate": 1.461803154567318e-06, + "loss": 0.6089, + "step": 42932 + }, + { + "epoch": 1.1, + "learning_rate": 1.4617786111838552e-06, + "loss": 0.7529, + "step": 42933 + }, + { + "epoch": 1.1, + "learning_rate": 1.46175406744683e-06, + "loss": 0.6572, + "step": 42934 + }, + { + "epoch": 1.1, + "learning_rate": 1.461729523356261e-06, + "loss": 0.8398, + "step": 42935 + }, + { + "epoch": 1.1, + "learning_rate": 1.461704978912167e-06, + "loss": 0.6216, + "step": 42936 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616804341145664e-06, + "loss": 0.5586, + "step": 42937 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616558889634788e-06, + "loss": 0.6094, + "step": 42938 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616313434589218e-06, + "loss": 0.7065, + "step": 42939 + }, + { + "epoch": 1.1, + "learning_rate": 1.4616067976009153e-06, + "loss": 0.7773, + "step": 42940 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615822513894778e-06, + "loss": 0.4971, + "step": 42941 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615577048246279e-06, + "loss": 0.6948, + "step": 42942 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615331579063845e-06, + "loss": 0.6523, + "step": 42943 + }, + { + "epoch": 1.1, + "learning_rate": 1.4615086106347663e-06, + "loss": 0.626, + "step": 42944 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614840630097923e-06, + "loss": 0.6826, + "step": 42945 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614595150314811e-06, + "loss": 0.7588, + "step": 42946 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614349666998518e-06, + "loss": 0.5205, + "step": 42947 + }, + { + "epoch": 1.1, + "learning_rate": 1.4614104180149228e-06, + "loss": 0.6621, + "step": 42948 + }, + { + "epoch": 1.1, + "learning_rate": 1.461385868976713e-06, + "loss": 0.6694, + "step": 42949 + }, + { + "epoch": 1.1, + "learning_rate": 1.461361319585241e-06, + "loss": 0.873, + "step": 42950 + }, + { + "epoch": 1.1, + "learning_rate": 1.4613367698405262e-06, + "loss": 0.5923, + "step": 42951 + }, + { + "epoch": 1.1, + "learning_rate": 1.461312219742587e-06, + "loss": 0.6431, + "step": 42952 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612876692914424e-06, + "loss": 0.6401, + "step": 42953 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612631184871108e-06, + "loss": 0.6411, + "step": 42954 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612385673296113e-06, + "loss": 0.644, + "step": 42955 + }, + { + "epoch": 1.1, + "learning_rate": 1.4612140158189625e-06, + "loss": 0.7891, + "step": 42956 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611894639551837e-06, + "loss": 0.584, + "step": 42957 + }, + { + "epoch": 1.1, + "learning_rate": 1.461164911738293e-06, + "loss": 0.6211, + "step": 42958 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611403591683095e-06, + "loss": 0.6152, + "step": 42959 + }, + { + "epoch": 1.1, + "learning_rate": 1.4611158062452523e-06, + "loss": 0.4648, + "step": 42960 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610912529691396e-06, + "loss": 0.6365, + "step": 42961 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610666993399909e-06, + "loss": 0.6523, + "step": 42962 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610421453578244e-06, + "loss": 0.7334, + "step": 42963 + }, + { + "epoch": 1.1, + "learning_rate": 1.4610175910226592e-06, + "loss": 0.7031, + "step": 42964 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609930363345143e-06, + "loss": 0.604, + "step": 42965 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609684812934075e-06, + "loss": 0.8154, + "step": 42966 + }, + { + "epoch": 1.1, + "learning_rate": 1.460943925899359e-06, + "loss": 0.542, + "step": 42967 + }, + { + "epoch": 1.1, + "learning_rate": 1.4609193701523868e-06, + "loss": 0.7856, + "step": 42968 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608948140525096e-06, + "loss": 0.603, + "step": 42969 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608702575997466e-06, + "loss": 0.623, + "step": 42970 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608457007941165e-06, + "loss": 0.7607, + "step": 42971 + }, + { + "epoch": 1.1, + "learning_rate": 1.4608211436356379e-06, + "loss": 0.6685, + "step": 42972 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607965861243296e-06, + "loss": 0.6562, + "step": 42973 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607720282602109e-06, + "loss": 0.6161, + "step": 42974 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607474700433e-06, + "loss": 0.8242, + "step": 42975 + }, + { + "epoch": 1.1, + "learning_rate": 1.4607229114736162e-06, + "loss": 0.7109, + "step": 42976 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606983525511779e-06, + "loss": 0.5647, + "step": 42977 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606737932760037e-06, + "loss": 0.7012, + "step": 42978 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606492336481134e-06, + "loss": 0.6953, + "step": 42979 + }, + { + "epoch": 1.1, + "learning_rate": 1.4606246736675247e-06, + "loss": 0.6836, + "step": 42980 + }, + { + "epoch": 1.1, + "learning_rate": 1.460600113334257e-06, + "loss": 0.5184, + "step": 42981 + }, + { + "epoch": 1.1, + "learning_rate": 1.4605755526483293e-06, + "loss": 0.665, + "step": 42982 + }, + { + "epoch": 1.1, + "learning_rate": 1.4605509916097596e-06, + "loss": 0.75, + "step": 42983 + }, + { + "epoch": 1.1, + "learning_rate": 1.460526430218567e-06, + "loss": 0.6992, + "step": 42984 + }, + { + "epoch": 1.1, + "learning_rate": 1.460501868474771e-06, + "loss": 0.5952, + "step": 42985 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604773063783898e-06, + "loss": 0.6777, + "step": 42986 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604527439294423e-06, + "loss": 0.6858, + "step": 42987 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604281811279472e-06, + "loss": 0.6719, + "step": 42988 + }, + { + "epoch": 1.1, + "learning_rate": 1.4604036179739235e-06, + "loss": 0.7656, + "step": 42989 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603790544673895e-06, + "loss": 0.6099, + "step": 42990 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603544906083652e-06, + "loss": 0.7812, + "step": 42991 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603299263968681e-06, + "loss": 0.7061, + "step": 42992 + }, + { + "epoch": 1.1, + "learning_rate": 1.4603053618329177e-06, + "loss": 0.5762, + "step": 42993 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602807969165325e-06, + "loss": 0.7285, + "step": 42994 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602562316477316e-06, + "loss": 0.7061, + "step": 42995 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602316660265336e-06, + "loss": 0.5737, + "step": 42996 + }, + { + "epoch": 1.1, + "learning_rate": 1.4602071000529575e-06, + "loss": 0.71, + "step": 42997 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601825337270218e-06, + "loss": 0.6694, + "step": 42998 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601579670487456e-06, + "loss": 0.6992, + "step": 42999 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601334000181475e-06, + "loss": 0.4534, + "step": 43000 + }, + { + "epoch": 1.1, + "learning_rate": 1.4601088326352468e-06, + "loss": 0.6143, + "step": 43001 + }, + { + "epoch": 1.1, + "learning_rate": 1.4600842649000615e-06, + "loss": 0.8281, + "step": 43002 + }, + { + "epoch": 1.1, + "learning_rate": 1.4600596968126111e-06, + "loss": 0.6846, + "step": 43003 + }, + { + "epoch": 1.1, + "learning_rate": 1.460035128372914e-06, + "loss": 0.6304, + "step": 43004 + }, + { + "epoch": 1.1, + "learning_rate": 1.460010559580989e-06, + "loss": 0.6611, + "step": 43005 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599859904368555e-06, + "loss": 0.6499, + "step": 43006 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599614209405312e-06, + "loss": 0.4458, + "step": 43007 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599368510920362e-06, + "loss": 0.6099, + "step": 43008 + }, + { + "epoch": 1.1, + "learning_rate": 1.4599122808913885e-06, + "loss": 0.6519, + "step": 43009 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598877103386072e-06, + "loss": 0.4739, + "step": 43010 + }, + { + "epoch": 1.1, + "learning_rate": 1.459863139433711e-06, + "loss": 0.5663, + "step": 43011 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598385681767187e-06, + "loss": 0.606, + "step": 43012 + }, + { + "epoch": 1.1, + "learning_rate": 1.4598139965676488e-06, + "loss": 0.7012, + "step": 43013 + }, + { + "epoch": 1.1, + "learning_rate": 1.459789424606521e-06, + "loss": 0.6152, + "step": 43014 + }, + { + "epoch": 1.1, + "learning_rate": 1.4597648522933533e-06, + "loss": 0.6201, + "step": 43015 + }, + { + "epoch": 1.1, + "learning_rate": 1.459740279628165e-06, + "loss": 0.6689, + "step": 43016 + }, + { + "epoch": 1.1, + "learning_rate": 1.4597157066109746e-06, + "loss": 0.7852, + "step": 43017 + }, + { + "epoch": 1.1, + "learning_rate": 1.459691133241801e-06, + "loss": 0.6313, + "step": 43018 + }, + { + "epoch": 1.1, + "learning_rate": 1.459666559520663e-06, + "loss": 0.874, + "step": 43019 + }, + { + "epoch": 1.1, + "learning_rate": 1.4596419854475795e-06, + "loss": 0.6953, + "step": 43020 + }, + { + "epoch": 1.1, + "learning_rate": 1.4596174110225691e-06, + "loss": 0.751, + "step": 43021 + }, + { + "epoch": 1.1, + "learning_rate": 1.459592836245651e-06, + "loss": 0.7803, + "step": 43022 + }, + { + "epoch": 1.1, + "learning_rate": 1.4595682611168439e-06, + "loss": 0.7852, + "step": 43023 + }, + { + "epoch": 1.1, + "learning_rate": 1.4595436856361664e-06, + "loss": 0.7178, + "step": 43024 + }, + { + "epoch": 1.1, + "learning_rate": 1.459519109803637e-06, + "loss": 0.6963, + "step": 43025 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594945336192757e-06, + "loss": 0.543, + "step": 43026 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594699570831002e-06, + "loss": 0.7139, + "step": 43027 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594453801951297e-06, + "loss": 0.791, + "step": 43028 + }, + { + "epoch": 1.1, + "learning_rate": 1.4594208029553827e-06, + "loss": 0.5742, + "step": 43029 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593962253638787e-06, + "loss": 0.709, + "step": 43030 + }, + { + "epoch": 1.1, + "learning_rate": 1.459371647420636e-06, + "loss": 0.7734, + "step": 43031 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593470691256735e-06, + "loss": 0.4727, + "step": 43032 + }, + { + "epoch": 1.1, + "learning_rate": 1.4593224904790103e-06, + "loss": 0.5889, + "step": 43033 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592979114806644e-06, + "loss": 0.5042, + "step": 43034 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592733321306559e-06, + "loss": 0.5967, + "step": 43035 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592487524290027e-06, + "loss": 0.6807, + "step": 43036 + }, + { + "epoch": 1.1, + "learning_rate": 1.4592241723757239e-06, + "loss": 0.5337, + "step": 43037 + }, + { + "epoch": 1.1, + "learning_rate": 1.459199591970838e-06, + "loss": 0.6445, + "step": 43038 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591750112143644e-06, + "loss": 0.7861, + "step": 43039 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591504301063214e-06, + "loss": 0.7695, + "step": 43040 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591258486467284e-06, + "loss": 0.7007, + "step": 43041 + }, + { + "epoch": 1.1, + "learning_rate": 1.4591012668356034e-06, + "loss": 0.5815, + "step": 43042 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590766846729658e-06, + "loss": 0.6904, + "step": 43043 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590521021588342e-06, + "loss": 0.7881, + "step": 43044 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590275192932277e-06, + "loss": 0.7158, + "step": 43045 + }, + { + "epoch": 1.1, + "learning_rate": 1.4590029360761648e-06, + "loss": 0.5063, + "step": 43046 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589783525076647e-06, + "loss": 0.6572, + "step": 43047 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589537685877457e-06, + "loss": 0.6992, + "step": 43048 + }, + { + "epoch": 1.1, + "learning_rate": 1.458929184316427e-06, + "loss": 0.6777, + "step": 43049 + }, + { + "epoch": 1.1, + "learning_rate": 1.4589045996937272e-06, + "loss": 0.7075, + "step": 43050 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588800147196655e-06, + "loss": 0.6484, + "step": 43051 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588554293942603e-06, + "loss": 0.751, + "step": 43052 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588308437175308e-06, + "loss": 0.709, + "step": 43053 + }, + { + "epoch": 1.1, + "learning_rate": 1.4588062576894952e-06, + "loss": 0.5879, + "step": 43054 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587816713101733e-06, + "loss": 0.6943, + "step": 43055 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587570845795832e-06, + "loss": 0.71, + "step": 43056 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587324974977436e-06, + "loss": 0.5811, + "step": 43057 + }, + { + "epoch": 1.1, + "learning_rate": 1.4587079100646737e-06, + "loss": 0.4819, + "step": 43058 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586833222803922e-06, + "loss": 0.7686, + "step": 43059 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586587341449184e-06, + "loss": 0.6475, + "step": 43060 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586341456582702e-06, + "loss": 0.7363, + "step": 43061 + }, + { + "epoch": 1.1, + "learning_rate": 1.4586095568204673e-06, + "loss": 0.6943, + "step": 43062 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585849676315277e-06, + "loss": 0.6538, + "step": 43063 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585603780914712e-06, + "loss": 0.6211, + "step": 43064 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585357882003158e-06, + "loss": 0.6689, + "step": 43065 + }, + { + "epoch": 1.1, + "learning_rate": 1.4585111979580808e-06, + "loss": 0.7393, + "step": 43066 + }, + { + "epoch": 1.1, + "learning_rate": 1.4584866073647848e-06, + "loss": 0.6396, + "step": 43067 + }, + { + "epoch": 1.1, + "learning_rate": 1.4584620164204466e-06, + "loss": 0.5938, + "step": 43068 + }, + { + "epoch": 1.1, + "learning_rate": 1.458437425125085e-06, + "loss": 0.511, + "step": 43069 + }, + { + "epoch": 1.1, + "learning_rate": 1.458412833478719e-06, + "loss": 0.5962, + "step": 43070 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583882414813677e-06, + "loss": 0.6938, + "step": 43071 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583636491330492e-06, + "loss": 0.5347, + "step": 43072 + }, + { + "epoch": 1.1, + "learning_rate": 1.458339056433783e-06, + "loss": 0.8008, + "step": 43073 + }, + { + "epoch": 1.1, + "learning_rate": 1.4583144633835875e-06, + "loss": 0.6494, + "step": 43074 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582898699824816e-06, + "loss": 0.8926, + "step": 43075 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582652762304846e-06, + "loss": 0.5312, + "step": 43076 + }, + { + "epoch": 1.1, + "learning_rate": 1.4582406821276147e-06, + "loss": 0.459, + "step": 43077 + }, + { + "epoch": 1.1, + "learning_rate": 1.458216087673891e-06, + "loss": 0.6294, + "step": 43078 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581914928693323e-06, + "loss": 0.6475, + "step": 43079 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581668977139572e-06, + "loss": 0.7036, + "step": 43080 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581423022077854e-06, + "loss": 0.7656, + "step": 43081 + }, + { + "epoch": 1.1, + "learning_rate": 1.4581177063508346e-06, + "loss": 0.5913, + "step": 43082 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580931101431243e-06, + "loss": 0.6807, + "step": 43083 + }, + { + "epoch": 1.1, + "learning_rate": 1.458068513584673e-06, + "loss": 0.6182, + "step": 43084 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580439166754998e-06, + "loss": 0.6494, + "step": 43085 + }, + { + "epoch": 1.1, + "learning_rate": 1.4580193194156235e-06, + "loss": 0.7256, + "step": 43086 + }, + { + "epoch": 1.1, + "learning_rate": 1.457994721805063e-06, + "loss": 0.7422, + "step": 43087 + }, + { + "epoch": 1.1, + "learning_rate": 1.4579701238438369e-06, + "loss": 0.7842, + "step": 43088 + }, + { + "epoch": 1.1, + "learning_rate": 1.457945525531964e-06, + "loss": 0.4829, + "step": 43089 + }, + { + "epoch": 1.1, + "learning_rate": 1.4579209268694632e-06, + "loss": 0.75, + "step": 43090 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578963278563539e-06, + "loss": 0.5791, + "step": 43091 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578717284926538e-06, + "loss": 0.7383, + "step": 43092 + }, + { + "epoch": 1.1, + "learning_rate": 1.4578471287783827e-06, + "loss": 0.5801, + "step": 43093 + }, + { + "epoch": 1.1, + "learning_rate": 1.457822528713559e-06, + "loss": 0.4785, + "step": 43094 + }, + { + "epoch": 1.1, + "learning_rate": 1.457797928298202e-06, + "loss": 0.48, + "step": 43095 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577733275323297e-06, + "loss": 0.458, + "step": 43096 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577487264159613e-06, + "loss": 0.5933, + "step": 43097 + }, + { + "epoch": 1.1, + "learning_rate": 1.4577241249491162e-06, + "loss": 0.7227, + "step": 43098 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576995231318128e-06, + "loss": 0.6533, + "step": 43099 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576749209640695e-06, + "loss": 0.7588, + "step": 43100 + }, + { + "epoch": 1.1, + "learning_rate": 1.457650318445906e-06, + "loss": 0.6812, + "step": 43101 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576257155773404e-06, + "loss": 0.5466, + "step": 43102 + }, + { + "epoch": 1.1, + "learning_rate": 1.4576011123583917e-06, + "loss": 0.7236, + "step": 43103 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575765087890793e-06, + "loss": 0.6274, + "step": 43104 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575519048694211e-06, + "loss": 0.5586, + "step": 43105 + }, + { + "epoch": 1.1, + "learning_rate": 1.4575273005994371e-06, + "loss": 0.7549, + "step": 43106 + }, + { + "epoch": 1.1, + "learning_rate": 1.457502695979145e-06, + "loss": 0.6724, + "step": 43107 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574780910085642e-06, + "loss": 0.623, + "step": 43108 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574534856877136e-06, + "loss": 0.7314, + "step": 43109 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574288800166118e-06, + "loss": 0.7949, + "step": 43110 + }, + { + "epoch": 1.1, + "learning_rate": 1.4574042739952779e-06, + "loss": 0.751, + "step": 43111 + }, + { + "epoch": 1.1, + "learning_rate": 1.4573796676237303e-06, + "loss": 0.5382, + "step": 43112 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573550609019883e-06, + "loss": 0.5798, + "step": 43113 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573304538300705e-06, + "loss": 0.7441, + "step": 43114 + }, + { + "epoch": 1.11, + "learning_rate": 1.4573058464079957e-06, + "loss": 0.4563, + "step": 43115 + }, + { + "epoch": 1.11, + "learning_rate": 1.457281238635783e-06, + "loss": 0.772, + "step": 43116 + }, + { + "epoch": 1.11, + "learning_rate": 1.457256630513451e-06, + "loss": 0.623, + "step": 43117 + }, + { + "epoch": 1.11, + "learning_rate": 1.4572320220410187e-06, + "loss": 0.6914, + "step": 43118 + }, + { + "epoch": 1.11, + "learning_rate": 1.4572074132185047e-06, + "loss": 0.5283, + "step": 43119 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571828040459281e-06, + "loss": 0.5957, + "step": 43120 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571581945233077e-06, + "loss": 0.6548, + "step": 43121 + }, + { + "epoch": 1.11, + "learning_rate": 1.4571335846506622e-06, + "loss": 0.7578, + "step": 43122 + }, + { + "epoch": 1.11, + "learning_rate": 1.457108974428011e-06, + "loss": 0.6758, + "step": 43123 + }, + { + "epoch": 1.11, + "learning_rate": 1.457084363855372e-06, + "loss": 0.6674, + "step": 43124 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570597529327644e-06, + "loss": 0.6865, + "step": 43125 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570351416602074e-06, + "loss": 0.4265, + "step": 43126 + }, + { + "epoch": 1.11, + "learning_rate": 1.4570105300377197e-06, + "loss": 0.6914, + "step": 43127 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569859180653197e-06, + "loss": 0.7485, + "step": 43128 + }, + { + "epoch": 1.11, + "learning_rate": 1.456961305743027e-06, + "loss": 0.6289, + "step": 43129 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569366930708596e-06, + "loss": 0.6514, + "step": 43130 + }, + { + "epoch": 1.11, + "learning_rate": 1.4569120800488373e-06, + "loss": 0.749, + "step": 43131 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568874666769782e-06, + "loss": 0.6318, + "step": 43132 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568628529553012e-06, + "loss": 0.6299, + "step": 43133 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568382388838255e-06, + "loss": 0.6787, + "step": 43134 + }, + { + "epoch": 1.11, + "learning_rate": 1.4568136244625698e-06, + "loss": 0.4829, + "step": 43135 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567890096915529e-06, + "loss": 0.4071, + "step": 43136 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567643945707935e-06, + "loss": 0.7344, + "step": 43137 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567397791003107e-06, + "loss": 0.5967, + "step": 43138 + }, + { + "epoch": 1.11, + "learning_rate": 1.4567151632801233e-06, + "loss": 0.8242, + "step": 43139 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566905471102499e-06, + "loss": 0.6172, + "step": 43140 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566659305907098e-06, + "loss": 0.6445, + "step": 43141 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566413137215215e-06, + "loss": 0.7373, + "step": 43142 + }, + { + "epoch": 1.11, + "learning_rate": 1.4566166965027038e-06, + "loss": 0.7061, + "step": 43143 + }, + { + "epoch": 1.11, + "learning_rate": 1.456592078934276e-06, + "loss": 0.5913, + "step": 43144 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565674610162564e-06, + "loss": 0.4614, + "step": 43145 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565428427486644e-06, + "loss": 0.4019, + "step": 43146 + }, + { + "epoch": 1.11, + "learning_rate": 1.4565182241315182e-06, + "loss": 0.6191, + "step": 43147 + }, + { + "epoch": 1.11, + "learning_rate": 1.4564936051648372e-06, + "loss": 0.6357, + "step": 43148 + }, + { + "epoch": 1.11, + "learning_rate": 1.4564689858486395e-06, + "loss": 0.752, + "step": 43149 + }, + { + "epoch": 1.11, + "learning_rate": 1.456444366182945e-06, + "loss": 0.6299, + "step": 43150 + }, + { + "epoch": 1.11, + "learning_rate": 1.456419746167772e-06, + "loss": 0.6309, + "step": 43151 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563951258031394e-06, + "loss": 0.6836, + "step": 43152 + }, + { + "epoch": 1.11, + "learning_rate": 1.456370505089066e-06, + "loss": 0.7842, + "step": 43153 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563458840255706e-06, + "loss": 0.6138, + "step": 43154 + }, + { + "epoch": 1.11, + "learning_rate": 1.4563212626126723e-06, + "loss": 0.8066, + "step": 43155 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562966408503898e-06, + "loss": 0.8438, + "step": 43156 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562720187387418e-06, + "loss": 0.6641, + "step": 43157 + }, + { + "epoch": 1.11, + "learning_rate": 1.4562473962777473e-06, + "loss": 0.6797, + "step": 43158 + }, + { + "epoch": 1.11, + "learning_rate": 1.456222773467425e-06, + "loss": 0.6504, + "step": 43159 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561981503077942e-06, + "loss": 0.7109, + "step": 43160 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561735267988734e-06, + "loss": 0.561, + "step": 43161 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561489029406814e-06, + "loss": 0.7607, + "step": 43162 + }, + { + "epoch": 1.11, + "learning_rate": 1.4561242787332374e-06, + "loss": 0.5938, + "step": 43163 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560996541765595e-06, + "loss": 0.6777, + "step": 43164 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560750292706673e-06, + "loss": 0.6572, + "step": 43165 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560504040155797e-06, + "loss": 0.5825, + "step": 43166 + }, + { + "epoch": 1.11, + "learning_rate": 1.456025778411315e-06, + "loss": 0.4756, + "step": 43167 + }, + { + "epoch": 1.11, + "learning_rate": 1.4560011524578923e-06, + "loss": 0.8066, + "step": 43168 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559765261553307e-06, + "loss": 0.562, + "step": 43169 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559518995036486e-06, + "loss": 0.5105, + "step": 43170 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559272725028656e-06, + "loss": 0.6265, + "step": 43171 + }, + { + "epoch": 1.11, + "learning_rate": 1.4559026451529994e-06, + "loss": 0.6069, + "step": 43172 + }, + { + "epoch": 1.11, + "learning_rate": 1.45587801745407e-06, + "loss": 0.7051, + "step": 43173 + }, + { + "epoch": 1.11, + "learning_rate": 1.4558533894060955e-06, + "loss": 0.6323, + "step": 43174 + }, + { + "epoch": 1.11, + "learning_rate": 1.455828761009095e-06, + "loss": 0.7422, + "step": 43175 + }, + { + "epoch": 1.11, + "learning_rate": 1.4558041322630874e-06, + "loss": 1.04, + "step": 43176 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557795031680918e-06, + "loss": 0.6719, + "step": 43177 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557548737241263e-06, + "loss": 0.7256, + "step": 43178 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557302439312107e-06, + "loss": 0.6152, + "step": 43179 + }, + { + "epoch": 1.11, + "learning_rate": 1.4557056137893632e-06, + "loss": 0.5073, + "step": 43180 + }, + { + "epoch": 1.11, + "learning_rate": 1.455680983298603e-06, + "loss": 0.4922, + "step": 43181 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556563524589484e-06, + "loss": 0.7432, + "step": 43182 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556317212704191e-06, + "loss": 0.79, + "step": 43183 + }, + { + "epoch": 1.11, + "learning_rate": 1.4556070897330334e-06, + "loss": 0.5591, + "step": 43184 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555824578468103e-06, + "loss": 0.7285, + "step": 43185 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555578256117688e-06, + "loss": 0.7188, + "step": 43186 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555331930279276e-06, + "loss": 0.7285, + "step": 43187 + }, + { + "epoch": 1.11, + "learning_rate": 1.4555085600953054e-06, + "loss": 0.457, + "step": 43188 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554839268139214e-06, + "loss": 0.7666, + "step": 43189 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554592931837942e-06, + "loss": 0.6948, + "step": 43190 + }, + { + "epoch": 1.11, + "learning_rate": 1.455434659204943e-06, + "loss": 0.71, + "step": 43191 + }, + { + "epoch": 1.11, + "learning_rate": 1.4554100248773862e-06, + "loss": 0.6064, + "step": 43192 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553853902011426e-06, + "loss": 0.5933, + "step": 43193 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553607551762319e-06, + "loss": 0.5388, + "step": 43194 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553361198026718e-06, + "loss": 0.5454, + "step": 43195 + }, + { + "epoch": 1.11, + "learning_rate": 1.4553114840804825e-06, + "loss": 0.665, + "step": 43196 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552868480096816e-06, + "loss": 0.7144, + "step": 43197 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552622115902889e-06, + "loss": 0.7695, + "step": 43198 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552375748223224e-06, + "loss": 0.6426, + "step": 43199 + }, + { + "epoch": 1.11, + "learning_rate": 1.4552129377058017e-06, + "loss": 0.54, + "step": 43200 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551883002407454e-06, + "loss": 0.502, + "step": 43201 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551636624271724e-06, + "loss": 0.7178, + "step": 43202 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551390242651011e-06, + "loss": 0.6816, + "step": 43203 + }, + { + "epoch": 1.11, + "learning_rate": 1.4551143857545514e-06, + "loss": 0.7109, + "step": 43204 + }, + { + "epoch": 1.11, + "learning_rate": 1.455089746895541e-06, + "loss": 0.6025, + "step": 43205 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550651076880898e-06, + "loss": 0.7783, + "step": 43206 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550404681322158e-06, + "loss": 0.666, + "step": 43207 + }, + { + "epoch": 1.11, + "learning_rate": 1.4550158282279381e-06, + "loss": 0.749, + "step": 43208 + }, + { + "epoch": 1.11, + "learning_rate": 1.4549911879752758e-06, + "loss": 0.7168, + "step": 43209 + }, + { + "epoch": 1.11, + "learning_rate": 1.454966547374248e-06, + "loss": 0.6919, + "step": 43210 + }, + { + "epoch": 1.11, + "learning_rate": 1.4549419064248732e-06, + "loss": 0.792, + "step": 43211 + }, + { + "epoch": 1.11, + "learning_rate": 1.45491726512717e-06, + "loss": 0.6562, + "step": 43212 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548926234811576e-06, + "loss": 0.7192, + "step": 43213 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548679814868549e-06, + "loss": 0.7275, + "step": 43214 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548433391442806e-06, + "loss": 0.5225, + "step": 43215 + }, + { + "epoch": 1.11, + "learning_rate": 1.4548186964534539e-06, + "loss": 0.5889, + "step": 43216 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547940534143935e-06, + "loss": 0.6982, + "step": 43217 + }, + { + "epoch": 1.11, + "learning_rate": 1.454769410027118e-06, + "loss": 0.7266, + "step": 43218 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547447662916466e-06, + "loss": 0.6357, + "step": 43219 + }, + { + "epoch": 1.11, + "learning_rate": 1.4547201222079976e-06, + "loss": 0.623, + "step": 43220 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546954777761912e-06, + "loss": 0.6309, + "step": 43221 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546708329962445e-06, + "loss": 0.6162, + "step": 43222 + }, + { + "epoch": 1.11, + "learning_rate": 1.4546461878681778e-06, + "loss": 0.5232, + "step": 43223 + }, + { + "epoch": 1.11, + "learning_rate": 1.454621542392009e-06, + "loss": 0.7393, + "step": 43224 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545968965677577e-06, + "loss": 0.593, + "step": 43225 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545722503954426e-06, + "loss": 0.6167, + "step": 43226 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545476038750822e-06, + "loss": 0.7412, + "step": 43227 + }, + { + "epoch": 1.11, + "learning_rate": 1.4545229570066955e-06, + "loss": 0.6689, + "step": 43228 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544983097903013e-06, + "loss": 0.5774, + "step": 43229 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544736622259191e-06, + "loss": 0.6411, + "step": 43230 + }, + { + "epoch": 1.11, + "learning_rate": 1.454449014313567e-06, + "loss": 0.7441, + "step": 43231 + }, + { + "epoch": 1.11, + "learning_rate": 1.4544243660532645e-06, + "loss": 0.5542, + "step": 43232 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543997174450298e-06, + "loss": 0.6768, + "step": 43233 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543750684888822e-06, + "loss": 0.5493, + "step": 43234 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543504191848408e-06, + "loss": 0.7158, + "step": 43235 + }, + { + "epoch": 1.11, + "learning_rate": 1.454325769532924e-06, + "loss": 0.8149, + "step": 43236 + }, + { + "epoch": 1.11, + "learning_rate": 1.4543011195331506e-06, + "loss": 0.7222, + "step": 43237 + }, + { + "epoch": 1.11, + "learning_rate": 1.4542764691855403e-06, + "loss": 0.5701, + "step": 43238 + }, + { + "epoch": 1.11, + "learning_rate": 1.454251818490111e-06, + "loss": 0.7832, + "step": 43239 + }, + { + "epoch": 1.11, + "learning_rate": 1.454227167446882e-06, + "loss": 0.3538, + "step": 43240 + }, + { + "epoch": 1.11, + "learning_rate": 1.4542025160558722e-06, + "loss": 0.6855, + "step": 43241 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541778643171003e-06, + "loss": 0.7676, + "step": 43242 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541532122305853e-06, + "loss": 0.7471, + "step": 43243 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541285597963462e-06, + "loss": 0.7251, + "step": 43244 + }, + { + "epoch": 1.11, + "learning_rate": 1.4541039070144017e-06, + "loss": 0.6606, + "step": 43245 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540792538847708e-06, + "loss": 0.5488, + "step": 43246 + }, + { + "epoch": 1.11, + "learning_rate": 1.454054600407472e-06, + "loss": 0.603, + "step": 43247 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540299465825249e-06, + "loss": 0.623, + "step": 43248 + }, + { + "epoch": 1.11, + "learning_rate": 1.4540052924099475e-06, + "loss": 0.4971, + "step": 43249 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539806378897595e-06, + "loss": 0.8608, + "step": 43250 + }, + { + "epoch": 1.11, + "learning_rate": 1.453955983021979e-06, + "loss": 0.6143, + "step": 43251 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539313278066257e-06, + "loss": 0.6807, + "step": 43252 + }, + { + "epoch": 1.11, + "learning_rate": 1.4539066722437179e-06, + "loss": 0.6846, + "step": 43253 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538820163332746e-06, + "loss": 0.5742, + "step": 43254 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538573600753147e-06, + "loss": 0.6836, + "step": 43255 + }, + { + "epoch": 1.11, + "learning_rate": 1.453832703469857e-06, + "loss": 0.5028, + "step": 43256 + }, + { + "epoch": 1.11, + "learning_rate": 1.4538080465169206e-06, + "loss": 0.3142, + "step": 43257 + }, + { + "epoch": 1.11, + "learning_rate": 1.453783389216524e-06, + "loss": 0.6328, + "step": 43258 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537587315686866e-06, + "loss": 0.5645, + "step": 43259 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537340735734269e-06, + "loss": 0.6602, + "step": 43260 + }, + { + "epoch": 1.11, + "learning_rate": 1.4537094152307643e-06, + "loss": 0.5444, + "step": 43261 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536847565407167e-06, + "loss": 0.7305, + "step": 43262 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536600975033037e-06, + "loss": 0.5551, + "step": 43263 + }, + { + "epoch": 1.11, + "learning_rate": 1.453635438118544e-06, + "loss": 0.8408, + "step": 43264 + }, + { + "epoch": 1.11, + "learning_rate": 1.4536107783864565e-06, + "loss": 0.6982, + "step": 43265 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535861183070604e-06, + "loss": 0.5776, + "step": 43266 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535614578803739e-06, + "loss": 0.7129, + "step": 43267 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535367971064162e-06, + "loss": 0.7339, + "step": 43268 + }, + { + "epoch": 1.11, + "learning_rate": 1.4535121359852065e-06, + "loss": 0.6294, + "step": 43269 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534874745167632e-06, + "loss": 0.5767, + "step": 43270 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534628127011056e-06, + "loss": 0.8213, + "step": 43271 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534381505382522e-06, + "loss": 0.6562, + "step": 43272 + }, + { + "epoch": 1.11, + "learning_rate": 1.4534134880282222e-06, + "loss": 0.7168, + "step": 43273 + }, + { + "epoch": 1.11, + "learning_rate": 1.453388825171034e-06, + "loss": 0.7744, + "step": 43274 + }, + { + "epoch": 1.11, + "learning_rate": 1.453364161966707e-06, + "loss": 0.6836, + "step": 43275 + }, + { + "epoch": 1.11, + "learning_rate": 1.4533394984152603e-06, + "loss": 0.4434, + "step": 43276 + }, + { + "epoch": 1.11, + "learning_rate": 1.4533148345167119e-06, + "loss": 0.5762, + "step": 43277 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532901702710815e-06, + "loss": 0.4429, + "step": 43278 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532655056783877e-06, + "loss": 0.5566, + "step": 43279 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532408407386492e-06, + "loss": 0.6465, + "step": 43280 + }, + { + "epoch": 1.11, + "learning_rate": 1.4532161754518847e-06, + "loss": 0.6465, + "step": 43281 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531915098181137e-06, + "loss": 0.6758, + "step": 43282 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531668438373548e-06, + "loss": 0.4976, + "step": 43283 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531421775096268e-06, + "loss": 0.4596, + "step": 43284 + }, + { + "epoch": 1.11, + "learning_rate": 1.4531175108349489e-06, + "loss": 0.584, + "step": 43285 + }, + { + "epoch": 1.11, + "learning_rate": 1.4530928438133398e-06, + "loss": 0.7754, + "step": 43286 + }, + { + "epoch": 1.11, + "learning_rate": 1.4530681764448177e-06, + "loss": 0.4597, + "step": 43287 + }, + { + "epoch": 1.11, + "learning_rate": 1.453043508729403e-06, + "loss": 0.8428, + "step": 43288 + }, + { + "epoch": 1.11, + "learning_rate": 1.453018840667113e-06, + "loss": 0.6709, + "step": 43289 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529941722579678e-06, + "loss": 0.4946, + "step": 43290 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529695035019855e-06, + "loss": 0.6177, + "step": 43291 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529448343991856e-06, + "loss": 0.5996, + "step": 43292 + }, + { + "epoch": 1.11, + "learning_rate": 1.4529201649495862e-06, + "loss": 0.6147, + "step": 43293 + }, + { + "epoch": 1.11, + "learning_rate": 1.452895495153207e-06, + "loss": 0.5522, + "step": 43294 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528708250100666e-06, + "loss": 0.6899, + "step": 43295 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528461545201833e-06, + "loss": 0.4421, + "step": 43296 + }, + { + "epoch": 1.11, + "learning_rate": 1.4528214836835772e-06, + "loss": 0.6377, + "step": 43297 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527968125002663e-06, + "loss": 0.8203, + "step": 43298 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527721409702693e-06, + "loss": 0.6318, + "step": 43299 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527474690936058e-06, + "loss": 0.6309, + "step": 43300 + }, + { + "epoch": 1.11, + "learning_rate": 1.4527227968702946e-06, + "loss": 0.7427, + "step": 43301 + }, + { + "epoch": 1.11, + "learning_rate": 1.452698124300354e-06, + "loss": 0.6265, + "step": 43302 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526734513838036e-06, + "loss": 0.4612, + "step": 43303 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526487781206615e-06, + "loss": 0.6353, + "step": 43304 + }, + { + "epoch": 1.11, + "learning_rate": 1.4526241045109475e-06, + "loss": 0.8379, + "step": 43305 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525994305546799e-06, + "loss": 0.7275, + "step": 43306 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525747562518777e-06, + "loss": 0.5474, + "step": 43307 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525500816025595e-06, + "loss": 0.7803, + "step": 43308 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525254066067448e-06, + "loss": 0.6309, + "step": 43309 + }, + { + "epoch": 1.11, + "learning_rate": 1.4525007312644524e-06, + "loss": 0.6533, + "step": 43310 + }, + { + "epoch": 1.11, + "learning_rate": 1.452476055575701e-06, + "loss": 0.5112, + "step": 43311 + }, + { + "epoch": 1.11, + "learning_rate": 1.452451379540509e-06, + "loss": 0.834, + "step": 43312 + }, + { + "epoch": 1.11, + "learning_rate": 1.4524267031588962e-06, + "loss": 0.6592, + "step": 43313 + }, + { + "epoch": 1.11, + "learning_rate": 1.4524020264308808e-06, + "loss": 0.7012, + "step": 43314 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523773493564824e-06, + "loss": 0.665, + "step": 43315 + }, + { + "epoch": 1.11, + "learning_rate": 1.452352671935719e-06, + "loss": 0.7871, + "step": 43316 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523279941686103e-06, + "loss": 0.6274, + "step": 43317 + }, + { + "epoch": 1.11, + "learning_rate": 1.4523033160551745e-06, + "loss": 0.6475, + "step": 43318 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522786375954313e-06, + "loss": 0.8066, + "step": 43319 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522539587893986e-06, + "loss": 0.6162, + "step": 43320 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522292796370963e-06, + "loss": 0.4448, + "step": 43321 + }, + { + "epoch": 1.11, + "learning_rate": 1.4522046001385426e-06, + "loss": 0.6885, + "step": 43322 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521799202937566e-06, + "loss": 0.7354, + "step": 43323 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521552401027575e-06, + "loss": 0.6709, + "step": 43324 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521305595655637e-06, + "loss": 0.5547, + "step": 43325 + }, + { + "epoch": 1.11, + "learning_rate": 1.4521058786821944e-06, + "loss": 0.7305, + "step": 43326 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520811974526683e-06, + "loss": 0.6826, + "step": 43327 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520565158770045e-06, + "loss": 0.6152, + "step": 43328 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520318339552217e-06, + "loss": 0.6523, + "step": 43329 + }, + { + "epoch": 1.11, + "learning_rate": 1.4520071516873393e-06, + "loss": 0.9326, + "step": 43330 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519824690733756e-06, + "loss": 0.6494, + "step": 43331 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519577861133495e-06, + "loss": 0.5127, + "step": 43332 + }, + { + "epoch": 1.11, + "learning_rate": 1.45193310280728e-06, + "loss": 0.6572, + "step": 43333 + }, + { + "epoch": 1.11, + "learning_rate": 1.4519084191551866e-06, + "loss": 0.7256, + "step": 43334 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518837351570873e-06, + "loss": 0.8135, + "step": 43335 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518590508130018e-06, + "loss": 0.8115, + "step": 43336 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518343661229483e-06, + "loss": 0.6084, + "step": 43337 + }, + { + "epoch": 1.11, + "learning_rate": 1.4518096810869461e-06, + "loss": 0.8896, + "step": 43338 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517849957050136e-06, + "loss": 0.707, + "step": 43339 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517603099771706e-06, + "loss": 0.7549, + "step": 43340 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517356239034356e-06, + "loss": 0.6204, + "step": 43341 + }, + { + "epoch": 1.11, + "learning_rate": 1.4517109374838273e-06, + "loss": 0.7012, + "step": 43342 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516862507183643e-06, + "loss": 0.6045, + "step": 43343 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516615636070662e-06, + "loss": 0.6577, + "step": 43344 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516368761499517e-06, + "loss": 0.6348, + "step": 43345 + }, + { + "epoch": 1.11, + "learning_rate": 1.4516121883470393e-06, + "loss": 0.48, + "step": 43346 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515875001983484e-06, + "loss": 0.6934, + "step": 43347 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515628117038976e-06, + "loss": 0.5889, + "step": 43348 + }, + { + "epoch": 1.11, + "learning_rate": 1.451538122863706e-06, + "loss": 0.752, + "step": 43349 + }, + { + "epoch": 1.11, + "learning_rate": 1.4515134336777925e-06, + "loss": 0.6475, + "step": 43350 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514887441461761e-06, + "loss": 0.6201, + "step": 43351 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514640542688752e-06, + "loss": 0.6772, + "step": 43352 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514393640459092e-06, + "loss": 0.564, + "step": 43353 + }, + { + "epoch": 1.11, + "learning_rate": 1.4514146734772967e-06, + "loss": 0.4103, + "step": 43354 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513899825630572e-06, + "loss": 0.5125, + "step": 43355 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513652913032085e-06, + "loss": 0.6445, + "step": 43356 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513405996977705e-06, + "loss": 0.5894, + "step": 43357 + }, + { + "epoch": 1.11, + "learning_rate": 1.4513159077467616e-06, + "loss": 0.5415, + "step": 43358 + }, + { + "epoch": 1.11, + "learning_rate": 1.451291215450201e-06, + "loss": 0.6855, + "step": 43359 + }, + { + "epoch": 1.11, + "learning_rate": 1.4512665228081074e-06, + "loss": 0.561, + "step": 43360 + }, + { + "epoch": 1.11, + "learning_rate": 1.4512418298204998e-06, + "loss": 0.7285, + "step": 43361 + }, + { + "epoch": 1.11, + "learning_rate": 1.451217136487397e-06, + "loss": 0.6841, + "step": 43362 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511924428088183e-06, + "loss": 0.6982, + "step": 43363 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511677487847818e-06, + "loss": 0.6279, + "step": 43364 + }, + { + "epoch": 1.11, + "learning_rate": 1.4511430544153071e-06, + "loss": 0.7139, + "step": 43365 + }, + { + "epoch": 1.11, + "learning_rate": 1.451118359700413e-06, + "loss": 0.4182, + "step": 43366 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510936646401181e-06, + "loss": 0.5615, + "step": 43367 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510689692344417e-06, + "loss": 0.6211, + "step": 43368 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510442734834027e-06, + "loss": 0.488, + "step": 43369 + }, + { + "epoch": 1.11, + "learning_rate": 1.4510195773870197e-06, + "loss": 0.6943, + "step": 43370 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509948809453117e-06, + "loss": 0.6865, + "step": 43371 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509701841582978e-06, + "loss": 0.7734, + "step": 43372 + }, + { + "epoch": 1.11, + "learning_rate": 1.4509454870259964e-06, + "loss": 0.5435, + "step": 43373 + }, + { + "epoch": 1.11, + "learning_rate": 1.450920789548427e-06, + "loss": 0.4783, + "step": 43374 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508960917256083e-06, + "loss": 0.7017, + "step": 43375 + }, + { + "epoch": 1.11, + "learning_rate": 1.450871393557559e-06, + "loss": 0.7036, + "step": 43376 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508466950442986e-06, + "loss": 0.668, + "step": 43377 + }, + { + "epoch": 1.11, + "learning_rate": 1.4508219961858455e-06, + "loss": 0.5732, + "step": 43378 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507972969822184e-06, + "loss": 0.665, + "step": 43379 + }, + { + "epoch": 1.11, + "learning_rate": 1.450772597433437e-06, + "loss": 0.8369, + "step": 43380 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507478975395193e-06, + "loss": 0.6123, + "step": 43381 + }, + { + "epoch": 1.11, + "learning_rate": 1.4507231973004853e-06, + "loss": 0.6523, + "step": 43382 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506984967163525e-06, + "loss": 0.5049, + "step": 43383 + }, + { + "epoch": 1.11, + "learning_rate": 1.450673795787141e-06, + "loss": 0.668, + "step": 43384 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506490945128693e-06, + "loss": 0.4988, + "step": 43385 + }, + { + "epoch": 1.11, + "learning_rate": 1.4506243928935561e-06, + "loss": 0.7881, + "step": 43386 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505996909292208e-06, + "loss": 0.5918, + "step": 43387 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505749886198818e-06, + "loss": 0.7256, + "step": 43388 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505502859655584e-06, + "loss": 0.5239, + "step": 43389 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505255829662693e-06, + "loss": 0.4097, + "step": 43390 + }, + { + "epoch": 1.11, + "learning_rate": 1.4505008796220335e-06, + "loss": 0.5283, + "step": 43391 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504761759328698e-06, + "loss": 0.6973, + "step": 43392 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504514718987974e-06, + "loss": 0.7949, + "step": 43393 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504267675198346e-06, + "loss": 0.6406, + "step": 43394 + }, + { + "epoch": 1.11, + "learning_rate": 1.4504020627960013e-06, + "loss": 0.563, + "step": 43395 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503773577273155e-06, + "loss": 0.6934, + "step": 43396 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503526523137968e-06, + "loss": 0.6326, + "step": 43397 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503279465554635e-06, + "loss": 0.5283, + "step": 43398 + }, + { + "epoch": 1.11, + "learning_rate": 1.4503032404523347e-06, + "loss": 0.791, + "step": 43399 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502785340044297e-06, + "loss": 0.6326, + "step": 43400 + }, + { + "epoch": 1.11, + "learning_rate": 1.450253827211767e-06, + "loss": 0.4858, + "step": 43401 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502291200743655e-06, + "loss": 0.7495, + "step": 43402 + }, + { + "epoch": 1.11, + "learning_rate": 1.4502044125922446e-06, + "loss": 0.4309, + "step": 43403 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501797047654223e-06, + "loss": 0.7988, + "step": 43404 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501549965939189e-06, + "loss": 0.645, + "step": 43405 + }, + { + "epoch": 1.11, + "learning_rate": 1.450130288077752e-06, + "loss": 0.4819, + "step": 43406 + }, + { + "epoch": 1.11, + "learning_rate": 1.4501055792169411e-06, + "loss": 0.5322, + "step": 43407 + }, + { + "epoch": 1.11, + "learning_rate": 1.450080870011505e-06, + "loss": 0.5029, + "step": 43408 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500561604614628e-06, + "loss": 0.7432, + "step": 43409 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500314505668332e-06, + "loss": 0.6709, + "step": 43410 + }, + { + "epoch": 1.11, + "learning_rate": 1.4500067403276353e-06, + "loss": 0.5615, + "step": 43411 + }, + { + "epoch": 1.11, + "learning_rate": 1.4499820297438879e-06, + "loss": 0.6313, + "step": 43412 + }, + { + "epoch": 1.11, + "learning_rate": 1.4499573188156098e-06, + "loss": 0.6172, + "step": 43413 + }, + { + "epoch": 1.11, + "learning_rate": 1.44993260754282e-06, + "loss": 0.6216, + "step": 43414 + }, + { + "epoch": 1.11, + "learning_rate": 1.449907895925538e-06, + "loss": 0.6006, + "step": 43415 + }, + { + "epoch": 1.11, + "learning_rate": 1.449883183963782e-06, + "loss": 0.6299, + "step": 43416 + }, + { + "epoch": 1.11, + "learning_rate": 1.449858471657571e-06, + "loss": 0.5493, + "step": 43417 + }, + { + "epoch": 1.11, + "learning_rate": 1.4498337590069241e-06, + "loss": 0.6494, + "step": 43418 + }, + { + "epoch": 1.11, + "learning_rate": 1.4498090460118602e-06, + "loss": 0.835, + "step": 43419 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497843326723983e-06, + "loss": 0.6909, + "step": 43420 + }, + { + "epoch": 1.11, + "learning_rate": 1.449759618988557e-06, + "loss": 0.8105, + "step": 43421 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497349049603556e-06, + "loss": 0.8662, + "step": 43422 + }, + { + "epoch": 1.11, + "learning_rate": 1.4497101905878127e-06, + "loss": 0.7393, + "step": 43423 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496854758709477e-06, + "loss": 0.6147, + "step": 43424 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496607608097788e-06, + "loss": 0.4421, + "step": 43425 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496360454043255e-06, + "loss": 0.6807, + "step": 43426 + }, + { + "epoch": 1.11, + "learning_rate": 1.4496113296546067e-06, + "loss": 0.6689, + "step": 43427 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495866135606408e-06, + "loss": 0.7148, + "step": 43428 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495618971224475e-06, + "loss": 0.6709, + "step": 43429 + }, + { + "epoch": 1.11, + "learning_rate": 1.4495371803400452e-06, + "loss": 0.5698, + "step": 43430 + }, + { + "epoch": 1.11, + "learning_rate": 1.449512463213453e-06, + "loss": 0.5945, + "step": 43431 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494877457426897e-06, + "loss": 0.4497, + "step": 43432 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494630279277741e-06, + "loss": 0.6753, + "step": 43433 + }, + { + "epoch": 1.11, + "learning_rate": 1.4494383097687258e-06, + "loss": 0.7441, + "step": 43434 + }, + { + "epoch": 1.11, + "learning_rate": 1.449413591265563e-06, + "loss": 0.8945, + "step": 43435 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493888724183046e-06, + "loss": 0.6406, + "step": 43436 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493641532269702e-06, + "loss": 0.7051, + "step": 43437 + }, + { + "epoch": 1.11, + "learning_rate": 1.449339433691578e-06, + "loss": 0.6104, + "step": 43438 + }, + { + "epoch": 1.11, + "learning_rate": 1.4493147138121476e-06, + "loss": 0.5122, + "step": 43439 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492899935886975e-06, + "loss": 0.4868, + "step": 43440 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492652730212467e-06, + "loss": 0.626, + "step": 43441 + }, + { + "epoch": 1.11, + "learning_rate": 1.449240552109814e-06, + "loss": 0.5557, + "step": 43442 + }, + { + "epoch": 1.11, + "learning_rate": 1.4492158308544187e-06, + "loss": 0.6353, + "step": 43443 + }, + { + "epoch": 1.11, + "learning_rate": 1.449191109255079e-06, + "loss": 0.6633, + "step": 43444 + }, + { + "epoch": 1.11, + "learning_rate": 1.449166387311815e-06, + "loss": 0.5557, + "step": 43445 + }, + { + "epoch": 1.11, + "learning_rate": 1.4491416650246447e-06, + "loss": 0.4902, + "step": 43446 + }, + { + "epoch": 1.11, + "learning_rate": 1.4491169423935873e-06, + "loss": 0.6797, + "step": 43447 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490922194186611e-06, + "loss": 0.7559, + "step": 43448 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490674960998864e-06, + "loss": 0.6323, + "step": 43449 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490427724372811e-06, + "loss": 0.6729, + "step": 43450 + }, + { + "epoch": 1.11, + "learning_rate": 1.4490180484308645e-06, + "loss": 0.7188, + "step": 43451 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489933240806553e-06, + "loss": 0.6616, + "step": 43452 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489685993866728e-06, + "loss": 0.6445, + "step": 43453 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489438743489354e-06, + "loss": 0.6865, + "step": 43454 + }, + { + "epoch": 1.11, + "learning_rate": 1.4489191489674624e-06, + "loss": 0.6572, + "step": 43455 + }, + { + "epoch": 1.11, + "learning_rate": 1.4488944232422726e-06, + "loss": 0.3762, + "step": 43456 + }, + { + "epoch": 1.11, + "learning_rate": 1.448869697173385e-06, + "loss": 0.7476, + "step": 43457 + }, + { + "epoch": 1.11, + "learning_rate": 1.4488449707608186e-06, + "loss": 0.7705, + "step": 43458 + }, + { + "epoch": 1.11, + "learning_rate": 1.448820244004592e-06, + "loss": 0.7217, + "step": 43459 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487955169047248e-06, + "loss": 0.7734, + "step": 43460 + }, + { + "epoch": 1.11, + "learning_rate": 1.448770789461235e-06, + "loss": 0.644, + "step": 43461 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487460616741424e-06, + "loss": 0.542, + "step": 43462 + }, + { + "epoch": 1.11, + "learning_rate": 1.4487213335434654e-06, + "loss": 0.6729, + "step": 43463 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486966050692234e-06, + "loss": 0.6228, + "step": 43464 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486718762514348e-06, + "loss": 0.75, + "step": 43465 + }, + { + "epoch": 1.11, + "learning_rate": 1.448647147090119e-06, + "loss": 0.5933, + "step": 43466 + }, + { + "epoch": 1.11, + "learning_rate": 1.4486224175852941e-06, + "loss": 0.7422, + "step": 43467 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485976877369802e-06, + "loss": 0.7227, + "step": 43468 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485729575451955e-06, + "loss": 0.562, + "step": 43469 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485482270099593e-06, + "loss": 0.7861, + "step": 43470 + }, + { + "epoch": 1.11, + "learning_rate": 1.4485234961312902e-06, + "loss": 0.7056, + "step": 43471 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484987649092072e-06, + "loss": 0.561, + "step": 43472 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484740333437295e-06, + "loss": 0.7715, + "step": 43473 + }, + { + "epoch": 1.11, + "learning_rate": 1.4484493014348758e-06, + "loss": 0.6997, + "step": 43474 + }, + { + "epoch": 1.11, + "learning_rate": 1.448424569182665e-06, + "loss": 0.5601, + "step": 43475 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483998365871162e-06, + "loss": 0.6611, + "step": 43476 + }, + { + "epoch": 1.11, + "learning_rate": 1.448375103648248e-06, + "loss": 0.7051, + "step": 43477 + }, + { + "epoch": 1.11, + "learning_rate": 1.44835037036608e-06, + "loss": 0.6997, + "step": 43478 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483256367406304e-06, + "loss": 0.6504, + "step": 43479 + }, + { + "epoch": 1.11, + "learning_rate": 1.4483009027719188e-06, + "loss": 0.605, + "step": 43480 + }, + { + "epoch": 1.11, + "learning_rate": 1.4482761684599638e-06, + "loss": 0.668, + "step": 43481 + }, + { + "epoch": 1.11, + "learning_rate": 1.448251433804784e-06, + "loss": 0.5635, + "step": 43482 + }, + { + "epoch": 1.11, + "learning_rate": 1.448226698806399e-06, + "loss": 0.7461, + "step": 43483 + }, + { + "epoch": 1.11, + "learning_rate": 1.4482019634648273e-06, + "loss": 0.5959, + "step": 43484 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481772277800882e-06, + "loss": 0.75, + "step": 43485 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481524917522e-06, + "loss": 0.624, + "step": 43486 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481277553811823e-06, + "loss": 0.5664, + "step": 43487 + }, + { + "epoch": 1.11, + "learning_rate": 1.4481030186670536e-06, + "loss": 0.6787, + "step": 43488 + }, + { + "epoch": 1.11, + "learning_rate": 1.448078281609833e-06, + "loss": 0.6401, + "step": 43489 + }, + { + "epoch": 1.11, + "learning_rate": 1.4480535442095398e-06, + "loss": 0.458, + "step": 43490 + }, + { + "epoch": 1.11, + "learning_rate": 1.4480288064661926e-06, + "loss": 0.4121, + "step": 43491 + }, + { + "epoch": 1.11, + "learning_rate": 1.44800406837981e-06, + "loss": 0.5654, + "step": 43492 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479793299504114e-06, + "loss": 0.6475, + "step": 43493 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479545911780155e-06, + "loss": 0.6006, + "step": 43494 + }, + { + "epoch": 1.11, + "learning_rate": 1.447929852062642e-06, + "loss": 0.7861, + "step": 43495 + }, + { + "epoch": 1.11, + "learning_rate": 1.4479051126043085e-06, + "loss": 0.6982, + "step": 43496 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478803728030352e-06, + "loss": 0.6494, + "step": 43497 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478556326588397e-06, + "loss": 0.7617, + "step": 43498 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478308921717425e-06, + "loss": 0.4883, + "step": 43499 + }, + { + "epoch": 1.11, + "learning_rate": 1.4478061513417614e-06, + "loss": 0.6582, + "step": 43500 + }, + { + "epoch": 1.11, + "learning_rate": 1.4477814101689156e-06, + "loss": 0.5845, + "step": 43501 + }, + { + "epoch": 1.11, + "learning_rate": 1.4477566686532245e-06, + "loss": 0.563, + "step": 43502 + }, + { + "epoch": 1.12, + "learning_rate": 1.4477319267947065e-06, + "loss": 0.6445, + "step": 43503 + }, + { + "epoch": 1.12, + "learning_rate": 1.447707184593381e-06, + "loss": 0.5485, + "step": 43504 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476824420492666e-06, + "loss": 0.4941, + "step": 43505 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476576991623822e-06, + "loss": 0.6069, + "step": 43506 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476329559327469e-06, + "loss": 0.6885, + "step": 43507 + }, + { + "epoch": 1.12, + "learning_rate": 1.4476082123603798e-06, + "loss": 0.5491, + "step": 43508 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475834684452995e-06, + "loss": 0.7739, + "step": 43509 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475587241875254e-06, + "loss": 0.5957, + "step": 43510 + }, + { + "epoch": 1.12, + "learning_rate": 1.4475339795870758e-06, + "loss": 0.6938, + "step": 43511 + }, + { + "epoch": 1.12, + "learning_rate": 1.44750923464397e-06, + "loss": 0.5322, + "step": 43512 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474844893582272e-06, + "loss": 0.4863, + "step": 43513 + }, + { + "epoch": 1.12, + "learning_rate": 1.447459743729866e-06, + "loss": 0.7295, + "step": 43514 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474349977589056e-06, + "loss": 0.7695, + "step": 43515 + }, + { + "epoch": 1.12, + "learning_rate": 1.4474102514453645e-06, + "loss": 0.6938, + "step": 43516 + }, + { + "epoch": 1.12, + "learning_rate": 1.447385504789262e-06, + "loss": 0.7627, + "step": 43517 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473607577906173e-06, + "loss": 0.6431, + "step": 43518 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473360104494487e-06, + "loss": 0.6543, + "step": 43519 + }, + { + "epoch": 1.12, + "learning_rate": 1.4473112627657757e-06, + "loss": 0.6904, + "step": 43520 + }, + { + "epoch": 1.12, + "learning_rate": 1.447286514739617e-06, + "loss": 0.6924, + "step": 43521 + }, + { + "epoch": 1.12, + "learning_rate": 1.4472617663709916e-06, + "loss": 0.3418, + "step": 43522 + }, + { + "epoch": 1.12, + "learning_rate": 1.4472370176599183e-06, + "loss": 0.6885, + "step": 43523 + }, + { + "epoch": 1.12, + "learning_rate": 1.447212268606416e-06, + "loss": 0.5415, + "step": 43524 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471875192105042e-06, + "loss": 0.5796, + "step": 43525 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471627694722012e-06, + "loss": 0.6655, + "step": 43526 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471380193915266e-06, + "loss": 0.7383, + "step": 43527 + }, + { + "epoch": 1.12, + "learning_rate": 1.4471132689684987e-06, + "loss": 0.6279, + "step": 43528 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470885182031367e-06, + "loss": 0.6021, + "step": 43529 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470637670954598e-06, + "loss": 0.5139, + "step": 43530 + }, + { + "epoch": 1.12, + "learning_rate": 1.4470390156454866e-06, + "loss": 0.6504, + "step": 43531 + }, + { + "epoch": 1.12, + "learning_rate": 1.447014263853236e-06, + "loss": 0.5454, + "step": 43532 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469895117187274e-06, + "loss": 0.8311, + "step": 43533 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469647592419794e-06, + "loss": 0.707, + "step": 43534 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469400064230111e-06, + "loss": 0.7612, + "step": 43535 + }, + { + "epoch": 1.12, + "learning_rate": 1.4469152532618414e-06, + "loss": 0.7559, + "step": 43536 + }, + { + "epoch": 1.12, + "learning_rate": 1.446890499758489e-06, + "loss": 0.6147, + "step": 43537 + }, + { + "epoch": 1.12, + "learning_rate": 1.4468657459129732e-06, + "loss": 0.6543, + "step": 43538 + }, + { + "epoch": 1.12, + "learning_rate": 1.4468409917253128e-06, + "loss": 0.5835, + "step": 43539 + }, + { + "epoch": 1.12, + "learning_rate": 1.446816237195527e-06, + "loss": 0.7617, + "step": 43540 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467914823236346e-06, + "loss": 0.7295, + "step": 43541 + }, + { + "epoch": 1.12, + "learning_rate": 1.446766727109654e-06, + "loss": 0.5854, + "step": 43542 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467419715536054e-06, + "loss": 0.5977, + "step": 43543 + }, + { + "epoch": 1.12, + "learning_rate": 1.4467172156555062e-06, + "loss": 0.322, + "step": 43544 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466924594153768e-06, + "loss": 0.7471, + "step": 43545 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466677028332354e-06, + "loss": 0.8486, + "step": 43546 + }, + { + "epoch": 1.12, + "learning_rate": 1.446642945909101e-06, + "loss": 0.7031, + "step": 43547 + }, + { + "epoch": 1.12, + "learning_rate": 1.4466181886429926e-06, + "loss": 0.7334, + "step": 43548 + }, + { + "epoch": 1.12, + "learning_rate": 1.446593431034929e-06, + "loss": 0.6621, + "step": 43549 + }, + { + "epoch": 1.12, + "learning_rate": 1.4465686730849301e-06, + "loss": 0.749, + "step": 43550 + }, + { + "epoch": 1.12, + "learning_rate": 1.446543914793013e-06, + "loss": 0.625, + "step": 43551 + }, + { + "epoch": 1.12, + "learning_rate": 1.4465191561591986e-06, + "loss": 0.5874, + "step": 43552 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464943971835045e-06, + "loss": 0.488, + "step": 43553 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464696378659507e-06, + "loss": 0.7305, + "step": 43554 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464448782065553e-06, + "loss": 0.667, + "step": 43555 + }, + { + "epoch": 1.12, + "learning_rate": 1.4464201182053377e-06, + "loss": 0.7646, + "step": 43556 + }, + { + "epoch": 1.12, + "learning_rate": 1.4463953578623164e-06, + "loss": 0.5659, + "step": 43557 + }, + { + "epoch": 1.12, + "learning_rate": 1.446370597177511e-06, + "loss": 0.583, + "step": 43558 + }, + { + "epoch": 1.12, + "learning_rate": 1.44634583615094e-06, + "loss": 0.583, + "step": 43559 + }, + { + "epoch": 1.12, + "learning_rate": 1.446321074782623e-06, + "loss": 0.707, + "step": 43560 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462963130725781e-06, + "loss": 0.6138, + "step": 43561 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462715510208246e-06, + "loss": 0.6196, + "step": 43562 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462467886273815e-06, + "loss": 0.6191, + "step": 43563 + }, + { + "epoch": 1.12, + "learning_rate": 1.4462220258922677e-06, + "loss": 0.5869, + "step": 43564 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461972628155024e-06, + "loss": 0.5791, + "step": 43565 + }, + { + "epoch": 1.12, + "learning_rate": 1.446172499397104e-06, + "loss": 0.5874, + "step": 43566 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461477356370923e-06, + "loss": 0.6841, + "step": 43567 + }, + { + "epoch": 1.12, + "learning_rate": 1.4461229715354858e-06, + "loss": 0.834, + "step": 43568 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460982070923028e-06, + "loss": 0.6001, + "step": 43569 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460734423075636e-06, + "loss": 0.6128, + "step": 43570 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460486771812863e-06, + "loss": 0.748, + "step": 43571 + }, + { + "epoch": 1.12, + "learning_rate": 1.4460239117134898e-06, + "loss": 0.7891, + "step": 43572 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459991459041937e-06, + "loss": 0.8091, + "step": 43573 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459743797534162e-06, + "loss": 0.5488, + "step": 43574 + }, + { + "epoch": 1.12, + "learning_rate": 1.445949613261177e-06, + "loss": 0.5884, + "step": 43575 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459248464274943e-06, + "loss": 0.7002, + "step": 43576 + }, + { + "epoch": 1.12, + "learning_rate": 1.4459000792523876e-06, + "loss": 0.709, + "step": 43577 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458753117358757e-06, + "loss": 0.5532, + "step": 43578 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458505438779779e-06, + "loss": 0.8389, + "step": 43579 + }, + { + "epoch": 1.12, + "learning_rate": 1.4458257756787125e-06, + "loss": 0.6206, + "step": 43580 + }, + { + "epoch": 1.12, + "learning_rate": 1.445801007138099e-06, + "loss": 0.7861, + "step": 43581 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457762382561557e-06, + "loss": 0.7812, + "step": 43582 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457514690329022e-06, + "loss": 0.5543, + "step": 43583 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457266994683575e-06, + "loss": 0.6426, + "step": 43584 + }, + { + "epoch": 1.12, + "learning_rate": 1.4457019295625403e-06, + "loss": 0.5845, + "step": 43585 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456771593154696e-06, + "loss": 0.7422, + "step": 43586 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456523887271645e-06, + "loss": 0.748, + "step": 43587 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456276177976436e-06, + "loss": 0.6665, + "step": 43588 + }, + { + "epoch": 1.12, + "learning_rate": 1.4456028465269264e-06, + "loss": 0.5874, + "step": 43589 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455780749150315e-06, + "loss": 0.6079, + "step": 43590 + }, + { + "epoch": 1.12, + "learning_rate": 1.445553302961978e-06, + "loss": 0.8584, + "step": 43591 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455285306677846e-06, + "loss": 0.6221, + "step": 43592 + }, + { + "epoch": 1.12, + "learning_rate": 1.4455037580324704e-06, + "loss": 0.7627, + "step": 43593 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454789850560552e-06, + "loss": 0.5264, + "step": 43594 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454542117385566e-06, + "loss": 0.6729, + "step": 43595 + }, + { + "epoch": 1.12, + "learning_rate": 1.4454294380799942e-06, + "loss": 0.7354, + "step": 43596 + }, + { + "epoch": 1.12, + "learning_rate": 1.445404664080387e-06, + "loss": 0.6333, + "step": 43597 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453798897397543e-06, + "loss": 0.6953, + "step": 43598 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453551150581142e-06, + "loss": 0.667, + "step": 43599 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453303400354866e-06, + "loss": 0.6602, + "step": 43600 + }, + { + "epoch": 1.12, + "learning_rate": 1.4453055646718896e-06, + "loss": 0.6611, + "step": 43601 + }, + { + "epoch": 1.12, + "learning_rate": 1.445280788967343e-06, + "loss": 0.7578, + "step": 43602 + }, + { + "epoch": 1.12, + "learning_rate": 1.445256012921865e-06, + "loss": 0.7109, + "step": 43603 + }, + { + "epoch": 1.12, + "learning_rate": 1.4452312365354753e-06, + "loss": 0.6436, + "step": 43604 + }, + { + "epoch": 1.12, + "learning_rate": 1.4452064598081924e-06, + "loss": 0.7241, + "step": 43605 + }, + { + "epoch": 1.12, + "learning_rate": 1.4451816827400353e-06, + "loss": 0.6631, + "step": 43606 + }, + { + "epoch": 1.12, + "learning_rate": 1.445156905331023e-06, + "loss": 0.6797, + "step": 43607 + }, + { + "epoch": 1.12, + "learning_rate": 1.4451321275811748e-06, + "loss": 0.6963, + "step": 43608 + }, + { + "epoch": 1.12, + "learning_rate": 1.445107349490509e-06, + "loss": 0.687, + "step": 43609 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450825710590453e-06, + "loss": 0.5273, + "step": 43610 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450577922868021e-06, + "loss": 0.5474, + "step": 43611 + }, + { + "epoch": 1.12, + "learning_rate": 1.4450330131737988e-06, + "loss": 0.5068, + "step": 43612 + }, + { + "epoch": 1.12, + "learning_rate": 1.445008233720054e-06, + "loss": 0.6182, + "step": 43613 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449834539255871e-06, + "loss": 0.5635, + "step": 43614 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449586737904169e-06, + "loss": 0.626, + "step": 43615 + }, + { + "epoch": 1.12, + "learning_rate": 1.444933893314562e-06, + "loss": 0.4861, + "step": 43616 + }, + { + "epoch": 1.12, + "learning_rate": 1.4449091124980418e-06, + "loss": 0.7656, + "step": 43617 + }, + { + "epoch": 1.12, + "learning_rate": 1.444884331340875e-06, + "loss": 0.5908, + "step": 43618 + }, + { + "epoch": 1.12, + "learning_rate": 1.4448595498430812e-06, + "loss": 0.6099, + "step": 43619 + }, + { + "epoch": 1.12, + "learning_rate": 1.4448347680046784e-06, + "loss": 0.6367, + "step": 43620 + }, + { + "epoch": 1.12, + "learning_rate": 1.444809985825686e-06, + "loss": 0.5488, + "step": 43621 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447852033061233e-06, + "loss": 0.6436, + "step": 43622 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447604204460091e-06, + "loss": 0.6992, + "step": 43623 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447356372453623e-06, + "loss": 0.5459, + "step": 43624 + }, + { + "epoch": 1.12, + "learning_rate": 1.4447108537042018e-06, + "loss": 0.6772, + "step": 43625 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446860698225466e-06, + "loss": 0.6729, + "step": 43626 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446612856004157e-06, + "loss": 0.7012, + "step": 43627 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446365010378281e-06, + "loss": 0.6191, + "step": 43628 + }, + { + "epoch": 1.12, + "learning_rate": 1.4446117161348028e-06, + "loss": 0.6436, + "step": 43629 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445869308913587e-06, + "loss": 0.6172, + "step": 43630 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445621453075152e-06, + "loss": 0.6279, + "step": 43631 + }, + { + "epoch": 1.12, + "learning_rate": 1.4445373593832904e-06, + "loss": 0.6289, + "step": 43632 + }, + { + "epoch": 1.12, + "learning_rate": 1.444512573118704e-06, + "loss": 0.6499, + "step": 43633 + }, + { + "epoch": 1.12, + "learning_rate": 1.444487786513775e-06, + "loss": 0.668, + "step": 43634 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444629995685216e-06, + "loss": 0.4231, + "step": 43635 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444382122829636e-06, + "loss": 0.4988, + "step": 43636 + }, + { + "epoch": 1.12, + "learning_rate": 1.4444134246571196e-06, + "loss": 0.6426, + "step": 43637 + }, + { + "epoch": 1.12, + "learning_rate": 1.444388636691009e-06, + "loss": 0.6006, + "step": 43638 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443638483846504e-06, + "loss": 0.7773, + "step": 43639 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443390597380628e-06, + "loss": 0.5815, + "step": 43640 + }, + { + "epoch": 1.12, + "learning_rate": 1.4443142707512648e-06, + "loss": 0.5688, + "step": 43641 + }, + { + "epoch": 1.12, + "learning_rate": 1.444289481424276e-06, + "loss": 0.7065, + "step": 43642 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442646917571153e-06, + "loss": 0.499, + "step": 43643 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442399017498017e-06, + "loss": 0.8125, + "step": 43644 + }, + { + "epoch": 1.12, + "learning_rate": 1.4442151114023537e-06, + "loss": 0.6455, + "step": 43645 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441903207147907e-06, + "loss": 0.5664, + "step": 43646 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441655296871316e-06, + "loss": 0.6084, + "step": 43647 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441407383193956e-06, + "loss": 0.5842, + "step": 43648 + }, + { + "epoch": 1.12, + "learning_rate": 1.4441159466116013e-06, + "loss": 0.3658, + "step": 43649 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440911545637677e-06, + "loss": 0.2881, + "step": 43650 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440663621759142e-06, + "loss": 0.5967, + "step": 43651 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440415694480592e-06, + "loss": 0.5098, + "step": 43652 + }, + { + "epoch": 1.12, + "learning_rate": 1.4440167763802222e-06, + "loss": 0.6729, + "step": 43653 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439919829724218e-06, + "loss": 0.5118, + "step": 43654 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439671892246773e-06, + "loss": 0.4617, + "step": 43655 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439423951370076e-06, + "loss": 0.7739, + "step": 43656 + }, + { + "epoch": 1.12, + "learning_rate": 1.4439176007094313e-06, + "loss": 0.7188, + "step": 43657 + }, + { + "epoch": 1.12, + "learning_rate": 1.443892805941968e-06, + "loss": 0.4492, + "step": 43658 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438680108346367e-06, + "loss": 0.6173, + "step": 43659 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438432153874553e-06, + "loss": 0.5, + "step": 43660 + }, + { + "epoch": 1.12, + "learning_rate": 1.4438184196004441e-06, + "loss": 0.5708, + "step": 43661 + }, + { + "epoch": 1.12, + "learning_rate": 1.4437936234736213e-06, + "loss": 0.7227, + "step": 43662 + }, + { + "epoch": 1.12, + "learning_rate": 1.4437688270070064e-06, + "loss": 0.8242, + "step": 43663 + }, + { + "epoch": 1.12, + "learning_rate": 1.443744030200618e-06, + "loss": 0.7451, + "step": 43664 + }, + { + "epoch": 1.12, + "learning_rate": 1.443719233054475e-06, + "loss": 0.79, + "step": 43665 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436944355685968e-06, + "loss": 0.5947, + "step": 43666 + }, + { + "epoch": 1.12, + "learning_rate": 1.443669637743002e-06, + "loss": 0.5615, + "step": 43667 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436448395777099e-06, + "loss": 0.7441, + "step": 43668 + }, + { + "epoch": 1.12, + "learning_rate": 1.4436200410727396e-06, + "loss": 0.6289, + "step": 43669 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435952422281093e-06, + "loss": 0.5898, + "step": 43670 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435704430438387e-06, + "loss": 0.7207, + "step": 43671 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435456435199464e-06, + "loss": 0.6548, + "step": 43672 + }, + { + "epoch": 1.12, + "learning_rate": 1.4435208436564522e-06, + "loss": 0.5913, + "step": 43673 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434960434533741e-06, + "loss": 0.6328, + "step": 43674 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434712429107316e-06, + "loss": 0.6138, + "step": 43675 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434464420285432e-06, + "loss": 0.7188, + "step": 43676 + }, + { + "epoch": 1.12, + "learning_rate": 1.4434216408068287e-06, + "loss": 0.4454, + "step": 43677 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433968392456064e-06, + "loss": 0.7695, + "step": 43678 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433720373448956e-06, + "loss": 0.6914, + "step": 43679 + }, + { + "epoch": 1.12, + "learning_rate": 1.4433472351047154e-06, + "loss": 0.6479, + "step": 43680 + }, + { + "epoch": 1.12, + "learning_rate": 1.443322432525084e-06, + "loss": 0.4321, + "step": 43681 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432976296060218e-06, + "loss": 0.6099, + "step": 43682 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432728263475462e-06, + "loss": 0.791, + "step": 43683 + }, + { + "epoch": 1.12, + "learning_rate": 1.4432480227496777e-06, + "loss": 0.6406, + "step": 43684 + }, + { + "epoch": 1.12, + "learning_rate": 1.443223218812434e-06, + "loss": 0.6068, + "step": 43685 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431984145358351e-06, + "loss": 0.7256, + "step": 43686 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431736099198993e-06, + "loss": 0.4917, + "step": 43687 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431488049646458e-06, + "loss": 0.8232, + "step": 43688 + }, + { + "epoch": 1.12, + "learning_rate": 1.4431239996700938e-06, + "loss": 0.6553, + "step": 43689 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430991940362622e-06, + "loss": 0.627, + "step": 43690 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430743880631697e-06, + "loss": 0.6294, + "step": 43691 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430495817508356e-06, + "loss": 0.6221, + "step": 43692 + }, + { + "epoch": 1.12, + "learning_rate": 1.4430247750992788e-06, + "loss": 0.4822, + "step": 43693 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429999681085186e-06, + "loss": 0.7012, + "step": 43694 + }, + { + "epoch": 1.12, + "learning_rate": 1.442975160778573e-06, + "loss": 0.667, + "step": 43695 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429503531094625e-06, + "loss": 0.7354, + "step": 43696 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429255451012048e-06, + "loss": 0.6055, + "step": 43697 + }, + { + "epoch": 1.12, + "learning_rate": 1.4429007367538194e-06, + "loss": 0.5664, + "step": 43698 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428759280673255e-06, + "loss": 0.7051, + "step": 43699 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428511190417414e-06, + "loss": 0.5581, + "step": 43700 + }, + { + "epoch": 1.12, + "learning_rate": 1.442826309677087e-06, + "loss": 0.6206, + "step": 43701 + }, + { + "epoch": 1.12, + "learning_rate": 1.4428014999733808e-06, + "loss": 0.7607, + "step": 43702 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427766899306417e-06, + "loss": 0.7157, + "step": 43703 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427518795488888e-06, + "loss": 0.666, + "step": 43704 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427270688281415e-06, + "loss": 0.6284, + "step": 43705 + }, + { + "epoch": 1.12, + "learning_rate": 1.4427022577684181e-06, + "loss": 0.6631, + "step": 43706 + }, + { + "epoch": 1.12, + "learning_rate": 1.442677446369738e-06, + "loss": 0.6162, + "step": 43707 + }, + { + "epoch": 1.12, + "learning_rate": 1.44265263463212e-06, + "loss": 0.6689, + "step": 43708 + }, + { + "epoch": 1.12, + "learning_rate": 1.4426278225555836e-06, + "loss": 0.6069, + "step": 43709 + }, + { + "epoch": 1.12, + "learning_rate": 1.4426030101401472e-06, + "loss": 0.7344, + "step": 43710 + }, + { + "epoch": 1.12, + "learning_rate": 1.44257819738583e-06, + "loss": 0.7959, + "step": 43711 + }, + { + "epoch": 1.12, + "learning_rate": 1.442553384292651e-06, + "loss": 0.7305, + "step": 43712 + }, + { + "epoch": 1.12, + "learning_rate": 1.4425285708606293e-06, + "loss": 0.6797, + "step": 43713 + }, + { + "epoch": 1.12, + "learning_rate": 1.442503757089784e-06, + "loss": 0.4652, + "step": 43714 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424789429801338e-06, + "loss": 0.5029, + "step": 43715 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424541285316976e-06, + "loss": 0.7988, + "step": 43716 + }, + { + "epoch": 1.12, + "learning_rate": 1.442429313744495e-06, + "loss": 0.7192, + "step": 43717 + }, + { + "epoch": 1.12, + "learning_rate": 1.4424044986185443e-06, + "loss": 0.6982, + "step": 43718 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423796831538648e-06, + "loss": 0.666, + "step": 43719 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423548673504758e-06, + "loss": 0.5835, + "step": 43720 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423300512083957e-06, + "loss": 0.7422, + "step": 43721 + }, + { + "epoch": 1.12, + "learning_rate": 1.4423052347276442e-06, + "loss": 0.6523, + "step": 43722 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422804179082395e-06, + "loss": 0.7139, + "step": 43723 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422556007502014e-06, + "loss": 0.6592, + "step": 43724 + }, + { + "epoch": 1.12, + "learning_rate": 1.442230783253548e-06, + "loss": 0.6685, + "step": 43725 + }, + { + "epoch": 1.12, + "learning_rate": 1.4422059654182995e-06, + "loss": 0.7793, + "step": 43726 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421811472444737e-06, + "loss": 0.7422, + "step": 43727 + }, + { + "epoch": 1.12, + "learning_rate": 1.44215632873209e-06, + "loss": 0.6797, + "step": 43728 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421315098811681e-06, + "loss": 0.6562, + "step": 43729 + }, + { + "epoch": 1.12, + "learning_rate": 1.4421066906917263e-06, + "loss": 0.5293, + "step": 43730 + }, + { + "epoch": 1.12, + "learning_rate": 1.4420818711637835e-06, + "loss": 0.4006, + "step": 43731 + }, + { + "epoch": 1.12, + "learning_rate": 1.442057051297359e-06, + "loss": 0.5669, + "step": 43732 + }, + { + "epoch": 1.12, + "learning_rate": 1.4420322310924717e-06, + "loss": 0.6504, + "step": 43733 + }, + { + "epoch": 1.12, + "learning_rate": 1.442007410549141e-06, + "loss": 0.7051, + "step": 43734 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419825896673853e-06, + "loss": 0.8555, + "step": 43735 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419577684472237e-06, + "loss": 0.5437, + "step": 43736 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419329468886754e-06, + "loss": 0.6348, + "step": 43737 + }, + { + "epoch": 1.12, + "learning_rate": 1.4419081249917595e-06, + "loss": 0.6277, + "step": 43738 + }, + { + "epoch": 1.12, + "learning_rate": 1.441883302756495e-06, + "loss": 0.6685, + "step": 43739 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418584801829005e-06, + "loss": 0.6846, + "step": 43740 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418336572709952e-06, + "loss": 0.7031, + "step": 43741 + }, + { + "epoch": 1.12, + "learning_rate": 1.4418088340207987e-06, + "loss": 0.6067, + "step": 43742 + }, + { + "epoch": 1.12, + "learning_rate": 1.441784010432329e-06, + "loss": 0.8193, + "step": 43743 + }, + { + "epoch": 1.12, + "learning_rate": 1.4417591865056057e-06, + "loss": 0.5859, + "step": 43744 + }, + { + "epoch": 1.12, + "learning_rate": 1.441734362240648e-06, + "loss": 0.7305, + "step": 43745 + }, + { + "epoch": 1.12, + "learning_rate": 1.4417095376374741e-06, + "loss": 0.637, + "step": 43746 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416847126961039e-06, + "loss": 0.6699, + "step": 43747 + }, + { + "epoch": 1.12, + "learning_rate": 1.441659887416556e-06, + "loss": 0.5869, + "step": 43748 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416350617988494e-06, + "loss": 0.7363, + "step": 43749 + }, + { + "epoch": 1.12, + "learning_rate": 1.4416102358430028e-06, + "loss": 0.7734, + "step": 43750 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415854095490362e-06, + "loss": 0.6113, + "step": 43751 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415605829169672e-06, + "loss": 0.3911, + "step": 43752 + }, + { + "epoch": 1.12, + "learning_rate": 1.441535755946816e-06, + "loss": 0.5938, + "step": 43753 + }, + { + "epoch": 1.12, + "learning_rate": 1.4415109286386011e-06, + "loss": 0.4639, + "step": 43754 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414861009923417e-06, + "loss": 0.6904, + "step": 43755 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414612730080567e-06, + "loss": 0.6338, + "step": 43756 + }, + { + "epoch": 1.12, + "learning_rate": 1.441436444685765e-06, + "loss": 0.4238, + "step": 43757 + }, + { + "epoch": 1.12, + "learning_rate": 1.4414116160254856e-06, + "loss": 0.7363, + "step": 43758 + }, + { + "epoch": 1.12, + "learning_rate": 1.441386787027238e-06, + "loss": 0.6855, + "step": 43759 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413619576910402e-06, + "loss": 0.6187, + "step": 43760 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413371280169124e-06, + "loss": 0.7695, + "step": 43761 + }, + { + "epoch": 1.12, + "learning_rate": 1.4413122980048728e-06, + "loss": 0.625, + "step": 43762 + }, + { + "epoch": 1.12, + "learning_rate": 1.441287467654941e-06, + "loss": 0.6279, + "step": 43763 + }, + { + "epoch": 1.12, + "learning_rate": 1.4412626369671353e-06, + "loss": 0.7598, + "step": 43764 + }, + { + "epoch": 1.12, + "learning_rate": 1.441237805941475e-06, + "loss": 0.7666, + "step": 43765 + }, + { + "epoch": 1.12, + "learning_rate": 1.4412129745779796e-06, + "loss": 0.6675, + "step": 43766 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411881428766675e-06, + "loss": 0.7607, + "step": 43767 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411633108375578e-06, + "loss": 0.6499, + "step": 43768 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411384784606698e-06, + "loss": 0.4534, + "step": 43769 + }, + { + "epoch": 1.12, + "learning_rate": 1.4411136457460225e-06, + "loss": 0.6631, + "step": 43770 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410888126936341e-06, + "loss": 0.6895, + "step": 43771 + }, + { + "epoch": 1.12, + "learning_rate": 1.441063979303525e-06, + "loss": 0.5791, + "step": 43772 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410391455757131e-06, + "loss": 0.51, + "step": 43773 + }, + { + "epoch": 1.12, + "learning_rate": 1.4410143115102185e-06, + "loss": 0.5608, + "step": 43774 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409894771070587e-06, + "loss": 0.6592, + "step": 43775 + }, + { + "epoch": 1.12, + "learning_rate": 1.440964642366254e-06, + "loss": 0.6743, + "step": 43776 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409398072878226e-06, + "loss": 0.5508, + "step": 43777 + }, + { + "epoch": 1.12, + "learning_rate": 1.4409149718717841e-06, + "loss": 0.665, + "step": 43778 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408901361181571e-06, + "loss": 0.7637, + "step": 43779 + }, + { + "epoch": 1.12, + "learning_rate": 1.440865300026961e-06, + "loss": 0.6587, + "step": 43780 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408404635982144e-06, + "loss": 0.6782, + "step": 43781 + }, + { + "epoch": 1.12, + "learning_rate": 1.4408156268319367e-06, + "loss": 0.3733, + "step": 43782 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407907897281466e-06, + "loss": 0.5415, + "step": 43783 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407659522868636e-06, + "loss": 0.625, + "step": 43784 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407411145081061e-06, + "loss": 0.7153, + "step": 43785 + }, + { + "epoch": 1.12, + "learning_rate": 1.4407162763918933e-06, + "loss": 0.5588, + "step": 43786 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406914379382444e-06, + "loss": 0.8379, + "step": 43787 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406665991471784e-06, + "loss": 0.5264, + "step": 43788 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406417600187144e-06, + "loss": 0.6099, + "step": 43789 + }, + { + "epoch": 1.12, + "learning_rate": 1.4406169205528709e-06, + "loss": 0.75, + "step": 43790 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405920807496674e-06, + "loss": 0.6255, + "step": 43791 + }, + { + "epoch": 1.12, + "learning_rate": 1.440567240609123e-06, + "loss": 0.7344, + "step": 43792 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405424001312563e-06, + "loss": 0.5596, + "step": 43793 + }, + { + "epoch": 1.12, + "learning_rate": 1.4405175593160867e-06, + "loss": 0.5928, + "step": 43794 + }, + { + "epoch": 1.12, + "learning_rate": 1.440492718163633e-06, + "loss": 0.7832, + "step": 43795 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404678766739142e-06, + "loss": 0.7217, + "step": 43796 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404430348469496e-06, + "loss": 0.6836, + "step": 43797 + }, + { + "epoch": 1.12, + "learning_rate": 1.4404181926827576e-06, + "loss": 0.6472, + "step": 43798 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403933501813582e-06, + "loss": 0.582, + "step": 43799 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403685073427697e-06, + "loss": 0.7412, + "step": 43800 + }, + { + "epoch": 1.12, + "learning_rate": 1.440343664167011e-06, + "loss": 0.5474, + "step": 43801 + }, + { + "epoch": 1.12, + "learning_rate": 1.4403188206541016e-06, + "loss": 0.7158, + "step": 43802 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402939768040604e-06, + "loss": 0.5518, + "step": 43803 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402691326169062e-06, + "loss": 0.8018, + "step": 43804 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402442880926583e-06, + "loss": 0.5437, + "step": 43805 + }, + { + "epoch": 1.12, + "learning_rate": 1.4402194432313354e-06, + "loss": 0.6982, + "step": 43806 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401945980329569e-06, + "loss": 0.6061, + "step": 43807 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401697524975414e-06, + "loss": 0.6479, + "step": 43808 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401449066251084e-06, + "loss": 0.7935, + "step": 43809 + }, + { + "epoch": 1.12, + "learning_rate": 1.4401200604156767e-06, + "loss": 0.7188, + "step": 43810 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400952138692653e-06, + "loss": 0.6909, + "step": 43811 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400703669858928e-06, + "loss": 0.4805, + "step": 43812 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400455197655791e-06, + "loss": 0.5132, + "step": 43813 + }, + { + "epoch": 1.12, + "learning_rate": 1.4400206722083428e-06, + "loss": 0.5547, + "step": 43814 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399958243142027e-06, + "loss": 0.6709, + "step": 43815 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399709760831781e-06, + "loss": 0.749, + "step": 43816 + }, + { + "epoch": 1.12, + "learning_rate": 1.439946127515288e-06, + "loss": 0.7085, + "step": 43817 + }, + { + "epoch": 1.12, + "learning_rate": 1.4399212786105514e-06, + "loss": 0.6016, + "step": 43818 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398964293689873e-06, + "loss": 0.708, + "step": 43819 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398715797906147e-06, + "loss": 0.6172, + "step": 43820 + }, + { + "epoch": 1.12, + "learning_rate": 1.4398467298754526e-06, + "loss": 0.5625, + "step": 43821 + }, + { + "epoch": 1.12, + "learning_rate": 1.43982187962352e-06, + "loss": 0.6479, + "step": 43822 + }, + { + "epoch": 1.12, + "learning_rate": 1.439797029034836e-06, + "loss": 0.6694, + "step": 43823 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397721781094202e-06, + "loss": 0.6729, + "step": 43824 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397473268472903e-06, + "loss": 0.6709, + "step": 43825 + }, + { + "epoch": 1.12, + "learning_rate": 1.4397224752484666e-06, + "loss": 0.6729, + "step": 43826 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396976233129674e-06, + "loss": 0.6782, + "step": 43827 + }, + { + "epoch": 1.12, + "learning_rate": 1.439672771040812e-06, + "loss": 0.5425, + "step": 43828 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396479184320193e-06, + "loss": 0.542, + "step": 43829 + }, + { + "epoch": 1.12, + "learning_rate": 1.4396230654866086e-06, + "loss": 0.5144, + "step": 43830 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395982122045985e-06, + "loss": 0.6699, + "step": 43831 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395733585860086e-06, + "loss": 0.7148, + "step": 43832 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395485046308571e-06, + "loss": 0.5571, + "step": 43833 + }, + { + "epoch": 1.12, + "learning_rate": 1.4395236503391638e-06, + "loss": 0.6709, + "step": 43834 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394987957109477e-06, + "loss": 0.6807, + "step": 43835 + }, + { + "epoch": 1.12, + "learning_rate": 1.439473940746227e-06, + "loss": 0.6709, + "step": 43836 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394490854450216e-06, + "loss": 0.8389, + "step": 43837 + }, + { + "epoch": 1.12, + "learning_rate": 1.4394242298073503e-06, + "loss": 0.7002, + "step": 43838 + }, + { + "epoch": 1.12, + "learning_rate": 1.4393993738332321e-06, + "loss": 0.7324, + "step": 43839 + }, + { + "epoch": 1.12, + "learning_rate": 1.439374517522686e-06, + "loss": 0.5957, + "step": 43840 + }, + { + "epoch": 1.12, + "learning_rate": 1.439349660875731e-06, + "loss": 0.5425, + "step": 43841 + }, + { + "epoch": 1.12, + "learning_rate": 1.439324803892386e-06, + "loss": 0.8438, + "step": 43842 + }, + { + "epoch": 1.12, + "learning_rate": 1.4392999465726704e-06, + "loss": 0.5474, + "step": 43843 + }, + { + "epoch": 1.12, + "learning_rate": 1.439275088916603e-06, + "loss": 0.9287, + "step": 43844 + }, + { + "epoch": 1.12, + "learning_rate": 1.439250230924203e-06, + "loss": 0.7588, + "step": 43845 + }, + { + "epoch": 1.12, + "learning_rate": 1.439225372595489e-06, + "loss": 0.5232, + "step": 43846 + }, + { + "epoch": 1.12, + "learning_rate": 1.4392005139304803e-06, + "loss": 0.6895, + "step": 43847 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391756549291963e-06, + "loss": 0.6631, + "step": 43848 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391507955916557e-06, + "loss": 0.7246, + "step": 43849 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391259359178772e-06, + "loss": 0.7549, + "step": 43850 + }, + { + "epoch": 1.12, + "learning_rate": 1.4391010759078803e-06, + "loss": 0.7539, + "step": 43851 + }, + { + "epoch": 1.12, + "learning_rate": 1.4390762155616838e-06, + "loss": 0.7334, + "step": 43852 + }, + { + "epoch": 1.12, + "learning_rate": 1.439051354879307e-06, + "loss": 0.792, + "step": 43853 + }, + { + "epoch": 1.12, + "learning_rate": 1.4390264938607688e-06, + "loss": 0.7432, + "step": 43854 + }, + { + "epoch": 1.12, + "learning_rate": 1.439001632506088e-06, + "loss": 0.6973, + "step": 43855 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389767708152837e-06, + "loss": 0.5479, + "step": 43856 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389519087883754e-06, + "loss": 0.583, + "step": 43857 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389270464253818e-06, + "loss": 0.6206, + "step": 43858 + }, + { + "epoch": 1.12, + "learning_rate": 1.4389021837263217e-06, + "loss": 0.6787, + "step": 43859 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388773206912149e-06, + "loss": 0.6699, + "step": 43860 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388524573200793e-06, + "loss": 0.626, + "step": 43861 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388275936129348e-06, + "loss": 0.5544, + "step": 43862 + }, + { + "epoch": 1.12, + "learning_rate": 1.4388027295698003e-06, + "loss": 0.4041, + "step": 43863 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387778651906948e-06, + "loss": 0.5547, + "step": 43864 + }, + { + "epoch": 1.12, + "learning_rate": 1.438753000475637e-06, + "loss": 0.7349, + "step": 43865 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387281354246464e-06, + "loss": 0.6567, + "step": 43866 + }, + { + "epoch": 1.12, + "learning_rate": 1.4387032700377416e-06, + "loss": 0.7012, + "step": 43867 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386784043149418e-06, + "loss": 0.668, + "step": 43868 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386535382562665e-06, + "loss": 0.6499, + "step": 43869 + }, + { + "epoch": 1.12, + "learning_rate": 1.4386286718617343e-06, + "loss": 0.8408, + "step": 43870 + }, + { + "epoch": 1.12, + "learning_rate": 1.438603805131364e-06, + "loss": 0.6123, + "step": 43871 + }, + { + "epoch": 1.12, + "learning_rate": 1.438578938065175e-06, + "loss": 0.6914, + "step": 43872 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385540706631867e-06, + "loss": 0.7529, + "step": 43873 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385292029254173e-06, + "loss": 0.8809, + "step": 43874 + }, + { + "epoch": 1.12, + "learning_rate": 1.4385043348518862e-06, + "loss": 0.6641, + "step": 43875 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384794664426127e-06, + "loss": 0.4795, + "step": 43876 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384545976976155e-06, + "loss": 0.5559, + "step": 43877 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384297286169141e-06, + "loss": 0.4841, + "step": 43878 + }, + { + "epoch": 1.12, + "learning_rate": 1.4384048592005268e-06, + "loss": 0.4594, + "step": 43879 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383799894484732e-06, + "loss": 0.8701, + "step": 43880 + }, + { + "epoch": 1.12, + "learning_rate": 1.438355119360772e-06, + "loss": 0.8125, + "step": 43881 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383302489374428e-06, + "loss": 0.7012, + "step": 43882 + }, + { + "epoch": 1.12, + "learning_rate": 1.4383053781785044e-06, + "loss": 0.5688, + "step": 43883 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382805070839755e-06, + "loss": 0.7842, + "step": 43884 + }, + { + "epoch": 1.12, + "learning_rate": 1.438255635653875e-06, + "loss": 0.7988, + "step": 43885 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382307638882228e-06, + "loss": 0.6953, + "step": 43886 + }, + { + "epoch": 1.12, + "learning_rate": 1.4382058917870373e-06, + "loss": 0.6807, + "step": 43887 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381810193503378e-06, + "loss": 0.5415, + "step": 43888 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381561465781432e-06, + "loss": 0.6233, + "step": 43889 + }, + { + "epoch": 1.12, + "learning_rate": 1.4381312734704723e-06, + "loss": 0.5354, + "step": 43890 + }, + { + "epoch": 1.12, + "learning_rate": 1.438106400027345e-06, + "loss": 0.6284, + "step": 43891 + }, + { + "epoch": 1.12, + "learning_rate": 1.438081526248779e-06, + "loss": 0.519, + "step": 43892 + }, + { + "epoch": 1.12, + "learning_rate": 1.438056652134795e-06, + "loss": 0.7188, + "step": 43893 + }, + { + "epoch": 1.13, + "learning_rate": 1.4380317776854106e-06, + "loss": 0.6211, + "step": 43894 + }, + { + "epoch": 1.13, + "learning_rate": 1.4380069029006454e-06, + "loss": 0.5021, + "step": 43895 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379820277805186e-06, + "loss": 0.5933, + "step": 43896 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379571523250491e-06, + "loss": 0.7646, + "step": 43897 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379322765342559e-06, + "loss": 0.4951, + "step": 43898 + }, + { + "epoch": 1.13, + "learning_rate": 1.4379074004081583e-06, + "loss": 0.411, + "step": 43899 + }, + { + "epoch": 1.13, + "learning_rate": 1.437882523946775e-06, + "loss": 0.5957, + "step": 43900 + }, + { + "epoch": 1.13, + "learning_rate": 1.437857647150125e-06, + "loss": 0.7314, + "step": 43901 + }, + { + "epoch": 1.13, + "learning_rate": 1.4378327700182276e-06, + "loss": 0.6992, + "step": 43902 + }, + { + "epoch": 1.13, + "learning_rate": 1.437807892551102e-06, + "loss": 0.6348, + "step": 43903 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377830147487668e-06, + "loss": 0.6802, + "step": 43904 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377581366112412e-06, + "loss": 0.5403, + "step": 43905 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377332581385447e-06, + "loss": 0.7441, + "step": 43906 + }, + { + "epoch": 1.13, + "learning_rate": 1.4377083793306955e-06, + "loss": 0.5757, + "step": 43907 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376835001877136e-06, + "loss": 0.6582, + "step": 43908 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376586207096174e-06, + "loss": 0.5825, + "step": 43909 + }, + { + "epoch": 1.13, + "learning_rate": 1.437633740896426e-06, + "loss": 0.5947, + "step": 43910 + }, + { + "epoch": 1.13, + "learning_rate": 1.4376088607481585e-06, + "loss": 0.8027, + "step": 43911 + }, + { + "epoch": 1.13, + "learning_rate": 1.437583980264834e-06, + "loss": 0.3591, + "step": 43912 + }, + { + "epoch": 1.13, + "learning_rate": 1.437559099446472e-06, + "loss": 0.7422, + "step": 43913 + }, + { + "epoch": 1.13, + "learning_rate": 1.437534218293091e-06, + "loss": 0.5415, + "step": 43914 + }, + { + "epoch": 1.13, + "learning_rate": 1.4375093368047097e-06, + "loss": 0.5908, + "step": 43915 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374844549813482e-06, + "loss": 0.5405, + "step": 43916 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374595728230243e-06, + "loss": 0.5605, + "step": 43917 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374346903297584e-06, + "loss": 0.5283, + "step": 43918 + }, + { + "epoch": 1.13, + "learning_rate": 1.4374098075015685e-06, + "loss": 0.6421, + "step": 43919 + }, + { + "epoch": 1.13, + "learning_rate": 1.437384924338474e-06, + "loss": 0.6455, + "step": 43920 + }, + { + "epoch": 1.13, + "learning_rate": 1.437360040840494e-06, + "loss": 0.4819, + "step": 43921 + }, + { + "epoch": 1.13, + "learning_rate": 1.4373351570076478e-06, + "loss": 0.6138, + "step": 43922 + }, + { + "epoch": 1.13, + "learning_rate": 1.437310272839954e-06, + "loss": 0.5288, + "step": 43923 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372853883374316e-06, + "loss": 0.5938, + "step": 43924 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372605035001005e-06, + "loss": 0.6572, + "step": 43925 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372356183279784e-06, + "loss": 0.6826, + "step": 43926 + }, + { + "epoch": 1.13, + "learning_rate": 1.4372107328210853e-06, + "loss": 0.6064, + "step": 43927 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371858469794404e-06, + "loss": 0.6714, + "step": 43928 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371609608030624e-06, + "loss": 0.6147, + "step": 43929 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371360742919699e-06, + "loss": 0.5889, + "step": 43930 + }, + { + "epoch": 1.13, + "learning_rate": 1.4371111874461829e-06, + "loss": 0.751, + "step": 43931 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370863002657191e-06, + "loss": 0.6338, + "step": 43932 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370614127505995e-06, + "loss": 0.7842, + "step": 43933 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370365249008415e-06, + "loss": 0.5171, + "step": 43934 + }, + { + "epoch": 1.13, + "learning_rate": 1.4370116367164648e-06, + "loss": 0.4404, + "step": 43935 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369867481974884e-06, + "loss": 0.5359, + "step": 43936 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369618593439312e-06, + "loss": 0.7363, + "step": 43937 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369369701558128e-06, + "loss": 0.4412, + "step": 43938 + }, + { + "epoch": 1.13, + "learning_rate": 1.4369120806331516e-06, + "loss": 0.6606, + "step": 43939 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368871907759667e-06, + "loss": 0.6738, + "step": 43940 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368623005842776e-06, + "loss": 0.7041, + "step": 43941 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368374100581032e-06, + "loss": 0.7676, + "step": 43942 + }, + { + "epoch": 1.13, + "learning_rate": 1.4368125191974622e-06, + "loss": 0.7129, + "step": 43943 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367876280023742e-06, + "loss": 0.5952, + "step": 43944 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367627364728581e-06, + "loss": 0.6543, + "step": 43945 + }, + { + "epoch": 1.13, + "learning_rate": 1.4367378446089324e-06, + "loss": 0.6826, + "step": 43946 + }, + { + "epoch": 1.13, + "learning_rate": 1.436712952410617e-06, + "loss": 0.6914, + "step": 43947 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366880598779305e-06, + "loss": 0.5537, + "step": 43948 + }, + { + "epoch": 1.13, + "learning_rate": 1.436663167010892e-06, + "loss": 0.8682, + "step": 43949 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366382738095206e-06, + "loss": 0.627, + "step": 43950 + }, + { + "epoch": 1.13, + "learning_rate": 1.4366133802738351e-06, + "loss": 0.6343, + "step": 43951 + }, + { + "epoch": 1.13, + "learning_rate": 1.436588486403855e-06, + "loss": 0.5044, + "step": 43952 + }, + { + "epoch": 1.13, + "learning_rate": 1.4365635921995993e-06, + "loss": 0.7295, + "step": 43953 + }, + { + "epoch": 1.13, + "learning_rate": 1.436538697661087e-06, + "loss": 0.5986, + "step": 43954 + }, + { + "epoch": 1.13, + "learning_rate": 1.4365138027883368e-06, + "loss": 0.7266, + "step": 43955 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364889075813683e-06, + "loss": 0.8623, + "step": 43956 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364640120402e-06, + "loss": 0.5146, + "step": 43957 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364391161648516e-06, + "loss": 0.6055, + "step": 43958 + }, + { + "epoch": 1.13, + "learning_rate": 1.4364142199553417e-06, + "loss": 0.4651, + "step": 43959 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363893234116894e-06, + "loss": 0.626, + "step": 43960 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363644265339141e-06, + "loss": 0.5974, + "step": 43961 + }, + { + "epoch": 1.13, + "learning_rate": 1.4363395293220344e-06, + "loss": 0.6719, + "step": 43962 + }, + { + "epoch": 1.13, + "learning_rate": 1.43631463177607e-06, + "loss": 0.666, + "step": 43963 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362897338960391e-06, + "loss": 0.7959, + "step": 43964 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362648356819614e-06, + "loss": 0.5149, + "step": 43965 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362399371338556e-06, + "loss": 0.6104, + "step": 43966 + }, + { + "epoch": 1.13, + "learning_rate": 1.4362150382517408e-06, + "loss": 0.4878, + "step": 43967 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361901390356366e-06, + "loss": 0.6348, + "step": 43968 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361652394855618e-06, + "loss": 0.6045, + "step": 43969 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361403396015349e-06, + "loss": 0.7002, + "step": 43970 + }, + { + "epoch": 1.13, + "learning_rate": 1.4361154393835756e-06, + "loss": 0.3394, + "step": 43971 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360905388317024e-06, + "loss": 0.6045, + "step": 43972 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360656379459353e-06, + "loss": 0.7441, + "step": 43973 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360407367262925e-06, + "loss": 0.8057, + "step": 43974 + }, + { + "epoch": 1.13, + "learning_rate": 1.4360158351727933e-06, + "loss": 0.7422, + "step": 43975 + }, + { + "epoch": 1.13, + "learning_rate": 1.435990933285457e-06, + "loss": 0.6343, + "step": 43976 + }, + { + "epoch": 1.13, + "learning_rate": 1.4359660310643023e-06, + "loss": 0.5942, + "step": 43977 + }, + { + "epoch": 1.13, + "learning_rate": 1.4359411285093486e-06, + "loss": 0.5869, + "step": 43978 + }, + { + "epoch": 1.13, + "learning_rate": 1.435916225620615e-06, + "loss": 0.6396, + "step": 43979 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358913223981198e-06, + "loss": 0.583, + "step": 43980 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358664188418832e-06, + "loss": 0.5044, + "step": 43981 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358415149519235e-06, + "loss": 0.876, + "step": 43982 + }, + { + "epoch": 1.13, + "learning_rate": 1.4358166107282603e-06, + "loss": 0.7988, + "step": 43983 + }, + { + "epoch": 1.13, + "learning_rate": 1.435791706170912e-06, + "loss": 0.8213, + "step": 43984 + }, + { + "epoch": 1.13, + "learning_rate": 1.435766801279898e-06, + "loss": 0.688, + "step": 43985 + }, + { + "epoch": 1.13, + "learning_rate": 1.4357418960552376e-06, + "loss": 0.7148, + "step": 43986 + }, + { + "epoch": 1.13, + "learning_rate": 1.4357169904969494e-06, + "loss": 0.7256, + "step": 43987 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356920846050532e-06, + "loss": 0.7319, + "step": 43988 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356671783795671e-06, + "loss": 0.7549, + "step": 43989 + }, + { + "epoch": 1.13, + "learning_rate": 1.435642271820511e-06, + "loss": 0.4607, + "step": 43990 + }, + { + "epoch": 1.13, + "learning_rate": 1.4356173649279038e-06, + "loss": 0.5918, + "step": 43991 + }, + { + "epoch": 1.13, + "learning_rate": 1.435592457701764e-06, + "loss": 0.5488, + "step": 43992 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355675501421113e-06, + "loss": 0.6143, + "step": 43993 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355426422489645e-06, + "loss": 0.6128, + "step": 43994 + }, + { + "epoch": 1.13, + "learning_rate": 1.4355177340223426e-06, + "loss": 0.7012, + "step": 43995 + }, + { + "epoch": 1.13, + "learning_rate": 1.435492825462265e-06, + "loss": 0.5085, + "step": 43996 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354679165687504e-06, + "loss": 0.6543, + "step": 43997 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354430073418183e-06, + "loss": 0.6229, + "step": 43998 + }, + { + "epoch": 1.13, + "learning_rate": 1.4354180977814872e-06, + "loss": 0.6577, + "step": 43999 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353931878877767e-06, + "loss": 0.6982, + "step": 44000 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353682776607055e-06, + "loss": 0.8232, + "step": 44001 + }, + { + "epoch": 1.13, + "learning_rate": 1.435343367100293e-06, + "loss": 0.6748, + "step": 44002 + }, + { + "epoch": 1.13, + "learning_rate": 1.4353184562065582e-06, + "loss": 0.7129, + "step": 44003 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352935449795198e-06, + "loss": 0.6094, + "step": 44004 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352686334191973e-06, + "loss": 0.5919, + "step": 44005 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352437215256095e-06, + "loss": 0.6787, + "step": 44006 + }, + { + "epoch": 1.13, + "learning_rate": 1.4352188092987756e-06, + "loss": 0.6611, + "step": 44007 + }, + { + "epoch": 1.13, + "learning_rate": 1.435193896738715e-06, + "loss": 0.6768, + "step": 44008 + }, + { + "epoch": 1.13, + "learning_rate": 1.435168983845446e-06, + "loss": 0.6895, + "step": 44009 + }, + { + "epoch": 1.13, + "learning_rate": 1.4351440706189884e-06, + "loss": 0.7578, + "step": 44010 + }, + { + "epoch": 1.13, + "learning_rate": 1.4351191570593607e-06, + "loss": 0.6313, + "step": 44011 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350942431665824e-06, + "loss": 0.6118, + "step": 44012 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350693289406726e-06, + "loss": 0.5435, + "step": 44013 + }, + { + "epoch": 1.13, + "learning_rate": 1.43504441438165e-06, + "loss": 0.6455, + "step": 44014 + }, + { + "epoch": 1.13, + "learning_rate": 1.4350194994895341e-06, + "loss": 0.6055, + "step": 44015 + }, + { + "epoch": 1.13, + "learning_rate": 1.4349945842643436e-06, + "loss": 0.7119, + "step": 44016 + }, + { + "epoch": 1.13, + "learning_rate": 1.434969668706098e-06, + "loss": 0.7793, + "step": 44017 + }, + { + "epoch": 1.13, + "learning_rate": 1.434944752814816e-06, + "loss": 0.792, + "step": 44018 + }, + { + "epoch": 1.13, + "learning_rate": 1.4349198365905166e-06, + "loss": 0.4829, + "step": 44019 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348949200332192e-06, + "loss": 0.7441, + "step": 44020 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348700031429429e-06, + "loss": 0.835, + "step": 44021 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348450859197062e-06, + "loss": 0.7471, + "step": 44022 + }, + { + "epoch": 1.13, + "learning_rate": 1.4348201683635295e-06, + "loss": 0.8716, + "step": 44023 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347952504744303e-06, + "loss": 0.7568, + "step": 44024 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347703322524285e-06, + "loss": 0.6826, + "step": 44025 + }, + { + "epoch": 1.13, + "learning_rate": 1.4347454136975427e-06, + "loss": 0.585, + "step": 44026 + }, + { + "epoch": 1.13, + "learning_rate": 1.434720494809793e-06, + "loss": 0.6729, + "step": 44027 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346955755891973e-06, + "loss": 0.4553, + "step": 44028 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346706560357756e-06, + "loss": 0.7861, + "step": 44029 + }, + { + "epoch": 1.13, + "learning_rate": 1.434645736149546e-06, + "loss": 0.7578, + "step": 44030 + }, + { + "epoch": 1.13, + "learning_rate": 1.4346208159305286e-06, + "loss": 0.7402, + "step": 44031 + }, + { + "epoch": 1.13, + "learning_rate": 1.434595895378742e-06, + "loss": 0.6006, + "step": 44032 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345709744942051e-06, + "loss": 0.4878, + "step": 44033 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345460532769375e-06, + "loss": 0.7412, + "step": 44034 + }, + { + "epoch": 1.13, + "learning_rate": 1.4345211317269579e-06, + "loss": 0.6465, + "step": 44035 + }, + { + "epoch": 1.13, + "learning_rate": 1.434496209844285e-06, + "loss": 0.6377, + "step": 44036 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344712876289386e-06, + "loss": 0.6836, + "step": 44037 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344463650809377e-06, + "loss": 0.7607, + "step": 44038 + }, + { + "epoch": 1.13, + "learning_rate": 1.4344214422003009e-06, + "loss": 0.6416, + "step": 44039 + }, + { + "epoch": 1.13, + "learning_rate": 1.434396518987048e-06, + "loss": 0.7559, + "step": 44040 + }, + { + "epoch": 1.13, + "learning_rate": 1.4343715954411972e-06, + "loss": 0.6792, + "step": 44041 + }, + { + "epoch": 1.13, + "learning_rate": 1.434346671562768e-06, + "loss": 0.7427, + "step": 44042 + }, + { + "epoch": 1.13, + "learning_rate": 1.4343217473517802e-06, + "loss": 0.5381, + "step": 44043 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342968228082516e-06, + "loss": 0.418, + "step": 44044 + }, + { + "epoch": 1.13, + "learning_rate": 1.434271897932202e-06, + "loss": 0.6445, + "step": 44045 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342469727236506e-06, + "loss": 0.5198, + "step": 44046 + }, + { + "epoch": 1.13, + "learning_rate": 1.4342220471826159e-06, + "loss": 0.7783, + "step": 44047 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341971213091177e-06, + "loss": 0.5786, + "step": 44048 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341721951031745e-06, + "loss": 0.7451, + "step": 44049 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341472685648057e-06, + "loss": 0.7173, + "step": 44050 + }, + { + "epoch": 1.13, + "learning_rate": 1.4341223416940302e-06, + "loss": 0.4885, + "step": 44051 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340974144908673e-06, + "loss": 0.7339, + "step": 44052 + }, + { + "epoch": 1.13, + "learning_rate": 1.434072486955336e-06, + "loss": 0.7539, + "step": 44053 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340475590874555e-06, + "loss": 0.6323, + "step": 44054 + }, + { + "epoch": 1.13, + "learning_rate": 1.4340226308872442e-06, + "loss": 0.624, + "step": 44055 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339977023547222e-06, + "loss": 0.709, + "step": 44056 + }, + { + "epoch": 1.13, + "learning_rate": 1.433972773489908e-06, + "loss": 0.5669, + "step": 44057 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339478442928208e-06, + "loss": 0.5742, + "step": 44058 + }, + { + "epoch": 1.13, + "learning_rate": 1.4339229147634798e-06, + "loss": 0.6367, + "step": 44059 + }, + { + "epoch": 1.13, + "learning_rate": 1.4338979849019036e-06, + "loss": 0.6655, + "step": 44060 + }, + { + "epoch": 1.13, + "learning_rate": 1.433873054708112e-06, + "loss": 0.52, + "step": 44061 + }, + { + "epoch": 1.13, + "learning_rate": 1.4338481241821233e-06, + "loss": 0.5085, + "step": 44062 + }, + { + "epoch": 1.13, + "learning_rate": 1.433823193323958e-06, + "loss": 0.5037, + "step": 44063 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337982621336334e-06, + "loss": 0.3794, + "step": 44064 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337733306111696e-06, + "loss": 0.6201, + "step": 44065 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337483987565854e-06, + "loss": 0.4041, + "step": 44066 + }, + { + "epoch": 1.13, + "learning_rate": 1.4337234665699002e-06, + "loss": 0.8418, + "step": 44067 + }, + { + "epoch": 1.13, + "learning_rate": 1.433698534051133e-06, + "loss": 0.7197, + "step": 44068 + }, + { + "epoch": 1.13, + "learning_rate": 1.4336736012003025e-06, + "loss": 0.584, + "step": 44069 + }, + { + "epoch": 1.13, + "learning_rate": 1.4336486680174282e-06, + "loss": 0.811, + "step": 44070 + }, + { + "epoch": 1.13, + "learning_rate": 1.433623734502529e-06, + "loss": 0.583, + "step": 44071 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335988006556238e-06, + "loss": 0.3262, + "step": 44072 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335738664767328e-06, + "loss": 0.6445, + "step": 44073 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335489319658734e-06, + "loss": 0.5625, + "step": 44074 + }, + { + "epoch": 1.13, + "learning_rate": 1.4335239971230659e-06, + "loss": 0.6206, + "step": 44075 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334990619483288e-06, + "loss": 0.4939, + "step": 44076 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334741264416814e-06, + "loss": 0.6514, + "step": 44077 + }, + { + "epoch": 1.13, + "learning_rate": 1.433449190603143e-06, + "loss": 0.6025, + "step": 44078 + }, + { + "epoch": 1.13, + "learning_rate": 1.4334242544327322e-06, + "loss": 0.7266, + "step": 44079 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333993179304685e-06, + "loss": 0.7617, + "step": 44080 + }, + { + "epoch": 1.13, + "learning_rate": 1.433374381096371e-06, + "loss": 0.5259, + "step": 44081 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333494439304583e-06, + "loss": 0.6567, + "step": 44082 + }, + { + "epoch": 1.13, + "learning_rate": 1.4333245064327503e-06, + "loss": 0.7783, + "step": 44083 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332995686032654e-06, + "loss": 0.7787, + "step": 44084 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332746304420229e-06, + "loss": 0.6958, + "step": 44085 + }, + { + "epoch": 1.13, + "learning_rate": 1.433249691949042e-06, + "loss": 0.7295, + "step": 44086 + }, + { + "epoch": 1.13, + "learning_rate": 1.4332247531243417e-06, + "loss": 0.7451, + "step": 44087 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331998139679416e-06, + "loss": 0.5317, + "step": 44088 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331748744798596e-06, + "loss": 0.5057, + "step": 44089 + }, + { + "epoch": 1.13, + "learning_rate": 1.433149934660116e-06, + "loss": 0.6514, + "step": 44090 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331249945087292e-06, + "loss": 0.8447, + "step": 44091 + }, + { + "epoch": 1.13, + "learning_rate": 1.4331000540257185e-06, + "loss": 0.6553, + "step": 44092 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330751132111032e-06, + "loss": 0.6987, + "step": 44093 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330501720649022e-06, + "loss": 0.5635, + "step": 44094 + }, + { + "epoch": 1.13, + "learning_rate": 1.4330252305871341e-06, + "loss": 0.6123, + "step": 44095 + }, + { + "epoch": 1.13, + "learning_rate": 1.433000288777819e-06, + "loss": 0.7109, + "step": 44096 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329753466369751e-06, + "loss": 0.6855, + "step": 44097 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329504041646225e-06, + "loss": 0.7168, + "step": 44098 + }, + { + "epoch": 1.13, + "learning_rate": 1.4329254613607793e-06, + "loss": 0.6079, + "step": 44099 + }, + { + "epoch": 1.13, + "learning_rate": 1.432900518225465e-06, + "loss": 0.5303, + "step": 44100 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328755747586984e-06, + "loss": 0.6382, + "step": 44101 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328506309604993e-06, + "loss": 0.8174, + "step": 44102 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328256868308862e-06, + "loss": 0.7383, + "step": 44103 + }, + { + "epoch": 1.13, + "learning_rate": 1.4328007423698783e-06, + "loss": 0.6455, + "step": 44104 + }, + { + "epoch": 1.13, + "learning_rate": 1.432775797577495e-06, + "loss": 0.8096, + "step": 44105 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327508524537548e-06, + "loss": 0.8574, + "step": 44106 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327259069986775e-06, + "loss": 0.7061, + "step": 44107 + }, + { + "epoch": 1.13, + "learning_rate": 1.4327009612122818e-06, + "loss": 0.709, + "step": 44108 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326760150945869e-06, + "loss": 0.7979, + "step": 44109 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326510686456117e-06, + "loss": 0.7607, + "step": 44110 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326261218653757e-06, + "loss": 0.6523, + "step": 44111 + }, + { + "epoch": 1.13, + "learning_rate": 1.4326011747538975e-06, + "loss": 0.7422, + "step": 44112 + }, + { + "epoch": 1.13, + "learning_rate": 1.432576227311197e-06, + "loss": 0.6992, + "step": 44113 + }, + { + "epoch": 1.13, + "learning_rate": 1.432551279537292e-06, + "loss": 0.6387, + "step": 44114 + }, + { + "epoch": 1.13, + "learning_rate": 1.4325263314322032e-06, + "loss": 0.5723, + "step": 44115 + }, + { + "epoch": 1.13, + "learning_rate": 1.432501382995948e-06, + "loss": 0.6377, + "step": 44116 + }, + { + "epoch": 1.13, + "learning_rate": 1.4324764342285472e-06, + "loss": 0.6631, + "step": 44117 + }, + { + "epoch": 1.13, + "learning_rate": 1.4324514851300186e-06, + "loss": 0.7148, + "step": 44118 + }, + { + "epoch": 1.13, + "learning_rate": 1.432426535700382e-06, + "loss": 0.7998, + "step": 44119 + }, + { + "epoch": 1.13, + "learning_rate": 1.432401585939656e-06, + "loss": 0.6577, + "step": 44120 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323766358478602e-06, + "loss": 0.7285, + "step": 44121 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323516854250132e-06, + "loss": 0.7617, + "step": 44122 + }, + { + "epoch": 1.13, + "learning_rate": 1.432326734671135e-06, + "loss": 0.5635, + "step": 44123 + }, + { + "epoch": 1.13, + "learning_rate": 1.4323017835862436e-06, + "loss": 0.5353, + "step": 44124 + }, + { + "epoch": 1.13, + "learning_rate": 1.432276832170359e-06, + "loss": 0.7354, + "step": 44125 + }, + { + "epoch": 1.13, + "learning_rate": 1.4322518804234993e-06, + "loss": 0.627, + "step": 44126 + }, + { + "epoch": 1.13, + "learning_rate": 1.4322269283456846e-06, + "loss": 0.8125, + "step": 44127 + }, + { + "epoch": 1.13, + "learning_rate": 1.432201975936934e-06, + "loss": 0.6621, + "step": 44128 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321770231972655e-06, + "loss": 0.4941, + "step": 44129 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321520701266994e-06, + "loss": 0.834, + "step": 44130 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321271167252537e-06, + "loss": 0.7529, + "step": 44131 + }, + { + "epoch": 1.13, + "learning_rate": 1.4321021629929488e-06, + "loss": 0.5182, + "step": 44132 + }, + { + "epoch": 1.13, + "learning_rate": 1.432077208929803e-06, + "loss": 0.6698, + "step": 44133 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320522545358356e-06, + "loss": 0.793, + "step": 44134 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320272998110654e-06, + "loss": 0.6748, + "step": 44135 + }, + { + "epoch": 1.13, + "learning_rate": 1.4320023447555121e-06, + "loss": 0.6738, + "step": 44136 + }, + { + "epoch": 1.13, + "learning_rate": 1.431977389369194e-06, + "loss": 0.5967, + "step": 44137 + }, + { + "epoch": 1.13, + "learning_rate": 1.4319524336521315e-06, + "loss": 0.5518, + "step": 44138 + }, + { + "epoch": 1.13, + "learning_rate": 1.431927477604342e-06, + "loss": 0.5586, + "step": 44139 + }, + { + "epoch": 1.13, + "learning_rate": 1.4319025212258458e-06, + "loss": 0.6465, + "step": 44140 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318775645166617e-06, + "loss": 0.6133, + "step": 44141 + }, + { + "epoch": 1.13, + "learning_rate": 1.431852607476809e-06, + "loss": 0.6689, + "step": 44142 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318276501063062e-06, + "loss": 0.6001, + "step": 44143 + }, + { + "epoch": 1.13, + "learning_rate": 1.4318026924051734e-06, + "loss": 0.5176, + "step": 44144 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317777343734286e-06, + "loss": 0.6455, + "step": 44145 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317527760110917e-06, + "loss": 0.6987, + "step": 44146 + }, + { + "epoch": 1.13, + "learning_rate": 1.4317278173181814e-06, + "loss": 0.6777, + "step": 44147 + }, + { + "epoch": 1.13, + "learning_rate": 1.431702858294717e-06, + "loss": 0.6479, + "step": 44148 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316778989407176e-06, + "loss": 0.6328, + "step": 44149 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316529392562023e-06, + "loss": 0.7148, + "step": 44150 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316279792411902e-06, + "loss": 0.6675, + "step": 44151 + }, + { + "epoch": 1.13, + "learning_rate": 1.4316030188957004e-06, + "loss": 0.7754, + "step": 44152 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315780582197521e-06, + "loss": 0.5217, + "step": 44153 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315530972133642e-06, + "loss": 0.6138, + "step": 44154 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315281358765561e-06, + "loss": 0.5688, + "step": 44155 + }, + { + "epoch": 1.13, + "learning_rate": 1.4315031742093464e-06, + "loss": 0.5968, + "step": 44156 + }, + { + "epoch": 1.13, + "learning_rate": 1.431478212211755e-06, + "loss": 0.6475, + "step": 44157 + }, + { + "epoch": 1.13, + "learning_rate": 1.4314532498838004e-06, + "loss": 0.605, + "step": 44158 + }, + { + "epoch": 1.13, + "learning_rate": 1.431428287225502e-06, + "loss": 0.5669, + "step": 44159 + }, + { + "epoch": 1.13, + "learning_rate": 1.4314033242368784e-06, + "loss": 0.7412, + "step": 44160 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313783609179493e-06, + "loss": 0.5176, + "step": 44161 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313533972687337e-06, + "loss": 0.7646, + "step": 44162 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313284332892508e-06, + "loss": 0.9551, + "step": 44163 + }, + { + "epoch": 1.13, + "learning_rate": 1.4313034689795193e-06, + "loss": 0.697, + "step": 44164 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312785043395587e-06, + "loss": 0.5043, + "step": 44165 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312535393693876e-06, + "loss": 0.6445, + "step": 44166 + }, + { + "epoch": 1.13, + "learning_rate": 1.431228574069026e-06, + "loss": 0.6807, + "step": 44167 + }, + { + "epoch": 1.13, + "learning_rate": 1.4312036084384923e-06, + "loss": 0.2842, + "step": 44168 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311786424778058e-06, + "loss": 0.5378, + "step": 44169 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311536761869857e-06, + "loss": 0.5957, + "step": 44170 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311287095660512e-06, + "loss": 0.7461, + "step": 44171 + }, + { + "epoch": 1.13, + "learning_rate": 1.4311037426150213e-06, + "loss": 0.6143, + "step": 44172 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310787753339147e-06, + "loss": 0.707, + "step": 44173 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310538077227512e-06, + "loss": 0.7783, + "step": 44174 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310288397815493e-06, + "loss": 0.7217, + "step": 44175 + }, + { + "epoch": 1.13, + "learning_rate": 1.4310038715103288e-06, + "loss": 0.7002, + "step": 44176 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309789029091085e-06, + "loss": 0.5928, + "step": 44177 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309539339779072e-06, + "loss": 0.8125, + "step": 44178 + }, + { + "epoch": 1.13, + "learning_rate": 1.4309289647167442e-06, + "loss": 0.6064, + "step": 44179 + }, + { + "epoch": 1.13, + "learning_rate": 1.430903995125639e-06, + "loss": 0.5884, + "step": 44180 + }, + { + "epoch": 1.13, + "learning_rate": 1.43087902520461e-06, + "loss": 0.5439, + "step": 44181 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308540549536775e-06, + "loss": 0.666, + "step": 44182 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308290843728592e-06, + "loss": 0.6826, + "step": 44183 + }, + { + "epoch": 1.13, + "learning_rate": 1.4308041134621752e-06, + "loss": 0.7305, + "step": 44184 + }, + { + "epoch": 1.13, + "learning_rate": 1.430779142221644e-06, + "loss": 0.7041, + "step": 44185 + }, + { + "epoch": 1.13, + "learning_rate": 1.4307541706512854e-06, + "loss": 0.6328, + "step": 44186 + }, + { + "epoch": 1.13, + "learning_rate": 1.4307291987511179e-06, + "loss": 0.5923, + "step": 44187 + }, + { + "epoch": 1.13, + "learning_rate": 1.430704226521161e-06, + "loss": 0.6182, + "step": 44188 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306792539614334e-06, + "loss": 0.6797, + "step": 44189 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306542810719546e-06, + "loss": 0.7627, + "step": 44190 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306293078527437e-06, + "loss": 0.499, + "step": 44191 + }, + { + "epoch": 1.13, + "learning_rate": 1.4306043343038199e-06, + "loss": 0.624, + "step": 44192 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305793604252019e-06, + "loss": 0.6646, + "step": 44193 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305543862169089e-06, + "loss": 0.5522, + "step": 44194 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305294116789608e-06, + "loss": 0.4971, + "step": 44195 + }, + { + "epoch": 1.13, + "learning_rate": 1.4305044368113757e-06, + "loss": 0.7207, + "step": 44196 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304794616141735e-06, + "loss": 0.6177, + "step": 44197 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304544860873727e-06, + "loss": 0.6543, + "step": 44198 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304295102309927e-06, + "loss": 0.7178, + "step": 44199 + }, + { + "epoch": 1.13, + "learning_rate": 1.4304045340450524e-06, + "loss": 0.5107, + "step": 44200 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303795575295713e-06, + "loss": 0.7275, + "step": 44201 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303545806845687e-06, + "loss": 0.6523, + "step": 44202 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303296035100631e-06, + "loss": 0.7314, + "step": 44203 + }, + { + "epoch": 1.13, + "learning_rate": 1.4303046260060738e-06, + "loss": 0.5933, + "step": 44204 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302796481726202e-06, + "loss": 0.6821, + "step": 44205 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302546700097212e-06, + "loss": 0.7188, + "step": 44206 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302296915173962e-06, + "loss": 0.7734, + "step": 44207 + }, + { + "epoch": 1.13, + "learning_rate": 1.4302047126956637e-06, + "loss": 0.5981, + "step": 44208 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301797335445437e-06, + "loss": 0.5488, + "step": 44209 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301547540640544e-06, + "loss": 0.6611, + "step": 44210 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301297742542156e-06, + "loss": 0.709, + "step": 44211 + }, + { + "epoch": 1.13, + "learning_rate": 1.4301047941150465e-06, + "loss": 0.8447, + "step": 44212 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300798136465653e-06, + "loss": 0.6807, + "step": 44213 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300548328487922e-06, + "loss": 0.7197, + "step": 44214 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300298517217458e-06, + "loss": 0.731, + "step": 44215 + }, + { + "epoch": 1.13, + "learning_rate": 1.4300048702654453e-06, + "loss": 0.7051, + "step": 44216 + }, + { + "epoch": 1.13, + "learning_rate": 1.42997988847991e-06, + "loss": 0.5603, + "step": 44217 + }, + { + "epoch": 1.13, + "learning_rate": 1.4299549063651586e-06, + "loss": 0.5225, + "step": 44218 + }, + { + "epoch": 1.13, + "learning_rate": 1.4299299239212105e-06, + "loss": 0.6768, + "step": 44219 + }, + { + "epoch": 1.13, + "learning_rate": 1.429904941148085e-06, + "loss": 0.5557, + "step": 44220 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298799580458008e-06, + "loss": 0.624, + "step": 44221 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298549746143778e-06, + "loss": 0.5713, + "step": 44222 + }, + { + "epoch": 1.13, + "learning_rate": 1.429829990853834e-06, + "loss": 0.7598, + "step": 44223 + }, + { + "epoch": 1.13, + "learning_rate": 1.4298050067641895e-06, + "loss": 0.6982, + "step": 44224 + }, + { + "epoch": 1.13, + "learning_rate": 1.429780022345463e-06, + "loss": 0.6621, + "step": 44225 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297550375976738e-06, + "loss": 0.6108, + "step": 44226 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297300525208406e-06, + "loss": 0.5669, + "step": 44227 + }, + { + "epoch": 1.13, + "learning_rate": 1.4297050671149834e-06, + "loss": 0.574, + "step": 44228 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296800813801201e-06, + "loss": 0.6611, + "step": 44229 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296550953162712e-06, + "loss": 0.5063, + "step": 44230 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296301089234546e-06, + "loss": 0.5537, + "step": 44231 + }, + { + "epoch": 1.13, + "learning_rate": 1.4296051222016902e-06, + "loss": 0.6982, + "step": 44232 + }, + { + "epoch": 1.13, + "learning_rate": 1.429580135150997e-06, + "loss": 0.834, + "step": 44233 + }, + { + "epoch": 1.13, + "learning_rate": 1.429555147771394e-06, + "loss": 0.605, + "step": 44234 + }, + { + "epoch": 1.13, + "learning_rate": 1.4295301600629004e-06, + "loss": 0.625, + "step": 44235 + }, + { + "epoch": 1.13, + "learning_rate": 1.4295051720255352e-06, + "loss": 0.793, + "step": 44236 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294801836593178e-06, + "loss": 0.6089, + "step": 44237 + }, + { + "epoch": 1.13, + "learning_rate": 1.429455194964267e-06, + "loss": 0.5757, + "step": 44238 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294302059404022e-06, + "loss": 0.5209, + "step": 44239 + }, + { + "epoch": 1.13, + "learning_rate": 1.4294052165877423e-06, + "loss": 0.4795, + "step": 44240 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293802269063067e-06, + "loss": 0.7451, + "step": 44241 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293552368961143e-06, + "loss": 0.7881, + "step": 44242 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293302465571847e-06, + "loss": 0.7373, + "step": 44243 + }, + { + "epoch": 1.13, + "learning_rate": 1.4293052558895361e-06, + "loss": 0.5981, + "step": 44244 + }, + { + "epoch": 1.13, + "learning_rate": 1.4292802648931886e-06, + "loss": 0.7222, + "step": 44245 + }, + { + "epoch": 1.13, + "learning_rate": 1.429255273568161e-06, + "loss": 0.4907, + "step": 44246 + }, + { + "epoch": 1.13, + "learning_rate": 1.429230281914472e-06, + "loss": 0.5269, + "step": 44247 + }, + { + "epoch": 1.13, + "learning_rate": 1.4292052899321414e-06, + "loss": 0.5947, + "step": 44248 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291802976211881e-06, + "loss": 0.7393, + "step": 44249 + }, + { + "epoch": 1.13, + "learning_rate": 1.429155304981631e-06, + "loss": 0.7656, + "step": 44250 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291303120134895e-06, + "loss": 0.6465, + "step": 44251 + }, + { + "epoch": 1.13, + "learning_rate": 1.4291053187167826e-06, + "loss": 0.7012, + "step": 44252 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290803250915296e-06, + "loss": 0.5879, + "step": 44253 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290553311377492e-06, + "loss": 0.7578, + "step": 44254 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290303368554613e-06, + "loss": 0.6455, + "step": 44255 + }, + { + "epoch": 1.13, + "learning_rate": 1.4290053422446842e-06, + "loss": 0.6646, + "step": 44256 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289803473054375e-06, + "loss": 0.6165, + "step": 44257 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289553520377406e-06, + "loss": 0.4331, + "step": 44258 + }, + { + "epoch": 1.13, + "learning_rate": 1.428930356441612e-06, + "loss": 0.54, + "step": 44259 + }, + { + "epoch": 1.13, + "learning_rate": 1.4289053605170714e-06, + "loss": 0.5234, + "step": 44260 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288803642641374e-06, + "loss": 0.5591, + "step": 44261 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288553676828297e-06, + "loss": 0.479, + "step": 44262 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288303707731668e-06, + "loss": 0.4382, + "step": 44263 + }, + { + "epoch": 1.13, + "learning_rate": 1.4288053735351686e-06, + "loss": 0.5406, + "step": 44264 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287803759688535e-06, + "loss": 0.5291, + "step": 44265 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287553780742415e-06, + "loss": 0.7832, + "step": 44266 + }, + { + "epoch": 1.13, + "learning_rate": 1.4287303798513507e-06, + "loss": 0.4524, + "step": 44267 + }, + { + "epoch": 1.13, + "learning_rate": 1.428705381300201e-06, + "loss": 0.8389, + "step": 44268 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286803824208112e-06, + "loss": 0.4666, + "step": 44269 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286553832132008e-06, + "loss": 0.627, + "step": 44270 + }, + { + "epoch": 1.13, + "learning_rate": 1.428630383677388e-06, + "loss": 0.6946, + "step": 44271 + }, + { + "epoch": 1.13, + "learning_rate": 1.4286053838133936e-06, + "loss": 0.792, + "step": 44272 + }, + { + "epoch": 1.13, + "learning_rate": 1.428580383621235e-06, + "loss": 0.5703, + "step": 44273 + }, + { + "epoch": 1.13, + "learning_rate": 1.4285553831009325e-06, + "loss": 0.5352, + "step": 44274 + }, + { + "epoch": 1.13, + "learning_rate": 1.4285303822525046e-06, + "loss": 0.6104, + "step": 44275 + }, + { + "epoch": 1.13, + "learning_rate": 1.428505381075971e-06, + "loss": 0.6709, + "step": 44276 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284803795713502e-06, + "loss": 0.7056, + "step": 44277 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284553777386618e-06, + "loss": 0.6367, + "step": 44278 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284303755779248e-06, + "loss": 0.6094, + "step": 44279 + }, + { + "epoch": 1.13, + "learning_rate": 1.4284053730891583e-06, + "loss": 0.7402, + "step": 44280 + }, + { + "epoch": 1.13, + "learning_rate": 1.4283803702723816e-06, + "loss": 0.6523, + "step": 44281 + }, + { + "epoch": 1.13, + "learning_rate": 1.428355367127614e-06, + "loss": 0.6729, + "step": 44282 + }, + { + "epoch": 1.13, + "learning_rate": 1.428330363654874e-06, + "loss": 0.5771, + "step": 44283 + }, + { + "epoch": 1.14, + "learning_rate": 1.428305359854181e-06, + "loss": 0.8066, + "step": 44284 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282803557255548e-06, + "loss": 0.5801, + "step": 44285 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282553512690137e-06, + "loss": 0.6294, + "step": 44286 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282303464845775e-06, + "loss": 0.644, + "step": 44287 + }, + { + "epoch": 1.14, + "learning_rate": 1.4282053413722646e-06, + "loss": 0.7744, + "step": 44288 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281803359320948e-06, + "loss": 0.5835, + "step": 44289 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281553301640867e-06, + "loss": 0.7656, + "step": 44290 + }, + { + "epoch": 1.14, + "learning_rate": 1.42813032406826e-06, + "loss": 0.6602, + "step": 44291 + }, + { + "epoch": 1.14, + "learning_rate": 1.4281053176446336e-06, + "loss": 0.7793, + "step": 44292 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280803108932266e-06, + "loss": 0.6028, + "step": 44293 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280553038140583e-06, + "loss": 0.834, + "step": 44294 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280302964071475e-06, + "loss": 0.5098, + "step": 44295 + }, + { + "epoch": 1.14, + "learning_rate": 1.4280052886725137e-06, + "loss": 0.6533, + "step": 44296 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279802806101762e-06, + "loss": 0.6523, + "step": 44297 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279552722201535e-06, + "loss": 0.8213, + "step": 44298 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279302635024656e-06, + "loss": 0.4563, + "step": 44299 + }, + { + "epoch": 1.14, + "learning_rate": 1.4279052544571305e-06, + "loss": 0.5405, + "step": 44300 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278802450841685e-06, + "loss": 0.5757, + "step": 44301 + }, + { + "epoch": 1.14, + "learning_rate": 1.427855235383598e-06, + "loss": 0.6758, + "step": 44302 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278302253554385e-06, + "loss": 0.4941, + "step": 44303 + }, + { + "epoch": 1.14, + "learning_rate": 1.4278052149997093e-06, + "loss": 0.4082, + "step": 44304 + }, + { + "epoch": 1.14, + "learning_rate": 1.427780204316429e-06, + "loss": 0.5508, + "step": 44305 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277551933056172e-06, + "loss": 0.9014, + "step": 44306 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277301819672928e-06, + "loss": 0.6611, + "step": 44307 + }, + { + "epoch": 1.14, + "learning_rate": 1.4277051703014754e-06, + "loss": 0.7183, + "step": 44308 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276801583081835e-06, + "loss": 0.6128, + "step": 44309 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276551459874366e-06, + "loss": 0.5083, + "step": 44310 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276301333392537e-06, + "loss": 0.6167, + "step": 44311 + }, + { + "epoch": 1.14, + "learning_rate": 1.4276051203636548e-06, + "loss": 0.5935, + "step": 44312 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275801070606576e-06, + "loss": 0.4456, + "step": 44313 + }, + { + "epoch": 1.14, + "learning_rate": 1.427555093430282e-06, + "loss": 0.5576, + "step": 44314 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275300794725472e-06, + "loss": 0.6602, + "step": 44315 + }, + { + "epoch": 1.14, + "learning_rate": 1.4275050651874725e-06, + "loss": 0.7266, + "step": 44316 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274800505750769e-06, + "loss": 0.7021, + "step": 44317 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274550356353793e-06, + "loss": 0.6328, + "step": 44318 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274300203683987e-06, + "loss": 0.6147, + "step": 44319 + }, + { + "epoch": 1.14, + "learning_rate": 1.4274050047741551e-06, + "loss": 0.5063, + "step": 44320 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273799888526665e-06, + "loss": 0.7852, + "step": 44321 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273549726039534e-06, + "loss": 0.707, + "step": 44322 + }, + { + "epoch": 1.14, + "learning_rate": 1.427329956028034e-06, + "loss": 0.8604, + "step": 44323 + }, + { + "epoch": 1.14, + "learning_rate": 1.4273049391249277e-06, + "loss": 0.6592, + "step": 44324 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272799218946533e-06, + "loss": 0.6592, + "step": 44325 + }, + { + "epoch": 1.14, + "learning_rate": 1.427254904337231e-06, + "loss": 0.6279, + "step": 44326 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272298864526788e-06, + "loss": 0.7197, + "step": 44327 + }, + { + "epoch": 1.14, + "learning_rate": 1.4272048682410164e-06, + "loss": 0.728, + "step": 44328 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271798497022629e-06, + "loss": 0.6396, + "step": 44329 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271548308364373e-06, + "loss": 0.603, + "step": 44330 + }, + { + "epoch": 1.14, + "learning_rate": 1.427129811643559e-06, + "loss": 0.6145, + "step": 44331 + }, + { + "epoch": 1.14, + "learning_rate": 1.4271047921236472e-06, + "loss": 0.3169, + "step": 44332 + }, + { + "epoch": 1.14, + "learning_rate": 1.4270797722767208e-06, + "loss": 0.749, + "step": 44333 + }, + { + "epoch": 1.14, + "learning_rate": 1.427054752102799e-06, + "loss": 0.6484, + "step": 44334 + }, + { + "epoch": 1.14, + "learning_rate": 1.427029731601901e-06, + "loss": 0.7871, + "step": 44335 + }, + { + "epoch": 1.14, + "learning_rate": 1.427004710774046e-06, + "loss": 0.4808, + "step": 44336 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269796896192533e-06, + "loss": 0.7134, + "step": 44337 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269546681375416e-06, + "loss": 0.6797, + "step": 44338 + }, + { + "epoch": 1.14, + "learning_rate": 1.4269296463289304e-06, + "loss": 0.4907, + "step": 44339 + }, + { + "epoch": 1.14, + "learning_rate": 1.426904624193439e-06, + "loss": 0.7153, + "step": 44340 + }, + { + "epoch": 1.14, + "learning_rate": 1.426879601731086e-06, + "loss": 0.6611, + "step": 44341 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268545789418914e-06, + "loss": 0.6855, + "step": 44342 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268295558258734e-06, + "loss": 0.8154, + "step": 44343 + }, + { + "epoch": 1.14, + "learning_rate": 1.4268045323830518e-06, + "loss": 0.7305, + "step": 44344 + }, + { + "epoch": 1.14, + "learning_rate": 1.4267795086134459e-06, + "loss": 0.7969, + "step": 44345 + }, + { + "epoch": 1.14, + "learning_rate": 1.4267544845170741e-06, + "loss": 0.8291, + "step": 44346 + }, + { + "epoch": 1.14, + "learning_rate": 1.426729460093956e-06, + "loss": 0.8408, + "step": 44347 + }, + { + "epoch": 1.14, + "learning_rate": 1.426704435344111e-06, + "loss": 0.7334, + "step": 44348 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266794102675581e-06, + "loss": 0.606, + "step": 44349 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266543848643164e-06, + "loss": 0.6943, + "step": 44350 + }, + { + "epoch": 1.14, + "learning_rate": 1.426629359134405e-06, + "loss": 0.626, + "step": 44351 + }, + { + "epoch": 1.14, + "learning_rate": 1.4266043330778431e-06, + "loss": 0.7139, + "step": 44352 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265793066946497e-06, + "loss": 0.5408, + "step": 44353 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265542799848444e-06, + "loss": 0.6455, + "step": 44354 + }, + { + "epoch": 1.14, + "learning_rate": 1.426529252948446e-06, + "loss": 0.5405, + "step": 44355 + }, + { + "epoch": 1.14, + "learning_rate": 1.4265042255854738e-06, + "loss": 0.5854, + "step": 44356 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264791978959468e-06, + "loss": 0.509, + "step": 44357 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264541698798844e-06, + "loss": 0.6328, + "step": 44358 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264291415373056e-06, + "loss": 0.5903, + "step": 44359 + }, + { + "epoch": 1.14, + "learning_rate": 1.4264041128682296e-06, + "loss": 0.5137, + "step": 44360 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263790838726754e-06, + "loss": 0.709, + "step": 44361 + }, + { + "epoch": 1.14, + "learning_rate": 1.426354054550663e-06, + "loss": 0.7246, + "step": 44362 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263290249022104e-06, + "loss": 0.6616, + "step": 44363 + }, + { + "epoch": 1.14, + "learning_rate": 1.4263039949273373e-06, + "loss": 0.7065, + "step": 44364 + }, + { + "epoch": 1.14, + "learning_rate": 1.4262789646260627e-06, + "loss": 0.4616, + "step": 44365 + }, + { + "epoch": 1.14, + "learning_rate": 1.426253933998406e-06, + "loss": 0.7568, + "step": 44366 + }, + { + "epoch": 1.14, + "learning_rate": 1.4262289030443866e-06, + "loss": 0.7295, + "step": 44367 + }, + { + "epoch": 1.14, + "learning_rate": 1.426203871764023e-06, + "loss": 0.4946, + "step": 44368 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261788401573348e-06, + "loss": 0.6875, + "step": 44369 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261538082243409e-06, + "loss": 0.6367, + "step": 44370 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261287759650607e-06, + "loss": 0.6006, + "step": 44371 + }, + { + "epoch": 1.14, + "learning_rate": 1.4261037433795132e-06, + "loss": 0.5771, + "step": 44372 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260787104677179e-06, + "loss": 0.449, + "step": 44373 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260536772296935e-06, + "loss": 0.7656, + "step": 44374 + }, + { + "epoch": 1.14, + "learning_rate": 1.4260286436654596e-06, + "loss": 0.6729, + "step": 44375 + }, + { + "epoch": 1.14, + "learning_rate": 1.426003609775035e-06, + "loss": 0.6484, + "step": 44376 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259785755584392e-06, + "loss": 0.5574, + "step": 44377 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259535410156908e-06, + "loss": 0.7373, + "step": 44378 + }, + { + "epoch": 1.14, + "learning_rate": 1.42592850614681e-06, + "loss": 0.8604, + "step": 44379 + }, + { + "epoch": 1.14, + "learning_rate": 1.4259034709518146e-06, + "loss": 0.7627, + "step": 44380 + }, + { + "epoch": 1.14, + "learning_rate": 1.425878435430725e-06, + "loss": 0.751, + "step": 44381 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258533995835596e-06, + "loss": 0.707, + "step": 44382 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258283634103382e-06, + "loss": 0.5405, + "step": 44383 + }, + { + "epoch": 1.14, + "learning_rate": 1.4258033269110792e-06, + "loss": 0.6279, + "step": 44384 + }, + { + "epoch": 1.14, + "learning_rate": 1.425778290085802e-06, + "loss": 0.4811, + "step": 44385 + }, + { + "epoch": 1.14, + "learning_rate": 1.4257532529345264e-06, + "loss": 0.7725, + "step": 44386 + }, + { + "epoch": 1.14, + "learning_rate": 1.425728215457271e-06, + "loss": 0.7432, + "step": 44387 + }, + { + "epoch": 1.14, + "learning_rate": 1.425703177654055e-06, + "loss": 0.6035, + "step": 44388 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256781395248978e-06, + "loss": 0.8525, + "step": 44389 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256531010698184e-06, + "loss": 0.5005, + "step": 44390 + }, + { + "epoch": 1.14, + "learning_rate": 1.425628062288836e-06, + "loss": 0.6436, + "step": 44391 + }, + { + "epoch": 1.14, + "learning_rate": 1.4256030231819696e-06, + "loss": 0.7959, + "step": 44392 + }, + { + "epoch": 1.14, + "learning_rate": 1.4255779837492386e-06, + "loss": 0.7383, + "step": 44393 + }, + { + "epoch": 1.14, + "learning_rate": 1.4255529439906622e-06, + "loss": 0.6914, + "step": 44394 + }, + { + "epoch": 1.14, + "learning_rate": 1.425527903906259e-06, + "loss": 0.5504, + "step": 44395 + }, + { + "epoch": 1.14, + "learning_rate": 1.425502863496049e-06, + "loss": 0.5854, + "step": 44396 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254778227600515e-06, + "loss": 0.6582, + "step": 44397 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254527816982847e-06, + "loss": 0.6875, + "step": 44398 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254277403107681e-06, + "loss": 0.5049, + "step": 44399 + }, + { + "epoch": 1.14, + "learning_rate": 1.4254026985975214e-06, + "loss": 0.7227, + "step": 44400 + }, + { + "epoch": 1.14, + "learning_rate": 1.4253776565585632e-06, + "loss": 0.5518, + "step": 44401 + }, + { + "epoch": 1.14, + "learning_rate": 1.4253526141939132e-06, + "loss": 0.5903, + "step": 44402 + }, + { + "epoch": 1.14, + "learning_rate": 1.42532757150359e-06, + "loss": 0.468, + "step": 44403 + }, + { + "epoch": 1.14, + "learning_rate": 1.425302528487613e-06, + "loss": 0.4937, + "step": 44404 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252774851460015e-06, + "loss": 0.5916, + "step": 44405 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252524414787745e-06, + "loss": 0.7202, + "step": 44406 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252273974859514e-06, + "loss": 0.7451, + "step": 44407 + }, + { + "epoch": 1.14, + "learning_rate": 1.4252023531675513e-06, + "loss": 0.666, + "step": 44408 + }, + { + "epoch": 1.14, + "learning_rate": 1.425177308523593e-06, + "loss": 0.6367, + "step": 44409 + }, + { + "epoch": 1.14, + "learning_rate": 1.4251522635540962e-06, + "loss": 0.7295, + "step": 44410 + }, + { + "epoch": 1.14, + "learning_rate": 1.4251272182590796e-06, + "loss": 0.5283, + "step": 44411 + }, + { + "epoch": 1.14, + "learning_rate": 1.425102172638563e-06, + "loss": 0.4761, + "step": 44412 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250771266925652e-06, + "loss": 0.6443, + "step": 44413 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250520804211053e-06, + "loss": 0.7588, + "step": 44414 + }, + { + "epoch": 1.14, + "learning_rate": 1.4250270338242023e-06, + "loss": 0.6826, + "step": 44415 + }, + { + "epoch": 1.14, + "learning_rate": 1.425001986901876e-06, + "loss": 0.6943, + "step": 44416 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249769396541451e-06, + "loss": 0.7827, + "step": 44417 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249518920810285e-06, + "loss": 0.9541, + "step": 44418 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249268441825465e-06, + "loss": 0.5547, + "step": 44419 + }, + { + "epoch": 1.14, + "learning_rate": 1.4249017959587172e-06, + "loss": 0.7129, + "step": 44420 + }, + { + "epoch": 1.14, + "learning_rate": 1.42487674740956e-06, + "loss": 0.4912, + "step": 44421 + }, + { + "epoch": 1.14, + "learning_rate": 1.4248516985350945e-06, + "loss": 0.6284, + "step": 44422 + }, + { + "epoch": 1.14, + "learning_rate": 1.4248266493353396e-06, + "loss": 0.6611, + "step": 44423 + }, + { + "epoch": 1.14, + "learning_rate": 1.424801599810314e-06, + "loss": 0.5986, + "step": 44424 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247765499600378e-06, + "loss": 0.7285, + "step": 44425 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247514997845294e-06, + "loss": 0.6416, + "step": 44426 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247264492838088e-06, + "loss": 0.6816, + "step": 44427 + }, + { + "epoch": 1.14, + "learning_rate": 1.4247013984578942e-06, + "loss": 0.7793, + "step": 44428 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246763473068055e-06, + "loss": 0.6934, + "step": 44429 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246512958305615e-06, + "loss": 0.6348, + "step": 44430 + }, + { + "epoch": 1.14, + "learning_rate": 1.4246262440291816e-06, + "loss": 0.7109, + "step": 44431 + }, + { + "epoch": 1.14, + "learning_rate": 1.424601191902685e-06, + "loss": 0.7578, + "step": 44432 + }, + { + "epoch": 1.14, + "learning_rate": 1.4245761394510908e-06, + "loss": 0.75, + "step": 44433 + }, + { + "epoch": 1.14, + "learning_rate": 1.424551086674418e-06, + "loss": 0.5503, + "step": 44434 + }, + { + "epoch": 1.14, + "learning_rate": 1.4245260335726861e-06, + "loss": 0.6016, + "step": 44435 + }, + { + "epoch": 1.14, + "learning_rate": 1.424500980145914e-06, + "loss": 0.4985, + "step": 44436 + }, + { + "epoch": 1.14, + "learning_rate": 1.424475926394121e-06, + "loss": 0.5508, + "step": 44437 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244508723173267e-06, + "loss": 0.6689, + "step": 44438 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244258179155495e-06, + "loss": 0.5837, + "step": 44439 + }, + { + "epoch": 1.14, + "learning_rate": 1.4244007631888091e-06, + "loss": 0.6958, + "step": 44440 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243757081371245e-06, + "loss": 0.6274, + "step": 44441 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243506527605149e-06, + "loss": 0.5225, + "step": 44442 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243255970589995e-06, + "loss": 0.624, + "step": 44443 + }, + { + "epoch": 1.14, + "learning_rate": 1.4243005410325977e-06, + "loss": 0.4739, + "step": 44444 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242754846813282e-06, + "loss": 0.6191, + "step": 44445 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242504280052108e-06, + "loss": 0.6353, + "step": 44446 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242253710042643e-06, + "loss": 0.4824, + "step": 44447 + }, + { + "epoch": 1.14, + "learning_rate": 1.4242003136785077e-06, + "loss": 0.709, + "step": 44448 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241752560279604e-06, + "loss": 0.6777, + "step": 44449 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241501980526419e-06, + "loss": 0.7051, + "step": 44450 + }, + { + "epoch": 1.14, + "learning_rate": 1.4241251397525709e-06, + "loss": 0.5513, + "step": 44451 + }, + { + "epoch": 1.14, + "learning_rate": 1.424100081127767e-06, + "loss": 0.5205, + "step": 44452 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240750221782486e-06, + "loss": 0.6855, + "step": 44453 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240499629040362e-06, + "loss": 0.6807, + "step": 44454 + }, + { + "epoch": 1.14, + "learning_rate": 1.4240249033051477e-06, + "loss": 0.7163, + "step": 44455 + }, + { + "epoch": 1.14, + "learning_rate": 1.423999843381603e-06, + "loss": 0.7754, + "step": 44456 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239747831334212e-06, + "loss": 0.6152, + "step": 44457 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239497225606214e-06, + "loss": 0.6543, + "step": 44458 + }, + { + "epoch": 1.14, + "learning_rate": 1.4239246616632228e-06, + "loss": 0.6235, + "step": 44459 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238996004412445e-06, + "loss": 0.7246, + "step": 44460 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238745388947054e-06, + "loss": 0.6924, + "step": 44461 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238494770236255e-06, + "loss": 0.7148, + "step": 44462 + }, + { + "epoch": 1.14, + "learning_rate": 1.4238244148280237e-06, + "loss": 0.584, + "step": 44463 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237993523079185e-06, + "loss": 0.748, + "step": 44464 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237742894633302e-06, + "loss": 0.4231, + "step": 44465 + }, + { + "epoch": 1.14, + "learning_rate": 1.4237492262942771e-06, + "loss": 0.6357, + "step": 44466 + }, + { + "epoch": 1.14, + "learning_rate": 1.423724162800779e-06, + "loss": 0.5603, + "step": 44467 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236990989828544e-06, + "loss": 0.7598, + "step": 44468 + }, + { + "epoch": 1.14, + "learning_rate": 1.423674034840523e-06, + "loss": 0.7832, + "step": 44469 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236489703738039e-06, + "loss": 0.7998, + "step": 44470 + }, + { + "epoch": 1.14, + "learning_rate": 1.4236239055827163e-06, + "loss": 0.6465, + "step": 44471 + }, + { + "epoch": 1.14, + "learning_rate": 1.4235988404672793e-06, + "loss": 0.7637, + "step": 44472 + }, + { + "epoch": 1.14, + "learning_rate": 1.4235737750275123e-06, + "loss": 0.6569, + "step": 44473 + }, + { + "epoch": 1.14, + "learning_rate": 1.423548709263434e-06, + "loss": 0.6396, + "step": 44474 + }, + { + "epoch": 1.14, + "learning_rate": 1.423523643175064e-06, + "loss": 0.7305, + "step": 44475 + }, + { + "epoch": 1.14, + "learning_rate": 1.4234985767624217e-06, + "loss": 0.5957, + "step": 44476 + }, + { + "epoch": 1.14, + "learning_rate": 1.423473510025526e-06, + "loss": 0.79, + "step": 44477 + }, + { + "epoch": 1.14, + "learning_rate": 1.4234484429643959e-06, + "loss": 0.4849, + "step": 44478 + }, + { + "epoch": 1.14, + "learning_rate": 1.423423375579051e-06, + "loss": 0.7661, + "step": 44479 + }, + { + "epoch": 1.14, + "learning_rate": 1.42339830786951e-06, + "loss": 0.8301, + "step": 44480 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233732398357924e-06, + "loss": 0.4739, + "step": 44481 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233481714779177e-06, + "loss": 0.6763, + "step": 44482 + }, + { + "epoch": 1.14, + "learning_rate": 1.4233231027959045e-06, + "loss": 0.5913, + "step": 44483 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232980337897724e-06, + "loss": 0.6191, + "step": 44484 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232729644595403e-06, + "loss": 0.7607, + "step": 44485 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232478948052277e-06, + "loss": 0.7183, + "step": 44486 + }, + { + "epoch": 1.14, + "learning_rate": 1.4232228248268536e-06, + "loss": 0.7529, + "step": 44487 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231977545244374e-06, + "loss": 0.6904, + "step": 44488 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231726838979978e-06, + "loss": 0.5615, + "step": 44489 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231476129475547e-06, + "loss": 0.5455, + "step": 44490 + }, + { + "epoch": 1.14, + "learning_rate": 1.4231225416731268e-06, + "loss": 0.374, + "step": 44491 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230974700747334e-06, + "loss": 0.7588, + "step": 44492 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230723981523935e-06, + "loss": 0.5371, + "step": 44493 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230473259061268e-06, + "loss": 0.79, + "step": 44494 + }, + { + "epoch": 1.14, + "learning_rate": 1.4230222533359522e-06, + "loss": 0.7871, + "step": 44495 + }, + { + "epoch": 1.14, + "learning_rate": 1.422997180441889e-06, + "loss": 0.5591, + "step": 44496 + }, + { + "epoch": 1.14, + "learning_rate": 1.422972107223956e-06, + "loss": 0.6074, + "step": 44497 + }, + { + "epoch": 1.14, + "learning_rate": 1.422947033682173e-06, + "loss": 0.6777, + "step": 44498 + }, + { + "epoch": 1.14, + "learning_rate": 1.4229219598165585e-06, + "loss": 0.6426, + "step": 44499 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228968856271324e-06, + "loss": 0.749, + "step": 44500 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228718111139137e-06, + "loss": 0.6953, + "step": 44501 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228467362769212e-06, + "loss": 0.52, + "step": 44502 + }, + { + "epoch": 1.14, + "learning_rate": 1.4228216611161745e-06, + "loss": 0.6134, + "step": 44503 + }, + { + "epoch": 1.14, + "learning_rate": 1.422796585631693e-06, + "loss": 0.7144, + "step": 44504 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227715098234952e-06, + "loss": 0.7822, + "step": 44505 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227464336916008e-06, + "loss": 0.4243, + "step": 44506 + }, + { + "epoch": 1.14, + "learning_rate": 1.4227213572360294e-06, + "loss": 0.6592, + "step": 44507 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226962804567987e-06, + "loss": 0.5779, + "step": 44508 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226712033539297e-06, + "loss": 0.5117, + "step": 44509 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226461259274402e-06, + "loss": 0.751, + "step": 44510 + }, + { + "epoch": 1.14, + "learning_rate": 1.4226210481773508e-06, + "loss": 0.6104, + "step": 44511 + }, + { + "epoch": 1.14, + "learning_rate": 1.422595970103679e-06, + "loss": 0.6714, + "step": 44512 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225708917064457e-06, + "loss": 0.5098, + "step": 44513 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225458129856686e-06, + "loss": 0.627, + "step": 44514 + }, + { + "epoch": 1.14, + "learning_rate": 1.4225207339413681e-06, + "loss": 0.7393, + "step": 44515 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224956545735627e-06, + "loss": 0.542, + "step": 44516 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224705748822718e-06, + "loss": 0.748, + "step": 44517 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224454948675146e-06, + "loss": 0.6504, + "step": 44518 + }, + { + "epoch": 1.14, + "learning_rate": 1.4224204145293103e-06, + "loss": 0.646, + "step": 44519 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223953338676781e-06, + "loss": 0.7959, + "step": 44520 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223702528826376e-06, + "loss": 0.7617, + "step": 44521 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223451715742072e-06, + "loss": 0.5753, + "step": 44522 + }, + { + "epoch": 1.14, + "learning_rate": 1.4223200899424066e-06, + "loss": 0.5669, + "step": 44523 + }, + { + "epoch": 1.14, + "learning_rate": 1.422295007987255e-06, + "loss": 0.8174, + "step": 44524 + }, + { + "epoch": 1.14, + "learning_rate": 1.4222699257087713e-06, + "loss": 0.7314, + "step": 44525 + }, + { + "epoch": 1.14, + "learning_rate": 1.422244843106975e-06, + "loss": 0.5649, + "step": 44526 + }, + { + "epoch": 1.14, + "learning_rate": 1.4222197601818853e-06, + "loss": 0.5718, + "step": 44527 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221946769335214e-06, + "loss": 0.8105, + "step": 44528 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221695933619025e-06, + "loss": 0.7471, + "step": 44529 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221445094670477e-06, + "loss": 0.7061, + "step": 44530 + }, + { + "epoch": 1.14, + "learning_rate": 1.4221194252489764e-06, + "loss": 0.6924, + "step": 44531 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220943407077074e-06, + "loss": 0.6885, + "step": 44532 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220692558432601e-06, + "loss": 0.6099, + "step": 44533 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220441706556541e-06, + "loss": 0.7246, + "step": 44534 + }, + { + "epoch": 1.14, + "learning_rate": 1.4220190851449078e-06, + "loss": 0.6162, + "step": 44535 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219939993110418e-06, + "loss": 0.7402, + "step": 44536 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219689131540735e-06, + "loss": 0.6587, + "step": 44537 + }, + { + "epoch": 1.14, + "learning_rate": 1.4219438266740236e-06, + "loss": 0.5862, + "step": 44538 + }, + { + "epoch": 1.14, + "learning_rate": 1.42191873987091e-06, + "loss": 0.6865, + "step": 44539 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218936527447534e-06, + "loss": 0.5752, + "step": 44540 + }, + { + "epoch": 1.14, + "learning_rate": 1.421868565295572e-06, + "loss": 0.7109, + "step": 44541 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218434775233852e-06, + "loss": 0.7812, + "step": 44542 + }, + { + "epoch": 1.14, + "learning_rate": 1.4218183894282118e-06, + "loss": 0.5386, + "step": 44543 + }, + { + "epoch": 1.14, + "learning_rate": 1.421793301010072e-06, + "loss": 0.6191, + "step": 44544 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217682122689842e-06, + "loss": 0.6636, + "step": 44545 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217431232049681e-06, + "loss": 0.6533, + "step": 44546 + }, + { + "epoch": 1.14, + "learning_rate": 1.4217180338180426e-06, + "loss": 0.665, + "step": 44547 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216929441082268e-06, + "loss": 0.6143, + "step": 44548 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216678540755402e-06, + "loss": 0.3352, + "step": 44549 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216427637200022e-06, + "loss": 0.5474, + "step": 44550 + }, + { + "epoch": 1.14, + "learning_rate": 1.4216176730416316e-06, + "loss": 0.7061, + "step": 44551 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215925820404474e-06, + "loss": 0.6836, + "step": 44552 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215674907164695e-06, + "loss": 0.6787, + "step": 44553 + }, + { + "epoch": 1.14, + "learning_rate": 1.4215423990697163e-06, + "loss": 0.4646, + "step": 44554 + }, + { + "epoch": 1.14, + "learning_rate": 1.421517307100208e-06, + "loss": 0.667, + "step": 44555 + }, + { + "epoch": 1.14, + "learning_rate": 1.4214922148079631e-06, + "loss": 0.6191, + "step": 44556 + }, + { + "epoch": 1.14, + "learning_rate": 1.421467122193001e-06, + "loss": 0.5786, + "step": 44557 + }, + { + "epoch": 1.14, + "learning_rate": 1.4214420292553406e-06, + "loss": 0.5615, + "step": 44558 + }, + { + "epoch": 1.14, + "learning_rate": 1.421416935995002e-06, + "loss": 0.6362, + "step": 44559 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213918424120033e-06, + "loss": 0.6152, + "step": 44560 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213667485063647e-06, + "loss": 0.7095, + "step": 44561 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213416542781044e-06, + "loss": 0.7021, + "step": 44562 + }, + { + "epoch": 1.14, + "learning_rate": 1.4213165597272427e-06, + "loss": 0.5376, + "step": 44563 + }, + { + "epoch": 1.14, + "learning_rate": 1.421291464853798e-06, + "loss": 0.6279, + "step": 44564 + }, + { + "epoch": 1.14, + "learning_rate": 1.4212663696577898e-06, + "loss": 0.5603, + "step": 44565 + }, + { + "epoch": 1.14, + "learning_rate": 1.4212412741392377e-06, + "loss": 0.7402, + "step": 44566 + }, + { + "epoch": 1.14, + "learning_rate": 1.42121617829816e-06, + "loss": 0.6265, + "step": 44567 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211910821345767e-06, + "loss": 0.6445, + "step": 44568 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211659856485066e-06, + "loss": 0.8271, + "step": 44569 + }, + { + "epoch": 1.14, + "learning_rate": 1.421140888839969e-06, + "loss": 0.4941, + "step": 44570 + }, + { + "epoch": 1.14, + "learning_rate": 1.4211157917089836e-06, + "loss": 0.8398, + "step": 44571 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210906942555689e-06, + "loss": 0.6562, + "step": 44572 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210655964797442e-06, + "loss": 0.7424, + "step": 44573 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210404983815295e-06, + "loss": 0.5317, + "step": 44574 + }, + { + "epoch": 1.14, + "learning_rate": 1.4210153999609429e-06, + "loss": 0.5747, + "step": 44575 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209903012180046e-06, + "loss": 0.6748, + "step": 44576 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209652021527332e-06, + "loss": 0.6035, + "step": 44577 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209401027651482e-06, + "loss": 0.5112, + "step": 44578 + }, + { + "epoch": 1.14, + "learning_rate": 1.4209150030552684e-06, + "loss": 0.5354, + "step": 44579 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208899030231135e-06, + "loss": 0.5981, + "step": 44580 + }, + { + "epoch": 1.14, + "learning_rate": 1.420864802668703e-06, + "loss": 0.7578, + "step": 44581 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208397019920553e-06, + "loss": 0.5298, + "step": 44582 + }, + { + "epoch": 1.14, + "learning_rate": 1.4208146009931898e-06, + "loss": 0.5747, + "step": 44583 + }, + { + "epoch": 1.14, + "learning_rate": 1.420789499672126e-06, + "loss": 0.5809, + "step": 44584 + }, + { + "epoch": 1.14, + "learning_rate": 1.420764398028883e-06, + "loss": 0.7148, + "step": 44585 + }, + { + "epoch": 1.14, + "learning_rate": 1.4207392960634805e-06, + "loss": 0.5696, + "step": 44586 + }, + { + "epoch": 1.14, + "learning_rate": 1.4207141937759367e-06, + "loss": 0.5629, + "step": 44587 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206890911662719e-06, + "loss": 0.7031, + "step": 44588 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206639882345045e-06, + "loss": 0.5737, + "step": 44589 + }, + { + "epoch": 1.14, + "learning_rate": 1.420638884980654e-06, + "loss": 0.6147, + "step": 44590 + }, + { + "epoch": 1.14, + "learning_rate": 1.4206137814047396e-06, + "loss": 0.5303, + "step": 44591 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205886775067806e-06, + "loss": 0.6279, + "step": 44592 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205635732867964e-06, + "loss": 0.5967, + "step": 44593 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205384687448058e-06, + "loss": 0.542, + "step": 44594 + }, + { + "epoch": 1.14, + "learning_rate": 1.4205133638808282e-06, + "loss": 0.7979, + "step": 44595 + }, + { + "epoch": 1.14, + "learning_rate": 1.420488258694883e-06, + "loss": 0.6235, + "step": 44596 + }, + { + "epoch": 1.14, + "learning_rate": 1.4204631531869896e-06, + "loss": 0.6074, + "step": 44597 + }, + { + "epoch": 1.14, + "learning_rate": 1.4204380473571663e-06, + "loss": 0.6743, + "step": 44598 + }, + { + "epoch": 1.14, + "learning_rate": 1.420412941205433e-06, + "loss": 0.7324, + "step": 44599 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203878347318088e-06, + "loss": 0.8203, + "step": 44600 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203627279363136e-06, + "loss": 0.5957, + "step": 44601 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203376208189655e-06, + "loss": 0.6279, + "step": 44602 + }, + { + "epoch": 1.14, + "learning_rate": 1.4203125133797841e-06, + "loss": 0.834, + "step": 44603 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202874056187888e-06, + "loss": 0.6611, + "step": 44604 + }, + { + "epoch": 1.14, + "learning_rate": 1.420262297535999e-06, + "loss": 0.7021, + "step": 44605 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202371891314336e-06, + "loss": 0.7041, + "step": 44606 + }, + { + "epoch": 1.14, + "learning_rate": 1.4202120804051119e-06, + "loss": 0.5972, + "step": 44607 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201869713570528e-06, + "loss": 0.7627, + "step": 44608 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201618619872762e-06, + "loss": 0.7002, + "step": 44609 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201367522958007e-06, + "loss": 0.6865, + "step": 44610 + }, + { + "epoch": 1.14, + "learning_rate": 1.4201116422826465e-06, + "loss": 0.7041, + "step": 44611 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200865319478315e-06, + "loss": 0.7686, + "step": 44612 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200614212913756e-06, + "loss": 0.8037, + "step": 44613 + }, + { + "epoch": 1.14, + "learning_rate": 1.420036310313298e-06, + "loss": 0.8721, + "step": 44614 + }, + { + "epoch": 1.14, + "learning_rate": 1.4200111990136182e-06, + "loss": 0.627, + "step": 44615 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199860873923548e-06, + "loss": 0.8135, + "step": 44616 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199609754495273e-06, + "loss": 0.6494, + "step": 44617 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199358631851554e-06, + "loss": 0.6201, + "step": 44618 + }, + { + "epoch": 1.14, + "learning_rate": 1.4199107505992576e-06, + "loss": 0.6992, + "step": 44619 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198856376918536e-06, + "loss": 0.5649, + "step": 44620 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198605244629625e-06, + "loss": 0.7324, + "step": 44621 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198354109126033e-06, + "loss": 0.6914, + "step": 44622 + }, + { + "epoch": 1.14, + "learning_rate": 1.4198102970407956e-06, + "loss": 0.5962, + "step": 44623 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197851828475585e-06, + "loss": 0.6113, + "step": 44624 + }, + { + "epoch": 1.14, + "learning_rate": 1.419760068332911e-06, + "loss": 0.6406, + "step": 44625 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197349534968727e-06, + "loss": 0.7227, + "step": 44626 + }, + { + "epoch": 1.14, + "learning_rate": 1.4197098383394625e-06, + "loss": 0.6709, + "step": 44627 + }, + { + "epoch": 1.14, + "learning_rate": 1.4196847228607e-06, + "loss": 0.543, + "step": 44628 + }, + { + "epoch": 1.14, + "learning_rate": 1.419659607060604e-06, + "loss": 0.562, + "step": 44629 + }, + { + "epoch": 1.14, + "learning_rate": 1.419634490939194e-06, + "loss": 0.5542, + "step": 44630 + }, + { + "epoch": 1.14, + "learning_rate": 1.4196093744964893e-06, + "loss": 0.4481, + "step": 44631 + }, + { + "epoch": 1.14, + "learning_rate": 1.4195842577325087e-06, + "loss": 0.5962, + "step": 44632 + }, + { + "epoch": 1.14, + "learning_rate": 1.4195591406472718e-06, + "loss": 0.7314, + "step": 44633 + }, + { + "epoch": 1.14, + "learning_rate": 1.419534023240798e-06, + "loss": 0.6763, + "step": 44634 + }, + { + "epoch": 1.14, + "learning_rate": 1.419508905513106e-06, + "loss": 0.7231, + "step": 44635 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194837874642154e-06, + "loss": 0.6592, + "step": 44636 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194586690941454e-06, + "loss": 0.5723, + "step": 44637 + }, + { + "epoch": 1.14, + "learning_rate": 1.4194335504029152e-06, + "loss": 0.6133, + "step": 44638 + }, + { + "epoch": 1.14, + "learning_rate": 1.419408431390544e-06, + "loss": 0.5598, + "step": 44639 + }, + { + "epoch": 1.14, + "learning_rate": 1.419383312057051e-06, + "loss": 0.959, + "step": 44640 + }, + { + "epoch": 1.14, + "learning_rate": 1.4193581924024555e-06, + "loss": 0.6006, + "step": 44641 + }, + { + "epoch": 1.14, + "learning_rate": 1.419333072426777e-06, + "loss": 0.6426, + "step": 44642 + }, + { + "epoch": 1.14, + "learning_rate": 1.4193079521300341e-06, + "loss": 0.5337, + "step": 44643 + }, + { + "epoch": 1.14, + "learning_rate": 1.4192828315122463e-06, + "loss": 0.6582, + "step": 44644 + }, + { + "epoch": 1.14, + "learning_rate": 1.419257710573433e-06, + "loss": 0.7725, + "step": 44645 + }, + { + "epoch": 1.14, + "learning_rate": 1.4192325893136136e-06, + "loss": 0.6133, + "step": 44646 + }, + { + "epoch": 1.14, + "learning_rate": 1.419207467732807e-06, + "loss": 0.8711, + "step": 44647 + }, + { + "epoch": 1.14, + "learning_rate": 1.4191823458310324e-06, + "loss": 0.6768, + "step": 44648 + }, + { + "epoch": 1.14, + "learning_rate": 1.419157223608309e-06, + "loss": 0.5649, + "step": 44649 + }, + { + "epoch": 1.14, + "learning_rate": 1.4191321010646563e-06, + "loss": 0.3986, + "step": 44650 + }, + { + "epoch": 1.14, + "learning_rate": 1.419106978200094e-06, + "loss": 0.5996, + "step": 44651 + }, + { + "epoch": 1.14, + "learning_rate": 1.41908185501464e-06, + "loss": 0.7461, + "step": 44652 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190567315083146e-06, + "loss": 0.6172, + "step": 44653 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190316076811365e-06, + "loss": 0.6108, + "step": 44654 + }, + { + "epoch": 1.14, + "learning_rate": 1.4190064835331255e-06, + "loss": 0.6787, + "step": 44655 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189813590643005e-06, + "loss": 0.606, + "step": 44656 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189562342746807e-06, + "loss": 0.7129, + "step": 44657 + }, + { + "epoch": 1.14, + "learning_rate": 1.418931109164285e-06, + "loss": 0.5579, + "step": 44658 + }, + { + "epoch": 1.14, + "learning_rate": 1.4189059837331331e-06, + "loss": 0.5898, + "step": 44659 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188808579812443e-06, + "loss": 0.7324, + "step": 44660 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188557319086378e-06, + "loss": 0.3969, + "step": 44661 + }, + { + "epoch": 1.14, + "learning_rate": 1.4188306055153328e-06, + "loss": 0.5024, + "step": 44662 + }, + { + "epoch": 1.14, + "learning_rate": 1.418805478801348e-06, + "loss": 0.5162, + "step": 44663 + }, + { + "epoch": 1.14, + "learning_rate": 1.4187803517667036e-06, + "loss": 0.6646, + "step": 44664 + }, + { + "epoch": 1.14, + "learning_rate": 1.418755224411418e-06, + "loss": 0.5327, + "step": 44665 + }, + { + "epoch": 1.14, + "learning_rate": 1.418730096735511e-06, + "loss": 0.8945, + "step": 44666 + }, + { + "epoch": 1.14, + "learning_rate": 1.4187049687390016e-06, + "loss": 0.7676, + "step": 44667 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186798404219092e-06, + "loss": 0.7295, + "step": 44668 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186547117842524e-06, + "loss": 0.4385, + "step": 44669 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186295828260515e-06, + "loss": 0.6653, + "step": 44670 + }, + { + "epoch": 1.14, + "learning_rate": 1.4186044535473248e-06, + "loss": 0.6177, + "step": 44671 + }, + { + "epoch": 1.14, + "learning_rate": 1.4185793239480922e-06, + "loss": 0.6709, + "step": 44672 + }, + { + "epoch": 1.14, + "learning_rate": 1.4185541940283723e-06, + "loss": 0.6489, + "step": 44673 + }, + { + "epoch": 1.15, + "learning_rate": 1.4185290637881848e-06, + "loss": 0.6094, + "step": 44674 + }, + { + "epoch": 1.15, + "learning_rate": 1.418503933227549e-06, + "loss": 0.3733, + "step": 44675 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184788023464841e-06, + "loss": 0.7129, + "step": 44676 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184536711450089e-06, + "loss": 0.6226, + "step": 44677 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184285396231432e-06, + "loss": 0.6582, + "step": 44678 + }, + { + "epoch": 1.15, + "learning_rate": 1.4184034077809057e-06, + "loss": 0.749, + "step": 44679 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183782756183162e-06, + "loss": 0.4324, + "step": 44680 + }, + { + "epoch": 1.15, + "learning_rate": 1.418353143135394e-06, + "loss": 0.7012, + "step": 44681 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183280103321574e-06, + "loss": 0.8408, + "step": 44682 + }, + { + "epoch": 1.15, + "learning_rate": 1.4183028772086265e-06, + "loss": 0.6084, + "step": 44683 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182777437648207e-06, + "loss": 0.4895, + "step": 44684 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182526100007582e-06, + "loss": 0.6836, + "step": 44685 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182274759164594e-06, + "loss": 0.4919, + "step": 44686 + }, + { + "epoch": 1.15, + "learning_rate": 1.4182023415119429e-06, + "loss": 0.6812, + "step": 44687 + }, + { + "epoch": 1.15, + "learning_rate": 1.418177206787228e-06, + "loss": 0.7188, + "step": 44688 + }, + { + "epoch": 1.15, + "learning_rate": 1.418152071742334e-06, + "loss": 0.3073, + "step": 44689 + }, + { + "epoch": 1.15, + "learning_rate": 1.4181269363772802e-06, + "loss": 0.6865, + "step": 44690 + }, + { + "epoch": 1.15, + "learning_rate": 1.4181018006920865e-06, + "loss": 0.4351, + "step": 44691 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180766646867706e-06, + "loss": 0.689, + "step": 44692 + }, + { + "epoch": 1.15, + "learning_rate": 1.418051528361353e-06, + "loss": 0.6738, + "step": 44693 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180263917158525e-06, + "loss": 0.5063, + "step": 44694 + }, + { + "epoch": 1.15, + "learning_rate": 1.4180012547502884e-06, + "loss": 0.6191, + "step": 44695 + }, + { + "epoch": 1.15, + "learning_rate": 1.41797611746468e-06, + "loss": 0.3837, + "step": 44696 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179509798590468e-06, + "loss": 0.665, + "step": 44697 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179258419334073e-06, + "loss": 0.5234, + "step": 44698 + }, + { + "epoch": 1.15, + "learning_rate": 1.4179007036877813e-06, + "loss": 0.6641, + "step": 44699 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178755651221879e-06, + "loss": 0.6089, + "step": 44700 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178504262366468e-06, + "loss": 0.5596, + "step": 44701 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178252870311765e-06, + "loss": 0.7793, + "step": 44702 + }, + { + "epoch": 1.15, + "learning_rate": 1.4178001475057966e-06, + "loss": 0.5172, + "step": 44703 + }, + { + "epoch": 1.15, + "learning_rate": 1.4177750076605261e-06, + "loss": 0.668, + "step": 44704 + }, + { + "epoch": 1.15, + "learning_rate": 1.417749867495385e-06, + "loss": 0.8926, + "step": 44705 + }, + { + "epoch": 1.15, + "learning_rate": 1.4177247270103918e-06, + "loss": 0.3403, + "step": 44706 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176995862055658e-06, + "loss": 0.7158, + "step": 44707 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176744450809265e-06, + "loss": 0.6428, + "step": 44708 + }, + { + "epoch": 1.15, + "learning_rate": 1.4176493036364932e-06, + "loss": 0.6963, + "step": 44709 + }, + { + "epoch": 1.15, + "learning_rate": 1.417624161872285e-06, + "loss": 0.6953, + "step": 44710 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175990197883214e-06, + "loss": 0.749, + "step": 44711 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175738773846213e-06, + "loss": 0.6914, + "step": 44712 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175487346612038e-06, + "loss": 0.7041, + "step": 44713 + }, + { + "epoch": 1.15, + "learning_rate": 1.4175235916180887e-06, + "loss": 0.8408, + "step": 44714 + }, + { + "epoch": 1.15, + "learning_rate": 1.417498448255295e-06, + "loss": 0.7178, + "step": 44715 + }, + { + "epoch": 1.15, + "learning_rate": 1.417473304572842e-06, + "loss": 0.4995, + "step": 44716 + }, + { + "epoch": 1.15, + "learning_rate": 1.4174481605707488e-06, + "loss": 0.5476, + "step": 44717 + }, + { + "epoch": 1.15, + "learning_rate": 1.4174230162490345e-06, + "loss": 0.791, + "step": 44718 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173978716077186e-06, + "loss": 0.6143, + "step": 44719 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173727266468208e-06, + "loss": 0.6704, + "step": 44720 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173475813663596e-06, + "loss": 0.6313, + "step": 44721 + }, + { + "epoch": 1.15, + "learning_rate": 1.4173224357663547e-06, + "loss": 0.6709, + "step": 44722 + }, + { + "epoch": 1.15, + "learning_rate": 1.417297289846825e-06, + "loss": 0.6313, + "step": 44723 + }, + { + "epoch": 1.15, + "learning_rate": 1.41727214360779e-06, + "loss": 0.6514, + "step": 44724 + }, + { + "epoch": 1.15, + "learning_rate": 1.4172469970492688e-06, + "loss": 0.8662, + "step": 44725 + }, + { + "epoch": 1.15, + "learning_rate": 1.4172218501712809e-06, + "loss": 0.7529, + "step": 44726 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171967029738455e-06, + "loss": 0.6509, + "step": 44727 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171715554569815e-06, + "loss": 0.8652, + "step": 44728 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171464076207088e-06, + "loss": 0.5933, + "step": 44729 + }, + { + "epoch": 1.15, + "learning_rate": 1.4171212594650462e-06, + "loss": 0.6069, + "step": 44730 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170961109900128e-06, + "loss": 0.6465, + "step": 44731 + }, + { + "epoch": 1.15, + "learning_rate": 1.417070962195628e-06, + "loss": 0.6816, + "step": 44732 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170458130819115e-06, + "loss": 0.6929, + "step": 44733 + }, + { + "epoch": 1.15, + "learning_rate": 1.4170206636488817e-06, + "loss": 0.6875, + "step": 44734 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169955138965588e-06, + "loss": 0.7617, + "step": 44735 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169703638249617e-06, + "loss": 0.7578, + "step": 44736 + }, + { + "epoch": 1.15, + "learning_rate": 1.4169452134341094e-06, + "loss": 0.6797, + "step": 44737 + }, + { + "epoch": 1.15, + "learning_rate": 1.416920062724021e-06, + "loss": 0.7148, + "step": 44738 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168949116947165e-06, + "loss": 0.8213, + "step": 44739 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168697603462145e-06, + "loss": 0.625, + "step": 44740 + }, + { + "epoch": 1.15, + "learning_rate": 1.4168446086785348e-06, + "loss": 0.6387, + "step": 44741 + }, + { + "epoch": 1.15, + "learning_rate": 1.416819456691696e-06, + "loss": 0.7354, + "step": 44742 + }, + { + "epoch": 1.15, + "learning_rate": 1.4167943043857179e-06, + "loss": 0.7793, + "step": 44743 + }, + { + "epoch": 1.15, + "learning_rate": 1.4167691517606192e-06, + "loss": 0.5833, + "step": 44744 + }, + { + "epoch": 1.15, + "learning_rate": 1.41674399881642e-06, + "loss": 0.6631, + "step": 44745 + }, + { + "epoch": 1.15, + "learning_rate": 1.416718845553139e-06, + "loss": 0.8682, + "step": 44746 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166936919707955e-06, + "loss": 0.6611, + "step": 44747 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166685380694086e-06, + "loss": 0.5615, + "step": 44748 + }, + { + "epoch": 1.15, + "learning_rate": 1.416643383848998e-06, + "loss": 0.4495, + "step": 44749 + }, + { + "epoch": 1.15, + "learning_rate": 1.4166182293095826e-06, + "loss": 0.6064, + "step": 44750 + }, + { + "epoch": 1.15, + "learning_rate": 1.4165930744511818e-06, + "loss": 0.7969, + "step": 44751 + }, + { + "epoch": 1.15, + "learning_rate": 1.416567919273815e-06, + "loss": 0.9141, + "step": 44752 + }, + { + "epoch": 1.15, + "learning_rate": 1.416542763777501e-06, + "loss": 0.7734, + "step": 44753 + }, + { + "epoch": 1.15, + "learning_rate": 1.4165176079622594e-06, + "loss": 0.6074, + "step": 44754 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164924518281093e-06, + "loss": 0.4822, + "step": 44755 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164672953750708e-06, + "loss": 0.7344, + "step": 44756 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164421386031616e-06, + "loss": 0.7026, + "step": 44757 + }, + { + "epoch": 1.15, + "learning_rate": 1.4164169815124024e-06, + "loss": 0.6143, + "step": 44758 + }, + { + "epoch": 1.15, + "learning_rate": 1.4163918241028115e-06, + "loss": 0.6406, + "step": 44759 + }, + { + "epoch": 1.15, + "learning_rate": 1.416366666374409e-06, + "loss": 0.5439, + "step": 44760 + }, + { + "epoch": 1.15, + "learning_rate": 1.416341508327213e-06, + "loss": 0.6865, + "step": 44761 + }, + { + "epoch": 1.15, + "learning_rate": 1.416316349961244e-06, + "loss": 0.6855, + "step": 44762 + }, + { + "epoch": 1.15, + "learning_rate": 1.41629119127652e-06, + "loss": 0.7334, + "step": 44763 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162660322730617e-06, + "loss": 0.6689, + "step": 44764 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162408729508874e-06, + "loss": 0.708, + "step": 44765 + }, + { + "epoch": 1.15, + "learning_rate": 1.4162157133100168e-06, + "loss": 0.7151, + "step": 44766 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161905533504686e-06, + "loss": 0.5715, + "step": 44767 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161653930722625e-06, + "loss": 0.7061, + "step": 44768 + }, + { + "epoch": 1.15, + "learning_rate": 1.416140232475418e-06, + "loss": 0.6318, + "step": 44769 + }, + { + "epoch": 1.15, + "learning_rate": 1.4161150715599538e-06, + "loss": 0.5518, + "step": 44770 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160899103258897e-06, + "loss": 0.5361, + "step": 44771 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160647487732442e-06, + "loss": 0.5317, + "step": 44772 + }, + { + "epoch": 1.15, + "learning_rate": 1.4160395869020375e-06, + "loss": 0.6533, + "step": 44773 + }, + { + "epoch": 1.15, + "learning_rate": 1.416014424712288e-06, + "loss": 0.7178, + "step": 44774 + }, + { + "epoch": 1.15, + "learning_rate": 1.415989262204016e-06, + "loss": 0.5835, + "step": 44775 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159640993772394e-06, + "loss": 0.5697, + "step": 44776 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159389362319787e-06, + "loss": 0.6821, + "step": 44777 + }, + { + "epoch": 1.15, + "learning_rate": 1.4159137727682526e-06, + "loss": 0.5605, + "step": 44778 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158886089860804e-06, + "loss": 0.7793, + "step": 44779 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158634448854815e-06, + "loss": 0.501, + "step": 44780 + }, + { + "epoch": 1.15, + "learning_rate": 1.415838280466475e-06, + "loss": 0.5723, + "step": 44781 + }, + { + "epoch": 1.15, + "learning_rate": 1.4158131157290803e-06, + "loss": 0.6226, + "step": 44782 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157879506733166e-06, + "loss": 0.7715, + "step": 44783 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157627852992028e-06, + "loss": 0.6025, + "step": 44784 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157376196067594e-06, + "loss": 0.6602, + "step": 44785 + }, + { + "epoch": 1.15, + "learning_rate": 1.4157124535960044e-06, + "loss": 0.749, + "step": 44786 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156872872669575e-06, + "loss": 0.3882, + "step": 44787 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156621206196375e-06, + "loss": 0.6631, + "step": 44788 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156369536540646e-06, + "loss": 0.606, + "step": 44789 + }, + { + "epoch": 1.15, + "learning_rate": 1.4156117863702576e-06, + "loss": 0.7324, + "step": 44790 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155866187682358e-06, + "loss": 0.6973, + "step": 44791 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155614508480182e-06, + "loss": 0.6738, + "step": 44792 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155362826096244e-06, + "loss": 0.6904, + "step": 44793 + }, + { + "epoch": 1.15, + "learning_rate": 1.4155111140530735e-06, + "loss": 0.7354, + "step": 44794 + }, + { + "epoch": 1.15, + "learning_rate": 1.415485945178385e-06, + "loss": 0.6372, + "step": 44795 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154607759855778e-06, + "loss": 0.8086, + "step": 44796 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154356064746718e-06, + "loss": 0.7168, + "step": 44797 + }, + { + "epoch": 1.15, + "learning_rate": 1.4154104366456854e-06, + "loss": 0.7656, + "step": 44798 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153852664986385e-06, + "loss": 0.8057, + "step": 44799 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153600960335505e-06, + "loss": 0.6802, + "step": 44800 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153349252504399e-06, + "loss": 0.7695, + "step": 44801 + }, + { + "epoch": 1.15, + "learning_rate": 1.4153097541493267e-06, + "loss": 0.6758, + "step": 44802 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152845827302299e-06, + "loss": 0.5994, + "step": 44803 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152594109931685e-06, + "loss": 0.606, + "step": 44804 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152342389381626e-06, + "loss": 0.5669, + "step": 44805 + }, + { + "epoch": 1.15, + "learning_rate": 1.4152090665652307e-06, + "loss": 0.7529, + "step": 44806 + }, + { + "epoch": 1.15, + "learning_rate": 1.415183893874392e-06, + "loss": 0.6333, + "step": 44807 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151587208656666e-06, + "loss": 0.6719, + "step": 44808 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151335475390728e-06, + "loss": 0.5396, + "step": 44809 + }, + { + "epoch": 1.15, + "learning_rate": 1.4151083738946307e-06, + "loss": 0.6763, + "step": 44810 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150831999323592e-06, + "loss": 0.6016, + "step": 44811 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150580256522773e-06, + "loss": 0.6423, + "step": 44812 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150328510544048e-06, + "loss": 0.519, + "step": 44813 + }, + { + "epoch": 1.15, + "learning_rate": 1.4150076761387606e-06, + "loss": 0.5471, + "step": 44814 + }, + { + "epoch": 1.15, + "learning_rate": 1.414982500905364e-06, + "loss": 0.6836, + "step": 44815 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149573253542344e-06, + "loss": 0.4561, + "step": 44816 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149321494853912e-06, + "loss": 0.6196, + "step": 44817 + }, + { + "epoch": 1.15, + "learning_rate": 1.4149069732988535e-06, + "loss": 0.5215, + "step": 44818 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148817967946404e-06, + "loss": 0.6406, + "step": 44819 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148566199727719e-06, + "loss": 0.6455, + "step": 44820 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148314428332665e-06, + "loss": 0.6038, + "step": 44821 + }, + { + "epoch": 1.15, + "learning_rate": 1.4148062653761434e-06, + "loss": 0.707, + "step": 44822 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147810876014225e-06, + "loss": 0.7695, + "step": 44823 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147559095091227e-06, + "loss": 0.6279, + "step": 44824 + }, + { + "epoch": 1.15, + "learning_rate": 1.4147307310992638e-06, + "loss": 0.8379, + "step": 44825 + }, + { + "epoch": 1.15, + "learning_rate": 1.414705552371864e-06, + "loss": 0.7559, + "step": 44826 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146803733269437e-06, + "loss": 0.5786, + "step": 44827 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146551939645215e-06, + "loss": 0.6577, + "step": 44828 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146300142846168e-06, + "loss": 0.6104, + "step": 44829 + }, + { + "epoch": 1.15, + "learning_rate": 1.4146048342872491e-06, + "loss": 0.6387, + "step": 44830 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145796539724376e-06, + "loss": 0.6475, + "step": 44831 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145544733402016e-06, + "loss": 0.7305, + "step": 44832 + }, + { + "epoch": 1.15, + "learning_rate": 1.41452929239056e-06, + "loss": 0.7246, + "step": 44833 + }, + { + "epoch": 1.15, + "learning_rate": 1.4145041111235325e-06, + "loss": 0.418, + "step": 44834 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144789295391385e-06, + "loss": 0.447, + "step": 44835 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144537476373967e-06, + "loss": 0.6475, + "step": 44836 + }, + { + "epoch": 1.15, + "learning_rate": 1.414428565418327e-06, + "loss": 0.5347, + "step": 44837 + }, + { + "epoch": 1.15, + "learning_rate": 1.4144033828819482e-06, + "loss": 0.6025, + "step": 44838 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143782000282798e-06, + "loss": 0.4529, + "step": 44839 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143530168573411e-06, + "loss": 0.6343, + "step": 44840 + }, + { + "epoch": 1.15, + "learning_rate": 1.4143278333691514e-06, + "loss": 0.6143, + "step": 44841 + }, + { + "epoch": 1.15, + "learning_rate": 1.41430264956373e-06, + "loss": 0.5972, + "step": 44842 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142774654410958e-06, + "loss": 0.5928, + "step": 44843 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142522810012686e-06, + "loss": 0.7119, + "step": 44844 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142270962442676e-06, + "loss": 0.6992, + "step": 44845 + }, + { + "epoch": 1.15, + "learning_rate": 1.4142019111701117e-06, + "loss": 0.8701, + "step": 44846 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141767257788206e-06, + "loss": 0.709, + "step": 44847 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141515400704136e-06, + "loss": 0.4609, + "step": 44848 + }, + { + "epoch": 1.15, + "learning_rate": 1.4141263540449093e-06, + "loss": 0.6179, + "step": 44849 + }, + { + "epoch": 1.15, + "learning_rate": 1.414101167702328e-06, + "loss": 0.6387, + "step": 44850 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140759810426883e-06, + "loss": 0.7266, + "step": 44851 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140507940660097e-06, + "loss": 0.6436, + "step": 44852 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140256067723112e-06, + "loss": 0.6084, + "step": 44853 + }, + { + "epoch": 1.15, + "learning_rate": 1.4140004191616127e-06, + "loss": 0.5122, + "step": 44854 + }, + { + "epoch": 1.15, + "learning_rate": 1.413975231233933e-06, + "loss": 0.7461, + "step": 44855 + }, + { + "epoch": 1.15, + "learning_rate": 1.4139500429892915e-06, + "loss": 0.521, + "step": 44856 + }, + { + "epoch": 1.15, + "learning_rate": 1.4139248544277073e-06, + "loss": 0.6025, + "step": 44857 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138996655492e-06, + "loss": 0.7109, + "step": 44858 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138744763537884e-06, + "loss": 0.5225, + "step": 44859 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138492868414927e-06, + "loss": 0.6436, + "step": 44860 + }, + { + "epoch": 1.15, + "learning_rate": 1.4138240970123315e-06, + "loss": 0.6074, + "step": 44861 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137989068663239e-06, + "loss": 0.5435, + "step": 44862 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137737164034897e-06, + "loss": 0.5798, + "step": 44863 + }, + { + "epoch": 1.15, + "learning_rate": 1.413748525623848e-06, + "loss": 0.6836, + "step": 44864 + }, + { + "epoch": 1.15, + "learning_rate": 1.4137233345274185e-06, + "loss": 0.6445, + "step": 44865 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136981431142195e-06, + "loss": 0.4985, + "step": 44866 + }, + { + "epoch": 1.15, + "learning_rate": 1.413672951384271e-06, + "loss": 0.603, + "step": 44867 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136477593375922e-06, + "loss": 0.5757, + "step": 44868 + }, + { + "epoch": 1.15, + "learning_rate": 1.4136225669742023e-06, + "loss": 0.5835, + "step": 44869 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135973742941207e-06, + "loss": 0.6582, + "step": 44870 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135721812973667e-06, + "loss": 0.7266, + "step": 44871 + }, + { + "epoch": 1.15, + "learning_rate": 1.413546987983959e-06, + "loss": 0.562, + "step": 44872 + }, + { + "epoch": 1.15, + "learning_rate": 1.4135217943539179e-06, + "loss": 0.6924, + "step": 44873 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134966004072618e-06, + "loss": 0.5381, + "step": 44874 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134714061440108e-06, + "loss": 0.6934, + "step": 44875 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134462115641834e-06, + "loss": 0.6934, + "step": 44876 + }, + { + "epoch": 1.15, + "learning_rate": 1.4134210166677994e-06, + "loss": 0.646, + "step": 44877 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133958214548777e-06, + "loss": 0.5903, + "step": 44878 + }, + { + "epoch": 1.15, + "learning_rate": 1.413370625925438e-06, + "loss": 0.6948, + "step": 44879 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133454300794995e-06, + "loss": 0.6272, + "step": 44880 + }, + { + "epoch": 1.15, + "learning_rate": 1.4133202339170814e-06, + "loss": 0.7607, + "step": 44881 + }, + { + "epoch": 1.15, + "learning_rate": 1.413295037438203e-06, + "loss": 0.7949, + "step": 44882 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132698406428836e-06, + "loss": 0.4907, + "step": 44883 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132446435311423e-06, + "loss": 0.7646, + "step": 44884 + }, + { + "epoch": 1.15, + "learning_rate": 1.4132194461029987e-06, + "loss": 0.6804, + "step": 44885 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131942483584721e-06, + "loss": 0.6172, + "step": 44886 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131690502975816e-06, + "loss": 0.6387, + "step": 44887 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131438519203464e-06, + "loss": 0.6758, + "step": 44888 + }, + { + "epoch": 1.15, + "learning_rate": 1.4131186532267857e-06, + "loss": 0.6489, + "step": 44889 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130934542169199e-06, + "loss": 0.5928, + "step": 44890 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130682548907669e-06, + "loss": 0.6812, + "step": 44891 + }, + { + "epoch": 1.15, + "learning_rate": 1.4130430552483465e-06, + "loss": 0.668, + "step": 44892 + }, + { + "epoch": 1.15, + "learning_rate": 1.413017855289678e-06, + "loss": 0.6514, + "step": 44893 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129926550147807e-06, + "loss": 0.5815, + "step": 44894 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129674544236742e-06, + "loss": 0.8105, + "step": 44895 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129422535163772e-06, + "loss": 0.5151, + "step": 44896 + }, + { + "epoch": 1.15, + "learning_rate": 1.4129170522929094e-06, + "loss": 0.5864, + "step": 44897 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128918507532903e-06, + "loss": 0.7764, + "step": 44898 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128666488975385e-06, + "loss": 0.7812, + "step": 44899 + }, + { + "epoch": 1.15, + "learning_rate": 1.412841446725674e-06, + "loss": 0.585, + "step": 44900 + }, + { + "epoch": 1.15, + "learning_rate": 1.4128162442377157e-06, + "loss": 0.6689, + "step": 44901 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127910414336828e-06, + "loss": 0.752, + "step": 44902 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127658383135947e-06, + "loss": 0.7695, + "step": 44903 + }, + { + "epoch": 1.15, + "learning_rate": 1.412740634877471e-06, + "loss": 0.5869, + "step": 44904 + }, + { + "epoch": 1.15, + "learning_rate": 1.4127154311253308e-06, + "loss": 0.8359, + "step": 44905 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126902270571932e-06, + "loss": 0.6348, + "step": 44906 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126650226730776e-06, + "loss": 0.4883, + "step": 44907 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126398179730034e-06, + "loss": 0.6826, + "step": 44908 + }, + { + "epoch": 1.15, + "learning_rate": 1.4126146129569902e-06, + "loss": 0.6758, + "step": 44909 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125894076250568e-06, + "loss": 0.6885, + "step": 44910 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125642019772226e-06, + "loss": 0.7012, + "step": 44911 + }, + { + "epoch": 1.15, + "learning_rate": 1.412538996013507e-06, + "loss": 0.605, + "step": 44912 + }, + { + "epoch": 1.15, + "learning_rate": 1.4125137897339292e-06, + "loss": 0.5356, + "step": 44913 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124885831385085e-06, + "loss": 0.5957, + "step": 44914 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124633762272646e-06, + "loss": 0.5806, + "step": 44915 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124381690002163e-06, + "loss": 0.6846, + "step": 44916 + }, + { + "epoch": 1.15, + "learning_rate": 1.4124129614573827e-06, + "loss": 0.7397, + "step": 44917 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123877535987839e-06, + "loss": 0.6572, + "step": 44918 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123625454244385e-06, + "loss": 0.6577, + "step": 44919 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123373369343662e-06, + "loss": 0.6489, + "step": 44920 + }, + { + "epoch": 1.15, + "learning_rate": 1.4123121281285863e-06, + "loss": 0.6836, + "step": 44921 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122869190071175e-06, + "loss": 0.5425, + "step": 44922 + }, + { + "epoch": 1.15, + "learning_rate": 1.41226170956998e-06, + "loss": 0.728, + "step": 44923 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122364998171924e-06, + "loss": 0.6113, + "step": 44924 + }, + { + "epoch": 1.15, + "learning_rate": 1.4122112897487744e-06, + "loss": 0.5396, + "step": 44925 + }, + { + "epoch": 1.15, + "learning_rate": 1.412186079364745e-06, + "loss": 0.7715, + "step": 44926 + }, + { + "epoch": 1.15, + "learning_rate": 1.412160868665124e-06, + "loss": 0.6055, + "step": 44927 + }, + { + "epoch": 1.15, + "learning_rate": 1.4121356576499301e-06, + "loss": 0.7568, + "step": 44928 + }, + { + "epoch": 1.15, + "learning_rate": 1.4121104463191832e-06, + "loss": 0.7598, + "step": 44929 + }, + { + "epoch": 1.15, + "learning_rate": 1.412085234672902e-06, + "loss": 0.6138, + "step": 44930 + }, + { + "epoch": 1.15, + "learning_rate": 1.412060022711106e-06, + "loss": 0.623, + "step": 44931 + }, + { + "epoch": 1.15, + "learning_rate": 1.4120348104338148e-06, + "loss": 0.7607, + "step": 44932 + }, + { + "epoch": 1.15, + "learning_rate": 1.4120095978410471e-06, + "loss": 0.4796, + "step": 44933 + }, + { + "epoch": 1.15, + "learning_rate": 1.411984384932823e-06, + "loss": 0.5295, + "step": 44934 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119591717091614e-06, + "loss": 0.7773, + "step": 44935 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119339581700818e-06, + "loss": 0.5801, + "step": 44936 + }, + { + "epoch": 1.15, + "learning_rate": 1.4119087443156027e-06, + "loss": 0.5203, + "step": 44937 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118835301457443e-06, + "loss": 0.6309, + "step": 44938 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118583156605257e-06, + "loss": 0.7578, + "step": 44939 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118331008599663e-06, + "loss": 0.7061, + "step": 44940 + }, + { + "epoch": 1.15, + "learning_rate": 1.4118078857440849e-06, + "loss": 0.6953, + "step": 44941 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117826703129012e-06, + "loss": 0.7441, + "step": 44942 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117574545664344e-06, + "loss": 0.6304, + "step": 44943 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117322385047042e-06, + "loss": 0.6494, + "step": 44944 + }, + { + "epoch": 1.15, + "learning_rate": 1.4117070221277292e-06, + "loss": 0.646, + "step": 44945 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116818054355292e-06, + "loss": 0.7266, + "step": 44946 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116565884281233e-06, + "loss": 0.7422, + "step": 44947 + }, + { + "epoch": 1.15, + "learning_rate": 1.411631371105531e-06, + "loss": 0.6694, + "step": 44948 + }, + { + "epoch": 1.15, + "learning_rate": 1.4116061534677711e-06, + "loss": 0.7627, + "step": 44949 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115809355148638e-06, + "loss": 0.5083, + "step": 44950 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115557172468275e-06, + "loss": 0.7646, + "step": 44951 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115304986636823e-06, + "loss": 0.5598, + "step": 44952 + }, + { + "epoch": 1.15, + "learning_rate": 1.4115052797654467e-06, + "loss": 0.647, + "step": 44953 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114800605521408e-06, + "loss": 0.6875, + "step": 44954 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114548410237833e-06, + "loss": 0.6279, + "step": 44955 + }, + { + "epoch": 1.15, + "learning_rate": 1.411429621180394e-06, + "loss": 0.5518, + "step": 44956 + }, + { + "epoch": 1.15, + "learning_rate": 1.4114044010219917e-06, + "loss": 0.8145, + "step": 44957 + }, + { + "epoch": 1.15, + "learning_rate": 1.411379180548596e-06, + "loss": 0.6182, + "step": 44958 + }, + { + "epoch": 1.15, + "learning_rate": 1.4113539597602264e-06, + "loss": 0.5605, + "step": 44959 + }, + { + "epoch": 1.15, + "learning_rate": 1.411328738656902e-06, + "loss": 0.7637, + "step": 44960 + }, + { + "epoch": 1.15, + "learning_rate": 1.4113035172386419e-06, + "loss": 0.6934, + "step": 44961 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112782955054653e-06, + "loss": 0.6816, + "step": 44962 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112530734573924e-06, + "loss": 0.7354, + "step": 44963 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112278510944415e-06, + "loss": 0.6572, + "step": 44964 + }, + { + "epoch": 1.15, + "learning_rate": 1.4112026284166328e-06, + "loss": 0.5806, + "step": 44965 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111774054239847e-06, + "loss": 0.5698, + "step": 44966 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111521821165173e-06, + "loss": 0.5557, + "step": 44967 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111269584942491e-06, + "loss": 0.7109, + "step": 44968 + }, + { + "epoch": 1.15, + "learning_rate": 1.4111017345572006e-06, + "loss": 0.5967, + "step": 44969 + }, + { + "epoch": 1.15, + "learning_rate": 1.41107651030539e-06, + "loss": 0.5447, + "step": 44970 + }, + { + "epoch": 1.15, + "learning_rate": 1.411051285738837e-06, + "loss": 0.7158, + "step": 44971 + }, + { + "epoch": 1.15, + "learning_rate": 1.4110260608575607e-06, + "loss": 0.8164, + "step": 44972 + }, + { + "epoch": 1.15, + "learning_rate": 1.4110008356615813e-06, + "loss": 0.7266, + "step": 44973 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109756101509169e-06, + "loss": 0.6113, + "step": 44974 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109503843255875e-06, + "loss": 0.5991, + "step": 44975 + }, + { + "epoch": 1.15, + "learning_rate": 1.4109251581856123e-06, + "loss": 0.5947, + "step": 44976 + }, + { + "epoch": 1.15, + "learning_rate": 1.4108999317310106e-06, + "loss": 0.8076, + "step": 44977 + }, + { + "epoch": 1.15, + "learning_rate": 1.410874704961802e-06, + "loss": 0.6582, + "step": 44978 + }, + { + "epoch": 1.15, + "learning_rate": 1.4108494778780048e-06, + "loss": 0.665, + "step": 44979 + }, + { + "epoch": 1.15, + "learning_rate": 1.41082425047964e-06, + "loss": 0.5928, + "step": 44980 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107990227667255e-06, + "loss": 0.5574, + "step": 44981 + }, + { + "epoch": 1.15, + "learning_rate": 1.410773794739281e-06, + "loss": 0.6929, + "step": 44982 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107485663973257e-06, + "loss": 0.5396, + "step": 44983 + }, + { + "epoch": 1.15, + "learning_rate": 1.4107233377408796e-06, + "loss": 0.7217, + "step": 44984 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106981087699614e-06, + "loss": 0.6221, + "step": 44985 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106728794845904e-06, + "loss": 0.7617, + "step": 44986 + }, + { + "epoch": 1.15, + "learning_rate": 1.410647649884786e-06, + "loss": 0.7256, + "step": 44987 + }, + { + "epoch": 1.15, + "learning_rate": 1.4106224199705678e-06, + "loss": 0.5981, + "step": 44988 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105971897419547e-06, + "loss": 0.7051, + "step": 44989 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105719591989665e-06, + "loss": 0.6011, + "step": 44990 + }, + { + "epoch": 1.15, + "learning_rate": 1.410546728341622e-06, + "loss": 0.5747, + "step": 44991 + }, + { + "epoch": 1.15, + "learning_rate": 1.4105214971699407e-06, + "loss": 0.6455, + "step": 44992 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104962656839418e-06, + "loss": 0.7563, + "step": 44993 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104710338836452e-06, + "loss": 0.6841, + "step": 44994 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104458017690696e-06, + "loss": 0.7246, + "step": 44995 + }, + { + "epoch": 1.15, + "learning_rate": 1.4104205693402346e-06, + "loss": 0.5278, + "step": 44996 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103953365971592e-06, + "loss": 0.5007, + "step": 44997 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103701035398632e-06, + "loss": 0.6885, + "step": 44998 + }, + { + "epoch": 1.15, + "learning_rate": 1.4103448701683656e-06, + "loss": 0.6797, + "step": 44999 + }, + { + "epoch": 1.15, + "learning_rate": 1.410319636482686e-06, + "loss": 0.6338, + "step": 45000 + }, + { + "epoch": 1.15, + "learning_rate": 1.4102944024828434e-06, + "loss": 0.6562, + "step": 45001 + }, + { + "epoch": 1.15, + "learning_rate": 1.410269168168857e-06, + "loss": 0.5942, + "step": 45002 + }, + { + "epoch": 1.15, + "learning_rate": 1.4102439335407466e-06, + "loss": 0.6252, + "step": 45003 + }, + { + "epoch": 1.15, + "learning_rate": 1.410218698598531e-06, + "loss": 0.7583, + "step": 45004 + }, + { + "epoch": 1.15, + "learning_rate": 1.4101934633422303e-06, + "loss": 0.5679, + "step": 45005 + }, + { + "epoch": 1.15, + "learning_rate": 1.410168227771863e-06, + "loss": 0.6484, + "step": 45006 + }, + { + "epoch": 1.15, + "learning_rate": 1.410142991887449e-06, + "loss": 0.5605, + "step": 45007 + }, + { + "epoch": 1.15, + "learning_rate": 1.4101177556890069e-06, + "loss": 0.6035, + "step": 45008 + }, + { + "epoch": 1.15, + "learning_rate": 1.410092519176557e-06, + "loss": 0.5923, + "step": 45009 + }, + { + "epoch": 1.15, + "learning_rate": 1.4100672823501179e-06, + "loss": 0.7168, + "step": 45010 + }, + { + "epoch": 1.15, + "learning_rate": 1.410042045209709e-06, + "loss": 0.6016, + "step": 45011 + }, + { + "epoch": 1.15, + "learning_rate": 1.4100168077553498e-06, + "loss": 0.4954, + "step": 45012 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099915699870598e-06, + "loss": 0.5942, + "step": 45013 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099663319048578e-06, + "loss": 0.5781, + "step": 45014 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099410935087637e-06, + "loss": 0.6719, + "step": 45015 + }, + { + "epoch": 1.15, + "learning_rate": 1.4099158547987965e-06, + "loss": 0.7363, + "step": 45016 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098906157749756e-06, + "loss": 0.6924, + "step": 45017 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098653764373204e-06, + "loss": 0.6357, + "step": 45018 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098401367858496e-06, + "loss": 0.6235, + "step": 45019 + }, + { + "epoch": 1.15, + "learning_rate": 1.4098148968205836e-06, + "loss": 0.6738, + "step": 45020 + }, + { + "epoch": 1.15, + "learning_rate": 1.409789656541541e-06, + "loss": 0.6016, + "step": 45021 + }, + { + "epoch": 1.15, + "learning_rate": 1.4097644159487415e-06, + "loss": 0.5259, + "step": 45022 + }, + { + "epoch": 1.15, + "learning_rate": 1.4097391750422038e-06, + "loss": 0.4688, + "step": 45023 + }, + { + "epoch": 1.15, + "learning_rate": 1.409713933821948e-06, + "loss": 0.833, + "step": 45024 + }, + { + "epoch": 1.15, + "learning_rate": 1.409688692287993e-06, + "loss": 0.6904, + "step": 45025 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096634504403582e-06, + "loss": 0.6914, + "step": 45026 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096382082790628e-06, + "loss": 0.6416, + "step": 45027 + }, + { + "epoch": 1.15, + "learning_rate": 1.4096129658041262e-06, + "loss": 0.7256, + "step": 45028 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095877230155679e-06, + "loss": 0.6528, + "step": 45029 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095624799134075e-06, + "loss": 0.5918, + "step": 45030 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095372364976634e-06, + "loss": 0.6865, + "step": 45031 + }, + { + "epoch": 1.15, + "learning_rate": 1.4095119927683558e-06, + "loss": 0.4747, + "step": 45032 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094867487255036e-06, + "loss": 0.7725, + "step": 45033 + }, + { + "epoch": 1.15, + "learning_rate": 1.409461504369126e-06, + "loss": 0.4197, + "step": 45034 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094362596992428e-06, + "loss": 0.6289, + "step": 45035 + }, + { + "epoch": 1.15, + "learning_rate": 1.4094110147158732e-06, + "loss": 0.5137, + "step": 45036 + }, + { + "epoch": 1.15, + "learning_rate": 1.409385769419036e-06, + "loss": 0.5521, + "step": 45037 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093605238087514e-06, + "loss": 0.562, + "step": 45038 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093352778850378e-06, + "loss": 0.4897, + "step": 45039 + }, + { + "epoch": 1.15, + "learning_rate": 1.4093100316479155e-06, + "loss": 0.3964, + "step": 45040 + }, + { + "epoch": 1.15, + "learning_rate": 1.409284785097403e-06, + "loss": 0.6313, + "step": 45041 + }, + { + "epoch": 1.15, + "learning_rate": 1.40925953823352e-06, + "loss": 0.7183, + "step": 45042 + }, + { + "epoch": 1.15, + "learning_rate": 1.4092342910562857e-06, + "loss": 0.533, + "step": 45043 + }, + { + "epoch": 1.15, + "learning_rate": 1.4092090435657196e-06, + "loss": 0.6636, + "step": 45044 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091837957618413e-06, + "loss": 0.748, + "step": 45045 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091585476446694e-06, + "loss": 0.7842, + "step": 45046 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091332992142237e-06, + "loss": 0.5273, + "step": 45047 + }, + { + "epoch": 1.15, + "learning_rate": 1.4091080504705236e-06, + "loss": 0.8467, + "step": 45048 + }, + { + "epoch": 1.15, + "learning_rate": 1.409082801413588e-06, + "loss": 0.5986, + "step": 45049 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090575520434366e-06, + "loss": 0.7549, + "step": 45050 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090323023600888e-06, + "loss": 0.7793, + "step": 45051 + }, + { + "epoch": 1.15, + "learning_rate": 1.4090070523635636e-06, + "loss": 0.667, + "step": 45052 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089818020538804e-06, + "loss": 0.71, + "step": 45053 + }, + { + "epoch": 1.15, + "learning_rate": 1.408956551431059e-06, + "loss": 0.6108, + "step": 45054 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089313004951183e-06, + "loss": 0.4354, + "step": 45055 + }, + { + "epoch": 1.15, + "learning_rate": 1.4089060492460775e-06, + "loss": 0.7607, + "step": 45056 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088807976839561e-06, + "loss": 0.54, + "step": 45057 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088555458087735e-06, + "loss": 0.6904, + "step": 45058 + }, + { + "epoch": 1.15, + "learning_rate": 1.408830293620549e-06, + "loss": 0.7412, + "step": 45059 + }, + { + "epoch": 1.15, + "learning_rate": 1.4088050411193022e-06, + "loss": 0.6089, + "step": 45060 + }, + { + "epoch": 1.15, + "learning_rate": 1.4087797883050518e-06, + "loss": 0.5427, + "step": 45061 + }, + { + "epoch": 1.15, + "learning_rate": 1.408754535177818e-06, + "loss": 0.7285, + "step": 45062 + }, + { + "epoch": 1.15, + "learning_rate": 1.4087292817376193e-06, + "loss": 0.751, + "step": 45063 + }, + { + "epoch": 1.16, + "learning_rate": 1.4087040279844755e-06, + "loss": 0.6296, + "step": 45064 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086787739184058e-06, + "loss": 0.7568, + "step": 45065 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086535195394296e-06, + "loss": 0.6543, + "step": 45066 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086282648475657e-06, + "loss": 0.8018, + "step": 45067 + }, + { + "epoch": 1.16, + "learning_rate": 1.4086030098428346e-06, + "loss": 0.7119, + "step": 45068 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085777545252548e-06, + "loss": 0.7744, + "step": 45069 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085524988948456e-06, + "loss": 0.5093, + "step": 45070 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085272429516266e-06, + "loss": 0.6274, + "step": 45071 + }, + { + "epoch": 1.16, + "learning_rate": 1.4085019866956173e-06, + "loss": 0.7041, + "step": 45072 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084767301268366e-06, + "loss": 0.6558, + "step": 45073 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084514732453041e-06, + "loss": 0.7148, + "step": 45074 + }, + { + "epoch": 1.16, + "learning_rate": 1.4084262160510392e-06, + "loss": 0.7314, + "step": 45075 + }, + { + "epoch": 1.16, + "learning_rate": 1.408400958544061e-06, + "loss": 0.5225, + "step": 45076 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083757007243886e-06, + "loss": 0.6602, + "step": 45077 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083504425920423e-06, + "loss": 0.7168, + "step": 45078 + }, + { + "epoch": 1.16, + "learning_rate": 1.4083251841470407e-06, + "loss": 0.6443, + "step": 45079 + }, + { + "epoch": 1.16, + "learning_rate": 1.4082999253894033e-06, + "loss": 0.6348, + "step": 45080 + }, + { + "epoch": 1.16, + "learning_rate": 1.4082746663191492e-06, + "loss": 0.7334, + "step": 45081 + }, + { + "epoch": 1.16, + "learning_rate": 1.408249406936298e-06, + "loss": 0.666, + "step": 45082 + }, + { + "epoch": 1.16, + "learning_rate": 1.408224147240869e-06, + "loss": 0.6304, + "step": 45083 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081988872328816e-06, + "loss": 0.5162, + "step": 45084 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081736269123552e-06, + "loss": 0.6514, + "step": 45085 + }, + { + "epoch": 1.16, + "learning_rate": 1.4081483662793087e-06, + "loss": 0.6206, + "step": 45086 + }, + { + "epoch": 1.16, + "learning_rate": 1.408123105333762e-06, + "loss": 0.623, + "step": 45087 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080978440757342e-06, + "loss": 0.6392, + "step": 45088 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080725825052448e-06, + "loss": 0.6096, + "step": 45089 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080473206223128e-06, + "loss": 0.6729, + "step": 45090 + }, + { + "epoch": 1.16, + "learning_rate": 1.4080220584269578e-06, + "loss": 0.7305, + "step": 45091 + }, + { + "epoch": 1.16, + "learning_rate": 1.407996795919199e-06, + "loss": 0.6318, + "step": 45092 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079715330990557e-06, + "loss": 0.4385, + "step": 45093 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079462699665477e-06, + "loss": 0.5986, + "step": 45094 + }, + { + "epoch": 1.16, + "learning_rate": 1.4079210065216938e-06, + "loss": 0.7402, + "step": 45095 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078957427645132e-06, + "loss": 0.7148, + "step": 45096 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078704786950263e-06, + "loss": 0.5693, + "step": 45097 + }, + { + "epoch": 1.16, + "learning_rate": 1.407845214313251e-06, + "loss": 0.7041, + "step": 45098 + }, + { + "epoch": 1.16, + "learning_rate": 1.4078199496192081e-06, + "loss": 0.7949, + "step": 45099 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077946846129157e-06, + "loss": 0.6934, + "step": 45100 + }, + { + "epoch": 1.16, + "learning_rate": 1.407769419294394e-06, + "loss": 0.8213, + "step": 45101 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077441536636614e-06, + "loss": 0.6963, + "step": 45102 + }, + { + "epoch": 1.16, + "learning_rate": 1.4077188877207385e-06, + "loss": 0.7139, + "step": 45103 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076936214656438e-06, + "loss": 0.5791, + "step": 45104 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076683548983965e-06, + "loss": 0.748, + "step": 45105 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076430880190166e-06, + "loss": 0.5645, + "step": 45106 + }, + { + "epoch": 1.16, + "learning_rate": 1.4076178208275234e-06, + "loss": 0.5383, + "step": 45107 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075925533239355e-06, + "loss": 0.5645, + "step": 45108 + }, + { + "epoch": 1.16, + "learning_rate": 1.407567285508273e-06, + "loss": 0.6084, + "step": 45109 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075420173805549e-06, + "loss": 0.4785, + "step": 45110 + }, + { + "epoch": 1.16, + "learning_rate": 1.4075167489408004e-06, + "loss": 0.7051, + "step": 45111 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074914801890293e-06, + "loss": 0.7529, + "step": 45112 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074662111252607e-06, + "loss": 0.3707, + "step": 45113 + }, + { + "epoch": 1.16, + "learning_rate": 1.407440941749514e-06, + "loss": 0.6689, + "step": 45114 + }, + { + "epoch": 1.16, + "learning_rate": 1.4074156720618082e-06, + "loss": 0.7178, + "step": 45115 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073904020621635e-06, + "loss": 0.6914, + "step": 45116 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073651317505981e-06, + "loss": 0.624, + "step": 45117 + }, + { + "epoch": 1.16, + "learning_rate": 1.4073398611271324e-06, + "loss": 0.5703, + "step": 45118 + }, + { + "epoch": 1.16, + "learning_rate": 1.407314590191785e-06, + "loss": 0.6777, + "step": 45119 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072893189445758e-06, + "loss": 0.7119, + "step": 45120 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072640473855236e-06, + "loss": 0.7861, + "step": 45121 + }, + { + "epoch": 1.16, + "learning_rate": 1.4072387755146483e-06, + "loss": 0.7949, + "step": 45122 + }, + { + "epoch": 1.16, + "learning_rate": 1.407213503331969e-06, + "loss": 0.6846, + "step": 45123 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071882308375052e-06, + "loss": 0.7373, + "step": 45124 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071629580312756e-06, + "loss": 0.7109, + "step": 45125 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071376849133003e-06, + "loss": 0.4751, + "step": 45126 + }, + { + "epoch": 1.16, + "learning_rate": 1.4071124114835983e-06, + "loss": 0.7168, + "step": 45127 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070871377421894e-06, + "loss": 0.6377, + "step": 45128 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070618636890923e-06, + "loss": 0.562, + "step": 45129 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070365893243265e-06, + "loss": 0.7607, + "step": 45130 + }, + { + "epoch": 1.16, + "learning_rate": 1.4070113146479116e-06, + "loss": 0.6611, + "step": 45131 + }, + { + "epoch": 1.16, + "learning_rate": 1.406986039659867e-06, + "loss": 0.4856, + "step": 45132 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069607643602118e-06, + "loss": 0.707, + "step": 45133 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069354887489656e-06, + "loss": 0.5532, + "step": 45134 + }, + { + "epoch": 1.16, + "learning_rate": 1.4069102128261477e-06, + "loss": 0.6504, + "step": 45135 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068849365917768e-06, + "loss": 0.6426, + "step": 45136 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068596600458732e-06, + "loss": 0.5996, + "step": 45137 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068343831884559e-06, + "loss": 0.6348, + "step": 45138 + }, + { + "epoch": 1.16, + "learning_rate": 1.4068091060195445e-06, + "loss": 0.3792, + "step": 45139 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067838285391575e-06, + "loss": 0.7827, + "step": 45140 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067585507473152e-06, + "loss": 0.4424, + "step": 45141 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067332726440362e-06, + "loss": 0.604, + "step": 45142 + }, + { + "epoch": 1.16, + "learning_rate": 1.4067079942293405e-06, + "loss": 0.5859, + "step": 45143 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066827155032472e-06, + "loss": 0.6279, + "step": 45144 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066574364657758e-06, + "loss": 0.7188, + "step": 45145 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066321571169453e-06, + "loss": 0.5034, + "step": 45146 + }, + { + "epoch": 1.16, + "learning_rate": 1.4066068774567753e-06, + "loss": 0.6729, + "step": 45147 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065815974852847e-06, + "loss": 0.563, + "step": 45148 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065563172024939e-06, + "loss": 0.5864, + "step": 45149 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065310366084214e-06, + "loss": 0.7646, + "step": 45150 + }, + { + "epoch": 1.16, + "learning_rate": 1.4065057557030867e-06, + "loss": 0.5017, + "step": 45151 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064804744865094e-06, + "loss": 0.5679, + "step": 45152 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064551929587086e-06, + "loss": 0.7285, + "step": 45153 + }, + { + "epoch": 1.16, + "learning_rate": 1.4064299111197035e-06, + "loss": 0.5767, + "step": 45154 + }, + { + "epoch": 1.16, + "learning_rate": 1.406404628969514e-06, + "loss": 0.4088, + "step": 45155 + }, + { + "epoch": 1.16, + "learning_rate": 1.406379346508159e-06, + "loss": 0.7183, + "step": 45156 + }, + { + "epoch": 1.16, + "learning_rate": 1.406354063735658e-06, + "loss": 0.4924, + "step": 45157 + }, + { + "epoch": 1.16, + "learning_rate": 1.4063287806520305e-06, + "loss": 0.5747, + "step": 45158 + }, + { + "epoch": 1.16, + "learning_rate": 1.4063034972572959e-06, + "loss": 0.7393, + "step": 45159 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062782135514733e-06, + "loss": 0.7305, + "step": 45160 + }, + { + "epoch": 1.16, + "learning_rate": 1.406252929534582e-06, + "loss": 0.7881, + "step": 45161 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062276452066415e-06, + "loss": 0.6602, + "step": 45162 + }, + { + "epoch": 1.16, + "learning_rate": 1.4062023605676712e-06, + "loss": 0.6914, + "step": 45163 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061770756176907e-06, + "loss": 0.668, + "step": 45164 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061517903567186e-06, + "loss": 0.5327, + "step": 45165 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061265047847752e-06, + "loss": 0.8604, + "step": 45166 + }, + { + "epoch": 1.16, + "learning_rate": 1.4061012189018791e-06, + "loss": 0.6328, + "step": 45167 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060759327080502e-06, + "loss": 0.5225, + "step": 45168 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060506462033075e-06, + "loss": 0.7139, + "step": 45169 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060253593876706e-06, + "loss": 0.707, + "step": 45170 + }, + { + "epoch": 1.16, + "learning_rate": 1.4060000722611585e-06, + "loss": 0.3513, + "step": 45171 + }, + { + "epoch": 1.16, + "learning_rate": 1.405974784823791e-06, + "loss": 0.5635, + "step": 45172 + }, + { + "epoch": 1.16, + "learning_rate": 1.4059494970755871e-06, + "loss": 0.6558, + "step": 45173 + }, + { + "epoch": 1.16, + "learning_rate": 1.4059242090165667e-06, + "loss": 0.53, + "step": 45174 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058989206467487e-06, + "loss": 0.7705, + "step": 45175 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058736319661524e-06, + "loss": 0.6323, + "step": 45176 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058483429747973e-06, + "loss": 0.6875, + "step": 45177 + }, + { + "epoch": 1.16, + "learning_rate": 1.4058230536727028e-06, + "loss": 0.6357, + "step": 45178 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057977640598883e-06, + "loss": 0.6191, + "step": 45179 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057724741363732e-06, + "loss": 0.6963, + "step": 45180 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057471839021768e-06, + "loss": 0.7812, + "step": 45181 + }, + { + "epoch": 1.16, + "learning_rate": 1.4057218933573182e-06, + "loss": 0.6533, + "step": 45182 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056966025018172e-06, + "loss": 0.4683, + "step": 45183 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056713113356929e-06, + "loss": 0.6475, + "step": 45184 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056460198589648e-06, + "loss": 0.7354, + "step": 45185 + }, + { + "epoch": 1.16, + "learning_rate": 1.4056207280716522e-06, + "loss": 0.5444, + "step": 45186 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055954359737743e-06, + "loss": 0.6143, + "step": 45187 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055701435653504e-06, + "loss": 0.5815, + "step": 45188 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055448508464006e-06, + "loss": 0.5795, + "step": 45189 + }, + { + "epoch": 1.16, + "learning_rate": 1.4055195578169436e-06, + "loss": 0.5981, + "step": 45190 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054942644769989e-06, + "loss": 0.4917, + "step": 45191 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054689708265856e-06, + "loss": 0.6514, + "step": 45192 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054436768657237e-06, + "loss": 0.5356, + "step": 45193 + }, + { + "epoch": 1.16, + "learning_rate": 1.4054183825944324e-06, + "loss": 0.7822, + "step": 45194 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053930880127305e-06, + "loss": 0.7656, + "step": 45195 + }, + { + "epoch": 1.16, + "learning_rate": 1.405367793120638e-06, + "loss": 0.8301, + "step": 45196 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053424979181738e-06, + "loss": 0.8926, + "step": 45197 + }, + { + "epoch": 1.16, + "learning_rate": 1.4053172024053574e-06, + "loss": 0.6118, + "step": 45198 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052919065822085e-06, + "loss": 0.5137, + "step": 45199 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052666104487463e-06, + "loss": 0.6904, + "step": 45200 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052413140049897e-06, + "loss": 0.6777, + "step": 45201 + }, + { + "epoch": 1.16, + "learning_rate": 1.4052160172509588e-06, + "loss": 0.6699, + "step": 45202 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051907201866724e-06, + "loss": 0.585, + "step": 45203 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051654228121505e-06, + "loss": 0.6409, + "step": 45204 + }, + { + "epoch": 1.16, + "learning_rate": 1.4051401251274118e-06, + "loss": 0.5038, + "step": 45205 + }, + { + "epoch": 1.16, + "learning_rate": 1.405114827132476e-06, + "loss": 0.6602, + "step": 45206 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050895288273621e-06, + "loss": 0.5537, + "step": 45207 + }, + { + "epoch": 1.16, + "learning_rate": 1.40506423021209e-06, + "loss": 0.6465, + "step": 45208 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050389312866791e-06, + "loss": 0.5903, + "step": 45209 + }, + { + "epoch": 1.16, + "learning_rate": 1.4050136320511483e-06, + "loss": 0.8564, + "step": 45210 + }, + { + "epoch": 1.16, + "learning_rate": 1.404988332505517e-06, + "loss": 0.5503, + "step": 45211 + }, + { + "epoch": 1.16, + "learning_rate": 1.404963032649805e-06, + "loss": 0.7163, + "step": 45212 + }, + { + "epoch": 1.16, + "learning_rate": 1.404937732484031e-06, + "loss": 0.623, + "step": 45213 + }, + { + "epoch": 1.16, + "learning_rate": 1.4049124320082152e-06, + "loss": 0.7578, + "step": 45214 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048871312223767e-06, + "loss": 0.4048, + "step": 45215 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048618301265348e-06, + "loss": 0.6484, + "step": 45216 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048365287207082e-06, + "loss": 0.6265, + "step": 45217 + }, + { + "epoch": 1.16, + "learning_rate": 1.4048112270049175e-06, + "loss": 0.7324, + "step": 45218 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047859249791812e-06, + "loss": 0.7363, + "step": 45219 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047606226435186e-06, + "loss": 0.8291, + "step": 45220 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047353199979498e-06, + "loss": 0.6982, + "step": 45221 + }, + { + "epoch": 1.16, + "learning_rate": 1.4047100170424936e-06, + "loss": 0.6196, + "step": 45222 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046847137771699e-06, + "loss": 0.8574, + "step": 45223 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046594102019975e-06, + "loss": 0.6138, + "step": 45224 + }, + { + "epoch": 1.16, + "learning_rate": 1.404634106316996e-06, + "loss": 0.7188, + "step": 45225 + }, + { + "epoch": 1.16, + "learning_rate": 1.4046088021221847e-06, + "loss": 0.3544, + "step": 45226 + }, + { + "epoch": 1.16, + "learning_rate": 1.404583497617583e-06, + "loss": 0.5675, + "step": 45227 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045581928032105e-06, + "loss": 0.5605, + "step": 45228 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045328876790863e-06, + "loss": 0.6763, + "step": 45229 + }, + { + "epoch": 1.16, + "learning_rate": 1.4045075822452298e-06, + "loss": 0.7412, + "step": 45230 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044822765016607e-06, + "loss": 0.3661, + "step": 45231 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044569704483977e-06, + "loss": 0.6484, + "step": 45232 + }, + { + "epoch": 1.16, + "learning_rate": 1.404431664085461e-06, + "loss": 0.606, + "step": 45233 + }, + { + "epoch": 1.16, + "learning_rate": 1.4044063574128692e-06, + "loss": 0.5452, + "step": 45234 + }, + { + "epoch": 1.16, + "learning_rate": 1.4043810504306425e-06, + "loss": 0.6543, + "step": 45235 + }, + { + "epoch": 1.16, + "learning_rate": 1.4043557431387996e-06, + "loss": 0.5464, + "step": 45236 + }, + { + "epoch": 1.16, + "learning_rate": 1.40433043553736e-06, + "loss": 0.5933, + "step": 45237 + }, + { + "epoch": 1.16, + "learning_rate": 1.404305127626343e-06, + "loss": 0.7139, + "step": 45238 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042798194057686e-06, + "loss": 0.582, + "step": 45239 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042545108756557e-06, + "loss": 0.6855, + "step": 45240 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042292020360233e-06, + "loss": 0.8262, + "step": 45241 + }, + { + "epoch": 1.16, + "learning_rate": 1.4042038928868915e-06, + "loss": 0.6797, + "step": 45242 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041785834282793e-06, + "loss": 0.5569, + "step": 45243 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041532736602061e-06, + "loss": 0.7246, + "step": 45244 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041279635826915e-06, + "loss": 0.7295, + "step": 45245 + }, + { + "epoch": 1.16, + "learning_rate": 1.4041026531957544e-06, + "loss": 0.7275, + "step": 45246 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040773424994147e-06, + "loss": 0.5103, + "step": 45247 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040520314936914e-06, + "loss": 0.6621, + "step": 45248 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040267201786043e-06, + "loss": 0.6899, + "step": 45249 + }, + { + "epoch": 1.16, + "learning_rate": 1.4040014085541724e-06, + "loss": 0.6143, + "step": 45250 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039760966204151e-06, + "loss": 0.6914, + "step": 45251 + }, + { + "epoch": 1.16, + "learning_rate": 1.403950784377352e-06, + "loss": 0.5613, + "step": 45252 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039254718250022e-06, + "loss": 0.6074, + "step": 45253 + }, + { + "epoch": 1.16, + "learning_rate": 1.4039001589633854e-06, + "loss": 0.7197, + "step": 45254 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038748457925206e-06, + "loss": 0.7793, + "step": 45255 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038495323124278e-06, + "loss": 0.5576, + "step": 45256 + }, + { + "epoch": 1.16, + "learning_rate": 1.4038242185231254e-06, + "loss": 0.5693, + "step": 45257 + }, + { + "epoch": 1.16, + "learning_rate": 1.403798904424634e-06, + "loss": 0.6357, + "step": 45258 + }, + { + "epoch": 1.16, + "learning_rate": 1.4037735900169721e-06, + "loss": 0.8887, + "step": 45259 + }, + { + "epoch": 1.16, + "learning_rate": 1.4037482753001594e-06, + "loss": 0.6411, + "step": 45260 + }, + { + "epoch": 1.16, + "learning_rate": 1.403722960274215e-06, + "loss": 0.5966, + "step": 45261 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036976449391585e-06, + "loss": 0.6064, + "step": 45262 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036723292950092e-06, + "loss": 0.6787, + "step": 45263 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036470133417869e-06, + "loss": 0.7339, + "step": 45264 + }, + { + "epoch": 1.16, + "learning_rate": 1.4036216970795104e-06, + "loss": 0.6992, + "step": 45265 + }, + { + "epoch": 1.16, + "learning_rate": 1.4035963805081992e-06, + "loss": 0.8965, + "step": 45266 + }, + { + "epoch": 1.16, + "learning_rate": 1.403571063627873e-06, + "loss": 0.4575, + "step": 45267 + }, + { + "epoch": 1.16, + "learning_rate": 1.403545746438551e-06, + "loss": 0.5488, + "step": 45268 + }, + { + "epoch": 1.16, + "learning_rate": 1.4035204289402527e-06, + "loss": 0.5938, + "step": 45269 + }, + { + "epoch": 1.16, + "learning_rate": 1.403495111132997e-06, + "loss": 0.6157, + "step": 45270 + }, + { + "epoch": 1.16, + "learning_rate": 1.403469793016804e-06, + "loss": 0.626, + "step": 45271 + }, + { + "epoch": 1.16, + "learning_rate": 1.4034444745916925e-06, + "loss": 0.792, + "step": 45272 + }, + { + "epoch": 1.16, + "learning_rate": 1.4034191558576822e-06, + "loss": 0.71, + "step": 45273 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033938368147926e-06, + "loss": 0.7251, + "step": 45274 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033685174630427e-06, + "loss": 0.6611, + "step": 45275 + }, + { + "epoch": 1.16, + "learning_rate": 1.4033431978024522e-06, + "loss": 0.5198, + "step": 45276 + }, + { + "epoch": 1.16, + "learning_rate": 1.40331787783304e-06, + "loss": 0.6714, + "step": 45277 + }, + { + "epoch": 1.16, + "learning_rate": 1.403292557554826e-06, + "loss": 0.8408, + "step": 45278 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032672369678297e-06, + "loss": 0.6211, + "step": 45279 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032419160720702e-06, + "loss": 0.6221, + "step": 45280 + }, + { + "epoch": 1.16, + "learning_rate": 1.4032165948675667e-06, + "loss": 0.7305, + "step": 45281 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031912733543388e-06, + "loss": 0.5921, + "step": 45282 + }, + { + "epoch": 1.16, + "learning_rate": 1.403165951532406e-06, + "loss": 0.835, + "step": 45283 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031406294017874e-06, + "loss": 0.4893, + "step": 45284 + }, + { + "epoch": 1.16, + "learning_rate": 1.4031153069625026e-06, + "loss": 0.3792, + "step": 45285 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030899842145709e-06, + "loss": 0.752, + "step": 45286 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030646611580119e-06, + "loss": 0.5669, + "step": 45287 + }, + { + "epoch": 1.16, + "learning_rate": 1.4030393377928447e-06, + "loss": 0.6318, + "step": 45288 + }, + { + "epoch": 1.16, + "learning_rate": 1.403014014119089e-06, + "loss": 0.6602, + "step": 45289 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029886901367638e-06, + "loss": 0.7217, + "step": 45290 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029633658458885e-06, + "loss": 0.4653, + "step": 45291 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029380412464832e-06, + "loss": 0.5088, + "step": 45292 + }, + { + "epoch": 1.16, + "learning_rate": 1.4029127163385664e-06, + "loss": 0.5913, + "step": 45293 + }, + { + "epoch": 1.16, + "learning_rate": 1.402887391122158e-06, + "loss": 0.5613, + "step": 45294 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028620655972771e-06, + "loss": 0.4177, + "step": 45295 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028367397639436e-06, + "loss": 0.6738, + "step": 45296 + }, + { + "epoch": 1.16, + "learning_rate": 1.4028114136221761e-06, + "loss": 0.6406, + "step": 45297 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027860871719945e-06, + "loss": 0.6221, + "step": 45298 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027607604134185e-06, + "loss": 0.7676, + "step": 45299 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027354333464668e-06, + "loss": 0.689, + "step": 45300 + }, + { + "epoch": 1.16, + "learning_rate": 1.4027101059711591e-06, + "loss": 0.5161, + "step": 45301 + }, + { + "epoch": 1.16, + "learning_rate": 1.4026847782875147e-06, + "loss": 0.7314, + "step": 45302 + }, + { + "epoch": 1.16, + "learning_rate": 1.402659450295553e-06, + "loss": 0.6143, + "step": 45303 + }, + { + "epoch": 1.16, + "learning_rate": 1.4026341219952937e-06, + "loss": 0.5442, + "step": 45304 + }, + { + "epoch": 1.16, + "learning_rate": 1.402608793386756e-06, + "loss": 0.6416, + "step": 45305 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025834644699592e-06, + "loss": 0.8262, + "step": 45306 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025581352449227e-06, + "loss": 0.5027, + "step": 45307 + }, + { + "epoch": 1.16, + "learning_rate": 1.402532805711666e-06, + "loss": 0.6865, + "step": 45308 + }, + { + "epoch": 1.16, + "learning_rate": 1.4025074758702084e-06, + "loss": 0.6406, + "step": 45309 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024821457205693e-06, + "loss": 0.5742, + "step": 45310 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024568152627683e-06, + "loss": 0.7705, + "step": 45311 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024314844968244e-06, + "loss": 0.7168, + "step": 45312 + }, + { + "epoch": 1.16, + "learning_rate": 1.4024061534227574e-06, + "loss": 0.5674, + "step": 45313 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023808220405866e-06, + "loss": 0.6196, + "step": 45314 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023554903503311e-06, + "loss": 0.7212, + "step": 45315 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023301583520104e-06, + "loss": 0.6001, + "step": 45316 + }, + { + "epoch": 1.16, + "learning_rate": 1.4023048260456443e-06, + "loss": 0.6875, + "step": 45317 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022794934312513e-06, + "loss": 0.7148, + "step": 45318 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022541605088523e-06, + "loss": 0.6611, + "step": 45319 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022288272784652e-06, + "loss": 0.7041, + "step": 45320 + }, + { + "epoch": 1.16, + "learning_rate": 1.4022034937401102e-06, + "loss": 0.7275, + "step": 45321 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021781598938063e-06, + "loss": 0.7637, + "step": 45322 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021528257395732e-06, + "loss": 0.8198, + "step": 45323 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021274912774302e-06, + "loss": 0.6016, + "step": 45324 + }, + { + "epoch": 1.16, + "learning_rate": 1.4021021565073965e-06, + "loss": 0.667, + "step": 45325 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020768214294916e-06, + "loss": 0.6934, + "step": 45326 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020514860437351e-06, + "loss": 0.5918, + "step": 45327 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020261503501463e-06, + "loss": 0.6895, + "step": 45328 + }, + { + "epoch": 1.16, + "learning_rate": 1.4020008143487445e-06, + "loss": 0.6387, + "step": 45329 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019754780395493e-06, + "loss": 0.4182, + "step": 45330 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019501414225798e-06, + "loss": 0.7314, + "step": 45331 + }, + { + "epoch": 1.16, + "learning_rate": 1.4019248044978557e-06, + "loss": 0.6846, + "step": 45332 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018994672653963e-06, + "loss": 0.6763, + "step": 45333 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018741297252209e-06, + "loss": 0.7021, + "step": 45334 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018487918773488e-06, + "loss": 0.5869, + "step": 45335 + }, + { + "epoch": 1.16, + "learning_rate": 1.4018234537217997e-06, + "loss": 0.7432, + "step": 45336 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017981152585927e-06, + "loss": 0.749, + "step": 45337 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017727764877474e-06, + "loss": 0.6782, + "step": 45338 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017474374092832e-06, + "loss": 0.626, + "step": 45339 + }, + { + "epoch": 1.16, + "learning_rate": 1.4017220980232197e-06, + "loss": 0.5068, + "step": 45340 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016967583295758e-06, + "loss": 0.5497, + "step": 45341 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016714183283713e-06, + "loss": 0.5142, + "step": 45342 + }, + { + "epoch": 1.16, + "learning_rate": 1.401646078019625e-06, + "loss": 0.5654, + "step": 45343 + }, + { + "epoch": 1.16, + "learning_rate": 1.4016207374033575e-06, + "loss": 0.8232, + "step": 45344 + }, + { + "epoch": 1.16, + "learning_rate": 1.401595396479587e-06, + "loss": 0.707, + "step": 45345 + }, + { + "epoch": 1.16, + "learning_rate": 1.4015700552483335e-06, + "loss": 0.564, + "step": 45346 + }, + { + "epoch": 1.16, + "learning_rate": 1.4015447137096162e-06, + "loss": 0.6514, + "step": 45347 + }, + { + "epoch": 1.16, + "learning_rate": 1.401519371863455e-06, + "loss": 0.4707, + "step": 45348 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014940297098683e-06, + "loss": 0.5083, + "step": 45349 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014686872488763e-06, + "loss": 0.6079, + "step": 45350 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014433444804982e-06, + "loss": 0.668, + "step": 45351 + }, + { + "epoch": 1.16, + "learning_rate": 1.4014180014047534e-06, + "loss": 0.6008, + "step": 45352 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013926580216613e-06, + "loss": 0.5908, + "step": 45353 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013673143312412e-06, + "loss": 0.6289, + "step": 45354 + }, + { + "epoch": 1.16, + "learning_rate": 1.4013419703335127e-06, + "loss": 0.6348, + "step": 45355 + }, + { + "epoch": 1.16, + "learning_rate": 1.401316626028495e-06, + "loss": 0.8374, + "step": 45356 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012912814162077e-06, + "loss": 0.6042, + "step": 45357 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012659364966702e-06, + "loss": 0.6001, + "step": 45358 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012405912699017e-06, + "loss": 0.5889, + "step": 45359 + }, + { + "epoch": 1.16, + "learning_rate": 1.4012152457359217e-06, + "loss": 0.6768, + "step": 45360 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011898998947498e-06, + "loss": 0.7119, + "step": 45361 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011645537464049e-06, + "loss": 0.5259, + "step": 45362 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011392072909072e-06, + "loss": 0.5181, + "step": 45363 + }, + { + "epoch": 1.16, + "learning_rate": 1.4011138605282753e-06, + "loss": 0.8818, + "step": 45364 + }, + { + "epoch": 1.16, + "learning_rate": 1.4010885134585294e-06, + "loss": 0.6318, + "step": 45365 + }, + { + "epoch": 1.16, + "learning_rate": 1.4010631660816879e-06, + "loss": 0.7715, + "step": 45366 + }, + { + "epoch": 1.16, + "learning_rate": 1.401037818397771e-06, + "loss": 0.5645, + "step": 45367 + }, + { + "epoch": 1.16, + "learning_rate": 1.401012470406798e-06, + "loss": 0.4395, + "step": 45368 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009871221087881e-06, + "loss": 0.6846, + "step": 45369 + }, + { + "epoch": 1.16, + "learning_rate": 1.400961773503761e-06, + "loss": 0.6816, + "step": 45370 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009364245917357e-06, + "loss": 0.5776, + "step": 45371 + }, + { + "epoch": 1.16, + "learning_rate": 1.4009110753727316e-06, + "loss": 0.5942, + "step": 45372 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008857258467685e-06, + "loss": 0.5654, + "step": 45373 + }, + { + "epoch": 1.16, + "learning_rate": 1.400860376013866e-06, + "loss": 0.6538, + "step": 45374 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008350258740426e-06, + "loss": 0.8242, + "step": 45375 + }, + { + "epoch": 1.16, + "learning_rate": 1.4008096754273186e-06, + "loss": 0.728, + "step": 45376 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007843246737127e-06, + "loss": 0.5078, + "step": 45377 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007589736132452e-06, + "loss": 0.6055, + "step": 45378 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007336222459345e-06, + "loss": 0.7529, + "step": 45379 + }, + { + "epoch": 1.16, + "learning_rate": 1.4007082705718007e-06, + "loss": 0.6602, + "step": 45380 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006829185908631e-06, + "loss": 0.7295, + "step": 45381 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006575663031408e-06, + "loss": 0.8618, + "step": 45382 + }, + { + "epoch": 1.16, + "learning_rate": 1.4006322137086536e-06, + "loss": 0.7139, + "step": 45383 + }, + { + "epoch": 1.16, + "learning_rate": 1.400606860807421e-06, + "loss": 0.8281, + "step": 45384 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005815075994614e-06, + "loss": 0.5752, + "step": 45385 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005561540847954e-06, + "loss": 0.6621, + "step": 45386 + }, + { + "epoch": 1.16, + "learning_rate": 1.400530800263442e-06, + "loss": 0.6533, + "step": 45387 + }, + { + "epoch": 1.16, + "learning_rate": 1.4005054461354207e-06, + "loss": 0.6982, + "step": 45388 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004800917007504e-06, + "loss": 0.7339, + "step": 45389 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004547369594513e-06, + "loss": 0.5654, + "step": 45390 + }, + { + "epoch": 1.16, + "learning_rate": 1.400429381911542e-06, + "loss": 0.5038, + "step": 45391 + }, + { + "epoch": 1.16, + "learning_rate": 1.4004040265570427e-06, + "loss": 0.75, + "step": 45392 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003786708959725e-06, + "loss": 0.5137, + "step": 45393 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003533149283505e-06, + "loss": 0.6592, + "step": 45394 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003279586541963e-06, + "loss": 0.5684, + "step": 45395 + }, + { + "epoch": 1.16, + "learning_rate": 1.4003026020735297e-06, + "loss": 0.7148, + "step": 45396 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002772451863696e-06, + "loss": 0.604, + "step": 45397 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002518879927356e-06, + "loss": 0.7568, + "step": 45398 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002265304926475e-06, + "loss": 0.835, + "step": 45399 + }, + { + "epoch": 1.16, + "learning_rate": 1.4002011726861238e-06, + "loss": 0.6655, + "step": 45400 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001758145731848e-06, + "loss": 0.7051, + "step": 45401 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001504561538494e-06, + "loss": 0.5015, + "step": 45402 + }, + { + "epoch": 1.16, + "learning_rate": 1.4001250974281375e-06, + "loss": 0.8047, + "step": 45403 + }, + { + "epoch": 1.16, + "learning_rate": 1.400099738396068e-06, + "loss": 0.833, + "step": 45404 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000743790576606e-06, + "loss": 0.5393, + "step": 45405 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000490194129345e-06, + "loss": 0.4946, + "step": 45406 + }, + { + "epoch": 1.16, + "learning_rate": 1.4000236594619092e-06, + "loss": 0.7363, + "step": 45407 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999982992046044e-06, + "loss": 0.7266, + "step": 45408 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999729386410394e-06, + "loss": 0.5439, + "step": 45409 + }, + { + "epoch": 1.16, + "learning_rate": 1.399947577771233e-06, + "loss": 0.7627, + "step": 45410 + }, + { + "epoch": 1.16, + "learning_rate": 1.3999222165952059e-06, + "loss": 0.7783, + "step": 45411 + }, + { + "epoch": 1.16, + "learning_rate": 1.399896855112976e-06, + "loss": 0.6367, + "step": 45412 + }, + { + "epoch": 1.16, + "learning_rate": 1.399871493324564e-06, + "loss": 0.6191, + "step": 45413 + }, + { + "epoch": 1.16, + "learning_rate": 1.3998461312299884e-06, + "loss": 0.7041, + "step": 45414 + }, + { + "epoch": 1.16, + "learning_rate": 1.399820768829269e-06, + "loss": 0.9307, + "step": 45415 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997954061224255e-06, + "loss": 0.6865, + "step": 45416 + }, + { + "epoch": 1.16, + "learning_rate": 1.399770043109477e-06, + "loss": 0.5117, + "step": 45417 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997446797904428e-06, + "loss": 0.7393, + "step": 45418 + }, + { + "epoch": 1.16, + "learning_rate": 1.3997193161653424e-06, + "loss": 0.749, + "step": 45419 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996939522341957e-06, + "loss": 0.7324, + "step": 45420 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996685879970213e-06, + "loss": 0.7715, + "step": 45421 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996432234538393e-06, + "loss": 0.8594, + "step": 45422 + }, + { + "epoch": 1.16, + "learning_rate": 1.3996178586046688e-06, + "loss": 0.6787, + "step": 45423 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995924934495294e-06, + "loss": 0.7744, + "step": 45424 + }, + { + "epoch": 1.16, + "learning_rate": 1.39956712798844e-06, + "loss": 0.6172, + "step": 45425 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995417622214207e-06, + "loss": 0.667, + "step": 45426 + }, + { + "epoch": 1.16, + "learning_rate": 1.3995163961484907e-06, + "loss": 0.6514, + "step": 45427 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994910297696697e-06, + "loss": 0.75, + "step": 45428 + }, + { + "epoch": 1.16, + "learning_rate": 1.399465663084976e-06, + "loss": 0.6206, + "step": 45429 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994402960944304e-06, + "loss": 0.4434, + "step": 45430 + }, + { + "epoch": 1.16, + "learning_rate": 1.3994149287980512e-06, + "loss": 0.7627, + "step": 45431 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993895611958588e-06, + "loss": 0.4473, + "step": 45432 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993641932878721e-06, + "loss": 0.6416, + "step": 45433 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993388250741107e-06, + "loss": 0.6035, + "step": 45434 + }, + { + "epoch": 1.16, + "learning_rate": 1.3993134565545938e-06, + "loss": 0.7129, + "step": 45435 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992880877293407e-06, + "loss": 0.686, + "step": 45436 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992627185983711e-06, + "loss": 0.2832, + "step": 45437 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992373491617047e-06, + "loss": 0.5327, + "step": 45438 + }, + { + "epoch": 1.16, + "learning_rate": 1.3992119794193607e-06, + "loss": 0.7656, + "step": 45439 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991866093713582e-06, + "loss": 0.5737, + "step": 45440 + }, + { + "epoch": 1.16, + "learning_rate": 1.399161239017717e-06, + "loss": 0.5122, + "step": 45441 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991358683584563e-06, + "loss": 0.6401, + "step": 45442 + }, + { + "epoch": 1.16, + "learning_rate": 1.3991104973935956e-06, + "loss": 0.6602, + "step": 45443 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990851261231545e-06, + "loss": 0.6736, + "step": 45444 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990597545471521e-06, + "loss": 0.6362, + "step": 45445 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990343826656079e-06, + "loss": 0.7412, + "step": 45446 + }, + { + "epoch": 1.16, + "learning_rate": 1.3990090104785416e-06, + "loss": 0.6104, + "step": 45447 + }, + { + "epoch": 1.16, + "learning_rate": 1.3989836379859723e-06, + "loss": 0.6582, + "step": 45448 + }, + { + "epoch": 1.16, + "learning_rate": 1.39895826518792e-06, + "loss": 0.5195, + "step": 45449 + }, + { + "epoch": 1.16, + "learning_rate": 1.398932892084403e-06, + "loss": 0.835, + "step": 45450 + }, + { + "epoch": 1.16, + "learning_rate": 1.398907518675442e-06, + "loss": 0.7568, + "step": 45451 + }, + { + "epoch": 1.16, + "learning_rate": 1.3988821449610555e-06, + "loss": 0.6665, + "step": 45452 + }, + { + "epoch": 1.16, + "learning_rate": 1.3988567709412638e-06, + "loss": 0.6704, + "step": 45453 + }, + { + "epoch": 1.17, + "learning_rate": 1.3988313966160852e-06, + "loss": 0.5801, + "step": 45454 + }, + { + "epoch": 1.17, + "learning_rate": 1.3988060219855402e-06, + "loss": 0.6377, + "step": 45455 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987806470496474e-06, + "loss": 0.5771, + "step": 45456 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987552718084268e-06, + "loss": 0.3979, + "step": 45457 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987298962618976e-06, + "loss": 0.4705, + "step": 45458 + }, + { + "epoch": 1.17, + "learning_rate": 1.3987045204100793e-06, + "loss": 0.7441, + "step": 45459 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986791442529914e-06, + "loss": 0.4351, + "step": 45460 + }, + { + "epoch": 1.17, + "learning_rate": 1.398653767790653e-06, + "loss": 0.5762, + "step": 45461 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986283910230836e-06, + "loss": 0.5601, + "step": 45462 + }, + { + "epoch": 1.17, + "learning_rate": 1.3986030139503028e-06, + "loss": 0.7373, + "step": 45463 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985776365723302e-06, + "loss": 0.6396, + "step": 45464 + }, + { + "epoch": 1.17, + "learning_rate": 1.398552258889185e-06, + "loss": 0.5781, + "step": 45465 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985268809008866e-06, + "loss": 0.6587, + "step": 45466 + }, + { + "epoch": 1.17, + "learning_rate": 1.3985015026074545e-06, + "loss": 0.6934, + "step": 45467 + }, + { + "epoch": 1.17, + "learning_rate": 1.3984761240089085e-06, + "loss": 0.7412, + "step": 45468 + }, + { + "epoch": 1.17, + "learning_rate": 1.398450745105267e-06, + "loss": 0.749, + "step": 45469 + }, + { + "epoch": 1.17, + "learning_rate": 1.3984253658965503e-06, + "loss": 0.8057, + "step": 45470 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983999863827778e-06, + "loss": 0.749, + "step": 45471 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983746065639688e-06, + "loss": 0.6812, + "step": 45472 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983492264401423e-06, + "loss": 0.5708, + "step": 45473 + }, + { + "epoch": 1.17, + "learning_rate": 1.3983238460113186e-06, + "loss": 0.6489, + "step": 45474 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982984652775162e-06, + "loss": 0.5903, + "step": 45475 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982730842387553e-06, + "loss": 0.5493, + "step": 45476 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982477028950547e-06, + "loss": 0.5894, + "step": 45477 + }, + { + "epoch": 1.17, + "learning_rate": 1.3982223212464345e-06, + "loss": 0.5923, + "step": 45478 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981969392929135e-06, + "loss": 0.6973, + "step": 45479 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981715570345118e-06, + "loss": 0.7852, + "step": 45480 + }, + { + "epoch": 1.17, + "learning_rate": 1.3981461744712478e-06, + "loss": 0.7383, + "step": 45481 + }, + { + "epoch": 1.17, + "learning_rate": 1.398120791603142e-06, + "loss": 0.5811, + "step": 45482 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980954084302136e-06, + "loss": 0.6396, + "step": 45483 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980700249524815e-06, + "loss": 0.5488, + "step": 45484 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980446411699655e-06, + "loss": 0.6699, + "step": 45485 + }, + { + "epoch": 1.17, + "learning_rate": 1.3980192570826853e-06, + "loss": 0.5737, + "step": 45486 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979938726906597e-06, + "loss": 0.707, + "step": 45487 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979684879939088e-06, + "loss": 0.6162, + "step": 45488 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979431029924518e-06, + "loss": 0.7041, + "step": 45489 + }, + { + "epoch": 1.17, + "learning_rate": 1.3979177176863078e-06, + "loss": 0.6104, + "step": 45490 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978923320754966e-06, + "loss": 0.7061, + "step": 45491 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978669461600373e-06, + "loss": 0.7134, + "step": 45492 + }, + { + "epoch": 1.17, + "learning_rate": 1.39784155993995e-06, + "loss": 0.7969, + "step": 45493 + }, + { + "epoch": 1.17, + "learning_rate": 1.3978161734152533e-06, + "loss": 0.5679, + "step": 45494 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977907865859675e-06, + "loss": 0.5698, + "step": 45495 + }, + { + "epoch": 1.17, + "learning_rate": 1.397765399452111e-06, + "loss": 0.7842, + "step": 45496 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977400120137044e-06, + "loss": 0.647, + "step": 45497 + }, + { + "epoch": 1.17, + "learning_rate": 1.3977146242707662e-06, + "loss": 0.7314, + "step": 45498 + }, + { + "epoch": 1.17, + "learning_rate": 1.3976892362233163e-06, + "loss": 0.5522, + "step": 45499 + }, + { + "epoch": 1.17, + "learning_rate": 1.397663847871374e-06, + "loss": 0.7236, + "step": 45500 + }, + { + "epoch": 1.17, + "learning_rate": 1.397638459214959e-06, + "loss": 0.7393, + "step": 45501 + }, + { + "epoch": 1.17, + "learning_rate": 1.3976130702540903e-06, + "loss": 0.623, + "step": 45502 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975876809887877e-06, + "loss": 0.5688, + "step": 45503 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975622914190703e-06, + "loss": 0.7334, + "step": 45504 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975369015449578e-06, + "loss": 0.5999, + "step": 45505 + }, + { + "epoch": 1.17, + "learning_rate": 1.3975115113664695e-06, + "loss": 0.6343, + "step": 45506 + }, + { + "epoch": 1.17, + "learning_rate": 1.397486120883625e-06, + "loss": 0.6025, + "step": 45507 + }, + { + "epoch": 1.17, + "learning_rate": 1.3974607300964438e-06, + "loss": 0.6685, + "step": 45508 + }, + { + "epoch": 1.17, + "learning_rate": 1.397435339004945e-06, + "loss": 0.541, + "step": 45509 + }, + { + "epoch": 1.17, + "learning_rate": 1.3974099476091483e-06, + "loss": 0.5566, + "step": 45510 + }, + { + "epoch": 1.17, + "learning_rate": 1.397384555909073e-06, + "loss": 0.6494, + "step": 45511 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973591639047387e-06, + "loss": 0.4639, + "step": 45512 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973337715961648e-06, + "loss": 0.7168, + "step": 45513 + }, + { + "epoch": 1.17, + "learning_rate": 1.3973083789833706e-06, + "loss": 0.6831, + "step": 45514 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972829860663757e-06, + "loss": 0.707, + "step": 45515 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972575928451996e-06, + "loss": 0.7188, + "step": 45516 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972321993198612e-06, + "loss": 0.7285, + "step": 45517 + }, + { + "epoch": 1.17, + "learning_rate": 1.3972068054903812e-06, + "loss": 0.7876, + "step": 45518 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971814113567772e-06, + "loss": 0.5796, + "step": 45519 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971560169190704e-06, + "loss": 0.6526, + "step": 45520 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971306221772792e-06, + "loss": 0.6499, + "step": 45521 + }, + { + "epoch": 1.17, + "learning_rate": 1.3971052271314235e-06, + "loss": 0.6519, + "step": 45522 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970798317815225e-06, + "loss": 0.5947, + "step": 45523 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970544361275956e-06, + "loss": 0.5757, + "step": 45524 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970290401696624e-06, + "loss": 0.5381, + "step": 45525 + }, + { + "epoch": 1.17, + "learning_rate": 1.3970036439077425e-06, + "loss": 0.6729, + "step": 45526 + }, + { + "epoch": 1.17, + "learning_rate": 1.396978247341855e-06, + "loss": 0.7334, + "step": 45527 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969528504720197e-06, + "loss": 0.7197, + "step": 45528 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969274532982556e-06, + "loss": 0.5708, + "step": 45529 + }, + { + "epoch": 1.17, + "learning_rate": 1.3969020558205827e-06, + "loss": 0.5249, + "step": 45530 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968766580390198e-06, + "loss": 0.6172, + "step": 45531 + }, + { + "epoch": 1.17, + "learning_rate": 1.396851259953587e-06, + "loss": 0.6758, + "step": 45532 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968258615643031e-06, + "loss": 0.6865, + "step": 45533 + }, + { + "epoch": 1.17, + "learning_rate": 1.3968004628711883e-06, + "loss": 0.582, + "step": 45534 + }, + { + "epoch": 1.17, + "learning_rate": 1.3967750638742612e-06, + "loss": 0.594, + "step": 45535 + }, + { + "epoch": 1.17, + "learning_rate": 1.396749664573542e-06, + "loss": 0.6875, + "step": 45536 + }, + { + "epoch": 1.17, + "learning_rate": 1.3967242649690496e-06, + "loss": 0.5432, + "step": 45537 + }, + { + "epoch": 1.17, + "learning_rate": 1.396698865060804e-06, + "loss": 0.5913, + "step": 45538 + }, + { + "epoch": 1.17, + "learning_rate": 1.396673464848824e-06, + "loss": 0.6382, + "step": 45539 + }, + { + "epoch": 1.17, + "learning_rate": 1.3966480643331296e-06, + "loss": 0.4805, + "step": 45540 + }, + { + "epoch": 1.17, + "learning_rate": 1.3966226635137397e-06, + "loss": 0.7119, + "step": 45541 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965972623906744e-06, + "loss": 0.4362, + "step": 45542 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965718609639528e-06, + "loss": 0.7529, + "step": 45543 + }, + { + "epoch": 1.17, + "learning_rate": 1.396546459233594e-06, + "loss": 0.7773, + "step": 45544 + }, + { + "epoch": 1.17, + "learning_rate": 1.3965210571996183e-06, + "loss": 0.6218, + "step": 45545 + }, + { + "epoch": 1.17, + "learning_rate": 1.396495654862044e-06, + "loss": 0.6855, + "step": 45546 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964702522208918e-06, + "loss": 0.6858, + "step": 45547 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964448492761804e-06, + "loss": 0.4717, + "step": 45548 + }, + { + "epoch": 1.17, + "learning_rate": 1.3964194460279295e-06, + "loss": 0.5479, + "step": 45549 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963940424761582e-06, + "loss": 0.6626, + "step": 45550 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963686386208864e-06, + "loss": 0.6016, + "step": 45551 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963432344621331e-06, + "loss": 0.5146, + "step": 45552 + }, + { + "epoch": 1.17, + "learning_rate": 1.3963178299999182e-06, + "loss": 0.5493, + "step": 45553 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962924252342612e-06, + "loss": 0.6099, + "step": 45554 + }, + { + "epoch": 1.17, + "learning_rate": 1.396267020165181e-06, + "loss": 0.6226, + "step": 45555 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962416147926975e-06, + "loss": 0.7207, + "step": 45556 + }, + { + "epoch": 1.17, + "learning_rate": 1.3962162091168299e-06, + "loss": 0.5981, + "step": 45557 + }, + { + "epoch": 1.17, + "learning_rate": 1.396190803137598e-06, + "loss": 0.6287, + "step": 45558 + }, + { + "epoch": 1.17, + "learning_rate": 1.3961653968550206e-06, + "loss": 0.6816, + "step": 45559 + }, + { + "epoch": 1.17, + "learning_rate": 1.396139990269118e-06, + "loss": 0.6379, + "step": 45560 + }, + { + "epoch": 1.17, + "learning_rate": 1.396114583379909e-06, + "loss": 0.7109, + "step": 45561 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960891761874134e-06, + "loss": 0.6367, + "step": 45562 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960637686916506e-06, + "loss": 0.5977, + "step": 45563 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960383608926398e-06, + "loss": 0.6758, + "step": 45564 + }, + { + "epoch": 1.17, + "learning_rate": 1.3960129527904006e-06, + "loss": 0.5906, + "step": 45565 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959875443849525e-06, + "loss": 0.6167, + "step": 45566 + }, + { + "epoch": 1.17, + "learning_rate": 1.395962135676315e-06, + "loss": 0.5981, + "step": 45567 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959367266645076e-06, + "loss": 0.6675, + "step": 45568 + }, + { + "epoch": 1.17, + "learning_rate": 1.3959113173495497e-06, + "loss": 0.8135, + "step": 45569 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958859077314605e-06, + "loss": 0.6934, + "step": 45570 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958604978102594e-06, + "loss": 0.6353, + "step": 45571 + }, + { + "epoch": 1.17, + "learning_rate": 1.3958350875859668e-06, + "loss": 0.6323, + "step": 45572 + }, + { + "epoch": 1.17, + "learning_rate": 1.395809677058601e-06, + "loss": 0.7031, + "step": 45573 + }, + { + "epoch": 1.17, + "learning_rate": 1.395784266228182e-06, + "loss": 0.4314, + "step": 45574 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957588550947292e-06, + "loss": 0.3771, + "step": 45575 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957334436582625e-06, + "loss": 0.6445, + "step": 45576 + }, + { + "epoch": 1.17, + "learning_rate": 1.3957080319188002e-06, + "loss": 0.5264, + "step": 45577 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956826198763627e-06, + "loss": 0.6797, + "step": 45578 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956572075309693e-06, + "loss": 0.6162, + "step": 45579 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956317948826392e-06, + "loss": 0.6904, + "step": 45580 + }, + { + "epoch": 1.17, + "learning_rate": 1.3956063819313921e-06, + "loss": 0.582, + "step": 45581 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955809686772475e-06, + "loss": 0.6836, + "step": 45582 + }, + { + "epoch": 1.17, + "learning_rate": 1.395555555120225e-06, + "loss": 0.7188, + "step": 45583 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955301412603434e-06, + "loss": 0.6211, + "step": 45584 + }, + { + "epoch": 1.17, + "learning_rate": 1.3955047270976226e-06, + "loss": 0.5752, + "step": 45585 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954793126320818e-06, + "loss": 0.728, + "step": 45586 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954538978637409e-06, + "loss": 0.627, + "step": 45587 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954284827926195e-06, + "loss": 0.5918, + "step": 45588 + }, + { + "epoch": 1.17, + "learning_rate": 1.3954030674187363e-06, + "loss": 0.6104, + "step": 45589 + }, + { + "epoch": 1.17, + "learning_rate": 1.395377651742111e-06, + "loss": 0.6631, + "step": 45590 + }, + { + "epoch": 1.17, + "learning_rate": 1.3953522357627636e-06, + "loss": 0.6123, + "step": 45591 + }, + { + "epoch": 1.17, + "learning_rate": 1.3953268194807128e-06, + "loss": 0.5737, + "step": 45592 + }, + { + "epoch": 1.17, + "learning_rate": 1.395301402895979e-06, + "loss": 0.79, + "step": 45593 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952759860085804e-06, + "loss": 0.6846, + "step": 45594 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952505688185375e-06, + "loss": 0.7246, + "step": 45595 + }, + { + "epoch": 1.17, + "learning_rate": 1.3952251513258693e-06, + "loss": 0.6768, + "step": 45596 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951997335305956e-06, + "loss": 0.6357, + "step": 45597 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951743154327355e-06, + "loss": 0.3943, + "step": 45598 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951488970323084e-06, + "loss": 0.752, + "step": 45599 + }, + { + "epoch": 1.17, + "learning_rate": 1.3951234783293343e-06, + "loss": 0.5776, + "step": 45600 + }, + { + "epoch": 1.17, + "learning_rate": 1.395098059323832e-06, + "loss": 0.6084, + "step": 45601 + }, + { + "epoch": 1.17, + "learning_rate": 1.3950726400158216e-06, + "loss": 0.5137, + "step": 45602 + }, + { + "epoch": 1.17, + "learning_rate": 1.3950472204053222e-06, + "loss": 0.5991, + "step": 45603 + }, + { + "epoch": 1.17, + "learning_rate": 1.395021800492353e-06, + "loss": 0.5083, + "step": 45604 + }, + { + "epoch": 1.17, + "learning_rate": 1.394996380276934e-06, + "loss": 0.7578, + "step": 45605 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949709597590844e-06, + "loss": 0.481, + "step": 45606 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949455389388236e-06, + "loss": 0.585, + "step": 45607 + }, + { + "epoch": 1.17, + "learning_rate": 1.3949201178161715e-06, + "loss": 0.6475, + "step": 45608 + }, + { + "epoch": 1.17, + "learning_rate": 1.394894696391147e-06, + "loss": 0.6406, + "step": 45609 + }, + { + "epoch": 1.17, + "learning_rate": 1.3948692746637699e-06, + "loss": 0.7236, + "step": 45610 + }, + { + "epoch": 1.17, + "learning_rate": 1.3948438526340592e-06, + "loss": 0.6816, + "step": 45611 + }, + { + "epoch": 1.17, + "learning_rate": 1.394818430302035e-06, + "loss": 0.7441, + "step": 45612 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947930076677166e-06, + "loss": 0.5759, + "step": 45613 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947675847311232e-06, + "loss": 0.4761, + "step": 45614 + }, + { + "epoch": 1.17, + "learning_rate": 1.394742161492274e-06, + "loss": 0.7148, + "step": 45615 + }, + { + "epoch": 1.17, + "learning_rate": 1.3947167379511894e-06, + "loss": 0.7959, + "step": 45616 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946913141078883e-06, + "loss": 0.6812, + "step": 45617 + }, + { + "epoch": 1.17, + "learning_rate": 1.39466588996239e-06, + "loss": 0.373, + "step": 45618 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946404655147143e-06, + "loss": 0.6699, + "step": 45619 + }, + { + "epoch": 1.17, + "learning_rate": 1.3946150407648806e-06, + "loss": 0.5039, + "step": 45620 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945896157129083e-06, + "loss": 0.7812, + "step": 45621 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945641903588168e-06, + "loss": 0.6165, + "step": 45622 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945387647026259e-06, + "loss": 0.5657, + "step": 45623 + }, + { + "epoch": 1.17, + "learning_rate": 1.3945133387443542e-06, + "loss": 0.5245, + "step": 45624 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944879124840223e-06, + "loss": 0.6968, + "step": 45625 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944624859216488e-06, + "loss": 0.7178, + "step": 45626 + }, + { + "epoch": 1.17, + "learning_rate": 1.394437059057254e-06, + "loss": 0.4956, + "step": 45627 + }, + { + "epoch": 1.17, + "learning_rate": 1.3944116318908566e-06, + "loss": 0.585, + "step": 45628 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943862044224764e-06, + "loss": 0.5464, + "step": 45629 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943607766521325e-06, + "loss": 0.6084, + "step": 45630 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943353485798451e-06, + "loss": 0.6545, + "step": 45631 + }, + { + "epoch": 1.17, + "learning_rate": 1.3943099202056328e-06, + "loss": 0.5825, + "step": 45632 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942844915295162e-06, + "loss": 0.606, + "step": 45633 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942590625515136e-06, + "loss": 0.6572, + "step": 45634 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942336332716452e-06, + "loss": 0.6289, + "step": 45635 + }, + { + "epoch": 1.17, + "learning_rate": 1.3942082036899299e-06, + "loss": 0.6157, + "step": 45636 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941827738063879e-06, + "loss": 0.6675, + "step": 45637 + }, + { + "epoch": 1.17, + "learning_rate": 1.394157343621038e-06, + "loss": 0.5254, + "step": 45638 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941319131339002e-06, + "loss": 0.7812, + "step": 45639 + }, + { + "epoch": 1.17, + "learning_rate": 1.3941064823449933e-06, + "loss": 0.5996, + "step": 45640 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940810512543374e-06, + "loss": 0.5757, + "step": 45641 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940556198619517e-06, + "loss": 0.5713, + "step": 45642 + }, + { + "epoch": 1.17, + "learning_rate": 1.394030188167856e-06, + "loss": 0.748, + "step": 45643 + }, + { + "epoch": 1.17, + "learning_rate": 1.3940047561720695e-06, + "loss": 0.5156, + "step": 45644 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939793238746115e-06, + "loss": 0.7461, + "step": 45645 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939538912755015e-06, + "loss": 0.7061, + "step": 45646 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939284583747594e-06, + "loss": 0.5596, + "step": 45647 + }, + { + "epoch": 1.17, + "learning_rate": 1.3939030251724044e-06, + "loss": 0.4932, + "step": 45648 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938775916684556e-06, + "loss": 0.5269, + "step": 45649 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938521578629331e-06, + "loss": 0.5435, + "step": 45650 + }, + { + "epoch": 1.17, + "learning_rate": 1.393826723755856e-06, + "loss": 0.6289, + "step": 45651 + }, + { + "epoch": 1.17, + "learning_rate": 1.3938012893472441e-06, + "loss": 0.6455, + "step": 45652 + }, + { + "epoch": 1.17, + "learning_rate": 1.3937758546371166e-06, + "loss": 0.4929, + "step": 45653 + }, + { + "epoch": 1.17, + "learning_rate": 1.393750419625493e-06, + "loss": 0.7153, + "step": 45654 + }, + { + "epoch": 1.17, + "learning_rate": 1.3937249843123926e-06, + "loss": 0.5046, + "step": 45655 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936995486978354e-06, + "loss": 0.6387, + "step": 45656 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936741127818406e-06, + "loss": 0.6172, + "step": 45657 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936486765644272e-06, + "loss": 0.6021, + "step": 45658 + }, + { + "epoch": 1.17, + "learning_rate": 1.3936232400456154e-06, + "loss": 0.6704, + "step": 45659 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935978032254245e-06, + "loss": 0.7036, + "step": 45660 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935723661038734e-06, + "loss": 0.8088, + "step": 45661 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935469286809824e-06, + "loss": 0.6973, + "step": 45662 + }, + { + "epoch": 1.17, + "learning_rate": 1.3935214909567708e-06, + "loss": 0.5098, + "step": 45663 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934960529312574e-06, + "loss": 0.751, + "step": 45664 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934706146044626e-06, + "loss": 0.6465, + "step": 45665 + }, + { + "epoch": 1.17, + "learning_rate": 1.3934451759764053e-06, + "loss": 0.627, + "step": 45666 + }, + { + "epoch": 1.17, + "learning_rate": 1.393419737047105e-06, + "loss": 0.6021, + "step": 45667 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933942978165813e-06, + "loss": 0.3449, + "step": 45668 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933688582848538e-06, + "loss": 0.7666, + "step": 45669 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933434184519416e-06, + "loss": 0.5762, + "step": 45670 + }, + { + "epoch": 1.17, + "learning_rate": 1.3933179783178648e-06, + "loss": 0.6899, + "step": 45671 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932925378826424e-06, + "loss": 0.4536, + "step": 45672 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932670971462939e-06, + "loss": 0.7441, + "step": 45673 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932416561088388e-06, + "loss": 0.6201, + "step": 45674 + }, + { + "epoch": 1.17, + "learning_rate": 1.3932162147702969e-06, + "loss": 0.6538, + "step": 45675 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931907731306872e-06, + "loss": 0.458, + "step": 45676 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931653311900295e-06, + "loss": 0.7207, + "step": 45677 + }, + { + "epoch": 1.17, + "learning_rate": 1.393139888948343e-06, + "loss": 0.5552, + "step": 45678 + }, + { + "epoch": 1.17, + "learning_rate": 1.3931144464056476e-06, + "loss": 0.4907, + "step": 45679 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930890035619624e-06, + "loss": 0.6094, + "step": 45680 + }, + { + "epoch": 1.17, + "learning_rate": 1.393063560417307e-06, + "loss": 0.6934, + "step": 45681 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930381169717012e-06, + "loss": 0.5713, + "step": 45682 + }, + { + "epoch": 1.17, + "learning_rate": 1.3930126732251642e-06, + "loss": 0.7246, + "step": 45683 + }, + { + "epoch": 1.17, + "learning_rate": 1.392987229177715e-06, + "loss": 0.592, + "step": 45684 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929617848293737e-06, + "loss": 0.707, + "step": 45685 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929363401801596e-06, + "loss": 0.7827, + "step": 45686 + }, + { + "epoch": 1.17, + "learning_rate": 1.3929108952300925e-06, + "loss": 0.6016, + "step": 45687 + }, + { + "epoch": 1.17, + "learning_rate": 1.3928854499791916e-06, + "loss": 0.7642, + "step": 45688 + }, + { + "epoch": 1.17, + "learning_rate": 1.392860004427476e-06, + "loss": 0.541, + "step": 45689 + }, + { + "epoch": 1.17, + "learning_rate": 1.392834558574966e-06, + "loss": 0.7266, + "step": 45690 + }, + { + "epoch": 1.17, + "learning_rate": 1.3928091124216802e-06, + "loss": 0.6479, + "step": 45691 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927836659676388e-06, + "loss": 0.6299, + "step": 45692 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927582192128608e-06, + "loss": 0.6001, + "step": 45693 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927327721573661e-06, + "loss": 0.8467, + "step": 45694 + }, + { + "epoch": 1.17, + "learning_rate": 1.3927073248011739e-06, + "loss": 0.624, + "step": 45695 + }, + { + "epoch": 1.17, + "learning_rate": 1.392681877144304e-06, + "loss": 0.6758, + "step": 45696 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926564291867753e-06, + "loss": 0.5371, + "step": 45697 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926309809286077e-06, + "loss": 0.8203, + "step": 45698 + }, + { + "epoch": 1.17, + "learning_rate": 1.3926055323698205e-06, + "loss": 0.6484, + "step": 45699 + }, + { + "epoch": 1.17, + "learning_rate": 1.3925800835104336e-06, + "loss": 0.5555, + "step": 45700 + }, + { + "epoch": 1.17, + "learning_rate": 1.392554634350466e-06, + "loss": 0.5771, + "step": 45701 + }, + { + "epoch": 1.17, + "learning_rate": 1.3925291848899375e-06, + "loss": 0.6494, + "step": 45702 + }, + { + "epoch": 1.17, + "learning_rate": 1.392503735128867e-06, + "loss": 0.5718, + "step": 45703 + }, + { + "epoch": 1.17, + "learning_rate": 1.392478285067275e-06, + "loss": 0.7744, + "step": 45704 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924528347051801e-06, + "loss": 0.6592, + "step": 45705 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924273840426022e-06, + "loss": 0.6567, + "step": 45706 + }, + { + "epoch": 1.17, + "learning_rate": 1.3924019330795609e-06, + "loss": 0.7129, + "step": 45707 + }, + { + "epoch": 1.17, + "learning_rate": 1.392376481816075e-06, + "loss": 0.748, + "step": 45708 + }, + { + "epoch": 1.17, + "learning_rate": 1.392351030252165e-06, + "loss": 0.6035, + "step": 45709 + }, + { + "epoch": 1.17, + "learning_rate": 1.3923255783878496e-06, + "loss": 0.7773, + "step": 45710 + }, + { + "epoch": 1.17, + "learning_rate": 1.3923001262231483e-06, + "loss": 0.6738, + "step": 45711 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922746737580813e-06, + "loss": 0.6875, + "step": 45712 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922492209926676e-06, + "loss": 0.7275, + "step": 45713 + }, + { + "epoch": 1.17, + "learning_rate": 1.3922237679269263e-06, + "loss": 0.749, + "step": 45714 + }, + { + "epoch": 1.17, + "learning_rate": 1.3921983145608775e-06, + "loss": 0.5508, + "step": 45715 + }, + { + "epoch": 1.17, + "learning_rate": 1.3921728608945405e-06, + "loss": 0.6582, + "step": 45716 + }, + { + "epoch": 1.17, + "learning_rate": 1.392147406927935e-06, + "loss": 0.7988, + "step": 45717 + }, + { + "epoch": 1.17, + "learning_rate": 1.39212195266108e-06, + "loss": 0.6836, + "step": 45718 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920964980939952e-06, + "loss": 0.6792, + "step": 45719 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920710432267e-06, + "loss": 0.7344, + "step": 45720 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920455880592143e-06, + "loss": 0.752, + "step": 45721 + }, + { + "epoch": 1.17, + "learning_rate": 1.3920201325915576e-06, + "loss": 0.8096, + "step": 45722 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919946768237488e-06, + "loss": 0.7588, + "step": 45723 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919692207558074e-06, + "loss": 0.3494, + "step": 45724 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919437643877536e-06, + "loss": 0.6479, + "step": 45725 + }, + { + "epoch": 1.17, + "learning_rate": 1.3919183077196061e-06, + "loss": 0.3804, + "step": 45726 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918928507513852e-06, + "loss": 0.7812, + "step": 45727 + }, + { + "epoch": 1.17, + "learning_rate": 1.39186739348311e-06, + "loss": 0.5781, + "step": 45728 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918419359147997e-06, + "loss": 0.7666, + "step": 45729 + }, + { + "epoch": 1.17, + "learning_rate": 1.3918164780464737e-06, + "loss": 0.4678, + "step": 45730 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917910198781526e-06, + "loss": 0.4873, + "step": 45731 + }, + { + "epoch": 1.17, + "learning_rate": 1.391765561409855e-06, + "loss": 0.7617, + "step": 45732 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917401026416e-06, + "loss": 0.6826, + "step": 45733 + }, + { + "epoch": 1.17, + "learning_rate": 1.3917146435734079e-06, + "loss": 0.6924, + "step": 45734 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916891842052978e-06, + "loss": 0.5142, + "step": 45735 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916637245372896e-06, + "loss": 0.7129, + "step": 45736 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916382645694023e-06, + "loss": 0.6797, + "step": 45737 + }, + { + "epoch": 1.17, + "learning_rate": 1.3916128043016558e-06, + "loss": 0.363, + "step": 45738 + }, + { + "epoch": 1.17, + "learning_rate": 1.391587343734069e-06, + "loss": 0.6475, + "step": 45739 + }, + { + "epoch": 1.17, + "learning_rate": 1.391561882866662e-06, + "loss": 0.5591, + "step": 45740 + }, + { + "epoch": 1.17, + "learning_rate": 1.3915364216994538e-06, + "loss": 0.5767, + "step": 45741 + }, + { + "epoch": 1.17, + "learning_rate": 1.3915109602324647e-06, + "loss": 0.6431, + "step": 45742 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914854984657132e-06, + "loss": 0.6064, + "step": 45743 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914600363992196e-06, + "loss": 0.6699, + "step": 45744 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914345740330027e-06, + "loss": 0.4727, + "step": 45745 + }, + { + "epoch": 1.17, + "learning_rate": 1.3914091113670825e-06, + "loss": 0.7207, + "step": 45746 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913836484014785e-06, + "loss": 0.5217, + "step": 45747 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913581851362099e-06, + "loss": 0.7148, + "step": 45748 + }, + { + "epoch": 1.17, + "learning_rate": 1.3913327215712961e-06, + "loss": 0.6729, + "step": 45749 + }, + { + "epoch": 1.17, + "learning_rate": 1.391307257706757e-06, + "loss": 0.8076, + "step": 45750 + }, + { + "epoch": 1.17, + "learning_rate": 1.3912817935426119e-06, + "loss": 0.5205, + "step": 45751 + }, + { + "epoch": 1.17, + "learning_rate": 1.3912563290788806e-06, + "loss": 0.7393, + "step": 45752 + }, + { + "epoch": 1.17, + "learning_rate": 1.391230864315582e-06, + "loss": 0.6055, + "step": 45753 + }, + { + "epoch": 1.17, + "learning_rate": 1.391205399252736e-06, + "loss": 0.7236, + "step": 45754 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911799338903621e-06, + "loss": 0.8398, + "step": 45755 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911544682284796e-06, + "loss": 0.6003, + "step": 45756 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911290022671085e-06, + "loss": 0.5625, + "step": 45757 + }, + { + "epoch": 1.17, + "learning_rate": 1.3911035360062672e-06, + "loss": 0.8428, + "step": 45758 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910780694459765e-06, + "loss": 0.915, + "step": 45759 + }, + { + "epoch": 1.17, + "learning_rate": 1.391052602586255e-06, + "loss": 0.6621, + "step": 45760 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910271354271227e-06, + "loss": 0.5728, + "step": 45761 + }, + { + "epoch": 1.17, + "learning_rate": 1.3910016679685988e-06, + "loss": 0.7197, + "step": 45762 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909762002107028e-06, + "loss": 0.5767, + "step": 45763 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909507321534543e-06, + "loss": 0.6802, + "step": 45764 + }, + { + "epoch": 1.17, + "learning_rate": 1.3909252637968729e-06, + "loss": 0.6973, + "step": 45765 + }, + { + "epoch": 1.17, + "learning_rate": 1.390899795140978e-06, + "loss": 0.7266, + "step": 45766 + }, + { + "epoch": 1.17, + "learning_rate": 1.3908743261857894e-06, + "loss": 0.6035, + "step": 45767 + }, + { + "epoch": 1.17, + "learning_rate": 1.390848856931326e-06, + "loss": 0.5737, + "step": 45768 + }, + { + "epoch": 1.17, + "learning_rate": 1.3908233873776074e-06, + "loss": 0.541, + "step": 45769 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907979175246533e-06, + "loss": 0.6689, + "step": 45770 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907724473724836e-06, + "loss": 0.7012, + "step": 45771 + }, + { + "epoch": 1.17, + "learning_rate": 1.3907469769211172e-06, + "loss": 0.6172, + "step": 45772 + }, + { + "epoch": 1.17, + "learning_rate": 1.390721506170574e-06, + "loss": 0.3445, + "step": 45773 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906960351208729e-06, + "loss": 0.7969, + "step": 45774 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906705637720342e-06, + "loss": 0.8486, + "step": 45775 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906450921240767e-06, + "loss": 0.5977, + "step": 45776 + }, + { + "epoch": 1.17, + "learning_rate": 1.3906196201770205e-06, + "loss": 0.5845, + "step": 45777 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905941479308847e-06, + "loss": 0.7227, + "step": 45778 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905686753856887e-06, + "loss": 0.6357, + "step": 45779 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905432025414526e-06, + "loss": 0.5752, + "step": 45780 + }, + { + "epoch": 1.17, + "learning_rate": 1.3905177293981952e-06, + "loss": 0.5935, + "step": 45781 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904922559559366e-06, + "loss": 0.6016, + "step": 45782 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904667822146958e-06, + "loss": 0.5352, + "step": 45783 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904413081744928e-06, + "loss": 0.7598, + "step": 45784 + }, + { + "epoch": 1.17, + "learning_rate": 1.3904158338353464e-06, + "loss": 0.5986, + "step": 45785 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903903591972773e-06, + "loss": 0.4248, + "step": 45786 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903648842603035e-06, + "loss": 0.6797, + "step": 45787 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903394090244458e-06, + "loss": 0.6924, + "step": 45788 + }, + { + "epoch": 1.17, + "learning_rate": 1.3903139334897228e-06, + "loss": 0.6846, + "step": 45789 + }, + { + "epoch": 1.17, + "learning_rate": 1.3902884576561547e-06, + "loss": 0.7695, + "step": 45790 + }, + { + "epoch": 1.17, + "learning_rate": 1.39026298152376e-06, + "loss": 0.5356, + "step": 45791 + }, + { + "epoch": 1.17, + "learning_rate": 1.3902375050925596e-06, + "loss": 0.7061, + "step": 45792 + }, + { + "epoch": 1.17, + "learning_rate": 1.390212028362572e-06, + "loss": 0.6709, + "step": 45793 + }, + { + "epoch": 1.17, + "learning_rate": 1.390186551333817e-06, + "loss": 0.5413, + "step": 45794 + }, + { + "epoch": 1.17, + "learning_rate": 1.390161074006314e-06, + "loss": 0.551, + "step": 45795 + }, + { + "epoch": 1.17, + "learning_rate": 1.390135596380083e-06, + "loss": 0.6084, + "step": 45796 + }, + { + "epoch": 1.17, + "learning_rate": 1.3901101184551429e-06, + "loss": 0.6943, + "step": 45797 + }, + { + "epoch": 1.17, + "learning_rate": 1.3900846402315132e-06, + "loss": 0.8203, + "step": 45798 + }, + { + "epoch": 1.17, + "learning_rate": 1.390059161709214e-06, + "loss": 0.6787, + "step": 45799 + }, + { + "epoch": 1.17, + "learning_rate": 1.390033682888264e-06, + "loss": 0.7559, + "step": 45800 + }, + { + "epoch": 1.17, + "learning_rate": 1.3900082037686833e-06, + "loss": 0.7217, + "step": 45801 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899827243504913e-06, + "loss": 0.4277, + "step": 45802 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899572446337079e-06, + "loss": 0.7021, + "step": 45803 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899317646183515e-06, + "loss": 0.6221, + "step": 45804 + }, + { + "epoch": 1.17, + "learning_rate": 1.3899062843044424e-06, + "loss": 0.6729, + "step": 45805 + }, + { + "epoch": 1.17, + "learning_rate": 1.389880803692e-06, + "loss": 0.6099, + "step": 45806 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898553227810444e-06, + "loss": 0.5547, + "step": 45807 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898298415715937e-06, + "loss": 0.8008, + "step": 45808 + }, + { + "epoch": 1.17, + "learning_rate": 1.3898043600636687e-06, + "loss": 0.749, + "step": 45809 + }, + { + "epoch": 1.17, + "learning_rate": 1.389778878257288e-06, + "loss": 0.4429, + "step": 45810 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897533961524718e-06, + "loss": 0.5859, + "step": 45811 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897279137492395e-06, + "loss": 0.5083, + "step": 45812 + }, + { + "epoch": 1.17, + "learning_rate": 1.3897024310476103e-06, + "loss": 0.4363, + "step": 45813 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896769480476037e-06, + "loss": 0.5625, + "step": 45814 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896514647492397e-06, + "loss": 0.627, + "step": 45815 + }, + { + "epoch": 1.17, + "learning_rate": 1.389625981152537e-06, + "loss": 0.6353, + "step": 45816 + }, + { + "epoch": 1.17, + "learning_rate": 1.3896004972575162e-06, + "loss": 0.6973, + "step": 45817 + }, + { + "epoch": 1.17, + "learning_rate": 1.3895750130641959e-06, + "loss": 0.6816, + "step": 45818 + }, + { + "epoch": 1.17, + "learning_rate": 1.389549528572596e-06, + "loss": 0.6128, + "step": 45819 + }, + { + "epoch": 1.17, + "learning_rate": 1.3895240437827358e-06, + "loss": 0.5715, + "step": 45820 + }, + { + "epoch": 1.17, + "learning_rate": 1.389498558694635e-06, + "loss": 0.6519, + "step": 45821 + }, + { + "epoch": 1.17, + "learning_rate": 1.3894730733083133e-06, + "loss": 0.5312, + "step": 45822 + }, + { + "epoch": 1.17, + "learning_rate": 1.3894475876237897e-06, + "loss": 0.7266, + "step": 45823 + }, + { + "epoch": 1.17, + "learning_rate": 1.389422101641084e-06, + "loss": 0.7637, + "step": 45824 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893966153602157e-06, + "loss": 0.6074, + "step": 45825 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893711287812046e-06, + "loss": 0.5728, + "step": 45826 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893456419040699e-06, + "loss": 0.5391, + "step": 45827 + }, + { + "epoch": 1.17, + "learning_rate": 1.3893201547288308e-06, + "loss": 0.5376, + "step": 45828 + }, + { + "epoch": 1.17, + "learning_rate": 1.3892946672555073e-06, + "loss": 0.8647, + "step": 45829 + }, + { + "epoch": 1.17, + "learning_rate": 1.389269179484119e-06, + "loss": 0.605, + "step": 45830 + }, + { + "epoch": 1.17, + "learning_rate": 1.3892436914146848e-06, + "loss": 0.667, + "step": 45831 + }, + { + "epoch": 1.17, + "learning_rate": 1.389218203047225e-06, + "loss": 0.6621, + "step": 45832 + }, + { + "epoch": 1.17, + "learning_rate": 1.3891927143817586e-06, + "loss": 0.4666, + "step": 45833 + }, + { + "epoch": 1.17, + "learning_rate": 1.389167225418305e-06, + "loss": 0.6484, + "step": 45834 + }, + { + "epoch": 1.17, + "learning_rate": 1.389141736156884e-06, + "loss": 0.5615, + "step": 45835 + }, + { + "epoch": 1.17, + "learning_rate": 1.3891162465975153e-06, + "loss": 0.7305, + "step": 45836 + }, + { + "epoch": 1.17, + "learning_rate": 1.3890907567402182e-06, + "loss": 0.6763, + "step": 45837 + }, + { + "epoch": 1.17, + "learning_rate": 1.389065266585012e-06, + "loss": 0.6177, + "step": 45838 + }, + { + "epoch": 1.17, + "learning_rate": 1.3890397761319163e-06, + "loss": 0.5869, + "step": 45839 + }, + { + "epoch": 1.17, + "learning_rate": 1.389014285380951e-06, + "loss": 0.6528, + "step": 45840 + }, + { + "epoch": 1.17, + "learning_rate": 1.388988794332135e-06, + "loss": 0.5129, + "step": 45841 + }, + { + "epoch": 1.17, + "learning_rate": 1.3889633029854886e-06, + "loss": 0.6519, + "step": 45842 + }, + { + "epoch": 1.17, + "learning_rate": 1.388937811341031e-06, + "loss": 0.624, + "step": 45843 + }, + { + "epoch": 1.18, + "learning_rate": 1.3889123193987808e-06, + "loss": 0.6426, + "step": 45844 + }, + { + "epoch": 1.18, + "learning_rate": 1.388886827158759e-06, + "loss": 0.5225, + "step": 45845 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888613346209843e-06, + "loss": 0.6326, + "step": 45846 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888358417854764e-06, + "loss": 0.5713, + "step": 45847 + }, + { + "epoch": 1.18, + "learning_rate": 1.3888103486522545e-06, + "loss": 0.8242, + "step": 45848 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887848552213388e-06, + "loss": 0.7998, + "step": 45849 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887593614927479e-06, + "loss": 0.561, + "step": 45850 + }, + { + "epoch": 1.18, + "learning_rate": 1.3887338674665024e-06, + "loss": 0.6626, + "step": 45851 + }, + { + "epoch": 1.18, + "learning_rate": 1.388708373142621e-06, + "loss": 0.5645, + "step": 45852 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886828785211235e-06, + "loss": 0.4171, + "step": 45853 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886573836020291e-06, + "loss": 0.5039, + "step": 45854 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886318883853578e-06, + "loss": 0.4299, + "step": 45855 + }, + { + "epoch": 1.18, + "learning_rate": 1.3886063928711292e-06, + "loss": 0.6221, + "step": 45856 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885808970593624e-06, + "loss": 0.7383, + "step": 45857 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885554009500768e-06, + "loss": 0.6611, + "step": 45858 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885299045432926e-06, + "loss": 0.4666, + "step": 45859 + }, + { + "epoch": 1.18, + "learning_rate": 1.3885044078390286e-06, + "loss": 0.7031, + "step": 45860 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884789108373046e-06, + "loss": 0.6504, + "step": 45861 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884534135381408e-06, + "loss": 0.5596, + "step": 45862 + }, + { + "epoch": 1.18, + "learning_rate": 1.3884279159415555e-06, + "loss": 0.6543, + "step": 45863 + }, + { + "epoch": 1.18, + "learning_rate": 1.388402418047569e-06, + "loss": 0.6309, + "step": 45864 + }, + { + "epoch": 1.18, + "learning_rate": 1.3883769198562005e-06, + "loss": 0.6016, + "step": 45865 + }, + { + "epoch": 1.18, + "learning_rate": 1.3883514213674693e-06, + "loss": 0.573, + "step": 45866 + }, + { + "epoch": 1.18, + "learning_rate": 1.388325922581396e-06, + "loss": 0.5493, + "step": 45867 + }, + { + "epoch": 1.18, + "learning_rate": 1.388300423497999e-06, + "loss": 0.454, + "step": 45868 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882749241172982e-06, + "loss": 0.8516, + "step": 45869 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882494244393132e-06, + "loss": 0.5156, + "step": 45870 + }, + { + "epoch": 1.18, + "learning_rate": 1.3882239244640634e-06, + "loss": 0.5239, + "step": 45871 + }, + { + "epoch": 1.18, + "learning_rate": 1.3881984241915687e-06, + "loss": 0.7295, + "step": 45872 + }, + { + "epoch": 1.18, + "learning_rate": 1.388172923621848e-06, + "loss": 0.7505, + "step": 45873 + }, + { + "epoch": 1.18, + "learning_rate": 1.3881474227549215e-06, + "loss": 0.6543, + "step": 45874 + }, + { + "epoch": 1.18, + "learning_rate": 1.388121921590808e-06, + "loss": 0.709, + "step": 45875 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880964201295275e-06, + "loss": 0.6309, + "step": 45876 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880709183710994e-06, + "loss": 0.6836, + "step": 45877 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880454163155434e-06, + "loss": 0.6289, + "step": 45878 + }, + { + "epoch": 1.18, + "learning_rate": 1.3880199139628785e-06, + "loss": 0.5742, + "step": 45879 + }, + { + "epoch": 1.18, + "learning_rate": 1.387994411313125e-06, + "loss": 0.6755, + "step": 45880 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879689083663015e-06, + "loss": 0.9258, + "step": 45881 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879434051224288e-06, + "loss": 0.5415, + "step": 45882 + }, + { + "epoch": 1.18, + "learning_rate": 1.3879179015815253e-06, + "loss": 0.7402, + "step": 45883 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878923977436108e-06, + "loss": 0.7686, + "step": 45884 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878668936087047e-06, + "loss": 0.5693, + "step": 45885 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878413891768272e-06, + "loss": 0.7627, + "step": 45886 + }, + { + "epoch": 1.18, + "learning_rate": 1.3878158844479973e-06, + "loss": 0.5869, + "step": 45887 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877903794222343e-06, + "loss": 0.5422, + "step": 45888 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877648740995585e-06, + "loss": 0.4636, + "step": 45889 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877393684799885e-06, + "loss": 0.6172, + "step": 45890 + }, + { + "epoch": 1.18, + "learning_rate": 1.3877138625635447e-06, + "loss": 0.666, + "step": 45891 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876883563502462e-06, + "loss": 0.7217, + "step": 45892 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876628498401124e-06, + "loss": 0.7188, + "step": 45893 + }, + { + "epoch": 1.18, + "learning_rate": 1.387637343033163e-06, + "loss": 0.8701, + "step": 45894 + }, + { + "epoch": 1.18, + "learning_rate": 1.3876118359294174e-06, + "loss": 0.5825, + "step": 45895 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875863285288952e-06, + "loss": 0.6763, + "step": 45896 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875608208316163e-06, + "loss": 0.5469, + "step": 45897 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875353128375998e-06, + "loss": 0.6455, + "step": 45898 + }, + { + "epoch": 1.18, + "learning_rate": 1.3875098045468653e-06, + "loss": 0.5049, + "step": 45899 + }, + { + "epoch": 1.18, + "learning_rate": 1.387484295959432e-06, + "loss": 0.5204, + "step": 45900 + }, + { + "epoch": 1.18, + "learning_rate": 1.38745878707532e-06, + "loss": 0.6533, + "step": 45901 + }, + { + "epoch": 1.18, + "learning_rate": 1.387433277894549e-06, + "loss": 0.6611, + "step": 45902 + }, + { + "epoch": 1.18, + "learning_rate": 1.387407768417138e-06, + "loss": 0.6265, + "step": 45903 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873822586431062e-06, + "loss": 0.6357, + "step": 45904 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873567485724743e-06, + "loss": 0.6689, + "step": 45905 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873312382052605e-06, + "loss": 0.7085, + "step": 45906 + }, + { + "epoch": 1.18, + "learning_rate": 1.3873057275414855e-06, + "loss": 0.5869, + "step": 45907 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872802165811682e-06, + "loss": 0.749, + "step": 45908 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872547053243282e-06, + "loss": 0.6548, + "step": 45909 + }, + { + "epoch": 1.18, + "learning_rate": 1.3872291937709848e-06, + "loss": 0.7383, + "step": 45910 + }, + { + "epoch": 1.18, + "learning_rate": 1.387203681921158e-06, + "loss": 0.6729, + "step": 45911 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871781697748674e-06, + "loss": 0.791, + "step": 45912 + }, + { + "epoch": 1.18, + "learning_rate": 1.387152657332132e-06, + "loss": 0.5637, + "step": 45913 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871271445929718e-06, + "loss": 0.6401, + "step": 45914 + }, + { + "epoch": 1.18, + "learning_rate": 1.3871016315574058e-06, + "loss": 0.6436, + "step": 45915 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870761182254541e-06, + "loss": 0.7109, + "step": 45916 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870506045971362e-06, + "loss": 0.8037, + "step": 45917 + }, + { + "epoch": 1.18, + "learning_rate": 1.3870250906724713e-06, + "loss": 0.7246, + "step": 45918 + }, + { + "epoch": 1.18, + "learning_rate": 1.386999576451479e-06, + "loss": 0.7598, + "step": 45919 + }, + { + "epoch": 1.18, + "learning_rate": 1.386974061934179e-06, + "loss": 0.6509, + "step": 45920 + }, + { + "epoch": 1.18, + "learning_rate": 1.3869485471205906e-06, + "loss": 0.7754, + "step": 45921 + }, + { + "epoch": 1.18, + "learning_rate": 1.386923032010734e-06, + "loss": 0.6895, + "step": 45922 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868975166046275e-06, + "loss": 0.5659, + "step": 45923 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868720009022918e-06, + "loss": 0.7441, + "step": 45924 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868464849037457e-06, + "loss": 0.3533, + "step": 45925 + }, + { + "epoch": 1.18, + "learning_rate": 1.3868209686090093e-06, + "loss": 0.8779, + "step": 45926 + }, + { + "epoch": 1.18, + "learning_rate": 1.386795452018102e-06, + "loss": 0.6685, + "step": 45927 + }, + { + "epoch": 1.18, + "learning_rate": 1.386769935131043e-06, + "loss": 0.6689, + "step": 45928 + }, + { + "epoch": 1.18, + "learning_rate": 1.386744417947852e-06, + "loss": 0.7871, + "step": 45929 + }, + { + "epoch": 1.18, + "learning_rate": 1.3867189004685487e-06, + "loss": 0.5449, + "step": 45930 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866933826931524e-06, + "loss": 0.7754, + "step": 45931 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866678646216827e-06, + "loss": 0.6021, + "step": 45932 + }, + { + "epoch": 1.18, + "learning_rate": 1.3866423462541595e-06, + "loss": 0.7256, + "step": 45933 + }, + { + "epoch": 1.18, + "learning_rate": 1.386616827590602e-06, + "loss": 0.626, + "step": 45934 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865913086310294e-06, + "loss": 0.5591, + "step": 45935 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865657893754618e-06, + "loss": 0.7354, + "step": 45936 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865402698239187e-06, + "loss": 0.7549, + "step": 45937 + }, + { + "epoch": 1.18, + "learning_rate": 1.3865147499764194e-06, + "loss": 0.7773, + "step": 45938 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864892298329834e-06, + "loss": 0.9307, + "step": 45939 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864637093936303e-06, + "loss": 0.5386, + "step": 45940 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864381886583803e-06, + "loss": 0.6245, + "step": 45941 + }, + { + "epoch": 1.18, + "learning_rate": 1.3864126676272517e-06, + "loss": 0.6982, + "step": 45942 + }, + { + "epoch": 1.18, + "learning_rate": 1.386387146300265e-06, + "loss": 0.5601, + "step": 45943 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863616246774393e-06, + "loss": 0.5659, + "step": 45944 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863361027587944e-06, + "loss": 0.7256, + "step": 45945 + }, + { + "epoch": 1.18, + "learning_rate": 1.3863105805443496e-06, + "loss": 0.627, + "step": 45946 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862850580341246e-06, + "loss": 0.4199, + "step": 45947 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862595352281388e-06, + "loss": 0.6929, + "step": 45948 + }, + { + "epoch": 1.18, + "learning_rate": 1.386234012126412e-06, + "loss": 0.5891, + "step": 45949 + }, + { + "epoch": 1.18, + "learning_rate": 1.3862084887289634e-06, + "loss": 0.5669, + "step": 45950 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861829650358129e-06, + "loss": 0.6465, + "step": 45951 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861574410469797e-06, + "loss": 0.5771, + "step": 45952 + }, + { + "epoch": 1.18, + "learning_rate": 1.3861319167624837e-06, + "loss": 0.5784, + "step": 45953 + }, + { + "epoch": 1.18, + "learning_rate": 1.386106392182344e-06, + "loss": 0.5991, + "step": 45954 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860808673065805e-06, + "loss": 0.5588, + "step": 45955 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860553421352127e-06, + "loss": 0.7285, + "step": 45956 + }, + { + "epoch": 1.18, + "learning_rate": 1.3860298166682598e-06, + "loss": 0.7018, + "step": 45957 + }, + { + "epoch": 1.18, + "learning_rate": 1.386004290905742e-06, + "loss": 0.6812, + "step": 45958 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859787648476782e-06, + "loss": 0.6553, + "step": 45959 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859532384940882e-06, + "loss": 0.7363, + "step": 45960 + }, + { + "epoch": 1.18, + "learning_rate": 1.3859277118449918e-06, + "loss": 0.5803, + "step": 45961 + }, + { + "epoch": 1.18, + "learning_rate": 1.385902184900408e-06, + "loss": 0.6748, + "step": 45962 + }, + { + "epoch": 1.18, + "learning_rate": 1.385876657660357e-06, + "loss": 0.7852, + "step": 45963 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858511301248576e-06, + "loss": 0.5786, + "step": 45964 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858256022939298e-06, + "loss": 0.5791, + "step": 45965 + }, + { + "epoch": 1.18, + "learning_rate": 1.3858000741675935e-06, + "loss": 0.6338, + "step": 45966 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857745457458672e-06, + "loss": 0.7773, + "step": 45967 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857490170287716e-06, + "loss": 0.5581, + "step": 45968 + }, + { + "epoch": 1.18, + "learning_rate": 1.3857234880163253e-06, + "loss": 0.5811, + "step": 45969 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856979587085485e-06, + "loss": 0.5059, + "step": 45970 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856724291054604e-06, + "loss": 0.748, + "step": 45971 + }, + { + "epoch": 1.18, + "learning_rate": 1.3856468992070808e-06, + "loss": 0.5146, + "step": 45972 + }, + { + "epoch": 1.18, + "learning_rate": 1.385621369013429e-06, + "loss": 0.6333, + "step": 45973 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855958385245248e-06, + "loss": 0.6675, + "step": 45974 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855703077403874e-06, + "loss": 0.6934, + "step": 45975 + }, + { + "epoch": 1.18, + "learning_rate": 1.3855447766610365e-06, + "loss": 0.6162, + "step": 45976 + }, + { + "epoch": 1.18, + "learning_rate": 1.385519245286492e-06, + "loss": 0.7188, + "step": 45977 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854937136167726e-06, + "loss": 0.6543, + "step": 45978 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854681816518988e-06, + "loss": 0.7695, + "step": 45979 + }, + { + "epoch": 1.18, + "learning_rate": 1.3854426493918897e-06, + "loss": 0.7822, + "step": 45980 + }, + { + "epoch": 1.18, + "learning_rate": 1.385417116836765e-06, + "loss": 0.8047, + "step": 45981 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853915839865437e-06, + "loss": 0.6846, + "step": 45982 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853660508412462e-06, + "loss": 0.7295, + "step": 45983 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853405174008914e-06, + "loss": 0.6299, + "step": 45984 + }, + { + "epoch": 1.18, + "learning_rate": 1.3853149836654993e-06, + "loss": 0.6714, + "step": 45985 + }, + { + "epoch": 1.18, + "learning_rate": 1.385289449635089e-06, + "loss": 0.3748, + "step": 45986 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852639153096805e-06, + "loss": 0.7773, + "step": 45987 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852383806892932e-06, + "loss": 0.7715, + "step": 45988 + }, + { + "epoch": 1.18, + "learning_rate": 1.3852128457739463e-06, + "loss": 0.5566, + "step": 45989 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851873105636598e-06, + "loss": 0.7041, + "step": 45990 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851617750584531e-06, + "loss": 0.6016, + "step": 45991 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851362392583456e-06, + "loss": 0.6318, + "step": 45992 + }, + { + "epoch": 1.18, + "learning_rate": 1.3851107031633571e-06, + "loss": 0.45, + "step": 45993 + }, + { + "epoch": 1.18, + "learning_rate": 1.3850851667735072e-06, + "loss": 0.6797, + "step": 45994 + }, + { + "epoch": 1.18, + "learning_rate": 1.385059630088815e-06, + "loss": 0.7256, + "step": 45995 + }, + { + "epoch": 1.18, + "learning_rate": 1.3850340931093005e-06, + "loss": 0.5879, + "step": 45996 + }, + { + "epoch": 1.18, + "learning_rate": 1.385008555834983e-06, + "loss": 0.7422, + "step": 45997 + }, + { + "epoch": 1.18, + "learning_rate": 1.384983018265882e-06, + "loss": 0.7666, + "step": 45998 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849574804020177e-06, + "loss": 0.4695, + "step": 45999 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849319422434088e-06, + "loss": 0.6826, + "step": 46000 + }, + { + "epoch": 1.18, + "learning_rate": 1.3849064037900754e-06, + "loss": 0.6602, + "step": 46001 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848808650420368e-06, + "loss": 0.8262, + "step": 46002 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848553259993122e-06, + "loss": 0.5532, + "step": 46003 + }, + { + "epoch": 1.18, + "learning_rate": 1.384829786661922e-06, + "loss": 0.6797, + "step": 46004 + }, + { + "epoch": 1.18, + "learning_rate": 1.3848042470298853e-06, + "loss": 0.6797, + "step": 46005 + }, + { + "epoch": 1.18, + "learning_rate": 1.384778707103222e-06, + "loss": 0.6602, + "step": 46006 + }, + { + "epoch": 1.18, + "learning_rate": 1.3847531668819508e-06, + "loss": 0.748, + "step": 46007 + }, + { + "epoch": 1.18, + "learning_rate": 1.384727626366092e-06, + "loss": 0.6499, + "step": 46008 + }, + { + "epoch": 1.18, + "learning_rate": 1.3847020855556647e-06, + "loss": 0.563, + "step": 46009 + }, + { + "epoch": 1.18, + "learning_rate": 1.3846765444506892e-06, + "loss": 0.4871, + "step": 46010 + }, + { + "epoch": 1.18, + "learning_rate": 1.3846510030511842e-06, + "loss": 0.625, + "step": 46011 + }, + { + "epoch": 1.18, + "learning_rate": 1.38462546135717e-06, + "loss": 0.5859, + "step": 46012 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845999193686652e-06, + "loss": 0.752, + "step": 46013 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845743770856903e-06, + "loss": 0.5894, + "step": 46014 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845488345082642e-06, + "loss": 0.6846, + "step": 46015 + }, + { + "epoch": 1.18, + "learning_rate": 1.3845232916364071e-06, + "loss": 0.6929, + "step": 46016 + }, + { + "epoch": 1.18, + "learning_rate": 1.384497748470138e-06, + "loss": 0.6221, + "step": 46017 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844722050094765e-06, + "loss": 0.6787, + "step": 46018 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844466612544426e-06, + "loss": 0.3318, + "step": 46019 + }, + { + "epoch": 1.18, + "learning_rate": 1.3844211172050555e-06, + "loss": 0.7002, + "step": 46020 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843955728613347e-06, + "loss": 0.6953, + "step": 46021 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843700282232999e-06, + "loss": 0.6895, + "step": 46022 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843444832909708e-06, + "loss": 0.6797, + "step": 46023 + }, + { + "epoch": 1.18, + "learning_rate": 1.3843189380643666e-06, + "loss": 0.6992, + "step": 46024 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842933925435071e-06, + "loss": 0.7603, + "step": 46025 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842678467284122e-06, + "loss": 0.7144, + "step": 46026 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842423006191006e-06, + "loss": 0.46, + "step": 46027 + }, + { + "epoch": 1.18, + "learning_rate": 1.3842167542155926e-06, + "loss": 0.4443, + "step": 46028 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841912075179073e-06, + "loss": 0.541, + "step": 46029 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841656605260644e-06, + "loss": 0.6582, + "step": 46030 + }, + { + "epoch": 1.18, + "learning_rate": 1.384140113240084e-06, + "loss": 0.6064, + "step": 46031 + }, + { + "epoch": 1.18, + "learning_rate": 1.3841145656599848e-06, + "loss": 0.6514, + "step": 46032 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840890177857868e-06, + "loss": 0.6016, + "step": 46033 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840634696175092e-06, + "loss": 0.7529, + "step": 46034 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840379211551722e-06, + "loss": 0.5181, + "step": 46035 + }, + { + "epoch": 1.18, + "learning_rate": 1.3840123723987952e-06, + "loss": 0.5381, + "step": 46036 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839868233483975e-06, + "loss": 0.566, + "step": 46037 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839612740039983e-06, + "loss": 0.7134, + "step": 46038 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839357243656182e-06, + "loss": 0.4961, + "step": 46039 + }, + { + "epoch": 1.18, + "learning_rate": 1.3839101744332758e-06, + "loss": 0.5344, + "step": 46040 + }, + { + "epoch": 1.18, + "learning_rate": 1.383884624206991e-06, + "loss": 0.7656, + "step": 46041 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838590736867837e-06, + "loss": 0.7559, + "step": 46042 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838335228726729e-06, + "loss": 0.6748, + "step": 46043 + }, + { + "epoch": 1.18, + "learning_rate": 1.3838079717646785e-06, + "loss": 0.6621, + "step": 46044 + }, + { + "epoch": 1.18, + "learning_rate": 1.38378242036282e-06, + "loss": 0.7261, + "step": 46045 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837568686671168e-06, + "loss": 0.5962, + "step": 46046 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837313166775887e-06, + "loss": 0.6523, + "step": 46047 + }, + { + "epoch": 1.18, + "learning_rate": 1.3837057643942554e-06, + "loss": 0.5171, + "step": 46048 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836802118171357e-06, + "loss": 0.5742, + "step": 46049 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836546589462504e-06, + "loss": 0.5635, + "step": 46050 + }, + { + "epoch": 1.18, + "learning_rate": 1.383629105781618e-06, + "loss": 0.7354, + "step": 46051 + }, + { + "epoch": 1.18, + "learning_rate": 1.3836035523232586e-06, + "loss": 0.7393, + "step": 46052 + }, + { + "epoch": 1.18, + "learning_rate": 1.3835779985711914e-06, + "loss": 0.5771, + "step": 46053 + }, + { + "epoch": 1.18, + "learning_rate": 1.383552444525436e-06, + "loss": 0.7158, + "step": 46054 + }, + { + "epoch": 1.18, + "learning_rate": 1.3835268901860121e-06, + "loss": 0.5796, + "step": 46055 + }, + { + "epoch": 1.18, + "learning_rate": 1.38350133555294e-06, + "loss": 0.8086, + "step": 46056 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834757806262381e-06, + "loss": 0.5513, + "step": 46057 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834502254059263e-06, + "loss": 0.832, + "step": 46058 + }, + { + "epoch": 1.18, + "learning_rate": 1.3834246698920241e-06, + "loss": 0.5542, + "step": 46059 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833991140845518e-06, + "loss": 0.5254, + "step": 46060 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833735579835284e-06, + "loss": 0.6699, + "step": 46061 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833480015889733e-06, + "loss": 0.6035, + "step": 46062 + }, + { + "epoch": 1.18, + "learning_rate": 1.3833224449009062e-06, + "loss": 0.5776, + "step": 46063 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832968879193469e-06, + "loss": 0.5693, + "step": 46064 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832713306443144e-06, + "loss": 0.5378, + "step": 46065 + }, + { + "epoch": 1.18, + "learning_rate": 1.3832457730758292e-06, + "loss": 0.7881, + "step": 46066 + }, + { + "epoch": 1.18, + "learning_rate": 1.38322021521391e-06, + "loss": 0.666, + "step": 46067 + }, + { + "epoch": 1.18, + "learning_rate": 1.383194657058577e-06, + "loss": 0.8047, + "step": 46068 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831690986098492e-06, + "loss": 0.7412, + "step": 46069 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831435398677463e-06, + "loss": 0.6523, + "step": 46070 + }, + { + "epoch": 1.18, + "learning_rate": 1.3831179808322886e-06, + "loss": 0.7568, + "step": 46071 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830924215034945e-06, + "loss": 0.8223, + "step": 46072 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830668618813843e-06, + "loss": 0.6797, + "step": 46073 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830413019659775e-06, + "loss": 0.6514, + "step": 46074 + }, + { + "epoch": 1.18, + "learning_rate": 1.3830157417572934e-06, + "loss": 0.5938, + "step": 46075 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829901812553518e-06, + "loss": 0.3806, + "step": 46076 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829646204601726e-06, + "loss": 0.6475, + "step": 46077 + }, + { + "epoch": 1.18, + "learning_rate": 1.3829390593717747e-06, + "loss": 0.4324, + "step": 46078 + }, + { + "epoch": 1.18, + "learning_rate": 1.382913497990178e-06, + "loss": 0.5596, + "step": 46079 + }, + { + "epoch": 1.18, + "learning_rate": 1.382887936315402e-06, + "loss": 0.6494, + "step": 46080 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828623743474665e-06, + "loss": 0.7422, + "step": 46081 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828368120863906e-06, + "loss": 0.7549, + "step": 46082 + }, + { + "epoch": 1.18, + "learning_rate": 1.3828112495321944e-06, + "loss": 0.769, + "step": 46083 + }, + { + "epoch": 1.18, + "learning_rate": 1.382785686684897e-06, + "loss": 0.6084, + "step": 46084 + }, + { + "epoch": 1.18, + "learning_rate": 1.3827601235445183e-06, + "loss": 0.7031, + "step": 46085 + }, + { + "epoch": 1.18, + "learning_rate": 1.3827345601110781e-06, + "loss": 0.7598, + "step": 46086 + }, + { + "epoch": 1.18, + "learning_rate": 1.382708996384595e-06, + "loss": 0.6953, + "step": 46087 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826834323650898e-06, + "loss": 0.6621, + "step": 46088 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826578680525812e-06, + "loss": 0.5112, + "step": 46089 + }, + { + "epoch": 1.18, + "learning_rate": 1.382632303447089e-06, + "loss": 0.8457, + "step": 46090 + }, + { + "epoch": 1.18, + "learning_rate": 1.3826067385486332e-06, + "loss": 0.7251, + "step": 46091 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825811733572329e-06, + "loss": 0.6045, + "step": 46092 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825556078729074e-06, + "loss": 0.6602, + "step": 46093 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825300420956768e-06, + "loss": 0.792, + "step": 46094 + }, + { + "epoch": 1.18, + "learning_rate": 1.3825044760255607e-06, + "loss": 0.7168, + "step": 46095 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824789096625788e-06, + "loss": 0.6646, + "step": 46096 + }, + { + "epoch": 1.18, + "learning_rate": 1.38245334300675e-06, + "loss": 0.5419, + "step": 46097 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824277760580942e-06, + "loss": 0.6763, + "step": 46098 + }, + { + "epoch": 1.18, + "learning_rate": 1.3824022088166309e-06, + "loss": 0.5781, + "step": 46099 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823766412823802e-06, + "loss": 0.4438, + "step": 46100 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823510734553615e-06, + "loss": 0.5898, + "step": 46101 + }, + { + "epoch": 1.18, + "learning_rate": 1.3823255053355938e-06, + "loss": 0.5049, + "step": 46102 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822999369230968e-06, + "loss": 0.6494, + "step": 46103 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822743682178906e-06, + "loss": 0.5463, + "step": 46104 + }, + { + "epoch": 1.18, + "learning_rate": 1.3822487992199943e-06, + "loss": 0.583, + "step": 46105 + }, + { + "epoch": 1.18, + "learning_rate": 1.382223229929428e-06, + "loss": 0.6885, + "step": 46106 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821976603462108e-06, + "loss": 0.7207, + "step": 46107 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821720904703623e-06, + "loss": 0.667, + "step": 46108 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821465203019025e-06, + "loss": 0.6147, + "step": 46109 + }, + { + "epoch": 1.18, + "learning_rate": 1.3821209498408504e-06, + "loss": 0.6255, + "step": 46110 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820953790872261e-06, + "loss": 0.5923, + "step": 46111 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820698080410487e-06, + "loss": 0.4932, + "step": 46112 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820442367023381e-06, + "loss": 0.6426, + "step": 46113 + }, + { + "epoch": 1.18, + "learning_rate": 1.3820186650711136e-06, + "loss": 0.646, + "step": 46114 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819930931473953e-06, + "loss": 0.5297, + "step": 46115 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819675209312026e-06, + "loss": 0.7041, + "step": 46116 + }, + { + "epoch": 1.18, + "learning_rate": 1.3819419484225544e-06, + "loss": 0.6709, + "step": 46117 + }, + { + "epoch": 1.18, + "learning_rate": 1.381916375621471e-06, + "loss": 0.665, + "step": 46118 + }, + { + "epoch": 1.18, + "learning_rate": 1.381890802527972e-06, + "loss": 0.4744, + "step": 46119 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818652291420767e-06, + "loss": 0.6279, + "step": 46120 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818396554638048e-06, + "loss": 0.7002, + "step": 46121 + }, + { + "epoch": 1.18, + "learning_rate": 1.3818140814931756e-06, + "loss": 0.5981, + "step": 46122 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817885072302091e-06, + "loss": 0.666, + "step": 46123 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817629326749246e-06, + "loss": 0.7021, + "step": 46124 + }, + { + "epoch": 1.18, + "learning_rate": 1.381737357827342e-06, + "loss": 0.5532, + "step": 46125 + }, + { + "epoch": 1.18, + "learning_rate": 1.3817117826874803e-06, + "loss": 0.7119, + "step": 46126 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816862072553598e-06, + "loss": 0.6831, + "step": 46127 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816606315309993e-06, + "loss": 0.4307, + "step": 46128 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816350555144192e-06, + "loss": 0.3828, + "step": 46129 + }, + { + "epoch": 1.18, + "learning_rate": 1.3816094792056382e-06, + "loss": 0.4521, + "step": 46130 + }, + { + "epoch": 1.18, + "learning_rate": 1.381583902604677e-06, + "loss": 0.6528, + "step": 46131 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815583257115542e-06, + "loss": 0.8389, + "step": 46132 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815327485262898e-06, + "loss": 0.7021, + "step": 46133 + }, + { + "epoch": 1.18, + "learning_rate": 1.3815071710489033e-06, + "loss": 0.6245, + "step": 46134 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814815932794144e-06, + "loss": 0.7192, + "step": 46135 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814560152178425e-06, + "loss": 0.6797, + "step": 46136 + }, + { + "epoch": 1.18, + "learning_rate": 1.3814304368642069e-06, + "loss": 0.6084, + "step": 46137 + }, + { + "epoch": 1.18, + "learning_rate": 1.381404858218528e-06, + "loss": 0.8994, + "step": 46138 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813792792808248e-06, + "loss": 0.7773, + "step": 46139 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813537000511172e-06, + "loss": 0.4563, + "step": 46140 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813281205294246e-06, + "loss": 0.6416, + "step": 46141 + }, + { + "epoch": 1.18, + "learning_rate": 1.3813025407157663e-06, + "loss": 0.5757, + "step": 46142 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812769606101622e-06, + "loss": 0.8057, + "step": 46143 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812513802126322e-06, + "loss": 0.7344, + "step": 46144 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812257995231952e-06, + "loss": 0.6924, + "step": 46145 + }, + { + "epoch": 1.18, + "learning_rate": 1.3812002185418715e-06, + "loss": 0.6953, + "step": 46146 + }, + { + "epoch": 1.18, + "learning_rate": 1.3811746372686801e-06, + "loss": 0.3853, + "step": 46147 + }, + { + "epoch": 1.18, + "learning_rate": 1.3811490557036406e-06, + "loss": 0.5433, + "step": 46148 + }, + { + "epoch": 1.18, + "learning_rate": 1.381123473846773e-06, + "loss": 0.6855, + "step": 46149 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810978916980969e-06, + "loss": 0.5131, + "step": 46150 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810723092576315e-06, + "loss": 0.5811, + "step": 46151 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810467265253964e-06, + "loss": 0.6719, + "step": 46152 + }, + { + "epoch": 1.18, + "learning_rate": 1.3810211435014115e-06, + "loss": 0.6396, + "step": 46153 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809955601856963e-06, + "loss": 0.686, + "step": 46154 + }, + { + "epoch": 1.18, + "learning_rate": 1.38096997657827e-06, + "loss": 0.6733, + "step": 46155 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809443926791526e-06, + "loss": 0.7852, + "step": 46156 + }, + { + "epoch": 1.18, + "learning_rate": 1.3809188084883639e-06, + "loss": 0.7671, + "step": 46157 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808932240059228e-06, + "loss": 0.5449, + "step": 46158 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808676392318494e-06, + "loss": 0.4705, + "step": 46159 + }, + { + "epoch": 1.18, + "learning_rate": 1.3808420541661631e-06, + "loss": 0.7256, + "step": 46160 + }, + { + "epoch": 1.18, + "learning_rate": 1.380816468808884e-06, + "loss": 0.6177, + "step": 46161 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807908831600308e-06, + "loss": 0.6042, + "step": 46162 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807652972196238e-06, + "loss": 0.5913, + "step": 46163 + }, + { + "epoch": 1.18, + "learning_rate": 1.380739710987682e-06, + "loss": 0.6636, + "step": 46164 + }, + { + "epoch": 1.18, + "learning_rate": 1.3807141244642255e-06, + "loss": 0.7358, + "step": 46165 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806885376492736e-06, + "loss": 0.6484, + "step": 46166 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806629505428463e-06, + "loss": 0.6279, + "step": 46167 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806373631449626e-06, + "loss": 0.6118, + "step": 46168 + }, + { + "epoch": 1.18, + "learning_rate": 1.3806117754556423e-06, + "loss": 0.748, + "step": 46169 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805861874749053e-06, + "loss": 0.6318, + "step": 46170 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805605992027709e-06, + "loss": 0.6943, + "step": 46171 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805350106392586e-06, + "loss": 0.6851, + "step": 46172 + }, + { + "epoch": 1.18, + "learning_rate": 1.3805094217843882e-06, + "loss": 0.6216, + "step": 46173 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804838326381791e-06, + "loss": 0.6318, + "step": 46174 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804582432006513e-06, + "loss": 0.585, + "step": 46175 + }, + { + "epoch": 1.18, + "learning_rate": 1.380432653471824e-06, + "loss": 0.6108, + "step": 46176 + }, + { + "epoch": 1.18, + "learning_rate": 1.3804070634517168e-06, + "loss": 0.7344, + "step": 46177 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803814731403495e-06, + "loss": 0.5537, + "step": 46178 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803558825377416e-06, + "loss": 0.5952, + "step": 46179 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803302916439128e-06, + "loss": 0.6484, + "step": 46180 + }, + { + "epoch": 1.18, + "learning_rate": 1.3803047004588827e-06, + "loss": 0.7231, + "step": 46181 + }, + { + "epoch": 1.18, + "learning_rate": 1.3802791089826704e-06, + "loss": 0.7549, + "step": 46182 + }, + { + "epoch": 1.18, + "learning_rate": 1.380253517215296e-06, + "loss": 0.6416, + "step": 46183 + }, + { + "epoch": 1.18, + "learning_rate": 1.380227925156779e-06, + "loss": 0.4795, + "step": 46184 + }, + { + "epoch": 1.18, + "learning_rate": 1.3802023328071389e-06, + "loss": 0.6587, + "step": 46185 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801767401663956e-06, + "loss": 0.6021, + "step": 46186 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801511472345683e-06, + "loss": 0.7129, + "step": 46187 + }, + { + "epoch": 1.18, + "learning_rate": 1.3801255540116764e-06, + "loss": 0.6396, + "step": 46188 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800999604977403e-06, + "loss": 0.6709, + "step": 46189 + }, + { + "epoch": 1.18, + "learning_rate": 1.380074366692779e-06, + "loss": 0.4937, + "step": 46190 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800487725968122e-06, + "loss": 0.7441, + "step": 46191 + }, + { + "epoch": 1.18, + "learning_rate": 1.3800231782098598e-06, + "loss": 0.6104, + "step": 46192 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799975835319407e-06, + "loss": 0.7114, + "step": 46193 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799719885630753e-06, + "loss": 0.6311, + "step": 46194 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799463933032822e-06, + "loss": 0.5425, + "step": 46195 + }, + { + "epoch": 1.18, + "learning_rate": 1.3799207977525825e-06, + "loss": 0.6934, + "step": 46196 + }, + { + "epoch": 1.18, + "learning_rate": 1.3798952019109945e-06, + "loss": 0.6875, + "step": 46197 + }, + { + "epoch": 1.18, + "learning_rate": 1.379869605778538e-06, + "loss": 0.593, + "step": 46198 + }, + { + "epoch": 1.18, + "learning_rate": 1.379844009355233e-06, + "loss": 0.5986, + "step": 46199 + }, + { + "epoch": 1.18, + "learning_rate": 1.3798184126410987e-06, + "loss": 0.6099, + "step": 46200 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797928156361552e-06, + "loss": 0.4824, + "step": 46201 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797672183404217e-06, + "loss": 0.7959, + "step": 46202 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797416207539179e-06, + "loss": 0.748, + "step": 46203 + }, + { + "epoch": 1.18, + "learning_rate": 1.3797160228766634e-06, + "loss": 0.7295, + "step": 46204 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796904247086776e-06, + "loss": 0.5879, + "step": 46205 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796648262499808e-06, + "loss": 0.6167, + "step": 46206 + }, + { + "epoch": 1.18, + "learning_rate": 1.3796392275005918e-06, + "loss": 0.6797, + "step": 46207 + }, + { + "epoch": 1.18, + "learning_rate": 1.37961362846053e-06, + "loss": 0.6211, + "step": 46208 + }, + { + "epoch": 1.18, + "learning_rate": 1.3795880291298162e-06, + "loss": 0.7129, + "step": 46209 + }, + { + "epoch": 1.18, + "learning_rate": 1.379562429508469e-06, + "loss": 0.4956, + "step": 46210 + }, + { + "epoch": 1.18, + "learning_rate": 1.379536829596509e-06, + "loss": 0.7686, + "step": 46211 + }, + { + "epoch": 1.18, + "learning_rate": 1.3795112293939542e-06, + "loss": 0.7852, + "step": 46212 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794856289008255e-06, + "loss": 0.5259, + "step": 46213 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794600281171418e-06, + "loss": 0.6953, + "step": 46214 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794344270429235e-06, + "loss": 0.7017, + "step": 46215 + }, + { + "epoch": 1.18, + "learning_rate": 1.3794088256781892e-06, + "loss": 0.6621, + "step": 46216 + }, + { + "epoch": 1.18, + "learning_rate": 1.3793832240229595e-06, + "loss": 0.6934, + "step": 46217 + }, + { + "epoch": 1.18, + "learning_rate": 1.3793576220772529e-06, + "loss": 0.8701, + "step": 46218 + }, + { + "epoch": 1.18, + "learning_rate": 1.37933201984109e-06, + "loss": 0.686, + "step": 46219 + }, + { + "epoch": 1.18, + "learning_rate": 1.37930641731449e-06, + "loss": 0.6577, + "step": 46220 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792808144974725e-06, + "loss": 0.6582, + "step": 46221 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792552113900571e-06, + "loss": 0.6797, + "step": 46222 + }, + { + "epoch": 1.18, + "learning_rate": 1.3792296079922633e-06, + "loss": 0.7402, + "step": 46223 + }, + { + "epoch": 1.18, + "learning_rate": 1.379204004304111e-06, + "loss": 0.5576, + "step": 46224 + }, + { + "epoch": 1.18, + "learning_rate": 1.3791784003256196e-06, + "loss": 0.6328, + "step": 46225 + }, + { + "epoch": 1.18, + "learning_rate": 1.3791527960568087e-06, + "loss": 0.833, + "step": 46226 + }, + { + "epoch": 1.18, + "learning_rate": 1.379127191497698e-06, + "loss": 0.7759, + "step": 46227 + }, + { + "epoch": 1.18, + "learning_rate": 1.379101586648307e-06, + "loss": 0.7017, + "step": 46228 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790759815086552e-06, + "loss": 0.5684, + "step": 46229 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790503760787627e-06, + "loss": 0.5352, + "step": 46230 + }, + { + "epoch": 1.18, + "learning_rate": 1.3790247703586487e-06, + "loss": 0.5864, + "step": 46231 + }, + { + "epoch": 1.18, + "learning_rate": 1.3789991643483325e-06, + "loss": 0.7158, + "step": 46232 + }, + { + "epoch": 1.18, + "learning_rate": 1.3789735580478343e-06, + "loss": 0.5815, + "step": 46233 + }, + { + "epoch": 1.19, + "learning_rate": 1.3789479514571736e-06, + "loss": 0.626, + "step": 46234 + }, + { + "epoch": 1.19, + "learning_rate": 1.3789223445763695e-06, + "loss": 0.7549, + "step": 46235 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788967374054424e-06, + "loss": 0.7686, + "step": 46236 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788711299444113e-06, + "loss": 0.603, + "step": 46237 + }, + { + "epoch": 1.19, + "learning_rate": 1.3788455221932959e-06, + "loss": 0.6265, + "step": 46238 + }, + { + "epoch": 1.19, + "learning_rate": 1.378819914152116e-06, + "loss": 0.6689, + "step": 46239 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787943058208912e-06, + "loss": 0.4475, + "step": 46240 + }, + { + "epoch": 1.19, + "learning_rate": 1.378768697199641e-06, + "loss": 0.6807, + "step": 46241 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787430882883851e-06, + "loss": 0.7783, + "step": 46242 + }, + { + "epoch": 1.19, + "learning_rate": 1.3787174790871428e-06, + "loss": 0.668, + "step": 46243 + }, + { + "epoch": 1.19, + "learning_rate": 1.378691869595934e-06, + "loss": 0.6362, + "step": 46244 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786662598147783e-06, + "loss": 0.687, + "step": 46245 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786406497436951e-06, + "loss": 0.5752, + "step": 46246 + }, + { + "epoch": 1.19, + "learning_rate": 1.3786150393827044e-06, + "loss": 0.6992, + "step": 46247 + }, + { + "epoch": 1.19, + "learning_rate": 1.3785894287318255e-06, + "loss": 0.4724, + "step": 46248 + }, + { + "epoch": 1.19, + "learning_rate": 1.378563817791078e-06, + "loss": 0.6177, + "step": 46249 + }, + { + "epoch": 1.19, + "learning_rate": 1.3785382065604816e-06, + "loss": 0.5898, + "step": 46250 + }, + { + "epoch": 1.19, + "learning_rate": 1.378512595040056e-06, + "loss": 0.8047, + "step": 46251 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784869832298205e-06, + "loss": 0.6655, + "step": 46252 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784613711297953e-06, + "loss": 0.666, + "step": 46253 + }, + { + "epoch": 1.19, + "learning_rate": 1.378435758739999e-06, + "loss": 0.5156, + "step": 46254 + }, + { + "epoch": 1.19, + "learning_rate": 1.3784101460604527e-06, + "loss": 0.7432, + "step": 46255 + }, + { + "epoch": 1.19, + "learning_rate": 1.3783845330911745e-06, + "loss": 0.5151, + "step": 46256 + }, + { + "epoch": 1.19, + "learning_rate": 1.378358919832185e-06, + "loss": 0.6177, + "step": 46257 + }, + { + "epoch": 1.19, + "learning_rate": 1.378333306283503e-06, + "loss": 0.6431, + "step": 46258 + }, + { + "epoch": 1.19, + "learning_rate": 1.378307692445149e-06, + "loss": 0.6523, + "step": 46259 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782820783171423e-06, + "loss": 0.583, + "step": 46260 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782564638995021e-06, + "loss": 0.6079, + "step": 46261 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782308491922485e-06, + "loss": 0.5913, + "step": 46262 + }, + { + "epoch": 1.19, + "learning_rate": 1.3782052341954009e-06, + "loss": 0.6006, + "step": 46263 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781796189089788e-06, + "loss": 0.5684, + "step": 46264 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781540033330022e-06, + "loss": 0.5913, + "step": 46265 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781283874674903e-06, + "loss": 0.7725, + "step": 46266 + }, + { + "epoch": 1.19, + "learning_rate": 1.3781027713124628e-06, + "loss": 0.6865, + "step": 46267 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780771548679395e-06, + "loss": 0.6553, + "step": 46268 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780515381339402e-06, + "loss": 0.479, + "step": 46269 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780259211104839e-06, + "loss": 0.6538, + "step": 46270 + }, + { + "epoch": 1.19, + "learning_rate": 1.3780003037975903e-06, + "loss": 0.7021, + "step": 46271 + }, + { + "epoch": 1.19, + "learning_rate": 1.3779746861952797e-06, + "loss": 0.4985, + "step": 46272 + }, + { + "epoch": 1.19, + "learning_rate": 1.3779490683035708e-06, + "loss": 0.665, + "step": 46273 + }, + { + "epoch": 1.19, + "learning_rate": 1.377923450122484e-06, + "loss": 0.6455, + "step": 46274 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778978316520386e-06, + "loss": 0.6382, + "step": 46275 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778722128922545e-06, + "loss": 0.5172, + "step": 46276 + }, + { + "epoch": 1.19, + "learning_rate": 1.3778465938431505e-06, + "loss": 0.6484, + "step": 46277 + }, + { + "epoch": 1.19, + "learning_rate": 1.377820974504747e-06, + "loss": 0.584, + "step": 46278 + }, + { + "epoch": 1.19, + "learning_rate": 1.377795354877063e-06, + "loss": 0.6033, + "step": 46279 + }, + { + "epoch": 1.19, + "learning_rate": 1.377769734960119e-06, + "loss": 0.5352, + "step": 46280 + }, + { + "epoch": 1.19, + "learning_rate": 1.3777441147539338e-06, + "loss": 0.667, + "step": 46281 + }, + { + "epoch": 1.19, + "learning_rate": 1.377718494258527e-06, + "loss": 0.5796, + "step": 46282 + }, + { + "epoch": 1.19, + "learning_rate": 1.377692873473919e-06, + "loss": 0.5571, + "step": 46283 + }, + { + "epoch": 1.19, + "learning_rate": 1.377667252400129e-06, + "loss": 0.7285, + "step": 46284 + }, + { + "epoch": 1.19, + "learning_rate": 1.3776416310371762e-06, + "loss": 0.5615, + "step": 46285 + }, + { + "epoch": 1.19, + "learning_rate": 1.3776160093850808e-06, + "loss": 0.749, + "step": 46286 + }, + { + "epoch": 1.19, + "learning_rate": 1.377590387443862e-06, + "loss": 0.7324, + "step": 46287 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775647652135397e-06, + "loss": 0.7773, + "step": 46288 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775391426941332e-06, + "loss": 0.5967, + "step": 46289 + }, + { + "epoch": 1.19, + "learning_rate": 1.3775135198856625e-06, + "loss": 0.667, + "step": 46290 + }, + { + "epoch": 1.19, + "learning_rate": 1.377487896788147e-06, + "loss": 0.625, + "step": 46291 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774622734016067e-06, + "loss": 0.6436, + "step": 46292 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774366497260605e-06, + "loss": 0.7148, + "step": 46293 + }, + { + "epoch": 1.19, + "learning_rate": 1.3774110257615286e-06, + "loss": 0.834, + "step": 46294 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773854015080307e-06, + "loss": 0.5376, + "step": 46295 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773597769655855e-06, + "loss": 0.585, + "step": 46296 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773341521342138e-06, + "loss": 0.6597, + "step": 46297 + }, + { + "epoch": 1.19, + "learning_rate": 1.3773085270139344e-06, + "loss": 0.7354, + "step": 46298 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772829016047674e-06, + "loss": 0.3857, + "step": 46299 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772572759067323e-06, + "loss": 0.9062, + "step": 46300 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772316499198484e-06, + "loss": 0.5396, + "step": 46301 + }, + { + "epoch": 1.19, + "learning_rate": 1.3772060236441356e-06, + "loss": 0.4641, + "step": 46302 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771803970796135e-06, + "loss": 0.7031, + "step": 46303 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771547702263018e-06, + "loss": 0.7852, + "step": 46304 + }, + { + "epoch": 1.19, + "learning_rate": 1.3771291430842203e-06, + "loss": 0.4868, + "step": 46305 + }, + { + "epoch": 1.19, + "learning_rate": 1.377103515653388e-06, + "loss": 0.6357, + "step": 46306 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770778879338249e-06, + "loss": 0.6533, + "step": 46307 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770522599255504e-06, + "loss": 0.6621, + "step": 46308 + }, + { + "epoch": 1.19, + "learning_rate": 1.377026631628585e-06, + "loss": 0.5723, + "step": 46309 + }, + { + "epoch": 1.19, + "learning_rate": 1.3770010030429472e-06, + "loss": 0.6641, + "step": 46310 + }, + { + "epoch": 1.19, + "learning_rate": 1.3769753741686567e-06, + "loss": 0.5914, + "step": 46311 + }, + { + "epoch": 1.19, + "learning_rate": 1.3769497450057338e-06, + "loss": 0.5479, + "step": 46312 + }, + { + "epoch": 1.19, + "learning_rate": 1.376924115554198e-06, + "loss": 0.4705, + "step": 46313 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768984858140686e-06, + "loss": 0.71, + "step": 46314 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768728557853653e-06, + "loss": 0.6177, + "step": 46315 + }, + { + "epoch": 1.19, + "learning_rate": 1.376847225468108e-06, + "loss": 0.6709, + "step": 46316 + }, + { + "epoch": 1.19, + "learning_rate": 1.3768215948623158e-06, + "loss": 0.613, + "step": 46317 + }, + { + "epoch": 1.19, + "learning_rate": 1.376795963968009e-06, + "loss": 0.8154, + "step": 46318 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767703327852066e-06, + "loss": 0.666, + "step": 46319 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767447013139286e-06, + "loss": 0.8779, + "step": 46320 + }, + { + "epoch": 1.19, + "learning_rate": 1.3767190695541943e-06, + "loss": 0.6494, + "step": 46321 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766934375060237e-06, + "loss": 0.7793, + "step": 46322 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766678051694363e-06, + "loss": 0.3867, + "step": 46323 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766421725444516e-06, + "loss": 0.6082, + "step": 46324 + }, + { + "epoch": 1.19, + "learning_rate": 1.3766165396310894e-06, + "loss": 0.4414, + "step": 46325 + }, + { + "epoch": 1.19, + "learning_rate": 1.376590906429369e-06, + "loss": 0.7344, + "step": 46326 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765652729393105e-06, + "loss": 0.5479, + "step": 46327 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765396391609333e-06, + "loss": 0.6938, + "step": 46328 + }, + { + "epoch": 1.19, + "learning_rate": 1.3765140050942567e-06, + "loss": 0.7188, + "step": 46329 + }, + { + "epoch": 1.19, + "learning_rate": 1.376488370739301e-06, + "loss": 0.499, + "step": 46330 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764627360960853e-06, + "loss": 0.5615, + "step": 46331 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764371011646294e-06, + "loss": 0.6074, + "step": 46332 + }, + { + "epoch": 1.19, + "learning_rate": 1.3764114659449528e-06, + "loss": 0.5171, + "step": 46333 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763858304370755e-06, + "loss": 0.4863, + "step": 46334 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763601946410168e-06, + "loss": 0.708, + "step": 46335 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763345585567963e-06, + "loss": 0.5132, + "step": 46336 + }, + { + "epoch": 1.19, + "learning_rate": 1.3763089221844338e-06, + "loss": 0.6309, + "step": 46337 + }, + { + "epoch": 1.19, + "learning_rate": 1.3762832855239486e-06, + "loss": 0.564, + "step": 46338 + }, + { + "epoch": 1.19, + "learning_rate": 1.376257648575361e-06, + "loss": 0.6611, + "step": 46339 + }, + { + "epoch": 1.19, + "learning_rate": 1.37623201133869e-06, + "loss": 0.464, + "step": 46340 + }, + { + "epoch": 1.19, + "learning_rate": 1.3762063738139554e-06, + "loss": 0.6709, + "step": 46341 + }, + { + "epoch": 1.19, + "learning_rate": 1.376180736001177e-06, + "loss": 0.5986, + "step": 46342 + }, + { + "epoch": 1.19, + "learning_rate": 1.3761550979003743e-06, + "loss": 0.7373, + "step": 46343 + }, + { + "epoch": 1.19, + "learning_rate": 1.376129459511567e-06, + "loss": 0.7666, + "step": 46344 + }, + { + "epoch": 1.19, + "learning_rate": 1.3761038208347748e-06, + "loss": 0.7964, + "step": 46345 + }, + { + "epoch": 1.19, + "learning_rate": 1.376078181870017e-06, + "loss": 0.665, + "step": 46346 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760525426173132e-06, + "loss": 0.7969, + "step": 46347 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760269030766835e-06, + "loss": 0.7539, + "step": 46348 + }, + { + "epoch": 1.19, + "learning_rate": 1.3760012632481473e-06, + "loss": 0.6567, + "step": 46349 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759756231317242e-06, + "loss": 0.6602, + "step": 46350 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759499827274339e-06, + "loss": 0.7217, + "step": 46351 + }, + { + "epoch": 1.19, + "learning_rate": 1.3759243420352959e-06, + "loss": 0.6357, + "step": 46352 + }, + { + "epoch": 1.19, + "learning_rate": 1.37589870105533e-06, + "loss": 0.7148, + "step": 46353 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758730597875556e-06, + "loss": 0.3622, + "step": 46354 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758474182319927e-06, + "loss": 0.8242, + "step": 46355 + }, + { + "epoch": 1.19, + "learning_rate": 1.3758217763886607e-06, + "loss": 0.5908, + "step": 46356 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757961342575789e-06, + "loss": 0.5151, + "step": 46357 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757704918387676e-06, + "loss": 0.5889, + "step": 46358 + }, + { + "epoch": 1.19, + "learning_rate": 1.3757448491322462e-06, + "loss": 0.7725, + "step": 46359 + }, + { + "epoch": 1.19, + "learning_rate": 1.375719206138034e-06, + "loss": 0.5466, + "step": 46360 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756935628561508e-06, + "loss": 0.8428, + "step": 46361 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756679192866165e-06, + "loss": 0.8096, + "step": 46362 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756422754294503e-06, + "loss": 0.6909, + "step": 46363 + }, + { + "epoch": 1.19, + "learning_rate": 1.3756166312846724e-06, + "loss": 0.6143, + "step": 46364 + }, + { + "epoch": 1.19, + "learning_rate": 1.375590986852302e-06, + "loss": 0.667, + "step": 46365 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755653421323591e-06, + "loss": 0.6484, + "step": 46366 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755396971248627e-06, + "loss": 0.7412, + "step": 46367 + }, + { + "epoch": 1.19, + "learning_rate": 1.3755140518298331e-06, + "loss": 0.4711, + "step": 46368 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754884062472894e-06, + "loss": 0.6543, + "step": 46369 + }, + { + "epoch": 1.19, + "learning_rate": 1.375462760377252e-06, + "loss": 0.6279, + "step": 46370 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754371142197394e-06, + "loss": 0.7305, + "step": 46371 + }, + { + "epoch": 1.19, + "learning_rate": 1.3754114677747721e-06, + "loss": 0.5688, + "step": 46372 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753858210423693e-06, + "loss": 0.6875, + "step": 46373 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753601740225514e-06, + "loss": 0.6836, + "step": 46374 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753345267153372e-06, + "loss": 0.6699, + "step": 46375 + }, + { + "epoch": 1.19, + "learning_rate": 1.3753088791207466e-06, + "loss": 0.6748, + "step": 46376 + }, + { + "epoch": 1.19, + "learning_rate": 1.375283231238799e-06, + "loss": 0.7227, + "step": 46377 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752575830695145e-06, + "loss": 0.667, + "step": 46378 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752319346129124e-06, + "loss": 0.6716, + "step": 46379 + }, + { + "epoch": 1.19, + "learning_rate": 1.3752062858690126e-06, + "loss": 0.6538, + "step": 46380 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751806368378346e-06, + "loss": 0.5703, + "step": 46381 + }, + { + "epoch": 1.19, + "learning_rate": 1.375154987519398e-06, + "loss": 0.6641, + "step": 46382 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751293379137226e-06, + "loss": 0.8145, + "step": 46383 + }, + { + "epoch": 1.19, + "learning_rate": 1.3751036880208275e-06, + "loss": 0.7168, + "step": 46384 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750780378407334e-06, + "loss": 0.584, + "step": 46385 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750523873734587e-06, + "loss": 0.5604, + "step": 46386 + }, + { + "epoch": 1.19, + "learning_rate": 1.375026736619024e-06, + "loss": 0.7227, + "step": 46387 + }, + { + "epoch": 1.19, + "learning_rate": 1.3750010855774484e-06, + "loss": 0.5801, + "step": 46388 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749754342487516e-06, + "loss": 0.7168, + "step": 46389 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749497826329538e-06, + "loss": 0.7129, + "step": 46390 + }, + { + "epoch": 1.19, + "learning_rate": 1.3749241307300738e-06, + "loss": 0.5906, + "step": 46391 + }, + { + "epoch": 1.19, + "learning_rate": 1.3748984785401317e-06, + "loss": 0.4727, + "step": 46392 + }, + { + "epoch": 1.19, + "learning_rate": 1.374872826063147e-06, + "loss": 0.749, + "step": 46393 + }, + { + "epoch": 1.19, + "learning_rate": 1.3748471732991393e-06, + "loss": 0.5818, + "step": 46394 + }, + { + "epoch": 1.19, + "learning_rate": 1.374821520248129e-06, + "loss": 0.6768, + "step": 46395 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747958669101346e-06, + "loss": 0.5884, + "step": 46396 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747702132851763e-06, + "loss": 0.7678, + "step": 46397 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747445593732736e-06, + "loss": 0.6084, + "step": 46398 + }, + { + "epoch": 1.19, + "learning_rate": 1.3747189051744462e-06, + "loss": 0.668, + "step": 46399 + }, + { + "epoch": 1.19, + "learning_rate": 1.374693250688714e-06, + "loss": 0.7153, + "step": 46400 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746675959160962e-06, + "loss": 0.6963, + "step": 46401 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746419408566127e-06, + "loss": 0.6079, + "step": 46402 + }, + { + "epoch": 1.19, + "learning_rate": 1.3746162855102832e-06, + "loss": 0.6523, + "step": 46403 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745906298771273e-06, + "loss": 0.7139, + "step": 46404 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745649739571642e-06, + "loss": 0.7705, + "step": 46405 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745393177504144e-06, + "loss": 0.7446, + "step": 46406 + }, + { + "epoch": 1.19, + "learning_rate": 1.3745136612568967e-06, + "loss": 0.6611, + "step": 46407 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744880044766314e-06, + "loss": 0.6255, + "step": 46408 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744623474096374e-06, + "loss": 0.6079, + "step": 46409 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744366900559353e-06, + "loss": 0.6572, + "step": 46410 + }, + { + "epoch": 1.19, + "learning_rate": 1.3744110324155441e-06, + "loss": 0.5571, + "step": 46411 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743853744884835e-06, + "loss": 0.5903, + "step": 46412 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743597162747732e-06, + "loss": 0.6968, + "step": 46413 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743340577744328e-06, + "loss": 0.5469, + "step": 46414 + }, + { + "epoch": 1.19, + "learning_rate": 1.3743083989874823e-06, + "loss": 0.7842, + "step": 46415 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742827399139412e-06, + "loss": 0.6177, + "step": 46416 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742570805538285e-06, + "loss": 0.4458, + "step": 46417 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742314209071646e-06, + "loss": 0.6348, + "step": 46418 + }, + { + "epoch": 1.19, + "learning_rate": 1.3742057609739687e-06, + "loss": 0.6875, + "step": 46419 + }, + { + "epoch": 1.19, + "learning_rate": 1.374180100754261e-06, + "loss": 0.7915, + "step": 46420 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741544402480606e-06, + "loss": 0.8682, + "step": 46421 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741287794553878e-06, + "loss": 0.5703, + "step": 46422 + }, + { + "epoch": 1.19, + "learning_rate": 1.3741031183762611e-06, + "loss": 0.6357, + "step": 46423 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740774570107012e-06, + "loss": 0.708, + "step": 46424 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740517953587274e-06, + "loss": 0.6885, + "step": 46425 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740261334203593e-06, + "loss": 0.5391, + "step": 46426 + }, + { + "epoch": 1.19, + "learning_rate": 1.3740004711956166e-06, + "loss": 0.5996, + "step": 46427 + }, + { + "epoch": 1.19, + "learning_rate": 1.3739748086845189e-06, + "loss": 0.4547, + "step": 46428 + }, + { + "epoch": 1.19, + "learning_rate": 1.373949145887086e-06, + "loss": 0.6958, + "step": 46429 + }, + { + "epoch": 1.19, + "learning_rate": 1.3739234828033372e-06, + "loss": 0.7354, + "step": 46430 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738978194332926e-06, + "loss": 0.6592, + "step": 46431 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738721557769715e-06, + "loss": 0.5762, + "step": 46432 + }, + { + "epoch": 1.19, + "learning_rate": 1.3738464918343938e-06, + "loss": 0.7656, + "step": 46433 + }, + { + "epoch": 1.19, + "learning_rate": 1.373820827605579e-06, + "loss": 0.6304, + "step": 46434 + }, + { + "epoch": 1.19, + "learning_rate": 1.373795163090547e-06, + "loss": 0.6333, + "step": 46435 + }, + { + "epoch": 1.19, + "learning_rate": 1.3737694982893166e-06, + "loss": 0.7476, + "step": 46436 + }, + { + "epoch": 1.19, + "learning_rate": 1.3737438332019085e-06, + "loss": 0.7368, + "step": 46437 + }, + { + "epoch": 1.19, + "learning_rate": 1.373718167828342e-06, + "loss": 0.582, + "step": 46438 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736925021686366e-06, + "loss": 0.9189, + "step": 46439 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736668362228119e-06, + "loss": 0.6172, + "step": 46440 + }, + { + "epoch": 1.19, + "learning_rate": 1.373641169990888e-06, + "loss": 0.6675, + "step": 46441 + }, + { + "epoch": 1.19, + "learning_rate": 1.3736155034728838e-06, + "loss": 0.5894, + "step": 46442 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735898366688196e-06, + "loss": 0.5884, + "step": 46443 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735641695787147e-06, + "loss": 0.5874, + "step": 46444 + }, + { + "epoch": 1.19, + "learning_rate": 1.373538502202589e-06, + "loss": 0.564, + "step": 46445 + }, + { + "epoch": 1.19, + "learning_rate": 1.3735128345404623e-06, + "loss": 0.7559, + "step": 46446 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734871665923537e-06, + "loss": 0.563, + "step": 46447 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734614983582832e-06, + "loss": 0.6323, + "step": 46448 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734358298382707e-06, + "loss": 0.707, + "step": 46449 + }, + { + "epoch": 1.19, + "learning_rate": 1.3734101610323352e-06, + "loss": 0.8271, + "step": 46450 + }, + { + "epoch": 1.19, + "learning_rate": 1.373384491940497e-06, + "loss": 0.6416, + "step": 46451 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733588225627752e-06, + "loss": 0.7939, + "step": 46452 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733331528991897e-06, + "loss": 0.54, + "step": 46453 + }, + { + "epoch": 1.19, + "learning_rate": 1.3733074829497601e-06, + "loss": 0.5542, + "step": 46454 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732818127145065e-06, + "loss": 0.7197, + "step": 46455 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732561421934481e-06, + "loss": 0.6523, + "step": 46456 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732304713866044e-06, + "loss": 0.5643, + "step": 46457 + }, + { + "epoch": 1.19, + "learning_rate": 1.3732048002939953e-06, + "loss": 0.6064, + "step": 46458 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731791289156404e-06, + "loss": 0.7812, + "step": 46459 + }, + { + "epoch": 1.19, + "learning_rate": 1.37315345725156e-06, + "loss": 0.71, + "step": 46460 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731277853017723e-06, + "loss": 0.6846, + "step": 46461 + }, + { + "epoch": 1.19, + "learning_rate": 1.3731021130662983e-06, + "loss": 0.8594, + "step": 46462 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730764405451569e-06, + "loss": 0.7471, + "step": 46463 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730507677383684e-06, + "loss": 0.4617, + "step": 46464 + }, + { + "epoch": 1.19, + "learning_rate": 1.3730250946459518e-06, + "loss": 0.6162, + "step": 46465 + }, + { + "epoch": 1.19, + "learning_rate": 1.372999421267927e-06, + "loss": 0.6816, + "step": 46466 + }, + { + "epoch": 1.19, + "learning_rate": 1.372973747604314e-06, + "loss": 0.5654, + "step": 46467 + }, + { + "epoch": 1.19, + "learning_rate": 1.372948073655132e-06, + "loss": 0.6235, + "step": 46468 + }, + { + "epoch": 1.19, + "learning_rate": 1.3729223994204007e-06, + "loss": 0.5713, + "step": 46469 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728967249001398e-06, + "loss": 0.6167, + "step": 46470 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728710500943695e-06, + "loss": 0.646, + "step": 46471 + }, + { + "epoch": 1.19, + "learning_rate": 1.3728453750031084e-06, + "loss": 0.7607, + "step": 46472 + }, + { + "epoch": 1.19, + "learning_rate": 1.372819699626377e-06, + "loss": 0.7393, + "step": 46473 + }, + { + "epoch": 1.19, + "learning_rate": 1.3727940239641944e-06, + "loss": 0.6182, + "step": 46474 + }, + { + "epoch": 1.19, + "learning_rate": 1.3727683480165813e-06, + "loss": 0.5801, + "step": 46475 + }, + { + "epoch": 1.19, + "learning_rate": 1.372742671783556e-06, + "loss": 0.6743, + "step": 46476 + }, + { + "epoch": 1.19, + "learning_rate": 1.372716995265139e-06, + "loss": 0.6294, + "step": 46477 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726913184613493e-06, + "loss": 0.6953, + "step": 46478 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726656413722074e-06, + "loss": 0.5188, + "step": 46479 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726399639977326e-06, + "loss": 0.7549, + "step": 46480 + }, + { + "epoch": 1.19, + "learning_rate": 1.3726142863379447e-06, + "loss": 0.6953, + "step": 46481 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725886083928625e-06, + "loss": 0.7788, + "step": 46482 + }, + { + "epoch": 1.19, + "learning_rate": 1.372562930162507e-06, + "loss": 0.6875, + "step": 46483 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725372516468968e-06, + "loss": 0.4331, + "step": 46484 + }, + { + "epoch": 1.19, + "learning_rate": 1.3725115728460523e-06, + "loss": 0.6855, + "step": 46485 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724858937599924e-06, + "loss": 0.6938, + "step": 46486 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724602143887376e-06, + "loss": 0.4797, + "step": 46487 + }, + { + "epoch": 1.19, + "learning_rate": 1.3724345347323067e-06, + "loss": 0.6475, + "step": 46488 + }, + { + "epoch": 1.19, + "learning_rate": 1.37240885479072e-06, + "loss": 0.7217, + "step": 46489 + }, + { + "epoch": 1.19, + "learning_rate": 1.372383174563997e-06, + "loss": 0.5977, + "step": 46490 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723574940521575e-06, + "loss": 0.7227, + "step": 46491 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723318132552206e-06, + "loss": 0.5747, + "step": 46492 + }, + { + "epoch": 1.19, + "learning_rate": 1.3723061321732066e-06, + "loss": 0.5688, + "step": 46493 + }, + { + "epoch": 1.19, + "learning_rate": 1.372280450806135e-06, + "loss": 0.6855, + "step": 46494 + }, + { + "epoch": 1.19, + "learning_rate": 1.3722547691540252e-06, + "loss": 0.5981, + "step": 46495 + }, + { + "epoch": 1.19, + "learning_rate": 1.372229087216897e-06, + "loss": 0.6494, + "step": 46496 + }, + { + "epoch": 1.19, + "learning_rate": 1.3722034049947701e-06, + "loss": 0.7354, + "step": 46497 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721777224876642e-06, + "loss": 0.6455, + "step": 46498 + }, + { + "epoch": 1.19, + "learning_rate": 1.372152039695599e-06, + "loss": 0.7773, + "step": 46499 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721263566185944e-06, + "loss": 0.6455, + "step": 46500 + }, + { + "epoch": 1.19, + "learning_rate": 1.3721006732566692e-06, + "loss": 0.7065, + "step": 46501 + }, + { + "epoch": 1.19, + "learning_rate": 1.372074989609844e-06, + "loss": 0.6807, + "step": 46502 + }, + { + "epoch": 1.19, + "learning_rate": 1.372049305678138e-06, + "loss": 0.7764, + "step": 46503 + }, + { + "epoch": 1.19, + "learning_rate": 1.3720236214615709e-06, + "loss": 0.7627, + "step": 46504 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719979369601623e-06, + "loss": 0.875, + "step": 46505 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719722521739324e-06, + "loss": 0.6396, + "step": 46506 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719465671028999e-06, + "loss": 0.4226, + "step": 46507 + }, + { + "epoch": 1.19, + "learning_rate": 1.3719208817470854e-06, + "loss": 0.6357, + "step": 46508 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718951961065077e-06, + "loss": 0.6753, + "step": 46509 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718695101811874e-06, + "loss": 0.624, + "step": 46510 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718438239711438e-06, + "loss": 0.6318, + "step": 46511 + }, + { + "epoch": 1.19, + "learning_rate": 1.3718181374763965e-06, + "loss": 0.8262, + "step": 46512 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717924506969646e-06, + "loss": 0.647, + "step": 46513 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717667636328689e-06, + "loss": 0.6626, + "step": 46514 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717410762841282e-06, + "loss": 0.7109, + "step": 46515 + }, + { + "epoch": 1.19, + "learning_rate": 1.3717153886507623e-06, + "loss": 0.5303, + "step": 46516 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716897007327911e-06, + "loss": 0.7295, + "step": 46517 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716640125302344e-06, + "loss": 0.748, + "step": 46518 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716383240431117e-06, + "loss": 0.6255, + "step": 46519 + }, + { + "epoch": 1.19, + "learning_rate": 1.3716126352714426e-06, + "loss": 0.4932, + "step": 46520 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715869462152467e-06, + "loss": 0.5425, + "step": 46521 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715612568745435e-06, + "loss": 0.7266, + "step": 46522 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715355672493534e-06, + "loss": 0.8799, + "step": 46523 + }, + { + "epoch": 1.19, + "learning_rate": 1.3715098773396952e-06, + "loss": 0.6323, + "step": 46524 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714841871455893e-06, + "loss": 0.5298, + "step": 46525 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714584966670549e-06, + "loss": 0.584, + "step": 46526 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714328059041117e-06, + "loss": 0.5024, + "step": 46527 + }, + { + "epoch": 1.19, + "learning_rate": 1.3714071148567794e-06, + "loss": 0.7393, + "step": 46528 + }, + { + "epoch": 1.19, + "learning_rate": 1.371381423525078e-06, + "loss": 0.6655, + "step": 46529 + }, + { + "epoch": 1.19, + "learning_rate": 1.371355731909027e-06, + "loss": 0.6807, + "step": 46530 + }, + { + "epoch": 1.19, + "learning_rate": 1.371330040008646e-06, + "loss": 0.6074, + "step": 46531 + }, + { + "epoch": 1.19, + "learning_rate": 1.3713043478239542e-06, + "loss": 0.4897, + "step": 46532 + }, + { + "epoch": 1.19, + "learning_rate": 1.371278655354972e-06, + "loss": 0.7061, + "step": 46533 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712529626017188e-06, + "loss": 0.728, + "step": 46534 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712272695642144e-06, + "loss": 0.6699, + "step": 46535 + }, + { + "epoch": 1.19, + "learning_rate": 1.3712015762424783e-06, + "loss": 0.668, + "step": 46536 + }, + { + "epoch": 1.19, + "learning_rate": 1.37117588263653e-06, + "loss": 0.5786, + "step": 46537 + }, + { + "epoch": 1.19, + "learning_rate": 1.3711501887463896e-06, + "loss": 0.4648, + "step": 46538 + }, + { + "epoch": 1.19, + "learning_rate": 1.3711244945720765e-06, + "loss": 0.623, + "step": 46539 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710988001136108e-06, + "loss": 0.8164, + "step": 46540 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710731053710113e-06, + "loss": 0.7285, + "step": 46541 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710474103442985e-06, + "loss": 0.687, + "step": 46542 + }, + { + "epoch": 1.19, + "learning_rate": 1.3710217150334912e-06, + "loss": 0.5708, + "step": 46543 + }, + { + "epoch": 1.19, + "learning_rate": 1.3709960194386105e-06, + "loss": 0.4312, + "step": 46544 + }, + { + "epoch": 1.19, + "learning_rate": 1.3709703235596748e-06, + "loss": 0.6567, + "step": 46545 + }, + { + "epoch": 1.19, + "learning_rate": 1.370944627396704e-06, + "loss": 0.6494, + "step": 46546 + }, + { + "epoch": 1.19, + "learning_rate": 1.370918930949718e-06, + "loss": 0.646, + "step": 46547 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708932342187366e-06, + "loss": 0.6377, + "step": 46548 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708675372037791e-06, + "loss": 0.6167, + "step": 46549 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708418399048657e-06, + "loss": 0.5125, + "step": 46550 + }, + { + "epoch": 1.19, + "learning_rate": 1.3708161423220154e-06, + "loss": 0.4064, + "step": 46551 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707904444552488e-06, + "loss": 0.5664, + "step": 46552 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707647463045845e-06, + "loss": 0.6987, + "step": 46553 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707390478700427e-06, + "loss": 0.6074, + "step": 46554 + }, + { + "epoch": 1.19, + "learning_rate": 1.3707133491516431e-06, + "loss": 0.5466, + "step": 46555 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706876501494053e-06, + "loss": 0.6279, + "step": 46556 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706619508633492e-06, + "loss": 0.6221, + "step": 46557 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706362512934943e-06, + "loss": 0.709, + "step": 46558 + }, + { + "epoch": 1.19, + "learning_rate": 1.3706105514398603e-06, + "loss": 0.7383, + "step": 46559 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705848513024664e-06, + "loss": 0.7314, + "step": 46560 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705591508813332e-06, + "loss": 0.6689, + "step": 46561 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705334501764796e-06, + "loss": 0.5898, + "step": 46562 + }, + { + "epoch": 1.19, + "learning_rate": 1.3705077491879258e-06, + "loss": 0.4801, + "step": 46563 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704820479156911e-06, + "loss": 0.5811, + "step": 46564 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704563463597953e-06, + "loss": 0.5554, + "step": 46565 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704306445202583e-06, + "loss": 0.4849, + "step": 46566 + }, + { + "epoch": 1.19, + "learning_rate": 1.3704049423970994e-06, + "loss": 0.9092, + "step": 46567 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703792399903384e-06, + "loss": 0.6519, + "step": 46568 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703535372999955e-06, + "loss": 0.3479, + "step": 46569 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703278343260895e-06, + "loss": 0.4893, + "step": 46570 + }, + { + "epoch": 1.19, + "learning_rate": 1.3703021310686406e-06, + "loss": 0.6362, + "step": 46571 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702764275276685e-06, + "loss": 0.6494, + "step": 46572 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702507237031925e-06, + "loss": 0.6406, + "step": 46573 + }, + { + "epoch": 1.19, + "learning_rate": 1.3702250195952328e-06, + "loss": 0.4285, + "step": 46574 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701993152038088e-06, + "loss": 0.9062, + "step": 46575 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701736105289401e-06, + "loss": 0.8184, + "step": 46576 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701479055706466e-06, + "loss": 0.707, + "step": 46577 + }, + { + "epoch": 1.19, + "learning_rate": 1.3701222003289474e-06, + "loss": 0.6328, + "step": 46578 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700964948038633e-06, + "loss": 0.8262, + "step": 46579 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700707889954131e-06, + "loss": 0.5933, + "step": 46580 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700450829036165e-06, + "loss": 0.605, + "step": 46581 + }, + { + "epoch": 1.19, + "learning_rate": 1.3700193765284937e-06, + "loss": 0.7646, + "step": 46582 + }, + { + "epoch": 1.19, + "learning_rate": 1.3699936698700638e-06, + "loss": 0.708, + "step": 46583 + }, + { + "epoch": 1.19, + "learning_rate": 1.369967962928347e-06, + "loss": 0.6313, + "step": 46584 + }, + { + "epoch": 1.19, + "learning_rate": 1.369942255703363e-06, + "loss": 0.6631, + "step": 46585 + }, + { + "epoch": 1.19, + "learning_rate": 1.3699165481951307e-06, + "loss": 0.7222, + "step": 46586 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698908404036705e-06, + "loss": 0.4873, + "step": 46587 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698651323290017e-06, + "loss": 0.4934, + "step": 46588 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698394239711446e-06, + "loss": 0.7725, + "step": 46589 + }, + { + "epoch": 1.19, + "learning_rate": 1.3698137153301183e-06, + "loss": 0.6089, + "step": 46590 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697880064059423e-06, + "loss": 0.6973, + "step": 46591 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697622971986372e-06, + "loss": 0.6885, + "step": 46592 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697365877082217e-06, + "loss": 0.7598, + "step": 46593 + }, + { + "epoch": 1.19, + "learning_rate": 1.3697108779347163e-06, + "loss": 0.3716, + "step": 46594 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696851678781397e-06, + "loss": 0.7646, + "step": 46595 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696594575385126e-06, + "loss": 0.7314, + "step": 46596 + }, + { + "epoch": 1.19, + "learning_rate": 1.369633746915854e-06, + "loss": 0.5815, + "step": 46597 + }, + { + "epoch": 1.19, + "learning_rate": 1.3696080360101838e-06, + "loss": 0.7178, + "step": 46598 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695823248215218e-06, + "loss": 0.6089, + "step": 46599 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695566133498877e-06, + "loss": 0.5283, + "step": 46600 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695309015953013e-06, + "loss": 0.9424, + "step": 46601 + }, + { + "epoch": 1.19, + "learning_rate": 1.3695051895577816e-06, + "loss": 0.4424, + "step": 46602 + }, + { + "epoch": 1.19, + "learning_rate": 1.369479477237349e-06, + "loss": 0.8486, + "step": 46603 + }, + { + "epoch": 1.19, + "learning_rate": 1.369453764634023e-06, + "loss": 0.6855, + "step": 46604 + }, + { + "epoch": 1.19, + "learning_rate": 1.3694280517478233e-06, + "loss": 0.6934, + "step": 46605 + }, + { + "epoch": 1.19, + "learning_rate": 1.3694023385787693e-06, + "loss": 0.7383, + "step": 46606 + }, + { + "epoch": 1.19, + "learning_rate": 1.369376625126881e-06, + "loss": 0.6768, + "step": 46607 + }, + { + "epoch": 1.19, + "learning_rate": 1.369350911392178e-06, + "loss": 0.6089, + "step": 46608 + }, + { + "epoch": 1.19, + "learning_rate": 1.3693251973746801e-06, + "loss": 0.5654, + "step": 46609 + }, + { + "epoch": 1.19, + "learning_rate": 1.3692994830744069e-06, + "loss": 0.7324, + "step": 46610 + }, + { + "epoch": 1.19, + "learning_rate": 1.369273768491378e-06, + "loss": 0.6128, + "step": 46611 + }, + { + "epoch": 1.19, + "learning_rate": 1.3692480536256131e-06, + "loss": 0.6895, + "step": 46612 + }, + { + "epoch": 1.19, + "learning_rate": 1.369222338477132e-06, + "loss": 0.6377, + "step": 46613 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691966230459544e-06, + "loss": 0.5249, + "step": 46614 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691709073320998e-06, + "loss": 0.6807, + "step": 46615 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691451913355878e-06, + "loss": 0.7402, + "step": 46616 + }, + { + "epoch": 1.19, + "learning_rate": 1.3691194750564388e-06, + "loss": 0.6494, + "step": 46617 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690937584946716e-06, + "loss": 0.6841, + "step": 46618 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690680416503067e-06, + "loss": 0.793, + "step": 46619 + }, + { + "epoch": 1.19, + "learning_rate": 1.369042324523363e-06, + "loss": 0.5338, + "step": 46620 + }, + { + "epoch": 1.19, + "learning_rate": 1.3690166071138606e-06, + "loss": 0.7852, + "step": 46621 + }, + { + "epoch": 1.19, + "learning_rate": 1.368990889421819e-06, + "loss": 0.6216, + "step": 46622 + }, + { + "epoch": 1.19, + "learning_rate": 1.3689651714472583e-06, + "loss": 0.7168, + "step": 46623 + }, + { + "epoch": 1.19, + "learning_rate": 1.3689394531901979e-06, + "loss": 0.6338, + "step": 46624 + }, + { + "epoch": 1.2, + "learning_rate": 1.3689137346506575e-06, + "loss": 0.7969, + "step": 46625 + }, + { + "epoch": 1.2, + "learning_rate": 1.368888015828657e-06, + "loss": 0.5879, + "step": 46626 + }, + { + "epoch": 1.2, + "learning_rate": 1.3688622967242155e-06, + "loss": 0.5059, + "step": 46627 + }, + { + "epoch": 1.2, + "learning_rate": 1.3688365773373533e-06, + "loss": 0.5491, + "step": 46628 + }, + { + "epoch": 1.2, + "learning_rate": 1.36881085766809e-06, + "loss": 0.6509, + "step": 46629 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687851377164451e-06, + "loss": 0.8428, + "step": 46630 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687594174824384e-06, + "loss": 0.8594, + "step": 46631 + }, + { + "epoch": 1.2, + "learning_rate": 1.3687336969660893e-06, + "loss": 0.5383, + "step": 46632 + }, + { + "epoch": 1.2, + "learning_rate": 1.368707976167418e-06, + "loss": 0.8096, + "step": 46633 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686822550864444e-06, + "loss": 0.647, + "step": 46634 + }, + { + "epoch": 1.2, + "learning_rate": 1.368656533723187e-06, + "loss": 0.7598, + "step": 46635 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686308120776669e-06, + "loss": 0.6328, + "step": 46636 + }, + { + "epoch": 1.2, + "learning_rate": 1.3686050901499028e-06, + "loss": 0.707, + "step": 46637 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685793679399145e-06, + "loss": 0.7725, + "step": 46638 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685536454477221e-06, + "loss": 0.6309, + "step": 46639 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685279226733454e-06, + "loss": 0.6963, + "step": 46640 + }, + { + "epoch": 1.2, + "learning_rate": 1.3685021996168034e-06, + "loss": 0.7168, + "step": 46641 + }, + { + "epoch": 1.2, + "learning_rate": 1.3684764762781164e-06, + "loss": 0.5991, + "step": 46642 + }, + { + "epoch": 1.2, + "learning_rate": 1.368450752657304e-06, + "loss": 0.4997, + "step": 46643 + }, + { + "epoch": 1.2, + "learning_rate": 1.3684250287543858e-06, + "loss": 0.7412, + "step": 46644 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683993045693814e-06, + "loss": 0.6299, + "step": 46645 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683735801023103e-06, + "loss": 0.5947, + "step": 46646 + }, + { + "epoch": 1.2, + "learning_rate": 1.368347855353193e-06, + "loss": 0.5562, + "step": 46647 + }, + { + "epoch": 1.2, + "learning_rate": 1.3683221303220484e-06, + "loss": 0.6565, + "step": 46648 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682964050088967e-06, + "loss": 0.8281, + "step": 46649 + }, + { + "epoch": 1.2, + "learning_rate": 1.368270679413757e-06, + "loss": 0.5488, + "step": 46650 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682449535366498e-06, + "loss": 0.7266, + "step": 46651 + }, + { + "epoch": 1.2, + "learning_rate": 1.3682192273775938e-06, + "loss": 0.6169, + "step": 46652 + }, + { + "epoch": 1.2, + "learning_rate": 1.3681935009366099e-06, + "loss": 0.522, + "step": 46653 + }, + { + "epoch": 1.2, + "learning_rate": 1.368167774213717e-06, + "loss": 0.572, + "step": 46654 + }, + { + "epoch": 1.2, + "learning_rate": 1.368142047208935e-06, + "loss": 0.5627, + "step": 46655 + }, + { + "epoch": 1.2, + "learning_rate": 1.3681163199222832e-06, + "loss": 0.6562, + "step": 46656 + }, + { + "epoch": 1.2, + "learning_rate": 1.368090592353782e-06, + "loss": 0.5376, + "step": 46657 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680648645034504e-06, + "loss": 0.6362, + "step": 46658 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680391363713091e-06, + "loss": 0.6504, + "step": 46659 + }, + { + "epoch": 1.2, + "learning_rate": 1.3680134079573767e-06, + "loss": 0.6772, + "step": 46660 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679876792616734e-06, + "loss": 0.7275, + "step": 46661 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679619502842186e-06, + "loss": 0.6328, + "step": 46662 + }, + { + "epoch": 1.2, + "learning_rate": 1.3679362210250326e-06, + "loss": 0.6699, + "step": 46663 + }, + { + "epoch": 1.2, + "learning_rate": 1.367910491484135e-06, + "loss": 0.7627, + "step": 46664 + }, + { + "epoch": 1.2, + "learning_rate": 1.367884761661545e-06, + "loss": 0.7236, + "step": 46665 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678590315572822e-06, + "loss": 0.6709, + "step": 46666 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678333011713669e-06, + "loss": 0.6187, + "step": 46667 + }, + { + "epoch": 1.2, + "learning_rate": 1.3678075705038186e-06, + "loss": 0.6855, + "step": 46668 + }, + { + "epoch": 1.2, + "learning_rate": 1.367781839554657e-06, + "loss": 0.6709, + "step": 46669 + }, + { + "epoch": 1.2, + "learning_rate": 1.3677561083239017e-06, + "loss": 0.665, + "step": 46670 + }, + { + "epoch": 1.2, + "learning_rate": 1.3677303768115725e-06, + "loss": 0.5366, + "step": 46671 + }, + { + "epoch": 1.2, + "learning_rate": 1.367704645017689e-06, + "loss": 0.5684, + "step": 46672 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676789129422708e-06, + "loss": 0.7637, + "step": 46673 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676531805853381e-06, + "loss": 0.521, + "step": 46674 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676274479469102e-06, + "loss": 0.7729, + "step": 46675 + }, + { + "epoch": 1.2, + "learning_rate": 1.3676017150270068e-06, + "loss": 0.7012, + "step": 46676 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675759818256473e-06, + "loss": 0.7041, + "step": 46677 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675502483428525e-06, + "loss": 0.6621, + "step": 46678 + }, + { + "epoch": 1.2, + "learning_rate": 1.3675245145786408e-06, + "loss": 0.627, + "step": 46679 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674987805330328e-06, + "loss": 0.7227, + "step": 46680 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674730462060478e-06, + "loss": 0.6294, + "step": 46681 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674473115977056e-06, + "loss": 0.6201, + "step": 46682 + }, + { + "epoch": 1.2, + "learning_rate": 1.3674215767080257e-06, + "loss": 0.6389, + "step": 46683 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673958415370283e-06, + "loss": 0.7715, + "step": 46684 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673701060847325e-06, + "loss": 0.5518, + "step": 46685 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673443703511585e-06, + "loss": 0.7598, + "step": 46686 + }, + { + "epoch": 1.2, + "learning_rate": 1.3673186343363257e-06, + "loss": 0.7275, + "step": 46687 + }, + { + "epoch": 1.2, + "learning_rate": 1.367292898040254e-06, + "loss": 0.5459, + "step": 46688 + }, + { + "epoch": 1.2, + "learning_rate": 1.367267161462963e-06, + "loss": 0.6187, + "step": 46689 + }, + { + "epoch": 1.2, + "learning_rate": 1.3672414246044723e-06, + "loss": 0.6924, + "step": 46690 + }, + { + "epoch": 1.2, + "learning_rate": 1.3672156874648018e-06, + "loss": 0.6299, + "step": 46691 + }, + { + "epoch": 1.2, + "learning_rate": 1.3671899500439712e-06, + "loss": 0.8027, + "step": 46692 + }, + { + "epoch": 1.2, + "learning_rate": 1.367164212342e-06, + "loss": 0.6377, + "step": 46693 + }, + { + "epoch": 1.2, + "learning_rate": 1.367138474358908e-06, + "loss": 0.5796, + "step": 46694 + }, + { + "epoch": 1.2, + "learning_rate": 1.3671127360947153e-06, + "loss": 0.6475, + "step": 46695 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670869975494408e-06, + "loss": 0.709, + "step": 46696 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670612587231051e-06, + "loss": 0.7471, + "step": 46697 + }, + { + "epoch": 1.2, + "learning_rate": 1.367035519615727e-06, + "loss": 0.7358, + "step": 46698 + }, + { + "epoch": 1.2, + "learning_rate": 1.3670097802273272e-06, + "loss": 0.7656, + "step": 46699 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669840405579244e-06, + "loss": 0.7119, + "step": 46700 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669583006075394e-06, + "loss": 0.5219, + "step": 46701 + }, + { + "epoch": 1.2, + "learning_rate": 1.3669325603761908e-06, + "loss": 0.6265, + "step": 46702 + }, + { + "epoch": 1.2, + "learning_rate": 1.366906819863899e-06, + "loss": 0.6655, + "step": 46703 + }, + { + "epoch": 1.2, + "learning_rate": 1.3668810790706835e-06, + "loss": 0.3828, + "step": 46704 + }, + { + "epoch": 1.2, + "learning_rate": 1.3668553379965642e-06, + "loss": 0.7061, + "step": 46705 + }, + { + "epoch": 1.2, + "learning_rate": 1.36682959664156e-06, + "loss": 0.7061, + "step": 46706 + }, + { + "epoch": 1.2, + "learning_rate": 1.366803855005692e-06, + "loss": 0.439, + "step": 46707 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667781130889786e-06, + "loss": 0.7505, + "step": 46708 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667523708914406e-06, + "loss": 0.6689, + "step": 46709 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667266284130967e-06, + "loss": 0.708, + "step": 46710 + }, + { + "epoch": 1.2, + "learning_rate": 1.3667008856539671e-06, + "loss": 0.6545, + "step": 46711 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666751426140716e-06, + "loss": 0.6636, + "step": 46712 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666493992934301e-06, + "loss": 0.749, + "step": 46713 + }, + { + "epoch": 1.2, + "learning_rate": 1.3666236556920616e-06, + "loss": 0.6077, + "step": 46714 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665979118099864e-06, + "loss": 0.6021, + "step": 46715 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665721676472241e-06, + "loss": 0.5234, + "step": 46716 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665464232037941e-06, + "loss": 0.585, + "step": 46717 + }, + { + "epoch": 1.2, + "learning_rate": 1.3665206784797165e-06, + "loss": 0.5115, + "step": 46718 + }, + { + "epoch": 1.2, + "learning_rate": 1.366494933475011e-06, + "loss": 0.6328, + "step": 46719 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664691881896973e-06, + "loss": 0.6339, + "step": 46720 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664434426237944e-06, + "loss": 0.4727, + "step": 46721 + }, + { + "epoch": 1.2, + "learning_rate": 1.3664176967773232e-06, + "loss": 0.5259, + "step": 46722 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663919506503025e-06, + "loss": 0.4097, + "step": 46723 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663662042427526e-06, + "loss": 0.708, + "step": 46724 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663404575546927e-06, + "loss": 0.6729, + "step": 46725 + }, + { + "epoch": 1.2, + "learning_rate": 1.3663147105861427e-06, + "loss": 0.436, + "step": 46726 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662889633371223e-06, + "loss": 0.8047, + "step": 46727 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662632158076517e-06, + "loss": 0.5044, + "step": 46728 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662374679977502e-06, + "loss": 0.5986, + "step": 46729 + }, + { + "epoch": 1.2, + "learning_rate": 1.3662117199074372e-06, + "loss": 0.7764, + "step": 46730 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661859715367328e-06, + "loss": 0.6113, + "step": 46731 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661602228856567e-06, + "loss": 0.7119, + "step": 46732 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661344739542285e-06, + "loss": 0.7549, + "step": 46733 + }, + { + "epoch": 1.2, + "learning_rate": 1.3661087247424678e-06, + "loss": 0.7695, + "step": 46734 + }, + { + "epoch": 1.2, + "learning_rate": 1.366082975250395e-06, + "loss": 0.5557, + "step": 46735 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660572254780286e-06, + "loss": 0.6621, + "step": 46736 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660314754253893e-06, + "loss": 0.6943, + "step": 46737 + }, + { + "epoch": 1.2, + "learning_rate": 1.3660057250924969e-06, + "loss": 0.7568, + "step": 46738 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659799744793704e-06, + "loss": 0.7588, + "step": 46739 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659542235860297e-06, + "loss": 0.6123, + "step": 46740 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659284724124952e-06, + "loss": 0.7676, + "step": 46741 + }, + { + "epoch": 1.2, + "learning_rate": 1.3659027209587854e-06, + "loss": 0.5859, + "step": 46742 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658769692249213e-06, + "loss": 0.6709, + "step": 46743 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658512172109219e-06, + "loss": 0.7363, + "step": 46744 + }, + { + "epoch": 1.2, + "learning_rate": 1.3658254649168068e-06, + "loss": 0.7207, + "step": 46745 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657997123425962e-06, + "loss": 0.6128, + "step": 46746 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657739594883096e-06, + "loss": 0.6465, + "step": 46747 + }, + { + "epoch": 1.2, + "learning_rate": 1.3657482063539662e-06, + "loss": 0.5767, + "step": 46748 + }, + { + "epoch": 1.2, + "learning_rate": 1.365722452939587e-06, + "loss": 0.5449, + "step": 46749 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656966992451903e-06, + "loss": 0.5967, + "step": 46750 + }, + { + "epoch": 1.2, + "learning_rate": 1.365670945270797e-06, + "loss": 0.6099, + "step": 46751 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656451910164257e-06, + "loss": 0.5615, + "step": 46752 + }, + { + "epoch": 1.2, + "learning_rate": 1.3656194364820972e-06, + "loss": 0.5693, + "step": 46753 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655936816678304e-06, + "loss": 0.6504, + "step": 46754 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655679265736455e-06, + "loss": 0.6157, + "step": 46755 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655421711995619e-06, + "loss": 0.6279, + "step": 46756 + }, + { + "epoch": 1.2, + "learning_rate": 1.3655164155455996e-06, + "loss": 0.7109, + "step": 46757 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654906596117778e-06, + "loss": 0.6602, + "step": 46758 + }, + { + "epoch": 1.2, + "learning_rate": 1.365464903398117e-06, + "loss": 0.6299, + "step": 46759 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654391469046367e-06, + "loss": 0.5801, + "step": 46760 + }, + { + "epoch": 1.2, + "learning_rate": 1.3654133901313557e-06, + "loss": 0.5645, + "step": 46761 + }, + { + "epoch": 1.2, + "learning_rate": 1.365387633078295e-06, + "loss": 0.6489, + "step": 46762 + }, + { + "epoch": 1.2, + "learning_rate": 1.3653618757454739e-06, + "loss": 0.7139, + "step": 46763 + }, + { + "epoch": 1.2, + "learning_rate": 1.3653361181329122e-06, + "loss": 0.7197, + "step": 46764 + }, + { + "epoch": 1.2, + "learning_rate": 1.365310360240629e-06, + "loss": 0.6177, + "step": 46765 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652846020686445e-06, + "loss": 0.9541, + "step": 46766 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652588436169783e-06, + "loss": 0.4197, + "step": 46767 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652330848856505e-06, + "loss": 0.6912, + "step": 46768 + }, + { + "epoch": 1.2, + "learning_rate": 1.3652073258746804e-06, + "loss": 0.7207, + "step": 46769 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651815665840878e-06, + "loss": 0.6514, + "step": 46770 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651558070138921e-06, + "loss": 0.666, + "step": 46771 + }, + { + "epoch": 1.2, + "learning_rate": 1.365130047164114e-06, + "loss": 0.5088, + "step": 46772 + }, + { + "epoch": 1.2, + "learning_rate": 1.3651042870347722e-06, + "loss": 0.6636, + "step": 46773 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650785266258874e-06, + "loss": 0.7295, + "step": 46774 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650527659374782e-06, + "loss": 0.6528, + "step": 46775 + }, + { + "epoch": 1.2, + "learning_rate": 1.365027004969565e-06, + "loss": 0.604, + "step": 46776 + }, + { + "epoch": 1.2, + "learning_rate": 1.3650012437221672e-06, + "loss": 0.576, + "step": 46777 + }, + { + "epoch": 1.2, + "learning_rate": 1.3649754821953053e-06, + "loss": 0.6089, + "step": 46778 + }, + { + "epoch": 1.2, + "learning_rate": 1.364949720388998e-06, + "loss": 0.7129, + "step": 46779 + }, + { + "epoch": 1.2, + "learning_rate": 1.3649239583032655e-06, + "loss": 0.6147, + "step": 46780 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648981959381277e-06, + "loss": 0.791, + "step": 46781 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648724332936042e-06, + "loss": 0.791, + "step": 46782 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648466703697144e-06, + "loss": 0.5728, + "step": 46783 + }, + { + "epoch": 1.2, + "learning_rate": 1.3648209071664782e-06, + "loss": 0.752, + "step": 46784 + }, + { + "epoch": 1.2, + "learning_rate": 1.364795143683916e-06, + "loss": 0.7148, + "step": 46785 + }, + { + "epoch": 1.2, + "learning_rate": 1.364769379922046e-06, + "loss": 0.7109, + "step": 46786 + }, + { + "epoch": 1.2, + "learning_rate": 1.3647436158808897e-06, + "loss": 0.8301, + "step": 46787 + }, + { + "epoch": 1.2, + "learning_rate": 1.3647178515604653e-06, + "loss": 0.625, + "step": 46788 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646920869607938e-06, + "loss": 0.7188, + "step": 46789 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646663220818942e-06, + "loss": 0.6704, + "step": 46790 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646405569237862e-06, + "loss": 0.8359, + "step": 46791 + }, + { + "epoch": 1.2, + "learning_rate": 1.3646147914864896e-06, + "loss": 0.7075, + "step": 46792 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645890257700244e-06, + "loss": 0.6934, + "step": 46793 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645632597744103e-06, + "loss": 0.6387, + "step": 46794 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645374934996668e-06, + "loss": 0.7222, + "step": 46795 + }, + { + "epoch": 1.2, + "learning_rate": 1.3645117269458135e-06, + "loss": 0.6108, + "step": 46796 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644859601128704e-06, + "loss": 0.6338, + "step": 46797 + }, + { + "epoch": 1.2, + "learning_rate": 1.364460193000857e-06, + "loss": 0.7402, + "step": 46798 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644344256097937e-06, + "loss": 0.7793, + "step": 46799 + }, + { + "epoch": 1.2, + "learning_rate": 1.3644086579396994e-06, + "loss": 0.6265, + "step": 46800 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643828899905941e-06, + "loss": 0.6504, + "step": 46801 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643571217624974e-06, + "loss": 0.6719, + "step": 46802 + }, + { + "epoch": 1.2, + "learning_rate": 1.3643313532554297e-06, + "loss": 0.5928, + "step": 46803 + }, + { + "epoch": 1.2, + "learning_rate": 1.36430558446941e-06, + "loss": 0.6504, + "step": 46804 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642798154044582e-06, + "loss": 0.5654, + "step": 46805 + }, + { + "epoch": 1.2, + "learning_rate": 1.364254046060594e-06, + "loss": 0.6245, + "step": 46806 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642282764378371e-06, + "loss": 0.6802, + "step": 46807 + }, + { + "epoch": 1.2, + "learning_rate": 1.3642025065362078e-06, + "loss": 0.5396, + "step": 46808 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641767363557254e-06, + "loss": 0.6318, + "step": 46809 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641509658964094e-06, + "loss": 0.6104, + "step": 46810 + }, + { + "epoch": 1.2, + "learning_rate": 1.3641251951582798e-06, + "loss": 0.4448, + "step": 46811 + }, + { + "epoch": 1.2, + "learning_rate": 1.364099424141356e-06, + "loss": 0.3718, + "step": 46812 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640736528456581e-06, + "loss": 0.645, + "step": 46813 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640478812712063e-06, + "loss": 0.5898, + "step": 46814 + }, + { + "epoch": 1.2, + "learning_rate": 1.3640221094180193e-06, + "loss": 0.6924, + "step": 46815 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639963372861175e-06, + "loss": 0.6274, + "step": 46816 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639705648755203e-06, + "loss": 0.4985, + "step": 46817 + }, + { + "epoch": 1.2, + "learning_rate": 1.3639447921862476e-06, + "loss": 0.5876, + "step": 46818 + }, + { + "epoch": 1.2, + "learning_rate": 1.363919019218319e-06, + "loss": 0.6943, + "step": 46819 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638932459717547e-06, + "loss": 0.6953, + "step": 46820 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638674724465737e-06, + "loss": 0.7061, + "step": 46821 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638416986427964e-06, + "loss": 0.7285, + "step": 46822 + }, + { + "epoch": 1.2, + "learning_rate": 1.3638159245604416e-06, + "loss": 0.5811, + "step": 46823 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637901501995303e-06, + "loss": 0.5562, + "step": 46824 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637643755600817e-06, + "loss": 0.6602, + "step": 46825 + }, + { + "epoch": 1.2, + "learning_rate": 1.363738600642115e-06, + "loss": 0.5479, + "step": 46826 + }, + { + "epoch": 1.2, + "learning_rate": 1.3637128254456507e-06, + "loss": 0.5669, + "step": 46827 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636870499707081e-06, + "loss": 0.6118, + "step": 46828 + }, + { + "epoch": 1.2, + "learning_rate": 1.363661274217307e-06, + "loss": 0.626, + "step": 46829 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636354981854672e-06, + "loss": 0.5923, + "step": 46830 + }, + { + "epoch": 1.2, + "learning_rate": 1.3636097218752086e-06, + "loss": 0.7354, + "step": 46831 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635839452865505e-06, + "loss": 0.6763, + "step": 46832 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635581684195132e-06, + "loss": 0.6533, + "step": 46833 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635323912741158e-06, + "loss": 0.8633, + "step": 46834 + }, + { + "epoch": 1.2, + "learning_rate": 1.3635066138503786e-06, + "loss": 0.7139, + "step": 46835 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634808361483209e-06, + "loss": 0.5557, + "step": 46836 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634550581679628e-06, + "loss": 0.7437, + "step": 46837 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634292799093237e-06, + "loss": 0.8486, + "step": 46838 + }, + { + "epoch": 1.2, + "learning_rate": 1.3634035013724237e-06, + "loss": 0.6641, + "step": 46839 + }, + { + "epoch": 1.2, + "learning_rate": 1.3633777225572823e-06, + "loss": 0.4103, + "step": 46840 + }, + { + "epoch": 1.2, + "learning_rate": 1.363351943463919e-06, + "loss": 0.751, + "step": 46841 + }, + { + "epoch": 1.2, + "learning_rate": 1.363326164092354e-06, + "loss": 0.7246, + "step": 46842 + }, + { + "epoch": 1.2, + "learning_rate": 1.363300384442607e-06, + "loss": 0.8174, + "step": 46843 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632746045146976e-06, + "loss": 0.5508, + "step": 46844 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632488243086455e-06, + "loss": 0.6362, + "step": 46845 + }, + { + "epoch": 1.2, + "learning_rate": 1.3632230438244703e-06, + "loss": 0.532, + "step": 46846 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631972630621922e-06, + "loss": 0.5852, + "step": 46847 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631714820218308e-06, + "loss": 0.7285, + "step": 46848 + }, + { + "epoch": 1.2, + "learning_rate": 1.363145700703405e-06, + "loss": 0.627, + "step": 46849 + }, + { + "epoch": 1.2, + "learning_rate": 1.3631199191069359e-06, + "loss": 0.5933, + "step": 46850 + }, + { + "epoch": 1.2, + "learning_rate": 1.363094137232442e-06, + "loss": 0.6777, + "step": 46851 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630683550799442e-06, + "loss": 0.6523, + "step": 46852 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630425726494614e-06, + "loss": 0.5942, + "step": 46853 + }, + { + "epoch": 1.2, + "learning_rate": 1.3630167899410137e-06, + "loss": 0.7329, + "step": 46854 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629910069546204e-06, + "loss": 0.7393, + "step": 46855 + }, + { + "epoch": 1.2, + "learning_rate": 1.362965223690302e-06, + "loss": 0.6484, + "step": 46856 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629394401480773e-06, + "loss": 0.6719, + "step": 46857 + }, + { + "epoch": 1.2, + "learning_rate": 1.3629136563279672e-06, + "loss": 0.667, + "step": 46858 + }, + { + "epoch": 1.2, + "learning_rate": 1.3628878722299904e-06, + "loss": 0.584, + "step": 46859 + }, + { + "epoch": 1.2, + "learning_rate": 1.3628620878541672e-06, + "loss": 0.6504, + "step": 46860 + }, + { + "epoch": 1.2, + "learning_rate": 1.362836303200517e-06, + "loss": 0.5942, + "step": 46861 + }, + { + "epoch": 1.2, + "learning_rate": 1.36281051826906e-06, + "loss": 0.6016, + "step": 46862 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627847330598154e-06, + "loss": 0.7119, + "step": 46863 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627589475728034e-06, + "loss": 0.791, + "step": 46864 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627331618080434e-06, + "loss": 0.5581, + "step": 46865 + }, + { + "epoch": 1.2, + "learning_rate": 1.3627073757655554e-06, + "loss": 0.6006, + "step": 46866 + }, + { + "epoch": 1.2, + "learning_rate": 1.362681589445359e-06, + "loss": 0.5942, + "step": 46867 + }, + { + "epoch": 1.2, + "learning_rate": 1.362655802847474e-06, + "loss": 0.707, + "step": 46868 + }, + { + "epoch": 1.2, + "learning_rate": 1.36263001597192e-06, + "loss": 0.7217, + "step": 46869 + }, + { + "epoch": 1.2, + "learning_rate": 1.362604228818717e-06, + "loss": 0.6836, + "step": 46870 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625784413878845e-06, + "loss": 0.7319, + "step": 46871 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625526536794426e-06, + "loss": 0.7637, + "step": 46872 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625268656934108e-06, + "loss": 0.6904, + "step": 46873 + }, + { + "epoch": 1.2, + "learning_rate": 1.3625010774298085e-06, + "loss": 0.6865, + "step": 46874 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624752888886562e-06, + "loss": 0.8066, + "step": 46875 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624495000699728e-06, + "loss": 0.6611, + "step": 46876 + }, + { + "epoch": 1.2, + "learning_rate": 1.3624237109737788e-06, + "loss": 0.7305, + "step": 46877 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623979216000937e-06, + "loss": 0.6821, + "step": 46878 + }, + { + "epoch": 1.2, + "learning_rate": 1.362372131948937e-06, + "loss": 0.5469, + "step": 46879 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623463420203284e-06, + "loss": 0.792, + "step": 46880 + }, + { + "epoch": 1.2, + "learning_rate": 1.3623205518142883e-06, + "loss": 0.6904, + "step": 46881 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622947613308358e-06, + "loss": 0.6797, + "step": 46882 + }, + { + "epoch": 1.2, + "learning_rate": 1.362268970569991e-06, + "loss": 0.772, + "step": 46883 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622431795317733e-06, + "loss": 0.6465, + "step": 46884 + }, + { + "epoch": 1.2, + "learning_rate": 1.3622173882162029e-06, + "loss": 0.5469, + "step": 46885 + }, + { + "epoch": 1.2, + "learning_rate": 1.3621915966232988e-06, + "loss": 0.7476, + "step": 46886 + }, + { + "epoch": 1.2, + "learning_rate": 1.362165804753082e-06, + "loss": 0.7334, + "step": 46887 + }, + { + "epoch": 1.2, + "learning_rate": 1.362140012605571e-06, + "loss": 0.6631, + "step": 46888 + }, + { + "epoch": 1.2, + "learning_rate": 1.362114220180786e-06, + "loss": 0.6714, + "step": 46889 + }, + { + "epoch": 1.2, + "learning_rate": 1.362088427478747e-06, + "loss": 0.7295, + "step": 46890 + }, + { + "epoch": 1.2, + "learning_rate": 1.3620626344994738e-06, + "loss": 0.6694, + "step": 46891 + }, + { + "epoch": 1.2, + "learning_rate": 1.3620368412429853e-06, + "loss": 0.7129, + "step": 46892 + }, + { + "epoch": 1.2, + "learning_rate": 1.362011047709302e-06, + "loss": 0.7061, + "step": 46893 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619852538984438e-06, + "loss": 0.5574, + "step": 46894 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619594598104297e-06, + "loss": 0.6304, + "step": 46895 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619336654452802e-06, + "loss": 0.5562, + "step": 46896 + }, + { + "epoch": 1.2, + "learning_rate": 1.3619078708030146e-06, + "loss": 0.7402, + "step": 46897 + }, + { + "epoch": 1.2, + "learning_rate": 1.361882075883653e-06, + "loss": 0.6025, + "step": 46898 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618562806872146e-06, + "loss": 0.6553, + "step": 46899 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618304852137197e-06, + "loss": 0.7783, + "step": 46900 + }, + { + "epoch": 1.2, + "learning_rate": 1.3618046894631877e-06, + "loss": 0.6948, + "step": 46901 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617788934356386e-06, + "loss": 0.5688, + "step": 46902 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617530971310922e-06, + "loss": 0.5547, + "step": 46903 + }, + { + "epoch": 1.2, + "learning_rate": 1.361727300549568e-06, + "loss": 0.7344, + "step": 46904 + }, + { + "epoch": 1.2, + "learning_rate": 1.3617015036910856e-06, + "loss": 0.4812, + "step": 46905 + }, + { + "epoch": 1.2, + "learning_rate": 1.361675706555665e-06, + "loss": 0.7012, + "step": 46906 + }, + { + "epoch": 1.2, + "learning_rate": 1.361649909143326e-06, + "loss": 0.6345, + "step": 46907 + }, + { + "epoch": 1.2, + "learning_rate": 1.3616241114540886e-06, + "loss": 0.6333, + "step": 46908 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615983134879718e-06, + "loss": 0.6357, + "step": 46909 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615725152449962e-06, + "loss": 0.7002, + "step": 46910 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615467167251805e-06, + "loss": 0.6689, + "step": 46911 + }, + { + "epoch": 1.2, + "learning_rate": 1.3615209179285459e-06, + "loss": 0.6602, + "step": 46912 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614951188551112e-06, + "loss": 0.668, + "step": 46913 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614693195048958e-06, + "loss": 0.667, + "step": 46914 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614435198779204e-06, + "loss": 0.7075, + "step": 46915 + }, + { + "epoch": 1.2, + "learning_rate": 1.3614177199742042e-06, + "loss": 0.5098, + "step": 46916 + }, + { + "epoch": 1.2, + "learning_rate": 1.3613919197937669e-06, + "loss": 0.6638, + "step": 46917 + }, + { + "epoch": 1.2, + "learning_rate": 1.361366119336629e-06, + "loss": 0.575, + "step": 46918 + }, + { + "epoch": 1.2, + "learning_rate": 1.361340318602809e-06, + "loss": 0.6538, + "step": 46919 + }, + { + "epoch": 1.2, + "learning_rate": 1.3613145175923274e-06, + "loss": 0.666, + "step": 46920 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612887163052043e-06, + "loss": 0.7324, + "step": 46921 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612629147414587e-06, + "loss": 0.4885, + "step": 46922 + }, + { + "epoch": 1.2, + "learning_rate": 1.361237112901111e-06, + "loss": 0.488, + "step": 46923 + }, + { + "epoch": 1.2, + "learning_rate": 1.3612113107841805e-06, + "loss": 0.7188, + "step": 46924 + }, + { + "epoch": 1.2, + "learning_rate": 1.361185508390687e-06, + "loss": 0.4207, + "step": 46925 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611597057206504e-06, + "loss": 0.6123, + "step": 46926 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611339027740904e-06, + "loss": 0.8213, + "step": 46927 + }, + { + "epoch": 1.2, + "learning_rate": 1.3611080995510271e-06, + "loss": 0.6035, + "step": 46928 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610822960514796e-06, + "loss": 0.6914, + "step": 46929 + }, + { + "epoch": 1.2, + "learning_rate": 1.361056492275468e-06, + "loss": 0.5552, + "step": 46930 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610306882230122e-06, + "loss": 0.6323, + "step": 46931 + }, + { + "epoch": 1.2, + "learning_rate": 1.3610048838941316e-06, + "loss": 0.6562, + "step": 46932 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609790792888465e-06, + "loss": 0.7246, + "step": 46933 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609532744071758e-06, + "loss": 0.6978, + "step": 46934 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609274692491403e-06, + "loss": 0.5278, + "step": 46935 + }, + { + "epoch": 1.2, + "learning_rate": 1.3609016638147588e-06, + "loss": 0.6846, + "step": 46936 + }, + { + "epoch": 1.2, + "learning_rate": 1.360875858104052e-06, + "loss": 0.7021, + "step": 46937 + }, + { + "epoch": 1.2, + "learning_rate": 1.3608500521170388e-06, + "loss": 0.4946, + "step": 46938 + }, + { + "epoch": 1.2, + "learning_rate": 1.360824245853739e-06, + "loss": 0.6367, + "step": 46939 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607984393141733e-06, + "loss": 0.6372, + "step": 46940 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607726324983603e-06, + "loss": 0.5531, + "step": 46941 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607468254063207e-06, + "loss": 0.6709, + "step": 46942 + }, + { + "epoch": 1.2, + "learning_rate": 1.3607210180380737e-06, + "loss": 0.6621, + "step": 46943 + }, + { + "epoch": 1.2, + "learning_rate": 1.3606952103936392e-06, + "loss": 0.6455, + "step": 46944 + }, + { + "epoch": 1.2, + "learning_rate": 1.360669402473037e-06, + "loss": 0.7725, + "step": 46945 + }, + { + "epoch": 1.2, + "learning_rate": 1.3606435942762868e-06, + "loss": 0.6943, + "step": 46946 + }, + { + "epoch": 1.2, + "learning_rate": 1.360617785803408e-06, + "loss": 0.7188, + "step": 46947 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605919770544214e-06, + "loss": 0.7578, + "step": 46948 + }, + { + "epoch": 1.2, + "learning_rate": 1.360566168029346e-06, + "loss": 0.624, + "step": 46949 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605403587282012e-06, + "loss": 0.6367, + "step": 46950 + }, + { + "epoch": 1.2, + "learning_rate": 1.3605145491510074e-06, + "loss": 0.5203, + "step": 46951 + }, + { + "epoch": 1.2, + "learning_rate": 1.3604887392977844e-06, + "loss": 0.8994, + "step": 46952 + }, + { + "epoch": 1.2, + "learning_rate": 1.3604629291685518e-06, + "loss": 0.6436, + "step": 46953 + }, + { + "epoch": 1.2, + "learning_rate": 1.360437118763329e-06, + "loss": 0.6846, + "step": 46954 + }, + { + "epoch": 1.2, + "learning_rate": 1.360411308082136e-06, + "loss": 0.6514, + "step": 46955 + }, + { + "epoch": 1.2, + "learning_rate": 1.360385497124993e-06, + "loss": 0.7546, + "step": 46956 + }, + { + "epoch": 1.2, + "learning_rate": 1.360359685891919e-06, + "loss": 0.647, + "step": 46957 + }, + { + "epoch": 1.2, + "learning_rate": 1.3603338743829345e-06, + "loss": 0.5474, + "step": 46958 + }, + { + "epoch": 1.2, + "learning_rate": 1.360308062598059e-06, + "loss": 0.6582, + "step": 46959 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602822505373117e-06, + "loss": 0.6787, + "step": 46960 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602564382007132e-06, + "loss": 0.6343, + "step": 46961 + }, + { + "epoch": 1.2, + "learning_rate": 1.360230625588283e-06, + "loss": 0.6445, + "step": 46962 + }, + { + "epoch": 1.2, + "learning_rate": 1.3602048127000405e-06, + "loss": 0.7959, + "step": 46963 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601789995360057e-06, + "loss": 0.626, + "step": 46964 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601531860961987e-06, + "loss": 0.6055, + "step": 46965 + }, + { + "epoch": 1.2, + "learning_rate": 1.3601273723806387e-06, + "loss": 0.4773, + "step": 46966 + }, + { + "epoch": 1.2, + "learning_rate": 1.360101558389346e-06, + "loss": 0.5835, + "step": 46967 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600757441223402e-06, + "loss": 0.7969, + "step": 46968 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600499295796406e-06, + "loss": 0.625, + "step": 46969 + }, + { + "epoch": 1.2, + "learning_rate": 1.3600241147612672e-06, + "loss": 0.6694, + "step": 46970 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599982996672404e-06, + "loss": 0.6919, + "step": 46971 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599724842975788e-06, + "loss": 0.5168, + "step": 46972 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599466686523037e-06, + "loss": 0.7607, + "step": 46973 + }, + { + "epoch": 1.2, + "learning_rate": 1.3599208527314332e-06, + "loss": 0.6914, + "step": 46974 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598950365349882e-06, + "loss": 0.7266, + "step": 46975 + }, + { + "epoch": 1.2, + "learning_rate": 1.359869220062988e-06, + "loss": 0.5884, + "step": 46976 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598434033154527e-06, + "loss": 0.5507, + "step": 46977 + }, + { + "epoch": 1.2, + "learning_rate": 1.3598175862924016e-06, + "loss": 0.5356, + "step": 46978 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597917689938548e-06, + "loss": 0.6768, + "step": 46979 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597659514198318e-06, + "loss": 0.6074, + "step": 46980 + }, + { + "epoch": 1.2, + "learning_rate": 1.359740133570353e-06, + "loss": 0.6445, + "step": 46981 + }, + { + "epoch": 1.2, + "learning_rate": 1.3597143154454373e-06, + "loss": 0.5713, + "step": 46982 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596884970451053e-06, + "loss": 0.6763, + "step": 46983 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596626783693758e-06, + "loss": 0.5283, + "step": 46984 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596368594182694e-06, + "loss": 0.7803, + "step": 46985 + }, + { + "epoch": 1.2, + "learning_rate": 1.3596110401918058e-06, + "loss": 0.7588, + "step": 46986 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595852206900043e-06, + "loss": 0.676, + "step": 46987 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595594009128853e-06, + "loss": 0.7227, + "step": 46988 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595335808604679e-06, + "loss": 0.6377, + "step": 46989 + }, + { + "epoch": 1.2, + "learning_rate": 1.3595077605327721e-06, + "loss": 0.4775, + "step": 46990 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594819399298176e-06, + "loss": 0.8164, + "step": 46991 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594561190516248e-06, + "loss": 0.7246, + "step": 46992 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594302978982128e-06, + "loss": 0.6123, + "step": 46993 + }, + { + "epoch": 1.2, + "learning_rate": 1.3594044764696016e-06, + "loss": 0.6929, + "step": 46994 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593786547658107e-06, + "loss": 0.5942, + "step": 46995 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593528327868602e-06, + "loss": 0.8545, + "step": 46996 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593270105327695e-06, + "loss": 0.5234, + "step": 46997 + }, + { + "epoch": 1.2, + "learning_rate": 1.3593011880035592e-06, + "loss": 0.4441, + "step": 46998 + }, + { + "epoch": 1.2, + "learning_rate": 1.359275365199248e-06, + "loss": 0.7852, + "step": 46999 + }, + { + "epoch": 1.2, + "learning_rate": 1.3592495421198562e-06, + "loss": 0.7559, + "step": 47000 + }, + { + "epoch": 1.2, + "learning_rate": 1.3592237187654036e-06, + "loss": 0.6914, + "step": 47001 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591978951359102e-06, + "loss": 0.7178, + "step": 47002 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591720712313955e-06, + "loss": 0.7744, + "step": 47003 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591462470518788e-06, + "loss": 0.6797, + "step": 47004 + }, + { + "epoch": 1.2, + "learning_rate": 1.3591204225973804e-06, + "loss": 0.6289, + "step": 47005 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590945978679202e-06, + "loss": 0.6753, + "step": 47006 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590687728635177e-06, + "loss": 0.6997, + "step": 47007 + }, + { + "epoch": 1.2, + "learning_rate": 1.359042947584193e-06, + "loss": 0.6108, + "step": 47008 + }, + { + "epoch": 1.2, + "learning_rate": 1.3590171220299656e-06, + "loss": 0.563, + "step": 47009 + }, + { + "epoch": 1.2, + "learning_rate": 1.358991296200855e-06, + "loss": 0.6289, + "step": 47010 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589654700968814e-06, + "loss": 0.6914, + "step": 47011 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589396437180645e-06, + "loss": 0.833, + "step": 47012 + }, + { + "epoch": 1.2, + "learning_rate": 1.3589138170644241e-06, + "loss": 0.5352, + "step": 47013 + }, + { + "epoch": 1.2, + "learning_rate": 1.3588879901359796e-06, + "loss": 0.5586, + "step": 47014 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588621629327514e-06, + "loss": 0.708, + "step": 47015 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588363354547584e-06, + "loss": 0.5698, + "step": 47016 + }, + { + "epoch": 1.21, + "learning_rate": 1.3588105077020215e-06, + "loss": 0.6875, + "step": 47017 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587846796745597e-06, + "loss": 0.5615, + "step": 47018 + }, + { + "epoch": 1.21, + "learning_rate": 1.358758851372393e-06, + "loss": 0.7754, + "step": 47019 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587330227955411e-06, + "loss": 0.6763, + "step": 47020 + }, + { + "epoch": 1.21, + "learning_rate": 1.3587071939440237e-06, + "loss": 0.5547, + "step": 47021 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586813648178609e-06, + "loss": 0.6724, + "step": 47022 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586555354170722e-06, + "loss": 0.7588, + "step": 47023 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586297057416776e-06, + "loss": 0.7246, + "step": 47024 + }, + { + "epoch": 1.21, + "learning_rate": 1.3586038757916965e-06, + "loss": 0.5735, + "step": 47025 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585780455671488e-06, + "loss": 0.4934, + "step": 47026 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585522150680546e-06, + "loss": 0.7471, + "step": 47027 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585263842944335e-06, + "loss": 0.6387, + "step": 47028 + }, + { + "epoch": 1.21, + "learning_rate": 1.3585005532463049e-06, + "loss": 0.4403, + "step": 47029 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584747219236893e-06, + "loss": 0.7129, + "step": 47030 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584488903266058e-06, + "loss": 0.6177, + "step": 47031 + }, + { + "epoch": 1.21, + "learning_rate": 1.3584230584550746e-06, + "loss": 0.7197, + "step": 47032 + }, + { + "epoch": 1.21, + "learning_rate": 1.3583972263091154e-06, + "loss": 0.5186, + "step": 47033 + }, + { + "epoch": 1.21, + "learning_rate": 1.358371393888748e-06, + "loss": 0.4417, + "step": 47034 + }, + { + "epoch": 1.21, + "learning_rate": 1.3583455611939917e-06, + "loss": 0.7139, + "step": 47035 + }, + { + "epoch": 1.21, + "learning_rate": 1.358319728224867e-06, + "loss": 0.6826, + "step": 47036 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582938949813934e-06, + "loss": 0.7314, + "step": 47037 + }, + { + "epoch": 1.21, + "learning_rate": 1.358268061463591e-06, + "loss": 0.5228, + "step": 47038 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582422276714783e-06, + "loss": 0.749, + "step": 47039 + }, + { + "epoch": 1.21, + "learning_rate": 1.3582163936050765e-06, + "loss": 0.6084, + "step": 47040 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581905592644046e-06, + "loss": 0.5762, + "step": 47041 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581647246494832e-06, + "loss": 0.5703, + "step": 47042 + }, + { + "epoch": 1.21, + "learning_rate": 1.3581388897603312e-06, + "loss": 0.6533, + "step": 47043 + }, + { + "epoch": 1.21, + "learning_rate": 1.358113054596969e-06, + "loss": 0.4531, + "step": 47044 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580872191594157e-06, + "loss": 0.7227, + "step": 47045 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580613834476916e-06, + "loss": 0.6797, + "step": 47046 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580355474618164e-06, + "loss": 0.665, + "step": 47047 + }, + { + "epoch": 1.21, + "learning_rate": 1.3580097112018098e-06, + "loss": 0.6621, + "step": 47048 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579838746676916e-06, + "loss": 0.564, + "step": 47049 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579580378594817e-06, + "loss": 0.3911, + "step": 47050 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579322007771998e-06, + "loss": 0.749, + "step": 47051 + }, + { + "epoch": 1.21, + "learning_rate": 1.3579063634208655e-06, + "loss": 0.5708, + "step": 47052 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578805257904994e-06, + "loss": 0.5405, + "step": 47053 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578546878861197e-06, + "loss": 0.7578, + "step": 47054 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578288497077478e-06, + "loss": 0.6025, + "step": 47055 + }, + { + "epoch": 1.21, + "learning_rate": 1.3578030112554024e-06, + "loss": 0.7285, + "step": 47056 + }, + { + "epoch": 1.21, + "learning_rate": 1.357777172529104e-06, + "loss": 0.6709, + "step": 47057 + }, + { + "epoch": 1.21, + "learning_rate": 1.357751333528872e-06, + "loss": 0.5142, + "step": 47058 + }, + { + "epoch": 1.21, + "learning_rate": 1.357725494254726e-06, + "loss": 0.6396, + "step": 47059 + }, + { + "epoch": 1.21, + "learning_rate": 1.357699654706686e-06, + "loss": 0.7383, + "step": 47060 + }, + { + "epoch": 1.21, + "learning_rate": 1.357673814884772e-06, + "loss": 0.791, + "step": 47061 + }, + { + "epoch": 1.21, + "learning_rate": 1.3576479747890037e-06, + "loss": 0.6689, + "step": 47062 + }, + { + "epoch": 1.21, + "learning_rate": 1.357622134419401e-06, + "loss": 0.7861, + "step": 47063 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575962937759831e-06, + "loss": 0.5149, + "step": 47064 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575704528587704e-06, + "loss": 0.5942, + "step": 47065 + }, + { + "epoch": 1.21, + "learning_rate": 1.357544611667782e-06, + "loss": 0.5305, + "step": 47066 + }, + { + "epoch": 1.21, + "learning_rate": 1.3575187702030387e-06, + "loss": 0.6553, + "step": 47067 + }, + { + "epoch": 1.21, + "learning_rate": 1.3574929284645596e-06, + "loss": 0.6816, + "step": 47068 + }, + { + "epoch": 1.21, + "learning_rate": 1.357467086452364e-06, + "loss": 0.499, + "step": 47069 + }, + { + "epoch": 1.21, + "learning_rate": 1.357441244166473e-06, + "loss": 0.6504, + "step": 47070 + }, + { + "epoch": 1.21, + "learning_rate": 1.3574154016069054e-06, + "loss": 0.5835, + "step": 47071 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573895587736813e-06, + "loss": 0.5366, + "step": 47072 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573637156668202e-06, + "loss": 0.7588, + "step": 47073 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573378722863427e-06, + "loss": 0.6016, + "step": 47074 + }, + { + "epoch": 1.21, + "learning_rate": 1.3573120286322674e-06, + "loss": 0.7598, + "step": 47075 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572861847046151e-06, + "loss": 0.7607, + "step": 47076 + }, + { + "epoch": 1.21, + "learning_rate": 1.357260340503405e-06, + "loss": 0.6802, + "step": 47077 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572344960286575e-06, + "loss": 0.7129, + "step": 47078 + }, + { + "epoch": 1.21, + "learning_rate": 1.3572086512803915e-06, + "loss": 0.6479, + "step": 47079 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571828062586275e-06, + "loss": 0.5781, + "step": 47080 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571569609633846e-06, + "loss": 0.5933, + "step": 47081 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571311153946837e-06, + "loss": 0.5835, + "step": 47082 + }, + { + "epoch": 1.21, + "learning_rate": 1.3571052695525436e-06, + "loss": 0.6704, + "step": 47083 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570794234369844e-06, + "loss": 0.6543, + "step": 47084 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570535770480259e-06, + "loss": 0.4556, + "step": 47085 + }, + { + "epoch": 1.21, + "learning_rate": 1.357027730385688e-06, + "loss": 0.5669, + "step": 47086 + }, + { + "epoch": 1.21, + "learning_rate": 1.3570018834499903e-06, + "loss": 0.6123, + "step": 47087 + }, + { + "epoch": 1.21, + "learning_rate": 1.356976036240953e-06, + "loss": 0.4368, + "step": 47088 + }, + { + "epoch": 1.21, + "learning_rate": 1.3569501887585951e-06, + "loss": 0.4926, + "step": 47089 + }, + { + "epoch": 1.21, + "learning_rate": 1.356924341002937e-06, + "loss": 0.6777, + "step": 47090 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568984929739982e-06, + "loss": 0.4597, + "step": 47091 + }, + { + "epoch": 1.21, + "learning_rate": 1.356872644671799e-06, + "loss": 0.7173, + "step": 47092 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568467960963585e-06, + "loss": 0.6299, + "step": 47093 + }, + { + "epoch": 1.21, + "learning_rate": 1.3568209472476967e-06, + "loss": 0.7354, + "step": 47094 + }, + { + "epoch": 1.21, + "learning_rate": 1.356795098125834e-06, + "loss": 0.6982, + "step": 47095 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567692487307892e-06, + "loss": 0.6631, + "step": 47096 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567433990625829e-06, + "loss": 0.6069, + "step": 47097 + }, + { + "epoch": 1.21, + "learning_rate": 1.3567175491212347e-06, + "loss": 0.707, + "step": 47098 + }, + { + "epoch": 1.21, + "learning_rate": 1.356691698906764e-06, + "loss": 0.4517, + "step": 47099 + }, + { + "epoch": 1.21, + "learning_rate": 1.356665848419191e-06, + "loss": 0.7822, + "step": 47100 + }, + { + "epoch": 1.21, + "learning_rate": 1.3566399976585353e-06, + "loss": 0.6501, + "step": 47101 + }, + { + "epoch": 1.21, + "learning_rate": 1.3566141466248167e-06, + "loss": 0.4916, + "step": 47102 + }, + { + "epoch": 1.21, + "learning_rate": 1.3565882953180552e-06, + "loss": 0.5762, + "step": 47103 + }, + { + "epoch": 1.21, + "learning_rate": 1.3565624437382704e-06, + "loss": 0.6338, + "step": 47104 + }, + { + "epoch": 1.21, + "learning_rate": 1.356536591885482e-06, + "loss": 0.5742, + "step": 47105 + }, + { + "epoch": 1.21, + "learning_rate": 1.35651073975971e-06, + "loss": 0.4518, + "step": 47106 + }, + { + "epoch": 1.21, + "learning_rate": 1.356484887360974e-06, + "loss": 0.6797, + "step": 47107 + }, + { + "epoch": 1.21, + "learning_rate": 1.3564590346892941e-06, + "loss": 0.5532, + "step": 47108 + }, + { + "epoch": 1.21, + "learning_rate": 1.35643318174469e-06, + "loss": 0.7734, + "step": 47109 + }, + { + "epoch": 1.21, + "learning_rate": 1.3564073285271812e-06, + "loss": 0.6006, + "step": 47110 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563814750367878e-06, + "loss": 0.6431, + "step": 47111 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563556212735293e-06, + "loss": 0.5144, + "step": 47112 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563297672374258e-06, + "loss": 0.6514, + "step": 47113 + }, + { + "epoch": 1.21, + "learning_rate": 1.3563039129284972e-06, + "loss": 0.4938, + "step": 47114 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562780583467629e-06, + "loss": 0.7632, + "step": 47115 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562522034922426e-06, + "loss": 0.7183, + "step": 47116 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562263483649567e-06, + "loss": 0.6318, + "step": 47117 + }, + { + "epoch": 1.21, + "learning_rate": 1.3562004929649246e-06, + "loss": 0.5854, + "step": 47118 + }, + { + "epoch": 1.21, + "learning_rate": 1.356174637292166e-06, + "loss": 0.7598, + "step": 47119 + }, + { + "epoch": 1.21, + "learning_rate": 1.3561487813467012e-06, + "loss": 0.6855, + "step": 47120 + }, + { + "epoch": 1.21, + "learning_rate": 1.3561229251285494e-06, + "loss": 0.5201, + "step": 47121 + }, + { + "epoch": 1.21, + "learning_rate": 1.3560970686377307e-06, + "loss": 0.877, + "step": 47122 + }, + { + "epoch": 1.21, + "learning_rate": 1.356071211874265e-06, + "loss": 0.6904, + "step": 47123 + }, + { + "epoch": 1.21, + "learning_rate": 1.356045354838172e-06, + "loss": 0.5317, + "step": 47124 + }, + { + "epoch": 1.21, + "learning_rate": 1.3560194975294709e-06, + "loss": 0.7197, + "step": 47125 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559936399481826e-06, + "loss": 0.6113, + "step": 47126 + }, + { + "epoch": 1.21, + "learning_rate": 1.355967782094326e-06, + "loss": 0.7014, + "step": 47127 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559419239679214e-06, + "loss": 0.5869, + "step": 47128 + }, + { + "epoch": 1.21, + "learning_rate": 1.3559160655689886e-06, + "loss": 0.7949, + "step": 47129 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558902068975469e-06, + "loss": 0.5298, + "step": 47130 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558643479536165e-06, + "loss": 0.6025, + "step": 47131 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558384887372173e-06, + "loss": 0.8848, + "step": 47132 + }, + { + "epoch": 1.21, + "learning_rate": 1.3558126292483687e-06, + "loss": 0.6729, + "step": 47133 + }, + { + "epoch": 1.21, + "learning_rate": 1.355786769487091e-06, + "loss": 0.7168, + "step": 47134 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557609094534036e-06, + "loss": 0.4663, + "step": 47135 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557350491473263e-06, + "loss": 0.6304, + "step": 47136 + }, + { + "epoch": 1.21, + "learning_rate": 1.3557091885688795e-06, + "loss": 0.6113, + "step": 47137 + }, + { + "epoch": 1.21, + "learning_rate": 1.355683327718082e-06, + "loss": 0.7637, + "step": 47138 + }, + { + "epoch": 1.21, + "learning_rate": 1.3556574665949543e-06, + "loss": 0.5059, + "step": 47139 + }, + { + "epoch": 1.21, + "learning_rate": 1.3556316051995158e-06, + "loss": 0.7104, + "step": 47140 + }, + { + "epoch": 1.21, + "learning_rate": 1.355605743531787e-06, + "loss": 0.7949, + "step": 47141 + }, + { + "epoch": 1.21, + "learning_rate": 1.355579881591787e-06, + "loss": 0.6782, + "step": 47142 + }, + { + "epoch": 1.21, + "learning_rate": 1.355554019379536e-06, + "loss": 0.5762, + "step": 47143 + }, + { + "epoch": 1.21, + "learning_rate": 1.3555281568950532e-06, + "loss": 0.6724, + "step": 47144 + }, + { + "epoch": 1.21, + "learning_rate": 1.355502294138359e-06, + "loss": 0.5684, + "step": 47145 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554764311094732e-06, + "loss": 0.5034, + "step": 47146 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554505678084156e-06, + "loss": 0.7827, + "step": 47147 + }, + { + "epoch": 1.21, + "learning_rate": 1.3554247042352056e-06, + "loss": 0.6899, + "step": 47148 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553988403898634e-06, + "loss": 0.667, + "step": 47149 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553729762724083e-06, + "loss": 0.5884, + "step": 47150 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553471118828608e-06, + "loss": 0.6592, + "step": 47151 + }, + { + "epoch": 1.21, + "learning_rate": 1.3553212472212402e-06, + "loss": 0.5728, + "step": 47152 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552953822875668e-06, + "loss": 0.717, + "step": 47153 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552695170818596e-06, + "loss": 0.6602, + "step": 47154 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552436516041393e-06, + "loss": 0.6284, + "step": 47155 + }, + { + "epoch": 1.21, + "learning_rate": 1.3552177858544248e-06, + "loss": 0.624, + "step": 47156 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551919198327367e-06, + "loss": 0.6191, + "step": 47157 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551660535390943e-06, + "loss": 0.6372, + "step": 47158 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551401869735174e-06, + "loss": 0.572, + "step": 47159 + }, + { + "epoch": 1.21, + "learning_rate": 1.3551143201360265e-06, + "loss": 0.6362, + "step": 47160 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550884530266403e-06, + "loss": 0.7012, + "step": 47161 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550625856453799e-06, + "loss": 0.8115, + "step": 47162 + }, + { + "epoch": 1.21, + "learning_rate": 1.355036717992264e-06, + "loss": 0.5994, + "step": 47163 + }, + { + "epoch": 1.21, + "learning_rate": 1.3550108500673128e-06, + "loss": 0.5446, + "step": 47164 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549849818705461e-06, + "loss": 0.8359, + "step": 47165 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549591134019838e-06, + "loss": 0.6768, + "step": 47166 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549332446616454e-06, + "loss": 0.5354, + "step": 47167 + }, + { + "epoch": 1.21, + "learning_rate": 1.3549073756495516e-06, + "loss": 0.7168, + "step": 47168 + }, + { + "epoch": 1.21, + "learning_rate": 1.3548815063657209e-06, + "loss": 0.6348, + "step": 47169 + }, + { + "epoch": 1.21, + "learning_rate": 1.354855636810174e-06, + "loss": 0.5312, + "step": 47170 + }, + { + "epoch": 1.21, + "learning_rate": 1.35482976698293e-06, + "loss": 0.6328, + "step": 47171 + }, + { + "epoch": 1.21, + "learning_rate": 1.35480389688401e-06, + "loss": 0.4346, + "step": 47172 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547780265134322e-06, + "loss": 0.5049, + "step": 47173 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547521558712176e-06, + "loss": 0.7158, + "step": 47174 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547262849573854e-06, + "loss": 0.5918, + "step": 47175 + }, + { + "epoch": 1.21, + "learning_rate": 1.3547004137719558e-06, + "loss": 0.7061, + "step": 47176 + }, + { + "epoch": 1.21, + "learning_rate": 1.3546745423149483e-06, + "loss": 0.7954, + "step": 47177 + }, + { + "epoch": 1.21, + "learning_rate": 1.354648670586383e-06, + "loss": 0.8486, + "step": 47178 + }, + { + "epoch": 1.21, + "learning_rate": 1.354622798586279e-06, + "loss": 0.5283, + "step": 47179 + }, + { + "epoch": 1.21, + "learning_rate": 1.354596926314657e-06, + "loss": 0.707, + "step": 47180 + }, + { + "epoch": 1.21, + "learning_rate": 1.3545710537715365e-06, + "loss": 0.7617, + "step": 47181 + }, + { + "epoch": 1.21, + "learning_rate": 1.354545180956937e-06, + "loss": 0.6519, + "step": 47182 + }, + { + "epoch": 1.21, + "learning_rate": 1.3545193078708788e-06, + "loss": 0.7793, + "step": 47183 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544934345133812e-06, + "loss": 0.6724, + "step": 47184 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544675608844646e-06, + "loss": 0.7119, + "step": 47185 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544416869841482e-06, + "loss": 0.6621, + "step": 47186 + }, + { + "epoch": 1.21, + "learning_rate": 1.3544158128124523e-06, + "loss": 0.8545, + "step": 47187 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543899383693964e-06, + "loss": 0.6514, + "step": 47188 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543640636550005e-06, + "loss": 0.7559, + "step": 47189 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543381886692843e-06, + "loss": 0.5964, + "step": 47190 + }, + { + "epoch": 1.21, + "learning_rate": 1.3543123134122676e-06, + "loss": 0.7861, + "step": 47191 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542864378839703e-06, + "loss": 0.6895, + "step": 47192 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542605620844123e-06, + "loss": 0.543, + "step": 47193 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542346860136128e-06, + "loss": 0.668, + "step": 47194 + }, + { + "epoch": 1.21, + "learning_rate": 1.3542088096715925e-06, + "loss": 0.6455, + "step": 47195 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541829330583706e-06, + "loss": 0.6616, + "step": 47196 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541570561739674e-06, + "loss": 0.6904, + "step": 47197 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541311790184022e-06, + "loss": 0.752, + "step": 47198 + }, + { + "epoch": 1.21, + "learning_rate": 1.3541053015916952e-06, + "loss": 0.7402, + "step": 47199 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540794238938657e-06, + "loss": 0.5176, + "step": 47200 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540535459249342e-06, + "loss": 0.6074, + "step": 47201 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540276676849201e-06, + "loss": 0.709, + "step": 47202 + }, + { + "epoch": 1.21, + "learning_rate": 1.3540017891738432e-06, + "loss": 0.5273, + "step": 47203 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539759103917235e-06, + "loss": 0.6289, + "step": 47204 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539500313385809e-06, + "loss": 0.563, + "step": 47205 + }, + { + "epoch": 1.21, + "learning_rate": 1.3539241520144347e-06, + "loss": 0.6895, + "step": 47206 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538982724193054e-06, + "loss": 0.6802, + "step": 47207 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538723925532121e-06, + "loss": 0.6357, + "step": 47208 + }, + { + "epoch": 1.21, + "learning_rate": 1.353846512416175e-06, + "loss": 0.5571, + "step": 47209 + }, + { + "epoch": 1.21, + "learning_rate": 1.3538206320082143e-06, + "loss": 0.6602, + "step": 47210 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537947513293488e-06, + "loss": 0.5371, + "step": 47211 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537688703795995e-06, + "loss": 0.5542, + "step": 47212 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537429891589854e-06, + "loss": 0.6514, + "step": 47213 + }, + { + "epoch": 1.21, + "learning_rate": 1.3537171076675267e-06, + "loss": 0.7207, + "step": 47214 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536912259052426e-06, + "loss": 0.6494, + "step": 47215 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536653438721538e-06, + "loss": 0.3652, + "step": 47216 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536394615682799e-06, + "loss": 0.749, + "step": 47217 + }, + { + "epoch": 1.21, + "learning_rate": 1.3536135789936403e-06, + "loss": 0.561, + "step": 47218 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535876961482548e-06, + "loss": 0.6006, + "step": 47219 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535618130321438e-06, + "loss": 0.5864, + "step": 47220 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535359296453265e-06, + "loss": 0.5703, + "step": 47221 + }, + { + "epoch": 1.21, + "learning_rate": 1.3535100459878233e-06, + "loss": 0.5713, + "step": 47222 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534841620596535e-06, + "loss": 0.6387, + "step": 47223 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534582778608372e-06, + "loss": 0.7402, + "step": 47224 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534323933913944e-06, + "loss": 0.5723, + "step": 47225 + }, + { + "epoch": 1.21, + "learning_rate": 1.3534065086513441e-06, + "loss": 0.75, + "step": 47226 + }, + { + "epoch": 1.21, + "learning_rate": 1.353380623640707e-06, + "loss": 0.7485, + "step": 47227 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533547383595026e-06, + "loss": 0.5532, + "step": 47228 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533288528077508e-06, + "loss": 0.6465, + "step": 47229 + }, + { + "epoch": 1.21, + "learning_rate": 1.3533029669854712e-06, + "loss": 0.8955, + "step": 47230 + }, + { + "epoch": 1.21, + "learning_rate": 1.353277080892684e-06, + "loss": 0.7007, + "step": 47231 + }, + { + "epoch": 1.21, + "learning_rate": 1.3532511945294085e-06, + "loss": 0.7949, + "step": 47232 + }, + { + "epoch": 1.21, + "learning_rate": 1.353225307895665e-06, + "loss": 0.6753, + "step": 47233 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531994209914729e-06, + "loss": 0.6504, + "step": 47234 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531735338168524e-06, + "loss": 0.6768, + "step": 47235 + }, + { + "epoch": 1.21, + "learning_rate": 1.353147646371823e-06, + "loss": 0.6909, + "step": 47236 + }, + { + "epoch": 1.21, + "learning_rate": 1.3531217586564052e-06, + "loss": 0.646, + "step": 47237 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530958706706176e-06, + "loss": 0.5923, + "step": 47238 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530699824144814e-06, + "loss": 0.5652, + "step": 47239 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530440938880151e-06, + "loss": 0.6357, + "step": 47240 + }, + { + "epoch": 1.21, + "learning_rate": 1.3530182050912395e-06, + "loss": 0.6489, + "step": 47241 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529923160241742e-06, + "loss": 0.6719, + "step": 47242 + }, + { + "epoch": 1.21, + "learning_rate": 1.352966426686839e-06, + "loss": 0.5923, + "step": 47243 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529405370792533e-06, + "loss": 0.8174, + "step": 47244 + }, + { + "epoch": 1.21, + "learning_rate": 1.3529146472014374e-06, + "loss": 0.5869, + "step": 47245 + }, + { + "epoch": 1.21, + "learning_rate": 1.352888757053411e-06, + "loss": 0.7305, + "step": 47246 + }, + { + "epoch": 1.21, + "learning_rate": 1.3528628666351938e-06, + "loss": 0.6963, + "step": 47247 + }, + { + "epoch": 1.21, + "learning_rate": 1.352836975946806e-06, + "loss": 0.4856, + "step": 47248 + }, + { + "epoch": 1.21, + "learning_rate": 1.3528110849882665e-06, + "loss": 0.4458, + "step": 47249 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527851937595964e-06, + "loss": 0.6621, + "step": 47250 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527593022608147e-06, + "loss": 0.4629, + "step": 47251 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527334104919418e-06, + "loss": 0.4685, + "step": 47252 + }, + { + "epoch": 1.21, + "learning_rate": 1.3527075184529965e-06, + "loss": 0.6494, + "step": 47253 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526816261439997e-06, + "loss": 0.6387, + "step": 47254 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526557335649704e-06, + "loss": 0.6055, + "step": 47255 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526298407159294e-06, + "loss": 0.479, + "step": 47256 + }, + { + "epoch": 1.21, + "learning_rate": 1.3526039475968956e-06, + "loss": 0.5815, + "step": 47257 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525780542078892e-06, + "loss": 0.5942, + "step": 47258 + }, + { + "epoch": 1.21, + "learning_rate": 1.35255216054893e-06, + "loss": 0.7637, + "step": 47259 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525262666200378e-06, + "loss": 0.5747, + "step": 47260 + }, + { + "epoch": 1.21, + "learning_rate": 1.3525003724212323e-06, + "loss": 0.5918, + "step": 47261 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524744779525339e-06, + "loss": 0.7207, + "step": 47262 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524485832139617e-06, + "loss": 0.5685, + "step": 47263 + }, + { + "epoch": 1.21, + "learning_rate": 1.3524226882055358e-06, + "loss": 0.7217, + "step": 47264 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523967929272762e-06, + "loss": 0.646, + "step": 47265 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523708973792024e-06, + "loss": 0.5083, + "step": 47266 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523450015613347e-06, + "loss": 0.7285, + "step": 47267 + }, + { + "epoch": 1.21, + "learning_rate": 1.3523191054736925e-06, + "loss": 0.5603, + "step": 47268 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522932091162955e-06, + "loss": 0.7046, + "step": 47269 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522673124891642e-06, + "loss": 0.572, + "step": 47270 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522414155923176e-06, + "loss": 0.6309, + "step": 47271 + }, + { + "epoch": 1.21, + "learning_rate": 1.3522155184257763e-06, + "loss": 0.605, + "step": 47272 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521896209895596e-06, + "loss": 0.5378, + "step": 47273 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521637232836874e-06, + "loss": 0.7617, + "step": 47274 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521378253081796e-06, + "loss": 0.6455, + "step": 47275 + }, + { + "epoch": 1.21, + "learning_rate": 1.3521119270630564e-06, + "loss": 0.6436, + "step": 47276 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520860285483372e-06, + "loss": 0.8193, + "step": 47277 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520601297640418e-06, + "loss": 0.6816, + "step": 47278 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520342307101901e-06, + "loss": 0.7188, + "step": 47279 + }, + { + "epoch": 1.21, + "learning_rate": 1.3520083313868018e-06, + "loss": 0.5571, + "step": 47280 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519824317938973e-06, + "loss": 0.626, + "step": 47281 + }, + { + "epoch": 1.21, + "learning_rate": 1.351956531931496e-06, + "loss": 0.752, + "step": 47282 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519306317996177e-06, + "loss": 0.7803, + "step": 47283 + }, + { + "epoch": 1.21, + "learning_rate": 1.3519047313982821e-06, + "loss": 0.7246, + "step": 47284 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518788307275096e-06, + "loss": 0.606, + "step": 47285 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518529297873192e-06, + "loss": 0.5508, + "step": 47286 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518270285777317e-06, + "loss": 0.5342, + "step": 47287 + }, + { + "epoch": 1.21, + "learning_rate": 1.3518011270987658e-06, + "loss": 0.6479, + "step": 47288 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517752253504427e-06, + "loss": 0.6943, + "step": 47289 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517493233327808e-06, + "loss": 0.7441, + "step": 47290 + }, + { + "epoch": 1.21, + "learning_rate": 1.3517234210458008e-06, + "loss": 0.6367, + "step": 47291 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516975184895226e-06, + "loss": 0.7412, + "step": 47292 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516716156639656e-06, + "loss": 0.6914, + "step": 47293 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516457125691497e-06, + "loss": 0.5273, + "step": 47294 + }, + { + "epoch": 1.21, + "learning_rate": 1.3516198092050951e-06, + "loss": 0.7217, + "step": 47295 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515939055718213e-06, + "loss": 0.6841, + "step": 47296 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515680016693483e-06, + "loss": 0.6958, + "step": 47297 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515420974976956e-06, + "loss": 0.7178, + "step": 47298 + }, + { + "epoch": 1.21, + "learning_rate": 1.3515161930568834e-06, + "loss": 0.5942, + "step": 47299 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514902883469314e-06, + "loss": 0.5842, + "step": 47300 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514643833678594e-06, + "loss": 0.5293, + "step": 47301 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514384781196878e-06, + "loss": 0.6846, + "step": 47302 + }, + { + "epoch": 1.21, + "learning_rate": 1.3514125726024352e-06, + "loss": 0.5327, + "step": 47303 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513866668161224e-06, + "loss": 0.6719, + "step": 47304 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513607607607688e-06, + "loss": 0.6758, + "step": 47305 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513348544363949e-06, + "loss": 0.9121, + "step": 47306 + }, + { + "epoch": 1.21, + "learning_rate": 1.3513089478430197e-06, + "loss": 0.8076, + "step": 47307 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512830409806638e-06, + "loss": 0.7549, + "step": 47308 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512571338493461e-06, + "loss": 0.6963, + "step": 47309 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512312264490872e-06, + "loss": 0.7178, + "step": 47310 + }, + { + "epoch": 1.21, + "learning_rate": 1.3512053187799065e-06, + "loss": 0.708, + "step": 47311 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511794108418243e-06, + "loss": 0.5747, + "step": 47312 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511535026348603e-06, + "loss": 0.7798, + "step": 47313 + }, + { + "epoch": 1.21, + "learning_rate": 1.3511275941590338e-06, + "loss": 0.6265, + "step": 47314 + }, + { + "epoch": 1.21, + "learning_rate": 1.351101685414365e-06, + "loss": 0.6758, + "step": 47315 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510757764008745e-06, + "loss": 0.8125, + "step": 47316 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510498671185808e-06, + "loss": 0.5757, + "step": 47317 + }, + { + "epoch": 1.21, + "learning_rate": 1.3510239575675045e-06, + "loss": 0.6353, + "step": 47318 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509980477476653e-06, + "loss": 0.8291, + "step": 47319 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509721376590828e-06, + "loss": 0.6719, + "step": 47320 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509462273017772e-06, + "loss": 0.7861, + "step": 47321 + }, + { + "epoch": 1.21, + "learning_rate": 1.3509203166757685e-06, + "loss": 0.7109, + "step": 47322 + }, + { + "epoch": 1.21, + "learning_rate": 1.3508944057810762e-06, + "loss": 0.6245, + "step": 47323 + }, + { + "epoch": 1.21, + "learning_rate": 1.35086849461772e-06, + "loss": 0.7705, + "step": 47324 + }, + { + "epoch": 1.21, + "learning_rate": 1.35084258318572e-06, + "loss": 0.6025, + "step": 47325 + }, + { + "epoch": 1.21, + "learning_rate": 1.3508166714850958e-06, + "loss": 0.6895, + "step": 47326 + }, + { + "epoch": 1.21, + "learning_rate": 1.350790759515868e-06, + "loss": 0.7148, + "step": 47327 + }, + { + "epoch": 1.21, + "learning_rate": 1.350764847278055e-06, + "loss": 0.4709, + "step": 47328 + }, + { + "epoch": 1.21, + "learning_rate": 1.350738934771678e-06, + "loss": 0.6016, + "step": 47329 + }, + { + "epoch": 1.21, + "learning_rate": 1.3507130219967561e-06, + "loss": 0.6846, + "step": 47330 + }, + { + "epoch": 1.21, + "learning_rate": 1.3506871089533096e-06, + "loss": 0.8291, + "step": 47331 + }, + { + "epoch": 1.21, + "learning_rate": 1.350661195641358e-06, + "loss": 0.8213, + "step": 47332 + }, + { + "epoch": 1.21, + "learning_rate": 1.3506352820609213e-06, + "loss": 0.5308, + "step": 47333 + }, + { + "epoch": 1.21, + "learning_rate": 1.350609368212019e-06, + "loss": 0.6787, + "step": 47334 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505834540946718e-06, + "loss": 0.5518, + "step": 47335 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505575397088982e-06, + "loss": 0.8291, + "step": 47336 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505316250547195e-06, + "loss": 0.8252, + "step": 47337 + }, + { + "epoch": 1.21, + "learning_rate": 1.3505057101321545e-06, + "loss": 0.7979, + "step": 47338 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504797949412234e-06, + "loss": 0.7139, + "step": 47339 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504538794819462e-06, + "loss": 0.6094, + "step": 47340 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504279637543425e-06, + "loss": 0.6362, + "step": 47341 + }, + { + "epoch": 1.21, + "learning_rate": 1.3504020477584322e-06, + "loss": 0.7725, + "step": 47342 + }, + { + "epoch": 1.21, + "learning_rate": 1.350376131494235e-06, + "loss": 0.6641, + "step": 47343 + }, + { + "epoch": 1.21, + "learning_rate": 1.3503502149617712e-06, + "loss": 0.605, + "step": 47344 + }, + { + "epoch": 1.21, + "learning_rate": 1.35032429816106e-06, + "loss": 0.7783, + "step": 47345 + }, + { + "epoch": 1.21, + "learning_rate": 1.350298381092122e-06, + "loss": 0.8047, + "step": 47346 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502724637549765e-06, + "loss": 0.6421, + "step": 47347 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502465461496435e-06, + "loss": 0.6572, + "step": 47348 + }, + { + "epoch": 1.21, + "learning_rate": 1.3502206282761426e-06, + "loss": 0.6982, + "step": 47349 + }, + { + "epoch": 1.21, + "learning_rate": 1.350194710134494e-06, + "loss": 0.6909, + "step": 47350 + }, + { + "epoch": 1.21, + "learning_rate": 1.3501687917247173e-06, + "loss": 0.4829, + "step": 47351 + }, + { + "epoch": 1.21, + "learning_rate": 1.3501428730468329e-06, + "loss": 0.6855, + "step": 47352 + }, + { + "epoch": 1.21, + "learning_rate": 1.35011695410086e-06, + "loss": 0.5479, + "step": 47353 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500910348868184e-06, + "loss": 0.5417, + "step": 47354 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500651154047282e-06, + "loss": 0.6025, + "step": 47355 + }, + { + "epoch": 1.21, + "learning_rate": 1.3500391956546095e-06, + "loss": 0.7939, + "step": 47356 + }, + { + "epoch": 1.21, + "learning_rate": 1.350013275636482e-06, + "loss": 0.6924, + "step": 47357 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499873553503652e-06, + "loss": 0.6489, + "step": 47358 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499614347962788e-06, + "loss": 0.7266, + "step": 47359 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499355139742437e-06, + "loss": 0.7314, + "step": 47360 + }, + { + "epoch": 1.21, + "learning_rate": 1.3499095928842785e-06, + "loss": 0.6699, + "step": 47361 + }, + { + "epoch": 1.21, + "learning_rate": 1.349883671526404e-06, + "loss": 0.6802, + "step": 47362 + }, + { + "epoch": 1.21, + "learning_rate": 1.3498577499006397e-06, + "loss": 0.667, + "step": 47363 + }, + { + "epoch": 1.21, + "learning_rate": 1.349831828007005e-06, + "loss": 0.6292, + "step": 47364 + }, + { + "epoch": 1.21, + "learning_rate": 1.3498059058455205e-06, + "loss": 0.5076, + "step": 47365 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497799834162054e-06, + "loss": 0.5469, + "step": 47366 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497540607190803e-06, + "loss": 0.5933, + "step": 47367 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497281377541643e-06, + "loss": 0.6216, + "step": 47368 + }, + { + "epoch": 1.21, + "learning_rate": 1.3497022145214777e-06, + "loss": 0.5342, + "step": 47369 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496762910210397e-06, + "loss": 0.6436, + "step": 47370 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496503672528711e-06, + "loss": 0.7422, + "step": 47371 + }, + { + "epoch": 1.21, + "learning_rate": 1.3496244432169914e-06, + "loss": 0.7178, + "step": 47372 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495985189134203e-06, + "loss": 0.4924, + "step": 47373 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495725943421775e-06, + "loss": 0.6548, + "step": 47374 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495466695032828e-06, + "loss": 0.6497, + "step": 47375 + }, + { + "epoch": 1.21, + "learning_rate": 1.3495207443967566e-06, + "loss": 0.6973, + "step": 47376 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494948190226184e-06, + "loss": 0.7842, + "step": 47377 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494688933808881e-06, + "loss": 0.6509, + "step": 47378 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494429674715857e-06, + "loss": 0.585, + "step": 47379 + }, + { + "epoch": 1.21, + "learning_rate": 1.3494170412947307e-06, + "loss": 0.6729, + "step": 47380 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493911148503433e-06, + "loss": 0.77, + "step": 47381 + }, + { + "epoch": 1.21, + "learning_rate": 1.349365188138443e-06, + "loss": 0.6904, + "step": 47382 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493392611590497e-06, + "loss": 0.751, + "step": 47383 + }, + { + "epoch": 1.21, + "learning_rate": 1.3493133339121837e-06, + "loss": 0.6572, + "step": 47384 + }, + { + "epoch": 1.21, + "learning_rate": 1.349287406397864e-06, + "loss": 0.6416, + "step": 47385 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492614786161116e-06, + "loss": 0.7417, + "step": 47386 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492355505669458e-06, + "loss": 0.6621, + "step": 47387 + }, + { + "epoch": 1.21, + "learning_rate": 1.3492096222503862e-06, + "loss": 0.6787, + "step": 47388 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491836936664527e-06, + "loss": 0.7705, + "step": 47389 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491577648151653e-06, + "loss": 0.4617, + "step": 47390 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491318356965437e-06, + "loss": 0.5, + "step": 47391 + }, + { + "epoch": 1.21, + "learning_rate": 1.3491059063106086e-06, + "loss": 0.5928, + "step": 47392 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490799766573786e-06, + "loss": 0.7061, + "step": 47393 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490540467368743e-06, + "loss": 0.561, + "step": 47394 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490281165491152e-06, + "loss": 0.4934, + "step": 47395 + }, + { + "epoch": 1.21, + "learning_rate": 1.3490021860941215e-06, + "loss": 0.7354, + "step": 47396 + }, + { + "epoch": 1.21, + "learning_rate": 1.3489762553719128e-06, + "loss": 0.8457, + "step": 47397 + }, + { + "epoch": 1.21, + "learning_rate": 1.3489503243825092e-06, + "loss": 0.6133, + "step": 47398 + }, + { + "epoch": 1.21, + "learning_rate": 1.34892439312593e-06, + "loss": 0.6494, + "step": 47399 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488984616021957e-06, + "loss": 0.7666, + "step": 47400 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488725298113257e-06, + "loss": 0.7129, + "step": 47401 + }, + { + "epoch": 1.21, + "learning_rate": 1.3488465977533404e-06, + "loss": 0.5168, + "step": 47402 + }, + { + "epoch": 1.21, + "learning_rate": 1.348820665428259e-06, + "loss": 0.8516, + "step": 47403 + }, + { + "epoch": 1.21, + "learning_rate": 1.3487947328361018e-06, + "loss": 0.7012, + "step": 47404 + }, + { + "epoch": 1.22, + "learning_rate": 1.3487687999768885e-06, + "loss": 0.5303, + "step": 47405 + }, + { + "epoch": 1.22, + "learning_rate": 1.348742866850639e-06, + "loss": 0.7852, + "step": 47406 + }, + { + "epoch": 1.22, + "learning_rate": 1.3487169334573728e-06, + "loss": 0.7607, + "step": 47407 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486909997971103e-06, + "loss": 0.6943, + "step": 47408 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486650658698712e-06, + "loss": 0.5093, + "step": 47409 + }, + { + "epoch": 1.22, + "learning_rate": 1.348639131675675e-06, + "loss": 0.7402, + "step": 47410 + }, + { + "epoch": 1.22, + "learning_rate": 1.3486131972145422e-06, + "loss": 0.7354, + "step": 47411 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485872624864922e-06, + "loss": 0.54, + "step": 47412 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485613274915452e-06, + "loss": 0.7012, + "step": 47413 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485353922297204e-06, + "loss": 0.7158, + "step": 47414 + }, + { + "epoch": 1.22, + "learning_rate": 1.3485094567010384e-06, + "loss": 0.6182, + "step": 47415 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484835209055185e-06, + "loss": 0.6958, + "step": 47416 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484575848431812e-06, + "loss": 0.6206, + "step": 47417 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484316485140451e-06, + "loss": 0.7178, + "step": 47418 + }, + { + "epoch": 1.22, + "learning_rate": 1.3484057119181318e-06, + "loss": 0.6689, + "step": 47419 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483797750554598e-06, + "loss": 0.5825, + "step": 47420 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483538379260497e-06, + "loss": 0.4431, + "step": 47421 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483279005299208e-06, + "loss": 0.6543, + "step": 47422 + }, + { + "epoch": 1.22, + "learning_rate": 1.3483019628670932e-06, + "loss": 0.645, + "step": 47423 + }, + { + "epoch": 1.22, + "learning_rate": 1.348276024937587e-06, + "loss": 0.7305, + "step": 47424 + }, + { + "epoch": 1.22, + "learning_rate": 1.348250086741422e-06, + "loss": 0.7383, + "step": 47425 + }, + { + "epoch": 1.22, + "learning_rate": 1.3482241482786177e-06, + "loss": 0.5647, + "step": 47426 + }, + { + "epoch": 1.22, + "learning_rate": 1.3481982095491942e-06, + "loss": 0.5081, + "step": 47427 + }, + { + "epoch": 1.22, + "learning_rate": 1.3481722705531712e-06, + "loss": 0.7222, + "step": 47428 + }, + { + "epoch": 1.22, + "learning_rate": 1.348146331290569e-06, + "loss": 0.5591, + "step": 47429 + }, + { + "epoch": 1.22, + "learning_rate": 1.348120391761407e-06, + "loss": 0.7471, + "step": 47430 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480944519657054e-06, + "loss": 0.6846, + "step": 47431 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480685119034835e-06, + "loss": 0.6313, + "step": 47432 + }, + { + "epoch": 1.22, + "learning_rate": 1.3480425715747618e-06, + "loss": 0.6963, + "step": 47433 + }, + { + "epoch": 1.22, + "learning_rate": 1.34801663097956e-06, + "loss": 0.6992, + "step": 47434 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479906901178976e-06, + "loss": 0.3842, + "step": 47435 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479647489897951e-06, + "loss": 0.6831, + "step": 47436 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479388075952716e-06, + "loss": 0.7061, + "step": 47437 + }, + { + "epoch": 1.22, + "learning_rate": 1.3479128659343477e-06, + "loss": 0.7363, + "step": 47438 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478869240070425e-06, + "loss": 0.6582, + "step": 47439 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478609818133766e-06, + "loss": 0.79, + "step": 47440 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478350393533694e-06, + "loss": 0.7803, + "step": 47441 + }, + { + "epoch": 1.22, + "learning_rate": 1.3478090966270411e-06, + "loss": 0.4846, + "step": 47442 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477831536344112e-06, + "loss": 0.6958, + "step": 47443 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477572103754997e-06, + "loss": 0.7529, + "step": 47444 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477312668503266e-06, + "loss": 0.7246, + "step": 47445 + }, + { + "epoch": 1.22, + "learning_rate": 1.3477053230589117e-06, + "loss": 0.7002, + "step": 47446 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476793790012749e-06, + "loss": 0.5586, + "step": 47447 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476534346774357e-06, + "loss": 0.6602, + "step": 47448 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476274900874142e-06, + "loss": 0.6519, + "step": 47449 + }, + { + "epoch": 1.22, + "learning_rate": 1.3476015452312307e-06, + "loss": 0.7324, + "step": 47450 + }, + { + "epoch": 1.22, + "learning_rate": 1.3475756001089045e-06, + "loss": 0.5347, + "step": 47451 + }, + { + "epoch": 1.22, + "learning_rate": 1.3475496547204554e-06, + "loss": 0.709, + "step": 47452 + }, + { + "epoch": 1.22, + "learning_rate": 1.347523709065904e-06, + "loss": 0.479, + "step": 47453 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474977631452692e-06, + "loss": 0.6533, + "step": 47454 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474718169585716e-06, + "loss": 0.5874, + "step": 47455 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474458705058307e-06, + "loss": 0.5566, + "step": 47456 + }, + { + "epoch": 1.22, + "learning_rate": 1.3474199237870668e-06, + "loss": 0.5864, + "step": 47457 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473939768022988e-06, + "loss": 0.5188, + "step": 47458 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473680295515478e-06, + "loss": 0.6523, + "step": 47459 + }, + { + "epoch": 1.22, + "learning_rate": 1.3473420820348327e-06, + "loss": 0.6963, + "step": 47460 + }, + { + "epoch": 1.22, + "learning_rate": 1.347316134252174e-06, + "loss": 0.8037, + "step": 47461 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472901862035913e-06, + "loss": 0.6313, + "step": 47462 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472642378891044e-06, + "loss": 0.502, + "step": 47463 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472382893087328e-06, + "loss": 0.8955, + "step": 47464 + }, + { + "epoch": 1.22, + "learning_rate": 1.3472123404624972e-06, + "loss": 0.7524, + "step": 47465 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471863913504174e-06, + "loss": 0.667, + "step": 47466 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471604419725126e-06, + "loss": 0.793, + "step": 47467 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471344923288031e-06, + "loss": 0.5996, + "step": 47468 + }, + { + "epoch": 1.22, + "learning_rate": 1.3471085424193085e-06, + "loss": 0.5537, + "step": 47469 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470825922440488e-06, + "loss": 0.7134, + "step": 47470 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470566418030443e-06, + "loss": 0.6914, + "step": 47471 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470306910963142e-06, + "loss": 0.5293, + "step": 47472 + }, + { + "epoch": 1.22, + "learning_rate": 1.3470047401238786e-06, + "loss": 0.6631, + "step": 47473 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469787888857575e-06, + "loss": 0.5215, + "step": 47474 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469528373819707e-06, + "loss": 0.6709, + "step": 47475 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469268856125384e-06, + "loss": 0.5007, + "step": 47476 + }, + { + "epoch": 1.22, + "learning_rate": 1.3469009335774798e-06, + "loss": 0.6182, + "step": 47477 + }, + { + "epoch": 1.22, + "learning_rate": 1.3468749812768152e-06, + "loss": 0.7656, + "step": 47478 + }, + { + "epoch": 1.22, + "learning_rate": 1.3468490287105642e-06, + "loss": 0.6235, + "step": 47479 + }, + { + "epoch": 1.22, + "learning_rate": 1.346823075878747e-06, + "loss": 0.5405, + "step": 47480 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467971227813836e-06, + "loss": 0.4829, + "step": 47481 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467711694184932e-06, + "loss": 0.5459, + "step": 47482 + }, + { + "epoch": 1.22, + "learning_rate": 1.346745215790096e-06, + "loss": 0.6582, + "step": 47483 + }, + { + "epoch": 1.22, + "learning_rate": 1.3467192618962122e-06, + "loss": 0.7383, + "step": 47484 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466933077368612e-06, + "loss": 0.5869, + "step": 47485 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466673533120635e-06, + "loss": 0.5957, + "step": 47486 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466413986218382e-06, + "loss": 0.5154, + "step": 47487 + }, + { + "epoch": 1.22, + "learning_rate": 1.3466154436662053e-06, + "loss": 0.8252, + "step": 47488 + }, + { + "epoch": 1.22, + "learning_rate": 1.346589488445185e-06, + "loss": 0.5625, + "step": 47489 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465635329587973e-06, + "loss": 0.5713, + "step": 47490 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465375772070616e-06, + "loss": 0.6357, + "step": 47491 + }, + { + "epoch": 1.22, + "learning_rate": 1.3465116211899982e-06, + "loss": 0.6089, + "step": 47492 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464856649076267e-06, + "loss": 0.627, + "step": 47493 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464597083599673e-06, + "loss": 0.5679, + "step": 47494 + }, + { + "epoch": 1.22, + "learning_rate": 1.3464337515470392e-06, + "loss": 0.584, + "step": 47495 + }, + { + "epoch": 1.22, + "learning_rate": 1.346407794468863e-06, + "loss": 0.646, + "step": 47496 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463818371254583e-06, + "loss": 0.5332, + "step": 47497 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463558795168448e-06, + "loss": 0.5571, + "step": 47498 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463299216430426e-06, + "loss": 0.5625, + "step": 47499 + }, + { + "epoch": 1.22, + "learning_rate": 1.3463039635040714e-06, + "loss": 0.6455, + "step": 47500 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462780050999514e-06, + "loss": 0.9385, + "step": 47501 + }, + { + "epoch": 1.22, + "learning_rate": 1.346252046430702e-06, + "loss": 0.5225, + "step": 47502 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462260874963435e-06, + "loss": 0.686, + "step": 47503 + }, + { + "epoch": 1.22, + "learning_rate": 1.3462001282968956e-06, + "loss": 0.562, + "step": 47504 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461741688323782e-06, + "loss": 0.6069, + "step": 47505 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461482091028111e-06, + "loss": 0.4933, + "step": 47506 + }, + { + "epoch": 1.22, + "learning_rate": 1.3461222491082142e-06, + "loss": 0.6074, + "step": 47507 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460962888486074e-06, + "loss": 0.8037, + "step": 47508 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460703283240107e-06, + "loss": 0.583, + "step": 47509 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460443675344437e-06, + "loss": 0.583, + "step": 47510 + }, + { + "epoch": 1.22, + "learning_rate": 1.3460184064799267e-06, + "loss": 0.8223, + "step": 47511 + }, + { + "epoch": 1.22, + "learning_rate": 1.345992445160479e-06, + "loss": 0.7114, + "step": 47512 + }, + { + "epoch": 1.22, + "learning_rate": 1.345966483576121e-06, + "loss": 0.5825, + "step": 47513 + }, + { + "epoch": 1.22, + "learning_rate": 1.3459405217268722e-06, + "loss": 0.6875, + "step": 47514 + }, + { + "epoch": 1.22, + "learning_rate": 1.3459145596127528e-06, + "loss": 0.7275, + "step": 47515 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458885972337825e-06, + "loss": 0.7109, + "step": 47516 + }, + { + "epoch": 1.22, + "learning_rate": 1.345862634589981e-06, + "loss": 0.6162, + "step": 47517 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458366716813688e-06, + "loss": 0.5308, + "step": 47518 + }, + { + "epoch": 1.22, + "learning_rate": 1.3458107085079648e-06, + "loss": 0.5967, + "step": 47519 + }, + { + "epoch": 1.22, + "learning_rate": 1.34578474506979e-06, + "loss": 0.8008, + "step": 47520 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457587813668637e-06, + "loss": 0.7539, + "step": 47521 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457328173992056e-06, + "loss": 0.6118, + "step": 47522 + }, + { + "epoch": 1.22, + "learning_rate": 1.3457068531668357e-06, + "loss": 0.7168, + "step": 47523 + }, + { + "epoch": 1.22, + "learning_rate": 1.345680888669774e-06, + "loss": 0.5405, + "step": 47524 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456549239080402e-06, + "loss": 0.6267, + "step": 47525 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456289588816547e-06, + "loss": 0.6157, + "step": 47526 + }, + { + "epoch": 1.22, + "learning_rate": 1.3456029935906365e-06, + "loss": 0.4988, + "step": 47527 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455770280350066e-06, + "loss": 0.668, + "step": 47528 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455510622147836e-06, + "loss": 0.5237, + "step": 47529 + }, + { + "epoch": 1.22, + "learning_rate": 1.3455250961299885e-06, + "loss": 0.312, + "step": 47530 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454991297806406e-06, + "loss": 0.6851, + "step": 47531 + }, + { + "epoch": 1.22, + "learning_rate": 1.34547316316676e-06, + "loss": 0.7217, + "step": 47532 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454471962883662e-06, + "loss": 0.6978, + "step": 47533 + }, + { + "epoch": 1.22, + "learning_rate": 1.3454212291454797e-06, + "loss": 0.7363, + "step": 47534 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453952617381197e-06, + "loss": 0.7441, + "step": 47535 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453692940663067e-06, + "loss": 0.5156, + "step": 47536 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453433261300603e-06, + "loss": 0.5654, + "step": 47537 + }, + { + "epoch": 1.22, + "learning_rate": 1.3453173579294004e-06, + "loss": 0.5342, + "step": 47538 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452913894643465e-06, + "loss": 0.5679, + "step": 47539 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452654207349192e-06, + "loss": 0.7109, + "step": 47540 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452394517411383e-06, + "loss": 0.5972, + "step": 47541 + }, + { + "epoch": 1.22, + "learning_rate": 1.3452134824830231e-06, + "loss": 0.7207, + "step": 47542 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451875129605937e-06, + "loss": 0.7559, + "step": 47543 + }, + { + "epoch": 1.22, + "learning_rate": 1.34516154317387e-06, + "loss": 0.707, + "step": 47544 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451355731228723e-06, + "loss": 0.4878, + "step": 47545 + }, + { + "epoch": 1.22, + "learning_rate": 1.3451096028076202e-06, + "loss": 0.6099, + "step": 47546 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450836322281337e-06, + "loss": 0.5679, + "step": 47547 + }, + { + "epoch": 1.22, + "learning_rate": 1.345057661384432e-06, + "loss": 0.436, + "step": 47548 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450316902765357e-06, + "loss": 0.7344, + "step": 47549 + }, + { + "epoch": 1.22, + "learning_rate": 1.3450057189044644e-06, + "loss": 0.7188, + "step": 47550 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449797472682388e-06, + "loss": 0.666, + "step": 47551 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449537753678772e-06, + "loss": 0.6406, + "step": 47552 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449278032034008e-06, + "loss": 0.6956, + "step": 47553 + }, + { + "epoch": 1.22, + "learning_rate": 1.3449018307748288e-06, + "loss": 0.7803, + "step": 47554 + }, + { + "epoch": 1.22, + "learning_rate": 1.3448758580821814e-06, + "loss": 0.6191, + "step": 47555 + }, + { + "epoch": 1.22, + "learning_rate": 1.3448498851254786e-06, + "loss": 0.7021, + "step": 47556 + }, + { + "epoch": 1.22, + "learning_rate": 1.34482391190474e-06, + "loss": 0.6118, + "step": 47557 + }, + { + "epoch": 1.22, + "learning_rate": 1.3447979384199854e-06, + "loss": 0.6572, + "step": 47558 + }, + { + "epoch": 1.22, + "learning_rate": 1.344771964671235e-06, + "loss": 0.5342, + "step": 47559 + }, + { + "epoch": 1.22, + "learning_rate": 1.3447459906585086e-06, + "loss": 0.6274, + "step": 47560 + }, + { + "epoch": 1.22, + "learning_rate": 1.344720016381826e-06, + "loss": 0.6694, + "step": 47561 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446940418412072e-06, + "loss": 0.6133, + "step": 47562 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446680670366718e-06, + "loss": 0.6807, + "step": 47563 + }, + { + "epoch": 1.22, + "learning_rate": 1.34464209196824e-06, + "loss": 0.6001, + "step": 47564 + }, + { + "epoch": 1.22, + "learning_rate": 1.3446161166359318e-06, + "loss": 0.5615, + "step": 47565 + }, + { + "epoch": 1.22, + "learning_rate": 1.344590141039767e-06, + "loss": 0.6494, + "step": 47566 + }, + { + "epoch": 1.22, + "learning_rate": 1.344564165179765e-06, + "loss": 0.6357, + "step": 47567 + }, + { + "epoch": 1.22, + "learning_rate": 1.3445381890559463e-06, + "loss": 0.6963, + "step": 47568 + }, + { + "epoch": 1.22, + "learning_rate": 1.3445122126683304e-06, + "loss": 0.5884, + "step": 47569 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444862360169373e-06, + "loss": 0.6133, + "step": 47570 + }, + { + "epoch": 1.22, + "learning_rate": 1.344460259101787e-06, + "loss": 0.627, + "step": 47571 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444342819228995e-06, + "loss": 0.6982, + "step": 47572 + }, + { + "epoch": 1.22, + "learning_rate": 1.3444083044802942e-06, + "loss": 0.7334, + "step": 47573 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443823267739916e-06, + "loss": 0.7324, + "step": 47574 + }, + { + "epoch": 1.22, + "learning_rate": 1.344356348804011e-06, + "loss": 0.6968, + "step": 47575 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443303705703728e-06, + "loss": 0.6184, + "step": 47576 + }, + { + "epoch": 1.22, + "learning_rate": 1.3443043920730964e-06, + "loss": 0.5089, + "step": 47577 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442784133122023e-06, + "loss": 0.5269, + "step": 47578 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442524342877098e-06, + "loss": 0.7402, + "step": 47579 + }, + { + "epoch": 1.22, + "learning_rate": 1.344226454999639e-06, + "loss": 0.6934, + "step": 47580 + }, + { + "epoch": 1.22, + "learning_rate": 1.3442004754480102e-06, + "loss": 0.5771, + "step": 47581 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441744956328426e-06, + "loss": 0.6812, + "step": 47582 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441485155541566e-06, + "loss": 0.5767, + "step": 47583 + }, + { + "epoch": 1.22, + "learning_rate": 1.3441225352119718e-06, + "loss": 0.6836, + "step": 47584 + }, + { + "epoch": 1.22, + "learning_rate": 1.344096554606308e-06, + "loss": 0.5659, + "step": 47585 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440705737371855e-06, + "loss": 0.6375, + "step": 47586 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440445926046241e-06, + "loss": 0.5491, + "step": 47587 + }, + { + "epoch": 1.22, + "learning_rate": 1.3440186112086433e-06, + "loss": 0.7349, + "step": 47588 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439926295492636e-06, + "loss": 0.5776, + "step": 47589 + }, + { + "epoch": 1.22, + "learning_rate": 1.343966647626504e-06, + "loss": 0.6504, + "step": 47590 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439406654403857e-06, + "loss": 0.6406, + "step": 47591 + }, + { + "epoch": 1.22, + "learning_rate": 1.3439146829909276e-06, + "loss": 0.7329, + "step": 47592 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438887002781496e-06, + "loss": 0.7695, + "step": 47593 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438627173020718e-06, + "loss": 0.6089, + "step": 47594 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438367340627143e-06, + "loss": 0.728, + "step": 47595 + }, + { + "epoch": 1.22, + "learning_rate": 1.3438107505600971e-06, + "loss": 0.7656, + "step": 47596 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437847667942395e-06, + "loss": 0.7144, + "step": 47597 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437587827651614e-06, + "loss": 0.6992, + "step": 47598 + }, + { + "epoch": 1.22, + "learning_rate": 1.3437327984728834e-06, + "loss": 0.5791, + "step": 47599 + }, + { + "epoch": 1.22, + "learning_rate": 1.343706813917425e-06, + "loss": 0.6855, + "step": 47600 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436808290988061e-06, + "loss": 0.5059, + "step": 47601 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436548440170466e-06, + "loss": 0.6821, + "step": 47602 + }, + { + "epoch": 1.22, + "learning_rate": 1.3436288586721664e-06, + "loss": 0.7002, + "step": 47603 + }, + { + "epoch": 1.22, + "learning_rate": 1.343602873064185e-06, + "loss": 0.7021, + "step": 47604 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435768871931231e-06, + "loss": 0.5928, + "step": 47605 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435509010590003e-06, + "loss": 0.7227, + "step": 47606 + }, + { + "epoch": 1.22, + "learning_rate": 1.3435249146618359e-06, + "loss": 0.666, + "step": 47607 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434989280016505e-06, + "loss": 0.5293, + "step": 47608 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434729410784638e-06, + "loss": 0.5815, + "step": 47609 + }, + { + "epoch": 1.22, + "learning_rate": 1.3434469538922955e-06, + "loss": 0.6631, + "step": 47610 + }, + { + "epoch": 1.22, + "learning_rate": 1.343420966443166e-06, + "loss": 0.6748, + "step": 47611 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433949787310946e-06, + "loss": 0.7412, + "step": 47612 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433689907561015e-06, + "loss": 0.5986, + "step": 47613 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433430025182063e-06, + "loss": 0.6611, + "step": 47614 + }, + { + "epoch": 1.22, + "learning_rate": 1.3433170140174294e-06, + "loss": 0.7656, + "step": 47615 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432910252537908e-06, + "loss": 0.6069, + "step": 47616 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432650362273095e-06, + "loss": 0.6758, + "step": 47617 + }, + { + "epoch": 1.22, + "learning_rate": 1.343239046938006e-06, + "loss": 0.6387, + "step": 47618 + }, + { + "epoch": 1.22, + "learning_rate": 1.3432130573859003e-06, + "loss": 0.7314, + "step": 47619 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431870675710121e-06, + "loss": 0.5708, + "step": 47620 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431610774933618e-06, + "loss": 0.8008, + "step": 47621 + }, + { + "epoch": 1.22, + "learning_rate": 1.3431350871529682e-06, + "loss": 0.7729, + "step": 47622 + }, + { + "epoch": 1.22, + "learning_rate": 1.343109096549852e-06, + "loss": 0.625, + "step": 47623 + }, + { + "epoch": 1.22, + "learning_rate": 1.343083105684033e-06, + "loss": 0.5093, + "step": 47624 + }, + { + "epoch": 1.22, + "learning_rate": 1.343057114555531e-06, + "loss": 0.9043, + "step": 47625 + }, + { + "epoch": 1.22, + "learning_rate": 1.3430311231643661e-06, + "loss": 0.7188, + "step": 47626 + }, + { + "epoch": 1.22, + "learning_rate": 1.343005131510558e-06, + "loss": 0.6406, + "step": 47627 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429791395941266e-06, + "loss": 0.5864, + "step": 47628 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429531474150918e-06, + "loss": 0.5857, + "step": 47629 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429271549734733e-06, + "loss": 0.7012, + "step": 47630 + }, + { + "epoch": 1.22, + "learning_rate": 1.3429011622692915e-06, + "loss": 0.5464, + "step": 47631 + }, + { + "epoch": 1.22, + "learning_rate": 1.342875169302566e-06, + "loss": 0.5054, + "step": 47632 + }, + { + "epoch": 1.22, + "learning_rate": 1.342849176073317e-06, + "loss": 0.6738, + "step": 47633 + }, + { + "epoch": 1.22, + "learning_rate": 1.3428231825815636e-06, + "loss": 0.6279, + "step": 47634 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427971888273268e-06, + "loss": 0.6416, + "step": 47635 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427711948106258e-06, + "loss": 0.7554, + "step": 47636 + }, + { + "epoch": 1.22, + "learning_rate": 1.3427452005314805e-06, + "loss": 0.834, + "step": 47637 + }, + { + "epoch": 1.22, + "learning_rate": 1.342719205989911e-06, + "loss": 0.7627, + "step": 47638 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426932111859372e-06, + "loss": 0.5801, + "step": 47639 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426672161195792e-06, + "loss": 0.6758, + "step": 47640 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426412207908565e-06, + "loss": 0.6602, + "step": 47641 + }, + { + "epoch": 1.22, + "learning_rate": 1.3426152251997892e-06, + "loss": 0.5342, + "step": 47642 + }, + { + "epoch": 1.22, + "learning_rate": 1.342589229346397e-06, + "loss": 0.5525, + "step": 47643 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425632332307e-06, + "loss": 0.5334, + "step": 47644 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425372368527183e-06, + "loss": 0.6313, + "step": 47645 + }, + { + "epoch": 1.22, + "learning_rate": 1.3425112402124714e-06, + "loss": 0.5317, + "step": 47646 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424852433099795e-06, + "loss": 0.7529, + "step": 47647 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424592461452622e-06, + "loss": 0.8477, + "step": 47648 + }, + { + "epoch": 1.22, + "learning_rate": 1.3424332487183398e-06, + "loss": 0.644, + "step": 47649 + }, + { + "epoch": 1.22, + "learning_rate": 1.342407251029232e-06, + "loss": 0.5557, + "step": 47650 + }, + { + "epoch": 1.22, + "learning_rate": 1.3423812530779585e-06, + "loss": 0.6484, + "step": 47651 + }, + { + "epoch": 1.22, + "learning_rate": 1.3423552548645398e-06, + "loss": 0.7148, + "step": 47652 + }, + { + "epoch": 1.22, + "learning_rate": 1.342329256388995e-06, + "loss": 0.5259, + "step": 47653 + }, + { + "epoch": 1.22, + "learning_rate": 1.342303257651345e-06, + "loss": 0.5342, + "step": 47654 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422772586516084e-06, + "loss": 0.5923, + "step": 47655 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422512593898066e-06, + "loss": 0.7227, + "step": 47656 + }, + { + "epoch": 1.22, + "learning_rate": 1.3422252598659583e-06, + "loss": 0.6006, + "step": 47657 + }, + { + "epoch": 1.22, + "learning_rate": 1.342199260080084e-06, + "loss": 0.4448, + "step": 47658 + }, + { + "epoch": 1.22, + "learning_rate": 1.3421732600322032e-06, + "loss": 0.7148, + "step": 47659 + }, + { + "epoch": 1.22, + "learning_rate": 1.3421472597223362e-06, + "loss": 0.5291, + "step": 47660 + }, + { + "epoch": 1.22, + "learning_rate": 1.342121259150503e-06, + "loss": 0.6943, + "step": 47661 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420952583167232e-06, + "loss": 0.71, + "step": 47662 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420692572210163e-06, + "loss": 0.8076, + "step": 47663 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420432558634035e-06, + "loss": 0.4449, + "step": 47664 + }, + { + "epoch": 1.22, + "learning_rate": 1.3420172542439033e-06, + "loss": 0.6392, + "step": 47665 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419912523625365e-06, + "loss": 0.5742, + "step": 47666 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419652502193226e-06, + "loss": 0.7617, + "step": 47667 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419392478142818e-06, + "loss": 0.6548, + "step": 47668 + }, + { + "epoch": 1.22, + "learning_rate": 1.3419132451474336e-06, + "loss": 0.7246, + "step": 47669 + }, + { + "epoch": 1.22, + "learning_rate": 1.341887242218798e-06, + "loss": 0.6997, + "step": 47670 + }, + { + "epoch": 1.22, + "learning_rate": 1.3418612390283956e-06, + "loss": 0.8535, + "step": 47671 + }, + { + "epoch": 1.22, + "learning_rate": 1.3418352355762454e-06, + "loss": 0.4897, + "step": 47672 + }, + { + "epoch": 1.22, + "learning_rate": 1.341809231862368e-06, + "loss": 0.6572, + "step": 47673 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417832278867828e-06, + "loss": 0.5825, + "step": 47674 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417572236495097e-06, + "loss": 0.8179, + "step": 47675 + }, + { + "epoch": 1.22, + "learning_rate": 1.341731219150569e-06, + "loss": 0.6787, + "step": 47676 + }, + { + "epoch": 1.22, + "learning_rate": 1.3417052143899804e-06, + "loss": 0.7236, + "step": 47677 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416792093677636e-06, + "loss": 0.5474, + "step": 47678 + }, + { + "epoch": 1.22, + "learning_rate": 1.341653204083939e-06, + "loss": 0.7578, + "step": 47679 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416271985385262e-06, + "loss": 0.5967, + "step": 47680 + }, + { + "epoch": 1.22, + "learning_rate": 1.3416011927315454e-06, + "loss": 0.728, + "step": 47681 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415751866630159e-06, + "loss": 0.7568, + "step": 47682 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415491803329582e-06, + "loss": 0.6021, + "step": 47683 + }, + { + "epoch": 1.22, + "learning_rate": 1.3415231737413917e-06, + "loss": 0.668, + "step": 47684 + }, + { + "epoch": 1.22, + "learning_rate": 1.341497166888337e-06, + "loss": 0.6111, + "step": 47685 + }, + { + "epoch": 1.22, + "learning_rate": 1.3414711597738136e-06, + "loss": 0.7959, + "step": 47686 + }, + { + "epoch": 1.22, + "learning_rate": 1.341445152397841e-06, + "loss": 0.7217, + "step": 47687 + }, + { + "epoch": 1.22, + "learning_rate": 1.3414191447604399e-06, + "loss": 0.752, + "step": 47688 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413931368616297e-06, + "loss": 0.8281, + "step": 47689 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413671287014305e-06, + "loss": 0.5454, + "step": 47690 + }, + { + "epoch": 1.22, + "learning_rate": 1.3413411202798625e-06, + "loss": 0.6475, + "step": 47691 + }, + { + "epoch": 1.22, + "learning_rate": 1.341315111596945e-06, + "loss": 0.6047, + "step": 47692 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412891026526984e-06, + "loss": 0.7559, + "step": 47693 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412630934471422e-06, + "loss": 0.7744, + "step": 47694 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412370839802968e-06, + "loss": 0.6208, + "step": 47695 + }, + { + "epoch": 1.22, + "learning_rate": 1.3412110742521815e-06, + "loss": 0.7451, + "step": 47696 + }, + { + "epoch": 1.22, + "learning_rate": 1.3411850642628165e-06, + "loss": 0.519, + "step": 47697 + }, + { + "epoch": 1.22, + "learning_rate": 1.3411590540122224e-06, + "loss": 0.4883, + "step": 47698 + }, + { + "epoch": 1.22, + "learning_rate": 1.341133043500418e-06, + "loss": 0.5957, + "step": 47699 + }, + { + "epoch": 1.22, + "learning_rate": 1.341107032727424e-06, + "loss": 0.7236, + "step": 47700 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410810216932597e-06, + "loss": 0.7139, + "step": 47701 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410550103979456e-06, + "loss": 0.8838, + "step": 47702 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410289988415013e-06, + "loss": 0.2537, + "step": 47703 + }, + { + "epoch": 1.22, + "learning_rate": 1.3410029870239468e-06, + "loss": 0.6123, + "step": 47704 + }, + { + "epoch": 1.22, + "learning_rate": 1.340976974945302e-06, + "loss": 0.6182, + "step": 47705 + }, + { + "epoch": 1.22, + "learning_rate": 1.340950962605587e-06, + "loss": 0.6626, + "step": 47706 + }, + { + "epoch": 1.22, + "learning_rate": 1.3409249500048211e-06, + "loss": 0.6377, + "step": 47707 + }, + { + "epoch": 1.22, + "learning_rate": 1.340898937143025e-06, + "loss": 0.623, + "step": 47708 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408729240202178e-06, + "loss": 0.6689, + "step": 47709 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408469106364202e-06, + "loss": 0.6865, + "step": 47710 + }, + { + "epoch": 1.22, + "learning_rate": 1.3408208969916519e-06, + "loss": 0.7842, + "step": 47711 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407948830859327e-06, + "loss": 0.6289, + "step": 47712 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407688689192822e-06, + "loss": 0.6724, + "step": 47713 + }, + { + "epoch": 1.22, + "learning_rate": 1.340742854491721e-06, + "loss": 0.4648, + "step": 47714 + }, + { + "epoch": 1.22, + "learning_rate": 1.3407168398032684e-06, + "loss": 0.6606, + "step": 47715 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406908248539446e-06, + "loss": 0.6611, + "step": 47716 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406648096437699e-06, + "loss": 0.5879, + "step": 47717 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406387941727632e-06, + "loss": 0.5698, + "step": 47718 + }, + { + "epoch": 1.22, + "learning_rate": 1.3406127784409456e-06, + "loss": 0.5986, + "step": 47719 + }, + { + "epoch": 1.22, + "learning_rate": 1.340586762448336e-06, + "loss": 0.877, + "step": 47720 + }, + { + "epoch": 1.22, + "learning_rate": 1.340560746194955e-06, + "loss": 0.7017, + "step": 47721 + }, + { + "epoch": 1.22, + "learning_rate": 1.3405347296808222e-06, + "loss": 0.6875, + "step": 47722 + }, + { + "epoch": 1.22, + "learning_rate": 1.340508712905958e-06, + "loss": 0.6699, + "step": 47723 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404826958703813e-06, + "loss": 0.6611, + "step": 47724 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404566785741133e-06, + "loss": 0.645, + "step": 47725 + }, + { + "epoch": 1.22, + "learning_rate": 1.340430661017173e-06, + "loss": 0.4539, + "step": 47726 + }, + { + "epoch": 1.22, + "learning_rate": 1.3404046431995806e-06, + "loss": 0.6646, + "step": 47727 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403786251213559e-06, + "loss": 0.5815, + "step": 47728 + }, + { + "epoch": 1.22, + "learning_rate": 1.340352606782519e-06, + "loss": 0.6943, + "step": 47729 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403265881830898e-06, + "loss": 0.7637, + "step": 47730 + }, + { + "epoch": 1.22, + "learning_rate": 1.3403005693230882e-06, + "loss": 0.6714, + "step": 47731 + }, + { + "epoch": 1.22, + "learning_rate": 1.340274550202534e-06, + "loss": 0.6318, + "step": 47732 + }, + { + "epoch": 1.22, + "learning_rate": 1.3402485308214472e-06, + "loss": 0.6216, + "step": 47733 + }, + { + "epoch": 1.22, + "learning_rate": 1.3402225111798477e-06, + "loss": 0.7744, + "step": 47734 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401964912777556e-06, + "loss": 0.6172, + "step": 47735 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401704711151908e-06, + "loss": 0.5933, + "step": 47736 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401444506921733e-06, + "loss": 0.6289, + "step": 47737 + }, + { + "epoch": 1.22, + "learning_rate": 1.3401184300087224e-06, + "loss": 0.8311, + "step": 47738 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400924090648586e-06, + "loss": 0.6553, + "step": 47739 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400663878606016e-06, + "loss": 0.7178, + "step": 47740 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400403663959714e-06, + "loss": 0.6294, + "step": 47741 + }, + { + "epoch": 1.22, + "learning_rate": 1.3400143446709882e-06, + "loss": 0.5378, + "step": 47742 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399883226856711e-06, + "loss": 0.6885, + "step": 47743 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399623004400412e-06, + "loss": 0.6785, + "step": 47744 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399362779341175e-06, + "loss": 0.4929, + "step": 47745 + }, + { + "epoch": 1.22, + "learning_rate": 1.3399102551679202e-06, + "loss": 0.6641, + "step": 47746 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398842321414692e-06, + "loss": 0.6865, + "step": 47747 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398582088547847e-06, + "loss": 0.709, + "step": 47748 + }, + { + "epoch": 1.22, + "learning_rate": 1.339832185307886e-06, + "loss": 0.7686, + "step": 47749 + }, + { + "epoch": 1.22, + "learning_rate": 1.3398061615007941e-06, + "loss": 0.6821, + "step": 47750 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397801374335277e-06, + "loss": 0.5898, + "step": 47751 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397541131061073e-06, + "loss": 0.6846, + "step": 47752 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397280885185528e-06, + "loss": 0.6475, + "step": 47753 + }, + { + "epoch": 1.22, + "learning_rate": 1.3397020636708844e-06, + "loss": 0.6616, + "step": 47754 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396760385631217e-06, + "loss": 0.7393, + "step": 47755 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396500131952846e-06, + "loss": 0.6953, + "step": 47756 + }, + { + "epoch": 1.22, + "learning_rate": 1.3396239875673928e-06, + "loss": 0.8008, + "step": 47757 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395979616794667e-06, + "loss": 0.5342, + "step": 47758 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395719355315263e-06, + "loss": 0.636, + "step": 47759 + }, + { + "epoch": 1.22, + "learning_rate": 1.339545909123591e-06, + "loss": 0.6372, + "step": 47760 + }, + { + "epoch": 1.22, + "learning_rate": 1.3395198824556812e-06, + "loss": 0.6172, + "step": 47761 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394938555278166e-06, + "loss": 0.6509, + "step": 47762 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394678283400168e-06, + "loss": 0.5488, + "step": 47763 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394418008923027e-06, + "loss": 0.6865, + "step": 47764 + }, + { + "epoch": 1.22, + "learning_rate": 1.3394157731846934e-06, + "loss": 0.8228, + "step": 47765 + }, + { + "epoch": 1.22, + "learning_rate": 1.339389745217209e-06, + "loss": 0.6182, + "step": 47766 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393637169898695e-06, + "loss": 0.5708, + "step": 47767 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393376885026945e-06, + "loss": 0.6543, + "step": 47768 + }, + { + "epoch": 1.22, + "learning_rate": 1.3393116597557047e-06, + "loss": 0.7314, + "step": 47769 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392856307489196e-06, + "loss": 0.5785, + "step": 47770 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392596014823587e-06, + "loss": 0.6763, + "step": 47771 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392335719560424e-06, + "loss": 0.833, + "step": 47772 + }, + { + "epoch": 1.22, + "learning_rate": 1.3392075421699907e-06, + "loss": 0.6377, + "step": 47773 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391815121242232e-06, + "loss": 0.5469, + "step": 47774 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391554818187605e-06, + "loss": 0.6685, + "step": 47775 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391294512536216e-06, + "loss": 0.6206, + "step": 47776 + }, + { + "epoch": 1.22, + "learning_rate": 1.3391034204288269e-06, + "loss": 0.6123, + "step": 47777 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390773893443962e-06, + "loss": 0.7246, + "step": 47778 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390513580003498e-06, + "loss": 0.5771, + "step": 47779 + }, + { + "epoch": 1.22, + "learning_rate": 1.3390253263967072e-06, + "loss": 0.8062, + "step": 47780 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389992945334887e-06, + "loss": 0.604, + "step": 47781 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389732624107138e-06, + "loss": 0.5923, + "step": 47782 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389472300284027e-06, + "loss": 0.7383, + "step": 47783 + }, + { + "epoch": 1.22, + "learning_rate": 1.3389211973865752e-06, + "loss": 0.7803, + "step": 47784 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388951644852514e-06, + "loss": 0.6768, + "step": 47785 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388691313244515e-06, + "loss": 0.625, + "step": 47786 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388430979041947e-06, + "loss": 0.6768, + "step": 47787 + }, + { + "epoch": 1.22, + "learning_rate": 1.3388170642245013e-06, + "loss": 0.7646, + "step": 47788 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387910302853913e-06, + "loss": 0.8066, + "step": 47789 + }, + { + "epoch": 1.22, + "learning_rate": 1.338764996086885e-06, + "loss": 0.6299, + "step": 47790 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387389616290016e-06, + "loss": 0.6318, + "step": 47791 + }, + { + "epoch": 1.22, + "learning_rate": 1.3387129269117612e-06, + "loss": 0.7783, + "step": 47792 + }, + { + "epoch": 1.22, + "learning_rate": 1.3386868919351839e-06, + "loss": 0.6475, + "step": 47793 + }, + { + "epoch": 1.22, + "learning_rate": 1.33866085669929e-06, + "loss": 0.5759, + "step": 47794 + }, + { + "epoch": 1.23, + "learning_rate": 1.3386348212040987e-06, + "loss": 0.7578, + "step": 47795 + }, + { + "epoch": 1.23, + "learning_rate": 1.3386087854496305e-06, + "loss": 0.6504, + "step": 47796 + }, + { + "epoch": 1.23, + "learning_rate": 1.3385827494359047e-06, + "loss": 0.6108, + "step": 47797 + }, + { + "epoch": 1.23, + "learning_rate": 1.338556713162942e-06, + "loss": 0.7148, + "step": 47798 + }, + { + "epoch": 1.23, + "learning_rate": 1.338530676630762e-06, + "loss": 0.6206, + "step": 47799 + }, + { + "epoch": 1.23, + "learning_rate": 1.3385046398393848e-06, + "loss": 0.5034, + "step": 47800 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384786027888298e-06, + "loss": 0.6201, + "step": 47801 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384525654791174e-06, + "loss": 0.7188, + "step": 47802 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384265279102675e-06, + "loss": 0.5347, + "step": 47803 + }, + { + "epoch": 1.23, + "learning_rate": 1.3384004900823e-06, + "loss": 0.5781, + "step": 47804 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383744519952346e-06, + "loss": 0.6724, + "step": 47805 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383484136490916e-06, + "loss": 0.5522, + "step": 47806 + }, + { + "epoch": 1.23, + "learning_rate": 1.3383223750438908e-06, + "loss": 0.7529, + "step": 47807 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382963361796519e-06, + "loss": 0.7588, + "step": 47808 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382702970563953e-06, + "loss": 0.7715, + "step": 47809 + }, + { + "epoch": 1.23, + "learning_rate": 1.3382442576741407e-06, + "loss": 0.6562, + "step": 47810 + }, + { + "epoch": 1.23, + "learning_rate": 1.338218218032908e-06, + "loss": 0.646, + "step": 47811 + }, + { + "epoch": 1.23, + "learning_rate": 1.338192178132717e-06, + "loss": 0.8008, + "step": 47812 + }, + { + "epoch": 1.23, + "learning_rate": 1.338166137973588e-06, + "loss": 0.5906, + "step": 47813 + }, + { + "epoch": 1.23, + "learning_rate": 1.3381400975555406e-06, + "loss": 0.7383, + "step": 47814 + }, + { + "epoch": 1.23, + "learning_rate": 1.3381140568785952e-06, + "loss": 0.707, + "step": 47815 + }, + { + "epoch": 1.23, + "learning_rate": 1.338088015942771e-06, + "loss": 0.5522, + "step": 47816 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380619747480883e-06, + "loss": 0.5986, + "step": 47817 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380359332945673e-06, + "loss": 0.604, + "step": 47818 + }, + { + "epoch": 1.23, + "learning_rate": 1.3380098915822277e-06, + "loss": 0.7432, + "step": 47819 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379838496110895e-06, + "loss": 0.6296, + "step": 47820 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379578073811728e-06, + "loss": 0.7471, + "step": 47821 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379317648924968e-06, + "loss": 0.6396, + "step": 47822 + }, + { + "epoch": 1.23, + "learning_rate": 1.3379057221450825e-06, + "loss": 0.4263, + "step": 47823 + }, + { + "epoch": 1.23, + "learning_rate": 1.337879679138949e-06, + "loss": 0.5232, + "step": 47824 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378536358741168e-06, + "loss": 0.6504, + "step": 47825 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378275923506054e-06, + "loss": 0.7153, + "step": 47826 + }, + { + "epoch": 1.23, + "learning_rate": 1.3378015485684354e-06, + "loss": 0.5132, + "step": 47827 + }, + { + "epoch": 1.23, + "learning_rate": 1.3377755045276255e-06, + "loss": 0.6807, + "step": 47828 + }, + { + "epoch": 1.23, + "learning_rate": 1.337749460228197e-06, + "loss": 0.6973, + "step": 47829 + }, + { + "epoch": 1.23, + "learning_rate": 1.3377234156701693e-06, + "loss": 0.4907, + "step": 47830 + }, + { + "epoch": 1.23, + "learning_rate": 1.337697370853562e-06, + "loss": 0.6616, + "step": 47831 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376713257783955e-06, + "loss": 0.748, + "step": 47832 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376452804446894e-06, + "loss": 0.5129, + "step": 47833 + }, + { + "epoch": 1.23, + "learning_rate": 1.3376192348524641e-06, + "loss": 0.7119, + "step": 47834 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375931890017393e-06, + "loss": 0.708, + "step": 47835 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375671428925349e-06, + "loss": 0.6221, + "step": 47836 + }, + { + "epoch": 1.23, + "learning_rate": 1.3375410965248706e-06, + "loss": 0.6533, + "step": 47837 + }, + { + "epoch": 1.23, + "learning_rate": 1.337515049898767e-06, + "loss": 0.6533, + "step": 47838 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374890030142432e-06, + "loss": 0.7876, + "step": 47839 + }, + { + "epoch": 1.23, + "learning_rate": 1.33746295587132e-06, + "loss": 0.6914, + "step": 47840 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374369084700166e-06, + "loss": 0.7705, + "step": 47841 + }, + { + "epoch": 1.23, + "learning_rate": 1.3374108608103536e-06, + "loss": 0.5605, + "step": 47842 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373848128923501e-06, + "loss": 0.7139, + "step": 47843 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373587647160273e-06, + "loss": 0.7754, + "step": 47844 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373327162814038e-06, + "loss": 0.5366, + "step": 47845 + }, + { + "epoch": 1.23, + "learning_rate": 1.3373066675885005e-06, + "loss": 0.6177, + "step": 47846 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372806186373367e-06, + "loss": 0.8486, + "step": 47847 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372545694279328e-06, + "loss": 0.7109, + "step": 47848 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372285199603087e-06, + "loss": 0.5869, + "step": 47849 + }, + { + "epoch": 1.23, + "learning_rate": 1.3372024702344839e-06, + "loss": 0.6489, + "step": 47850 + }, + { + "epoch": 1.23, + "learning_rate": 1.337176420250479e-06, + "loss": 0.8379, + "step": 47851 + }, + { + "epoch": 1.23, + "learning_rate": 1.3371503700083133e-06, + "loss": 0.6455, + "step": 47852 + }, + { + "epoch": 1.23, + "learning_rate": 1.3371243195080073e-06, + "loss": 0.7842, + "step": 47853 + }, + { + "epoch": 1.23, + "learning_rate": 1.337098268749581e-06, + "loss": 0.5139, + "step": 47854 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370722177330536e-06, + "loss": 0.7227, + "step": 47855 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370461664584456e-06, + "loss": 0.4407, + "step": 47856 + }, + { + "epoch": 1.23, + "learning_rate": 1.3370201149257767e-06, + "loss": 0.5625, + "step": 47857 + }, + { + "epoch": 1.23, + "learning_rate": 1.336994063135067e-06, + "loss": 0.5251, + "step": 47858 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369680110863368e-06, + "loss": 0.6138, + "step": 47859 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369419587796055e-06, + "loss": 0.752, + "step": 47860 + }, + { + "epoch": 1.23, + "learning_rate": 1.3369159062148933e-06, + "loss": 0.7461, + "step": 47861 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368898533922199e-06, + "loss": 0.6758, + "step": 47862 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368638003116057e-06, + "loss": 0.6768, + "step": 47863 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368377469730702e-06, + "loss": 0.6431, + "step": 47864 + }, + { + "epoch": 1.23, + "learning_rate": 1.3368116933766339e-06, + "loss": 0.7227, + "step": 47865 + }, + { + "epoch": 1.23, + "learning_rate": 1.3367856395223158e-06, + "loss": 0.666, + "step": 47866 + }, + { + "epoch": 1.23, + "learning_rate": 1.3367595854101366e-06, + "loss": 0.834, + "step": 47867 + }, + { + "epoch": 1.23, + "learning_rate": 1.336733531040116e-06, + "loss": 0.6475, + "step": 47868 + }, + { + "epoch": 1.23, + "learning_rate": 1.336707476412274e-06, + "loss": 0.7957, + "step": 47869 + }, + { + "epoch": 1.23, + "learning_rate": 1.336681421526631e-06, + "loss": 0.6465, + "step": 47870 + }, + { + "epoch": 1.23, + "learning_rate": 1.3366553663832063e-06, + "loss": 0.6123, + "step": 47871 + }, + { + "epoch": 1.23, + "learning_rate": 1.3366293109820198e-06, + "loss": 0.46, + "step": 47872 + }, + { + "epoch": 1.23, + "learning_rate": 1.336603255323092e-06, + "loss": 0.7617, + "step": 47873 + }, + { + "epoch": 1.23, + "learning_rate": 1.3365771994064422e-06, + "loss": 0.5649, + "step": 47874 + }, + { + "epoch": 1.23, + "learning_rate": 1.336551143232091e-06, + "loss": 0.8428, + "step": 47875 + }, + { + "epoch": 1.23, + "learning_rate": 1.3365250868000582e-06, + "loss": 0.6265, + "step": 47876 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364990301103634e-06, + "loss": 0.7168, + "step": 47877 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364729731630269e-06, + "loss": 0.6084, + "step": 47878 + }, + { + "epoch": 1.23, + "learning_rate": 1.3364469159580682e-06, + "loss": 0.79, + "step": 47879 + }, + { + "epoch": 1.23, + "learning_rate": 1.336420858495508e-06, + "loss": 0.6514, + "step": 47880 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363948007753655e-06, + "loss": 0.6855, + "step": 47881 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363687427976612e-06, + "loss": 0.6479, + "step": 47882 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363426845624147e-06, + "loss": 0.6281, + "step": 47883 + }, + { + "epoch": 1.23, + "learning_rate": 1.3363166260696462e-06, + "loss": 0.5923, + "step": 47884 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362905673193755e-06, + "loss": 0.9531, + "step": 47885 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362645083116224e-06, + "loss": 0.7344, + "step": 47886 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362384490464069e-06, + "loss": 0.6401, + "step": 47887 + }, + { + "epoch": 1.23, + "learning_rate": 1.3362123895237494e-06, + "loss": 0.6982, + "step": 47888 + }, + { + "epoch": 1.23, + "learning_rate": 1.3361863297436694e-06, + "loss": 0.7588, + "step": 47889 + }, + { + "epoch": 1.23, + "learning_rate": 1.336160269706187e-06, + "loss": 0.7295, + "step": 47890 + }, + { + "epoch": 1.23, + "learning_rate": 1.336134209411322e-06, + "loss": 0.7285, + "step": 47891 + }, + { + "epoch": 1.23, + "learning_rate": 1.3361081488590948e-06, + "loss": 0.5039, + "step": 47892 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360820880495248e-06, + "loss": 0.6147, + "step": 47893 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360560269826325e-06, + "loss": 0.8154, + "step": 47894 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360299656584372e-06, + "loss": 0.7168, + "step": 47895 + }, + { + "epoch": 1.23, + "learning_rate": 1.3360039040769593e-06, + "loss": 0.5345, + "step": 47896 + }, + { + "epoch": 1.23, + "learning_rate": 1.3359778422382188e-06, + "loss": 0.6426, + "step": 47897 + }, + { + "epoch": 1.23, + "learning_rate": 1.3359517801422352e-06, + "loss": 0.4607, + "step": 47898 + }, + { + "epoch": 1.23, + "learning_rate": 1.335925717789029e-06, + "loss": 0.7705, + "step": 47899 + }, + { + "epoch": 1.23, + "learning_rate": 1.33589965517862e-06, + "loss": 0.8408, + "step": 47900 + }, + { + "epoch": 1.23, + "learning_rate": 1.335873592311028e-06, + "loss": 0.2503, + "step": 47901 + }, + { + "epoch": 1.23, + "learning_rate": 1.335847529186273e-06, + "loss": 0.5664, + "step": 47902 + }, + { + "epoch": 1.23, + "learning_rate": 1.3358214658043751e-06, + "loss": 0.7061, + "step": 47903 + }, + { + "epoch": 1.23, + "learning_rate": 1.335795402165354e-06, + "loss": 0.6738, + "step": 47904 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357693382692302e-06, + "loss": 0.8096, + "step": 47905 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357432741160226e-06, + "loss": 0.7402, + "step": 47906 + }, + { + "epoch": 1.23, + "learning_rate": 1.3357172097057521e-06, + "loss": 0.6748, + "step": 47907 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356911450384383e-06, + "loss": 0.7554, + "step": 47908 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356650801141014e-06, + "loss": 0.6729, + "step": 47909 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356390149327612e-06, + "loss": 0.5745, + "step": 47910 + }, + { + "epoch": 1.23, + "learning_rate": 1.3356129494944377e-06, + "loss": 0.6904, + "step": 47911 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355868837991503e-06, + "loss": 0.6489, + "step": 47912 + }, + { + "epoch": 1.23, + "learning_rate": 1.33556081784692e-06, + "loss": 0.6699, + "step": 47913 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355347516377658e-06, + "loss": 0.6787, + "step": 47914 + }, + { + "epoch": 1.23, + "learning_rate": 1.3355086851717084e-06, + "loss": 0.646, + "step": 47915 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354826184487674e-06, + "loss": 0.71, + "step": 47916 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354565514689625e-06, + "loss": 0.7031, + "step": 47917 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354304842323142e-06, + "loss": 0.7036, + "step": 47918 + }, + { + "epoch": 1.23, + "learning_rate": 1.3354044167388424e-06, + "loss": 0.7109, + "step": 47919 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353783489885664e-06, + "loss": 0.6836, + "step": 47920 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353522809815067e-06, + "loss": 0.7544, + "step": 47921 + }, + { + "epoch": 1.23, + "learning_rate": 1.3353262127176833e-06, + "loss": 0.6299, + "step": 47922 + }, + { + "epoch": 1.23, + "learning_rate": 1.335300144197116e-06, + "loss": 0.7324, + "step": 47923 + }, + { + "epoch": 1.23, + "learning_rate": 1.335274075419825e-06, + "loss": 0.6479, + "step": 47924 + }, + { + "epoch": 1.23, + "learning_rate": 1.3352480063858299e-06, + "loss": 0.5059, + "step": 47925 + }, + { + "epoch": 1.23, + "learning_rate": 1.3352219370951508e-06, + "loss": 0.6582, + "step": 47926 + }, + { + "epoch": 1.23, + "learning_rate": 1.3351958675478074e-06, + "loss": 0.7197, + "step": 47927 + }, + { + "epoch": 1.23, + "learning_rate": 1.3351697977438203e-06, + "loss": 0.7354, + "step": 47928 + }, + { + "epoch": 1.23, + "learning_rate": 1.335143727683209e-06, + "loss": 0.5642, + "step": 47929 + }, + { + "epoch": 1.23, + "learning_rate": 1.335117657365994e-06, + "loss": 0.5176, + "step": 47930 + }, + { + "epoch": 1.23, + "learning_rate": 1.335091586792194e-06, + "loss": 0.7197, + "step": 47931 + }, + { + "epoch": 1.23, + "learning_rate": 1.3350655159618304e-06, + "loss": 0.5596, + "step": 47932 + }, + { + "epoch": 1.23, + "learning_rate": 1.335039444874922e-06, + "loss": 0.7314, + "step": 47933 + }, + { + "epoch": 1.23, + "learning_rate": 1.3350133735314897e-06, + "loss": 0.5508, + "step": 47934 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349873019315532e-06, + "loss": 0.5557, + "step": 47935 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349612300751321e-06, + "loss": 0.7422, + "step": 47936 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349351579622464e-06, + "loss": 0.5918, + "step": 47937 + }, + { + "epoch": 1.23, + "learning_rate": 1.3349090855929167e-06, + "loss": 0.6704, + "step": 47938 + }, + { + "epoch": 1.23, + "learning_rate": 1.334883012967162e-06, + "loss": 0.7134, + "step": 47939 + }, + { + "epoch": 1.23, + "learning_rate": 1.334856940085003e-06, + "loss": 0.7002, + "step": 47940 + }, + { + "epoch": 1.23, + "learning_rate": 1.3348308669464596e-06, + "loss": 0.4358, + "step": 47941 + }, + { + "epoch": 1.23, + "learning_rate": 1.3348047935515513e-06, + "loss": 0.7207, + "step": 47942 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347787199002987e-06, + "loss": 0.8242, + "step": 47943 + }, + { + "epoch": 1.23, + "learning_rate": 1.334752645992721e-06, + "loss": 0.4603, + "step": 47944 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347265718288391e-06, + "loss": 0.668, + "step": 47945 + }, + { + "epoch": 1.23, + "learning_rate": 1.3347004974086721e-06, + "loss": 0.4412, + "step": 47946 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346744227322404e-06, + "loss": 0.752, + "step": 47947 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346483477995638e-06, + "loss": 0.5725, + "step": 47948 + }, + { + "epoch": 1.23, + "learning_rate": 1.3346222726106627e-06, + "loss": 0.6738, + "step": 47949 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345961971655564e-06, + "loss": 0.6133, + "step": 47950 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345701214642654e-06, + "loss": 0.4146, + "step": 47951 + }, + { + "epoch": 1.23, + "learning_rate": 1.3345440455068091e-06, + "loss": 0.5581, + "step": 47952 + }, + { + "epoch": 1.23, + "learning_rate": 1.334517969293208e-06, + "loss": 0.7559, + "step": 47953 + }, + { + "epoch": 1.23, + "learning_rate": 1.334491892823482e-06, + "loss": 0.7061, + "step": 47954 + }, + { + "epoch": 1.23, + "learning_rate": 1.334465816097651e-06, + "loss": 0.6157, + "step": 47955 + }, + { + "epoch": 1.23, + "learning_rate": 1.3344397391157345e-06, + "loss": 0.7104, + "step": 47956 + }, + { + "epoch": 1.23, + "learning_rate": 1.3344136618777531e-06, + "loss": 0.7559, + "step": 47957 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343875843837262e-06, + "loss": 0.5698, + "step": 47958 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343615066336747e-06, + "loss": 0.6421, + "step": 47959 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343354286276176e-06, + "loss": 0.6299, + "step": 47960 + }, + { + "epoch": 1.23, + "learning_rate": 1.3343093503655753e-06, + "loss": 0.6934, + "step": 47961 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342832718475677e-06, + "loss": 0.6768, + "step": 47962 + }, + { + "epoch": 1.23, + "learning_rate": 1.334257193073615e-06, + "loss": 0.7373, + "step": 47963 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342311140437366e-06, + "loss": 0.5352, + "step": 47964 + }, + { + "epoch": 1.23, + "learning_rate": 1.3342050347579527e-06, + "loss": 0.6611, + "step": 47965 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341789552162838e-06, + "loss": 0.708, + "step": 47966 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341528754187493e-06, + "loss": 0.5266, + "step": 47967 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341267953653691e-06, + "loss": 0.4386, + "step": 47968 + }, + { + "epoch": 1.23, + "learning_rate": 1.3341007150561634e-06, + "loss": 0.7085, + "step": 47969 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340746344911526e-06, + "loss": 0.6914, + "step": 47970 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340485536703557e-06, + "loss": 0.7383, + "step": 47971 + }, + { + "epoch": 1.23, + "learning_rate": 1.3340224725937934e-06, + "loss": 0.7295, + "step": 47972 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339963912614854e-06, + "loss": 0.5806, + "step": 47973 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339703096734518e-06, + "loss": 0.6689, + "step": 47974 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339442278297127e-06, + "loss": 0.5256, + "step": 47975 + }, + { + "epoch": 1.23, + "learning_rate": 1.3339181457302876e-06, + "loss": 0.4756, + "step": 47976 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338920633751964e-06, + "loss": 0.6543, + "step": 47977 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338659807644598e-06, + "loss": 0.4434, + "step": 47978 + }, + { + "epoch": 1.23, + "learning_rate": 1.3338398978980972e-06, + "loss": 0.7314, + "step": 47979 + }, + { + "epoch": 1.23, + "learning_rate": 1.333813814776129e-06, + "loss": 0.6084, + "step": 47980 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337877313985746e-06, + "loss": 0.5676, + "step": 47981 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337616477654545e-06, + "loss": 0.7803, + "step": 47982 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337355638767881e-06, + "loss": 0.5623, + "step": 47983 + }, + { + "epoch": 1.23, + "learning_rate": 1.3337094797325963e-06, + "loss": 0.6294, + "step": 47984 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336833953328984e-06, + "loss": 0.71, + "step": 47985 + }, + { + "epoch": 1.23, + "learning_rate": 1.333657310677714e-06, + "loss": 0.7119, + "step": 47986 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336312257670638e-06, + "loss": 0.6455, + "step": 47987 + }, + { + "epoch": 1.23, + "learning_rate": 1.3336051406009674e-06, + "loss": 0.6582, + "step": 47988 + }, + { + "epoch": 1.23, + "learning_rate": 1.333579055179445e-06, + "loss": 0.4951, + "step": 47989 + }, + { + "epoch": 1.23, + "learning_rate": 1.3335529695025165e-06, + "loss": 0.532, + "step": 47990 + }, + { + "epoch": 1.23, + "learning_rate": 1.3335268835702019e-06, + "loss": 0.6807, + "step": 47991 + }, + { + "epoch": 1.23, + "learning_rate": 1.333500797382521e-06, + "loss": 0.5803, + "step": 47992 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334747109394938e-06, + "loss": 0.6719, + "step": 47993 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334486242411403e-06, + "loss": 0.5967, + "step": 47994 + }, + { + "epoch": 1.23, + "learning_rate": 1.3334225372874808e-06, + "loss": 0.5586, + "step": 47995 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333964500785348e-06, + "loss": 0.6719, + "step": 47996 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333703626143224e-06, + "loss": 0.4644, + "step": 47997 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333442748948637e-06, + "loss": 0.7168, + "step": 47998 + }, + { + "epoch": 1.23, + "learning_rate": 1.3333181869201786e-06, + "loss": 0.6025, + "step": 47999 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332920986902873e-06, + "loss": 0.4795, + "step": 48000 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332660102052096e-06, + "loss": 0.4429, + "step": 48001 + }, + { + "epoch": 1.23, + "learning_rate": 1.333239921464965e-06, + "loss": 0.5771, + "step": 48002 + }, + { + "epoch": 1.23, + "learning_rate": 1.3332138324695743e-06, + "loss": 0.5076, + "step": 48003 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331877432190568e-06, + "loss": 0.6621, + "step": 48004 + }, + { + "epoch": 1.23, + "learning_rate": 1.333161653713433e-06, + "loss": 0.645, + "step": 48005 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331355639527227e-06, + "loss": 0.5466, + "step": 48006 + }, + { + "epoch": 1.23, + "learning_rate": 1.3331094739369454e-06, + "loss": 0.7637, + "step": 48007 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330833836661217e-06, + "loss": 0.5864, + "step": 48008 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330572931402718e-06, + "loss": 0.7305, + "step": 48009 + }, + { + "epoch": 1.23, + "learning_rate": 1.3330312023594148e-06, + "loss": 0.5913, + "step": 48010 + }, + { + "epoch": 1.23, + "learning_rate": 1.333005111323571e-06, + "loss": 0.7734, + "step": 48011 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329790200327608e-06, + "loss": 0.5488, + "step": 48012 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329529284870036e-06, + "loss": 0.6289, + "step": 48013 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329268366863202e-06, + "loss": 0.8311, + "step": 48014 + }, + { + "epoch": 1.23, + "learning_rate": 1.3329007446307295e-06, + "loss": 0.4629, + "step": 48015 + }, + { + "epoch": 1.23, + "learning_rate": 1.332874652320252e-06, + "loss": 0.7031, + "step": 48016 + }, + { + "epoch": 1.23, + "learning_rate": 1.332848559754908e-06, + "loss": 0.3967, + "step": 48017 + }, + { + "epoch": 1.23, + "learning_rate": 1.332822466934717e-06, + "loss": 0.6509, + "step": 48018 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327963738596993e-06, + "loss": 0.5166, + "step": 48019 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327702805298743e-06, + "loss": 0.728, + "step": 48020 + }, + { + "epoch": 1.23, + "learning_rate": 1.3327441869452627e-06, + "loss": 0.5691, + "step": 48021 + }, + { + "epoch": 1.23, + "learning_rate": 1.332718093105884e-06, + "loss": 0.7295, + "step": 48022 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326919990117586e-06, + "loss": 0.7031, + "step": 48023 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326659046629064e-06, + "loss": 0.6914, + "step": 48024 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326398100593469e-06, + "loss": 0.6143, + "step": 48025 + }, + { + "epoch": 1.23, + "learning_rate": 1.3326137152011003e-06, + "loss": 0.5919, + "step": 48026 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325876200881867e-06, + "loss": 0.8198, + "step": 48027 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325615247206263e-06, + "loss": 0.6597, + "step": 48028 + }, + { + "epoch": 1.23, + "learning_rate": 1.3325354290984388e-06, + "loss": 0.7588, + "step": 48029 + }, + { + "epoch": 1.23, + "learning_rate": 1.332509333221644e-06, + "loss": 0.75, + "step": 48030 + }, + { + "epoch": 1.23, + "learning_rate": 1.3324832370902624e-06, + "loss": 0.5684, + "step": 48031 + }, + { + "epoch": 1.23, + "learning_rate": 1.3324571407043133e-06, + "loss": 0.6973, + "step": 48032 + }, + { + "epoch": 1.23, + "learning_rate": 1.332431044063817e-06, + "loss": 0.5669, + "step": 48033 + }, + { + "epoch": 1.23, + "learning_rate": 1.332404947168794e-06, + "loss": 0.48, + "step": 48034 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323788500192637e-06, + "loss": 0.6597, + "step": 48035 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323527526152458e-06, + "loss": 0.5735, + "step": 48036 + }, + { + "epoch": 1.23, + "learning_rate": 1.332326654956761e-06, + "loss": 0.5488, + "step": 48037 + }, + { + "epoch": 1.23, + "learning_rate": 1.3323005570438288e-06, + "loss": 0.7461, + "step": 48038 + }, + { + "epoch": 1.23, + "learning_rate": 1.33227445887647e-06, + "loss": 0.5083, + "step": 48039 + }, + { + "epoch": 1.23, + "learning_rate": 1.332248360454703e-06, + "loss": 0.6807, + "step": 48040 + }, + { + "epoch": 1.23, + "learning_rate": 1.3322222617785492e-06, + "loss": 0.6025, + "step": 48041 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321961628480278e-06, + "loss": 0.6602, + "step": 48042 + }, + { + "epoch": 1.23, + "learning_rate": 1.332170063663159e-06, + "loss": 0.7266, + "step": 48043 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321439642239635e-06, + "loss": 0.7539, + "step": 48044 + }, + { + "epoch": 1.23, + "learning_rate": 1.3321178645304602e-06, + "loss": 0.5908, + "step": 48045 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320917645826694e-06, + "loss": 0.5146, + "step": 48046 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320656643806116e-06, + "loss": 0.6064, + "step": 48047 + }, + { + "epoch": 1.23, + "learning_rate": 1.332039563924306e-06, + "loss": 0.7002, + "step": 48048 + }, + { + "epoch": 1.23, + "learning_rate": 1.3320134632137733e-06, + "loss": 0.7163, + "step": 48049 + }, + { + "epoch": 1.23, + "learning_rate": 1.331987362249033e-06, + "loss": 0.6626, + "step": 48050 + }, + { + "epoch": 1.23, + "learning_rate": 1.3319612610301051e-06, + "loss": 0.5933, + "step": 48051 + }, + { + "epoch": 1.23, + "learning_rate": 1.3319351595570098e-06, + "loss": 0.5098, + "step": 48052 + }, + { + "epoch": 1.23, + "learning_rate": 1.331909057829767e-06, + "loss": 0.4561, + "step": 48053 + }, + { + "epoch": 1.23, + "learning_rate": 1.331882955848397e-06, + "loss": 0.5938, + "step": 48054 + }, + { + "epoch": 1.23, + "learning_rate": 1.3318568536129192e-06, + "loss": 0.6001, + "step": 48055 + }, + { + "epoch": 1.23, + "learning_rate": 1.331830751123354e-06, + "loss": 0.5532, + "step": 48056 + }, + { + "epoch": 1.23, + "learning_rate": 1.3318046483797209e-06, + "loss": 0.7676, + "step": 48057 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317785453820408e-06, + "loss": 0.5425, + "step": 48058 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317524421303327e-06, + "loss": 0.751, + "step": 48059 + }, + { + "epoch": 1.23, + "learning_rate": 1.3317263386246173e-06, + "loss": 0.748, + "step": 48060 + }, + { + "epoch": 1.23, + "learning_rate": 1.331700234864914e-06, + "loss": 0.5284, + "step": 48061 + }, + { + "epoch": 1.23, + "learning_rate": 1.3316741308512434e-06, + "loss": 0.4646, + "step": 48062 + }, + { + "epoch": 1.23, + "learning_rate": 1.3316480265836248e-06, + "loss": 0.7266, + "step": 48063 + }, + { + "epoch": 1.23, + "learning_rate": 1.331621922062079e-06, + "loss": 0.7188, + "step": 48064 + }, + { + "epoch": 1.23, + "learning_rate": 1.331595817286625e-06, + "loss": 0.6621, + "step": 48065 + }, + { + "epoch": 1.23, + "learning_rate": 1.3315697122572838e-06, + "loss": 0.6992, + "step": 48066 + }, + { + "epoch": 1.23, + "learning_rate": 1.3315436069740746e-06, + "loss": 0.6069, + "step": 48067 + }, + { + "epoch": 1.23, + "learning_rate": 1.331517501437018e-06, + "loss": 0.6133, + "step": 48068 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314913956461336e-06, + "loss": 0.6157, + "step": 48069 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314652896014413e-06, + "loss": 0.7144, + "step": 48070 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314391833029613e-06, + "loss": 0.7168, + "step": 48071 + }, + { + "epoch": 1.23, + "learning_rate": 1.3314130767507137e-06, + "loss": 0.7197, + "step": 48072 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313869699447182e-06, + "loss": 0.707, + "step": 48073 + }, + { + "epoch": 1.23, + "learning_rate": 1.331360862884995e-06, + "loss": 0.6167, + "step": 48074 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313347555715641e-06, + "loss": 0.7002, + "step": 48075 + }, + { + "epoch": 1.23, + "learning_rate": 1.3313086480044453e-06, + "loss": 0.6831, + "step": 48076 + }, + { + "epoch": 1.23, + "learning_rate": 1.331282540183659e-06, + "loss": 0.6807, + "step": 48077 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312564321092243e-06, + "loss": 0.7285, + "step": 48078 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312303237811624e-06, + "loss": 0.8096, + "step": 48079 + }, + { + "epoch": 1.23, + "learning_rate": 1.3312042151994924e-06, + "loss": 0.6128, + "step": 48080 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311781063642346e-06, + "loss": 0.8462, + "step": 48081 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311519972754086e-06, + "loss": 0.6616, + "step": 48082 + }, + { + "epoch": 1.23, + "learning_rate": 1.3311258879330352e-06, + "loss": 0.7598, + "step": 48083 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310997783371338e-06, + "loss": 0.6855, + "step": 48084 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310736684877246e-06, + "loss": 0.833, + "step": 48085 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310475583848276e-06, + "loss": 0.7085, + "step": 48086 + }, + { + "epoch": 1.23, + "learning_rate": 1.3310214480284626e-06, + "loss": 0.6396, + "step": 48087 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309953374186494e-06, + "loss": 0.6299, + "step": 48088 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309692265554086e-06, + "loss": 0.6226, + "step": 48089 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309431154387597e-06, + "loss": 0.6465, + "step": 48090 + }, + { + "epoch": 1.23, + "learning_rate": 1.3309170040687233e-06, + "loss": 0.6406, + "step": 48091 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308908924453183e-06, + "loss": 0.7041, + "step": 48092 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308647805685658e-06, + "loss": 0.8477, + "step": 48093 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308386684384854e-06, + "loss": 0.5391, + "step": 48094 + }, + { + "epoch": 1.23, + "learning_rate": 1.3308125560550966e-06, + "loss": 0.7979, + "step": 48095 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307864434184204e-06, + "loss": 0.4949, + "step": 48096 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307603305284758e-06, + "loss": 0.8525, + "step": 48097 + }, + { + "epoch": 1.23, + "learning_rate": 1.3307342173852833e-06, + "loss": 0.5361, + "step": 48098 + }, + { + "epoch": 1.23, + "learning_rate": 1.330708103988863e-06, + "loss": 0.5391, + "step": 48099 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306819903392347e-06, + "loss": 0.6396, + "step": 48100 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306558764364181e-06, + "loss": 0.5918, + "step": 48101 + }, + { + "epoch": 1.23, + "learning_rate": 1.330629762280434e-06, + "loss": 0.7002, + "step": 48102 + }, + { + "epoch": 1.23, + "learning_rate": 1.3306036478713015e-06, + "loss": 0.5566, + "step": 48103 + }, + { + "epoch": 1.23, + "learning_rate": 1.330577533209041e-06, + "loss": 0.5786, + "step": 48104 + }, + { + "epoch": 1.23, + "learning_rate": 1.3305514182936729e-06, + "loss": 0.455, + "step": 48105 + }, + { + "epoch": 1.23, + "learning_rate": 1.3305253031252165e-06, + "loss": 0.5171, + "step": 48106 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304991877036918e-06, + "loss": 0.6328, + "step": 48107 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304730720291192e-06, + "loss": 0.6396, + "step": 48108 + }, + { + "epoch": 1.23, + "learning_rate": 1.330446956101519e-06, + "loss": 0.6523, + "step": 48109 + }, + { + "epoch": 1.23, + "learning_rate": 1.3304208399209104e-06, + "loss": 0.6748, + "step": 48110 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303947234873135e-06, + "loss": 0.6787, + "step": 48111 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303686068007492e-06, + "loss": 0.6914, + "step": 48112 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303424898612363e-06, + "loss": 0.5142, + "step": 48113 + }, + { + "epoch": 1.23, + "learning_rate": 1.3303163726687955e-06, + "loss": 0.5137, + "step": 48114 + }, + { + "epoch": 1.23, + "learning_rate": 1.3302902552234468e-06, + "loss": 0.7422, + "step": 48115 + }, + { + "epoch": 1.23, + "learning_rate": 1.33026413752521e-06, + "loss": 0.5513, + "step": 48116 + }, + { + "epoch": 1.23, + "learning_rate": 1.330238019574105e-06, + "loss": 0.5874, + "step": 48117 + }, + { + "epoch": 1.23, + "learning_rate": 1.330211901370152e-06, + "loss": 0.7559, + "step": 48118 + }, + { + "epoch": 1.23, + "learning_rate": 1.330185782913371e-06, + "loss": 0.6226, + "step": 48119 + }, + { + "epoch": 1.23, + "learning_rate": 1.3301596642037815e-06, + "loss": 0.6934, + "step": 48120 + }, + { + "epoch": 1.23, + "learning_rate": 1.3301335452414044e-06, + "loss": 0.5776, + "step": 48121 + }, + { + "epoch": 1.23, + "learning_rate": 1.330107426026259e-06, + "loss": 0.7578, + "step": 48122 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300813065583655e-06, + "loss": 0.7998, + "step": 48123 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300551868377442e-06, + "loss": 0.7529, + "step": 48124 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300290668644147e-06, + "loss": 0.9248, + "step": 48125 + }, + { + "epoch": 1.23, + "learning_rate": 1.3300029466383972e-06, + "loss": 0.6821, + "step": 48126 + }, + { + "epoch": 1.23, + "learning_rate": 1.3299768261597114e-06, + "loss": 0.5786, + "step": 48127 + }, + { + "epoch": 1.23, + "learning_rate": 1.3299507054283776e-06, + "loss": 0.5952, + "step": 48128 + }, + { + "epoch": 1.23, + "learning_rate": 1.329924584444416e-06, + "loss": 0.752, + "step": 48129 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298984632078458e-06, + "loss": 0.5386, + "step": 48130 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298723417186879e-06, + "loss": 0.6479, + "step": 48131 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298462199769615e-06, + "loss": 0.6382, + "step": 48132 + }, + { + "epoch": 1.23, + "learning_rate": 1.3298200979826875e-06, + "loss": 0.6196, + "step": 48133 + }, + { + "epoch": 1.23, + "learning_rate": 1.329793975735885e-06, + "loss": 0.6133, + "step": 48134 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297678532365747e-06, + "loss": 0.7002, + "step": 48135 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297417304847761e-06, + "loss": 0.7852, + "step": 48136 + }, + { + "epoch": 1.23, + "learning_rate": 1.3297156074805099e-06, + "loss": 0.6099, + "step": 48137 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296894842237951e-06, + "loss": 0.6885, + "step": 48138 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296633607146523e-06, + "loss": 0.6562, + "step": 48139 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296372369531017e-06, + "loss": 0.6211, + "step": 48140 + }, + { + "epoch": 1.23, + "learning_rate": 1.3296111129391628e-06, + "loss": 0.6509, + "step": 48141 + }, + { + "epoch": 1.23, + "learning_rate": 1.3295849886728558e-06, + "loss": 0.6758, + "step": 48142 + }, + { + "epoch": 1.23, + "learning_rate": 1.329558864154201e-06, + "loss": 0.668, + "step": 48143 + }, + { + "epoch": 1.23, + "learning_rate": 1.329532739383218e-06, + "loss": 0.9385, + "step": 48144 + }, + { + "epoch": 1.23, + "learning_rate": 1.3295066143599267e-06, + "loss": 0.6709, + "step": 48145 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294804890843475e-06, + "loss": 0.5469, + "step": 48146 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294543635565e-06, + "loss": 0.7373, + "step": 48147 + }, + { + "epoch": 1.23, + "learning_rate": 1.329428237776405e-06, + "loss": 0.6929, + "step": 48148 + }, + { + "epoch": 1.23, + "learning_rate": 1.3294021117440817e-06, + "loss": 0.7236, + "step": 48149 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293759854595503e-06, + "loss": 0.6504, + "step": 48150 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293498589228307e-06, + "loss": 0.7764, + "step": 48151 + }, + { + "epoch": 1.23, + "learning_rate": 1.3293237321339433e-06, + "loss": 0.573, + "step": 48152 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292976050929077e-06, + "loss": 0.6416, + "step": 48153 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292714777997443e-06, + "loss": 0.5337, + "step": 48154 + }, + { + "epoch": 1.23, + "learning_rate": 1.3292453502544725e-06, + "loss": 0.5669, + "step": 48155 + }, + { + "epoch": 1.23, + "learning_rate": 1.329219222457113e-06, + "loss": 0.9121, + "step": 48156 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291930944076853e-06, + "loss": 0.7354, + "step": 48157 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291669661062094e-06, + "loss": 0.6602, + "step": 48158 + }, + { + "epoch": 1.23, + "learning_rate": 1.329140837552706e-06, + "loss": 0.5757, + "step": 48159 + }, + { + "epoch": 1.23, + "learning_rate": 1.3291147087471943e-06, + "loss": 0.5754, + "step": 48160 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290885796896945e-06, + "loss": 0.6436, + "step": 48161 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290624503802268e-06, + "loss": 0.6055, + "step": 48162 + }, + { + "epoch": 1.23, + "learning_rate": 1.329036320818811e-06, + "loss": 0.7207, + "step": 48163 + }, + { + "epoch": 1.23, + "learning_rate": 1.3290101910054677e-06, + "loss": 0.6611, + "step": 48164 + }, + { + "epoch": 1.23, + "learning_rate": 1.328984060940216e-06, + "loss": 0.8027, + "step": 48165 + }, + { + "epoch": 1.23, + "learning_rate": 1.3289579306230763e-06, + "loss": 0.9043, + "step": 48166 + }, + { + "epoch": 1.23, + "learning_rate": 1.3289318000540687e-06, + "loss": 0.7578, + "step": 48167 + }, + { + "epoch": 1.23, + "learning_rate": 1.328905669233213e-06, + "loss": 0.5898, + "step": 48168 + }, + { + "epoch": 1.23, + "learning_rate": 1.32887953816053e-06, + "loss": 0.6445, + "step": 48169 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288534068360383e-06, + "loss": 0.6523, + "step": 48170 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288272752597592e-06, + "loss": 0.6279, + "step": 48171 + }, + { + "epoch": 1.23, + "learning_rate": 1.3288011434317116e-06, + "loss": 0.5586, + "step": 48172 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287750113519168e-06, + "loss": 0.7559, + "step": 48173 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287488790203936e-06, + "loss": 0.6582, + "step": 48174 + }, + { + "epoch": 1.23, + "learning_rate": 1.3287227464371626e-06, + "loss": 0.5737, + "step": 48175 + }, + { + "epoch": 1.23, + "learning_rate": 1.3286966136022438e-06, + "loss": 0.5557, + "step": 48176 + }, + { + "epoch": 1.23, + "learning_rate": 1.328670480515657e-06, + "loss": 0.6484, + "step": 48177 + }, + { + "epoch": 1.23, + "learning_rate": 1.3286443471774222e-06, + "loss": 0.5081, + "step": 48178 + }, + { + "epoch": 1.23, + "learning_rate": 1.32861821358756e-06, + "loss": 0.7275, + "step": 48179 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285920797460897e-06, + "loss": 0.5913, + "step": 48180 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285659456530314e-06, + "loss": 0.4437, + "step": 48181 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285398113084053e-06, + "loss": 0.4731, + "step": 48182 + }, + { + "epoch": 1.23, + "learning_rate": 1.3285136767122316e-06, + "loss": 0.5879, + "step": 48183 + }, + { + "epoch": 1.23, + "learning_rate": 1.3284875418645298e-06, + "loss": 0.6123, + "step": 48184 + }, + { + "epoch": 1.24, + "learning_rate": 1.3284614067653204e-06, + "loss": 0.4252, + "step": 48185 + }, + { + "epoch": 1.24, + "learning_rate": 1.328435271414623e-06, + "loss": 0.6641, + "step": 48186 + }, + { + "epoch": 1.24, + "learning_rate": 1.328409135812458e-06, + "loss": 0.6045, + "step": 48187 + }, + { + "epoch": 1.24, + "learning_rate": 1.328382999958845e-06, + "loss": 0.4954, + "step": 48188 + }, + { + "epoch": 1.24, + "learning_rate": 1.3283568638538045e-06, + "loss": 0.5015, + "step": 48189 + }, + { + "epoch": 1.24, + "learning_rate": 1.3283307274973564e-06, + "loss": 0.5273, + "step": 48190 + }, + { + "epoch": 1.24, + "learning_rate": 1.32830459088952e-06, + "loss": 0.6113, + "step": 48191 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282784540303162e-06, + "loss": 0.7637, + "step": 48192 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282523169197646e-06, + "loss": 0.6875, + "step": 48193 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282261795578858e-06, + "loss": 0.6436, + "step": 48194 + }, + { + "epoch": 1.24, + "learning_rate": 1.3282000419446987e-06, + "loss": 0.7827, + "step": 48195 + }, + { + "epoch": 1.24, + "learning_rate": 1.328173904080224e-06, + "loss": 0.5181, + "step": 48196 + }, + { + "epoch": 1.24, + "learning_rate": 1.3281477659644815e-06, + "loss": 0.8447, + "step": 48197 + }, + { + "epoch": 1.24, + "learning_rate": 1.3281216275974916e-06, + "loss": 0.7158, + "step": 48198 + }, + { + "epoch": 1.24, + "learning_rate": 1.3280954889792743e-06, + "loss": 0.4353, + "step": 48199 + }, + { + "epoch": 1.24, + "learning_rate": 1.328069350109849e-06, + "loss": 0.6104, + "step": 48200 + }, + { + "epoch": 1.24, + "learning_rate": 1.328043210989236e-06, + "loss": 0.6245, + "step": 48201 + }, + { + "epoch": 1.24, + "learning_rate": 1.3280170716174557e-06, + "loss": 0.7559, + "step": 48202 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279909319945275e-06, + "loss": 0.626, + "step": 48203 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279647921204722e-06, + "loss": 0.5037, + "step": 48204 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279386519953088e-06, + "loss": 0.7402, + "step": 48205 + }, + { + "epoch": 1.24, + "learning_rate": 1.3279125116190583e-06, + "loss": 0.7773, + "step": 48206 + }, + { + "epoch": 1.24, + "learning_rate": 1.3278863709917398e-06, + "loss": 0.6421, + "step": 48207 + }, + { + "epoch": 1.24, + "learning_rate": 1.327860230113374e-06, + "loss": 0.6489, + "step": 48208 + }, + { + "epoch": 1.24, + "learning_rate": 1.327834088983981e-06, + "loss": 0.441, + "step": 48209 + }, + { + "epoch": 1.24, + "learning_rate": 1.32780794760358e-06, + "loss": 0.6885, + "step": 48210 + }, + { + "epoch": 1.24, + "learning_rate": 1.327781805972192e-06, + "loss": 0.5615, + "step": 48211 + }, + { + "epoch": 1.24, + "learning_rate": 1.3277556640898362e-06, + "loss": 0.5322, + "step": 48212 + }, + { + "epoch": 1.24, + "learning_rate": 1.327729521956533e-06, + "loss": 0.5513, + "step": 48213 + }, + { + "epoch": 1.24, + "learning_rate": 1.3277033795723026e-06, + "loss": 0.6296, + "step": 48214 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276772369371647e-06, + "loss": 0.6758, + "step": 48215 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276510940511392e-06, + "loss": 0.7109, + "step": 48216 + }, + { + "epoch": 1.24, + "learning_rate": 1.3276249509142466e-06, + "loss": 0.7412, + "step": 48217 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275988075265064e-06, + "loss": 0.6582, + "step": 48218 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275726638879392e-06, + "loss": 0.5535, + "step": 48219 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275465199985643e-06, + "loss": 0.7275, + "step": 48220 + }, + { + "epoch": 1.24, + "learning_rate": 1.3275203758584024e-06, + "loss": 0.7178, + "step": 48221 + }, + { + "epoch": 1.24, + "learning_rate": 1.327494231467473e-06, + "loss": 0.5657, + "step": 48222 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274680868257962e-06, + "loss": 0.7383, + "step": 48223 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274419419333924e-06, + "loss": 0.7268, + "step": 48224 + }, + { + "epoch": 1.24, + "learning_rate": 1.3274157967902812e-06, + "loss": 0.543, + "step": 48225 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273896513964828e-06, + "loss": 0.6401, + "step": 48226 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273635057520173e-06, + "loss": 0.6821, + "step": 48227 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273373598569043e-06, + "loss": 0.8086, + "step": 48228 + }, + { + "epoch": 1.24, + "learning_rate": 1.3273112137111645e-06, + "loss": 0.481, + "step": 48229 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272850673148177e-06, + "loss": 0.6294, + "step": 48230 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272589206678832e-06, + "loss": 0.7085, + "step": 48231 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272327737703821e-06, + "loss": 0.8604, + "step": 48232 + }, + { + "epoch": 1.24, + "learning_rate": 1.3272066266223338e-06, + "loss": 0.5605, + "step": 48233 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271804792237584e-06, + "loss": 0.627, + "step": 48234 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271543315746759e-06, + "loss": 0.5566, + "step": 48235 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271281836751062e-06, + "loss": 0.606, + "step": 48236 + }, + { + "epoch": 1.24, + "learning_rate": 1.3271020355250696e-06, + "loss": 0.5962, + "step": 48237 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270758871245861e-06, + "loss": 0.6948, + "step": 48238 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270497384736758e-06, + "loss": 0.6426, + "step": 48239 + }, + { + "epoch": 1.24, + "learning_rate": 1.3270235895723585e-06, + "loss": 0.6011, + "step": 48240 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269974404206541e-06, + "loss": 0.6484, + "step": 48241 + }, + { + "epoch": 1.24, + "learning_rate": 1.326971291018583e-06, + "loss": 0.7314, + "step": 48242 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269451413661646e-06, + "loss": 0.5327, + "step": 48243 + }, + { + "epoch": 1.24, + "learning_rate": 1.3269189914634197e-06, + "loss": 0.5972, + "step": 48244 + }, + { + "epoch": 1.24, + "learning_rate": 1.326892841310368e-06, + "loss": 0.6768, + "step": 48245 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268666909070292e-06, + "loss": 0.5625, + "step": 48246 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268405402534236e-06, + "loss": 0.561, + "step": 48247 + }, + { + "epoch": 1.24, + "learning_rate": 1.3268143893495713e-06, + "loss": 0.6328, + "step": 48248 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267882381954927e-06, + "loss": 0.7422, + "step": 48249 + }, + { + "epoch": 1.24, + "learning_rate": 1.326762086791207e-06, + "loss": 0.4951, + "step": 48250 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267359351367344e-06, + "loss": 0.5393, + "step": 48251 + }, + { + "epoch": 1.24, + "learning_rate": 1.3267097832320952e-06, + "loss": 0.4546, + "step": 48252 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266836310773095e-06, + "loss": 0.7686, + "step": 48253 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266574786723973e-06, + "loss": 0.3999, + "step": 48254 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266313260173782e-06, + "loss": 0.665, + "step": 48255 + }, + { + "epoch": 1.24, + "learning_rate": 1.3266051731122725e-06, + "loss": 0.6357, + "step": 48256 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265790199571006e-06, + "loss": 0.6616, + "step": 48257 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265528665518816e-06, + "loss": 0.8867, + "step": 48258 + }, + { + "epoch": 1.24, + "learning_rate": 1.3265267128966367e-06, + "loss": 0.4722, + "step": 48259 + }, + { + "epoch": 1.24, + "learning_rate": 1.326500558991385e-06, + "loss": 0.5122, + "step": 48260 + }, + { + "epoch": 1.24, + "learning_rate": 1.3264744048361467e-06, + "loss": 0.7158, + "step": 48261 + }, + { + "epoch": 1.24, + "learning_rate": 1.326448250430942e-06, + "loss": 0.6514, + "step": 48262 + }, + { + "epoch": 1.24, + "learning_rate": 1.326422095775791e-06, + "loss": 0.6484, + "step": 48263 + }, + { + "epoch": 1.24, + "learning_rate": 1.3263959408707137e-06, + "loss": 0.5796, + "step": 48264 + }, + { + "epoch": 1.24, + "learning_rate": 1.32636978571573e-06, + "loss": 0.6221, + "step": 48265 + }, + { + "epoch": 1.24, + "learning_rate": 1.32634363031086e-06, + "loss": 0.5092, + "step": 48266 + }, + { + "epoch": 1.24, + "learning_rate": 1.3263174746561233e-06, + "loss": 0.592, + "step": 48267 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262913187515405e-06, + "loss": 0.8154, + "step": 48268 + }, + { + "epoch": 1.24, + "learning_rate": 1.326265162597132e-06, + "loss": 0.6426, + "step": 48269 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262390061929166e-06, + "loss": 0.5088, + "step": 48270 + }, + { + "epoch": 1.24, + "learning_rate": 1.3262128495389154e-06, + "loss": 0.7793, + "step": 48271 + }, + { + "epoch": 1.24, + "learning_rate": 1.3261866926351476e-06, + "loss": 0.7681, + "step": 48272 + }, + { + "epoch": 1.24, + "learning_rate": 1.326160535481634e-06, + "loss": 0.7529, + "step": 48273 + }, + { + "epoch": 1.24, + "learning_rate": 1.326134378078394e-06, + "loss": 0.5874, + "step": 48274 + }, + { + "epoch": 1.24, + "learning_rate": 1.3261082204254482e-06, + "loss": 0.6489, + "step": 48275 + }, + { + "epoch": 1.24, + "learning_rate": 1.326082062522816e-06, + "loss": 0.8223, + "step": 48276 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260559043705183e-06, + "loss": 0.7295, + "step": 48277 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260297459685738e-06, + "loss": 0.6953, + "step": 48278 + }, + { + "epoch": 1.24, + "learning_rate": 1.3260035873170039e-06, + "loss": 0.7393, + "step": 48279 + }, + { + "epoch": 1.24, + "learning_rate": 1.325977428415828e-06, + "loss": 0.7432, + "step": 48280 + }, + { + "epoch": 1.24, + "learning_rate": 1.3259512692650659e-06, + "loss": 0.6699, + "step": 48281 + }, + { + "epoch": 1.24, + "learning_rate": 1.3259251098647378e-06, + "loss": 0.6992, + "step": 48282 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258989502148642e-06, + "loss": 0.6611, + "step": 48283 + }, + { + "epoch": 1.24, + "learning_rate": 1.325872790315465e-06, + "loss": 0.6631, + "step": 48284 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258466301665593e-06, + "loss": 0.4667, + "step": 48285 + }, + { + "epoch": 1.24, + "learning_rate": 1.3258204697681684e-06, + "loss": 0.7104, + "step": 48286 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257943091203112e-06, + "loss": 0.8486, + "step": 48287 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257681482230087e-06, + "loss": 0.623, + "step": 48288 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257419870762804e-06, + "loss": 0.4692, + "step": 48289 + }, + { + "epoch": 1.24, + "learning_rate": 1.3257158256801467e-06, + "loss": 0.7573, + "step": 48290 + }, + { + "epoch": 1.24, + "learning_rate": 1.325689664034627e-06, + "loss": 0.707, + "step": 48291 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256635021397418e-06, + "loss": 0.6104, + "step": 48292 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256373399955107e-06, + "loss": 0.5054, + "step": 48293 + }, + { + "epoch": 1.24, + "learning_rate": 1.3256111776019548e-06, + "loss": 0.5364, + "step": 48294 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255850149590928e-06, + "loss": 0.4692, + "step": 48295 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255588520669453e-06, + "loss": 0.6807, + "step": 48296 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255326889255324e-06, + "loss": 0.6299, + "step": 48297 + }, + { + "epoch": 1.24, + "learning_rate": 1.3255065255348745e-06, + "loss": 0.8086, + "step": 48298 + }, + { + "epoch": 1.24, + "learning_rate": 1.325480361894991e-06, + "loss": 0.6675, + "step": 48299 + }, + { + "epoch": 1.24, + "learning_rate": 1.325454198005902e-06, + "loss": 0.5801, + "step": 48300 + }, + { + "epoch": 1.24, + "learning_rate": 1.325428033867628e-06, + "loss": 0.4958, + "step": 48301 + }, + { + "epoch": 1.24, + "learning_rate": 1.3254018694801882e-06, + "loss": 0.6426, + "step": 48302 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253757048436035e-06, + "loss": 0.6621, + "step": 48303 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253495399578937e-06, + "loss": 0.6367, + "step": 48304 + }, + { + "epoch": 1.24, + "learning_rate": 1.3253233748230788e-06, + "loss": 0.8623, + "step": 48305 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252972094391783e-06, + "loss": 0.5547, + "step": 48306 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252710438062129e-06, + "loss": 0.4512, + "step": 48307 + }, + { + "epoch": 1.24, + "learning_rate": 1.3252448779242026e-06, + "loss": 0.6621, + "step": 48308 + }, + { + "epoch": 1.24, + "learning_rate": 1.325218711793167e-06, + "loss": 0.6719, + "step": 48309 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251925454131265e-06, + "loss": 0.5635, + "step": 48310 + }, + { + "epoch": 1.24, + "learning_rate": 1.325166378784101e-06, + "loss": 0.4644, + "step": 48311 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251402119061104e-06, + "loss": 0.5212, + "step": 48312 + }, + { + "epoch": 1.24, + "learning_rate": 1.3251140447791754e-06, + "loss": 0.7178, + "step": 48313 + }, + { + "epoch": 1.24, + "learning_rate": 1.325087877403315e-06, + "loss": 0.6001, + "step": 48314 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250617097785498e-06, + "loss": 0.5017, + "step": 48315 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250355419049e-06, + "loss": 0.6875, + "step": 48316 + }, + { + "epoch": 1.24, + "learning_rate": 1.3250093737823853e-06, + "loss": 0.6992, + "step": 48317 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249832054110259e-06, + "loss": 0.7754, + "step": 48318 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249570367908419e-06, + "loss": 0.6719, + "step": 48319 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249308679218531e-06, + "loss": 0.6343, + "step": 48320 + }, + { + "epoch": 1.24, + "learning_rate": 1.3249046988040796e-06, + "loss": 0.5771, + "step": 48321 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248785294375418e-06, + "loss": 0.8311, + "step": 48322 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248523598222592e-06, + "loss": 0.7983, + "step": 48323 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248261899582522e-06, + "loss": 0.606, + "step": 48324 + }, + { + "epoch": 1.24, + "learning_rate": 1.3248000198455407e-06, + "loss": 0.7227, + "step": 48325 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247738494841447e-06, + "loss": 0.6416, + "step": 48326 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247476788740844e-06, + "loss": 0.7231, + "step": 48327 + }, + { + "epoch": 1.24, + "learning_rate": 1.3247215080153797e-06, + "loss": 0.6211, + "step": 48328 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246953369080507e-06, + "loss": 0.4946, + "step": 48329 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246691655521173e-06, + "loss": 0.5518, + "step": 48330 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246429939475997e-06, + "loss": 0.708, + "step": 48331 + }, + { + "epoch": 1.24, + "learning_rate": 1.3246168220945179e-06, + "loss": 0.7256, + "step": 48332 + }, + { + "epoch": 1.24, + "learning_rate": 1.324590649992892e-06, + "loss": 0.3894, + "step": 48333 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245644776427421e-06, + "loss": 0.5703, + "step": 48334 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245383050440878e-06, + "loss": 0.5269, + "step": 48335 + }, + { + "epoch": 1.24, + "learning_rate": 1.3245121321969495e-06, + "loss": 0.5371, + "step": 48336 + }, + { + "epoch": 1.24, + "learning_rate": 1.324485959101347e-06, + "loss": 0.4856, + "step": 48337 + }, + { + "epoch": 1.24, + "learning_rate": 1.324459785757301e-06, + "loss": 0.708, + "step": 48338 + }, + { + "epoch": 1.24, + "learning_rate": 1.3244336121648306e-06, + "loss": 0.542, + "step": 48339 + }, + { + "epoch": 1.24, + "learning_rate": 1.3244074383239567e-06, + "loss": 0.7168, + "step": 48340 + }, + { + "epoch": 1.24, + "learning_rate": 1.3243812642346988e-06, + "loss": 0.6709, + "step": 48341 + }, + { + "epoch": 1.24, + "learning_rate": 1.324355089897077e-06, + "loss": 0.6382, + "step": 48342 + }, + { + "epoch": 1.24, + "learning_rate": 1.3243289153111115e-06, + "loss": 0.6455, + "step": 48343 + }, + { + "epoch": 1.24, + "learning_rate": 1.324302740476822e-06, + "loss": 0.6958, + "step": 48344 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242765653942292e-06, + "loss": 0.4833, + "step": 48345 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242503900633523e-06, + "loss": 0.666, + "step": 48346 + }, + { + "epoch": 1.24, + "learning_rate": 1.3242242144842122e-06, + "loss": 0.6011, + "step": 48347 + }, + { + "epoch": 1.24, + "learning_rate": 1.3241980386568284e-06, + "loss": 0.5591, + "step": 48348 + }, + { + "epoch": 1.24, + "learning_rate": 1.324171862581221e-06, + "loss": 0.606, + "step": 48349 + }, + { + "epoch": 1.24, + "learning_rate": 1.32414568625741e-06, + "loss": 0.6694, + "step": 48350 + }, + { + "epoch": 1.24, + "learning_rate": 1.3241195096854158e-06, + "loss": 0.6968, + "step": 48351 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240933328652578e-06, + "loss": 0.5645, + "step": 48352 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240671557969573e-06, + "loss": 0.4745, + "step": 48353 + }, + { + "epoch": 1.24, + "learning_rate": 1.3240409784805327e-06, + "loss": 0.6875, + "step": 48354 + }, + { + "epoch": 1.24, + "learning_rate": 1.324014800916005e-06, + "loss": 0.6455, + "step": 48355 + }, + { + "epoch": 1.24, + "learning_rate": 1.323988623103394e-06, + "loss": 0.4712, + "step": 48356 + }, + { + "epoch": 1.24, + "learning_rate": 1.32396244504272e-06, + "loss": 0.5073, + "step": 48357 + }, + { + "epoch": 1.24, + "learning_rate": 1.323936266734003e-06, + "loss": 0.7178, + "step": 48358 + }, + { + "epoch": 1.24, + "learning_rate": 1.3239100881772627e-06, + "loss": 0.7314, + "step": 48359 + }, + { + "epoch": 1.24, + "learning_rate": 1.323883909372519e-06, + "loss": 0.647, + "step": 48360 + }, + { + "epoch": 1.24, + "learning_rate": 1.323857730319793e-06, + "loss": 0.5396, + "step": 48361 + }, + { + "epoch": 1.24, + "learning_rate": 1.3238315510191033e-06, + "loss": 0.8525, + "step": 48362 + }, + { + "epoch": 1.24, + "learning_rate": 1.323805371470471e-06, + "loss": 0.472, + "step": 48363 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237791916739159e-06, + "loss": 0.6597, + "step": 48364 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237530116294578e-06, + "loss": 0.6396, + "step": 48365 + }, + { + "epoch": 1.24, + "learning_rate": 1.323726831337117e-06, + "loss": 0.7256, + "step": 48366 + }, + { + "epoch": 1.24, + "learning_rate": 1.3237006507969133e-06, + "loss": 0.5425, + "step": 48367 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236744700088674e-06, + "loss": 0.7246, + "step": 48368 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236482889729981e-06, + "loss": 0.5762, + "step": 48369 + }, + { + "epoch": 1.24, + "learning_rate": 1.3236221076893266e-06, + "loss": 0.6768, + "step": 48370 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235959261578725e-06, + "loss": 0.5464, + "step": 48371 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235697443786558e-06, + "loss": 0.5959, + "step": 48372 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235435623516967e-06, + "loss": 0.7119, + "step": 48373 + }, + { + "epoch": 1.24, + "learning_rate": 1.3235173800770153e-06, + "loss": 0.479, + "step": 48374 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234911975546313e-06, + "loss": 0.665, + "step": 48375 + }, + { + "epoch": 1.24, + "learning_rate": 1.323465014784565e-06, + "loss": 0.7578, + "step": 48376 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234388317668361e-06, + "loss": 0.7017, + "step": 48377 + }, + { + "epoch": 1.24, + "learning_rate": 1.3234126485014656e-06, + "loss": 0.6294, + "step": 48378 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233864649884728e-06, + "loss": 0.4189, + "step": 48379 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233602812278774e-06, + "loss": 0.5696, + "step": 48380 + }, + { + "epoch": 1.24, + "learning_rate": 1.3233340972197002e-06, + "loss": 0.5552, + "step": 48381 + }, + { + "epoch": 1.24, + "learning_rate": 1.323307912963961e-06, + "loss": 0.6228, + "step": 48382 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232817284606797e-06, + "loss": 0.7559, + "step": 48383 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232555437098764e-06, + "loss": 0.7529, + "step": 48384 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232293587115713e-06, + "loss": 0.7881, + "step": 48385 + }, + { + "epoch": 1.24, + "learning_rate": 1.3232031734657843e-06, + "loss": 0.7158, + "step": 48386 + }, + { + "epoch": 1.24, + "learning_rate": 1.3231769879725354e-06, + "loss": 0.6504, + "step": 48387 + }, + { + "epoch": 1.24, + "learning_rate": 1.323150802231845e-06, + "loss": 0.7197, + "step": 48388 + }, + { + "epoch": 1.24, + "learning_rate": 1.3231246162437327e-06, + "loss": 0.6021, + "step": 48389 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230984300082187e-06, + "loss": 0.5129, + "step": 48390 + }, + { + "epoch": 1.24, + "learning_rate": 1.323072243525323e-06, + "loss": 0.6787, + "step": 48391 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230460567950656e-06, + "loss": 0.6357, + "step": 48392 + }, + { + "epoch": 1.24, + "learning_rate": 1.3230198698174673e-06, + "loss": 0.6416, + "step": 48393 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229936825925472e-06, + "loss": 0.5806, + "step": 48394 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229674951203257e-06, + "loss": 0.7246, + "step": 48395 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229413074008227e-06, + "loss": 0.6162, + "step": 48396 + }, + { + "epoch": 1.24, + "learning_rate": 1.3229151194340586e-06, + "loss": 0.6438, + "step": 48397 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228889312200533e-06, + "loss": 0.6904, + "step": 48398 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228627427588266e-06, + "loss": 0.6318, + "step": 48399 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228365540503988e-06, + "loss": 0.5708, + "step": 48400 + }, + { + "epoch": 1.24, + "learning_rate": 1.3228103650947898e-06, + "loss": 0.5649, + "step": 48401 + }, + { + "epoch": 1.24, + "learning_rate": 1.3227841758920197e-06, + "loss": 0.7754, + "step": 48402 + }, + { + "epoch": 1.24, + "learning_rate": 1.322757986442109e-06, + "loss": 0.7695, + "step": 48403 + }, + { + "epoch": 1.24, + "learning_rate": 1.322731796745077e-06, + "loss": 0.5765, + "step": 48404 + }, + { + "epoch": 1.24, + "learning_rate": 1.3227056068009443e-06, + "loss": 0.5244, + "step": 48405 + }, + { + "epoch": 1.24, + "learning_rate": 1.3226794166097307e-06, + "loss": 0.6885, + "step": 48406 + }, + { + "epoch": 1.24, + "learning_rate": 1.322653226171456e-06, + "loss": 0.708, + "step": 48407 + }, + { + "epoch": 1.24, + "learning_rate": 1.322627035486141e-06, + "loss": 0.5552, + "step": 48408 + }, + { + "epoch": 1.24, + "learning_rate": 1.3226008445538051e-06, + "loss": 0.6787, + "step": 48409 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225746533744685e-06, + "loss": 0.6504, + "step": 48410 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225484619481513e-06, + "loss": 0.6533, + "step": 48411 + }, + { + "epoch": 1.24, + "learning_rate": 1.3225222702748738e-06, + "loss": 0.7085, + "step": 48412 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224960783546557e-06, + "loss": 0.5872, + "step": 48413 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224698861875175e-06, + "loss": 0.5591, + "step": 48414 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224436937734783e-06, + "loss": 0.6484, + "step": 48415 + }, + { + "epoch": 1.24, + "learning_rate": 1.3224175011125593e-06, + "loss": 0.6035, + "step": 48416 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223913082047798e-06, + "loss": 0.6768, + "step": 48417 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223651150501605e-06, + "loss": 0.7158, + "step": 48418 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223389216487204e-06, + "loss": 0.5535, + "step": 48419 + }, + { + "epoch": 1.24, + "learning_rate": 1.3223127280004807e-06, + "loss": 0.7656, + "step": 48420 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222865341054606e-06, + "loss": 0.7832, + "step": 48421 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222603399636807e-06, + "loss": 0.7324, + "step": 48422 + }, + { + "epoch": 1.24, + "learning_rate": 1.322234145575161e-06, + "loss": 0.5796, + "step": 48423 + }, + { + "epoch": 1.24, + "learning_rate": 1.3222079509399216e-06, + "loss": 0.6982, + "step": 48424 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221817560579819e-06, + "loss": 0.7686, + "step": 48425 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221555609293626e-06, + "loss": 0.5298, + "step": 48426 + }, + { + "epoch": 1.24, + "learning_rate": 1.3221293655540836e-06, + "loss": 0.6533, + "step": 48427 + }, + { + "epoch": 1.24, + "learning_rate": 1.322103169932165e-06, + "loss": 0.6548, + "step": 48428 + }, + { + "epoch": 1.24, + "learning_rate": 1.322076974063627e-06, + "loss": 0.6714, + "step": 48429 + }, + { + "epoch": 1.24, + "learning_rate": 1.3220507779484894e-06, + "loss": 0.5193, + "step": 48430 + }, + { + "epoch": 1.24, + "learning_rate": 1.3220245815867718e-06, + "loss": 0.6294, + "step": 48431 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219983849784955e-06, + "loss": 0.6465, + "step": 48432 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219721881236796e-06, + "loss": 0.6445, + "step": 48433 + }, + { + "epoch": 1.24, + "learning_rate": 1.321945991022344e-06, + "loss": 0.5669, + "step": 48434 + }, + { + "epoch": 1.24, + "learning_rate": 1.3219197936745096e-06, + "loss": 0.6187, + "step": 48435 + }, + { + "epoch": 1.24, + "learning_rate": 1.321893596080196e-06, + "loss": 0.6899, + "step": 48436 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218673982394233e-06, + "loss": 0.5508, + "step": 48437 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218412001522116e-06, + "loss": 0.6191, + "step": 48438 + }, + { + "epoch": 1.24, + "learning_rate": 1.3218150018185806e-06, + "loss": 0.835, + "step": 48439 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217888032385507e-06, + "loss": 0.8096, + "step": 48440 + }, + { + "epoch": 1.24, + "learning_rate": 1.321762604412142e-06, + "loss": 0.5991, + "step": 48441 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217364053393743e-06, + "loss": 0.5051, + "step": 48442 + }, + { + "epoch": 1.24, + "learning_rate": 1.3217102060202682e-06, + "loss": 0.4775, + "step": 48443 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216840064548431e-06, + "loss": 0.9229, + "step": 48444 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216578066431195e-06, + "loss": 0.7295, + "step": 48445 + }, + { + "epoch": 1.24, + "learning_rate": 1.321631606585117e-06, + "loss": 0.5776, + "step": 48446 + }, + { + "epoch": 1.24, + "learning_rate": 1.3216054062808563e-06, + "loss": 0.5718, + "step": 48447 + }, + { + "epoch": 1.24, + "learning_rate": 1.321579205730357e-06, + "loss": 0.7222, + "step": 48448 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215530049336395e-06, + "loss": 0.3511, + "step": 48449 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215268038907232e-06, + "loss": 0.5806, + "step": 48450 + }, + { + "epoch": 1.24, + "learning_rate": 1.3215006026016291e-06, + "loss": 0.5093, + "step": 48451 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214744010663762e-06, + "loss": 0.4346, + "step": 48452 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214481992849857e-06, + "loss": 0.5269, + "step": 48453 + }, + { + "epoch": 1.24, + "learning_rate": 1.3214219972574769e-06, + "loss": 0.6104, + "step": 48454 + }, + { + "epoch": 1.24, + "learning_rate": 1.3213957949838698e-06, + "loss": 0.6387, + "step": 48455 + }, + { + "epoch": 1.24, + "learning_rate": 1.321369592464185e-06, + "loss": 0.5781, + "step": 48456 + }, + { + "epoch": 1.24, + "learning_rate": 1.3213433896984425e-06, + "loss": 0.6064, + "step": 48457 + }, + { + "epoch": 1.24, + "learning_rate": 1.321317186686662e-06, + "loss": 0.7773, + "step": 48458 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212909834288633e-06, + "loss": 0.7236, + "step": 48459 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212647799250671e-06, + "loss": 0.6533, + "step": 48460 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212385761752934e-06, + "loss": 0.5194, + "step": 48461 + }, + { + "epoch": 1.24, + "learning_rate": 1.3212123721795618e-06, + "loss": 0.7764, + "step": 48462 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211861679378927e-06, + "loss": 0.5518, + "step": 48463 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211599634503065e-06, + "loss": 0.7319, + "step": 48464 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211337587168226e-06, + "loss": 0.605, + "step": 48465 + }, + { + "epoch": 1.24, + "learning_rate": 1.3211075537374613e-06, + "loss": 0.7793, + "step": 48466 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210813485122428e-06, + "loss": 0.7124, + "step": 48467 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210551430411871e-06, + "loss": 0.752, + "step": 48468 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210289373243143e-06, + "loss": 0.7109, + "step": 48469 + }, + { + "epoch": 1.24, + "learning_rate": 1.3210027313616443e-06, + "loss": 0.7358, + "step": 48470 + }, + { + "epoch": 1.24, + "learning_rate": 1.320976525153197e-06, + "loss": 0.6245, + "step": 48471 + }, + { + "epoch": 1.24, + "learning_rate": 1.320950318698993e-06, + "loss": 0.6699, + "step": 48472 + }, + { + "epoch": 1.24, + "learning_rate": 1.3209241119990523e-06, + "loss": 0.5859, + "step": 48473 + }, + { + "epoch": 1.24, + "learning_rate": 1.3208979050533945e-06, + "loss": 0.7715, + "step": 48474 + }, + { + "epoch": 1.24, + "learning_rate": 1.32087169786204e-06, + "loss": 0.6274, + "step": 48475 + }, + { + "epoch": 1.24, + "learning_rate": 1.320845490425009e-06, + "loss": 0.6782, + "step": 48476 + }, + { + "epoch": 1.24, + "learning_rate": 1.3208192827423208e-06, + "loss": 0.7773, + "step": 48477 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207930748139963e-06, + "loss": 0.3983, + "step": 48478 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207668666400556e-06, + "loss": 0.6187, + "step": 48479 + }, + { + "epoch": 1.24, + "learning_rate": 1.320740658220518e-06, + "loss": 0.7334, + "step": 48480 + }, + { + "epoch": 1.24, + "learning_rate": 1.3207144495554045e-06, + "loss": 0.6699, + "step": 48481 + }, + { + "epoch": 1.24, + "learning_rate": 1.3206882406447342e-06, + "loss": 0.6353, + "step": 48482 + }, + { + "epoch": 1.24, + "learning_rate": 1.320662031488528e-06, + "loss": 0.7812, + "step": 48483 + }, + { + "epoch": 1.24, + "learning_rate": 1.3206358220868057e-06, + "loss": 0.6699, + "step": 48484 + }, + { + "epoch": 1.24, + "learning_rate": 1.320609612439587e-06, + "loss": 0.7051, + "step": 48485 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205834025468924e-06, + "loss": 0.7754, + "step": 48486 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205571924087417e-06, + "loss": 0.6523, + "step": 48487 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205309820251552e-06, + "loss": 0.7627, + "step": 48488 + }, + { + "epoch": 1.24, + "learning_rate": 1.3205047713961532e-06, + "loss": 0.665, + "step": 48489 + }, + { + "epoch": 1.24, + "learning_rate": 1.320478560521755e-06, + "loss": 0.6338, + "step": 48490 + }, + { + "epoch": 1.24, + "learning_rate": 1.3204523494019812e-06, + "loss": 0.7061, + "step": 48491 + }, + { + "epoch": 1.24, + "learning_rate": 1.3204261380368515e-06, + "loss": 0.6719, + "step": 48492 + }, + { + "epoch": 1.24, + "learning_rate": 1.320399926426387e-06, + "loss": 0.8164, + "step": 48493 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203737145706063e-06, + "loss": 0.7603, + "step": 48494 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203475024695305e-06, + "loss": 0.709, + "step": 48495 + }, + { + "epoch": 1.24, + "learning_rate": 1.3203212901231792e-06, + "loss": 0.7051, + "step": 48496 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202950775315726e-06, + "loss": 0.6372, + "step": 48497 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202688646947311e-06, + "loss": 0.6895, + "step": 48498 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202426516126739e-06, + "loss": 0.6855, + "step": 48499 + }, + { + "epoch": 1.24, + "learning_rate": 1.3202164382854221e-06, + "loss": 0.4741, + "step": 48500 + }, + { + "epoch": 1.24, + "learning_rate": 1.320190224712995e-06, + "loss": 0.7725, + "step": 48501 + }, + { + "epoch": 1.24, + "learning_rate": 1.3201640108954133e-06, + "loss": 0.6514, + "step": 48502 + }, + { + "epoch": 1.24, + "learning_rate": 1.3201377968326965e-06, + "loss": 0.6826, + "step": 48503 + }, + { + "epoch": 1.24, + "learning_rate": 1.320111582524865e-06, + "loss": 0.4556, + "step": 48504 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200853679719388e-06, + "loss": 0.748, + "step": 48505 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200591531739378e-06, + "loss": 0.5835, + "step": 48506 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200329381308822e-06, + "loss": 0.793, + "step": 48507 + }, + { + "epoch": 1.24, + "learning_rate": 1.3200067228427924e-06, + "loss": 0.75, + "step": 48508 + }, + { + "epoch": 1.24, + "learning_rate": 1.319980507309688e-06, + "loss": 0.6953, + "step": 48509 + }, + { + "epoch": 1.24, + "learning_rate": 1.3199542915315892e-06, + "loss": 0.7119, + "step": 48510 + }, + { + "epoch": 1.24, + "learning_rate": 1.319928075508516e-06, + "loss": 0.7119, + "step": 48511 + }, + { + "epoch": 1.24, + "learning_rate": 1.3199018592404887e-06, + "loss": 0.7173, + "step": 48512 + }, + { + "epoch": 1.24, + "learning_rate": 1.3198756427275274e-06, + "loss": 0.7295, + "step": 48513 + }, + { + "epoch": 1.24, + "learning_rate": 1.319849425969652e-06, + "loss": 0.6816, + "step": 48514 + }, + { + "epoch": 1.24, + "learning_rate": 1.3198232089668824e-06, + "loss": 0.5649, + "step": 48515 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197969917192388e-06, + "loss": 0.665, + "step": 48516 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197707742267415e-06, + "loss": 0.7559, + "step": 48517 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197445564894104e-06, + "loss": 0.6514, + "step": 48518 + }, + { + "epoch": 1.24, + "learning_rate": 1.3197183385072659e-06, + "loss": 0.7285, + "step": 48519 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196921202803275e-06, + "loss": 0.6621, + "step": 48520 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196659018086155e-06, + "loss": 0.5938, + "step": 48521 + }, + { + "epoch": 1.24, + "learning_rate": 1.31963968309215e-06, + "loss": 0.6553, + "step": 48522 + }, + { + "epoch": 1.24, + "learning_rate": 1.3196134641309513e-06, + "loss": 0.7207, + "step": 48523 + }, + { + "epoch": 1.24, + "learning_rate": 1.319587244925039e-06, + "loss": 0.5845, + "step": 48524 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195610254744335e-06, + "loss": 0.5977, + "step": 48525 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195348057791549e-06, + "loss": 0.6221, + "step": 48526 + }, + { + "epoch": 1.24, + "learning_rate": 1.3195085858392232e-06, + "loss": 0.4696, + "step": 48527 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194823656546585e-06, + "loss": 0.4653, + "step": 48528 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194561452254809e-06, + "loss": 0.5582, + "step": 48529 + }, + { + "epoch": 1.24, + "learning_rate": 1.3194299245517102e-06, + "loss": 0.7393, + "step": 48530 + }, + { + "epoch": 1.24, + "learning_rate": 1.319403703633367e-06, + "loss": 0.7998, + "step": 48531 + }, + { + "epoch": 1.24, + "learning_rate": 1.3193774824704703e-06, + "loss": 0.5552, + "step": 48532 + }, + { + "epoch": 1.24, + "learning_rate": 1.319351261063042e-06, + "loss": 0.7617, + "step": 48533 + }, + { + "epoch": 1.24, + "learning_rate": 1.3193250394111006e-06, + "loss": 0.6738, + "step": 48534 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192988175146668e-06, + "loss": 0.7163, + "step": 48535 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192725953737603e-06, + "loss": 0.5396, + "step": 48536 + }, + { + "epoch": 1.24, + "learning_rate": 1.3192463729884018e-06, + "loss": 0.6719, + "step": 48537 + }, + { + "epoch": 1.24, + "learning_rate": 1.319220150358611e-06, + "loss": 0.449, + "step": 48538 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191939274844079e-06, + "loss": 0.6128, + "step": 48539 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191677043658125e-06, + "loss": 0.7339, + "step": 48540 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191414810028454e-06, + "loss": 0.6484, + "step": 48541 + }, + { + "epoch": 1.24, + "learning_rate": 1.3191152573955262e-06, + "loss": 0.6313, + "step": 48542 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190890335438751e-06, + "loss": 0.8506, + "step": 48543 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190628094479124e-06, + "loss": 0.6797, + "step": 48544 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190365851076575e-06, + "loss": 0.5576, + "step": 48545 + }, + { + "epoch": 1.24, + "learning_rate": 1.3190103605231312e-06, + "loss": 0.7466, + "step": 48546 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189841356943537e-06, + "loss": 0.7539, + "step": 48547 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189579106213444e-06, + "loss": 0.8506, + "step": 48548 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189316853041236e-06, + "loss": 0.6465, + "step": 48549 + }, + { + "epoch": 1.24, + "learning_rate": 1.3189054597427115e-06, + "loss": 0.6743, + "step": 48550 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188792339371282e-06, + "loss": 0.5601, + "step": 48551 + }, + { + "epoch": 1.24, + "learning_rate": 1.318853007887394e-06, + "loss": 0.6748, + "step": 48552 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188267815935283e-06, + "loss": 0.7344, + "step": 48553 + }, + { + "epoch": 1.24, + "learning_rate": 1.3188005550555518e-06, + "loss": 0.4763, + "step": 48554 + }, + { + "epoch": 1.24, + "learning_rate": 1.3187743282734843e-06, + "loss": 0.8262, + "step": 48555 + }, + { + "epoch": 1.24, + "learning_rate": 1.318748101247346e-06, + "loss": 0.7842, + "step": 48556 + }, + { + "epoch": 1.24, + "learning_rate": 1.318721873977157e-06, + "loss": 0.5503, + "step": 48557 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186956464629372e-06, + "loss": 0.6436, + "step": 48558 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186694187047068e-06, + "loss": 0.6377, + "step": 48559 + }, + { + "epoch": 1.24, + "learning_rate": 1.318643190702486e-06, + "loss": 0.5073, + "step": 48560 + }, + { + "epoch": 1.24, + "learning_rate": 1.3186169624562946e-06, + "loss": 0.7734, + "step": 48561 + }, + { + "epoch": 1.24, + "learning_rate": 1.318590733966153e-06, + "loss": 0.6025, + "step": 48562 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185645052320812e-06, + "loss": 0.7598, + "step": 48563 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185382762540988e-06, + "loss": 0.667, + "step": 48564 + }, + { + "epoch": 1.24, + "learning_rate": 1.3185120470322266e-06, + "loss": 0.7246, + "step": 48565 + }, + { + "epoch": 1.24, + "learning_rate": 1.3184858175664845e-06, + "loss": 0.5588, + "step": 48566 + }, + { + "epoch": 1.24, + "learning_rate": 1.318459587856892e-06, + "loss": 0.4885, + "step": 48567 + }, + { + "epoch": 1.24, + "learning_rate": 1.31843335790347e-06, + "loss": 0.7402, + "step": 48568 + }, + { + "epoch": 1.24, + "learning_rate": 1.3184071277062384e-06, + "loss": 0.5933, + "step": 48569 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183808972652166e-06, + "loss": 0.5811, + "step": 48570 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183546665804255e-06, + "loss": 0.6421, + "step": 48571 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183284356518847e-06, + "loss": 0.5625, + "step": 48572 + }, + { + "epoch": 1.24, + "learning_rate": 1.3183022044796145e-06, + "loss": 0.7373, + "step": 48573 + }, + { + "epoch": 1.24, + "learning_rate": 1.318275973063635e-06, + "loss": 0.6772, + "step": 48574 + }, + { + "epoch": 1.25, + "learning_rate": 1.3182497414039664e-06, + "loss": 0.6758, + "step": 48575 + }, + { + "epoch": 1.25, + "learning_rate": 1.3182235095006282e-06, + "loss": 0.6113, + "step": 48576 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181972773536412e-06, + "loss": 0.5178, + "step": 48577 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181710449630251e-06, + "loss": 0.6729, + "step": 48578 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181448123288003e-06, + "loss": 0.6973, + "step": 48579 + }, + { + "epoch": 1.25, + "learning_rate": 1.3181185794509858e-06, + "loss": 0.6128, + "step": 48580 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180923463296035e-06, + "loss": 0.792, + "step": 48581 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180661129646719e-06, + "loss": 0.6553, + "step": 48582 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180398793562121e-06, + "loss": 0.6206, + "step": 48583 + }, + { + "epoch": 1.25, + "learning_rate": 1.3180136455042436e-06, + "loss": 0.6475, + "step": 48584 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179874114087869e-06, + "loss": 0.6821, + "step": 48585 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179611770698614e-06, + "loss": 0.7632, + "step": 48586 + }, + { + "epoch": 1.25, + "learning_rate": 1.317934942487488e-06, + "loss": 0.665, + "step": 48587 + }, + { + "epoch": 1.25, + "learning_rate": 1.3179087076616863e-06, + "loss": 0.6709, + "step": 48588 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178824725924763e-06, + "loss": 0.5054, + "step": 48589 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178562372798786e-06, + "loss": 0.6367, + "step": 48590 + }, + { + "epoch": 1.25, + "learning_rate": 1.317830001723913e-06, + "loss": 0.7012, + "step": 48591 + }, + { + "epoch": 1.25, + "learning_rate": 1.3178037659245997e-06, + "loss": 0.6904, + "step": 48592 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177775298819587e-06, + "loss": 0.4622, + "step": 48593 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177512935960098e-06, + "loss": 0.6406, + "step": 48594 + }, + { + "epoch": 1.25, + "learning_rate": 1.3177250570667734e-06, + "loss": 0.7959, + "step": 48595 + }, + { + "epoch": 1.25, + "learning_rate": 1.3176988202942695e-06, + "loss": 0.5688, + "step": 48596 + }, + { + "epoch": 1.25, + "learning_rate": 1.317672583278518e-06, + "loss": 0.6982, + "step": 48597 + }, + { + "epoch": 1.25, + "learning_rate": 1.3176463460195399e-06, + "loss": 0.6582, + "step": 48598 + }, + { + "epoch": 1.25, + "learning_rate": 1.317620108517354e-06, + "loss": 0.6162, + "step": 48599 + }, + { + "epoch": 1.25, + "learning_rate": 1.317593870771981e-06, + "loss": 0.7451, + "step": 48600 + }, + { + "epoch": 1.25, + "learning_rate": 1.317567632783441e-06, + "loss": 0.4327, + "step": 48601 + }, + { + "epoch": 1.25, + "learning_rate": 1.3175413945517546e-06, + "loss": 0.5898, + "step": 48602 + }, + { + "epoch": 1.25, + "learning_rate": 1.3175151560769409e-06, + "loss": 0.6484, + "step": 48603 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174889173590206e-06, + "loss": 0.6724, + "step": 48604 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174626783980134e-06, + "loss": 0.5508, + "step": 48605 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174364391939399e-06, + "loss": 0.6621, + "step": 48606 + }, + { + "epoch": 1.25, + "learning_rate": 1.3174101997468198e-06, + "loss": 0.6738, + "step": 48607 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173839600566732e-06, + "loss": 0.6406, + "step": 48608 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173577201235205e-06, + "loss": 0.6895, + "step": 48609 + }, + { + "epoch": 1.25, + "learning_rate": 1.3173314799473814e-06, + "loss": 0.7354, + "step": 48610 + }, + { + "epoch": 1.25, + "learning_rate": 1.317305239528276e-06, + "loss": 0.5493, + "step": 48611 + }, + { + "epoch": 1.25, + "learning_rate": 1.317278998866225e-06, + "loss": 0.6299, + "step": 48612 + }, + { + "epoch": 1.25, + "learning_rate": 1.3172527579612478e-06, + "loss": 0.6724, + "step": 48613 + }, + { + "epoch": 1.25, + "learning_rate": 1.3172265168133648e-06, + "loss": 0.8135, + "step": 48614 + }, + { + "epoch": 1.25, + "learning_rate": 1.317200275422596e-06, + "loss": 0.5236, + "step": 48615 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171740337889616e-06, + "loss": 0.5723, + "step": 48616 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171477919124818e-06, + "loss": 0.6943, + "step": 48617 + }, + { + "epoch": 1.25, + "learning_rate": 1.3171215497931762e-06, + "loss": 0.509, + "step": 48618 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170953074310655e-06, + "loss": 0.8379, + "step": 48619 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170690648261693e-06, + "loss": 0.6867, + "step": 48620 + }, + { + "epoch": 1.25, + "learning_rate": 1.317042821978508e-06, + "loss": 0.418, + "step": 48621 + }, + { + "epoch": 1.25, + "learning_rate": 1.3170165788881016e-06, + "loss": 0.625, + "step": 48622 + }, + { + "epoch": 1.25, + "learning_rate": 1.31699033555497e-06, + "loss": 0.6073, + "step": 48623 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169640919791336e-06, + "loss": 0.667, + "step": 48624 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169378481606124e-06, + "loss": 0.5664, + "step": 48625 + }, + { + "epoch": 1.25, + "learning_rate": 1.3169116040994264e-06, + "loss": 0.6743, + "step": 48626 + }, + { + "epoch": 1.25, + "learning_rate": 1.316885359795596e-06, + "loss": 0.7402, + "step": 48627 + }, + { + "epoch": 1.25, + "learning_rate": 1.3168591152491406e-06, + "loss": 0.6836, + "step": 48628 + }, + { + "epoch": 1.25, + "learning_rate": 1.316832870460081e-06, + "loss": 0.8105, + "step": 48629 + }, + { + "epoch": 1.25, + "learning_rate": 1.3168066254284371e-06, + "loss": 0.2849, + "step": 48630 + }, + { + "epoch": 1.25, + "learning_rate": 1.316780380154229e-06, + "loss": 0.7207, + "step": 48631 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167541346374767e-06, + "loss": 0.6943, + "step": 48632 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167278888782e-06, + "loss": 0.6855, + "step": 48633 + }, + { + "epoch": 1.25, + "learning_rate": 1.3167016428764195e-06, + "loss": 0.6458, + "step": 48634 + }, + { + "epoch": 1.25, + "learning_rate": 1.316675396632155e-06, + "loss": 0.75, + "step": 48635 + }, + { + "epoch": 1.25, + "learning_rate": 1.3166491501454269e-06, + "loss": 0.5869, + "step": 48636 + }, + { + "epoch": 1.25, + "learning_rate": 1.3166229034162553e-06, + "loss": 0.7295, + "step": 48637 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165966564446599e-06, + "loss": 0.6597, + "step": 48638 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165704092306606e-06, + "loss": 0.7061, + "step": 48639 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165441617742783e-06, + "loss": 0.5977, + "step": 48640 + }, + { + "epoch": 1.25, + "learning_rate": 1.3165179140755327e-06, + "loss": 0.6826, + "step": 48641 + }, + { + "epoch": 1.25, + "learning_rate": 1.316491666134444e-06, + "loss": 0.7402, + "step": 48642 + }, + { + "epoch": 1.25, + "learning_rate": 1.316465417951032e-06, + "loss": 0.752, + "step": 48643 + }, + { + "epoch": 1.25, + "learning_rate": 1.316439169525317e-06, + "loss": 0.4702, + "step": 48644 + }, + { + "epoch": 1.25, + "learning_rate": 1.316412920857319e-06, + "loss": 0.6562, + "step": 48645 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163866719470583e-06, + "loss": 0.6357, + "step": 48646 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163604227945548e-06, + "loss": 0.5603, + "step": 48647 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163341733998288e-06, + "loss": 0.5505, + "step": 48648 + }, + { + "epoch": 1.25, + "learning_rate": 1.3163079237629e-06, + "loss": 0.5532, + "step": 48649 + }, + { + "epoch": 1.25, + "learning_rate": 1.316281673883789e-06, + "loss": 0.5981, + "step": 48650 + }, + { + "epoch": 1.25, + "learning_rate": 1.3162554237625153e-06, + "loss": 0.5757, + "step": 48651 + }, + { + "epoch": 1.25, + "learning_rate": 1.3162291733990997e-06, + "loss": 0.7031, + "step": 48652 + }, + { + "epoch": 1.25, + "learning_rate": 1.316202922793562e-06, + "loss": 0.7793, + "step": 48653 + }, + { + "epoch": 1.25, + "learning_rate": 1.316176671945922e-06, + "loss": 0.6963, + "step": 48654 + }, + { + "epoch": 1.25, + "learning_rate": 1.3161504208562005e-06, + "loss": 0.5942, + "step": 48655 + }, + { + "epoch": 1.25, + "learning_rate": 1.316124169524417e-06, + "loss": 0.585, + "step": 48656 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160979179505918e-06, + "loss": 0.7568, + "step": 48657 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160716661347446e-06, + "loss": 0.7559, + "step": 48658 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160454140768962e-06, + "loss": 0.541, + "step": 48659 + }, + { + "epoch": 1.25, + "learning_rate": 1.3160191617770663e-06, + "loss": 0.5762, + "step": 48660 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159929092352748e-06, + "loss": 0.7334, + "step": 48661 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159666564515424e-06, + "loss": 0.7559, + "step": 48662 + }, + { + "epoch": 1.25, + "learning_rate": 1.3159404034258887e-06, + "loss": 0.5828, + "step": 48663 + }, + { + "epoch": 1.25, + "learning_rate": 1.315914150158334e-06, + "loss": 0.749, + "step": 48664 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158878966488983e-06, + "loss": 0.7051, + "step": 48665 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158616428976016e-06, + "loss": 0.6191, + "step": 48666 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158353889044648e-06, + "loss": 0.7012, + "step": 48667 + }, + { + "epoch": 1.25, + "learning_rate": 1.3158091346695066e-06, + "loss": 0.7998, + "step": 48668 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157828801927484e-06, + "loss": 0.4409, + "step": 48669 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157566254742093e-06, + "loss": 0.6904, + "step": 48670 + }, + { + "epoch": 1.25, + "learning_rate": 1.3157303705139101e-06, + "loss": 0.4756, + "step": 48671 + }, + { + "epoch": 1.25, + "learning_rate": 1.315704115311871e-06, + "loss": 0.5881, + "step": 48672 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156778598681116e-06, + "loss": 0.6328, + "step": 48673 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156516041826518e-06, + "loss": 0.6182, + "step": 48674 + }, + { + "epoch": 1.25, + "learning_rate": 1.3156253482555124e-06, + "loss": 0.6152, + "step": 48675 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155990920867131e-06, + "loss": 0.4816, + "step": 48676 + }, + { + "epoch": 1.25, + "learning_rate": 1.315572835676274e-06, + "loss": 0.6377, + "step": 48677 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155465790242154e-06, + "loss": 0.5483, + "step": 48678 + }, + { + "epoch": 1.25, + "learning_rate": 1.3155203221305574e-06, + "loss": 0.7764, + "step": 48679 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154940649953198e-06, + "loss": 0.7422, + "step": 48680 + }, + { + "epoch": 1.25, + "learning_rate": 1.315467807618523e-06, + "loss": 0.5481, + "step": 48681 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154415500001873e-06, + "loss": 0.5801, + "step": 48682 + }, + { + "epoch": 1.25, + "learning_rate": 1.3154152921403321e-06, + "loss": 0.6335, + "step": 48683 + }, + { + "epoch": 1.25, + "learning_rate": 1.3153890340389779e-06, + "loss": 0.5703, + "step": 48684 + }, + { + "epoch": 1.25, + "learning_rate": 1.315362775696145e-06, + "loss": 0.4458, + "step": 48685 + }, + { + "epoch": 1.25, + "learning_rate": 1.3153365171118532e-06, + "loss": 0.7178, + "step": 48686 + }, + { + "epoch": 1.25, + "learning_rate": 1.315310258286123e-06, + "loss": 0.5352, + "step": 48687 + }, + { + "epoch": 1.25, + "learning_rate": 1.315283999218974e-06, + "loss": 0.6406, + "step": 48688 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152577399104264e-06, + "loss": 0.5762, + "step": 48689 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152314803605006e-06, + "loss": 0.6289, + "step": 48690 + }, + { + "epoch": 1.25, + "learning_rate": 1.3152052205692163e-06, + "loss": 0.5122, + "step": 48691 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151789605365946e-06, + "loss": 0.7705, + "step": 48692 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151527002626544e-06, + "loss": 0.7383, + "step": 48693 + }, + { + "epoch": 1.25, + "learning_rate": 1.315126439747416e-06, + "loss": 0.5715, + "step": 48694 + }, + { + "epoch": 1.25, + "learning_rate": 1.3151001789909e-06, + "loss": 0.8496, + "step": 48695 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150739179931263e-06, + "loss": 0.4954, + "step": 48696 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150476567541151e-06, + "loss": 0.623, + "step": 48697 + }, + { + "epoch": 1.25, + "learning_rate": 1.3150213952738863e-06, + "loss": 0.6206, + "step": 48698 + }, + { + "epoch": 1.25, + "learning_rate": 1.31499513355246e-06, + "loss": 0.5952, + "step": 48699 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149688715898565e-06, + "loss": 0.6211, + "step": 48700 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149426093860958e-06, + "loss": 0.6074, + "step": 48701 + }, + { + "epoch": 1.25, + "learning_rate": 1.3149163469411981e-06, + "loss": 0.566, + "step": 48702 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148900842551834e-06, + "loss": 0.6865, + "step": 48703 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148638213280716e-06, + "loss": 0.7217, + "step": 48704 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148375581598834e-06, + "loss": 0.8154, + "step": 48705 + }, + { + "epoch": 1.25, + "learning_rate": 1.3148112947506383e-06, + "loss": 0.4521, + "step": 48706 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147850311003572e-06, + "loss": 0.5483, + "step": 48707 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147587672090593e-06, + "loss": 0.7236, + "step": 48708 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147325030767648e-06, + "loss": 0.4595, + "step": 48709 + }, + { + "epoch": 1.25, + "learning_rate": 1.3147062387034944e-06, + "loss": 0.707, + "step": 48710 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146799740892678e-06, + "loss": 0.6182, + "step": 48711 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146537092341055e-06, + "loss": 0.5332, + "step": 48712 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146274441380269e-06, + "loss": 0.603, + "step": 48713 + }, + { + "epoch": 1.25, + "learning_rate": 1.3146011788010527e-06, + "loss": 0.7656, + "step": 48714 + }, + { + "epoch": 1.25, + "learning_rate": 1.314574913223203e-06, + "loss": 0.645, + "step": 48715 + }, + { + "epoch": 1.25, + "learning_rate": 1.3145486474044972e-06, + "loss": 0.7871, + "step": 48716 + }, + { + "epoch": 1.25, + "learning_rate": 1.3145223813449568e-06, + "loss": 0.6416, + "step": 48717 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144961150446006e-06, + "loss": 0.7178, + "step": 48718 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144698485034492e-06, + "loss": 0.647, + "step": 48719 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144435817215227e-06, + "loss": 0.5206, + "step": 48720 + }, + { + "epoch": 1.25, + "learning_rate": 1.3144173146988413e-06, + "loss": 0.5869, + "step": 48721 + }, + { + "epoch": 1.25, + "learning_rate": 1.314391047435425e-06, + "loss": 0.5557, + "step": 48722 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143647799312938e-06, + "loss": 0.7041, + "step": 48723 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143385121864682e-06, + "loss": 0.8066, + "step": 48724 + }, + { + "epoch": 1.25, + "learning_rate": 1.3143122442009677e-06, + "loss": 0.5337, + "step": 48725 + }, + { + "epoch": 1.25, + "learning_rate": 1.314285975974813e-06, + "loss": 0.5942, + "step": 48726 + }, + { + "epoch": 1.25, + "learning_rate": 1.314259707508024e-06, + "loss": 0.5349, + "step": 48727 + }, + { + "epoch": 1.25, + "learning_rate": 1.3142334388006208e-06, + "loss": 0.7188, + "step": 48728 + }, + { + "epoch": 1.25, + "learning_rate": 1.3142071698526233e-06, + "loss": 0.6406, + "step": 48729 + }, + { + "epoch": 1.25, + "learning_rate": 1.314180900664052e-06, + "loss": 0.4556, + "step": 48730 + }, + { + "epoch": 1.25, + "learning_rate": 1.3141546312349268e-06, + "loss": 0.6562, + "step": 48731 + }, + { + "epoch": 1.25, + "learning_rate": 1.314128361565268e-06, + "loss": 0.5859, + "step": 48732 + }, + { + "epoch": 1.25, + "learning_rate": 1.3141020916550954e-06, + "loss": 0.6519, + "step": 48733 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140758215044292e-06, + "loss": 0.4675, + "step": 48734 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140495511132895e-06, + "loss": 0.6611, + "step": 48735 + }, + { + "epoch": 1.25, + "learning_rate": 1.3140232804816966e-06, + "loss": 0.7217, + "step": 48736 + }, + { + "epoch": 1.25, + "learning_rate": 1.313997009609671e-06, + "loss": 0.6309, + "step": 48737 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139707384972316e-06, + "loss": 0.6436, + "step": 48738 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139444671443995e-06, + "loss": 0.7168, + "step": 48739 + }, + { + "epoch": 1.25, + "learning_rate": 1.3139181955511947e-06, + "loss": 0.6445, + "step": 48740 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138919237176369e-06, + "loss": 0.5649, + "step": 48741 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138656516437468e-06, + "loss": 0.6577, + "step": 48742 + }, + { + "epoch": 1.25, + "learning_rate": 1.313839379329544e-06, + "loss": 0.5864, + "step": 48743 + }, + { + "epoch": 1.25, + "learning_rate": 1.3138131067750486e-06, + "loss": 0.6743, + "step": 48744 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137868339802814e-06, + "loss": 0.624, + "step": 48745 + }, + { + "epoch": 1.25, + "learning_rate": 1.313760560945262e-06, + "loss": 0.6025, + "step": 48746 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137342876700105e-06, + "loss": 0.5688, + "step": 48747 + }, + { + "epoch": 1.25, + "learning_rate": 1.3137080141545467e-06, + "loss": 0.7949, + "step": 48748 + }, + { + "epoch": 1.25, + "learning_rate": 1.3136817403988916e-06, + "loss": 0.6445, + "step": 48749 + }, + { + "epoch": 1.25, + "learning_rate": 1.3136554664030643e-06, + "loss": 0.6323, + "step": 48750 + }, + { + "epoch": 1.25, + "learning_rate": 1.313629192167086e-06, + "loss": 0.6553, + "step": 48751 + }, + { + "epoch": 1.25, + "learning_rate": 1.313602917690976e-06, + "loss": 0.5918, + "step": 48752 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135766429747545e-06, + "loss": 0.5181, + "step": 48753 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135503680184418e-06, + "loss": 0.6191, + "step": 48754 + }, + { + "epoch": 1.25, + "learning_rate": 1.3135240928220583e-06, + "loss": 0.6689, + "step": 48755 + }, + { + "epoch": 1.25, + "learning_rate": 1.3134978173856234e-06, + "loss": 0.5649, + "step": 48756 + }, + { + "epoch": 1.25, + "learning_rate": 1.3134715417091584e-06, + "loss": 0.6096, + "step": 48757 + }, + { + "epoch": 1.25, + "learning_rate": 1.313445265792682e-06, + "loss": 0.6558, + "step": 48758 + }, + { + "epoch": 1.25, + "learning_rate": 1.313418989636215e-06, + "loss": 0.7275, + "step": 48759 + }, + { + "epoch": 1.25, + "learning_rate": 1.3133927132397778e-06, + "loss": 0.521, + "step": 48760 + }, + { + "epoch": 1.25, + "learning_rate": 1.3133664366033899e-06, + "loss": 0.6743, + "step": 48761 + }, + { + "epoch": 1.25, + "learning_rate": 1.313340159727072e-06, + "loss": 0.7012, + "step": 48762 + }, + { + "epoch": 1.25, + "learning_rate": 1.313313882610844e-06, + "loss": 0.4312, + "step": 48763 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132876052547253e-06, + "loss": 0.6758, + "step": 48764 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132613276587373e-06, + "loss": 0.6343, + "step": 48765 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132350498228992e-06, + "loss": 0.7705, + "step": 48766 + }, + { + "epoch": 1.25, + "learning_rate": 1.3132087717472319e-06, + "loss": 0.7695, + "step": 48767 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131824934317546e-06, + "loss": 0.6309, + "step": 48768 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131562148764878e-06, + "loss": 0.6191, + "step": 48769 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131299360814519e-06, + "loss": 0.5728, + "step": 48770 + }, + { + "epoch": 1.25, + "learning_rate": 1.3131036570466666e-06, + "loss": 0.8135, + "step": 48771 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130773777721529e-06, + "loss": 0.4854, + "step": 48772 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130510982579294e-06, + "loss": 0.6865, + "step": 48773 + }, + { + "epoch": 1.25, + "learning_rate": 1.3130248185040176e-06, + "loss": 0.5771, + "step": 48774 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129985385104368e-06, + "loss": 0.3909, + "step": 48775 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129722582772075e-06, + "loss": 0.7451, + "step": 48776 + }, + { + "epoch": 1.25, + "learning_rate": 1.3129459778043499e-06, + "loss": 0.5083, + "step": 48777 + }, + { + "epoch": 1.25, + "learning_rate": 1.312919697091884e-06, + "loss": 0.7988, + "step": 48778 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128934161398295e-06, + "loss": 0.7646, + "step": 48779 + }, + { + "epoch": 1.25, + "learning_rate": 1.312867134948207e-06, + "loss": 0.7568, + "step": 48780 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128408535170366e-06, + "loss": 0.6484, + "step": 48781 + }, + { + "epoch": 1.25, + "learning_rate": 1.3128145718463386e-06, + "loss": 0.7324, + "step": 48782 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127882899361325e-06, + "loss": 0.6455, + "step": 48783 + }, + { + "epoch": 1.25, + "learning_rate": 1.312762007786439e-06, + "loss": 0.6162, + "step": 48784 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127357253972778e-06, + "loss": 0.7031, + "step": 48785 + }, + { + "epoch": 1.25, + "learning_rate": 1.3127094427686694e-06, + "loss": 0.6416, + "step": 48786 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126831599006338e-06, + "loss": 0.6401, + "step": 48787 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126568767931907e-06, + "loss": 0.6836, + "step": 48788 + }, + { + "epoch": 1.25, + "learning_rate": 1.312630593446361e-06, + "loss": 0.5884, + "step": 48789 + }, + { + "epoch": 1.25, + "learning_rate": 1.3126043098601645e-06, + "loss": 0.6934, + "step": 48790 + }, + { + "epoch": 1.25, + "learning_rate": 1.3125780260346208e-06, + "loss": 0.6758, + "step": 48791 + }, + { + "epoch": 1.25, + "learning_rate": 1.312551741969751e-06, + "loss": 0.6118, + "step": 48792 + }, + { + "epoch": 1.25, + "learning_rate": 1.3125254576655744e-06, + "loss": 0.6509, + "step": 48793 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124991731221112e-06, + "loss": 0.7666, + "step": 48794 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124728883393822e-06, + "loss": 0.5217, + "step": 48795 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124466033174068e-06, + "loss": 0.5742, + "step": 48796 + }, + { + "epoch": 1.25, + "learning_rate": 1.3124203180562059e-06, + "loss": 0.6719, + "step": 48797 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123940325557987e-06, + "loss": 0.4382, + "step": 48798 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123677468162058e-06, + "loss": 0.604, + "step": 48799 + }, + { + "epoch": 1.25, + "learning_rate": 1.3123414608374472e-06, + "loss": 0.7275, + "step": 48800 + }, + { + "epoch": 1.25, + "learning_rate": 1.312315174619543e-06, + "loss": 0.4717, + "step": 48801 + }, + { + "epoch": 1.25, + "learning_rate": 1.312288888162514e-06, + "loss": 0.5552, + "step": 48802 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122626014663794e-06, + "loss": 0.569, + "step": 48803 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122363145311595e-06, + "loss": 0.6538, + "step": 48804 + }, + { + "epoch": 1.25, + "learning_rate": 1.3122100273568748e-06, + "loss": 0.6531, + "step": 48805 + }, + { + "epoch": 1.25, + "learning_rate": 1.312183739943545e-06, + "loss": 0.4962, + "step": 48806 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121574522911906e-06, + "loss": 0.5679, + "step": 48807 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121311643998318e-06, + "loss": 0.7812, + "step": 48808 + }, + { + "epoch": 1.25, + "learning_rate": 1.3121048762694886e-06, + "loss": 0.6592, + "step": 48809 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120785879001805e-06, + "loss": 0.4205, + "step": 48810 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120522992919288e-06, + "loss": 0.5941, + "step": 48811 + }, + { + "epoch": 1.25, + "learning_rate": 1.3120260104447527e-06, + "loss": 0.8066, + "step": 48812 + }, + { + "epoch": 1.25, + "learning_rate": 1.3119997213586723e-06, + "loss": 0.6104, + "step": 48813 + }, + { + "epoch": 1.25, + "learning_rate": 1.3119734320337088e-06, + "loss": 0.708, + "step": 48814 + }, + { + "epoch": 1.25, + "learning_rate": 1.311947142469881e-06, + "loss": 0.7139, + "step": 48815 + }, + { + "epoch": 1.25, + "learning_rate": 1.31192085266721e-06, + "loss": 0.439, + "step": 48816 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118945626257154e-06, + "loss": 0.6299, + "step": 48817 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118682723454173e-06, + "loss": 0.5156, + "step": 48818 + }, + { + "epoch": 1.25, + "learning_rate": 1.311841981826336e-06, + "loss": 0.6147, + "step": 48819 + }, + { + "epoch": 1.25, + "learning_rate": 1.3118156910684919e-06, + "loss": 0.5679, + "step": 48820 + }, + { + "epoch": 1.25, + "learning_rate": 1.3117894000719046e-06, + "loss": 0.5327, + "step": 48821 + }, + { + "epoch": 1.25, + "learning_rate": 1.3117631088365948e-06, + "loss": 0.6924, + "step": 48822 + }, + { + "epoch": 1.25, + "learning_rate": 1.311736817362582e-06, + "loss": 0.6167, + "step": 48823 + }, + { + "epoch": 1.25, + "learning_rate": 1.311710525649887e-06, + "loss": 0.7764, + "step": 48824 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116842336985292e-06, + "loss": 0.6035, + "step": 48825 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116579415085294e-06, + "loss": 0.7603, + "step": 48826 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116316490799074e-06, + "loss": 0.5654, + "step": 48827 + }, + { + "epoch": 1.25, + "learning_rate": 1.3116053564126834e-06, + "loss": 0.7578, + "step": 48828 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115790635068773e-06, + "loss": 0.5459, + "step": 48829 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115527703625096e-06, + "loss": 0.6475, + "step": 48830 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115264769796e-06, + "loss": 0.7725, + "step": 48831 + }, + { + "epoch": 1.25, + "learning_rate": 1.3115001833581691e-06, + "loss": 0.5991, + "step": 48832 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114738894982372e-06, + "loss": 0.6924, + "step": 48833 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114475953998235e-06, + "loss": 0.4938, + "step": 48834 + }, + { + "epoch": 1.25, + "learning_rate": 1.3114213010629489e-06, + "loss": 0.6279, + "step": 48835 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113950064876336e-06, + "loss": 0.6509, + "step": 48836 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113687116738972e-06, + "loss": 0.6357, + "step": 48837 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113424166217598e-06, + "loss": 0.7148, + "step": 48838 + }, + { + "epoch": 1.25, + "learning_rate": 1.3113161213312424e-06, + "loss": 0.7188, + "step": 48839 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112898258023641e-06, + "loss": 0.7163, + "step": 48840 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112635300351458e-06, + "loss": 0.7065, + "step": 48841 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112372340296072e-06, + "loss": 0.5742, + "step": 48842 + }, + { + "epoch": 1.25, + "learning_rate": 1.3112109377857688e-06, + "loss": 0.6538, + "step": 48843 + }, + { + "epoch": 1.25, + "learning_rate": 1.31118464130365e-06, + "loss": 0.8057, + "step": 48844 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111583445832719e-06, + "loss": 0.6709, + "step": 48845 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111320476246537e-06, + "loss": 0.8223, + "step": 48846 + }, + { + "epoch": 1.25, + "learning_rate": 1.3111057504278166e-06, + "loss": 0.5249, + "step": 48847 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110794529927796e-06, + "loss": 0.6787, + "step": 48848 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110531553195635e-06, + "loss": 0.7158, + "step": 48849 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110268574081885e-06, + "loss": 0.5566, + "step": 48850 + }, + { + "epoch": 1.25, + "learning_rate": 1.3110005592586744e-06, + "loss": 0.6431, + "step": 48851 + }, + { + "epoch": 1.25, + "learning_rate": 1.3109742608710415e-06, + "loss": 0.6831, + "step": 48852 + }, + { + "epoch": 1.25, + "learning_rate": 1.31094796224531e-06, + "loss": 0.6777, + "step": 48853 + }, + { + "epoch": 1.25, + "learning_rate": 1.3109216633814998e-06, + "loss": 0.6357, + "step": 48854 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108953642796311e-06, + "loss": 0.7837, + "step": 48855 + }, + { + "epoch": 1.25, + "learning_rate": 1.310869064939724e-06, + "loss": 0.5615, + "step": 48856 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108427653617991e-06, + "loss": 0.8135, + "step": 48857 + }, + { + "epoch": 1.25, + "learning_rate": 1.3108164655458762e-06, + "loss": 0.7666, + "step": 48858 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107901654919752e-06, + "loss": 0.6328, + "step": 48859 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107638652001165e-06, + "loss": 0.7246, + "step": 48860 + }, + { + "epoch": 1.25, + "learning_rate": 1.31073756467032e-06, + "loss": 0.8008, + "step": 48861 + }, + { + "epoch": 1.25, + "learning_rate": 1.3107112639026069e-06, + "loss": 0.5371, + "step": 48862 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106849628969953e-06, + "loss": 0.6846, + "step": 48863 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106586616535072e-06, + "loss": 0.7051, + "step": 48864 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106323601721618e-06, + "loss": 0.7529, + "step": 48865 + }, + { + "epoch": 1.25, + "learning_rate": 1.3106060584529796e-06, + "loss": 0.4922, + "step": 48866 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105797564959808e-06, + "loss": 0.5425, + "step": 48867 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105534543011851e-06, + "loss": 0.7764, + "step": 48868 + }, + { + "epoch": 1.25, + "learning_rate": 1.310527151868613e-06, + "loss": 0.7334, + "step": 48869 + }, + { + "epoch": 1.25, + "learning_rate": 1.3105008491982845e-06, + "loss": 0.5664, + "step": 48870 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104745462902195e-06, + "loss": 0.6177, + "step": 48871 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104482431444392e-06, + "loss": 0.6348, + "step": 48872 + }, + { + "epoch": 1.25, + "learning_rate": 1.3104219397609622e-06, + "loss": 0.749, + "step": 48873 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103956361398098e-06, + "loss": 0.7295, + "step": 48874 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103693322810014e-06, + "loss": 0.7295, + "step": 48875 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103430281845577e-06, + "loss": 0.5049, + "step": 48876 + }, + { + "epoch": 1.25, + "learning_rate": 1.3103167238504986e-06, + "loss": 0.6689, + "step": 48877 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102904192788441e-06, + "loss": 0.6606, + "step": 48878 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102641144696148e-06, + "loss": 0.5693, + "step": 48879 + }, + { + "epoch": 1.25, + "learning_rate": 1.3102378094228304e-06, + "loss": 0.4746, + "step": 48880 + }, + { + "epoch": 1.25, + "learning_rate": 1.310211504138511e-06, + "loss": 0.708, + "step": 48881 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101851986166769e-06, + "loss": 0.6738, + "step": 48882 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101588928573487e-06, + "loss": 0.6279, + "step": 48883 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101325868605457e-06, + "loss": 0.7695, + "step": 48884 + }, + { + "epoch": 1.25, + "learning_rate": 1.3101062806262886e-06, + "loss": 0.6719, + "step": 48885 + }, + { + "epoch": 1.25, + "learning_rate": 1.3100799741545972e-06, + "loss": 0.7852, + "step": 48886 + }, + { + "epoch": 1.25, + "learning_rate": 1.310053667445492e-06, + "loss": 0.6504, + "step": 48887 + }, + { + "epoch": 1.25, + "learning_rate": 1.310027360498993e-06, + "loss": 0.4548, + "step": 48888 + }, + { + "epoch": 1.25, + "learning_rate": 1.31000105331512e-06, + "loss": 0.5161, + "step": 48889 + }, + { + "epoch": 1.25, + "learning_rate": 1.3099747458938937e-06, + "loss": 0.5354, + "step": 48890 + }, + { + "epoch": 1.25, + "learning_rate": 1.309948438235334e-06, + "loss": 0.6553, + "step": 48891 + }, + { + "epoch": 1.25, + "learning_rate": 1.309922130339461e-06, + "loss": 0.5371, + "step": 48892 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098958222062951e-06, + "loss": 0.7378, + "step": 48893 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098695138358555e-06, + "loss": 0.834, + "step": 48894 + }, + { + "epoch": 1.25, + "learning_rate": 1.3098432052281638e-06, + "loss": 0.5231, + "step": 48895 + }, + { + "epoch": 1.25, + "learning_rate": 1.309816896383239e-06, + "loss": 0.6914, + "step": 48896 + }, + { + "epoch": 1.25, + "learning_rate": 1.309790587301102e-06, + "loss": 0.8125, + "step": 48897 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097642779817722e-06, + "loss": 0.7559, + "step": 48898 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097379684252703e-06, + "loss": 0.5884, + "step": 48899 + }, + { + "epoch": 1.25, + "learning_rate": 1.3097116586316165e-06, + "loss": 0.7168, + "step": 48900 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096853486008303e-06, + "loss": 0.4878, + "step": 48901 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096590383329326e-06, + "loss": 0.8184, + "step": 48902 + }, + { + "epoch": 1.25, + "learning_rate": 1.3096327278279429e-06, + "loss": 0.6145, + "step": 48903 + }, + { + "epoch": 1.25, + "learning_rate": 1.309606417085882e-06, + "loss": 0.6523, + "step": 48904 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095801061067695e-06, + "loss": 1.0234, + "step": 48905 + }, + { + "epoch": 1.25, + "learning_rate": 1.309553794890626e-06, + "loss": 0.4172, + "step": 48906 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095274834374709e-06, + "loss": 0.4716, + "step": 48907 + }, + { + "epoch": 1.25, + "learning_rate": 1.3095011717473251e-06, + "loss": 0.6279, + "step": 48908 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094748598202086e-06, + "loss": 0.5059, + "step": 48909 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094485476561415e-06, + "loss": 0.5952, + "step": 48910 + }, + { + "epoch": 1.25, + "learning_rate": 1.3094222352551439e-06, + "loss": 0.603, + "step": 48911 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093959226172358e-06, + "loss": 0.4216, + "step": 48912 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093696097424372e-06, + "loss": 0.7412, + "step": 48913 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093432966307687e-06, + "loss": 0.6133, + "step": 48914 + }, + { + "epoch": 1.25, + "learning_rate": 1.3093169832822502e-06, + "loss": 0.5854, + "step": 48915 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092906696969021e-06, + "loss": 0.6133, + "step": 48916 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092643558747444e-06, + "loss": 0.5535, + "step": 48917 + }, + { + "epoch": 1.25, + "learning_rate": 1.309238041815797e-06, + "loss": 0.6333, + "step": 48918 + }, + { + "epoch": 1.25, + "learning_rate": 1.3092117275200803e-06, + "loss": 0.5234, + "step": 48919 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091854129876143e-06, + "loss": 0.5669, + "step": 48920 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091590982184195e-06, + "loss": 0.8091, + "step": 48921 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091327832125154e-06, + "loss": 0.6824, + "step": 48922 + }, + { + "epoch": 1.25, + "learning_rate": 1.3091064679699228e-06, + "loss": 0.6514, + "step": 48923 + }, + { + "epoch": 1.25, + "learning_rate": 1.3090801524906617e-06, + "loss": 0.5774, + "step": 48924 + }, + { + "epoch": 1.25, + "learning_rate": 1.309053836774752e-06, + "loss": 0.6504, + "step": 48925 + }, + { + "epoch": 1.25, + "learning_rate": 1.3090275208222142e-06, + "loss": 0.6265, + "step": 48926 + }, + { + "epoch": 1.25, + "learning_rate": 1.309001204633068e-06, + "loss": 0.668, + "step": 48927 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089748882073338e-06, + "loss": 0.6968, + "step": 48928 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089485715450316e-06, + "loss": 0.6841, + "step": 48929 + }, + { + "epoch": 1.25, + "learning_rate": 1.3089222546461819e-06, + "loss": 0.7744, + "step": 48930 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088959375108045e-06, + "loss": 0.5298, + "step": 48931 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088696201389197e-06, + "loss": 0.6763, + "step": 48932 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088433025305478e-06, + "loss": 0.8066, + "step": 48933 + }, + { + "epoch": 1.25, + "learning_rate": 1.3088169846857086e-06, + "loss": 0.6646, + "step": 48934 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087906666044227e-06, + "loss": 0.6123, + "step": 48935 + }, + { + "epoch": 1.25, + "learning_rate": 1.30876434828671e-06, + "loss": 0.6851, + "step": 48936 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087380297325904e-06, + "loss": 0.5574, + "step": 48937 + }, + { + "epoch": 1.25, + "learning_rate": 1.3087117109420842e-06, + "loss": 0.7646, + "step": 48938 + }, + { + "epoch": 1.25, + "learning_rate": 1.3086853919152118e-06, + "loss": 0.7598, + "step": 48939 + }, + { + "epoch": 1.25, + "learning_rate": 1.308659072651993e-06, + "loss": 0.708, + "step": 48940 + }, + { + "epoch": 1.25, + "learning_rate": 1.3086327531524483e-06, + "loss": 0.6299, + "step": 48941 + }, + { + "epoch": 1.25, + "learning_rate": 1.308606433416598e-06, + "loss": 0.5396, + "step": 48942 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085801134444615e-06, + "loss": 0.6655, + "step": 48943 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085537932360592e-06, + "loss": 0.7432, + "step": 48944 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085274727914119e-06, + "loss": 0.6396, + "step": 48945 + }, + { + "epoch": 1.25, + "learning_rate": 1.3085011521105393e-06, + "loss": 0.9316, + "step": 48946 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084748311934614e-06, + "loss": 0.5493, + "step": 48947 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084485100401987e-06, + "loss": 0.5723, + "step": 48948 + }, + { + "epoch": 1.25, + "learning_rate": 1.3084221886507706e-06, + "loss": 0.5859, + "step": 48949 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083958670251984e-06, + "loss": 0.7725, + "step": 48950 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083695451635015e-06, + "loss": 0.7676, + "step": 48951 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083432230657003e-06, + "loss": 0.6079, + "step": 48952 + }, + { + "epoch": 1.25, + "learning_rate": 1.3083169007318146e-06, + "loss": 0.6108, + "step": 48953 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082905781618652e-06, + "loss": 0.5938, + "step": 48954 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082642553558714e-06, + "loss": 0.6689, + "step": 48955 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082379323138543e-06, + "loss": 0.7178, + "step": 48956 + }, + { + "epoch": 1.25, + "learning_rate": 1.3082116090358332e-06, + "loss": 0.5535, + "step": 48957 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081852855218292e-06, + "loss": 0.7393, + "step": 48958 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081589617718614e-06, + "loss": 0.5488, + "step": 48959 + }, + { + "epoch": 1.25, + "learning_rate": 1.3081326377859506e-06, + "loss": 0.7773, + "step": 48960 + }, + { + "epoch": 1.25, + "learning_rate": 1.308106313564117e-06, + "loss": 0.8652, + "step": 48961 + }, + { + "epoch": 1.25, + "learning_rate": 1.3080799891063803e-06, + "loss": 0.6367, + "step": 48962 + }, + { + "epoch": 1.25, + "learning_rate": 1.308053664412761e-06, + "loss": 0.5012, + "step": 48963 + }, + { + "epoch": 1.25, + "learning_rate": 1.308027339483279e-06, + "loss": 0.5879, + "step": 48964 + }, + { + "epoch": 1.25, + "learning_rate": 1.3080010143179547e-06, + "loss": 0.6699, + "step": 48965 + }, + { + "epoch": 1.26, + "learning_rate": 1.3079746889168082e-06, + "loss": 0.7275, + "step": 48966 + }, + { + "epoch": 1.26, + "learning_rate": 1.30794836327986e-06, + "loss": 0.8213, + "step": 48967 + }, + { + "epoch": 1.26, + "learning_rate": 1.3079220374071294e-06, + "loss": 0.5771, + "step": 48968 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078957112986371e-06, + "loss": 0.6074, + "step": 48969 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078693849544034e-06, + "loss": 0.5801, + "step": 48970 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078430583744484e-06, + "loss": 0.6611, + "step": 48971 + }, + { + "epoch": 1.26, + "learning_rate": 1.3078167315587919e-06, + "loss": 0.4805, + "step": 48972 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077904045074544e-06, + "loss": 0.7056, + "step": 48973 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077640772204556e-06, + "loss": 0.5977, + "step": 48974 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077377496978167e-06, + "loss": 0.626, + "step": 48975 + }, + { + "epoch": 1.26, + "learning_rate": 1.3077114219395565e-06, + "loss": 0.8574, + "step": 48976 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076850939456962e-06, + "loss": 0.6274, + "step": 48977 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076587657162553e-06, + "loss": 0.5859, + "step": 48978 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076324372512543e-06, + "loss": 0.6489, + "step": 48979 + }, + { + "epoch": 1.26, + "learning_rate": 1.3076061085507132e-06, + "loss": 0.7207, + "step": 48980 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075797796146529e-06, + "loss": 0.8145, + "step": 48981 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075534504430921e-06, + "loss": 0.6826, + "step": 48982 + }, + { + "epoch": 1.26, + "learning_rate": 1.307527121036052e-06, + "loss": 1.043, + "step": 48983 + }, + { + "epoch": 1.26, + "learning_rate": 1.3075007913935525e-06, + "loss": 0.6035, + "step": 48984 + }, + { + "epoch": 1.26, + "learning_rate": 1.307474461515614e-06, + "loss": 0.8184, + "step": 48985 + }, + { + "epoch": 1.26, + "learning_rate": 1.3074481314022563e-06, + "loss": 0.7646, + "step": 48986 + }, + { + "epoch": 1.26, + "learning_rate": 1.3074218010534996e-06, + "loss": 0.5103, + "step": 48987 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073954704693643e-06, + "loss": 0.7427, + "step": 48988 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073691396498705e-06, + "loss": 0.6177, + "step": 48989 + }, + { + "epoch": 1.26, + "learning_rate": 1.307342808595038e-06, + "loss": 0.6494, + "step": 48990 + }, + { + "epoch": 1.26, + "learning_rate": 1.3073164773048875e-06, + "loss": 0.5024, + "step": 48991 + }, + { + "epoch": 1.26, + "learning_rate": 1.307290145779439e-06, + "loss": 0.5342, + "step": 48992 + }, + { + "epoch": 1.26, + "learning_rate": 1.3072638140187122e-06, + "loss": 0.6104, + "step": 48993 + }, + { + "epoch": 1.26, + "learning_rate": 1.307237482022728e-06, + "loss": 0.6836, + "step": 48994 + }, + { + "epoch": 1.26, + "learning_rate": 1.3072111497915058e-06, + "loss": 0.7197, + "step": 48995 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071848173250665e-06, + "loss": 0.6338, + "step": 48996 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071584846234295e-06, + "loss": 0.6104, + "step": 48997 + }, + { + "epoch": 1.26, + "learning_rate": 1.307132151686616e-06, + "loss": 0.6772, + "step": 48998 + }, + { + "epoch": 1.26, + "learning_rate": 1.3071058185146448e-06, + "loss": 0.7017, + "step": 48999 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070794851075374e-06, + "loss": 0.7676, + "step": 49000 + }, + { + "epoch": 1.26, + "learning_rate": 1.307053151465313e-06, + "loss": 0.71, + "step": 49001 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070268175879924e-06, + "loss": 0.6519, + "step": 49002 + }, + { + "epoch": 1.26, + "learning_rate": 1.3070004834755951e-06, + "loss": 0.6768, + "step": 49003 + }, + { + "epoch": 1.26, + "learning_rate": 1.306974149128142e-06, + "loss": 0.6416, + "step": 49004 + }, + { + "epoch": 1.26, + "learning_rate": 1.3069478145456526e-06, + "loss": 0.8984, + "step": 49005 + }, + { + "epoch": 1.26, + "learning_rate": 1.3069214797281479e-06, + "loss": 0.8594, + "step": 49006 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068951446756472e-06, + "loss": 0.6182, + "step": 49007 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068688093881708e-06, + "loss": 0.5327, + "step": 49008 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068424738657392e-06, + "loss": 0.7373, + "step": 49009 + }, + { + "epoch": 1.26, + "learning_rate": 1.3068161381083726e-06, + "loss": 0.5738, + "step": 49010 + }, + { + "epoch": 1.26, + "learning_rate": 1.306789802116091e-06, + "loss": 0.6582, + "step": 49011 + }, + { + "epoch": 1.26, + "learning_rate": 1.3067634658889141e-06, + "loss": 0.7373, + "step": 49012 + }, + { + "epoch": 1.26, + "learning_rate": 1.306737129426863e-06, + "loss": 0.582, + "step": 49013 + }, + { + "epoch": 1.26, + "learning_rate": 1.306710792729957e-06, + "loss": 0.5459, + "step": 49014 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066844557982171e-06, + "loss": 0.5178, + "step": 49015 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066581186316628e-06, + "loss": 0.6152, + "step": 49016 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066317812303145e-06, + "loss": 0.6255, + "step": 49017 + }, + { + "epoch": 1.26, + "learning_rate": 1.3066054435941922e-06, + "loss": 0.7412, + "step": 49018 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065791057233164e-06, + "loss": 0.6006, + "step": 49019 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065527676177068e-06, + "loss": 0.4966, + "step": 49020 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065264292773844e-06, + "loss": 0.4592, + "step": 49021 + }, + { + "epoch": 1.26, + "learning_rate": 1.3065000907023682e-06, + "loss": 0.7002, + "step": 49022 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064737518926794e-06, + "loss": 0.584, + "step": 49023 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064474128483373e-06, + "loss": 0.5449, + "step": 49024 + }, + { + "epoch": 1.26, + "learning_rate": 1.3064210735693628e-06, + "loss": 0.5728, + "step": 49025 + }, + { + "epoch": 1.26, + "learning_rate": 1.306394734055776e-06, + "loss": 0.5132, + "step": 49026 + }, + { + "epoch": 1.26, + "learning_rate": 1.3063683943075964e-06, + "loss": 0.6143, + "step": 49027 + }, + { + "epoch": 1.26, + "learning_rate": 1.306342054324845e-06, + "loss": 0.6768, + "step": 49028 + }, + { + "epoch": 1.26, + "learning_rate": 1.3063157141075411e-06, + "loss": 0.6318, + "step": 49029 + }, + { + "epoch": 1.26, + "learning_rate": 1.3062893736557056e-06, + "loss": 0.623, + "step": 49030 + }, + { + "epoch": 1.26, + "learning_rate": 1.3062630329693585e-06, + "loss": 0.7168, + "step": 49031 + }, + { + "epoch": 1.26, + "learning_rate": 1.30623669204852e-06, + "loss": 0.7373, + "step": 49032 + }, + { + "epoch": 1.26, + "learning_rate": 1.30621035089321e-06, + "loss": 1.0176, + "step": 49033 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061840095034484e-06, + "loss": 0.5513, + "step": 49034 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061576678792564e-06, + "loss": 0.6089, + "step": 49035 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061313260206532e-06, + "loss": 0.7139, + "step": 49036 + }, + { + "epoch": 1.26, + "learning_rate": 1.3061049839276593e-06, + "loss": 0.6541, + "step": 49037 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060786416002952e-06, + "loss": 0.709, + "step": 49038 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060522990385802e-06, + "loss": 0.6973, + "step": 49039 + }, + { + "epoch": 1.26, + "learning_rate": 1.3060259562425356e-06, + "loss": 0.7129, + "step": 49040 + }, + { + "epoch": 1.26, + "learning_rate": 1.305999613212181e-06, + "loss": 0.6406, + "step": 49041 + }, + { + "epoch": 1.26, + "learning_rate": 1.3059732699475361e-06, + "loss": 0.7021, + "step": 49042 + }, + { + "epoch": 1.26, + "learning_rate": 1.3059469264486217e-06, + "loss": 0.6536, + "step": 49043 + }, + { + "epoch": 1.26, + "learning_rate": 1.305920582715458e-06, + "loss": 0.4204, + "step": 49044 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058942387480647e-06, + "loss": 0.5911, + "step": 49045 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058678945464627e-06, + "loss": 0.7598, + "step": 49046 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058415501106712e-06, + "loss": 0.623, + "step": 49047 + }, + { + "epoch": 1.26, + "learning_rate": 1.3058152054407113e-06, + "loss": 0.5908, + "step": 49048 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057888605366025e-06, + "loss": 0.7959, + "step": 49049 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057625153983654e-06, + "loss": 0.7852, + "step": 49050 + }, + { + "epoch": 1.26, + "learning_rate": 1.30573617002602e-06, + "loss": 0.7349, + "step": 49051 + }, + { + "epoch": 1.26, + "learning_rate": 1.3057098244195864e-06, + "loss": 0.5991, + "step": 49052 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056834785790845e-06, + "loss": 0.5908, + "step": 49053 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056571325045354e-06, + "loss": 0.5037, + "step": 49054 + }, + { + "epoch": 1.26, + "learning_rate": 1.305630786195958e-06, + "loss": 0.6641, + "step": 49055 + }, + { + "epoch": 1.26, + "learning_rate": 1.3056044396533738e-06, + "loss": 0.6523, + "step": 49056 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055780928768023e-06, + "loss": 0.6621, + "step": 49057 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055517458662634e-06, + "loss": 0.791, + "step": 49058 + }, + { + "epoch": 1.26, + "learning_rate": 1.3055253986217775e-06, + "loss": 0.5498, + "step": 49059 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054990511433653e-06, + "loss": 0.5801, + "step": 49060 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054727034310464e-06, + "loss": 0.7246, + "step": 49061 + }, + { + "epoch": 1.26, + "learning_rate": 1.3054463554848408e-06, + "loss": 0.6393, + "step": 49062 + }, + { + "epoch": 1.26, + "learning_rate": 1.305420007304769e-06, + "loss": 0.6611, + "step": 49063 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053936588908513e-06, + "loss": 0.6294, + "step": 49064 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053673102431078e-06, + "loss": 0.7725, + "step": 49065 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053409613615584e-06, + "loss": 0.5132, + "step": 49066 + }, + { + "epoch": 1.26, + "learning_rate": 1.3053146122462239e-06, + "loss": 0.6826, + "step": 49067 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052882628971235e-06, + "loss": 0.6411, + "step": 49068 + }, + { + "epoch": 1.26, + "learning_rate": 1.305261913314278e-06, + "loss": 0.4893, + "step": 49069 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052355634977076e-06, + "loss": 0.6196, + "step": 49070 + }, + { + "epoch": 1.26, + "learning_rate": 1.3052092134474325e-06, + "loss": 0.7246, + "step": 49071 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051828631634727e-06, + "loss": 0.7695, + "step": 49072 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051565126458485e-06, + "loss": 0.6206, + "step": 49073 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051301618945795e-06, + "loss": 0.6846, + "step": 49074 + }, + { + "epoch": 1.26, + "learning_rate": 1.3051038109096868e-06, + "loss": 0.626, + "step": 49075 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050774596911902e-06, + "loss": 0.707, + "step": 49076 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050511082391095e-06, + "loss": 0.3888, + "step": 49077 + }, + { + "epoch": 1.26, + "learning_rate": 1.3050247565534653e-06, + "loss": 0.6421, + "step": 49078 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049984046342777e-06, + "loss": 0.7354, + "step": 49079 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049720524815669e-06, + "loss": 0.5632, + "step": 49080 + }, + { + "epoch": 1.26, + "learning_rate": 1.304945700095353e-06, + "loss": 0.7422, + "step": 49081 + }, + { + "epoch": 1.26, + "learning_rate": 1.3049193474756562e-06, + "loss": 0.6013, + "step": 49082 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048929946224966e-06, + "loss": 0.748, + "step": 49083 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048666415358945e-06, + "loss": 0.7129, + "step": 49084 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048402882158698e-06, + "loss": 0.5762, + "step": 49085 + }, + { + "epoch": 1.26, + "learning_rate": 1.3048139346624434e-06, + "loss": 0.6934, + "step": 49086 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047875808756345e-06, + "loss": 0.6553, + "step": 49087 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047612268554643e-06, + "loss": 0.7793, + "step": 49088 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047348726019519e-06, + "loss": 0.5293, + "step": 49089 + }, + { + "epoch": 1.26, + "learning_rate": 1.3047085181151183e-06, + "loss": 0.5693, + "step": 49090 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046821633949833e-06, + "loss": 0.5615, + "step": 49091 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046558084415674e-06, + "loss": 0.6538, + "step": 49092 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046294532548902e-06, + "loss": 0.6758, + "step": 49093 + }, + { + "epoch": 1.26, + "learning_rate": 1.3046030978349726e-06, + "loss": 0.54, + "step": 49094 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045767421818341e-06, + "loss": 0.522, + "step": 49095 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045503862954955e-06, + "loss": 0.8721, + "step": 49096 + }, + { + "epoch": 1.26, + "learning_rate": 1.3045240301759763e-06, + "loss": 0.7012, + "step": 49097 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044976738232973e-06, + "loss": 0.6611, + "step": 49098 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044713172374784e-06, + "loss": 0.6729, + "step": 49099 + }, + { + "epoch": 1.26, + "learning_rate": 1.30444496041854e-06, + "loss": 0.7344, + "step": 49100 + }, + { + "epoch": 1.26, + "learning_rate": 1.3044186033665016e-06, + "loss": 0.5771, + "step": 49101 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043922460813842e-06, + "loss": 0.5332, + "step": 49102 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043658885632075e-06, + "loss": 0.8291, + "step": 49103 + }, + { + "epoch": 1.26, + "learning_rate": 1.304339530811992e-06, + "loss": 0.645, + "step": 49104 + }, + { + "epoch": 1.26, + "learning_rate": 1.3043131728277577e-06, + "loss": 0.7227, + "step": 49105 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042868146105248e-06, + "loss": 0.7373, + "step": 49106 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042604561603133e-06, + "loss": 0.6816, + "step": 49107 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042340974771437e-06, + "loss": 0.7471, + "step": 49108 + }, + { + "epoch": 1.26, + "learning_rate": 1.3042077385610361e-06, + "loss": 0.4557, + "step": 49109 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041813794120104e-06, + "loss": 0.6572, + "step": 49110 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041550200300875e-06, + "loss": 0.5918, + "step": 49111 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041286604152866e-06, + "loss": 0.6523, + "step": 49112 + }, + { + "epoch": 1.26, + "learning_rate": 1.3041023005676286e-06, + "loss": 0.5869, + "step": 49113 + }, + { + "epoch": 1.26, + "learning_rate": 1.304075940487133e-06, + "loss": 0.7031, + "step": 49114 + }, + { + "epoch": 1.26, + "learning_rate": 1.304049580173821e-06, + "loss": 0.8184, + "step": 49115 + }, + { + "epoch": 1.26, + "learning_rate": 1.3040232196277122e-06, + "loss": 0.9551, + "step": 49116 + }, + { + "epoch": 1.26, + "learning_rate": 1.303996858848827e-06, + "loss": 0.6685, + "step": 49117 + }, + { + "epoch": 1.26, + "learning_rate": 1.3039704978371847e-06, + "loss": 0.6289, + "step": 49118 + }, + { + "epoch": 1.26, + "learning_rate": 1.3039441365928063e-06, + "loss": 0.6675, + "step": 49119 + }, + { + "epoch": 1.26, + "learning_rate": 1.303917775115712e-06, + "loss": 0.6143, + "step": 49120 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038914134059221e-06, + "loss": 0.4495, + "step": 49121 + }, + { + "epoch": 1.26, + "learning_rate": 1.303865051463456e-06, + "loss": 0.6401, + "step": 49122 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038386892883348e-06, + "loss": 0.7529, + "step": 49123 + }, + { + "epoch": 1.26, + "learning_rate": 1.3038123268805781e-06, + "loss": 0.5856, + "step": 49124 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037859642402063e-06, + "loss": 0.4905, + "step": 49125 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037596013672398e-06, + "loss": 0.7021, + "step": 49126 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037332382616982e-06, + "loss": 0.645, + "step": 49127 + }, + { + "epoch": 1.26, + "learning_rate": 1.3037068749236022e-06, + "loss": 0.5691, + "step": 49128 + }, + { + "epoch": 1.26, + "learning_rate": 1.3036805113529716e-06, + "loss": 0.6768, + "step": 49129 + }, + { + "epoch": 1.26, + "learning_rate": 1.303654147549827e-06, + "loss": 0.5083, + "step": 49130 + }, + { + "epoch": 1.26, + "learning_rate": 1.3036277835141884e-06, + "loss": 0.5393, + "step": 49131 + }, + { + "epoch": 1.26, + "learning_rate": 1.303601419246076e-06, + "loss": 0.5767, + "step": 49132 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035750547455097e-06, + "loss": 0.527, + "step": 49133 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035486900125104e-06, + "loss": 0.6543, + "step": 49134 + }, + { + "epoch": 1.26, + "learning_rate": 1.3035223250470972e-06, + "loss": 0.4976, + "step": 49135 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034959598492913e-06, + "loss": 0.5813, + "step": 49136 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034695944191125e-06, + "loss": 0.7178, + "step": 49137 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034432287565808e-06, + "loss": 0.7168, + "step": 49138 + }, + { + "epoch": 1.26, + "learning_rate": 1.3034168628617167e-06, + "loss": 0.4937, + "step": 49139 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033904967345403e-06, + "loss": 0.5552, + "step": 49140 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033641303750717e-06, + "loss": 0.6348, + "step": 49141 + }, + { + "epoch": 1.26, + "learning_rate": 1.3033377637833314e-06, + "loss": 0.8076, + "step": 49142 + }, + { + "epoch": 1.26, + "learning_rate": 1.303311396959339e-06, + "loss": 0.6309, + "step": 49143 + }, + { + "epoch": 1.26, + "learning_rate": 1.303285029903115e-06, + "loss": 0.6934, + "step": 49144 + }, + { + "epoch": 1.26, + "learning_rate": 1.3032586626146796e-06, + "loss": 0.6252, + "step": 49145 + }, + { + "epoch": 1.26, + "learning_rate": 1.303232295094053e-06, + "loss": 0.8584, + "step": 49146 + }, + { + "epoch": 1.26, + "learning_rate": 1.3032059273412555e-06, + "loss": 0.666, + "step": 49147 + }, + { + "epoch": 1.26, + "learning_rate": 1.303179559356307e-06, + "loss": 0.665, + "step": 49148 + }, + { + "epoch": 1.26, + "learning_rate": 1.3031531911392279e-06, + "loss": 0.6465, + "step": 49149 + }, + { + "epoch": 1.26, + "learning_rate": 1.3031268226900385e-06, + "loss": 0.6064, + "step": 49150 + }, + { + "epoch": 1.26, + "learning_rate": 1.303100454008759e-06, + "loss": 0.7578, + "step": 49151 + }, + { + "epoch": 1.26, + "learning_rate": 1.303074085095409e-06, + "loss": 0.7852, + "step": 49152 + }, + { + "epoch": 1.26, + "learning_rate": 1.3030477159500093e-06, + "loss": 0.5923, + "step": 49153 + }, + { + "epoch": 1.26, + "learning_rate": 1.3030213465725797e-06, + "loss": 0.4659, + "step": 49154 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029949769631405e-06, + "loss": 0.6768, + "step": 49155 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029686071217123e-06, + "loss": 0.6436, + "step": 49156 + }, + { + "epoch": 1.26, + "learning_rate": 1.302942237048315e-06, + "loss": 0.7598, + "step": 49157 + }, + { + "epoch": 1.26, + "learning_rate": 1.3029158667429684e-06, + "loss": 0.6377, + "step": 49158 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028894962056935e-06, + "loss": 0.6104, + "step": 49159 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028631254365098e-06, + "loss": 0.585, + "step": 49160 + }, + { + "epoch": 1.26, + "learning_rate": 1.302836754435438e-06, + "loss": 0.7139, + "step": 49161 + }, + { + "epoch": 1.26, + "learning_rate": 1.3028103832024977e-06, + "loss": 0.5264, + "step": 49162 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027840117377093e-06, + "loss": 0.7412, + "step": 49163 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027576400410933e-06, + "loss": 0.7363, + "step": 49164 + }, + { + "epoch": 1.26, + "learning_rate": 1.30273126811267e-06, + "loss": 0.5425, + "step": 49165 + }, + { + "epoch": 1.26, + "learning_rate": 1.3027048959524586e-06, + "loss": 0.7725, + "step": 49166 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026785235604804e-06, + "loss": 0.6367, + "step": 49167 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026521509367552e-06, + "loss": 0.5938, + "step": 49168 + }, + { + "epoch": 1.26, + "learning_rate": 1.3026257780813032e-06, + "loss": 0.6362, + "step": 49169 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025994049941441e-06, + "loss": 0.5361, + "step": 49170 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025730316752993e-06, + "loss": 0.7285, + "step": 49171 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025466581247877e-06, + "loss": 0.6826, + "step": 49172 + }, + { + "epoch": 1.26, + "learning_rate": 1.3025202843426302e-06, + "loss": 0.7109, + "step": 49173 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024939103288467e-06, + "loss": 0.6934, + "step": 49174 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024675360834575e-06, + "loss": 0.6416, + "step": 49175 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024411616064831e-06, + "loss": 0.874, + "step": 49176 + }, + { + "epoch": 1.26, + "learning_rate": 1.3024147868979433e-06, + "loss": 0.6538, + "step": 49177 + }, + { + "epoch": 1.26, + "learning_rate": 1.3023884119578585e-06, + "loss": 0.6235, + "step": 49178 + }, + { + "epoch": 1.26, + "learning_rate": 1.3023620367862485e-06, + "loss": 0.5862, + "step": 49179 + }, + { + "epoch": 1.26, + "learning_rate": 1.302335661383134e-06, + "loss": 0.7231, + "step": 49180 + }, + { + "epoch": 1.26, + "learning_rate": 1.302309285748535e-06, + "loss": 0.666, + "step": 49181 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022829098824717e-06, + "loss": 0.396, + "step": 49182 + }, + { + "epoch": 1.26, + "learning_rate": 1.302256533784964e-06, + "loss": 0.5596, + "step": 49183 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022301574560326e-06, + "loss": 0.7832, + "step": 49184 + }, + { + "epoch": 1.26, + "learning_rate": 1.3022037808956975e-06, + "loss": 0.6104, + "step": 49185 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021774041039788e-06, + "loss": 0.7686, + "step": 49186 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021510270808966e-06, + "loss": 0.7285, + "step": 49187 + }, + { + "epoch": 1.26, + "learning_rate": 1.3021246498264716e-06, + "loss": 0.7705, + "step": 49188 + }, + { + "epoch": 1.26, + "learning_rate": 1.3020982723407233e-06, + "loss": 0.668, + "step": 49189 + }, + { + "epoch": 1.26, + "learning_rate": 1.3020718946236724e-06, + "loss": 0.5425, + "step": 49190 + }, + { + "epoch": 1.26, + "learning_rate": 1.302045516675339e-06, + "loss": 0.6504, + "step": 49191 + }, + { + "epoch": 1.26, + "learning_rate": 1.302019138495743e-06, + "loss": 0.6548, + "step": 49192 + }, + { + "epoch": 1.26, + "learning_rate": 1.301992760084905e-06, + "loss": 0.498, + "step": 49193 + }, + { + "epoch": 1.26, + "learning_rate": 1.301966381442845e-06, + "loss": 0.6729, + "step": 49194 + }, + { + "epoch": 1.26, + "learning_rate": 1.3019400025695835e-06, + "loss": 0.7197, + "step": 49195 + }, + { + "epoch": 1.26, + "learning_rate": 1.30191362346514e-06, + "loss": 0.561, + "step": 49196 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018872441295353e-06, + "loss": 0.6309, + "step": 49197 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018608645627893e-06, + "loss": 0.8154, + "step": 49198 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018344847649225e-06, + "loss": 0.5786, + "step": 49199 + }, + { + "epoch": 1.26, + "learning_rate": 1.3018081047359549e-06, + "loss": 0.6084, + "step": 49200 + }, + { + "epoch": 1.26, + "learning_rate": 1.301781724475907e-06, + "loss": 0.7207, + "step": 49201 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017553439847979e-06, + "loss": 0.7529, + "step": 49202 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017289632626491e-06, + "loss": 0.5541, + "step": 49203 + }, + { + "epoch": 1.26, + "learning_rate": 1.3017025823094802e-06, + "loss": 0.7393, + "step": 49204 + }, + { + "epoch": 1.26, + "learning_rate": 1.3016762011253119e-06, + "loss": 0.7344, + "step": 49205 + }, + { + "epoch": 1.26, + "learning_rate": 1.3016498197101636e-06, + "loss": 0.6816, + "step": 49206 + }, + { + "epoch": 1.26, + "learning_rate": 1.301623438064056e-06, + "loss": 0.4802, + "step": 49207 + }, + { + "epoch": 1.26, + "learning_rate": 1.301597056187009e-06, + "loss": 0.6006, + "step": 49208 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015706740790433e-06, + "loss": 0.6172, + "step": 49209 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015442917401789e-06, + "loss": 0.5605, + "step": 49210 + }, + { + "epoch": 1.26, + "learning_rate": 1.3015179091704353e-06, + "loss": 0.6997, + "step": 49211 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014915263698338e-06, + "loss": 0.4829, + "step": 49212 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014651433383941e-06, + "loss": 0.7637, + "step": 49213 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014387600761363e-06, + "loss": 0.6445, + "step": 49214 + }, + { + "epoch": 1.26, + "learning_rate": 1.3014123765830807e-06, + "loss": 0.6675, + "step": 49215 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013859928592475e-06, + "loss": 0.751, + "step": 49216 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013596089046568e-06, + "loss": 0.7734, + "step": 49217 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013332247193291e-06, + "loss": 0.5808, + "step": 49218 + }, + { + "epoch": 1.26, + "learning_rate": 1.3013068403032841e-06, + "loss": 0.8223, + "step": 49219 + }, + { + "epoch": 1.26, + "learning_rate": 1.301280455656543e-06, + "loss": 0.7285, + "step": 49220 + }, + { + "epoch": 1.26, + "learning_rate": 1.3012540707791246e-06, + "loss": 0.6768, + "step": 49221 + }, + { + "epoch": 1.26, + "learning_rate": 1.30122768567105e-06, + "loss": 0.6211, + "step": 49222 + }, + { + "epoch": 1.26, + "learning_rate": 1.3012013003323393e-06, + "loss": 0.5146, + "step": 49223 + }, + { + "epoch": 1.26, + "learning_rate": 1.3011749147630123e-06, + "loss": 0.6377, + "step": 49224 + }, + { + "epoch": 1.26, + "learning_rate": 1.3011485289630902e-06, + "loss": 0.5137, + "step": 49225 + }, + { + "epoch": 1.26, + "learning_rate": 1.301122142932592e-06, + "loss": 0.428, + "step": 49226 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010957566715383e-06, + "loss": 0.7441, + "step": 49227 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010693701799498e-06, + "loss": 0.6416, + "step": 49228 + }, + { + "epoch": 1.26, + "learning_rate": 1.301042983457846e-06, + "loss": 0.7168, + "step": 49229 + }, + { + "epoch": 1.26, + "learning_rate": 1.3010165965052477e-06, + "loss": 0.7266, + "step": 49230 + }, + { + "epoch": 1.26, + "learning_rate": 1.300990209322175e-06, + "loss": 0.6846, + "step": 49231 + }, + { + "epoch": 1.26, + "learning_rate": 1.3009638219086477e-06, + "loss": 0.4612, + "step": 49232 + }, + { + "epoch": 1.26, + "learning_rate": 1.300937434264686e-06, + "loss": 0.6973, + "step": 49233 + }, + { + "epoch": 1.26, + "learning_rate": 1.3009110463903106e-06, + "loss": 0.7627, + "step": 49234 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008846582855415e-06, + "loss": 0.6572, + "step": 49235 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008582699503987e-06, + "loss": 0.6396, + "step": 49236 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008318813849026e-06, + "loss": 0.7754, + "step": 49237 + }, + { + "epoch": 1.26, + "learning_rate": 1.3008054925890732e-06, + "loss": 0.7207, + "step": 49238 + }, + { + "epoch": 1.26, + "learning_rate": 1.3007791035629311e-06, + "loss": 0.7568, + "step": 49239 + }, + { + "epoch": 1.26, + "learning_rate": 1.3007527143064962e-06, + "loss": 0.7471, + "step": 49240 + }, + { + "epoch": 1.26, + "learning_rate": 1.300726324819789e-06, + "loss": 0.5903, + "step": 49241 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006999351028291e-06, + "loss": 0.7051, + "step": 49242 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006735451556374e-06, + "loss": 0.6719, + "step": 49243 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006471549782333e-06, + "loss": 0.8047, + "step": 49244 + }, + { + "epoch": 1.26, + "learning_rate": 1.3006207645706383e-06, + "loss": 0.5334, + "step": 49245 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005943739328712e-06, + "loss": 0.6582, + "step": 49246 + }, + { + "epoch": 1.26, + "learning_rate": 1.300567983064953e-06, + "loss": 0.6062, + "step": 49247 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005415919669036e-06, + "loss": 0.7354, + "step": 49248 + }, + { + "epoch": 1.26, + "learning_rate": 1.3005152006387435e-06, + "loss": 0.6494, + "step": 49249 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004888090804927e-06, + "loss": 0.5303, + "step": 49250 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004624172921713e-06, + "loss": 0.5918, + "step": 49251 + }, + { + "epoch": 1.26, + "learning_rate": 1.3004360252737996e-06, + "loss": 0.668, + "step": 49252 + }, + { + "epoch": 1.26, + "learning_rate": 1.300409633025398e-06, + "loss": 0.5615, + "step": 49253 + }, + { + "epoch": 1.26, + "learning_rate": 1.3003832405469864e-06, + "loss": 0.6592, + "step": 49254 + }, + { + "epoch": 1.26, + "learning_rate": 1.3003568478385854e-06, + "loss": 0.6489, + "step": 49255 + }, + { + "epoch": 1.26, + "learning_rate": 1.300330454900215e-06, + "loss": 0.8018, + "step": 49256 + }, + { + "epoch": 1.26, + "learning_rate": 1.300304061731895e-06, + "loss": 0.6514, + "step": 49257 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002776683336462e-06, + "loss": 0.6133, + "step": 49258 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002512747054888e-06, + "loss": 0.6187, + "step": 49259 + }, + { + "epoch": 1.26, + "learning_rate": 1.3002248808474426e-06, + "loss": 0.564, + "step": 49260 + }, + { + "epoch": 1.26, + "learning_rate": 1.300198486759528e-06, + "loss": 0.6436, + "step": 49261 + }, + { + "epoch": 1.26, + "learning_rate": 1.3001720924417652e-06, + "loss": 0.6904, + "step": 49262 + }, + { + "epoch": 1.26, + "learning_rate": 1.3001456978941745e-06, + "loss": 0.6377, + "step": 49263 + }, + { + "epoch": 1.26, + "learning_rate": 1.300119303116776e-06, + "loss": 0.6802, + "step": 49264 + }, + { + "epoch": 1.26, + "learning_rate": 1.30009290810959e-06, + "loss": 0.7646, + "step": 49265 + }, + { + "epoch": 1.26, + "learning_rate": 1.3000665128726368e-06, + "loss": 0.5098, + "step": 49266 + }, + { + "epoch": 1.26, + "learning_rate": 1.300040117405936e-06, + "loss": 0.6245, + "step": 49267 + }, + { + "epoch": 1.26, + "learning_rate": 1.3000137217095088e-06, + "loss": 0.4888, + "step": 49268 + }, + { + "epoch": 1.26, + "learning_rate": 1.2999873257833745e-06, + "loss": 0.6611, + "step": 49269 + }, + { + "epoch": 1.26, + "learning_rate": 1.299960929627554e-06, + "loss": 0.6074, + "step": 49270 + }, + { + "epoch": 1.26, + "learning_rate": 1.299934533242067e-06, + "loss": 0.4646, + "step": 49271 + }, + { + "epoch": 1.26, + "learning_rate": 1.299908136626934e-06, + "loss": 0.437, + "step": 49272 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998817397821752e-06, + "loss": 0.7705, + "step": 49273 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998553427078104e-06, + "loss": 0.8574, + "step": 49274 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998289454038608e-06, + "loss": 0.6904, + "step": 49275 + }, + { + "epoch": 1.26, + "learning_rate": 1.2998025478703457e-06, + "loss": 0.7354, + "step": 49276 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997761501072853e-06, + "loss": 0.5972, + "step": 49277 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997497521147e-06, + "loss": 0.5825, + "step": 49278 + }, + { + "epoch": 1.26, + "learning_rate": 1.2997233538926104e-06, + "loss": 0.4094, + "step": 49279 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996969554410364e-06, + "loss": 0.7168, + "step": 49280 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996705567599981e-06, + "loss": 0.668, + "step": 49281 + }, + { + "epoch": 1.26, + "learning_rate": 1.2996441578495158e-06, + "loss": 0.6782, + "step": 49282 + }, + { + "epoch": 1.26, + "learning_rate": 1.29961775870961e-06, + "loss": 0.5396, + "step": 49283 + }, + { + "epoch": 1.26, + "learning_rate": 1.2995913593403003e-06, + "loss": 0.6895, + "step": 49284 + }, + { + "epoch": 1.26, + "learning_rate": 1.299564959741608e-06, + "loss": 0.8135, + "step": 49285 + }, + { + "epoch": 1.26, + "learning_rate": 1.2995385599135517e-06, + "loss": 0.7031, + "step": 49286 + }, + { + "epoch": 1.26, + "learning_rate": 1.299512159856153e-06, + "loss": 0.6201, + "step": 49287 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994857595694314e-06, + "loss": 0.6484, + "step": 49288 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994593590534074e-06, + "loss": 0.6504, + "step": 49289 + }, + { + "epoch": 1.26, + "learning_rate": 1.2994329583081012e-06, + "loss": 0.575, + "step": 49290 + }, + { + "epoch": 1.26, + "learning_rate": 1.299406557333533e-06, + "loss": 0.8252, + "step": 49291 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993801561297227e-06, + "loss": 0.6992, + "step": 49292 + }, + { + "epoch": 1.26, + "learning_rate": 1.299353754696691e-06, + "loss": 0.6226, + "step": 49293 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993273530344577e-06, + "loss": 0.6655, + "step": 49294 + }, + { + "epoch": 1.26, + "learning_rate": 1.2993009511430435e-06, + "loss": 0.5718, + "step": 49295 + }, + { + "epoch": 1.26, + "learning_rate": 1.299274549022468e-06, + "loss": 0.6924, + "step": 49296 + }, + { + "epoch": 1.26, + "learning_rate": 1.299248146672752e-06, + "loss": 0.7007, + "step": 49297 + }, + { + "epoch": 1.26, + "learning_rate": 1.2992217440939153e-06, + "loss": 0.6455, + "step": 49298 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991953412859784e-06, + "loss": 0.6777, + "step": 49299 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991689382489614e-06, + "loss": 0.5281, + "step": 49300 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991425349828842e-06, + "loss": 0.6689, + "step": 49301 + }, + { + "epoch": 1.26, + "learning_rate": 1.2991161314877677e-06, + "loss": 0.8564, + "step": 49302 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990897277636314e-06, + "loss": 0.7168, + "step": 49303 + }, + { + "epoch": 1.26, + "learning_rate": 1.299063323810496e-06, + "loss": 0.6484, + "step": 49304 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990369196283817e-06, + "loss": 0.5469, + "step": 49305 + }, + { + "epoch": 1.26, + "learning_rate": 1.2990105152173085e-06, + "loss": 0.6055, + "step": 49306 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989841105772965e-06, + "loss": 0.6294, + "step": 49307 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989577057083662e-06, + "loss": 0.6758, + "step": 49308 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989313006105378e-06, + "loss": 0.6934, + "step": 49309 + }, + { + "epoch": 1.26, + "learning_rate": 1.2989048952838317e-06, + "loss": 0.5049, + "step": 49310 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988784897282675e-06, + "loss": 0.5552, + "step": 49311 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988520839438659e-06, + "loss": 0.8555, + "step": 49312 + }, + { + "epoch": 1.26, + "learning_rate": 1.2988256779306468e-06, + "loss": 0.7109, + "step": 49313 + }, + { + "epoch": 1.26, + "learning_rate": 1.298799271688631e-06, + "loss": 0.6279, + "step": 49314 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987728652178383e-06, + "loss": 0.6973, + "step": 49315 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987464585182888e-06, + "loss": 0.6104, + "step": 49316 + }, + { + "epoch": 1.26, + "learning_rate": 1.2987200515900027e-06, + "loss": 0.4702, + "step": 49317 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986936444330005e-06, + "loss": 0.6006, + "step": 49318 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986672370473023e-06, + "loss": 0.4835, + "step": 49319 + }, + { + "epoch": 1.26, + "learning_rate": 1.2986408294329284e-06, + "loss": 0.3215, + "step": 49320 + }, + { + "epoch": 1.26, + "learning_rate": 1.298614421589899e-06, + "loss": 0.5972, + "step": 49321 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985880135182346e-06, + "loss": 0.833, + "step": 49322 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985616052179544e-06, + "loss": 0.5291, + "step": 49323 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985351966890796e-06, + "loss": 0.6055, + "step": 49324 + }, + { + "epoch": 1.26, + "learning_rate": 1.2985087879316303e-06, + "loss": 0.7832, + "step": 49325 + }, + { + "epoch": 1.26, + "learning_rate": 1.2984823789456263e-06, + "loss": 0.501, + "step": 49326 + }, + { + "epoch": 1.26, + "learning_rate": 1.298455969731088e-06, + "loss": 0.5913, + "step": 49327 + }, + { + "epoch": 1.26, + "learning_rate": 1.2984295602880359e-06, + "loss": 0.5083, + "step": 49328 + }, + { + "epoch": 1.26, + "learning_rate": 1.29840315061649e-06, + "loss": 0.6357, + "step": 49329 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983767407164705e-06, + "loss": 0.7295, + "step": 49330 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983503305879977e-06, + "loss": 0.5782, + "step": 49331 + }, + { + "epoch": 1.26, + "learning_rate": 1.2983239202310916e-06, + "loss": 0.8652, + "step": 49332 + }, + { + "epoch": 1.26, + "learning_rate": 1.298297509645773e-06, + "loss": 0.7461, + "step": 49333 + }, + { + "epoch": 1.26, + "learning_rate": 1.2982710988320611e-06, + "loss": 0.7266, + "step": 49334 + }, + { + "epoch": 1.26, + "learning_rate": 1.2982446877899774e-06, + "loss": 0.667, + "step": 49335 + }, + { + "epoch": 1.26, + "learning_rate": 1.298218276519541e-06, + "loss": 0.6782, + "step": 49336 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981918650207726e-06, + "loss": 0.7534, + "step": 49337 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981654532936922e-06, + "loss": 0.665, + "step": 49338 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981390413383206e-06, + "loss": 0.5073, + "step": 49339 + }, + { + "epoch": 1.26, + "learning_rate": 1.2981126291546778e-06, + "loss": 0.647, + "step": 49340 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980862167427836e-06, + "loss": 0.7886, + "step": 49341 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980598041026585e-06, + "loss": 0.7578, + "step": 49342 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980333912343226e-06, + "loss": 0.7461, + "step": 49343 + }, + { + "epoch": 1.26, + "learning_rate": 1.2980069781377962e-06, + "loss": 0.7676, + "step": 49344 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979805648130997e-06, + "loss": 0.6621, + "step": 49345 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979541512602533e-06, + "loss": 0.564, + "step": 49346 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979277374792769e-06, + "loss": 0.7676, + "step": 49347 + }, + { + "epoch": 1.26, + "learning_rate": 1.2979013234701913e-06, + "loss": 0.7334, + "step": 49348 + }, + { + "epoch": 1.26, + "learning_rate": 1.297874909233016e-06, + "loss": 0.7363, + "step": 49349 + }, + { + "epoch": 1.26, + "learning_rate": 1.2978484947677717e-06, + "loss": 0.5068, + "step": 49350 + }, + { + "epoch": 1.26, + "learning_rate": 1.2978220800744783e-06, + "loss": 0.5142, + "step": 49351 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977956651531566e-06, + "loss": 0.4229, + "step": 49352 + }, + { + "epoch": 1.26, + "learning_rate": 1.297769250003826e-06, + "loss": 0.5293, + "step": 49353 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977428346265075e-06, + "loss": 0.7471, + "step": 49354 + }, + { + "epoch": 1.26, + "learning_rate": 1.2977164190212212e-06, + "loss": 0.7275, + "step": 49355 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976900031879868e-06, + "loss": 0.7988, + "step": 49356 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976635871268246e-06, + "loss": 0.6592, + "step": 49357 + }, + { + "epoch": 1.27, + "learning_rate": 1.2976371708377556e-06, + "loss": 0.4094, + "step": 49358 + }, + { + "epoch": 1.27, + "learning_rate": 1.297610754320799e-06, + "loss": 0.7241, + "step": 49359 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975843375759762e-06, + "loss": 0.5532, + "step": 49360 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975579206033063e-06, + "loss": 0.708, + "step": 49361 + }, + { + "epoch": 1.27, + "learning_rate": 1.29753150340281e-06, + "loss": 0.8125, + "step": 49362 + }, + { + "epoch": 1.27, + "learning_rate": 1.2975050859745076e-06, + "loss": 0.7607, + "step": 49363 + }, + { + "epoch": 1.27, + "learning_rate": 1.2974786683184191e-06, + "loss": 0.709, + "step": 49364 + }, + { + "epoch": 1.27, + "learning_rate": 1.297452250434565e-06, + "loss": 0.5603, + "step": 49365 + }, + { + "epoch": 1.27, + "learning_rate": 1.2974258323229656e-06, + "loss": 0.7104, + "step": 49366 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973994139836405e-06, + "loss": 0.3921, + "step": 49367 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973729954166107e-06, + "loss": 0.6846, + "step": 49368 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973465766218956e-06, + "loss": 0.8145, + "step": 49369 + }, + { + "epoch": 1.27, + "learning_rate": 1.2973201575995164e-06, + "loss": 0.7402, + "step": 49370 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972937383494924e-06, + "loss": 0.5532, + "step": 49371 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972673188718443e-06, + "loss": 0.3977, + "step": 49372 + }, + { + "epoch": 1.27, + "learning_rate": 1.2972408991665926e-06, + "loss": 0.5698, + "step": 49373 + }, + { + "epoch": 1.27, + "learning_rate": 1.297214479233757e-06, + "loss": 0.4995, + "step": 49374 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971880590733582e-06, + "loss": 0.6357, + "step": 49375 + }, + { + "epoch": 1.27, + "learning_rate": 1.297161638685416e-06, + "loss": 0.5918, + "step": 49376 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971352180699506e-06, + "loss": 0.6484, + "step": 49377 + }, + { + "epoch": 1.27, + "learning_rate": 1.2971087972269825e-06, + "loss": 0.7812, + "step": 49378 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970823761565322e-06, + "loss": 0.5962, + "step": 49379 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970559548586192e-06, + "loss": 0.6914, + "step": 49380 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970295333332644e-06, + "loss": 0.7822, + "step": 49381 + }, + { + "epoch": 1.27, + "learning_rate": 1.2970031115804873e-06, + "loss": 0.6543, + "step": 49382 + }, + { + "epoch": 1.27, + "learning_rate": 1.2969766896003088e-06, + "loss": 0.5508, + "step": 49383 + }, + { + "epoch": 1.27, + "learning_rate": 1.296950267392749e-06, + "loss": 0.7505, + "step": 49384 + }, + { + "epoch": 1.27, + "learning_rate": 1.2969238449578284e-06, + "loss": 0.5796, + "step": 49385 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968974222955662e-06, + "loss": 0.7471, + "step": 49386 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968709994059837e-06, + "loss": 0.6768, + "step": 49387 + }, + { + "epoch": 1.27, + "learning_rate": 1.2968445762891005e-06, + "loss": 0.424, + "step": 49388 + }, + { + "epoch": 1.27, + "learning_rate": 1.296818152944937e-06, + "loss": 0.6348, + "step": 49389 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967917293735138e-06, + "loss": 0.543, + "step": 49390 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967653055748504e-06, + "loss": 0.7163, + "step": 49391 + }, + { + "epoch": 1.27, + "learning_rate": 1.296738881548968e-06, + "loss": 0.7422, + "step": 49392 + }, + { + "epoch": 1.27, + "learning_rate": 1.2967124572958857e-06, + "loss": 0.6533, + "step": 49393 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966860328156247e-06, + "loss": 0.6154, + "step": 49394 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966596081082049e-06, + "loss": 0.6514, + "step": 49395 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966331831736464e-06, + "loss": 0.603, + "step": 49396 + }, + { + "epoch": 1.27, + "learning_rate": 1.2966067580119694e-06, + "loss": 0.79, + "step": 49397 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965803326231941e-06, + "loss": 0.6592, + "step": 49398 + }, + { + "epoch": 1.27, + "learning_rate": 1.296553907007341e-06, + "loss": 0.582, + "step": 49399 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965274811644305e-06, + "loss": 0.749, + "step": 49400 + }, + { + "epoch": 1.27, + "learning_rate": 1.2965010550944822e-06, + "loss": 0.605, + "step": 49401 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964746287975167e-06, + "loss": 0.5776, + "step": 49402 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964482022735543e-06, + "loss": 0.5586, + "step": 49403 + }, + { + "epoch": 1.27, + "learning_rate": 1.2964217755226152e-06, + "loss": 0.6304, + "step": 49404 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963953485447197e-06, + "loss": 0.5664, + "step": 49405 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963689213398877e-06, + "loss": 0.7734, + "step": 49406 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963424939081395e-06, + "loss": 0.7617, + "step": 49407 + }, + { + "epoch": 1.27, + "learning_rate": 1.2963160662494957e-06, + "loss": 0.5745, + "step": 49408 + }, + { + "epoch": 1.27, + "learning_rate": 1.296289638363976e-06, + "loss": 0.7617, + "step": 49409 + }, + { + "epoch": 1.27, + "learning_rate": 1.2962632102516013e-06, + "loss": 0.7686, + "step": 49410 + }, + { + "epoch": 1.27, + "learning_rate": 1.2962367819123916e-06, + "loss": 0.667, + "step": 49411 + }, + { + "epoch": 1.27, + "learning_rate": 1.296210353346367e-06, + "loss": 0.5186, + "step": 49412 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961839245535471e-06, + "loss": 0.4419, + "step": 49413 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961574955339533e-06, + "loss": 0.752, + "step": 49414 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961310662876056e-06, + "loss": 0.748, + "step": 49415 + }, + { + "epoch": 1.27, + "learning_rate": 1.2961046368145235e-06, + "loss": 0.7192, + "step": 49416 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960782071147279e-06, + "loss": 0.6167, + "step": 49417 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960517771882385e-06, + "loss": 0.6504, + "step": 49418 + }, + { + "epoch": 1.27, + "learning_rate": 1.2960253470350762e-06, + "loss": 0.7725, + "step": 49419 + }, + { + "epoch": 1.27, + "learning_rate": 1.295998916655261e-06, + "loss": 0.533, + "step": 49420 + }, + { + "epoch": 1.27, + "learning_rate": 1.295972486048813e-06, + "loss": 0.6006, + "step": 49421 + }, + { + "epoch": 1.27, + "learning_rate": 1.295946055215752e-06, + "loss": 0.6631, + "step": 49422 + }, + { + "epoch": 1.27, + "learning_rate": 1.295919624156099e-06, + "loss": 0.5465, + "step": 49423 + }, + { + "epoch": 1.27, + "learning_rate": 1.295893192869874e-06, + "loss": 0.5757, + "step": 49424 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958667613570974e-06, + "loss": 0.8027, + "step": 49425 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958403296177888e-06, + "loss": 0.6816, + "step": 49426 + }, + { + "epoch": 1.27, + "learning_rate": 1.2958138976519692e-06, + "loss": 0.7231, + "step": 49427 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957874654596584e-06, + "loss": 0.6445, + "step": 49428 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957610330408765e-06, + "loss": 0.6475, + "step": 49429 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957346003956445e-06, + "loss": 0.6621, + "step": 49430 + }, + { + "epoch": 1.27, + "learning_rate": 1.2957081675239818e-06, + "loss": 0.8262, + "step": 49431 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956817344259089e-06, + "loss": 0.4218, + "step": 49432 + }, + { + "epoch": 1.27, + "learning_rate": 1.295655301101446e-06, + "loss": 0.5883, + "step": 49433 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956288675506135e-06, + "loss": 0.7207, + "step": 49434 + }, + { + "epoch": 1.27, + "learning_rate": 1.2956024337734319e-06, + "loss": 0.6362, + "step": 49435 + }, + { + "epoch": 1.27, + "learning_rate": 1.295575999769921e-06, + "loss": 0.626, + "step": 49436 + }, + { + "epoch": 1.27, + "learning_rate": 1.2955495655401009e-06, + "loss": 0.6445, + "step": 49437 + }, + { + "epoch": 1.27, + "learning_rate": 1.295523131083992e-06, + "loss": 0.4246, + "step": 49438 + }, + { + "epoch": 1.27, + "learning_rate": 1.295496696401615e-06, + "loss": 0.5693, + "step": 49439 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954702614929898e-06, + "loss": 0.7061, + "step": 49440 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954438263581362e-06, + "loss": 0.6885, + "step": 49441 + }, + { + "epoch": 1.27, + "learning_rate": 1.2954173909970752e-06, + "loss": 0.7324, + "step": 49442 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953909554098261e-06, + "loss": 0.5144, + "step": 49443 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953645195964106e-06, + "loss": 0.5293, + "step": 49444 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953380835568474e-06, + "loss": 0.6406, + "step": 49445 + }, + { + "epoch": 1.27, + "learning_rate": 1.2953116472911577e-06, + "loss": 0.6807, + "step": 49446 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952852107993613e-06, + "loss": 0.4824, + "step": 49447 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952587740814787e-06, + "loss": 0.5308, + "step": 49448 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952323371375298e-06, + "loss": 0.4717, + "step": 49449 + }, + { + "epoch": 1.27, + "learning_rate": 1.2952058999675357e-06, + "loss": 0.6082, + "step": 49450 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951794625715153e-06, + "loss": 0.8018, + "step": 49451 + }, + { + "epoch": 1.27, + "learning_rate": 1.29515302494949e-06, + "loss": 0.6143, + "step": 49452 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951265871014793e-06, + "loss": 0.624, + "step": 49453 + }, + { + "epoch": 1.27, + "learning_rate": 1.2951001490275041e-06, + "loss": 0.626, + "step": 49454 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950737107275842e-06, + "loss": 0.7598, + "step": 49455 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950472722017398e-06, + "loss": 0.772, + "step": 49456 + }, + { + "epoch": 1.27, + "learning_rate": 1.2950208334499913e-06, + "loss": 0.7842, + "step": 49457 + }, + { + "epoch": 1.27, + "learning_rate": 1.294994394472359e-06, + "loss": 0.7783, + "step": 49458 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949679552688627e-06, + "loss": 0.5583, + "step": 49459 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949415158395232e-06, + "loss": 0.5422, + "step": 49460 + }, + { + "epoch": 1.27, + "learning_rate": 1.2949150761843609e-06, + "loss": 0.6704, + "step": 49461 + }, + { + "epoch": 1.27, + "learning_rate": 1.294888636303395e-06, + "loss": 0.647, + "step": 49462 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948621961966471e-06, + "loss": 0.6548, + "step": 49463 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948357558641363e-06, + "loss": 0.5269, + "step": 49464 + }, + { + "epoch": 1.27, + "learning_rate": 1.2948093153058836e-06, + "loss": 0.6982, + "step": 49465 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947828745219089e-06, + "loss": 0.6299, + "step": 49466 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947564335122325e-06, + "loss": 0.8164, + "step": 49467 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947299922768746e-06, + "loss": 0.5, + "step": 49468 + }, + { + "epoch": 1.27, + "learning_rate": 1.2947035508158554e-06, + "loss": 0.6807, + "step": 49469 + }, + { + "epoch": 1.27, + "learning_rate": 1.2946771091291955e-06, + "loss": 0.6602, + "step": 49470 + }, + { + "epoch": 1.27, + "learning_rate": 1.294650667216915e-06, + "loss": 0.6377, + "step": 49471 + }, + { + "epoch": 1.27, + "learning_rate": 1.2946242250790336e-06, + "loss": 0.6016, + "step": 49472 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945977827155722e-06, + "loss": 0.8271, + "step": 49473 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945713401265506e-06, + "loss": 0.6816, + "step": 49474 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945448973119897e-06, + "loss": 0.6602, + "step": 49475 + }, + { + "epoch": 1.27, + "learning_rate": 1.2945184542719089e-06, + "loss": 0.7588, + "step": 49476 + }, + { + "epoch": 1.27, + "learning_rate": 1.294492011006329e-06, + "loss": 0.665, + "step": 49477 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944655675152702e-06, + "loss": 0.5972, + "step": 49478 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944391237987527e-06, + "loss": 0.7056, + "step": 49479 + }, + { + "epoch": 1.27, + "learning_rate": 1.2944126798567967e-06, + "loss": 0.5708, + "step": 49480 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943862356894221e-06, + "loss": 0.6074, + "step": 49481 + }, + { + "epoch": 1.27, + "learning_rate": 1.29435979129665e-06, + "loss": 0.4777, + "step": 49482 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943333466784995e-06, + "loss": 0.5825, + "step": 49483 + }, + { + "epoch": 1.27, + "learning_rate": 1.2943069018349921e-06, + "loss": 0.7212, + "step": 49484 + }, + { + "epoch": 1.27, + "learning_rate": 1.294280456766147e-06, + "loss": 0.7412, + "step": 49485 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942540114719856e-06, + "loss": 0.5298, + "step": 49486 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942275659525268e-06, + "loss": 0.6162, + "step": 49487 + }, + { + "epoch": 1.27, + "learning_rate": 1.2942011202077917e-06, + "loss": 0.5215, + "step": 49488 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941746742378001e-06, + "loss": 0.7451, + "step": 49489 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941482280425728e-06, + "loss": 0.5647, + "step": 49490 + }, + { + "epoch": 1.27, + "learning_rate": 1.2941217816221296e-06, + "loss": 0.7979, + "step": 49491 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940953349764908e-06, + "loss": 0.6865, + "step": 49492 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940688881056765e-06, + "loss": 0.7686, + "step": 49493 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940424410097078e-06, + "loss": 0.324, + "step": 49494 + }, + { + "epoch": 1.27, + "learning_rate": 1.2940159936886036e-06, + "loss": 0.6548, + "step": 49495 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939895461423854e-06, + "loss": 0.5107, + "step": 49496 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939630983710728e-06, + "loss": 0.6509, + "step": 49497 + }, + { + "epoch": 1.27, + "learning_rate": 1.293936650374686e-06, + "loss": 0.5732, + "step": 49498 + }, + { + "epoch": 1.27, + "learning_rate": 1.2939102021532456e-06, + "loss": 0.8467, + "step": 49499 + }, + { + "epoch": 1.27, + "learning_rate": 1.2938837537067715e-06, + "loss": 0.6182, + "step": 49500 + }, + { + "epoch": 1.27, + "learning_rate": 1.2938573050352843e-06, + "loss": 0.6353, + "step": 49501 + }, + { + "epoch": 1.27, + "learning_rate": 1.293830856138804e-06, + "loss": 0.6055, + "step": 49502 + }, + { + "epoch": 1.27, + "learning_rate": 1.293804407017351e-06, + "loss": 0.7742, + "step": 49503 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937779576709456e-06, + "loss": 0.834, + "step": 49504 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937515080996075e-06, + "loss": 0.7461, + "step": 49505 + }, + { + "epoch": 1.27, + "learning_rate": 1.2937250583033577e-06, + "loss": 0.7109, + "step": 49506 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936986082822162e-06, + "loss": 0.7432, + "step": 49507 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936721580362026e-06, + "loss": 0.4458, + "step": 49508 + }, + { + "epoch": 1.27, + "learning_rate": 1.2936457075653385e-06, + "loss": 0.5781, + "step": 49509 + }, + { + "epoch": 1.27, + "learning_rate": 1.293619256869643e-06, + "loss": 0.6196, + "step": 49510 + }, + { + "epoch": 1.27, + "learning_rate": 1.2935928059491369e-06, + "loss": 0.7021, + "step": 49511 + }, + { + "epoch": 1.27, + "learning_rate": 1.29356635480384e-06, + "loss": 0.5996, + "step": 49512 + }, + { + "epoch": 1.27, + "learning_rate": 1.293539903433773e-06, + "loss": 0.6812, + "step": 49513 + }, + { + "epoch": 1.27, + "learning_rate": 1.293513451838956e-06, + "loss": 0.625, + "step": 49514 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934870000194094e-06, + "loss": 0.54, + "step": 49515 + }, + { + "epoch": 1.27, + "learning_rate": 1.293460547975153e-06, + "loss": 0.7051, + "step": 49516 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934340957062075e-06, + "loss": 0.7246, + "step": 49517 + }, + { + "epoch": 1.27, + "learning_rate": 1.2934076432125928e-06, + "loss": 0.532, + "step": 49518 + }, + { + "epoch": 1.27, + "learning_rate": 1.2933811904943298e-06, + "loss": 0.8604, + "step": 49519 + }, + { + "epoch": 1.27, + "learning_rate": 1.293354737551438e-06, + "loss": 0.5762, + "step": 49520 + }, + { + "epoch": 1.27, + "learning_rate": 1.293328284383938e-06, + "loss": 0.8115, + "step": 49521 + }, + { + "epoch": 1.27, + "learning_rate": 1.29330183099185e-06, + "loss": 0.7861, + "step": 49522 + }, + { + "epoch": 1.27, + "learning_rate": 1.2932753773751946e-06, + "loss": 0.7695, + "step": 49523 + }, + { + "epoch": 1.27, + "learning_rate": 1.2932489235339915e-06, + "loss": 0.6074, + "step": 49524 + }, + { + "epoch": 1.27, + "learning_rate": 1.293222469468261e-06, + "loss": 0.5693, + "step": 49525 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931960151780237e-06, + "loss": 0.8359, + "step": 49526 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931695606632995e-06, + "loss": 0.667, + "step": 49527 + }, + { + "epoch": 1.27, + "learning_rate": 1.293143105924109e-06, + "loss": 0.4868, + "step": 49528 + }, + { + "epoch": 1.27, + "learning_rate": 1.2931166509604725e-06, + "loss": 0.7529, + "step": 49529 + }, + { + "epoch": 1.27, + "learning_rate": 1.29309019577241e-06, + "loss": 0.7363, + "step": 49530 + }, + { + "epoch": 1.27, + "learning_rate": 1.2930637403599415e-06, + "loss": 0.6306, + "step": 49531 + }, + { + "epoch": 1.27, + "learning_rate": 1.293037284723088e-06, + "loss": 0.7861, + "step": 49532 + }, + { + "epoch": 1.27, + "learning_rate": 1.2930108288618688e-06, + "loss": 0.5513, + "step": 49533 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929843727763053e-06, + "loss": 0.7432, + "step": 49534 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929579164664165e-06, + "loss": 0.623, + "step": 49535 + }, + { + "epoch": 1.27, + "learning_rate": 1.292931459932224e-06, + "loss": 0.6826, + "step": 49536 + }, + { + "epoch": 1.27, + "learning_rate": 1.2929050031737468e-06, + "loss": 0.6631, + "step": 49537 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928785461910058e-06, + "loss": 0.5223, + "step": 49538 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928520889840212e-06, + "loss": 0.6514, + "step": 49539 + }, + { + "epoch": 1.27, + "learning_rate": 1.2928256315528134e-06, + "loss": 0.3564, + "step": 49540 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927991738974022e-06, + "loss": 0.6343, + "step": 49541 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927727160178083e-06, + "loss": 0.4607, + "step": 49542 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927462579140516e-06, + "loss": 0.625, + "step": 49543 + }, + { + "epoch": 1.27, + "learning_rate": 1.2927197995861528e-06, + "loss": 0.7939, + "step": 49544 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926933410341318e-06, + "loss": 0.7422, + "step": 49545 + }, + { + "epoch": 1.27, + "learning_rate": 1.292666882258009e-06, + "loss": 0.5332, + "step": 49546 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926404232578048e-06, + "loss": 0.585, + "step": 49547 + }, + { + "epoch": 1.27, + "learning_rate": 1.2926139640335389e-06, + "loss": 0.5479, + "step": 49548 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925875045852323e-06, + "loss": 0.5505, + "step": 49549 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925610449129044e-06, + "loss": 0.6768, + "step": 49550 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925345850165765e-06, + "loss": 0.6665, + "step": 49551 + }, + { + "epoch": 1.27, + "learning_rate": 1.2925081248962682e-06, + "loss": 0.6553, + "step": 49552 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924816645519996e-06, + "loss": 0.6304, + "step": 49553 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924552039837914e-06, + "loss": 0.6631, + "step": 49554 + }, + { + "epoch": 1.27, + "learning_rate": 1.2924287431916642e-06, + "loss": 0.6895, + "step": 49555 + }, + { + "epoch": 1.27, + "learning_rate": 1.292402282175637e-06, + "loss": 0.5752, + "step": 49556 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923758209357311e-06, + "loss": 0.6201, + "step": 49557 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923493594719662e-06, + "loss": 0.625, + "step": 49558 + }, + { + "epoch": 1.27, + "learning_rate": 1.2923228977843636e-06, + "loss": 0.4032, + "step": 49559 + }, + { + "epoch": 1.27, + "learning_rate": 1.2922964358729422e-06, + "loss": 0.7588, + "step": 49560 + }, + { + "epoch": 1.27, + "learning_rate": 1.292269973737723e-06, + "loss": 0.6843, + "step": 49561 + }, + { + "epoch": 1.27, + "learning_rate": 1.292243511378726e-06, + "loss": 0.5923, + "step": 49562 + }, + { + "epoch": 1.27, + "learning_rate": 1.2922170487959716e-06, + "loss": 0.5894, + "step": 49563 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921905859894803e-06, + "loss": 0.5356, + "step": 49564 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921641229592722e-06, + "loss": 0.7754, + "step": 49565 + }, + { + "epoch": 1.27, + "learning_rate": 1.292137659705367e-06, + "loss": 0.6025, + "step": 49566 + }, + { + "epoch": 1.27, + "learning_rate": 1.2921111962277856e-06, + "loss": 0.4844, + "step": 49567 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920847325265478e-06, + "loss": 0.5339, + "step": 49568 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920582686016745e-06, + "loss": 0.6372, + "step": 49569 + }, + { + "epoch": 1.27, + "learning_rate": 1.292031804453186e-06, + "loss": 0.6387, + "step": 49570 + }, + { + "epoch": 1.27, + "learning_rate": 1.2920053400811015e-06, + "loss": 0.5137, + "step": 49571 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919788754854422e-06, + "loss": 0.6787, + "step": 49572 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919524106662279e-06, + "loss": 0.8047, + "step": 49573 + }, + { + "epoch": 1.27, + "learning_rate": 1.2919259456234794e-06, + "loss": 0.5825, + "step": 49574 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918994803572165e-06, + "loss": 0.4768, + "step": 49575 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918730148674594e-06, + "loss": 0.5962, + "step": 49576 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918465491542287e-06, + "loss": 0.6772, + "step": 49577 + }, + { + "epoch": 1.27, + "learning_rate": 1.2918200832175447e-06, + "loss": 0.6309, + "step": 49578 + }, + { + "epoch": 1.27, + "learning_rate": 1.2917936170574275e-06, + "loss": 0.6211, + "step": 49579 + }, + { + "epoch": 1.27, + "learning_rate": 1.291767150673897e-06, + "loss": 0.6367, + "step": 49580 + }, + { + "epoch": 1.27, + "learning_rate": 1.291740684066974e-06, + "loss": 0.6562, + "step": 49581 + }, + { + "epoch": 1.27, + "learning_rate": 1.2917142172366786e-06, + "loss": 0.5259, + "step": 49582 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916877501830308e-06, + "loss": 0.6968, + "step": 49583 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916612829060517e-06, + "loss": 0.6802, + "step": 49584 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916348154057604e-06, + "loss": 0.6572, + "step": 49585 + }, + { + "epoch": 1.27, + "learning_rate": 1.2916083476821778e-06, + "loss": 0.7061, + "step": 49586 + }, + { + "epoch": 1.27, + "learning_rate": 1.291581879735324e-06, + "loss": 0.5869, + "step": 49587 + }, + { + "epoch": 1.27, + "learning_rate": 1.2915554115652196e-06, + "loss": 0.8262, + "step": 49588 + }, + { + "epoch": 1.27, + "learning_rate": 1.2915289431718845e-06, + "loss": 0.6748, + "step": 49589 + }, + { + "epoch": 1.27, + "learning_rate": 1.291502474555339e-06, + "loss": 0.7871, + "step": 49590 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914760057156039e-06, + "loss": 0.8096, + "step": 49591 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914495366526988e-06, + "loss": 0.6184, + "step": 49592 + }, + { + "epoch": 1.27, + "learning_rate": 1.2914230673666439e-06, + "loss": 0.7666, + "step": 49593 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913965978574602e-06, + "loss": 0.4758, + "step": 49594 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913701281251674e-06, + "loss": 0.5889, + "step": 49595 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913436581697856e-06, + "loss": 0.6904, + "step": 49596 + }, + { + "epoch": 1.27, + "learning_rate": 1.2913171879913356e-06, + "loss": 0.5649, + "step": 49597 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912907175898372e-06, + "loss": 0.5459, + "step": 49598 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912642469653115e-06, + "loss": 0.5215, + "step": 49599 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912377761177774e-06, + "loss": 0.8408, + "step": 49600 + }, + { + "epoch": 1.27, + "learning_rate": 1.2912113050472564e-06, + "loss": 0.4722, + "step": 49601 + }, + { + "epoch": 1.27, + "learning_rate": 1.291184833753768e-06, + "loss": 0.686, + "step": 49602 + }, + { + "epoch": 1.27, + "learning_rate": 1.291158362237333e-06, + "loss": 0.5918, + "step": 49603 + }, + { + "epoch": 1.27, + "learning_rate": 1.2911318904979714e-06, + "loss": 0.7891, + "step": 49604 + }, + { + "epoch": 1.27, + "learning_rate": 1.2911054185357036e-06, + "loss": 0.6357, + "step": 49605 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910789463505493e-06, + "loss": 0.5343, + "step": 49606 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910524739425296e-06, + "loss": 0.6367, + "step": 49607 + }, + { + "epoch": 1.27, + "learning_rate": 1.2910260013116645e-06, + "loss": 0.5679, + "step": 49608 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909995284579742e-06, + "loss": 0.6406, + "step": 49609 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909730553814786e-06, + "loss": 0.603, + "step": 49610 + }, + { + "epoch": 1.27, + "learning_rate": 1.2909465820821986e-06, + "loss": 0.604, + "step": 49611 + }, + { + "epoch": 1.27, + "learning_rate": 1.290920108560154e-06, + "loss": 0.564, + "step": 49612 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908936348153651e-06, + "loss": 0.7471, + "step": 49613 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908671608478528e-06, + "loss": 0.543, + "step": 49614 + }, + { + "epoch": 1.27, + "learning_rate": 1.2908406866576364e-06, + "loss": 0.7344, + "step": 49615 + }, + { + "epoch": 1.27, + "learning_rate": 1.290814212244737e-06, + "loss": 0.6304, + "step": 49616 + }, + { + "epoch": 1.27, + "learning_rate": 1.2907877376091743e-06, + "loss": 0.665, + "step": 49617 + }, + { + "epoch": 1.27, + "learning_rate": 1.290761262750969e-06, + "loss": 0.5669, + "step": 49618 + }, + { + "epoch": 1.27, + "learning_rate": 1.2907347876701412e-06, + "loss": 0.7412, + "step": 49619 + }, + { + "epoch": 1.27, + "learning_rate": 1.290708312366711e-06, + "loss": 0.6699, + "step": 49620 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906818368406986e-06, + "loss": 0.731, + "step": 49621 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906553610921247e-06, + "loss": 0.6406, + "step": 49622 + }, + { + "epoch": 1.27, + "learning_rate": 1.2906288851210093e-06, + "loss": 0.5339, + "step": 49623 + }, + { + "epoch": 1.27, + "learning_rate": 1.290602408927373e-06, + "loss": 0.627, + "step": 49624 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905759325112355e-06, + "loss": 0.5972, + "step": 49625 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905494558726175e-06, + "loss": 0.7227, + "step": 49626 + }, + { + "epoch": 1.27, + "learning_rate": 1.2905229790115391e-06, + "loss": 0.5972, + "step": 49627 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904965019280206e-06, + "loss": 0.6406, + "step": 49628 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904700246220822e-06, + "loss": 0.7041, + "step": 49629 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904435470937448e-06, + "loss": 0.7244, + "step": 49630 + }, + { + "epoch": 1.27, + "learning_rate": 1.2904170693430273e-06, + "loss": 0.7129, + "step": 49631 + }, + { + "epoch": 1.27, + "learning_rate": 1.2903905913699514e-06, + "loss": 0.6021, + "step": 49632 + }, + { + "epoch": 1.27, + "learning_rate": 1.2903641131745363e-06, + "loss": 0.8164, + "step": 49633 + }, + { + "epoch": 1.27, + "learning_rate": 1.290337634756803e-06, + "loss": 0.667, + "step": 49634 + }, + { + "epoch": 1.27, + "learning_rate": 1.290311156116772e-06, + "loss": 0.5796, + "step": 49635 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902846772544622e-06, + "loss": 0.7119, + "step": 49636 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902581981698953e-06, + "loss": 0.751, + "step": 49637 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902317188630912e-06, + "loss": 0.5562, + "step": 49638 + }, + { + "epoch": 1.27, + "learning_rate": 1.2902052393340696e-06, + "loss": 0.6816, + "step": 49639 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901787595828513e-06, + "loss": 0.5078, + "step": 49640 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901522796094567e-06, + "loss": 0.5015, + "step": 49641 + }, + { + "epoch": 1.27, + "learning_rate": 1.2901257994139054e-06, + "loss": 0.6914, + "step": 49642 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900993189962183e-06, + "loss": 0.5132, + "step": 49643 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900728383564159e-06, + "loss": 0.5107, + "step": 49644 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900463574945178e-06, + "loss": 0.6279, + "step": 49645 + }, + { + "epoch": 1.27, + "learning_rate": 1.2900198764105444e-06, + "loss": 0.7222, + "step": 49646 + }, + { + "epoch": 1.27, + "learning_rate": 1.289993395104516e-06, + "loss": 0.8701, + "step": 49647 + }, + { + "epoch": 1.27, + "learning_rate": 1.2899669135764532e-06, + "loss": 0.5366, + "step": 49648 + }, + { + "epoch": 1.27, + "learning_rate": 1.2899404318263765e-06, + "loss": 0.6172, + "step": 49649 + }, + { + "epoch": 1.27, + "learning_rate": 1.289913949854305e-06, + "loss": 0.7568, + "step": 49650 + }, + { + "epoch": 1.27, + "learning_rate": 1.28988746766026e-06, + "loss": 0.71, + "step": 49651 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898609852442614e-06, + "loss": 0.6763, + "step": 49652 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898345026063298e-06, + "loss": 0.447, + "step": 49653 + }, + { + "epoch": 1.27, + "learning_rate": 1.2898080197464854e-06, + "loss": 0.4778, + "step": 49654 + }, + { + "epoch": 1.27, + "learning_rate": 1.289781536664748e-06, + "loss": 0.7646, + "step": 49655 + }, + { + "epoch": 1.27, + "learning_rate": 1.289755053361138e-06, + "loss": 0.6582, + "step": 49656 + }, + { + "epoch": 1.27, + "learning_rate": 1.2897285698356765e-06, + "loss": 0.478, + "step": 49657 + }, + { + "epoch": 1.27, + "learning_rate": 1.2897020860883824e-06, + "loss": 0.5825, + "step": 49658 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896756021192774e-06, + "loss": 0.4797, + "step": 49659 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896491179283808e-06, + "loss": 0.6191, + "step": 49660 + }, + { + "epoch": 1.27, + "learning_rate": 1.2896226335157132e-06, + "loss": 0.3131, + "step": 49661 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895961488812947e-06, + "loss": 0.6387, + "step": 49662 + }, + { + "epoch": 1.27, + "learning_rate": 1.289569664025146e-06, + "loss": 0.6787, + "step": 49663 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895431789472872e-06, + "loss": 0.4617, + "step": 49664 + }, + { + "epoch": 1.27, + "learning_rate": 1.2895166936477384e-06, + "loss": 0.6035, + "step": 49665 + }, + { + "epoch": 1.27, + "learning_rate": 1.28949020812652e-06, + "loss": 0.7207, + "step": 49666 + }, + { + "epoch": 1.27, + "learning_rate": 1.289463722383652e-06, + "loss": 0.6028, + "step": 49667 + }, + { + "epoch": 1.27, + "learning_rate": 1.2894372364191552e-06, + "loss": 0.7812, + "step": 49668 + }, + { + "epoch": 1.27, + "learning_rate": 1.2894107502330496e-06, + "loss": 0.6807, + "step": 49669 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893842638253555e-06, + "loss": 0.5029, + "step": 49670 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893577771960931e-06, + "loss": 0.6938, + "step": 49671 + }, + { + "epoch": 1.27, + "learning_rate": 1.289331290345283e-06, + "loss": 0.3943, + "step": 49672 + }, + { + "epoch": 1.27, + "learning_rate": 1.2893048032729448e-06, + "loss": 0.6602, + "step": 49673 + }, + { + "epoch": 1.27, + "learning_rate": 1.2892783159790997e-06, + "loss": 0.6055, + "step": 49674 + }, + { + "epoch": 1.27, + "learning_rate": 1.289251828463767e-06, + "loss": 0.6738, + "step": 49675 + }, + { + "epoch": 1.27, + "learning_rate": 1.2892253407269678e-06, + "loss": 0.7314, + "step": 49676 + }, + { + "epoch": 1.27, + "learning_rate": 1.289198852768722e-06, + "loss": 0.4062, + "step": 49677 + }, + { + "epoch": 1.27, + "learning_rate": 1.2891723645890498e-06, + "loss": 0.6562, + "step": 49678 + }, + { + "epoch": 1.27, + "learning_rate": 1.289145876187972e-06, + "loss": 0.7383, + "step": 49679 + }, + { + "epoch": 1.27, + "learning_rate": 1.289119387565508e-06, + "loss": 0.7549, + "step": 49680 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890928987216788e-06, + "loss": 0.6091, + "step": 49681 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890664096565044e-06, + "loss": 0.6689, + "step": 49682 + }, + { + "epoch": 1.27, + "learning_rate": 1.289039920370005e-06, + "loss": 0.4302, + "step": 49683 + }, + { + "epoch": 1.27, + "learning_rate": 1.2890134308622015e-06, + "loss": 0.5381, + "step": 49684 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889869411331134e-06, + "loss": 0.6157, + "step": 49685 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889604511827612e-06, + "loss": 0.7178, + "step": 49686 + }, + { + "epoch": 1.27, + "learning_rate": 1.2889339610111653e-06, + "loss": 0.7969, + "step": 49687 + }, + { + "epoch": 1.27, + "learning_rate": 1.288907470618346e-06, + "loss": 0.7881, + "step": 49688 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888809800043238e-06, + "loss": 0.5476, + "step": 49689 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888544891691184e-06, + "loss": 0.6826, + "step": 49690 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888279981127506e-06, + "loss": 0.708, + "step": 49691 + }, + { + "epoch": 1.27, + "learning_rate": 1.2888015068352404e-06, + "loss": 0.7373, + "step": 49692 + }, + { + "epoch": 1.27, + "learning_rate": 1.2887750153366079e-06, + "loss": 0.7646, + "step": 49693 + }, + { + "epoch": 1.27, + "learning_rate": 1.288748523616874e-06, + "loss": 0.6641, + "step": 49694 + }, + { + "epoch": 1.27, + "learning_rate": 1.2887220316760585e-06, + "loss": 0.7598, + "step": 49695 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886955395141819e-06, + "loss": 0.6611, + "step": 49696 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886690471312642e-06, + "loss": 0.6953, + "step": 49697 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886425545273261e-06, + "loss": 0.5742, + "step": 49698 + }, + { + "epoch": 1.27, + "learning_rate": 1.2886160617023878e-06, + "loss": 0.7126, + "step": 49699 + }, + { + "epoch": 1.27, + "learning_rate": 1.2885895686564688e-06, + "loss": 0.7197, + "step": 49700 + }, + { + "epoch": 1.27, + "learning_rate": 1.288563075389591e-06, + "loss": 0.7607, + "step": 49701 + }, + { + "epoch": 1.27, + "learning_rate": 1.288536581901773e-06, + "loss": 0.7466, + "step": 49702 + }, + { + "epoch": 1.27, + "learning_rate": 1.288510088193036e-06, + "loss": 0.6616, + "step": 49703 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884835942634e-06, + "loss": 0.6416, + "step": 49704 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884571001128854e-06, + "loss": 0.5771, + "step": 49705 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884306057415127e-06, + "loss": 0.7158, + "step": 49706 + }, + { + "epoch": 1.27, + "learning_rate": 1.2884041111493016e-06, + "loss": 0.7363, + "step": 49707 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883776163362729e-06, + "loss": 0.8809, + "step": 49708 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883511213024467e-06, + "loss": 0.6084, + "step": 49709 + }, + { + "epoch": 1.27, + "learning_rate": 1.2883246260478436e-06, + "loss": 0.5723, + "step": 49710 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882981305724831e-06, + "loss": 0.793, + "step": 49711 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882716348763863e-06, + "loss": 0.7373, + "step": 49712 + }, + { + "epoch": 1.27, + "learning_rate": 1.288245138959573e-06, + "loss": 0.6377, + "step": 49713 + }, + { + "epoch": 1.27, + "learning_rate": 1.2882186428220638e-06, + "loss": 0.5889, + "step": 49714 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881921464638788e-06, + "loss": 0.7451, + "step": 49715 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881656498850383e-06, + "loss": 0.6963, + "step": 49716 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881391530855622e-06, + "loss": 0.6099, + "step": 49717 + }, + { + "epoch": 1.27, + "learning_rate": 1.2881126560654718e-06, + "loss": 0.7178, + "step": 49718 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880861588247867e-06, + "loss": 0.6621, + "step": 49719 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880596613635274e-06, + "loss": 0.6724, + "step": 49720 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880331636817134e-06, + "loss": 0.5742, + "step": 49721 + }, + { + "epoch": 1.27, + "learning_rate": 1.2880066657793662e-06, + "loss": 0.6631, + "step": 49722 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879801676565051e-06, + "loss": 0.7344, + "step": 49723 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879536693131514e-06, + "loss": 0.6738, + "step": 49724 + }, + { + "epoch": 1.27, + "learning_rate": 1.2879271707493246e-06, + "loss": 0.593, + "step": 49725 + }, + { + "epoch": 1.27, + "learning_rate": 1.287900671965045e-06, + "loss": 0.7969, + "step": 49726 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878741729603332e-06, + "loss": 0.792, + "step": 49727 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878476737352096e-06, + "loss": 0.6572, + "step": 49728 + }, + { + "epoch": 1.27, + "learning_rate": 1.2878211742896943e-06, + "loss": 0.7041, + "step": 49729 + }, + { + "epoch": 1.27, + "learning_rate": 1.287794674623807e-06, + "loss": 0.6675, + "step": 49730 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877681747375691e-06, + "loss": 0.7412, + "step": 49731 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877416746309999e-06, + "loss": 0.5791, + "step": 49732 + }, + { + "epoch": 1.27, + "learning_rate": 1.2877151743041206e-06, + "loss": 0.5928, + "step": 49733 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876886737569508e-06, + "loss": 0.7656, + "step": 49734 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876621729895113e-06, + "loss": 0.7637, + "step": 49735 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876356720018215e-06, + "loss": 0.6108, + "step": 49736 + }, + { + "epoch": 1.27, + "learning_rate": 1.2876091707939028e-06, + "loss": 0.8789, + "step": 49737 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875826693657745e-06, + "loss": 0.707, + "step": 49738 + }, + { + "epoch": 1.27, + "learning_rate": 1.287556167717458e-06, + "loss": 0.4795, + "step": 49739 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875296658489725e-06, + "loss": 0.7422, + "step": 49740 + }, + { + "epoch": 1.27, + "learning_rate": 1.2875031637603388e-06, + "loss": 0.6218, + "step": 49741 + }, + { + "epoch": 1.27, + "learning_rate": 1.2874766614515773e-06, + "loss": 0.5718, + "step": 49742 + }, + { + "epoch": 1.27, + "learning_rate": 1.287450158922708e-06, + "loss": 0.5576, + "step": 49743 + }, + { + "epoch": 1.27, + "learning_rate": 1.2874236561737514e-06, + "loss": 0.5449, + "step": 49744 + }, + { + "epoch": 1.27, + "learning_rate": 1.2873971532047278e-06, + "loss": 0.6826, + "step": 49745 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873706500156574e-06, + "loss": 0.7773, + "step": 49746 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873441466065605e-06, + "loss": 0.75, + "step": 49747 + }, + { + "epoch": 1.28, + "learning_rate": 1.2873176429774572e-06, + "loss": 0.6318, + "step": 49748 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872911391283681e-06, + "loss": 0.7598, + "step": 49749 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872646350593136e-06, + "loss": 0.5991, + "step": 49750 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872381307703135e-06, + "loss": 0.4819, + "step": 49751 + }, + { + "epoch": 1.28, + "learning_rate": 1.2872116262613886e-06, + "loss": 0.5859, + "step": 49752 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871851215325587e-06, + "loss": 0.7891, + "step": 49753 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871586165838445e-06, + "loss": 0.666, + "step": 49754 + }, + { + "epoch": 1.28, + "learning_rate": 1.287132111415266e-06, + "loss": 0.6582, + "step": 49755 + }, + { + "epoch": 1.28, + "learning_rate": 1.2871056060268439e-06, + "loss": 0.6025, + "step": 49756 + }, + { + "epoch": 1.28, + "learning_rate": 1.287079100418598e-06, + "loss": 0.7744, + "step": 49757 + }, + { + "epoch": 1.28, + "learning_rate": 1.287052594590549e-06, + "loss": 0.5859, + "step": 49758 + }, + { + "epoch": 1.28, + "learning_rate": 1.2870260885427172e-06, + "loss": 0.6421, + "step": 49759 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869995822751225e-06, + "loss": 0.8018, + "step": 49760 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869730757877853e-06, + "loss": 0.6431, + "step": 49761 + }, + { + "epoch": 1.28, + "learning_rate": 1.2869465690807262e-06, + "loss": 0.75, + "step": 49762 + }, + { + "epoch": 1.28, + "learning_rate": 1.286920062153965e-06, + "loss": 0.7363, + "step": 49763 + }, + { + "epoch": 1.28, + "learning_rate": 1.286893555007523e-06, + "loss": 0.625, + "step": 49764 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868670476414192e-06, + "loss": 0.6636, + "step": 49765 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868405400556746e-06, + "loss": 0.7002, + "step": 49766 + }, + { + "epoch": 1.28, + "learning_rate": 1.2868140322503094e-06, + "loss": 0.5559, + "step": 49767 + }, + { + "epoch": 1.28, + "learning_rate": 1.286787524225344e-06, + "loss": 0.6738, + "step": 49768 + }, + { + "epoch": 1.28, + "learning_rate": 1.2867610159807986e-06, + "loss": 0.6934, + "step": 49769 + }, + { + "epoch": 1.28, + "learning_rate": 1.286734507516693e-06, + "loss": 0.54, + "step": 49770 + }, + { + "epoch": 1.28, + "learning_rate": 1.2867079988330485e-06, + "loss": 0.6631, + "step": 49771 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866814899298848e-06, + "loss": 0.6289, + "step": 49772 + }, + { + "epoch": 1.28, + "learning_rate": 1.286654980807222e-06, + "loss": 0.5378, + "step": 49773 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866284714650807e-06, + "loss": 0.5537, + "step": 49774 + }, + { + "epoch": 1.28, + "learning_rate": 1.2866019619034817e-06, + "loss": 0.8145, + "step": 49775 + }, + { + "epoch": 1.28, + "learning_rate": 1.286575452122444e-06, + "loss": 0.6689, + "step": 49776 + }, + { + "epoch": 1.28, + "learning_rate": 1.286548942121989e-06, + "loss": 0.6719, + "step": 49777 + }, + { + "epoch": 1.28, + "learning_rate": 1.2865224319021365e-06, + "loss": 0.4871, + "step": 49778 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864959214629073e-06, + "loss": 0.6719, + "step": 49779 + }, + { + "epoch": 1.28, + "learning_rate": 1.286469410804321e-06, + "loss": 0.6685, + "step": 49780 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864428999263988e-06, + "loss": 0.6738, + "step": 49781 + }, + { + "epoch": 1.28, + "learning_rate": 1.2864163888291597e-06, + "loss": 0.5723, + "step": 49782 + }, + { + "epoch": 1.28, + "learning_rate": 1.286389877512625e-06, + "loss": 0.5361, + "step": 49783 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863633659768152e-06, + "loss": 0.4668, + "step": 49784 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863368542217496e-06, + "loss": 0.5688, + "step": 49785 + }, + { + "epoch": 1.28, + "learning_rate": 1.2863103422474491e-06, + "loss": 0.8076, + "step": 49786 + }, + { + "epoch": 1.28, + "learning_rate": 1.286283830053934e-06, + "loss": 0.6357, + "step": 49787 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862573176412248e-06, + "loss": 0.6621, + "step": 49788 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862308050093414e-06, + "loss": 0.6963, + "step": 49789 + }, + { + "epoch": 1.28, + "learning_rate": 1.2862042921583039e-06, + "loss": 0.4126, + "step": 49790 + }, + { + "epoch": 1.28, + "learning_rate": 1.2861777790881332e-06, + "loss": 0.6396, + "step": 49791 + }, + { + "epoch": 1.28, + "learning_rate": 1.286151265798849e-06, + "loss": 0.5747, + "step": 49792 + }, + { + "epoch": 1.28, + "learning_rate": 1.2861247522904724e-06, + "loss": 0.4932, + "step": 49793 + }, + { + "epoch": 1.28, + "learning_rate": 1.286098238563023e-06, + "loss": 0.752, + "step": 49794 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860717246165214e-06, + "loss": 0.7275, + "step": 49795 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860452104509878e-06, + "loss": 0.6875, + "step": 49796 + }, + { + "epoch": 1.28, + "learning_rate": 1.2860186960664424e-06, + "loss": 0.6084, + "step": 49797 + }, + { + "epoch": 1.28, + "learning_rate": 1.2859921814629062e-06, + "loss": 0.6357, + "step": 49798 + }, + { + "epoch": 1.28, + "learning_rate": 1.2859656666403984e-06, + "loss": 0.6064, + "step": 49799 + }, + { + "epoch": 1.28, + "learning_rate": 1.28593915159894e-06, + "loss": 0.5889, + "step": 49800 + }, + { + "epoch": 1.28, + "learning_rate": 1.285912636338551e-06, + "loss": 0.7715, + "step": 49801 + }, + { + "epoch": 1.28, + "learning_rate": 1.285886120859252e-06, + "loss": 0.5679, + "step": 49802 + }, + { + "epoch": 1.28, + "learning_rate": 1.2858596051610633e-06, + "loss": 0.7705, + "step": 49803 + }, + { + "epoch": 1.28, + "learning_rate": 1.2858330892440049e-06, + "loss": 0.6284, + "step": 49804 + }, + { + "epoch": 1.28, + "learning_rate": 1.285806573108097e-06, + "loss": 0.8154, + "step": 49805 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857800567533603e-06, + "loss": 0.5837, + "step": 49806 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857535401798148e-06, + "loss": 0.6807, + "step": 49807 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857270233874815e-06, + "loss": 0.4802, + "step": 49808 + }, + { + "epoch": 1.28, + "learning_rate": 1.2857005063763797e-06, + "loss": 0.6543, + "step": 49809 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856739891465302e-06, + "loss": 0.7222, + "step": 49810 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856474716979532e-06, + "loss": 0.6914, + "step": 49811 + }, + { + "epoch": 1.28, + "learning_rate": 1.2856209540306694e-06, + "loss": 0.7461, + "step": 49812 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855944361446984e-06, + "loss": 0.6636, + "step": 49813 + }, + { + "epoch": 1.28, + "learning_rate": 1.285567918040061e-06, + "loss": 0.6221, + "step": 49814 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855413997167774e-06, + "loss": 0.4624, + "step": 49815 + }, + { + "epoch": 1.28, + "learning_rate": 1.2855148811748677e-06, + "loss": 0.5581, + "step": 49816 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854883624143526e-06, + "loss": 0.6094, + "step": 49817 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854618434352525e-06, + "loss": 0.7402, + "step": 49818 + }, + { + "epoch": 1.28, + "learning_rate": 1.285435324237587e-06, + "loss": 0.6216, + "step": 49819 + }, + { + "epoch": 1.28, + "learning_rate": 1.2854088048213767e-06, + "loss": 0.6816, + "step": 49820 + }, + { + "epoch": 1.28, + "learning_rate": 1.285382285186642e-06, + "loss": 0.5857, + "step": 49821 + }, + { + "epoch": 1.28, + "learning_rate": 1.2853557653334033e-06, + "loss": 0.6709, + "step": 49822 + }, + { + "epoch": 1.28, + "learning_rate": 1.285329245261681e-06, + "loss": 0.6147, + "step": 49823 + }, + { + "epoch": 1.28, + "learning_rate": 1.2853027249714953e-06, + "loss": 0.4081, + "step": 49824 + }, + { + "epoch": 1.28, + "learning_rate": 1.2852762044628663e-06, + "loss": 0.5205, + "step": 49825 + }, + { + "epoch": 1.28, + "learning_rate": 1.285249683735814e-06, + "loss": 0.7876, + "step": 49826 + }, + { + "epoch": 1.28, + "learning_rate": 1.2852231627903596e-06, + "loss": 0.7324, + "step": 49827 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851966416265227e-06, + "loss": 0.4612, + "step": 49828 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851701202443241e-06, + "loss": 0.3921, + "step": 49829 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851435986437835e-06, + "loss": 0.7734, + "step": 49830 + }, + { + "epoch": 1.28, + "learning_rate": 1.2851170768249219e-06, + "loss": 0.5693, + "step": 49831 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850905547877589e-06, + "loss": 0.6699, + "step": 49832 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850640325323155e-06, + "loss": 0.394, + "step": 49833 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850375100586118e-06, + "loss": 0.5972, + "step": 49834 + }, + { + "epoch": 1.28, + "learning_rate": 1.2850109873666678e-06, + "loss": 0.5542, + "step": 49835 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849844644565035e-06, + "loss": 0.6157, + "step": 49836 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849579413281403e-06, + "loss": 0.6855, + "step": 49837 + }, + { + "epoch": 1.28, + "learning_rate": 1.284931417981598e-06, + "loss": 0.6787, + "step": 49838 + }, + { + "epoch": 1.28, + "learning_rate": 1.2849048944168962e-06, + "loss": 0.6121, + "step": 49839 + }, + { + "epoch": 1.28, + "learning_rate": 1.2848783706340563e-06, + "loss": 0.5029, + "step": 49840 + }, + { + "epoch": 1.28, + "learning_rate": 1.284851846633098e-06, + "loss": 0.6777, + "step": 49841 + }, + { + "epoch": 1.28, + "learning_rate": 1.2848253224140417e-06, + "loss": 0.5457, + "step": 49842 + }, + { + "epoch": 1.28, + "learning_rate": 1.284798797976908e-06, + "loss": 0.6792, + "step": 49843 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847722733217167e-06, + "loss": 0.6387, + "step": 49844 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847457484484882e-06, + "loss": 0.7607, + "step": 49845 + }, + { + "epoch": 1.28, + "learning_rate": 1.2847192233572433e-06, + "loss": 0.666, + "step": 49846 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846926980480017e-06, + "loss": 0.6318, + "step": 49847 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846661725207845e-06, + "loss": 0.7119, + "step": 49848 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846396467756111e-06, + "loss": 0.5203, + "step": 49849 + }, + { + "epoch": 1.28, + "learning_rate": 1.2846131208125025e-06, + "loss": 0.5244, + "step": 49850 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845865946314783e-06, + "loss": 0.5896, + "step": 49851 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845600682325594e-06, + "loss": 0.6904, + "step": 49852 + }, + { + "epoch": 1.28, + "learning_rate": 1.284533541615766e-06, + "loss": 0.5938, + "step": 49853 + }, + { + "epoch": 1.28, + "learning_rate": 1.2845070147811185e-06, + "loss": 0.6582, + "step": 49854 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844804877286368e-06, + "loss": 0.5713, + "step": 49855 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844539604583416e-06, + "loss": 0.5635, + "step": 49856 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844274329702529e-06, + "loss": 0.7539, + "step": 49857 + }, + { + "epoch": 1.28, + "learning_rate": 1.2844009052643913e-06, + "loss": 0.7617, + "step": 49858 + }, + { + "epoch": 1.28, + "learning_rate": 1.284374377340777e-06, + "loss": 0.5737, + "step": 49859 + }, + { + "epoch": 1.28, + "learning_rate": 1.2843478491994305e-06, + "loss": 0.6855, + "step": 49860 + }, + { + "epoch": 1.28, + "learning_rate": 1.2843213208403716e-06, + "loss": 0.6768, + "step": 49861 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842947922636213e-06, + "loss": 0.8887, + "step": 49862 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842682634691992e-06, + "loss": 0.5845, + "step": 49863 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842417344571262e-06, + "loss": 0.5557, + "step": 49864 + }, + { + "epoch": 1.28, + "learning_rate": 1.2842152052274221e-06, + "loss": 0.7861, + "step": 49865 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841886757801076e-06, + "loss": 0.4514, + "step": 49866 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841621461152033e-06, + "loss": 0.4895, + "step": 49867 + }, + { + "epoch": 1.28, + "learning_rate": 1.2841356162327288e-06, + "loss": 0.7759, + "step": 49868 + }, + { + "epoch": 1.28, + "learning_rate": 1.284109086132705e-06, + "loss": 0.627, + "step": 49869 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840825558151513e-06, + "loss": 0.7148, + "step": 49870 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840560252800892e-06, + "loss": 0.7725, + "step": 49871 + }, + { + "epoch": 1.28, + "learning_rate": 1.284029494527538e-06, + "loss": 0.5452, + "step": 49872 + }, + { + "epoch": 1.28, + "learning_rate": 1.2840029635575192e-06, + "loss": 0.8066, + "step": 49873 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839764323700517e-06, + "loss": 0.7764, + "step": 49874 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839499009651566e-06, + "loss": 0.6753, + "step": 49875 + }, + { + "epoch": 1.28, + "learning_rate": 1.2839233693428542e-06, + "loss": 0.5427, + "step": 49876 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838968375031649e-06, + "loss": 0.7754, + "step": 49877 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838703054461086e-06, + "loss": 0.5815, + "step": 49878 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838437731717062e-06, + "loss": 0.5015, + "step": 49879 + }, + { + "epoch": 1.28, + "learning_rate": 1.2838172406799773e-06, + "loss": 0.47, + "step": 49880 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837907079709428e-06, + "loss": 0.4756, + "step": 49881 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837641750446226e-06, + "loss": 0.6943, + "step": 49882 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837376419010376e-06, + "loss": 0.5991, + "step": 49883 + }, + { + "epoch": 1.28, + "learning_rate": 1.2837111085402075e-06, + "loss": 0.6172, + "step": 49884 + }, + { + "epoch": 1.28, + "learning_rate": 1.2836845749621528e-06, + "loss": 0.8359, + "step": 49885 + }, + { + "epoch": 1.28, + "learning_rate": 1.283658041166894e-06, + "loss": 0.5288, + "step": 49886 + }, + { + "epoch": 1.28, + "learning_rate": 1.283631507154451e-06, + "loss": 0.6914, + "step": 49887 + }, + { + "epoch": 1.28, + "learning_rate": 1.283604972924845e-06, + "loss": 0.6387, + "step": 49888 + }, + { + "epoch": 1.28, + "learning_rate": 1.283578438478095e-06, + "loss": 0.5308, + "step": 49889 + }, + { + "epoch": 1.28, + "learning_rate": 1.2835519038142225e-06, + "loss": 0.6431, + "step": 49890 + }, + { + "epoch": 1.28, + "learning_rate": 1.2835253689332471e-06, + "loss": 0.6768, + "step": 49891 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834988338351895e-06, + "loss": 0.6968, + "step": 49892 + }, + { + "epoch": 1.28, + "learning_rate": 1.28347229852007e-06, + "loss": 0.6943, + "step": 49893 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834457629879086e-06, + "loss": 0.7607, + "step": 49894 + }, + { + "epoch": 1.28, + "learning_rate": 1.2834192272387257e-06, + "loss": 0.7256, + "step": 49895 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833926912725419e-06, + "loss": 0.5615, + "step": 49896 + }, + { + "epoch": 1.28, + "learning_rate": 1.283366155089377e-06, + "loss": 0.6772, + "step": 49897 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833396186892525e-06, + "loss": 0.6592, + "step": 49898 + }, + { + "epoch": 1.28, + "learning_rate": 1.2833130820721872e-06, + "loss": 0.5435, + "step": 49899 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832865452382022e-06, + "loss": 0.7461, + "step": 49900 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832600081873178e-06, + "loss": 0.6357, + "step": 49901 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832334709195541e-06, + "loss": 0.7031, + "step": 49902 + }, + { + "epoch": 1.28, + "learning_rate": 1.2832069334349318e-06, + "loss": 0.7686, + "step": 49903 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831803957334706e-06, + "loss": 0.5229, + "step": 49904 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831538578151918e-06, + "loss": 0.6611, + "step": 49905 + }, + { + "epoch": 1.28, + "learning_rate": 1.2831273196801145e-06, + "loss": 0.5488, + "step": 49906 + }, + { + "epoch": 1.28, + "learning_rate": 1.28310078132826e-06, + "loss": 0.6577, + "step": 49907 + }, + { + "epoch": 1.28, + "learning_rate": 1.283074242759648e-06, + "loss": 0.5508, + "step": 49908 + }, + { + "epoch": 1.28, + "learning_rate": 1.2830477039742992e-06, + "loss": 0.8721, + "step": 49909 + }, + { + "epoch": 1.28, + "learning_rate": 1.2830211649722337e-06, + "loss": 0.6919, + "step": 49910 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829946257534721e-06, + "loss": 0.8428, + "step": 49911 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829680863180343e-06, + "loss": 0.5513, + "step": 49912 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829415466659413e-06, + "loss": 0.6396, + "step": 49913 + }, + { + "epoch": 1.28, + "learning_rate": 1.2829150067972124e-06, + "loss": 0.5923, + "step": 49914 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828884667118688e-06, + "loss": 0.6934, + "step": 49915 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828619264099303e-06, + "loss": 0.5366, + "step": 49916 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828353858914176e-06, + "loss": 0.455, + "step": 49917 + }, + { + "epoch": 1.28, + "learning_rate": 1.2828088451563509e-06, + "loss": 0.623, + "step": 49918 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827823042047503e-06, + "loss": 0.71, + "step": 49919 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827557630366363e-06, + "loss": 0.7852, + "step": 49920 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827292216520293e-06, + "loss": 0.6753, + "step": 49921 + }, + { + "epoch": 1.28, + "learning_rate": 1.2827026800509495e-06, + "loss": 0.7461, + "step": 49922 + }, + { + "epoch": 1.28, + "learning_rate": 1.2826761382334171e-06, + "loss": 0.6675, + "step": 49923 + }, + { + "epoch": 1.28, + "learning_rate": 1.282649596199453e-06, + "loss": 0.748, + "step": 49924 + }, + { + "epoch": 1.28, + "learning_rate": 1.282623053949077e-06, + "loss": 0.5815, + "step": 49925 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825965114823092e-06, + "loss": 0.708, + "step": 49926 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825699687991704e-06, + "loss": 0.5786, + "step": 49927 + }, + { + "epoch": 1.28, + "learning_rate": 1.282543425899681e-06, + "loss": 0.4429, + "step": 49928 + }, + { + "epoch": 1.28, + "learning_rate": 1.2825168827838609e-06, + "loss": 0.7998, + "step": 49929 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824903394517303e-06, + "loss": 0.8447, + "step": 49930 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824637959033103e-06, + "loss": 0.5669, + "step": 49931 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824372521386204e-06, + "loss": 0.5723, + "step": 49932 + }, + { + "epoch": 1.28, + "learning_rate": 1.2824107081576816e-06, + "loss": 0.8623, + "step": 49933 + }, + { + "epoch": 1.28, + "learning_rate": 1.282384163960514e-06, + "loss": 0.7285, + "step": 49934 + }, + { + "epoch": 1.28, + "learning_rate": 1.2823576195471372e-06, + "loss": 0.4231, + "step": 49935 + }, + { + "epoch": 1.28, + "learning_rate": 1.2823310749175728e-06, + "loss": 0.6484, + "step": 49936 + }, + { + "epoch": 1.28, + "learning_rate": 1.28230453007184e-06, + "loss": 0.5164, + "step": 49937 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822779850099603e-06, + "loss": 0.6992, + "step": 49938 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822514397319526e-06, + "loss": 0.7793, + "step": 49939 + }, + { + "epoch": 1.28, + "learning_rate": 1.2822248942378385e-06, + "loss": 0.4881, + "step": 49940 + }, + { + "epoch": 1.28, + "learning_rate": 1.282198348527637e-06, + "loss": 0.5269, + "step": 49941 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821718026013699e-06, + "loss": 0.6719, + "step": 49942 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821452564590567e-06, + "loss": 0.6318, + "step": 49943 + }, + { + "epoch": 1.28, + "learning_rate": 1.2821187101007178e-06, + "loss": 0.7061, + "step": 49944 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820921635263734e-06, + "loss": 0.6992, + "step": 49945 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820656167360445e-06, + "loss": 0.6565, + "step": 49946 + }, + { + "epoch": 1.28, + "learning_rate": 1.2820390697297504e-06, + "loss": 0.6592, + "step": 49947 + }, + { + "epoch": 1.28, + "learning_rate": 1.282012522507512e-06, + "loss": 0.6597, + "step": 49948 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819859750693498e-06, + "loss": 0.6982, + "step": 49949 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819594274152836e-06, + "loss": 0.645, + "step": 49950 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819328795453345e-06, + "loss": 0.7402, + "step": 49951 + }, + { + "epoch": 1.28, + "learning_rate": 1.2819063314595223e-06, + "loss": 0.8701, + "step": 49952 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818797831578672e-06, + "loss": 0.6465, + "step": 49953 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818532346403895e-06, + "loss": 0.5757, + "step": 49954 + }, + { + "epoch": 1.28, + "learning_rate": 1.28182668590711e-06, + "loss": 0.6147, + "step": 49955 + }, + { + "epoch": 1.28, + "learning_rate": 1.2818001369580485e-06, + "loss": 0.8213, + "step": 49956 + }, + { + "epoch": 1.28, + "learning_rate": 1.2817735877932258e-06, + "loss": 0.8105, + "step": 49957 + }, + { + "epoch": 1.28, + "learning_rate": 1.281747038412662e-06, + "loss": 0.605, + "step": 49958 + }, + { + "epoch": 1.28, + "learning_rate": 1.2817204888163777e-06, + "loss": 0.6611, + "step": 49959 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816939390043926e-06, + "loss": 0.7173, + "step": 49960 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816673889767275e-06, + "loss": 0.8154, + "step": 49961 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816408387334025e-06, + "loss": 0.7832, + "step": 49962 + }, + { + "epoch": 1.28, + "learning_rate": 1.2816142882744388e-06, + "loss": 0.5881, + "step": 49963 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815877375998552e-06, + "loss": 0.7051, + "step": 49964 + }, + { + "epoch": 1.28, + "learning_rate": 1.281561186709673e-06, + "loss": 0.8047, + "step": 49965 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815346356039124e-06, + "loss": 0.6016, + "step": 49966 + }, + { + "epoch": 1.28, + "learning_rate": 1.2815080842825935e-06, + "loss": 0.7529, + "step": 49967 + }, + { + "epoch": 1.28, + "learning_rate": 1.2814815327457372e-06, + "loss": 0.7275, + "step": 49968 + }, + { + "epoch": 1.28, + "learning_rate": 1.2814549809933633e-06, + "loss": 0.4721, + "step": 49969 + }, + { + "epoch": 1.28, + "learning_rate": 1.281428429025492e-06, + "loss": 0.7812, + "step": 49970 + }, + { + "epoch": 1.28, + "learning_rate": 1.281401876842144e-06, + "loss": 0.6235, + "step": 49971 + }, + { + "epoch": 1.28, + "learning_rate": 1.2813753244433394e-06, + "loss": 0.8057, + "step": 49972 + }, + { + "epoch": 1.28, + "learning_rate": 1.281348771829099e-06, + "loss": 0.5473, + "step": 49973 + }, + { + "epoch": 1.28, + "learning_rate": 1.2813222189994426e-06, + "loss": 0.5754, + "step": 49974 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812956659543905e-06, + "loss": 0.4833, + "step": 49975 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812691126939636e-06, + "loss": 0.6782, + "step": 49976 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812425592181817e-06, + "loss": 0.6738, + "step": 49977 + }, + { + "epoch": 1.28, + "learning_rate": 1.2812160055270655e-06, + "loss": 0.5659, + "step": 49978 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811894516206349e-06, + "loss": 0.623, + "step": 49979 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811628974989106e-06, + "loss": 0.8408, + "step": 49980 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811363431619126e-06, + "loss": 0.8096, + "step": 49981 + }, + { + "epoch": 1.28, + "learning_rate": 1.2811097886096617e-06, + "loss": 0.8076, + "step": 49982 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810832338421777e-06, + "loss": 0.6675, + "step": 49983 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810566788594815e-06, + "loss": 0.543, + "step": 49984 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810301236615929e-06, + "loss": 0.8611, + "step": 49985 + }, + { + "epoch": 1.28, + "learning_rate": 1.2810035682485325e-06, + "loss": 0.7012, + "step": 49986 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809770126203205e-06, + "loss": 0.6611, + "step": 49987 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809504567769778e-06, + "loss": 0.6826, + "step": 49988 + }, + { + "epoch": 1.28, + "learning_rate": 1.2809239007185236e-06, + "loss": 0.7729, + "step": 49989 + }, + { + "epoch": 1.28, + "learning_rate": 1.280897344444979e-06, + "loss": 0.7529, + "step": 49990 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808707879563645e-06, + "loss": 0.6372, + "step": 49991 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808442312527001e-06, + "loss": 0.5225, + "step": 49992 + }, + { + "epoch": 1.28, + "learning_rate": 1.2808176743340063e-06, + "loss": 0.7949, + "step": 49993 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807911172003027e-06, + "loss": 0.7002, + "step": 49994 + }, + { + "epoch": 1.28, + "learning_rate": 1.280764559851611e-06, + "loss": 0.5776, + "step": 49995 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807380022879502e-06, + "loss": 0.8691, + "step": 49996 + }, + { + "epoch": 1.28, + "learning_rate": 1.2807114445093413e-06, + "loss": 0.6455, + "step": 49997 + }, + { + "epoch": 1.28, + "learning_rate": 1.280684886515805e-06, + "loss": 0.6733, + "step": 49998 + }, + { + "epoch": 1.28, + "learning_rate": 1.280658328307361e-06, + "loss": 0.6438, + "step": 49999 + }, + { + "epoch": 1.28, + "learning_rate": 1.2806317698840297e-06, + "loss": 0.4318, + "step": 50000 + }, + { + "epoch": 1.28, + "learning_rate": 1.2806052112458316e-06, + "loss": 0.6055, + "step": 50001 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805786523927869e-06, + "loss": 0.6123, + "step": 50002 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805520933249164e-06, + "loss": 0.5898, + "step": 50003 + }, + { + "epoch": 1.28, + "learning_rate": 1.2805255340422396e-06, + "loss": 0.5688, + "step": 50004 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804989745447777e-06, + "loss": 0.7178, + "step": 50005 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804724148325503e-06, + "loss": 0.6289, + "step": 50006 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804458549055781e-06, + "loss": 0.564, + "step": 50007 + }, + { + "epoch": 1.28, + "learning_rate": 1.2804192947638816e-06, + "loss": 0.5579, + "step": 50008 + }, + { + "epoch": 1.28, + "learning_rate": 1.280392734407481e-06, + "loss": 0.6895, + "step": 50009 + }, + { + "epoch": 1.28, + "learning_rate": 1.2803661738363962e-06, + "loss": 0.6567, + "step": 50010 + }, + { + "epoch": 1.28, + "learning_rate": 1.2803396130506484e-06, + "loss": 0.7397, + "step": 50011 + }, + { + "epoch": 1.28, + "learning_rate": 1.280313052050257e-06, + "loss": 0.6379, + "step": 50012 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802864908352428e-06, + "loss": 0.7109, + "step": 50013 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802599294056264e-06, + "loss": 0.7236, + "step": 50014 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802333677614278e-06, + "loss": 0.4922, + "step": 50015 + }, + { + "epoch": 1.28, + "learning_rate": 1.2802068059026674e-06, + "loss": 0.7051, + "step": 50016 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801802438293654e-06, + "loss": 0.7998, + "step": 50017 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801536815415423e-06, + "loss": 0.6426, + "step": 50018 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801271190392185e-06, + "loss": 0.5845, + "step": 50019 + }, + { + "epoch": 1.28, + "learning_rate": 1.2801005563224141e-06, + "loss": 0.7568, + "step": 50020 + }, + { + "epoch": 1.28, + "learning_rate": 1.2800739933911495e-06, + "loss": 0.6973, + "step": 50021 + }, + { + "epoch": 1.28, + "learning_rate": 1.2800474302454455e-06, + "loss": 0.7236, + "step": 50022 + }, + { + "epoch": 1.28, + "learning_rate": 1.280020866885322e-06, + "loss": 0.8506, + "step": 50023 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799943033107993e-06, + "loss": 0.8008, + "step": 50024 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799677395218974e-06, + "loss": 0.603, + "step": 50025 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799411755186378e-06, + "loss": 0.6621, + "step": 50026 + }, + { + "epoch": 1.28, + "learning_rate": 1.2799146113010395e-06, + "loss": 0.6377, + "step": 50027 + }, + { + "epoch": 1.28, + "learning_rate": 1.279888046869124e-06, + "loss": 0.6543, + "step": 50028 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798614822229108e-06, + "loss": 0.5801, + "step": 50029 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798349173624206e-06, + "loss": 0.5425, + "step": 50030 + }, + { + "epoch": 1.28, + "learning_rate": 1.2798083522876734e-06, + "loss": 0.709, + "step": 50031 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797817869986902e-06, + "loss": 0.4893, + "step": 50032 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797552214954907e-06, + "loss": 0.6509, + "step": 50033 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797286557780958e-06, + "loss": 0.7119, + "step": 50034 + }, + { + "epoch": 1.28, + "learning_rate": 1.2797020898465252e-06, + "loss": 0.583, + "step": 50035 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796755237007997e-06, + "loss": 0.708, + "step": 50036 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796489573409393e-06, + "loss": 0.6382, + "step": 50037 + }, + { + "epoch": 1.28, + "learning_rate": 1.2796223907669647e-06, + "loss": 0.6763, + "step": 50038 + }, + { + "epoch": 1.28, + "learning_rate": 1.2795958239788965e-06, + "loss": 0.5918, + "step": 50039 + }, + { + "epoch": 1.28, + "learning_rate": 1.279569256976754e-06, + "loss": 0.7559, + "step": 50040 + }, + { + "epoch": 1.28, + "learning_rate": 1.2795426897605587e-06, + "loss": 0.5422, + "step": 50041 + }, + { + "epoch": 1.28, + "learning_rate": 1.27951612233033e-06, + "loss": 0.6523, + "step": 50042 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794895546860889e-06, + "loss": 0.6226, + "step": 50043 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794629868278553e-06, + "loss": 0.7617, + "step": 50044 + }, + { + "epoch": 1.28, + "learning_rate": 1.27943641875565e-06, + "loss": 0.6875, + "step": 50045 + }, + { + "epoch": 1.28, + "learning_rate": 1.2794098504694927e-06, + "loss": 0.79, + "step": 50046 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793832819694044e-06, + "loss": 0.7734, + "step": 50047 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793567132554052e-06, + "loss": 0.7744, + "step": 50048 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793301443275155e-06, + "loss": 0.4707, + "step": 50049 + }, + { + "epoch": 1.28, + "learning_rate": 1.2793035751857553e-06, + "loss": 0.7441, + "step": 50050 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792770058301451e-06, + "loss": 0.7266, + "step": 50051 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792504362607055e-06, + "loss": 0.7637, + "step": 50052 + }, + { + "epoch": 1.28, + "learning_rate": 1.2792238664774572e-06, + "loss": 0.4741, + "step": 50053 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791972964804192e-06, + "loss": 0.792, + "step": 50054 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791707262696132e-06, + "loss": 0.7295, + "step": 50055 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791441558450587e-06, + "loss": 0.6138, + "step": 50056 + }, + { + "epoch": 1.28, + "learning_rate": 1.2791175852067765e-06, + "loss": 0.7197, + "step": 50057 + }, + { + "epoch": 1.28, + "learning_rate": 1.279091014354787e-06, + "loss": 0.5908, + "step": 50058 + }, + { + "epoch": 1.28, + "learning_rate": 1.2790644432891098e-06, + "loss": 0.6147, + "step": 50059 + }, + { + "epoch": 1.28, + "learning_rate": 1.2790378720097662e-06, + "loss": 0.7842, + "step": 50060 + }, + { + "epoch": 1.28, + "learning_rate": 1.279011300516776e-06, + "loss": 0.6582, + "step": 50061 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789847288101595e-06, + "loss": 0.7891, + "step": 50062 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789581568899377e-06, + "loss": 0.5898, + "step": 50063 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789315847561302e-06, + "loss": 0.7461, + "step": 50064 + }, + { + "epoch": 1.28, + "learning_rate": 1.2789050124087575e-06, + "loss": 0.6641, + "step": 50065 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788784398478404e-06, + "loss": 0.498, + "step": 50066 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788518670733983e-06, + "loss": 0.7939, + "step": 50067 + }, + { + "epoch": 1.28, + "learning_rate": 1.2788252940854527e-06, + "loss": 0.7988, + "step": 50068 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787987208840233e-06, + "loss": 0.4325, + "step": 50069 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787721474691305e-06, + "loss": 0.7939, + "step": 50070 + }, + { + "epoch": 1.28, + "learning_rate": 1.2787455738407943e-06, + "loss": 0.8105, + "step": 50071 + }, + { + "epoch": 1.28, + "learning_rate": 1.278718999999036e-06, + "loss": 0.6348, + "step": 50072 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786924259438752e-06, + "loss": 0.7617, + "step": 50073 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786658516753324e-06, + "loss": 0.7773, + "step": 50074 + }, + { + "epoch": 1.28, + "learning_rate": 1.2786392771934278e-06, + "loss": 0.7295, + "step": 50075 + }, + { + "epoch": 1.28, + "learning_rate": 1.278612702498182e-06, + "loss": 0.8125, + "step": 50076 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785861275896153e-06, + "loss": 0.6606, + "step": 50077 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785595524677485e-06, + "loss": 0.8027, + "step": 50078 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785329771326005e-06, + "loss": 0.7734, + "step": 50079 + }, + { + "epoch": 1.28, + "learning_rate": 1.2785064015841933e-06, + "loss": 0.7319, + "step": 50080 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784798258225462e-06, + "loss": 0.6514, + "step": 50081 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784532498476801e-06, + "loss": 0.4204, + "step": 50082 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784266736596153e-06, + "loss": 0.752, + "step": 50083 + }, + { + "epoch": 1.28, + "learning_rate": 1.2784000972583715e-06, + "loss": 0.549, + "step": 50084 + }, + { + "epoch": 1.28, + "learning_rate": 1.27837352064397e-06, + "loss": 0.5698, + "step": 50085 + }, + { + "epoch": 1.28, + "learning_rate": 1.2783469438164303e-06, + "loss": 0.6758, + "step": 50086 + }, + { + "epoch": 1.28, + "learning_rate": 1.2783203667757736e-06, + "loss": 0.5828, + "step": 50087 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782937895220193e-06, + "loss": 0.7695, + "step": 50088 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782672120551888e-06, + "loss": 0.6943, + "step": 50089 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782406343753014e-06, + "loss": 0.5405, + "step": 50090 + }, + { + "epoch": 1.28, + "learning_rate": 1.2782140564823783e-06, + "loss": 0.5186, + "step": 50091 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781874783764394e-06, + "loss": 0.6074, + "step": 50092 + }, + { + "epoch": 1.28, + "learning_rate": 1.278160900057505e-06, + "loss": 0.4954, + "step": 50093 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781343215255958e-06, + "loss": 0.7197, + "step": 50094 + }, + { + "epoch": 1.28, + "learning_rate": 1.2781077427807319e-06, + "loss": 0.6704, + "step": 50095 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780811638229332e-06, + "loss": 0.6201, + "step": 50096 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780545846522212e-06, + "loss": 0.6602, + "step": 50097 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780280052686152e-06, + "loss": 0.6426, + "step": 50098 + }, + { + "epoch": 1.28, + "learning_rate": 1.2780014256721364e-06, + "loss": 0.7034, + "step": 50099 + }, + { + "epoch": 1.28, + "learning_rate": 1.277974845862804e-06, + "loss": 0.6387, + "step": 50100 + }, + { + "epoch": 1.28, + "learning_rate": 1.2779482658406395e-06, + "loss": 0.6216, + "step": 50101 + }, + { + "epoch": 1.28, + "learning_rate": 1.2779216856056627e-06, + "loss": 0.7217, + "step": 50102 + }, + { + "epoch": 1.28, + "learning_rate": 1.277895105157894e-06, + "loss": 0.6807, + "step": 50103 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778685244973539e-06, + "loss": 0.7227, + "step": 50104 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778419436240626e-06, + "loss": 0.6191, + "step": 50105 + }, + { + "epoch": 1.28, + "learning_rate": 1.2778153625380403e-06, + "loss": 0.7598, + "step": 50106 + }, + { + "epoch": 1.28, + "learning_rate": 1.277788781239308e-06, + "loss": 0.7578, + "step": 50107 + }, + { + "epoch": 1.28, + "learning_rate": 1.2777621997278853e-06, + "loss": 0.5713, + "step": 50108 + }, + { + "epoch": 1.28, + "learning_rate": 1.277735618003793e-06, + "loss": 0.5518, + "step": 50109 + }, + { + "epoch": 1.28, + "learning_rate": 1.2777090360670511e-06, + "loss": 0.7539, + "step": 50110 + }, + { + "epoch": 1.28, + "learning_rate": 1.27768245391768e-06, + "loss": 0.8125, + "step": 50111 + }, + { + "epoch": 1.28, + "learning_rate": 1.2776558715557006e-06, + "loss": 0.6304, + "step": 50112 + }, + { + "epoch": 1.28, + "learning_rate": 1.2776292889811329e-06, + "loss": 0.7949, + "step": 50113 + }, + { + "epoch": 1.28, + "learning_rate": 1.277602706193997e-06, + "loss": 0.7241, + "step": 50114 + }, + { + "epoch": 1.28, + "learning_rate": 1.2775761231943133e-06, + "loss": 0.5693, + "step": 50115 + }, + { + "epoch": 1.28, + "learning_rate": 1.2775495399821026e-06, + "loss": 0.5967, + "step": 50116 + }, + { + "epoch": 1.28, + "learning_rate": 1.277522956557385e-06, + "loss": 0.7822, + "step": 50117 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774963729201808e-06, + "loss": 0.5371, + "step": 50118 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774697890705105e-06, + "loss": 0.7236, + "step": 50119 + }, + { + "epoch": 1.28, + "learning_rate": 1.277443205008394e-06, + "loss": 0.561, + "step": 50120 + }, + { + "epoch": 1.28, + "learning_rate": 1.2774166207338522e-06, + "loss": 0.6504, + "step": 50121 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773900362469053e-06, + "loss": 0.6826, + "step": 50122 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773634515475735e-06, + "loss": 0.5867, + "step": 50123 + }, + { + "epoch": 1.28, + "learning_rate": 1.2773368666358775e-06, + "loss": 0.6113, + "step": 50124 + }, + { + "epoch": 1.28, + "learning_rate": 1.277310281511837e-06, + "loss": 0.7539, + "step": 50125 + }, + { + "epoch": 1.28, + "learning_rate": 1.277283696175473e-06, + "loss": 0.6289, + "step": 50126 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772571106268057e-06, + "loss": 0.5815, + "step": 50127 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772305248658553e-06, + "loss": 0.6099, + "step": 50128 + }, + { + "epoch": 1.28, + "learning_rate": 1.2772039388926422e-06, + "loss": 0.5891, + "step": 50129 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771773527071866e-06, + "loss": 0.7188, + "step": 50130 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771507663095094e-06, + "loss": 0.6128, + "step": 50131 + }, + { + "epoch": 1.28, + "learning_rate": 1.2771241796996303e-06, + "loss": 0.6304, + "step": 50132 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770975928775704e-06, + "loss": 0.6904, + "step": 50133 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770710058433492e-06, + "loss": 0.7842, + "step": 50134 + }, + { + "epoch": 1.28, + "learning_rate": 1.2770444185969878e-06, + "loss": 0.7861, + "step": 50135 + }, + { + "epoch": 1.29, + "learning_rate": 1.2770178311385058e-06, + "loss": 0.7988, + "step": 50136 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769912434679244e-06, + "loss": 0.8018, + "step": 50137 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769646555852634e-06, + "loss": 0.7393, + "step": 50138 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769380674905432e-06, + "loss": 0.5547, + "step": 50139 + }, + { + "epoch": 1.29, + "learning_rate": 1.2769114791837842e-06, + "loss": 0.7412, + "step": 50140 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768848906650069e-06, + "loss": 0.6223, + "step": 50141 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768583019342316e-06, + "loss": 0.5791, + "step": 50142 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768317129914788e-06, + "loss": 0.6196, + "step": 50143 + }, + { + "epoch": 1.29, + "learning_rate": 1.2768051238367682e-06, + "loss": 0.7148, + "step": 50144 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767785344701211e-06, + "loss": 0.627, + "step": 50145 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767519448915572e-06, + "loss": 0.6008, + "step": 50146 + }, + { + "epoch": 1.29, + "learning_rate": 1.2767253551010972e-06, + "loss": 0.7031, + "step": 50147 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766987650987614e-06, + "loss": 0.5928, + "step": 50148 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766721748845697e-06, + "loss": 0.8047, + "step": 50149 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766455844585431e-06, + "loss": 0.8359, + "step": 50150 + }, + { + "epoch": 1.29, + "learning_rate": 1.2766189938207016e-06, + "loss": 0.8164, + "step": 50151 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765924029710658e-06, + "loss": 0.665, + "step": 50152 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765658119096555e-06, + "loss": 0.707, + "step": 50153 + }, + { + "epoch": 1.29, + "learning_rate": 1.2765392206364923e-06, + "loss": 0.606, + "step": 50154 + }, + { + "epoch": 1.29, + "learning_rate": 1.276512629151595e-06, + "loss": 0.438, + "step": 50155 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764860374549848e-06, + "loss": 0.7949, + "step": 50156 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764594455466822e-06, + "loss": 0.6123, + "step": 50157 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764328534267073e-06, + "loss": 0.7568, + "step": 50158 + }, + { + "epoch": 1.29, + "learning_rate": 1.2764062610950802e-06, + "loss": 0.6143, + "step": 50159 + }, + { + "epoch": 1.29, + "learning_rate": 1.2763796685518218e-06, + "loss": 0.6641, + "step": 50160 + }, + { + "epoch": 1.29, + "learning_rate": 1.276353075796952e-06, + "loss": 0.8994, + "step": 50161 + }, + { + "epoch": 1.29, + "learning_rate": 1.2763264828304915e-06, + "loss": 0.6277, + "step": 50162 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762998896524605e-06, + "loss": 0.6616, + "step": 50163 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762732962628795e-06, + "loss": 0.7451, + "step": 50164 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762467026617682e-06, + "loss": 0.4626, + "step": 50165 + }, + { + "epoch": 1.29, + "learning_rate": 1.2762201088491483e-06, + "loss": 0.4655, + "step": 50166 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761935148250388e-06, + "loss": 0.7285, + "step": 50167 + }, + { + "epoch": 1.29, + "learning_rate": 1.276166920589461e-06, + "loss": 0.4392, + "step": 50168 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761403261424344e-06, + "loss": 0.7871, + "step": 50169 + }, + { + "epoch": 1.29, + "learning_rate": 1.2761137314839803e-06, + "loss": 0.6079, + "step": 50170 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760871366141182e-06, + "loss": 0.8057, + "step": 50171 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760605415328691e-06, + "loss": 0.5923, + "step": 50172 + }, + { + "epoch": 1.29, + "learning_rate": 1.276033946240253e-06, + "loss": 0.8232, + "step": 50173 + }, + { + "epoch": 1.29, + "learning_rate": 1.2760073507362907e-06, + "loss": 0.7383, + "step": 50174 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759807550210023e-06, + "loss": 0.7285, + "step": 50175 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759541590944075e-06, + "loss": 0.7734, + "step": 50176 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759275629565282e-06, + "loss": 0.7158, + "step": 50177 + }, + { + "epoch": 1.29, + "learning_rate": 1.2759009666073832e-06, + "loss": 0.5654, + "step": 50178 + }, + { + "epoch": 1.29, + "learning_rate": 1.2758743700469937e-06, + "loss": 0.5413, + "step": 50179 + }, + { + "epoch": 1.29, + "learning_rate": 1.2758477732753798e-06, + "loss": 0.6724, + "step": 50180 + }, + { + "epoch": 1.29, + "learning_rate": 1.275821176292562e-06, + "loss": 0.6484, + "step": 50181 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757945790985606e-06, + "loss": 0.8008, + "step": 50182 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757679816933961e-06, + "loss": 0.6543, + "step": 50183 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757413840770886e-06, + "loss": 0.75, + "step": 50184 + }, + { + "epoch": 1.29, + "learning_rate": 1.2757147862496587e-06, + "loss": 0.6025, + "step": 50185 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756881882111264e-06, + "loss": 0.7979, + "step": 50186 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756615899615129e-06, + "loss": 0.8086, + "step": 50187 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756349915008376e-06, + "loss": 0.7832, + "step": 50188 + }, + { + "epoch": 1.29, + "learning_rate": 1.2756083928291212e-06, + "loss": 0.6226, + "step": 50189 + }, + { + "epoch": 1.29, + "learning_rate": 1.275581793946384e-06, + "loss": 0.5832, + "step": 50190 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755551948526469e-06, + "loss": 0.5776, + "step": 50191 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755285955479295e-06, + "loss": 0.6484, + "step": 50192 + }, + { + "epoch": 1.29, + "learning_rate": 1.2755019960322528e-06, + "loss": 0.644, + "step": 50193 + }, + { + "epoch": 1.29, + "learning_rate": 1.2754753963056368e-06, + "loss": 0.7744, + "step": 50194 + }, + { + "epoch": 1.29, + "learning_rate": 1.275448796368102e-06, + "loss": 0.6396, + "step": 50195 + }, + { + "epoch": 1.29, + "learning_rate": 1.2754221962196684e-06, + "loss": 0.6523, + "step": 50196 + }, + { + "epoch": 1.29, + "learning_rate": 1.275395595860357e-06, + "loss": 0.668, + "step": 50197 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753689952901877e-06, + "loss": 0.6143, + "step": 50198 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753423945091813e-06, + "loss": 0.7588, + "step": 50199 + }, + { + "epoch": 1.29, + "learning_rate": 1.2753157935173577e-06, + "loss": 0.5815, + "step": 50200 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752891923147374e-06, + "loss": 0.6211, + "step": 50201 + }, + { + "epoch": 1.29, + "learning_rate": 1.275262590901341e-06, + "loss": 0.7393, + "step": 50202 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752359892771884e-06, + "loss": 0.6074, + "step": 50203 + }, + { + "epoch": 1.29, + "learning_rate": 1.2752093874423006e-06, + "loss": 0.793, + "step": 50204 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751827853966975e-06, + "loss": 0.5811, + "step": 50205 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751561831403994e-06, + "loss": 0.7285, + "step": 50206 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751295806734272e-06, + "loss": 0.6748, + "step": 50207 + }, + { + "epoch": 1.29, + "learning_rate": 1.2751029779958007e-06, + "loss": 0.5376, + "step": 50208 + }, + { + "epoch": 1.29, + "learning_rate": 1.2750763751075404e-06, + "loss": 0.6631, + "step": 50209 + }, + { + "epoch": 1.29, + "learning_rate": 1.275049772008667e-06, + "loss": 0.7559, + "step": 50210 + }, + { + "epoch": 1.29, + "learning_rate": 1.2750231686992003e-06, + "loss": 0.7109, + "step": 50211 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749965651791617e-06, + "loss": 0.6816, + "step": 50212 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749699614485703e-06, + "loss": 0.4856, + "step": 50213 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749433575074474e-06, + "loss": 0.5747, + "step": 50214 + }, + { + "epoch": 1.29, + "learning_rate": 1.2749167533558125e-06, + "loss": 0.5449, + "step": 50215 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748901489936867e-06, + "loss": 0.6548, + "step": 50216 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748635444210905e-06, + "loss": 0.7617, + "step": 50217 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748369396380434e-06, + "loss": 0.6963, + "step": 50218 + }, + { + "epoch": 1.29, + "learning_rate": 1.2748103346445667e-06, + "loss": 0.7412, + "step": 50219 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747837294406801e-06, + "loss": 0.6528, + "step": 50220 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747571240264043e-06, + "loss": 0.603, + "step": 50221 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747305184017598e-06, + "loss": 0.6704, + "step": 50222 + }, + { + "epoch": 1.29, + "learning_rate": 1.2747039125667667e-06, + "loss": 0.5771, + "step": 50223 + }, + { + "epoch": 1.29, + "learning_rate": 1.274677306521445e-06, + "loss": 0.7627, + "step": 50224 + }, + { + "epoch": 1.29, + "learning_rate": 1.2746507002658162e-06, + "loss": 0.7588, + "step": 50225 + }, + { + "epoch": 1.29, + "learning_rate": 1.2746240937998995e-06, + "loss": 0.647, + "step": 50226 + }, + { + "epoch": 1.29, + "learning_rate": 1.274597487123716e-06, + "loss": 0.6602, + "step": 50227 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745708802372858e-06, + "loss": 0.5898, + "step": 50228 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745442731406293e-06, + "loss": 0.6807, + "step": 50229 + }, + { + "epoch": 1.29, + "learning_rate": 1.2745176658337666e-06, + "loss": 0.8564, + "step": 50230 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744910583167187e-06, + "loss": 0.6777, + "step": 50231 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744644505895057e-06, + "loss": 0.8066, + "step": 50232 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744378426521477e-06, + "loss": 0.425, + "step": 50233 + }, + { + "epoch": 1.29, + "learning_rate": 1.2744112345046651e-06, + "loss": 0.749, + "step": 50234 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743846261470785e-06, + "loss": 0.467, + "step": 50235 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743580175794081e-06, + "loss": 0.6533, + "step": 50236 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743314088016748e-06, + "loss": 0.5273, + "step": 50237 + }, + { + "epoch": 1.29, + "learning_rate": 1.2743047998138985e-06, + "loss": 0.2727, + "step": 50238 + }, + { + "epoch": 1.29, + "learning_rate": 1.274278190616099e-06, + "loss": 0.5203, + "step": 50239 + }, + { + "epoch": 1.29, + "learning_rate": 1.2742515812082981e-06, + "loss": 0.7844, + "step": 50240 + }, + { + "epoch": 1.29, + "learning_rate": 1.274224971590515e-06, + "loss": 0.7002, + "step": 50241 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741983617627704e-06, + "loss": 0.8262, + "step": 50242 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741717517250847e-06, + "loss": 0.6978, + "step": 50243 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741451414774786e-06, + "loss": 0.5404, + "step": 50244 + }, + { + "epoch": 1.29, + "learning_rate": 1.2741185310199718e-06, + "loss": 0.6904, + "step": 50245 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740919203525852e-06, + "loss": 0.689, + "step": 50246 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740653094753393e-06, + "loss": 0.7598, + "step": 50247 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740386983882538e-06, + "loss": 0.8125, + "step": 50248 + }, + { + "epoch": 1.29, + "learning_rate": 1.2740120870913497e-06, + "loss": 0.708, + "step": 50249 + }, + { + "epoch": 1.29, + "learning_rate": 1.273985475584647e-06, + "loss": 0.6338, + "step": 50250 + }, + { + "epoch": 1.29, + "learning_rate": 1.2739588638681662e-06, + "loss": 0.5239, + "step": 50251 + }, + { + "epoch": 1.29, + "learning_rate": 1.273932251941928e-06, + "loss": 0.5146, + "step": 50252 + }, + { + "epoch": 1.29, + "learning_rate": 1.273905639805952e-06, + "loss": 0.4871, + "step": 50253 + }, + { + "epoch": 1.29, + "learning_rate": 1.2738790274602593e-06, + "loss": 0.748, + "step": 50254 + }, + { + "epoch": 1.29, + "learning_rate": 1.27385241490487e-06, + "loss": 0.5288, + "step": 50255 + }, + { + "epoch": 1.29, + "learning_rate": 1.2738258021398045e-06, + "loss": 0.5288, + "step": 50256 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737991891650832e-06, + "loss": 0.6641, + "step": 50257 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737725759807264e-06, + "loss": 0.644, + "step": 50258 + }, + { + "epoch": 1.29, + "learning_rate": 1.2737459625867546e-06, + "loss": 0.7871, + "step": 50259 + }, + { + "epoch": 1.29, + "learning_rate": 1.273719348983188e-06, + "loss": 0.709, + "step": 50260 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736927351700471e-06, + "loss": 0.5037, + "step": 50261 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736661211473522e-06, + "loss": 0.6592, + "step": 50262 + }, + { + "epoch": 1.29, + "learning_rate": 1.273639506915124e-06, + "loss": 0.4792, + "step": 50263 + }, + { + "epoch": 1.29, + "learning_rate": 1.2736128924733823e-06, + "loss": 0.6113, + "step": 50264 + }, + { + "epoch": 1.29, + "learning_rate": 1.273586277822148e-06, + "loss": 0.5505, + "step": 50265 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735596629614408e-06, + "loss": 0.6406, + "step": 50266 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735330478912825e-06, + "loss": 0.9561, + "step": 50267 + }, + { + "epoch": 1.29, + "learning_rate": 1.2735064326116918e-06, + "loss": 0.6631, + "step": 50268 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734798171226899e-06, + "loss": 0.6074, + "step": 50269 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734532014242971e-06, + "loss": 0.9258, + "step": 50270 + }, + { + "epoch": 1.29, + "learning_rate": 1.2734265855165338e-06, + "loss": 0.521, + "step": 50271 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733999693994205e-06, + "loss": 0.5356, + "step": 50272 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733733530729774e-06, + "loss": 0.5977, + "step": 50273 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733467365372246e-06, + "loss": 0.541, + "step": 50274 + }, + { + "epoch": 1.29, + "learning_rate": 1.2733201197921829e-06, + "loss": 0.6543, + "step": 50275 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732935028378724e-06, + "loss": 0.7158, + "step": 50276 + }, + { + "epoch": 1.29, + "learning_rate": 1.273266885674314e-06, + "loss": 0.501, + "step": 50277 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732402683015273e-06, + "loss": 0.5537, + "step": 50278 + }, + { + "epoch": 1.29, + "learning_rate": 1.2732136507195334e-06, + "loss": 0.7241, + "step": 50279 + }, + { + "epoch": 1.29, + "learning_rate": 1.273187032928352e-06, + "loss": 0.7402, + "step": 50280 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731604149280043e-06, + "loss": 0.5576, + "step": 50281 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731337967185102e-06, + "loss": 0.7261, + "step": 50282 + }, + { + "epoch": 1.29, + "learning_rate": 1.2731071782998898e-06, + "loss": 0.6523, + "step": 50283 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730805596721639e-06, + "loss": 0.6685, + "step": 50284 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730539408353531e-06, + "loss": 0.4866, + "step": 50285 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730273217894769e-06, + "loss": 0.6211, + "step": 50286 + }, + { + "epoch": 1.29, + "learning_rate": 1.2730007025345567e-06, + "loss": 0.6094, + "step": 50287 + }, + { + "epoch": 1.29, + "learning_rate": 1.272974083070612e-06, + "loss": 0.4849, + "step": 50288 + }, + { + "epoch": 1.29, + "learning_rate": 1.2729474633976638e-06, + "loss": 0.5723, + "step": 50289 + }, + { + "epoch": 1.29, + "learning_rate": 1.2729208435157323e-06, + "loss": 0.5791, + "step": 50290 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728942234248379e-06, + "loss": 0.6064, + "step": 50291 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728676031250011e-06, + "loss": 0.7139, + "step": 50292 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728409826162418e-06, + "loss": 0.6675, + "step": 50293 + }, + { + "epoch": 1.29, + "learning_rate": 1.2728143618985808e-06, + "loss": 0.5735, + "step": 50294 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727877409720384e-06, + "loss": 0.5576, + "step": 50295 + }, + { + "epoch": 1.29, + "learning_rate": 1.272761119836635e-06, + "loss": 0.7393, + "step": 50296 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727344984923912e-06, + "loss": 0.729, + "step": 50297 + }, + { + "epoch": 1.29, + "learning_rate": 1.2727078769393266e-06, + "loss": 0.5591, + "step": 50298 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726812551774625e-06, + "loss": 0.7017, + "step": 50299 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726546332068187e-06, + "loss": 0.549, + "step": 50300 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726280110274159e-06, + "loss": 0.6377, + "step": 50301 + }, + { + "epoch": 1.29, + "learning_rate": 1.2726013886392747e-06, + "loss": 0.5862, + "step": 50302 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725747660424144e-06, + "loss": 0.7246, + "step": 50303 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725481432368566e-06, + "loss": 0.6294, + "step": 50304 + }, + { + "epoch": 1.29, + "learning_rate": 1.2725215202226212e-06, + "loss": 0.5479, + "step": 50305 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724948969997284e-06, + "loss": 0.7051, + "step": 50306 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724682735681991e-06, + "loss": 0.6567, + "step": 50307 + }, + { + "epoch": 1.29, + "learning_rate": 1.272441649928053e-06, + "loss": 0.6758, + "step": 50308 + }, + { + "epoch": 1.29, + "learning_rate": 1.2724150260793113e-06, + "loss": 0.6484, + "step": 50309 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723884020219936e-06, + "loss": 0.75, + "step": 50310 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723617777561207e-06, + "loss": 0.6011, + "step": 50311 + }, + { + "epoch": 1.29, + "learning_rate": 1.272335153281713e-06, + "loss": 0.7168, + "step": 50312 + }, + { + "epoch": 1.29, + "learning_rate": 1.2723085285987908e-06, + "loss": 0.6963, + "step": 50313 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722819037073741e-06, + "loss": 0.8184, + "step": 50314 + }, + { + "epoch": 1.29, + "learning_rate": 1.272255278607484e-06, + "loss": 0.6748, + "step": 50315 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722286532991406e-06, + "loss": 0.488, + "step": 50316 + }, + { + "epoch": 1.29, + "learning_rate": 1.2722020277823644e-06, + "loss": 0.5146, + "step": 50317 + }, + { + "epoch": 1.29, + "learning_rate": 1.2721754020571754e-06, + "loss": 0.8145, + "step": 50318 + }, + { + "epoch": 1.29, + "learning_rate": 1.2721487761235944e-06, + "loss": 0.71, + "step": 50319 + }, + { + "epoch": 1.29, + "learning_rate": 1.272122149981641e-06, + "loss": 0.7407, + "step": 50320 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720955236313367e-06, + "loss": 0.7139, + "step": 50321 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720688970727015e-06, + "loss": 0.6748, + "step": 50322 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720422703057553e-06, + "loss": 0.5571, + "step": 50323 + }, + { + "epoch": 1.29, + "learning_rate": 1.2720156433305188e-06, + "loss": 0.6006, + "step": 50324 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719890161470125e-06, + "loss": 0.6592, + "step": 50325 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719623887552567e-06, + "loss": 0.6091, + "step": 50326 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719357611552722e-06, + "loss": 0.6099, + "step": 50327 + }, + { + "epoch": 1.29, + "learning_rate": 1.2719091333470786e-06, + "loss": 0.6963, + "step": 50328 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718825053306965e-06, + "loss": 0.6172, + "step": 50329 + }, + { + "epoch": 1.29, + "learning_rate": 1.271855877106147e-06, + "loss": 0.6162, + "step": 50330 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718292486734497e-06, + "loss": 0.4771, + "step": 50331 + }, + { + "epoch": 1.29, + "learning_rate": 1.2718026200326252e-06, + "loss": 0.6484, + "step": 50332 + }, + { + "epoch": 1.29, + "learning_rate": 1.271775991183694e-06, + "loss": 0.5708, + "step": 50333 + }, + { + "epoch": 1.29, + "learning_rate": 1.2717493621266765e-06, + "loss": 0.5317, + "step": 50334 + }, + { + "epoch": 1.29, + "learning_rate": 1.2717227328615927e-06, + "loss": 0.7061, + "step": 50335 + }, + { + "epoch": 1.29, + "learning_rate": 1.2716961033884635e-06, + "loss": 0.7227, + "step": 50336 + }, + { + "epoch": 1.29, + "learning_rate": 1.271669473707309e-06, + "loss": 0.7012, + "step": 50337 + }, + { + "epoch": 1.29, + "learning_rate": 1.2716428438181499e-06, + "loss": 0.5513, + "step": 50338 + }, + { + "epoch": 1.29, + "learning_rate": 1.271616213721006e-06, + "loss": 0.4846, + "step": 50339 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715895834158985e-06, + "loss": 0.6299, + "step": 50340 + }, + { + "epoch": 1.29, + "learning_rate": 1.271562952902847e-06, + "loss": 0.668, + "step": 50341 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715363221818727e-06, + "loss": 0.6558, + "step": 50342 + }, + { + "epoch": 1.29, + "learning_rate": 1.2715096912529951e-06, + "loss": 0.6304, + "step": 50343 + }, + { + "epoch": 1.29, + "learning_rate": 1.271483060116235e-06, + "loss": 0.5044, + "step": 50344 + }, + { + "epoch": 1.29, + "learning_rate": 1.2714564287716126e-06, + "loss": 0.7422, + "step": 50345 + }, + { + "epoch": 1.29, + "learning_rate": 1.271429797219149e-06, + "loss": 0.6357, + "step": 50346 + }, + { + "epoch": 1.29, + "learning_rate": 1.271403165458864e-06, + "loss": 0.6602, + "step": 50347 + }, + { + "epoch": 1.29, + "learning_rate": 1.271376533490778e-06, + "loss": 0.6309, + "step": 50348 + }, + { + "epoch": 1.29, + "learning_rate": 1.2713499013149115e-06, + "loss": 0.8652, + "step": 50349 + }, + { + "epoch": 1.29, + "learning_rate": 1.2713232689312845e-06, + "loss": 0.8281, + "step": 50350 + }, + { + "epoch": 1.29, + "learning_rate": 1.271296636339918e-06, + "loss": 0.4961, + "step": 50351 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712700035408322e-06, + "loss": 0.6875, + "step": 50352 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712433705340475e-06, + "loss": 0.6836, + "step": 50353 + }, + { + "epoch": 1.29, + "learning_rate": 1.2712167373195839e-06, + "loss": 0.6953, + "step": 50354 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711901038974623e-06, + "loss": 0.7227, + "step": 50355 + }, + { + "epoch": 1.29, + "learning_rate": 1.271163470267703e-06, + "loss": 0.4905, + "step": 50356 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711368364303266e-06, + "loss": 0.7676, + "step": 50357 + }, + { + "epoch": 1.29, + "learning_rate": 1.2711102023853525e-06, + "loss": 0.7134, + "step": 50358 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710835681328022e-06, + "loss": 0.5762, + "step": 50359 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710569336726955e-06, + "loss": 0.6899, + "step": 50360 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710302990050533e-06, + "loss": 0.4231, + "step": 50361 + }, + { + "epoch": 1.29, + "learning_rate": 1.2710036641298954e-06, + "loss": 0.6895, + "step": 50362 + }, + { + "epoch": 1.29, + "learning_rate": 1.2709770290472426e-06, + "loss": 0.7725, + "step": 50363 + }, + { + "epoch": 1.29, + "learning_rate": 1.2709503937571146e-06, + "loss": 0.7656, + "step": 50364 + }, + { + "epoch": 1.29, + "learning_rate": 1.270923758259533e-06, + "loss": 0.5115, + "step": 50365 + }, + { + "epoch": 1.29, + "learning_rate": 1.270897122554517e-06, + "loss": 0.6685, + "step": 50366 + }, + { + "epoch": 1.29, + "learning_rate": 1.2708704866420883e-06, + "loss": 0.6689, + "step": 50367 + }, + { + "epoch": 1.29, + "learning_rate": 1.270843850522266e-06, + "loss": 0.4001, + "step": 50368 + }, + { + "epoch": 1.29, + "learning_rate": 1.270817214195071e-06, + "loss": 0.6978, + "step": 50369 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707905776605237e-06, + "loss": 0.7207, + "step": 50370 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707639409186445e-06, + "loss": 0.553, + "step": 50371 + }, + { + "epoch": 1.29, + "learning_rate": 1.270737303969454e-06, + "loss": 0.5249, + "step": 50372 + }, + { + "epoch": 1.29, + "learning_rate": 1.2707106668129722e-06, + "loss": 0.5806, + "step": 50373 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706840294492198e-06, + "loss": 0.623, + "step": 50374 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706573918782174e-06, + "loss": 0.6138, + "step": 50375 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706307540999845e-06, + "loss": 0.7109, + "step": 50376 + }, + { + "epoch": 1.29, + "learning_rate": 1.2706041161145422e-06, + "loss": 0.8008, + "step": 50377 + }, + { + "epoch": 1.29, + "learning_rate": 1.2705774779219112e-06, + "loss": 0.5798, + "step": 50378 + }, + { + "epoch": 1.29, + "learning_rate": 1.270550839522111e-06, + "loss": 0.7646, + "step": 50379 + }, + { + "epoch": 1.29, + "learning_rate": 1.2705242009151626e-06, + "loss": 0.6523, + "step": 50380 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704975621010862e-06, + "loss": 0.6475, + "step": 50381 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704709230799023e-06, + "loss": 0.7061, + "step": 50382 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704442838516314e-06, + "loss": 0.7705, + "step": 50383 + }, + { + "epoch": 1.29, + "learning_rate": 1.2704176444162938e-06, + "loss": 0.7368, + "step": 50384 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703910047739094e-06, + "loss": 0.7715, + "step": 50385 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703643649244995e-06, + "loss": 0.5881, + "step": 50386 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703377248680838e-06, + "loss": 0.6338, + "step": 50387 + }, + { + "epoch": 1.29, + "learning_rate": 1.2703110846046832e-06, + "loss": 0.5913, + "step": 50388 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702844441343172e-06, + "loss": 0.6562, + "step": 50389 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702578034570076e-06, + "loss": 0.6123, + "step": 50390 + }, + { + "epoch": 1.29, + "learning_rate": 1.2702311625727735e-06, + "loss": 0.5123, + "step": 50391 + }, + { + "epoch": 1.29, + "learning_rate": 1.270204521481636e-06, + "loss": 0.5513, + "step": 50392 + }, + { + "epoch": 1.29, + "learning_rate": 1.2701778801836153e-06, + "loss": 0.5552, + "step": 50393 + }, + { + "epoch": 1.29, + "learning_rate": 1.2701512386787318e-06, + "loss": 0.4775, + "step": 50394 + }, + { + "epoch": 1.29, + "learning_rate": 1.270124596967006e-06, + "loss": 0.5536, + "step": 50395 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700979550484583e-06, + "loss": 0.6445, + "step": 50396 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700713129231088e-06, + "loss": 0.7598, + "step": 50397 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700446705909782e-06, + "loss": 0.6099, + "step": 50398 + }, + { + "epoch": 1.29, + "learning_rate": 1.2700180280520867e-06, + "loss": 0.7256, + "step": 50399 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699913853064547e-06, + "loss": 0.6919, + "step": 50400 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699647423541033e-06, + "loss": 0.7024, + "step": 50401 + }, + { + "epoch": 1.29, + "learning_rate": 1.269938099195052e-06, + "loss": 0.6904, + "step": 50402 + }, + { + "epoch": 1.29, + "learning_rate": 1.2699114558293213e-06, + "loss": 0.6714, + "step": 50403 + }, + { + "epoch": 1.29, + "learning_rate": 1.269884812256932e-06, + "loss": 0.7119, + "step": 50404 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698581684779044e-06, + "loss": 0.6611, + "step": 50405 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698315244922586e-06, + "loss": 0.6216, + "step": 50406 + }, + { + "epoch": 1.29, + "learning_rate": 1.2698048803000155e-06, + "loss": 0.7988, + "step": 50407 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697782359011948e-06, + "loss": 0.6475, + "step": 50408 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697515912958177e-06, + "loss": 0.5466, + "step": 50409 + }, + { + "epoch": 1.29, + "learning_rate": 1.2697249464839037e-06, + "loss": 0.6455, + "step": 50410 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696983014654742e-06, + "loss": 0.6797, + "step": 50411 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696716562405489e-06, + "loss": 0.7764, + "step": 50412 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696450108091484e-06, + "loss": 0.6494, + "step": 50413 + }, + { + "epoch": 1.29, + "learning_rate": 1.2696183651712933e-06, + "loss": 0.5178, + "step": 50414 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695917193270039e-06, + "loss": 0.6738, + "step": 50415 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695650732763002e-06, + "loss": 0.6074, + "step": 50416 + }, + { + "epoch": 1.29, + "learning_rate": 1.269538427019203e-06, + "loss": 0.6519, + "step": 50417 + }, + { + "epoch": 1.29, + "learning_rate": 1.2695117805557324e-06, + "loss": 0.7354, + "step": 50418 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694851338859095e-06, + "loss": 0.4683, + "step": 50419 + }, + { + "epoch": 1.29, + "learning_rate": 1.269458487009754e-06, + "loss": 0.708, + "step": 50420 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694318399272866e-06, + "loss": 0.7686, + "step": 50421 + }, + { + "epoch": 1.29, + "learning_rate": 1.2694051926385274e-06, + "loss": 0.7266, + "step": 50422 + }, + { + "epoch": 1.29, + "learning_rate": 1.269378545143497e-06, + "loss": 0.7666, + "step": 50423 + }, + { + "epoch": 1.29, + "learning_rate": 1.2693518974422162e-06, + "loss": 0.6621, + "step": 50424 + }, + { + "epoch": 1.29, + "learning_rate": 1.2693252495347047e-06, + "loss": 0.4697, + "step": 50425 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692986014209836e-06, + "loss": 0.8301, + "step": 50426 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692719531010727e-06, + "loss": 0.5586, + "step": 50427 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692453045749927e-06, + "loss": 0.6865, + "step": 50428 + }, + { + "epoch": 1.29, + "learning_rate": 1.2692186558427638e-06, + "loss": 0.813, + "step": 50429 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691920069044066e-06, + "loss": 0.7617, + "step": 50430 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691653577599417e-06, + "loss": 0.7217, + "step": 50431 + }, + { + "epoch": 1.29, + "learning_rate": 1.269138708409389e-06, + "loss": 0.583, + "step": 50432 + }, + { + "epoch": 1.29, + "learning_rate": 1.2691120588527692e-06, + "loss": 0.5945, + "step": 50433 + }, + { + "epoch": 1.29, + "learning_rate": 1.269085409090103e-06, + "loss": 0.5693, + "step": 50434 + }, + { + "epoch": 1.29, + "learning_rate": 1.26905875912141e-06, + "loss": 0.5391, + "step": 50435 + }, + { + "epoch": 1.29, + "learning_rate": 1.2690321089467114e-06, + "loss": 0.7441, + "step": 50436 + }, + { + "epoch": 1.29, + "learning_rate": 1.2690054585660272e-06, + "loss": 0.6572, + "step": 50437 + }, + { + "epoch": 1.29, + "learning_rate": 1.268978807979378e-06, + "loss": 0.4841, + "step": 50438 + }, + { + "epoch": 1.29, + "learning_rate": 1.268952157186784e-06, + "loss": 0.7178, + "step": 50439 + }, + { + "epoch": 1.29, + "learning_rate": 1.2689255061882656e-06, + "loss": 0.611, + "step": 50440 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688988549838433e-06, + "loss": 0.6768, + "step": 50441 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688722035735376e-06, + "loss": 0.563, + "step": 50442 + }, + { + "epoch": 1.29, + "learning_rate": 1.268845551957369e-06, + "loss": 0.6445, + "step": 50443 + }, + { + "epoch": 1.29, + "learning_rate": 1.2688189001353571e-06, + "loss": 0.7061, + "step": 50444 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687922481075235e-06, + "loss": 0.6445, + "step": 50445 + }, + { + "epoch": 1.29, + "learning_rate": 1.268765595873888e-06, + "loss": 0.6343, + "step": 50446 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687389434344709e-06, + "loss": 0.6387, + "step": 50447 + }, + { + "epoch": 1.29, + "learning_rate": 1.2687122907892928e-06, + "loss": 0.626, + "step": 50448 + }, + { + "epoch": 1.29, + "learning_rate": 1.268685637938374e-06, + "loss": 0.5562, + "step": 50449 + }, + { + "epoch": 1.29, + "learning_rate": 1.268658984881735e-06, + "loss": 0.6357, + "step": 50450 + }, + { + "epoch": 1.29, + "learning_rate": 1.2686323316193963e-06, + "loss": 0.5608, + "step": 50451 + }, + { + "epoch": 1.29, + "learning_rate": 1.2686056781513778e-06, + "loss": 0.6572, + "step": 50452 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685790244777007e-06, + "loss": 0.6545, + "step": 50453 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685523705983846e-06, + "loss": 0.5879, + "step": 50454 + }, + { + "epoch": 1.29, + "learning_rate": 1.2685257165134507e-06, + "loss": 0.4255, + "step": 50455 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684990622229187e-06, + "loss": 0.5488, + "step": 50456 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684724077268097e-06, + "loss": 0.7637, + "step": 50457 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684457530251432e-06, + "loss": 0.613, + "step": 50458 + }, + { + "epoch": 1.29, + "learning_rate": 1.2684190981179403e-06, + "loss": 0.7715, + "step": 50459 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683924430052213e-06, + "loss": 0.5693, + "step": 50460 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683657876870067e-06, + "loss": 0.6897, + "step": 50461 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683391321633165e-06, + "loss": 0.5952, + "step": 50462 + }, + { + "epoch": 1.29, + "learning_rate": 1.2683124764341714e-06, + "loss": 0.5889, + "step": 50463 + }, + { + "epoch": 1.29, + "learning_rate": 1.268285820499592e-06, + "loss": 0.7266, + "step": 50464 + }, + { + "epoch": 1.29, + "learning_rate": 1.2682591643595984e-06, + "loss": 0.5304, + "step": 50465 + }, + { + "epoch": 1.29, + "learning_rate": 1.268232508014211e-06, + "loss": 0.6416, + "step": 50466 + }, + { + "epoch": 1.29, + "learning_rate": 1.2682058514634504e-06, + "loss": 0.8398, + "step": 50467 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681791947073368e-06, + "loss": 0.5999, + "step": 50468 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681525377458905e-06, + "loss": 0.7275, + "step": 50469 + }, + { + "epoch": 1.29, + "learning_rate": 1.2681258805791326e-06, + "loss": 0.5732, + "step": 50470 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680992232070828e-06, + "loss": 0.8291, + "step": 50471 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680725656297619e-06, + "loss": 0.4656, + "step": 50472 + }, + { + "epoch": 1.29, + "learning_rate": 1.26804590784719e-06, + "loss": 0.6724, + "step": 50473 + }, + { + "epoch": 1.29, + "learning_rate": 1.2680192498593878e-06, + "loss": 0.543, + "step": 50474 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679925916663753e-06, + "loss": 0.6133, + "step": 50475 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679659332681738e-06, + "loss": 0.6353, + "step": 50476 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679392746648026e-06, + "loss": 0.5774, + "step": 50477 + }, + { + "epoch": 1.29, + "learning_rate": 1.2679126158562826e-06, + "loss": 0.4004, + "step": 50478 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678859568426344e-06, + "loss": 0.5854, + "step": 50479 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678592976238783e-06, + "loss": 0.6924, + "step": 50480 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678326382000346e-06, + "loss": 0.6494, + "step": 50481 + }, + { + "epoch": 1.29, + "learning_rate": 1.2678059785711237e-06, + "loss": 0.6128, + "step": 50482 + }, + { + "epoch": 1.29, + "learning_rate": 1.267779318737166e-06, + "loss": 0.5361, + "step": 50483 + }, + { + "epoch": 1.29, + "learning_rate": 1.2677526586981821e-06, + "loss": 0.6777, + "step": 50484 + }, + { + "epoch": 1.29, + "learning_rate": 1.2677259984541922e-06, + "loss": 0.7295, + "step": 50485 + }, + { + "epoch": 1.29, + "learning_rate": 1.267699338005217e-06, + "loss": 0.6387, + "step": 50486 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676726773512767e-06, + "loss": 0.7129, + "step": 50487 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676460164923915e-06, + "loss": 0.8672, + "step": 50488 + }, + { + "epoch": 1.29, + "learning_rate": 1.2676193554285823e-06, + "loss": 0.6484, + "step": 50489 + }, + { + "epoch": 1.29, + "learning_rate": 1.2675926941598691e-06, + "loss": 0.6982, + "step": 50490 + }, + { + "epoch": 1.29, + "learning_rate": 1.2675660326862726e-06, + "loss": 0.6152, + "step": 50491 + }, + { + "epoch": 1.29, + "learning_rate": 1.267539371007813e-06, + "loss": 0.7144, + "step": 50492 + }, + { + "epoch": 1.29, + "learning_rate": 1.267512709124511e-06, + "loss": 0.6748, + "step": 50493 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674860470363867e-06, + "loss": 0.4336, + "step": 50494 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674593847434607e-06, + "loss": 0.7725, + "step": 50495 + }, + { + "epoch": 1.29, + "learning_rate": 1.2674327222457533e-06, + "loss": 0.7998, + "step": 50496 + }, + { + "epoch": 1.29, + "learning_rate": 1.267406059543285e-06, + "loss": 0.6738, + "step": 50497 + }, + { + "epoch": 1.29, + "learning_rate": 1.267379396636076e-06, + "loss": 0.5049, + "step": 50498 + }, + { + "epoch": 1.29, + "learning_rate": 1.267352733524147e-06, + "loss": 0.7754, + "step": 50499 + }, + { + "epoch": 1.29, + "learning_rate": 1.267326070207518e-06, + "loss": 0.645, + "step": 50500 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672994066862103e-06, + "loss": 0.584, + "step": 50501 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672727429602435e-06, + "loss": 0.5985, + "step": 50502 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672460790296382e-06, + "loss": 0.645, + "step": 50503 + }, + { + "epoch": 1.29, + "learning_rate": 1.2672194148944147e-06, + "loss": 0.8408, + "step": 50504 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671927505545938e-06, + "loss": 0.6001, + "step": 50505 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671660860101959e-06, + "loss": 0.5146, + "step": 50506 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671394212612407e-06, + "loss": 0.5103, + "step": 50507 + }, + { + "epoch": 1.29, + "learning_rate": 1.2671127563077493e-06, + "loss": 0.7236, + "step": 50508 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670860911497418e-06, + "loss": 0.7783, + "step": 50509 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670594257872394e-06, + "loss": 0.5986, + "step": 50510 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670327602202613e-06, + "loss": 0.6245, + "step": 50511 + }, + { + "epoch": 1.29, + "learning_rate": 1.2670060944488288e-06, + "loss": 0.5947, + "step": 50512 + }, + { + "epoch": 1.29, + "learning_rate": 1.2669794284729616e-06, + "loss": 0.7363, + "step": 50513 + }, + { + "epoch": 1.29, + "learning_rate": 1.266952762292681e-06, + "loss": 0.7266, + "step": 50514 + }, + { + "epoch": 1.29, + "learning_rate": 1.2669260959080066e-06, + "loss": 0.7725, + "step": 50515 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668994293189594e-06, + "loss": 0.7549, + "step": 50516 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668727625255596e-06, + "loss": 0.4727, + "step": 50517 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668460955278274e-06, + "loss": 0.7236, + "step": 50518 + }, + { + "epoch": 1.29, + "learning_rate": 1.2668194283257833e-06, + "loss": 0.792, + "step": 50519 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667927609194482e-06, + "loss": 0.7363, + "step": 50520 + }, + { + "epoch": 1.29, + "learning_rate": 1.266766093308842e-06, + "loss": 0.5232, + "step": 50521 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667394254939854e-06, + "loss": 0.4951, + "step": 50522 + }, + { + "epoch": 1.29, + "learning_rate": 1.2667127574748984e-06, + "loss": 0.6201, + "step": 50523 + }, + { + "epoch": 1.29, + "learning_rate": 1.2666860892516017e-06, + "loss": 0.7017, + "step": 50524 + }, + { + "epoch": 1.29, + "learning_rate": 1.2666594208241159e-06, + "loss": 0.7891, + "step": 50525 + }, + { + "epoch": 1.3, + "learning_rate": 1.2666327521924612e-06, + "loss": 0.751, + "step": 50526 + }, + { + "epoch": 1.3, + "learning_rate": 1.2666060833566583e-06, + "loss": 0.6255, + "step": 50527 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665794143167272e-06, + "loss": 0.6895, + "step": 50528 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665527450726882e-06, + "loss": 0.5703, + "step": 50529 + }, + { + "epoch": 1.3, + "learning_rate": 1.2665260756245624e-06, + "loss": 0.6729, + "step": 50530 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664994059723696e-06, + "loss": 0.4368, + "step": 50531 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664727361161304e-06, + "loss": 0.7285, + "step": 50532 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664460660558657e-06, + "loss": 0.624, + "step": 50533 + }, + { + "epoch": 1.3, + "learning_rate": 1.2664193957915949e-06, + "loss": 0.668, + "step": 50534 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663927253233398e-06, + "loss": 0.5796, + "step": 50535 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663660546511195e-06, + "loss": 0.6318, + "step": 50536 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663393837749552e-06, + "loss": 0.6768, + "step": 50537 + }, + { + "epoch": 1.3, + "learning_rate": 1.2663127126948667e-06, + "loss": 0.3779, + "step": 50538 + }, + { + "epoch": 1.3, + "learning_rate": 1.266286041410875e-06, + "loss": 0.6992, + "step": 50539 + }, + { + "epoch": 1.3, + "learning_rate": 1.2662593699230005e-06, + "loss": 0.6855, + "step": 50540 + }, + { + "epoch": 1.3, + "learning_rate": 1.2662326982312634e-06, + "loss": 0.5371, + "step": 50541 + }, + { + "epoch": 1.3, + "learning_rate": 1.266206026335684e-06, + "loss": 0.5234, + "step": 50542 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661793542362831e-06, + "loss": 0.6814, + "step": 50543 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661526819330805e-06, + "loss": 0.7637, + "step": 50544 + }, + { + "epoch": 1.3, + "learning_rate": 1.2661260094260974e-06, + "loss": 0.6348, + "step": 50545 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660993367153538e-06, + "loss": 0.5022, + "step": 50546 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660726638008702e-06, + "loss": 0.4722, + "step": 50547 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660459906826668e-06, + "loss": 0.7324, + "step": 50548 + }, + { + "epoch": 1.3, + "learning_rate": 1.2660193173607644e-06, + "loss": 0.6797, + "step": 50549 + }, + { + "epoch": 1.3, + "learning_rate": 1.265992643835183e-06, + "loss": 0.8184, + "step": 50550 + }, + { + "epoch": 1.3, + "learning_rate": 1.2659659701059435e-06, + "loss": 0.6025, + "step": 50551 + }, + { + "epoch": 1.3, + "learning_rate": 1.2659392961730663e-06, + "loss": 0.4937, + "step": 50552 + }, + { + "epoch": 1.3, + "learning_rate": 1.265912622036571e-06, + "loss": 0.4854, + "step": 50553 + }, + { + "epoch": 1.3, + "learning_rate": 1.265885947696479e-06, + "loss": 0.7588, + "step": 50554 + }, + { + "epoch": 1.3, + "learning_rate": 1.2658592731528102e-06, + "loss": 0.7354, + "step": 50555 + }, + { + "epoch": 1.3, + "learning_rate": 1.2658325984055855e-06, + "loss": 0.7129, + "step": 50556 + }, + { + "epoch": 1.3, + "learning_rate": 1.265805923454825e-06, + "loss": 0.7383, + "step": 50557 + }, + { + "epoch": 1.3, + "learning_rate": 1.2657792483005488e-06, + "loss": 0.6274, + "step": 50558 + }, + { + "epoch": 1.3, + "learning_rate": 1.2657525729427777e-06, + "loss": 0.6807, + "step": 50559 + }, + { + "epoch": 1.3, + "learning_rate": 1.265725897381532e-06, + "loss": 0.751, + "step": 50560 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656992216168325e-06, + "loss": 0.6416, + "step": 50561 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656725456486994e-06, + "loss": 0.5779, + "step": 50562 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656458694771526e-06, + "loss": 0.5469, + "step": 50563 + }, + { + "epoch": 1.3, + "learning_rate": 1.2656191931022132e-06, + "loss": 0.5129, + "step": 50564 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655925165239013e-06, + "loss": 0.7441, + "step": 50565 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655658397422377e-06, + "loss": 0.8076, + "step": 50566 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655391627572423e-06, + "loss": 0.6074, + "step": 50567 + }, + { + "epoch": 1.3, + "learning_rate": 1.2655124855689358e-06, + "loss": 0.6665, + "step": 50568 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654858081773388e-06, + "loss": 0.5918, + "step": 50569 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654591305824713e-06, + "loss": 0.6177, + "step": 50570 + }, + { + "epoch": 1.3, + "learning_rate": 1.265432452784354e-06, + "loss": 0.5288, + "step": 50571 + }, + { + "epoch": 1.3, + "learning_rate": 1.2654057747830072e-06, + "loss": 0.7119, + "step": 50572 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653790965784517e-06, + "loss": 0.3145, + "step": 50573 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653524181707074e-06, + "loss": 0.5366, + "step": 50574 + }, + { + "epoch": 1.3, + "learning_rate": 1.2653257395597946e-06, + "loss": 0.7266, + "step": 50575 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652990607457348e-06, + "loss": 0.6514, + "step": 50576 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652723817285473e-06, + "loss": 0.5879, + "step": 50577 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652457025082528e-06, + "loss": 0.6499, + "step": 50578 + }, + { + "epoch": 1.3, + "learning_rate": 1.2652190230848723e-06, + "loss": 0.7676, + "step": 50579 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651923434584253e-06, + "loss": 0.5728, + "step": 50580 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651656636289332e-06, + "loss": 0.626, + "step": 50581 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651389835964156e-06, + "loss": 0.5157, + "step": 50582 + }, + { + "epoch": 1.3, + "learning_rate": 1.2651123033608934e-06, + "loss": 0.6157, + "step": 50583 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650856229223868e-06, + "loss": 0.6768, + "step": 50584 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650589422809165e-06, + "loss": 0.5918, + "step": 50585 + }, + { + "epoch": 1.3, + "learning_rate": 1.2650322614365027e-06, + "loss": 0.8799, + "step": 50586 + }, + { + "epoch": 1.3, + "learning_rate": 1.265005580389166e-06, + "loss": 0.6777, + "step": 50587 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649788991389263e-06, + "loss": 0.5126, + "step": 50588 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649522176858048e-06, + "loss": 0.6493, + "step": 50589 + }, + { + "epoch": 1.3, + "learning_rate": 1.2649255360298213e-06, + "loss": 0.5625, + "step": 50590 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648988541709971e-06, + "loss": 0.6514, + "step": 50591 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648721721093511e-06, + "loss": 0.4382, + "step": 50592 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648454898449055e-06, + "loss": 0.594, + "step": 50593 + }, + { + "epoch": 1.3, + "learning_rate": 1.2648188073776794e-06, + "loss": 0.7158, + "step": 50594 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647921247076939e-06, + "loss": 0.5151, + "step": 50595 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647654418349691e-06, + "loss": 0.6602, + "step": 50596 + }, + { + "epoch": 1.3, + "learning_rate": 1.2647387587595257e-06, + "loss": 0.7109, + "step": 50597 + }, + { + "epoch": 1.3, + "learning_rate": 1.264712075481384e-06, + "loss": 0.6543, + "step": 50598 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646853920005642e-06, + "loss": 0.748, + "step": 50599 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646587083170875e-06, + "loss": 0.6875, + "step": 50600 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646320244309734e-06, + "loss": 0.6105, + "step": 50601 + }, + { + "epoch": 1.3, + "learning_rate": 1.2646053403422428e-06, + "loss": 0.7217, + "step": 50602 + }, + { + "epoch": 1.3, + "learning_rate": 1.264578656050916e-06, + "loss": 0.5803, + "step": 50603 + }, + { + "epoch": 1.3, + "learning_rate": 1.2645519715570134e-06, + "loss": 0.5093, + "step": 50604 + }, + { + "epoch": 1.3, + "learning_rate": 1.2645252868605556e-06, + "loss": 0.7344, + "step": 50605 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644986019615633e-06, + "loss": 0.7109, + "step": 50606 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644719168600562e-06, + "loss": 0.6484, + "step": 50607 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644452315560555e-06, + "loss": 0.8389, + "step": 50608 + }, + { + "epoch": 1.3, + "learning_rate": 1.2644185460495807e-06, + "loss": 0.6934, + "step": 50609 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643918603406532e-06, + "loss": 0.5457, + "step": 50610 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643651744292928e-06, + "loss": 0.7871, + "step": 50611 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643384883155204e-06, + "loss": 0.6758, + "step": 50612 + }, + { + "epoch": 1.3, + "learning_rate": 1.2643118019993558e-06, + "loss": 0.7314, + "step": 50613 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642851154808197e-06, + "loss": 0.6162, + "step": 50614 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642584287599328e-06, + "loss": 0.7344, + "step": 50615 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642317418367156e-06, + "loss": 0.6602, + "step": 50616 + }, + { + "epoch": 1.3, + "learning_rate": 1.2642050547111884e-06, + "loss": 0.7998, + "step": 50617 + }, + { + "epoch": 1.3, + "learning_rate": 1.2641783673833714e-06, + "loss": 0.4782, + "step": 50618 + }, + { + "epoch": 1.3, + "learning_rate": 1.264151679853285e-06, + "loss": 0.6108, + "step": 50619 + }, + { + "epoch": 1.3, + "learning_rate": 1.26412499212095e-06, + "loss": 0.7979, + "step": 50620 + }, + { + "epoch": 1.3, + "learning_rate": 1.2640983041863865e-06, + "loss": 0.8135, + "step": 50621 + }, + { + "epoch": 1.3, + "learning_rate": 1.264071616049615e-06, + "loss": 0.618, + "step": 50622 + }, + { + "epoch": 1.3, + "learning_rate": 1.264044927710656e-06, + "loss": 0.6055, + "step": 50623 + }, + { + "epoch": 1.3, + "learning_rate": 1.26401823916953e-06, + "loss": 0.7188, + "step": 50624 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639915504262576e-06, + "loss": 0.531, + "step": 50625 + }, + { + "epoch": 1.3, + "learning_rate": 1.263964861480859e-06, + "loss": 0.707, + "step": 50626 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639381723333543e-06, + "loss": 0.4424, + "step": 50627 + }, + { + "epoch": 1.3, + "learning_rate": 1.2639114829837644e-06, + "loss": 0.5132, + "step": 50628 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638847934321097e-06, + "loss": 0.6523, + "step": 50629 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638581036784105e-06, + "loss": 0.6904, + "step": 50630 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638314137226877e-06, + "loss": 0.5146, + "step": 50631 + }, + { + "epoch": 1.3, + "learning_rate": 1.2638047235649608e-06, + "loss": 0.6836, + "step": 50632 + }, + { + "epoch": 1.3, + "learning_rate": 1.2637780332052508e-06, + "loss": 0.9482, + "step": 50633 + }, + { + "epoch": 1.3, + "learning_rate": 1.263751342643578e-06, + "loss": 0.79, + "step": 50634 + }, + { + "epoch": 1.3, + "learning_rate": 1.263724651879963e-06, + "loss": 0.7544, + "step": 50635 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636979609144266e-06, + "loss": 0.6826, + "step": 50636 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636712697469885e-06, + "loss": 0.6611, + "step": 50637 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636445783776693e-06, + "loss": 0.4753, + "step": 50638 + }, + { + "epoch": 1.3, + "learning_rate": 1.2636178868064894e-06, + "loss": 0.8496, + "step": 50639 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635911950334697e-06, + "loss": 0.6953, + "step": 50640 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635645030586303e-06, + "loss": 0.7598, + "step": 50641 + }, + { + "epoch": 1.3, + "learning_rate": 1.263537810881992e-06, + "loss": 0.834, + "step": 50642 + }, + { + "epoch": 1.3, + "learning_rate": 1.2635111185035744e-06, + "loss": 0.8252, + "step": 50643 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634844259233985e-06, + "loss": 0.8496, + "step": 50644 + }, + { + "epoch": 1.3, + "learning_rate": 1.263457733141485e-06, + "loss": 0.623, + "step": 50645 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634310401578541e-06, + "loss": 0.7749, + "step": 50646 + }, + { + "epoch": 1.3, + "learning_rate": 1.2634043469725257e-06, + "loss": 0.5986, + "step": 50647 + }, + { + "epoch": 1.3, + "learning_rate": 1.263377653585521e-06, + "loss": 0.6387, + "step": 50648 + }, + { + "epoch": 1.3, + "learning_rate": 1.2633509599968599e-06, + "loss": 0.6104, + "step": 50649 + }, + { + "epoch": 1.3, + "learning_rate": 1.2633242662065634e-06, + "loss": 0.6602, + "step": 50650 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632975722146514e-06, + "loss": 0.6475, + "step": 50651 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632708780211448e-06, + "loss": 0.6963, + "step": 50652 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632441836260633e-06, + "loss": 0.7383, + "step": 50653 + }, + { + "epoch": 1.3, + "learning_rate": 1.2632174890294283e-06, + "loss": 0.6733, + "step": 50654 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631907942312596e-06, + "loss": 0.7461, + "step": 50655 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631640992315779e-06, + "loss": 0.5879, + "step": 50656 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631374040304034e-06, + "loss": 0.7119, + "step": 50657 + }, + { + "epoch": 1.3, + "learning_rate": 1.2631107086277568e-06, + "loss": 0.8174, + "step": 50658 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630840130236584e-06, + "loss": 0.5454, + "step": 50659 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630573172181287e-06, + "loss": 0.6055, + "step": 50660 + }, + { + "epoch": 1.3, + "learning_rate": 1.263030621211188e-06, + "loss": 0.6826, + "step": 50661 + }, + { + "epoch": 1.3, + "learning_rate": 1.2630039250028568e-06, + "loss": 0.6909, + "step": 50662 + }, + { + "epoch": 1.3, + "learning_rate": 1.262977228593156e-06, + "loss": 0.5112, + "step": 50663 + }, + { + "epoch": 1.3, + "learning_rate": 1.2629505319821055e-06, + "loss": 0.7285, + "step": 50664 + }, + { + "epoch": 1.3, + "learning_rate": 1.2629238351697253e-06, + "loss": 0.8047, + "step": 50665 + }, + { + "epoch": 1.3, + "learning_rate": 1.262897138156037e-06, + "loss": 0.7744, + "step": 50666 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628704409410605e-06, + "loss": 0.6729, + "step": 50667 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628437435248157e-06, + "loss": 0.7256, + "step": 50668 + }, + { + "epoch": 1.3, + "learning_rate": 1.2628170459073238e-06, + "loss": 0.666, + "step": 50669 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627903480886049e-06, + "loss": 0.7754, + "step": 50670 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627636500686798e-06, + "loss": 0.603, + "step": 50671 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627369518475682e-06, + "loss": 0.6016, + "step": 50672 + }, + { + "epoch": 1.3, + "learning_rate": 1.2627102534252915e-06, + "loss": 0.5757, + "step": 50673 + }, + { + "epoch": 1.3, + "learning_rate": 1.262683554801869e-06, + "loss": 0.6216, + "step": 50674 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626568559773226e-06, + "loss": 0.5913, + "step": 50675 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626301569516713e-06, + "loss": 0.6553, + "step": 50676 + }, + { + "epoch": 1.3, + "learning_rate": 1.2626034577249365e-06, + "loss": 0.7041, + "step": 50677 + }, + { + "epoch": 1.3, + "learning_rate": 1.2625767582971378e-06, + "loss": 0.6436, + "step": 50678 + }, + { + "epoch": 1.3, + "learning_rate": 1.2625500586682966e-06, + "loss": 0.6592, + "step": 50679 + }, + { + "epoch": 1.3, + "learning_rate": 1.262523358838433e-06, + "loss": 0.5879, + "step": 50680 + }, + { + "epoch": 1.3, + "learning_rate": 1.262496658807567e-06, + "loss": 0.7104, + "step": 50681 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624699585757195e-06, + "loss": 0.8682, + "step": 50682 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624432581429107e-06, + "loss": 0.6226, + "step": 50683 + }, + { + "epoch": 1.3, + "learning_rate": 1.2624165575091612e-06, + "loss": 0.7764, + "step": 50684 + }, + { + "epoch": 1.3, + "learning_rate": 1.2623898566744915e-06, + "loss": 0.7383, + "step": 50685 + }, + { + "epoch": 1.3, + "learning_rate": 1.262363155638922e-06, + "loss": 0.7627, + "step": 50686 + }, + { + "epoch": 1.3, + "learning_rate": 1.262336454402473e-06, + "loss": 0.6826, + "step": 50687 + }, + { + "epoch": 1.3, + "learning_rate": 1.2623097529651652e-06, + "loss": 0.7271, + "step": 50688 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622830513270187e-06, + "loss": 0.8447, + "step": 50689 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622563494880542e-06, + "loss": 0.4371, + "step": 50690 + }, + { + "epoch": 1.3, + "learning_rate": 1.262229647448292e-06, + "loss": 0.397, + "step": 50691 + }, + { + "epoch": 1.3, + "learning_rate": 1.2622029452077528e-06, + "loss": 0.5619, + "step": 50692 + }, + { + "epoch": 1.3, + "learning_rate": 1.2621762427664566e-06, + "loss": 0.7373, + "step": 50693 + }, + { + "epoch": 1.3, + "learning_rate": 1.2621495401244244e-06, + "loss": 0.6138, + "step": 50694 + }, + { + "epoch": 1.3, + "learning_rate": 1.262122837281676e-06, + "loss": 0.6392, + "step": 50695 + }, + { + "epoch": 1.3, + "learning_rate": 1.2620961342382326e-06, + "loss": 0.7676, + "step": 50696 + }, + { + "epoch": 1.3, + "learning_rate": 1.262069430994114e-06, + "loss": 0.4292, + "step": 50697 + }, + { + "epoch": 1.3, + "learning_rate": 1.262042727549341e-06, + "loss": 0.5288, + "step": 50698 + }, + { + "epoch": 1.3, + "learning_rate": 1.2620160239039336e-06, + "loss": 0.5557, + "step": 50699 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619893200579133e-06, + "loss": 0.7023, + "step": 50700 + }, + { + "epoch": 1.3, + "learning_rate": 1.261962616011299e-06, + "loss": 0.5977, + "step": 50701 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619359117641123e-06, + "loss": 0.5684, + "step": 50702 + }, + { + "epoch": 1.3, + "learning_rate": 1.2619092073163736e-06, + "loss": 0.6768, + "step": 50703 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618825026681025e-06, + "loss": 0.7949, + "step": 50704 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618557978193206e-06, + "loss": 0.4624, + "step": 50705 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618290927700472e-06, + "loss": 0.5527, + "step": 50706 + }, + { + "epoch": 1.3, + "learning_rate": 1.2618023875203036e-06, + "loss": 0.7363, + "step": 50707 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617756820701102e-06, + "loss": 0.5586, + "step": 50708 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617489764194868e-06, + "loss": 0.6758, + "step": 50709 + }, + { + "epoch": 1.3, + "learning_rate": 1.2617222705684544e-06, + "loss": 0.667, + "step": 50710 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616955645170333e-06, + "loss": 0.7422, + "step": 50711 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616688582652437e-06, + "loss": 0.6987, + "step": 50712 + }, + { + "epoch": 1.3, + "learning_rate": 1.2616421518131066e-06, + "loss": 0.7148, + "step": 50713 + }, + { + "epoch": 1.3, + "learning_rate": 1.261615445160642e-06, + "loss": 0.5798, + "step": 50714 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615887383078708e-06, + "loss": 0.5874, + "step": 50715 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615620312548124e-06, + "loss": 0.5767, + "step": 50716 + }, + { + "epoch": 1.3, + "learning_rate": 1.2615353240014886e-06, + "loss": 0.8008, + "step": 50717 + }, + { + "epoch": 1.3, + "learning_rate": 1.261508616547919e-06, + "loss": 0.5562, + "step": 50718 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614819088941243e-06, + "loss": 0.5288, + "step": 50719 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614552010401251e-06, + "loss": 0.7024, + "step": 50720 + }, + { + "epoch": 1.3, + "learning_rate": 1.2614284929859416e-06, + "loss": 0.6206, + "step": 50721 + }, + { + "epoch": 1.3, + "learning_rate": 1.261401784731594e-06, + "loss": 0.6357, + "step": 50722 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613750762771033e-06, + "loss": 0.6577, + "step": 50723 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613483676224897e-06, + "loss": 0.8184, + "step": 50724 + }, + { + "epoch": 1.3, + "learning_rate": 1.2613216587677736e-06, + "loss": 0.5674, + "step": 50725 + }, + { + "epoch": 1.3, + "learning_rate": 1.261294949712976e-06, + "loss": 0.6567, + "step": 50726 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612682404581166e-06, + "loss": 0.8291, + "step": 50727 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612415310032156e-06, + "loss": 0.592, + "step": 50728 + }, + { + "epoch": 1.3, + "learning_rate": 1.2612148213482944e-06, + "loss": 0.8555, + "step": 50729 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611881114933732e-06, + "loss": 0.5913, + "step": 50730 + }, + { + "epoch": 1.3, + "learning_rate": 1.261161401438472e-06, + "loss": 0.6279, + "step": 50731 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611346911836118e-06, + "loss": 0.5986, + "step": 50732 + }, + { + "epoch": 1.3, + "learning_rate": 1.2611079807288124e-06, + "loss": 0.6748, + "step": 50733 + }, + { + "epoch": 1.3, + "learning_rate": 1.261081270074095e-06, + "loss": 0.5793, + "step": 50734 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610545592194795e-06, + "loss": 0.7949, + "step": 50735 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610278481649864e-06, + "loss": 0.5864, + "step": 50736 + }, + { + "epoch": 1.3, + "learning_rate": 1.2610011369106364e-06, + "loss": 0.8076, + "step": 50737 + }, + { + "epoch": 1.3, + "learning_rate": 1.26097442545645e-06, + "loss": 0.6689, + "step": 50738 + }, + { + "epoch": 1.3, + "learning_rate": 1.260947713802447e-06, + "loss": 0.7109, + "step": 50739 + }, + { + "epoch": 1.3, + "learning_rate": 1.2609210019486489e-06, + "loss": 0.5571, + "step": 50740 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608942898950752e-06, + "loss": 0.6855, + "step": 50741 + }, + { + "epoch": 1.3, + "learning_rate": 1.260867577641747e-06, + "loss": 0.5916, + "step": 50742 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608408651886842e-06, + "loss": 0.8525, + "step": 50743 + }, + { + "epoch": 1.3, + "learning_rate": 1.2608141525359077e-06, + "loss": 0.4844, + "step": 50744 + }, + { + "epoch": 1.3, + "learning_rate": 1.260787439683438e-06, + "loss": 0.5688, + "step": 50745 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607607266312953e-06, + "loss": 0.5139, + "step": 50746 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607340133794997e-06, + "loss": 0.4103, + "step": 50747 + }, + { + "epoch": 1.3, + "learning_rate": 1.2607072999280724e-06, + "loss": 0.7007, + "step": 50748 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606805862770333e-06, + "loss": 0.6138, + "step": 50749 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606538724264032e-06, + "loss": 0.5413, + "step": 50750 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606271583762026e-06, + "loss": 0.6099, + "step": 50751 + }, + { + "epoch": 1.3, + "learning_rate": 1.2606004441264512e-06, + "loss": 0.7031, + "step": 50752 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605737296771706e-06, + "loss": 0.7173, + "step": 50753 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605470150283805e-06, + "loss": 0.6016, + "step": 50754 + }, + { + "epoch": 1.3, + "learning_rate": 1.2605203001801014e-06, + "loss": 0.7461, + "step": 50755 + }, + { + "epoch": 1.3, + "learning_rate": 1.260493585132354e-06, + "loss": 0.6436, + "step": 50756 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604668698851586e-06, + "loss": 0.6807, + "step": 50757 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604401544385356e-06, + "loss": 0.5488, + "step": 50758 + }, + { + "epoch": 1.3, + "learning_rate": 1.2604134387925057e-06, + "loss": 0.6709, + "step": 50759 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603867229470893e-06, + "loss": 0.6372, + "step": 50760 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603600069023065e-06, + "loss": 0.5532, + "step": 50761 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603332906581781e-06, + "loss": 0.5591, + "step": 50762 + }, + { + "epoch": 1.3, + "learning_rate": 1.2603065742147245e-06, + "loss": 0.5884, + "step": 50763 + }, + { + "epoch": 1.3, + "learning_rate": 1.260279857571966e-06, + "loss": 0.6914, + "step": 50764 + }, + { + "epoch": 1.3, + "learning_rate": 1.2602531407299237e-06, + "loss": 0.5601, + "step": 50765 + }, + { + "epoch": 1.3, + "learning_rate": 1.2602264236886169e-06, + "loss": 0.6807, + "step": 50766 + }, + { + "epoch": 1.3, + "learning_rate": 1.260199706448067e-06, + "loss": 0.6895, + "step": 50767 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601729890082941e-06, + "loss": 0.7773, + "step": 50768 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601462713693187e-06, + "loss": 0.4268, + "step": 50769 + }, + { + "epoch": 1.3, + "learning_rate": 1.2601195535311613e-06, + "loss": 0.6587, + "step": 50770 + }, + { + "epoch": 1.3, + "learning_rate": 1.2600928354938422e-06, + "loss": 0.583, + "step": 50771 + }, + { + "epoch": 1.3, + "learning_rate": 1.260066117257382e-06, + "loss": 0.6123, + "step": 50772 + }, + { + "epoch": 1.3, + "learning_rate": 1.2600393988218013e-06, + "loss": 0.6831, + "step": 50773 + }, + { + "epoch": 1.3, + "learning_rate": 1.26001268018712e-06, + "loss": 0.7031, + "step": 50774 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599859613533595e-06, + "loss": 0.6626, + "step": 50775 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599592423205395e-06, + "loss": 0.635, + "step": 50776 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599325230886805e-06, + "loss": 0.5278, + "step": 50777 + }, + { + "epoch": 1.3, + "learning_rate": 1.2599058036578032e-06, + "loss": 0.6255, + "step": 50778 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598790840279279e-06, + "loss": 0.5347, + "step": 50779 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598523641990752e-06, + "loss": 0.5168, + "step": 50780 + }, + { + "epoch": 1.3, + "learning_rate": 1.2598256441712657e-06, + "loss": 0.748, + "step": 50781 + }, + { + "epoch": 1.3, + "learning_rate": 1.2597989239445195e-06, + "loss": 0.6533, + "step": 50782 + }, + { + "epoch": 1.3, + "learning_rate": 1.2597722035188569e-06, + "loss": 0.6572, + "step": 50783 + }, + { + "epoch": 1.3, + "learning_rate": 1.259745482894299e-06, + "loss": 0.6572, + "step": 50784 + }, + { + "epoch": 1.3, + "learning_rate": 1.259718762070866e-06, + "loss": 0.7422, + "step": 50785 + }, + { + "epoch": 1.3, + "learning_rate": 1.259692041048578e-06, + "loss": 0.6211, + "step": 50786 + }, + { + "epoch": 1.3, + "learning_rate": 1.259665319827456e-06, + "loss": 0.6182, + "step": 50787 + }, + { + "epoch": 1.3, + "learning_rate": 1.2596385984075203e-06, + "loss": 0.585, + "step": 50788 + }, + { + "epoch": 1.3, + "learning_rate": 1.2596118767887906e-06, + "loss": 0.7344, + "step": 50789 + }, + { + "epoch": 1.3, + "learning_rate": 1.259585154971289e-06, + "loss": 0.6099, + "step": 50790 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595584329550343e-06, + "loss": 0.7412, + "step": 50791 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595317107400478e-06, + "loss": 0.5796, + "step": 50792 + }, + { + "epoch": 1.3, + "learning_rate": 1.2595049883263498e-06, + "loss": 0.5483, + "step": 50793 + }, + { + "epoch": 1.3, + "learning_rate": 1.2594782657139607e-06, + "loss": 0.751, + "step": 50794 + }, + { + "epoch": 1.3, + "learning_rate": 1.259451542902901e-06, + "loss": 0.6187, + "step": 50795 + }, + { + "epoch": 1.3, + "learning_rate": 1.2594248198931915e-06, + "loss": 0.4541, + "step": 50796 + }, + { + "epoch": 1.3, + "learning_rate": 1.259398096684852e-06, + "loss": 0.7139, + "step": 50797 + }, + { + "epoch": 1.3, + "learning_rate": 1.2593713732779034e-06, + "loss": 0.6421, + "step": 50798 + }, + { + "epoch": 1.3, + "learning_rate": 1.259344649672366e-06, + "loss": 0.6777, + "step": 50799 + }, + { + "epoch": 1.3, + "learning_rate": 1.2593179258682605e-06, + "loss": 0.7129, + "step": 50800 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592912018656072e-06, + "loss": 0.5869, + "step": 50801 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592644776644264e-06, + "loss": 0.6709, + "step": 50802 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592377532647389e-06, + "loss": 0.6074, + "step": 50803 + }, + { + "epoch": 1.3, + "learning_rate": 1.2592110286665647e-06, + "loss": 0.7588, + "step": 50804 + }, + { + "epoch": 1.3, + "learning_rate": 1.259184303869925e-06, + "loss": 0.5977, + "step": 50805 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591575788748391e-06, + "loss": 0.4714, + "step": 50806 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591308536813287e-06, + "loss": 0.5967, + "step": 50807 + }, + { + "epoch": 1.3, + "learning_rate": 1.2591041282894135e-06, + "loss": 0.5371, + "step": 50808 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590774026991142e-06, + "loss": 0.6558, + "step": 50809 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590506769104513e-06, + "loss": 0.7705, + "step": 50810 + }, + { + "epoch": 1.3, + "learning_rate": 1.2590239509234453e-06, + "loss": 0.5308, + "step": 50811 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589972247381164e-06, + "loss": 0.6361, + "step": 50812 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589704983544853e-06, + "loss": 0.71, + "step": 50813 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589437717725724e-06, + "loss": 0.6675, + "step": 50814 + }, + { + "epoch": 1.3, + "learning_rate": 1.2589170449923981e-06, + "loss": 0.5933, + "step": 50815 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588903180139832e-06, + "loss": 0.7666, + "step": 50816 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588635908373477e-06, + "loss": 0.6553, + "step": 50817 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588368634625119e-06, + "loss": 0.5845, + "step": 50818 + }, + { + "epoch": 1.3, + "learning_rate": 1.2588101358894972e-06, + "loss": 0.5825, + "step": 50819 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587834081183234e-06, + "loss": 0.6885, + "step": 50820 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587566801490104e-06, + "loss": 0.7646, + "step": 50821 + }, + { + "epoch": 1.3, + "learning_rate": 1.25872995198158e-06, + "loss": 0.6914, + "step": 50822 + }, + { + "epoch": 1.3, + "learning_rate": 1.2587032236160516e-06, + "loss": 0.6758, + "step": 50823 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586764950524463e-06, + "loss": 0.5283, + "step": 50824 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586497662907843e-06, + "loss": 0.7314, + "step": 50825 + }, + { + "epoch": 1.3, + "learning_rate": 1.2586230373310858e-06, + "loss": 0.7812, + "step": 50826 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585963081733714e-06, + "loss": 0.6143, + "step": 50827 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585695788176622e-06, + "loss": 0.6626, + "step": 50828 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585428492639778e-06, + "loss": 0.5752, + "step": 50829 + }, + { + "epoch": 1.3, + "learning_rate": 1.2585161195123396e-06, + "loss": 0.6064, + "step": 50830 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584893895627668e-06, + "loss": 0.6484, + "step": 50831 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584626594152806e-06, + "loss": 0.6284, + "step": 50832 + }, + { + "epoch": 1.3, + "learning_rate": 1.258435929069902e-06, + "loss": 0.707, + "step": 50833 + }, + { + "epoch": 1.3, + "learning_rate": 1.2584091985266504e-06, + "loss": 0.7451, + "step": 50834 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583824677855467e-06, + "loss": 0.8379, + "step": 50835 + }, + { + "epoch": 1.3, + "learning_rate": 1.258355736846612e-06, + "loss": 0.5146, + "step": 50836 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583290057098657e-06, + "loss": 0.71, + "step": 50837 + }, + { + "epoch": 1.3, + "learning_rate": 1.2583022743753289e-06, + "loss": 0.5288, + "step": 50838 + }, + { + "epoch": 1.3, + "learning_rate": 1.2582755428430217e-06, + "loss": 0.6465, + "step": 50839 + }, + { + "epoch": 1.3, + "learning_rate": 1.258248811112965e-06, + "loss": 0.54, + "step": 50840 + }, + { + "epoch": 1.3, + "learning_rate": 1.2582220791851792e-06, + "loss": 0.5947, + "step": 50841 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581953470596843e-06, + "loss": 0.7144, + "step": 50842 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581686147365014e-06, + "loss": 0.667, + "step": 50843 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581418822156505e-06, + "loss": 0.7295, + "step": 50844 + }, + { + "epoch": 1.3, + "learning_rate": 1.2581151494971525e-06, + "loss": 0.7344, + "step": 50845 + }, + { + "epoch": 1.3, + "learning_rate": 1.258088416581027e-06, + "loss": 0.627, + "step": 50846 + }, + { + "epoch": 1.3, + "learning_rate": 1.2580616834672957e-06, + "loss": 0.6943, + "step": 50847 + }, + { + "epoch": 1.3, + "learning_rate": 1.258034950155978e-06, + "loss": 0.8076, + "step": 50848 + }, + { + "epoch": 1.3, + "learning_rate": 1.2580082166470949e-06, + "loss": 0.6602, + "step": 50849 + }, + { + "epoch": 1.3, + "learning_rate": 1.257981482940667e-06, + "loss": 0.5625, + "step": 50850 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579547490367144e-06, + "loss": 0.8555, + "step": 50851 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579280149352576e-06, + "loss": 0.5483, + "step": 50852 + }, + { + "epoch": 1.3, + "learning_rate": 1.2579012806363172e-06, + "loss": 0.8086, + "step": 50853 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578745461399136e-06, + "loss": 0.5698, + "step": 50854 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578478114460678e-06, + "loss": 0.7725, + "step": 50855 + }, + { + "epoch": 1.3, + "learning_rate": 1.2578210765547992e-06, + "loss": 0.533, + "step": 50856 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577943414661292e-06, + "loss": 0.5801, + "step": 50857 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577676061800778e-06, + "loss": 0.8379, + "step": 50858 + }, + { + "epoch": 1.3, + "learning_rate": 1.2577408706966654e-06, + "loss": 0.6133, + "step": 50859 + }, + { + "epoch": 1.3, + "learning_rate": 1.257714135015913e-06, + "loss": 0.6978, + "step": 50860 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576873991378408e-06, + "loss": 0.7607, + "step": 50861 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576606630624689e-06, + "loss": 0.5496, + "step": 50862 + }, + { + "epoch": 1.3, + "learning_rate": 1.257633926789818e-06, + "loss": 0.5898, + "step": 50863 + }, + { + "epoch": 1.3, + "learning_rate": 1.2576071903199087e-06, + "loss": 0.6486, + "step": 50864 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575804536527619e-06, + "loss": 0.6768, + "step": 50865 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575537167883972e-06, + "loss": 0.6382, + "step": 50866 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575269797268353e-06, + "loss": 0.6201, + "step": 50867 + }, + { + "epoch": 1.3, + "learning_rate": 1.2575002424680971e-06, + "loss": 0.6797, + "step": 50868 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574735050122027e-06, + "loss": 0.5925, + "step": 50869 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574467673591728e-06, + "loss": 0.543, + "step": 50870 + }, + { + "epoch": 1.3, + "learning_rate": 1.2574200295090278e-06, + "loss": 0.6631, + "step": 50871 + }, + { + "epoch": 1.3, + "learning_rate": 1.257393291461788e-06, + "loss": 0.6665, + "step": 50872 + }, + { + "epoch": 1.3, + "learning_rate": 1.2573665532174737e-06, + "loss": 0.5552, + "step": 50873 + }, + { + "epoch": 1.3, + "learning_rate": 1.257339814776106e-06, + "loss": 0.5508, + "step": 50874 + }, + { + "epoch": 1.3, + "learning_rate": 1.2573130761377053e-06, + "loss": 0.7363, + "step": 50875 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572863373022916e-06, + "loss": 0.8516, + "step": 50876 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572595982698852e-06, + "loss": 0.7427, + "step": 50877 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572328590405073e-06, + "loss": 0.6553, + "step": 50878 + }, + { + "epoch": 1.3, + "learning_rate": 1.2572061196141777e-06, + "loss": 0.5015, + "step": 50879 + }, + { + "epoch": 1.3, + "learning_rate": 1.2571793799909179e-06, + "loss": 0.6001, + "step": 50880 + }, + { + "epoch": 1.3, + "learning_rate": 1.257152640170747e-06, + "loss": 0.5664, + "step": 50881 + }, + { + "epoch": 1.3, + "learning_rate": 1.2571259001536864e-06, + "loss": 0.4287, + "step": 50882 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570991599397562e-06, + "loss": 0.5984, + "step": 50883 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570724195289772e-06, + "loss": 0.5229, + "step": 50884 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570456789213697e-06, + "loss": 0.584, + "step": 50885 + }, + { + "epoch": 1.3, + "learning_rate": 1.2570189381169537e-06, + "loss": 0.6909, + "step": 50886 + }, + { + "epoch": 1.3, + "learning_rate": 1.2569921971157506e-06, + "loss": 0.708, + "step": 50887 + }, + { + "epoch": 1.3, + "learning_rate": 1.25696545591778e-06, + "loss": 0.6929, + "step": 50888 + }, + { + "epoch": 1.3, + "learning_rate": 1.2569387145230632e-06, + "loss": 0.6694, + "step": 50889 + }, + { + "epoch": 1.3, + "learning_rate": 1.25691197293162e-06, + "loss": 0.4186, + "step": 50890 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568852311434712e-06, + "loss": 0.4822, + "step": 50891 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568584891586368e-06, + "loss": 0.6602, + "step": 50892 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568317469771384e-06, + "loss": 0.644, + "step": 50893 + }, + { + "epoch": 1.3, + "learning_rate": 1.2568050045989951e-06, + "loss": 0.5615, + "step": 50894 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567782620242284e-06, + "loss": 0.915, + "step": 50895 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567515192528582e-06, + "loss": 0.564, + "step": 50896 + }, + { + "epoch": 1.3, + "learning_rate": 1.2567247762849053e-06, + "loss": 0.4686, + "step": 50897 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566980331203898e-06, + "loss": 0.7988, + "step": 50898 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566712897593325e-06, + "loss": 0.6318, + "step": 50899 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566445462017541e-06, + "loss": 0.365, + "step": 50900 + }, + { + "epoch": 1.3, + "learning_rate": 1.2566178024476747e-06, + "loss": 0.6777, + "step": 50901 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565910584971145e-06, + "loss": 0.6465, + "step": 50902 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565643143500945e-06, + "loss": 0.7568, + "step": 50903 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565375700066349e-06, + "loss": 0.5383, + "step": 50904 + }, + { + "epoch": 1.3, + "learning_rate": 1.2565108254667564e-06, + "loss": 0.5977, + "step": 50905 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564840807304795e-06, + "loss": 0.6587, + "step": 50906 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564573357978242e-06, + "loss": 0.6943, + "step": 50907 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564305906688114e-06, + "loss": 0.6333, + "step": 50908 + }, + { + "epoch": 1.3, + "learning_rate": 1.2564038453434617e-06, + "loss": 0.7012, + "step": 50909 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563770998217954e-06, + "loss": 0.7017, + "step": 50910 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563503541038328e-06, + "loss": 0.6152, + "step": 50911 + }, + { + "epoch": 1.3, + "learning_rate": 1.2563236081895946e-06, + "loss": 0.7222, + "step": 50912 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562968620791008e-06, + "loss": 0.6626, + "step": 50913 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562701157723728e-06, + "loss": 0.6201, + "step": 50914 + }, + { + "epoch": 1.3, + "learning_rate": 1.2562433692694304e-06, + "loss": 0.7363, + "step": 50915 + }, + { + "epoch": 1.31, + "learning_rate": 1.2562166225702942e-06, + "loss": 0.5227, + "step": 50916 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561898756749844e-06, + "loss": 0.6072, + "step": 50917 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561631285835223e-06, + "loss": 0.4697, + "step": 50918 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561363812959273e-06, + "loss": 0.6455, + "step": 50919 + }, + { + "epoch": 1.31, + "learning_rate": 1.2561096338122212e-06, + "loss": 0.6533, + "step": 50920 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560828861324231e-06, + "loss": 0.6797, + "step": 50921 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560561382565547e-06, + "loss": 0.7061, + "step": 50922 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560293901846352e-06, + "loss": 0.7695, + "step": 50923 + }, + { + "epoch": 1.31, + "learning_rate": 1.2560026419166862e-06, + "loss": 0.5615, + "step": 50924 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559758934527275e-06, + "loss": 0.6553, + "step": 50925 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559491447927802e-06, + "loss": 0.4731, + "step": 50926 + }, + { + "epoch": 1.31, + "learning_rate": 1.2559223959368641e-06, + "loss": 0.6387, + "step": 50927 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558956468850001e-06, + "loss": 0.6382, + "step": 50928 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558688976372085e-06, + "loss": 0.6631, + "step": 50929 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558421481935099e-06, + "loss": 0.7695, + "step": 50930 + }, + { + "epoch": 1.31, + "learning_rate": 1.2558153985539249e-06, + "loss": 0.6826, + "step": 50931 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557886487184735e-06, + "loss": 0.6582, + "step": 50932 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557618986871766e-06, + "loss": 0.6284, + "step": 50933 + }, + { + "epoch": 1.31, + "learning_rate": 1.2557351484600546e-06, + "loss": 0.4844, + "step": 50934 + }, + { + "epoch": 1.31, + "learning_rate": 1.255708398037128e-06, + "loss": 0.538, + "step": 50935 + }, + { + "epoch": 1.31, + "learning_rate": 1.255681647418417e-06, + "loss": 0.6992, + "step": 50936 + }, + { + "epoch": 1.31, + "learning_rate": 1.255654896603943e-06, + "loss": 0.5034, + "step": 50937 + }, + { + "epoch": 1.31, + "learning_rate": 1.255628145593725e-06, + "loss": 0.7598, + "step": 50938 + }, + { + "epoch": 1.31, + "learning_rate": 1.2556013943877845e-06, + "loss": 0.7139, + "step": 50939 + }, + { + "epoch": 1.31, + "learning_rate": 1.255574642986142e-06, + "loss": 0.5381, + "step": 50940 + }, + { + "epoch": 1.31, + "learning_rate": 1.2555478913888178e-06, + "loss": 0.6567, + "step": 50941 + }, + { + "epoch": 1.31, + "learning_rate": 1.2555211395958318e-06, + "loss": 0.7012, + "step": 50942 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554943876072055e-06, + "loss": 0.7266, + "step": 50943 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554676354229586e-06, + "loss": 0.5962, + "step": 50944 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554408830431125e-06, + "loss": 0.5359, + "step": 50945 + }, + { + "epoch": 1.31, + "learning_rate": 1.2554141304676864e-06, + "loss": 0.5752, + "step": 50946 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553873776967017e-06, + "loss": 0.5901, + "step": 50947 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553606247301782e-06, + "loss": 0.7139, + "step": 50948 + }, + { + "epoch": 1.31, + "learning_rate": 1.2553338715681374e-06, + "loss": 0.5391, + "step": 50949 + }, + { + "epoch": 1.31, + "learning_rate": 1.255307118210599e-06, + "loss": 0.6685, + "step": 50950 + }, + { + "epoch": 1.31, + "learning_rate": 1.2552803646575839e-06, + "loss": 0.4702, + "step": 50951 + }, + { + "epoch": 1.31, + "learning_rate": 1.255253610909112e-06, + "loss": 0.6104, + "step": 50952 + }, + { + "epoch": 1.31, + "learning_rate": 1.255226856965204e-06, + "loss": 0.4739, + "step": 50953 + }, + { + "epoch": 1.31, + "learning_rate": 1.2552001028258806e-06, + "loss": 0.708, + "step": 50954 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551733484911626e-06, + "loss": 0.7373, + "step": 50955 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551465939610698e-06, + "loss": 0.6641, + "step": 50956 + }, + { + "epoch": 1.31, + "learning_rate": 1.2551198392356233e-06, + "loss": 0.6304, + "step": 50957 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550930843148432e-06, + "loss": 0.6904, + "step": 50958 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550663291987495e-06, + "loss": 0.7383, + "step": 50959 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550395738873641e-06, + "loss": 0.6963, + "step": 50960 + }, + { + "epoch": 1.31, + "learning_rate": 1.2550128183807061e-06, + "loss": 0.6123, + "step": 50961 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549860626787964e-06, + "loss": 0.6777, + "step": 50962 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549593067816558e-06, + "loss": 0.7676, + "step": 50963 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549325506893046e-06, + "loss": 0.8955, + "step": 50964 + }, + { + "epoch": 1.31, + "learning_rate": 1.2549057944017633e-06, + "loss": 0.6348, + "step": 50965 + }, + { + "epoch": 1.31, + "learning_rate": 1.2548790379190523e-06, + "loss": 0.6357, + "step": 50966 + }, + { + "epoch": 1.31, + "learning_rate": 1.254852281241192e-06, + "loss": 0.668, + "step": 50967 + }, + { + "epoch": 1.31, + "learning_rate": 1.2548255243682034e-06, + "loss": 0.6328, + "step": 50968 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547987673001064e-06, + "loss": 0.604, + "step": 50969 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547720100369217e-06, + "loss": 0.6689, + "step": 50970 + }, + { + "epoch": 1.31, + "learning_rate": 1.2547452525786697e-06, + "loss": 0.7412, + "step": 50971 + }, + { + "epoch": 1.31, + "learning_rate": 1.254718494925371e-06, + "loss": 0.665, + "step": 50972 + }, + { + "epoch": 1.31, + "learning_rate": 1.254691737077046e-06, + "loss": 0.8184, + "step": 50973 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546649790337155e-06, + "loss": 0.8271, + "step": 50974 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546382207953997e-06, + "loss": 0.5869, + "step": 50975 + }, + { + "epoch": 1.31, + "learning_rate": 1.2546114623621188e-06, + "loss": 0.5996, + "step": 50976 + }, + { + "epoch": 1.31, + "learning_rate": 1.2545847037338936e-06, + "loss": 0.7007, + "step": 50977 + }, + { + "epoch": 1.31, + "learning_rate": 1.2545579449107448e-06, + "loss": 0.583, + "step": 50978 + }, + { + "epoch": 1.31, + "learning_rate": 1.254531185892693e-06, + "loss": 0.7461, + "step": 50979 + }, + { + "epoch": 1.31, + "learning_rate": 1.254504426679758e-06, + "loss": 0.7754, + "step": 50980 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544776672719609e-06, + "loss": 0.8428, + "step": 50981 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544509076693215e-06, + "loss": 0.7568, + "step": 50982 + }, + { + "epoch": 1.31, + "learning_rate": 1.2544241478718612e-06, + "loss": 0.7402, + "step": 50983 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543973878795996e-06, + "loss": 0.5547, + "step": 50984 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543706276925581e-06, + "loss": 0.7295, + "step": 50985 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543438673107565e-06, + "loss": 0.7979, + "step": 50986 + }, + { + "epoch": 1.31, + "learning_rate": 1.2543171067342154e-06, + "loss": 0.646, + "step": 50987 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542903459629551e-06, + "loss": 0.7539, + "step": 50988 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542635849969972e-06, + "loss": 0.6257, + "step": 50989 + }, + { + "epoch": 1.31, + "learning_rate": 1.2542368238363608e-06, + "loss": 0.8135, + "step": 50990 + }, + { + "epoch": 1.31, + "learning_rate": 1.254210062481067e-06, + "loss": 0.6729, + "step": 50991 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541833009311363e-06, + "loss": 0.6943, + "step": 50992 + }, + { + "epoch": 1.31, + "learning_rate": 1.254156539186589e-06, + "loss": 0.7646, + "step": 50993 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541297772474462e-06, + "loss": 0.6641, + "step": 50994 + }, + { + "epoch": 1.31, + "learning_rate": 1.2541030151137273e-06, + "loss": 0.5991, + "step": 50995 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540762527854539e-06, + "loss": 0.5466, + "step": 50996 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540494902626458e-06, + "loss": 0.6289, + "step": 50997 + }, + { + "epoch": 1.31, + "learning_rate": 1.2540227275453234e-06, + "loss": 0.6592, + "step": 50998 + }, + { + "epoch": 1.31, + "learning_rate": 1.253995964633508e-06, + "loss": 0.7275, + "step": 50999 + }, + { + "epoch": 1.31, + "learning_rate": 1.253969201527219e-06, + "loss": 0.4639, + "step": 51000 + }, + { + "epoch": 1.31, + "learning_rate": 1.2539424382264777e-06, + "loss": 0.7148, + "step": 51001 + }, + { + "epoch": 1.31, + "learning_rate": 1.2539156747313046e-06, + "loss": 0.6873, + "step": 51002 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538889110417196e-06, + "loss": 0.5999, + "step": 51003 + }, + { + "epoch": 1.31, + "learning_rate": 1.253862147157744e-06, + "loss": 0.5867, + "step": 51004 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538353830793974e-06, + "loss": 0.6572, + "step": 51005 + }, + { + "epoch": 1.31, + "learning_rate": 1.2538086188067007e-06, + "loss": 0.709, + "step": 51006 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537818543396746e-06, + "loss": 0.7598, + "step": 51007 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537550896783393e-06, + "loss": 0.6016, + "step": 51008 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537283248227155e-06, + "loss": 0.7676, + "step": 51009 + }, + { + "epoch": 1.31, + "learning_rate": 1.2537015597728238e-06, + "loss": 0.5947, + "step": 51010 + }, + { + "epoch": 1.31, + "learning_rate": 1.2536747945286839e-06, + "loss": 0.4133, + "step": 51011 + }, + { + "epoch": 1.31, + "learning_rate": 1.2536480290903172e-06, + "loss": 0.605, + "step": 51012 + }, + { + "epoch": 1.31, + "learning_rate": 1.253621263457744e-06, + "loss": 0.7246, + "step": 51013 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535944976309847e-06, + "loss": 0.5793, + "step": 51014 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535677316100595e-06, + "loss": 0.6592, + "step": 51015 + }, + { + "epoch": 1.31, + "learning_rate": 1.2535409653949892e-06, + "loss": 0.752, + "step": 51016 + }, + { + "epoch": 1.31, + "learning_rate": 1.253514198985794e-06, + "loss": 0.3582, + "step": 51017 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534874323824952e-06, + "loss": 0.6396, + "step": 51018 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534606655851122e-06, + "loss": 0.6934, + "step": 51019 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534338985936664e-06, + "loss": 0.5317, + "step": 51020 + }, + { + "epoch": 1.31, + "learning_rate": 1.2534071314081778e-06, + "loss": 0.6157, + "step": 51021 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533803640286666e-06, + "loss": 0.6689, + "step": 51022 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533535964551542e-06, + "loss": 0.52, + "step": 51023 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533268286876606e-06, + "loss": 0.7039, + "step": 51024 + }, + { + "epoch": 1.31, + "learning_rate": 1.2533000607262064e-06, + "loss": 0.8018, + "step": 51025 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532732925708115e-06, + "loss": 0.7324, + "step": 51026 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532465242214971e-06, + "loss": 0.5781, + "step": 51027 + }, + { + "epoch": 1.31, + "learning_rate": 1.2532197556782836e-06, + "loss": 0.8125, + "step": 51028 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531929869411916e-06, + "loss": 0.7891, + "step": 51029 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531662180102408e-06, + "loss": 0.7861, + "step": 51030 + }, + { + "epoch": 1.31, + "learning_rate": 1.2531394488854527e-06, + "loss": 0.5791, + "step": 51031 + }, + { + "epoch": 1.31, + "learning_rate": 1.253112679566847e-06, + "loss": 0.6709, + "step": 51032 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530859100544448e-06, + "loss": 0.6182, + "step": 51033 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530591403482666e-06, + "loss": 0.6211, + "step": 51034 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530323704483322e-06, + "loss": 0.6367, + "step": 51035 + }, + { + "epoch": 1.31, + "learning_rate": 1.2530056003546627e-06, + "loss": 0.4634, + "step": 51036 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529788300672785e-06, + "loss": 0.8945, + "step": 51037 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529520595862e-06, + "loss": 0.6631, + "step": 51038 + }, + { + "epoch": 1.31, + "learning_rate": 1.2529252889114478e-06, + "loss": 0.5938, + "step": 51039 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528985180430422e-06, + "loss": 0.7292, + "step": 51040 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528717469810042e-06, + "loss": 0.5214, + "step": 51041 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528449757253534e-06, + "loss": 0.7686, + "step": 51042 + }, + { + "epoch": 1.31, + "learning_rate": 1.2528182042761112e-06, + "loss": 0.6431, + "step": 51043 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527914326332979e-06, + "loss": 0.4917, + "step": 51044 + }, + { + "epoch": 1.31, + "learning_rate": 1.252764660796933e-06, + "loss": 0.605, + "step": 51045 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527378887670388e-06, + "loss": 0.6763, + "step": 51046 + }, + { + "epoch": 1.31, + "learning_rate": 1.2527111165436342e-06, + "loss": 0.4868, + "step": 51047 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526843441267405e-06, + "loss": 0.34, + "step": 51048 + }, + { + "epoch": 1.31, + "learning_rate": 1.252657571516378e-06, + "loss": 0.5769, + "step": 51049 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526307987125673e-06, + "loss": 0.7207, + "step": 51050 + }, + { + "epoch": 1.31, + "learning_rate": 1.2526040257153288e-06, + "loss": 0.6357, + "step": 51051 + }, + { + "epoch": 1.31, + "learning_rate": 1.2525772525246829e-06, + "loss": 0.7148, + "step": 51052 + }, + { + "epoch": 1.31, + "learning_rate": 1.25255047914065e-06, + "loss": 0.8545, + "step": 51053 + }, + { + "epoch": 1.31, + "learning_rate": 1.2525237055632513e-06, + "loss": 0.6406, + "step": 51054 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524969317925065e-06, + "loss": 0.5552, + "step": 51055 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524701578284367e-06, + "loss": 0.6592, + "step": 51056 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524433836710616e-06, + "loss": 0.6982, + "step": 51057 + }, + { + "epoch": 1.31, + "learning_rate": 1.2524166093204028e-06, + "loss": 0.6826, + "step": 51058 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523898347764798e-06, + "loss": 0.79, + "step": 51059 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523630600393139e-06, + "loss": 0.6182, + "step": 51060 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523362851089247e-06, + "loss": 0.6431, + "step": 51061 + }, + { + "epoch": 1.31, + "learning_rate": 1.2523095099853337e-06, + "loss": 0.7002, + "step": 51062 + }, + { + "epoch": 1.31, + "learning_rate": 1.2522827346685603e-06, + "loss": 0.626, + "step": 51063 + }, + { + "epoch": 1.31, + "learning_rate": 1.252255959158626e-06, + "loss": 0.3822, + "step": 51064 + }, + { + "epoch": 1.31, + "learning_rate": 1.252229183455551e-06, + "loss": 0.6431, + "step": 51065 + }, + { + "epoch": 1.31, + "learning_rate": 1.2522024075593556e-06, + "loss": 0.6338, + "step": 51066 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521756314700604e-06, + "loss": 0.6104, + "step": 51067 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521488551876857e-06, + "loss": 0.7539, + "step": 51068 + }, + { + "epoch": 1.31, + "learning_rate": 1.2521220787122525e-06, + "loss": 0.6665, + "step": 51069 + }, + { + "epoch": 1.31, + "learning_rate": 1.252095302043781e-06, + "loss": 0.7036, + "step": 51070 + }, + { + "epoch": 1.31, + "learning_rate": 1.2520685251822918e-06, + "loss": 0.5215, + "step": 51071 + }, + { + "epoch": 1.31, + "learning_rate": 1.252041748127805e-06, + "loss": 0.5435, + "step": 51072 + }, + { + "epoch": 1.31, + "learning_rate": 1.2520149708803418e-06, + "loss": 0.8154, + "step": 51073 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519881934399221e-06, + "loss": 0.6904, + "step": 51074 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519614158065667e-06, + "loss": 0.562, + "step": 51075 + }, + { + "epoch": 1.31, + "learning_rate": 1.251934637980296e-06, + "loss": 0.7246, + "step": 51076 + }, + { + "epoch": 1.31, + "learning_rate": 1.2519078599611307e-06, + "loss": 0.3274, + "step": 51077 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518810817490906e-06, + "loss": 0.7217, + "step": 51078 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518543033441975e-06, + "loss": 0.7539, + "step": 51079 + }, + { + "epoch": 1.31, + "learning_rate": 1.2518275247464704e-06, + "loss": 0.5037, + "step": 51080 + }, + { + "epoch": 1.31, + "learning_rate": 1.251800745955931e-06, + "loss": 0.5776, + "step": 51081 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517739669725993e-06, + "loss": 0.6001, + "step": 51082 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517471877964956e-06, + "loss": 0.623, + "step": 51083 + }, + { + "epoch": 1.31, + "learning_rate": 1.2517204084276412e-06, + "loss": 0.748, + "step": 51084 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516936288660554e-06, + "loss": 0.6992, + "step": 51085 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516668491117596e-06, + "loss": 0.5522, + "step": 51086 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516400691647744e-06, + "loss": 0.5835, + "step": 51087 + }, + { + "epoch": 1.31, + "learning_rate": 1.2516132890251194e-06, + "loss": 0.6411, + "step": 51088 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515865086928162e-06, + "loss": 0.626, + "step": 51089 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515597281678845e-06, + "loss": 0.6699, + "step": 51090 + }, + { + "epoch": 1.31, + "learning_rate": 1.251532947450345e-06, + "loss": 0.7012, + "step": 51091 + }, + { + "epoch": 1.31, + "learning_rate": 1.2515061665402185e-06, + "loss": 0.7793, + "step": 51092 + }, + { + "epoch": 1.31, + "learning_rate": 1.251479385437525e-06, + "loss": 0.6514, + "step": 51093 + }, + { + "epoch": 1.31, + "learning_rate": 1.2514526041422859e-06, + "loss": 0.7441, + "step": 51094 + }, + { + "epoch": 1.31, + "learning_rate": 1.2514258226545204e-06, + "loss": 0.7017, + "step": 51095 + }, + { + "epoch": 1.31, + "learning_rate": 1.25139904097425e-06, + "loss": 0.7617, + "step": 51096 + }, + { + "epoch": 1.31, + "learning_rate": 1.2513722591014947e-06, + "loss": 0.6494, + "step": 51097 + }, + { + "epoch": 1.31, + "learning_rate": 1.2513454770362758e-06, + "loss": 0.7085, + "step": 51098 + }, + { + "epoch": 1.31, + "learning_rate": 1.251318694778613e-06, + "loss": 0.5645, + "step": 51099 + }, + { + "epoch": 1.31, + "learning_rate": 1.251291912328527e-06, + "loss": 0.4541, + "step": 51100 + }, + { + "epoch": 1.31, + "learning_rate": 1.2512651296860378e-06, + "loss": 0.7285, + "step": 51101 + }, + { + "epoch": 1.31, + "learning_rate": 1.251238346851167e-06, + "loss": 0.521, + "step": 51102 + }, + { + "epoch": 1.31, + "learning_rate": 1.2512115638239345e-06, + "loss": 0.6123, + "step": 51103 + }, + { + "epoch": 1.31, + "learning_rate": 1.251184780604361e-06, + "loss": 0.625, + "step": 51104 + }, + { + "epoch": 1.31, + "learning_rate": 1.2511579971924664e-06, + "loss": 0.6797, + "step": 51105 + }, + { + "epoch": 1.31, + "learning_rate": 1.251131213588272e-06, + "loss": 0.7061, + "step": 51106 + }, + { + "epoch": 1.31, + "learning_rate": 1.2511044297917978e-06, + "loss": 0.6885, + "step": 51107 + }, + { + "epoch": 1.31, + "learning_rate": 1.2510776458030648e-06, + "loss": 0.6875, + "step": 51108 + }, + { + "epoch": 1.31, + "learning_rate": 1.2510508616220929e-06, + "loss": 0.6211, + "step": 51109 + }, + { + "epoch": 1.31, + "learning_rate": 1.251024077248903e-06, + "loss": 0.6431, + "step": 51110 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509972926835154e-06, + "loss": 0.668, + "step": 51111 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509705079259508e-06, + "loss": 0.5649, + "step": 51112 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509437229762296e-06, + "loss": 0.603, + "step": 51113 + }, + { + "epoch": 1.31, + "learning_rate": 1.2509169378343724e-06, + "loss": 0.7529, + "step": 51114 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508901525003996e-06, + "loss": 0.6914, + "step": 51115 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508633669743317e-06, + "loss": 0.6982, + "step": 51116 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508365812561893e-06, + "loss": 0.6719, + "step": 51117 + }, + { + "epoch": 1.31, + "learning_rate": 1.2508097953459929e-06, + "loss": 0.6042, + "step": 51118 + }, + { + "epoch": 1.31, + "learning_rate": 1.250783009243763e-06, + "loss": 0.5728, + "step": 51119 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507562229495199e-06, + "loss": 0.6904, + "step": 51120 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507294364632845e-06, + "loss": 0.6992, + "step": 51121 + }, + { + "epoch": 1.31, + "learning_rate": 1.2507026497850769e-06, + "loss": 0.7217, + "step": 51122 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506758629149178e-06, + "loss": 0.6323, + "step": 51123 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506490758528281e-06, + "loss": 0.6729, + "step": 51124 + }, + { + "epoch": 1.31, + "learning_rate": 1.2506222885988278e-06, + "loss": 0.7832, + "step": 51125 + }, + { + "epoch": 1.31, + "learning_rate": 1.250595501152937e-06, + "loss": 0.5483, + "step": 51126 + }, + { + "epoch": 1.31, + "learning_rate": 1.2505687135151771e-06, + "loss": 0.4705, + "step": 51127 + }, + { + "epoch": 1.31, + "learning_rate": 1.2505419256855682e-06, + "loss": 0.7793, + "step": 51128 + }, + { + "epoch": 1.31, + "learning_rate": 1.250515137664131e-06, + "loss": 0.7217, + "step": 51129 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504883494508861e-06, + "loss": 0.5432, + "step": 51130 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504615610458536e-06, + "loss": 0.6895, + "step": 51131 + }, + { + "epoch": 1.31, + "learning_rate": 1.250434772449054e-06, + "loss": 0.6843, + "step": 51132 + }, + { + "epoch": 1.31, + "learning_rate": 1.2504079836605082e-06, + "loss": 0.7705, + "step": 51133 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503811946802366e-06, + "loss": 0.7568, + "step": 51134 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503544055082594e-06, + "loss": 0.7168, + "step": 51135 + }, + { + "epoch": 1.31, + "learning_rate": 1.2503276161445976e-06, + "loss": 0.6001, + "step": 51136 + }, + { + "epoch": 1.31, + "learning_rate": 1.250300826589271e-06, + "loss": 0.5425, + "step": 51137 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502740368423007e-06, + "loss": 0.4839, + "step": 51138 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502472469037075e-06, + "loss": 0.7278, + "step": 51139 + }, + { + "epoch": 1.31, + "learning_rate": 1.2502204567735113e-06, + "loss": 0.7622, + "step": 51140 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501936664517324e-06, + "loss": 0.3378, + "step": 51141 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501668759383924e-06, + "loss": 0.832, + "step": 51142 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501400852335104e-06, + "loss": 0.5518, + "step": 51143 + }, + { + "epoch": 1.31, + "learning_rate": 1.2501132943371082e-06, + "loss": 0.626, + "step": 51144 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500865032492055e-06, + "loss": 0.6895, + "step": 51145 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500597119698233e-06, + "loss": 0.5996, + "step": 51146 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500329204989815e-06, + "loss": 0.425, + "step": 51147 + }, + { + "epoch": 1.31, + "learning_rate": 1.2500061288367011e-06, + "loss": 0.7715, + "step": 51148 + }, + { + "epoch": 1.31, + "learning_rate": 1.2499793369830028e-06, + "loss": 0.624, + "step": 51149 + }, + { + "epoch": 1.31, + "learning_rate": 1.2499525449379068e-06, + "loss": 0.686, + "step": 51150 + }, + { + "epoch": 1.31, + "learning_rate": 1.249925752701433e-06, + "loss": 0.6372, + "step": 51151 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498989602736032e-06, + "loss": 0.6377, + "step": 51152 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498721676544367e-06, + "loss": 0.668, + "step": 51153 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498453748439552e-06, + "loss": 0.7822, + "step": 51154 + }, + { + "epoch": 1.31, + "learning_rate": 1.2498185818421782e-06, + "loss": 0.4944, + "step": 51155 + }, + { + "epoch": 1.31, + "learning_rate": 1.2497917886491266e-06, + "loss": 0.645, + "step": 51156 + }, + { + "epoch": 1.31, + "learning_rate": 1.249764995264821e-06, + "loss": 0.5229, + "step": 51157 + }, + { + "epoch": 1.31, + "learning_rate": 1.2497382016892818e-06, + "loss": 0.7632, + "step": 51158 + }, + { + "epoch": 1.31, + "learning_rate": 1.24971140792253e-06, + "loss": 0.4893, + "step": 51159 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496846139645849e-06, + "loss": 0.6191, + "step": 51160 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496578198154681e-06, + "loss": 0.4551, + "step": 51161 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496310254751997e-06, + "loss": 0.7959, + "step": 51162 + }, + { + "epoch": 1.31, + "learning_rate": 1.2496042309438007e-06, + "loss": 0.6592, + "step": 51163 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495774362212907e-06, + "loss": 0.7539, + "step": 51164 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495506413076911e-06, + "loss": 0.3979, + "step": 51165 + }, + { + "epoch": 1.31, + "learning_rate": 1.2495238462030217e-06, + "loss": 0.5103, + "step": 51166 + }, + { + "epoch": 1.31, + "learning_rate": 1.2494970509073037e-06, + "loss": 0.4592, + "step": 51167 + }, + { + "epoch": 1.31, + "learning_rate": 1.249470255420557e-06, + "loss": 0.8022, + "step": 51168 + }, + { + "epoch": 1.31, + "learning_rate": 1.2494434597428028e-06, + "loss": 0.6277, + "step": 51169 + }, + { + "epoch": 1.31, + "learning_rate": 1.249416663874061e-06, + "loss": 0.5474, + "step": 51170 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493898678143521e-06, + "loss": 0.6611, + "step": 51171 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493630715636969e-06, + "loss": 0.6074, + "step": 51172 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493362751221161e-06, + "loss": 0.4633, + "step": 51173 + }, + { + "epoch": 1.31, + "learning_rate": 1.2493094784896299e-06, + "loss": 0.6152, + "step": 51174 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492826816662588e-06, + "loss": 0.5752, + "step": 51175 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492558846520234e-06, + "loss": 0.4756, + "step": 51176 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492290874469443e-06, + "loss": 0.6045, + "step": 51177 + }, + { + "epoch": 1.31, + "learning_rate": 1.2492022900510419e-06, + "loss": 0.5752, + "step": 51178 + }, + { + "epoch": 1.31, + "learning_rate": 1.249175492464337e-06, + "loss": 0.266, + "step": 51179 + }, + { + "epoch": 1.31, + "learning_rate": 1.2491486946868498e-06, + "loss": 0.7666, + "step": 51180 + }, + { + "epoch": 1.31, + "learning_rate": 1.2491218967186004e-06, + "loss": 0.7314, + "step": 51181 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490950985596104e-06, + "loss": 0.5315, + "step": 51182 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490683002098995e-06, + "loss": 0.7754, + "step": 51183 + }, + { + "epoch": 1.31, + "learning_rate": 1.2490415016694886e-06, + "loss": 0.8027, + "step": 51184 + }, + { + "epoch": 1.31, + "learning_rate": 1.249014702938398e-06, + "loss": 0.6279, + "step": 51185 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489879040166482e-06, + "loss": 0.6084, + "step": 51186 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489611049042597e-06, + "loss": 0.7607, + "step": 51187 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489343056012533e-06, + "loss": 0.7078, + "step": 51188 + }, + { + "epoch": 1.31, + "learning_rate": 1.2489075061076496e-06, + "loss": 0.6724, + "step": 51189 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488807064234685e-06, + "loss": 0.3514, + "step": 51190 + }, + { + "epoch": 1.31, + "learning_rate": 1.248853906548731e-06, + "loss": 0.7705, + "step": 51191 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488271064834575e-06, + "loss": 0.7451, + "step": 51192 + }, + { + "epoch": 1.31, + "learning_rate": 1.2488003062276683e-06, + "loss": 0.5742, + "step": 51193 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487735057813849e-06, + "loss": 0.6592, + "step": 51194 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487467051446263e-06, + "loss": 0.7593, + "step": 51195 + }, + { + "epoch": 1.31, + "learning_rate": 1.2487199043174142e-06, + "loss": 0.5234, + "step": 51196 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486931032997682e-06, + "loss": 0.7051, + "step": 51197 + }, + { + "epoch": 1.31, + "learning_rate": 1.24866630209171e-06, + "loss": 0.7148, + "step": 51198 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486395006932591e-06, + "loss": 0.6113, + "step": 51199 + }, + { + "epoch": 1.31, + "learning_rate": 1.2486126991044362e-06, + "loss": 0.5952, + "step": 51200 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485858973252623e-06, + "loss": 0.7373, + "step": 51201 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485590953557572e-06, + "loss": 0.6914, + "step": 51202 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485322931959424e-06, + "loss": 0.7217, + "step": 51203 + }, + { + "epoch": 1.31, + "learning_rate": 1.2485054908458374e-06, + "loss": 0.6826, + "step": 51204 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484786883054633e-06, + "loss": 0.5371, + "step": 51205 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484518855748407e-06, + "loss": 0.6465, + "step": 51206 + }, + { + "epoch": 1.31, + "learning_rate": 1.2484250826539898e-06, + "loss": 0.6592, + "step": 51207 + }, + { + "epoch": 1.31, + "learning_rate": 1.248398279542931e-06, + "loss": 0.584, + "step": 51208 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483714762416855e-06, + "loss": 0.7861, + "step": 51209 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483446727502728e-06, + "loss": 0.644, + "step": 51210 + }, + { + "epoch": 1.31, + "learning_rate": 1.2483178690687146e-06, + "loss": 0.6016, + "step": 51211 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482910651970305e-06, + "loss": 0.6943, + "step": 51212 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482642611352411e-06, + "loss": 0.5315, + "step": 51213 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482374568833678e-06, + "loss": 0.6205, + "step": 51214 + }, + { + "epoch": 1.31, + "learning_rate": 1.2482106524414302e-06, + "loss": 0.6765, + "step": 51215 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481838478094487e-06, + "loss": 0.4043, + "step": 51216 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481570429874447e-06, + "loss": 0.5939, + "step": 51217 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481302379754381e-06, + "loss": 0.6436, + "step": 51218 + }, + { + "epoch": 1.31, + "learning_rate": 1.2481034327734498e-06, + "loss": 0.7832, + "step": 51219 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480766273815002e-06, + "loss": 0.5859, + "step": 51220 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480498217996096e-06, + "loss": 0.75, + "step": 51221 + }, + { + "epoch": 1.31, + "learning_rate": 1.2480230160277981e-06, + "loss": 0.5251, + "step": 51222 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479962100660874e-06, + "loss": 0.4683, + "step": 51223 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479694039144975e-06, + "loss": 0.6572, + "step": 51224 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479425975730485e-06, + "loss": 0.6299, + "step": 51225 + }, + { + "epoch": 1.31, + "learning_rate": 1.2479157910417612e-06, + "loss": 0.7788, + "step": 51226 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478889843206562e-06, + "loss": 0.752, + "step": 51227 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478621774097542e-06, + "loss": 0.4456, + "step": 51228 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478353703090757e-06, + "loss": 0.7559, + "step": 51229 + }, + { + "epoch": 1.31, + "learning_rate": 1.2478085630186408e-06, + "loss": 0.5879, + "step": 51230 + }, + { + "epoch": 1.31, + "learning_rate": 1.24778175553847e-06, + "loss": 0.5234, + "step": 51231 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477549478685845e-06, + "loss": 0.7979, + "step": 51232 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477281400090043e-06, + "loss": 0.7305, + "step": 51233 + }, + { + "epoch": 1.31, + "learning_rate": 1.2477013319597502e-06, + "loss": 0.5022, + "step": 51234 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476745237208423e-06, + "loss": 0.6064, + "step": 51235 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476477152923014e-06, + "loss": 0.5781, + "step": 51236 + }, + { + "epoch": 1.31, + "learning_rate": 1.2476209066741484e-06, + "loss": 0.5308, + "step": 51237 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475940978664033e-06, + "loss": 0.4844, + "step": 51238 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475672888690868e-06, + "loss": 0.5132, + "step": 51239 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475404796822193e-06, + "loss": 0.5605, + "step": 51240 + }, + { + "epoch": 1.31, + "learning_rate": 1.2475136703058214e-06, + "loss": 0.668, + "step": 51241 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474868607399137e-06, + "loss": 0.6123, + "step": 51242 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474600509845166e-06, + "loss": 0.5571, + "step": 51243 + }, + { + "epoch": 1.31, + "learning_rate": 1.2474332410396508e-06, + "loss": 0.6439, + "step": 51244 + }, + { + "epoch": 1.31, + "learning_rate": 1.247406430905337e-06, + "loss": 0.6675, + "step": 51245 + }, + { + "epoch": 1.31, + "learning_rate": 1.247379620581595e-06, + "loss": 0.6699, + "step": 51246 + }, + { + "epoch": 1.31, + "learning_rate": 1.247352810068446e-06, + "loss": 0.624, + "step": 51247 + }, + { + "epoch": 1.31, + "learning_rate": 1.2473259993659105e-06, + "loss": 0.5854, + "step": 51248 + }, + { + "epoch": 1.31, + "learning_rate": 1.2472991884740089e-06, + "loss": 0.5913, + "step": 51249 + }, + { + "epoch": 1.31, + "learning_rate": 1.2472723773927613e-06, + "loss": 0.6577, + "step": 51250 + }, + { + "epoch": 1.31, + "learning_rate": 1.247245566122189e-06, + "loss": 0.6196, + "step": 51251 + }, + { + "epoch": 1.31, + "learning_rate": 1.247218754662312e-06, + "loss": 0.6797, + "step": 51252 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471919430131508e-06, + "loss": 0.6152, + "step": 51253 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471651311747263e-06, + "loss": 0.7363, + "step": 51254 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471383191470588e-06, + "loss": 0.6196, + "step": 51255 + }, + { + "epoch": 1.31, + "learning_rate": 1.2471115069301687e-06, + "loss": 0.6289, + "step": 51256 + }, + { + "epoch": 1.31, + "learning_rate": 1.247084694524077e-06, + "loss": 0.5747, + "step": 51257 + }, + { + "epoch": 1.31, + "learning_rate": 1.2470578819288033e-06, + "loss": 0.5942, + "step": 51258 + }, + { + "epoch": 1.31, + "learning_rate": 1.2470310691443696e-06, + "loss": 0.6514, + "step": 51259 + }, + { + "epoch": 1.31, + "learning_rate": 1.247004256170795e-06, + "loss": 0.6494, + "step": 51260 + }, + { + "epoch": 1.31, + "learning_rate": 1.2469774430081005e-06, + "loss": 0.6689, + "step": 51261 + }, + { + "epoch": 1.31, + "learning_rate": 1.246950629656307e-06, + "loss": 0.7197, + "step": 51262 + }, + { + "epoch": 1.31, + "learning_rate": 1.2469238161154348e-06, + "loss": 0.8047, + "step": 51263 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468970023855044e-06, + "loss": 0.7627, + "step": 51264 + }, + { + "epoch": 1.31, + "learning_rate": 1.246870188466536e-06, + "loss": 0.6519, + "step": 51265 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468433743585506e-06, + "loss": 0.4253, + "step": 51266 + }, + { + "epoch": 1.31, + "learning_rate": 1.2468165600615687e-06, + "loss": 0.6831, + "step": 51267 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467897455756106e-06, + "loss": 0.6025, + "step": 51268 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467629309006968e-06, + "loss": 0.4841, + "step": 51269 + }, + { + "epoch": 1.31, + "learning_rate": 1.2467361160368483e-06, + "loss": 0.7612, + "step": 51270 + }, + { + "epoch": 1.31, + "learning_rate": 1.246709300984085e-06, + "loss": 0.5791, + "step": 51271 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466824857424281e-06, + "loss": 0.6709, + "step": 51272 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466556703118976e-06, + "loss": 0.7305, + "step": 51273 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466288546925141e-06, + "loss": 0.6514, + "step": 51274 + }, + { + "epoch": 1.31, + "learning_rate": 1.2466020388842982e-06, + "loss": 0.6914, + "step": 51275 + }, + { + "epoch": 1.31, + "learning_rate": 1.2465752228872706e-06, + "loss": 0.5811, + "step": 51276 + }, + { + "epoch": 1.31, + "learning_rate": 1.2465484067014514e-06, + "loss": 0.5259, + "step": 51277 + }, + { + "epoch": 1.31, + "learning_rate": 1.246521590326862e-06, + "loss": 0.7783, + "step": 51278 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464947737635219e-06, + "loss": 0.6416, + "step": 51279 + }, + { + "epoch": 1.31, + "learning_rate": 1.246467957011452e-06, + "loss": 0.7559, + "step": 51280 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464411400706732e-06, + "loss": 0.4675, + "step": 51281 + }, + { + "epoch": 1.31, + "learning_rate": 1.2464143229412053e-06, + "loss": 0.4624, + "step": 51282 + }, + { + "epoch": 1.31, + "learning_rate": 1.24638750562307e-06, + "loss": 0.6431, + "step": 51283 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463606881162868e-06, + "loss": 0.8027, + "step": 51284 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463338704208764e-06, + "loss": 0.6289, + "step": 51285 + }, + { + "epoch": 1.31, + "learning_rate": 1.2463070525368594e-06, + "loss": 0.7046, + "step": 51286 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462802344642566e-06, + "loss": 0.752, + "step": 51287 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462534162030885e-06, + "loss": 0.5752, + "step": 51288 + }, + { + "epoch": 1.31, + "learning_rate": 1.2462265977533753e-06, + "loss": 0.8662, + "step": 51289 + }, + { + "epoch": 1.31, + "learning_rate": 1.2461997791151376e-06, + "loss": 0.7246, + "step": 51290 + }, + { + "epoch": 1.31, + "learning_rate": 1.246172960288396e-06, + "loss": 0.7148, + "step": 51291 + }, + { + "epoch": 1.31, + "learning_rate": 1.2461461412731713e-06, + "loss": 0.7871, + "step": 51292 + }, + { + "epoch": 1.31, + "learning_rate": 1.246119322069484e-06, + "loss": 0.7354, + "step": 51293 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460925026773542e-06, + "loss": 0.6904, + "step": 51294 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460656830968029e-06, + "loss": 0.625, + "step": 51295 + }, + { + "epoch": 1.31, + "learning_rate": 1.24603886332785e-06, + "loss": 0.5781, + "step": 51296 + }, + { + "epoch": 1.31, + "learning_rate": 1.2460120433705167e-06, + "loss": 0.6172, + "step": 51297 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459852232248234e-06, + "loss": 0.5444, + "step": 51298 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459584028907903e-06, + "loss": 0.7139, + "step": 51299 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459315823684382e-06, + "loss": 0.6143, + "step": 51300 + }, + { + "epoch": 1.31, + "learning_rate": 1.2459047616577878e-06, + "loss": 0.6309, + "step": 51301 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458779407588592e-06, + "loss": 0.5161, + "step": 51302 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458511196716734e-06, + "loss": 0.446, + "step": 51303 + }, + { + "epoch": 1.31, + "learning_rate": 1.2458242983962505e-06, + "loss": 0.5433, + "step": 51304 + }, + { + "epoch": 1.31, + "learning_rate": 1.2457974769326114e-06, + "loss": 0.7578, + "step": 51305 + }, + { + "epoch": 1.31, + "learning_rate": 1.2457706552807763e-06, + "loss": 0.5645, + "step": 51306 + }, + { + "epoch": 1.32, + "learning_rate": 1.245743833440766e-06, + "loss": 0.707, + "step": 51307 + }, + { + "epoch": 1.32, + "learning_rate": 1.245717011412601e-06, + "loss": 0.5664, + "step": 51308 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456901891963017e-06, + "loss": 0.6875, + "step": 51309 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456633667918889e-06, + "loss": 0.7212, + "step": 51310 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456365441993826e-06, + "loss": 0.4624, + "step": 51311 + }, + { + "epoch": 1.32, + "learning_rate": 1.2456097214188038e-06, + "loss": 0.6958, + "step": 51312 + }, + { + "epoch": 1.32, + "learning_rate": 1.245582898450173e-06, + "loss": 0.7119, + "step": 51313 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455560752935109e-06, + "loss": 0.6733, + "step": 51314 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455292519488373e-06, + "loss": 0.6313, + "step": 51315 + }, + { + "epoch": 1.32, + "learning_rate": 1.2455024284161736e-06, + "loss": 0.5364, + "step": 51316 + }, + { + "epoch": 1.32, + "learning_rate": 1.2454756046955398e-06, + "loss": 0.7578, + "step": 51317 + }, + { + "epoch": 1.32, + "learning_rate": 1.2454487807869572e-06, + "loss": 0.6338, + "step": 51318 + }, + { + "epoch": 1.32, + "learning_rate": 1.245421956690445e-06, + "loss": 0.709, + "step": 51319 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453951324060247e-06, + "loss": 0.7197, + "step": 51320 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453683079337167e-06, + "loss": 0.5542, + "step": 51321 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453414832735417e-06, + "loss": 0.6689, + "step": 51322 + }, + { + "epoch": 1.32, + "learning_rate": 1.2453146584255197e-06, + "loss": 0.6362, + "step": 51323 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452878333896718e-06, + "loss": 0.5752, + "step": 51324 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452610081660178e-06, + "loss": 0.7051, + "step": 51325 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452341827545792e-06, + "loss": 0.7012, + "step": 51326 + }, + { + "epoch": 1.32, + "learning_rate": 1.2452073571553756e-06, + "loss": 0.563, + "step": 51327 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451805313684286e-06, + "loss": 0.7036, + "step": 51328 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451537053937577e-06, + "loss": 0.6943, + "step": 51329 + }, + { + "epoch": 1.32, + "learning_rate": 1.2451268792313843e-06, + "loss": 0.6846, + "step": 51330 + }, + { + "epoch": 1.32, + "learning_rate": 1.245100052881328e-06, + "loss": 0.7446, + "step": 51331 + }, + { + "epoch": 1.32, + "learning_rate": 1.2450732263436102e-06, + "loss": 0.6116, + "step": 51332 + }, + { + "epoch": 1.32, + "learning_rate": 1.245046399618251e-06, + "loss": 0.7432, + "step": 51333 + }, + { + "epoch": 1.32, + "learning_rate": 1.2450195727052708e-06, + "loss": 0.6338, + "step": 51334 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449927456046907e-06, + "loss": 0.606, + "step": 51335 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449659183165309e-06, + "loss": 0.748, + "step": 51336 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449390908408118e-06, + "loss": 0.5378, + "step": 51337 + }, + { + "epoch": 1.32, + "learning_rate": 1.2449122631775545e-06, + "loss": 0.5757, + "step": 51338 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448854353267789e-06, + "loss": 0.606, + "step": 51339 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448586072885054e-06, + "loss": 0.7373, + "step": 51340 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448317790627553e-06, + "loss": 0.5503, + "step": 51341 + }, + { + "epoch": 1.32, + "learning_rate": 1.2448049506495486e-06, + "loss": 0.7656, + "step": 51342 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447781220489064e-06, + "loss": 0.6992, + "step": 51343 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447512932608484e-06, + "loss": 0.7012, + "step": 51344 + }, + { + "epoch": 1.32, + "learning_rate": 1.2447244642853958e-06, + "loss": 0.668, + "step": 51345 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446976351225685e-06, + "loss": 0.7339, + "step": 51346 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446708057723882e-06, + "loss": 0.5015, + "step": 51347 + }, + { + "epoch": 1.32, + "learning_rate": 1.2446439762348744e-06, + "loss": 0.6016, + "step": 51348 + }, + { + "epoch": 1.32, + "learning_rate": 1.244617146510048e-06, + "loss": 0.4619, + "step": 51349 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445903165979292e-06, + "loss": 0.6123, + "step": 51350 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445634864985393e-06, + "loss": 0.6763, + "step": 51351 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445366562118979e-06, + "loss": 0.582, + "step": 51352 + }, + { + "epoch": 1.32, + "learning_rate": 1.2445098257380264e-06, + "loss": 0.6724, + "step": 51353 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444829950769448e-06, + "loss": 0.79, + "step": 51354 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444561642286738e-06, + "loss": 0.4578, + "step": 51355 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444293331932342e-06, + "loss": 0.6973, + "step": 51356 + }, + { + "epoch": 1.32, + "learning_rate": 1.2444025019706461e-06, + "loss": 0.8447, + "step": 51357 + }, + { + "epoch": 1.32, + "learning_rate": 1.2443756705609304e-06, + "loss": 0.3235, + "step": 51358 + }, + { + "epoch": 1.32, + "learning_rate": 1.244348838964107e-06, + "loss": 0.5938, + "step": 51359 + }, + { + "epoch": 1.32, + "learning_rate": 1.2443220071801974e-06, + "loss": 0.5444, + "step": 51360 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442951752092214e-06, + "loss": 0.5522, + "step": 51361 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442683430512e-06, + "loss": 0.6367, + "step": 51362 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442415107061537e-06, + "loss": 0.7754, + "step": 51363 + }, + { + "epoch": 1.32, + "learning_rate": 1.2442146781741027e-06, + "loss": 0.6543, + "step": 51364 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441878454550675e-06, + "loss": 0.4639, + "step": 51365 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441610125490693e-06, + "loss": 0.5352, + "step": 51366 + }, + { + "epoch": 1.32, + "learning_rate": 1.244134179456128e-06, + "loss": 0.7422, + "step": 51367 + }, + { + "epoch": 1.32, + "learning_rate": 1.2441073461762649e-06, + "loss": 0.6406, + "step": 51368 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440805127094993e-06, + "loss": 0.5933, + "step": 51369 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440536790558528e-06, + "loss": 0.5627, + "step": 51370 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440268452153456e-06, + "loss": 0.6289, + "step": 51371 + }, + { + "epoch": 1.32, + "learning_rate": 1.2440000111879983e-06, + "loss": 0.6172, + "step": 51372 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439731769738316e-06, + "loss": 0.6797, + "step": 51373 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439463425728656e-06, + "loss": 0.5037, + "step": 51374 + }, + { + "epoch": 1.32, + "learning_rate": 1.2439195079851211e-06, + "loss": 0.5479, + "step": 51375 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438926732106188e-06, + "loss": 0.4956, + "step": 51376 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438658382493788e-06, + "loss": 0.573, + "step": 51377 + }, + { + "epoch": 1.32, + "learning_rate": 1.243839003101422e-06, + "loss": 0.6855, + "step": 51378 + }, + { + "epoch": 1.32, + "learning_rate": 1.2438121677667692e-06, + "loss": 0.7383, + "step": 51379 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437853322454403e-06, + "loss": 0.7832, + "step": 51380 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437584965374567e-06, + "loss": 0.5247, + "step": 51381 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437316606428376e-06, + "loss": 0.688, + "step": 51382 + }, + { + "epoch": 1.32, + "learning_rate": 1.2437048245616053e-06, + "loss": 0.6104, + "step": 51383 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436779882937786e-06, + "loss": 0.6631, + "step": 51384 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436511518393796e-06, + "loss": 0.5151, + "step": 51385 + }, + { + "epoch": 1.32, + "learning_rate": 1.2436243151984275e-06, + "loss": 0.3661, + "step": 51386 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435974783709437e-06, + "loss": 0.7695, + "step": 51387 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435706413569487e-06, + "loss": 0.6392, + "step": 51388 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435438041564628e-06, + "loss": 0.7119, + "step": 51389 + }, + { + "epoch": 1.32, + "learning_rate": 1.2435169667695063e-06, + "loss": 0.416, + "step": 51390 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434901291961001e-06, + "loss": 0.667, + "step": 51391 + }, + { + "epoch": 1.32, + "learning_rate": 1.243463291436265e-06, + "loss": 0.7871, + "step": 51392 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434364534900213e-06, + "loss": 0.4519, + "step": 51393 + }, + { + "epoch": 1.32, + "learning_rate": 1.2434096153573891e-06, + "loss": 0.6797, + "step": 51394 + }, + { + "epoch": 1.32, + "learning_rate": 1.2433827770383896e-06, + "loss": 0.6499, + "step": 51395 + }, + { + "epoch": 1.32, + "learning_rate": 1.243355938533043e-06, + "loss": 0.6143, + "step": 51396 + }, + { + "epoch": 1.32, + "learning_rate": 1.24332909984137e-06, + "loss": 0.6104, + "step": 51397 + }, + { + "epoch": 1.32, + "learning_rate": 1.243302260963391e-06, + "loss": 0.814, + "step": 51398 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432754218991269e-06, + "loss": 0.6475, + "step": 51399 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432485826485978e-06, + "loss": 0.7529, + "step": 51400 + }, + { + "epoch": 1.32, + "learning_rate": 1.2432217432118243e-06, + "loss": 0.5707, + "step": 51401 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431949035888273e-06, + "loss": 0.7246, + "step": 51402 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431680637796272e-06, + "loss": 0.7803, + "step": 51403 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431412237842444e-06, + "loss": 0.6958, + "step": 51404 + }, + { + "epoch": 1.32, + "learning_rate": 1.2431143836026995e-06, + "loss": 0.8662, + "step": 51405 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430875432350131e-06, + "loss": 0.71, + "step": 51406 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430607026812059e-06, + "loss": 0.7832, + "step": 51407 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430338619412983e-06, + "loss": 0.6699, + "step": 51408 + }, + { + "epoch": 1.32, + "learning_rate": 1.2430070210153107e-06, + "loss": 0.7236, + "step": 51409 + }, + { + "epoch": 1.32, + "learning_rate": 1.242980179903264e-06, + "loss": 0.5288, + "step": 51410 + }, + { + "epoch": 1.32, + "learning_rate": 1.2429533386051783e-06, + "loss": 0.563, + "step": 51411 + }, + { + "epoch": 1.32, + "learning_rate": 1.2429264971210745e-06, + "loss": 0.5854, + "step": 51412 + }, + { + "epoch": 1.32, + "learning_rate": 1.242899655450973e-06, + "loss": 0.7168, + "step": 51413 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428728135948945e-06, + "loss": 0.637, + "step": 51414 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428459715528594e-06, + "loss": 0.6082, + "step": 51415 + }, + { + "epoch": 1.32, + "learning_rate": 1.2428191293248884e-06, + "loss": 0.7002, + "step": 51416 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427922869110017e-06, + "loss": 0.6899, + "step": 51417 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427654443112202e-06, + "loss": 0.7529, + "step": 51418 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427386015255646e-06, + "loss": 0.7744, + "step": 51419 + }, + { + "epoch": 1.32, + "learning_rate": 1.2427117585540551e-06, + "loss": 0.5957, + "step": 51420 + }, + { + "epoch": 1.32, + "learning_rate": 1.2426849153967123e-06, + "loss": 0.6348, + "step": 51421 + }, + { + "epoch": 1.32, + "learning_rate": 1.242658072053557e-06, + "loss": 0.7402, + "step": 51422 + }, + { + "epoch": 1.32, + "learning_rate": 1.2426312285246092e-06, + "loss": 0.8174, + "step": 51423 + }, + { + "epoch": 1.32, + "learning_rate": 1.24260438480989e-06, + "loss": 0.5542, + "step": 51424 + }, + { + "epoch": 1.32, + "learning_rate": 1.24257754090942e-06, + "loss": 0.7334, + "step": 51425 + }, + { + "epoch": 1.32, + "learning_rate": 1.242550696823219e-06, + "loss": 0.4849, + "step": 51426 + }, + { + "epoch": 1.32, + "learning_rate": 1.2425238525513084e-06, + "loss": 0.6104, + "step": 51427 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424970080937086e-06, + "loss": 0.6562, + "step": 51428 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424701634504399e-06, + "loss": 0.6279, + "step": 51429 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424433186215229e-06, + "loss": 0.502, + "step": 51430 + }, + { + "epoch": 1.32, + "learning_rate": 1.2424164736069782e-06, + "loss": 0.6074, + "step": 51431 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423896284068263e-06, + "loss": 0.668, + "step": 51432 + }, + { + "epoch": 1.32, + "learning_rate": 1.242362783021088e-06, + "loss": 0.6191, + "step": 51433 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423359374497836e-06, + "loss": 0.6514, + "step": 51434 + }, + { + "epoch": 1.32, + "learning_rate": 1.2423090916929335e-06, + "loss": 0.5923, + "step": 51435 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422822457505585e-06, + "loss": 0.7246, + "step": 51436 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422553996226792e-06, + "loss": 0.5557, + "step": 51437 + }, + { + "epoch": 1.32, + "learning_rate": 1.2422285533093162e-06, + "loss": 0.5356, + "step": 51438 + }, + { + "epoch": 1.32, + "learning_rate": 1.24220170681049e-06, + "loss": 0.6108, + "step": 51439 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421748601262208e-06, + "loss": 0.593, + "step": 51440 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421480132565296e-06, + "loss": 0.5503, + "step": 51441 + }, + { + "epoch": 1.32, + "learning_rate": 1.2421211662014366e-06, + "loss": 0.9531, + "step": 51442 + }, + { + "epoch": 1.32, + "learning_rate": 1.242094318960963e-06, + "loss": 0.7471, + "step": 51443 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420674715351287e-06, + "loss": 0.7534, + "step": 51444 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420406239239541e-06, + "loss": 0.6111, + "step": 51445 + }, + { + "epoch": 1.32, + "learning_rate": 1.2420137761274606e-06, + "loss": 0.5789, + "step": 51446 + }, + { + "epoch": 1.32, + "learning_rate": 1.241986928145668e-06, + "loss": 0.5347, + "step": 51447 + }, + { + "epoch": 1.32, + "learning_rate": 1.2419600799785973e-06, + "loss": 0.6924, + "step": 51448 + }, + { + "epoch": 1.32, + "learning_rate": 1.241933231626269e-06, + "loss": 0.6201, + "step": 51449 + }, + { + "epoch": 1.32, + "learning_rate": 1.2419063830887033e-06, + "loss": 0.6992, + "step": 51450 + }, + { + "epoch": 1.32, + "learning_rate": 1.241879534365921e-06, + "loss": 0.75, + "step": 51451 + }, + { + "epoch": 1.32, + "learning_rate": 1.2418526854579428e-06, + "loss": 0.793, + "step": 51452 + }, + { + "epoch": 1.32, + "learning_rate": 1.2418258363647892e-06, + "loss": 0.793, + "step": 51453 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417989870864807e-06, + "loss": 0.5591, + "step": 51454 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417721376230374e-06, + "loss": 0.7275, + "step": 51455 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417452879744807e-06, + "loss": 0.4626, + "step": 51456 + }, + { + "epoch": 1.32, + "learning_rate": 1.2417184381408305e-06, + "loss": 0.7427, + "step": 51457 + }, + { + "epoch": 1.32, + "learning_rate": 1.241691588122108e-06, + "loss": 0.6055, + "step": 51458 + }, + { + "epoch": 1.32, + "learning_rate": 1.241664737918333e-06, + "loss": 0.6382, + "step": 51459 + }, + { + "epoch": 1.32, + "learning_rate": 1.2416378875295267e-06, + "loss": 0.7075, + "step": 51460 + }, + { + "epoch": 1.32, + "learning_rate": 1.2416110369557089e-06, + "loss": 0.7744, + "step": 51461 + }, + { + "epoch": 1.32, + "learning_rate": 1.241584186196901e-06, + "loss": 0.7217, + "step": 51462 + }, + { + "epoch": 1.32, + "learning_rate": 1.2415573352531233e-06, + "loss": 0.5659, + "step": 51463 + }, + { + "epoch": 1.32, + "learning_rate": 1.241530484124396e-06, + "loss": 0.7822, + "step": 51464 + }, + { + "epoch": 1.32, + "learning_rate": 1.24150363281074e-06, + "loss": 0.7529, + "step": 51465 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414767813121757e-06, + "loss": 0.7939, + "step": 51466 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414499296287238e-06, + "loss": 0.4503, + "step": 51467 + }, + { + "epoch": 1.32, + "learning_rate": 1.2414230777604048e-06, + "loss": 0.6123, + "step": 51468 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413962257072395e-06, + "loss": 0.6006, + "step": 51469 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413693734692476e-06, + "loss": 0.5166, + "step": 51470 + }, + { + "epoch": 1.32, + "learning_rate": 1.2413425210464507e-06, + "loss": 0.6372, + "step": 51471 + }, + { + "epoch": 1.32, + "learning_rate": 1.241315668438869e-06, + "loss": 0.7197, + "step": 51472 + }, + { + "epoch": 1.32, + "learning_rate": 1.2412888156465232e-06, + "loss": 0.4402, + "step": 51473 + }, + { + "epoch": 1.32, + "learning_rate": 1.241261962669433e-06, + "loss": 0.6255, + "step": 51474 + }, + { + "epoch": 1.32, + "learning_rate": 1.24123510950762e-06, + "loss": 0.5332, + "step": 51475 + }, + { + "epoch": 1.32, + "learning_rate": 1.2412082561611041e-06, + "loss": 0.6553, + "step": 51476 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411814026299064e-06, + "loss": 0.6343, + "step": 51477 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411545489140472e-06, + "loss": 0.5964, + "step": 51478 + }, + { + "epoch": 1.32, + "learning_rate": 1.241127695013547e-06, + "loss": 0.4475, + "step": 51479 + }, + { + "epoch": 1.32, + "learning_rate": 1.2411008409284262e-06, + "loss": 0.8018, + "step": 51480 + }, + { + "epoch": 1.32, + "learning_rate": 1.241073986658706e-06, + "loss": 0.6494, + "step": 51481 + }, + { + "epoch": 1.32, + "learning_rate": 1.241047132204406e-06, + "loss": 0.6533, + "step": 51482 + }, + { + "epoch": 1.32, + "learning_rate": 1.2410202775655478e-06, + "loss": 0.6626, + "step": 51483 + }, + { + "epoch": 1.32, + "learning_rate": 1.240993422742151e-06, + "loss": 0.573, + "step": 51484 + }, + { + "epoch": 1.32, + "learning_rate": 1.240966567734237e-06, + "loss": 0.6714, + "step": 51485 + }, + { + "epoch": 1.32, + "learning_rate": 1.2409397125418255e-06, + "loss": 0.6431, + "step": 51486 + }, + { + "epoch": 1.32, + "learning_rate": 1.240912857164938e-06, + "loss": 0.792, + "step": 51487 + }, + { + "epoch": 1.32, + "learning_rate": 1.2408860016035944e-06, + "loss": 0.6768, + "step": 51488 + }, + { + "epoch": 1.32, + "learning_rate": 1.2408591458578154e-06, + "loss": 0.4924, + "step": 51489 + }, + { + "epoch": 1.32, + "learning_rate": 1.240832289927622e-06, + "loss": 0.7832, + "step": 51490 + }, + { + "epoch": 1.32, + "learning_rate": 1.240805433813034e-06, + "loss": 0.7173, + "step": 51491 + }, + { + "epoch": 1.32, + "learning_rate": 1.2407785775140725e-06, + "loss": 0.6309, + "step": 51492 + }, + { + "epoch": 1.32, + "learning_rate": 1.240751721030758e-06, + "loss": 0.6953, + "step": 51493 + }, + { + "epoch": 1.32, + "learning_rate": 1.240724864363111e-06, + "loss": 0.6836, + "step": 51494 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406980075111517e-06, + "loss": 0.4932, + "step": 51495 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406711504749013e-06, + "loss": 0.7119, + "step": 51496 + }, + { + "epoch": 1.32, + "learning_rate": 1.24064429325438e-06, + "loss": 0.6875, + "step": 51497 + }, + { + "epoch": 1.32, + "learning_rate": 1.2406174358496086e-06, + "loss": 0.4922, + "step": 51498 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405905782606072e-06, + "loss": 0.8066, + "step": 51499 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405637204873967e-06, + "loss": 0.4535, + "step": 51500 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405368625299977e-06, + "loss": 0.667, + "step": 51501 + }, + { + "epoch": 1.32, + "learning_rate": 1.2405100043884308e-06, + "loss": 0.5518, + "step": 51502 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404831460627163e-06, + "loss": 0.6465, + "step": 51503 + }, + { + "epoch": 1.32, + "learning_rate": 1.240456287552875e-06, + "loss": 0.6377, + "step": 51504 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404294288589272e-06, + "loss": 0.5913, + "step": 51505 + }, + { + "epoch": 1.32, + "learning_rate": 1.2404025699808937e-06, + "loss": 0.6699, + "step": 51506 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403757109187948e-06, + "loss": 0.7402, + "step": 51507 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403488516726518e-06, + "loss": 0.5615, + "step": 51508 + }, + { + "epoch": 1.32, + "learning_rate": 1.2403219922424845e-06, + "loss": 0.6406, + "step": 51509 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402951326283137e-06, + "loss": 0.623, + "step": 51510 + }, + { + "epoch": 1.32, + "learning_rate": 1.24026827283016e-06, + "loss": 0.5122, + "step": 51511 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402414128480438e-06, + "loss": 0.6985, + "step": 51512 + }, + { + "epoch": 1.32, + "learning_rate": 1.2402145526819859e-06, + "loss": 0.8213, + "step": 51513 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401876923320067e-06, + "loss": 0.6572, + "step": 51514 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401608317981269e-06, + "loss": 0.5596, + "step": 51515 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401339710803666e-06, + "loss": 0.6216, + "step": 51516 + }, + { + "epoch": 1.32, + "learning_rate": 1.2401071101787472e-06, + "loss": 0.458, + "step": 51517 + }, + { + "epoch": 1.32, + "learning_rate": 1.2400802490932888e-06, + "loss": 0.2642, + "step": 51518 + }, + { + "epoch": 1.32, + "learning_rate": 1.240053387824012e-06, + "loss": 0.8389, + "step": 51519 + }, + { + "epoch": 1.32, + "learning_rate": 1.2400265263709374e-06, + "loss": 0.5579, + "step": 51520 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399996647340854e-06, + "loss": 0.6973, + "step": 51521 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399728029134765e-06, + "loss": 0.5464, + "step": 51522 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399459409091319e-06, + "loss": 0.6934, + "step": 51523 + }, + { + "epoch": 1.32, + "learning_rate": 1.2399190787210715e-06, + "loss": 0.8115, + "step": 51524 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398922163493159e-06, + "loss": 0.7295, + "step": 51525 + }, + { + "epoch": 1.32, + "learning_rate": 1.239865353793886e-06, + "loss": 0.7451, + "step": 51526 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398384910548023e-06, + "loss": 0.6367, + "step": 51527 + }, + { + "epoch": 1.32, + "learning_rate": 1.2398116281320855e-06, + "loss": 0.7871, + "step": 51528 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397847650257558e-06, + "loss": 0.6384, + "step": 51529 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397579017358337e-06, + "loss": 0.4697, + "step": 51530 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397310382623402e-06, + "loss": 0.6479, + "step": 51531 + }, + { + "epoch": 1.32, + "learning_rate": 1.2397041746052953e-06, + "loss": 0.5708, + "step": 51532 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396773107647204e-06, + "loss": 0.5825, + "step": 51533 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396504467406356e-06, + "loss": 0.6213, + "step": 51534 + }, + { + "epoch": 1.32, + "learning_rate": 1.2396235825330613e-06, + "loss": 0.7998, + "step": 51535 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395967181420183e-06, + "loss": 0.7422, + "step": 51536 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395698535675273e-06, + "loss": 0.5571, + "step": 51537 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395429888096083e-06, + "loss": 0.8027, + "step": 51538 + }, + { + "epoch": 1.32, + "learning_rate": 1.2395161238682823e-06, + "loss": 0.5688, + "step": 51539 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394892587435701e-06, + "loss": 0.6436, + "step": 51540 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394623934354918e-06, + "loss": 0.5181, + "step": 51541 + }, + { + "epoch": 1.32, + "learning_rate": 1.239435527944068e-06, + "loss": 0.5088, + "step": 51542 + }, + { + "epoch": 1.32, + "learning_rate": 1.2394086622693199e-06, + "loss": 0.5093, + "step": 51543 + }, + { + "epoch": 1.32, + "learning_rate": 1.239381796411267e-06, + "loss": 0.6309, + "step": 51544 + }, + { + "epoch": 1.32, + "learning_rate": 1.239354930369931e-06, + "loss": 0.5581, + "step": 51545 + }, + { + "epoch": 1.32, + "learning_rate": 1.2393280641453317e-06, + "loss": 0.6875, + "step": 51546 + }, + { + "epoch": 1.32, + "learning_rate": 1.2393011977374897e-06, + "loss": 0.7207, + "step": 51547 + }, + { + "epoch": 1.32, + "learning_rate": 1.2392743311464263e-06, + "loss": 0.791, + "step": 51548 + }, + { + "epoch": 1.32, + "learning_rate": 1.239247464372161e-06, + "loss": 0.6514, + "step": 51549 + }, + { + "epoch": 1.32, + "learning_rate": 1.2392205974147152e-06, + "loss": 0.4048, + "step": 51550 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391937302741088e-06, + "loss": 0.6353, + "step": 51551 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391668629503633e-06, + "loss": 0.6133, + "step": 51552 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391399954434987e-06, + "loss": 0.6465, + "step": 51553 + }, + { + "epoch": 1.32, + "learning_rate": 1.2391131277535353e-06, + "loss": 0.5796, + "step": 51554 + }, + { + "epoch": 1.32, + "learning_rate": 1.239086259880494e-06, + "loss": 0.7139, + "step": 51555 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390593918243957e-06, + "loss": 0.7285, + "step": 51556 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390325235852602e-06, + "loss": 0.7471, + "step": 51557 + }, + { + "epoch": 1.32, + "learning_rate": 1.2390056551631087e-06, + "loss": 0.7666, + "step": 51558 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389787865579616e-06, + "loss": 0.6689, + "step": 51559 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389519177698391e-06, + "loss": 0.6484, + "step": 51560 + }, + { + "epoch": 1.32, + "learning_rate": 1.2389250487987624e-06, + "loss": 0.6406, + "step": 51561 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388981796447517e-06, + "loss": 0.8379, + "step": 51562 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388713103078279e-06, + "loss": 0.7061, + "step": 51563 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388444407880108e-06, + "loss": 0.6116, + "step": 51564 + }, + { + "epoch": 1.32, + "learning_rate": 1.2388175710853218e-06, + "loss": 0.7593, + "step": 51565 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387907011997811e-06, + "loss": 0.5311, + "step": 51566 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387638311314096e-06, + "loss": 0.8506, + "step": 51567 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387369608802275e-06, + "loss": 0.7031, + "step": 51568 + }, + { + "epoch": 1.32, + "learning_rate": 1.2387100904462554e-06, + "loss": 0.7207, + "step": 51569 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386832198295137e-06, + "loss": 0.708, + "step": 51570 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386563490300238e-06, + "loss": 0.7129, + "step": 51571 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386294780478054e-06, + "loss": 0.708, + "step": 51572 + }, + { + "epoch": 1.32, + "learning_rate": 1.2386026068828792e-06, + "loss": 0.6709, + "step": 51573 + }, + { + "epoch": 1.32, + "learning_rate": 1.238575735535266e-06, + "loss": 0.6758, + "step": 51574 + }, + { + "epoch": 1.32, + "learning_rate": 1.2385488640049866e-06, + "loss": 0.7266, + "step": 51575 + }, + { + "epoch": 1.32, + "learning_rate": 1.2385219922920608e-06, + "loss": 0.7505, + "step": 51576 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384951203965105e-06, + "loss": 0.7393, + "step": 51577 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384682483183549e-06, + "loss": 0.6294, + "step": 51578 + }, + { + "epoch": 1.32, + "learning_rate": 1.2384413760576152e-06, + "loss": 0.6738, + "step": 51579 + }, + { + "epoch": 1.32, + "learning_rate": 1.238414503614312e-06, + "loss": 0.5791, + "step": 51580 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383876309884653e-06, + "loss": 0.6855, + "step": 51581 + }, + { + "epoch": 1.32, + "learning_rate": 1.238360758180097e-06, + "loss": 0.8916, + "step": 51582 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383338851892262e-06, + "loss": 0.5635, + "step": 51583 + }, + { + "epoch": 1.32, + "learning_rate": 1.2383070120158743e-06, + "loss": 0.7207, + "step": 51584 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382801386600615e-06, + "loss": 0.5361, + "step": 51585 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382532651218087e-06, + "loss": 0.7332, + "step": 51586 + }, + { + "epoch": 1.32, + "learning_rate": 1.2382263914011364e-06, + "loss": 0.5366, + "step": 51587 + }, + { + "epoch": 1.32, + "learning_rate": 1.238199517498065e-06, + "loss": 0.7485, + "step": 51588 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381726434126152e-06, + "loss": 0.6377, + "step": 51589 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381457691448077e-06, + "loss": 0.6343, + "step": 51590 + }, + { + "epoch": 1.32, + "learning_rate": 1.2381188946946627e-06, + "loss": 0.6211, + "step": 51591 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380920200622013e-06, + "loss": 0.4485, + "step": 51592 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380651452474435e-06, + "loss": 0.7393, + "step": 51593 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380382702504104e-06, + "loss": 0.4858, + "step": 51594 + }, + { + "epoch": 1.32, + "learning_rate": 1.2380113950711222e-06, + "loss": 0.5029, + "step": 51595 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379845197095996e-06, + "loss": 0.4689, + "step": 51596 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379576441658634e-06, + "loss": 0.5076, + "step": 51597 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379307684399335e-06, + "loss": 0.7891, + "step": 51598 + }, + { + "epoch": 1.32, + "learning_rate": 1.2379038925318314e-06, + "loss": 0.4154, + "step": 51599 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378770164415772e-06, + "loss": 0.7896, + "step": 51600 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378501401691912e-06, + "loss": 0.6514, + "step": 51601 + }, + { + "epoch": 1.32, + "learning_rate": 1.2378232637146947e-06, + "loss": 0.7559, + "step": 51602 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377963870781076e-06, + "loss": 0.6367, + "step": 51603 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377695102594508e-06, + "loss": 0.6455, + "step": 51604 + }, + { + "epoch": 1.32, + "learning_rate": 1.2377426332587448e-06, + "loss": 0.8008, + "step": 51605 + }, + { + "epoch": 1.32, + "learning_rate": 1.23771575607601e-06, + "loss": 0.7178, + "step": 51606 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376888787112677e-06, + "loss": 0.6768, + "step": 51607 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376620011645376e-06, + "loss": 0.7549, + "step": 51608 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376351234358406e-06, + "loss": 0.5552, + "step": 51609 + }, + { + "epoch": 1.32, + "learning_rate": 1.2376082455251972e-06, + "loss": 0.6294, + "step": 51610 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375813674326283e-06, + "loss": 0.5825, + "step": 51611 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375544891581544e-06, + "loss": 0.7012, + "step": 51612 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375276107017958e-06, + "loss": 0.5776, + "step": 51613 + }, + { + "epoch": 1.32, + "learning_rate": 1.2375007320635731e-06, + "loss": 0.5349, + "step": 51614 + }, + { + "epoch": 1.32, + "learning_rate": 1.237473853243507e-06, + "loss": 0.6357, + "step": 51615 + }, + { + "epoch": 1.32, + "learning_rate": 1.2374469742416182e-06, + "loss": 0.729, + "step": 51616 + }, + { + "epoch": 1.32, + "learning_rate": 1.2374200950579277e-06, + "loss": 0.6626, + "step": 51617 + }, + { + "epoch": 1.32, + "learning_rate": 1.237393215692455e-06, + "loss": 0.6826, + "step": 51618 + }, + { + "epoch": 1.32, + "learning_rate": 1.2373663361452211e-06, + "loss": 0.6365, + "step": 51619 + }, + { + "epoch": 1.32, + "learning_rate": 1.237339456416247e-06, + "loss": 0.6172, + "step": 51620 + }, + { + "epoch": 1.32, + "learning_rate": 1.2373125765055528e-06, + "loss": 0.6021, + "step": 51621 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372856964131596e-06, + "loss": 0.791, + "step": 51622 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372588161390871e-06, + "loss": 0.8066, + "step": 51623 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372319356833566e-06, + "loss": 0.6562, + "step": 51624 + }, + { + "epoch": 1.32, + "learning_rate": 1.2372050550459888e-06, + "loss": 0.5859, + "step": 51625 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371781742270038e-06, + "loss": 0.6553, + "step": 51626 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371512932264225e-06, + "loss": 0.7021, + "step": 51627 + }, + { + "epoch": 1.32, + "learning_rate": 1.2371244120442653e-06, + "loss": 0.6865, + "step": 51628 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370975306805528e-06, + "loss": 0.5908, + "step": 51629 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370706491353056e-06, + "loss": 0.6582, + "step": 51630 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370437674085443e-06, + "loss": 0.6963, + "step": 51631 + }, + { + "epoch": 1.32, + "learning_rate": 1.2370168855002898e-06, + "loss": 0.697, + "step": 51632 + }, + { + "epoch": 1.32, + "learning_rate": 1.236990003410562e-06, + "loss": 0.5049, + "step": 51633 + }, + { + "epoch": 1.32, + "learning_rate": 1.2369631211393822e-06, + "loss": 0.645, + "step": 51634 + }, + { + "epoch": 1.32, + "learning_rate": 1.2369362386867702e-06, + "loss": 0.5796, + "step": 51635 + }, + { + "epoch": 1.32, + "learning_rate": 1.236909356052747e-06, + "loss": 0.4384, + "step": 51636 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368824732373336e-06, + "loss": 0.6826, + "step": 51637 + }, + { + "epoch": 1.32, + "learning_rate": 1.23685559024055e-06, + "loss": 0.498, + "step": 51638 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368287070624168e-06, + "loss": 0.446, + "step": 51639 + }, + { + "epoch": 1.32, + "learning_rate": 1.2368018237029549e-06, + "loss": 0.6353, + "step": 51640 + }, + { + "epoch": 1.32, + "learning_rate": 1.2367749401621847e-06, + "loss": 0.708, + "step": 51641 + }, + { + "epoch": 1.32, + "learning_rate": 1.236748056440127e-06, + "loss": 0.5427, + "step": 51642 + }, + { + "epoch": 1.32, + "learning_rate": 1.2367211725368021e-06, + "loss": 0.4436, + "step": 51643 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366942884522304e-06, + "loss": 0.71, + "step": 51644 + }, + { + "epoch": 1.32, + "learning_rate": 1.236667404186433e-06, + "loss": 0.493, + "step": 51645 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366405197394306e-06, + "loss": 0.6553, + "step": 51646 + }, + { + "epoch": 1.32, + "learning_rate": 1.2366136351112431e-06, + "loss": 0.6909, + "step": 51647 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365867503018912e-06, + "loss": 0.6631, + "step": 51648 + }, + { + "epoch": 1.32, + "learning_rate": 1.236559865311396e-06, + "loss": 0.6299, + "step": 51649 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365329801397775e-06, + "loss": 0.7471, + "step": 51650 + }, + { + "epoch": 1.32, + "learning_rate": 1.2365060947870569e-06, + "loss": 0.5723, + "step": 51651 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364792092532544e-06, + "loss": 0.5605, + "step": 51652 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364523235383905e-06, + "loss": 0.436, + "step": 51653 + }, + { + "epoch": 1.32, + "learning_rate": 1.2364254376424861e-06, + "loss": 0.6675, + "step": 51654 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363985515655614e-06, + "loss": 0.7842, + "step": 51655 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363716653076372e-06, + "loss": 0.5801, + "step": 51656 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363447788687347e-06, + "loss": 0.6836, + "step": 51657 + }, + { + "epoch": 1.32, + "learning_rate": 1.2363178922488731e-06, + "loss": 0.708, + "step": 51658 + }, + { + "epoch": 1.32, + "learning_rate": 1.2362910054480739e-06, + "loss": 0.7339, + "step": 51659 + }, + { + "epoch": 1.32, + "learning_rate": 1.236264118466358e-06, + "loss": 0.6309, + "step": 51660 + }, + { + "epoch": 1.32, + "learning_rate": 1.236237231303745e-06, + "loss": 0.6587, + "step": 51661 + }, + { + "epoch": 1.32, + "learning_rate": 1.2362103439602563e-06, + "loss": 0.7236, + "step": 51662 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361834564359122e-06, + "loss": 0.6035, + "step": 51663 + }, + { + "epoch": 1.32, + "learning_rate": 1.236156568730733e-06, + "loss": 0.6035, + "step": 51664 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361296808447398e-06, + "loss": 0.5635, + "step": 51665 + }, + { + "epoch": 1.32, + "learning_rate": 1.2361027927779528e-06, + "loss": 0.7725, + "step": 51666 + }, + { + "epoch": 1.32, + "learning_rate": 1.236075904530393e-06, + "loss": 0.5823, + "step": 51667 + }, + { + "epoch": 1.32, + "learning_rate": 1.2360490161020806e-06, + "loss": 0.623, + "step": 51668 + }, + { + "epoch": 1.32, + "learning_rate": 1.2360221274930363e-06, + "loss": 0.6025, + "step": 51669 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359952387032809e-06, + "loss": 0.4585, + "step": 51670 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359683497328344e-06, + "loss": 0.7695, + "step": 51671 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359414605817182e-06, + "loss": 0.6196, + "step": 51672 + }, + { + "epoch": 1.32, + "learning_rate": 1.2359145712499523e-06, + "loss": 0.7129, + "step": 51673 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358876817375573e-06, + "loss": 0.6611, + "step": 51674 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358607920445541e-06, + "loss": 0.4663, + "step": 51675 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358339021709633e-06, + "loss": 0.7021, + "step": 51676 + }, + { + "epoch": 1.32, + "learning_rate": 1.2358070121168051e-06, + "loss": 0.6035, + "step": 51677 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357801218821006e-06, + "loss": 0.6182, + "step": 51678 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357532314668697e-06, + "loss": 0.7549, + "step": 51679 + }, + { + "epoch": 1.32, + "learning_rate": 1.2357263408711335e-06, + "loss": 0.5908, + "step": 51680 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356994500949128e-06, + "loss": 0.7241, + "step": 51681 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356725591382277e-06, + "loss": 0.5874, + "step": 51682 + }, + { + "epoch": 1.32, + "learning_rate": 1.2356456680010987e-06, + "loss": 0.5684, + "step": 51683 + }, + { + "epoch": 1.32, + "learning_rate": 1.235618776683547e-06, + "loss": 0.6504, + "step": 51684 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355918851855925e-06, + "loss": 0.8232, + "step": 51685 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355649935072563e-06, + "loss": 0.7822, + "step": 51686 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355381016485588e-06, + "loss": 0.7188, + "step": 51687 + }, + { + "epoch": 1.32, + "learning_rate": 1.2355112096095206e-06, + "loss": 0.7705, + "step": 51688 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354843173901623e-06, + "loss": 0.7139, + "step": 51689 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354574249905047e-06, + "loss": 0.5459, + "step": 51690 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354305324105677e-06, + "loss": 0.7969, + "step": 51691 + }, + { + "epoch": 1.32, + "learning_rate": 1.2354036396503729e-06, + "loss": 0.603, + "step": 51692 + }, + { + "epoch": 1.32, + "learning_rate": 1.23537674670994e-06, + "loss": 0.6294, + "step": 51693 + }, + { + "epoch": 1.32, + "learning_rate": 1.23534985358929e-06, + "loss": 0.625, + "step": 51694 + }, + { + "epoch": 1.32, + "learning_rate": 1.2353229602884436e-06, + "loss": 0.7349, + "step": 51695 + }, + { + "epoch": 1.32, + "learning_rate": 1.235296066807421e-06, + "loss": 0.8477, + "step": 51696 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352691731462436e-06, + "loss": 0.6729, + "step": 51697 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352422793049306e-06, + "loss": 0.7739, + "step": 51698 + }, + { + "epoch": 1.33, + "learning_rate": 1.2352153852835039e-06, + "loss": 0.6396, + "step": 51699 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351884910819832e-06, + "loss": 0.6724, + "step": 51700 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351615967003898e-06, + "loss": 0.7783, + "step": 51701 + }, + { + "epoch": 1.33, + "learning_rate": 1.235134702138744e-06, + "loss": 0.7832, + "step": 51702 + }, + { + "epoch": 1.33, + "learning_rate": 1.2351078073970665e-06, + "loss": 0.6543, + "step": 51703 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350809124753774e-06, + "loss": 0.8154, + "step": 51704 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350540173736978e-06, + "loss": 0.7754, + "step": 51705 + }, + { + "epoch": 1.33, + "learning_rate": 1.235027122092048e-06, + "loss": 0.6436, + "step": 51706 + }, + { + "epoch": 1.33, + "learning_rate": 1.2350002266304492e-06, + "loss": 0.8145, + "step": 51707 + }, + { + "epoch": 1.33, + "learning_rate": 1.234973330988921e-06, + "loss": 0.6416, + "step": 51708 + }, + { + "epoch": 1.33, + "learning_rate": 1.2349464351674847e-06, + "loss": 0.7451, + "step": 51709 + }, + { + "epoch": 1.33, + "learning_rate": 1.2349195391661606e-06, + "loss": 0.6052, + "step": 51710 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348926429849697e-06, + "loss": 0.6953, + "step": 51711 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348657466239324e-06, + "loss": 0.7734, + "step": 51712 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348388500830689e-06, + "loss": 0.5371, + "step": 51713 + }, + { + "epoch": 1.33, + "learning_rate": 1.2348119533624002e-06, + "loss": 0.5444, + "step": 51714 + }, + { + "epoch": 1.33, + "learning_rate": 1.2347850564619466e-06, + "loss": 0.6963, + "step": 51715 + }, + { + "epoch": 1.33, + "learning_rate": 1.2347581593817291e-06, + "loss": 0.6797, + "step": 51716 + }, + { + "epoch": 1.33, + "learning_rate": 1.234731262121768e-06, + "loss": 0.6006, + "step": 51717 + }, + { + "epoch": 1.33, + "learning_rate": 1.234704364682084e-06, + "loss": 0.6216, + "step": 51718 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346774670626975e-06, + "loss": 0.6525, + "step": 51719 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346505692636296e-06, + "loss": 0.7539, + "step": 51720 + }, + { + "epoch": 1.33, + "learning_rate": 1.2346236712849002e-06, + "loss": 0.4746, + "step": 51721 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345967731265305e-06, + "loss": 0.5469, + "step": 51722 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345698747885407e-06, + "loss": 0.625, + "step": 51723 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345429762709515e-06, + "loss": 0.6025, + "step": 51724 + }, + { + "epoch": 1.33, + "learning_rate": 1.2345160775737835e-06, + "loss": 0.707, + "step": 51725 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344891786970574e-06, + "loss": 0.5791, + "step": 51726 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344622796407938e-06, + "loss": 0.7959, + "step": 51727 + }, + { + "epoch": 1.33, + "learning_rate": 1.2344353804050133e-06, + "loss": 0.6807, + "step": 51728 + }, + { + "epoch": 1.33, + "learning_rate": 1.234408480989736e-06, + "loss": 0.6943, + "step": 51729 + }, + { + "epoch": 1.33, + "learning_rate": 1.234381581394983e-06, + "loss": 0.6426, + "step": 51730 + }, + { + "epoch": 1.33, + "learning_rate": 1.234354681620775e-06, + "loss": 0.6758, + "step": 51731 + }, + { + "epoch": 1.33, + "learning_rate": 1.2343277816671323e-06, + "loss": 0.5957, + "step": 51732 + }, + { + "epoch": 1.33, + "learning_rate": 1.2343008815340756e-06, + "loss": 0.6035, + "step": 51733 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342739812216257e-06, + "loss": 0.7568, + "step": 51734 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342470807298026e-06, + "loss": 0.5935, + "step": 51735 + }, + { + "epoch": 1.33, + "learning_rate": 1.2342201800586275e-06, + "loss": 0.646, + "step": 51736 + }, + { + "epoch": 1.33, + "learning_rate": 1.234193279208121e-06, + "loss": 0.6699, + "step": 51737 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341663781783032e-06, + "loss": 0.5527, + "step": 51738 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341394769691948e-06, + "loss": 0.6572, + "step": 51739 + }, + { + "epoch": 1.33, + "learning_rate": 1.2341125755808168e-06, + "loss": 0.7002, + "step": 51740 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340856740131895e-06, + "loss": 0.4956, + "step": 51741 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340587722663338e-06, + "loss": 0.5908, + "step": 51742 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340318703402698e-06, + "loss": 0.748, + "step": 51743 + }, + { + "epoch": 1.33, + "learning_rate": 1.2340049682350184e-06, + "loss": 0.6738, + "step": 51744 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339780659506002e-06, + "loss": 0.6543, + "step": 51745 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339511634870356e-06, + "loss": 0.6479, + "step": 51746 + }, + { + "epoch": 1.33, + "learning_rate": 1.2339242608443456e-06, + "loss": 0.6406, + "step": 51747 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338973580225505e-06, + "loss": 0.5459, + "step": 51748 + }, + { + "epoch": 1.33, + "learning_rate": 1.233870455021671e-06, + "loss": 0.606, + "step": 51749 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338435518417272e-06, + "loss": 0.5908, + "step": 51750 + }, + { + "epoch": 1.33, + "learning_rate": 1.2338166484827406e-06, + "loss": 0.7285, + "step": 51751 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337897449447314e-06, + "loss": 0.8574, + "step": 51752 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337628412277199e-06, + "loss": 0.8032, + "step": 51753 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337359373317269e-06, + "loss": 0.7139, + "step": 51754 + }, + { + "epoch": 1.33, + "learning_rate": 1.2337090332567732e-06, + "loss": 0.5596, + "step": 51755 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336821290028789e-06, + "loss": 0.6484, + "step": 51756 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336552245700654e-06, + "loss": 0.6309, + "step": 51757 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336283199583528e-06, + "loss": 0.7432, + "step": 51758 + }, + { + "epoch": 1.33, + "learning_rate": 1.2336014151677613e-06, + "loss": 0.5942, + "step": 51759 + }, + { + "epoch": 1.33, + "learning_rate": 1.2335745101983124e-06, + "loss": 0.7291, + "step": 51760 + }, + { + "epoch": 1.33, + "learning_rate": 1.233547605050026e-06, + "loss": 0.5896, + "step": 51761 + }, + { + "epoch": 1.33, + "learning_rate": 1.2335206997229233e-06, + "loss": 0.7236, + "step": 51762 + }, + { + "epoch": 1.33, + "learning_rate": 1.233493794217024e-06, + "loss": 0.6113, + "step": 51763 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334668885323495e-06, + "loss": 0.5737, + "step": 51764 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334399826689202e-06, + "loss": 0.6396, + "step": 51765 + }, + { + "epoch": 1.33, + "learning_rate": 1.2334130766267564e-06, + "loss": 0.5444, + "step": 51766 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333861704058793e-06, + "loss": 0.6982, + "step": 51767 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333592640063089e-06, + "loss": 0.4624, + "step": 51768 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333323574280662e-06, + "loss": 0.708, + "step": 51769 + }, + { + "epoch": 1.33, + "learning_rate": 1.2333054506711713e-06, + "loss": 0.7822, + "step": 51770 + }, + { + "epoch": 1.33, + "learning_rate": 1.2332785437356453e-06, + "loss": 0.6895, + "step": 51771 + }, + { + "epoch": 1.33, + "learning_rate": 1.233251636621509e-06, + "loss": 0.6289, + "step": 51772 + }, + { + "epoch": 1.33, + "learning_rate": 1.2332247293287821e-06, + "loss": 0.6362, + "step": 51773 + }, + { + "epoch": 1.33, + "learning_rate": 1.2331978218574861e-06, + "loss": 0.6982, + "step": 51774 + }, + { + "epoch": 1.33, + "learning_rate": 1.2331709142076409e-06, + "loss": 0.708, + "step": 51775 + }, + { + "epoch": 1.33, + "learning_rate": 1.233144006379268e-06, + "loss": 0.6484, + "step": 51776 + }, + { + "epoch": 1.33, + "learning_rate": 1.233117098372387e-06, + "loss": 0.7188, + "step": 51777 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330901901870193e-06, + "loss": 0.7041, + "step": 51778 + }, + { + "epoch": 1.33, + "learning_rate": 1.233063281823185e-06, + "loss": 0.6963, + "step": 51779 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330363732809047e-06, + "loss": 0.4473, + "step": 51780 + }, + { + "epoch": 1.33, + "learning_rate": 1.2330094645601993e-06, + "loss": 0.626, + "step": 51781 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329825556610893e-06, + "loss": 0.8105, + "step": 51782 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329556465835953e-06, + "loss": 0.5928, + "step": 51783 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329287373277376e-06, + "loss": 0.7773, + "step": 51784 + }, + { + "epoch": 1.33, + "learning_rate": 1.2329018278935374e-06, + "loss": 0.6494, + "step": 51785 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328749182810148e-06, + "loss": 0.4871, + "step": 51786 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328480084901908e-06, + "loss": 0.6284, + "step": 51787 + }, + { + "epoch": 1.33, + "learning_rate": 1.2328210985210855e-06, + "loss": 0.6504, + "step": 51788 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327941883737202e-06, + "loss": 0.5479, + "step": 51789 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327672780481146e-06, + "loss": 0.7402, + "step": 51790 + }, + { + "epoch": 1.33, + "learning_rate": 1.2327403675442903e-06, + "loss": 0.8652, + "step": 51791 + }, + { + "epoch": 1.33, + "learning_rate": 1.232713456862267e-06, + "loss": 0.6196, + "step": 51792 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326865460020659e-06, + "loss": 0.7305, + "step": 51793 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326596349637073e-06, + "loss": 0.7715, + "step": 51794 + }, + { + "epoch": 1.33, + "learning_rate": 1.232632723747212e-06, + "loss": 0.6934, + "step": 51795 + }, + { + "epoch": 1.33, + "learning_rate": 1.2326058123526005e-06, + "loss": 0.7217, + "step": 51796 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325789007798935e-06, + "loss": 0.6533, + "step": 51797 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325519890291113e-06, + "loss": 0.392, + "step": 51798 + }, + { + "epoch": 1.33, + "learning_rate": 1.2325250771002748e-06, + "loss": 0.7051, + "step": 51799 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324981649934044e-06, + "loss": 0.5073, + "step": 51800 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324712527085212e-06, + "loss": 0.9043, + "step": 51801 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324443402456454e-06, + "loss": 0.5459, + "step": 51802 + }, + { + "epoch": 1.33, + "learning_rate": 1.2324174276047977e-06, + "loss": 0.5664, + "step": 51803 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323905147859982e-06, + "loss": 0.5703, + "step": 51804 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323636017892685e-06, + "loss": 0.6919, + "step": 51805 + }, + { + "epoch": 1.33, + "learning_rate": 1.2323366886146284e-06, + "loss": 0.52, + "step": 51806 + }, + { + "epoch": 1.33, + "learning_rate": 1.232309775262099e-06, + "loss": 0.46, + "step": 51807 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322828617317005e-06, + "loss": 0.6406, + "step": 51808 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322559480234536e-06, + "loss": 0.6289, + "step": 51809 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322290341373793e-06, + "loss": 0.7275, + "step": 51810 + }, + { + "epoch": 1.33, + "learning_rate": 1.2322021200734976e-06, + "loss": 0.6943, + "step": 51811 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321752058318297e-06, + "loss": 0.4422, + "step": 51812 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321482914123958e-06, + "loss": 0.5732, + "step": 51813 + }, + { + "epoch": 1.33, + "learning_rate": 1.2321213768152165e-06, + "loss": 0.6865, + "step": 51814 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320944620403127e-06, + "loss": 0.623, + "step": 51815 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320675470877047e-06, + "loss": 0.6934, + "step": 51816 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320406319574135e-06, + "loss": 0.6514, + "step": 51817 + }, + { + "epoch": 1.33, + "learning_rate": 1.2320137166494593e-06, + "loss": 0.461, + "step": 51818 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319868011638629e-06, + "loss": 0.6082, + "step": 51819 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319598855006446e-06, + "loss": 0.748, + "step": 51820 + }, + { + "epoch": 1.33, + "learning_rate": 1.2319329696598254e-06, + "loss": 0.7549, + "step": 51821 + }, + { + "epoch": 1.33, + "learning_rate": 1.231906053641426e-06, + "loss": 0.5791, + "step": 51822 + }, + { + "epoch": 1.33, + "learning_rate": 1.2318791374454667e-06, + "loss": 0.4188, + "step": 51823 + }, + { + "epoch": 1.33, + "learning_rate": 1.2318522210719682e-06, + "loss": 0.7402, + "step": 51824 + }, + { + "epoch": 1.33, + "learning_rate": 1.231825304520951e-06, + "loss": 0.7324, + "step": 51825 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317983877924361e-06, + "loss": 0.5757, + "step": 51826 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317714708864438e-06, + "loss": 0.6143, + "step": 51827 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317445538029944e-06, + "loss": 0.6211, + "step": 51828 + }, + { + "epoch": 1.33, + "learning_rate": 1.2317176365421092e-06, + "loss": 0.7734, + "step": 51829 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316907191038082e-06, + "loss": 0.5811, + "step": 51830 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316638014881123e-06, + "loss": 0.4929, + "step": 51831 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316368836950425e-06, + "loss": 0.6782, + "step": 51832 + }, + { + "epoch": 1.33, + "learning_rate": 1.2316099657246187e-06, + "loss": 0.5217, + "step": 51833 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315830475768614e-06, + "loss": 0.7441, + "step": 51834 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315561292517922e-06, + "loss": 0.4978, + "step": 51835 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315292107494307e-06, + "loss": 0.7139, + "step": 51836 + }, + { + "epoch": 1.33, + "learning_rate": 1.2315022920697983e-06, + "loss": 0.6694, + "step": 51837 + }, + { + "epoch": 1.33, + "learning_rate": 1.231475373212915e-06, + "loss": 0.624, + "step": 51838 + }, + { + "epoch": 1.33, + "learning_rate": 1.2314484541788016e-06, + "loss": 0.5735, + "step": 51839 + }, + { + "epoch": 1.33, + "learning_rate": 1.2314215349674789e-06, + "loss": 0.7031, + "step": 51840 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313946155789674e-06, + "loss": 0.748, + "step": 51841 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313676960132877e-06, + "loss": 0.623, + "step": 51842 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313407762704604e-06, + "loss": 0.6123, + "step": 51843 + }, + { + "epoch": 1.33, + "learning_rate": 1.2313138563505059e-06, + "loss": 0.5737, + "step": 51844 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312869362534452e-06, + "loss": 0.5469, + "step": 51845 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312600159792985e-06, + "loss": 0.5504, + "step": 51846 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312330955280868e-06, + "loss": 0.5244, + "step": 51847 + }, + { + "epoch": 1.33, + "learning_rate": 1.2312061748998308e-06, + "loss": 0.4705, + "step": 51848 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311792540945504e-06, + "loss": 0.7041, + "step": 51849 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311523331122668e-06, + "loss": 0.6875, + "step": 51850 + }, + { + "epoch": 1.33, + "learning_rate": 1.2311254119530005e-06, + "loss": 0.5675, + "step": 51851 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310984906167725e-06, + "loss": 0.6333, + "step": 51852 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310715691036026e-06, + "loss": 0.5999, + "step": 51853 + }, + { + "epoch": 1.33, + "learning_rate": 1.231044647413512e-06, + "loss": 0.7363, + "step": 51854 + }, + { + "epoch": 1.33, + "learning_rate": 1.2310177255465209e-06, + "loss": 0.8066, + "step": 51855 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309908035026507e-06, + "loss": 0.6943, + "step": 51856 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309638812819208e-06, + "loss": 0.6943, + "step": 51857 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309369588843528e-06, + "loss": 0.6548, + "step": 51858 + }, + { + "epoch": 1.33, + "learning_rate": 1.2309100363099668e-06, + "loss": 0.5151, + "step": 51859 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308831135587838e-06, + "loss": 0.6743, + "step": 51860 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308561906308242e-06, + "loss": 0.665, + "step": 51861 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308292675261088e-06, + "loss": 0.6504, + "step": 51862 + }, + { + "epoch": 1.33, + "learning_rate": 1.2308023442446576e-06, + "loss": 0.6714, + "step": 51863 + }, + { + "epoch": 1.33, + "learning_rate": 1.230775420786492e-06, + "loss": 0.7285, + "step": 51864 + }, + { + "epoch": 1.33, + "learning_rate": 1.230748497151632e-06, + "loss": 0.5532, + "step": 51865 + }, + { + "epoch": 1.33, + "learning_rate": 1.2307215733400987e-06, + "loss": 0.709, + "step": 51866 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306946493519124e-06, + "loss": 0.7109, + "step": 51867 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306677251870937e-06, + "loss": 0.4124, + "step": 51868 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306408008456636e-06, + "loss": 0.3708, + "step": 51869 + }, + { + "epoch": 1.33, + "learning_rate": 1.2306138763276424e-06, + "loss": 0.6733, + "step": 51870 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305869516330507e-06, + "loss": 0.7051, + "step": 51871 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305600267619093e-06, + "loss": 0.791, + "step": 51872 + }, + { + "epoch": 1.33, + "learning_rate": 1.2305331017142383e-06, + "loss": 0.5637, + "step": 51873 + }, + { + "epoch": 1.33, + "learning_rate": 1.230506176490059e-06, + "loss": 0.5371, + "step": 51874 + }, + { + "epoch": 1.33, + "learning_rate": 1.2304792510893918e-06, + "loss": 0.9038, + "step": 51875 + }, + { + "epoch": 1.33, + "learning_rate": 1.230452325512257e-06, + "loss": 0.6929, + "step": 51876 + }, + { + "epoch": 1.33, + "learning_rate": 1.2304253997586758e-06, + "loss": 0.4978, + "step": 51877 + }, + { + "epoch": 1.33, + "learning_rate": 1.230398473828668e-06, + "loss": 0.6865, + "step": 51878 + }, + { + "epoch": 1.33, + "learning_rate": 1.230371547722255e-06, + "loss": 0.6875, + "step": 51879 + }, + { + "epoch": 1.33, + "learning_rate": 1.2303446214394569e-06, + "loss": 0.6094, + "step": 51880 + }, + { + "epoch": 1.33, + "learning_rate": 1.2303176949802949e-06, + "loss": 0.8096, + "step": 51881 + }, + { + "epoch": 1.33, + "learning_rate": 1.2302907683447886e-06, + "loss": 0.4673, + "step": 51882 + }, + { + "epoch": 1.33, + "learning_rate": 1.2302638415329598e-06, + "loss": 0.6748, + "step": 51883 + }, + { + "epoch": 1.33, + "learning_rate": 1.230236914544828e-06, + "loss": 0.6992, + "step": 51884 + }, + { + "epoch": 1.33, + "learning_rate": 1.230209987380415e-06, + "loss": 0.7148, + "step": 51885 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301830600397407e-06, + "loss": 0.4826, + "step": 51886 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301561325228258e-06, + "loss": 0.5703, + "step": 51887 + }, + { + "epoch": 1.33, + "learning_rate": 1.2301292048296905e-06, + "loss": 0.7451, + "step": 51888 + }, + { + "epoch": 1.33, + "learning_rate": 1.230102276960356e-06, + "loss": 0.4819, + "step": 51889 + }, + { + "epoch": 1.33, + "learning_rate": 1.230075348914843e-06, + "loss": 0.6072, + "step": 51890 + }, + { + "epoch": 1.33, + "learning_rate": 1.230048420693172e-06, + "loss": 0.4675, + "step": 51891 + }, + { + "epoch": 1.33, + "learning_rate": 1.2300214922953633e-06, + "loss": 0.6206, + "step": 51892 + }, + { + "epoch": 1.33, + "learning_rate": 1.2299945637214376e-06, + "loss": 0.7544, + "step": 51893 + }, + { + "epoch": 1.33, + "learning_rate": 1.2299676349714157e-06, + "loss": 0.7451, + "step": 51894 + }, + { + "epoch": 1.33, + "learning_rate": 1.229940706045318e-06, + "loss": 0.5957, + "step": 51895 + }, + { + "epoch": 1.33, + "learning_rate": 1.229913776943166e-06, + "loss": 0.5493, + "step": 51896 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298868476649788e-06, + "loss": 0.626, + "step": 51897 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298599182107784e-06, + "loss": 0.5977, + "step": 51898 + }, + { + "epoch": 1.33, + "learning_rate": 1.229832988580584e-06, + "loss": 0.5874, + "step": 51899 + }, + { + "epoch": 1.33, + "learning_rate": 1.2298060587744177e-06, + "loss": 0.4788, + "step": 51900 + }, + { + "epoch": 1.33, + "learning_rate": 1.2297791287922995e-06, + "loss": 0.7822, + "step": 51901 + }, + { + "epoch": 1.33, + "learning_rate": 1.22975219863425e-06, + "loss": 0.5991, + "step": 51902 + }, + { + "epoch": 1.33, + "learning_rate": 1.2297252683002895e-06, + "loss": 0.6069, + "step": 51903 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296983377904391e-06, + "loss": 0.8447, + "step": 51904 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296714071047189e-06, + "loss": 0.7734, + "step": 51905 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296444762431506e-06, + "loss": 0.8398, + "step": 51906 + }, + { + "epoch": 1.33, + "learning_rate": 1.2296175452057533e-06, + "loss": 0.5698, + "step": 51907 + }, + { + "epoch": 1.33, + "learning_rate": 1.229590613992549e-06, + "loss": 0.7109, + "step": 51908 + }, + { + "epoch": 1.33, + "learning_rate": 1.2295636826035574e-06, + "loss": 0.5703, + "step": 51909 + }, + { + "epoch": 1.33, + "learning_rate": 1.2295367510387995e-06, + "loss": 0.7539, + "step": 51910 + }, + { + "epoch": 1.33, + "learning_rate": 1.229509819298296e-06, + "loss": 0.5859, + "step": 51911 + }, + { + "epoch": 1.33, + "learning_rate": 1.229482887382067e-06, + "loss": 0.7334, + "step": 51912 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294559552901338e-06, + "loss": 0.3345, + "step": 51913 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294290230225166e-06, + "loss": 0.7529, + "step": 51914 + }, + { + "epoch": 1.33, + "learning_rate": 1.2294020905792365e-06, + "loss": 0.6042, + "step": 51915 + }, + { + "epoch": 1.33, + "learning_rate": 1.2293751579603133e-06, + "loss": 0.7432, + "step": 51916 + }, + { + "epoch": 1.33, + "learning_rate": 1.2293482251657685e-06, + "loss": 0.6362, + "step": 51917 + }, + { + "epoch": 1.33, + "learning_rate": 1.229321292195622e-06, + "loss": 0.7656, + "step": 51918 + }, + { + "epoch": 1.33, + "learning_rate": 1.2292943590498947e-06, + "loss": 0.7363, + "step": 51919 + }, + { + "epoch": 1.33, + "learning_rate": 1.2292674257286073e-06, + "loss": 0.5181, + "step": 51920 + }, + { + "epoch": 1.33, + "learning_rate": 1.229240492231781e-06, + "loss": 0.6025, + "step": 51921 + }, + { + "epoch": 1.33, + "learning_rate": 1.229213558559435e-06, + "loss": 0.5656, + "step": 51922 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291866247115909e-06, + "loss": 0.7432, + "step": 51923 + }, + { + "epoch": 1.33, + "learning_rate": 1.229159690688269e-06, + "loss": 0.6528, + "step": 51924 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291327564894904e-06, + "loss": 0.8027, + "step": 51925 + }, + { + "epoch": 1.33, + "learning_rate": 1.2291058221152754e-06, + "loss": 0.6694, + "step": 51926 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290788875656446e-06, + "loss": 0.7129, + "step": 51927 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290519528406184e-06, + "loss": 0.6587, + "step": 51928 + }, + { + "epoch": 1.33, + "learning_rate": 1.2290250179402178e-06, + "loss": 0.7163, + "step": 51929 + }, + { + "epoch": 1.33, + "learning_rate": 1.228998082864463e-06, + "loss": 0.8184, + "step": 51930 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289711476133754e-06, + "loss": 0.6602, + "step": 51931 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289442121869748e-06, + "loss": 0.6826, + "step": 51932 + }, + { + "epoch": 1.33, + "learning_rate": 1.2289172765852822e-06, + "loss": 0.6406, + "step": 51933 + }, + { + "epoch": 1.33, + "learning_rate": 1.228890340808318e-06, + "loss": 0.7822, + "step": 51934 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288634048561032e-06, + "loss": 0.4639, + "step": 51935 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288364687286583e-06, + "loss": 0.7314, + "step": 51936 + }, + { + "epoch": 1.33, + "learning_rate": 1.2288095324260034e-06, + "loss": 0.7324, + "step": 51937 + }, + { + "epoch": 1.33, + "learning_rate": 1.22878259594816e-06, + "loss": 0.6636, + "step": 51938 + }, + { + "epoch": 1.33, + "learning_rate": 1.228755659295148e-06, + "loss": 0.7676, + "step": 51939 + }, + { + "epoch": 1.33, + "learning_rate": 1.2287287224669887e-06, + "loss": 0.6289, + "step": 51940 + }, + { + "epoch": 1.33, + "learning_rate": 1.228701785463702e-06, + "loss": 0.7842, + "step": 51941 + }, + { + "epoch": 1.33, + "learning_rate": 1.228674848285309e-06, + "loss": 0.7617, + "step": 51942 + }, + { + "epoch": 1.33, + "learning_rate": 1.22864791093183e-06, + "loss": 0.6294, + "step": 51943 + }, + { + "epoch": 1.33, + "learning_rate": 1.2286209734032863e-06, + "loss": 0.3983, + "step": 51944 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285940356996973e-06, + "loss": 0.6572, + "step": 51945 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285670978210849e-06, + "loss": 0.7725, + "step": 51946 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285401597674689e-06, + "loss": 0.4485, + "step": 51947 + }, + { + "epoch": 1.33, + "learning_rate": 1.2285132215388705e-06, + "loss": 0.6562, + "step": 51948 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284862831353098e-06, + "loss": 0.5981, + "step": 51949 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284593445568076e-06, + "loss": 0.5347, + "step": 51950 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284324058033848e-06, + "loss": 0.6841, + "step": 51951 + }, + { + "epoch": 1.33, + "learning_rate": 1.2284054668750618e-06, + "loss": 0.5258, + "step": 51952 + }, + { + "epoch": 1.33, + "learning_rate": 1.228378527771859e-06, + "loss": 0.75, + "step": 51953 + }, + { + "epoch": 1.33, + "learning_rate": 1.2283515884937977e-06, + "loss": 0.436, + "step": 51954 + }, + { + "epoch": 1.33, + "learning_rate": 1.2283246490408976e-06, + "loss": 0.7402, + "step": 51955 + }, + { + "epoch": 1.33, + "learning_rate": 1.22829770941318e-06, + "loss": 0.7725, + "step": 51956 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282707696106653e-06, + "loss": 0.8018, + "step": 51957 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282438296333742e-06, + "loss": 0.7441, + "step": 51958 + }, + { + "epoch": 1.33, + "learning_rate": 1.2282168894813274e-06, + "loss": 0.5083, + "step": 51959 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281899491545454e-06, + "loss": 0.5947, + "step": 51960 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281630086530489e-06, + "loss": 0.666, + "step": 51961 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281360679768581e-06, + "loss": 0.6387, + "step": 51962 + }, + { + "epoch": 1.33, + "learning_rate": 1.2281091271259944e-06, + "loss": 0.7871, + "step": 51963 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280821861004777e-06, + "loss": 0.7881, + "step": 51964 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280552449003291e-06, + "loss": 0.6606, + "step": 51965 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280283035255693e-06, + "loss": 0.5974, + "step": 51966 + }, + { + "epoch": 1.33, + "learning_rate": 1.2280013619762187e-06, + "loss": 0.7275, + "step": 51967 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279744202522978e-06, + "loss": 0.9072, + "step": 51968 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279474783538273e-06, + "loss": 0.6826, + "step": 51969 + }, + { + "epoch": 1.33, + "learning_rate": 1.2279205362808277e-06, + "loss": 0.6543, + "step": 51970 + }, + { + "epoch": 1.33, + "learning_rate": 1.2278935940333204e-06, + "loss": 0.7295, + "step": 51971 + }, + { + "epoch": 1.33, + "learning_rate": 1.227866651611325e-06, + "loss": 0.5308, + "step": 51972 + }, + { + "epoch": 1.33, + "learning_rate": 1.227839709014863e-06, + "loss": 0.5264, + "step": 51973 + }, + { + "epoch": 1.33, + "learning_rate": 1.2278127662439542e-06, + "loss": 0.7871, + "step": 51974 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277858232986198e-06, + "loss": 0.6523, + "step": 51975 + }, + { + "epoch": 1.33, + "learning_rate": 1.22775888017888e-06, + "loss": 0.6245, + "step": 51976 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277319368847561e-06, + "loss": 0.5828, + "step": 51977 + }, + { + "epoch": 1.33, + "learning_rate": 1.2277049934162681e-06, + "loss": 0.707, + "step": 51978 + }, + { + "epoch": 1.33, + "learning_rate": 1.227678049773437e-06, + "loss": 0.5806, + "step": 51979 + }, + { + "epoch": 1.33, + "learning_rate": 1.2276511059562831e-06, + "loss": 0.7285, + "step": 51980 + }, + { + "epoch": 1.33, + "learning_rate": 1.2276241619648273e-06, + "loss": 0.7969, + "step": 51981 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275972177990903e-06, + "loss": 0.6294, + "step": 51982 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275702734590922e-06, + "loss": 0.4729, + "step": 51983 + }, + { + "epoch": 1.33, + "learning_rate": 1.2275433289448544e-06, + "loss": 0.7656, + "step": 51984 + }, + { + "epoch": 1.33, + "learning_rate": 1.227516384256397e-06, + "loss": 0.573, + "step": 51985 + }, + { + "epoch": 1.33, + "learning_rate": 1.227489439393741e-06, + "loss": 0.7461, + "step": 51986 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274624943569062e-06, + "loss": 0.6206, + "step": 51987 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274355491459143e-06, + "loss": 0.7793, + "step": 51988 + }, + { + "epoch": 1.33, + "learning_rate": 1.2274086037607854e-06, + "loss": 0.585, + "step": 51989 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273816582015401e-06, + "loss": 0.7725, + "step": 51990 + }, + { + "epoch": 1.33, + "learning_rate": 1.227354712468199e-06, + "loss": 0.7871, + "step": 51991 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273277665607833e-06, + "loss": 0.7822, + "step": 51992 + }, + { + "epoch": 1.33, + "learning_rate": 1.2273008204793128e-06, + "loss": 0.6895, + "step": 51993 + }, + { + "epoch": 1.33, + "learning_rate": 1.2272738742238085e-06, + "loss": 0.7285, + "step": 51994 + }, + { + "epoch": 1.33, + "learning_rate": 1.227246927794291e-06, + "loss": 0.6782, + "step": 51995 + }, + { + "epoch": 1.33, + "learning_rate": 1.2272199811907813e-06, + "loss": 0.6851, + "step": 51996 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271930344132994e-06, + "loss": 0.7578, + "step": 51997 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271660874618665e-06, + "loss": 0.6079, + "step": 51998 + }, + { + "epoch": 1.33, + "learning_rate": 1.2271391403365029e-06, + "loss": 0.5635, + "step": 51999 + }, + { + "epoch": 1.33, + "learning_rate": 1.227112193037229e-06, + "loss": 0.7236, + "step": 52000 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270852455640662e-06, + "loss": 0.6504, + "step": 52001 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270582979170344e-06, + "loss": 0.5835, + "step": 52002 + }, + { + "epoch": 1.33, + "learning_rate": 1.2270313500961544e-06, + "loss": 0.792, + "step": 52003 + }, + { + "epoch": 1.33, + "learning_rate": 1.227004402101447e-06, + "loss": 0.5269, + "step": 52004 + }, + { + "epoch": 1.33, + "learning_rate": 1.226977453932933e-06, + "loss": 0.5938, + "step": 52005 + }, + { + "epoch": 1.33, + "learning_rate": 1.2269505055906327e-06, + "loss": 0.6191, + "step": 52006 + }, + { + "epoch": 1.33, + "learning_rate": 1.226923557074567e-06, + "loss": 0.7051, + "step": 52007 + }, + { + "epoch": 1.33, + "learning_rate": 1.2268966083847559e-06, + "loss": 0.522, + "step": 52008 + }, + { + "epoch": 1.33, + "learning_rate": 1.2268696595212207e-06, + "loss": 0.7998, + "step": 52009 + }, + { + "epoch": 1.33, + "learning_rate": 1.226842710483982e-06, + "loss": 0.7451, + "step": 52010 + }, + { + "epoch": 1.33, + "learning_rate": 1.22681576127306e-06, + "loss": 0.5908, + "step": 52011 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267888118884757e-06, + "loss": 0.6758, + "step": 52012 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267618623302499e-06, + "loss": 0.6777, + "step": 52013 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267349125984026e-06, + "loss": 0.6562, + "step": 52014 + }, + { + "epoch": 1.33, + "learning_rate": 1.2267079626929548e-06, + "loss": 0.5693, + "step": 52015 + }, + { + "epoch": 1.33, + "learning_rate": 1.2266810126139276e-06, + "loss": 0.4524, + "step": 52016 + }, + { + "epoch": 1.33, + "learning_rate": 1.226654062361341e-06, + "loss": 0.7617, + "step": 52017 + }, + { + "epoch": 1.33, + "learning_rate": 1.2266271119352155e-06, + "loss": 0.5396, + "step": 52018 + }, + { + "epoch": 1.33, + "learning_rate": 1.226600161335572e-06, + "loss": 0.5625, + "step": 52019 + }, + { + "epoch": 1.33, + "learning_rate": 1.2265732105624314e-06, + "loss": 0.8691, + "step": 52020 + }, + { + "epoch": 1.33, + "learning_rate": 1.226546259615814e-06, + "loss": 0.7744, + "step": 52021 + }, + { + "epoch": 1.33, + "learning_rate": 1.2265193084957408e-06, + "loss": 0.6592, + "step": 52022 + }, + { + "epoch": 1.33, + "learning_rate": 1.226492357202232e-06, + "loss": 0.6914, + "step": 52023 + }, + { + "epoch": 1.33, + "learning_rate": 1.2264654057353085e-06, + "loss": 0.4208, + "step": 52024 + }, + { + "epoch": 1.33, + "learning_rate": 1.226438454094991e-06, + "loss": 0.4604, + "step": 52025 + }, + { + "epoch": 1.33, + "learning_rate": 1.2264115022812997e-06, + "loss": 0.6318, + "step": 52026 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263845502942553e-06, + "loss": 0.7461, + "step": 52027 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263575981338792e-06, + "loss": 0.7705, + "step": 52028 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263306458001909e-06, + "loss": 0.7773, + "step": 52029 + }, + { + "epoch": 1.33, + "learning_rate": 1.2263036932932123e-06, + "loss": 0.5903, + "step": 52030 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262767406129631e-06, + "loss": 0.7061, + "step": 52031 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262497877594642e-06, + "loss": 0.5767, + "step": 52032 + }, + { + "epoch": 1.33, + "learning_rate": 1.2262228347327358e-06, + "loss": 0.6982, + "step": 52033 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261958815327998e-06, + "loss": 0.6812, + "step": 52034 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261689281596752e-06, + "loss": 0.6172, + "step": 52035 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261419746133842e-06, + "loss": 0.605, + "step": 52036 + }, + { + "epoch": 1.33, + "learning_rate": 1.2261150208939461e-06, + "loss": 0.5776, + "step": 52037 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260880670013824e-06, + "loss": 0.6167, + "step": 52038 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260611129357135e-06, + "loss": 0.6592, + "step": 52039 + }, + { + "epoch": 1.33, + "learning_rate": 1.22603415869696e-06, + "loss": 0.6943, + "step": 52040 + }, + { + "epoch": 1.33, + "learning_rate": 1.2260072042851423e-06, + "loss": 0.5617, + "step": 52041 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259802497002816e-06, + "loss": 0.7285, + "step": 52042 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259532949423978e-06, + "loss": 0.7783, + "step": 52043 + }, + { + "epoch": 1.33, + "learning_rate": 1.2259263400115125e-06, + "loss": 0.7871, + "step": 52044 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258993849076452e-06, + "loss": 0.6594, + "step": 52045 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258724296308177e-06, + "loss": 0.5889, + "step": 52046 + }, + { + "epoch": 1.33, + "learning_rate": 1.2258454741810499e-06, + "loss": 0.7715, + "step": 52047 + }, + { + "epoch": 1.33, + "learning_rate": 1.225818518558362e-06, + "loss": 0.5569, + "step": 52048 + }, + { + "epoch": 1.33, + "learning_rate": 1.225791562762776e-06, + "loss": 0.6367, + "step": 52049 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257646067943114e-06, + "loss": 0.5774, + "step": 52050 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257376506529895e-06, + "loss": 0.6592, + "step": 52051 + }, + { + "epoch": 1.33, + "learning_rate": 1.2257106943388306e-06, + "loss": 0.6885, + "step": 52052 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256837378518553e-06, + "loss": 0.6514, + "step": 52053 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256567811920842e-06, + "loss": 0.7285, + "step": 52054 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256298243595381e-06, + "loss": 0.6396, + "step": 52055 + }, + { + "epoch": 1.33, + "learning_rate": 1.2256028673542377e-06, + "loss": 0.7168, + "step": 52056 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255759101762039e-06, + "loss": 0.3921, + "step": 52057 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255489528254566e-06, + "loss": 0.583, + "step": 52058 + }, + { + "epoch": 1.33, + "learning_rate": 1.2255219953020168e-06, + "loss": 0.6953, + "step": 52059 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254950376059052e-06, + "loss": 0.5688, + "step": 52060 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254680797371428e-06, + "loss": 0.6725, + "step": 52061 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254411216957494e-06, + "loss": 0.5503, + "step": 52062 + }, + { + "epoch": 1.33, + "learning_rate": 1.2254141634817464e-06, + "loss": 0.4736, + "step": 52063 + }, + { + "epoch": 1.33, + "learning_rate": 1.225387205095154e-06, + "loss": 0.5679, + "step": 52064 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253602465359929e-06, + "loss": 0.8252, + "step": 52065 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253332878042841e-06, + "loss": 0.5625, + "step": 52066 + }, + { + "epoch": 1.33, + "learning_rate": 1.2253063289000475e-06, + "loss": 0.554, + "step": 52067 + }, + { + "epoch": 1.33, + "learning_rate": 1.2252793698233045e-06, + "loss": 0.7168, + "step": 52068 + }, + { + "epoch": 1.33, + "learning_rate": 1.2252524105740756e-06, + "loss": 0.5684, + "step": 52069 + }, + { + "epoch": 1.33, + "learning_rate": 1.225225451152381e-06, + "loss": 0.6968, + "step": 52070 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251984915582418e-06, + "loss": 0.668, + "step": 52071 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251715317916786e-06, + "loss": 0.541, + "step": 52072 + }, + { + "epoch": 1.33, + "learning_rate": 1.2251445718527116e-06, + "loss": 0.6514, + "step": 52073 + }, + { + "epoch": 1.33, + "learning_rate": 1.225117611741362e-06, + "loss": 0.6631, + "step": 52074 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250906514576498e-06, + "loss": 0.7295, + "step": 52075 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250636910015965e-06, + "loss": 0.6934, + "step": 52076 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250367303732222e-06, + "loss": 0.7178, + "step": 52077 + }, + { + "epoch": 1.33, + "learning_rate": 1.2250097695725474e-06, + "loss": 0.7803, + "step": 52078 + }, + { + "epoch": 1.33, + "learning_rate": 1.224982808599593e-06, + "loss": 0.7666, + "step": 52079 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249558474543798e-06, + "loss": 0.627, + "step": 52080 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249288861369283e-06, + "loss": 0.7822, + "step": 52081 + }, + { + "epoch": 1.33, + "learning_rate": 1.2249019246472589e-06, + "loss": 0.7646, + "step": 52082 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248749629853923e-06, + "loss": 0.7285, + "step": 52083 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248480011513496e-06, + "loss": 0.624, + "step": 52084 + }, + { + "epoch": 1.33, + "learning_rate": 1.2248210391451508e-06, + "loss": 0.481, + "step": 52085 + }, + { + "epoch": 1.33, + "learning_rate": 1.2247940769668174e-06, + "loss": 0.7983, + "step": 52086 + }, + { + "epoch": 1.34, + "learning_rate": 1.224767114616369e-06, + "loss": 0.6255, + "step": 52087 + }, + { + "epoch": 1.34, + "learning_rate": 1.224740152093827e-06, + "loss": 0.7852, + "step": 52088 + }, + { + "epoch": 1.34, + "learning_rate": 1.2247131893992115e-06, + "loss": 0.606, + "step": 52089 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246862265325437e-06, + "loss": 0.5791, + "step": 52090 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246592634938442e-06, + "loss": 0.5605, + "step": 52091 + }, + { + "epoch": 1.34, + "learning_rate": 1.224632300283133e-06, + "loss": 0.6255, + "step": 52092 + }, + { + "epoch": 1.34, + "learning_rate": 1.2246053369004314e-06, + "loss": 0.604, + "step": 52093 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245783733457596e-06, + "loss": 0.792, + "step": 52094 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245514096191386e-06, + "loss": 0.7334, + "step": 52095 + }, + { + "epoch": 1.34, + "learning_rate": 1.2245244457205893e-06, + "loss": 0.668, + "step": 52096 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244974816501314e-06, + "loss": 0.4081, + "step": 52097 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244705174077862e-06, + "loss": 0.6494, + "step": 52098 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244435529935746e-06, + "loss": 0.7773, + "step": 52099 + }, + { + "epoch": 1.34, + "learning_rate": 1.2244165884075164e-06, + "loss": 0.7773, + "step": 52100 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243896236496334e-06, + "loss": 0.8467, + "step": 52101 + }, + { + "epoch": 1.34, + "learning_rate": 1.224362658719945e-06, + "loss": 0.6978, + "step": 52102 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243356936184726e-06, + "loss": 0.5728, + "step": 52103 + }, + { + "epoch": 1.34, + "learning_rate": 1.2243087283452364e-06, + "loss": 0.625, + "step": 52104 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242817629002577e-06, + "loss": 0.5156, + "step": 52105 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242547972835569e-06, + "loss": 0.6069, + "step": 52106 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242278314951542e-06, + "loss": 0.7529, + "step": 52107 + }, + { + "epoch": 1.34, + "learning_rate": 1.2242008655350706e-06, + "loss": 0.7412, + "step": 52108 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241738994033267e-06, + "loss": 0.6934, + "step": 52109 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241469330999433e-06, + "loss": 0.5872, + "step": 52110 + }, + { + "epoch": 1.34, + "learning_rate": 1.2241199666249408e-06, + "loss": 0.6572, + "step": 52111 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240929999783398e-06, + "loss": 0.3173, + "step": 52112 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240660331601614e-06, + "loss": 0.5632, + "step": 52113 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240390661704257e-06, + "loss": 0.4365, + "step": 52114 + }, + { + "epoch": 1.34, + "learning_rate": 1.2240120990091537e-06, + "loss": 0.5957, + "step": 52115 + }, + { + "epoch": 1.34, + "learning_rate": 1.2239851316763658e-06, + "loss": 0.5698, + "step": 52116 + }, + { + "epoch": 1.34, + "learning_rate": 1.223958164172083e-06, + "loss": 0.6406, + "step": 52117 + }, + { + "epoch": 1.34, + "learning_rate": 1.2239311964963254e-06, + "loss": 0.6523, + "step": 52118 + }, + { + "epoch": 1.34, + "learning_rate": 1.223904228649114e-06, + "loss": 0.7139, + "step": 52119 + }, + { + "epoch": 1.34, + "learning_rate": 1.2238772606304698e-06, + "loss": 0.6279, + "step": 52120 + }, + { + "epoch": 1.34, + "learning_rate": 1.223850292440413e-06, + "loss": 0.7236, + "step": 52121 + }, + { + "epoch": 1.34, + "learning_rate": 1.2238233240789644e-06, + "loss": 0.6738, + "step": 52122 + }, + { + "epoch": 1.34, + "learning_rate": 1.223796355546144e-06, + "loss": 0.7051, + "step": 52123 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237693868419738e-06, + "loss": 0.6289, + "step": 52124 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237424179664731e-06, + "loss": 0.6675, + "step": 52125 + }, + { + "epoch": 1.34, + "learning_rate": 1.2237154489196634e-06, + "loss": 0.6338, + "step": 52126 + }, + { + "epoch": 1.34, + "learning_rate": 1.223688479701565e-06, + "loss": 0.6313, + "step": 52127 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236615103121985e-06, + "loss": 0.6111, + "step": 52128 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236345407515846e-06, + "loss": 0.606, + "step": 52129 + }, + { + "epoch": 1.34, + "learning_rate": 1.2236075710197444e-06, + "loss": 0.6509, + "step": 52130 + }, + { + "epoch": 1.34, + "learning_rate": 1.2235806011166981e-06, + "loss": 0.5195, + "step": 52131 + }, + { + "epoch": 1.34, + "learning_rate": 1.223553631042466e-06, + "loss": 0.5151, + "step": 52132 + }, + { + "epoch": 1.34, + "learning_rate": 1.2235266607970696e-06, + "loss": 0.6875, + "step": 52133 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234996903805289e-06, + "loss": 0.6992, + "step": 52134 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234727197928646e-06, + "loss": 0.585, + "step": 52135 + }, + { + "epoch": 1.34, + "learning_rate": 1.2234457490340978e-06, + "loss": 0.6787, + "step": 52136 + }, + { + "epoch": 1.34, + "learning_rate": 1.223418778104249e-06, + "loss": 0.5825, + "step": 52137 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233918070033382e-06, + "loss": 0.5085, + "step": 52138 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233648357313867e-06, + "loss": 0.6138, + "step": 52139 + }, + { + "epoch": 1.34, + "learning_rate": 1.223337864288415e-06, + "loss": 0.7441, + "step": 52140 + }, + { + "epoch": 1.34, + "learning_rate": 1.2233108926744444e-06, + "loss": 0.7524, + "step": 52141 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232839208894942e-06, + "loss": 0.6279, + "step": 52142 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232569489335863e-06, + "loss": 0.7725, + "step": 52143 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232299768067403e-06, + "loss": 0.8242, + "step": 52144 + }, + { + "epoch": 1.34, + "learning_rate": 1.2232030045089775e-06, + "loss": 0.6777, + "step": 52145 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231760320403189e-06, + "loss": 0.4377, + "step": 52146 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231490594007842e-06, + "loss": 0.4834, + "step": 52147 + }, + { + "epoch": 1.34, + "learning_rate": 1.2231220865903945e-06, + "loss": 0.7471, + "step": 52148 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230951136091708e-06, + "loss": 0.7817, + "step": 52149 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230681404571333e-06, + "loss": 0.5791, + "step": 52150 + }, + { + "epoch": 1.34, + "learning_rate": 1.223041167134303e-06, + "loss": 0.6543, + "step": 52151 + }, + { + "epoch": 1.34, + "learning_rate": 1.2230141936406996e-06, + "loss": 0.6216, + "step": 52152 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229872199763451e-06, + "loss": 0.6797, + "step": 52153 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229602461412592e-06, + "loss": 0.6021, + "step": 52154 + }, + { + "epoch": 1.34, + "learning_rate": 1.222933272135463e-06, + "loss": 0.6099, + "step": 52155 + }, + { + "epoch": 1.34, + "learning_rate": 1.2229062979589773e-06, + "loss": 0.4802, + "step": 52156 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228793236118223e-06, + "loss": 0.667, + "step": 52157 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228523490940188e-06, + "loss": 0.7295, + "step": 52158 + }, + { + "epoch": 1.34, + "learning_rate": 1.2228253744055876e-06, + "loss": 0.5552, + "step": 52159 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227983995465495e-06, + "loss": 0.7197, + "step": 52160 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227714245169244e-06, + "loss": 0.7539, + "step": 52161 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227444493167335e-06, + "loss": 0.8057, + "step": 52162 + }, + { + "epoch": 1.34, + "learning_rate": 1.2227174739459979e-06, + "loss": 0.6063, + "step": 52163 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226904984047373e-06, + "loss": 0.5376, + "step": 52164 + }, + { + "epoch": 1.34, + "learning_rate": 1.222663522692973e-06, + "loss": 0.6445, + "step": 52165 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226365468107257e-06, + "loss": 0.6602, + "step": 52166 + }, + { + "epoch": 1.34, + "learning_rate": 1.2226095707580154e-06, + "loss": 0.6436, + "step": 52167 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225825945348635e-06, + "loss": 0.7285, + "step": 52168 + }, + { + "epoch": 1.34, + "learning_rate": 1.22255561814129e-06, + "loss": 0.5247, + "step": 52169 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225286415773167e-06, + "loss": 0.427, + "step": 52170 + }, + { + "epoch": 1.34, + "learning_rate": 1.2225016648429628e-06, + "loss": 0.7871, + "step": 52171 + }, + { + "epoch": 1.34, + "learning_rate": 1.2224746879382494e-06, + "loss": 0.5757, + "step": 52172 + }, + { + "epoch": 1.34, + "learning_rate": 1.2224477108631977e-06, + "loss": 0.5671, + "step": 52173 + }, + { + "epoch": 1.34, + "learning_rate": 1.222420733617828e-06, + "loss": 0.5088, + "step": 52174 + }, + { + "epoch": 1.34, + "learning_rate": 1.222393756202161e-06, + "loss": 0.605, + "step": 52175 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223667786162174e-06, + "loss": 0.7998, + "step": 52176 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223398008600176e-06, + "loss": 0.5728, + "step": 52177 + }, + { + "epoch": 1.34, + "learning_rate": 1.2223128229335826e-06, + "loss": 0.626, + "step": 52178 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222858448369327e-06, + "loss": 0.7295, + "step": 52179 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222588665700888e-06, + "loss": 0.7002, + "step": 52180 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222318881330716e-06, + "loss": 0.3877, + "step": 52181 + }, + { + "epoch": 1.34, + "learning_rate": 1.2222049095259014e-06, + "loss": 0.5464, + "step": 52182 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221779307485996e-06, + "loss": 0.7676, + "step": 52183 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221509518011858e-06, + "loss": 0.6738, + "step": 52184 + }, + { + "epoch": 1.34, + "learning_rate": 1.2221239726836818e-06, + "loss": 0.7124, + "step": 52185 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220969933961075e-06, + "loss": 0.6406, + "step": 52186 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220700139384836e-06, + "loss": 0.6997, + "step": 52187 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220430343108308e-06, + "loss": 0.6328, + "step": 52188 + }, + { + "epoch": 1.34, + "learning_rate": 1.2220160545131702e-06, + "loss": 0.7222, + "step": 52189 + }, + { + "epoch": 1.34, + "learning_rate": 1.221989074545522e-06, + "loss": 0.751, + "step": 52190 + }, + { + "epoch": 1.34, + "learning_rate": 1.221962094407907e-06, + "loss": 0.6782, + "step": 52191 + }, + { + "epoch": 1.34, + "learning_rate": 1.2219351141003455e-06, + "loss": 0.7832, + "step": 52192 + }, + { + "epoch": 1.34, + "learning_rate": 1.2219081336228588e-06, + "loss": 0.5928, + "step": 52193 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218811529754672e-06, + "loss": 0.6294, + "step": 52194 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218541721581913e-06, + "loss": 0.6758, + "step": 52195 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218271911710521e-06, + "loss": 0.5713, + "step": 52196 + }, + { + "epoch": 1.34, + "learning_rate": 1.2218002100140699e-06, + "loss": 0.5928, + "step": 52197 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217732286872654e-06, + "loss": 0.7285, + "step": 52198 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217462471906593e-06, + "loss": 0.4734, + "step": 52199 + }, + { + "epoch": 1.34, + "learning_rate": 1.2217192655242725e-06, + "loss": 0.3972, + "step": 52200 + }, + { + "epoch": 1.34, + "learning_rate": 1.221692283688125e-06, + "loss": 0.5317, + "step": 52201 + }, + { + "epoch": 1.34, + "learning_rate": 1.2216653016822386e-06, + "loss": 0.5051, + "step": 52202 + }, + { + "epoch": 1.34, + "learning_rate": 1.221638319506633e-06, + "loss": 0.7725, + "step": 52203 + }, + { + "epoch": 1.34, + "learning_rate": 1.2216113371613289e-06, + "loss": 0.6436, + "step": 52204 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215843546463472e-06, + "loss": 0.793, + "step": 52205 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215573719617086e-06, + "loss": 0.6577, + "step": 52206 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215303891074337e-06, + "loss": 0.6372, + "step": 52207 + }, + { + "epoch": 1.34, + "learning_rate": 1.2215034060835434e-06, + "loss": 0.7578, + "step": 52208 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214764228900579e-06, + "loss": 0.5449, + "step": 52209 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214494395269982e-06, + "loss": 0.6055, + "step": 52210 + }, + { + "epoch": 1.34, + "learning_rate": 1.2214224559943848e-06, + "loss": 0.481, + "step": 52211 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213954722922386e-06, + "loss": 0.6201, + "step": 52212 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213684884205797e-06, + "loss": 0.6846, + "step": 52213 + }, + { + "epoch": 1.34, + "learning_rate": 1.2213415043794293e-06, + "loss": 0.7051, + "step": 52214 + }, + { + "epoch": 1.34, + "learning_rate": 1.221314520168808e-06, + "loss": 0.6851, + "step": 52215 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212875357887362e-06, + "loss": 0.666, + "step": 52216 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212605512392347e-06, + "loss": 0.7959, + "step": 52217 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212335665203243e-06, + "loss": 0.6064, + "step": 52218 + }, + { + "epoch": 1.34, + "learning_rate": 1.2212065816320254e-06, + "loss": 0.606, + "step": 52219 + }, + { + "epoch": 1.34, + "learning_rate": 1.221179596574359e-06, + "loss": 0.5181, + "step": 52220 + }, + { + "epoch": 1.34, + "learning_rate": 1.2211526113473453e-06, + "loss": 0.668, + "step": 52221 + }, + { + "epoch": 1.34, + "learning_rate": 1.2211256259510053e-06, + "loss": 0.6621, + "step": 52222 + }, + { + "epoch": 1.34, + "learning_rate": 1.2210986403853595e-06, + "loss": 0.5796, + "step": 52223 + }, + { + "epoch": 1.34, + "learning_rate": 1.221071654650429e-06, + "loss": 0.3679, + "step": 52224 + }, + { + "epoch": 1.34, + "learning_rate": 1.221044668746234e-06, + "loss": 0.5488, + "step": 52225 + }, + { + "epoch": 1.34, + "learning_rate": 1.2210176826727947e-06, + "loss": 0.6504, + "step": 52226 + }, + { + "epoch": 1.34, + "learning_rate": 1.2209906964301328e-06, + "loss": 0.7021, + "step": 52227 + }, + { + "epoch": 1.34, + "learning_rate": 1.2209637100182683e-06, + "loss": 0.6826, + "step": 52228 + }, + { + "epoch": 1.34, + "learning_rate": 1.220936723437222e-06, + "loss": 0.7383, + "step": 52229 + }, + { + "epoch": 1.34, + "learning_rate": 1.220909736687015e-06, + "loss": 0.7114, + "step": 52230 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208827497676675e-06, + "loss": 0.7363, + "step": 52231 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208557626791998e-06, + "loss": 0.5483, + "step": 52232 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208287754216332e-06, + "loss": 0.5337, + "step": 52233 + }, + { + "epoch": 1.34, + "learning_rate": 1.2208017879949883e-06, + "loss": 0.7275, + "step": 52234 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207748003992857e-06, + "loss": 0.7415, + "step": 52235 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207478126345459e-06, + "loss": 0.6377, + "step": 52236 + }, + { + "epoch": 1.34, + "learning_rate": 1.2207208247007895e-06, + "loss": 0.5918, + "step": 52237 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206938365980373e-06, + "loss": 0.5579, + "step": 52238 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206668483263102e-06, + "loss": 0.6187, + "step": 52239 + }, + { + "epoch": 1.34, + "learning_rate": 1.2206398598856285e-06, + "loss": 0.564, + "step": 52240 + }, + { + "epoch": 1.34, + "learning_rate": 1.220612871276013e-06, + "loss": 0.6633, + "step": 52241 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205858824974843e-06, + "loss": 0.5962, + "step": 52242 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205588935500633e-06, + "loss": 0.6621, + "step": 52243 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205319044337703e-06, + "loss": 0.55, + "step": 52244 + }, + { + "epoch": 1.34, + "learning_rate": 1.2205049151486265e-06, + "loss": 0.791, + "step": 52245 + }, + { + "epoch": 1.34, + "learning_rate": 1.2204779256946518e-06, + "loss": 0.5737, + "step": 52246 + }, + { + "epoch": 1.34, + "learning_rate": 1.2204509360718675e-06, + "loss": 0.626, + "step": 52247 + }, + { + "epoch": 1.34, + "learning_rate": 1.220423946280294e-06, + "loss": 0.5234, + "step": 52248 + }, + { + "epoch": 1.34, + "learning_rate": 1.220396956319952e-06, + "loss": 0.5986, + "step": 52249 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203699661908627e-06, + "loss": 0.561, + "step": 52250 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203429758930454e-06, + "loss": 0.7412, + "step": 52251 + }, + { + "epoch": 1.34, + "learning_rate": 1.2203159854265222e-06, + "loss": 0.7598, + "step": 52252 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202889947913129e-06, + "loss": 0.7451, + "step": 52253 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202620039874385e-06, + "loss": 0.3427, + "step": 52254 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202350130149197e-06, + "loss": 0.6035, + "step": 52255 + }, + { + "epoch": 1.34, + "learning_rate": 1.2202080218737771e-06, + "loss": 0.7568, + "step": 52256 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201810305640312e-06, + "loss": 0.7266, + "step": 52257 + }, + { + "epoch": 1.34, + "learning_rate": 1.220154039085703e-06, + "loss": 0.5464, + "step": 52258 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201270474388126e-06, + "loss": 0.8105, + "step": 52259 + }, + { + "epoch": 1.34, + "learning_rate": 1.2201000556233816e-06, + "loss": 0.6265, + "step": 52260 + }, + { + "epoch": 1.34, + "learning_rate": 1.2200730636394296e-06, + "loss": 0.5537, + "step": 52261 + }, + { + "epoch": 1.34, + "learning_rate": 1.2200460714869782e-06, + "loss": 0.6147, + "step": 52262 + }, + { + "epoch": 1.34, + "learning_rate": 1.220019079166047e-06, + "loss": 0.8047, + "step": 52263 + }, + { + "epoch": 1.34, + "learning_rate": 1.219992086676658e-06, + "loss": 0.7471, + "step": 52264 + }, + { + "epoch": 1.34, + "learning_rate": 1.219965094018831e-06, + "loss": 0.5015, + "step": 52265 + }, + { + "epoch": 1.34, + "learning_rate": 1.219938101192587e-06, + "loss": 0.5278, + "step": 52266 + }, + { + "epoch": 1.34, + "learning_rate": 1.219911108197946e-06, + "loss": 0.4126, + "step": 52267 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198841150349296e-06, + "loss": 0.7344, + "step": 52268 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198571217035576e-06, + "loss": 0.707, + "step": 52269 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198301282038514e-06, + "loss": 0.6274, + "step": 52270 + }, + { + "epoch": 1.34, + "learning_rate": 1.2198031345358314e-06, + "loss": 0.6406, + "step": 52271 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197761406995181e-06, + "loss": 0.4661, + "step": 52272 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197491466949326e-06, + "loss": 0.668, + "step": 52273 + }, + { + "epoch": 1.34, + "learning_rate": 1.2197221525220948e-06, + "loss": 0.7129, + "step": 52274 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196951581810266e-06, + "loss": 0.6992, + "step": 52275 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196681636717475e-06, + "loss": 0.6816, + "step": 52276 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196411689942786e-06, + "loss": 0.605, + "step": 52277 + }, + { + "epoch": 1.34, + "learning_rate": 1.2196141741486404e-06, + "loss": 0.5787, + "step": 52278 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195871791348537e-06, + "loss": 0.751, + "step": 52279 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195601839529394e-06, + "loss": 0.5942, + "step": 52280 + }, + { + "epoch": 1.34, + "learning_rate": 1.219533188602918e-06, + "loss": 0.6572, + "step": 52281 + }, + { + "epoch": 1.34, + "learning_rate": 1.2195061930848099e-06, + "loss": 0.6021, + "step": 52282 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194791973986363e-06, + "loss": 0.4277, + "step": 52283 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194522015444174e-06, + "loss": 0.6235, + "step": 52284 + }, + { + "epoch": 1.34, + "learning_rate": 1.2194252055221742e-06, + "loss": 0.6699, + "step": 52285 + }, + { + "epoch": 1.34, + "learning_rate": 1.219398209331927e-06, + "loss": 0.668, + "step": 52286 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193712129736967e-06, + "loss": 0.5601, + "step": 52287 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193442164475038e-06, + "loss": 0.6758, + "step": 52288 + }, + { + "epoch": 1.34, + "learning_rate": 1.2193172197533693e-06, + "loss": 0.7446, + "step": 52289 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192902228913137e-06, + "loss": 0.7412, + "step": 52290 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192632258613578e-06, + "loss": 0.4156, + "step": 52291 + }, + { + "epoch": 1.34, + "learning_rate": 1.2192362286635218e-06, + "loss": 0.6851, + "step": 52292 + }, + { + "epoch": 1.34, + "learning_rate": 1.219209231297827e-06, + "loss": 0.4758, + "step": 52293 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191822337642936e-06, + "loss": 0.7168, + "step": 52294 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191552360629427e-06, + "loss": 0.6177, + "step": 52295 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191282381937944e-06, + "loss": 0.6655, + "step": 52296 + }, + { + "epoch": 1.34, + "learning_rate": 1.2191012401568696e-06, + "loss": 0.7007, + "step": 52297 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190742419521893e-06, + "loss": 0.5493, + "step": 52298 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190472435797738e-06, + "loss": 0.8281, + "step": 52299 + }, + { + "epoch": 1.34, + "learning_rate": 1.2190202450396443e-06, + "loss": 0.6743, + "step": 52300 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189932463318207e-06, + "loss": 0.6758, + "step": 52301 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189662474563241e-06, + "loss": 0.6797, + "step": 52302 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189392484131748e-06, + "loss": 0.7578, + "step": 52303 + }, + { + "epoch": 1.34, + "learning_rate": 1.2189122492023942e-06, + "loss": 0.6738, + "step": 52304 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188852498240026e-06, + "loss": 0.6895, + "step": 52305 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188582502780204e-06, + "loss": 0.7939, + "step": 52306 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188312505644684e-06, + "loss": 0.8149, + "step": 52307 + }, + { + "epoch": 1.34, + "learning_rate": 1.2188042506833678e-06, + "loss": 0.7612, + "step": 52308 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187772506347385e-06, + "loss": 0.7432, + "step": 52309 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187502504186016e-06, + "loss": 0.6499, + "step": 52310 + }, + { + "epoch": 1.34, + "learning_rate": 1.2187232500349777e-06, + "loss": 0.6206, + "step": 52311 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186962494838878e-06, + "loss": 0.4639, + "step": 52312 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186692487653516e-06, + "loss": 0.7246, + "step": 52313 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186422478793908e-06, + "loss": 0.7383, + "step": 52314 + }, + { + "epoch": 1.34, + "learning_rate": 1.2186152468260256e-06, + "loss": 0.4672, + "step": 52315 + }, + { + "epoch": 1.34, + "learning_rate": 1.2185882456052765e-06, + "loss": 0.5693, + "step": 52316 + }, + { + "epoch": 1.34, + "learning_rate": 1.218561244217165e-06, + "loss": 0.7622, + "step": 52317 + }, + { + "epoch": 1.34, + "learning_rate": 1.2185342426617106e-06, + "loss": 0.4612, + "step": 52318 + }, + { + "epoch": 1.34, + "learning_rate": 1.218507240938935e-06, + "loss": 0.7539, + "step": 52319 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184802390488584e-06, + "loss": 0.7793, + "step": 52320 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184532369915015e-06, + "loss": 0.6709, + "step": 52321 + }, + { + "epoch": 1.34, + "learning_rate": 1.2184262347668847e-06, + "loss": 0.4741, + "step": 52322 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183992323750294e-06, + "loss": 0.8066, + "step": 52323 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183722298159555e-06, + "loss": 0.6182, + "step": 52324 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183452270896846e-06, + "loss": 0.667, + "step": 52325 + }, + { + "epoch": 1.34, + "learning_rate": 1.2183182241962362e-06, + "loss": 0.5845, + "step": 52326 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182912211356319e-06, + "loss": 0.7363, + "step": 52327 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182642179078918e-06, + "loss": 0.6411, + "step": 52328 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182372145130368e-06, + "loss": 0.6846, + "step": 52329 + }, + { + "epoch": 1.34, + "learning_rate": 1.2182102109510878e-06, + "loss": 0.4487, + "step": 52330 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181832072220654e-06, + "loss": 0.626, + "step": 52331 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181562033259898e-06, + "loss": 0.5757, + "step": 52332 + }, + { + "epoch": 1.34, + "learning_rate": 1.2181291992628824e-06, + "loss": 0.6396, + "step": 52333 + }, + { + "epoch": 1.34, + "learning_rate": 1.218102195032763e-06, + "loss": 0.7471, + "step": 52334 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180751906356532e-06, + "loss": 0.5513, + "step": 52335 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180481860715731e-06, + "loss": 0.6641, + "step": 52336 + }, + { + "epoch": 1.34, + "learning_rate": 1.2180211813405433e-06, + "loss": 0.7344, + "step": 52337 + }, + { + "epoch": 1.34, + "learning_rate": 1.2179941764425852e-06, + "loss": 0.752, + "step": 52338 + }, + { + "epoch": 1.34, + "learning_rate": 1.217967171377719e-06, + "loss": 0.7871, + "step": 52339 + }, + { + "epoch": 1.34, + "learning_rate": 1.217940166145965e-06, + "loss": 0.7256, + "step": 52340 + }, + { + "epoch": 1.34, + "learning_rate": 1.2179131607473443e-06, + "loss": 0.7656, + "step": 52341 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178861551818775e-06, + "loss": 0.6055, + "step": 52342 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178591494495854e-06, + "loss": 0.6167, + "step": 52343 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178321435504887e-06, + "loss": 0.7383, + "step": 52344 + }, + { + "epoch": 1.34, + "learning_rate": 1.2178051374846076e-06, + "loss": 0.6836, + "step": 52345 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177781312519635e-06, + "loss": 0.5974, + "step": 52346 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177511248525763e-06, + "loss": 0.6416, + "step": 52347 + }, + { + "epoch": 1.34, + "learning_rate": 1.2177241182864672e-06, + "loss": 0.4988, + "step": 52348 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176971115536567e-06, + "loss": 0.6611, + "step": 52349 + }, + { + "epoch": 1.34, + "learning_rate": 1.217670104654166e-06, + "loss": 0.4407, + "step": 52350 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176430975880147e-06, + "loss": 0.7676, + "step": 52351 + }, + { + "epoch": 1.34, + "learning_rate": 1.2176160903552244e-06, + "loss": 0.5033, + "step": 52352 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175890829558153e-06, + "loss": 0.8174, + "step": 52353 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175620753898083e-06, + "loss": 0.7168, + "step": 52354 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175350676572243e-06, + "loss": 0.6484, + "step": 52355 + }, + { + "epoch": 1.34, + "learning_rate": 1.2175080597580836e-06, + "loss": 0.7529, + "step": 52356 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174810516924066e-06, + "loss": 0.5842, + "step": 52357 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174540434602146e-06, + "loss": 0.4377, + "step": 52358 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174270350615282e-06, + "loss": 0.6865, + "step": 52359 + }, + { + "epoch": 1.34, + "learning_rate": 1.2174000264963677e-06, + "loss": 0.6924, + "step": 52360 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173730177647541e-06, + "loss": 0.3939, + "step": 52361 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173460088667078e-06, + "loss": 0.5503, + "step": 52362 + }, + { + "epoch": 1.34, + "learning_rate": 1.2173189998022499e-06, + "loss": 0.5215, + "step": 52363 + }, + { + "epoch": 1.34, + "learning_rate": 1.2172919905714005e-06, + "loss": 0.4844, + "step": 52364 + }, + { + "epoch": 1.34, + "learning_rate": 1.217264981174181e-06, + "loss": 0.5737, + "step": 52365 + }, + { + "epoch": 1.34, + "learning_rate": 1.2172379716106116e-06, + "loss": 0.521, + "step": 52366 + }, + { + "epoch": 1.34, + "learning_rate": 1.217210961880713e-06, + "loss": 0.4507, + "step": 52367 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171839519845056e-06, + "loss": 0.5227, + "step": 52368 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171569419220112e-06, + "loss": 0.6309, + "step": 52369 + }, + { + "epoch": 1.34, + "learning_rate": 1.2171299316932493e-06, + "loss": 0.6274, + "step": 52370 + }, + { + "epoch": 1.34, + "learning_rate": 1.217102921298241e-06, + "loss": 0.7588, + "step": 52371 + }, + { + "epoch": 1.34, + "learning_rate": 1.217075910737007e-06, + "loss": 0.5532, + "step": 52372 + }, + { + "epoch": 1.34, + "learning_rate": 1.2170489000095678e-06, + "loss": 0.6816, + "step": 52373 + }, + { + "epoch": 1.34, + "learning_rate": 1.2170218891159443e-06, + "loss": 0.4741, + "step": 52374 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169948780561577e-06, + "loss": 0.7578, + "step": 52375 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169678668302272e-06, + "loss": 0.6582, + "step": 52376 + }, + { + "epoch": 1.34, + "learning_rate": 1.216940855438175e-06, + "loss": 0.6982, + "step": 52377 + }, + { + "epoch": 1.34, + "learning_rate": 1.2169138438800207e-06, + "loss": 0.6094, + "step": 52378 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168868321557857e-06, + "loss": 0.6221, + "step": 52379 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168598202654905e-06, + "loss": 0.5449, + "step": 52380 + }, + { + "epoch": 1.34, + "learning_rate": 1.2168328082091555e-06, + "loss": 0.6953, + "step": 52381 + }, + { + "epoch": 1.34, + "learning_rate": 1.216805795986802e-06, + "loss": 0.6958, + "step": 52382 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167787835984497e-06, + "loss": 0.6553, + "step": 52383 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167517710441203e-06, + "loss": 0.5728, + "step": 52384 + }, + { + "epoch": 1.34, + "learning_rate": 1.2167247583238338e-06, + "loss": 0.5972, + "step": 52385 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166977454376112e-06, + "loss": 0.4932, + "step": 52386 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166707323854731e-06, + "loss": 0.5112, + "step": 52387 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166437191674402e-06, + "loss": 0.4392, + "step": 52388 + }, + { + "epoch": 1.34, + "learning_rate": 1.2166167057835329e-06, + "loss": 0.5708, + "step": 52389 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165896922337726e-06, + "loss": 0.6265, + "step": 52390 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165626785181792e-06, + "loss": 0.7314, + "step": 52391 + }, + { + "epoch": 1.34, + "learning_rate": 1.2165356646367739e-06, + "loss": 0.6948, + "step": 52392 + }, + { + "epoch": 1.34, + "learning_rate": 1.216508650589577e-06, + "loss": 0.6123, + "step": 52393 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164816363766095e-06, + "loss": 0.6484, + "step": 52394 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164546219978922e-06, + "loss": 0.3704, + "step": 52395 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164276074534451e-06, + "loss": 0.7168, + "step": 52396 + }, + { + "epoch": 1.34, + "learning_rate": 1.2164005927432896e-06, + "loss": 0.6528, + "step": 52397 + }, + { + "epoch": 1.34, + "learning_rate": 1.2163735778674461e-06, + "loss": 0.7754, + "step": 52398 + }, + { + "epoch": 1.34, + "learning_rate": 1.216346562825935e-06, + "loss": 0.7412, + "step": 52399 + }, + { + "epoch": 1.34, + "learning_rate": 1.2163195476187777e-06, + "loss": 0.7202, + "step": 52400 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162925322459946e-06, + "loss": 0.7129, + "step": 52401 + }, + { + "epoch": 1.34, + "learning_rate": 1.216265516707606e-06, + "loss": 0.6445, + "step": 52402 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162385010036324e-06, + "loss": 0.6875, + "step": 52403 + }, + { + "epoch": 1.34, + "learning_rate": 1.2162114851340956e-06, + "loss": 0.6201, + "step": 52404 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161844690990154e-06, + "loss": 0.7383, + "step": 52405 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161574528984124e-06, + "loss": 0.6392, + "step": 52406 + }, + { + "epoch": 1.34, + "learning_rate": 1.2161304365323079e-06, + "loss": 0.793, + "step": 52407 + }, + { + "epoch": 1.34, + "learning_rate": 1.216103420000722e-06, + "loss": 0.585, + "step": 52408 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160764033036759e-06, + "loss": 0.6416, + "step": 52409 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160493864411901e-06, + "loss": 0.521, + "step": 52410 + }, + { + "epoch": 1.34, + "learning_rate": 1.2160223694132852e-06, + "loss": 0.625, + "step": 52411 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159953522199814e-06, + "loss": 0.5977, + "step": 52412 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159683348613006e-06, + "loss": 0.5684, + "step": 52413 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159413173372624e-06, + "loss": 0.6499, + "step": 52414 + }, + { + "epoch": 1.34, + "learning_rate": 1.2159142996478878e-06, + "loss": 0.6084, + "step": 52415 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158872817931979e-06, + "loss": 0.6421, + "step": 52416 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158602637732128e-06, + "loss": 0.667, + "step": 52417 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158332455879532e-06, + "loss": 0.7217, + "step": 52418 + }, + { + "epoch": 1.34, + "learning_rate": 1.2158062272374404e-06, + "loss": 0.7515, + "step": 52419 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157792087216946e-06, + "loss": 0.5613, + "step": 52420 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157521900407366e-06, + "loss": 0.6113, + "step": 52421 + }, + { + "epoch": 1.34, + "learning_rate": 1.2157251711945866e-06, + "loss": 0.6826, + "step": 52422 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156981521832663e-06, + "loss": 0.5391, + "step": 52423 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156711330067954e-06, + "loss": 0.6133, + "step": 52424 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156441136651956e-06, + "loss": 0.5591, + "step": 52425 + }, + { + "epoch": 1.34, + "learning_rate": 1.2156170941584867e-06, + "loss": 0.7212, + "step": 52426 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155900744866895e-06, + "loss": 0.6094, + "step": 52427 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155630546498251e-06, + "loss": 0.6548, + "step": 52428 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155360346479142e-06, + "loss": 0.7422, + "step": 52429 + }, + { + "epoch": 1.34, + "learning_rate": 1.2155090144809772e-06, + "loss": 0.6343, + "step": 52430 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154819941490346e-06, + "loss": 0.75, + "step": 52431 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154549736521075e-06, + "loss": 0.7295, + "step": 52432 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154279529902163e-06, + "loss": 0.7363, + "step": 52433 + }, + { + "epoch": 1.34, + "learning_rate": 1.2154009321633819e-06, + "loss": 0.7158, + "step": 52434 + }, + { + "epoch": 1.34, + "learning_rate": 1.215373911171625e-06, + "loss": 0.7295, + "step": 52435 + }, + { + "epoch": 1.34, + "learning_rate": 1.215346890014966e-06, + "loss": 0.5154, + "step": 52436 + }, + { + "epoch": 1.34, + "learning_rate": 1.215319868693426e-06, + "loss": 0.5552, + "step": 52437 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152928472070255e-06, + "loss": 0.6851, + "step": 52438 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152658255557847e-06, + "loss": 0.7349, + "step": 52439 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152388037397256e-06, + "loss": 0.6021, + "step": 52440 + }, + { + "epoch": 1.34, + "learning_rate": 1.2152117817588675e-06, + "loss": 0.6699, + "step": 52441 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151847596132316e-06, + "loss": 0.6562, + "step": 52442 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151577373028386e-06, + "loss": 0.6177, + "step": 52443 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151307148277094e-06, + "loss": 0.8857, + "step": 52444 + }, + { + "epoch": 1.34, + "learning_rate": 1.2151036921878646e-06, + "loss": 0.5781, + "step": 52445 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150766693833247e-06, + "loss": 0.6709, + "step": 52446 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150496464141103e-06, + "loss": 0.647, + "step": 52447 + }, + { + "epoch": 1.34, + "learning_rate": 1.2150226232802424e-06, + "loss": 0.751, + "step": 52448 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149955999817417e-06, + "loss": 0.5489, + "step": 52449 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149685765186285e-06, + "loss": 0.6279, + "step": 52450 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149415528909236e-06, + "loss": 0.7959, + "step": 52451 + }, + { + "epoch": 1.34, + "learning_rate": 1.2149145290986483e-06, + "loss": 0.6597, + "step": 52452 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148875051418226e-06, + "loss": 0.4551, + "step": 52453 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148604810204674e-06, + "loss": 0.7656, + "step": 52454 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148334567346035e-06, + "loss": 0.6558, + "step": 52455 + }, + { + "epoch": 1.34, + "learning_rate": 1.2148064322842514e-06, + "loss": 0.7227, + "step": 52456 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147794076694319e-06, + "loss": 0.7861, + "step": 52457 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147523828901656e-06, + "loss": 0.5322, + "step": 52458 + }, + { + "epoch": 1.34, + "learning_rate": 1.2147253579464737e-06, + "loss": 0.6943, + "step": 52459 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146983328383761e-06, + "loss": 0.5083, + "step": 52460 + }, + { + "epoch": 1.34, + "learning_rate": 1.214671307565894e-06, + "loss": 0.7578, + "step": 52461 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146442821290477e-06, + "loss": 0.7075, + "step": 52462 + }, + { + "epoch": 1.34, + "learning_rate": 1.2146172565278586e-06, + "loss": 0.4963, + "step": 52463 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145902307623465e-06, + "loss": 0.7002, + "step": 52464 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145632048325327e-06, + "loss": 0.6934, + "step": 52465 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145361787384375e-06, + "loss": 0.6519, + "step": 52466 + }, + { + "epoch": 1.34, + "learning_rate": 1.2145091524800821e-06, + "loss": 0.665, + "step": 52467 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144821260574866e-06, + "loss": 0.5032, + "step": 52468 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144550994706723e-06, + "loss": 0.5811, + "step": 52469 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144280727196599e-06, + "loss": 0.6982, + "step": 52470 + }, + { + "epoch": 1.34, + "learning_rate": 1.2144010458044692e-06, + "loss": 0.4561, + "step": 52471 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143740187251218e-06, + "loss": 0.6406, + "step": 52472 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143469914816376e-06, + "loss": 0.5088, + "step": 52473 + }, + { + "epoch": 1.34, + "learning_rate": 1.2143199640740385e-06, + "loss": 0.6064, + "step": 52474 + }, + { + "epoch": 1.34, + "learning_rate": 1.2142929365023439e-06, + "loss": 0.7002, + "step": 52475 + }, + { + "epoch": 1.34, + "learning_rate": 1.2142659087665752e-06, + "loss": 0.6973, + "step": 52476 + }, + { + "epoch": 1.35, + "learning_rate": 1.2142388808667527e-06, + "loss": 0.7251, + "step": 52477 + }, + { + "epoch": 1.35, + "learning_rate": 1.2142118528028978e-06, + "loss": 0.6239, + "step": 52478 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141848245750305e-06, + "loss": 0.5638, + "step": 52479 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141577961831719e-06, + "loss": 0.6426, + "step": 52480 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141307676273423e-06, + "loss": 0.5417, + "step": 52481 + }, + { + "epoch": 1.35, + "learning_rate": 1.2141037389075627e-06, + "loss": 0.6455, + "step": 52482 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140767100238537e-06, + "loss": 0.5771, + "step": 52483 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140496809762361e-06, + "loss": 0.5182, + "step": 52484 + }, + { + "epoch": 1.35, + "learning_rate": 1.2140226517647304e-06, + "loss": 0.7549, + "step": 52485 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139956223893575e-06, + "loss": 0.7178, + "step": 52486 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139685928501377e-06, + "loss": 0.6343, + "step": 52487 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139415631470924e-06, + "loss": 0.6338, + "step": 52488 + }, + { + "epoch": 1.35, + "learning_rate": 1.2139145332802417e-06, + "loss": 0.6841, + "step": 52489 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138875032496062e-06, + "loss": 0.5713, + "step": 52490 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138604730552073e-06, + "loss": 0.5991, + "step": 52491 + }, + { + "epoch": 1.35, + "learning_rate": 1.213833442697065e-06, + "loss": 0.7046, + "step": 52492 + }, + { + "epoch": 1.35, + "learning_rate": 1.2138064121752004e-06, + "loss": 0.5713, + "step": 52493 + }, + { + "epoch": 1.35, + "learning_rate": 1.213779381489634e-06, + "loss": 0.8574, + "step": 52494 + }, + { + "epoch": 1.35, + "learning_rate": 1.2137523506403868e-06, + "loss": 0.7979, + "step": 52495 + }, + { + "epoch": 1.35, + "learning_rate": 1.2137253196274788e-06, + "loss": 0.7383, + "step": 52496 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136982884509314e-06, + "loss": 0.5266, + "step": 52497 + }, + { + "epoch": 1.35, + "learning_rate": 1.213671257110765e-06, + "loss": 0.71, + "step": 52498 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136442256070005e-06, + "loss": 0.647, + "step": 52499 + }, + { + "epoch": 1.35, + "learning_rate": 1.2136171939396582e-06, + "loss": 0.6919, + "step": 52500 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135901621087595e-06, + "loss": 0.3462, + "step": 52501 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135631301143238e-06, + "loss": 0.6367, + "step": 52502 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135360979563733e-06, + "loss": 0.5938, + "step": 52503 + }, + { + "epoch": 1.35, + "learning_rate": 1.2135090656349281e-06, + "loss": 0.5248, + "step": 52504 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134820331500085e-06, + "loss": 0.7559, + "step": 52505 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134550005016355e-06, + "loss": 0.708, + "step": 52506 + }, + { + "epoch": 1.35, + "learning_rate": 1.21342796768983e-06, + "loss": 0.5938, + "step": 52507 + }, + { + "epoch": 1.35, + "learning_rate": 1.2134009347146124e-06, + "loss": 0.7598, + "step": 52508 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133739015760038e-06, + "loss": 0.5767, + "step": 52509 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133468682740241e-06, + "loss": 0.4258, + "step": 52510 + }, + { + "epoch": 1.35, + "learning_rate": 1.2133198348086948e-06, + "loss": 0.5483, + "step": 52511 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132928011800364e-06, + "loss": 0.6455, + "step": 52512 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132657673880693e-06, + "loss": 0.4917, + "step": 52513 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132387334328147e-06, + "loss": 0.71, + "step": 52514 + }, + { + "epoch": 1.35, + "learning_rate": 1.2132116993142925e-06, + "loss": 0.7051, + "step": 52515 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131846650325244e-06, + "loss": 0.7148, + "step": 52516 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131576305875301e-06, + "loss": 0.5408, + "step": 52517 + }, + { + "epoch": 1.35, + "learning_rate": 1.2131305959793314e-06, + "loss": 0.627, + "step": 52518 + }, + { + "epoch": 1.35, + "learning_rate": 1.213103561207948e-06, + "loss": 0.8662, + "step": 52519 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130765262734013e-06, + "loss": 0.6777, + "step": 52520 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130494911757114e-06, + "loss": 0.6127, + "step": 52521 + }, + { + "epoch": 1.35, + "learning_rate": 1.2130224559148997e-06, + "loss": 0.4995, + "step": 52522 + }, + { + "epoch": 1.35, + "learning_rate": 1.212995420490986e-06, + "loss": 0.6221, + "step": 52523 + }, + { + "epoch": 1.35, + "learning_rate": 1.212968384903992e-06, + "loss": 0.6519, + "step": 52524 + }, + { + "epoch": 1.35, + "learning_rate": 1.2129413491539375e-06, + "loss": 0.6846, + "step": 52525 + }, + { + "epoch": 1.35, + "learning_rate": 1.2129143132408439e-06, + "loss": 0.6729, + "step": 52526 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128872771647312e-06, + "loss": 0.7803, + "step": 52527 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128602409256207e-06, + "loss": 0.6191, + "step": 52528 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128332045235333e-06, + "loss": 0.6846, + "step": 52529 + }, + { + "epoch": 1.35, + "learning_rate": 1.2128061679584888e-06, + "loss": 0.7119, + "step": 52530 + }, + { + "epoch": 1.35, + "learning_rate": 1.2127791312305084e-06, + "loss": 0.5791, + "step": 52531 + }, + { + "epoch": 1.35, + "learning_rate": 1.212752094339613e-06, + "loss": 0.5249, + "step": 52532 + }, + { + "epoch": 1.35, + "learning_rate": 1.212725057285823e-06, + "loss": 0.6592, + "step": 52533 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126980200691593e-06, + "loss": 0.6768, + "step": 52534 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126709826896426e-06, + "loss": 0.689, + "step": 52535 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126439451472934e-06, + "loss": 0.7646, + "step": 52536 + }, + { + "epoch": 1.35, + "learning_rate": 1.2126169074421324e-06, + "loss": 0.7168, + "step": 52537 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125898695741806e-06, + "loss": 0.6299, + "step": 52538 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125628315434585e-06, + "loss": 0.5493, + "step": 52539 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125357933499864e-06, + "loss": 0.5576, + "step": 52540 + }, + { + "epoch": 1.35, + "learning_rate": 1.2125087549937859e-06, + "loss": 0.5405, + "step": 52541 + }, + { + "epoch": 1.35, + "learning_rate": 1.212481716474877e-06, + "loss": 0.7588, + "step": 52542 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124546777932805e-06, + "loss": 0.5908, + "step": 52543 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124276389490175e-06, + "loss": 0.8638, + "step": 52544 + }, + { + "epoch": 1.35, + "learning_rate": 1.2124005999421086e-06, + "loss": 0.5994, + "step": 52545 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123735607725737e-06, + "loss": 0.2734, + "step": 52546 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123465214404344e-06, + "loss": 0.7148, + "step": 52547 + }, + { + "epoch": 1.35, + "learning_rate": 1.2123194819457113e-06, + "loss": 0.7041, + "step": 52548 + }, + { + "epoch": 1.35, + "learning_rate": 1.212292442288425e-06, + "loss": 0.7061, + "step": 52549 + }, + { + "epoch": 1.35, + "learning_rate": 1.2122654024685959e-06, + "loss": 0.7139, + "step": 52550 + }, + { + "epoch": 1.35, + "learning_rate": 1.212238362486245e-06, + "loss": 0.6768, + "step": 52551 + }, + { + "epoch": 1.35, + "learning_rate": 1.212211322341393e-06, + "loss": 0.5469, + "step": 52552 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121842820340604e-06, + "loss": 0.6172, + "step": 52553 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121572415642682e-06, + "loss": 0.792, + "step": 52554 + }, + { + "epoch": 1.35, + "learning_rate": 1.212130200932037e-06, + "loss": 0.7412, + "step": 52555 + }, + { + "epoch": 1.35, + "learning_rate": 1.2121031601373873e-06, + "loss": 0.5048, + "step": 52556 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120761191803402e-06, + "loss": 0.5547, + "step": 52557 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120490780609158e-06, + "loss": 0.6104, + "step": 52558 + }, + { + "epoch": 1.35, + "learning_rate": 1.2120220367791353e-06, + "loss": 0.6577, + "step": 52559 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119949953350197e-06, + "loss": 0.6543, + "step": 52560 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119679537285886e-06, + "loss": 0.5464, + "step": 52561 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119409119598637e-06, + "loss": 0.4226, + "step": 52562 + }, + { + "epoch": 1.35, + "learning_rate": 1.2119138700288653e-06, + "loss": 0.7803, + "step": 52563 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118868279356148e-06, + "loss": 0.5566, + "step": 52564 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118597856801316e-06, + "loss": 0.4297, + "step": 52565 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118327432624373e-06, + "loss": 0.5272, + "step": 52566 + }, + { + "epoch": 1.35, + "learning_rate": 1.2118057006825524e-06, + "loss": 0.5483, + "step": 52567 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117786579404977e-06, + "loss": 0.7236, + "step": 52568 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117516150362938e-06, + "loss": 0.6555, + "step": 52569 + }, + { + "epoch": 1.35, + "learning_rate": 1.2117245719699614e-06, + "loss": 0.8018, + "step": 52570 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116975287415211e-06, + "loss": 0.7471, + "step": 52571 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116704853509939e-06, + "loss": 0.7285, + "step": 52572 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116434417984e-06, + "loss": 0.6699, + "step": 52573 + }, + { + "epoch": 1.35, + "learning_rate": 1.2116163980837613e-06, + "loss": 0.8066, + "step": 52574 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115893542070967e-06, + "loss": 0.4863, + "step": 52575 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115623101684285e-06, + "loss": 0.626, + "step": 52576 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115352659677763e-06, + "loss": 0.5344, + "step": 52577 + }, + { + "epoch": 1.35, + "learning_rate": 1.2115082216051615e-06, + "loss": 0.6355, + "step": 52578 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114811770806047e-06, + "loss": 0.7236, + "step": 52579 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114541323941261e-06, + "loss": 0.6423, + "step": 52580 + }, + { + "epoch": 1.35, + "learning_rate": 1.211427087545747e-06, + "loss": 0.7168, + "step": 52581 + }, + { + "epoch": 1.35, + "learning_rate": 1.2114000425354882e-06, + "loss": 0.6709, + "step": 52582 + }, + { + "epoch": 1.35, + "learning_rate": 1.2113729973633697e-06, + "loss": 0.6074, + "step": 52583 + }, + { + "epoch": 1.35, + "learning_rate": 1.211345952029413e-06, + "loss": 0.6436, + "step": 52584 + }, + { + "epoch": 1.35, + "learning_rate": 1.2113189065336383e-06, + "loss": 0.625, + "step": 52585 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112918608760661e-06, + "loss": 0.6572, + "step": 52586 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112648150567176e-06, + "loss": 0.6621, + "step": 52587 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112377690756132e-06, + "loss": 0.6748, + "step": 52588 + }, + { + "epoch": 1.35, + "learning_rate": 1.2112107229327744e-06, + "loss": 0.4443, + "step": 52589 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111836766282206e-06, + "loss": 0.5156, + "step": 52590 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111566301619736e-06, + "loss": 0.6709, + "step": 52591 + }, + { + "epoch": 1.35, + "learning_rate": 1.2111295835340532e-06, + "loss": 0.6748, + "step": 52592 + }, + { + "epoch": 1.35, + "learning_rate": 1.211102536744481e-06, + "loss": 0.6694, + "step": 52593 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110754897932771e-06, + "loss": 0.6802, + "step": 52594 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110484426804625e-06, + "loss": 0.5137, + "step": 52595 + }, + { + "epoch": 1.35, + "learning_rate": 1.2110213954060578e-06, + "loss": 0.5669, + "step": 52596 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109943479700836e-06, + "loss": 0.7178, + "step": 52597 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109673003725608e-06, + "loss": 0.8369, + "step": 52598 + }, + { + "epoch": 1.35, + "learning_rate": 1.2109402526135102e-06, + "loss": 0.4404, + "step": 52599 + }, + { + "epoch": 1.35, + "learning_rate": 1.210913204692952e-06, + "loss": 0.6523, + "step": 52600 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108861566109076e-06, + "loss": 0.5713, + "step": 52601 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108591083673972e-06, + "loss": 0.6753, + "step": 52602 + }, + { + "epoch": 1.35, + "learning_rate": 1.2108320599624417e-06, + "loss": 0.7173, + "step": 52603 + }, + { + "epoch": 1.35, + "learning_rate": 1.210805011396062e-06, + "loss": 0.6318, + "step": 52604 + }, + { + "epoch": 1.35, + "learning_rate": 1.210777962668278e-06, + "loss": 0.6426, + "step": 52605 + }, + { + "epoch": 1.35, + "learning_rate": 1.2107509137791113e-06, + "loss": 0.8105, + "step": 52606 + }, + { + "epoch": 1.35, + "learning_rate": 1.2107238647285824e-06, + "loss": 0.6191, + "step": 52607 + }, + { + "epoch": 1.35, + "learning_rate": 1.210696815516712e-06, + "loss": 0.6982, + "step": 52608 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106697661435208e-06, + "loss": 0.365, + "step": 52609 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106427166090294e-06, + "loss": 0.6309, + "step": 52610 + }, + { + "epoch": 1.35, + "learning_rate": 1.2106156669132584e-06, + "loss": 0.7031, + "step": 52611 + }, + { + "epoch": 1.35, + "learning_rate": 1.2105886170562288e-06, + "loss": 0.665, + "step": 52612 + }, + { + "epoch": 1.35, + "learning_rate": 1.210561567037961e-06, + "loss": 0.6416, + "step": 52613 + }, + { + "epoch": 1.35, + "learning_rate": 1.210534516858476e-06, + "loss": 0.4758, + "step": 52614 + }, + { + "epoch": 1.35, + "learning_rate": 1.2105074665177945e-06, + "loss": 0.5767, + "step": 52615 + }, + { + "epoch": 1.35, + "learning_rate": 1.210480416015937e-06, + "loss": 0.6851, + "step": 52616 + }, + { + "epoch": 1.35, + "learning_rate": 1.2104533653529243e-06, + "loss": 0.8125, + "step": 52617 + }, + { + "epoch": 1.35, + "learning_rate": 1.210426314528777e-06, + "loss": 0.6787, + "step": 52618 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103992635435165e-06, + "loss": 0.6519, + "step": 52619 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103722123971624e-06, + "loss": 0.6338, + "step": 52620 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103451610897363e-06, + "loss": 0.7783, + "step": 52621 + }, + { + "epoch": 1.35, + "learning_rate": 1.2103181096212585e-06, + "loss": 0.6299, + "step": 52622 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102910579917493e-06, + "loss": 0.7168, + "step": 52623 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102640062012306e-06, + "loss": 0.4712, + "step": 52624 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102369542497221e-06, + "loss": 0.6689, + "step": 52625 + }, + { + "epoch": 1.35, + "learning_rate": 1.2102099021372452e-06, + "loss": 0.6318, + "step": 52626 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101828498638197e-06, + "loss": 0.4614, + "step": 52627 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101557974294672e-06, + "loss": 0.3591, + "step": 52628 + }, + { + "epoch": 1.35, + "learning_rate": 1.210128744834208e-06, + "loss": 0.6138, + "step": 52629 + }, + { + "epoch": 1.35, + "learning_rate": 1.2101016920780626e-06, + "loss": 0.6318, + "step": 52630 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100746391610524e-06, + "loss": 0.5215, + "step": 52631 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100475860831974e-06, + "loss": 0.626, + "step": 52632 + }, + { + "epoch": 1.35, + "learning_rate": 1.2100205328445187e-06, + "loss": 0.5759, + "step": 52633 + }, + { + "epoch": 1.35, + "learning_rate": 1.209993479445037e-06, + "loss": 0.6484, + "step": 52634 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099664258847733e-06, + "loss": 0.6992, + "step": 52635 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099393721637473e-06, + "loss": 0.9102, + "step": 52636 + }, + { + "epoch": 1.35, + "learning_rate": 1.2099123182819807e-06, + "loss": 0.6855, + "step": 52637 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098852642394939e-06, + "loss": 0.5356, + "step": 52638 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098582100363077e-06, + "loss": 0.6094, + "step": 52639 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098311556724426e-06, + "loss": 0.6396, + "step": 52640 + }, + { + "epoch": 1.35, + "learning_rate": 1.2098041011479195e-06, + "loss": 0.8057, + "step": 52641 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097770464627589e-06, + "loss": 0.8545, + "step": 52642 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097499916169818e-06, + "loss": 0.5979, + "step": 52643 + }, + { + "epoch": 1.35, + "learning_rate": 1.2097229366106087e-06, + "loss": 0.6611, + "step": 52644 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096958814436604e-06, + "loss": 0.5608, + "step": 52645 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096688261161575e-06, + "loss": 0.4512, + "step": 52646 + }, + { + "epoch": 1.35, + "learning_rate": 1.209641770628121e-06, + "loss": 0.5425, + "step": 52647 + }, + { + "epoch": 1.35, + "learning_rate": 1.2096147149795712e-06, + "loss": 0.6523, + "step": 52648 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095876591705292e-06, + "loss": 0.6187, + "step": 52649 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095606032010157e-06, + "loss": 0.6143, + "step": 52650 + }, + { + "epoch": 1.35, + "learning_rate": 1.209533547071051e-06, + "loss": 0.7324, + "step": 52651 + }, + { + "epoch": 1.35, + "learning_rate": 1.2095064907806565e-06, + "loss": 0.6089, + "step": 52652 + }, + { + "epoch": 1.35, + "learning_rate": 1.209479434329852e-06, + "loss": 0.645, + "step": 52653 + }, + { + "epoch": 1.35, + "learning_rate": 1.2094523777186593e-06, + "loss": 0.7324, + "step": 52654 + }, + { + "epoch": 1.35, + "learning_rate": 1.2094253209470982e-06, + "loss": 0.5, + "step": 52655 + }, + { + "epoch": 1.35, + "learning_rate": 1.20939826401519e-06, + "loss": 0.6602, + "step": 52656 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093712069229546e-06, + "loss": 0.4984, + "step": 52657 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093441496704138e-06, + "loss": 0.7119, + "step": 52658 + }, + { + "epoch": 1.35, + "learning_rate": 1.2093170922575878e-06, + "loss": 0.8335, + "step": 52659 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092900346844971e-06, + "loss": 0.5879, + "step": 52660 + }, + { + "epoch": 1.35, + "learning_rate": 1.209262976951163e-06, + "loss": 0.627, + "step": 52661 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092359190576056e-06, + "loss": 0.7227, + "step": 52662 + }, + { + "epoch": 1.35, + "learning_rate": 1.2092088610038456e-06, + "loss": 0.5483, + "step": 52663 + }, + { + "epoch": 1.35, + "learning_rate": 1.2091818027899047e-06, + "loss": 0.6606, + "step": 52664 + }, + { + "epoch": 1.35, + "learning_rate": 1.2091547444158023e-06, + "loss": 0.542, + "step": 52665 + }, + { + "epoch": 1.35, + "learning_rate": 1.20912768588156e-06, + "loss": 0.5527, + "step": 52666 + }, + { + "epoch": 1.35, + "learning_rate": 1.209100627187198e-06, + "loss": 0.5742, + "step": 52667 + }, + { + "epoch": 1.35, + "learning_rate": 1.2090735683327375e-06, + "loss": 0.7334, + "step": 52668 + }, + { + "epoch": 1.35, + "learning_rate": 1.209046509318199e-06, + "loss": 1.0098, + "step": 52669 + }, + { + "epoch": 1.35, + "learning_rate": 1.209019450143603e-06, + "loss": 0.6216, + "step": 52670 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089923908089708e-06, + "loss": 0.6807, + "step": 52671 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089653313143224e-06, + "loss": 0.5388, + "step": 52672 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089382716596788e-06, + "loss": 0.7656, + "step": 52673 + }, + { + "epoch": 1.35, + "learning_rate": 1.2089112118450611e-06, + "loss": 0.6152, + "step": 52674 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088841518704896e-06, + "loss": 0.6846, + "step": 52675 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088570917359849e-06, + "loss": 0.6213, + "step": 52676 + }, + { + "epoch": 1.35, + "learning_rate": 1.208830031441568e-06, + "loss": 0.6357, + "step": 52677 + }, + { + "epoch": 1.35, + "learning_rate": 1.2088029709872594e-06, + "loss": 0.6885, + "step": 52678 + }, + { + "epoch": 1.35, + "learning_rate": 1.2087759103730806e-06, + "loss": 0.6582, + "step": 52679 + }, + { + "epoch": 1.35, + "learning_rate": 1.208748849599051e-06, + "loss": 0.5359, + "step": 52680 + }, + { + "epoch": 1.35, + "learning_rate": 1.2087217886651924e-06, + "loss": 0.6538, + "step": 52681 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086947275715247e-06, + "loss": 0.5889, + "step": 52682 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086676663180695e-06, + "loss": 0.4463, + "step": 52683 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086406049048468e-06, + "loss": 0.5859, + "step": 52684 + }, + { + "epoch": 1.35, + "learning_rate": 1.2086135433318777e-06, + "loss": 0.6934, + "step": 52685 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085864815991826e-06, + "loss": 0.5199, + "step": 52686 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085594197067827e-06, + "loss": 0.3151, + "step": 52687 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085323576546981e-06, + "loss": 0.7773, + "step": 52688 + }, + { + "epoch": 1.35, + "learning_rate": 1.2085052954429504e-06, + "loss": 0.6953, + "step": 52689 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084782330715595e-06, + "loss": 0.6406, + "step": 52690 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084511705405462e-06, + "loss": 0.6826, + "step": 52691 + }, + { + "epoch": 1.35, + "learning_rate": 1.2084241078499315e-06, + "loss": 0.7002, + "step": 52692 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083970449997363e-06, + "loss": 0.6592, + "step": 52693 + }, + { + "epoch": 1.35, + "learning_rate": 1.208369981989981e-06, + "loss": 0.5149, + "step": 52694 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083429188206862e-06, + "loss": 0.6069, + "step": 52695 + }, + { + "epoch": 1.35, + "learning_rate": 1.2083158554918728e-06, + "loss": 0.6978, + "step": 52696 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082887920035615e-06, + "loss": 0.8301, + "step": 52697 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082617283557731e-06, + "loss": 0.6138, + "step": 52698 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082346645485287e-06, + "loss": 0.6338, + "step": 52699 + }, + { + "epoch": 1.35, + "learning_rate": 1.2082076005818483e-06, + "loss": 0.5593, + "step": 52700 + }, + { + "epoch": 1.35, + "learning_rate": 1.2081805364557527e-06, + "loss": 0.5198, + "step": 52701 + }, + { + "epoch": 1.35, + "learning_rate": 1.208153472170263e-06, + "loss": 0.5259, + "step": 52702 + }, + { + "epoch": 1.35, + "learning_rate": 1.2081264077253995e-06, + "loss": 0.5933, + "step": 52703 + }, + { + "epoch": 1.35, + "learning_rate": 1.208099343121184e-06, + "loss": 0.5572, + "step": 52704 + }, + { + "epoch": 1.35, + "learning_rate": 1.2080722783576357e-06, + "loss": 0.6494, + "step": 52705 + }, + { + "epoch": 1.35, + "learning_rate": 1.208045213434776e-06, + "loss": 0.6245, + "step": 52706 + }, + { + "epoch": 1.35, + "learning_rate": 1.2080181483526256e-06, + "loss": 0.6558, + "step": 52707 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079910831112058e-06, + "loss": 0.7808, + "step": 52708 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079640177105363e-06, + "loss": 0.6562, + "step": 52709 + }, + { + "epoch": 1.35, + "learning_rate": 1.2079369521506386e-06, + "loss": 0.5542, + "step": 52710 + }, + { + "epoch": 1.35, + "learning_rate": 1.207909886431533e-06, + "loss": 0.7588, + "step": 52711 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078828205532403e-06, + "loss": 0.605, + "step": 52712 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078557545157814e-06, + "loss": 0.7402, + "step": 52713 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078286883191768e-06, + "loss": 0.6748, + "step": 52714 + }, + { + "epoch": 1.35, + "learning_rate": 1.2078016219634474e-06, + "loss": 0.6396, + "step": 52715 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077745554486139e-06, + "loss": 0.6514, + "step": 52716 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077474887746967e-06, + "loss": 0.6816, + "step": 52717 + }, + { + "epoch": 1.35, + "learning_rate": 1.2077204219417172e-06, + "loss": 0.6348, + "step": 52718 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076933549496958e-06, + "loss": 0.5283, + "step": 52719 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076662877986526e-06, + "loss": 0.6548, + "step": 52720 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076392204886093e-06, + "loss": 0.7061, + "step": 52721 + }, + { + "epoch": 1.35, + "learning_rate": 1.2076121530195858e-06, + "loss": 0.5352, + "step": 52722 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075850853916033e-06, + "loss": 0.7998, + "step": 52723 + }, + { + "epoch": 1.35, + "learning_rate": 1.207558017604683e-06, + "loss": 0.7397, + "step": 52724 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075309496588447e-06, + "loss": 0.5942, + "step": 52725 + }, + { + "epoch": 1.35, + "learning_rate": 1.2075038815541091e-06, + "loss": 0.5024, + "step": 52726 + }, + { + "epoch": 1.35, + "learning_rate": 1.207476813290498e-06, + "loss": 0.6211, + "step": 52727 + }, + { + "epoch": 1.35, + "learning_rate": 1.207449744868031e-06, + "loss": 0.792, + "step": 52728 + }, + { + "epoch": 1.35, + "learning_rate": 1.2074226762867297e-06, + "loss": 0.4819, + "step": 52729 + }, + { + "epoch": 1.35, + "learning_rate": 1.207395607546614e-06, + "loss": 0.7295, + "step": 52730 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073685386477052e-06, + "loss": 0.5566, + "step": 52731 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073414695900237e-06, + "loss": 0.8271, + "step": 52732 + }, + { + "epoch": 1.35, + "learning_rate": 1.2073144003735904e-06, + "loss": 0.5581, + "step": 52733 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072873309984262e-06, + "loss": 0.6309, + "step": 52734 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072602614645514e-06, + "loss": 0.4832, + "step": 52735 + }, + { + "epoch": 1.35, + "learning_rate": 1.207233191771987e-06, + "loss": 0.5791, + "step": 52736 + }, + { + "epoch": 1.35, + "learning_rate": 1.2072061219207538e-06, + "loss": 0.4927, + "step": 52737 + }, + { + "epoch": 1.35, + "learning_rate": 1.207179051910872e-06, + "loss": 0.5142, + "step": 52738 + }, + { + "epoch": 1.35, + "learning_rate": 1.2071519817423632e-06, + "loss": 0.5059, + "step": 52739 + }, + { + "epoch": 1.35, + "learning_rate": 1.2071249114152476e-06, + "loss": 0.5869, + "step": 52740 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070978409295457e-06, + "loss": 0.4834, + "step": 52741 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070707702852787e-06, + "loss": 0.5093, + "step": 52742 + }, + { + "epoch": 1.35, + "learning_rate": 1.207043699482467e-06, + "loss": 0.666, + "step": 52743 + }, + { + "epoch": 1.35, + "learning_rate": 1.2070166285211315e-06, + "loss": 0.8164, + "step": 52744 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069895574012928e-06, + "loss": 0.7148, + "step": 52745 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069624861229722e-06, + "loss": 0.5708, + "step": 52746 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069354146861894e-06, + "loss": 0.583, + "step": 52747 + }, + { + "epoch": 1.35, + "learning_rate": 1.2069083430909662e-06, + "loss": 0.7949, + "step": 52748 + }, + { + "epoch": 1.35, + "learning_rate": 1.2068812713373222e-06, + "loss": 0.6436, + "step": 52749 + }, + { + "epoch": 1.35, + "learning_rate": 1.206854199425279e-06, + "loss": 0.7734, + "step": 52750 + }, + { + "epoch": 1.35, + "learning_rate": 1.206827127354857e-06, + "loss": 0.6274, + "step": 52751 + }, + { + "epoch": 1.35, + "learning_rate": 1.2068000551260772e-06, + "loss": 0.6729, + "step": 52752 + }, + { + "epoch": 1.35, + "learning_rate": 1.2067729827389599e-06, + "loss": 0.624, + "step": 52753 + }, + { + "epoch": 1.35, + "learning_rate": 1.206745910193526e-06, + "loss": 0.583, + "step": 52754 + }, + { + "epoch": 1.35, + "learning_rate": 1.206718837489796e-06, + "loss": 0.6738, + "step": 52755 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066917646277914e-06, + "loss": 0.7109, + "step": 52756 + }, + { + "epoch": 1.35, + "learning_rate": 1.206664691607532e-06, + "loss": 0.6357, + "step": 52757 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066376184290392e-06, + "loss": 0.7412, + "step": 52758 + }, + { + "epoch": 1.35, + "learning_rate": 1.2066105450923336e-06, + "loss": 0.6777, + "step": 52759 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065834715974355e-06, + "loss": 0.7979, + "step": 52760 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065563979443663e-06, + "loss": 0.8174, + "step": 52761 + }, + { + "epoch": 1.35, + "learning_rate": 1.2065293241331462e-06, + "loss": 0.6396, + "step": 52762 + }, + { + "epoch": 1.35, + "learning_rate": 1.206502250163796e-06, + "loss": 0.6084, + "step": 52763 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064751760363366e-06, + "loss": 0.5874, + "step": 52764 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064481017507885e-06, + "loss": 0.6416, + "step": 52765 + }, + { + "epoch": 1.35, + "learning_rate": 1.2064210273071726e-06, + "loss": 0.6094, + "step": 52766 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063939527055097e-06, + "loss": 0.5996, + "step": 52767 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063668779458205e-06, + "loss": 0.6279, + "step": 52768 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063398030281258e-06, + "loss": 0.6924, + "step": 52769 + }, + { + "epoch": 1.35, + "learning_rate": 1.2063127279524459e-06, + "loss": 0.5068, + "step": 52770 + }, + { + "epoch": 1.35, + "learning_rate": 1.206285652718802e-06, + "loss": 0.6836, + "step": 52771 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062585773272145e-06, + "loss": 0.5615, + "step": 52772 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062315017777046e-06, + "loss": 0.7432, + "step": 52773 + }, + { + "epoch": 1.35, + "learning_rate": 1.2062044260702925e-06, + "loss": 0.7388, + "step": 52774 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061773502049993e-06, + "loss": 0.7373, + "step": 52775 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061502741818453e-06, + "loss": 0.6719, + "step": 52776 + }, + { + "epoch": 1.35, + "learning_rate": 1.2061231980008515e-06, + "loss": 0.5889, + "step": 52777 + }, + { + "epoch": 1.35, + "learning_rate": 1.2060961216620388e-06, + "loss": 0.5063, + "step": 52778 + }, + { + "epoch": 1.35, + "learning_rate": 1.206069045165428e-06, + "loss": 0.6694, + "step": 52779 + }, + { + "epoch": 1.35, + "learning_rate": 1.2060419685110393e-06, + "loss": 0.5234, + "step": 52780 + }, + { + "epoch": 1.35, + "learning_rate": 1.206014891698894e-06, + "loss": 0.7246, + "step": 52781 + }, + { + "epoch": 1.35, + "learning_rate": 1.205987814729012e-06, + "loss": 0.79, + "step": 52782 + }, + { + "epoch": 1.35, + "learning_rate": 1.2059607376014152e-06, + "loss": 0.5396, + "step": 52783 + }, + { + "epoch": 1.35, + "learning_rate": 1.2059336603161236e-06, + "loss": 0.7061, + "step": 52784 + }, + { + "epoch": 1.35, + "learning_rate": 1.205906582873158e-06, + "loss": 0.6226, + "step": 52785 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058795052725393e-06, + "loss": 0.5557, + "step": 52786 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058524275142878e-06, + "loss": 0.6348, + "step": 52787 + }, + { + "epoch": 1.35, + "learning_rate": 1.2058253495984253e-06, + "loss": 0.5742, + "step": 52788 + }, + { + "epoch": 1.35, + "learning_rate": 1.205798271524971e-06, + "loss": 0.6045, + "step": 52789 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057711932939467e-06, + "loss": 0.6196, + "step": 52790 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057441149053729e-06, + "loss": 0.5493, + "step": 52791 + }, + { + "epoch": 1.35, + "learning_rate": 1.2057170363592702e-06, + "loss": 0.7539, + "step": 52792 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056899576556597e-06, + "loss": 0.5085, + "step": 52793 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056628787945618e-06, + "loss": 0.7012, + "step": 52794 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056357997759968e-06, + "loss": 0.5505, + "step": 52795 + }, + { + "epoch": 1.35, + "learning_rate": 1.2056087205999863e-06, + "loss": 0.6572, + "step": 52796 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055816412665504e-06, + "loss": 0.7764, + "step": 52797 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055545617757108e-06, + "loss": 0.6733, + "step": 52798 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055274821274868e-06, + "loss": 0.7832, + "step": 52799 + }, + { + "epoch": 1.35, + "learning_rate": 1.2055004023219002e-06, + "loss": 0.4985, + "step": 52800 + }, + { + "epoch": 1.35, + "learning_rate": 1.205473322358971e-06, + "loss": 0.3915, + "step": 52801 + }, + { + "epoch": 1.35, + "learning_rate": 1.2054462422387207e-06, + "loss": 0.5244, + "step": 52802 + }, + { + "epoch": 1.35, + "learning_rate": 1.2054191619611699e-06, + "loss": 0.6377, + "step": 52803 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053920815263385e-06, + "loss": 0.7837, + "step": 52804 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053650009342481e-06, + "loss": 0.6982, + "step": 52805 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053379201849192e-06, + "loss": 0.8516, + "step": 52806 + }, + { + "epoch": 1.35, + "learning_rate": 1.2053108392783725e-06, + "loss": 0.709, + "step": 52807 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052837582146287e-06, + "loss": 0.5088, + "step": 52808 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052566769937084e-06, + "loss": 0.666, + "step": 52809 + }, + { + "epoch": 1.35, + "learning_rate": 1.2052295956156327e-06, + "loss": 0.6377, + "step": 52810 + }, + { + "epoch": 1.35, + "learning_rate": 1.205202514080422e-06, + "loss": 0.5959, + "step": 52811 + }, + { + "epoch": 1.35, + "learning_rate": 1.205175432388097e-06, + "loss": 0.6787, + "step": 52812 + }, + { + "epoch": 1.35, + "learning_rate": 1.2051483505386792e-06, + "loss": 0.7188, + "step": 52813 + }, + { + "epoch": 1.35, + "learning_rate": 1.2051212685321882e-06, + "loss": 0.6738, + "step": 52814 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050941863686457e-06, + "loss": 0.6294, + "step": 52815 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050671040480715e-06, + "loss": 0.4299, + "step": 52816 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050400215704874e-06, + "loss": 0.6357, + "step": 52817 + }, + { + "epoch": 1.35, + "learning_rate": 1.2050129389359134e-06, + "loss": 0.6504, + "step": 52818 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049858561443705e-06, + "loss": 0.5239, + "step": 52819 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049587731958789e-06, + "loss": 0.5789, + "step": 52820 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049316900904602e-06, + "loss": 0.9365, + "step": 52821 + }, + { + "epoch": 1.35, + "learning_rate": 1.2049046068281342e-06, + "loss": 0.6431, + "step": 52822 + }, + { + "epoch": 1.35, + "learning_rate": 1.2048775234089227e-06, + "loss": 0.7109, + "step": 52823 + }, + { + "epoch": 1.35, + "learning_rate": 1.204850439832846e-06, + "loss": 0.564, + "step": 52824 + }, + { + "epoch": 1.35, + "learning_rate": 1.2048233560999246e-06, + "loss": 0.5605, + "step": 52825 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047962722101793e-06, + "loss": 0.4993, + "step": 52826 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047691881636308e-06, + "loss": 0.6274, + "step": 52827 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047421039603001e-06, + "loss": 0.6846, + "step": 52828 + }, + { + "epoch": 1.35, + "learning_rate": 1.2047150196002076e-06, + "loss": 0.7124, + "step": 52829 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046879350833746e-06, + "loss": 0.6357, + "step": 52830 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046608504098207e-06, + "loss": 0.7373, + "step": 52831 + }, + { + "epoch": 1.35, + "learning_rate": 1.2046337655795682e-06, + "loss": 0.8271, + "step": 52832 + }, + { + "epoch": 1.35, + "learning_rate": 1.204606680592637e-06, + "loss": 0.5295, + "step": 52833 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045795954490474e-06, + "loss": 0.7266, + "step": 52834 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045525101488207e-06, + "loss": 0.5879, + "step": 52835 + }, + { + "epoch": 1.35, + "learning_rate": 1.2045254246919778e-06, + "loss": 0.6709, + "step": 52836 + }, + { + "epoch": 1.35, + "learning_rate": 1.204498339078539e-06, + "loss": 0.6201, + "step": 52837 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044712533085255e-06, + "loss": 0.7393, + "step": 52838 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044441673819575e-06, + "loss": 0.6562, + "step": 52839 + }, + { + "epoch": 1.35, + "learning_rate": 1.2044170812988562e-06, + "loss": 0.6758, + "step": 52840 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043899950592418e-06, + "loss": 0.6364, + "step": 52841 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043629086631355e-06, + "loss": 0.585, + "step": 52842 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043358221105581e-06, + "loss": 0.5249, + "step": 52843 + }, + { + "epoch": 1.35, + "learning_rate": 1.2043087354015301e-06, + "loss": 0.5386, + "step": 52844 + }, + { + "epoch": 1.35, + "learning_rate": 1.204281648536072e-06, + "loss": 0.5745, + "step": 52845 + }, + { + "epoch": 1.35, + "learning_rate": 1.2042545615142052e-06, + "loss": 0.6738, + "step": 52846 + }, + { + "epoch": 1.35, + "learning_rate": 1.20422747433595e-06, + "loss": 0.7461, + "step": 52847 + }, + { + "epoch": 1.35, + "learning_rate": 1.2042003870013272e-06, + "loss": 0.5771, + "step": 52848 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041732995103575e-06, + "loss": 0.6191, + "step": 52849 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041462118630616e-06, + "loss": 0.6304, + "step": 52850 + }, + { + "epoch": 1.35, + "learning_rate": 1.2041191240594606e-06, + "loss": 0.7354, + "step": 52851 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040920360995748e-06, + "loss": 0.4292, + "step": 52852 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040649479834252e-06, + "loss": 0.6113, + "step": 52853 + }, + { + "epoch": 1.35, + "learning_rate": 1.2040378597110323e-06, + "loss": 0.7119, + "step": 52854 + }, + { + "epoch": 1.35, + "learning_rate": 1.204010771282417e-06, + "loss": 0.7285, + "step": 52855 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039836826976e-06, + "loss": 0.5723, + "step": 52856 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039565939566024e-06, + "loss": 0.8125, + "step": 52857 + }, + { + "epoch": 1.35, + "learning_rate": 1.2039295050594444e-06, + "loss": 0.4546, + "step": 52858 + }, + { + "epoch": 1.35, + "learning_rate": 1.203902416006147e-06, + "loss": 0.5669, + "step": 52859 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038753267967307e-06, + "loss": 0.6289, + "step": 52860 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038482374312166e-06, + "loss": 0.5566, + "step": 52861 + }, + { + "epoch": 1.35, + "learning_rate": 1.2038211479096253e-06, + "loss": 0.7939, + "step": 52862 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037940582319776e-06, + "loss": 0.4897, + "step": 52863 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037669683982938e-06, + "loss": 0.4961, + "step": 52864 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037398784085954e-06, + "loss": 0.5129, + "step": 52865 + }, + { + "epoch": 1.35, + "learning_rate": 1.2037127882629025e-06, + "loss": 0.5444, + "step": 52866 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036856979612362e-06, + "loss": 0.5889, + "step": 52867 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036586075036173e-06, + "loss": 0.3687, + "step": 52868 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036315168900662e-06, + "loss": 0.8867, + "step": 52869 + }, + { + "epoch": 1.36, + "learning_rate": 1.2036044261206035e-06, + "loss": 0.5645, + "step": 52870 + }, + { + "epoch": 1.36, + "learning_rate": 1.2035773351952507e-06, + "loss": 0.7129, + "step": 52871 + }, + { + "epoch": 1.36, + "learning_rate": 1.2035502441140277e-06, + "loss": 0.6738, + "step": 52872 + }, + { + "epoch": 1.36, + "learning_rate": 1.203523152876956e-06, + "loss": 0.6299, + "step": 52873 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034960614840558e-06, + "loss": 0.6689, + "step": 52874 + }, + { + "epoch": 1.36, + "learning_rate": 1.203468969935348e-06, + "loss": 0.6963, + "step": 52875 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034418782308536e-06, + "loss": 0.5596, + "step": 52876 + }, + { + "epoch": 1.36, + "learning_rate": 1.2034147863705928e-06, + "loss": 0.4956, + "step": 52877 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033876943545869e-06, + "loss": 0.6416, + "step": 52878 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033606021828562e-06, + "loss": 0.6665, + "step": 52879 + }, + { + "epoch": 1.36, + "learning_rate": 1.2033335098554218e-06, + "loss": 0.6328, + "step": 52880 + }, + { + "epoch": 1.36, + "learning_rate": 1.203306417372304e-06, + "loss": 0.6616, + "step": 52881 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032793247335241e-06, + "loss": 0.7168, + "step": 52882 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032522319391025e-06, + "loss": 0.7041, + "step": 52883 + }, + { + "epoch": 1.36, + "learning_rate": 1.2032251389890601e-06, + "loss": 0.8604, + "step": 52884 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031980458834174e-06, + "loss": 0.7305, + "step": 52885 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031709526221953e-06, + "loss": 0.4582, + "step": 52886 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031438592054145e-06, + "loss": 0.6626, + "step": 52887 + }, + { + "epoch": 1.36, + "learning_rate": 1.2031167656330963e-06, + "loss": 0.7041, + "step": 52888 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030896719052604e-06, + "loss": 0.5801, + "step": 52889 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030625780219284e-06, + "loss": 0.6133, + "step": 52890 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030354839831203e-06, + "loss": 0.7432, + "step": 52891 + }, + { + "epoch": 1.36, + "learning_rate": 1.2030083897888575e-06, + "loss": 0.5537, + "step": 52892 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029812954391605e-06, + "loss": 0.6992, + "step": 52893 + }, + { + "epoch": 1.36, + "learning_rate": 1.20295420093405e-06, + "loss": 0.5601, + "step": 52894 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029271062735468e-06, + "loss": 0.4568, + "step": 52895 + }, + { + "epoch": 1.36, + "learning_rate": 1.2029000114576717e-06, + "loss": 0.6006, + "step": 52896 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028729164864455e-06, + "loss": 0.5034, + "step": 52897 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028458213598887e-06, + "loss": 0.5647, + "step": 52898 + }, + { + "epoch": 1.36, + "learning_rate": 1.2028187260780222e-06, + "loss": 0.5508, + "step": 52899 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027916306408667e-06, + "loss": 0.7197, + "step": 52900 + }, + { + "epoch": 1.36, + "learning_rate": 1.202764535048443e-06, + "loss": 0.8926, + "step": 52901 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027374393007716e-06, + "loss": 0.5474, + "step": 52902 + }, + { + "epoch": 1.36, + "learning_rate": 1.2027103433978743e-06, + "loss": 0.7734, + "step": 52903 + }, + { + "epoch": 1.36, + "learning_rate": 1.2026832473397702e-06, + "loss": 0.666, + "step": 52904 + }, + { + "epoch": 1.36, + "learning_rate": 1.202656151126481e-06, + "loss": 0.5503, + "step": 52905 + }, + { + "epoch": 1.36, + "learning_rate": 1.2026290547580274e-06, + "loss": 0.5315, + "step": 52906 + }, + { + "epoch": 1.36, + "learning_rate": 1.20260195823443e-06, + "loss": 0.6904, + "step": 52907 + }, + { + "epoch": 1.36, + "learning_rate": 1.2025748615557096e-06, + "loss": 0.5586, + "step": 52908 + }, + { + "epoch": 1.36, + "learning_rate": 1.2025477647218872e-06, + "loss": 0.6128, + "step": 52909 + }, + { + "epoch": 1.36, + "learning_rate": 1.202520667732983e-06, + "loss": 0.6338, + "step": 52910 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024935705890177e-06, + "loss": 0.7178, + "step": 52911 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024664732900128e-06, + "loss": 0.8662, + "step": 52912 + }, + { + "epoch": 1.36, + "learning_rate": 1.2024393758359888e-06, + "loss": 0.6323, + "step": 52913 + }, + { + "epoch": 1.36, + "learning_rate": 1.202412278226966e-06, + "loss": 0.708, + "step": 52914 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023851804629657e-06, + "loss": 0.5972, + "step": 52915 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023580825440079e-06, + "loss": 0.5542, + "step": 52916 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023309844701142e-06, + "loss": 0.5938, + "step": 52917 + }, + { + "epoch": 1.36, + "learning_rate": 1.2023038862413049e-06, + "loss": 0.6523, + "step": 52918 + }, + { + "epoch": 1.36, + "learning_rate": 1.2022767878576008e-06, + "loss": 0.7227, + "step": 52919 + }, + { + "epoch": 1.36, + "learning_rate": 1.2022496893190225e-06, + "loss": 0.6777, + "step": 52920 + }, + { + "epoch": 1.36, + "learning_rate": 1.202222590625591e-06, + "loss": 0.748, + "step": 52921 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021954917773272e-06, + "loss": 0.5986, + "step": 52922 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021683927742514e-06, + "loss": 0.646, + "step": 52923 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021412936163847e-06, + "loss": 0.7734, + "step": 52924 + }, + { + "epoch": 1.36, + "learning_rate": 1.2021141943037474e-06, + "loss": 0.6234, + "step": 52925 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020870948363608e-06, + "loss": 0.5388, + "step": 52926 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020599952142453e-06, + "loss": 0.6045, + "step": 52927 + }, + { + "epoch": 1.36, + "learning_rate": 1.2020328954374219e-06, + "loss": 0.6836, + "step": 52928 + }, + { + "epoch": 1.36, + "learning_rate": 1.202005795505911e-06, + "loss": 0.8174, + "step": 52929 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019786954197338e-06, + "loss": 0.7456, + "step": 52930 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019515951789105e-06, + "loss": 0.6831, + "step": 52931 + }, + { + "epoch": 1.36, + "learning_rate": 1.2019244947834623e-06, + "loss": 0.7852, + "step": 52932 + }, + { + "epoch": 1.36, + "learning_rate": 1.20189739423341e-06, + "loss": 0.6196, + "step": 52933 + }, + { + "epoch": 1.36, + "learning_rate": 1.2018702935287739e-06, + "loss": 0.707, + "step": 52934 + }, + { + "epoch": 1.36, + "learning_rate": 1.201843192669575e-06, + "loss": 0.7559, + "step": 52935 + }, + { + "epoch": 1.36, + "learning_rate": 1.2018160916558342e-06, + "loss": 0.3564, + "step": 52936 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017889904875718e-06, + "loss": 0.6475, + "step": 52937 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017618891648091e-06, + "loss": 0.6528, + "step": 52938 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017347876875667e-06, + "loss": 0.709, + "step": 52939 + }, + { + "epoch": 1.36, + "learning_rate": 1.2017076860558648e-06, + "loss": 0.7266, + "step": 52940 + }, + { + "epoch": 1.36, + "learning_rate": 1.201680584269725e-06, + "loss": 0.708, + "step": 52941 + }, + { + "epoch": 1.36, + "learning_rate": 1.2016534823291677e-06, + "loss": 0.6621, + "step": 52942 + }, + { + "epoch": 1.36, + "learning_rate": 1.2016263802342135e-06, + "loss": 0.5044, + "step": 52943 + }, + { + "epoch": 1.36, + "learning_rate": 1.201599277984883e-06, + "loss": 0.7344, + "step": 52944 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015721755811976e-06, + "loss": 0.6035, + "step": 52945 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015450730231773e-06, + "loss": 0.6816, + "step": 52946 + }, + { + "epoch": 1.36, + "learning_rate": 1.2015179703108433e-06, + "loss": 0.5898, + "step": 52947 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014908674442163e-06, + "loss": 0.7178, + "step": 52948 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014637644233171e-06, + "loss": 0.7334, + "step": 52949 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014366612481664e-06, + "loss": 0.6309, + "step": 52950 + }, + { + "epoch": 1.36, + "learning_rate": 1.2014095579187848e-06, + "loss": 0.7383, + "step": 52951 + }, + { + "epoch": 1.36, + "learning_rate": 1.201382454435193e-06, + "loss": 0.5447, + "step": 52952 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013553507974124e-06, + "loss": 0.918, + "step": 52953 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013282470054626e-06, + "loss": 0.7344, + "step": 52954 + }, + { + "epoch": 1.36, + "learning_rate": 1.2013011430593656e-06, + "loss": 0.5684, + "step": 52955 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012740389591412e-06, + "loss": 0.8545, + "step": 52956 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012469347048106e-06, + "loss": 0.791, + "step": 52957 + }, + { + "epoch": 1.36, + "learning_rate": 1.2012198302963946e-06, + "loss": 0.585, + "step": 52958 + }, + { + "epoch": 1.36, + "learning_rate": 1.2011927257339138e-06, + "loss": 0.7153, + "step": 52959 + }, + { + "epoch": 1.36, + "learning_rate": 1.201165621017389e-06, + "loss": 0.7002, + "step": 52960 + }, + { + "epoch": 1.36, + "learning_rate": 1.2011385161468408e-06, + "loss": 0.5879, + "step": 52961 + }, + { + "epoch": 1.36, + "learning_rate": 1.20111141112229e-06, + "loss": 0.7363, + "step": 52962 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010843059437577e-06, + "loss": 0.6445, + "step": 52963 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010572006112643e-06, + "loss": 0.6406, + "step": 52964 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010300951248305e-06, + "loss": 0.5591, + "step": 52965 + }, + { + "epoch": 1.36, + "learning_rate": 1.2010029894844774e-06, + "loss": 0.7441, + "step": 52966 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009758836902252e-06, + "loss": 0.7646, + "step": 52967 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009487777420958e-06, + "loss": 0.5776, + "step": 52968 + }, + { + "epoch": 1.36, + "learning_rate": 1.2009216716401085e-06, + "loss": 0.7773, + "step": 52969 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008945653842848e-06, + "loss": 0.5776, + "step": 52970 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008674589746452e-06, + "loss": 0.7227, + "step": 52971 + }, + { + "epoch": 1.36, + "learning_rate": 1.200840352411211e-06, + "loss": 0.8301, + "step": 52972 + }, + { + "epoch": 1.36, + "learning_rate": 1.2008132456940026e-06, + "loss": 0.3735, + "step": 52973 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007861388230404e-06, + "loss": 0.7246, + "step": 52974 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007590317983456e-06, + "loss": 0.751, + "step": 52975 + }, + { + "epoch": 1.36, + "learning_rate": 1.200731924619939e-06, + "loss": 0.6436, + "step": 52976 + }, + { + "epoch": 1.36, + "learning_rate": 1.2007048172878409e-06, + "loss": 0.5481, + "step": 52977 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006777098020728e-06, + "loss": 0.8057, + "step": 52978 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006506021626548e-06, + "loss": 0.8311, + "step": 52979 + }, + { + "epoch": 1.36, + "learning_rate": 1.2006234943696078e-06, + "loss": 0.6108, + "step": 52980 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005963864229526e-06, + "loss": 0.6143, + "step": 52981 + }, + { + "epoch": 1.36, + "learning_rate": 1.20056927832271e-06, + "loss": 0.6978, + "step": 52982 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005421700689007e-06, + "loss": 0.6719, + "step": 52983 + }, + { + "epoch": 1.36, + "learning_rate": 1.2005150616615453e-06, + "loss": 0.5957, + "step": 52984 + }, + { + "epoch": 1.36, + "learning_rate": 1.200487953100665e-06, + "loss": 0.6067, + "step": 52985 + }, + { + "epoch": 1.36, + "learning_rate": 1.20046084438628e-06, + "loss": 0.6211, + "step": 52986 + }, + { + "epoch": 1.36, + "learning_rate": 1.2004337355184118e-06, + "loss": 0.5889, + "step": 52987 + }, + { + "epoch": 1.36, + "learning_rate": 1.2004066264970805e-06, + "loss": 0.7842, + "step": 52988 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003795173223072e-06, + "loss": 0.6182, + "step": 52989 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003524079941124e-06, + "loss": 0.5646, + "step": 52990 + }, + { + "epoch": 1.36, + "learning_rate": 1.2003252985125168e-06, + "loss": 0.7178, + "step": 52991 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002981888775411e-06, + "loss": 0.5605, + "step": 52992 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002710790892072e-06, + "loss": 0.7646, + "step": 52993 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002439691475342e-06, + "loss": 0.6982, + "step": 52994 + }, + { + "epoch": 1.36, + "learning_rate": 1.2002168590525438e-06, + "loss": 0.707, + "step": 52995 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001897488042566e-06, + "loss": 0.7217, + "step": 52996 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001626384026932e-06, + "loss": 0.6333, + "step": 52997 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001355278478747e-06, + "loss": 0.4363, + "step": 52998 + }, + { + "epoch": 1.36, + "learning_rate": 1.2001084171398215e-06, + "loss": 0.7334, + "step": 52999 + }, + { + "epoch": 1.36, + "learning_rate": 1.200081306278554e-06, + "loss": 0.7031, + "step": 53000 + }, + { + "epoch": 1.36, + "learning_rate": 1.2000541952640942e-06, + "loss": 0.5781, + "step": 53001 + }, + { + "epoch": 1.36, + "learning_rate": 1.2000270840964617e-06, + "loss": 0.6768, + "step": 53002 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999999727756777e-06, + "loss": 0.7734, + "step": 53003 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999728613017632e-06, + "loss": 0.7168, + "step": 53004 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999457496747386e-06, + "loss": 0.6699, + "step": 53005 + }, + { + "epoch": 1.36, + "learning_rate": 1.1999186378946242e-06, + "loss": 0.5391, + "step": 53006 + }, + { + "epoch": 1.36, + "learning_rate": 1.199891525961442e-06, + "loss": 0.6187, + "step": 53007 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998644138752117e-06, + "loss": 0.5884, + "step": 53008 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998373016359543e-06, + "loss": 0.6885, + "step": 53009 + }, + { + "epoch": 1.36, + "learning_rate": 1.1998101892436907e-06, + "loss": 0.6602, + "step": 53010 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997830766984415e-06, + "loss": 0.7031, + "step": 53011 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997559640002281e-06, + "loss": 0.626, + "step": 53012 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997288511490705e-06, + "loss": 0.6006, + "step": 53013 + }, + { + "epoch": 1.36, + "learning_rate": 1.1997017381449897e-06, + "loss": 0.7295, + "step": 53014 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996746249880063e-06, + "loss": 0.6965, + "step": 53015 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996475116781414e-06, + "loss": 0.6167, + "step": 53016 + }, + { + "epoch": 1.36, + "learning_rate": 1.1996203982154153e-06, + "loss": 0.5044, + "step": 53017 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995932845998496e-06, + "loss": 0.626, + "step": 53018 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995661708314639e-06, + "loss": 0.4576, + "step": 53019 + }, + { + "epoch": 1.36, + "learning_rate": 1.19953905691028e-06, + "loss": 0.647, + "step": 53020 + }, + { + "epoch": 1.36, + "learning_rate": 1.1995119428363178e-06, + "loss": 0.583, + "step": 53021 + }, + { + "epoch": 1.36, + "learning_rate": 1.199484828609599e-06, + "loss": 0.5718, + "step": 53022 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994577142301433e-06, + "loss": 0.688, + "step": 53023 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994305996979726e-06, + "loss": 0.6885, + "step": 53024 + }, + { + "epoch": 1.36, + "learning_rate": 1.1994034850131065e-06, + "loss": 0.5513, + "step": 53025 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993763701755666e-06, + "loss": 0.5674, + "step": 53026 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993492551853733e-06, + "loss": 0.5171, + "step": 53027 + }, + { + "epoch": 1.36, + "learning_rate": 1.1993221400425473e-06, + "loss": 0.5986, + "step": 53028 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992950247471098e-06, + "loss": 0.5118, + "step": 53029 + }, + { + "epoch": 1.36, + "learning_rate": 1.199267909299081e-06, + "loss": 0.8975, + "step": 53030 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992407936984822e-06, + "loss": 0.7842, + "step": 53031 + }, + { + "epoch": 1.36, + "learning_rate": 1.1992136779453337e-06, + "loss": 0.5962, + "step": 53032 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991865620396567e-06, + "loss": 0.604, + "step": 53033 + }, + { + "epoch": 1.36, + "learning_rate": 1.199159445981471e-06, + "loss": 0.7373, + "step": 53034 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991323297707987e-06, + "loss": 0.6504, + "step": 53035 + }, + { + "epoch": 1.36, + "learning_rate": 1.1991052134076599e-06, + "loss": 0.6196, + "step": 53036 + }, + { + "epoch": 1.36, + "learning_rate": 1.1990780968920754e-06, + "loss": 0.7178, + "step": 53037 + }, + { + "epoch": 1.36, + "learning_rate": 1.1990509802240658e-06, + "loss": 0.5977, + "step": 53038 + }, + { + "epoch": 1.36, + "learning_rate": 1.199023863403652e-06, + "loss": 0.7021, + "step": 53039 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989967464308549e-06, + "loss": 0.7305, + "step": 53040 + }, + { + "epoch": 1.36, + "learning_rate": 1.198969629305695e-06, + "loss": 0.5879, + "step": 53041 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989425120281932e-06, + "loss": 0.9111, + "step": 53042 + }, + { + "epoch": 1.36, + "learning_rate": 1.1989153945983706e-06, + "loss": 0.5662, + "step": 53043 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988882770162472e-06, + "loss": 0.6738, + "step": 53044 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988611592818446e-06, + "loss": 0.6895, + "step": 53045 + }, + { + "epoch": 1.36, + "learning_rate": 1.1988340413951826e-06, + "loss": 0.6133, + "step": 53046 + }, + { + "epoch": 1.36, + "learning_rate": 1.198806923356283e-06, + "loss": 0.3467, + "step": 53047 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987798051651659e-06, + "loss": 0.791, + "step": 53048 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987526868218523e-06, + "loss": 0.7119, + "step": 53049 + }, + { + "epoch": 1.36, + "learning_rate": 1.1987255683263627e-06, + "loss": 0.8555, + "step": 53050 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986984496787182e-06, + "loss": 0.707, + "step": 53051 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986713308789397e-06, + "loss": 0.7656, + "step": 53052 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986442119270473e-06, + "loss": 0.5557, + "step": 53053 + }, + { + "epoch": 1.36, + "learning_rate": 1.1986170928230623e-06, + "loss": 0.6001, + "step": 53054 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985899735670053e-06, + "loss": 0.709, + "step": 53055 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985628541588972e-06, + "loss": 0.6172, + "step": 53056 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985357345987588e-06, + "loss": 0.6111, + "step": 53057 + }, + { + "epoch": 1.36, + "learning_rate": 1.1985086148866103e-06, + "loss": 0.6348, + "step": 53058 + }, + { + "epoch": 1.36, + "learning_rate": 1.198481495022473e-06, + "loss": 0.7979, + "step": 53059 + }, + { + "epoch": 1.36, + "learning_rate": 1.1984543750063678e-06, + "loss": 0.5322, + "step": 53060 + }, + { + "epoch": 1.36, + "learning_rate": 1.1984272548383149e-06, + "loss": 0.5063, + "step": 53061 + }, + { + "epoch": 1.36, + "learning_rate": 1.198400134518336e-06, + "loss": 0.4961, + "step": 53062 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983730140464502e-06, + "loss": 0.7344, + "step": 53063 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983458934226802e-06, + "loss": 0.5815, + "step": 53064 + }, + { + "epoch": 1.36, + "learning_rate": 1.1983187726470454e-06, + "loss": 0.8223, + "step": 53065 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982916517195671e-06, + "loss": 0.5825, + "step": 53066 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982645306402664e-06, + "loss": 0.5166, + "step": 53067 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982374094091632e-06, + "loss": 0.7529, + "step": 53068 + }, + { + "epoch": 1.36, + "learning_rate": 1.1982102880262788e-06, + "loss": 0.6299, + "step": 53069 + }, + { + "epoch": 1.36, + "learning_rate": 1.198183166491634e-06, + "loss": 0.4932, + "step": 53070 + }, + { + "epoch": 1.36, + "learning_rate": 1.1981560448052493e-06, + "loss": 0.7666, + "step": 53071 + }, + { + "epoch": 1.36, + "learning_rate": 1.198128922967146e-06, + "loss": 0.4243, + "step": 53072 + }, + { + "epoch": 1.36, + "learning_rate": 1.198101800977344e-06, + "loss": 0.7305, + "step": 53073 + }, + { + "epoch": 1.36, + "learning_rate": 1.1980746788358649e-06, + "loss": 0.6074, + "step": 53074 + }, + { + "epoch": 1.36, + "learning_rate": 1.198047556542729e-06, + "loss": 0.5547, + "step": 53075 + }, + { + "epoch": 1.36, + "learning_rate": 1.1980204340979573e-06, + "loss": 0.4724, + "step": 53076 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979933115015703e-06, + "loss": 0.812, + "step": 53077 + }, + { + "epoch": 1.36, + "learning_rate": 1.197966188753589e-06, + "loss": 0.8213, + "step": 53078 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979390658540342e-06, + "loss": 0.5547, + "step": 53079 + }, + { + "epoch": 1.36, + "learning_rate": 1.1979119428029264e-06, + "loss": 0.5439, + "step": 53080 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978848196002864e-06, + "loss": 0.7139, + "step": 53081 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978576962461356e-06, + "loss": 0.6924, + "step": 53082 + }, + { + "epoch": 1.36, + "learning_rate": 1.197830572740494e-06, + "loss": 0.7686, + "step": 53083 + }, + { + "epoch": 1.36, + "learning_rate": 1.1978034490833825e-06, + "loss": 0.7031, + "step": 53084 + }, + { + "epoch": 1.36, + "learning_rate": 1.197776325274822e-06, + "loss": 0.5586, + "step": 53085 + }, + { + "epoch": 1.36, + "learning_rate": 1.197749201314833e-06, + "loss": 0.584, + "step": 53086 + }, + { + "epoch": 1.36, + "learning_rate": 1.1977220772034373e-06, + "loss": 0.7935, + "step": 53087 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976949529406541e-06, + "loss": 0.7002, + "step": 53088 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976678285265057e-06, + "loss": 0.4824, + "step": 53089 + }, + { + "epoch": 1.36, + "learning_rate": 1.1976407039610115e-06, + "loss": 0.7656, + "step": 53090 + }, + { + "epoch": 1.36, + "learning_rate": 1.197613579244193e-06, + "loss": 0.75, + "step": 53091 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975864543760712e-06, + "loss": 0.7588, + "step": 53092 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975593293566664e-06, + "loss": 0.5659, + "step": 53093 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975322041859994e-06, + "loss": 0.5076, + "step": 53094 + }, + { + "epoch": 1.36, + "learning_rate": 1.1975050788640913e-06, + "loss": 0.7012, + "step": 53095 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974779533909622e-06, + "loss": 0.5815, + "step": 53096 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974508277666339e-06, + "loss": 0.7451, + "step": 53097 + }, + { + "epoch": 1.36, + "learning_rate": 1.1974237019911262e-06, + "loss": 0.6958, + "step": 53098 + }, + { + "epoch": 1.36, + "learning_rate": 1.19739657606446e-06, + "loss": 0.4722, + "step": 53099 + }, + { + "epoch": 1.36, + "learning_rate": 1.1973694499866566e-06, + "loss": 0.6172, + "step": 53100 + }, + { + "epoch": 1.36, + "learning_rate": 1.1973423237577365e-06, + "loss": 0.5879, + "step": 53101 + }, + { + "epoch": 1.36, + "learning_rate": 1.197315197377721e-06, + "loss": 0.708, + "step": 53102 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972880708466294e-06, + "loss": 0.5034, + "step": 53103 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972609441644838e-06, + "loss": 0.5271, + "step": 53104 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972338173313046e-06, + "loss": 0.5708, + "step": 53105 + }, + { + "epoch": 1.36, + "learning_rate": 1.1972066903471125e-06, + "loss": 0.7139, + "step": 53106 + }, + { + "epoch": 1.36, + "learning_rate": 1.1971795632119283e-06, + "loss": 0.7764, + "step": 53107 + }, + { + "epoch": 1.36, + "learning_rate": 1.197152435925773e-06, + "loss": 0.6274, + "step": 53108 + }, + { + "epoch": 1.36, + "learning_rate": 1.1971253084886667e-06, + "loss": 0.5254, + "step": 53109 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970981809006308e-06, + "loss": 0.4862, + "step": 53110 + }, + { + "epoch": 1.36, + "learning_rate": 1.197071053161686e-06, + "loss": 0.7363, + "step": 53111 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970439252718532e-06, + "loss": 0.7979, + "step": 53112 + }, + { + "epoch": 1.36, + "learning_rate": 1.1970167972311523e-06, + "loss": 0.7295, + "step": 53113 + }, + { + "epoch": 1.36, + "learning_rate": 1.196989669039605e-06, + "loss": 0.6602, + "step": 53114 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969625406972318e-06, + "loss": 0.7617, + "step": 53115 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969354122040533e-06, + "loss": 0.5861, + "step": 53116 + }, + { + "epoch": 1.36, + "learning_rate": 1.1969082835600908e-06, + "loss": 0.7461, + "step": 53117 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968811547653641e-06, + "loss": 0.6689, + "step": 53118 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968540258198952e-06, + "loss": 0.5601, + "step": 53119 + }, + { + "epoch": 1.36, + "learning_rate": 1.1968268967237035e-06, + "loss": 0.7021, + "step": 53120 + }, + { + "epoch": 1.36, + "learning_rate": 1.1967997674768112e-06, + "loss": 0.4207, + "step": 53121 + }, + { + "epoch": 1.36, + "learning_rate": 1.196772638079238e-06, + "loss": 0.6826, + "step": 53122 + }, + { + "epoch": 1.36, + "learning_rate": 1.1967455085310052e-06, + "loss": 0.6274, + "step": 53123 + }, + { + "epoch": 1.36, + "learning_rate": 1.196718378832133e-06, + "loss": 0.6099, + "step": 53124 + }, + { + "epoch": 1.36, + "learning_rate": 1.196691248982643e-06, + "loss": 0.6899, + "step": 53125 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966641189825552e-06, + "loss": 0.666, + "step": 53126 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966369888318912e-06, + "loss": 0.793, + "step": 53127 + }, + { + "epoch": 1.36, + "learning_rate": 1.1966098585306709e-06, + "loss": 0.8486, + "step": 53128 + }, + { + "epoch": 1.36, + "learning_rate": 1.1965827280789159e-06, + "loss": 0.6284, + "step": 53129 + }, + { + "epoch": 1.36, + "learning_rate": 1.196555597476646e-06, + "loss": 0.8975, + "step": 53130 + }, + { + "epoch": 1.36, + "learning_rate": 1.1965284667238829e-06, + "loss": 0.6943, + "step": 53131 + }, + { + "epoch": 1.36, + "learning_rate": 1.196501335820647e-06, + "loss": 0.5811, + "step": 53132 + }, + { + "epoch": 1.36, + "learning_rate": 1.196474204766959e-06, + "loss": 0.6904, + "step": 53133 + }, + { + "epoch": 1.36, + "learning_rate": 1.1964470735628395e-06, + "loss": 0.5835, + "step": 53134 + }, + { + "epoch": 1.36, + "learning_rate": 1.1964199422083096e-06, + "loss": 0.561, + "step": 53135 + }, + { + "epoch": 1.36, + "learning_rate": 1.19639281070339e-06, + "loss": 0.5415, + "step": 53136 + }, + { + "epoch": 1.36, + "learning_rate": 1.1963656790481015e-06, + "loss": 0.667, + "step": 53137 + }, + { + "epoch": 1.36, + "learning_rate": 1.1963385472424651e-06, + "loss": 0.5693, + "step": 53138 + }, + { + "epoch": 1.36, + "learning_rate": 1.196311415286501e-06, + "loss": 0.5659, + "step": 53139 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962842831802301e-06, + "loss": 0.6211, + "step": 53140 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962571509236738e-06, + "loss": 0.7188, + "step": 53141 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962300185168524e-06, + "loss": 0.6904, + "step": 53142 + }, + { + "epoch": 1.36, + "learning_rate": 1.1962028859597864e-06, + "loss": 0.6992, + "step": 53143 + }, + { + "epoch": 1.36, + "learning_rate": 1.196175753252497e-06, + "loss": 0.6631, + "step": 53144 + }, + { + "epoch": 1.36, + "learning_rate": 1.1961486203950045e-06, + "loss": 0.5298, + "step": 53145 + }, + { + "epoch": 1.36, + "learning_rate": 1.1961214873873304e-06, + "loss": 0.6768, + "step": 53146 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960943542294952e-06, + "loss": 0.6377, + "step": 53147 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960672209215195e-06, + "loss": 0.7256, + "step": 53148 + }, + { + "epoch": 1.36, + "learning_rate": 1.196040087463424e-06, + "loss": 0.7188, + "step": 53149 + }, + { + "epoch": 1.36, + "learning_rate": 1.1960129538552296e-06, + "loss": 0.6943, + "step": 53150 + }, + { + "epoch": 1.36, + "learning_rate": 1.195985820096957e-06, + "loss": 0.6665, + "step": 53151 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959586861886276e-06, + "loss": 0.7266, + "step": 53152 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959315521302611e-06, + "loss": 0.7061, + "step": 53153 + }, + { + "epoch": 1.36, + "learning_rate": 1.1959044179218792e-06, + "loss": 0.7598, + "step": 53154 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958772835635017e-06, + "loss": 0.6816, + "step": 53155 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958501490551505e-06, + "loss": 0.5848, + "step": 53156 + }, + { + "epoch": 1.36, + "learning_rate": 1.1958230143968458e-06, + "loss": 0.6973, + "step": 53157 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957958795886085e-06, + "loss": 0.9038, + "step": 53158 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957687446304589e-06, + "loss": 0.5923, + "step": 53159 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957416095224185e-06, + "loss": 0.7295, + "step": 53160 + }, + { + "epoch": 1.36, + "learning_rate": 1.1957144742645075e-06, + "loss": 0.6738, + "step": 53161 + }, + { + "epoch": 1.36, + "learning_rate": 1.1956873388567472e-06, + "loss": 0.6992, + "step": 53162 + }, + { + "epoch": 1.36, + "learning_rate": 1.195660203299158e-06, + "loss": 0.5942, + "step": 53163 + }, + { + "epoch": 1.36, + "learning_rate": 1.1956330675917605e-06, + "loss": 0.5771, + "step": 53164 + }, + { + "epoch": 1.36, + "learning_rate": 1.195605931734576e-06, + "loss": 0.7314, + "step": 53165 + }, + { + "epoch": 1.36, + "learning_rate": 1.1955787957276251e-06, + "loss": 0.7373, + "step": 53166 + }, + { + "epoch": 1.36, + "learning_rate": 1.1955516595709287e-06, + "loss": 0.5996, + "step": 53167 + }, + { + "epoch": 1.36, + "learning_rate": 1.195524523264507e-06, + "loss": 0.6313, + "step": 53168 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954973868083812e-06, + "loss": 0.5063, + "step": 53169 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954702502025723e-06, + "loss": 0.7671, + "step": 53170 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954431134471007e-06, + "loss": 0.5225, + "step": 53171 + }, + { + "epoch": 1.36, + "learning_rate": 1.1954159765419873e-06, + "loss": 0.6885, + "step": 53172 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953888394872528e-06, + "loss": 0.6641, + "step": 53173 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953617022829181e-06, + "loss": 0.3948, + "step": 53174 + }, + { + "epoch": 1.36, + "learning_rate": 1.195334564929004e-06, + "loss": 0.7246, + "step": 53175 + }, + { + "epoch": 1.36, + "learning_rate": 1.1953074274255309e-06, + "loss": 0.4675, + "step": 53176 + }, + { + "epoch": 1.36, + "learning_rate": 1.1952802897725203e-06, + "loss": 0.4858, + "step": 53177 + }, + { + "epoch": 1.36, + "learning_rate": 1.1952531519699923e-06, + "loss": 0.7358, + "step": 53178 + }, + { + "epoch": 1.36, + "learning_rate": 1.195226014017968e-06, + "loss": 0.7563, + "step": 53179 + }, + { + "epoch": 1.36, + "learning_rate": 1.195198875916468e-06, + "loss": 0.6201, + "step": 53180 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951717376655132e-06, + "loss": 0.6494, + "step": 53181 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951445992651248e-06, + "loss": 0.708, + "step": 53182 + }, + { + "epoch": 1.36, + "learning_rate": 1.1951174607153227e-06, + "loss": 0.6602, + "step": 53183 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950903220161284e-06, + "loss": 0.5996, + "step": 53184 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950631831675621e-06, + "loss": 0.5674, + "step": 53185 + }, + { + "epoch": 1.36, + "learning_rate": 1.195036044169645e-06, + "loss": 0.7412, + "step": 53186 + }, + { + "epoch": 1.36, + "learning_rate": 1.1950089050223979e-06, + "loss": 0.6277, + "step": 53187 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949817657258416e-06, + "loss": 0.6377, + "step": 53188 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949546262799964e-06, + "loss": 0.5037, + "step": 53189 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949274866848835e-06, + "loss": 0.6533, + "step": 53190 + }, + { + "epoch": 1.36, + "learning_rate": 1.1949003469405235e-06, + "loss": 0.7773, + "step": 53191 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948732070469376e-06, + "loss": 0.5015, + "step": 53192 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948460670041457e-06, + "loss": 0.6533, + "step": 53193 + }, + { + "epoch": 1.36, + "learning_rate": 1.1948189268121697e-06, + "loss": 0.6089, + "step": 53194 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947917864710296e-06, + "loss": 0.5381, + "step": 53195 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947646459807464e-06, + "loss": 0.7314, + "step": 53196 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947375053413407e-06, + "loss": 0.7192, + "step": 53197 + }, + { + "epoch": 1.36, + "learning_rate": 1.1947103645528335e-06, + "loss": 0.5615, + "step": 53198 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946832236152456e-06, + "loss": 0.6221, + "step": 53199 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946560825285976e-06, + "loss": 0.4744, + "step": 53200 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946289412929106e-06, + "loss": 0.6709, + "step": 53201 + }, + { + "epoch": 1.36, + "learning_rate": 1.1946017999082053e-06, + "loss": 0.5996, + "step": 53202 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945746583745018e-06, + "loss": 0.4644, + "step": 53203 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945475166918217e-06, + "loss": 0.5981, + "step": 53204 + }, + { + "epoch": 1.36, + "learning_rate": 1.1945203748601856e-06, + "loss": 0.7217, + "step": 53205 + }, + { + "epoch": 1.36, + "learning_rate": 1.194493232879614e-06, + "loss": 0.5337, + "step": 53206 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944660907501281e-06, + "loss": 0.9414, + "step": 53207 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944389484717482e-06, + "loss": 0.5117, + "step": 53208 + }, + { + "epoch": 1.36, + "learning_rate": 1.1944118060444957e-06, + "loss": 0.5406, + "step": 53209 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943846634683907e-06, + "loss": 0.6943, + "step": 53210 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943575207434544e-06, + "loss": 0.6826, + "step": 53211 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943303778697075e-06, + "loss": 0.5552, + "step": 53212 + }, + { + "epoch": 1.36, + "learning_rate": 1.1943032348471708e-06, + "loss": 0.6943, + "step": 53213 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942760916758649e-06, + "loss": 0.6699, + "step": 53214 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942489483558108e-06, + "loss": 0.7607, + "step": 53215 + }, + { + "epoch": 1.36, + "learning_rate": 1.1942218048870295e-06, + "loss": 0.7412, + "step": 53216 + }, + { + "epoch": 1.36, + "learning_rate": 1.1941946612695413e-06, + "loss": 0.5664, + "step": 53217 + }, + { + "epoch": 1.36, + "learning_rate": 1.194167517503367e-06, + "loss": 0.6758, + "step": 53218 + }, + { + "epoch": 1.36, + "learning_rate": 1.1941403735885278e-06, + "loss": 0.4351, + "step": 53219 + }, + { + "epoch": 1.36, + "learning_rate": 1.194113229525044e-06, + "loss": 0.4722, + "step": 53220 + }, + { + "epoch": 1.36, + "learning_rate": 1.194086085312937e-06, + "loss": 0.6252, + "step": 53221 + }, + { + "epoch": 1.36, + "learning_rate": 1.1940589409522269e-06, + "loss": 0.6572, + "step": 53222 + }, + { + "epoch": 1.36, + "learning_rate": 1.194031796442935e-06, + "loss": 0.7656, + "step": 53223 + }, + { + "epoch": 1.36, + "learning_rate": 1.1940046517850815e-06, + "loss": 0.5815, + "step": 53224 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939775069786878e-06, + "loss": 0.707, + "step": 53225 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939503620237744e-06, + "loss": 0.6841, + "step": 53226 + }, + { + "epoch": 1.36, + "learning_rate": 1.1939232169203621e-06, + "loss": 0.7773, + "step": 53227 + }, + { + "epoch": 1.36, + "learning_rate": 1.1938960716684718e-06, + "loss": 0.6772, + "step": 53228 + }, + { + "epoch": 1.36, + "learning_rate": 1.193868926268124e-06, + "loss": 0.6543, + "step": 53229 + }, + { + "epoch": 1.36, + "learning_rate": 1.19384178071934e-06, + "loss": 0.6538, + "step": 53230 + }, + { + "epoch": 1.36, + "learning_rate": 1.1938146350221401e-06, + "loss": 0.7305, + "step": 53231 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937874891765453e-06, + "loss": 0.6855, + "step": 53232 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937603431825762e-06, + "loss": 0.5825, + "step": 53233 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937331970402537e-06, + "loss": 0.6211, + "step": 53234 + }, + { + "epoch": 1.36, + "learning_rate": 1.1937060507495986e-06, + "loss": 0.6826, + "step": 53235 + }, + { + "epoch": 1.36, + "learning_rate": 1.193678904310632e-06, + "loss": 0.7959, + "step": 53236 + }, + { + "epoch": 1.36, + "learning_rate": 1.1936517577233743e-06, + "loss": 0.7632, + "step": 53237 + }, + { + "epoch": 1.36, + "learning_rate": 1.193624610987846e-06, + "loss": 0.6826, + "step": 53238 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935974641040684e-06, + "loss": 0.5571, + "step": 53239 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935703170720623e-06, + "loss": 0.4951, + "step": 53240 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935431698918479e-06, + "loss": 0.7461, + "step": 53241 + }, + { + "epoch": 1.36, + "learning_rate": 1.1935160225634471e-06, + "loss": 0.6152, + "step": 53242 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934888750868792e-06, + "loss": 0.6548, + "step": 53243 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934617274621664e-06, + "loss": 0.6904, + "step": 53244 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934345796893284e-06, + "loss": 0.6162, + "step": 53245 + }, + { + "epoch": 1.36, + "learning_rate": 1.1934074317683866e-06, + "loss": 0.5151, + "step": 53246 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933802836993617e-06, + "loss": 0.6084, + "step": 53247 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933531354822743e-06, + "loss": 0.5518, + "step": 53248 + }, + { + "epoch": 1.36, + "learning_rate": 1.1933259871171453e-06, + "loss": 0.7607, + "step": 53249 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932988386039956e-06, + "loss": 0.4438, + "step": 53250 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932716899428455e-06, + "loss": 0.4241, + "step": 53251 + }, + { + "epoch": 1.36, + "learning_rate": 1.1932445411337164e-06, + "loss": 0.5088, + "step": 53252 + }, + { + "epoch": 1.36, + "learning_rate": 1.193217392176629e-06, + "loss": 0.9141, + "step": 53253 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931902430716037e-06, + "loss": 0.6943, + "step": 53254 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931630938186617e-06, + "loss": 0.7109, + "step": 53255 + }, + { + "epoch": 1.36, + "learning_rate": 1.1931359444178234e-06, + "loss": 0.5718, + "step": 53256 + }, + { + "epoch": 1.37, + "learning_rate": 1.19310879486911e-06, + "loss": 0.7998, + "step": 53257 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930816451725417e-06, + "loss": 0.5977, + "step": 53258 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930544953281402e-06, + "loss": 0.7725, + "step": 53259 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930273453359255e-06, + "loss": 0.5359, + "step": 53260 + }, + { + "epoch": 1.37, + "learning_rate": 1.1930001951959185e-06, + "loss": 0.4628, + "step": 53261 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929730449081403e-06, + "loss": 0.4663, + "step": 53262 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929458944726116e-06, + "loss": 0.6816, + "step": 53263 + }, + { + "epoch": 1.37, + "learning_rate": 1.1929187438893528e-06, + "loss": 0.6492, + "step": 53264 + }, + { + "epoch": 1.37, + "learning_rate": 1.1928915931583851e-06, + "loss": 0.6426, + "step": 53265 + }, + { + "epoch": 1.37, + "learning_rate": 1.192864442279729e-06, + "loss": 0.6323, + "step": 53266 + }, + { + "epoch": 1.37, + "learning_rate": 1.192837291253406e-06, + "loss": 0.7749, + "step": 53267 + }, + { + "epoch": 1.37, + "learning_rate": 1.1928101400794362e-06, + "loss": 0.752, + "step": 53268 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927829887578403e-06, + "loss": 0.5405, + "step": 53269 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927558372886392e-06, + "loss": 0.7607, + "step": 53270 + }, + { + "epoch": 1.37, + "learning_rate": 1.192728685671854e-06, + "loss": 0.7227, + "step": 53271 + }, + { + "epoch": 1.37, + "learning_rate": 1.1927015339075056e-06, + "loss": 0.6895, + "step": 53272 + }, + { + "epoch": 1.37, + "learning_rate": 1.192674381995614e-06, + "loss": 0.5159, + "step": 53273 + }, + { + "epoch": 1.37, + "learning_rate": 1.1926472299362009e-06, + "loss": 0.7324, + "step": 53274 + }, + { + "epoch": 1.37, + "learning_rate": 1.1926200777292866e-06, + "loss": 0.5671, + "step": 53275 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925929253748916e-06, + "loss": 0.6626, + "step": 53276 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925657728730374e-06, + "loss": 0.4912, + "step": 53277 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925386202237443e-06, + "loss": 0.5244, + "step": 53278 + }, + { + "epoch": 1.37, + "learning_rate": 1.1925114674270331e-06, + "loss": 0.7729, + "step": 53279 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924843144829251e-06, + "loss": 0.6543, + "step": 53280 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924571613914403e-06, + "loss": 0.6885, + "step": 53281 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924300081526004e-06, + "loss": 0.4902, + "step": 53282 + }, + { + "epoch": 1.37, + "learning_rate": 1.1924028547664253e-06, + "loss": 0.3378, + "step": 53283 + }, + { + "epoch": 1.37, + "learning_rate": 1.1923757012329362e-06, + "loss": 0.7354, + "step": 53284 + }, + { + "epoch": 1.37, + "learning_rate": 1.192348547552154e-06, + "loss": 0.8594, + "step": 53285 + }, + { + "epoch": 1.37, + "learning_rate": 1.1923213937240995e-06, + "loss": 0.5061, + "step": 53286 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922942397487932e-06, + "loss": 0.5928, + "step": 53287 + }, + { + "epoch": 1.37, + "learning_rate": 1.192267085626256e-06, + "loss": 0.6157, + "step": 53288 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922399313565087e-06, + "loss": 0.6411, + "step": 53289 + }, + { + "epoch": 1.37, + "learning_rate": 1.1922127769395723e-06, + "loss": 0.7285, + "step": 53290 + }, + { + "epoch": 1.37, + "learning_rate": 1.192185622375467e-06, + "loss": 0.8135, + "step": 53291 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921584676642144e-06, + "loss": 0.4991, + "step": 53292 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921313128058348e-06, + "loss": 0.7314, + "step": 53293 + }, + { + "epoch": 1.37, + "learning_rate": 1.1921041578003493e-06, + "loss": 0.5481, + "step": 53294 + }, + { + "epoch": 1.37, + "learning_rate": 1.192077002647778e-06, + "loss": 0.6992, + "step": 53295 + }, + { + "epoch": 1.37, + "learning_rate": 1.1920498473481425e-06, + "loss": 0.5115, + "step": 53296 + }, + { + "epoch": 1.37, + "learning_rate": 1.1920226919014633e-06, + "loss": 0.7979, + "step": 53297 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919955363077608e-06, + "loss": 0.5957, + "step": 53298 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919683805670566e-06, + "loss": 0.8184, + "step": 53299 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919412246793706e-06, + "loss": 0.6562, + "step": 53300 + }, + { + "epoch": 1.37, + "learning_rate": 1.1919140686447242e-06, + "loss": 0.6211, + "step": 53301 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918869124631383e-06, + "loss": 0.8662, + "step": 53302 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918597561346332e-06, + "loss": 0.7695, + "step": 53303 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918325996592298e-06, + "loss": 0.791, + "step": 53304 + }, + { + "epoch": 1.37, + "learning_rate": 1.1918054430369492e-06, + "loss": 0.6416, + "step": 53305 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917782862678117e-06, + "loss": 0.5977, + "step": 53306 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917511293518389e-06, + "loss": 0.5016, + "step": 53307 + }, + { + "epoch": 1.37, + "learning_rate": 1.1917239722890507e-06, + "loss": 0.7861, + "step": 53308 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916968150794682e-06, + "loss": 0.7188, + "step": 53309 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916696577231121e-06, + "loss": 0.8291, + "step": 53310 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916425002200038e-06, + "loss": 0.6084, + "step": 53311 + }, + { + "epoch": 1.37, + "learning_rate": 1.1916153425701636e-06, + "loss": 0.7588, + "step": 53312 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915881847736124e-06, + "loss": 0.6875, + "step": 53313 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915610268303706e-06, + "loss": 0.6221, + "step": 53314 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915338687404597e-06, + "loss": 0.5605, + "step": 53315 + }, + { + "epoch": 1.37, + "learning_rate": 1.1915067105038996e-06, + "loss": 0.7109, + "step": 53316 + }, + { + "epoch": 1.37, + "learning_rate": 1.191479552120712e-06, + "loss": 0.5363, + "step": 53317 + }, + { + "epoch": 1.37, + "learning_rate": 1.1914523935909172e-06, + "loss": 0.5724, + "step": 53318 + }, + { + "epoch": 1.37, + "learning_rate": 1.1914252349145362e-06, + "loss": 0.6631, + "step": 53319 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913980760915898e-06, + "loss": 0.665, + "step": 53320 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913709171220985e-06, + "loss": 0.6533, + "step": 53321 + }, + { + "epoch": 1.37, + "learning_rate": 1.1913437580060834e-06, + "loss": 0.5752, + "step": 53322 + }, + { + "epoch": 1.37, + "learning_rate": 1.191316598743565e-06, + "loss": 0.4548, + "step": 53323 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912894393345645e-06, + "loss": 0.4397, + "step": 53324 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912622797791024e-06, + "loss": 0.6812, + "step": 53325 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912351200771995e-06, + "loss": 0.7725, + "step": 53326 + }, + { + "epoch": 1.37, + "learning_rate": 1.1912079602288768e-06, + "loss": 0.6733, + "step": 53327 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911808002341548e-06, + "loss": 0.6826, + "step": 53328 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911536400930545e-06, + "loss": 0.5249, + "step": 53329 + }, + { + "epoch": 1.37, + "learning_rate": 1.1911264798055967e-06, + "loss": 0.6455, + "step": 53330 + }, + { + "epoch": 1.37, + "learning_rate": 1.191099319371802e-06, + "loss": 0.6174, + "step": 53331 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910721587916916e-06, + "loss": 0.6555, + "step": 53332 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910449980652858e-06, + "loss": 0.5996, + "step": 53333 + }, + { + "epoch": 1.37, + "learning_rate": 1.1910178371926059e-06, + "loss": 0.6914, + "step": 53334 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909906761736718e-06, + "loss": 0.4974, + "step": 53335 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909635150085055e-06, + "loss": 0.7676, + "step": 53336 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909363536971271e-06, + "loss": 0.5776, + "step": 53337 + }, + { + "epoch": 1.37, + "learning_rate": 1.1909091922395576e-06, + "loss": 0.7446, + "step": 53338 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908820306358174e-06, + "loss": 0.5693, + "step": 53339 + }, + { + "epoch": 1.37, + "learning_rate": 1.190854868885928e-06, + "loss": 0.6616, + "step": 53340 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908277069899094e-06, + "loss": 0.5298, + "step": 53341 + }, + { + "epoch": 1.37, + "learning_rate": 1.1908005449477832e-06, + "loss": 0.5352, + "step": 53342 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907733827595695e-06, + "loss": 0.7842, + "step": 53343 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907462204252894e-06, + "loss": 0.665, + "step": 53344 + }, + { + "epoch": 1.37, + "learning_rate": 1.1907190579449638e-06, + "loss": 0.6328, + "step": 53345 + }, + { + "epoch": 1.37, + "learning_rate": 1.1906918953186134e-06, + "loss": 0.5237, + "step": 53346 + }, + { + "epoch": 1.37, + "learning_rate": 1.190664732546259e-06, + "loss": 0.5065, + "step": 53347 + }, + { + "epoch": 1.37, + "learning_rate": 1.190637569627921e-06, + "loss": 0.6523, + "step": 53348 + }, + { + "epoch": 1.37, + "learning_rate": 1.1906104065636212e-06, + "loss": 0.6426, + "step": 53349 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905832433533794e-06, + "loss": 0.8516, + "step": 53350 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905560799972173e-06, + "loss": 0.6914, + "step": 53351 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905289164951544e-06, + "loss": 0.4146, + "step": 53352 + }, + { + "epoch": 1.37, + "learning_rate": 1.1905017528472126e-06, + "loss": 0.6782, + "step": 53353 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904745890534123e-06, + "loss": 0.8125, + "step": 53354 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904474251137744e-06, + "loss": 0.6299, + "step": 53355 + }, + { + "epoch": 1.37, + "learning_rate": 1.1904202610283199e-06, + "loss": 0.6602, + "step": 53356 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903930967970692e-06, + "loss": 0.6548, + "step": 53357 + }, + { + "epoch": 1.37, + "learning_rate": 1.190365932420043e-06, + "loss": 0.8623, + "step": 53358 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903387678972628e-06, + "loss": 0.7891, + "step": 53359 + }, + { + "epoch": 1.37, + "learning_rate": 1.1903116032287484e-06, + "loss": 0.6973, + "step": 53360 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902844384145216e-06, + "loss": 0.6188, + "step": 53361 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902572734546028e-06, + "loss": 0.6758, + "step": 53362 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902301083490123e-06, + "loss": 0.6416, + "step": 53363 + }, + { + "epoch": 1.37, + "learning_rate": 1.1902029430977718e-06, + "loss": 0.6631, + "step": 53364 + }, + { + "epoch": 1.37, + "learning_rate": 1.1901757777009015e-06, + "loss": 0.7734, + "step": 53365 + }, + { + "epoch": 1.37, + "learning_rate": 1.1901486121584225e-06, + "loss": 0.688, + "step": 53366 + }, + { + "epoch": 1.37, + "learning_rate": 1.190121446470355e-06, + "loss": 0.6904, + "step": 53367 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900942806367206e-06, + "loss": 0.605, + "step": 53368 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900671146575396e-06, + "loss": 0.6143, + "step": 53369 + }, + { + "epoch": 1.37, + "learning_rate": 1.1900399485328332e-06, + "loss": 0.5825, + "step": 53370 + }, + { + "epoch": 1.37, + "learning_rate": 1.190012782262622e-06, + "loss": 0.5605, + "step": 53371 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899856158469265e-06, + "loss": 0.8369, + "step": 53372 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899584492857677e-06, + "loss": 0.7158, + "step": 53373 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899312825791666e-06, + "loss": 0.6541, + "step": 53374 + }, + { + "epoch": 1.37, + "learning_rate": 1.1899041157271437e-06, + "loss": 0.7188, + "step": 53375 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898769487297202e-06, + "loss": 0.6743, + "step": 53376 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898497815869164e-06, + "loss": 0.6519, + "step": 53377 + }, + { + "epoch": 1.37, + "learning_rate": 1.1898226142987535e-06, + "loss": 0.6426, + "step": 53378 + }, + { + "epoch": 1.37, + "learning_rate": 1.189795446865252e-06, + "loss": 0.7227, + "step": 53379 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897682792864331e-06, + "loss": 0.6211, + "step": 53380 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897411115623172e-06, + "loss": 0.6421, + "step": 53381 + }, + { + "epoch": 1.37, + "learning_rate": 1.1897139436929253e-06, + "loss": 0.7998, + "step": 53382 + }, + { + "epoch": 1.37, + "learning_rate": 1.189686775678278e-06, + "loss": 0.7715, + "step": 53383 + }, + { + "epoch": 1.37, + "learning_rate": 1.1896596075183966e-06, + "loss": 0.6204, + "step": 53384 + }, + { + "epoch": 1.37, + "learning_rate": 1.1896324392133012e-06, + "loss": 0.6125, + "step": 53385 + }, + { + "epoch": 1.37, + "learning_rate": 1.189605270763013e-06, + "loss": 0.4751, + "step": 53386 + }, + { + "epoch": 1.37, + "learning_rate": 1.189578102167553e-06, + "loss": 0.584, + "step": 53387 + }, + { + "epoch": 1.37, + "learning_rate": 1.1895509334269417e-06, + "loss": 0.5186, + "step": 53388 + }, + { + "epoch": 1.37, + "learning_rate": 1.1895237645411999e-06, + "loss": 0.488, + "step": 53389 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894965955103482e-06, + "loss": 0.6299, + "step": 53390 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894694263344082e-06, + "loss": 0.5371, + "step": 53391 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894422570134e-06, + "loss": 0.655, + "step": 53392 + }, + { + "epoch": 1.37, + "learning_rate": 1.1894150875473444e-06, + "loss": 0.6943, + "step": 53393 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893879179362623e-06, + "loss": 0.5054, + "step": 53394 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893607481801748e-06, + "loss": 0.5991, + "step": 53395 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893335782791025e-06, + "loss": 0.729, + "step": 53396 + }, + { + "epoch": 1.37, + "learning_rate": 1.1893064082330661e-06, + "loss": 0.7368, + "step": 53397 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892792380420864e-06, + "loss": 0.5798, + "step": 53398 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892520677061846e-06, + "loss": 0.5894, + "step": 53399 + }, + { + "epoch": 1.37, + "learning_rate": 1.1892248972253808e-06, + "loss": 0.4562, + "step": 53400 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891977265996966e-06, + "loss": 0.4027, + "step": 53401 + }, + { + "epoch": 1.37, + "learning_rate": 1.189170555829152e-06, + "loss": 0.5854, + "step": 53402 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891433849137684e-06, + "loss": 0.5479, + "step": 53403 + }, + { + "epoch": 1.37, + "learning_rate": 1.1891162138535663e-06, + "loss": 0.6367, + "step": 53404 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890890426485668e-06, + "loss": 0.7285, + "step": 53405 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890618712987905e-06, + "loss": 0.6689, + "step": 53406 + }, + { + "epoch": 1.37, + "learning_rate": 1.189034699804258e-06, + "loss": 0.6602, + "step": 53407 + }, + { + "epoch": 1.37, + "learning_rate": 1.1890075281649905e-06, + "loss": 0.4929, + "step": 53408 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889803563810086e-06, + "loss": 0.6406, + "step": 53409 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889531844523331e-06, + "loss": 0.5864, + "step": 53410 + }, + { + "epoch": 1.37, + "learning_rate": 1.1889260123789849e-06, + "loss": 0.7549, + "step": 53411 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888988401609847e-06, + "loss": 0.7065, + "step": 53412 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888716677983533e-06, + "loss": 0.6914, + "step": 53413 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888444952911116e-06, + "loss": 0.7456, + "step": 53414 + }, + { + "epoch": 1.37, + "learning_rate": 1.1888173226392802e-06, + "loss": 0.7197, + "step": 53415 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887901498428805e-06, + "loss": 0.6416, + "step": 53416 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887629769019322e-06, + "loss": 0.728, + "step": 53417 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887358038164573e-06, + "loss": 0.7402, + "step": 53418 + }, + { + "epoch": 1.37, + "learning_rate": 1.1887086305864758e-06, + "loss": 0.5264, + "step": 53419 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886814572120089e-06, + "loss": 0.6926, + "step": 53420 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886542836930773e-06, + "loss": 0.7734, + "step": 53421 + }, + { + "epoch": 1.37, + "learning_rate": 1.1886271100297019e-06, + "loss": 0.6318, + "step": 53422 + }, + { + "epoch": 1.37, + "learning_rate": 1.188599936221903e-06, + "loss": 0.5325, + "step": 53423 + }, + { + "epoch": 1.37, + "learning_rate": 1.188572762269702e-06, + "loss": 0.6172, + "step": 53424 + }, + { + "epoch": 1.37, + "learning_rate": 1.1885455881731197e-06, + "loss": 0.7339, + "step": 53425 + }, + { + "epoch": 1.37, + "learning_rate": 1.1885184139321764e-06, + "loss": 0.7207, + "step": 53426 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884912395468936e-06, + "loss": 0.8271, + "step": 53427 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884640650172915e-06, + "loss": 0.7109, + "step": 53428 + }, + { + "epoch": 1.37, + "learning_rate": 1.188436890343391e-06, + "loss": 0.7119, + "step": 53429 + }, + { + "epoch": 1.37, + "learning_rate": 1.1884097155252133e-06, + "loss": 0.6816, + "step": 53430 + }, + { + "epoch": 1.37, + "learning_rate": 1.188382540562779e-06, + "loss": 0.5928, + "step": 53431 + }, + { + "epoch": 1.37, + "learning_rate": 1.1883553654561085e-06, + "loss": 0.6846, + "step": 53432 + }, + { + "epoch": 1.37, + "learning_rate": 1.188328190205223e-06, + "loss": 0.5356, + "step": 53433 + }, + { + "epoch": 1.37, + "learning_rate": 1.1883010148101434e-06, + "loss": 0.5117, + "step": 53434 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882738392708904e-06, + "loss": 0.6382, + "step": 53435 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882466635874848e-06, + "loss": 0.7344, + "step": 53436 + }, + { + "epoch": 1.37, + "learning_rate": 1.1882194877599473e-06, + "loss": 0.7314, + "step": 53437 + }, + { + "epoch": 1.37, + "learning_rate": 1.188192311788299e-06, + "loss": 0.5762, + "step": 53438 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881651356725602e-06, + "loss": 0.7446, + "step": 53439 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881379594127518e-06, + "loss": 0.5381, + "step": 53440 + }, + { + "epoch": 1.37, + "learning_rate": 1.1881107830088957e-06, + "loss": 0.7051, + "step": 53441 + }, + { + "epoch": 1.37, + "learning_rate": 1.188083606461011e-06, + "loss": 0.6313, + "step": 53442 + }, + { + "epoch": 1.37, + "learning_rate": 1.1880564297691196e-06, + "loss": 0.7939, + "step": 53443 + }, + { + "epoch": 1.37, + "learning_rate": 1.1880292529332422e-06, + "loss": 0.7041, + "step": 53444 + }, + { + "epoch": 1.37, + "learning_rate": 1.188002075953399e-06, + "loss": 0.752, + "step": 53445 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879748988296117e-06, + "loss": 0.4944, + "step": 53446 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879477215619008e-06, + "loss": 0.4282, + "step": 53447 + }, + { + "epoch": 1.37, + "learning_rate": 1.1879205441502862e-06, + "loss": 0.752, + "step": 53448 + }, + { + "epoch": 1.37, + "learning_rate": 1.18789336659479e-06, + "loss": 0.6094, + "step": 53449 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878661888954325e-06, + "loss": 0.6099, + "step": 53450 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878390110522344e-06, + "loss": 0.6335, + "step": 53451 + }, + { + "epoch": 1.37, + "learning_rate": 1.1878118330652168e-06, + "loss": 0.6313, + "step": 53452 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877846549343998e-06, + "loss": 0.603, + "step": 53453 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877574766598052e-06, + "loss": 0.8076, + "step": 53454 + }, + { + "epoch": 1.37, + "learning_rate": 1.1877302982414534e-06, + "loss": 0.6875, + "step": 53455 + }, + { + "epoch": 1.37, + "learning_rate": 1.187703119679365e-06, + "loss": 0.627, + "step": 53456 + }, + { + "epoch": 1.37, + "learning_rate": 1.1876759409735609e-06, + "loss": 0.8369, + "step": 53457 + }, + { + "epoch": 1.37, + "learning_rate": 1.1876487621240619e-06, + "loss": 0.5645, + "step": 53458 + }, + { + "epoch": 1.37, + "learning_rate": 1.187621583130889e-06, + "loss": 0.7598, + "step": 53459 + }, + { + "epoch": 1.37, + "learning_rate": 1.1875944039940628e-06, + "loss": 0.7188, + "step": 53460 + }, + { + "epoch": 1.37, + "learning_rate": 1.187567224713604e-06, + "loss": 0.7622, + "step": 53461 + }, + { + "epoch": 1.37, + "learning_rate": 1.187540045289534e-06, + "loss": 0.6953, + "step": 53462 + }, + { + "epoch": 1.37, + "learning_rate": 1.1875128657218729e-06, + "loss": 0.7764, + "step": 53463 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874856860106421e-06, + "loss": 0.6516, + "step": 53464 + }, + { + "epoch": 1.37, + "learning_rate": 1.187458506155862e-06, + "loss": 0.5728, + "step": 53465 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874313261575536e-06, + "loss": 0.4644, + "step": 53466 + }, + { + "epoch": 1.37, + "learning_rate": 1.1874041460157375e-06, + "loss": 0.6875, + "step": 53467 + }, + { + "epoch": 1.37, + "learning_rate": 1.1873769657304349e-06, + "loss": 0.6592, + "step": 53468 + }, + { + "epoch": 1.37, + "learning_rate": 1.187349785301666e-06, + "loss": 0.7812, + "step": 53469 + }, + { + "epoch": 1.37, + "learning_rate": 1.1873226047294522e-06, + "loss": 0.6357, + "step": 53470 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872954240138142e-06, + "loss": 0.7197, + "step": 53471 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872682431547728e-06, + "loss": 0.4937, + "step": 53472 + }, + { + "epoch": 1.37, + "learning_rate": 1.1872410621523483e-06, + "loss": 0.627, + "step": 53473 + }, + { + "epoch": 1.37, + "learning_rate": 1.187213881006562e-06, + "loss": 0.7051, + "step": 53474 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871866997174348e-06, + "loss": 0.7676, + "step": 53475 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871595182849874e-06, + "loss": 0.7124, + "step": 53476 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871323367092406e-06, + "loss": 0.645, + "step": 53477 + }, + { + "epoch": 1.37, + "learning_rate": 1.1871051549902149e-06, + "loss": 0.6826, + "step": 53478 + }, + { + "epoch": 1.37, + "learning_rate": 1.1870779731279317e-06, + "loss": 0.5151, + "step": 53479 + }, + { + "epoch": 1.37, + "learning_rate": 1.187050791122411e-06, + "loss": 0.6279, + "step": 53480 + }, + { + "epoch": 1.37, + "learning_rate": 1.1870236089736749e-06, + "loss": 0.5801, + "step": 53481 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869964266817427e-06, + "loss": 0.5334, + "step": 53482 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869692442466364e-06, + "loss": 0.6367, + "step": 53483 + }, + { + "epoch": 1.37, + "learning_rate": 1.1869420616683761e-06, + "loss": 0.6152, + "step": 53484 + }, + { + "epoch": 1.37, + "learning_rate": 1.186914878946983e-06, + "loss": 0.677, + "step": 53485 + }, + { + "epoch": 1.37, + "learning_rate": 1.1868876960824776e-06, + "loss": 0.6011, + "step": 53486 + }, + { + "epoch": 1.37, + "learning_rate": 1.186860513074881e-06, + "loss": 0.5103, + "step": 53487 + }, + { + "epoch": 1.37, + "learning_rate": 1.1868333299242138e-06, + "loss": 0.6553, + "step": 53488 + }, + { + "epoch": 1.37, + "learning_rate": 1.186806146630497e-06, + "loss": 0.5991, + "step": 53489 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867789631937512e-06, + "loss": 0.5139, + "step": 53490 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867517796139978e-06, + "loss": 0.6294, + "step": 53491 + }, + { + "epoch": 1.37, + "learning_rate": 1.1867245958912567e-06, + "loss": 0.6938, + "step": 53492 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866974120255492e-06, + "loss": 0.623, + "step": 53493 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866702280168962e-06, + "loss": 0.6621, + "step": 53494 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866430438653182e-06, + "loss": 0.6616, + "step": 53495 + }, + { + "epoch": 1.37, + "learning_rate": 1.1866158595708365e-06, + "loss": 0.6514, + "step": 53496 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865886751334713e-06, + "loss": 0.5767, + "step": 53497 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865614905532439e-06, + "loss": 0.6963, + "step": 53498 + }, + { + "epoch": 1.37, + "learning_rate": 1.186534305830175e-06, + "loss": 0.6604, + "step": 53499 + }, + { + "epoch": 1.37, + "learning_rate": 1.1865071209642852e-06, + "loss": 0.7012, + "step": 53500 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864799359555954e-06, + "loss": 0.4697, + "step": 53501 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864527508041268e-06, + "loss": 0.7607, + "step": 53502 + }, + { + "epoch": 1.37, + "learning_rate": 1.1864255655098995e-06, + "loss": 0.5383, + "step": 53503 + }, + { + "epoch": 1.37, + "learning_rate": 1.186398380072935e-06, + "loss": 0.585, + "step": 53504 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863711944932536e-06, + "loss": 0.7104, + "step": 53505 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863440087708772e-06, + "loss": 0.8164, + "step": 53506 + }, + { + "epoch": 1.37, + "learning_rate": 1.1863168229058249e-06, + "loss": 0.6133, + "step": 53507 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862896368981186e-06, + "loss": 0.6787, + "step": 53508 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862624507477788e-06, + "loss": 0.5513, + "step": 53509 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862352644548264e-06, + "loss": 0.5527, + "step": 53510 + }, + { + "epoch": 1.37, + "learning_rate": 1.1862080780192825e-06, + "loss": 0.6167, + "step": 53511 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861808914411674e-06, + "loss": 0.6709, + "step": 53512 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861537047205018e-06, + "loss": 0.7217, + "step": 53513 + }, + { + "epoch": 1.37, + "learning_rate": 1.1861265178573074e-06, + "loss": 0.7139, + "step": 53514 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860993308516042e-06, + "loss": 0.5151, + "step": 53515 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860721437034137e-06, + "loss": 0.7568, + "step": 53516 + }, + { + "epoch": 1.37, + "learning_rate": 1.186044956412756e-06, + "loss": 0.6299, + "step": 53517 + }, + { + "epoch": 1.37, + "learning_rate": 1.1860177689796525e-06, + "loss": 0.5132, + "step": 53518 + }, + { + "epoch": 1.37, + "learning_rate": 1.1859905814041234e-06, + "loss": 0.5706, + "step": 53519 + }, + { + "epoch": 1.37, + "learning_rate": 1.18596339368619e-06, + "loss": 0.4561, + "step": 53520 + }, + { + "epoch": 1.37, + "learning_rate": 1.185936205825873e-06, + "loss": 0.6709, + "step": 53521 + }, + { + "epoch": 1.37, + "learning_rate": 1.185909017823193e-06, + "loss": 0.6133, + "step": 53522 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858818296781712e-06, + "loss": 0.6265, + "step": 53523 + }, + { + "epoch": 1.37, + "learning_rate": 1.185854641390828e-06, + "loss": 0.5303, + "step": 53524 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858274529611848e-06, + "loss": 0.697, + "step": 53525 + }, + { + "epoch": 1.37, + "learning_rate": 1.1858002643892619e-06, + "loss": 0.6211, + "step": 53526 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857730756750806e-06, + "loss": 0.5532, + "step": 53527 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857458868186609e-06, + "loss": 0.6973, + "step": 53528 + }, + { + "epoch": 1.37, + "learning_rate": 1.1857186978200243e-06, + "loss": 0.6411, + "step": 53529 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856915086791915e-06, + "loss": 0.7578, + "step": 53530 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856643193961833e-06, + "loss": 0.6016, + "step": 53531 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856371299710202e-06, + "loss": 0.5649, + "step": 53532 + }, + { + "epoch": 1.37, + "learning_rate": 1.1856099404037236e-06, + "loss": 0.6816, + "step": 53533 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855827506943138e-06, + "loss": 0.4543, + "step": 53534 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855555608428118e-06, + "loss": 0.7812, + "step": 53535 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855283708492385e-06, + "loss": 0.6729, + "step": 53536 + }, + { + "epoch": 1.37, + "learning_rate": 1.1855011807136148e-06, + "loss": 0.689, + "step": 53537 + }, + { + "epoch": 1.37, + "learning_rate": 1.185473990435961e-06, + "loss": 0.7642, + "step": 53538 + }, + { + "epoch": 1.37, + "learning_rate": 1.1854468000162987e-06, + "loss": 0.5266, + "step": 53539 + }, + { + "epoch": 1.37, + "learning_rate": 1.185419609454648e-06, + "loss": 0.7031, + "step": 53540 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853924187510302e-06, + "loss": 0.7144, + "step": 53541 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853652279054662e-06, + "loss": 0.4802, + "step": 53542 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853380369179762e-06, + "loss": 0.7324, + "step": 53543 + }, + { + "epoch": 1.37, + "learning_rate": 1.1853108457885815e-06, + "loss": 0.4045, + "step": 53544 + }, + { + "epoch": 1.37, + "learning_rate": 1.1852836545173028e-06, + "loss": 0.4648, + "step": 53545 + }, + { + "epoch": 1.37, + "learning_rate": 1.185256463104161e-06, + "loss": 0.5435, + "step": 53546 + }, + { + "epoch": 1.37, + "learning_rate": 1.1852292715491767e-06, + "loss": 0.5502, + "step": 53547 + }, + { + "epoch": 1.37, + "learning_rate": 1.185202079852371e-06, + "loss": 0.6289, + "step": 53548 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851748880137641e-06, + "loss": 0.6826, + "step": 53549 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851476960333779e-06, + "loss": 0.6094, + "step": 53550 + }, + { + "epoch": 1.37, + "learning_rate": 1.1851205039112326e-06, + "loss": 0.5132, + "step": 53551 + }, + { + "epoch": 1.37, + "learning_rate": 1.185093311647349e-06, + "loss": 0.6475, + "step": 53552 + }, + { + "epoch": 1.37, + "learning_rate": 1.1850661192417478e-06, + "loss": 0.6855, + "step": 53553 + }, + { + "epoch": 1.37, + "learning_rate": 1.18503892669445e-06, + "loss": 0.6328, + "step": 53554 + }, + { + "epoch": 1.37, + "learning_rate": 1.1850117340054762e-06, + "loss": 0.3855, + "step": 53555 + }, + { + "epoch": 1.37, + "learning_rate": 1.184984541174848e-06, + "loss": 0.6196, + "step": 53556 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849573482025852e-06, + "loss": 0.5139, + "step": 53557 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849301550887092e-06, + "loss": 0.6216, + "step": 53558 + }, + { + "epoch": 1.37, + "learning_rate": 1.1849029618332404e-06, + "loss": 0.6455, + "step": 53559 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848757684362002e-06, + "loss": 0.7241, + "step": 53560 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848485748976092e-06, + "loss": 0.7178, + "step": 53561 + }, + { + "epoch": 1.37, + "learning_rate": 1.1848213812174878e-06, + "loss": 0.7207, + "step": 53562 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847941873958575e-06, + "loss": 0.6084, + "step": 53563 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847669934327386e-06, + "loss": 0.7441, + "step": 53564 + }, + { + "epoch": 1.37, + "learning_rate": 1.1847397993281521e-06, + "loss": 0.6855, + "step": 53565 + }, + { + "epoch": 1.37, + "learning_rate": 1.184712605082119e-06, + "loss": 0.4775, + "step": 53566 + }, + { + "epoch": 1.37, + "learning_rate": 1.18468541069466e-06, + "loss": 0.7153, + "step": 53567 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846582161657956e-06, + "loss": 0.6699, + "step": 53568 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846310214955471e-06, + "loss": 0.5635, + "step": 53569 + }, + { + "epoch": 1.37, + "learning_rate": 1.1846038266839348e-06, + "loss": 0.5303, + "step": 53570 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845766317309804e-06, + "loss": 0.6641, + "step": 53571 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845494366367037e-06, + "loss": 0.6533, + "step": 53572 + }, + { + "epoch": 1.37, + "learning_rate": 1.1845222414011262e-06, + "loss": 0.5366, + "step": 53573 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844950460242682e-06, + "loss": 0.668, + "step": 53574 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844678505061512e-06, + "loss": 0.6753, + "step": 53575 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844406548467955e-06, + "loss": 0.6758, + "step": 53576 + }, + { + "epoch": 1.37, + "learning_rate": 1.1844134590462222e-06, + "loss": 0.5273, + "step": 53577 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843862631044517e-06, + "loss": 0.6519, + "step": 53578 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843590670215054e-06, + "loss": 0.6802, + "step": 53579 + }, + { + "epoch": 1.37, + "learning_rate": 1.1843318707974036e-06, + "loss": 0.6582, + "step": 53580 + }, + { + "epoch": 1.37, + "learning_rate": 1.184304674432168e-06, + "loss": 0.5564, + "step": 53581 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842774779258178e-06, + "loss": 0.5625, + "step": 53582 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842502812783755e-06, + "loss": 0.6768, + "step": 53583 + }, + { + "epoch": 1.37, + "learning_rate": 1.1842230844898609e-06, + "loss": 0.47, + "step": 53584 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841958875602954e-06, + "loss": 0.5928, + "step": 53585 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841686904896993e-06, + "loss": 0.6514, + "step": 53586 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841414932780937e-06, + "loss": 0.4919, + "step": 53587 + }, + { + "epoch": 1.37, + "learning_rate": 1.1841142959254996e-06, + "loss": 0.7529, + "step": 53588 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840870984319375e-06, + "loss": 0.8643, + "step": 53589 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840599007974286e-06, + "loss": 0.5981, + "step": 53590 + }, + { + "epoch": 1.37, + "learning_rate": 1.1840327030219934e-06, + "loss": 0.6924, + "step": 53591 + }, + { + "epoch": 1.37, + "learning_rate": 1.184005505105653e-06, + "loss": 0.5728, + "step": 53592 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839783070484276e-06, + "loss": 0.6914, + "step": 53593 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839511088503388e-06, + "loss": 0.7246, + "step": 53594 + }, + { + "epoch": 1.37, + "learning_rate": 1.1839239105114069e-06, + "loss": 0.7139, + "step": 53595 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838967120316533e-06, + "loss": 0.6162, + "step": 53596 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838695134110982e-06, + "loss": 0.8418, + "step": 53597 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838423146497628e-06, + "loss": 0.6304, + "step": 53598 + }, + { + "epoch": 1.37, + "learning_rate": 1.1838151157476674e-06, + "loss": 0.7959, + "step": 53599 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837879167048335e-06, + "loss": 0.6562, + "step": 53600 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837607175212818e-06, + "loss": 0.6807, + "step": 53601 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837335181970328e-06, + "loss": 0.6729, + "step": 53602 + }, + { + "epoch": 1.37, + "learning_rate": 1.1837063187321073e-06, + "loss": 0.665, + "step": 53603 + }, + { + "epoch": 1.37, + "learning_rate": 1.1836791191265266e-06, + "loss": 0.6416, + "step": 53604 + }, + { + "epoch": 1.37, + "learning_rate": 1.183651919380311e-06, + "loss": 0.6465, + "step": 53605 + }, + { + "epoch": 1.37, + "learning_rate": 1.1836247194934816e-06, + "loss": 0.4937, + "step": 53606 + }, + { + "epoch": 1.37, + "learning_rate": 1.1835975194660595e-06, + "loss": 0.6113, + "step": 53607 + }, + { + "epoch": 1.37, + "learning_rate": 1.183570319298065e-06, + "loss": 0.6465, + "step": 53608 + }, + { + "epoch": 1.37, + "learning_rate": 1.183543118989519e-06, + "loss": 0.7715, + "step": 53609 + }, + { + "epoch": 1.37, + "learning_rate": 1.183515918540443e-06, + "loss": 0.7471, + "step": 53610 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834887179508568e-06, + "loss": 0.5879, + "step": 53611 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834615172207817e-06, + "loss": 0.7441, + "step": 53612 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834343163502387e-06, + "loss": 0.7412, + "step": 53613 + }, + { + "epoch": 1.37, + "learning_rate": 1.1834071153392484e-06, + "loss": 0.6577, + "step": 53614 + }, + { + "epoch": 1.37, + "learning_rate": 1.183379914187832e-06, + "loss": 0.7754, + "step": 53615 + }, + { + "epoch": 1.37, + "learning_rate": 1.1833527128960098e-06, + "loss": 0.6816, + "step": 53616 + }, + { + "epoch": 1.37, + "learning_rate": 1.183325511463803e-06, + "loss": 0.6816, + "step": 53617 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832983098912318e-06, + "loss": 0.8027, + "step": 53618 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832711081783182e-06, + "loss": 0.6841, + "step": 53619 + }, + { + "epoch": 1.37, + "learning_rate": 1.183243906325082e-06, + "loss": 0.4758, + "step": 53620 + }, + { + "epoch": 1.37, + "learning_rate": 1.1832167043315446e-06, + "loss": 0.3127, + "step": 53621 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831895021977263e-06, + "loss": 0.7861, + "step": 53622 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831622999236484e-06, + "loss": 0.6626, + "step": 53623 + }, + { + "epoch": 1.37, + "learning_rate": 1.1831350975093312e-06, + "loss": 0.5879, + "step": 53624 + }, + { + "epoch": 1.37, + "learning_rate": 1.183107894954796e-06, + "loss": 0.6807, + "step": 53625 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830806922600639e-06, + "loss": 0.467, + "step": 53626 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830534894251552e-06, + "loss": 0.5059, + "step": 53627 + }, + { + "epoch": 1.37, + "learning_rate": 1.1830262864500907e-06, + "loss": 0.6816, + "step": 53628 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829990833348913e-06, + "loss": 0.6116, + "step": 53629 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829718800795781e-06, + "loss": 0.6543, + "step": 53630 + }, + { + "epoch": 1.37, + "learning_rate": 1.1829446766841716e-06, + "loss": 0.6387, + "step": 53631 + }, + { + "epoch": 1.37, + "learning_rate": 1.182917473148693e-06, + "loss": 0.6387, + "step": 53632 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828902694731624e-06, + "loss": 0.5732, + "step": 53633 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828630656576018e-06, + "loss": 0.6748, + "step": 53634 + }, + { + "epoch": 1.37, + "learning_rate": 1.182835861702031e-06, + "loss": 0.73, + "step": 53635 + }, + { + "epoch": 1.37, + "learning_rate": 1.1828086576064712e-06, + "loss": 0.6504, + "step": 53636 + }, + { + "epoch": 1.37, + "learning_rate": 1.1827814533709433e-06, + "loss": 0.6162, + "step": 53637 + }, + { + "epoch": 1.37, + "learning_rate": 1.182754248995468e-06, + "loss": 0.7607, + "step": 53638 + }, + { + "epoch": 1.37, + "learning_rate": 1.182727044480066e-06, + "loss": 0.749, + "step": 53639 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826998398247588e-06, + "loss": 0.6924, + "step": 53640 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826726350295662e-06, + "loss": 0.7207, + "step": 53641 + }, + { + "epoch": 1.37, + "learning_rate": 1.18264543009451e-06, + "loss": 0.5645, + "step": 53642 + }, + { + "epoch": 1.37, + "learning_rate": 1.1826182250196101e-06, + "loss": 0.7363, + "step": 53643 + }, + { + "epoch": 1.37, + "learning_rate": 1.182591019804888e-06, + "loss": 0.7119, + "step": 53644 + }, + { + "epoch": 1.37, + "learning_rate": 1.1825638144503646e-06, + "loss": 0.8232, + "step": 53645 + }, + { + "epoch": 1.37, + "learning_rate": 1.1825366089560604e-06, + "loss": 0.6543, + "step": 53646 + }, + { + "epoch": 1.38, + "learning_rate": 1.1825094033219962e-06, + "loss": 0.5869, + "step": 53647 + }, + { + "epoch": 1.38, + "learning_rate": 1.182482197548193e-06, + "loss": 0.6548, + "step": 53648 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824549916346714e-06, + "loss": 0.6621, + "step": 53649 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824277855814525e-06, + "loss": 0.4805, + "step": 53650 + }, + { + "epoch": 1.38, + "learning_rate": 1.1824005793885573e-06, + "loss": 0.7129, + "step": 53651 + }, + { + "epoch": 1.38, + "learning_rate": 1.182373373056006e-06, + "loss": 0.5029, + "step": 53652 + }, + { + "epoch": 1.38, + "learning_rate": 1.1823461665838199e-06, + "loss": 0.6602, + "step": 53653 + }, + { + "epoch": 1.38, + "learning_rate": 1.1823189599720198e-06, + "loss": 0.6787, + "step": 53654 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822917532206264e-06, + "loss": 0.4357, + "step": 53655 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822645463296606e-06, + "loss": 0.5317, + "step": 53656 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822373392991434e-06, + "loss": 0.5923, + "step": 53657 + }, + { + "epoch": 1.38, + "learning_rate": 1.1822101321290952e-06, + "loss": 0.5654, + "step": 53658 + }, + { + "epoch": 1.38, + "learning_rate": 1.182182924819537e-06, + "loss": 0.563, + "step": 53659 + }, + { + "epoch": 1.38, + "learning_rate": 1.18215571737049e-06, + "loss": 0.6025, + "step": 53660 + }, + { + "epoch": 1.38, + "learning_rate": 1.1821285097819747e-06, + "loss": 0.5225, + "step": 53661 + }, + { + "epoch": 1.38, + "learning_rate": 1.1821013020540118e-06, + "loss": 0.4792, + "step": 53662 + }, + { + "epoch": 1.38, + "learning_rate": 1.1820740941866222e-06, + "loss": 0.5775, + "step": 53663 + }, + { + "epoch": 1.38, + "learning_rate": 1.182046886179827e-06, + "loss": 0.686, + "step": 53664 + }, + { + "epoch": 1.38, + "learning_rate": 1.1820196780336474e-06, + "loss": 0.5542, + "step": 53665 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819924697481029e-06, + "loss": 0.6562, + "step": 53666 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819652613232154e-06, + "loss": 0.7031, + "step": 53667 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819380527590055e-06, + "loss": 0.958, + "step": 53668 + }, + { + "epoch": 1.38, + "learning_rate": 1.1819108440554938e-06, + "loss": 0.4774, + "step": 53669 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818836352127017e-06, + "loss": 0.6836, + "step": 53670 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818564262306496e-06, + "loss": 0.6416, + "step": 53671 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818292171093582e-06, + "loss": 0.6436, + "step": 53672 + }, + { + "epoch": 1.38, + "learning_rate": 1.1818020078488486e-06, + "loss": 0.6211, + "step": 53673 + }, + { + "epoch": 1.38, + "learning_rate": 1.1817747984491415e-06, + "loss": 0.4407, + "step": 53674 + }, + { + "epoch": 1.38, + "learning_rate": 1.181747588910258e-06, + "loss": 0.4749, + "step": 53675 + }, + { + "epoch": 1.38, + "learning_rate": 1.1817203792322185e-06, + "loss": 0.7549, + "step": 53676 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816931694150442e-06, + "loss": 0.6484, + "step": 53677 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816659594587557e-06, + "loss": 0.4785, + "step": 53678 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816387493633739e-06, + "loss": 0.625, + "step": 53679 + }, + { + "epoch": 1.38, + "learning_rate": 1.1816115391289202e-06, + "loss": 0.7461, + "step": 53680 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815843287554142e-06, + "loss": 0.708, + "step": 53681 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815571182428777e-06, + "loss": 0.6875, + "step": 53682 + }, + { + "epoch": 1.38, + "learning_rate": 1.181529907591331e-06, + "loss": 0.6367, + "step": 53683 + }, + { + "epoch": 1.38, + "learning_rate": 1.1815026968007954e-06, + "loss": 0.626, + "step": 53684 + }, + { + "epoch": 1.38, + "learning_rate": 1.181475485871292e-06, + "loss": 0.6113, + "step": 53685 + }, + { + "epoch": 1.38, + "learning_rate": 1.1814482748028405e-06, + "loss": 0.7666, + "step": 53686 + }, + { + "epoch": 1.38, + "learning_rate": 1.1814210635954628e-06, + "loss": 0.6797, + "step": 53687 + }, + { + "epoch": 1.38, + "learning_rate": 1.181393852249179e-06, + "loss": 0.616, + "step": 53688 + }, + { + "epoch": 1.38, + "learning_rate": 1.1813666407640103e-06, + "loss": 0.7324, + "step": 53689 + }, + { + "epoch": 1.38, + "learning_rate": 1.181339429139978e-06, + "loss": 0.8545, + "step": 53690 + }, + { + "epoch": 1.38, + "learning_rate": 1.1813122173771018e-06, + "loss": 0.6904, + "step": 53691 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812850054754035e-06, + "loss": 0.5864, + "step": 53692 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812577934349035e-06, + "loss": 0.6523, + "step": 53693 + }, + { + "epoch": 1.38, + "learning_rate": 1.181230581255623e-06, + "loss": 0.752, + "step": 53694 + }, + { + "epoch": 1.38, + "learning_rate": 1.1812033689375822e-06, + "loss": 0.7441, + "step": 53695 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811761564808023e-06, + "loss": 0.6587, + "step": 53696 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811489438853044e-06, + "loss": 0.5879, + "step": 53697 + }, + { + "epoch": 1.38, + "learning_rate": 1.1811217311511092e-06, + "loss": 0.6621, + "step": 53698 + }, + { + "epoch": 1.38, + "learning_rate": 1.181094518278237e-06, + "loss": 0.7061, + "step": 53699 + }, + { + "epoch": 1.38, + "learning_rate": 1.1810673052667094e-06, + "loss": 0.5662, + "step": 53700 + }, + { + "epoch": 1.38, + "learning_rate": 1.1810400921165468e-06, + "loss": 0.7119, + "step": 53701 + }, + { + "epoch": 1.38, + "learning_rate": 1.18101287882777e-06, + "loss": 0.8184, + "step": 53702 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809856654004003e-06, + "loss": 0.4626, + "step": 53703 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809584518344574e-06, + "loss": 0.6763, + "step": 53704 + }, + { + "epoch": 1.38, + "learning_rate": 1.180931238129964e-06, + "loss": 0.4454, + "step": 53705 + }, + { + "epoch": 1.38, + "learning_rate": 1.1809040242869392e-06, + "loss": 0.7334, + "step": 53706 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808768103054047e-06, + "loss": 0.5903, + "step": 53707 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808495961853811e-06, + "loss": 0.5859, + "step": 53708 + }, + { + "epoch": 1.38, + "learning_rate": 1.1808223819268893e-06, + "loss": 0.6724, + "step": 53709 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807951675299501e-06, + "loss": 0.6191, + "step": 53710 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807679529945844e-06, + "loss": 0.7715, + "step": 53711 + }, + { + "epoch": 1.38, + "learning_rate": 1.180740738320813e-06, + "loss": 0.7266, + "step": 53712 + }, + { + "epoch": 1.38, + "learning_rate": 1.1807135235086566e-06, + "loss": 0.4241, + "step": 53713 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806863085581361e-06, + "loss": 0.707, + "step": 53714 + }, + { + "epoch": 1.38, + "learning_rate": 1.180659093469273e-06, + "loss": 0.4907, + "step": 53715 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806318782420867e-06, + "loss": 0.7266, + "step": 53716 + }, + { + "epoch": 1.38, + "learning_rate": 1.1806046628765996e-06, + "loss": 0.4781, + "step": 53717 + }, + { + "epoch": 1.38, + "learning_rate": 1.180577447372831e-06, + "loss": 0.7842, + "step": 53718 + }, + { + "epoch": 1.38, + "learning_rate": 1.1805502317308035e-06, + "loss": 0.6519, + "step": 53719 + }, + { + "epoch": 1.38, + "learning_rate": 1.1805230159505365e-06, + "loss": 0.603, + "step": 53720 + }, + { + "epoch": 1.38, + "learning_rate": 1.180495800032051e-06, + "loss": 0.5337, + "step": 53721 + }, + { + "epoch": 1.38, + "learning_rate": 1.1804685839753688e-06, + "loss": 0.6455, + "step": 53722 + }, + { + "epoch": 1.38, + "learning_rate": 1.1804413677805097e-06, + "loss": 0.5385, + "step": 53723 + }, + { + "epoch": 1.38, + "learning_rate": 1.180414151447495e-06, + "loss": 0.5439, + "step": 53724 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803869349763456e-06, + "loss": 0.7559, + "step": 53725 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803597183670822e-06, + "loss": 0.6553, + "step": 53726 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803325016197255e-06, + "loss": 0.5923, + "step": 53727 + }, + { + "epoch": 1.38, + "learning_rate": 1.1803052847342967e-06, + "loss": 0.6248, + "step": 53728 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802780677108162e-06, + "loss": 0.5596, + "step": 53729 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802508505493055e-06, + "loss": 0.752, + "step": 53730 + }, + { + "epoch": 1.38, + "learning_rate": 1.1802236332497843e-06, + "loss": 0.6924, + "step": 53731 + }, + { + "epoch": 1.38, + "learning_rate": 1.180196415812275e-06, + "loss": 0.7554, + "step": 53732 + }, + { + "epoch": 1.38, + "learning_rate": 1.180169198236797e-06, + "loss": 0.7197, + "step": 53733 + }, + { + "epoch": 1.38, + "learning_rate": 1.1801419805233719e-06, + "loss": 0.791, + "step": 53734 + }, + { + "epoch": 1.38, + "learning_rate": 1.1801147626720202e-06, + "loss": 0.6201, + "step": 53735 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800875446827633e-06, + "loss": 0.6104, + "step": 53736 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800603265556212e-06, + "loss": 0.6963, + "step": 53737 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800331082906155e-06, + "loss": 0.5679, + "step": 53738 + }, + { + "epoch": 1.38, + "learning_rate": 1.1800058898877666e-06, + "loss": 0.8389, + "step": 53739 + }, + { + "epoch": 1.38, + "learning_rate": 1.1799786713470954e-06, + "loss": 0.5587, + "step": 53740 + }, + { + "epoch": 1.38, + "learning_rate": 1.179951452668623e-06, + "loss": 0.6875, + "step": 53741 + }, + { + "epoch": 1.38, + "learning_rate": 1.1799242338523697e-06, + "loss": 0.3728, + "step": 53742 + }, + { + "epoch": 1.38, + "learning_rate": 1.179897014898357e-06, + "loss": 0.5115, + "step": 53743 + }, + { + "epoch": 1.38, + "learning_rate": 1.1798697958066055e-06, + "loss": 0.5967, + "step": 53744 + }, + { + "epoch": 1.38, + "learning_rate": 1.179842576577136e-06, + "loss": 0.5273, + "step": 53745 + }, + { + "epoch": 1.38, + "learning_rate": 1.179815357209969e-06, + "loss": 0.5099, + "step": 53746 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797881377051259e-06, + "loss": 0.6084, + "step": 53747 + }, + { + "epoch": 1.38, + "learning_rate": 1.179760918062627e-06, + "loss": 0.7256, + "step": 53748 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797336982824937e-06, + "loss": 0.5952, + "step": 53749 + }, + { + "epoch": 1.38, + "learning_rate": 1.1797064783647465e-06, + "loss": 0.6646, + "step": 53750 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796792583094064e-06, + "loss": 0.6699, + "step": 53751 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796520381164941e-06, + "loss": 0.4773, + "step": 53752 + }, + { + "epoch": 1.38, + "learning_rate": 1.1796248177860303e-06, + "loss": 0.75, + "step": 53753 + }, + { + "epoch": 1.38, + "learning_rate": 1.179597597318036e-06, + "loss": 0.5942, + "step": 53754 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795703767125326e-06, + "loss": 0.6128, + "step": 53755 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795431559695402e-06, + "loss": 0.6274, + "step": 53756 + }, + { + "epoch": 1.38, + "learning_rate": 1.1795159350890795e-06, + "loss": 0.6455, + "step": 53757 + }, + { + "epoch": 1.38, + "learning_rate": 1.179488714071172e-06, + "loss": 0.7168, + "step": 53758 + }, + { + "epoch": 1.38, + "learning_rate": 1.1794614929158382e-06, + "loss": 0.6826, + "step": 53759 + }, + { + "epoch": 1.38, + "learning_rate": 1.179434271623099e-06, + "loss": 0.5723, + "step": 53760 + }, + { + "epoch": 1.38, + "learning_rate": 1.1794070501929753e-06, + "loss": 0.5254, + "step": 53761 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793798286254876e-06, + "loss": 0.6904, + "step": 53762 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793526069206574e-06, + "loss": 0.6494, + "step": 53763 + }, + { + "epoch": 1.38, + "learning_rate": 1.1793253850785049e-06, + "loss": 0.6387, + "step": 53764 + }, + { + "epoch": 1.38, + "learning_rate": 1.179298163099051e-06, + "loss": 0.6981, + "step": 53765 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792709409823172e-06, + "loss": 0.7734, + "step": 53766 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792437187283235e-06, + "loss": 0.6152, + "step": 53767 + }, + { + "epoch": 1.38, + "learning_rate": 1.1792164963370914e-06, + "loss": 0.7344, + "step": 53768 + }, + { + "epoch": 1.38, + "learning_rate": 1.179189273808641e-06, + "loss": 0.8438, + "step": 53769 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791620511429946e-06, + "loss": 0.6914, + "step": 53770 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791348283401712e-06, + "loss": 0.5027, + "step": 53771 + }, + { + "epoch": 1.38, + "learning_rate": 1.1791076054001928e-06, + "loss": 0.707, + "step": 53772 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790803823230798e-06, + "loss": 0.7539, + "step": 53773 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790531591088534e-06, + "loss": 0.876, + "step": 53774 + }, + { + "epoch": 1.38, + "learning_rate": 1.1790259357575338e-06, + "loss": 0.6738, + "step": 53775 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789987122691426e-06, + "loss": 0.7061, + "step": 53776 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789714886437003e-06, + "loss": 0.7803, + "step": 53777 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789442648812278e-06, + "loss": 0.7607, + "step": 53778 + }, + { + "epoch": 1.38, + "learning_rate": 1.1789170409817457e-06, + "loss": 0.562, + "step": 53779 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788898169452754e-06, + "loss": 0.6865, + "step": 53780 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788625927718373e-06, + "loss": 0.584, + "step": 53781 + }, + { + "epoch": 1.38, + "learning_rate": 1.1788353684614521e-06, + "loss": 0.5649, + "step": 53782 + }, + { + "epoch": 1.38, + "learning_rate": 1.178808144014141e-06, + "loss": 0.7119, + "step": 53783 + }, + { + "epoch": 1.38, + "learning_rate": 1.1787809194299247e-06, + "loss": 0.6445, + "step": 53784 + }, + { + "epoch": 1.38, + "learning_rate": 1.178753694708824e-06, + "loss": 0.7266, + "step": 53785 + }, + { + "epoch": 1.38, + "learning_rate": 1.1787264698508599e-06, + "loss": 0.6289, + "step": 53786 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786992448560533e-06, + "loss": 0.6855, + "step": 53787 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786720197244248e-06, + "loss": 0.6919, + "step": 53788 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786447944559952e-06, + "loss": 0.4189, + "step": 53789 + }, + { + "epoch": 1.38, + "learning_rate": 1.1786175690507855e-06, + "loss": 0.6184, + "step": 53790 + }, + { + "epoch": 1.38, + "learning_rate": 1.178590343508817e-06, + "loss": 0.5757, + "step": 53791 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785631178301096e-06, + "loss": 0.6434, + "step": 53792 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785358920146848e-06, + "loss": 0.645, + "step": 53793 + }, + { + "epoch": 1.38, + "learning_rate": 1.1785086660625632e-06, + "loss": 0.7207, + "step": 53794 + }, + { + "epoch": 1.38, + "learning_rate": 1.178481439973766e-06, + "loss": 0.5784, + "step": 53795 + }, + { + "epoch": 1.38, + "learning_rate": 1.1784542137483134e-06, + "loss": 0.4985, + "step": 53796 + }, + { + "epoch": 1.38, + "learning_rate": 1.1784269873862267e-06, + "loss": 0.644, + "step": 53797 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783997608875266e-06, + "loss": 0.668, + "step": 53798 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783725342522345e-06, + "loss": 0.5288, + "step": 53799 + }, + { + "epoch": 1.38, + "learning_rate": 1.17834530748037e-06, + "loss": 0.6763, + "step": 53800 + }, + { + "epoch": 1.38, + "learning_rate": 1.1783180805719553e-06, + "loss": 0.8047, + "step": 53801 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782908535270103e-06, + "loss": 0.5503, + "step": 53802 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782636263455566e-06, + "loss": 0.6514, + "step": 53803 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782363990276141e-06, + "loss": 0.5859, + "step": 53804 + }, + { + "epoch": 1.38, + "learning_rate": 1.1782091715732047e-06, + "loss": 0.6689, + "step": 53805 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781819439823484e-06, + "loss": 0.6553, + "step": 53806 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781547162550665e-06, + "loss": 0.5757, + "step": 53807 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781274883913794e-06, + "loss": 0.6226, + "step": 53808 + }, + { + "epoch": 1.38, + "learning_rate": 1.1781002603913086e-06, + "loss": 0.8848, + "step": 53809 + }, + { + "epoch": 1.38, + "learning_rate": 1.1780730322548745e-06, + "loss": 0.5232, + "step": 53810 + }, + { + "epoch": 1.38, + "learning_rate": 1.178045803982098e-06, + "loss": 0.4868, + "step": 53811 + }, + { + "epoch": 1.38, + "learning_rate": 1.1780185755730003e-06, + "loss": 0.668, + "step": 53812 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779913470276017e-06, + "loss": 0.6816, + "step": 53813 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779641183459234e-06, + "loss": 0.7544, + "step": 53814 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779368895279864e-06, + "loss": 0.6709, + "step": 53815 + }, + { + "epoch": 1.38, + "learning_rate": 1.1779096605738113e-06, + "loss": 0.6475, + "step": 53816 + }, + { + "epoch": 1.38, + "learning_rate": 1.1778824314834185e-06, + "loss": 0.8711, + "step": 53817 + }, + { + "epoch": 1.38, + "learning_rate": 1.1778552022568296e-06, + "loss": 0.7744, + "step": 53818 + }, + { + "epoch": 1.38, + "learning_rate": 1.177827972894065e-06, + "loss": 0.7686, + "step": 53819 + }, + { + "epoch": 1.38, + "learning_rate": 1.177800743395146e-06, + "loss": 0.6396, + "step": 53820 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777735137600928e-06, + "loss": 0.7188, + "step": 53821 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777462839889267e-06, + "loss": 0.6914, + "step": 53822 + }, + { + "epoch": 1.38, + "learning_rate": 1.1777190540816684e-06, + "loss": 0.6943, + "step": 53823 + }, + { + "epoch": 1.38, + "learning_rate": 1.177691824038339e-06, + "loss": 0.3308, + "step": 53824 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776645938589591e-06, + "loss": 0.6025, + "step": 53825 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776373635435494e-06, + "loss": 0.6182, + "step": 53826 + }, + { + "epoch": 1.38, + "learning_rate": 1.1776101330921311e-06, + "loss": 0.77, + "step": 53827 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775829025047249e-06, + "loss": 0.709, + "step": 53828 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775556717813512e-06, + "loss": 0.6816, + "step": 53829 + }, + { + "epoch": 1.38, + "learning_rate": 1.1775284409220318e-06, + "loss": 0.646, + "step": 53830 + }, + { + "epoch": 1.38, + "learning_rate": 1.177501209926787e-06, + "loss": 0.5459, + "step": 53831 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774739787956373e-06, + "loss": 0.7847, + "step": 53832 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774467475286043e-06, + "loss": 0.6963, + "step": 53833 + }, + { + "epoch": 1.38, + "learning_rate": 1.1774195161257086e-06, + "loss": 0.6279, + "step": 53834 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773922845869707e-06, + "loss": 0.6318, + "step": 53835 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773650529124114e-06, + "loss": 0.5503, + "step": 53836 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773378211020525e-06, + "loss": 0.7275, + "step": 53837 + }, + { + "epoch": 1.38, + "learning_rate": 1.1773105891559137e-06, + "loss": 0.4917, + "step": 53838 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772833570740163e-06, + "loss": 0.6953, + "step": 53839 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772561248563815e-06, + "loss": 0.5109, + "step": 53840 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772288925030295e-06, + "loss": 0.6367, + "step": 53841 + }, + { + "epoch": 1.38, + "learning_rate": 1.1772016600139818e-06, + "loss": 0.7617, + "step": 53842 + }, + { + "epoch": 1.38, + "learning_rate": 1.1771744273892587e-06, + "loss": 0.7471, + "step": 53843 + }, + { + "epoch": 1.38, + "learning_rate": 1.1771471946288813e-06, + "loss": 0.584, + "step": 53844 + }, + { + "epoch": 1.38, + "learning_rate": 1.177119961732871e-06, + "loss": 0.7207, + "step": 53845 + }, + { + "epoch": 1.38, + "learning_rate": 1.1770927287012474e-06, + "loss": 0.7705, + "step": 53846 + }, + { + "epoch": 1.38, + "learning_rate": 1.1770654955340323e-06, + "loss": 0.7686, + "step": 53847 + }, + { + "epoch": 1.38, + "learning_rate": 1.177038262231246e-06, + "loss": 0.625, + "step": 53848 + }, + { + "epoch": 1.38, + "learning_rate": 1.17701102879291e-06, + "loss": 0.7383, + "step": 53849 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769837952190447e-06, + "loss": 0.5864, + "step": 53850 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769565615096714e-06, + "loss": 0.4856, + "step": 53851 + }, + { + "epoch": 1.38, + "learning_rate": 1.1769293276648098e-06, + "loss": 0.5825, + "step": 53852 + }, + { + "epoch": 1.38, + "learning_rate": 1.176902093684482e-06, + "loss": 0.752, + "step": 53853 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768748595687084e-06, + "loss": 0.7754, + "step": 53854 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768476253175098e-06, + "loss": 0.6389, + "step": 53855 + }, + { + "epoch": 1.38, + "learning_rate": 1.1768203909309074e-06, + "loss": 0.6318, + "step": 53856 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767931564089213e-06, + "loss": 0.5461, + "step": 53857 + }, + { + "epoch": 1.38, + "learning_rate": 1.176765921751573e-06, + "loss": 0.7666, + "step": 53858 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767386869588828e-06, + "loss": 0.6118, + "step": 53859 + }, + { + "epoch": 1.38, + "learning_rate": 1.1767114520308728e-06, + "loss": 0.7158, + "step": 53860 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766842169675624e-06, + "loss": 0.3524, + "step": 53861 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766569817689732e-06, + "loss": 0.5938, + "step": 53862 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766297464351253e-06, + "loss": 0.5107, + "step": 53863 + }, + { + "epoch": 1.38, + "learning_rate": 1.1766025109660407e-06, + "loss": 0.5176, + "step": 53864 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765752753617397e-06, + "loss": 0.6748, + "step": 53865 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765480396222429e-06, + "loss": 0.6924, + "step": 53866 + }, + { + "epoch": 1.38, + "learning_rate": 1.1765208037475714e-06, + "loss": 0.5923, + "step": 53867 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764935677377462e-06, + "loss": 0.6626, + "step": 53868 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764663315927876e-06, + "loss": 0.749, + "step": 53869 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764390953127175e-06, + "loss": 0.5757, + "step": 53870 + }, + { + "epoch": 1.38, + "learning_rate": 1.1764118588975556e-06, + "loss": 0.5278, + "step": 53871 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763846223473235e-06, + "loss": 0.7607, + "step": 53872 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763573856620416e-06, + "loss": 0.8105, + "step": 53873 + }, + { + "epoch": 1.38, + "learning_rate": 1.176330148841731e-06, + "loss": 0.4636, + "step": 53874 + }, + { + "epoch": 1.38, + "learning_rate": 1.1763029118864127e-06, + "loss": 0.5596, + "step": 53875 + }, + { + "epoch": 1.38, + "learning_rate": 1.176275674796107e-06, + "loss": 0.7163, + "step": 53876 + }, + { + "epoch": 1.38, + "learning_rate": 1.1762484375708355e-06, + "loss": 0.5588, + "step": 53877 + }, + { + "epoch": 1.38, + "learning_rate": 1.1762212002106184e-06, + "loss": 0.6807, + "step": 53878 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761939627154768e-06, + "loss": 0.6016, + "step": 53879 + }, + { + "epoch": 1.38, + "learning_rate": 1.176166725085432e-06, + "loss": 0.6885, + "step": 53880 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761394873205042e-06, + "loss": 0.5732, + "step": 53881 + }, + { + "epoch": 1.38, + "learning_rate": 1.1761122494207144e-06, + "loss": 0.5923, + "step": 53882 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760850113860835e-06, + "loss": 0.6577, + "step": 53883 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760577732166324e-06, + "loss": 0.6455, + "step": 53884 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760305349123822e-06, + "loss": 0.71, + "step": 53885 + }, + { + "epoch": 1.38, + "learning_rate": 1.1760032964733535e-06, + "loss": 0.7998, + "step": 53886 + }, + { + "epoch": 1.38, + "learning_rate": 1.175976057899567e-06, + "loss": 0.4808, + "step": 53887 + }, + { + "epoch": 1.38, + "learning_rate": 1.1759488191910436e-06, + "loss": 0.5879, + "step": 53888 + }, + { + "epoch": 1.38, + "learning_rate": 1.1759215803478046e-06, + "loss": 0.5889, + "step": 53889 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758943413698704e-06, + "loss": 0.6372, + "step": 53890 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758671022572623e-06, + "loss": 0.6787, + "step": 53891 + }, + { + "epoch": 1.38, + "learning_rate": 1.1758398630100002e-06, + "loss": 0.7168, + "step": 53892 + }, + { + "epoch": 1.38, + "learning_rate": 1.175812623628106e-06, + "loss": 0.9678, + "step": 53893 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757853841116e-06, + "loss": 0.7148, + "step": 53894 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757581444605037e-06, + "loss": 0.6177, + "step": 53895 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757309046748368e-06, + "loss": 0.6963, + "step": 53896 + }, + { + "epoch": 1.38, + "learning_rate": 1.1757036647546212e-06, + "loss": 0.6431, + "step": 53897 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756764246998771e-06, + "loss": 0.6689, + "step": 53898 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756491845106257e-06, + "loss": 0.567, + "step": 53899 + }, + { + "epoch": 1.38, + "learning_rate": 1.1756219441868883e-06, + "loss": 0.6304, + "step": 53900 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755947037286846e-06, + "loss": 0.5781, + "step": 53901 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755674631360363e-06, + "loss": 0.5332, + "step": 53902 + }, + { + "epoch": 1.38, + "learning_rate": 1.175540222408964e-06, + "loss": 0.4915, + "step": 53903 + }, + { + "epoch": 1.38, + "learning_rate": 1.1755129815474888e-06, + "loss": 0.6396, + "step": 53904 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754857405516316e-06, + "loss": 0.4846, + "step": 53905 + }, + { + "epoch": 1.38, + "learning_rate": 1.175458499421413e-06, + "loss": 0.5564, + "step": 53906 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754312581568535e-06, + "loss": 0.7236, + "step": 53907 + }, + { + "epoch": 1.38, + "learning_rate": 1.1754040167579746e-06, + "loss": 0.6768, + "step": 53908 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753767752247968e-06, + "loss": 0.7915, + "step": 53909 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753495335573413e-06, + "loss": 0.7271, + "step": 53910 + }, + { + "epoch": 1.38, + "learning_rate": 1.1753222917556284e-06, + "loss": 0.6929, + "step": 53911 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752950498196794e-06, + "loss": 0.7412, + "step": 53912 + }, + { + "epoch": 1.38, + "learning_rate": 1.175267807749515e-06, + "loss": 0.6543, + "step": 53913 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752405655451562e-06, + "loss": 0.6279, + "step": 53914 + }, + { + "epoch": 1.38, + "learning_rate": 1.1752133232066237e-06, + "loss": 0.7285, + "step": 53915 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751860807339387e-06, + "loss": 0.5645, + "step": 53916 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751588381271212e-06, + "loss": 0.5728, + "step": 53917 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751315953861932e-06, + "loss": 0.4258, + "step": 53918 + }, + { + "epoch": 1.38, + "learning_rate": 1.1751043525111743e-06, + "loss": 0.751, + "step": 53919 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750771095020867e-06, + "loss": 0.6089, + "step": 53920 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750498663589506e-06, + "loss": 0.7051, + "step": 53921 + }, + { + "epoch": 1.38, + "learning_rate": 1.1750226230817863e-06, + "loss": 0.708, + "step": 53922 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749953796706157e-06, + "loss": 0.4186, + "step": 53923 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749681361254591e-06, + "loss": 0.6211, + "step": 53924 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749408924463375e-06, + "loss": 0.5498, + "step": 53925 + }, + { + "epoch": 1.38, + "learning_rate": 1.1749136486332716e-06, + "loss": 0.4297, + "step": 53926 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748864046862824e-06, + "loss": 0.4937, + "step": 53927 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748591606053904e-06, + "loss": 0.6899, + "step": 53928 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748319163906172e-06, + "loss": 0.8223, + "step": 53929 + }, + { + "epoch": 1.38, + "learning_rate": 1.1748046720419832e-06, + "loss": 0.7051, + "step": 53930 + }, + { + "epoch": 1.38, + "learning_rate": 1.1747774275595092e-06, + "loss": 0.688, + "step": 53931 + }, + { + "epoch": 1.38, + "learning_rate": 1.174750182943216e-06, + "loss": 0.7778, + "step": 53932 + }, + { + "epoch": 1.38, + "learning_rate": 1.174722938193125e-06, + "loss": 0.5784, + "step": 53933 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746956933092565e-06, + "loss": 0.6855, + "step": 53934 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746684482916316e-06, + "loss": 0.8135, + "step": 53935 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746412031402708e-06, + "loss": 0.3057, + "step": 53936 + }, + { + "epoch": 1.38, + "learning_rate": 1.1746139578551954e-06, + "loss": 0.6455, + "step": 53937 + }, + { + "epoch": 1.38, + "learning_rate": 1.1745867124364261e-06, + "loss": 0.6367, + "step": 53938 + }, + { + "epoch": 1.38, + "learning_rate": 1.174559466883984e-06, + "loss": 0.5803, + "step": 53939 + }, + { + "epoch": 1.38, + "learning_rate": 1.1745322211978898e-06, + "loss": 0.814, + "step": 53940 + }, + { + "epoch": 1.38, + "learning_rate": 1.174504975378164e-06, + "loss": 0.6509, + "step": 53941 + }, + { + "epoch": 1.38, + "learning_rate": 1.1744777294248278e-06, + "loss": 0.5732, + "step": 53942 + }, + { + "epoch": 1.38, + "learning_rate": 1.1744504833379024e-06, + "loss": 0.6709, + "step": 53943 + }, + { + "epoch": 1.38, + "learning_rate": 1.174423237117408e-06, + "loss": 0.7441, + "step": 53944 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743959907633656e-06, + "loss": 0.7676, + "step": 53945 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743687442757963e-06, + "loss": 0.6567, + "step": 53946 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743414976547209e-06, + "loss": 0.6504, + "step": 53947 + }, + { + "epoch": 1.38, + "learning_rate": 1.1743142509001603e-06, + "loss": 0.5996, + "step": 53948 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742870040121352e-06, + "loss": 0.7021, + "step": 53949 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742597569906667e-06, + "loss": 0.3569, + "step": 53950 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742325098357752e-06, + "loss": 0.833, + "step": 53951 + }, + { + "epoch": 1.38, + "learning_rate": 1.1742052625474822e-06, + "loss": 0.5952, + "step": 53952 + }, + { + "epoch": 1.38, + "learning_rate": 1.174178015125808e-06, + "loss": 0.6387, + "step": 53953 + }, + { + "epoch": 1.38, + "learning_rate": 1.1741507675707741e-06, + "loss": 0.7188, + "step": 53954 + }, + { + "epoch": 1.38, + "learning_rate": 1.1741235198824006e-06, + "loss": 0.6978, + "step": 53955 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740962720607091e-06, + "loss": 0.5825, + "step": 53956 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740690241057196e-06, + "loss": 0.6787, + "step": 53957 + }, + { + "epoch": 1.38, + "learning_rate": 1.1740417760174538e-06, + "loss": 0.5693, + "step": 53958 + }, + { + "epoch": 1.38, + "learning_rate": 1.174014527795932e-06, + "loss": 0.4382, + "step": 53959 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739872794411757e-06, + "loss": 0.6597, + "step": 53960 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739600309532047e-06, + "loss": 0.6875, + "step": 53961 + }, + { + "epoch": 1.38, + "learning_rate": 1.173932782332041e-06, + "loss": 0.5527, + "step": 53962 + }, + { + "epoch": 1.38, + "learning_rate": 1.1739055335777046e-06, + "loss": 0.7627, + "step": 53963 + }, + { + "epoch": 1.38, + "learning_rate": 1.173878284690217e-06, + "loss": 0.5908, + "step": 53964 + }, + { + "epoch": 1.38, + "learning_rate": 1.1738510356695989e-06, + "loss": 0.667, + "step": 53965 + }, + { + "epoch": 1.38, + "learning_rate": 1.1738237865158706e-06, + "loss": 0.6162, + "step": 53966 + }, + { + "epoch": 1.38, + "learning_rate": 1.1737965372290537e-06, + "loss": 0.5259, + "step": 53967 + }, + { + "epoch": 1.38, + "learning_rate": 1.173769287809169e-06, + "loss": 0.5386, + "step": 53968 + }, + { + "epoch": 1.38, + "learning_rate": 1.173742038256237e-06, + "loss": 0.7363, + "step": 53969 + }, + { + "epoch": 1.38, + "learning_rate": 1.1737147885702782e-06, + "loss": 0.5498, + "step": 53970 + }, + { + "epoch": 1.38, + "learning_rate": 1.1736875387513146e-06, + "loss": 0.627, + "step": 53971 + }, + { + "epoch": 1.38, + "learning_rate": 1.173660288799366e-06, + "loss": 0.5293, + "step": 53972 + }, + { + "epoch": 1.38, + "learning_rate": 1.173633038714454e-06, + "loss": 0.6582, + "step": 53973 + }, + { + "epoch": 1.38, + "learning_rate": 1.1736057884965992e-06, + "loss": 0.5596, + "step": 53974 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735785381458224e-06, + "loss": 0.7402, + "step": 53975 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735512876621444e-06, + "loss": 0.8125, + "step": 53976 + }, + { + "epoch": 1.38, + "learning_rate": 1.1735240370455862e-06, + "loss": 0.625, + "step": 53977 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734967862961685e-06, + "loss": 0.6709, + "step": 53978 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734695354139126e-06, + "loss": 0.7559, + "step": 53979 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734422843988387e-06, + "loss": 0.6123, + "step": 53980 + }, + { + "epoch": 1.38, + "learning_rate": 1.1734150332509683e-06, + "loss": 0.5859, + "step": 53981 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733877819703214e-06, + "loss": 0.6914, + "step": 53982 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733605305569202e-06, + "loss": 0.7471, + "step": 53983 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733332790107846e-06, + "loss": 0.6079, + "step": 53984 + }, + { + "epoch": 1.38, + "learning_rate": 1.1733060273319355e-06, + "loss": 0.7559, + "step": 53985 + }, + { + "epoch": 1.38, + "learning_rate": 1.1732787755203938e-06, + "loss": 0.4907, + "step": 53986 + }, + { + "epoch": 1.38, + "learning_rate": 1.1732515235761811e-06, + "loss": 0.7163, + "step": 53987 + }, + { + "epoch": 1.38, + "learning_rate": 1.173224271499317e-06, + "loss": 0.4446, + "step": 53988 + }, + { + "epoch": 1.38, + "learning_rate": 1.1731970192898235e-06, + "loss": 0.8242, + "step": 53989 + }, + { + "epoch": 1.38, + "learning_rate": 1.1731697669477209e-06, + "loss": 0.5898, + "step": 53990 + }, + { + "epoch": 1.38, + "learning_rate": 1.17314251447303e-06, + "loss": 0.6528, + "step": 53991 + }, + { + "epoch": 1.38, + "learning_rate": 1.173115261865772e-06, + "loss": 0.7832, + "step": 53992 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730880091259674e-06, + "loss": 0.6001, + "step": 53993 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730607562536379e-06, + "loss": 0.6953, + "step": 53994 + }, + { + "epoch": 1.38, + "learning_rate": 1.173033503248803e-06, + "loss": 0.6382, + "step": 53995 + }, + { + "epoch": 1.38, + "learning_rate": 1.1730062501114848e-06, + "loss": 0.7017, + "step": 53996 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729789968417033e-06, + "loss": 0.5112, + "step": 53997 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729517434394799e-06, + "loss": 0.6108, + "step": 53998 + }, + { + "epoch": 1.38, + "learning_rate": 1.1729244899048354e-06, + "loss": 0.6426, + "step": 53999 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728972362377905e-06, + "loss": 0.6748, + "step": 54000 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728699824383658e-06, + "loss": 0.4592, + "step": 54001 + }, + { + "epoch": 1.38, + "learning_rate": 1.1728427285065829e-06, + "loss": 0.873, + "step": 54002 + }, + { + "epoch": 1.38, + "learning_rate": 1.172815474442462e-06, + "loss": 0.8398, + "step": 54003 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727882202460248e-06, + "loss": 0.5227, + "step": 54004 + }, + { + "epoch": 1.38, + "learning_rate": 1.172760965917291e-06, + "loss": 0.7178, + "step": 54005 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727337114562825e-06, + "loss": 0.6094, + "step": 54006 + }, + { + "epoch": 1.38, + "learning_rate": 1.1727064568630193e-06, + "loss": 0.6816, + "step": 54007 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726792021375232e-06, + "loss": 0.5684, + "step": 54008 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726519472798142e-06, + "loss": 0.542, + "step": 54009 + }, + { + "epoch": 1.38, + "learning_rate": 1.1726246922899135e-06, + "loss": 0.6792, + "step": 54010 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725974371678423e-06, + "loss": 0.6367, + "step": 54011 + }, + { + "epoch": 1.38, + "learning_rate": 1.172570181913621e-06, + "loss": 0.6001, + "step": 54012 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725429265272707e-06, + "loss": 0.5757, + "step": 54013 + }, + { + "epoch": 1.38, + "learning_rate": 1.1725156710088123e-06, + "loss": 0.6123, + "step": 54014 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724884153582664e-06, + "loss": 0.7656, + "step": 54015 + }, + { + "epoch": 1.38, + "learning_rate": 1.172461159575654e-06, + "loss": 0.2573, + "step": 54016 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724339036609962e-06, + "loss": 0.6113, + "step": 54017 + }, + { + "epoch": 1.38, + "learning_rate": 1.1724066476143135e-06, + "loss": 0.6001, + "step": 54018 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723793914356274e-06, + "loss": 0.6863, + "step": 54019 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723521351249578e-06, + "loss": 0.5208, + "step": 54020 + }, + { + "epoch": 1.38, + "learning_rate": 1.1723248786823266e-06, + "loss": 0.7402, + "step": 54021 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722976221077536e-06, + "loss": 0.5244, + "step": 54022 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722703654012606e-06, + "loss": 0.6729, + "step": 54023 + }, + { + "epoch": 1.38, + "learning_rate": 1.172243108562868e-06, + "loss": 0.6558, + "step": 54024 + }, + { + "epoch": 1.38, + "learning_rate": 1.1722158515925971e-06, + "loss": 0.5122, + "step": 54025 + }, + { + "epoch": 1.38, + "learning_rate": 1.172188594490468e-06, + "loss": 0.6455, + "step": 54026 + }, + { + "epoch": 1.38, + "learning_rate": 1.172161337256502e-06, + "loss": 0.4795, + "step": 54027 + }, + { + "epoch": 1.38, + "learning_rate": 1.17213407989072e-06, + "loss": 0.7402, + "step": 54028 + }, + { + "epoch": 1.38, + "learning_rate": 1.172106822393143e-06, + "loss": 0.6685, + "step": 54029 + }, + { + "epoch": 1.38, + "learning_rate": 1.172079564763792e-06, + "loss": 0.7842, + "step": 54030 + }, + { + "epoch": 1.38, + "learning_rate": 1.1720523070026873e-06, + "loss": 0.6211, + "step": 54031 + }, + { + "epoch": 1.38, + "learning_rate": 1.1720250491098499e-06, + "loss": 0.6543, + "step": 54032 + }, + { + "epoch": 1.38, + "learning_rate": 1.171997791085301e-06, + "loss": 0.7842, + "step": 54033 + }, + { + "epoch": 1.38, + "learning_rate": 1.1719705329290613e-06, + "loss": 0.4955, + "step": 54034 + }, + { + "epoch": 1.38, + "learning_rate": 1.1719432746411514e-06, + "loss": 0.5674, + "step": 54035 + }, + { + "epoch": 1.38, + "learning_rate": 1.171916016221593e-06, + "loss": 0.6255, + "step": 54036 + }, + { + "epoch": 1.38, + "learning_rate": 1.171888757670406e-06, + "loss": 0.562, + "step": 54037 + }, + { + "epoch": 1.39, + "learning_rate": 1.1718614989876117e-06, + "loss": 0.7617, + "step": 54038 + }, + { + "epoch": 1.39, + "learning_rate": 1.171834240173231e-06, + "loss": 0.7695, + "step": 54039 + }, + { + "epoch": 1.39, + "learning_rate": 1.1718069812272847e-06, + "loss": 0.6963, + "step": 54040 + }, + { + "epoch": 1.39, + "learning_rate": 1.1717797221497938e-06, + "loss": 0.7451, + "step": 54041 + }, + { + "epoch": 1.39, + "learning_rate": 1.171752462940779e-06, + "loss": 0.7432, + "step": 54042 + }, + { + "epoch": 1.39, + "learning_rate": 1.1717252036002611e-06, + "loss": 0.6108, + "step": 54043 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716979441282616e-06, + "loss": 0.6265, + "step": 54044 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716706845248005e-06, + "loss": 0.6462, + "step": 54045 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716434247898992e-06, + "loss": 0.6094, + "step": 54046 + }, + { + "epoch": 1.39, + "learning_rate": 1.1716161649235782e-06, + "loss": 0.6523, + "step": 54047 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715889049258588e-06, + "loss": 0.5645, + "step": 54048 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715616447967615e-06, + "loss": 0.5864, + "step": 54049 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715343845363075e-06, + "loss": 0.7227, + "step": 54050 + }, + { + "epoch": 1.39, + "learning_rate": 1.1715071241445173e-06, + "loss": 0.7051, + "step": 54051 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714798636214122e-06, + "loss": 0.4463, + "step": 54052 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714526029670126e-06, + "loss": 0.8057, + "step": 54053 + }, + { + "epoch": 1.39, + "learning_rate": 1.1714253421813397e-06, + "loss": 0.7393, + "step": 54054 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713980812644147e-06, + "loss": 0.5239, + "step": 54055 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713708202162576e-06, + "loss": 0.7549, + "step": 54056 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713435590368898e-06, + "loss": 0.6221, + "step": 54057 + }, + { + "epoch": 1.39, + "learning_rate": 1.1713162977263323e-06, + "loss": 0.4668, + "step": 54058 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712890362846058e-06, + "loss": 0.7598, + "step": 54059 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712617747117308e-06, + "loss": 0.7793, + "step": 54060 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712345130077288e-06, + "loss": 0.7705, + "step": 54061 + }, + { + "epoch": 1.39, + "learning_rate": 1.1712072511726203e-06, + "loss": 0.7002, + "step": 54062 + }, + { + "epoch": 1.39, + "learning_rate": 1.1711799892064264e-06, + "loss": 0.4927, + "step": 54063 + }, + { + "epoch": 1.39, + "learning_rate": 1.171152727109168e-06, + "loss": 0.5703, + "step": 54064 + }, + { + "epoch": 1.39, + "learning_rate": 1.1711254648808657e-06, + "loss": 0.6128, + "step": 54065 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710982025215404e-06, + "loss": 0.7451, + "step": 54066 + }, + { + "epoch": 1.39, + "learning_rate": 1.171070940031213e-06, + "loss": 0.7036, + "step": 54067 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710436774099047e-06, + "loss": 0.6465, + "step": 54068 + }, + { + "epoch": 1.39, + "learning_rate": 1.1710164146576363e-06, + "loss": 0.749, + "step": 54069 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709891517744278e-06, + "loss": 0.6636, + "step": 54070 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709618887603011e-06, + "loss": 0.8389, + "step": 54071 + }, + { + "epoch": 1.39, + "learning_rate": 1.1709346256152767e-06, + "loss": 0.4331, + "step": 54072 + }, + { + "epoch": 1.39, + "learning_rate": 1.170907362339376e-06, + "loss": 0.5381, + "step": 54073 + }, + { + "epoch": 1.39, + "learning_rate": 1.170880098932619e-06, + "loss": 0.5391, + "step": 54074 + }, + { + "epoch": 1.39, + "learning_rate": 1.170852835395027e-06, + "loss": 0.6802, + "step": 54075 + }, + { + "epoch": 1.39, + "learning_rate": 1.1708255717266206e-06, + "loss": 0.4626, + "step": 54076 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707983079274212e-06, + "loss": 0.7974, + "step": 54077 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707710439974492e-06, + "loss": 0.5278, + "step": 54078 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707437799367259e-06, + "loss": 0.7178, + "step": 54079 + }, + { + "epoch": 1.39, + "learning_rate": 1.1707165157452718e-06, + "loss": 0.6169, + "step": 54080 + }, + { + "epoch": 1.39, + "learning_rate": 1.170689251423108e-06, + "loss": 0.6953, + "step": 54081 + }, + { + "epoch": 1.39, + "learning_rate": 1.170661986970255e-06, + "loss": 0.5938, + "step": 54082 + }, + { + "epoch": 1.39, + "learning_rate": 1.170634722386734e-06, + "loss": 0.6162, + "step": 54083 + }, + { + "epoch": 1.39, + "learning_rate": 1.1706074576725665e-06, + "loss": 0.5684, + "step": 54084 + }, + { + "epoch": 1.39, + "learning_rate": 1.170580192827772e-06, + "loss": 0.647, + "step": 54085 + }, + { + "epoch": 1.39, + "learning_rate": 1.1705529278523725e-06, + "loss": 0.4531, + "step": 54086 + }, + { + "epoch": 1.39, + "learning_rate": 1.1705256627463883e-06, + "loss": 0.8623, + "step": 54087 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704983975098404e-06, + "loss": 0.7061, + "step": 54088 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704711321427498e-06, + "loss": 0.5388, + "step": 54089 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704438666451373e-06, + "loss": 0.6318, + "step": 54090 + }, + { + "epoch": 1.39, + "learning_rate": 1.1704166010170235e-06, + "loss": 0.5752, + "step": 54091 + }, + { + "epoch": 1.39, + "learning_rate": 1.17038933525843e-06, + "loss": 0.6465, + "step": 54092 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703620693693767e-06, + "loss": 0.489, + "step": 54093 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703348033498856e-06, + "loss": 0.7236, + "step": 54094 + }, + { + "epoch": 1.39, + "learning_rate": 1.1703075371999764e-06, + "loss": 0.5575, + "step": 54095 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702802709196712e-06, + "loss": 0.7266, + "step": 54096 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702530045089895e-06, + "loss": 0.8398, + "step": 54097 + }, + { + "epoch": 1.39, + "learning_rate": 1.1702257379679532e-06, + "loss": 0.582, + "step": 54098 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701984712965832e-06, + "loss": 0.7305, + "step": 54099 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701712044948995e-06, + "loss": 0.6064, + "step": 54100 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701439375629238e-06, + "loss": 0.7808, + "step": 54101 + }, + { + "epoch": 1.39, + "learning_rate": 1.1701166705006767e-06, + "loss": 0.7373, + "step": 54102 + }, + { + "epoch": 1.39, + "learning_rate": 1.1700894033081792e-06, + "loss": 0.6074, + "step": 54103 + }, + { + "epoch": 1.39, + "learning_rate": 1.1700621359854519e-06, + "loss": 0.6284, + "step": 54104 + }, + { + "epoch": 1.39, + "learning_rate": 1.170034868532516e-06, + "loss": 0.6953, + "step": 54105 + }, + { + "epoch": 1.39, + "learning_rate": 1.170007600949392e-06, + "loss": 0.7891, + "step": 54106 + }, + { + "epoch": 1.39, + "learning_rate": 1.169980333236101e-06, + "loss": 0.5806, + "step": 54107 + }, + { + "epoch": 1.39, + "learning_rate": 1.1699530653926638e-06, + "loss": 0.6724, + "step": 54108 + }, + { + "epoch": 1.39, + "learning_rate": 1.169925797419102e-06, + "loss": 0.6855, + "step": 54109 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698985293154354e-06, + "loss": 0.6807, + "step": 54110 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698712610816852e-06, + "loss": 0.6807, + "step": 54111 + }, + { + "epoch": 1.39, + "learning_rate": 1.1698439927178722e-06, + "loss": 0.6353, + "step": 54112 + }, + { + "epoch": 1.39, + "learning_rate": 1.169816724224018e-06, + "loss": 0.521, + "step": 54113 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697894556001427e-06, + "loss": 0.6943, + "step": 54114 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697621868462675e-06, + "loss": 0.7261, + "step": 54115 + }, + { + "epoch": 1.39, + "learning_rate": 1.169734917962413e-06, + "loss": 0.6533, + "step": 54116 + }, + { + "epoch": 1.39, + "learning_rate": 1.1697076489486005e-06, + "loss": 0.5078, + "step": 54117 + }, + { + "epoch": 1.39, + "learning_rate": 1.1696803798048502e-06, + "loss": 0.876, + "step": 54118 + }, + { + "epoch": 1.39, + "learning_rate": 1.169653110531184e-06, + "loss": 0.6401, + "step": 54119 + }, + { + "epoch": 1.39, + "learning_rate": 1.169625841127622e-06, + "loss": 0.5454, + "step": 54120 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695985715941853e-06, + "loss": 0.5581, + "step": 54121 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695713019308947e-06, + "loss": 0.8018, + "step": 54122 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695440321377712e-06, + "loss": 0.5439, + "step": 54123 + }, + { + "epoch": 1.39, + "learning_rate": 1.1695167622148357e-06, + "loss": 0.5242, + "step": 54124 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694894921621087e-06, + "loss": 0.7295, + "step": 54125 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694622219796117e-06, + "loss": 0.6426, + "step": 54126 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694349516673652e-06, + "loss": 0.438, + "step": 54127 + }, + { + "epoch": 1.39, + "learning_rate": 1.1694076812253902e-06, + "loss": 0.5947, + "step": 54128 + }, + { + "epoch": 1.39, + "learning_rate": 1.1693804106537075e-06, + "loss": 0.4265, + "step": 54129 + }, + { + "epoch": 1.39, + "learning_rate": 1.169353139952338e-06, + "loss": 0.667, + "step": 54130 + }, + { + "epoch": 1.39, + "learning_rate": 1.1693258691213026e-06, + "loss": 0.7412, + "step": 54131 + }, + { + "epoch": 1.39, + "learning_rate": 1.169298598160622e-06, + "loss": 0.6523, + "step": 54132 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692713270703173e-06, + "loss": 0.7363, + "step": 54133 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692440558504099e-06, + "loss": 0.4717, + "step": 54134 + }, + { + "epoch": 1.39, + "learning_rate": 1.1692167845009193e-06, + "loss": 0.7129, + "step": 54135 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691895130218676e-06, + "loss": 0.6006, + "step": 54136 + }, + { + "epoch": 1.39, + "learning_rate": 1.169162241413275e-06, + "loss": 0.4907, + "step": 54137 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691349696751628e-06, + "loss": 0.6963, + "step": 54138 + }, + { + "epoch": 1.39, + "learning_rate": 1.1691076978075521e-06, + "loss": 0.6455, + "step": 54139 + }, + { + "epoch": 1.39, + "learning_rate": 1.169080425810463e-06, + "loss": 0.6211, + "step": 54140 + }, + { + "epoch": 1.39, + "learning_rate": 1.1690531536839168e-06, + "loss": 0.4861, + "step": 54141 + }, + { + "epoch": 1.39, + "learning_rate": 1.1690258814279345e-06, + "loss": 0.6719, + "step": 54142 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689986090425366e-06, + "loss": 0.7334, + "step": 54143 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689713365277445e-06, + "loss": 0.5059, + "step": 54144 + }, + { + "epoch": 1.39, + "learning_rate": 1.1689440638835788e-06, + "loss": 0.7148, + "step": 54145 + }, + { + "epoch": 1.39, + "learning_rate": 1.16891679111006e-06, + "loss": 0.4995, + "step": 54146 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688895182072101e-06, + "loss": 0.6602, + "step": 54147 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688622451750488e-06, + "loss": 0.5859, + "step": 54148 + }, + { + "epoch": 1.39, + "learning_rate": 1.1688349720135978e-06, + "loss": 0.6978, + "step": 54149 + }, + { + "epoch": 1.39, + "learning_rate": 1.168807698722877e-06, + "loss": 0.6665, + "step": 54150 + }, + { + "epoch": 1.39, + "learning_rate": 1.1687804253029083e-06, + "loss": 0.5537, + "step": 54151 + }, + { + "epoch": 1.39, + "learning_rate": 1.168753151753712e-06, + "loss": 0.5413, + "step": 54152 + }, + { + "epoch": 1.39, + "learning_rate": 1.1687258780753095e-06, + "loss": 0.448, + "step": 54153 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686986042677212e-06, + "loss": 0.5625, + "step": 54154 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686713303309683e-06, + "loss": 0.6807, + "step": 54155 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686440562650712e-06, + "loss": 0.6479, + "step": 54156 + }, + { + "epoch": 1.39, + "learning_rate": 1.1686167820700511e-06, + "loss": 0.4851, + "step": 54157 + }, + { + "epoch": 1.39, + "learning_rate": 1.168589507745929e-06, + "loss": 0.6973, + "step": 54158 + }, + { + "epoch": 1.39, + "learning_rate": 1.1685622332927261e-06, + "loss": 0.6406, + "step": 54159 + }, + { + "epoch": 1.39, + "learning_rate": 1.1685349587104623e-06, + "loss": 0.4972, + "step": 54160 + }, + { + "epoch": 1.39, + "learning_rate": 1.168507683999159e-06, + "loss": 0.6895, + "step": 54161 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684804091588372e-06, + "loss": 0.707, + "step": 54162 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684531341895178e-06, + "loss": 0.7339, + "step": 54163 + }, + { + "epoch": 1.39, + "learning_rate": 1.1684258590912216e-06, + "loss": 0.7861, + "step": 54164 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683985838639693e-06, + "loss": 0.8301, + "step": 54165 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683713085077823e-06, + "loss": 0.5928, + "step": 54166 + }, + { + "epoch": 1.39, + "learning_rate": 1.1683440330226809e-06, + "loss": 0.7627, + "step": 54167 + }, + { + "epoch": 1.39, + "learning_rate": 1.168316757408686e-06, + "loss": 0.542, + "step": 54168 + }, + { + "epoch": 1.39, + "learning_rate": 1.168289481665819e-06, + "loss": 0.7207, + "step": 54169 + }, + { + "epoch": 1.39, + "learning_rate": 1.1682622057941005e-06, + "loss": 0.6577, + "step": 54170 + }, + { + "epoch": 1.39, + "learning_rate": 1.168234929793551e-06, + "loss": 0.6118, + "step": 54171 + }, + { + "epoch": 1.39, + "learning_rate": 1.1682076536641922e-06, + "loss": 0.6094, + "step": 54172 + }, + { + "epoch": 1.39, + "learning_rate": 1.168180377406044e-06, + "loss": 0.6274, + "step": 54173 + }, + { + "epoch": 1.39, + "learning_rate": 1.1681531010191287e-06, + "loss": 0.75, + "step": 54174 + }, + { + "epoch": 1.39, + "learning_rate": 1.1681258245034655e-06, + "loss": 0.7393, + "step": 54175 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680985478590763e-06, + "loss": 0.4712, + "step": 54176 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680712710859818e-06, + "loss": 0.6299, + "step": 54177 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680439941842028e-06, + "loss": 0.4067, + "step": 54178 + }, + { + "epoch": 1.39, + "learning_rate": 1.1680167171537605e-06, + "loss": 0.6465, + "step": 54179 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679894399946754e-06, + "loss": 0.623, + "step": 54180 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679621627069685e-06, + "loss": 0.551, + "step": 54181 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679348852906605e-06, + "loss": 0.6201, + "step": 54182 + }, + { + "epoch": 1.39, + "learning_rate": 1.1679076077457725e-06, + "loss": 0.8164, + "step": 54183 + }, + { + "epoch": 1.39, + "learning_rate": 1.167880330072326e-06, + "loss": 0.4707, + "step": 54184 + }, + { + "epoch": 1.39, + "learning_rate": 1.1678530522703405e-06, + "loss": 0.6047, + "step": 54185 + }, + { + "epoch": 1.39, + "learning_rate": 1.1678257743398378e-06, + "loss": 0.6426, + "step": 54186 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677984962808388e-06, + "loss": 0.6797, + "step": 54187 + }, + { + "epoch": 1.39, + "learning_rate": 1.167771218093364e-06, + "loss": 0.5615, + "step": 54188 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677439397774347e-06, + "loss": 0.8057, + "step": 54189 + }, + { + "epoch": 1.39, + "learning_rate": 1.1677166613330714e-06, + "loss": 0.6353, + "step": 54190 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676893827602952e-06, + "loss": 0.6182, + "step": 54191 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676621040591267e-06, + "loss": 0.7109, + "step": 54192 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676348252295875e-06, + "loss": 0.8506, + "step": 54193 + }, + { + "epoch": 1.39, + "learning_rate": 1.1676075462716978e-06, + "loss": 0.5935, + "step": 54194 + }, + { + "epoch": 1.39, + "learning_rate": 1.167580267185479e-06, + "loss": 0.5745, + "step": 54195 + }, + { + "epoch": 1.39, + "learning_rate": 1.1675529879709514e-06, + "loss": 0.5083, + "step": 54196 + }, + { + "epoch": 1.39, + "learning_rate": 1.1675257086281363e-06, + "loss": 0.6431, + "step": 54197 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674984291570543e-06, + "loss": 0.5903, + "step": 54198 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674711495577268e-06, + "loss": 0.6826, + "step": 54199 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674438698301739e-06, + "loss": 0.5811, + "step": 54200 + }, + { + "epoch": 1.39, + "learning_rate": 1.1674165899744174e-06, + "loss": 0.5977, + "step": 54201 + }, + { + "epoch": 1.39, + "learning_rate": 1.167389309990477e-06, + "loss": 0.7041, + "step": 54202 + }, + { + "epoch": 1.39, + "learning_rate": 1.167362029878375e-06, + "loss": 0.7793, + "step": 54203 + }, + { + "epoch": 1.39, + "learning_rate": 1.1673347496381313e-06, + "loss": 0.7373, + "step": 54204 + }, + { + "epoch": 1.39, + "learning_rate": 1.167307469269767e-06, + "loss": 0.5859, + "step": 54205 + }, + { + "epoch": 1.39, + "learning_rate": 1.1672801887733033e-06, + "loss": 0.7432, + "step": 54206 + }, + { + "epoch": 1.39, + "learning_rate": 1.1672529081487607e-06, + "loss": 0.5303, + "step": 54207 + }, + { + "epoch": 1.39, + "learning_rate": 1.16722562739616e-06, + "loss": 0.6411, + "step": 54208 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671983465155228e-06, + "loss": 0.6816, + "step": 54209 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671710655068694e-06, + "loss": 0.5269, + "step": 54210 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671437843702208e-06, + "loss": 0.3887, + "step": 54211 + }, + { + "epoch": 1.39, + "learning_rate": 1.1671165031055975e-06, + "loss": 0.7773, + "step": 54212 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670892217130213e-06, + "loss": 0.8208, + "step": 54213 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670619401925124e-06, + "loss": 0.8203, + "step": 54214 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670346585440916e-06, + "loss": 0.5161, + "step": 54215 + }, + { + "epoch": 1.39, + "learning_rate": 1.1670073767677804e-06, + "loss": 0.7168, + "step": 54216 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669800948635988e-06, + "loss": 0.8213, + "step": 54217 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669528128315688e-06, + "loss": 0.625, + "step": 54218 + }, + { + "epoch": 1.39, + "learning_rate": 1.1669255306717105e-06, + "loss": 0.6353, + "step": 54219 + }, + { + "epoch": 1.39, + "learning_rate": 1.166898248384045e-06, + "loss": 0.6709, + "step": 54220 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668709659685932e-06, + "loss": 0.6958, + "step": 54221 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668436834253759e-06, + "loss": 0.7256, + "step": 54222 + }, + { + "epoch": 1.39, + "learning_rate": 1.1668164007544143e-06, + "loss": 0.6904, + "step": 54223 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667891179557289e-06, + "loss": 0.5703, + "step": 54224 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667618350293405e-06, + "loss": 0.7314, + "step": 54225 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667345519752704e-06, + "loss": 0.5371, + "step": 54226 + }, + { + "epoch": 1.39, + "learning_rate": 1.1667072687935393e-06, + "loss": 0.7715, + "step": 54227 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666799854841684e-06, + "loss": 0.6465, + "step": 54228 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666527020471782e-06, + "loss": 0.709, + "step": 54229 + }, + { + "epoch": 1.39, + "learning_rate": 1.1666254184825895e-06, + "loss": 0.7832, + "step": 54230 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665981347904232e-06, + "loss": 0.6489, + "step": 54231 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665708509707007e-06, + "loss": 0.627, + "step": 54232 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665435670234426e-06, + "loss": 0.6641, + "step": 54233 + }, + { + "epoch": 1.39, + "learning_rate": 1.1665162829486694e-06, + "loss": 0.6304, + "step": 54234 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664889987464026e-06, + "loss": 0.7148, + "step": 54235 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664617144166627e-06, + "loss": 0.752, + "step": 54236 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664344299594709e-06, + "loss": 0.4512, + "step": 54237 + }, + { + "epoch": 1.39, + "learning_rate": 1.1664071453748478e-06, + "loss": 0.4971, + "step": 54238 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663798606628147e-06, + "loss": 0.5913, + "step": 54239 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663525758233916e-06, + "loss": 0.5085, + "step": 54240 + }, + { + "epoch": 1.39, + "learning_rate": 1.1663252908566004e-06, + "loss": 0.5979, + "step": 54241 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662980057624612e-06, + "loss": 0.5822, + "step": 54242 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662707205409958e-06, + "loss": 0.6953, + "step": 54243 + }, + { + "epoch": 1.39, + "learning_rate": 1.166243435192224e-06, + "loss": 0.6836, + "step": 54244 + }, + { + "epoch": 1.39, + "learning_rate": 1.1662161497161678e-06, + "loss": 0.5139, + "step": 54245 + }, + { + "epoch": 1.39, + "learning_rate": 1.166188864112847e-06, + "loss": 0.4673, + "step": 54246 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661615783822835e-06, + "loss": 0.7129, + "step": 54247 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661342925244974e-06, + "loss": 0.7607, + "step": 54248 + }, + { + "epoch": 1.39, + "learning_rate": 1.1661070065395102e-06, + "loss": 0.5684, + "step": 54249 + }, + { + "epoch": 1.39, + "learning_rate": 1.166079720427342e-06, + "loss": 0.6875, + "step": 54250 + }, + { + "epoch": 1.39, + "learning_rate": 1.1660524341880146e-06, + "loss": 0.8057, + "step": 54251 + }, + { + "epoch": 1.39, + "learning_rate": 1.1660251478215485e-06, + "loss": 0.5336, + "step": 54252 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659978613279645e-06, + "loss": 0.8193, + "step": 54253 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659705747072837e-06, + "loss": 0.6177, + "step": 54254 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659432879595263e-06, + "loss": 0.4197, + "step": 54255 + }, + { + "epoch": 1.39, + "learning_rate": 1.1659160010847144e-06, + "loss": 0.6729, + "step": 54256 + }, + { + "epoch": 1.39, + "learning_rate": 1.165888714082868e-06, + "loss": 0.6135, + "step": 54257 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658614269540083e-06, + "loss": 0.6294, + "step": 54258 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658341396981559e-06, + "loss": 0.7422, + "step": 54259 + }, + { + "epoch": 1.39, + "learning_rate": 1.1658068523153324e-06, + "loss": 0.6035, + "step": 54260 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657795648055577e-06, + "loss": 0.7666, + "step": 54261 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657522771688534e-06, + "loss": 0.7158, + "step": 54262 + }, + { + "epoch": 1.39, + "learning_rate": 1.1657249894052403e-06, + "loss": 0.8389, + "step": 54263 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656977015147393e-06, + "loss": 0.5908, + "step": 54264 + }, + { + "epoch": 1.39, + "learning_rate": 1.165670413497371e-06, + "loss": 0.4788, + "step": 54265 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656431253531564e-06, + "loss": 0.7998, + "step": 54266 + }, + { + "epoch": 1.39, + "learning_rate": 1.1656158370821165e-06, + "loss": 0.5981, + "step": 54267 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655885486842725e-06, + "loss": 0.7031, + "step": 54268 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655612601596445e-06, + "loss": 0.7363, + "step": 54269 + }, + { + "epoch": 1.39, + "learning_rate": 1.165533971508254e-06, + "loss": 0.4259, + "step": 54270 + }, + { + "epoch": 1.39, + "learning_rate": 1.1655066827301219e-06, + "loss": 0.584, + "step": 54271 + }, + { + "epoch": 1.39, + "learning_rate": 1.1654793938252689e-06, + "loss": 0.7031, + "step": 54272 + }, + { + "epoch": 1.39, + "learning_rate": 1.165452104793716e-06, + "loss": 0.7705, + "step": 54273 + }, + { + "epoch": 1.39, + "learning_rate": 1.165424815635484e-06, + "loss": 0.582, + "step": 54274 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653975263505935e-06, + "loss": 0.6855, + "step": 54275 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653702369390662e-06, + "loss": 0.5244, + "step": 54276 + }, + { + "epoch": 1.39, + "learning_rate": 1.165342947400922e-06, + "loss": 0.7334, + "step": 54277 + }, + { + "epoch": 1.39, + "learning_rate": 1.1653156577361826e-06, + "loss": 0.6646, + "step": 54278 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652883679448688e-06, + "loss": 0.5815, + "step": 54279 + }, + { + "epoch": 1.39, + "learning_rate": 1.165261078027001e-06, + "loss": 0.6333, + "step": 54280 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652337879826005e-06, + "loss": 0.6187, + "step": 54281 + }, + { + "epoch": 1.39, + "learning_rate": 1.1652064978116878e-06, + "loss": 0.5874, + "step": 54282 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651792075142847e-06, + "loss": 0.79, + "step": 54283 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651519170904109e-06, + "loss": 0.5264, + "step": 54284 + }, + { + "epoch": 1.39, + "learning_rate": 1.1651246265400882e-06, + "loss": 0.6641, + "step": 54285 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650973358633369e-06, + "loss": 0.6616, + "step": 54286 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650700450601785e-06, + "loss": 0.7021, + "step": 54287 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650427541306336e-06, + "loss": 0.7314, + "step": 54288 + }, + { + "epoch": 1.39, + "learning_rate": 1.1650154630747229e-06, + "loss": 0.4194, + "step": 54289 + }, + { + "epoch": 1.39, + "learning_rate": 1.164988171892467e-06, + "loss": 0.71, + "step": 54290 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649608805838878e-06, + "loss": 0.7578, + "step": 54291 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649335891490052e-06, + "loss": 0.5239, + "step": 54292 + }, + { + "epoch": 1.39, + "learning_rate": 1.1649062975878412e-06, + "loss": 0.4751, + "step": 54293 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648790059004155e-06, + "loss": 0.79, + "step": 54294 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648517140867498e-06, + "loss": 0.8242, + "step": 54295 + }, + { + "epoch": 1.39, + "learning_rate": 1.1648244221468644e-06, + "loss": 0.5959, + "step": 54296 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647971300807807e-06, + "loss": 0.4927, + "step": 54297 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647698378885196e-06, + "loss": 0.5635, + "step": 54298 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647425455701014e-06, + "loss": 0.708, + "step": 54299 + }, + { + "epoch": 1.39, + "learning_rate": 1.1647152531255476e-06, + "loss": 0.5947, + "step": 54300 + }, + { + "epoch": 1.39, + "learning_rate": 1.164687960554879e-06, + "loss": 0.6704, + "step": 54301 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646606678581164e-06, + "loss": 0.7529, + "step": 54302 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646333750352805e-06, + "loss": 0.5659, + "step": 54303 + }, + { + "epoch": 1.39, + "learning_rate": 1.1646060820863928e-06, + "loss": 0.481, + "step": 54304 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645787890114733e-06, + "loss": 0.5164, + "step": 54305 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645514958105436e-06, + "loss": 0.4172, + "step": 54306 + }, + { + "epoch": 1.39, + "learning_rate": 1.1645242024836242e-06, + "loss": 0.6504, + "step": 54307 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644969090307369e-06, + "loss": 0.5659, + "step": 54308 + }, + { + "epoch": 1.39, + "learning_rate": 1.164469615451901e-06, + "loss": 0.6484, + "step": 54309 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644423217471389e-06, + "loss": 0.7041, + "step": 54310 + }, + { + "epoch": 1.39, + "learning_rate": 1.1644150279164704e-06, + "loss": 0.5352, + "step": 54311 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643877339599171e-06, + "loss": 0.5498, + "step": 54312 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643604398774999e-06, + "loss": 0.623, + "step": 54313 + }, + { + "epoch": 1.39, + "learning_rate": 1.1643331456692391e-06, + "loss": 0.6211, + "step": 54314 + }, + { + "epoch": 1.39, + "learning_rate": 1.164305851335156e-06, + "loss": 0.625, + "step": 54315 + }, + { + "epoch": 1.39, + "learning_rate": 1.1642785568752715e-06, + "loss": 0.7339, + "step": 54316 + }, + { + "epoch": 1.39, + "learning_rate": 1.1642512622896063e-06, + "loss": 0.6587, + "step": 54317 + }, + { + "epoch": 1.39, + "learning_rate": 1.164223967578182e-06, + "loss": 0.6709, + "step": 54318 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641966727410185e-06, + "loss": 0.6226, + "step": 54319 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641693777781374e-06, + "loss": 0.7197, + "step": 54320 + }, + { + "epoch": 1.39, + "learning_rate": 1.1641420826895591e-06, + "loss": 0.8027, + "step": 54321 + }, + { + "epoch": 1.39, + "learning_rate": 1.164114787475305e-06, + "loss": 0.75, + "step": 54322 + }, + { + "epoch": 1.39, + "learning_rate": 1.1640874921353958e-06, + "loss": 0.6416, + "step": 54323 + }, + { + "epoch": 1.39, + "learning_rate": 1.164060196669852e-06, + "loss": 0.8311, + "step": 54324 + }, + { + "epoch": 1.39, + "learning_rate": 1.164032901078695e-06, + "loss": 0.7256, + "step": 54325 + }, + { + "epoch": 1.39, + "learning_rate": 1.1640056053619455e-06, + "loss": 0.6934, + "step": 54326 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639783095196246e-06, + "loss": 0.7744, + "step": 54327 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639510135517533e-06, + "loss": 0.5576, + "step": 54328 + }, + { + "epoch": 1.39, + "learning_rate": 1.1639237174583521e-06, + "loss": 0.4854, + "step": 54329 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638964212394418e-06, + "loss": 0.6704, + "step": 54330 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638691248950436e-06, + "loss": 0.5845, + "step": 54331 + }, + { + "epoch": 1.39, + "learning_rate": 1.1638418284251782e-06, + "loss": 0.6182, + "step": 54332 + }, + { + "epoch": 1.39, + "learning_rate": 1.163814531829867e-06, + "loss": 0.4802, + "step": 54333 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637872351091304e-06, + "loss": 0.7266, + "step": 54334 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637599382629895e-06, + "loss": 0.6748, + "step": 54335 + }, + { + "epoch": 1.39, + "learning_rate": 1.163732641291465e-06, + "loss": 0.6816, + "step": 54336 + }, + { + "epoch": 1.39, + "learning_rate": 1.1637053441945782e-06, + "loss": 0.5, + "step": 54337 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636780469723495e-06, + "loss": 0.6357, + "step": 54338 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636507496248002e-06, + "loss": 0.6953, + "step": 54339 + }, + { + "epoch": 1.39, + "learning_rate": 1.1636234521519508e-06, + "loss": 0.6816, + "step": 54340 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635961545538227e-06, + "loss": 0.5708, + "step": 54341 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635688568304363e-06, + "loss": 0.6255, + "step": 54342 + }, + { + "epoch": 1.39, + "learning_rate": 1.163541558981813e-06, + "loss": 0.6416, + "step": 54343 + }, + { + "epoch": 1.39, + "learning_rate": 1.1635142610079732e-06, + "loss": 0.6172, + "step": 54344 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634869629089382e-06, + "loss": 0.7007, + "step": 54345 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634596646847287e-06, + "loss": 0.5889, + "step": 54346 + }, + { + "epoch": 1.39, + "learning_rate": 1.163432366335366e-06, + "loss": 0.5129, + "step": 54347 + }, + { + "epoch": 1.39, + "learning_rate": 1.1634050678608705e-06, + "loss": 0.6592, + "step": 54348 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633777692612627e-06, + "loss": 0.4365, + "step": 54349 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633504705365647e-06, + "loss": 0.5776, + "step": 54350 + }, + { + "epoch": 1.39, + "learning_rate": 1.1633231716867964e-06, + "loss": 0.6357, + "step": 54351 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632958727119793e-06, + "loss": 0.7119, + "step": 54352 + }, + { + "epoch": 1.39, + "learning_rate": 1.163268573612134e-06, + "loss": 0.5693, + "step": 54353 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632412743872812e-06, + "loss": 0.5986, + "step": 54354 + }, + { + "epoch": 1.39, + "learning_rate": 1.1632139750374422e-06, + "loss": 0.7207, + "step": 54355 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631866755626378e-06, + "loss": 0.5784, + "step": 54356 + }, + { + "epoch": 1.39, + "learning_rate": 1.163159375962889e-06, + "loss": 0.5615, + "step": 54357 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631320762382166e-06, + "loss": 0.7246, + "step": 54358 + }, + { + "epoch": 1.39, + "learning_rate": 1.1631047763886413e-06, + "loss": 0.4436, + "step": 54359 + }, + { + "epoch": 1.39, + "learning_rate": 1.1630774764141842e-06, + "loss": 0.7334, + "step": 54360 + }, + { + "epoch": 1.39, + "learning_rate": 1.163050176314866e-06, + "loss": 0.6777, + "step": 54361 + }, + { + "epoch": 1.39, + "learning_rate": 1.163022876090708e-06, + "loss": 0.7256, + "step": 54362 + }, + { + "epoch": 1.39, + "learning_rate": 1.162995575741731e-06, + "loss": 0.5957, + "step": 54363 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629682752679554e-06, + "loss": 0.72, + "step": 54364 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629409746694028e-06, + "loss": 0.7451, + "step": 54365 + }, + { + "epoch": 1.39, + "learning_rate": 1.1629136739460937e-06, + "loss": 0.6592, + "step": 54366 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628863730980489e-06, + "loss": 0.5796, + "step": 54367 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628590721252898e-06, + "loss": 0.731, + "step": 54368 + }, + { + "epoch": 1.39, + "learning_rate": 1.1628317710278367e-06, + "loss": 0.6973, + "step": 54369 + }, + { + "epoch": 1.39, + "learning_rate": 1.162804469805711e-06, + "loss": 0.8115, + "step": 54370 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627771684589333e-06, + "loss": 0.5835, + "step": 54371 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627498669875247e-06, + "loss": 0.6587, + "step": 54372 + }, + { + "epoch": 1.39, + "learning_rate": 1.1627225653915062e-06, + "loss": 0.6641, + "step": 54373 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626952636708981e-06, + "loss": 0.4263, + "step": 54374 + }, + { + "epoch": 1.39, + "learning_rate": 1.162667961825722e-06, + "loss": 0.7207, + "step": 54375 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626406598559983e-06, + "loss": 0.7524, + "step": 54376 + }, + { + "epoch": 1.39, + "learning_rate": 1.1626133577617485e-06, + "loss": 0.6104, + "step": 54377 + }, + { + "epoch": 1.39, + "learning_rate": 1.162586055542993e-06, + "loss": 0.6992, + "step": 54378 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625587531997527e-06, + "loss": 0.6777, + "step": 54379 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625314507320485e-06, + "loss": 0.7295, + "step": 54380 + }, + { + "epoch": 1.39, + "learning_rate": 1.1625041481399016e-06, + "loss": 0.7549, + "step": 54381 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624768454233327e-06, + "loss": 0.5996, + "step": 54382 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624495425823631e-06, + "loss": 0.6289, + "step": 54383 + }, + { + "epoch": 1.39, + "learning_rate": 1.1624222396170129e-06, + "loss": 0.6772, + "step": 54384 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623949365273036e-06, + "loss": 0.5981, + "step": 54385 + }, + { + "epoch": 1.39, + "learning_rate": 1.162367633313256e-06, + "loss": 0.6646, + "step": 54386 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623403299748908e-06, + "loss": 0.5308, + "step": 54387 + }, + { + "epoch": 1.39, + "learning_rate": 1.1623130265122293e-06, + "loss": 0.5757, + "step": 54388 + }, + { + "epoch": 1.39, + "learning_rate": 1.162285722925292e-06, + "loss": 0.5415, + "step": 54389 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622584192141002e-06, + "loss": 0.5547, + "step": 54390 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622311153786745e-06, + "loss": 0.7422, + "step": 54391 + }, + { + "epoch": 1.39, + "learning_rate": 1.1622038114190357e-06, + "loss": 0.4966, + "step": 54392 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621765073352053e-06, + "loss": 0.4707, + "step": 54393 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621492031272035e-06, + "loss": 0.7139, + "step": 54394 + }, + { + "epoch": 1.39, + "learning_rate": 1.1621218987950515e-06, + "loss": 0.583, + "step": 54395 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620945943387703e-06, + "loss": 0.4612, + "step": 54396 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620672897583805e-06, + "loss": 0.6309, + "step": 54397 + }, + { + "epoch": 1.39, + "learning_rate": 1.1620399850539038e-06, + "loss": 0.6831, + "step": 54398 + }, + { + "epoch": 1.39, + "learning_rate": 1.16201268022536e-06, + "loss": 0.6251, + "step": 54399 + }, + { + "epoch": 1.39, + "learning_rate": 1.161985375272771e-06, + "loss": 0.4927, + "step": 54400 + }, + { + "epoch": 1.39, + "learning_rate": 1.1619580701961567e-06, + "loss": 0.7178, + "step": 54401 + }, + { + "epoch": 1.39, + "learning_rate": 1.161930764995539e-06, + "loss": 0.8809, + "step": 54402 + }, + { + "epoch": 1.39, + "learning_rate": 1.1619034596709382e-06, + "loss": 0.6523, + "step": 54403 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618761542223753e-06, + "loss": 0.5854, + "step": 54404 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618488486498712e-06, + "loss": 0.6367, + "step": 54405 + }, + { + "epoch": 1.39, + "learning_rate": 1.1618215429534472e-06, + "loss": 0.583, + "step": 54406 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617942371331235e-06, + "loss": 0.5659, + "step": 54407 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617669311889216e-06, + "loss": 0.7109, + "step": 54408 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617396251208622e-06, + "loss": 0.5024, + "step": 54409 + }, + { + "epoch": 1.39, + "learning_rate": 1.1617123189289663e-06, + "loss": 0.625, + "step": 54410 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616850126132545e-06, + "loss": 0.7344, + "step": 54411 + }, + { + "epoch": 1.39, + "learning_rate": 1.161657706173748e-06, + "loss": 0.5684, + "step": 54412 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616303996104677e-06, + "loss": 0.5674, + "step": 54413 + }, + { + "epoch": 1.39, + "learning_rate": 1.1616030929234345e-06, + "loss": 0.6812, + "step": 54414 + }, + { + "epoch": 1.39, + "learning_rate": 1.161575786112669e-06, + "loss": 0.9375, + "step": 54415 + }, + { + "epoch": 1.39, + "learning_rate": 1.1615484791781924e-06, + "loss": 0.6416, + "step": 54416 + }, + { + "epoch": 1.39, + "learning_rate": 1.1615211721200258e-06, + "loss": 0.5459, + "step": 54417 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614938649381896e-06, + "loss": 0.6885, + "step": 54418 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614665576327052e-06, + "loss": 0.5649, + "step": 54419 + }, + { + "epoch": 1.39, + "learning_rate": 1.161439250203593e-06, + "loss": 0.8291, + "step": 54420 + }, + { + "epoch": 1.39, + "learning_rate": 1.1614119426508744e-06, + "loss": 0.7666, + "step": 54421 + }, + { + "epoch": 1.39, + "learning_rate": 1.16138463497457e-06, + "loss": 0.7617, + "step": 54422 + }, + { + "epoch": 1.39, + "learning_rate": 1.161357327174701e-06, + "loss": 0.6021, + "step": 54423 + }, + { + "epoch": 1.39, + "learning_rate": 1.1613300192512877e-06, + "loss": 0.6055, + "step": 54424 + }, + { + "epoch": 1.39, + "learning_rate": 1.1613027112043518e-06, + "loss": 0.6558, + "step": 54425 + }, + { + "epoch": 1.39, + "learning_rate": 1.1612754030339135e-06, + "loss": 0.751, + "step": 54426 + }, + { + "epoch": 1.39, + "learning_rate": 1.1612480947399944e-06, + "loss": 0.7246, + "step": 54427 + }, + { + "epoch": 1.4, + "learning_rate": 1.1612207863226152e-06, + "loss": 0.5942, + "step": 54428 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611934777817963e-06, + "loss": 0.5, + "step": 54429 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611661691175586e-06, + "loss": 0.655, + "step": 54430 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611388603299241e-06, + "loss": 0.5366, + "step": 54431 + }, + { + "epoch": 1.4, + "learning_rate": 1.1611115514189125e-06, + "loss": 0.6719, + "step": 54432 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610842423845455e-06, + "loss": 0.7451, + "step": 54433 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610569332268436e-06, + "loss": 0.6704, + "step": 54434 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610296239458277e-06, + "loss": 0.6533, + "step": 54435 + }, + { + "epoch": 1.4, + "learning_rate": 1.1610023145415189e-06, + "loss": 0.6582, + "step": 54436 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609750050139382e-06, + "loss": 0.4041, + "step": 54437 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609476953631062e-06, + "loss": 0.7642, + "step": 54438 + }, + { + "epoch": 1.4, + "learning_rate": 1.1609203855890438e-06, + "loss": 0.7637, + "step": 54439 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608930756917722e-06, + "loss": 0.6179, + "step": 54440 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608657656713121e-06, + "loss": 0.6738, + "step": 54441 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608384555276844e-06, + "loss": 0.6318, + "step": 54442 + }, + { + "epoch": 1.4, + "learning_rate": 1.1608111452609103e-06, + "loss": 0.7412, + "step": 54443 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607838348710105e-06, + "loss": 0.6201, + "step": 54444 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607565243580057e-06, + "loss": 0.6367, + "step": 54445 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607292137219174e-06, + "loss": 0.5874, + "step": 54446 + }, + { + "epoch": 1.4, + "learning_rate": 1.1607019029627659e-06, + "loss": 0.564, + "step": 54447 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606745920805724e-06, + "loss": 0.6953, + "step": 54448 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606472810753576e-06, + "loss": 0.625, + "step": 54449 + }, + { + "epoch": 1.4, + "learning_rate": 1.1606199699471426e-06, + "loss": 0.7842, + "step": 54450 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605926586959483e-06, + "loss": 0.7822, + "step": 54451 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605653473217956e-06, + "loss": 0.6406, + "step": 54452 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605380358247055e-06, + "loss": 0.6465, + "step": 54453 + }, + { + "epoch": 1.4, + "learning_rate": 1.1605107242046987e-06, + "loss": 0.5845, + "step": 54454 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604834124617961e-06, + "loss": 0.6504, + "step": 54455 + }, + { + "epoch": 1.4, + "learning_rate": 1.160456100596019e-06, + "loss": 0.5469, + "step": 54456 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604287886073878e-06, + "loss": 0.6621, + "step": 54457 + }, + { + "epoch": 1.4, + "learning_rate": 1.1604014764959238e-06, + "loss": 0.4147, + "step": 54458 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603741642616479e-06, + "loss": 0.5884, + "step": 54459 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603468519045805e-06, + "loss": 0.7559, + "step": 54460 + }, + { + "epoch": 1.4, + "learning_rate": 1.1603195394247432e-06, + "loss": 0.5667, + "step": 54461 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602922268221561e-06, + "loss": 0.5925, + "step": 54462 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602649140968414e-06, + "loss": 0.793, + "step": 54463 + }, + { + "epoch": 1.4, + "learning_rate": 1.160237601248819e-06, + "loss": 0.5239, + "step": 54464 + }, + { + "epoch": 1.4, + "learning_rate": 1.1602102882781097e-06, + "loss": 0.7363, + "step": 54465 + }, + { + "epoch": 1.4, + "learning_rate": 1.1601829751847348e-06, + "loss": 0.666, + "step": 54466 + }, + { + "epoch": 1.4, + "learning_rate": 1.1601556619687155e-06, + "loss": 0.5366, + "step": 54467 + }, + { + "epoch": 1.4, + "learning_rate": 1.160128348630072e-06, + "loss": 0.7007, + "step": 54468 + }, + { + "epoch": 1.4, + "learning_rate": 1.160101035168826e-06, + "loss": 0.5095, + "step": 54469 + }, + { + "epoch": 1.4, + "learning_rate": 1.1600737215849974e-06, + "loss": 0.6533, + "step": 54470 + }, + { + "epoch": 1.4, + "learning_rate": 1.160046407878608e-06, + "loss": 0.7471, + "step": 54471 + }, + { + "epoch": 1.4, + "learning_rate": 1.1600190940496784e-06, + "loss": 0.4827, + "step": 54472 + }, + { + "epoch": 1.4, + "learning_rate": 1.15999178009823e-06, + "loss": 0.6709, + "step": 54473 + }, + { + "epoch": 1.4, + "learning_rate": 1.1599644660242827e-06, + "loss": 0.6914, + "step": 54474 + }, + { + "epoch": 1.4, + "learning_rate": 1.1599371518278583e-06, + "loss": 0.7227, + "step": 54475 + }, + { + "epoch": 1.4, + "learning_rate": 1.159909837508977e-06, + "loss": 0.5742, + "step": 54476 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598825230676603e-06, + "loss": 0.6851, + "step": 54477 + }, + { + "epoch": 1.4, + "learning_rate": 1.159855208503929e-06, + "loss": 0.5938, + "step": 54478 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598278938178037e-06, + "loss": 0.547, + "step": 54479 + }, + { + "epoch": 1.4, + "learning_rate": 1.1598005790093055e-06, + "loss": 0.7256, + "step": 54480 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597732640784555e-06, + "loss": 0.5303, + "step": 54481 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597459490252746e-06, + "loss": 0.6855, + "step": 54482 + }, + { + "epoch": 1.4, + "learning_rate": 1.1597186338497833e-06, + "loss": 0.7754, + "step": 54483 + }, + { + "epoch": 1.4, + "learning_rate": 1.159691318552003e-06, + "loss": 0.5132, + "step": 54484 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596640031319542e-06, + "loss": 0.6338, + "step": 54485 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596366875896583e-06, + "loss": 0.6025, + "step": 54486 + }, + { + "epoch": 1.4, + "learning_rate": 1.1596093719251354e-06, + "loss": 0.8008, + "step": 54487 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595820561384075e-06, + "loss": 0.748, + "step": 54488 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595547402294947e-06, + "loss": 0.7051, + "step": 54489 + }, + { + "epoch": 1.4, + "learning_rate": 1.1595274241984183e-06, + "loss": 0.7793, + "step": 54490 + }, + { + "epoch": 1.4, + "learning_rate": 1.159500108045199e-06, + "loss": 0.5654, + "step": 54491 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594727917698576e-06, + "loss": 0.668, + "step": 54492 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594454753724156e-06, + "loss": 0.6543, + "step": 54493 + }, + { + "epoch": 1.4, + "learning_rate": 1.1594181588528934e-06, + "loss": 0.6641, + "step": 54494 + }, + { + "epoch": 1.4, + "learning_rate": 1.159390842211312e-06, + "loss": 0.5938, + "step": 54495 + }, + { + "epoch": 1.4, + "learning_rate": 1.1593635254476923e-06, + "loss": 0.5151, + "step": 54496 + }, + { + "epoch": 1.4, + "learning_rate": 1.1593362085620552e-06, + "loss": 0.7412, + "step": 54497 + }, + { + "epoch": 1.4, + "learning_rate": 1.159308891554422e-06, + "loss": 0.699, + "step": 54498 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592815744248132e-06, + "loss": 0.6362, + "step": 54499 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592542571732498e-06, + "loss": 0.7002, + "step": 54500 + }, + { + "epoch": 1.4, + "learning_rate": 1.1592269397997525e-06, + "loss": 0.6699, + "step": 54501 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591996223043427e-06, + "loss": 0.6602, + "step": 54502 + }, + { + "epoch": 1.4, + "learning_rate": 1.159172304687041e-06, + "loss": 0.7725, + "step": 54503 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591449869478684e-06, + "loss": 0.5747, + "step": 54504 + }, + { + "epoch": 1.4, + "learning_rate": 1.1591176690868457e-06, + "loss": 0.5411, + "step": 54505 + }, + { + "epoch": 1.4, + "learning_rate": 1.159090351103994e-06, + "loss": 0.5371, + "step": 54506 + }, + { + "epoch": 1.4, + "learning_rate": 1.1590630329993343e-06, + "loss": 0.7031, + "step": 54507 + }, + { + "epoch": 1.4, + "learning_rate": 1.1590357147728873e-06, + "loss": 0.8174, + "step": 54508 + }, + { + "epoch": 1.4, + "learning_rate": 1.159008396424674e-06, + "loss": 0.6157, + "step": 54509 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589810779547149e-06, + "loss": 0.7134, + "step": 54510 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589537593630317e-06, + "loss": 0.6504, + "step": 54511 + }, + { + "epoch": 1.4, + "learning_rate": 1.1589264406496446e-06, + "loss": 0.5708, + "step": 54512 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588991218145752e-06, + "loss": 0.5818, + "step": 54513 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588718028578437e-06, + "loss": 0.7017, + "step": 54514 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588444837794716e-06, + "loss": 0.7218, + "step": 54515 + }, + { + "epoch": 1.4, + "learning_rate": 1.1588171645794794e-06, + "loss": 0.7314, + "step": 54516 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587898452578886e-06, + "loss": 0.5693, + "step": 54517 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587625258147192e-06, + "loss": 0.54, + "step": 54518 + }, + { + "epoch": 1.4, + "learning_rate": 1.158735206249993e-06, + "loss": 0.5806, + "step": 54519 + }, + { + "epoch": 1.4, + "learning_rate": 1.1587078865637301e-06, + "loss": 0.5645, + "step": 54520 + }, + { + "epoch": 1.4, + "learning_rate": 1.1586805667559522e-06, + "loss": 0.7188, + "step": 54521 + }, + { + "epoch": 1.4, + "learning_rate": 1.15865324682668e-06, + "loss": 0.6738, + "step": 54522 + }, + { + "epoch": 1.4, + "learning_rate": 1.1586259267759339e-06, + "loss": 0.6904, + "step": 54523 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585986066037357e-06, + "loss": 0.5469, + "step": 54524 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585712863101054e-06, + "loss": 1.1729, + "step": 54525 + }, + { + "epoch": 1.4, + "learning_rate": 1.1585439658950647e-06, + "loss": 0.5781, + "step": 54526 + }, + { + "epoch": 1.4, + "learning_rate": 1.158516645358634e-06, + "loss": 0.6392, + "step": 54527 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584893247008347e-06, + "loss": 0.54, + "step": 54528 + }, + { + "epoch": 1.4, + "learning_rate": 1.158462003921687e-06, + "loss": 0.7461, + "step": 54529 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584346830212124e-06, + "loss": 0.7354, + "step": 54530 + }, + { + "epoch": 1.4, + "learning_rate": 1.1584073619994314e-06, + "loss": 0.5825, + "step": 54531 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583800408563658e-06, + "loss": 0.5679, + "step": 54532 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583527195920353e-06, + "loss": 0.7012, + "step": 54533 + }, + { + "epoch": 1.4, + "learning_rate": 1.1583253982064615e-06, + "loss": 0.7305, + "step": 54534 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582980766996653e-06, + "loss": 0.791, + "step": 54535 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582707550716678e-06, + "loss": 0.5657, + "step": 54536 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582434333224893e-06, + "loss": 0.5525, + "step": 54537 + }, + { + "epoch": 1.4, + "learning_rate": 1.1582161114521514e-06, + "loss": 0.79, + "step": 54538 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581887894606744e-06, + "loss": 0.668, + "step": 54539 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581614673480796e-06, + "loss": 0.6338, + "step": 54540 + }, + { + "epoch": 1.4, + "learning_rate": 1.1581341451143876e-06, + "loss": 0.6323, + "step": 54541 + }, + { + "epoch": 1.4, + "learning_rate": 1.15810682275962e-06, + "loss": 0.6565, + "step": 54542 + }, + { + "epoch": 1.4, + "learning_rate": 1.158079500283797e-06, + "loss": 0.5239, + "step": 54543 + }, + { + "epoch": 1.4, + "learning_rate": 1.1580521776869402e-06, + "loss": 0.5439, + "step": 54544 + }, + { + "epoch": 1.4, + "learning_rate": 1.1580248549690693e-06, + "loss": 0.6436, + "step": 54545 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579975321302067e-06, + "loss": 0.5444, + "step": 54546 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579702091703726e-06, + "loss": 0.6077, + "step": 54547 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579428860895876e-06, + "loss": 0.7236, + "step": 54548 + }, + { + "epoch": 1.4, + "learning_rate": 1.1579155628878734e-06, + "loss": 0.7227, + "step": 54549 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578882395652503e-06, + "loss": 0.7017, + "step": 54550 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578609161217394e-06, + "loss": 0.5986, + "step": 54551 + }, + { + "epoch": 1.4, + "learning_rate": 1.157833592557362e-06, + "loss": 0.7031, + "step": 54552 + }, + { + "epoch": 1.4, + "learning_rate": 1.1578062688721384e-06, + "loss": 0.7256, + "step": 54553 + }, + { + "epoch": 1.4, + "learning_rate": 1.1577789450660897e-06, + "loss": 0.6353, + "step": 54554 + }, + { + "epoch": 1.4, + "learning_rate": 1.157751621139237e-06, + "loss": 0.6338, + "step": 54555 + }, + { + "epoch": 1.4, + "learning_rate": 1.157724297091601e-06, + "loss": 0.5566, + "step": 54556 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576969729232034e-06, + "loss": 0.6646, + "step": 54557 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576696486340638e-06, + "loss": 0.7197, + "step": 54558 + }, + { + "epoch": 1.4, + "learning_rate": 1.157642324224204e-06, + "loss": 0.5008, + "step": 54559 + }, + { + "epoch": 1.4, + "learning_rate": 1.1576149996936446e-06, + "loss": 0.7607, + "step": 54560 + }, + { + "epoch": 1.4, + "learning_rate": 1.157587675042407e-06, + "loss": 0.6562, + "step": 54561 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575603502705115e-06, + "loss": 0.5532, + "step": 54562 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575330253779793e-06, + "loss": 0.5884, + "step": 54563 + }, + { + "epoch": 1.4, + "learning_rate": 1.1575057003648313e-06, + "loss": 0.9023, + "step": 54564 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574783752310885e-06, + "loss": 0.625, + "step": 54565 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574510499767716e-06, + "loss": 0.8223, + "step": 54566 + }, + { + "epoch": 1.4, + "learning_rate": 1.1574237246019018e-06, + "loss": 0.6006, + "step": 54567 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573963991065e-06, + "loss": 0.6611, + "step": 54568 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573690734905867e-06, + "loss": 0.7988, + "step": 54569 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573417477541834e-06, + "loss": 0.6069, + "step": 54570 + }, + { + "epoch": 1.4, + "learning_rate": 1.1573144218973105e-06, + "loss": 0.5728, + "step": 54571 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572870959199896e-06, + "loss": 0.6357, + "step": 54572 + }, + { + "epoch": 1.4, + "learning_rate": 1.157259769822241e-06, + "loss": 0.7344, + "step": 54573 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572324436040859e-06, + "loss": 0.6367, + "step": 54574 + }, + { + "epoch": 1.4, + "learning_rate": 1.1572051172655448e-06, + "loss": 0.4639, + "step": 54575 + }, + { + "epoch": 1.4, + "learning_rate": 1.1571777908066394e-06, + "loss": 0.438, + "step": 54576 + }, + { + "epoch": 1.4, + "learning_rate": 1.15715046422739e-06, + "loss": 0.7754, + "step": 54577 + }, + { + "epoch": 1.4, + "learning_rate": 1.1571231375278176e-06, + "loss": 0.834, + "step": 54578 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570958107079433e-06, + "loss": 0.5767, + "step": 54579 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570684837677882e-06, + "loss": 0.7617, + "step": 54580 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570411567073726e-06, + "loss": 0.5691, + "step": 54581 + }, + { + "epoch": 1.4, + "learning_rate": 1.1570138295267183e-06, + "loss": 0.5762, + "step": 54582 + }, + { + "epoch": 1.4, + "learning_rate": 1.156986502225845e-06, + "loss": 0.645, + "step": 54583 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569591748047751e-06, + "loss": 0.7432, + "step": 54584 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569318472635284e-06, + "loss": 0.7197, + "step": 54585 + }, + { + "epoch": 1.4, + "learning_rate": 1.1569045196021264e-06, + "loss": 0.8115, + "step": 54586 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568771918205897e-06, + "loss": 0.5576, + "step": 54587 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568498639189393e-06, + "loss": 0.7197, + "step": 54588 + }, + { + "epoch": 1.4, + "learning_rate": 1.1568225358971961e-06, + "loss": 0.7227, + "step": 54589 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567952077553814e-06, + "loss": 0.6621, + "step": 54590 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567678794935154e-06, + "loss": 0.5806, + "step": 54591 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567405511116198e-06, + "loss": 0.6914, + "step": 54592 + }, + { + "epoch": 1.4, + "learning_rate": 1.1567132226097148e-06, + "loss": 0.5903, + "step": 54593 + }, + { + "epoch": 1.4, + "learning_rate": 1.156685893987822e-06, + "loss": 0.6992, + "step": 54594 + }, + { + "epoch": 1.4, + "learning_rate": 1.1566585652459619e-06, + "loss": 0.6875, + "step": 54595 + }, + { + "epoch": 1.4, + "learning_rate": 1.1566312363841556e-06, + "loss": 0.7158, + "step": 54596 + }, + { + "epoch": 1.4, + "learning_rate": 1.156603907402424e-06, + "loss": 0.6768, + "step": 54597 + }, + { + "epoch": 1.4, + "learning_rate": 1.156576578300788e-06, + "loss": 0.7393, + "step": 54598 + }, + { + "epoch": 1.4, + "learning_rate": 1.1565492490792686e-06, + "loss": 0.7979, + "step": 54599 + }, + { + "epoch": 1.4, + "learning_rate": 1.1565219197378862e-06, + "loss": 0.5815, + "step": 54600 + }, + { + "epoch": 1.4, + "learning_rate": 1.1564945902766625e-06, + "loss": 0.6851, + "step": 54601 + }, + { + "epoch": 1.4, + "learning_rate": 1.156467260695618e-06, + "loss": 0.5771, + "step": 54602 + }, + { + "epoch": 1.4, + "learning_rate": 1.156439930994774e-06, + "loss": 0.6592, + "step": 54603 + }, + { + "epoch": 1.4, + "learning_rate": 1.1564126011741505e-06, + "loss": 0.7773, + "step": 54604 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563852712337698e-06, + "loss": 0.5796, + "step": 54605 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563579411736516e-06, + "loss": 0.4402, + "step": 54606 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563306109938177e-06, + "loss": 0.5747, + "step": 54607 + }, + { + "epoch": 1.4, + "learning_rate": 1.1563032806942882e-06, + "loss": 0.6543, + "step": 54608 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562759502750848e-06, + "loss": 0.499, + "step": 54609 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562486197362278e-06, + "loss": 0.6982, + "step": 54610 + }, + { + "epoch": 1.4, + "learning_rate": 1.1562212890777384e-06, + "loss": 0.6021, + "step": 54611 + }, + { + "epoch": 1.4, + "learning_rate": 1.156193958299638e-06, + "loss": 0.6733, + "step": 54612 + }, + { + "epoch": 1.4, + "learning_rate": 1.1561666274019466e-06, + "loss": 0.6528, + "step": 54613 + }, + { + "epoch": 1.4, + "learning_rate": 1.1561392963846858e-06, + "loss": 0.5588, + "step": 54614 + }, + { + "epoch": 1.4, + "learning_rate": 1.156111965247876e-06, + "loss": 0.5718, + "step": 54615 + }, + { + "epoch": 1.4, + "learning_rate": 1.1560846339915392e-06, + "loss": 0.5012, + "step": 54616 + }, + { + "epoch": 1.4, + "learning_rate": 1.156057302615695e-06, + "loss": 0.7051, + "step": 54617 + }, + { + "epoch": 1.4, + "learning_rate": 1.156029971120365e-06, + "loss": 0.6265, + "step": 54618 + }, + { + "epoch": 1.4, + "learning_rate": 1.15600263950557e-06, + "loss": 0.6143, + "step": 54619 + }, + { + "epoch": 1.4, + "learning_rate": 1.155975307771331e-06, + "loss": 0.9043, + "step": 54620 + }, + { + "epoch": 1.4, + "learning_rate": 1.1559479759176686e-06, + "loss": 0.877, + "step": 54621 + }, + { + "epoch": 1.4, + "learning_rate": 1.1559206439446048e-06, + "loss": 0.75, + "step": 54622 + }, + { + "epoch": 1.4, + "learning_rate": 1.155893311852159e-06, + "loss": 0.7178, + "step": 54623 + }, + { + "epoch": 1.4, + "learning_rate": 1.155865979640353e-06, + "loss": 0.7236, + "step": 54624 + }, + { + "epoch": 1.4, + "learning_rate": 1.1558386473092076e-06, + "loss": 0.6377, + "step": 54625 + }, + { + "epoch": 1.4, + "learning_rate": 1.1558113148587438e-06, + "loss": 0.4927, + "step": 54626 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557839822889826e-06, + "loss": 0.6748, + "step": 54627 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557566495999445e-06, + "loss": 0.7021, + "step": 54628 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557293167916506e-06, + "loss": 0.7422, + "step": 54629 + }, + { + "epoch": 1.4, + "learning_rate": 1.1557019838641222e-06, + "loss": 0.7227, + "step": 54630 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556746508173798e-06, + "loss": 0.5632, + "step": 54631 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556473176514446e-06, + "loss": 0.521, + "step": 54632 + }, + { + "epoch": 1.4, + "learning_rate": 1.1556199843663372e-06, + "loss": 0.7148, + "step": 54633 + }, + { + "epoch": 1.4, + "learning_rate": 1.155592650962079e-06, + "loss": 0.6914, + "step": 54634 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555653174386903e-06, + "loss": 0.7637, + "step": 54635 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555379837961928e-06, + "loss": 0.7109, + "step": 54636 + }, + { + "epoch": 1.4, + "learning_rate": 1.1555106500346069e-06, + "loss": 0.5127, + "step": 54637 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554833161539534e-06, + "loss": 0.6914, + "step": 54638 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554559821542538e-06, + "loss": 0.6709, + "step": 54639 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554286480355285e-06, + "loss": 0.6777, + "step": 54640 + }, + { + "epoch": 1.4, + "learning_rate": 1.1554013137977985e-06, + "loss": 0.5352, + "step": 54641 + }, + { + "epoch": 1.4, + "learning_rate": 1.1553739794410851e-06, + "loss": 0.6812, + "step": 54642 + }, + { + "epoch": 1.4, + "learning_rate": 1.155346644965409e-06, + "loss": 0.6426, + "step": 54643 + }, + { + "epoch": 1.4, + "learning_rate": 1.155319310370791e-06, + "loss": 0.6572, + "step": 54644 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552919756572522e-06, + "loss": 0.5776, + "step": 54645 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552646408248134e-06, + "loss": 0.5441, + "step": 54646 + }, + { + "epoch": 1.4, + "learning_rate": 1.1552373058734958e-06, + "loss": 0.5737, + "step": 54647 + }, + { + "epoch": 1.4, + "learning_rate": 1.15520997080332e-06, + "loss": 0.7715, + "step": 54648 + }, + { + "epoch": 1.4, + "learning_rate": 1.155182635614307e-06, + "loss": 0.689, + "step": 54649 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551553003064777e-06, + "loss": 0.6836, + "step": 54650 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551279648798535e-06, + "loss": 0.5947, + "step": 54651 + }, + { + "epoch": 1.4, + "learning_rate": 1.1551006293344548e-06, + "loss": 0.4717, + "step": 54652 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550732936703027e-06, + "loss": 0.4756, + "step": 54653 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550459578874177e-06, + "loss": 0.6338, + "step": 54654 + }, + { + "epoch": 1.4, + "learning_rate": 1.1550186219858215e-06, + "loss": 0.6328, + "step": 54655 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549912859655345e-06, + "loss": 0.5396, + "step": 54656 + }, + { + "epoch": 1.4, + "learning_rate": 1.154963949826578e-06, + "loss": 0.562, + "step": 54657 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549366135689729e-06, + "loss": 0.8027, + "step": 54658 + }, + { + "epoch": 1.4, + "learning_rate": 1.1549092771927394e-06, + "loss": 0.7061, + "step": 54659 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548819406978993e-06, + "loss": 0.833, + "step": 54660 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548546040844733e-06, + "loss": 0.5366, + "step": 54661 + }, + { + "epoch": 1.4, + "learning_rate": 1.1548272673524824e-06, + "loss": 0.8701, + "step": 54662 + }, + { + "epoch": 1.4, + "learning_rate": 1.154799930501947e-06, + "loss": 0.6147, + "step": 54663 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547725935328887e-06, + "loss": 0.709, + "step": 54664 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547452564453278e-06, + "loss": 0.5566, + "step": 54665 + }, + { + "epoch": 1.4, + "learning_rate": 1.1547179192392858e-06, + "loss": 0.6227, + "step": 54666 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546905819147835e-06, + "loss": 0.4922, + "step": 54667 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546632444718416e-06, + "loss": 0.6274, + "step": 54668 + }, + { + "epoch": 1.4, + "learning_rate": 1.1546359069104812e-06, + "loss": 0.7578, + "step": 54669 + }, + { + "epoch": 1.4, + "learning_rate": 1.154608569230723e-06, + "loss": 0.7656, + "step": 54670 + }, + { + "epoch": 1.4, + "learning_rate": 1.1545812314325883e-06, + "loss": 0.6289, + "step": 54671 + }, + { + "epoch": 1.4, + "learning_rate": 1.154553893516098e-06, + "loss": 0.5332, + "step": 54672 + }, + { + "epoch": 1.4, + "learning_rate": 1.1545265554812727e-06, + "loss": 0.7134, + "step": 54673 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544992173281335e-06, + "loss": 0.5081, + "step": 54674 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544718790567013e-06, + "loss": 0.4851, + "step": 54675 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544445406669973e-06, + "loss": 0.7705, + "step": 54676 + }, + { + "epoch": 1.4, + "learning_rate": 1.1544172021590423e-06, + "loss": 0.623, + "step": 54677 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543898635328569e-06, + "loss": 0.4204, + "step": 54678 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543625247884622e-06, + "loss": 0.7178, + "step": 54679 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543351859258796e-06, + "loss": 0.6167, + "step": 54680 + }, + { + "epoch": 1.4, + "learning_rate": 1.1543078469451293e-06, + "loss": 0.5337, + "step": 54681 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542805078462327e-06, + "loss": 0.7119, + "step": 54682 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542531686292106e-06, + "loss": 0.5403, + "step": 54683 + }, + { + "epoch": 1.4, + "learning_rate": 1.1542258292940838e-06, + "loss": 0.7314, + "step": 54684 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541984898408736e-06, + "loss": 0.5241, + "step": 54685 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541711502696005e-06, + "loss": 0.7461, + "step": 54686 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541438105802862e-06, + "loss": 0.5996, + "step": 54687 + }, + { + "epoch": 1.4, + "learning_rate": 1.1541164707729505e-06, + "loss": 0.8984, + "step": 54688 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540891308476151e-06, + "loss": 0.4963, + "step": 54689 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540617908043005e-06, + "loss": 0.4175, + "step": 54690 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540344506430281e-06, + "loss": 0.6484, + "step": 54691 + }, + { + "epoch": 1.4, + "learning_rate": 1.1540071103638187e-06, + "loss": 0.5913, + "step": 54692 + }, + { + "epoch": 1.4, + "learning_rate": 1.153979769966693e-06, + "loss": 0.8516, + "step": 54693 + }, + { + "epoch": 1.4, + "learning_rate": 1.1539524294516719e-06, + "loss": 0.5054, + "step": 54694 + }, + { + "epoch": 1.4, + "learning_rate": 1.1539250888187768e-06, + "loss": 1.1191, + "step": 54695 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538977480680281e-06, + "loss": 0.6538, + "step": 54696 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538704071994472e-06, + "loss": 0.5625, + "step": 54697 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538430662130544e-06, + "loss": 0.875, + "step": 54698 + }, + { + "epoch": 1.4, + "learning_rate": 1.1538157251088715e-06, + "loss": 0.5718, + "step": 54699 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537883838869186e-06, + "loss": 0.8564, + "step": 54700 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537610425472174e-06, + "loss": 0.6113, + "step": 54701 + }, + { + "epoch": 1.4, + "learning_rate": 1.1537337010897883e-06, + "loss": 0.6509, + "step": 54702 + }, + { + "epoch": 1.4, + "learning_rate": 1.153706359514652e-06, + "loss": 0.4712, + "step": 54703 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536790178218304e-06, + "loss": 0.4368, + "step": 54704 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536516760113434e-06, + "loss": 0.709, + "step": 54705 + }, + { + "epoch": 1.4, + "learning_rate": 1.1536243340832125e-06, + "loss": 0.5908, + "step": 54706 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535969920374587e-06, + "loss": 0.668, + "step": 54707 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535696498741026e-06, + "loss": 0.5947, + "step": 54708 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535423075931652e-06, + "loss": 0.7131, + "step": 54709 + }, + { + "epoch": 1.4, + "learning_rate": 1.1535149651946677e-06, + "loss": 0.6079, + "step": 54710 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534876226786306e-06, + "loss": 0.6465, + "step": 54711 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534602800450755e-06, + "loss": 0.5239, + "step": 54712 + }, + { + "epoch": 1.4, + "learning_rate": 1.1534329372940223e-06, + "loss": 0.6885, + "step": 54713 + }, + { + "epoch": 1.4, + "learning_rate": 1.153405594425493e-06, + "loss": 0.6143, + "step": 54714 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533782514395079e-06, + "loss": 0.9043, + "step": 54715 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533509083360881e-06, + "loss": 0.627, + "step": 54716 + }, + { + "epoch": 1.4, + "learning_rate": 1.1533235651152548e-06, + "loss": 0.5859, + "step": 54717 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532962217770288e-06, + "loss": 0.3745, + "step": 54718 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532688783214304e-06, + "loss": 0.8076, + "step": 54719 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532415347484814e-06, + "loss": 0.8926, + "step": 54720 + }, + { + "epoch": 1.4, + "learning_rate": 1.1532141910582023e-06, + "loss": 0.54, + "step": 54721 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531868472506142e-06, + "loss": 0.6606, + "step": 54722 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531595033257381e-06, + "loss": 0.4712, + "step": 54723 + }, + { + "epoch": 1.4, + "learning_rate": 1.1531321592835948e-06, + "loss": 0.491, + "step": 54724 + }, + { + "epoch": 1.4, + "learning_rate": 1.153104815124205e-06, + "loss": 0.603, + "step": 54725 + }, + { + "epoch": 1.4, + "learning_rate": 1.1530774708475901e-06, + "loss": 0.792, + "step": 54726 + }, + { + "epoch": 1.4, + "learning_rate": 1.153050126453771e-06, + "loss": 0.6255, + "step": 54727 + }, + { + "epoch": 1.4, + "learning_rate": 1.1530227819427677e-06, + "loss": 0.4858, + "step": 54728 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529954373146027e-06, + "loss": 0.6299, + "step": 54729 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529680925692956e-06, + "loss": 0.6641, + "step": 54730 + }, + { + "epoch": 1.4, + "learning_rate": 1.1529407477068682e-06, + "loss": 0.5713, + "step": 54731 + }, + { + "epoch": 1.4, + "learning_rate": 1.152913402727341e-06, + "loss": 0.498, + "step": 54732 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528860576307352e-06, + "loss": 0.7744, + "step": 54733 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528587124170711e-06, + "loss": 0.6963, + "step": 54734 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528313670863704e-06, + "loss": 0.792, + "step": 54735 + }, + { + "epoch": 1.4, + "learning_rate": 1.1528040216386536e-06, + "loss": 0.6274, + "step": 54736 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527766760739423e-06, + "loss": 0.5718, + "step": 54737 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527493303922565e-06, + "loss": 0.7393, + "step": 54738 + }, + { + "epoch": 1.4, + "learning_rate": 1.1527219845936177e-06, + "loss": 0.6541, + "step": 54739 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526946386780465e-06, + "loss": 0.7266, + "step": 54740 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526672926455642e-06, + "loss": 0.6982, + "step": 54741 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526399464961915e-06, + "loss": 0.552, + "step": 54742 + }, + { + "epoch": 1.4, + "learning_rate": 1.1526126002299497e-06, + "loss": 0.6587, + "step": 54743 + }, + { + "epoch": 1.4, + "learning_rate": 1.152585253846859e-06, + "loss": 0.645, + "step": 54744 + }, + { + "epoch": 1.4, + "learning_rate": 1.1525579073469412e-06, + "loss": 0.8662, + "step": 54745 + }, + { + "epoch": 1.4, + "learning_rate": 1.1525305607302162e-06, + "loss": 0.6328, + "step": 54746 + }, + { + "epoch": 1.4, + "learning_rate": 1.152503213996706e-06, + "loss": 0.6689, + "step": 54747 + }, + { + "epoch": 1.4, + "learning_rate": 1.1524758671464315e-06, + "loss": 0.5483, + "step": 54748 + }, + { + "epoch": 1.4, + "learning_rate": 1.1524485201794126e-06, + "loss": 0.6538, + "step": 54749 + }, + { + "epoch": 1.4, + "learning_rate": 1.152421173095671e-06, + "loss": 0.7314, + "step": 54750 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523938258952275e-06, + "loss": 0.6709, + "step": 54751 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523664785781035e-06, + "loss": 0.6318, + "step": 54752 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523391311443189e-06, + "loss": 0.6992, + "step": 54753 + }, + { + "epoch": 1.4, + "learning_rate": 1.1523117835938955e-06, + "loss": 0.7236, + "step": 54754 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522844359268539e-06, + "loss": 0.6943, + "step": 54755 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522570881432154e-06, + "loss": 0.5054, + "step": 54756 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522297402430003e-06, + "loss": 0.8594, + "step": 54757 + }, + { + "epoch": 1.4, + "learning_rate": 1.1522023922262304e-06, + "loss": 0.6084, + "step": 54758 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521750440929255e-06, + "loss": 0.6543, + "step": 54759 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521476958431074e-06, + "loss": 0.6553, + "step": 54760 + }, + { + "epoch": 1.4, + "learning_rate": 1.1521203474767967e-06, + "loss": 0.7188, + "step": 54761 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520929989940147e-06, + "loss": 0.6484, + "step": 54762 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520656503947818e-06, + "loss": 0.7227, + "step": 54763 + }, + { + "epoch": 1.4, + "learning_rate": 1.1520383016791195e-06, + "loss": 0.6431, + "step": 54764 + }, + { + "epoch": 1.4, + "learning_rate": 1.152010952847048e-06, + "loss": 0.7061, + "step": 54765 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519836038985894e-06, + "loss": 0.6978, + "step": 54766 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519562548337636e-06, + "loss": 0.6553, + "step": 54767 + }, + { + "epoch": 1.4, + "learning_rate": 1.1519289056525915e-06, + "loss": 0.7324, + "step": 54768 + }, + { + "epoch": 1.4, + "learning_rate": 1.151901556355095e-06, + "loss": 0.5464, + "step": 54769 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518742069412943e-06, + "loss": 0.6343, + "step": 54770 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518468574112103e-06, + "loss": 0.6387, + "step": 54771 + }, + { + "epoch": 1.4, + "learning_rate": 1.1518195077648645e-06, + "loss": 0.6416, + "step": 54772 + }, + { + "epoch": 1.4, + "learning_rate": 1.151792158002277e-06, + "loss": 0.5864, + "step": 54773 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517648081234694e-06, + "loss": 0.708, + "step": 54774 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517374581284628e-06, + "loss": 0.8291, + "step": 54775 + }, + { + "epoch": 1.4, + "learning_rate": 1.1517101080172773e-06, + "loss": 0.7773, + "step": 54776 + }, + { + "epoch": 1.4, + "learning_rate": 1.151682757789935e-06, + "loss": 0.4812, + "step": 54777 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516554074464554e-06, + "loss": 0.5999, + "step": 54778 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516280569868608e-06, + "loss": 0.7153, + "step": 54779 + }, + { + "epoch": 1.4, + "learning_rate": 1.1516007064111715e-06, + "loss": 0.6787, + "step": 54780 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515733557194083e-06, + "loss": 0.5908, + "step": 54781 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515460049115927e-06, + "loss": 0.4066, + "step": 54782 + }, + { + "epoch": 1.4, + "learning_rate": 1.1515186539877451e-06, + "loss": 0.5205, + "step": 54783 + }, + { + "epoch": 1.4, + "learning_rate": 1.1514913029478863e-06, + "loss": 0.7148, + "step": 54784 + }, + { + "epoch": 1.4, + "learning_rate": 1.151463951792038e-06, + "loss": 0.5479, + "step": 54785 + }, + { + "epoch": 1.4, + "learning_rate": 1.1514366005202202e-06, + "loss": 0.7188, + "step": 54786 + }, + { + "epoch": 1.4, + "learning_rate": 1.151409249132455e-06, + "loss": 0.6738, + "step": 54787 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513818976287625e-06, + "loss": 0.7041, + "step": 54788 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513545460091638e-06, + "loss": 0.7871, + "step": 54789 + }, + { + "epoch": 1.4, + "learning_rate": 1.1513271942736798e-06, + "loss": 0.7773, + "step": 54790 + }, + { + "epoch": 1.4, + "learning_rate": 1.1512998424223316e-06, + "loss": 0.5632, + "step": 54791 + }, + { + "epoch": 1.4, + "learning_rate": 1.15127249045514e-06, + "loss": 0.5037, + "step": 54792 + }, + { + "epoch": 1.4, + "learning_rate": 1.151245138372126e-06, + "loss": 0.4626, + "step": 54793 + }, + { + "epoch": 1.4, + "learning_rate": 1.1512177861733108e-06, + "loss": 0.6396, + "step": 54794 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511904338587146e-06, + "loss": 0.5957, + "step": 54795 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511630814283593e-06, + "loss": 0.3574, + "step": 54796 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511357288822652e-06, + "loss": 0.856, + "step": 54797 + }, + { + "epoch": 1.4, + "learning_rate": 1.1511083762204536e-06, + "loss": 0.8135, + "step": 54798 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510810234429448e-06, + "loss": 0.6963, + "step": 54799 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510536705497608e-06, + "loss": 0.5713, + "step": 54800 + }, + { + "epoch": 1.4, + "learning_rate": 1.1510263175409213e-06, + "loss": 0.7441, + "step": 54801 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509989644164485e-06, + "loss": 0.7158, + "step": 54802 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509716111763625e-06, + "loss": 0.5957, + "step": 54803 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509442578206845e-06, + "loss": 0.7393, + "step": 54804 + }, + { + "epoch": 1.4, + "learning_rate": 1.1509169043494354e-06, + "loss": 0.5752, + "step": 54805 + }, + { + "epoch": 1.4, + "learning_rate": 1.1508895507626361e-06, + "loss": 0.6899, + "step": 54806 + }, + { + "epoch": 1.4, + "learning_rate": 1.150862197060308e-06, + "loss": 0.5771, + "step": 54807 + }, + { + "epoch": 1.4, + "learning_rate": 1.150834843242471e-06, + "loss": 0.6572, + "step": 54808 + }, + { + "epoch": 1.4, + "learning_rate": 1.1508074893091471e-06, + "loss": 0.5312, + "step": 54809 + }, + { + "epoch": 1.4, + "learning_rate": 1.1507801352603569e-06, + "loss": 0.7158, + "step": 54810 + }, + { + "epoch": 1.4, + "learning_rate": 1.150752781096121e-06, + "loss": 0.7607, + "step": 54811 + }, + { + "epoch": 1.4, + "learning_rate": 1.1507254268164607e-06, + "loss": 0.6436, + "step": 54812 + }, + { + "epoch": 1.4, + "learning_rate": 1.150698072421397e-06, + "loss": 0.6484, + "step": 54813 + }, + { + "epoch": 1.4, + "learning_rate": 1.1506707179109505e-06, + "loss": 0.6309, + "step": 54814 + }, + { + "epoch": 1.4, + "learning_rate": 1.1506433632851427e-06, + "loss": 0.4707, + "step": 54815 + }, + { + "epoch": 1.4, + "learning_rate": 1.150616008543994e-06, + "loss": 0.71, + "step": 54816 + }, + { + "epoch": 1.4, + "learning_rate": 1.1505886536875255e-06, + "loss": 0.6736, + "step": 54817 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505612987157583e-06, + "loss": 0.6553, + "step": 54818 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505339436287132e-06, + "loss": 0.7617, + "step": 54819 + }, + { + "epoch": 1.41, + "learning_rate": 1.1505065884264112e-06, + "loss": 0.7324, + "step": 54820 + }, + { + "epoch": 1.41, + "learning_rate": 1.1504792331088734e-06, + "loss": 0.7725, + "step": 54821 + }, + { + "epoch": 1.41, + "learning_rate": 1.15045187767612e-06, + "loss": 0.7393, + "step": 54822 + }, + { + "epoch": 1.41, + "learning_rate": 1.1504245221281733e-06, + "loss": 0.832, + "step": 54823 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503971664650528e-06, + "loss": 0.6304, + "step": 54824 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503698106867802e-06, + "loss": 0.6191, + "step": 54825 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503424547933767e-06, + "loss": 0.7842, + "step": 54826 + }, + { + "epoch": 1.41, + "learning_rate": 1.1503150987848626e-06, + "loss": 0.8457, + "step": 54827 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502877426612592e-06, + "loss": 0.6533, + "step": 54828 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502603864225874e-06, + "loss": 0.6318, + "step": 54829 + }, + { + "epoch": 1.41, + "learning_rate": 1.150233030068868e-06, + "loss": 0.8037, + "step": 54830 + }, + { + "epoch": 1.41, + "learning_rate": 1.1502056736001224e-06, + "loss": 0.6875, + "step": 54831 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501783170163713e-06, + "loss": 0.5459, + "step": 54832 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501509603176352e-06, + "loss": 0.521, + "step": 54833 + }, + { + "epoch": 1.41, + "learning_rate": 1.1501236035039354e-06, + "loss": 0.6206, + "step": 54834 + }, + { + "epoch": 1.41, + "learning_rate": 1.150096246575293e-06, + "loss": 0.522, + "step": 54835 + }, + { + "epoch": 1.41, + "learning_rate": 1.150068889531729e-06, + "loss": 0.5581, + "step": 54836 + }, + { + "epoch": 1.41, + "learning_rate": 1.1500415323732638e-06, + "loss": 0.6899, + "step": 54837 + }, + { + "epoch": 1.41, + "learning_rate": 1.1500141750999188e-06, + "loss": 0.7539, + "step": 54838 + }, + { + "epoch": 1.41, + "learning_rate": 1.149986817711715e-06, + "loss": 0.4944, + "step": 54839 + }, + { + "epoch": 1.41, + "learning_rate": 1.149959460208673e-06, + "loss": 0.6777, + "step": 54840 + }, + { + "epoch": 1.41, + "learning_rate": 1.1499321025908141e-06, + "loss": 0.6455, + "step": 54841 + }, + { + "epoch": 1.41, + "learning_rate": 1.1499047448581592e-06, + "loss": 0.5981, + "step": 54842 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498773870107288e-06, + "loss": 0.5989, + "step": 54843 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498500290485442e-06, + "loss": 0.6846, + "step": 54844 + }, + { + "epoch": 1.41, + "learning_rate": 1.1498226709716263e-06, + "loss": 0.917, + "step": 54845 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497953127799966e-06, + "loss": 0.5132, + "step": 54846 + }, + { + "epoch": 1.41, + "learning_rate": 1.149767954473675e-06, + "loss": 0.5503, + "step": 54847 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497405960526832e-06, + "loss": 0.4716, + "step": 54848 + }, + { + "epoch": 1.41, + "learning_rate": 1.1497132375170414e-06, + "loss": 0.73, + "step": 54849 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496858788667716e-06, + "loss": 0.7246, + "step": 54850 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496585201018943e-06, + "loss": 0.6411, + "step": 54851 + }, + { + "epoch": 1.41, + "learning_rate": 1.14963116122243e-06, + "loss": 0.748, + "step": 54852 + }, + { + "epoch": 1.41, + "learning_rate": 1.1496038022284e-06, + "loss": 0.6846, + "step": 54853 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495764431198255e-06, + "loss": 0.604, + "step": 54854 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495490838967267e-06, + "loss": 0.7168, + "step": 54855 + }, + { + "epoch": 1.41, + "learning_rate": 1.1495217245591256e-06, + "loss": 0.5864, + "step": 54856 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494943651070425e-06, + "loss": 0.7725, + "step": 54857 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494670055404983e-06, + "loss": 0.6621, + "step": 54858 + }, + { + "epoch": 1.41, + "learning_rate": 1.1494396458595139e-06, + "loss": 0.6611, + "step": 54859 + }, + { + "epoch": 1.41, + "learning_rate": 1.149412286064111e-06, + "loss": 0.7715, + "step": 54860 + }, + { + "epoch": 1.41, + "learning_rate": 1.1493849261543096e-06, + "loss": 0.5679, + "step": 54861 + }, + { + "epoch": 1.41, + "learning_rate": 1.149357566130131e-06, + "loss": 0.584, + "step": 54862 + }, + { + "epoch": 1.41, + "learning_rate": 1.1493302059915962e-06, + "loss": 0.6846, + "step": 54863 + }, + { + "epoch": 1.41, + "learning_rate": 1.149302845738726e-06, + "loss": 0.6108, + "step": 54864 + }, + { + "epoch": 1.41, + "learning_rate": 1.1492754853715415e-06, + "loss": 0.6133, + "step": 54865 + }, + { + "epoch": 1.41, + "learning_rate": 1.1492481248900641e-06, + "loss": 0.7852, + "step": 54866 + }, + { + "epoch": 1.41, + "learning_rate": 1.149220764294314e-06, + "loss": 0.6104, + "step": 54867 + }, + { + "epoch": 1.41, + "learning_rate": 1.149193403584312e-06, + "loss": 0.6299, + "step": 54868 + }, + { + "epoch": 1.41, + "learning_rate": 1.14916604276008e-06, + "loss": 0.6514, + "step": 54869 + }, + { + "epoch": 1.41, + "learning_rate": 1.1491386818216382e-06, + "loss": 0.6763, + "step": 54870 + }, + { + "epoch": 1.41, + "learning_rate": 1.1491113207690082e-06, + "loss": 0.7441, + "step": 54871 + }, + { + "epoch": 1.41, + "learning_rate": 1.14908395960221e-06, + "loss": 0.4758, + "step": 54872 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490565983212652e-06, + "loss": 0.8379, + "step": 54873 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490292369261944e-06, + "loss": 0.71, + "step": 54874 + }, + { + "epoch": 1.41, + "learning_rate": 1.1490018754170192e-06, + "loss": 0.6445, + "step": 54875 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489745137937598e-06, + "loss": 0.7061, + "step": 54876 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489471520564379e-06, + "loss": 0.5398, + "step": 54877 + }, + { + "epoch": 1.41, + "learning_rate": 1.1489197902050734e-06, + "loss": 0.7637, + "step": 54878 + }, + { + "epoch": 1.41, + "learning_rate": 1.148892428239688e-06, + "loss": 0.6807, + "step": 54879 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488650661603027e-06, + "loss": 0.6621, + "step": 54880 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488377039669383e-06, + "loss": 0.707, + "step": 54881 + }, + { + "epoch": 1.41, + "learning_rate": 1.1488103416596157e-06, + "loss": 0.6611, + "step": 54882 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487829792383556e-06, + "loss": 0.7266, + "step": 54883 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487556167031795e-06, + "loss": 0.7129, + "step": 54884 + }, + { + "epoch": 1.41, + "learning_rate": 1.148728254054108e-06, + "loss": 0.6035, + "step": 54885 + }, + { + "epoch": 1.41, + "learning_rate": 1.1487008912911621e-06, + "loss": 0.6904, + "step": 54886 + }, + { + "epoch": 1.41, + "learning_rate": 1.1486735284143628e-06, + "loss": 0.8057, + "step": 54887 + }, + { + "epoch": 1.41, + "learning_rate": 1.148646165423731e-06, + "loss": 0.8213, + "step": 54888 + }, + { + "epoch": 1.41, + "learning_rate": 1.1486188023192875e-06, + "loss": 0.7207, + "step": 54889 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485914391010536e-06, + "loss": 0.5474, + "step": 54890 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485640757690501e-06, + "loss": 0.5312, + "step": 54891 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485367123232982e-06, + "loss": 0.6387, + "step": 54892 + }, + { + "epoch": 1.41, + "learning_rate": 1.1485093487638178e-06, + "loss": 0.6406, + "step": 54893 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484819850906311e-06, + "loss": 0.6602, + "step": 54894 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484546213037584e-06, + "loss": 0.6416, + "step": 54895 + }, + { + "epoch": 1.41, + "learning_rate": 1.1484272574032213e-06, + "loss": 0.4658, + "step": 54896 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483998933890397e-06, + "loss": 0.6108, + "step": 54897 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483725292612354e-06, + "loss": 0.6514, + "step": 54898 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483451650198287e-06, + "loss": 0.6987, + "step": 54899 + }, + { + "epoch": 1.41, + "learning_rate": 1.1483178006648415e-06, + "loss": 0.5349, + "step": 54900 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482904361962939e-06, + "loss": 0.6396, + "step": 54901 + }, + { + "epoch": 1.41, + "learning_rate": 1.148263071614207e-06, + "loss": 0.6699, + "step": 54902 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482357069186022e-06, + "loss": 0.5143, + "step": 54903 + }, + { + "epoch": 1.41, + "learning_rate": 1.1482083421094996e-06, + "loss": 0.5679, + "step": 54904 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481809771869213e-06, + "loss": 0.6787, + "step": 54905 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481536121508874e-06, + "loss": 0.7627, + "step": 54906 + }, + { + "epoch": 1.41, + "learning_rate": 1.1481262470014193e-06, + "loss": 0.7119, + "step": 54907 + }, + { + "epoch": 1.41, + "learning_rate": 1.1480988817385373e-06, + "loss": 0.5898, + "step": 54908 + }, + { + "epoch": 1.41, + "learning_rate": 1.1480715163622632e-06, + "loss": 0.8926, + "step": 54909 + }, + { + "epoch": 1.41, + "learning_rate": 1.148044150872617e-06, + "loss": 0.6133, + "step": 54910 + }, + { + "epoch": 1.41, + "learning_rate": 1.148016785269621e-06, + "loss": 0.6514, + "step": 54911 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479894195532947e-06, + "loss": 0.6626, + "step": 54912 + }, + { + "epoch": 1.41, + "learning_rate": 1.14796205372366e-06, + "loss": 0.5708, + "step": 54913 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479346877807374e-06, + "loss": 0.4532, + "step": 54914 + }, + { + "epoch": 1.41, + "learning_rate": 1.1479073217245482e-06, + "loss": 0.6211, + "step": 54915 + }, + { + "epoch": 1.41, + "learning_rate": 1.147879955555113e-06, + "loss": 0.3706, + "step": 54916 + }, + { + "epoch": 1.41, + "learning_rate": 1.1478525892724531e-06, + "loss": 0.7305, + "step": 54917 + }, + { + "epoch": 1.41, + "learning_rate": 1.147825222876589e-06, + "loss": 0.75, + "step": 54918 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477978563675423e-06, + "loss": 0.5298, + "step": 54919 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477704897453331e-06, + "loss": 0.5413, + "step": 54920 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477431230099832e-06, + "loss": 0.6914, + "step": 54921 + }, + { + "epoch": 1.41, + "learning_rate": 1.1477157561615131e-06, + "loss": 0.6401, + "step": 54922 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476883891999438e-06, + "loss": 0.5723, + "step": 54923 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476610221252962e-06, + "loss": 0.6338, + "step": 54924 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476336549375915e-06, + "loss": 0.7578, + "step": 54925 + }, + { + "epoch": 1.41, + "learning_rate": 1.1476062876368507e-06, + "loss": 0.6494, + "step": 54926 + }, + { + "epoch": 1.41, + "learning_rate": 1.147578920223094e-06, + "loss": 0.8271, + "step": 54927 + }, + { + "epoch": 1.41, + "learning_rate": 1.1475515526963433e-06, + "loss": 0.7119, + "step": 54928 + }, + { + "epoch": 1.41, + "learning_rate": 1.1475241850566188e-06, + "loss": 0.5513, + "step": 54929 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474968173039423e-06, + "loss": 0.6299, + "step": 54930 + }, + { + "epoch": 1.41, + "learning_rate": 1.147469449438334e-06, + "loss": 0.5833, + "step": 54931 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474420814598153e-06, + "loss": 0.8447, + "step": 54932 + }, + { + "epoch": 1.41, + "learning_rate": 1.1474147133684067e-06, + "loss": 0.5244, + "step": 54933 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473873451641297e-06, + "loss": 0.7441, + "step": 54934 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473599768470049e-06, + "loss": 0.5374, + "step": 54935 + }, + { + "epoch": 1.41, + "learning_rate": 1.1473326084170533e-06, + "loss": 0.7041, + "step": 54936 + }, + { + "epoch": 1.41, + "learning_rate": 1.147305239874296e-06, + "loss": 0.6709, + "step": 54937 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472778712187536e-06, + "loss": 0.8096, + "step": 54938 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472505024504475e-06, + "loss": 0.752, + "step": 54939 + }, + { + "epoch": 1.41, + "learning_rate": 1.1472231335693986e-06, + "loss": 0.791, + "step": 54940 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471957645756274e-06, + "loss": 0.6951, + "step": 54941 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471683954691553e-06, + "loss": 0.7734, + "step": 54942 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471410262500032e-06, + "loss": 0.5239, + "step": 54943 + }, + { + "epoch": 1.41, + "learning_rate": 1.1471136569181917e-06, + "loss": 0.5645, + "step": 54944 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470862874737423e-06, + "loss": 0.7266, + "step": 54945 + }, + { + "epoch": 1.41, + "learning_rate": 1.147058917916676e-06, + "loss": 0.6421, + "step": 54946 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470315482470129e-06, + "loss": 0.7861, + "step": 54947 + }, + { + "epoch": 1.41, + "learning_rate": 1.1470041784647745e-06, + "loss": 0.7051, + "step": 54948 + }, + { + "epoch": 1.41, + "learning_rate": 1.146976808569982e-06, + "loss": 0.541, + "step": 54949 + }, + { + "epoch": 1.41, + "learning_rate": 1.1469494385626562e-06, + "loss": 0.5962, + "step": 54950 + }, + { + "epoch": 1.41, + "learning_rate": 1.146922068442818e-06, + "loss": 0.625, + "step": 54951 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468946982104881e-06, + "loss": 0.5459, + "step": 54952 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468673278656877e-06, + "loss": 0.7637, + "step": 54953 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468399574084378e-06, + "loss": 0.5486, + "step": 54954 + }, + { + "epoch": 1.41, + "learning_rate": 1.1468125868387592e-06, + "loss": 0.6123, + "step": 54955 + }, + { + "epoch": 1.41, + "learning_rate": 1.146785216156673e-06, + "loss": 0.665, + "step": 54956 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467578453622004e-06, + "loss": 0.4861, + "step": 54957 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467304744553617e-06, + "loss": 0.5083, + "step": 54958 + }, + { + "epoch": 1.41, + "learning_rate": 1.1467031034361784e-06, + "loss": 0.6426, + "step": 54959 + }, + { + "epoch": 1.41, + "learning_rate": 1.1466757323046712e-06, + "loss": 0.4635, + "step": 54960 + }, + { + "epoch": 1.41, + "learning_rate": 1.1466483610608612e-06, + "loss": 0.7002, + "step": 54961 + }, + { + "epoch": 1.41, + "learning_rate": 1.146620989704769e-06, + "loss": 0.7139, + "step": 54962 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465936182364165e-06, + "loss": 0.4458, + "step": 54963 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465662466558234e-06, + "loss": 0.7705, + "step": 54964 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465388749630116e-06, + "loss": 0.6299, + "step": 54965 + }, + { + "epoch": 1.41, + "learning_rate": 1.1465115031580018e-06, + "loss": 0.5928, + "step": 54966 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464841312408147e-06, + "loss": 0.6162, + "step": 54967 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464567592114712e-06, + "loss": 0.5659, + "step": 54968 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464293870699928e-06, + "loss": 0.7822, + "step": 54969 + }, + { + "epoch": 1.41, + "learning_rate": 1.1464020148163998e-06, + "loss": 0.3828, + "step": 54970 + }, + { + "epoch": 1.41, + "learning_rate": 1.146374642450714e-06, + "loss": 0.6411, + "step": 54971 + }, + { + "epoch": 1.41, + "learning_rate": 1.1463472699729556e-06, + "loss": 0.6006, + "step": 54972 + }, + { + "epoch": 1.41, + "learning_rate": 1.1463198973831456e-06, + "loss": 0.7285, + "step": 54973 + }, + { + "epoch": 1.41, + "learning_rate": 1.1462925246813056e-06, + "loss": 0.4812, + "step": 54974 + }, + { + "epoch": 1.41, + "learning_rate": 1.146265151867456e-06, + "loss": 0.6982, + "step": 54975 + }, + { + "epoch": 1.41, + "learning_rate": 1.146237778941618e-06, + "loss": 0.7461, + "step": 54976 + }, + { + "epoch": 1.41, + "learning_rate": 1.1462104059038122e-06, + "loss": 0.8926, + "step": 54977 + }, + { + "epoch": 1.41, + "learning_rate": 1.14618303275406e-06, + "loss": 0.5854, + "step": 54978 + }, + { + "epoch": 1.41, + "learning_rate": 1.146155659492382e-06, + "loss": 0.5299, + "step": 54979 + }, + { + "epoch": 1.41, + "learning_rate": 1.1461282861187996e-06, + "loss": 0.5864, + "step": 54980 + }, + { + "epoch": 1.41, + "learning_rate": 1.1461009126333334e-06, + "loss": 0.6211, + "step": 54981 + }, + { + "epoch": 1.41, + "learning_rate": 1.1460735390360046e-06, + "loss": 0.6426, + "step": 54982 + }, + { + "epoch": 1.41, + "learning_rate": 1.1460461653268336e-06, + "loss": 0.6733, + "step": 54983 + }, + { + "epoch": 1.41, + "learning_rate": 1.146018791505842e-06, + "loss": 0.6982, + "step": 54984 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459914175730502e-06, + "loss": 0.6445, + "step": 54985 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459640435284802e-06, + "loss": 0.7568, + "step": 54986 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459366693721518e-06, + "loss": 0.6107, + "step": 54987 + }, + { + "epoch": 1.41, + "learning_rate": 1.1459092951040864e-06, + "loss": 0.4104, + "step": 54988 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458819207243048e-06, + "loss": 0.7207, + "step": 54989 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458545462328284e-06, + "loss": 0.4985, + "step": 54990 + }, + { + "epoch": 1.41, + "learning_rate": 1.1458271716296778e-06, + "loss": 0.6963, + "step": 54991 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457997969148741e-06, + "loss": 0.4436, + "step": 54992 + }, + { + "epoch": 1.41, + "learning_rate": 1.145772422088438e-06, + "loss": 0.834, + "step": 54993 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457450471503906e-06, + "loss": 0.7441, + "step": 54994 + }, + { + "epoch": 1.41, + "learning_rate": 1.1457176721007533e-06, + "loss": 0.668, + "step": 54995 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456902969395466e-06, + "loss": 0.5833, + "step": 54996 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456629216667915e-06, + "loss": 0.6206, + "step": 54997 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456355462825086e-06, + "loss": 0.5967, + "step": 54998 + }, + { + "epoch": 1.41, + "learning_rate": 1.1456081707867198e-06, + "loss": 0.5664, + "step": 54999 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455807951794452e-06, + "loss": 0.4116, + "step": 55000 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455534194607063e-06, + "loss": 0.6611, + "step": 55001 + }, + { + "epoch": 1.41, + "learning_rate": 1.1455260436305237e-06, + "loss": 0.6943, + "step": 55002 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454986676889186e-06, + "loss": 0.5419, + "step": 55003 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454712916359117e-06, + "loss": 0.646, + "step": 55004 + }, + { + "epoch": 1.41, + "learning_rate": 1.1454439154715242e-06, + "loss": 0.668, + "step": 55005 + }, + { + "epoch": 1.41, + "learning_rate": 1.145416539195777e-06, + "loss": 0.6963, + "step": 55006 + }, + { + "epoch": 1.41, + "learning_rate": 1.145389162808691e-06, + "loss": 0.7812, + "step": 55007 + }, + { + "epoch": 1.41, + "learning_rate": 1.1453617863102874e-06, + "loss": 0.6758, + "step": 55008 + }, + { + "epoch": 1.41, + "learning_rate": 1.1453344097005867e-06, + "loss": 0.6904, + "step": 55009 + }, + { + "epoch": 1.41, + "learning_rate": 1.14530703297961e-06, + "loss": 0.7041, + "step": 55010 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452796561473788e-06, + "loss": 0.8125, + "step": 55011 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452522792039135e-06, + "loss": 0.8535, + "step": 55012 + }, + { + "epoch": 1.41, + "learning_rate": 1.1452249021492353e-06, + "loss": 0.6162, + "step": 55013 + }, + { + "epoch": 1.41, + "learning_rate": 1.1451975249833648e-06, + "loss": 0.5413, + "step": 55014 + }, + { + "epoch": 1.41, + "learning_rate": 1.1451701477063233e-06, + "loss": 0.5547, + "step": 55015 + }, + { + "epoch": 1.41, + "learning_rate": 1.145142770318132e-06, + "loss": 0.6069, + "step": 55016 + }, + { + "epoch": 1.41, + "learning_rate": 1.145115392818811e-06, + "loss": 0.519, + "step": 55017 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450880152083825e-06, + "loss": 0.6758, + "step": 55018 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450606374868662e-06, + "loss": 0.5522, + "step": 55019 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450332596542837e-06, + "loss": 0.6055, + "step": 55020 + }, + { + "epoch": 1.41, + "learning_rate": 1.1450058817106563e-06, + "loss": 0.5278, + "step": 55021 + }, + { + "epoch": 1.41, + "learning_rate": 1.1449785036560042e-06, + "loss": 0.6006, + "step": 55022 + }, + { + "epoch": 1.41, + "learning_rate": 1.1449511254903487e-06, + "loss": 0.793, + "step": 55023 + }, + { + "epoch": 1.41, + "learning_rate": 1.144923747213711e-06, + "loss": 0.7251, + "step": 55024 + }, + { + "epoch": 1.41, + "learning_rate": 1.1448963688261117e-06, + "loss": 0.5249, + "step": 55025 + }, + { + "epoch": 1.41, + "learning_rate": 1.1448689903275724e-06, + "loss": 0.6416, + "step": 55026 + }, + { + "epoch": 1.41, + "learning_rate": 1.144841611718113e-06, + "loss": 0.7656, + "step": 55027 + }, + { + "epoch": 1.41, + "learning_rate": 1.144814232997755e-06, + "loss": 0.6997, + "step": 55028 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447868541665195e-06, + "loss": 0.6733, + "step": 55029 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447594752244276e-06, + "loss": 0.8545, + "step": 55030 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447320961714998e-06, + "loss": 0.7266, + "step": 55031 + }, + { + "epoch": 1.41, + "learning_rate": 1.1447047170077576e-06, + "loss": 0.666, + "step": 55032 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446773377332212e-06, + "loss": 0.771, + "step": 55033 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446499583479126e-06, + "loss": 0.7842, + "step": 55034 + }, + { + "epoch": 1.41, + "learning_rate": 1.1446225788518515e-06, + "loss": 0.8262, + "step": 55035 + }, + { + "epoch": 1.41, + "learning_rate": 1.14459519924506e-06, + "loss": 0.6704, + "step": 55036 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445678195275584e-06, + "loss": 0.6548, + "step": 55037 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445404396993678e-06, + "loss": 0.6301, + "step": 55038 + }, + { + "epoch": 1.41, + "learning_rate": 1.1445130597605094e-06, + "loss": 0.614, + "step": 55039 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444856797110044e-06, + "loss": 0.7178, + "step": 55040 + }, + { + "epoch": 1.41, + "learning_rate": 1.144458299550873e-06, + "loss": 0.5215, + "step": 55041 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444309192801363e-06, + "loss": 0.5903, + "step": 55042 + }, + { + "epoch": 1.41, + "learning_rate": 1.1444035388988156e-06, + "loss": 0.6816, + "step": 55043 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443761584069315e-06, + "loss": 0.6553, + "step": 55044 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443487778045056e-06, + "loss": 0.5659, + "step": 55045 + }, + { + "epoch": 1.41, + "learning_rate": 1.1443213970915583e-06, + "loss": 0.7002, + "step": 55046 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442940162681112e-06, + "loss": 0.6387, + "step": 55047 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442666353341841e-06, + "loss": 0.7783, + "step": 55048 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442392542897993e-06, + "loss": 0.6445, + "step": 55049 + }, + { + "epoch": 1.41, + "learning_rate": 1.1442118731349766e-06, + "loss": 0.647, + "step": 55050 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441844918697378e-06, + "loss": 0.752, + "step": 55051 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441571104941034e-06, + "loss": 0.6865, + "step": 55052 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441297290080946e-06, + "loss": 0.667, + "step": 55053 + }, + { + "epoch": 1.41, + "learning_rate": 1.1441023474117325e-06, + "loss": 0.688, + "step": 55054 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440749657050377e-06, + "loss": 0.7246, + "step": 55055 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440475838880311e-06, + "loss": 0.6704, + "step": 55056 + }, + { + "epoch": 1.41, + "learning_rate": 1.1440202019607343e-06, + "loss": 0.7627, + "step": 55057 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439928199231675e-06, + "loss": 0.8533, + "step": 55058 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439654377753522e-06, + "loss": 0.6494, + "step": 55059 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439380555173091e-06, + "loss": 0.6777, + "step": 55060 + }, + { + "epoch": 1.41, + "learning_rate": 1.1439106731490594e-06, + "loss": 0.6284, + "step": 55061 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438832906706236e-06, + "loss": 0.6538, + "step": 55062 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438559080820232e-06, + "loss": 0.6797, + "step": 55063 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438285253832792e-06, + "loss": 0.8135, + "step": 55064 + }, + { + "epoch": 1.41, + "learning_rate": 1.1438011425744119e-06, + "loss": 0.6812, + "step": 55065 + }, + { + "epoch": 1.41, + "learning_rate": 1.143773759655443e-06, + "loss": 0.6567, + "step": 55066 + }, + { + "epoch": 1.41, + "learning_rate": 1.1437463766263928e-06, + "loss": 0.4688, + "step": 55067 + }, + { + "epoch": 1.41, + "learning_rate": 1.143718993487283e-06, + "loss": 0.751, + "step": 55068 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436916102381338e-06, + "loss": 0.6506, + "step": 55069 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436642268789667e-06, + "loss": 0.6992, + "step": 55070 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436368434098025e-06, + "loss": 0.6924, + "step": 55071 + }, + { + "epoch": 1.41, + "learning_rate": 1.1436094598306622e-06, + "loss": 0.5957, + "step": 55072 + }, + { + "epoch": 1.41, + "learning_rate": 1.1435820761415667e-06, + "loss": 0.6758, + "step": 55073 + }, + { + "epoch": 1.41, + "learning_rate": 1.143554692342537e-06, + "loss": 0.8691, + "step": 55074 + }, + { + "epoch": 1.41, + "learning_rate": 1.143527308433594e-06, + "loss": 0.6455, + "step": 55075 + }, + { + "epoch": 1.41, + "learning_rate": 1.143499924414759e-06, + "loss": 0.585, + "step": 55076 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434725402860526e-06, + "loss": 0.5159, + "step": 55077 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434451560474957e-06, + "loss": 0.6802, + "step": 55078 + }, + { + "epoch": 1.41, + "learning_rate": 1.1434177716991094e-06, + "loss": 0.9199, + "step": 55079 + }, + { + "epoch": 1.41, + "learning_rate": 1.143390387240915e-06, + "loss": 0.541, + "step": 55080 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433630026729331e-06, + "loss": 0.6528, + "step": 55081 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433356179951846e-06, + "loss": 0.6758, + "step": 55082 + }, + { + "epoch": 1.41, + "learning_rate": 1.1433082332076906e-06, + "loss": 0.5312, + "step": 55083 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432808483104722e-06, + "loss": 0.6846, + "step": 55084 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432534633035501e-06, + "loss": 0.7266, + "step": 55085 + }, + { + "epoch": 1.41, + "learning_rate": 1.1432260781869455e-06, + "loss": 0.8135, + "step": 55086 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431986929606794e-06, + "loss": 0.5584, + "step": 55087 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431713076247725e-06, + "loss": 0.7217, + "step": 55088 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431439221792461e-06, + "loss": 0.6782, + "step": 55089 + }, + { + "epoch": 1.41, + "learning_rate": 1.1431165366241207e-06, + "loss": 0.6842, + "step": 55090 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430891509594178e-06, + "loss": 0.6865, + "step": 55091 + }, + { + "epoch": 1.41, + "learning_rate": 1.143061765185158e-06, + "loss": 0.624, + "step": 55092 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430343793013625e-06, + "loss": 0.6255, + "step": 55093 + }, + { + "epoch": 1.41, + "learning_rate": 1.1430069933080517e-06, + "loss": 0.8008, + "step": 55094 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429796072052472e-06, + "loss": 0.7666, + "step": 55095 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429522209929704e-06, + "loss": 0.6533, + "step": 55096 + }, + { + "epoch": 1.41, + "learning_rate": 1.1429248346712412e-06, + "loss": 0.584, + "step": 55097 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428974482400809e-06, + "loss": 0.7227, + "step": 55098 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428700616995105e-06, + "loss": 0.627, + "step": 55099 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428426750495512e-06, + "loss": 0.7354, + "step": 55100 + }, + { + "epoch": 1.41, + "learning_rate": 1.1428152882902243e-06, + "loss": 0.585, + "step": 55101 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427879014215498e-06, + "loss": 0.5728, + "step": 55102 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427605144435492e-06, + "loss": 0.645, + "step": 55103 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427331273562435e-06, + "loss": 0.6001, + "step": 55104 + }, + { + "epoch": 1.41, + "learning_rate": 1.1427057401596538e-06, + "loss": 0.665, + "step": 55105 + }, + { + "epoch": 1.41, + "learning_rate": 1.1426783528538007e-06, + "loss": 0.6016, + "step": 55106 + }, + { + "epoch": 1.41, + "learning_rate": 1.142650965438705e-06, + "loss": 0.6001, + "step": 55107 + }, + { + "epoch": 1.41, + "learning_rate": 1.1426235779143887e-06, + "loss": 0.5732, + "step": 55108 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425961902808717e-06, + "loss": 0.4312, + "step": 55109 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425688025381755e-06, + "loss": 0.6711, + "step": 55110 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425414146863209e-06, + "loss": 0.3315, + "step": 55111 + }, + { + "epoch": 1.41, + "learning_rate": 1.1425140267253288e-06, + "loss": 0.3545, + "step": 55112 + }, + { + "epoch": 1.41, + "learning_rate": 1.14248663865522e-06, + "loss": 0.6123, + "step": 55113 + }, + { + "epoch": 1.41, + "learning_rate": 1.142459250476016e-06, + "loss": 0.5322, + "step": 55114 + }, + { + "epoch": 1.41, + "learning_rate": 1.1424318621877379e-06, + "loss": 0.5625, + "step": 55115 + }, + { + "epoch": 1.41, + "learning_rate": 1.1424044737904057e-06, + "loss": 0.6387, + "step": 55116 + }, + { + "epoch": 1.41, + "learning_rate": 1.1423770852840411e-06, + "loss": 0.7324, + "step": 55117 + }, + { + "epoch": 1.41, + "learning_rate": 1.142349696668665e-06, + "loss": 0.6904, + "step": 55118 + }, + { + "epoch": 1.41, + "learning_rate": 1.1423223079442981e-06, + "loss": 0.6562, + "step": 55119 + }, + { + "epoch": 1.41, + "learning_rate": 1.142294919110962e-06, + "loss": 0.7061, + "step": 55120 + }, + { + "epoch": 1.41, + "learning_rate": 1.1422675301686767e-06, + "loss": 0.6611, + "step": 55121 + }, + { + "epoch": 1.41, + "learning_rate": 1.142240141117464e-06, + "loss": 0.6953, + "step": 55122 + }, + { + "epoch": 1.41, + "learning_rate": 1.1422127519573444e-06, + "loss": 0.6519, + "step": 55123 + }, + { + "epoch": 1.41, + "learning_rate": 1.142185362688339e-06, + "loss": 0.6875, + "step": 55124 + }, + { + "epoch": 1.41, + "learning_rate": 1.1421579733104689e-06, + "loss": 0.6543, + "step": 55125 + }, + { + "epoch": 1.41, + "learning_rate": 1.142130583823755e-06, + "loss": 0.6577, + "step": 55126 + }, + { + "epoch": 1.41, + "learning_rate": 1.1421031942282182e-06, + "loss": 0.6519, + "step": 55127 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420758045238794e-06, + "loss": 0.4346, + "step": 55128 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420484147107599e-06, + "loss": 0.7349, + "step": 55129 + }, + { + "epoch": 1.41, + "learning_rate": 1.1420210247888804e-06, + "loss": 0.4702, + "step": 55130 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419936347582622e-06, + "loss": 0.4873, + "step": 55131 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419662446189255e-06, + "loss": 0.644, + "step": 55132 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419388543708922e-06, + "loss": 0.501, + "step": 55133 + }, + { + "epoch": 1.41, + "learning_rate": 1.1419114640141822e-06, + "loss": 0.6572, + "step": 55134 + }, + { + "epoch": 1.41, + "learning_rate": 1.141884073548818e-06, + "loss": 0.6978, + "step": 55135 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418566829748191e-06, + "loss": 0.8799, + "step": 55136 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418292922922073e-06, + "loss": 0.6631, + "step": 55137 + }, + { + "epoch": 1.41, + "learning_rate": 1.1418019015010033e-06, + "loss": 0.7393, + "step": 55138 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417745106012279e-06, + "loss": 0.7939, + "step": 55139 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417471195929025e-06, + "loss": 0.5237, + "step": 55140 + }, + { + "epoch": 1.41, + "learning_rate": 1.1417197284760478e-06, + "loss": 0.7529, + "step": 55141 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416923372506845e-06, + "loss": 0.7246, + "step": 55142 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416649459168344e-06, + "loss": 0.5234, + "step": 55143 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416375544745177e-06, + "loss": 0.6318, + "step": 55144 + }, + { + "epoch": 1.41, + "learning_rate": 1.1416101629237557e-06, + "loss": 0.7676, + "step": 55145 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415827712645693e-06, + "loss": 0.6177, + "step": 55146 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415553794969795e-06, + "loss": 0.606, + "step": 55147 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415279876210073e-06, + "loss": 0.4443, + "step": 55148 + }, + { + "epoch": 1.41, + "learning_rate": 1.1415005956366737e-06, + "loss": 0.4619, + "step": 55149 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414732035439994e-06, + "loss": 0.7393, + "step": 55150 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414458113430054e-06, + "loss": 0.5732, + "step": 55151 + }, + { + "epoch": 1.41, + "learning_rate": 1.1414184190337132e-06, + "loss": 0.6699, + "step": 55152 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413910266161432e-06, + "loss": 0.4863, + "step": 55153 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413636340903168e-06, + "loss": 0.5259, + "step": 55154 + }, + { + "epoch": 1.41, + "learning_rate": 1.1413362414562548e-06, + "loss": 0.7646, + "step": 55155 + }, + { + "epoch": 1.41, + "learning_rate": 1.141308848713978e-06, + "loss": 0.7393, + "step": 55156 + }, + { + "epoch": 1.41, + "learning_rate": 1.1412814558635073e-06, + "loss": 0.6396, + "step": 55157 + }, + { + "epoch": 1.41, + "learning_rate": 1.1412540629048641e-06, + "loss": 0.7207, + "step": 55158 + }, + { + "epoch": 1.41, + "learning_rate": 1.141226669838069e-06, + "loss": 0.7852, + "step": 55159 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411992766631437e-06, + "loss": 0.6772, + "step": 55160 + }, + { + "epoch": 1.41, + "learning_rate": 1.141171883380108e-06, + "loss": 0.5605, + "step": 55161 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411444899889837e-06, + "loss": 0.6304, + "step": 55162 + }, + { + "epoch": 1.41, + "learning_rate": 1.1411170964897917e-06, + "loss": 0.8525, + "step": 55163 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410897028825525e-06, + "loss": 0.7188, + "step": 55164 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410623091672877e-06, + "loss": 0.7236, + "step": 55165 + }, + { + "epoch": 1.41, + "learning_rate": 1.141034915344018e-06, + "loss": 0.7402, + "step": 55166 + }, + { + "epoch": 1.41, + "learning_rate": 1.1410075214127638e-06, + "loss": 0.7026, + "step": 55167 + }, + { + "epoch": 1.41, + "learning_rate": 1.140980127373547e-06, + "loss": 0.6016, + "step": 55168 + }, + { + "epoch": 1.41, + "learning_rate": 1.1409527332263881e-06, + "loss": 0.4503, + "step": 55169 + }, + { + "epoch": 1.41, + "learning_rate": 1.1409253389713085e-06, + "loss": 0.353, + "step": 55170 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408979446083286e-06, + "loss": 0.6431, + "step": 55171 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408705501374695e-06, + "loss": 0.7959, + "step": 55172 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408431555587526e-06, + "loss": 0.75, + "step": 55173 + }, + { + "epoch": 1.41, + "learning_rate": 1.1408157608721982e-06, + "loss": 0.5132, + "step": 55174 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407883660778284e-06, + "loss": 0.5132, + "step": 55175 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407609711756627e-06, + "loss": 0.6201, + "step": 55176 + }, + { + "epoch": 1.41, + "learning_rate": 1.140733576165723e-06, + "loss": 0.4622, + "step": 55177 + }, + { + "epoch": 1.41, + "learning_rate": 1.1407061810480298e-06, + "loss": 0.7026, + "step": 55178 + }, + { + "epoch": 1.41, + "learning_rate": 1.140678785822605e-06, + "loss": 0.6196, + "step": 55179 + }, + { + "epoch": 1.41, + "learning_rate": 1.1406513904894684e-06, + "loss": 0.7939, + "step": 55180 + }, + { + "epoch": 1.41, + "learning_rate": 1.1406239950486415e-06, + "loss": 0.5317, + "step": 55181 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405965995001454e-06, + "loss": 0.7246, + "step": 55182 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405692038440011e-06, + "loss": 0.6484, + "step": 55183 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405418080802292e-06, + "loss": 0.564, + "step": 55184 + }, + { + "epoch": 1.41, + "learning_rate": 1.1405144122088511e-06, + "loss": 0.5211, + "step": 55185 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404870162298873e-06, + "loss": 0.71, + "step": 55186 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404596201433595e-06, + "loss": 0.6987, + "step": 55187 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404322239492876e-06, + "loss": 0.834, + "step": 55188 + }, + { + "epoch": 1.41, + "learning_rate": 1.1404048276476937e-06, + "loss": 0.7031, + "step": 55189 + }, + { + "epoch": 1.41, + "learning_rate": 1.140377431238598e-06, + "loss": 0.5894, + "step": 55190 + }, + { + "epoch": 1.41, + "learning_rate": 1.1403500347220218e-06, + "loss": 0.5405, + "step": 55191 + }, + { + "epoch": 1.41, + "learning_rate": 1.1403226380979863e-06, + "loss": 0.6689, + "step": 55192 + }, + { + "epoch": 1.41, + "learning_rate": 1.140295241366512e-06, + "loss": 0.7695, + "step": 55193 + }, + { + "epoch": 1.41, + "learning_rate": 1.14026784452762e-06, + "loss": 0.6313, + "step": 55194 + }, + { + "epoch": 1.41, + "learning_rate": 1.1402404475813314e-06, + "loss": 0.4775, + "step": 55195 + }, + { + "epoch": 1.41, + "learning_rate": 1.1402130505276672e-06, + "loss": 0.7246, + "step": 55196 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401856533666482e-06, + "loss": 0.4802, + "step": 55197 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401582560982957e-06, + "loss": 0.7144, + "step": 55198 + }, + { + "epoch": 1.41, + "learning_rate": 1.14013085872263e-06, + "loss": 0.8066, + "step": 55199 + }, + { + "epoch": 1.41, + "learning_rate": 1.1401034612396733e-06, + "loss": 0.6943, + "step": 55200 + }, + { + "epoch": 1.41, + "learning_rate": 1.1400760636494453e-06, + "loss": 0.6055, + "step": 55201 + }, + { + "epoch": 1.41, + "learning_rate": 1.1400486659519678e-06, + "loss": 0.5898, + "step": 55202 + }, + { + "epoch": 1.41, + "learning_rate": 1.140021268147261e-06, + "loss": 0.7676, + "step": 55203 + }, + { + "epoch": 1.41, + "learning_rate": 1.139993870235347e-06, + "loss": 0.6431, + "step": 55204 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399664722162456e-06, + "loss": 0.4868, + "step": 55205 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399390740899786e-06, + "loss": 0.7119, + "step": 55206 + }, + { + "epoch": 1.41, + "learning_rate": 1.1399116758565665e-06, + "loss": 0.6016, + "step": 55207 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398842775160306e-06, + "loss": 0.689, + "step": 55208 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398568790683916e-06, + "loss": 0.5813, + "step": 55209 + }, + { + "epoch": 1.42, + "learning_rate": 1.139829480513671e-06, + "loss": 0.7871, + "step": 55210 + }, + { + "epoch": 1.42, + "learning_rate": 1.1398020818518889e-06, + "loss": 0.7266, + "step": 55211 + }, + { + "epoch": 1.42, + "learning_rate": 1.139774683083067e-06, + "loss": 0.5682, + "step": 55212 + }, + { + "epoch": 1.42, + "learning_rate": 1.139747284207226e-06, + "loss": 0.7166, + "step": 55213 + }, + { + "epoch": 1.42, + "learning_rate": 1.139719885224387e-06, + "loss": 0.6177, + "step": 55214 + }, + { + "epoch": 1.42, + "learning_rate": 1.139692486134571e-06, + "loss": 0.8633, + "step": 55215 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396650869377985e-06, + "loss": 0.5269, + "step": 55216 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396376876340913e-06, + "loss": 0.6396, + "step": 55217 + }, + { + "epoch": 1.42, + "learning_rate": 1.1396102882234694e-06, + "loss": 0.6626, + "step": 55218 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395828887059548e-06, + "loss": 0.6953, + "step": 55219 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395554890815679e-06, + "loss": 0.7402, + "step": 55220 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395280893503299e-06, + "loss": 0.571, + "step": 55221 + }, + { + "epoch": 1.42, + "learning_rate": 1.1395006895122615e-06, + "loss": 0.6914, + "step": 55222 + }, + { + "epoch": 1.42, + "learning_rate": 1.1394732895673838e-06, + "loss": 0.6328, + "step": 55223 + }, + { + "epoch": 1.42, + "learning_rate": 1.1394458895157177e-06, + "loss": 0.5762, + "step": 55224 + }, + { + "epoch": 1.42, + "learning_rate": 1.139418489357285e-06, + "loss": 0.8047, + "step": 55225 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393910890921051e-06, + "loss": 0.6382, + "step": 55226 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393636887202002e-06, + "loss": 0.6953, + "step": 55227 + }, + { + "epoch": 1.42, + "learning_rate": 1.139336288241591e-06, + "loss": 0.7129, + "step": 55228 + }, + { + "epoch": 1.42, + "learning_rate": 1.1393088876562983e-06, + "loss": 0.6855, + "step": 55229 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392814869643432e-06, + "loss": 0.584, + "step": 55230 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392540861657467e-06, + "loss": 0.7412, + "step": 55231 + }, + { + "epoch": 1.42, + "learning_rate": 1.1392266852605297e-06, + "loss": 0.6205, + "step": 55232 + }, + { + "epoch": 1.42, + "learning_rate": 1.1391992842487132e-06, + "loss": 0.7139, + "step": 55233 + }, + { + "epoch": 1.42, + "learning_rate": 1.1391718831303184e-06, + "loss": 0.5625, + "step": 55234 + }, + { + "epoch": 1.42, + "learning_rate": 1.139144481905366e-06, + "loss": 0.5859, + "step": 55235 + }, + { + "epoch": 1.42, + "learning_rate": 1.139117080573877e-06, + "loss": 0.6582, + "step": 55236 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390896791358723e-06, + "loss": 0.6045, + "step": 55237 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390622775913735e-06, + "loss": 0.6128, + "step": 55238 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390348759404008e-06, + "loss": 0.7471, + "step": 55239 + }, + { + "epoch": 1.42, + "learning_rate": 1.1390074741829757e-06, + "loss": 0.5439, + "step": 55240 + }, + { + "epoch": 1.42, + "learning_rate": 1.1389800723191185e-06, + "loss": 0.7358, + "step": 55241 + }, + { + "epoch": 1.42, + "learning_rate": 1.138952670348851e-06, + "loss": 0.6182, + "step": 55242 + }, + { + "epoch": 1.42, + "learning_rate": 1.1389252682721934e-06, + "loss": 0.7568, + "step": 55243 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388978660891677e-06, + "loss": 0.6357, + "step": 55244 + }, + { + "epoch": 1.42, + "learning_rate": 1.138870463799794e-06, + "loss": 0.7822, + "step": 55245 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388430614040938e-06, + "loss": 0.7773, + "step": 55246 + }, + { + "epoch": 1.42, + "learning_rate": 1.1388156589020876e-06, + "loss": 0.6494, + "step": 55247 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387882562937967e-06, + "loss": 0.6855, + "step": 55248 + }, + { + "epoch": 1.42, + "learning_rate": 1.138760853579242e-06, + "loss": 0.8262, + "step": 55249 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387334507584447e-06, + "loss": 0.7266, + "step": 55250 + }, + { + "epoch": 1.42, + "learning_rate": 1.1387060478314251e-06, + "loss": 0.6382, + "step": 55251 + }, + { + "epoch": 1.42, + "learning_rate": 1.1386786447982053e-06, + "loss": 0.5728, + "step": 55252 + }, + { + "epoch": 1.42, + "learning_rate": 1.138651241658805e-06, + "loss": 0.665, + "step": 55253 + }, + { + "epoch": 1.42, + "learning_rate": 1.1386238384132463e-06, + "loss": 0.625, + "step": 55254 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385964350615495e-06, + "loss": 0.6616, + "step": 55255 + }, + { + "epoch": 1.42, + "learning_rate": 1.138569031603736e-06, + "loss": 0.5361, + "step": 55256 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385416280398262e-06, + "loss": 0.7227, + "step": 55257 + }, + { + "epoch": 1.42, + "learning_rate": 1.1385142243698416e-06, + "loss": 0.8789, + "step": 55258 + }, + { + "epoch": 1.42, + "learning_rate": 1.138486820593803e-06, + "loss": 0.6377, + "step": 55259 + }, + { + "epoch": 1.42, + "learning_rate": 1.1384594167117314e-06, + "loss": 0.5669, + "step": 55260 + }, + { + "epoch": 1.42, + "learning_rate": 1.138432012723648e-06, + "loss": 0.5771, + "step": 55261 + }, + { + "epoch": 1.42, + "learning_rate": 1.138404608629573e-06, + "loss": 0.9062, + "step": 55262 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383772044295286e-06, + "loss": 0.6543, + "step": 55263 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383498001235347e-06, + "loss": 0.6782, + "step": 55264 + }, + { + "epoch": 1.42, + "learning_rate": 1.1383223957116133e-06, + "loss": 0.6567, + "step": 55265 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382949911937843e-06, + "loss": 0.6543, + "step": 55266 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382675865700692e-06, + "loss": 0.6201, + "step": 55267 + }, + { + "epoch": 1.42, + "learning_rate": 1.138240181840489e-06, + "loss": 0.7275, + "step": 55268 + }, + { + "epoch": 1.42, + "learning_rate": 1.1382127770050649e-06, + "loss": 0.6802, + "step": 55269 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381853720638174e-06, + "loss": 0.7334, + "step": 55270 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381579670167677e-06, + "loss": 0.627, + "step": 55271 + }, + { + "epoch": 1.42, + "learning_rate": 1.138130561863937e-06, + "loss": 0.4626, + "step": 55272 + }, + { + "epoch": 1.42, + "learning_rate": 1.1381031566053458e-06, + "loss": 0.6143, + "step": 55273 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380757512410156e-06, + "loss": 0.5205, + "step": 55274 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380483457709674e-06, + "loss": 0.5388, + "step": 55275 + }, + { + "epoch": 1.42, + "learning_rate": 1.1380209401952213e-06, + "loss": 0.5803, + "step": 55276 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379935345137992e-06, + "loss": 0.4988, + "step": 55277 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379661287267218e-06, + "loss": 0.6257, + "step": 55278 + }, + { + "epoch": 1.42, + "learning_rate": 1.13793872283401e-06, + "loss": 0.6816, + "step": 55279 + }, + { + "epoch": 1.42, + "learning_rate": 1.1379113168356852e-06, + "loss": 0.679, + "step": 55280 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378839107317675e-06, + "loss": 0.6499, + "step": 55281 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378565045222787e-06, + "loss": 0.6162, + "step": 55282 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378290982072396e-06, + "loss": 0.6787, + "step": 55283 + }, + { + "epoch": 1.42, + "learning_rate": 1.1378016917866709e-06, + "loss": 0.6172, + "step": 55284 + }, + { + "epoch": 1.42, + "learning_rate": 1.137774285260594e-06, + "loss": 0.542, + "step": 55285 + }, + { + "epoch": 1.42, + "learning_rate": 1.1377468786290297e-06, + "loss": 0.709, + "step": 55286 + }, + { + "epoch": 1.42, + "learning_rate": 1.1377194718919985e-06, + "loss": 0.7012, + "step": 55287 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376920650495222e-06, + "loss": 0.4895, + "step": 55288 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376646581016213e-06, + "loss": 0.7246, + "step": 55289 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376372510483171e-06, + "loss": 0.9531, + "step": 55290 + }, + { + "epoch": 1.42, + "learning_rate": 1.1376098438896302e-06, + "loss": 0.5972, + "step": 55291 + }, + { + "epoch": 1.42, + "learning_rate": 1.137582436625582e-06, + "loss": 0.7861, + "step": 55292 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375550292561929e-06, + "loss": 0.6738, + "step": 55293 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375276217814845e-06, + "loss": 0.6406, + "step": 55294 + }, + { + "epoch": 1.42, + "learning_rate": 1.1375002142014776e-06, + "loss": 0.6023, + "step": 55295 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374728065161928e-06, + "loss": 0.5544, + "step": 55296 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374453987256517e-06, + "loss": 0.6602, + "step": 55297 + }, + { + "epoch": 1.42, + "learning_rate": 1.1374179908298748e-06, + "loss": 0.6836, + "step": 55298 + }, + { + "epoch": 1.42, + "learning_rate": 1.137390582828883e-06, + "loss": 0.6943, + "step": 55299 + }, + { + "epoch": 1.42, + "learning_rate": 1.1373631747226982e-06, + "loss": 0.6064, + "step": 55300 + }, + { + "epoch": 1.42, + "learning_rate": 1.13733576651134e-06, + "loss": 0.6836, + "step": 55301 + }, + { + "epoch": 1.42, + "learning_rate": 1.1373083581948306e-06, + "loss": 0.5132, + "step": 55302 + }, + { + "epoch": 1.42, + "learning_rate": 1.1372809497731902e-06, + "loss": 0.5343, + "step": 55303 + }, + { + "epoch": 1.42, + "learning_rate": 1.1372535412464407e-06, + "loss": 0.6934, + "step": 55304 + }, + { + "epoch": 1.42, + "learning_rate": 1.137226132614602e-06, + "loss": 0.4474, + "step": 55305 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371987238776953e-06, + "loss": 0.7012, + "step": 55306 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371713150357422e-06, + "loss": 0.7744, + "step": 55307 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371439060887632e-06, + "loss": 0.7529, + "step": 55308 + }, + { + "epoch": 1.42, + "learning_rate": 1.1371164970367798e-06, + "loss": 0.5142, + "step": 55309 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370890878798123e-06, + "loss": 0.7705, + "step": 55310 + }, + { + "epoch": 1.42, + "learning_rate": 1.137061678617882e-06, + "loss": 0.6836, + "step": 55311 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370342692510097e-06, + "loss": 0.6338, + "step": 55312 + }, + { + "epoch": 1.42, + "learning_rate": 1.1370068597792168e-06, + "loss": 0.7213, + "step": 55313 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369794502025237e-06, + "loss": 0.6445, + "step": 55314 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369520405209525e-06, + "loss": 0.6069, + "step": 55315 + }, + { + "epoch": 1.42, + "learning_rate": 1.1369246307345227e-06, + "loss": 0.6846, + "step": 55316 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368972208432564e-06, + "loss": 0.793, + "step": 55317 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368698108471738e-06, + "loss": 0.8145, + "step": 55318 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368424007462967e-06, + "loss": 0.5603, + "step": 55319 + }, + { + "epoch": 1.42, + "learning_rate": 1.1368149905406455e-06, + "loss": 0.6924, + "step": 55320 + }, + { + "epoch": 1.42, + "learning_rate": 1.1367875802302413e-06, + "loss": 0.5765, + "step": 55321 + }, + { + "epoch": 1.42, + "learning_rate": 1.136760169815105e-06, + "loss": 0.6454, + "step": 55322 + }, + { + "epoch": 1.42, + "learning_rate": 1.136732759295258e-06, + "loss": 0.5938, + "step": 55323 + }, + { + "epoch": 1.42, + "learning_rate": 1.1367053486707207e-06, + "loss": 0.6621, + "step": 55324 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366779379415148e-06, + "loss": 0.6895, + "step": 55325 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366505271076607e-06, + "loss": 0.5234, + "step": 55326 + }, + { + "epoch": 1.42, + "learning_rate": 1.1366231161691794e-06, + "loss": 0.6174, + "step": 55327 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365957051260923e-06, + "loss": 0.6277, + "step": 55328 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365682939784202e-06, + "loss": 0.7539, + "step": 55329 + }, + { + "epoch": 1.42, + "learning_rate": 1.136540882726184e-06, + "loss": 0.5649, + "step": 55330 + }, + { + "epoch": 1.42, + "learning_rate": 1.1365134713694045e-06, + "loss": 0.4976, + "step": 55331 + }, + { + "epoch": 1.42, + "learning_rate": 1.136486059908103e-06, + "loss": 0.751, + "step": 55332 + }, + { + "epoch": 1.42, + "learning_rate": 1.1364586483423004e-06, + "loss": 0.7266, + "step": 55333 + }, + { + "epoch": 1.42, + "learning_rate": 1.136431236672018e-06, + "loss": 0.6499, + "step": 55334 + }, + { + "epoch": 1.42, + "learning_rate": 1.1364038248972761e-06, + "loss": 0.6113, + "step": 55335 + }, + { + "epoch": 1.42, + "learning_rate": 1.1363764130180961e-06, + "loss": 0.624, + "step": 55336 + }, + { + "epoch": 1.42, + "learning_rate": 1.1363490010344992e-06, + "loss": 0.6011, + "step": 55337 + }, + { + "epoch": 1.42, + "learning_rate": 1.136321588946506e-06, + "loss": 0.6167, + "step": 55338 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362941767541374e-06, + "loss": 0.6973, + "step": 55339 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362667644574151e-06, + "loss": 0.4526, + "step": 55340 + }, + { + "epoch": 1.42, + "learning_rate": 1.136239352056359e-06, + "loss": 0.7129, + "step": 55341 + }, + { + "epoch": 1.42, + "learning_rate": 1.1362119395509914e-06, + "loss": 0.5728, + "step": 55342 + }, + { + "epoch": 1.42, + "learning_rate": 1.1361845269413319e-06, + "loss": 0.6484, + "step": 55343 + }, + { + "epoch": 1.42, + "learning_rate": 1.1361571142274024e-06, + "loss": 0.6924, + "step": 55344 + }, + { + "epoch": 1.42, + "learning_rate": 1.136129701409224e-06, + "loss": 0.6534, + "step": 55345 + }, + { + "epoch": 1.42, + "learning_rate": 1.136102288486817e-06, + "loss": 0.6206, + "step": 55346 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360748754602028e-06, + "loss": 0.6963, + "step": 55347 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360474623294022e-06, + "loss": 0.7607, + "step": 55348 + }, + { + "epoch": 1.42, + "learning_rate": 1.1360200490944363e-06, + "loss": 0.6638, + "step": 55349 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359926357553265e-06, + "loss": 0.6865, + "step": 55350 + }, + { + "epoch": 1.42, + "learning_rate": 1.135965222312093e-06, + "loss": 0.7266, + "step": 55351 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359378087647574e-06, + "loss": 0.7373, + "step": 55352 + }, + { + "epoch": 1.42, + "learning_rate": 1.1359103951133401e-06, + "loss": 0.6514, + "step": 55353 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358829813578627e-06, + "loss": 0.7046, + "step": 55354 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358555674983464e-06, + "loss": 0.6055, + "step": 55355 + }, + { + "epoch": 1.42, + "learning_rate": 1.135828153534811e-06, + "loss": 0.7119, + "step": 55356 + }, + { + "epoch": 1.42, + "learning_rate": 1.1358007394672789e-06, + "loss": 0.5156, + "step": 55357 + }, + { + "epoch": 1.42, + "learning_rate": 1.1357733252957698e-06, + "loss": 0.8184, + "step": 55358 + }, + { + "epoch": 1.42, + "learning_rate": 1.135745911020306e-06, + "loss": 0.7393, + "step": 55359 + }, + { + "epoch": 1.42, + "learning_rate": 1.1357184966409072e-06, + "loss": 0.6353, + "step": 55360 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356910821575952e-06, + "loss": 0.605, + "step": 55361 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356636675703905e-06, + "loss": 0.6528, + "step": 55362 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356362528793148e-06, + "loss": 0.5413, + "step": 55363 + }, + { + "epoch": 1.42, + "learning_rate": 1.1356088380843885e-06, + "loss": 0.7041, + "step": 55364 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355814231856328e-06, + "loss": 0.645, + "step": 55365 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355540081830686e-06, + "loss": 0.5488, + "step": 55366 + }, + { + "epoch": 1.42, + "learning_rate": 1.1355265930767168e-06, + "loss": 0.7324, + "step": 55367 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354991778665986e-06, + "loss": 0.6382, + "step": 55368 + }, + { + "epoch": 1.42, + "learning_rate": 1.135471762552735e-06, + "loss": 0.6719, + "step": 55369 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354443471351469e-06, + "loss": 0.6855, + "step": 55370 + }, + { + "epoch": 1.42, + "learning_rate": 1.1354169316138548e-06, + "loss": 0.5791, + "step": 55371 + }, + { + "epoch": 1.42, + "learning_rate": 1.1353895159888808e-06, + "loss": 0.6826, + "step": 55372 + }, + { + "epoch": 1.42, + "learning_rate": 1.135362100260245e-06, + "loss": 0.4307, + "step": 55373 + }, + { + "epoch": 1.42, + "learning_rate": 1.1353346844279687e-06, + "loss": 0.6719, + "step": 55374 + }, + { + "epoch": 1.42, + "learning_rate": 1.135307268492073e-06, + "loss": 0.4353, + "step": 55375 + }, + { + "epoch": 1.42, + "learning_rate": 1.135279852452579e-06, + "loss": 0.6572, + "step": 55376 + }, + { + "epoch": 1.42, + "learning_rate": 1.1352524363095067e-06, + "loss": 0.749, + "step": 55377 + }, + { + "epoch": 1.42, + "learning_rate": 1.135225020062878e-06, + "loss": 0.5444, + "step": 55378 + }, + { + "epoch": 1.42, + "learning_rate": 1.135197603712714e-06, + "loss": 0.6133, + "step": 55379 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351701872590355e-06, + "loss": 0.6554, + "step": 55380 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351427707018632e-06, + "loss": 0.7881, + "step": 55381 + }, + { + "epoch": 1.42, + "learning_rate": 1.1351153540412185e-06, + "loss": 0.6553, + "step": 55382 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350879372771218e-06, + "loss": 0.8213, + "step": 55383 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350605204095947e-06, + "loss": 0.7217, + "step": 55384 + }, + { + "epoch": 1.42, + "learning_rate": 1.135033103438658e-06, + "loss": 0.6, + "step": 55385 + }, + { + "epoch": 1.42, + "learning_rate": 1.1350056863643326e-06, + "loss": 0.4761, + "step": 55386 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349782691866397e-06, + "loss": 0.5151, + "step": 55387 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349508519055998e-06, + "loss": 0.4888, + "step": 55388 + }, + { + "epoch": 1.42, + "learning_rate": 1.1349234345212347e-06, + "loss": 0.5691, + "step": 55389 + }, + { + "epoch": 1.42, + "learning_rate": 1.134896017033565e-06, + "loss": 0.583, + "step": 55390 + }, + { + "epoch": 1.42, + "learning_rate": 1.134868599442611e-06, + "loss": 0.6685, + "step": 55391 + }, + { + "epoch": 1.42, + "learning_rate": 1.1348411817483948e-06, + "loss": 0.7275, + "step": 55392 + }, + { + "epoch": 1.42, + "learning_rate": 1.1348137639509365e-06, + "loss": 0.6162, + "step": 55393 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347863460502578e-06, + "loss": 0.6602, + "step": 55394 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347589280463795e-06, + "loss": 0.7559, + "step": 55395 + }, + { + "epoch": 1.42, + "learning_rate": 1.134731509939322e-06, + "loss": 0.7432, + "step": 55396 + }, + { + "epoch": 1.42, + "learning_rate": 1.1347040917291071e-06, + "loss": 0.7686, + "step": 55397 + }, + { + "epoch": 1.42, + "learning_rate": 1.1346766734157554e-06, + "loss": 0.8584, + "step": 55398 + }, + { + "epoch": 1.42, + "learning_rate": 1.134649254999288e-06, + "loss": 0.5938, + "step": 55399 + }, + { + "epoch": 1.42, + "learning_rate": 1.134621836479726e-06, + "loss": 0.7471, + "step": 55400 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345944178570903e-06, + "loss": 0.7412, + "step": 55401 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345669991314014e-06, + "loss": 0.6406, + "step": 55402 + }, + { + "epoch": 1.42, + "learning_rate": 1.1345395803026812e-06, + "loss": 0.7139, + "step": 55403 + }, + { + "epoch": 1.42, + "learning_rate": 1.13451216137095e-06, + "loss": 0.7783, + "step": 55404 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344847423362291e-06, + "loss": 0.6582, + "step": 55405 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344573231985392e-06, + "loss": 0.6128, + "step": 55406 + }, + { + "epoch": 1.42, + "learning_rate": 1.134429903957902e-06, + "loss": 0.5232, + "step": 55407 + }, + { + "epoch": 1.42, + "learning_rate": 1.1344024846143373e-06, + "loss": 0.6626, + "step": 55408 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343750651678677e-06, + "loss": 0.5762, + "step": 55409 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343476456185126e-06, + "loss": 0.6738, + "step": 55410 + }, + { + "epoch": 1.42, + "learning_rate": 1.1343202259662938e-06, + "loss": 0.6768, + "step": 55411 + }, + { + "epoch": 1.42, + "learning_rate": 1.1342928062112323e-06, + "loss": 0.6201, + "step": 55412 + }, + { + "epoch": 1.42, + "learning_rate": 1.134265386353349e-06, + "loss": 0.5245, + "step": 55413 + }, + { + "epoch": 1.42, + "learning_rate": 1.134237966392665e-06, + "loss": 0.6108, + "step": 55414 + }, + { + "epoch": 1.42, + "learning_rate": 1.1342105463292006e-06, + "loss": 0.8262, + "step": 55415 + }, + { + "epoch": 1.42, + "learning_rate": 1.1341831261629777e-06, + "loss": 0.6082, + "step": 55416 + }, + { + "epoch": 1.42, + "learning_rate": 1.134155705894017e-06, + "loss": 0.6636, + "step": 55417 + }, + { + "epoch": 1.42, + "learning_rate": 1.1341282855223393e-06, + "loss": 0.6631, + "step": 55418 + }, + { + "epoch": 1.42, + "learning_rate": 1.134100865047966e-06, + "loss": 0.603, + "step": 55419 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340734444709176e-06, + "loss": 0.6199, + "step": 55420 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340460237912154e-06, + "loss": 0.6294, + "step": 55421 + }, + { + "epoch": 1.42, + "learning_rate": 1.1340186030088804e-06, + "loss": 0.6255, + "step": 55422 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339911821239333e-06, + "loss": 0.626, + "step": 55423 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339637611363956e-06, + "loss": 0.6782, + "step": 55424 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339363400462878e-06, + "loss": 0.7979, + "step": 55425 + }, + { + "epoch": 1.42, + "learning_rate": 1.1339089188536313e-06, + "loss": 0.7334, + "step": 55426 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338814975584465e-06, + "loss": 0.7236, + "step": 55427 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338540761607553e-06, + "loss": 0.7686, + "step": 55428 + }, + { + "epoch": 1.42, + "learning_rate": 1.1338266546605779e-06, + "loss": 0.6807, + "step": 55429 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337992330579357e-06, + "loss": 0.626, + "step": 55430 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337718113528493e-06, + "loss": 0.835, + "step": 55431 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337443895453404e-06, + "loss": 0.583, + "step": 55432 + }, + { + "epoch": 1.42, + "learning_rate": 1.1337169676354292e-06, + "loss": 0.7695, + "step": 55433 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336895456231373e-06, + "loss": 0.4667, + "step": 55434 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336621235084855e-06, + "loss": 0.5947, + "step": 55435 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336347012914946e-06, + "loss": 0.7656, + "step": 55436 + }, + { + "epoch": 1.42, + "learning_rate": 1.1336072789721858e-06, + "loss": 0.5679, + "step": 55437 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335798565505801e-06, + "loss": 0.7158, + "step": 55438 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335524340266983e-06, + "loss": 0.6865, + "step": 55439 + }, + { + "epoch": 1.42, + "learning_rate": 1.1335250114005617e-06, + "loss": 0.6406, + "step": 55440 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334975886721911e-06, + "loss": 0.8467, + "step": 55441 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334701658416072e-06, + "loss": 0.6772, + "step": 55442 + }, + { + "epoch": 1.42, + "learning_rate": 1.133442742908832e-06, + "loss": 0.9326, + "step": 55443 + }, + { + "epoch": 1.42, + "learning_rate": 1.1334153198738854e-06, + "loss": 0.385, + "step": 55444 + }, + { + "epoch": 1.42, + "learning_rate": 1.133387896736789e-06, + "loss": 0.3667, + "step": 55445 + }, + { + "epoch": 1.42, + "learning_rate": 1.1333604734975634e-06, + "loss": 0.8838, + "step": 55446 + }, + { + "epoch": 1.42, + "learning_rate": 1.13333305015623e-06, + "loss": 0.6807, + "step": 55447 + }, + { + "epoch": 1.42, + "learning_rate": 1.1333056267128094e-06, + "loss": 0.8477, + "step": 55448 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332782031673231e-06, + "loss": 0.6514, + "step": 55449 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332507795197916e-06, + "loss": 0.6035, + "step": 55450 + }, + { + "epoch": 1.42, + "learning_rate": 1.1332233557702362e-06, + "loss": 0.7549, + "step": 55451 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331959319186777e-06, + "loss": 0.5557, + "step": 55452 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331685079651373e-06, + "loss": 0.6885, + "step": 55453 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331410839096357e-06, + "loss": 0.6582, + "step": 55454 + }, + { + "epoch": 1.42, + "learning_rate": 1.1331136597521946e-06, + "loss": 0.5869, + "step": 55455 + }, + { + "epoch": 1.42, + "learning_rate": 1.133086235492834e-06, + "loss": 0.5449, + "step": 55456 + }, + { + "epoch": 1.42, + "learning_rate": 1.1330588111315755e-06, + "loss": 0.5659, + "step": 55457 + }, + { + "epoch": 1.42, + "learning_rate": 1.13303138666844e-06, + "loss": 0.4731, + "step": 55458 + }, + { + "epoch": 1.42, + "learning_rate": 1.1330039621034485e-06, + "loss": 0.7811, + "step": 55459 + }, + { + "epoch": 1.42, + "learning_rate": 1.132976537436622e-06, + "loss": 0.5986, + "step": 55460 + }, + { + "epoch": 1.42, + "learning_rate": 1.1329491126679815e-06, + "loss": 0.6079, + "step": 55461 + }, + { + "epoch": 1.42, + "learning_rate": 1.132921687797548e-06, + "loss": 0.6816, + "step": 55462 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328942628253425e-06, + "loss": 0.5293, + "step": 55463 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328668377513858e-06, + "loss": 0.6665, + "step": 55464 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328394125756993e-06, + "loss": 0.5503, + "step": 55465 + }, + { + "epoch": 1.42, + "learning_rate": 1.1328119872983036e-06, + "loss": 0.6855, + "step": 55466 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327845619192198e-06, + "loss": 0.7471, + "step": 55467 + }, + { + "epoch": 1.42, + "learning_rate": 1.132757136438469e-06, + "loss": 0.7119, + "step": 55468 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327297108560724e-06, + "loss": 0.583, + "step": 55469 + }, + { + "epoch": 1.42, + "learning_rate": 1.1327022851720507e-06, + "loss": 0.5781, + "step": 55470 + }, + { + "epoch": 1.42, + "learning_rate": 1.1326748593864248e-06, + "loss": 0.5244, + "step": 55471 + }, + { + "epoch": 1.42, + "learning_rate": 1.132647433499216e-06, + "loss": 0.6758, + "step": 55472 + }, + { + "epoch": 1.42, + "learning_rate": 1.132620007510445e-06, + "loss": 0.6094, + "step": 55473 + }, + { + "epoch": 1.42, + "learning_rate": 1.132592581420133e-06, + "loss": 0.6748, + "step": 55474 + }, + { + "epoch": 1.42, + "learning_rate": 1.132565155228301e-06, + "loss": 0.6909, + "step": 55475 + }, + { + "epoch": 1.42, + "learning_rate": 1.13253772893497e-06, + "loss": 0.8008, + "step": 55476 + }, + { + "epoch": 1.42, + "learning_rate": 1.1325103025401608e-06, + "loss": 0.7095, + "step": 55477 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324828760438946e-06, + "loss": 0.7373, + "step": 55478 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324554494461926e-06, + "loss": 0.6265, + "step": 55479 + }, + { + "epoch": 1.42, + "learning_rate": 1.1324280227470754e-06, + "loss": 0.7236, + "step": 55480 + }, + { + "epoch": 1.42, + "learning_rate": 1.132400595946564e-06, + "loss": 0.6885, + "step": 55481 + }, + { + "epoch": 1.42, + "learning_rate": 1.1323731690446799e-06, + "loss": 0.6533, + "step": 55482 + }, + { + "epoch": 1.42, + "learning_rate": 1.1323457420414433e-06, + "loss": 0.6763, + "step": 55483 + }, + { + "epoch": 1.42, + "learning_rate": 1.132318314936876e-06, + "loss": 0.6992, + "step": 55484 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322908877309988e-06, + "loss": 0.7744, + "step": 55485 + }, + { + "epoch": 1.42, + "learning_rate": 1.132263460423832e-06, + "loss": 0.708, + "step": 55486 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322360330153975e-06, + "loss": 0.8301, + "step": 55487 + }, + { + "epoch": 1.42, + "learning_rate": 1.1322086055057156e-06, + "loss": 0.7275, + "step": 55488 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321811778948083e-06, + "loss": 0.7109, + "step": 55489 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321537501826954e-06, + "loss": 0.707, + "step": 55490 + }, + { + "epoch": 1.42, + "learning_rate": 1.1321263223693986e-06, + "loss": 0.6851, + "step": 55491 + }, + { + "epoch": 1.42, + "learning_rate": 1.1320988944549388e-06, + "loss": 0.7051, + "step": 55492 + }, + { + "epoch": 1.42, + "learning_rate": 1.132071466439337e-06, + "loss": 0.5786, + "step": 55493 + }, + { + "epoch": 1.42, + "learning_rate": 1.132044038322614e-06, + "loss": 0.5562, + "step": 55494 + }, + { + "epoch": 1.42, + "learning_rate": 1.1320166101047911e-06, + "loss": 0.6895, + "step": 55495 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319891817858892e-06, + "loss": 0.5784, + "step": 55496 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319617533659292e-06, + "loss": 0.7363, + "step": 55497 + }, + { + "epoch": 1.42, + "learning_rate": 1.1319343248449318e-06, + "loss": 0.6807, + "step": 55498 + }, + { + "epoch": 1.42, + "learning_rate": 1.131906896222919e-06, + "loss": 0.6013, + "step": 55499 + }, + { + "epoch": 1.42, + "learning_rate": 1.1318794674999107e-06, + "loss": 0.5708, + "step": 55500 + }, + { + "epoch": 1.42, + "learning_rate": 1.1318520386759285e-06, + "loss": 0.7246, + "step": 55501 + }, + { + "epoch": 1.42, + "learning_rate": 1.131824609750993e-06, + "loss": 0.604, + "step": 55502 + }, + { + "epoch": 1.42, + "learning_rate": 1.131797180725126e-06, + "loss": 0.54, + "step": 55503 + }, + { + "epoch": 1.42, + "learning_rate": 1.1317697515983474e-06, + "loss": 0.6206, + "step": 55504 + }, + { + "epoch": 1.42, + "learning_rate": 1.131742322370679e-06, + "loss": 0.5947, + "step": 55505 + }, + { + "epoch": 1.42, + "learning_rate": 1.1317148930421416e-06, + "loss": 0.6885, + "step": 55506 + }, + { + "epoch": 1.42, + "learning_rate": 1.131687463612756e-06, + "loss": 0.7178, + "step": 55507 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316600340825435e-06, + "loss": 0.7979, + "step": 55508 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316326044515249e-06, + "loss": 0.531, + "step": 55509 + }, + { + "epoch": 1.42, + "learning_rate": 1.1316051747197216e-06, + "loss": 0.605, + "step": 55510 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315777448871538e-06, + "loss": 0.6924, + "step": 55511 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315503149538432e-06, + "loss": 0.7139, + "step": 55512 + }, + { + "epoch": 1.42, + "learning_rate": 1.1315228849198103e-06, + "loss": 0.4918, + "step": 55513 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314954547850768e-06, + "loss": 0.4121, + "step": 55514 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314680245496631e-06, + "loss": 0.6289, + "step": 55515 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314405942135903e-06, + "loss": 0.6621, + "step": 55516 + }, + { + "epoch": 1.42, + "learning_rate": 1.1314131637768794e-06, + "loss": 0.791, + "step": 55517 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313857332395518e-06, + "loss": 0.6836, + "step": 55518 + }, + { + "epoch": 1.42, + "learning_rate": 1.131358302601628e-06, + "loss": 0.439, + "step": 55519 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313308718631293e-06, + "loss": 0.7236, + "step": 55520 + }, + { + "epoch": 1.42, + "learning_rate": 1.1313034410240762e-06, + "loss": 0.7275, + "step": 55521 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312760100844906e-06, + "loss": 0.5898, + "step": 55522 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312485790443926e-06, + "loss": 0.7588, + "step": 55523 + }, + { + "epoch": 1.42, + "learning_rate": 1.1312211479038039e-06, + "loss": 0.7549, + "step": 55524 + }, + { + "epoch": 1.42, + "learning_rate": 1.131193716662745e-06, + "loss": 0.3342, + "step": 55525 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311662853212373e-06, + "loss": 0.7344, + "step": 55526 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311388538793014e-06, + "loss": 0.6787, + "step": 55527 + }, + { + "epoch": 1.42, + "learning_rate": 1.1311114223369586e-06, + "loss": 0.5896, + "step": 55528 + }, + { + "epoch": 1.42, + "learning_rate": 1.13108399069423e-06, + "loss": 0.6611, + "step": 55529 + }, + { + "epoch": 1.42, + "learning_rate": 1.131056558951136e-06, + "loss": 0.5566, + "step": 55530 + }, + { + "epoch": 1.42, + "learning_rate": 1.131029127107698e-06, + "loss": 0.6826, + "step": 55531 + }, + { + "epoch": 1.42, + "learning_rate": 1.1310016951639375e-06, + "loss": 0.5249, + "step": 55532 + }, + { + "epoch": 1.42, + "learning_rate": 1.1309742631198746e-06, + "loss": 0.5437, + "step": 55533 + }, + { + "epoch": 1.42, + "learning_rate": 1.130946830975531e-06, + "loss": 0.4716, + "step": 55534 + }, + { + "epoch": 1.42, + "learning_rate": 1.1309193987309275e-06, + "loss": 0.5601, + "step": 55535 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308919663860847e-06, + "loss": 0.709, + "step": 55536 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308645339410244e-06, + "loss": 0.6582, + "step": 55537 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308371013957665e-06, + "loss": 0.5955, + "step": 55538 + }, + { + "epoch": 1.42, + "learning_rate": 1.1308096687503335e-06, + "loss": 0.6992, + "step": 55539 + }, + { + "epoch": 1.42, + "learning_rate": 1.1307822360047448e-06, + "loss": 0.5205, + "step": 55540 + }, + { + "epoch": 1.42, + "learning_rate": 1.1307548031590225e-06, + "loss": 0.7715, + "step": 55541 + }, + { + "epoch": 1.42, + "learning_rate": 1.130727370213187e-06, + "loss": 0.7568, + "step": 55542 + }, + { + "epoch": 1.42, + "learning_rate": 1.13069993716726e-06, + "loss": 0.5444, + "step": 55543 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306725040212616e-06, + "loss": 0.8564, + "step": 55544 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306450707752135e-06, + "loss": 0.7266, + "step": 55545 + }, + { + "epoch": 1.42, + "learning_rate": 1.1306176374291365e-06, + "loss": 0.4856, + "step": 55546 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305902039830516e-06, + "loss": 0.709, + "step": 55547 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305627704369795e-06, + "loss": 0.6885, + "step": 55548 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305353367909419e-06, + "loss": 0.5811, + "step": 55549 + }, + { + "epoch": 1.42, + "learning_rate": 1.1305079030449594e-06, + "loss": 0.5513, + "step": 55550 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304804691990523e-06, + "loss": 0.6777, + "step": 55551 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304530352532432e-06, + "loss": 0.8369, + "step": 55552 + }, + { + "epoch": 1.42, + "learning_rate": 1.1304256012075517e-06, + "loss": 0.6982, + "step": 55553 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303981670619995e-06, + "loss": 0.6714, + "step": 55554 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303707328166072e-06, + "loss": 0.6201, + "step": 55555 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303432984713962e-06, + "loss": 0.5425, + "step": 55556 + }, + { + "epoch": 1.42, + "learning_rate": 1.1303158640263871e-06, + "loss": 0.5679, + "step": 55557 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302884294816016e-06, + "loss": 0.5952, + "step": 55558 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302609948370602e-06, + "loss": 0.728, + "step": 55559 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302335600927838e-06, + "loss": 0.5269, + "step": 55560 + }, + { + "epoch": 1.42, + "learning_rate": 1.1302061252487934e-06, + "loss": 0.7275, + "step": 55561 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301786903051104e-06, + "loss": 0.5591, + "step": 55562 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301512552617549e-06, + "loss": 0.4902, + "step": 55563 + }, + { + "epoch": 1.42, + "learning_rate": 1.1301238201187496e-06, + "loss": 0.6553, + "step": 55564 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300963848761135e-06, + "loss": 0.5068, + "step": 55565 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300689495338693e-06, + "loss": 0.4978, + "step": 55566 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300415140920367e-06, + "loss": 0.5459, + "step": 55567 + }, + { + "epoch": 1.42, + "learning_rate": 1.1300140785506377e-06, + "loss": 0.5332, + "step": 55568 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299866429096929e-06, + "loss": 0.6348, + "step": 55569 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299592071692231e-06, + "loss": 0.6841, + "step": 55570 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299317713292497e-06, + "loss": 0.5483, + "step": 55571 + }, + { + "epoch": 1.42, + "learning_rate": 1.1299043353897935e-06, + "loss": 0.6338, + "step": 55572 + }, + { + "epoch": 1.42, + "learning_rate": 1.1298768993508753e-06, + "loss": 0.6621, + "step": 55573 + }, + { + "epoch": 1.42, + "learning_rate": 1.1298494632125167e-06, + "loss": 0.5867, + "step": 55574 + }, + { + "epoch": 1.42, + "learning_rate": 1.129822026974738e-06, + "loss": 0.7178, + "step": 55575 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297945906375605e-06, + "loss": 0.7178, + "step": 55576 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297671542010056e-06, + "loss": 0.6167, + "step": 55577 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297397176650936e-06, + "loss": 0.6924, + "step": 55578 + }, + { + "epoch": 1.42, + "learning_rate": 1.1297122810298464e-06, + "loss": 0.7275, + "step": 55579 + }, + { + "epoch": 1.42, + "learning_rate": 1.129684844295284e-06, + "loss": 0.4966, + "step": 55580 + }, + { + "epoch": 1.42, + "learning_rate": 1.1296574074614281e-06, + "loss": 0.752, + "step": 55581 + }, + { + "epoch": 1.42, + "learning_rate": 1.129629970528299e-06, + "loss": 0.7207, + "step": 55582 + }, + { + "epoch": 1.42, + "learning_rate": 1.1296025334959187e-06, + "loss": 0.6768, + "step": 55583 + }, + { + "epoch": 1.42, + "learning_rate": 1.1295750963643076e-06, + "loss": 0.6357, + "step": 55584 + }, + { + "epoch": 1.42, + "learning_rate": 1.129547659133487e-06, + "loss": 0.5234, + "step": 55585 + }, + { + "epoch": 1.42, + "learning_rate": 1.1295202218034772e-06, + "loss": 0.7412, + "step": 55586 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294927843743e-06, + "loss": 0.4834, + "step": 55587 + }, + { + "epoch": 1.42, + "learning_rate": 1.129465346845976e-06, + "loss": 0.7637, + "step": 55588 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294379092185268e-06, + "loss": 0.6592, + "step": 55589 + }, + { + "epoch": 1.42, + "learning_rate": 1.1294104714919725e-06, + "loss": 0.5864, + "step": 55590 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293830336663349e-06, + "loss": 0.7715, + "step": 55591 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293555957416342e-06, + "loss": 0.7207, + "step": 55592 + }, + { + "epoch": 1.42, + "learning_rate": 1.129328157717892e-06, + "loss": 0.7104, + "step": 55593 + }, + { + "epoch": 1.42, + "learning_rate": 1.1293007195951295e-06, + "loss": 0.5537, + "step": 55594 + }, + { + "epoch": 1.42, + "learning_rate": 1.129273281373367e-06, + "loss": 0.5415, + "step": 55595 + }, + { + "epoch": 1.42, + "learning_rate": 1.1292458430526262e-06, + "loss": 0.4839, + "step": 55596 + }, + { + "epoch": 1.42, + "learning_rate": 1.1292184046329273e-06, + "loss": 0.7002, + "step": 55597 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291909661142925e-06, + "loss": 0.6289, + "step": 55598 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291635274967417e-06, + "loss": 0.6504, + "step": 55599 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291360887802964e-06, + "loss": 0.5933, + "step": 55600 + }, + { + "epoch": 1.43, + "learning_rate": 1.1291086499649775e-06, + "loss": 0.6865, + "step": 55601 + }, + { + "epoch": 1.43, + "learning_rate": 1.1290812110508061e-06, + "loss": 0.6714, + "step": 55602 + }, + { + "epoch": 1.43, + "learning_rate": 1.129053772037803e-06, + "loss": 0.6309, + "step": 55603 + }, + { + "epoch": 1.43, + "learning_rate": 1.1290263329259899e-06, + "loss": 0.5342, + "step": 55604 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289988937153867e-06, + "loss": 0.5181, + "step": 55605 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289714544060152e-06, + "loss": 0.6277, + "step": 55606 + }, + { + "epoch": 1.43, + "learning_rate": 1.128944014997896e-06, + "loss": 0.6924, + "step": 55607 + }, + { + "epoch": 1.43, + "learning_rate": 1.1289165754910506e-06, + "loss": 0.6445, + "step": 55608 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288891358854994e-06, + "loss": 0.4623, + "step": 55609 + }, + { + "epoch": 1.43, + "learning_rate": 1.128861696181264e-06, + "loss": 0.6191, + "step": 55610 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288342563783648e-06, + "loss": 0.6538, + "step": 55611 + }, + { + "epoch": 1.43, + "learning_rate": 1.1288068164768235e-06, + "loss": 0.5762, + "step": 55612 + }, + { + "epoch": 1.43, + "learning_rate": 1.1287793764766602e-06, + "loss": 0.6313, + "step": 55613 + }, + { + "epoch": 1.43, + "learning_rate": 1.128751936377897e-06, + "loss": 0.667, + "step": 55614 + }, + { + "epoch": 1.43, + "learning_rate": 1.1287244961805542e-06, + "loss": 0.6743, + "step": 55615 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286970558846532e-06, + "loss": 0.4663, + "step": 55616 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286696154902143e-06, + "loss": 0.5977, + "step": 55617 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286421749972593e-06, + "loss": 0.606, + "step": 55618 + }, + { + "epoch": 1.43, + "learning_rate": 1.1286147344058088e-06, + "loss": 0.7065, + "step": 55619 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285872937158837e-06, + "loss": 0.7949, + "step": 55620 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285598529275055e-06, + "loss": 0.5986, + "step": 55621 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285324120406948e-06, + "loss": 0.6953, + "step": 55622 + }, + { + "epoch": 1.43, + "learning_rate": 1.1285049710554728e-06, + "loss": 0.7607, + "step": 55623 + }, + { + "epoch": 1.43, + "learning_rate": 1.1284775299718608e-06, + "loss": 0.7168, + "step": 55624 + }, + { + "epoch": 1.43, + "learning_rate": 1.128450088789879e-06, + "loss": 0.7471, + "step": 55625 + }, + { + "epoch": 1.43, + "learning_rate": 1.128422647509549e-06, + "loss": 0.5615, + "step": 55626 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283952061308916e-06, + "loss": 0.4561, + "step": 55627 + }, + { + "epoch": 1.43, + "learning_rate": 1.128367764653928e-06, + "loss": 0.488, + "step": 55628 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283403230786795e-06, + "loss": 0.667, + "step": 55629 + }, + { + "epoch": 1.43, + "learning_rate": 1.1283128814051658e-06, + "loss": 0.5903, + "step": 55630 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282854396334096e-06, + "loss": 0.5796, + "step": 55631 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282579977634309e-06, + "loss": 0.7227, + "step": 55632 + }, + { + "epoch": 1.43, + "learning_rate": 1.128230555795251e-06, + "loss": 0.666, + "step": 55633 + }, + { + "epoch": 1.43, + "learning_rate": 1.1282031137288907e-06, + "loss": 0.5571, + "step": 55634 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281756715643713e-06, + "loss": 0.6904, + "step": 55635 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281482293017135e-06, + "loss": 0.5771, + "step": 55636 + }, + { + "epoch": 1.43, + "learning_rate": 1.1281207869409387e-06, + "loss": 0.4575, + "step": 55637 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280933444820675e-06, + "loss": 0.6855, + "step": 55638 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280659019251213e-06, + "loss": 0.5747, + "step": 55639 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280384592701208e-06, + "loss": 0.5615, + "step": 55640 + }, + { + "epoch": 1.43, + "learning_rate": 1.1280110165170873e-06, + "loss": 0.748, + "step": 55641 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279835736660416e-06, + "loss": 0.5134, + "step": 55642 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279561307170046e-06, + "loss": 0.6494, + "step": 55643 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279286876699978e-06, + "loss": 0.6816, + "step": 55644 + }, + { + "epoch": 1.43, + "learning_rate": 1.1279012445250415e-06, + "loss": 0.5527, + "step": 55645 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278738012821574e-06, + "loss": 0.6597, + "step": 55646 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278463579413659e-06, + "loss": 0.8828, + "step": 55647 + }, + { + "epoch": 1.43, + "learning_rate": 1.1278189145026887e-06, + "loss": 0.4614, + "step": 55648 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277914709661463e-06, + "loss": 0.7227, + "step": 55649 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277640273317598e-06, + "loss": 0.613, + "step": 55650 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277365835995503e-06, + "loss": 0.6338, + "step": 55651 + }, + { + "epoch": 1.43, + "learning_rate": 1.1277091397695386e-06, + "loss": 0.8506, + "step": 55652 + }, + { + "epoch": 1.43, + "learning_rate": 1.127681695841746e-06, + "loss": 0.6729, + "step": 55653 + }, + { + "epoch": 1.43, + "learning_rate": 1.1276542518161937e-06, + "loss": 0.5112, + "step": 55654 + }, + { + "epoch": 1.43, + "learning_rate": 1.127626807692902e-06, + "loss": 0.4298, + "step": 55655 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275993634718926e-06, + "loss": 0.5593, + "step": 55656 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275719191531858e-06, + "loss": 0.6335, + "step": 55657 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275444747368034e-06, + "loss": 0.791, + "step": 55658 + }, + { + "epoch": 1.43, + "learning_rate": 1.1275170302227662e-06, + "loss": 0.6401, + "step": 55659 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274895856110947e-06, + "loss": 0.79, + "step": 55660 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274621409018105e-06, + "loss": 0.6294, + "step": 55661 + }, + { + "epoch": 1.43, + "learning_rate": 1.1274346960949343e-06, + "loss": 0.5293, + "step": 55662 + }, + { + "epoch": 1.43, + "learning_rate": 1.127407251190487e-06, + "loss": 0.7114, + "step": 55663 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273798061884903e-06, + "loss": 0.5195, + "step": 55664 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273523610889646e-06, + "loss": 0.605, + "step": 55665 + }, + { + "epoch": 1.43, + "learning_rate": 1.1273249158919306e-06, + "loss": 0.7529, + "step": 55666 + }, + { + "epoch": 1.43, + "learning_rate": 1.1272974705974103e-06, + "loss": 0.6172, + "step": 55667 + }, + { + "epoch": 1.43, + "learning_rate": 1.127270025205424e-06, + "loss": 0.6436, + "step": 55668 + }, + { + "epoch": 1.43, + "learning_rate": 1.1272425797159933e-06, + "loss": 0.6064, + "step": 55669 + }, + { + "epoch": 1.43, + "learning_rate": 1.127215134129138e-06, + "loss": 0.4329, + "step": 55670 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271876884448806e-06, + "loss": 0.7432, + "step": 55671 + }, + { + "epoch": 1.43, + "learning_rate": 1.127160242663241e-06, + "loss": 0.5687, + "step": 55672 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271327967842408e-06, + "loss": 0.6021, + "step": 55673 + }, + { + "epoch": 1.43, + "learning_rate": 1.1271053508079012e-06, + "loss": 0.6069, + "step": 55674 + }, + { + "epoch": 1.43, + "learning_rate": 1.1270779047342425e-06, + "loss": 0.7842, + "step": 55675 + }, + { + "epoch": 1.43, + "learning_rate": 1.127050458563286e-06, + "loss": 0.627, + "step": 55676 + }, + { + "epoch": 1.43, + "learning_rate": 1.1270230122950531e-06, + "loss": 0.7417, + "step": 55677 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269955659295643e-06, + "loss": 0.5859, + "step": 55678 + }, + { + "epoch": 1.43, + "learning_rate": 1.126968119466841e-06, + "loss": 0.5269, + "step": 55679 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269406729069039e-06, + "loss": 0.7227, + "step": 55680 + }, + { + "epoch": 1.43, + "learning_rate": 1.1269132262497742e-06, + "loss": 0.4767, + "step": 55681 + }, + { + "epoch": 1.43, + "learning_rate": 1.126885779495473e-06, + "loss": 0.52, + "step": 55682 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268583326440212e-06, + "loss": 0.5405, + "step": 55683 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268308856954395e-06, + "loss": 0.7793, + "step": 55684 + }, + { + "epoch": 1.43, + "learning_rate": 1.1268034386497496e-06, + "loss": 0.6523, + "step": 55685 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267759915069719e-06, + "loss": 0.5664, + "step": 55686 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267485442671276e-06, + "loss": 0.8311, + "step": 55687 + }, + { + "epoch": 1.43, + "learning_rate": 1.1267210969302379e-06, + "loss": 0.6016, + "step": 55688 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266936494963237e-06, + "loss": 0.6855, + "step": 55689 + }, + { + "epoch": 1.43, + "learning_rate": 1.126666201965406e-06, + "loss": 0.7007, + "step": 55690 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266387543375057e-06, + "loss": 0.7549, + "step": 55691 + }, + { + "epoch": 1.43, + "learning_rate": 1.1266113066126442e-06, + "loss": 0.7109, + "step": 55692 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265838587908419e-06, + "loss": 0.519, + "step": 55693 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265564108721206e-06, + "loss": 0.6636, + "step": 55694 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265289628565004e-06, + "loss": 0.6592, + "step": 55695 + }, + { + "epoch": 1.43, + "learning_rate": 1.1265015147440032e-06, + "loss": 0.6855, + "step": 55696 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264740665346492e-06, + "loss": 0.614, + "step": 55697 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264466182284603e-06, + "loss": 0.5137, + "step": 55698 + }, + { + "epoch": 1.43, + "learning_rate": 1.1264191698254566e-06, + "loss": 0.6108, + "step": 55699 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263917213256597e-06, + "loss": 0.5527, + "step": 55700 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263642727290905e-06, + "loss": 0.7373, + "step": 55701 + }, + { + "epoch": 1.43, + "learning_rate": 1.12633682403577e-06, + "loss": 0.626, + "step": 55702 + }, + { + "epoch": 1.43, + "learning_rate": 1.1263093752457191e-06, + "loss": 0.5898, + "step": 55703 + }, + { + "epoch": 1.43, + "learning_rate": 1.126281926358959e-06, + "loss": 0.6201, + "step": 55704 + }, + { + "epoch": 1.43, + "learning_rate": 1.1262544773755107e-06, + "loss": 0.6797, + "step": 55705 + }, + { + "epoch": 1.43, + "learning_rate": 1.126227028295395e-06, + "loss": 0.6113, + "step": 55706 + }, + { + "epoch": 1.43, + "learning_rate": 1.126199579118633e-06, + "loss": 0.5559, + "step": 55707 + }, + { + "epoch": 1.43, + "learning_rate": 1.126172129845246e-06, + "loss": 0.5425, + "step": 55708 + }, + { + "epoch": 1.43, + "learning_rate": 1.1261446804752547e-06, + "loss": 0.5476, + "step": 55709 + }, + { + "epoch": 1.43, + "learning_rate": 1.1261172310086804e-06, + "loss": 0.7998, + "step": 55710 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260897814455438e-06, + "loss": 0.7881, + "step": 55711 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260623317858659e-06, + "loss": 0.4966, + "step": 55712 + }, + { + "epoch": 1.43, + "learning_rate": 1.1260348820296682e-06, + "loss": 0.7734, + "step": 55713 + }, + { + "epoch": 1.43, + "learning_rate": 1.126007432176971e-06, + "loss": 0.7334, + "step": 55714 + }, + { + "epoch": 1.43, + "learning_rate": 1.125979982227796e-06, + "loss": 0.71, + "step": 55715 + }, + { + "epoch": 1.43, + "learning_rate": 1.1259525321821636e-06, + "loss": 0.6572, + "step": 55716 + }, + { + "epoch": 1.43, + "learning_rate": 1.1259250820400956e-06, + "loss": 0.5112, + "step": 55717 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258976318016124e-06, + "loss": 0.7773, + "step": 55718 + }, + { + "epoch": 1.43, + "learning_rate": 1.125870181466735e-06, + "loss": 0.8203, + "step": 55719 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258427310354845e-06, + "loss": 0.7812, + "step": 55720 + }, + { + "epoch": 1.43, + "learning_rate": 1.1258152805078825e-06, + "loss": 0.7363, + "step": 55721 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257878298839489e-06, + "loss": 0.646, + "step": 55722 + }, + { + "epoch": 1.43, + "learning_rate": 1.125760379163706e-06, + "loss": 0.5737, + "step": 55723 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257329283471737e-06, + "loss": 0.6758, + "step": 55724 + }, + { + "epoch": 1.43, + "learning_rate": 1.1257054774343735e-06, + "loss": 0.5664, + "step": 55725 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256780264253266e-06, + "loss": 0.5938, + "step": 55726 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256505753200536e-06, + "loss": 0.5664, + "step": 55727 + }, + { + "epoch": 1.43, + "learning_rate": 1.1256231241185758e-06, + "loss": 0.6055, + "step": 55728 + }, + { + "epoch": 1.43, + "learning_rate": 1.125595672820914e-06, + "loss": 0.8506, + "step": 55729 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255682214270896e-06, + "loss": 0.6538, + "step": 55730 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255407699371234e-06, + "loss": 0.5957, + "step": 55731 + }, + { + "epoch": 1.43, + "learning_rate": 1.1255133183510364e-06, + "loss": 0.6147, + "step": 55732 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254858666688497e-06, + "loss": 0.71, + "step": 55733 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254584148905842e-06, + "loss": 0.4722, + "step": 55734 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254309630162605e-06, + "loss": 0.8311, + "step": 55735 + }, + { + "epoch": 1.43, + "learning_rate": 1.1254035110459005e-06, + "loss": 0.6719, + "step": 55736 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253760589795246e-06, + "loss": 0.4453, + "step": 55737 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253486068171545e-06, + "loss": 0.8535, + "step": 55738 + }, + { + "epoch": 1.43, + "learning_rate": 1.1253211545588102e-06, + "loss": 0.5166, + "step": 55739 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252937022045134e-06, + "loss": 0.6553, + "step": 55740 + }, + { + "epoch": 1.43, + "learning_rate": 1.125266249754285e-06, + "loss": 0.5466, + "step": 55741 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252387972081461e-06, + "loss": 0.6631, + "step": 55742 + }, + { + "epoch": 1.43, + "learning_rate": 1.1252113445661175e-06, + "loss": 0.7754, + "step": 55743 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251838918282205e-06, + "loss": 0.6016, + "step": 55744 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251564389944758e-06, + "loss": 0.7344, + "step": 55745 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251289860649045e-06, + "loss": 0.5347, + "step": 55746 + }, + { + "epoch": 1.43, + "learning_rate": 1.1251015330395276e-06, + "loss": 0.6062, + "step": 55747 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250740799183664e-06, + "loss": 0.481, + "step": 55748 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250466267014417e-06, + "loss": 0.6719, + "step": 55749 + }, + { + "epoch": 1.43, + "learning_rate": 1.1250191733887746e-06, + "loss": 0.6709, + "step": 55750 + }, + { + "epoch": 1.43, + "learning_rate": 1.124991719980386e-06, + "loss": 0.6187, + "step": 55751 + }, + { + "epoch": 1.43, + "learning_rate": 1.124964266476297e-06, + "loss": 0.564, + "step": 55752 + }, + { + "epoch": 1.43, + "learning_rate": 1.124936812876529e-06, + "loss": 0.8242, + "step": 55753 + }, + { + "epoch": 1.43, + "learning_rate": 1.1249093591811018e-06, + "loss": 0.5298, + "step": 55754 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248819053900378e-06, + "loss": 0.6157, + "step": 55755 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248544515033572e-06, + "loss": 0.6392, + "step": 55756 + }, + { + "epoch": 1.43, + "learning_rate": 1.1248269975210815e-06, + "loss": 0.6597, + "step": 55757 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247995434432315e-06, + "loss": 0.7383, + "step": 55758 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247720892698282e-06, + "loss": 0.7021, + "step": 55759 + }, + { + "epoch": 1.43, + "learning_rate": 1.1247446350008926e-06, + "loss": 0.6768, + "step": 55760 + }, + { + "epoch": 1.43, + "learning_rate": 1.124717180636446e-06, + "loss": 0.6196, + "step": 55761 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246897261765088e-06, + "loss": 0.748, + "step": 55762 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246622716211026e-06, + "loss": 0.7559, + "step": 55763 + }, + { + "epoch": 1.43, + "learning_rate": 1.1246348169702482e-06, + "loss": 0.5234, + "step": 55764 + }, + { + "epoch": 1.43, + "learning_rate": 1.124607362223967e-06, + "loss": 0.5455, + "step": 55765 + }, + { + "epoch": 1.43, + "learning_rate": 1.124579907382279e-06, + "loss": 0.752, + "step": 55766 + }, + { + "epoch": 1.43, + "learning_rate": 1.1245524524452063e-06, + "loss": 0.6309, + "step": 55767 + }, + { + "epoch": 1.43, + "learning_rate": 1.1245249974127695e-06, + "loss": 0.5298, + "step": 55768 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244975422849897e-06, + "loss": 0.6138, + "step": 55769 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244700870618874e-06, + "loss": 0.6289, + "step": 55770 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244426317434848e-06, + "loss": 0.6689, + "step": 55771 + }, + { + "epoch": 1.43, + "learning_rate": 1.1244151763298016e-06, + "loss": 0.5908, + "step": 55772 + }, + { + "epoch": 1.43, + "learning_rate": 1.1243877208208595e-06, + "loss": 0.8096, + "step": 55773 + }, + { + "epoch": 1.43, + "learning_rate": 1.1243602652166799e-06, + "loss": 0.6143, + "step": 55774 + }, + { + "epoch": 1.43, + "learning_rate": 1.124332809517283e-06, + "loss": 0.6689, + "step": 55775 + }, + { + "epoch": 1.43, + "learning_rate": 1.12430535372269e-06, + "loss": 0.5566, + "step": 55776 + }, + { + "epoch": 1.43, + "learning_rate": 1.1242778978329224e-06, + "loss": 0.6777, + "step": 55777 + }, + { + "epoch": 1.43, + "learning_rate": 1.124250441848001e-06, + "loss": 0.8096, + "step": 55778 + }, + { + "epoch": 1.43, + "learning_rate": 1.1242229857679466e-06, + "loss": 0.7007, + "step": 55779 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241955295927805e-06, + "loss": 0.5464, + "step": 55780 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241680733225231e-06, + "loss": 0.5771, + "step": 55781 + }, + { + "epoch": 1.43, + "learning_rate": 1.1241406169571965e-06, + "loss": 0.3837, + "step": 55782 + }, + { + "epoch": 1.43, + "learning_rate": 1.124113160496821e-06, + "loss": 0.5505, + "step": 55783 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240857039414177e-06, + "loss": 0.8262, + "step": 55784 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240582472910077e-06, + "loss": 0.5759, + "step": 55785 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240307905456119e-06, + "loss": 0.6191, + "step": 55786 + }, + { + "epoch": 1.43, + "learning_rate": 1.1240033337052516e-06, + "loss": 0.5869, + "step": 55787 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239758767699476e-06, + "loss": 0.8682, + "step": 55788 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239484197397208e-06, + "loss": 0.6641, + "step": 55789 + }, + { + "epoch": 1.43, + "learning_rate": 1.1239209626145927e-06, + "loss": 0.7266, + "step": 55790 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238935053945837e-06, + "loss": 0.6787, + "step": 55791 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238660480797154e-06, + "loss": 0.7549, + "step": 55792 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238385906700085e-06, + "loss": 0.7031, + "step": 55793 + }, + { + "epoch": 1.43, + "learning_rate": 1.1238111331654838e-06, + "loss": 0.646, + "step": 55794 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237836755661629e-06, + "loss": 0.8057, + "step": 55795 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237562178720666e-06, + "loss": 0.6172, + "step": 55796 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237287600832156e-06, + "loss": 0.603, + "step": 55797 + }, + { + "epoch": 1.43, + "learning_rate": 1.1237013021996313e-06, + "loss": 0.6611, + "step": 55798 + }, + { + "epoch": 1.43, + "learning_rate": 1.1236738442213347e-06, + "loss": 0.6592, + "step": 55799 + }, + { + "epoch": 1.43, + "learning_rate": 1.1236463861483464e-06, + "loss": 0.7129, + "step": 55800 + }, + { + "epoch": 1.43, + "learning_rate": 1.123618927980688e-06, + "loss": 0.6025, + "step": 55801 + }, + { + "epoch": 1.43, + "learning_rate": 1.12359146971838e-06, + "loss": 0.7119, + "step": 55802 + }, + { + "epoch": 1.43, + "learning_rate": 1.1235640113614443e-06, + "loss": 0.6875, + "step": 55803 + }, + { + "epoch": 1.43, + "learning_rate": 1.123536552909901e-06, + "loss": 0.7344, + "step": 55804 + }, + { + "epoch": 1.43, + "learning_rate": 1.1235090943637713e-06, + "loss": 0.7119, + "step": 55805 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234816357230763e-06, + "loss": 0.748, + "step": 55806 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234541769878375e-06, + "loss": 0.6553, + "step": 55807 + }, + { + "epoch": 1.43, + "learning_rate": 1.1234267181580752e-06, + "loss": 0.6543, + "step": 55808 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233992592338108e-06, + "loss": 0.6953, + "step": 55809 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233718002150652e-06, + "loss": 0.5737, + "step": 55810 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233443411018597e-06, + "loss": 0.5786, + "step": 55811 + }, + { + "epoch": 1.43, + "learning_rate": 1.1233168818942146e-06, + "loss": 0.5649, + "step": 55812 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232894225921523e-06, + "loss": 0.6553, + "step": 55813 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232619631956922e-06, + "loss": 0.6777, + "step": 55814 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232345037048566e-06, + "loss": 0.5396, + "step": 55815 + }, + { + "epoch": 1.43, + "learning_rate": 1.1232070441196655e-06, + "loss": 0.6348, + "step": 55816 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231795844401405e-06, + "loss": 0.8955, + "step": 55817 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231521246663029e-06, + "loss": 0.709, + "step": 55818 + }, + { + "epoch": 1.43, + "learning_rate": 1.1231246647981731e-06, + "loss": 0.5864, + "step": 55819 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230972048357728e-06, + "loss": 0.6875, + "step": 55820 + }, + { + "epoch": 1.43, + "learning_rate": 1.123069744779122e-06, + "loss": 0.627, + "step": 55821 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230422846282428e-06, + "loss": 0.6328, + "step": 55822 + }, + { + "epoch": 1.43, + "learning_rate": 1.1230148243831559e-06, + "loss": 0.6528, + "step": 55823 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229873640438818e-06, + "loss": 0.6777, + "step": 55824 + }, + { + "epoch": 1.43, + "learning_rate": 1.122959903610442e-06, + "loss": 0.5488, + "step": 55825 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229324430828577e-06, + "loss": 0.8604, + "step": 55826 + }, + { + "epoch": 1.43, + "learning_rate": 1.1229049824611495e-06, + "loss": 0.6421, + "step": 55827 + }, + { + "epoch": 1.43, + "learning_rate": 1.1228775217453388e-06, + "loss": 0.5972, + "step": 55828 + }, + { + "epoch": 1.43, + "learning_rate": 1.1228500609354462e-06, + "loss": 0.5122, + "step": 55829 + }, + { + "epoch": 1.43, + "learning_rate": 1.122822600031493e-06, + "loss": 0.6602, + "step": 55830 + }, + { + "epoch": 1.43, + "learning_rate": 1.1227951390335003e-06, + "loss": 0.7559, + "step": 55831 + }, + { + "epoch": 1.43, + "learning_rate": 1.122767677941489e-06, + "loss": 0.7344, + "step": 55832 + }, + { + "epoch": 1.43, + "learning_rate": 1.12274021675548e-06, + "loss": 0.6812, + "step": 55833 + }, + { + "epoch": 1.43, + "learning_rate": 1.1227127554754947e-06, + "loss": 0.79, + "step": 55834 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226852941015534e-06, + "loss": 0.5752, + "step": 55835 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226578326336783e-06, + "loss": 0.6062, + "step": 55836 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226303710718892e-06, + "loss": 0.5791, + "step": 55837 + }, + { + "epoch": 1.43, + "learning_rate": 1.1226029094162078e-06, + "loss": 0.4514, + "step": 55838 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225754476666552e-06, + "loss": 0.5801, + "step": 55839 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225479858232518e-06, + "loss": 0.71, + "step": 55840 + }, + { + "epoch": 1.43, + "learning_rate": 1.1225205238860194e-06, + "loss": 0.7031, + "step": 55841 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224930618549785e-06, + "loss": 0.6143, + "step": 55842 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224655997301503e-06, + "loss": 0.7803, + "step": 55843 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224381375115558e-06, + "loss": 0.75, + "step": 55844 + }, + { + "epoch": 1.43, + "learning_rate": 1.1224106751992161e-06, + "loss": 1.0029, + "step": 55845 + }, + { + "epoch": 1.43, + "learning_rate": 1.122383212793152e-06, + "loss": 0.4937, + "step": 55846 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223557502933851e-06, + "loss": 0.6362, + "step": 55847 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223282876999358e-06, + "loss": 0.6323, + "step": 55848 + }, + { + "epoch": 1.43, + "learning_rate": 1.1223008250128257e-06, + "loss": 0.79, + "step": 55849 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222733622320747e-06, + "loss": 0.7783, + "step": 55850 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222458993577054e-06, + "loss": 0.6426, + "step": 55851 + }, + { + "epoch": 1.43, + "learning_rate": 1.1222184363897374e-06, + "loss": 0.751, + "step": 55852 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221909733281929e-06, + "loss": 0.6167, + "step": 55853 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221635101730923e-06, + "loss": 0.6133, + "step": 55854 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221360469244565e-06, + "loss": 0.3987, + "step": 55855 + }, + { + "epoch": 1.43, + "learning_rate": 1.1221085835823065e-06, + "loss": 0.7695, + "step": 55856 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220811201466641e-06, + "loss": 0.709, + "step": 55857 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220536566175495e-06, + "loss": 0.583, + "step": 55858 + }, + { + "epoch": 1.43, + "learning_rate": 1.1220261929949844e-06, + "loss": 0.7227, + "step": 55859 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219987292789889e-06, + "loss": 0.5146, + "step": 55860 + }, + { + "epoch": 1.43, + "learning_rate": 1.121971265469585e-06, + "loss": 0.4863, + "step": 55861 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219438015667931e-06, + "loss": 0.4697, + "step": 55862 + }, + { + "epoch": 1.43, + "learning_rate": 1.1219163375706343e-06, + "loss": 0.5918, + "step": 55863 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218888734811302e-06, + "loss": 0.8486, + "step": 55864 + }, + { + "epoch": 1.43, + "learning_rate": 1.121861409298301e-06, + "loss": 0.6533, + "step": 55865 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218339450221683e-06, + "loss": 0.6582, + "step": 55866 + }, + { + "epoch": 1.43, + "learning_rate": 1.1218064806527528e-06, + "loss": 0.7451, + "step": 55867 + }, + { + "epoch": 1.43, + "learning_rate": 1.121779016190076e-06, + "loss": 0.5742, + "step": 55868 + }, + { + "epoch": 1.43, + "learning_rate": 1.1217515516341584e-06, + "loss": 0.665, + "step": 55869 + }, + { + "epoch": 1.43, + "learning_rate": 1.1217240869850213e-06, + "loss": 0.6226, + "step": 55870 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216966222426853e-06, + "loss": 0.7725, + "step": 55871 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216691574071724e-06, + "loss": 0.7432, + "step": 55872 + }, + { + "epoch": 1.43, + "learning_rate": 1.121641692478503e-06, + "loss": 0.5178, + "step": 55873 + }, + { + "epoch": 1.43, + "learning_rate": 1.1216142274566977e-06, + "loss": 0.5618, + "step": 55874 + }, + { + "epoch": 1.43, + "learning_rate": 1.121586762341778e-06, + "loss": 0.7803, + "step": 55875 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215592971337652e-06, + "loss": 0.5386, + "step": 55876 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215318318326797e-06, + "loss": 0.4722, + "step": 55877 + }, + { + "epoch": 1.43, + "learning_rate": 1.1215043664385432e-06, + "loss": 0.6021, + "step": 55878 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214769009513762e-06, + "loss": 0.624, + "step": 55879 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214494353712002e-06, + "loss": 0.7051, + "step": 55880 + }, + { + "epoch": 1.43, + "learning_rate": 1.1214219696980353e-06, + "loss": 0.7705, + "step": 55881 + }, + { + "epoch": 1.43, + "learning_rate": 1.121394503931904e-06, + "loss": 0.5771, + "step": 55882 + }, + { + "epoch": 1.43, + "learning_rate": 1.121367038072826e-06, + "loss": 0.6504, + "step": 55883 + }, + { + "epoch": 1.43, + "learning_rate": 1.1213395721208228e-06, + "loss": 0.8398, + "step": 55884 + }, + { + "epoch": 1.43, + "learning_rate": 1.1213121060759156e-06, + "loss": 0.592, + "step": 55885 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212846399381255e-06, + "loss": 0.6914, + "step": 55886 + }, + { + "epoch": 1.43, + "learning_rate": 1.121257173707473e-06, + "loss": 0.7422, + "step": 55887 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212297073839798e-06, + "loss": 0.791, + "step": 55888 + }, + { + "epoch": 1.43, + "learning_rate": 1.1212022409676666e-06, + "loss": 0.353, + "step": 55889 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211747744585537e-06, + "loss": 0.7949, + "step": 55890 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211473078566636e-06, + "loss": 0.6279, + "step": 55891 + }, + { + "epoch": 1.43, + "learning_rate": 1.1211198411620163e-06, + "loss": 0.5073, + "step": 55892 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210923743746334e-06, + "loss": 0.5906, + "step": 55893 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210649074945351e-06, + "loss": 0.7432, + "step": 55894 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210374405217433e-06, + "loss": 0.6758, + "step": 55895 + }, + { + "epoch": 1.43, + "learning_rate": 1.1210099734562787e-06, + "loss": 0.4965, + "step": 55896 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209825062981622e-06, + "loss": 0.793, + "step": 55897 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209550390474152e-06, + "loss": 0.7637, + "step": 55898 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209275717040583e-06, + "loss": 0.627, + "step": 55899 + }, + { + "epoch": 1.43, + "learning_rate": 1.1209001042681125e-06, + "loss": 0.6084, + "step": 55900 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208726367395995e-06, + "loss": 0.6816, + "step": 55901 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208451691185395e-06, + "loss": 0.8516, + "step": 55902 + }, + { + "epoch": 1.43, + "learning_rate": 1.1208177014049542e-06, + "loss": 0.7285, + "step": 55903 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207902335988643e-06, + "loss": 0.6045, + "step": 55904 + }, + { + "epoch": 1.43, + "learning_rate": 1.120762765700291e-06, + "loss": 0.4946, + "step": 55905 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207352977092547e-06, + "loss": 0.5864, + "step": 55906 + }, + { + "epoch": 1.43, + "learning_rate": 1.1207078296257772e-06, + "loss": 0.4766, + "step": 55907 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206803614498795e-06, + "loss": 0.6572, + "step": 55908 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206528931815819e-06, + "loss": 0.5911, + "step": 55909 + }, + { + "epoch": 1.43, + "learning_rate": 1.1206254248209064e-06, + "loss": 0.6631, + "step": 55910 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205979563678733e-06, + "loss": 0.6348, + "step": 55911 + }, + { + "epoch": 1.43, + "learning_rate": 1.120570487822504e-06, + "loss": 0.7256, + "step": 55912 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205430191848196e-06, + "loss": 0.6826, + "step": 55913 + }, + { + "epoch": 1.43, + "learning_rate": 1.1205155504548408e-06, + "loss": 0.6865, + "step": 55914 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204880816325885e-06, + "loss": 0.6992, + "step": 55915 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204606127180842e-06, + "loss": 0.6836, + "step": 55916 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204331437113488e-06, + "loss": 0.6758, + "step": 55917 + }, + { + "epoch": 1.43, + "learning_rate": 1.1204056746124035e-06, + "loss": 0.7471, + "step": 55918 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203782054212688e-06, + "loss": 0.7915, + "step": 55919 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203507361379661e-06, + "loss": 0.6472, + "step": 55920 + }, + { + "epoch": 1.43, + "learning_rate": 1.1203232667625162e-06, + "loss": 0.6279, + "step": 55921 + }, + { + "epoch": 1.43, + "learning_rate": 1.1202957972949407e-06, + "loss": 0.8564, + "step": 55922 + }, + { + "epoch": 1.43, + "learning_rate": 1.12026832773526e-06, + "loss": 0.8359, + "step": 55923 + }, + { + "epoch": 1.43, + "learning_rate": 1.1202408580834957e-06, + "loss": 0.834, + "step": 55924 + }, + { + "epoch": 1.43, + "learning_rate": 1.120213388339668e-06, + "loss": 0.7402, + "step": 55925 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201859185037987e-06, + "loss": 0.5566, + "step": 55926 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201584485759084e-06, + "loss": 0.8027, + "step": 55927 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201309785560185e-06, + "loss": 0.6768, + "step": 55928 + }, + { + "epoch": 1.43, + "learning_rate": 1.1201035084441497e-06, + "loss": 0.4767, + "step": 55929 + }, + { + "epoch": 1.43, + "learning_rate": 1.1200760382403231e-06, + "loss": 0.749, + "step": 55930 + }, + { + "epoch": 1.43, + "learning_rate": 1.12004856794456e-06, + "loss": 0.6357, + "step": 55931 + }, + { + "epoch": 1.43, + "learning_rate": 1.1200210975568814e-06, + "loss": 0.9248, + "step": 55932 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199936270773078e-06, + "loss": 0.8086, + "step": 55933 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199661565058607e-06, + "loss": 0.7554, + "step": 55934 + }, + { + "epoch": 1.43, + "learning_rate": 1.119938685842561e-06, + "loss": 0.5239, + "step": 55935 + }, + { + "epoch": 1.43, + "learning_rate": 1.1199112150874297e-06, + "loss": 0.6943, + "step": 55936 + }, + { + "epoch": 1.43, + "learning_rate": 1.119883744240488e-06, + "loss": 0.6885, + "step": 55937 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198562733017571e-06, + "loss": 0.5996, + "step": 55938 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198288022712574e-06, + "loss": 0.7207, + "step": 55939 + }, + { + "epoch": 1.43, + "learning_rate": 1.1198013311490104e-06, + "loss": 0.6812, + "step": 55940 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197738599350371e-06, + "loss": 0.8584, + "step": 55941 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197463886293582e-06, + "loss": 0.8711, + "step": 55942 + }, + { + "epoch": 1.43, + "learning_rate": 1.1197189172319955e-06, + "loss": 0.438, + "step": 55943 + }, + { + "epoch": 1.43, + "learning_rate": 1.119691445742969e-06, + "loss": 0.6465, + "step": 55944 + }, + { + "epoch": 1.43, + "learning_rate": 1.1196639741623006e-06, + "loss": 0.6738, + "step": 55945 + }, + { + "epoch": 1.43, + "learning_rate": 1.1196365024900108e-06, + "loss": 0.6641, + "step": 55946 + }, + { + "epoch": 1.43, + "learning_rate": 1.119609030726121e-06, + "loss": 0.6016, + "step": 55947 + }, + { + "epoch": 1.43, + "learning_rate": 1.119581558870652e-06, + "loss": 0.7158, + "step": 55948 + }, + { + "epoch": 1.43, + "learning_rate": 1.1195540869236248e-06, + "loss": 0.6426, + "step": 55949 + }, + { + "epoch": 1.43, + "learning_rate": 1.1195266148850605e-06, + "loss": 0.7217, + "step": 55950 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194991427549805e-06, + "loss": 0.645, + "step": 55951 + }, + { + "epoch": 1.43, + "learning_rate": 1.119471670533405e-06, + "loss": 0.604, + "step": 55952 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194441982203559e-06, + "loss": 0.5798, + "step": 55953 + }, + { + "epoch": 1.43, + "learning_rate": 1.1194167258158537e-06, + "loss": 0.5151, + "step": 55954 + }, + { + "epoch": 1.43, + "learning_rate": 1.1193892533199196e-06, + "loss": 0.6943, + "step": 55955 + }, + { + "epoch": 1.43, + "learning_rate": 1.1193617807325747e-06, + "loss": 0.4072, + "step": 55956 + }, + { + "epoch": 1.43, + "learning_rate": 1.11933430805384e-06, + "loss": 0.7451, + "step": 55957 + }, + { + "epoch": 1.43, + "learning_rate": 1.119306835283737e-06, + "loss": 0.6631, + "step": 55958 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192793624222854e-06, + "loss": 0.665, + "step": 55959 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192518894695075e-06, + "loss": 0.6826, + "step": 55960 + }, + { + "epoch": 1.43, + "learning_rate": 1.1192244164254236e-06, + "loss": 0.7256, + "step": 55961 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191969432900555e-06, + "loss": 0.6953, + "step": 55962 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191694700634235e-06, + "loss": 0.6899, + "step": 55963 + }, + { + "epoch": 1.43, + "learning_rate": 1.1191419967455492e-06, + "loss": 0.8076, + "step": 55964 + }, + { + "epoch": 1.43, + "learning_rate": 1.119114523336453e-06, + "loss": 0.6953, + "step": 55965 + }, + { + "epoch": 1.43, + "learning_rate": 1.1190870498361563e-06, + "loss": 0.5691, + "step": 55966 + }, + { + "epoch": 1.43, + "learning_rate": 1.1190595762446802e-06, + "loss": 0.6973, + "step": 55967 + }, + { + "epoch": 1.43, + "learning_rate": 1.119032102562046e-06, + "loss": 0.4985, + "step": 55968 + }, + { + "epoch": 1.43, + "learning_rate": 1.119004628788274e-06, + "loss": 0.6406, + "step": 55969 + }, + { + "epoch": 1.43, + "learning_rate": 1.1189771549233857e-06, + "loss": 0.6328, + "step": 55970 + }, + { + "epoch": 1.43, + "learning_rate": 1.118949680967402e-06, + "loss": 0.4556, + "step": 55971 + }, + { + "epoch": 1.43, + "learning_rate": 1.1189222069203442e-06, + "loss": 0.7354, + "step": 55972 + }, + { + "epoch": 1.43, + "learning_rate": 1.118894732782233e-06, + "loss": 0.5737, + "step": 55973 + }, + { + "epoch": 1.43, + "learning_rate": 1.1188672585530895e-06, + "loss": 0.6411, + "step": 55974 + }, + { + "epoch": 1.43, + "learning_rate": 1.118839784232935e-06, + "loss": 0.6104, + "step": 55975 + }, + { + "epoch": 1.43, + "learning_rate": 1.1188123098217902e-06, + "loss": 0.7007, + "step": 55976 + }, + { + "epoch": 1.43, + "learning_rate": 1.118784835319676e-06, + "loss": 0.6104, + "step": 55977 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187573607266144e-06, + "loss": 0.6562, + "step": 55978 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187298860426252e-06, + "loss": 0.4512, + "step": 55979 + }, + { + "epoch": 1.43, + "learning_rate": 1.1187024112677301e-06, + "loss": 0.7246, + "step": 55980 + }, + { + "epoch": 1.43, + "learning_rate": 1.11867493640195e-06, + "loss": 0.7168, + "step": 55981 + }, + { + "epoch": 1.43, + "learning_rate": 1.118647461445306e-06, + "loss": 0.4673, + "step": 55982 + }, + { + "epoch": 1.43, + "learning_rate": 1.1186199863978194e-06, + "loss": 0.6411, + "step": 55983 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185925112595106e-06, + "loss": 0.6396, + "step": 55984 + }, + { + "epoch": 1.43, + "learning_rate": 1.118565036030401e-06, + "loss": 0.522, + "step": 55985 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185375607105114e-06, + "loss": 0.791, + "step": 55986 + }, + { + "epoch": 1.43, + "learning_rate": 1.1185100852998634e-06, + "loss": 0.5977, + "step": 55987 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184826097984777e-06, + "loss": 0.709, + "step": 55988 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184551342063752e-06, + "loss": 0.5334, + "step": 55989 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184276585235768e-06, + "loss": 0.6128, + "step": 55990 + }, + { + "epoch": 1.44, + "learning_rate": 1.1184001827501042e-06, + "loss": 0.6284, + "step": 55991 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183727068859777e-06, + "loss": 0.6272, + "step": 55992 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183452309312186e-06, + "loss": 0.5781, + "step": 55993 + }, + { + "epoch": 1.44, + "learning_rate": 1.1183177548858484e-06, + "loss": 0.7861, + "step": 55994 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182902787498876e-06, + "loss": 0.6426, + "step": 55995 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182628025233572e-06, + "loss": 0.6426, + "step": 55996 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182353262062785e-06, + "loss": 0.6748, + "step": 55997 + }, + { + "epoch": 1.44, + "learning_rate": 1.1182078497986724e-06, + "loss": 0.5938, + "step": 55998 + }, + { + "epoch": 1.44, + "learning_rate": 1.11818037330056e-06, + "loss": 0.7334, + "step": 55999 + }, + { + "epoch": 1.44, + "learning_rate": 1.1181528967119625e-06, + "loss": 0.4976, + "step": 56000 + }, + { + "epoch": 1.44, + "learning_rate": 1.1181254200329005e-06, + "loss": 0.5425, + "step": 56001 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180979432633955e-06, + "loss": 0.4893, + "step": 56002 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180704664034682e-06, + "loss": 0.6411, + "step": 56003 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180429894531399e-06, + "loss": 0.4149, + "step": 56004 + }, + { + "epoch": 1.44, + "learning_rate": 1.1180155124124312e-06, + "loss": 0.5498, + "step": 56005 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179880352813638e-06, + "loss": 0.7744, + "step": 56006 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179605580599583e-06, + "loss": 0.5923, + "step": 56007 + }, + { + "epoch": 1.44, + "learning_rate": 1.117933080748236e-06, + "loss": 0.7021, + "step": 56008 + }, + { + "epoch": 1.44, + "learning_rate": 1.1179056033462173e-06, + "loss": 0.6997, + "step": 56009 + }, + { + "epoch": 1.44, + "learning_rate": 1.117878125853924e-06, + "loss": 0.7939, + "step": 56010 + }, + { + "epoch": 1.44, + "learning_rate": 1.1178506482713767e-06, + "loss": 0.5752, + "step": 56011 + }, + { + "epoch": 1.44, + "learning_rate": 1.117823170598597e-06, + "loss": 0.5635, + "step": 56012 + }, + { + "epoch": 1.44, + "learning_rate": 1.117795692835605e-06, + "loss": 0.5347, + "step": 56013 + }, + { + "epoch": 1.44, + "learning_rate": 1.1177682149824223e-06, + "loss": 0.6738, + "step": 56014 + }, + { + "epoch": 1.44, + "learning_rate": 1.1177407370390702e-06, + "loss": 0.5967, + "step": 56015 + }, + { + "epoch": 1.44, + "learning_rate": 1.117713259005569e-06, + "loss": 0.6946, + "step": 56016 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176857808819406e-06, + "loss": 0.7422, + "step": 56017 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176583026682053e-06, + "loss": 0.5417, + "step": 56018 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176308243643848e-06, + "loss": 0.6157, + "step": 56019 + }, + { + "epoch": 1.44, + "learning_rate": 1.1176033459704995e-06, + "loss": 0.417, + "step": 56020 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175758674865708e-06, + "loss": 0.455, + "step": 56021 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175483889126196e-06, + "loss": 0.6812, + "step": 56022 + }, + { + "epoch": 1.44, + "learning_rate": 1.1175209102486674e-06, + "loss": 0.7627, + "step": 56023 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174934314947343e-06, + "loss": 0.5425, + "step": 56024 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174659526508422e-06, + "loss": 0.6216, + "step": 56025 + }, + { + "epoch": 1.44, + "learning_rate": 1.1174384737170115e-06, + "loss": 0.5267, + "step": 56026 + }, + { + "epoch": 1.44, + "learning_rate": 1.117410994693264e-06, + "loss": 0.647, + "step": 56027 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173835155796199e-06, + "loss": 0.7607, + "step": 56028 + }, + { + "epoch": 1.44, + "learning_rate": 1.117356036376101e-06, + "loss": 0.6738, + "step": 56029 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173285570827276e-06, + "loss": 0.4844, + "step": 56030 + }, + { + "epoch": 1.44, + "learning_rate": 1.1173010776995214e-06, + "loss": 0.6758, + "step": 56031 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172735982265032e-06, + "loss": 0.7168, + "step": 56032 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172461186636938e-06, + "loss": 0.5859, + "step": 56033 + }, + { + "epoch": 1.44, + "learning_rate": 1.1172186390111144e-06, + "loss": 0.6494, + "step": 56034 + }, + { + "epoch": 1.44, + "learning_rate": 1.117191159268786e-06, + "loss": 0.667, + "step": 56035 + }, + { + "epoch": 1.44, + "learning_rate": 1.1171636794367301e-06, + "loss": 0.4904, + "step": 56036 + }, + { + "epoch": 1.44, + "learning_rate": 1.117136199514967e-06, + "loss": 0.7852, + "step": 56037 + }, + { + "epoch": 1.44, + "learning_rate": 1.1171087195035186e-06, + "loss": 0.749, + "step": 56038 + }, + { + "epoch": 1.44, + "learning_rate": 1.1170812394024051e-06, + "loss": 0.5969, + "step": 56039 + }, + { + "epoch": 1.44, + "learning_rate": 1.1170537592116478e-06, + "loss": 0.4333, + "step": 56040 + }, + { + "epoch": 1.44, + "learning_rate": 1.117026278931268e-06, + "loss": 0.7275, + "step": 56041 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169987985612863e-06, + "loss": 0.5454, + "step": 56042 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169713181017242e-06, + "loss": 0.6826, + "step": 56043 + }, + { + "epoch": 1.44, + "learning_rate": 1.1169438375526025e-06, + "loss": 0.5879, + "step": 56044 + }, + { + "epoch": 1.44, + "learning_rate": 1.116916356913942e-06, + "loss": 0.6096, + "step": 56045 + }, + { + "epoch": 1.44, + "learning_rate": 1.1168888761857644e-06, + "loss": 0.793, + "step": 56046 + }, + { + "epoch": 1.44, + "learning_rate": 1.1168613953680903e-06, + "loss": 0.7324, + "step": 56047 + }, + { + "epoch": 1.44, + "learning_rate": 1.116833914460941e-06, + "loss": 0.7734, + "step": 56048 + }, + { + "epoch": 1.44, + "learning_rate": 1.116806433464337e-06, + "loss": 0.5811, + "step": 56049 + }, + { + "epoch": 1.44, + "learning_rate": 1.1167789523782999e-06, + "loss": 0.6543, + "step": 56050 + }, + { + "epoch": 1.44, + "learning_rate": 1.11675147120285e-06, + "loss": 0.6514, + "step": 56051 + }, + { + "epoch": 1.44, + "learning_rate": 1.1167239899380097e-06, + "loss": 0.6069, + "step": 56052 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166965085837987e-06, + "loss": 0.9902, + "step": 56053 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166690271402386e-06, + "loss": 0.5962, + "step": 56054 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166415456073504e-06, + "loss": 0.488, + "step": 56055 + }, + { + "epoch": 1.44, + "learning_rate": 1.1166140639851551e-06, + "loss": 0.5186, + "step": 56056 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165865822736739e-06, + "loss": 0.7314, + "step": 56057 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165591004729278e-06, + "loss": 0.5776, + "step": 56058 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165316185829373e-06, + "loss": 0.5889, + "step": 56059 + }, + { + "epoch": 1.44, + "learning_rate": 1.1165041366037244e-06, + "loss": 0.5526, + "step": 56060 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164766545353094e-06, + "loss": 0.8545, + "step": 56061 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164491723777137e-06, + "loss": 0.7227, + "step": 56062 + }, + { + "epoch": 1.44, + "learning_rate": 1.1164216901309582e-06, + "loss": 0.6294, + "step": 56063 + }, + { + "epoch": 1.44, + "learning_rate": 1.116394207795064e-06, + "loss": 0.5259, + "step": 56064 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163667253700519e-06, + "loss": 0.5293, + "step": 56065 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163392428559432e-06, + "loss": 0.5957, + "step": 56066 + }, + { + "epoch": 1.44, + "learning_rate": 1.1163117602527592e-06, + "loss": 0.6104, + "step": 56067 + }, + { + "epoch": 1.44, + "learning_rate": 1.11628427756052e-06, + "loss": 0.6846, + "step": 56068 + }, + { + "epoch": 1.44, + "learning_rate": 1.116256794779248e-06, + "loss": 0.6113, + "step": 56069 + }, + { + "epoch": 1.44, + "learning_rate": 1.116229311908963e-06, + "loss": 0.5088, + "step": 56070 + }, + { + "epoch": 1.44, + "learning_rate": 1.1162018289496868e-06, + "loss": 0.7163, + "step": 56071 + }, + { + "epoch": 1.44, + "learning_rate": 1.1161743459014404e-06, + "loss": 0.7725, + "step": 56072 + }, + { + "epoch": 1.44, + "learning_rate": 1.1161468627642443e-06, + "loss": 0.5996, + "step": 56073 + }, + { + "epoch": 1.44, + "learning_rate": 1.11611937953812e-06, + "loss": 0.5226, + "step": 56074 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160918962230884e-06, + "loss": 0.4551, + "step": 56075 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160644128191703e-06, + "loss": 0.5898, + "step": 56076 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160369293263876e-06, + "loss": 0.7627, + "step": 56077 + }, + { + "epoch": 1.44, + "learning_rate": 1.1160094457447603e-06, + "loss": 0.7373, + "step": 56078 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159819620743102e-06, + "loss": 0.7515, + "step": 56079 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159544783150577e-06, + "loss": 0.6685, + "step": 56080 + }, + { + "epoch": 1.44, + "learning_rate": 1.1159269944670246e-06, + "loss": 0.6045, + "step": 56081 + }, + { + "epoch": 1.44, + "learning_rate": 1.1158995105302313e-06, + "loss": 0.5063, + "step": 56082 + }, + { + "epoch": 1.44, + "learning_rate": 1.115872026504699e-06, + "loss": 0.7148, + "step": 56083 + }, + { + "epoch": 1.44, + "learning_rate": 1.115844542390449e-06, + "loss": 0.5073, + "step": 56084 + }, + { + "epoch": 1.44, + "learning_rate": 1.1158170581875022e-06, + "loss": 0.6045, + "step": 56085 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157895738958794e-06, + "loss": 0.7607, + "step": 56086 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157620895156019e-06, + "loss": 0.6196, + "step": 56087 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157346050466906e-06, + "loss": 0.6348, + "step": 56088 + }, + { + "epoch": 1.44, + "learning_rate": 1.1157071204891668e-06, + "loss": 0.5947, + "step": 56089 + }, + { + "epoch": 1.44, + "learning_rate": 1.1156796358430514e-06, + "loss": 0.7456, + "step": 56090 + }, + { + "epoch": 1.44, + "learning_rate": 1.115652151108365e-06, + "loss": 0.7026, + "step": 56091 + }, + { + "epoch": 1.44, + "learning_rate": 1.1156246662851298e-06, + "loss": 0.4658, + "step": 56092 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155971813733658e-06, + "loss": 0.7168, + "step": 56093 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155696963730942e-06, + "loss": 0.6035, + "step": 56094 + }, + { + "epoch": 1.44, + "learning_rate": 1.1155422112843363e-06, + "loss": 0.7227, + "step": 56095 + }, + { + "epoch": 1.44, + "learning_rate": 1.115514726107113e-06, + "loss": 0.5825, + "step": 56096 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154872408414455e-06, + "loss": 0.6699, + "step": 56097 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154597554873548e-06, + "loss": 0.6895, + "step": 56098 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154322700448615e-06, + "loss": 0.6533, + "step": 56099 + }, + { + "epoch": 1.44, + "learning_rate": 1.1154047845139874e-06, + "loss": 0.7549, + "step": 56100 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153772988947528e-06, + "loss": 0.5684, + "step": 56101 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153498131871796e-06, + "loss": 0.6665, + "step": 56102 + }, + { + "epoch": 1.44, + "learning_rate": 1.1153223273912876e-06, + "loss": 0.6592, + "step": 56103 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152948415070993e-06, + "loss": 0.71, + "step": 56104 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152673555346347e-06, + "loss": 0.7021, + "step": 56105 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152398694739154e-06, + "loss": 0.4054, + "step": 56106 + }, + { + "epoch": 1.44, + "learning_rate": 1.1152123833249623e-06, + "loss": 0.4995, + "step": 56107 + }, + { + "epoch": 1.44, + "learning_rate": 1.115184897087796e-06, + "loss": 0.7715, + "step": 56108 + }, + { + "epoch": 1.44, + "learning_rate": 1.115157410762438e-06, + "loss": 0.3291, + "step": 56109 + }, + { + "epoch": 1.44, + "learning_rate": 1.1151299243489094e-06, + "loss": 0.7812, + "step": 56110 + }, + { + "epoch": 1.44, + "learning_rate": 1.1151024378472311e-06, + "loss": 0.5278, + "step": 56111 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150749512574243e-06, + "loss": 0.5847, + "step": 56112 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150474645795096e-06, + "loss": 0.6235, + "step": 56113 + }, + { + "epoch": 1.44, + "learning_rate": 1.1150199778135085e-06, + "loss": 0.7744, + "step": 56114 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149924909594418e-06, + "loss": 0.6006, + "step": 56115 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149650040173305e-06, + "loss": 0.5485, + "step": 56116 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149375169871964e-06, + "loss": 0.689, + "step": 56117 + }, + { + "epoch": 1.44, + "learning_rate": 1.1149100298690594e-06, + "loss": 0.6013, + "step": 56118 + }, + { + "epoch": 1.44, + "learning_rate": 1.1148825426629415e-06, + "loss": 0.5591, + "step": 56119 + }, + { + "epoch": 1.44, + "learning_rate": 1.1148550553688628e-06, + "loss": 0.7812, + "step": 56120 + }, + { + "epoch": 1.44, + "learning_rate": 1.114827567986845e-06, + "loss": 0.6475, + "step": 56121 + }, + { + "epoch": 1.44, + "learning_rate": 1.114800080516909e-06, + "loss": 0.4561, + "step": 56122 + }, + { + "epoch": 1.44, + "learning_rate": 1.1147725929590763e-06, + "loss": 0.6025, + "step": 56123 + }, + { + "epoch": 1.44, + "learning_rate": 1.114745105313367e-06, + "loss": 0.5347, + "step": 56124 + }, + { + "epoch": 1.44, + "learning_rate": 1.1147176175798027e-06, + "loss": 0.5701, + "step": 56125 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146901297584045e-06, + "loss": 0.5947, + "step": 56126 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146626418491933e-06, + "loss": 0.6953, + "step": 56127 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146351538521903e-06, + "loss": 0.5425, + "step": 56128 + }, + { + "epoch": 1.44, + "learning_rate": 1.1146076657674166e-06, + "loss": 0.7544, + "step": 56129 + }, + { + "epoch": 1.44, + "learning_rate": 1.1145801775948927e-06, + "loss": 0.6777, + "step": 56130 + }, + { + "epoch": 1.44, + "learning_rate": 1.1145526893346402e-06, + "loss": 0.7354, + "step": 56131 + }, + { + "epoch": 1.44, + "learning_rate": 1.11452520098668e-06, + "loss": 0.6182, + "step": 56132 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144977125510329e-06, + "loss": 0.6196, + "step": 56133 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144702240277205e-06, + "loss": 0.645, + "step": 56134 + }, + { + "epoch": 1.44, + "learning_rate": 1.114442735416763e-06, + "loss": 0.8311, + "step": 56135 + }, + { + "epoch": 1.44, + "learning_rate": 1.1144152467181824e-06, + "loss": 0.7324, + "step": 56136 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143877579319993e-06, + "loss": 0.5928, + "step": 56137 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143602690582348e-06, + "loss": 0.8369, + "step": 56138 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143327800969096e-06, + "loss": 0.6377, + "step": 56139 + }, + { + "epoch": 1.44, + "learning_rate": 1.1143052910480453e-06, + "loss": 0.6016, + "step": 56140 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142778019116623e-06, + "loss": 0.6846, + "step": 56141 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142503126877827e-06, + "loss": 0.5918, + "step": 56142 + }, + { + "epoch": 1.44, + "learning_rate": 1.1142228233764263e-06, + "loss": 0.6714, + "step": 56143 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141953339776151e-06, + "loss": 0.5918, + "step": 56144 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141678444913696e-06, + "loss": 0.6426, + "step": 56145 + }, + { + "epoch": 1.44, + "learning_rate": 1.114140354917711e-06, + "loss": 0.7427, + "step": 56146 + }, + { + "epoch": 1.44, + "learning_rate": 1.1141128652566608e-06, + "loss": 0.6875, + "step": 56147 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140853755082393e-06, + "loss": 0.5864, + "step": 56148 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140578856724676e-06, + "loss": 0.6306, + "step": 56149 + }, + { + "epoch": 1.44, + "learning_rate": 1.1140303957493676e-06, + "loss": 0.4751, + "step": 56150 + }, + { + "epoch": 1.44, + "learning_rate": 1.114002905738959e-06, + "loss": 0.6072, + "step": 56151 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139754156412642e-06, + "loss": 0.7783, + "step": 56152 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139479254563036e-06, + "loss": 0.5911, + "step": 56153 + }, + { + "epoch": 1.44, + "learning_rate": 1.1139204351840983e-06, + "loss": 0.7124, + "step": 56154 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138929448246692e-06, + "loss": 0.5645, + "step": 56155 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138654543780375e-06, + "loss": 0.7168, + "step": 56156 + }, + { + "epoch": 1.44, + "learning_rate": 1.1138379638442248e-06, + "loss": 0.8301, + "step": 56157 + }, + { + "epoch": 1.44, + "learning_rate": 1.113810473223251e-06, + "loss": 0.6812, + "step": 56158 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137829825151378e-06, + "loss": 0.626, + "step": 56159 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137554917199063e-06, + "loss": 0.7812, + "step": 56160 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137280008375775e-06, + "loss": 0.7217, + "step": 56161 + }, + { + "epoch": 1.44, + "learning_rate": 1.1137005098681726e-06, + "loss": 0.5591, + "step": 56162 + }, + { + "epoch": 1.44, + "learning_rate": 1.1136730188117123e-06, + "loss": 0.6294, + "step": 56163 + }, + { + "epoch": 1.44, + "learning_rate": 1.1136455276682174e-06, + "loss": 0.5186, + "step": 56164 + }, + { + "epoch": 1.44, + "learning_rate": 1.11361803643771e-06, + "loss": 0.5942, + "step": 56165 + }, + { + "epoch": 1.44, + "learning_rate": 1.11359054512021e-06, + "loss": 0.8398, + "step": 56166 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135630537157392e-06, + "loss": 0.5264, + "step": 56167 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135355622243183e-06, + "loss": 0.8037, + "step": 56168 + }, + { + "epoch": 1.44, + "learning_rate": 1.1135080706459686e-06, + "loss": 0.7002, + "step": 56169 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134805789807107e-06, + "loss": 0.5952, + "step": 56170 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134530872285661e-06, + "loss": 0.7715, + "step": 56171 + }, + { + "epoch": 1.44, + "learning_rate": 1.1134255953895557e-06, + "loss": 0.6807, + "step": 56172 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133981034637004e-06, + "loss": 0.5659, + "step": 56173 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133706114510216e-06, + "loss": 0.5739, + "step": 56174 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133431193515399e-06, + "loss": 0.6187, + "step": 56175 + }, + { + "epoch": 1.44, + "learning_rate": 1.1133156271652767e-06, + "loss": 0.625, + "step": 56176 + }, + { + "epoch": 1.44, + "learning_rate": 1.113288134892253e-06, + "loss": 0.4863, + "step": 56177 + }, + { + "epoch": 1.44, + "learning_rate": 1.1132606425324898e-06, + "loss": 0.625, + "step": 56178 + }, + { + "epoch": 1.44, + "learning_rate": 1.113233150086008e-06, + "loss": 0.6797, + "step": 56179 + }, + { + "epoch": 1.44, + "learning_rate": 1.1132056575528288e-06, + "loss": 0.6064, + "step": 56180 + }, + { + "epoch": 1.44, + "learning_rate": 1.113178164932973e-06, + "loss": 0.6558, + "step": 56181 + }, + { + "epoch": 1.44, + "learning_rate": 1.1131506722264625e-06, + "loss": 0.5703, + "step": 56182 + }, + { + "epoch": 1.44, + "learning_rate": 1.1131231794333174e-06, + "loss": 0.5815, + "step": 56183 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130956865535591e-06, + "loss": 0.6104, + "step": 56184 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130681935872085e-06, + "loss": 0.7725, + "step": 56185 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130407005342868e-06, + "loss": 0.7295, + "step": 56186 + }, + { + "epoch": 1.44, + "learning_rate": 1.1130132073948153e-06, + "loss": 0.6636, + "step": 56187 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129857141688145e-06, + "loss": 0.7168, + "step": 56188 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129582208563057e-06, + "loss": 0.6992, + "step": 56189 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129307274573103e-06, + "loss": 0.584, + "step": 56190 + }, + { + "epoch": 1.44, + "learning_rate": 1.1129032339718487e-06, + "loss": 0.667, + "step": 56191 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128757403999428e-06, + "loss": 0.7139, + "step": 56192 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128482467416128e-06, + "loss": 0.7275, + "step": 56193 + }, + { + "epoch": 1.44, + "learning_rate": 1.1128207529968801e-06, + "loss": 0.7568, + "step": 56194 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127932591657654e-06, + "loss": 0.9424, + "step": 56195 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127657652482905e-06, + "loss": 0.6626, + "step": 56196 + }, + { + "epoch": 1.44, + "learning_rate": 1.112738271244476e-06, + "loss": 0.5125, + "step": 56197 + }, + { + "epoch": 1.44, + "learning_rate": 1.1127107771543427e-06, + "loss": 0.6304, + "step": 56198 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126832829779123e-06, + "loss": 0.55, + "step": 56199 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126557887152053e-06, + "loss": 0.5474, + "step": 56200 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126282943662432e-06, + "loss": 0.7305, + "step": 56201 + }, + { + "epoch": 1.44, + "learning_rate": 1.1126007999310465e-06, + "loss": 0.5562, + "step": 56202 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125733054096368e-06, + "loss": 0.4964, + "step": 56203 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125458108020344e-06, + "loss": 0.5952, + "step": 56204 + }, + { + "epoch": 1.44, + "learning_rate": 1.1125183161082613e-06, + "loss": 0.7676, + "step": 56205 + }, + { + "epoch": 1.44, + "learning_rate": 1.1124908213283377e-06, + "loss": 0.4214, + "step": 56206 + }, + { + "epoch": 1.44, + "learning_rate": 1.112463326462286e-06, + "loss": 0.6299, + "step": 56207 + }, + { + "epoch": 1.44, + "learning_rate": 1.1124358315101252e-06, + "loss": 0.6885, + "step": 56208 + }, + { + "epoch": 1.44, + "learning_rate": 1.112408336471878e-06, + "loss": 0.6553, + "step": 56209 + }, + { + "epoch": 1.44, + "learning_rate": 1.1123808413475645e-06, + "loss": 0.7197, + "step": 56210 + }, + { + "epoch": 1.44, + "learning_rate": 1.1123533461372065e-06, + "loss": 0.6167, + "step": 56211 + }, + { + "epoch": 1.44, + "learning_rate": 1.112325850840825e-06, + "loss": 0.7695, + "step": 56212 + }, + { + "epoch": 1.44, + "learning_rate": 1.1122983554584405e-06, + "loss": 0.6416, + "step": 56213 + }, + { + "epoch": 1.44, + "learning_rate": 1.112270859990074e-06, + "loss": 0.751, + "step": 56214 + }, + { + "epoch": 1.44, + "learning_rate": 1.112243364435747e-06, + "loss": 0.7578, + "step": 56215 + }, + { + "epoch": 1.44, + "learning_rate": 1.1122158687954803e-06, + "loss": 0.6855, + "step": 56216 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121883730692955e-06, + "loss": 0.6284, + "step": 56217 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121608772572132e-06, + "loss": 0.7568, + "step": 56218 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121333813592542e-06, + "loss": 0.6021, + "step": 56219 + }, + { + "epoch": 1.44, + "learning_rate": 1.1121058853754397e-06, + "loss": 0.4985, + "step": 56220 + }, + { + "epoch": 1.44, + "learning_rate": 1.1120783893057911e-06, + "loss": 0.6072, + "step": 56221 + }, + { + "epoch": 1.44, + "learning_rate": 1.1120508931503295e-06, + "loss": 0.6846, + "step": 56222 + }, + { + "epoch": 1.44, + "learning_rate": 1.112023396909075e-06, + "loss": 0.7461, + "step": 56223 + }, + { + "epoch": 1.44, + "learning_rate": 1.11199590058205e-06, + "loss": 0.6367, + "step": 56224 + }, + { + "epoch": 1.44, + "learning_rate": 1.1119684041692745e-06, + "loss": 0.605, + "step": 56225 + }, + { + "epoch": 1.44, + "learning_rate": 1.11194090767077e-06, + "loss": 0.55, + "step": 56226 + }, + { + "epoch": 1.44, + "learning_rate": 1.1119134110865576e-06, + "loss": 0.4449, + "step": 56227 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118859144166583e-06, + "loss": 0.6157, + "step": 56228 + }, + { + "epoch": 1.44, + "learning_rate": 1.111858417661093e-06, + "loss": 0.7402, + "step": 56229 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118309208198828e-06, + "loss": 0.8242, + "step": 56230 + }, + { + "epoch": 1.44, + "learning_rate": 1.1118034238930488e-06, + "loss": 0.7559, + "step": 56231 + }, + { + "epoch": 1.44, + "learning_rate": 1.1117759268806123e-06, + "loss": 0.6514, + "step": 56232 + }, + { + "epoch": 1.44, + "learning_rate": 1.111748429782594e-06, + "loss": 0.7012, + "step": 56233 + }, + { + "epoch": 1.44, + "learning_rate": 1.111720932599015e-06, + "loss": 0.5139, + "step": 56234 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116934353298961e-06, + "loss": 0.708, + "step": 56235 + }, + { + "epoch": 1.44, + "learning_rate": 1.111665937975259e-06, + "loss": 0.5293, + "step": 56236 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116384405351247e-06, + "loss": 0.7295, + "step": 56237 + }, + { + "epoch": 1.44, + "learning_rate": 1.1116109430095137e-06, + "loss": 0.7212, + "step": 56238 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115834453984471e-06, + "loss": 0.8047, + "step": 56239 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115559477019464e-06, + "loss": 0.5708, + "step": 56240 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115284499200324e-06, + "loss": 0.6548, + "step": 56241 + }, + { + "epoch": 1.44, + "learning_rate": 1.1115009520527262e-06, + "loss": 0.7363, + "step": 56242 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114734541000491e-06, + "loss": 0.5742, + "step": 56243 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114459560620216e-06, + "loss": 0.4998, + "step": 56244 + }, + { + "epoch": 1.44, + "learning_rate": 1.1114184579386652e-06, + "loss": 0.7236, + "step": 56245 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113909597300007e-06, + "loss": 0.5808, + "step": 56246 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113634614360496e-06, + "loss": 0.6262, + "step": 56247 + }, + { + "epoch": 1.44, + "learning_rate": 1.1113359630568323e-06, + "loss": 0.6899, + "step": 56248 + }, + { + "epoch": 1.44, + "learning_rate": 1.11130846459237e-06, + "loss": 0.6479, + "step": 56249 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112809660426842e-06, + "loss": 0.522, + "step": 56250 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112534674077957e-06, + "loss": 0.7188, + "step": 56251 + }, + { + "epoch": 1.44, + "learning_rate": 1.1112259686877255e-06, + "loss": 0.6997, + "step": 56252 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111984698824947e-06, + "loss": 0.6248, + "step": 56253 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111709709921242e-06, + "loss": 0.8174, + "step": 56254 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111434720166353e-06, + "loss": 0.646, + "step": 56255 + }, + { + "epoch": 1.44, + "learning_rate": 1.1111159729560488e-06, + "loss": 0.7075, + "step": 56256 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110884738103863e-06, + "loss": 0.6392, + "step": 56257 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110609745796682e-06, + "loss": 0.7383, + "step": 56258 + }, + { + "epoch": 1.44, + "learning_rate": 1.1110334752639158e-06, + "loss": 0.5527, + "step": 56259 + }, + { + "epoch": 1.44, + "learning_rate": 1.11100597586315e-06, + "loss": 0.7061, + "step": 56260 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109784763773924e-06, + "loss": 0.7324, + "step": 56261 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109509768066636e-06, + "loss": 0.8184, + "step": 56262 + }, + { + "epoch": 1.44, + "learning_rate": 1.1109234771509846e-06, + "loss": 0.6719, + "step": 56263 + }, + { + "epoch": 1.44, + "learning_rate": 1.1108959774103768e-06, + "loss": 0.623, + "step": 56264 + }, + { + "epoch": 1.44, + "learning_rate": 1.110868477584861e-06, + "loss": 0.7734, + "step": 56265 + }, + { + "epoch": 1.44, + "learning_rate": 1.110840977674458e-06, + "loss": 0.623, + "step": 56266 + }, + { + "epoch": 1.44, + "learning_rate": 1.1108134776791892e-06, + "loss": 0.7168, + "step": 56267 + }, + { + "epoch": 1.44, + "learning_rate": 1.110785977599076e-06, + "loss": 0.4246, + "step": 56268 + }, + { + "epoch": 1.44, + "learning_rate": 1.1107584774341388e-06, + "loss": 0.6787, + "step": 56269 + }, + { + "epoch": 1.44, + "learning_rate": 1.110730977184399e-06, + "loss": 0.5225, + "step": 56270 + }, + { + "epoch": 1.44, + "learning_rate": 1.1107034768498774e-06, + "loss": 0.7051, + "step": 56271 + }, + { + "epoch": 1.44, + "learning_rate": 1.1106759764305957e-06, + "loss": 0.5703, + "step": 56272 + }, + { + "epoch": 1.44, + "learning_rate": 1.110648475926574e-06, + "loss": 0.5923, + "step": 56273 + }, + { + "epoch": 1.44, + "learning_rate": 1.1106209753378342e-06, + "loss": 0.6182, + "step": 56274 + }, + { + "epoch": 1.44, + "learning_rate": 1.1105934746643968e-06, + "loss": 0.6816, + "step": 56275 + }, + { + "epoch": 1.44, + "learning_rate": 1.1105659739062832e-06, + "loss": 0.4753, + "step": 56276 + }, + { + "epoch": 1.44, + "learning_rate": 1.110538473063514e-06, + "loss": 0.6772, + "step": 56277 + }, + { + "epoch": 1.44, + "learning_rate": 1.110510972136111e-06, + "loss": 0.75, + "step": 56278 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104834711240944e-06, + "loss": 0.4956, + "step": 56279 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104559700274862e-06, + "loss": 0.5151, + "step": 56280 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104284688463063e-06, + "loss": 0.6826, + "step": 56281 + }, + { + "epoch": 1.44, + "learning_rate": 1.1104009675805771e-06, + "loss": 0.7178, + "step": 56282 + }, + { + "epoch": 1.44, + "learning_rate": 1.1103734662303185e-06, + "loss": 0.7144, + "step": 56283 + }, + { + "epoch": 1.44, + "learning_rate": 1.1103459647955525e-06, + "loss": 0.6943, + "step": 56284 + }, + { + "epoch": 1.44, + "learning_rate": 1.110318463276299e-06, + "loss": 0.5605, + "step": 56285 + }, + { + "epoch": 1.44, + "learning_rate": 1.1102909616725803e-06, + "loss": 0.6787, + "step": 56286 + }, + { + "epoch": 1.44, + "learning_rate": 1.1102634599844165e-06, + "loss": 0.6406, + "step": 56287 + }, + { + "epoch": 1.44, + "learning_rate": 1.110235958211829e-06, + "loss": 0.52, + "step": 56288 + }, + { + "epoch": 1.44, + "learning_rate": 1.110208456354839e-06, + "loss": 0.5923, + "step": 56289 + }, + { + "epoch": 1.44, + "learning_rate": 1.1101809544134674e-06, + "loss": 0.6514, + "step": 56290 + }, + { + "epoch": 1.44, + "learning_rate": 1.1101534523877356e-06, + "loss": 0.6924, + "step": 56291 + }, + { + "epoch": 1.44, + "learning_rate": 1.110125950277664e-06, + "loss": 0.5315, + "step": 56292 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100984480832744e-06, + "loss": 0.7354, + "step": 56293 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100709458045872e-06, + "loss": 0.5557, + "step": 56294 + }, + { + "epoch": 1.44, + "learning_rate": 1.110043443441624e-06, + "loss": 0.4961, + "step": 56295 + }, + { + "epoch": 1.44, + "learning_rate": 1.1100159409944052e-06, + "loss": 0.8467, + "step": 56296 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099884384629526e-06, + "loss": 0.7793, + "step": 56297 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099609358472869e-06, + "loss": 0.5791, + "step": 56298 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099334331474288e-06, + "loss": 0.623, + "step": 56299 + }, + { + "epoch": 1.44, + "learning_rate": 1.1099059303633999e-06, + "loss": 0.7744, + "step": 56300 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098784274952216e-06, + "loss": 0.7256, + "step": 56301 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098509245429138e-06, + "loss": 0.6189, + "step": 56302 + }, + { + "epoch": 1.44, + "learning_rate": 1.1098234215064983e-06, + "loss": 0.5659, + "step": 56303 + }, + { + "epoch": 1.44, + "learning_rate": 1.109795918385996e-06, + "loss": 0.6904, + "step": 56304 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097684151814281e-06, + "loss": 0.6465, + "step": 56305 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097409118928157e-06, + "loss": 0.4412, + "step": 56306 + }, + { + "epoch": 1.44, + "learning_rate": 1.1097134085201795e-06, + "loss": 0.7998, + "step": 56307 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096859050635412e-06, + "loss": 0.7002, + "step": 56308 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096584015229214e-06, + "loss": 0.542, + "step": 56309 + }, + { + "epoch": 1.44, + "learning_rate": 1.1096308978983406e-06, + "loss": 0.6914, + "step": 56310 + }, + { + "epoch": 1.44, + "learning_rate": 1.109603394189821e-06, + "loss": 0.7559, + "step": 56311 + }, + { + "epoch": 1.44, + "learning_rate": 1.109575890397383e-06, + "loss": 0.6787, + "step": 56312 + }, + { + "epoch": 1.44, + "learning_rate": 1.1095483865210478e-06, + "loss": 0.75, + "step": 56313 + }, + { + "epoch": 1.44, + "learning_rate": 1.1095208825608365e-06, + "loss": 0.7959, + "step": 56314 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094933785167698e-06, + "loss": 0.8008, + "step": 56315 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094658743888694e-06, + "loss": 0.749, + "step": 56316 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094383701771556e-06, + "loss": 0.5176, + "step": 56317 + }, + { + "epoch": 1.44, + "learning_rate": 1.1094108658816504e-06, + "loss": 0.5708, + "step": 56318 + }, + { + "epoch": 1.44, + "learning_rate": 1.109383361502374e-06, + "loss": 0.6504, + "step": 56319 + }, + { + "epoch": 1.44, + "learning_rate": 1.1093558570393478e-06, + "loss": 0.6553, + "step": 56320 + }, + { + "epoch": 1.44, + "learning_rate": 1.109328352492593e-06, + "loss": 0.6279, + "step": 56321 + }, + { + "epoch": 1.44, + "learning_rate": 1.1093008478621304e-06, + "loss": 0.7393, + "step": 56322 + }, + { + "epoch": 1.44, + "learning_rate": 1.109273343147981e-06, + "loss": 0.5605, + "step": 56323 + }, + { + "epoch": 1.44, + "learning_rate": 1.1092458383501663e-06, + "loss": 0.541, + "step": 56324 + }, + { + "epoch": 1.44, + "learning_rate": 1.1092183334687068e-06, + "loss": 0.623, + "step": 56325 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091908285036243e-06, + "loss": 0.5776, + "step": 56326 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091633234549392e-06, + "loss": 0.5137, + "step": 56327 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091358183226728e-06, + "loss": 0.6768, + "step": 56328 + }, + { + "epoch": 1.44, + "learning_rate": 1.1091083131068457e-06, + "loss": 0.6855, + "step": 56329 + }, + { + "epoch": 1.44, + "learning_rate": 1.1090808078074797e-06, + "loss": 0.5562, + "step": 56330 + }, + { + "epoch": 1.44, + "learning_rate": 1.109053302424596e-06, + "loss": 0.5269, + "step": 56331 + }, + { + "epoch": 1.44, + "learning_rate": 1.1090257969582144e-06, + "loss": 0.5513, + "step": 56332 + }, + { + "epoch": 1.44, + "learning_rate": 1.108998291408357e-06, + "loss": 0.6992, + "step": 56333 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089707857750448e-06, + "loss": 0.6943, + "step": 56334 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089432800582985e-06, + "loss": 0.4468, + "step": 56335 + }, + { + "epoch": 1.44, + "learning_rate": 1.1089157742581396e-06, + "loss": 0.8467, + "step": 56336 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088882683745888e-06, + "loss": 0.4954, + "step": 56337 + }, + { + "epoch": 1.44, + "learning_rate": 1.108860762407667e-06, + "loss": 0.5854, + "step": 56338 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088332563573958e-06, + "loss": 0.7012, + "step": 56339 + }, + { + "epoch": 1.44, + "learning_rate": 1.1088057502237958e-06, + "loss": 0.6221, + "step": 56340 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087782440068886e-06, + "loss": 0.5713, + "step": 56341 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087507377066944e-06, + "loss": 0.6562, + "step": 56342 + }, + { + "epoch": 1.44, + "learning_rate": 1.1087232313232351e-06, + "loss": 0.6064, + "step": 56343 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086957248565312e-06, + "loss": 0.7764, + "step": 56344 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086682183066043e-06, + "loss": 0.4702, + "step": 56345 + }, + { + "epoch": 1.44, + "learning_rate": 1.108640711673475e-06, + "loss": 0.543, + "step": 56346 + }, + { + "epoch": 1.44, + "learning_rate": 1.1086132049571645e-06, + "loss": 0.6382, + "step": 56347 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085856981576935e-06, + "loss": 0.8457, + "step": 56348 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085581912750838e-06, + "loss": 0.7754, + "step": 56349 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085306843093561e-06, + "loss": 0.6768, + "step": 56350 + }, + { + "epoch": 1.44, + "learning_rate": 1.1085031772605313e-06, + "loss": 0.7783, + "step": 56351 + }, + { + "epoch": 1.44, + "learning_rate": 1.108475670128631e-06, + "loss": 0.5879, + "step": 56352 + }, + { + "epoch": 1.44, + "learning_rate": 1.1084481629136752e-06, + "loss": 0.5151, + "step": 56353 + }, + { + "epoch": 1.44, + "learning_rate": 1.1084206556156861e-06, + "loss": 0.5261, + "step": 56354 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083931482346842e-06, + "loss": 0.3376, + "step": 56355 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083656407706906e-06, + "loss": 0.5752, + "step": 56356 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083381332237262e-06, + "loss": 0.6621, + "step": 56357 + }, + { + "epoch": 1.44, + "learning_rate": 1.1083106255938126e-06, + "loss": 0.6328, + "step": 56358 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082831178809705e-06, + "loss": 0.6274, + "step": 56359 + }, + { + "epoch": 1.44, + "learning_rate": 1.108255610085221e-06, + "loss": 0.7412, + "step": 56360 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082281022065849e-06, + "loss": 0.6602, + "step": 56361 + }, + { + "epoch": 1.44, + "learning_rate": 1.1082005942450838e-06, + "loss": 0.5127, + "step": 56362 + }, + { + "epoch": 1.44, + "learning_rate": 1.1081730862007384e-06, + "loss": 0.5073, + "step": 56363 + }, + { + "epoch": 1.44, + "learning_rate": 1.1081455780735699e-06, + "loss": 0.5725, + "step": 56364 + }, + { + "epoch": 1.44, + "learning_rate": 1.108118069863599e-06, + "loss": 0.6663, + "step": 56365 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080905615708475e-06, + "loss": 0.876, + "step": 56366 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080630531953357e-06, + "loss": 0.7949, + "step": 56367 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080355447370853e-06, + "loss": 0.6421, + "step": 56368 + }, + { + "epoch": 1.44, + "learning_rate": 1.1080080361961167e-06, + "loss": 0.5767, + "step": 56369 + }, + { + "epoch": 1.44, + "learning_rate": 1.1079805275724513e-06, + "loss": 0.6582, + "step": 56370 + }, + { + "epoch": 1.44, + "learning_rate": 1.1079530188661105e-06, + "loss": 0.4937, + "step": 56371 + }, + { + "epoch": 1.44, + "learning_rate": 1.107925510077115e-06, + "loss": 0.5122, + "step": 56372 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078980012054858e-06, + "loss": 0.6206, + "step": 56373 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078704922512439e-06, + "loss": 0.6416, + "step": 56374 + }, + { + "epoch": 1.44, + "learning_rate": 1.1078429832144105e-06, + "loss": 0.6274, + "step": 56375 + }, + { + "epoch": 1.44, + "learning_rate": 1.107815474095007e-06, + "loss": 0.396, + "step": 56376 + }, + { + "epoch": 1.44, + "learning_rate": 1.1077879648930541e-06, + "loss": 0.55, + "step": 56377 + }, + { + "epoch": 1.44, + "learning_rate": 1.1077604556085727e-06, + "loss": 0.7539, + "step": 56378 + }, + { + "epoch": 1.45, + "learning_rate": 1.1077329462415843e-06, + "loss": 0.6768, + "step": 56379 + }, + { + "epoch": 1.45, + "learning_rate": 1.1077054367921094e-06, + "loss": 0.6792, + "step": 56380 + }, + { + "epoch": 1.45, + "learning_rate": 1.1076779272601698e-06, + "loss": 0.4214, + "step": 56381 + }, + { + "epoch": 1.45, + "learning_rate": 1.107650417645786e-06, + "loss": 0.4958, + "step": 56382 + }, + { + "epoch": 1.45, + "learning_rate": 1.1076229079489793e-06, + "loss": 0.5068, + "step": 56383 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075953981697704e-06, + "loss": 0.8047, + "step": 56384 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075678883081808e-06, + "loss": 0.5239, + "step": 56385 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075403783642317e-06, + "loss": 0.6343, + "step": 56386 + }, + { + "epoch": 1.45, + "learning_rate": 1.1075128683379436e-06, + "loss": 0.5698, + "step": 56387 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074853582293378e-06, + "loss": 0.7754, + "step": 56388 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074578480384356e-06, + "loss": 0.6689, + "step": 56389 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074303377652576e-06, + "loss": 0.6948, + "step": 56390 + }, + { + "epoch": 1.45, + "learning_rate": 1.1074028274098254e-06, + "loss": 0.5737, + "step": 56391 + }, + { + "epoch": 1.45, + "learning_rate": 1.1073753169721596e-06, + "loss": 0.7168, + "step": 56392 + }, + { + "epoch": 1.45, + "learning_rate": 1.1073478064522817e-06, + "loss": 0.439, + "step": 56393 + }, + { + "epoch": 1.45, + "learning_rate": 1.107320295850212e-06, + "loss": 0.7207, + "step": 56394 + }, + { + "epoch": 1.45, + "learning_rate": 1.1072927851659727e-06, + "loss": 0.7285, + "step": 56395 + }, + { + "epoch": 1.45, + "learning_rate": 1.107265274399584e-06, + "loss": 0.4409, + "step": 56396 + }, + { + "epoch": 1.45, + "learning_rate": 1.107237763551067e-06, + "loss": 0.5796, + "step": 56397 + }, + { + "epoch": 1.45, + "learning_rate": 1.1072102526204433e-06, + "loss": 0.5122, + "step": 56398 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071827416077334e-06, + "loss": 0.6602, + "step": 56399 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071552305129587e-06, + "loss": 0.5249, + "step": 56400 + }, + { + "epoch": 1.45, + "learning_rate": 1.1071277193361404e-06, + "loss": 0.5356, + "step": 56401 + }, + { + "epoch": 1.45, + "learning_rate": 1.107100208077299e-06, + "loss": 0.668, + "step": 56402 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070726967364558e-06, + "loss": 0.7998, + "step": 56403 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070451853136324e-06, + "loss": 0.6387, + "step": 56404 + }, + { + "epoch": 1.45, + "learning_rate": 1.1070176738088491e-06, + "loss": 0.4573, + "step": 56405 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069901622221277e-06, + "loss": 0.6602, + "step": 56406 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069626505534884e-06, + "loss": 0.6387, + "step": 56407 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069351388029529e-06, + "loss": 0.707, + "step": 56408 + }, + { + "epoch": 1.45, + "learning_rate": 1.1069076269705416e-06, + "loss": 0.6396, + "step": 56409 + }, + { + "epoch": 1.45, + "learning_rate": 1.1068801150562768e-06, + "loss": 0.6543, + "step": 56410 + }, + { + "epoch": 1.45, + "learning_rate": 1.1068526030601786e-06, + "loss": 0.6377, + "step": 56411 + }, + { + "epoch": 1.45, + "learning_rate": 1.106825090982268e-06, + "loss": 0.5571, + "step": 56412 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067975788225664e-06, + "loss": 0.708, + "step": 56413 + }, + { + "epoch": 1.45, + "learning_rate": 1.106770066581095e-06, + "loss": 0.6528, + "step": 56414 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067425542578747e-06, + "loss": 0.5525, + "step": 56415 + }, + { + "epoch": 1.45, + "learning_rate": 1.1067150418529263e-06, + "loss": 0.7188, + "step": 56416 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066875293662711e-06, + "loss": 0.646, + "step": 56417 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066600167979306e-06, + "loss": 0.5967, + "step": 56418 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066325041479247e-06, + "loss": 0.5171, + "step": 56419 + }, + { + "epoch": 1.45, + "learning_rate": 1.1066049914162757e-06, + "loss": 0.7012, + "step": 56420 + }, + { + "epoch": 1.45, + "learning_rate": 1.1065774786030042e-06, + "loss": 0.6699, + "step": 56421 + }, + { + "epoch": 1.45, + "learning_rate": 1.106549965708131e-06, + "loss": 0.7427, + "step": 56422 + }, + { + "epoch": 1.45, + "learning_rate": 1.1065224527316775e-06, + "loss": 0.665, + "step": 56423 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064949396736644e-06, + "loss": 0.7812, + "step": 56424 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064674265341135e-06, + "loss": 0.791, + "step": 56425 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064399133130451e-06, + "loss": 0.6885, + "step": 56426 + }, + { + "epoch": 1.45, + "learning_rate": 1.1064124000104805e-06, + "loss": 0.6421, + "step": 56427 + }, + { + "epoch": 1.45, + "learning_rate": 1.106384886626441e-06, + "loss": 0.6074, + "step": 56428 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063573731609474e-06, + "loss": 0.6631, + "step": 56429 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063298596140206e-06, + "loss": 0.7188, + "step": 56430 + }, + { + "epoch": 1.45, + "learning_rate": 1.1063023459856825e-06, + "loss": 0.6631, + "step": 56431 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062748322759532e-06, + "loss": 0.6045, + "step": 56432 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062473184848542e-06, + "loss": 0.6421, + "step": 56433 + }, + { + "epoch": 1.45, + "learning_rate": 1.1062198046124062e-06, + "loss": 0.5811, + "step": 56434 + }, + { + "epoch": 1.45, + "learning_rate": 1.106192290658631e-06, + "loss": 0.6694, + "step": 56435 + }, + { + "epoch": 1.45, + "learning_rate": 1.1061647766235492e-06, + "loss": 0.6523, + "step": 56436 + }, + { + "epoch": 1.45, + "learning_rate": 1.106137262507182e-06, + "loss": 0.6421, + "step": 56437 + }, + { + "epoch": 1.45, + "learning_rate": 1.10610974830955e-06, + "loss": 0.665, + "step": 56438 + }, + { + "epoch": 1.45, + "learning_rate": 1.106082234030675e-06, + "loss": 0.6768, + "step": 56439 + }, + { + "epoch": 1.45, + "learning_rate": 1.1060547196705774e-06, + "loss": 0.6299, + "step": 56440 + }, + { + "epoch": 1.45, + "learning_rate": 1.1060272052292789e-06, + "loss": 0.54, + "step": 56441 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059996907068e-06, + "loss": 0.667, + "step": 56442 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059721761031622e-06, + "loss": 0.4976, + "step": 56443 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059446614183862e-06, + "loss": 0.4941, + "step": 56444 + }, + { + "epoch": 1.45, + "learning_rate": 1.1059171466524934e-06, + "loss": 0.627, + "step": 56445 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058896318055047e-06, + "loss": 0.7412, + "step": 56446 + }, + { + "epoch": 1.45, + "learning_rate": 1.105862116877441e-06, + "loss": 0.7568, + "step": 56447 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058346018683239e-06, + "loss": 0.4224, + "step": 56448 + }, + { + "epoch": 1.45, + "learning_rate": 1.1058070867781736e-06, + "loss": 0.5396, + "step": 56449 + }, + { + "epoch": 1.45, + "learning_rate": 1.105779571607012e-06, + "loss": 0.6636, + "step": 56450 + }, + { + "epoch": 1.45, + "learning_rate": 1.10575205635486e-06, + "loss": 0.5659, + "step": 56451 + }, + { + "epoch": 1.45, + "learning_rate": 1.105724541021738e-06, + "loss": 0.7783, + "step": 56452 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056970256076682e-06, + "loss": 0.6167, + "step": 56453 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056695101126704e-06, + "loss": 0.6367, + "step": 56454 + }, + { + "epoch": 1.45, + "learning_rate": 1.1056419945367668e-06, + "loss": 0.6982, + "step": 56455 + }, + { + "epoch": 1.45, + "learning_rate": 1.105614478879978e-06, + "loss": 0.3494, + "step": 56456 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055869631423247e-06, + "loss": 0.7383, + "step": 56457 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055594473238285e-06, + "loss": 0.7461, + "step": 56458 + }, + { + "epoch": 1.45, + "learning_rate": 1.1055319314245104e-06, + "loss": 0.6602, + "step": 56459 + }, + { + "epoch": 1.45, + "learning_rate": 1.105504415444391e-06, + "loss": 0.79, + "step": 56460 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054768993834923e-06, + "loss": 0.6338, + "step": 56461 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054493832418344e-06, + "loss": 0.624, + "step": 56462 + }, + { + "epoch": 1.45, + "learning_rate": 1.1054218670194386e-06, + "loss": 0.6167, + "step": 56463 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053943507163265e-06, + "loss": 0.7227, + "step": 56464 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053668343325185e-06, + "loss": 0.6294, + "step": 56465 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053393178680362e-06, + "loss": 0.6362, + "step": 56466 + }, + { + "epoch": 1.45, + "learning_rate": 1.1053118013229004e-06, + "loss": 0.7896, + "step": 56467 + }, + { + "epoch": 1.45, + "learning_rate": 1.105284284697132e-06, + "loss": 0.614, + "step": 56468 + }, + { + "epoch": 1.45, + "learning_rate": 1.1052567679907522e-06, + "loss": 0.4172, + "step": 56469 + }, + { + "epoch": 1.45, + "learning_rate": 1.105229251203782e-06, + "loss": 0.4801, + "step": 56470 + }, + { + "epoch": 1.45, + "learning_rate": 1.1052017343362435e-06, + "loss": 0.543, + "step": 56471 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051742173881562e-06, + "loss": 0.8379, + "step": 56472 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051467003595418e-06, + "loss": 0.7559, + "step": 56473 + }, + { + "epoch": 1.45, + "learning_rate": 1.1051191832504215e-06, + "loss": 0.5366, + "step": 56474 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050916660608162e-06, + "loss": 0.708, + "step": 56475 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050641487907474e-06, + "loss": 0.6836, + "step": 56476 + }, + { + "epoch": 1.45, + "learning_rate": 1.1050366314402354e-06, + "loss": 0.7637, + "step": 56477 + }, + { + "epoch": 1.45, + "learning_rate": 1.105009114009302e-06, + "loss": 0.6006, + "step": 56478 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049815964979677e-06, + "loss": 0.668, + "step": 56479 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049540789062538e-06, + "loss": 0.4856, + "step": 56480 + }, + { + "epoch": 1.45, + "learning_rate": 1.1049265612341816e-06, + "loss": 0.665, + "step": 56481 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048990434817718e-06, + "loss": 0.5898, + "step": 56482 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048715256490457e-06, + "loss": 0.5728, + "step": 56483 + }, + { + "epoch": 1.45, + "learning_rate": 1.104844007736024e-06, + "loss": 0.645, + "step": 56484 + }, + { + "epoch": 1.45, + "learning_rate": 1.1048164897427287e-06, + "loss": 0.6846, + "step": 56485 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047889716691799e-06, + "loss": 0.6699, + "step": 56486 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047614535153986e-06, + "loss": 0.7446, + "step": 56487 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047339352814067e-06, + "loss": 0.645, + "step": 56488 + }, + { + "epoch": 1.45, + "learning_rate": 1.1047064169672246e-06, + "loss": 0.8428, + "step": 56489 + }, + { + "epoch": 1.45, + "learning_rate": 1.1046788985728739e-06, + "loss": 0.6172, + "step": 56490 + }, + { + "epoch": 1.45, + "learning_rate": 1.1046513800983755e-06, + "loss": 0.5469, + "step": 56491 + }, + { + "epoch": 1.45, + "learning_rate": 1.10462386154375e-06, + "loss": 0.6511, + "step": 56492 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045963429090189e-06, + "loss": 0.8008, + "step": 56493 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045688241942032e-06, + "loss": 0.667, + "step": 56494 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045413053993237e-06, + "loss": 0.6187, + "step": 56495 + }, + { + "epoch": 1.45, + "learning_rate": 1.1045137865244025e-06, + "loss": 0.7109, + "step": 56496 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044862675694592e-06, + "loss": 0.6216, + "step": 56497 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044587485345157e-06, + "loss": 0.6528, + "step": 56498 + }, + { + "epoch": 1.45, + "learning_rate": 1.104431229419593e-06, + "loss": 0.5991, + "step": 56499 + }, + { + "epoch": 1.45, + "learning_rate": 1.1044037102247124e-06, + "loss": 0.7646, + "step": 56500 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043761909498943e-06, + "loss": 0.6465, + "step": 56501 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043486715951605e-06, + "loss": 0.5569, + "step": 56502 + }, + { + "epoch": 1.45, + "learning_rate": 1.1043211521605314e-06, + "loss": 0.6479, + "step": 56503 + }, + { + "epoch": 1.45, + "learning_rate": 1.1042936326460284e-06, + "loss": 0.7061, + "step": 56504 + }, + { + "epoch": 1.45, + "learning_rate": 1.1042661130516724e-06, + "loss": 0.626, + "step": 56505 + }, + { + "epoch": 1.45, + "learning_rate": 1.104238593377485e-06, + "loss": 0.5887, + "step": 56506 + }, + { + "epoch": 1.45, + "learning_rate": 1.104211073623487e-06, + "loss": 0.665, + "step": 56507 + }, + { + "epoch": 1.45, + "learning_rate": 1.104183553789699e-06, + "loss": 0.5913, + "step": 56508 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041560338761425e-06, + "loss": 0.603, + "step": 56509 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041285138828387e-06, + "loss": 0.6504, + "step": 56510 + }, + { + "epoch": 1.45, + "learning_rate": 1.1041009938098084e-06, + "loss": 0.7207, + "step": 56511 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040734736570726e-06, + "loss": 0.5156, + "step": 56512 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040459534246526e-06, + "loss": 0.7041, + "step": 56513 + }, + { + "epoch": 1.45, + "learning_rate": 1.1040184331125694e-06, + "loss": 0.7168, + "step": 56514 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039909127208443e-06, + "loss": 0.6016, + "step": 56515 + }, + { + "epoch": 1.45, + "learning_rate": 1.103963392249498e-06, + "loss": 0.7021, + "step": 56516 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039358716985518e-06, + "loss": 0.5471, + "step": 56517 + }, + { + "epoch": 1.45, + "learning_rate": 1.1039083510680263e-06, + "loss": 0.6567, + "step": 56518 + }, + { + "epoch": 1.45, + "learning_rate": 1.1038808303579435e-06, + "loss": 0.7568, + "step": 56519 + }, + { + "epoch": 1.45, + "learning_rate": 1.1038533095683234e-06, + "loss": 0.8018, + "step": 56520 + }, + { + "epoch": 1.45, + "learning_rate": 1.103825788699188e-06, + "loss": 0.4438, + "step": 56521 + }, + { + "epoch": 1.45, + "learning_rate": 1.1037982677505577e-06, + "loss": 0.6138, + "step": 56522 + }, + { + "epoch": 1.45, + "learning_rate": 1.103770746722454e-06, + "loss": 0.6147, + "step": 56523 + }, + { + "epoch": 1.45, + "learning_rate": 1.1037432256148978e-06, + "loss": 0.604, + "step": 56524 + }, + { + "epoch": 1.45, + "learning_rate": 1.10371570442791e-06, + "loss": 0.7559, + "step": 56525 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036881831615122e-06, + "loss": 0.6504, + "step": 56526 + }, + { + "epoch": 1.45, + "learning_rate": 1.103660661815725e-06, + "loss": 0.6074, + "step": 56527 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036331403905693e-06, + "loss": 0.7148, + "step": 56528 + }, + { + "epoch": 1.45, + "learning_rate": 1.1036056188860667e-06, + "loss": 0.6362, + "step": 56529 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035780973022378e-06, + "loss": 0.6865, + "step": 56530 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035505756391044e-06, + "loss": 0.5837, + "step": 56531 + }, + { + "epoch": 1.45, + "learning_rate": 1.1035230538966868e-06, + "loss": 0.7344, + "step": 56532 + }, + { + "epoch": 1.45, + "learning_rate": 1.1034955320750062e-06, + "loss": 0.71, + "step": 56533 + }, + { + "epoch": 1.45, + "learning_rate": 1.103468010174084e-06, + "loss": 0.4575, + "step": 56534 + }, + { + "epoch": 1.45, + "learning_rate": 1.1034404881939413e-06, + "loss": 0.5784, + "step": 56535 + }, + { + "epoch": 1.45, + "learning_rate": 1.103412966134599e-06, + "loss": 0.6333, + "step": 56536 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033854439960776e-06, + "loss": 0.832, + "step": 56537 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033579217783992e-06, + "loss": 0.5659, + "step": 56538 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033303994815841e-06, + "loss": 0.7041, + "step": 56539 + }, + { + "epoch": 1.45, + "learning_rate": 1.1033028771056539e-06, + "loss": 0.6006, + "step": 56540 + }, + { + "epoch": 1.45, + "learning_rate": 1.1032753546506296e-06, + "loss": 0.5479, + "step": 56541 + }, + { + "epoch": 1.45, + "learning_rate": 1.1032478321165318e-06, + "loss": 0.7539, + "step": 56542 + }, + { + "epoch": 1.45, + "learning_rate": 1.103220309503382e-06, + "loss": 0.6562, + "step": 56543 + }, + { + "epoch": 1.45, + "learning_rate": 1.103192786811201e-06, + "loss": 0.6602, + "step": 56544 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031652640400099e-06, + "loss": 0.4248, + "step": 56545 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031377411898303e-06, + "loss": 0.6362, + "step": 56546 + }, + { + "epoch": 1.45, + "learning_rate": 1.1031102182606825e-06, + "loss": 0.7539, + "step": 56547 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030826952525885e-06, + "loss": 0.8184, + "step": 56548 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030551721655684e-06, + "loss": 0.6245, + "step": 56549 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030276489996437e-06, + "loss": 0.6348, + "step": 56550 + }, + { + "epoch": 1.45, + "learning_rate": 1.1030001257548355e-06, + "loss": 0.5728, + "step": 56551 + }, + { + "epoch": 1.45, + "learning_rate": 1.102972602431165e-06, + "loss": 0.6831, + "step": 56552 + }, + { + "epoch": 1.45, + "learning_rate": 1.1029450790286528e-06, + "loss": 0.6719, + "step": 56553 + }, + { + "epoch": 1.45, + "learning_rate": 1.1029175555473204e-06, + "loss": 0.6768, + "step": 56554 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028900319871887e-06, + "loss": 0.7285, + "step": 56555 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028625083482792e-06, + "loss": 0.6777, + "step": 56556 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028349846306123e-06, + "loss": 0.6387, + "step": 56557 + }, + { + "epoch": 1.45, + "learning_rate": 1.1028074608342093e-06, + "loss": 0.6328, + "step": 56558 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027799369590915e-06, + "loss": 0.5278, + "step": 56559 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027524130052799e-06, + "loss": 0.5601, + "step": 56560 + }, + { + "epoch": 1.45, + "learning_rate": 1.1027248889727956e-06, + "loss": 0.6846, + "step": 56561 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026973648616593e-06, + "loss": 0.6277, + "step": 56562 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026698406718927e-06, + "loss": 0.4536, + "step": 56563 + }, + { + "epoch": 1.45, + "learning_rate": 1.102642316403516e-06, + "loss": 0.5352, + "step": 56564 + }, + { + "epoch": 1.45, + "learning_rate": 1.1026147920565512e-06, + "loss": 0.8076, + "step": 56565 + }, + { + "epoch": 1.45, + "learning_rate": 1.102587267631019e-06, + "loss": 0.5332, + "step": 56566 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025597431269402e-06, + "loss": 0.6172, + "step": 56567 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025322185443362e-06, + "loss": 0.5342, + "step": 56568 + }, + { + "epoch": 1.45, + "learning_rate": 1.1025046938832282e-06, + "loss": 0.6729, + "step": 56569 + }, + { + "epoch": 1.45, + "learning_rate": 1.1024771691436366e-06, + "loss": 0.6685, + "step": 56570 + }, + { + "epoch": 1.45, + "learning_rate": 1.1024496443255835e-06, + "loss": 0.6455, + "step": 56571 + }, + { + "epoch": 1.45, + "learning_rate": 1.102422119429089e-06, + "loss": 0.458, + "step": 56572 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023945944541747e-06, + "loss": 0.4507, + "step": 56573 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023670694008616e-06, + "loss": 0.5264, + "step": 56574 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023395442691707e-06, + "loss": 0.6709, + "step": 56575 + }, + { + "epoch": 1.45, + "learning_rate": 1.1023120190591232e-06, + "loss": 0.7988, + "step": 56576 + }, + { + "epoch": 1.45, + "learning_rate": 1.10228449377074e-06, + "loss": 0.6143, + "step": 56577 + }, + { + "epoch": 1.45, + "learning_rate": 1.1022569684040423e-06, + "loss": 0.6001, + "step": 56578 + }, + { + "epoch": 1.45, + "learning_rate": 1.102229442959051e-06, + "loss": 0.6233, + "step": 56579 + }, + { + "epoch": 1.45, + "learning_rate": 1.1022019174357877e-06, + "loss": 0.6689, + "step": 56580 + }, + { + "epoch": 1.45, + "learning_rate": 1.102174391834273e-06, + "loss": 0.3196, + "step": 56581 + }, + { + "epoch": 1.45, + "learning_rate": 1.102146866154528e-06, + "loss": 0.6592, + "step": 56582 + }, + { + "epoch": 1.45, + "learning_rate": 1.1021193403965737e-06, + "loss": 0.6851, + "step": 56583 + }, + { + "epoch": 1.45, + "learning_rate": 1.1020918145604313e-06, + "loss": 0.5137, + "step": 56584 + }, + { + "epoch": 1.45, + "learning_rate": 1.102064288646122e-06, + "loss": 0.6709, + "step": 56585 + }, + { + "epoch": 1.45, + "learning_rate": 1.102036762653667e-06, + "loss": 0.7402, + "step": 56586 + }, + { + "epoch": 1.45, + "learning_rate": 1.1020092365830867e-06, + "loss": 0.5933, + "step": 56587 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019817104344027e-06, + "loss": 0.5391, + "step": 56588 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019541842076362e-06, + "loss": 0.6177, + "step": 56589 + }, + { + "epoch": 1.45, + "learning_rate": 1.1019266579028082e-06, + "loss": 0.6763, + "step": 56590 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018991315199392e-06, + "loss": 0.6611, + "step": 56591 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018716050590511e-06, + "loss": 0.6963, + "step": 56592 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018440785201642e-06, + "loss": 0.6162, + "step": 56593 + }, + { + "epoch": 1.45, + "learning_rate": 1.1018165519033003e-06, + "loss": 0.7451, + "step": 56594 + }, + { + "epoch": 1.45, + "learning_rate": 1.10178902520848e-06, + "loss": 0.6963, + "step": 56595 + }, + { + "epoch": 1.45, + "learning_rate": 1.1017614984357246e-06, + "loss": 0.483, + "step": 56596 + }, + { + "epoch": 1.45, + "learning_rate": 1.101733971585055e-06, + "loss": 0.6191, + "step": 56597 + }, + { + "epoch": 1.45, + "learning_rate": 1.1017064446564925e-06, + "loss": 0.6934, + "step": 56598 + }, + { + "epoch": 1.45, + "learning_rate": 1.101678917650058e-06, + "loss": 0.6914, + "step": 56599 + }, + { + "epoch": 1.45, + "learning_rate": 1.1016513905657727e-06, + "loss": 0.5852, + "step": 56600 + }, + { + "epoch": 1.45, + "learning_rate": 1.1016238634036576e-06, + "loss": 0.7051, + "step": 56601 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015963361637334e-06, + "loss": 0.5098, + "step": 56602 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015688088460221e-06, + "loss": 0.4705, + "step": 56603 + }, + { + "epoch": 1.45, + "learning_rate": 1.101541281450544e-06, + "loss": 0.4229, + "step": 56604 + }, + { + "epoch": 1.45, + "learning_rate": 1.1015137539773208e-06, + "loss": 0.666, + "step": 56605 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014862264263724e-06, + "loss": 0.6196, + "step": 56606 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014586987977213e-06, + "loss": 0.7593, + "step": 56607 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014311710913875e-06, + "loss": 0.6187, + "step": 56608 + }, + { + "epoch": 1.45, + "learning_rate": 1.1014036433073928e-06, + "loss": 0.5039, + "step": 56609 + }, + { + "epoch": 1.45, + "learning_rate": 1.1013761154457579e-06, + "loss": 0.7217, + "step": 56610 + }, + { + "epoch": 1.45, + "learning_rate": 1.101348587506504e-06, + "loss": 0.748, + "step": 56611 + }, + { + "epoch": 1.45, + "learning_rate": 1.101321059489652e-06, + "loss": 0.6333, + "step": 56612 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012935313952233e-06, + "loss": 0.6177, + "step": 56613 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012660032232389e-06, + "loss": 0.7764, + "step": 56614 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012384749737198e-06, + "loss": 0.561, + "step": 56615 + }, + { + "epoch": 1.45, + "learning_rate": 1.1012109466466868e-06, + "loss": 0.7354, + "step": 56616 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011834182421613e-06, + "loss": 0.7598, + "step": 56617 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011558897601643e-06, + "loss": 0.8389, + "step": 56618 + }, + { + "epoch": 1.45, + "learning_rate": 1.101128361200717e-06, + "loss": 0.8037, + "step": 56619 + }, + { + "epoch": 1.45, + "learning_rate": 1.1011008325638402e-06, + "loss": 0.5759, + "step": 56620 + }, + { + "epoch": 1.45, + "learning_rate": 1.1010733038495552e-06, + "loss": 0.6973, + "step": 56621 + }, + { + "epoch": 1.45, + "learning_rate": 1.101045775057883e-06, + "loss": 0.6167, + "step": 56622 + }, + { + "epoch": 1.45, + "learning_rate": 1.1010182461888446e-06, + "loss": 0.6406, + "step": 56623 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009907172424615e-06, + "loss": 0.4915, + "step": 56624 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009631882187543e-06, + "loss": 0.5762, + "step": 56625 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009356591177441e-06, + "loss": 0.708, + "step": 56626 + }, + { + "epoch": 1.45, + "learning_rate": 1.1009081299394524e-06, + "loss": 0.4434, + "step": 56627 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008806006838995e-06, + "loss": 0.6699, + "step": 56628 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008530713511073e-06, + "loss": 0.5122, + "step": 56629 + }, + { + "epoch": 1.45, + "learning_rate": 1.1008255419410967e-06, + "loss": 0.6191, + "step": 56630 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007980124538882e-06, + "loss": 0.5195, + "step": 56631 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007704828895038e-06, + "loss": 0.6558, + "step": 56632 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007429532479636e-06, + "loss": 0.4116, + "step": 56633 + }, + { + "epoch": 1.45, + "learning_rate": 1.1007154235292893e-06, + "loss": 0.5103, + "step": 56634 + }, + { + "epoch": 1.45, + "learning_rate": 1.100687893733502e-06, + "loss": 0.7344, + "step": 56635 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006603638606225e-06, + "loss": 0.7012, + "step": 56636 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006328339106719e-06, + "loss": 0.6414, + "step": 56637 + }, + { + "epoch": 1.45, + "learning_rate": 1.1006053038836713e-06, + "loss": 0.5527, + "step": 56638 + }, + { + "epoch": 1.45, + "learning_rate": 1.100577773779642e-06, + "loss": 0.7227, + "step": 56639 + }, + { + "epoch": 1.45, + "learning_rate": 1.1005502435986049e-06, + "loss": 0.4365, + "step": 56640 + }, + { + "epoch": 1.45, + "learning_rate": 1.1005227133405812e-06, + "loss": 0.6777, + "step": 56641 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004951830055918e-06, + "loss": 0.6782, + "step": 56642 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004676525936575e-06, + "loss": 0.2974, + "step": 56643 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004401221048004e-06, + "loss": 0.5361, + "step": 56644 + }, + { + "epoch": 1.45, + "learning_rate": 1.1004125915390405e-06, + "loss": 0.5715, + "step": 56645 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003850608963994e-06, + "loss": 0.752, + "step": 56646 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003575301768981e-06, + "loss": 0.7012, + "step": 56647 + }, + { + "epoch": 1.45, + "learning_rate": 1.1003299993805575e-06, + "loss": 0.6572, + "step": 56648 + }, + { + "epoch": 1.45, + "learning_rate": 1.100302468507399e-06, + "loss": 0.5986, + "step": 56649 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002749375574433e-06, + "loss": 0.707, + "step": 56650 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002474065307122e-06, + "loss": 0.5713, + "step": 56651 + }, + { + "epoch": 1.45, + "learning_rate": 1.1002198754272257e-06, + "loss": 0.595, + "step": 56652 + }, + { + "epoch": 1.45, + "learning_rate": 1.1001923442470059e-06, + "loss": 0.6543, + "step": 56653 + }, + { + "epoch": 1.45, + "learning_rate": 1.100164812990073e-06, + "loss": 0.54, + "step": 56654 + }, + { + "epoch": 1.45, + "learning_rate": 1.100137281656449e-06, + "loss": 0.6484, + "step": 56655 + }, + { + "epoch": 1.45, + "learning_rate": 1.100109750246154e-06, + "loss": 0.5527, + "step": 56656 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000822187592098e-06, + "loss": 0.7207, + "step": 56657 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000546871956372e-06, + "loss": 0.7158, + "step": 56658 + }, + { + "epoch": 1.45, + "learning_rate": 1.1000271555554573e-06, + "loss": 0.7422, + "step": 56659 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999996238386912e-06, + "loss": 0.6997, + "step": 56660 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999720920453601e-06, + "loss": 0.6924, + "step": 56661 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999445601754848e-06, + "loss": 0.5986, + "step": 56662 + }, + { + "epoch": 1.45, + "learning_rate": 1.0999170282290868e-06, + "loss": 0.6523, + "step": 56663 + }, + { + "epoch": 1.45, + "learning_rate": 1.0998894962061867e-06, + "loss": 0.6035, + "step": 56664 + }, + { + "epoch": 1.45, + "learning_rate": 1.099861964106806e-06, + "loss": 0.4531, + "step": 56665 + }, + { + "epoch": 1.45, + "learning_rate": 1.0998344319309653e-06, + "loss": 0.5991, + "step": 56666 + }, + { + "epoch": 1.45, + "learning_rate": 1.099806899678686e-06, + "loss": 0.6914, + "step": 56667 + }, + { + "epoch": 1.45, + "learning_rate": 1.0997793673499894e-06, + "loss": 0.3951, + "step": 56668 + }, + { + "epoch": 1.45, + "learning_rate": 1.099751834944896e-06, + "loss": 0.6123, + "step": 56669 + }, + { + "epoch": 1.45, + "learning_rate": 1.0997243024634277e-06, + "loss": 0.5977, + "step": 56670 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996967699056045e-06, + "loss": 0.6592, + "step": 56671 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996692372714486e-06, + "loss": 0.6436, + "step": 56672 + }, + { + "epoch": 1.45, + "learning_rate": 1.09964170456098e-06, + "loss": 0.7129, + "step": 56673 + }, + { + "epoch": 1.45, + "learning_rate": 1.0996141717742208e-06, + "loss": 0.7407, + "step": 56674 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995866389111917e-06, + "loss": 0.6309, + "step": 56675 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995591059719134e-06, + "loss": 0.5547, + "step": 56676 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995315729564071e-06, + "loss": 0.6196, + "step": 56677 + }, + { + "epoch": 1.45, + "learning_rate": 1.0995040398646944e-06, + "loss": 0.7012, + "step": 56678 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994765066967957e-06, + "loss": 0.6104, + "step": 56679 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994489734527329e-06, + "loss": 0.5745, + "step": 56680 + }, + { + "epoch": 1.45, + "learning_rate": 1.0994214401325262e-06, + "loss": 0.5231, + "step": 56681 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993939067361973e-06, + "loss": 0.5986, + "step": 56682 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993663732637666e-06, + "loss": 0.5654, + "step": 56683 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993388397152562e-06, + "loss": 0.6284, + "step": 56684 + }, + { + "epoch": 1.45, + "learning_rate": 1.0993113060906865e-06, + "loss": 0.7295, + "step": 56685 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992837723900784e-06, + "loss": 0.6416, + "step": 56686 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992562386134533e-06, + "loss": 0.8086, + "step": 56687 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992287047608327e-06, + "loss": 0.6133, + "step": 56688 + }, + { + "epoch": 1.45, + "learning_rate": 1.0992011708322366e-06, + "loss": 0.8076, + "step": 56689 + }, + { + "epoch": 1.45, + "learning_rate": 1.0991736368276874e-06, + "loss": 0.6313, + "step": 56690 + }, + { + "epoch": 1.45, + "learning_rate": 1.0991461027472052e-06, + "loss": 0.6992, + "step": 56691 + }, + { + "epoch": 1.45, + "learning_rate": 1.099118568590811e-06, + "loss": 0.6836, + "step": 56692 + }, + { + "epoch": 1.45, + "learning_rate": 1.0990910343585269e-06, + "loss": 0.6104, + "step": 56693 + }, + { + "epoch": 1.45, + "learning_rate": 1.099063500050373e-06, + "loss": 0.6245, + "step": 56694 + }, + { + "epoch": 1.45, + "learning_rate": 1.099035965666371e-06, + "loss": 0.6108, + "step": 56695 + }, + { + "epoch": 1.45, + "learning_rate": 1.0990084312065415e-06, + "loss": 0.5784, + "step": 56696 + }, + { + "epoch": 1.45, + "learning_rate": 1.098980896670906e-06, + "loss": 0.6504, + "step": 56697 + }, + { + "epoch": 1.45, + "learning_rate": 1.098953362059485e-06, + "loss": 0.6094, + "step": 56698 + }, + { + "epoch": 1.45, + "learning_rate": 1.0989258273723004e-06, + "loss": 0.5684, + "step": 56699 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988982926093726e-06, + "loss": 0.7168, + "step": 56700 + }, + { + "epoch": 1.45, + "learning_rate": 1.098870757770723e-06, + "loss": 0.5254, + "step": 56701 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988432228563724e-06, + "loss": 0.7627, + "step": 56702 + }, + { + "epoch": 1.45, + "learning_rate": 1.0988156878663423e-06, + "loss": 0.5981, + "step": 56703 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987881528006534e-06, + "loss": 0.6602, + "step": 56704 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987606176593274e-06, + "loss": 0.7236, + "step": 56705 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987330824423847e-06, + "loss": 0.8428, + "step": 56706 + }, + { + "epoch": 1.45, + "learning_rate": 1.0987055471498463e-06, + "loss": 0.4424, + "step": 56707 + }, + { + "epoch": 1.45, + "learning_rate": 1.0986780117817338e-06, + "loss": 0.8184, + "step": 56708 + }, + { + "epoch": 1.45, + "learning_rate": 1.098650476338068e-06, + "loss": 0.6484, + "step": 56709 + }, + { + "epoch": 1.45, + "learning_rate": 1.0986229408188705e-06, + "loss": 0.4733, + "step": 56710 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985954052241615e-06, + "loss": 0.6626, + "step": 56711 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985678695539627e-06, + "loss": 0.6514, + "step": 56712 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985403338082948e-06, + "loss": 0.7246, + "step": 56713 + }, + { + "epoch": 1.45, + "learning_rate": 1.0985127979871793e-06, + "loss": 0.5447, + "step": 56714 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984852620906372e-06, + "loss": 0.5869, + "step": 56715 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984577261186893e-06, + "loss": 0.7363, + "step": 56716 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984301900713568e-06, + "loss": 0.4236, + "step": 56717 + }, + { + "epoch": 1.45, + "learning_rate": 1.0984026539486612e-06, + "loss": 0.7334, + "step": 56718 + }, + { + "epoch": 1.45, + "learning_rate": 1.0983751177506224e-06, + "loss": 0.7065, + "step": 56719 + }, + { + "epoch": 1.45, + "learning_rate": 1.098347581477263e-06, + "loss": 0.6074, + "step": 56720 + }, + { + "epoch": 1.45, + "learning_rate": 1.0983200451286032e-06, + "loss": 0.605, + "step": 56721 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982925087046644e-06, + "loss": 0.5889, + "step": 56722 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982649722054672e-06, + "loss": 0.7549, + "step": 56723 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982374356310333e-06, + "loss": 0.7979, + "step": 56724 + }, + { + "epoch": 1.45, + "learning_rate": 1.0982098989813834e-06, + "loss": 0.6592, + "step": 56725 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981823622565389e-06, + "loss": 0.6992, + "step": 56726 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981548254565205e-06, + "loss": 0.8091, + "step": 56727 + }, + { + "epoch": 1.45, + "learning_rate": 1.0981272885813494e-06, + "loss": 0.5894, + "step": 56728 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980997516310467e-06, + "loss": 0.7158, + "step": 56729 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980722146056338e-06, + "loss": 0.7471, + "step": 56730 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980446775051314e-06, + "loss": 0.5647, + "step": 56731 + }, + { + "epoch": 1.45, + "learning_rate": 1.0980171403295609e-06, + "loss": 0.6719, + "step": 56732 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979896030789426e-06, + "loss": 0.5535, + "step": 56733 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979620657532986e-06, + "loss": 0.5576, + "step": 56734 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979345283526495e-06, + "loss": 0.5015, + "step": 56735 + }, + { + "epoch": 1.45, + "learning_rate": 1.0979069908770163e-06, + "loss": 0.6304, + "step": 56736 + }, + { + "epoch": 1.45, + "learning_rate": 1.0978794533264205e-06, + "loss": 0.6019, + "step": 56737 + }, + { + "epoch": 1.45, + "learning_rate": 1.0978519157008826e-06, + "loss": 0.4805, + "step": 56738 + }, + { + "epoch": 1.45, + "learning_rate": 1.097824378000424e-06, + "loss": 0.6025, + "step": 56739 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977968402250658e-06, + "loss": 0.7637, + "step": 56740 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977693023748294e-06, + "loss": 0.8003, + "step": 56741 + }, + { + "epoch": 1.45, + "learning_rate": 1.097741764449735e-06, + "loss": 0.8115, + "step": 56742 + }, + { + "epoch": 1.45, + "learning_rate": 1.0977142264498048e-06, + "loss": 0.7285, + "step": 56743 + }, + { + "epoch": 1.45, + "learning_rate": 1.0976866883750589e-06, + "loss": 0.749, + "step": 56744 + }, + { + "epoch": 1.45, + "learning_rate": 1.097659150225519e-06, + "loss": 0.8984, + "step": 56745 + }, + { + "epoch": 1.45, + "learning_rate": 1.097631612001206e-06, + "loss": 0.5142, + "step": 56746 + }, + { + "epoch": 1.45, + "learning_rate": 1.097604073702141e-06, + "loss": 0.6216, + "step": 56747 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975765353283447e-06, + "loss": 0.5035, + "step": 56748 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975489968798387e-06, + "loss": 0.6621, + "step": 56749 + }, + { + "epoch": 1.45, + "learning_rate": 1.0975214583566438e-06, + "loss": 0.5767, + "step": 56750 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974939197587816e-06, + "loss": 0.6211, + "step": 56751 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974663810862724e-06, + "loss": 0.6016, + "step": 56752 + }, + { + "epoch": 1.45, + "learning_rate": 1.097438842339138e-06, + "loss": 0.5576, + "step": 56753 + }, + { + "epoch": 1.45, + "learning_rate": 1.0974113035173987e-06, + "loss": 0.5081, + "step": 56754 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973837646210764e-06, + "loss": 0.4861, + "step": 56755 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973562256501918e-06, + "loss": 0.6514, + "step": 56756 + }, + { + "epoch": 1.45, + "learning_rate": 1.0973286866047658e-06, + "loss": 0.5967, + "step": 56757 + }, + { + "epoch": 1.45, + "learning_rate": 1.09730114748482e-06, + "loss": 0.5308, + "step": 56758 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972736082903748e-06, + "loss": 0.6289, + "step": 56759 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972460690214522e-06, + "loss": 0.751, + "step": 56760 + }, + { + "epoch": 1.45, + "learning_rate": 1.0972185296780724e-06, + "loss": 0.665, + "step": 56761 + }, + { + "epoch": 1.45, + "learning_rate": 1.097190990260257e-06, + "loss": 0.7583, + "step": 56762 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971634507680268e-06, + "loss": 0.6885, + "step": 56763 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971359112014028e-06, + "loss": 0.5957, + "step": 56764 + }, + { + "epoch": 1.45, + "learning_rate": 1.0971083715604068e-06, + "loss": 0.6855, + "step": 56765 + }, + { + "epoch": 1.45, + "learning_rate": 1.0970808318450592e-06, + "loss": 0.9736, + "step": 56766 + }, + { + "epoch": 1.45, + "learning_rate": 1.0970532920553812e-06, + "loss": 0.6663, + "step": 56767 + }, + { + "epoch": 1.45, + "learning_rate": 1.097025752191394e-06, + "loss": 0.7373, + "step": 56768 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969982122531186e-06, + "loss": 0.7295, + "step": 56769 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969706722405762e-06, + "loss": 0.6836, + "step": 56770 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969431321537877e-06, + "loss": 0.7231, + "step": 56771 + }, + { + "epoch": 1.46, + "learning_rate": 1.0969155919927744e-06, + "loss": 0.5112, + "step": 56772 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968880517575573e-06, + "loss": 0.6279, + "step": 56773 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968605114481573e-06, + "loss": 0.6284, + "step": 56774 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968329710645959e-06, + "loss": 0.5999, + "step": 56775 + }, + { + "epoch": 1.46, + "learning_rate": 1.0968054306068936e-06, + "loss": 0.6533, + "step": 56776 + }, + { + "epoch": 1.46, + "learning_rate": 1.0967778900750722e-06, + "loss": 0.665, + "step": 56777 + }, + { + "epoch": 1.46, + "learning_rate": 1.0967503494691523e-06, + "loss": 0.7852, + "step": 56778 + }, + { + "epoch": 1.46, + "learning_rate": 1.096722808789155e-06, + "loss": 0.543, + "step": 56779 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966952680351017e-06, + "loss": 0.583, + "step": 56780 + }, + { + "epoch": 1.46, + "learning_rate": 1.096667727207013e-06, + "loss": 0.7451, + "step": 56781 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966401863049104e-06, + "loss": 0.6592, + "step": 56782 + }, + { + "epoch": 1.46, + "learning_rate": 1.0966126453288148e-06, + "loss": 0.4889, + "step": 56783 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965851042787475e-06, + "loss": 0.5464, + "step": 56784 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965575631547298e-06, + "loss": 0.6841, + "step": 56785 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965300219567817e-06, + "loss": 0.4351, + "step": 56786 + }, + { + "epoch": 1.46, + "learning_rate": 1.0965024806849251e-06, + "loss": 0.644, + "step": 56787 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964749393391813e-06, + "loss": 0.7676, + "step": 56788 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964473979195708e-06, + "loss": 0.6128, + "step": 56789 + }, + { + "epoch": 1.46, + "learning_rate": 1.0964198564261152e-06, + "loss": 0.6831, + "step": 56790 + }, + { + "epoch": 1.46, + "learning_rate": 1.0963923148588351e-06, + "loss": 0.6558, + "step": 56791 + }, + { + "epoch": 1.46, + "learning_rate": 1.096364773217752e-06, + "loss": 0.626, + "step": 56792 + }, + { + "epoch": 1.46, + "learning_rate": 1.096337231502887e-06, + "loss": 0.7285, + "step": 56793 + }, + { + "epoch": 1.46, + "learning_rate": 1.0963096897142606e-06, + "loss": 0.6313, + "step": 56794 + }, + { + "epoch": 1.46, + "learning_rate": 1.0962821478518946e-06, + "loss": 0.511, + "step": 56795 + }, + { + "epoch": 1.46, + "learning_rate": 1.0962546059158097e-06, + "loss": 0.7656, + "step": 56796 + }, + { + "epoch": 1.46, + "learning_rate": 1.096227063906027e-06, + "loss": 0.6699, + "step": 56797 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961995218225677e-06, + "loss": 0.6885, + "step": 56798 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961719796654529e-06, + "loss": 0.5815, + "step": 56799 + }, + { + "epoch": 1.46, + "learning_rate": 1.0961444374347038e-06, + "loss": 0.626, + "step": 56800 + }, + { + "epoch": 1.46, + "learning_rate": 1.096116895130341e-06, + "loss": 0.5811, + "step": 56801 + }, + { + "epoch": 1.46, + "learning_rate": 1.096089352752386e-06, + "loss": 0.4661, + "step": 56802 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960618103008599e-06, + "loss": 0.707, + "step": 56803 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960342677757836e-06, + "loss": 0.6045, + "step": 56804 + }, + { + "epoch": 1.46, + "learning_rate": 1.0960067251771782e-06, + "loss": 0.8018, + "step": 56805 + }, + { + "epoch": 1.46, + "learning_rate": 1.0959791825050653e-06, + "loss": 0.5312, + "step": 56806 + }, + { + "epoch": 1.46, + "learning_rate": 1.095951639759465e-06, + "loss": 0.5903, + "step": 56807 + }, + { + "epoch": 1.46, + "learning_rate": 1.0959240969403994e-06, + "loss": 0.5641, + "step": 56808 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958965540478887e-06, + "loss": 0.6401, + "step": 56809 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958690110819548e-06, + "loss": 0.6313, + "step": 56810 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958414680426183e-06, + "loss": 0.709, + "step": 56811 + }, + { + "epoch": 1.46, + "learning_rate": 1.0958139249299004e-06, + "loss": 0.5229, + "step": 56812 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957863817438218e-06, + "loss": 0.6099, + "step": 56813 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957588384844043e-06, + "loss": 0.7412, + "step": 56814 + }, + { + "epoch": 1.46, + "learning_rate": 1.095731295151669e-06, + "loss": 0.4451, + "step": 56815 + }, + { + "epoch": 1.46, + "learning_rate": 1.0957037517456362e-06, + "loss": 0.7109, + "step": 56816 + }, + { + "epoch": 1.46, + "learning_rate": 1.0956762082663273e-06, + "loss": 0.4841, + "step": 56817 + }, + { + "epoch": 1.46, + "learning_rate": 1.095648664713764e-06, + "loss": 0.6768, + "step": 56818 + }, + { + "epoch": 1.46, + "learning_rate": 1.0956211210879665e-06, + "loss": 0.5889, + "step": 56819 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955935773889565e-06, + "loss": 0.7236, + "step": 56820 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955660336167548e-06, + "loss": 0.6562, + "step": 56821 + }, + { + "epoch": 1.46, + "learning_rate": 1.0955384897713826e-06, + "loss": 0.7305, + "step": 56822 + }, + { + "epoch": 1.46, + "learning_rate": 1.095510945852861e-06, + "loss": 0.4229, + "step": 56823 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954834018612112e-06, + "loss": 0.5901, + "step": 56824 + }, + { + "epoch": 1.46, + "learning_rate": 1.095455857796454e-06, + "loss": 0.708, + "step": 56825 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954283136586107e-06, + "loss": 0.6211, + "step": 56826 + }, + { + "epoch": 1.46, + "learning_rate": 1.0954007694477023e-06, + "loss": 0.5664, + "step": 56827 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953732251637498e-06, + "loss": 0.5469, + "step": 56828 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953456808067748e-06, + "loss": 0.6465, + "step": 56829 + }, + { + "epoch": 1.46, + "learning_rate": 1.0953181363767976e-06, + "loss": 0.6187, + "step": 56830 + }, + { + "epoch": 1.46, + "learning_rate": 1.09529059187384e-06, + "loss": 0.6455, + "step": 56831 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952630472979223e-06, + "loss": 0.7529, + "step": 56832 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952355026490665e-06, + "loss": 0.6929, + "step": 56833 + }, + { + "epoch": 1.46, + "learning_rate": 1.0952079579272928e-06, + "loss": 0.6699, + "step": 56834 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951804131326234e-06, + "loss": 0.48, + "step": 56835 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951528682650784e-06, + "loss": 0.6992, + "step": 56836 + }, + { + "epoch": 1.46, + "learning_rate": 1.0951253233246791e-06, + "loss": 0.7231, + "step": 56837 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950977783114467e-06, + "loss": 0.5801, + "step": 56838 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950702332254025e-06, + "loss": 0.5168, + "step": 56839 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950426880665672e-06, + "loss": 0.6104, + "step": 56840 + }, + { + "epoch": 1.46, + "learning_rate": 1.0950151428349625e-06, + "loss": 0.667, + "step": 56841 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949875975306087e-06, + "loss": 0.4958, + "step": 56842 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949600521535273e-06, + "loss": 0.3528, + "step": 56843 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949325067037392e-06, + "loss": 0.6294, + "step": 56844 + }, + { + "epoch": 1.46, + "learning_rate": 1.0949049611812659e-06, + "loss": 0.6289, + "step": 56845 + }, + { + "epoch": 1.46, + "learning_rate": 1.0948774155861282e-06, + "loss": 0.4341, + "step": 56846 + }, + { + "epoch": 1.46, + "learning_rate": 1.0948498699183472e-06, + "loss": 0.6816, + "step": 56847 + }, + { + "epoch": 1.46, + "learning_rate": 1.094822324177944e-06, + "loss": 0.9326, + "step": 56848 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947947783649397e-06, + "loss": 0.6523, + "step": 56849 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947672324793554e-06, + "loss": 0.6465, + "step": 56850 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947396865212125e-06, + "loss": 0.7236, + "step": 56851 + }, + { + "epoch": 1.46, + "learning_rate": 1.0947121404905313e-06, + "loss": 0.6719, + "step": 56852 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946845943873334e-06, + "loss": 0.6396, + "step": 56853 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946570482116402e-06, + "loss": 0.6831, + "step": 56854 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946295019634723e-06, + "loss": 0.6821, + "step": 56855 + }, + { + "epoch": 1.46, + "learning_rate": 1.0946019556428509e-06, + "loss": 0.7197, + "step": 56856 + }, + { + "epoch": 1.46, + "learning_rate": 1.094574409249797e-06, + "loss": 0.6436, + "step": 56857 + }, + { + "epoch": 1.46, + "learning_rate": 1.0945468627843322e-06, + "loss": 0.8809, + "step": 56858 + }, + { + "epoch": 1.46, + "learning_rate": 1.0945193162464767e-06, + "loss": 0.5054, + "step": 56859 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944917696362528e-06, + "loss": 0.6616, + "step": 56860 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944642229536802e-06, + "loss": 0.4873, + "step": 56861 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944366761987812e-06, + "loss": 0.7012, + "step": 56862 + }, + { + "epoch": 1.46, + "learning_rate": 1.0944091293715758e-06, + "loss": 0.6079, + "step": 56863 + }, + { + "epoch": 1.46, + "learning_rate": 1.0943815824720861e-06, + "loss": 0.6855, + "step": 56864 + }, + { + "epoch": 1.46, + "learning_rate": 1.094354035500333e-06, + "loss": 0.6758, + "step": 56865 + }, + { + "epoch": 1.46, + "learning_rate": 1.0943264884563367e-06, + "loss": 0.4119, + "step": 56866 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942989413401194e-06, + "loss": 0.5295, + "step": 56867 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942713941517017e-06, + "loss": 0.6846, + "step": 56868 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942438468911043e-06, + "loss": 0.6387, + "step": 56869 + }, + { + "epoch": 1.46, + "learning_rate": 1.0942162995583493e-06, + "loss": 0.5229, + "step": 56870 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941887521534569e-06, + "loss": 0.7119, + "step": 56871 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941612046764485e-06, + "loss": 0.6504, + "step": 56872 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941336571273453e-06, + "loss": 0.3577, + "step": 56873 + }, + { + "epoch": 1.46, + "learning_rate": 1.0941061095061681e-06, + "loss": 0.5127, + "step": 56874 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940785618129387e-06, + "loss": 0.7275, + "step": 56875 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940510140476772e-06, + "loss": 0.6113, + "step": 56876 + }, + { + "epoch": 1.46, + "learning_rate": 1.0940234662104053e-06, + "loss": 0.624, + "step": 56877 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939959183011438e-06, + "loss": 0.4521, + "step": 56878 + }, + { + "epoch": 1.46, + "learning_rate": 1.093968370319914e-06, + "loss": 0.5913, + "step": 56879 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939408222667373e-06, + "loss": 0.5835, + "step": 56880 + }, + { + "epoch": 1.46, + "learning_rate": 1.0939132741416342e-06, + "loss": 0.6245, + "step": 56881 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938857259446258e-06, + "loss": 0.4857, + "step": 56882 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938581776757337e-06, + "loss": 0.5073, + "step": 56883 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938306293349785e-06, + "loss": 0.5234, + "step": 56884 + }, + { + "epoch": 1.46, + "learning_rate": 1.0938030809223818e-06, + "loss": 0.7324, + "step": 56885 + }, + { + "epoch": 1.46, + "learning_rate": 1.093775532437964e-06, + "loss": 0.752, + "step": 56886 + }, + { + "epoch": 1.46, + "learning_rate": 1.093747983881747e-06, + "loss": 0.6111, + "step": 56887 + }, + { + "epoch": 1.46, + "learning_rate": 1.093720435253751e-06, + "loss": 0.6846, + "step": 56888 + }, + { + "epoch": 1.46, + "learning_rate": 1.093692886553998e-06, + "loss": 0.5632, + "step": 56889 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936653377825085e-06, + "loss": 0.7227, + "step": 56890 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936377889393035e-06, + "loss": 0.6533, + "step": 56891 + }, + { + "epoch": 1.46, + "learning_rate": 1.0936102400244048e-06, + "loss": 0.5403, + "step": 56892 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935826910378325e-06, + "loss": 0.5364, + "step": 56893 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935551419796089e-06, + "loss": 0.7041, + "step": 56894 + }, + { + "epoch": 1.46, + "learning_rate": 1.093527592849754e-06, + "loss": 0.4595, + "step": 56895 + }, + { + "epoch": 1.46, + "learning_rate": 1.0935000436482894e-06, + "loss": 0.5249, + "step": 56896 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934724943752362e-06, + "loss": 0.6069, + "step": 56897 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934449450306154e-06, + "loss": 0.4019, + "step": 56898 + }, + { + "epoch": 1.46, + "learning_rate": 1.0934173956144482e-06, + "loss": 0.7041, + "step": 56899 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933898461267555e-06, + "loss": 0.5117, + "step": 56900 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933622965675582e-06, + "loss": 0.7222, + "step": 56901 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933347469368782e-06, + "loss": 0.7471, + "step": 56902 + }, + { + "epoch": 1.46, + "learning_rate": 1.0933071972347354e-06, + "loss": 0.7368, + "step": 56903 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932796474611522e-06, + "loss": 0.6733, + "step": 56904 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932520976161489e-06, + "loss": 0.502, + "step": 56905 + }, + { + "epoch": 1.46, + "learning_rate": 1.0932245476997468e-06, + "loss": 0.6807, + "step": 56906 + }, + { + "epoch": 1.46, + "learning_rate": 1.0931969977119665e-06, + "loss": 0.5605, + "step": 56907 + }, + { + "epoch": 1.46, + "learning_rate": 1.09316944765283e-06, + "loss": 0.6445, + "step": 56908 + }, + { + "epoch": 1.46, + "learning_rate": 1.093141897522358e-06, + "loss": 0.7324, + "step": 56909 + }, + { + "epoch": 1.46, + "learning_rate": 1.0931143473205713e-06, + "loss": 0.5645, + "step": 56910 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930867970474913e-06, + "loss": 0.8154, + "step": 56911 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930592467031387e-06, + "loss": 0.6323, + "step": 56912 + }, + { + "epoch": 1.46, + "learning_rate": 1.0930316962875354e-06, + "loss": 0.5229, + "step": 56913 + }, + { + "epoch": 1.46, + "learning_rate": 1.093004145800702e-06, + "loss": 0.5498, + "step": 56914 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929765952426596e-06, + "loss": 0.3368, + "step": 56915 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929490446134289e-06, + "loss": 0.6172, + "step": 56916 + }, + { + "epoch": 1.46, + "learning_rate": 1.0929214939130315e-06, + "loss": 0.7734, + "step": 56917 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928939431414885e-06, + "loss": 0.6707, + "step": 56918 + }, + { + "epoch": 1.46, + "learning_rate": 1.092866392298821e-06, + "loss": 0.6577, + "step": 56919 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928388413850499e-06, + "loss": 0.6611, + "step": 56920 + }, + { + "epoch": 1.46, + "learning_rate": 1.0928112904001962e-06, + "loss": 0.5918, + "step": 56921 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927837393442811e-06, + "loss": 0.7812, + "step": 56922 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927561882173262e-06, + "loss": 0.7461, + "step": 56923 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927286370193521e-06, + "loss": 0.7314, + "step": 56924 + }, + { + "epoch": 1.46, + "learning_rate": 1.0927010857503797e-06, + "loss": 0.6174, + "step": 56925 + }, + { + "epoch": 1.46, + "learning_rate": 1.09267353441043e-06, + "loss": 0.6221, + "step": 56926 + }, + { + "epoch": 1.46, + "learning_rate": 1.0926459829995252e-06, + "loss": 0.8174, + "step": 56927 + }, + { + "epoch": 1.46, + "learning_rate": 1.092618431517685e-06, + "loss": 0.7607, + "step": 56928 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925908799649314e-06, + "loss": 0.6069, + "step": 56929 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925633283412851e-06, + "loss": 0.6968, + "step": 56930 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925357766467676e-06, + "loss": 0.7554, + "step": 56931 + }, + { + "epoch": 1.46, + "learning_rate": 1.0925082248813995e-06, + "loss": 0.8115, + "step": 56932 + }, + { + "epoch": 1.46, + "learning_rate": 1.0924806730452021e-06, + "loss": 0.5391, + "step": 56933 + }, + { + "epoch": 1.46, + "learning_rate": 1.0924531211381966e-06, + "loss": 0.6924, + "step": 56934 + }, + { + "epoch": 1.46, + "learning_rate": 1.092425569160404e-06, + "loss": 0.667, + "step": 56935 + }, + { + "epoch": 1.46, + "learning_rate": 1.0923980171118452e-06, + "loss": 0.6748, + "step": 56936 + }, + { + "epoch": 1.46, + "learning_rate": 1.0923704649925415e-06, + "loss": 0.707, + "step": 56937 + }, + { + "epoch": 1.46, + "learning_rate": 1.092342912802514e-06, + "loss": 0.8252, + "step": 56938 + }, + { + "epoch": 1.46, + "learning_rate": 1.092315360541784e-06, + "loss": 0.6963, + "step": 56939 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922878082103724e-06, + "loss": 0.5947, + "step": 56940 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922602558082999e-06, + "loss": 0.6792, + "step": 56941 + }, + { + "epoch": 1.46, + "learning_rate": 1.0922327033355884e-06, + "loss": 0.5603, + "step": 56942 + }, + { + "epoch": 1.46, + "learning_rate": 1.092205150792258e-06, + "loss": 0.5981, + "step": 56943 + }, + { + "epoch": 1.46, + "learning_rate": 1.092177598178331e-06, + "loss": 0.708, + "step": 56944 + }, + { + "epoch": 1.46, + "learning_rate": 1.0921500454938272e-06, + "loss": 0.4836, + "step": 56945 + }, + { + "epoch": 1.46, + "learning_rate": 1.092122492738769e-06, + "loss": 0.6846, + "step": 56946 + }, + { + "epoch": 1.46, + "learning_rate": 1.0920949399131763e-06, + "loss": 0.4636, + "step": 56947 + }, + { + "epoch": 1.46, + "learning_rate": 1.092067387017071e-06, + "loss": 0.5264, + "step": 56948 + }, + { + "epoch": 1.46, + "learning_rate": 1.092039834050474e-06, + "loss": 0.457, + "step": 56949 + }, + { + "epoch": 1.46, + "learning_rate": 1.0920122810134063e-06, + "loss": 0.4454, + "step": 56950 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919847279058887e-06, + "loss": 0.8047, + "step": 56951 + }, + { + "epoch": 1.46, + "learning_rate": 1.091957174727943e-06, + "loss": 0.4622, + "step": 56952 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919296214795897e-06, + "loss": 0.7002, + "step": 56953 + }, + { + "epoch": 1.46, + "learning_rate": 1.0919020681608505e-06, + "loss": 0.3604, + "step": 56954 + }, + { + "epoch": 1.46, + "learning_rate": 1.0918745147717457e-06, + "loss": 0.625, + "step": 56955 + }, + { + "epoch": 1.46, + "learning_rate": 1.0918469613122967e-06, + "loss": 0.6426, + "step": 56956 + }, + { + "epoch": 1.46, + "learning_rate": 1.091819407782525e-06, + "loss": 0.5688, + "step": 56957 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917918541824515e-06, + "loss": 0.6504, + "step": 56958 + }, + { + "epoch": 1.46, + "learning_rate": 1.091764300512097e-06, + "loss": 0.7129, + "step": 56959 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917367467714829e-06, + "loss": 0.5048, + "step": 56960 + }, + { + "epoch": 1.46, + "learning_rate": 1.0917091929606302e-06, + "loss": 0.8037, + "step": 56961 + }, + { + "epoch": 1.46, + "learning_rate": 1.0916816390795597e-06, + "loss": 0.7236, + "step": 56962 + }, + { + "epoch": 1.46, + "learning_rate": 1.091654085128293e-06, + "loss": 0.6133, + "step": 56963 + }, + { + "epoch": 1.46, + "learning_rate": 1.0916265311068511e-06, + "loss": 0.7153, + "step": 56964 + }, + { + "epoch": 1.46, + "learning_rate": 1.091598977015255e-06, + "loss": 0.7295, + "step": 56965 + }, + { + "epoch": 1.46, + "learning_rate": 1.0915714228535254e-06, + "loss": 0.6172, + "step": 56966 + }, + { + "epoch": 1.46, + "learning_rate": 1.091543868621684e-06, + "loss": 0.709, + "step": 56967 + }, + { + "epoch": 1.46, + "learning_rate": 1.0915163143197517e-06, + "loss": 0.5054, + "step": 56968 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914887599477499e-06, + "loss": 0.7432, + "step": 56969 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914612055056986e-06, + "loss": 0.7021, + "step": 56970 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914336509936202e-06, + "loss": 0.5845, + "step": 56971 + }, + { + "epoch": 1.46, + "learning_rate": 1.0914060964115351e-06, + "loss": 0.6296, + "step": 56972 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913785417594646e-06, + "loss": 0.7295, + "step": 56973 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913509870374298e-06, + "loss": 0.6191, + "step": 56974 + }, + { + "epoch": 1.46, + "learning_rate": 1.0913234322454516e-06, + "loss": 0.623, + "step": 56975 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912958773835511e-06, + "loss": 0.6963, + "step": 56976 + }, + { + "epoch": 1.46, + "learning_rate": 1.09126832245175e-06, + "loss": 0.7812, + "step": 56977 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912407674500686e-06, + "loss": 0.561, + "step": 56978 + }, + { + "epoch": 1.46, + "learning_rate": 1.0912132123785285e-06, + "loss": 0.7383, + "step": 56979 + }, + { + "epoch": 1.46, + "learning_rate": 1.0911856572371508e-06, + "loss": 0.594, + "step": 56980 + }, + { + "epoch": 1.46, + "learning_rate": 1.091158102025956e-06, + "loss": 0.6836, + "step": 56981 + }, + { + "epoch": 1.46, + "learning_rate": 1.0911305467449658e-06, + "loss": 0.4771, + "step": 56982 + }, + { + "epoch": 1.46, + "learning_rate": 1.091102991394201e-06, + "loss": 0.8076, + "step": 56983 + }, + { + "epoch": 1.46, + "learning_rate": 1.0910754359736836e-06, + "loss": 0.5361, + "step": 56984 + }, + { + "epoch": 1.46, + "learning_rate": 1.091047880483433e-06, + "loss": 0.6069, + "step": 56985 + }, + { + "epoch": 1.46, + "learning_rate": 1.0910203249234718e-06, + "loss": 0.5374, + "step": 56986 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909927692938202e-06, + "loss": 0.7256, + "step": 56987 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909652135944995e-06, + "loss": 0.7207, + "step": 56988 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909376578255314e-06, + "loss": 0.564, + "step": 56989 + }, + { + "epoch": 1.46, + "learning_rate": 1.0909101019869362e-06, + "loss": 0.6875, + "step": 56990 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908825460787351e-06, + "loss": 0.6221, + "step": 56991 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908549901009498e-06, + "loss": 0.6572, + "step": 56992 + }, + { + "epoch": 1.46, + "learning_rate": 1.0908274340536009e-06, + "loss": 0.6824, + "step": 56993 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907998779367099e-06, + "loss": 0.8145, + "step": 56994 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907723217502972e-06, + "loss": 0.6777, + "step": 56995 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907447654943844e-06, + "loss": 0.6191, + "step": 56996 + }, + { + "epoch": 1.46, + "learning_rate": 1.0907172091689924e-06, + "loss": 0.5586, + "step": 56997 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906896527741425e-06, + "loss": 0.5991, + "step": 56998 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906620963098558e-06, + "loss": 0.6821, + "step": 56999 + }, + { + "epoch": 1.46, + "learning_rate": 1.0906345397761533e-06, + "loss": 0.5967, + "step": 57000 + }, + { + "epoch": 1.46, + "learning_rate": 1.090606983173056e-06, + "loss": 0.6709, + "step": 57001 + }, + { + "epoch": 1.46, + "learning_rate": 1.090579426500585e-06, + "loss": 0.6846, + "step": 57002 + }, + { + "epoch": 1.46, + "learning_rate": 1.0905518697587617e-06, + "loss": 0.4976, + "step": 57003 + }, + { + "epoch": 1.46, + "learning_rate": 1.090524312947607e-06, + "loss": 0.5015, + "step": 57004 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904967560671418e-06, + "loss": 0.6787, + "step": 57005 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904691991173875e-06, + "loss": 0.562, + "step": 57006 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904416420983651e-06, + "loss": 0.6582, + "step": 57007 + }, + { + "epoch": 1.46, + "learning_rate": 1.0904140850100955e-06, + "loss": 0.7168, + "step": 57008 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903865278526006e-06, + "loss": 0.5601, + "step": 57009 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903589706259002e-06, + "loss": 0.6064, + "step": 57010 + }, + { + "epoch": 1.46, + "learning_rate": 1.0903314133300166e-06, + "loss": 0.7266, + "step": 57011 + }, + { + "epoch": 1.46, + "learning_rate": 1.09030385596497e-06, + "loss": 0.6543, + "step": 57012 + }, + { + "epoch": 1.46, + "learning_rate": 1.0902762985307821e-06, + "loss": 0.7285, + "step": 57013 + }, + { + "epoch": 1.46, + "learning_rate": 1.090248741027474e-06, + "loss": 0.5049, + "step": 57014 + }, + { + "epoch": 1.46, + "learning_rate": 1.0902211834550664e-06, + "loss": 0.9189, + "step": 57015 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901936258135802e-06, + "loss": 0.5674, + "step": 57016 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901660681030374e-06, + "loss": 0.7041, + "step": 57017 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901385103234583e-06, + "loss": 0.6172, + "step": 57018 + }, + { + "epoch": 1.46, + "learning_rate": 1.0901109524748643e-06, + "loss": 0.6982, + "step": 57019 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900833945572768e-06, + "loss": 0.8213, + "step": 57020 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900558365707162e-06, + "loss": 0.4783, + "step": 57021 + }, + { + "epoch": 1.46, + "learning_rate": 1.090028278515204e-06, + "loss": 0.7314, + "step": 57022 + }, + { + "epoch": 1.46, + "learning_rate": 1.0900007203907615e-06, + "loss": 0.6084, + "step": 57023 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899731621974097e-06, + "loss": 0.6372, + "step": 57024 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899456039351691e-06, + "loss": 0.7573, + "step": 57025 + }, + { + "epoch": 1.46, + "learning_rate": 1.0899180456040618e-06, + "loss": 0.8203, + "step": 57026 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898904872041079e-06, + "loss": 0.5903, + "step": 57027 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898629287353293e-06, + "loss": 0.7822, + "step": 57028 + }, + { + "epoch": 1.46, + "learning_rate": 1.089835370197747e-06, + "loss": 0.562, + "step": 57029 + }, + { + "epoch": 1.46, + "learning_rate": 1.0898078115913817e-06, + "loss": 0.6079, + "step": 57030 + }, + { + "epoch": 1.46, + "learning_rate": 1.0897802529162545e-06, + "loss": 0.5884, + "step": 57031 + }, + { + "epoch": 1.46, + "learning_rate": 1.089752694172387e-06, + "loss": 0.7256, + "step": 57032 + }, + { + "epoch": 1.46, + "learning_rate": 1.0897251353597996e-06, + "loss": 0.7373, + "step": 57033 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896975764785141e-06, + "loss": 0.7559, + "step": 57034 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896700175285512e-06, + "loss": 0.647, + "step": 57035 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896424585099322e-06, + "loss": 0.5938, + "step": 57036 + }, + { + "epoch": 1.46, + "learning_rate": 1.0896148994226778e-06, + "loss": 0.4333, + "step": 57037 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895873402668096e-06, + "loss": 0.6992, + "step": 57038 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895597810423485e-06, + "loss": 0.8135, + "step": 57039 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895322217493156e-06, + "loss": 0.5771, + "step": 57040 + }, + { + "epoch": 1.46, + "learning_rate": 1.0895046623877317e-06, + "loss": 0.7051, + "step": 57041 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894771029576187e-06, + "loss": 0.8242, + "step": 57042 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894495434589967e-06, + "loss": 0.6875, + "step": 57043 + }, + { + "epoch": 1.46, + "learning_rate": 1.0894219838918877e-06, + "loss": 0.6313, + "step": 57044 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893944242563122e-06, + "loss": 0.6499, + "step": 57045 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893668645522913e-06, + "loss": 0.8184, + "step": 57046 + }, + { + "epoch": 1.46, + "learning_rate": 1.0893393047798467e-06, + "loss": 0.5708, + "step": 57047 + }, + { + "epoch": 1.46, + "learning_rate": 1.089311744938999e-06, + "loss": 0.7363, + "step": 57048 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892841850297694e-06, + "loss": 0.7666, + "step": 57049 + }, + { + "epoch": 1.46, + "learning_rate": 1.089256625052179e-06, + "loss": 0.6929, + "step": 57050 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892290650062487e-06, + "loss": 0.6414, + "step": 57051 + }, + { + "epoch": 1.46, + "learning_rate": 1.0892015048919999e-06, + "loss": 0.7476, + "step": 57052 + }, + { + "epoch": 1.46, + "learning_rate": 1.0891739447094536e-06, + "loss": 0.6069, + "step": 57053 + }, + { + "epoch": 1.46, + "learning_rate": 1.089146384458631e-06, + "loss": 0.7324, + "step": 57054 + }, + { + "epoch": 1.46, + "learning_rate": 1.0891188241395533e-06, + "loss": 0.8867, + "step": 57055 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890912637522411e-06, + "loss": 0.6904, + "step": 57056 + }, + { + "epoch": 1.46, + "learning_rate": 1.089063703296716e-06, + "loss": 0.6963, + "step": 57057 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890361427729986e-06, + "loss": 0.7461, + "step": 57058 + }, + { + "epoch": 1.46, + "learning_rate": 1.0890085821811108e-06, + "loss": 0.5735, + "step": 57059 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889810215210728e-06, + "loss": 0.5161, + "step": 57060 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889534607929065e-06, + "loss": 0.6777, + "step": 57061 + }, + { + "epoch": 1.46, + "learning_rate": 1.0889258999966322e-06, + "loss": 0.7139, + "step": 57062 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888983391322717e-06, + "loss": 0.5424, + "step": 57063 + }, + { + "epoch": 1.46, + "learning_rate": 1.088870778199846e-06, + "loss": 0.8076, + "step": 57064 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888432171993757e-06, + "loss": 0.7344, + "step": 57065 + }, + { + "epoch": 1.46, + "learning_rate": 1.0888156561308824e-06, + "loss": 0.6396, + "step": 57066 + }, + { + "epoch": 1.46, + "learning_rate": 1.088788094994387e-06, + "loss": 0.7021, + "step": 57067 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887605337899105e-06, + "loss": 0.7246, + "step": 57068 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887329725174743e-06, + "loss": 0.7168, + "step": 57069 + }, + { + "epoch": 1.46, + "learning_rate": 1.0887054111770994e-06, + "loss": 0.623, + "step": 57070 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886778497688066e-06, + "loss": 0.8057, + "step": 57071 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886502882926174e-06, + "loss": 0.709, + "step": 57072 + }, + { + "epoch": 1.46, + "learning_rate": 1.0886227267485526e-06, + "loss": 0.6982, + "step": 57073 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885951651366338e-06, + "loss": 0.6279, + "step": 57074 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885676034568817e-06, + "loss": 0.6353, + "step": 57075 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885400417093174e-06, + "loss": 0.6514, + "step": 57076 + }, + { + "epoch": 1.46, + "learning_rate": 1.0885124798939618e-06, + "loss": 0.5371, + "step": 57077 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884849180108365e-06, + "loss": 0.6543, + "step": 57078 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884573560599625e-06, + "loss": 0.5718, + "step": 57079 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884297940413605e-06, + "loss": 0.6602, + "step": 57080 + }, + { + "epoch": 1.46, + "learning_rate": 1.0884022319550516e-06, + "loss": 0.5908, + "step": 57081 + }, + { + "epoch": 1.46, + "learning_rate": 1.0883746698010576e-06, + "loss": 0.7803, + "step": 57082 + }, + { + "epoch": 1.46, + "learning_rate": 1.088347107579399e-06, + "loss": 0.8027, + "step": 57083 + }, + { + "epoch": 1.46, + "learning_rate": 1.0883195452900974e-06, + "loss": 0.4956, + "step": 57084 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882919829331734e-06, + "loss": 0.7793, + "step": 57085 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882644205086485e-06, + "loss": 0.6973, + "step": 57086 + }, + { + "epoch": 1.46, + "learning_rate": 1.088236858016543e-06, + "loss": 0.6899, + "step": 57087 + }, + { + "epoch": 1.46, + "learning_rate": 1.0882092954568792e-06, + "loss": 0.5956, + "step": 57088 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881817328296775e-06, + "loss": 0.4443, + "step": 57089 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881541701349586e-06, + "loss": 0.667, + "step": 57090 + }, + { + "epoch": 1.46, + "learning_rate": 1.0881266073727443e-06, + "loss": 0.5605, + "step": 57091 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880990445430558e-06, + "loss": 0.6826, + "step": 57092 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880714816459139e-06, + "loss": 0.5101, + "step": 57093 + }, + { + "epoch": 1.46, + "learning_rate": 1.0880439186813394e-06, + "loss": 0.5197, + "step": 57094 + }, + { + "epoch": 1.46, + "learning_rate": 1.088016355649354e-06, + "loss": 0.8662, + "step": 57095 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879887925499785e-06, + "loss": 0.6616, + "step": 57096 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879612293832338e-06, + "loss": 0.623, + "step": 57097 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879336661491415e-06, + "loss": 0.8652, + "step": 57098 + }, + { + "epoch": 1.46, + "learning_rate": 1.0879061028477225e-06, + "loss": 0.6577, + "step": 57099 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878785394789975e-06, + "loss": 0.7979, + "step": 57100 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878509760429882e-06, + "loss": 0.9111, + "step": 57101 + }, + { + "epoch": 1.46, + "learning_rate": 1.0878234125397152e-06, + "loss": 0.625, + "step": 57102 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877958489692e-06, + "loss": 0.6484, + "step": 57103 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877682853314637e-06, + "loss": 0.7197, + "step": 57104 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877407216265274e-06, + "loss": 0.6572, + "step": 57105 + }, + { + "epoch": 1.46, + "learning_rate": 1.0877131578544114e-06, + "loss": 0.8301, + "step": 57106 + }, + { + "epoch": 1.46, + "learning_rate": 1.087685594015138e-06, + "loss": 0.8311, + "step": 57107 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876580301087275e-06, + "loss": 0.6606, + "step": 57108 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876304661352014e-06, + "loss": 0.5508, + "step": 57109 + }, + { + "epoch": 1.46, + "learning_rate": 1.0876029020945809e-06, + "loss": 0.6025, + "step": 57110 + }, + { + "epoch": 1.46, + "learning_rate": 1.0875753379868865e-06, + "loss": 0.626, + "step": 57111 + }, + { + "epoch": 1.46, + "learning_rate": 1.08754777381214e-06, + "loss": 0.8164, + "step": 57112 + }, + { + "epoch": 1.46, + "learning_rate": 1.087520209570362e-06, + "loss": 0.6826, + "step": 57113 + }, + { + "epoch": 1.46, + "learning_rate": 1.087492645261574e-06, + "loss": 0.6451, + "step": 57114 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874650808857965e-06, + "loss": 0.4966, + "step": 57115 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874375164430513e-06, + "loss": 0.563, + "step": 57116 + }, + { + "epoch": 1.46, + "learning_rate": 1.0874099519333593e-06, + "loss": 0.6572, + "step": 57117 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873823873567414e-06, + "loss": 0.5884, + "step": 57118 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873548227132189e-06, + "loss": 0.6216, + "step": 57119 + }, + { + "epoch": 1.46, + "learning_rate": 1.0873272580028127e-06, + "loss": 0.4543, + "step": 57120 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872996932255441e-06, + "loss": 0.582, + "step": 57121 + }, + { + "epoch": 1.46, + "learning_rate": 1.087272128381434e-06, + "loss": 0.7236, + "step": 57122 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872445634705038e-06, + "loss": 0.7168, + "step": 57123 + }, + { + "epoch": 1.46, + "learning_rate": 1.0872169984927745e-06, + "loss": 0.5996, + "step": 57124 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871894334482672e-06, + "loss": 0.604, + "step": 57125 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871618683370028e-06, + "loss": 0.7461, + "step": 57126 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871343031590027e-06, + "loss": 0.7627, + "step": 57127 + }, + { + "epoch": 1.46, + "learning_rate": 1.0871067379142877e-06, + "loss": 0.6958, + "step": 57128 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870791726028793e-06, + "loss": 0.7256, + "step": 57129 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870516072247981e-06, + "loss": 0.647, + "step": 57130 + }, + { + "epoch": 1.46, + "learning_rate": 1.0870240417800657e-06, + "loss": 0.7656, + "step": 57131 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869964762687028e-06, + "loss": 0.6387, + "step": 57132 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869689106907306e-06, + "loss": 0.7773, + "step": 57133 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869413450461706e-06, + "loss": 0.7158, + "step": 57134 + }, + { + "epoch": 1.46, + "learning_rate": 1.0869137793350435e-06, + "loss": 0.75, + "step": 57135 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868862135573707e-06, + "loss": 0.6709, + "step": 57136 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868586477131729e-06, + "loss": 0.564, + "step": 57137 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868310818024715e-06, + "loss": 0.6201, + "step": 57138 + }, + { + "epoch": 1.46, + "learning_rate": 1.0868035158252878e-06, + "loss": 0.708, + "step": 57139 + }, + { + "epoch": 1.46, + "learning_rate": 1.086775949781642e-06, + "loss": 0.6973, + "step": 57140 + }, + { + "epoch": 1.46, + "learning_rate": 1.0867483836715563e-06, + "loss": 0.5906, + "step": 57141 + }, + { + "epoch": 1.46, + "learning_rate": 1.0867208174950513e-06, + "loss": 0.6904, + "step": 57142 + }, + { + "epoch": 1.46, + "learning_rate": 1.086693251252148e-06, + "loss": 0.707, + "step": 57143 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866656849428679e-06, + "loss": 0.5498, + "step": 57144 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866381185672318e-06, + "loss": 0.6084, + "step": 57145 + }, + { + "epoch": 1.46, + "learning_rate": 1.0866105521252606e-06, + "loss": 0.5007, + "step": 57146 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865829856169762e-06, + "loss": 0.6982, + "step": 57147 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865554190423987e-06, + "loss": 0.6494, + "step": 57148 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865278524015503e-06, + "loss": 0.6785, + "step": 57149 + }, + { + "epoch": 1.46, + "learning_rate": 1.0865002856944507e-06, + "loss": 0.5522, + "step": 57150 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864727189211225e-06, + "loss": 0.7036, + "step": 57151 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864451520815856e-06, + "loss": 0.6321, + "step": 57152 + }, + { + "epoch": 1.46, + "learning_rate": 1.0864175851758619e-06, + "loss": 0.4064, + "step": 57153 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863900182039722e-06, + "loss": 0.6963, + "step": 57154 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863624511659375e-06, + "loss": 0.5669, + "step": 57155 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863348840617792e-06, + "loss": 0.6963, + "step": 57156 + }, + { + "epoch": 1.46, + "learning_rate": 1.0863073168915182e-06, + "loss": 0.7305, + "step": 57157 + }, + { + "epoch": 1.46, + "learning_rate": 1.0862797496551757e-06, + "loss": 0.603, + "step": 57158 + }, + { + "epoch": 1.47, + "learning_rate": 1.0862521823527725e-06, + "loss": 0.6309, + "step": 57159 + }, + { + "epoch": 1.47, + "learning_rate": 1.0862246149843304e-06, + "loss": 0.5933, + "step": 57160 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861970475498697e-06, + "loss": 0.6431, + "step": 57161 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861694800494122e-06, + "loss": 0.499, + "step": 57162 + }, + { + "epoch": 1.47, + "learning_rate": 1.0861419124829783e-06, + "loss": 0.6924, + "step": 57163 + }, + { + "epoch": 1.47, + "learning_rate": 1.08611434485059e-06, + "loss": 0.5635, + "step": 57164 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860867771522676e-06, + "loss": 0.6211, + "step": 57165 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860592093880326e-06, + "loss": 0.6582, + "step": 57166 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860316415579058e-06, + "loss": 0.6729, + "step": 57167 + }, + { + "epoch": 1.47, + "learning_rate": 1.0860040736619087e-06, + "loss": 0.6543, + "step": 57168 + }, + { + "epoch": 1.47, + "learning_rate": 1.0859765057000624e-06, + "loss": 0.6777, + "step": 57169 + }, + { + "epoch": 1.47, + "learning_rate": 1.085948937672388e-06, + "loss": 0.5201, + "step": 57170 + }, + { + "epoch": 1.47, + "learning_rate": 1.0859213695789057e-06, + "loss": 0.6343, + "step": 57171 + }, + { + "epoch": 1.47, + "learning_rate": 1.085893801419638e-06, + "loss": 0.5688, + "step": 57172 + }, + { + "epoch": 1.47, + "learning_rate": 1.0858662331946048e-06, + "loss": 0.4475, + "step": 57173 + }, + { + "epoch": 1.47, + "learning_rate": 1.0858386649038285e-06, + "loss": 0.6392, + "step": 57174 + }, + { + "epoch": 1.47, + "learning_rate": 1.085811096547329e-06, + "loss": 0.8359, + "step": 57175 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857835281251282e-06, + "loss": 0.7324, + "step": 57176 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857559596372465e-06, + "loss": 0.585, + "step": 57177 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857283910837057e-06, + "loss": 0.708, + "step": 57178 + }, + { + "epoch": 1.47, + "learning_rate": 1.0857008224645265e-06, + "loss": 0.7529, + "step": 57179 + }, + { + "epoch": 1.47, + "learning_rate": 1.08567325377973e-06, + "loss": 0.6895, + "step": 57180 + }, + { + "epoch": 1.47, + "learning_rate": 1.0856456850293377e-06, + "loss": 0.5962, + "step": 57181 + }, + { + "epoch": 1.47, + "learning_rate": 1.0856181162133702e-06, + "loss": 0.7324, + "step": 57182 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855905473318492e-06, + "loss": 0.5724, + "step": 57183 + }, + { + "epoch": 1.47, + "learning_rate": 1.085562978384795e-06, + "loss": 0.6934, + "step": 57184 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855354093722295e-06, + "loss": 0.7617, + "step": 57185 + }, + { + "epoch": 1.47, + "learning_rate": 1.0855078402941731e-06, + "loss": 0.8369, + "step": 57186 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854802711506477e-06, + "loss": 0.7334, + "step": 57187 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854527019416737e-06, + "loss": 0.6973, + "step": 57188 + }, + { + "epoch": 1.47, + "learning_rate": 1.0854251326672728e-06, + "loss": 0.6658, + "step": 57189 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853975633274654e-06, + "loss": 0.4663, + "step": 57190 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853699939222733e-06, + "loss": 0.7109, + "step": 57191 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853424244517171e-06, + "loss": 0.6113, + "step": 57192 + }, + { + "epoch": 1.47, + "learning_rate": 1.0853148549158185e-06, + "loss": 0.625, + "step": 57193 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852872853145977e-06, + "loss": 0.7559, + "step": 57194 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852597156480769e-06, + "loss": 0.6777, + "step": 57195 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852321459162762e-06, + "loss": 0.749, + "step": 57196 + }, + { + "epoch": 1.47, + "learning_rate": 1.0852045761192174e-06, + "loss": 0.5835, + "step": 57197 + }, + { + "epoch": 1.47, + "learning_rate": 1.0851770062569214e-06, + "loss": 0.5341, + "step": 57198 + }, + { + "epoch": 1.47, + "learning_rate": 1.0851494363294092e-06, + "loss": 0.6172, + "step": 57199 + }, + { + "epoch": 1.47, + "learning_rate": 1.085121866336702e-06, + "loss": 0.5371, + "step": 57200 + }, + { + "epoch": 1.47, + "learning_rate": 1.085094296278821e-06, + "loss": 0.491, + "step": 57201 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850667261557871e-06, + "loss": 0.6943, + "step": 57202 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850391559676215e-06, + "loss": 0.707, + "step": 57203 + }, + { + "epoch": 1.47, + "learning_rate": 1.0850115857143456e-06, + "loss": 0.52, + "step": 57204 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849840153959798e-06, + "loss": 0.7012, + "step": 57205 + }, + { + "epoch": 1.47, + "learning_rate": 1.084956445012546e-06, + "loss": 0.6221, + "step": 57206 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849288745640646e-06, + "loss": 0.6445, + "step": 57207 + }, + { + "epoch": 1.47, + "learning_rate": 1.0849013040505575e-06, + "loss": 0.7715, + "step": 57208 + }, + { + "epoch": 1.47, + "learning_rate": 1.084873733472045e-06, + "loss": 0.6992, + "step": 57209 + }, + { + "epoch": 1.47, + "learning_rate": 1.0848461628285487e-06, + "loss": 0.6636, + "step": 57210 + }, + { + "epoch": 1.47, + "learning_rate": 1.0848185921200897e-06, + "loss": 0.6465, + "step": 57211 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847910213466888e-06, + "loss": 0.7002, + "step": 57212 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847634505083675e-06, + "loss": 0.6191, + "step": 57213 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847358796051468e-06, + "loss": 0.5308, + "step": 57214 + }, + { + "epoch": 1.47, + "learning_rate": 1.0847083086370476e-06, + "loss": 0.7705, + "step": 57215 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846807376040913e-06, + "loss": 0.6514, + "step": 57216 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846531665062986e-06, + "loss": 0.7236, + "step": 57217 + }, + { + "epoch": 1.47, + "learning_rate": 1.0846255953436912e-06, + "loss": 0.623, + "step": 57218 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845980241162896e-06, + "loss": 0.665, + "step": 57219 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845704528241151e-06, + "loss": 0.5986, + "step": 57220 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845428814671888e-06, + "loss": 0.665, + "step": 57221 + }, + { + "epoch": 1.47, + "learning_rate": 1.0845153100455323e-06, + "loss": 0.5535, + "step": 57222 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844877385591662e-06, + "loss": 0.6309, + "step": 57223 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844601670081116e-06, + "loss": 0.6685, + "step": 57224 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844325953923898e-06, + "loss": 0.6475, + "step": 57225 + }, + { + "epoch": 1.47, + "learning_rate": 1.0844050237120217e-06, + "loss": 0.48, + "step": 57226 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843774519670287e-06, + "loss": 0.7256, + "step": 57227 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843498801574317e-06, + "loss": 0.7402, + "step": 57228 + }, + { + "epoch": 1.47, + "learning_rate": 1.0843223082832522e-06, + "loss": 0.7061, + "step": 57229 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842947363445104e-06, + "loss": 0.6812, + "step": 57230 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842671643412285e-06, + "loss": 0.6157, + "step": 57231 + }, + { + "epoch": 1.47, + "learning_rate": 1.0842395922734269e-06, + "loss": 0.6113, + "step": 57232 + }, + { + "epoch": 1.47, + "learning_rate": 1.084212020141127e-06, + "loss": 0.5544, + "step": 57233 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841844479443498e-06, + "loss": 0.688, + "step": 57234 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841568756831163e-06, + "loss": 0.6035, + "step": 57235 + }, + { + "epoch": 1.47, + "learning_rate": 1.084129303357448e-06, + "loss": 0.6948, + "step": 57236 + }, + { + "epoch": 1.47, + "learning_rate": 1.0841017309673655e-06, + "loss": 0.7529, + "step": 57237 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840741585128903e-06, + "loss": 0.4619, + "step": 57238 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840465859940436e-06, + "loss": 0.6816, + "step": 57239 + }, + { + "epoch": 1.47, + "learning_rate": 1.0840190134108459e-06, + "loss": 0.5615, + "step": 57240 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839914407633188e-06, + "loss": 0.6299, + "step": 57241 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839638680514832e-06, + "loss": 0.6162, + "step": 57242 + }, + { + "epoch": 1.47, + "learning_rate": 1.0839362952753608e-06, + "loss": 0.6494, + "step": 57243 + }, + { + "epoch": 1.47, + "learning_rate": 1.083908722434972e-06, + "loss": 0.6982, + "step": 57244 + }, + { + "epoch": 1.47, + "learning_rate": 1.083881149530338e-06, + "loss": 0.8506, + "step": 57245 + }, + { + "epoch": 1.47, + "learning_rate": 1.08385357656148e-06, + "loss": 0.6787, + "step": 57246 + }, + { + "epoch": 1.47, + "learning_rate": 1.0838260035284195e-06, + "loss": 0.7222, + "step": 57247 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837984304311772e-06, + "loss": 0.6567, + "step": 57248 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837708572697742e-06, + "loss": 0.7427, + "step": 57249 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837432840442316e-06, + "loss": 0.5601, + "step": 57250 + }, + { + "epoch": 1.47, + "learning_rate": 1.0837157107545707e-06, + "loss": 0.6924, + "step": 57251 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836881374008128e-06, + "loss": 0.5874, + "step": 57252 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836605639829784e-06, + "loss": 0.662, + "step": 57253 + }, + { + "epoch": 1.47, + "learning_rate": 1.083632990501089e-06, + "loss": 0.7637, + "step": 57254 + }, + { + "epoch": 1.47, + "learning_rate": 1.0836054169551656e-06, + "loss": 0.7285, + "step": 57255 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835778433452295e-06, + "loss": 0.5786, + "step": 57256 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835502696713018e-06, + "loss": 0.6631, + "step": 57257 + }, + { + "epoch": 1.47, + "learning_rate": 1.0835226959334036e-06, + "loss": 0.5586, + "step": 57258 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834951221315556e-06, + "loss": 0.7148, + "step": 57259 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834675482657794e-06, + "loss": 0.6885, + "step": 57260 + }, + { + "epoch": 1.47, + "learning_rate": 1.0834399743360955e-06, + "loss": 0.5076, + "step": 57261 + }, + { + "epoch": 1.47, + "learning_rate": 1.083412400342526e-06, + "loss": 0.6748, + "step": 57262 + }, + { + "epoch": 1.47, + "learning_rate": 1.0833848262850913e-06, + "loss": 0.7812, + "step": 57263 + }, + { + "epoch": 1.47, + "learning_rate": 1.0833572521638128e-06, + "loss": 0.7432, + "step": 57264 + }, + { + "epoch": 1.47, + "learning_rate": 1.083329677978711e-06, + "loss": 0.5398, + "step": 57265 + }, + { + "epoch": 1.47, + "learning_rate": 1.083302103729808e-06, + "loss": 0.5869, + "step": 57266 + }, + { + "epoch": 1.47, + "learning_rate": 1.0832745294171242e-06, + "loss": 0.6533, + "step": 57267 + }, + { + "epoch": 1.47, + "learning_rate": 1.083246955040681e-06, + "loss": 0.6416, + "step": 57268 + }, + { + "epoch": 1.47, + "learning_rate": 1.0832193806004994e-06, + "loss": 0.6289, + "step": 57269 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831918060966003e-06, + "loss": 0.7002, + "step": 57270 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831642315290055e-06, + "loss": 0.7881, + "step": 57271 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831366568977353e-06, + "loss": 0.5811, + "step": 57272 + }, + { + "epoch": 1.47, + "learning_rate": 1.0831090822028116e-06, + "loss": 0.6821, + "step": 57273 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830815074442548e-06, + "loss": 0.6846, + "step": 57274 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830539326220864e-06, + "loss": 0.6733, + "step": 57275 + }, + { + "epoch": 1.47, + "learning_rate": 1.0830263577363273e-06, + "loss": 0.5613, + "step": 57276 + }, + { + "epoch": 1.47, + "learning_rate": 1.082998782786999e-06, + "loss": 0.5942, + "step": 57277 + }, + { + "epoch": 1.47, + "learning_rate": 1.082971207774122e-06, + "loss": 0.5935, + "step": 57278 + }, + { + "epoch": 1.47, + "learning_rate": 1.082943632697718e-06, + "loss": 0.6104, + "step": 57279 + }, + { + "epoch": 1.47, + "learning_rate": 1.0829160575578078e-06, + "loss": 0.6064, + "step": 57280 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828884823544125e-06, + "loss": 0.6577, + "step": 57281 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828609070875531e-06, + "loss": 0.7344, + "step": 57282 + }, + { + "epoch": 1.47, + "learning_rate": 1.0828333317572518e-06, + "loss": 0.6631, + "step": 57283 + }, + { + "epoch": 1.47, + "learning_rate": 1.082805756363528e-06, + "loss": 0.5762, + "step": 57284 + }, + { + "epoch": 1.47, + "learning_rate": 1.082778180906404e-06, + "loss": 0.7178, + "step": 57285 + }, + { + "epoch": 1.47, + "learning_rate": 1.0827506053859e-06, + "loss": 0.6904, + "step": 57286 + }, + { + "epoch": 1.47, + "learning_rate": 1.0827230298020384e-06, + "loss": 0.6338, + "step": 57287 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826954541548392e-06, + "loss": 0.7202, + "step": 57288 + }, + { + "epoch": 1.47, + "learning_rate": 1.082667878444324e-06, + "loss": 0.4659, + "step": 57289 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826403026705137e-06, + "loss": 0.6216, + "step": 57290 + }, + { + "epoch": 1.47, + "learning_rate": 1.0826127268334298e-06, + "loss": 0.7305, + "step": 57291 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825851509330927e-06, + "loss": 0.7119, + "step": 57292 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825575749695241e-06, + "loss": 0.4788, + "step": 57293 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825299989427451e-06, + "loss": 0.5712, + "step": 57294 + }, + { + "epoch": 1.47, + "learning_rate": 1.0825024228527766e-06, + "loss": 0.709, + "step": 57295 + }, + { + "epoch": 1.47, + "learning_rate": 1.08247484669964e-06, + "loss": 0.6934, + "step": 57296 + }, + { + "epoch": 1.47, + "learning_rate": 1.082447270483356e-06, + "loss": 0.5928, + "step": 57297 + }, + { + "epoch": 1.47, + "learning_rate": 1.082419694203946e-06, + "loss": 0.7354, + "step": 57298 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823921178614307e-06, + "loss": 0.5464, + "step": 57299 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823645414558319e-06, + "loss": 0.5312, + "step": 57300 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823369649871701e-06, + "loss": 0.6025, + "step": 57301 + }, + { + "epoch": 1.47, + "learning_rate": 1.0823093884554667e-06, + "loss": 0.7441, + "step": 57302 + }, + { + "epoch": 1.47, + "learning_rate": 1.082281811860743e-06, + "loss": 0.5332, + "step": 57303 + }, + { + "epoch": 1.47, + "learning_rate": 1.08225423520302e-06, + "loss": 0.457, + "step": 57304 + }, + { + "epoch": 1.47, + "learning_rate": 1.0822266584823183e-06, + "loss": 0.4556, + "step": 57305 + }, + { + "epoch": 1.47, + "learning_rate": 1.0821990816986596e-06, + "loss": 0.7041, + "step": 57306 + }, + { + "epoch": 1.47, + "learning_rate": 1.082171504852065e-06, + "loss": 0.7383, + "step": 57307 + }, + { + "epoch": 1.47, + "learning_rate": 1.0821439279425556e-06, + "loss": 0.5154, + "step": 57308 + }, + { + "epoch": 1.47, + "learning_rate": 1.082116350970152e-06, + "loss": 0.6221, + "step": 57309 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820887739348758e-06, + "loss": 0.7158, + "step": 57310 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820611968367479e-06, + "loss": 0.7129, + "step": 57311 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820336196757898e-06, + "loss": 0.5879, + "step": 57312 + }, + { + "epoch": 1.47, + "learning_rate": 1.0820060424520222e-06, + "loss": 0.4717, + "step": 57313 + }, + { + "epoch": 1.47, + "learning_rate": 1.081978465165466e-06, + "loss": 0.7178, + "step": 57314 + }, + { + "epoch": 1.47, + "learning_rate": 1.081950887816143e-06, + "loss": 0.7861, + "step": 57315 + }, + { + "epoch": 1.47, + "learning_rate": 1.0819233104040737e-06, + "loss": 0.7422, + "step": 57316 + }, + { + "epoch": 1.47, + "learning_rate": 1.08189573292928e-06, + "loss": 0.5625, + "step": 57317 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818681553917821e-06, + "loss": 0.7725, + "step": 57318 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818405777916017e-06, + "loss": 0.7578, + "step": 57319 + }, + { + "epoch": 1.47, + "learning_rate": 1.0818130001287595e-06, + "loss": 0.5549, + "step": 57320 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817854224032773e-06, + "loss": 0.6279, + "step": 57321 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817578446151752e-06, + "loss": 0.6987, + "step": 57322 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817302667644754e-06, + "loss": 0.7842, + "step": 57323 + }, + { + "epoch": 1.47, + "learning_rate": 1.0817026888511982e-06, + "loss": 0.7236, + "step": 57324 + }, + { + "epoch": 1.47, + "learning_rate": 1.081675110875365e-06, + "loss": 0.6602, + "step": 57325 + }, + { + "epoch": 1.47, + "learning_rate": 1.0816475328369969e-06, + "loss": 0.7061, + "step": 57326 + }, + { + "epoch": 1.47, + "learning_rate": 1.0816199547361152e-06, + "loss": 0.6406, + "step": 57327 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815923765727408e-06, + "loss": 0.6064, + "step": 57328 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815647983468949e-06, + "loss": 0.6125, + "step": 57329 + }, + { + "epoch": 1.47, + "learning_rate": 1.0815372200585984e-06, + "loss": 0.6816, + "step": 57330 + }, + { + "epoch": 1.47, + "learning_rate": 1.081509641707873e-06, + "loss": 0.7256, + "step": 57331 + }, + { + "epoch": 1.47, + "learning_rate": 1.0814820632947389e-06, + "loss": 0.4702, + "step": 57332 + }, + { + "epoch": 1.47, + "learning_rate": 1.0814544848192179e-06, + "loss": 0.5996, + "step": 57333 + }, + { + "epoch": 1.47, + "learning_rate": 1.081426906281331e-06, + "loss": 0.6211, + "step": 57334 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813993276810993e-06, + "loss": 0.6924, + "step": 57335 + }, + { + "epoch": 1.47, + "learning_rate": 1.081371749018544e-06, + "loss": 0.7109, + "step": 57336 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813441702936859e-06, + "loss": 0.7344, + "step": 57337 + }, + { + "epoch": 1.47, + "learning_rate": 1.0813165915065465e-06, + "loss": 0.7539, + "step": 57338 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812890126571462e-06, + "loss": 0.3594, + "step": 57339 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812614337455073e-06, + "loss": 0.4241, + "step": 57340 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812338547716497e-06, + "loss": 0.5972, + "step": 57341 + }, + { + "epoch": 1.47, + "learning_rate": 1.0812062757355955e-06, + "loss": 0.4285, + "step": 57342 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811786966373653e-06, + "loss": 0.5061, + "step": 57343 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811511174769803e-06, + "loss": 0.5491, + "step": 57344 + }, + { + "epoch": 1.47, + "learning_rate": 1.0811235382544614e-06, + "loss": 0.6504, + "step": 57345 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810959589698303e-06, + "loss": 0.6123, + "step": 57346 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810683796231072e-06, + "loss": 0.624, + "step": 57347 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810408002143145e-06, + "loss": 0.6973, + "step": 57348 + }, + { + "epoch": 1.47, + "learning_rate": 1.0810132207434722e-06, + "loss": 0.7344, + "step": 57349 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809856412106018e-06, + "loss": 0.4521, + "step": 57350 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809580616157243e-06, + "loss": 0.6748, + "step": 57351 + }, + { + "epoch": 1.47, + "learning_rate": 1.0809304819588612e-06, + "loss": 0.5186, + "step": 57352 + }, + { + "epoch": 1.47, + "learning_rate": 1.080902902240033e-06, + "loss": 0.6519, + "step": 57353 + }, + { + "epoch": 1.47, + "learning_rate": 1.0808753224592616e-06, + "loss": 0.8145, + "step": 57354 + }, + { + "epoch": 1.47, + "learning_rate": 1.0808477426165674e-06, + "loss": 0.6279, + "step": 57355 + }, + { + "epoch": 1.47, + "learning_rate": 1.080820162711972e-06, + "loss": 0.7354, + "step": 57356 + }, + { + "epoch": 1.47, + "learning_rate": 1.080792582745496e-06, + "loss": 0.3844, + "step": 57357 + }, + { + "epoch": 1.47, + "learning_rate": 1.0807650027171612e-06, + "loss": 0.7168, + "step": 57358 + }, + { + "epoch": 1.47, + "learning_rate": 1.080737422626988e-06, + "loss": 0.6943, + "step": 57359 + }, + { + "epoch": 1.47, + "learning_rate": 1.080709842474998e-06, + "loss": 0.5991, + "step": 57360 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806822622612124e-06, + "loss": 0.5752, + "step": 57361 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806546819856517e-06, + "loss": 0.6328, + "step": 57362 + }, + { + "epoch": 1.47, + "learning_rate": 1.0806271016483379e-06, + "loss": 0.6411, + "step": 57363 + }, + { + "epoch": 1.47, + "learning_rate": 1.0805995212492913e-06, + "loss": 0.7256, + "step": 57364 + }, + { + "epoch": 1.47, + "learning_rate": 1.0805719407885334e-06, + "loss": 0.5715, + "step": 57365 + }, + { + "epoch": 1.47, + "learning_rate": 1.080544360266085e-06, + "loss": 0.6152, + "step": 57366 + }, + { + "epoch": 1.47, + "learning_rate": 1.080516779681968e-06, + "loss": 0.7021, + "step": 57367 + }, + { + "epoch": 1.47, + "learning_rate": 1.0804891990362028e-06, + "loss": 0.4789, + "step": 57368 + }, + { + "epoch": 1.47, + "learning_rate": 1.080461618328811e-06, + "loss": 0.5278, + "step": 57369 + }, + { + "epoch": 1.47, + "learning_rate": 1.080434037559813e-06, + "loss": 0.5635, + "step": 57370 + }, + { + "epoch": 1.47, + "learning_rate": 1.0804064567292305e-06, + "loss": 0.4868, + "step": 57371 + }, + { + "epoch": 1.47, + "learning_rate": 1.0803788758370843e-06, + "loss": 0.666, + "step": 57372 + }, + { + "epoch": 1.47, + "learning_rate": 1.080351294883396e-06, + "loss": 0.6631, + "step": 57373 + }, + { + "epoch": 1.47, + "learning_rate": 1.0803237138681865e-06, + "loss": 0.7109, + "step": 57374 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802961327914765e-06, + "loss": 0.625, + "step": 57375 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802685516532875e-06, + "loss": 0.4843, + "step": 57376 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802409704536406e-06, + "loss": 0.7275, + "step": 57377 + }, + { + "epoch": 1.47, + "learning_rate": 1.0802133891925569e-06, + "loss": 0.7656, + "step": 57378 + }, + { + "epoch": 1.47, + "learning_rate": 1.0801858078700573e-06, + "loss": 0.8008, + "step": 57379 + }, + { + "epoch": 1.47, + "learning_rate": 1.0801582264861636e-06, + "loss": 0.7812, + "step": 57380 + }, + { + "epoch": 1.47, + "learning_rate": 1.080130645040896e-06, + "loss": 0.5483, + "step": 57381 + }, + { + "epoch": 1.47, + "learning_rate": 1.080103063534276e-06, + "loss": 0.5073, + "step": 57382 + }, + { + "epoch": 1.47, + "learning_rate": 1.0800754819663252e-06, + "loss": 0.6646, + "step": 57383 + }, + { + "epoch": 1.47, + "learning_rate": 1.080047900337064e-06, + "loss": 0.6709, + "step": 57384 + }, + { + "epoch": 1.47, + "learning_rate": 1.0800203186465138e-06, + "loss": 0.605, + "step": 57385 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799927368946956e-06, + "loss": 0.5767, + "step": 57386 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799651550816308e-06, + "loss": 0.5322, + "step": 57387 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799375732073406e-06, + "loss": 0.6577, + "step": 57388 + }, + { + "epoch": 1.47, + "learning_rate": 1.0799099912718456e-06, + "loss": 0.6807, + "step": 57389 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798824092751672e-06, + "loss": 0.542, + "step": 57390 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798548272173264e-06, + "loss": 0.7412, + "step": 57391 + }, + { + "epoch": 1.47, + "learning_rate": 1.0798272450983448e-06, + "loss": 0.748, + "step": 57392 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797996629182429e-06, + "loss": 0.6289, + "step": 57393 + }, + { + "epoch": 1.47, + "learning_rate": 1.079772080677042e-06, + "loss": 0.6836, + "step": 57394 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797444983747634e-06, + "loss": 0.5425, + "step": 57395 + }, + { + "epoch": 1.47, + "learning_rate": 1.0797169160114281e-06, + "loss": 0.6494, + "step": 57396 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796893335870571e-06, + "loss": 0.7422, + "step": 57397 + }, + { + "epoch": 1.47, + "learning_rate": 1.079661751101672e-06, + "loss": 0.6846, + "step": 57398 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796341685552933e-06, + "loss": 0.6057, + "step": 57399 + }, + { + "epoch": 1.47, + "learning_rate": 1.0796065859479424e-06, + "loss": 0.5972, + "step": 57400 + }, + { + "epoch": 1.47, + "learning_rate": 1.07957900327964e-06, + "loss": 0.665, + "step": 57401 + }, + { + "epoch": 1.47, + "learning_rate": 1.0795514205504081e-06, + "loss": 0.8848, + "step": 57402 + }, + { + "epoch": 1.47, + "learning_rate": 1.0795238377602673e-06, + "loss": 0.748, + "step": 57403 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794962549092386e-06, + "loss": 0.6743, + "step": 57404 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794686719973434e-06, + "loss": 0.687, + "step": 57405 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794410890246026e-06, + "loss": 0.6611, + "step": 57406 + }, + { + "epoch": 1.47, + "learning_rate": 1.0794135059910374e-06, + "loss": 0.4016, + "step": 57407 + }, + { + "epoch": 1.47, + "learning_rate": 1.079385922896669e-06, + "loss": 0.707, + "step": 57408 + }, + { + "epoch": 1.47, + "learning_rate": 1.0793583397415186e-06, + "loss": 0.7705, + "step": 57409 + }, + { + "epoch": 1.47, + "learning_rate": 1.079330756525607e-06, + "loss": 0.5522, + "step": 57410 + }, + { + "epoch": 1.47, + "learning_rate": 1.0793031732489554e-06, + "loss": 0.6904, + "step": 57411 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792755899115852e-06, + "loss": 0.6836, + "step": 57412 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792480065135174e-06, + "loss": 0.6191, + "step": 57413 + }, + { + "epoch": 1.47, + "learning_rate": 1.0792204230547728e-06, + "loss": 0.6411, + "step": 57414 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791928395353728e-06, + "loss": 0.5955, + "step": 57415 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791652559553384e-06, + "loss": 0.5413, + "step": 57416 + }, + { + "epoch": 1.47, + "learning_rate": 1.079137672314691e-06, + "loss": 0.6958, + "step": 57417 + }, + { + "epoch": 1.47, + "learning_rate": 1.0791100886134515e-06, + "loss": 0.7109, + "step": 57418 + }, + { + "epoch": 1.47, + "learning_rate": 1.079082504851641e-06, + "loss": 0.5621, + "step": 57419 + }, + { + "epoch": 1.47, + "learning_rate": 1.0790549210292805e-06, + "loss": 0.6274, + "step": 57420 + }, + { + "epoch": 1.47, + "learning_rate": 1.0790273371463916e-06, + "loss": 0.6147, + "step": 57421 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789997532029946e-06, + "loss": 0.7441, + "step": 57422 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789721691991115e-06, + "loss": 0.6089, + "step": 57423 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789445851347632e-06, + "loss": 0.7715, + "step": 57424 + }, + { + "epoch": 1.47, + "learning_rate": 1.0789170010099703e-06, + "loss": 0.6357, + "step": 57425 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788894168247546e-06, + "loss": 0.5488, + "step": 57426 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788618325791367e-06, + "loss": 0.7612, + "step": 57427 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788342482731381e-06, + "loss": 0.5828, + "step": 57428 + }, + { + "epoch": 1.47, + "learning_rate": 1.0788066639067793e-06, + "loss": 0.6021, + "step": 57429 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787790794800824e-06, + "loss": 0.6221, + "step": 57430 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787514949930675e-06, + "loss": 0.7549, + "step": 57431 + }, + { + "epoch": 1.47, + "learning_rate": 1.0787239104457567e-06, + "loss": 0.5454, + "step": 57432 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786963258381703e-06, + "loss": 0.637, + "step": 57433 + }, + { + "epoch": 1.47, + "learning_rate": 1.07866874117033e-06, + "loss": 0.4211, + "step": 57434 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786411564422562e-06, + "loss": 0.6138, + "step": 57435 + }, + { + "epoch": 1.47, + "learning_rate": 1.0786135716539708e-06, + "loss": 0.7485, + "step": 57436 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785859868054946e-06, + "loss": 0.7305, + "step": 57437 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785584018968488e-06, + "loss": 0.623, + "step": 57438 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785308169280543e-06, + "loss": 0.752, + "step": 57439 + }, + { + "epoch": 1.47, + "learning_rate": 1.0785032318991326e-06, + "loss": 0.6616, + "step": 57440 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784756468101039e-06, + "loss": 0.3821, + "step": 57441 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784480616609907e-06, + "loss": 0.7549, + "step": 57442 + }, + { + "epoch": 1.47, + "learning_rate": 1.0784204764518132e-06, + "loss": 0.6309, + "step": 57443 + }, + { + "epoch": 1.47, + "learning_rate": 1.078392891182593e-06, + "loss": 0.4417, + "step": 57444 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783653058533505e-06, + "loss": 0.668, + "step": 57445 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783377204641075e-06, + "loss": 0.5693, + "step": 57446 + }, + { + "epoch": 1.47, + "learning_rate": 1.0783101350148848e-06, + "loss": 0.7427, + "step": 57447 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782825495057037e-06, + "loss": 0.4513, + "step": 57448 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782549639365854e-06, + "loss": 0.7236, + "step": 57449 + }, + { + "epoch": 1.47, + "learning_rate": 1.0782273783075508e-06, + "loss": 0.6045, + "step": 57450 + }, + { + "epoch": 1.47, + "learning_rate": 1.078199792618621e-06, + "loss": 0.708, + "step": 57451 + }, + { + "epoch": 1.47, + "learning_rate": 1.0781722068698172e-06, + "loss": 0.4653, + "step": 57452 + }, + { + "epoch": 1.47, + "learning_rate": 1.078144621061161e-06, + "loss": 0.5991, + "step": 57453 + }, + { + "epoch": 1.47, + "learning_rate": 1.0781170351926724e-06, + "loss": 0.7666, + "step": 57454 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780894492643734e-06, + "loss": 0.6621, + "step": 57455 + }, + { + "epoch": 1.47, + "learning_rate": 1.078061863276285e-06, + "loss": 0.8193, + "step": 57456 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780342772284283e-06, + "loss": 0.6113, + "step": 57457 + }, + { + "epoch": 1.47, + "learning_rate": 1.0780066911208243e-06, + "loss": 0.7432, + "step": 57458 + }, + { + "epoch": 1.47, + "learning_rate": 1.077979104953494e-06, + "loss": 0.7002, + "step": 57459 + }, + { + "epoch": 1.47, + "learning_rate": 1.0779515187264586e-06, + "loss": 0.7881, + "step": 57460 + }, + { + "epoch": 1.47, + "learning_rate": 1.0779239324397396e-06, + "loss": 0.5537, + "step": 57461 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778963460933576e-06, + "loss": 0.6348, + "step": 57462 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778687596873344e-06, + "loss": 0.5161, + "step": 57463 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778411732216902e-06, + "loss": 0.5378, + "step": 57464 + }, + { + "epoch": 1.47, + "learning_rate": 1.0778135866964466e-06, + "loss": 0.4395, + "step": 57465 + }, + { + "epoch": 1.47, + "learning_rate": 1.0777860001116249e-06, + "loss": 0.7495, + "step": 57466 + }, + { + "epoch": 1.47, + "learning_rate": 1.077758413467246e-06, + "loss": 0.439, + "step": 57467 + }, + { + "epoch": 1.47, + "learning_rate": 1.077730826763331e-06, + "loss": 0.6045, + "step": 57468 + }, + { + "epoch": 1.47, + "learning_rate": 1.0777032399999009e-06, + "loss": 0.5093, + "step": 57469 + }, + { + "epoch": 1.47, + "learning_rate": 1.0776756531769773e-06, + "loss": 0.5771, + "step": 57470 + }, + { + "epoch": 1.47, + "learning_rate": 1.077648066294581e-06, + "loss": 0.5264, + "step": 57471 + }, + { + "epoch": 1.47, + "learning_rate": 1.077620479352733e-06, + "loss": 0.7148, + "step": 57472 + }, + { + "epoch": 1.47, + "learning_rate": 1.0775928923514546e-06, + "loss": 0.5596, + "step": 57473 + }, + { + "epoch": 1.47, + "learning_rate": 1.077565305290767e-06, + "loss": 0.5957, + "step": 57474 + }, + { + "epoch": 1.47, + "learning_rate": 1.077537718170691e-06, + "loss": 0.7949, + "step": 57475 + }, + { + "epoch": 1.47, + "learning_rate": 1.0775101309912483e-06, + "loss": 0.5317, + "step": 57476 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774825437524593e-06, + "loss": 0.6562, + "step": 57477 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774549564543459e-06, + "loss": 0.5879, + "step": 57478 + }, + { + "epoch": 1.47, + "learning_rate": 1.0774273690969282e-06, + "loss": 0.6091, + "step": 57479 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773997816802282e-06, + "loss": 0.5933, + "step": 57480 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773721942042668e-06, + "loss": 0.7383, + "step": 57481 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773446066690653e-06, + "loss": 0.7285, + "step": 57482 + }, + { + "epoch": 1.47, + "learning_rate": 1.0773170190746444e-06, + "loss": 0.6265, + "step": 57483 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772894314210253e-06, + "loss": 0.4624, + "step": 57484 + }, + { + "epoch": 1.47, + "learning_rate": 1.077261843708229e-06, + "loss": 0.6392, + "step": 57485 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772342559362773e-06, + "loss": 0.5742, + "step": 57486 + }, + { + "epoch": 1.47, + "learning_rate": 1.0772066681051908e-06, + "loss": 0.667, + "step": 57487 + }, + { + "epoch": 1.47, + "learning_rate": 1.0771790802149905e-06, + "loss": 0.5693, + "step": 57488 + }, + { + "epoch": 1.47, + "learning_rate": 1.077151492265698e-06, + "loss": 0.5913, + "step": 57489 + }, + { + "epoch": 1.47, + "learning_rate": 1.077123904257334e-06, + "loss": 0.7227, + "step": 57490 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770963161899196e-06, + "loss": 0.7969, + "step": 57491 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770687280634765e-06, + "loss": 0.5381, + "step": 57492 + }, + { + "epoch": 1.47, + "learning_rate": 1.0770411398780253e-06, + "loss": 0.52, + "step": 57493 + }, + { + "epoch": 1.47, + "learning_rate": 1.077013551633587e-06, + "loss": 0.708, + "step": 57494 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769859633301832e-06, + "loss": 0.6514, + "step": 57495 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769583749678345e-06, + "loss": 0.7148, + "step": 57496 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769307865465627e-06, + "loss": 0.6514, + "step": 57497 + }, + { + "epoch": 1.47, + "learning_rate": 1.0769031980663883e-06, + "loss": 0.7666, + "step": 57498 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768756095273328e-06, + "loss": 0.7578, + "step": 57499 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768480209294168e-06, + "loss": 0.7236, + "step": 57500 + }, + { + "epoch": 1.47, + "learning_rate": 1.0768204322726622e-06, + "loss": 0.6729, + "step": 57501 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767928435570897e-06, + "loss": 0.645, + "step": 57502 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767652547827205e-06, + "loss": 0.6494, + "step": 57503 + }, + { + "epoch": 1.47, + "learning_rate": 1.0767376659495753e-06, + "loss": 0.541, + "step": 57504 + }, + { + "epoch": 1.47, + "learning_rate": 1.076710077057676e-06, + "loss": 0.5427, + "step": 57505 + }, + { + "epoch": 1.47, + "learning_rate": 1.076682488107043e-06, + "loss": 0.5806, + "step": 57506 + }, + { + "epoch": 1.47, + "learning_rate": 1.076654899097698e-06, + "loss": 0.666, + "step": 57507 + }, + { + "epoch": 1.47, + "learning_rate": 1.0766273100296616e-06, + "loss": 0.6001, + "step": 57508 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765997209029556e-06, + "loss": 0.8369, + "step": 57509 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765721317176002e-06, + "loss": 0.7246, + "step": 57510 + }, + { + "epoch": 1.47, + "learning_rate": 1.0765445424736174e-06, + "loss": 0.4216, + "step": 57511 + }, + { + "epoch": 1.47, + "learning_rate": 1.076516953171028e-06, + "loss": 0.4208, + "step": 57512 + }, + { + "epoch": 1.47, + "learning_rate": 1.076489363809853e-06, + "loss": 0.8428, + "step": 57513 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764617743901133e-06, + "loss": 0.5283, + "step": 57514 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764341849118306e-06, + "loss": 0.5918, + "step": 57515 + }, + { + "epoch": 1.47, + "learning_rate": 1.0764065953750258e-06, + "loss": 0.7471, + "step": 57516 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763790057797202e-06, + "loss": 0.5713, + "step": 57517 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763514161259345e-06, + "loss": 0.6689, + "step": 57518 + }, + { + "epoch": 1.47, + "learning_rate": 1.0763238264136898e-06, + "loss": 0.7061, + "step": 57519 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762962366430078e-06, + "loss": 0.7178, + "step": 57520 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762686468139088e-06, + "loss": 0.6318, + "step": 57521 + }, + { + "epoch": 1.47, + "learning_rate": 1.076241056926415e-06, + "loss": 0.7773, + "step": 57522 + }, + { + "epoch": 1.47, + "learning_rate": 1.0762134669805466e-06, + "loss": 0.6641, + "step": 57523 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761858769763253e-06, + "loss": 0.7148, + "step": 57524 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761582869137716e-06, + "loss": 0.5684, + "step": 57525 + }, + { + "epoch": 1.47, + "learning_rate": 1.0761306967929075e-06, + "loss": 0.7363, + "step": 57526 + }, + { + "epoch": 1.47, + "learning_rate": 1.076103106613753e-06, + "loss": 0.6421, + "step": 57527 + }, + { + "epoch": 1.47, + "learning_rate": 1.0760755163763305e-06, + "loss": 0.6914, + "step": 57528 + }, + { + "epoch": 1.47, + "learning_rate": 1.07604792608066e-06, + "loss": 0.6575, + "step": 57529 + }, + { + "epoch": 1.47, + "learning_rate": 1.0760203357267633e-06, + "loss": 0.5669, + "step": 57530 + }, + { + "epoch": 1.47, + "learning_rate": 1.075992745314661e-06, + "loss": 0.6152, + "step": 57531 + }, + { + "epoch": 1.47, + "learning_rate": 1.075965154844375e-06, + "loss": 0.6328, + "step": 57532 + }, + { + "epoch": 1.47, + "learning_rate": 1.0759375643159258e-06, + "loss": 0.7412, + "step": 57533 + }, + { + "epoch": 1.47, + "learning_rate": 1.0759099737293348e-06, + "loss": 0.748, + "step": 57534 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758823830846227e-06, + "loss": 0.7019, + "step": 57535 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758547923818114e-06, + "loss": 0.6172, + "step": 57536 + }, + { + "epoch": 1.47, + "learning_rate": 1.0758272016209213e-06, + "loss": 0.71, + "step": 57537 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757996108019735e-06, + "loss": 0.5566, + "step": 57538 + }, + { + "epoch": 1.47, + "learning_rate": 1.07577201992499e-06, + "loss": 0.6934, + "step": 57539 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757444289899909e-06, + "loss": 0.6396, + "step": 57540 + }, + { + "epoch": 1.47, + "learning_rate": 1.0757168379969981e-06, + "loss": 0.7061, + "step": 57541 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756892469460323e-06, + "loss": 0.7041, + "step": 57542 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756616558371147e-06, + "loss": 0.6714, + "step": 57543 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756340646702663e-06, + "loss": 0.6001, + "step": 57544 + }, + { + "epoch": 1.47, + "learning_rate": 1.0756064734455086e-06, + "loss": 0.5388, + "step": 57545 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755788821628624e-06, + "loss": 0.4956, + "step": 57546 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755512908223492e-06, + "loss": 0.6069, + "step": 57547 + }, + { + "epoch": 1.47, + "learning_rate": 1.0755236994239896e-06, + "loss": 0.6123, + "step": 57548 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754961079678049e-06, + "loss": 0.709, + "step": 57549 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754685164538162e-06, + "loss": 0.4456, + "step": 57550 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754409248820452e-06, + "loss": 0.6987, + "step": 57551 + }, + { + "epoch": 1.48, + "learning_rate": 1.0754133332525123e-06, + "loss": 0.6934, + "step": 57552 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753857415652388e-06, + "loss": 0.624, + "step": 57553 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753581498202458e-06, + "loss": 0.8232, + "step": 57554 + }, + { + "epoch": 1.48, + "learning_rate": 1.0753305580175548e-06, + "loss": 0.6289, + "step": 57555 + }, + { + "epoch": 1.48, + "learning_rate": 1.075302966157186e-06, + "loss": 0.6152, + "step": 57556 + }, + { + "epoch": 1.48, + "learning_rate": 1.075275374239162e-06, + "loss": 0.7627, + "step": 57557 + }, + { + "epoch": 1.48, + "learning_rate": 1.0752477822635028e-06, + "loss": 0.7017, + "step": 57558 + }, + { + "epoch": 1.48, + "learning_rate": 1.0752201902302298e-06, + "loss": 0.7354, + "step": 57559 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751925981393644e-06, + "loss": 0.542, + "step": 57560 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751650059909272e-06, + "loss": 0.6641, + "step": 57561 + }, + { + "epoch": 1.48, + "learning_rate": 1.0751374137849399e-06, + "loss": 0.6875, + "step": 57562 + }, + { + "epoch": 1.48, + "learning_rate": 1.075109821521423e-06, + "loss": 0.5796, + "step": 57563 + }, + { + "epoch": 1.48, + "learning_rate": 1.075082229200398e-06, + "loss": 0.5439, + "step": 57564 + }, + { + "epoch": 1.48, + "learning_rate": 1.075054636821886e-06, + "loss": 0.6113, + "step": 57565 + }, + { + "epoch": 1.48, + "learning_rate": 1.0750270443859084e-06, + "loss": 0.8682, + "step": 57566 + }, + { + "epoch": 1.48, + "learning_rate": 1.074999451892486e-06, + "loss": 0.6855, + "step": 57567 + }, + { + "epoch": 1.48, + "learning_rate": 1.0749718593416397e-06, + "loss": 0.6592, + "step": 57568 + }, + { + "epoch": 1.48, + "learning_rate": 1.074944266733391e-06, + "loss": 0.6172, + "step": 57569 + }, + { + "epoch": 1.48, + "learning_rate": 1.074916674067761e-06, + "loss": 0.5035, + "step": 57570 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748890813447703e-06, + "loss": 0.6865, + "step": 57571 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748614885644413e-06, + "loss": 0.4342, + "step": 57572 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748338957267938e-06, + "loss": 0.6548, + "step": 57573 + }, + { + "epoch": 1.48, + "learning_rate": 1.0748063028318495e-06, + "loss": 0.7354, + "step": 57574 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747787098796293e-06, + "loss": 0.7109, + "step": 57575 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747511168701546e-06, + "loss": 0.5962, + "step": 57576 + }, + { + "epoch": 1.48, + "learning_rate": 1.0747235238034467e-06, + "loss": 0.6016, + "step": 57577 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746959306795257e-06, + "loss": 0.6245, + "step": 57578 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746683374984142e-06, + "loss": 0.6147, + "step": 57579 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746407442601323e-06, + "loss": 0.5513, + "step": 57580 + }, + { + "epoch": 1.48, + "learning_rate": 1.0746131509647014e-06, + "loss": 0.6548, + "step": 57581 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745855576121425e-06, + "loss": 0.4275, + "step": 57582 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745579642024773e-06, + "loss": 0.749, + "step": 57583 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745303707357261e-06, + "loss": 0.6416, + "step": 57584 + }, + { + "epoch": 1.48, + "learning_rate": 1.0745027772119106e-06, + "loss": 0.7217, + "step": 57585 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744751836310515e-06, + "loss": 0.7188, + "step": 57586 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744475899931707e-06, + "loss": 0.6372, + "step": 57587 + }, + { + "epoch": 1.48, + "learning_rate": 1.0744199962982883e-06, + "loss": 0.7158, + "step": 57588 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743924025464263e-06, + "loss": 0.6455, + "step": 57589 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743648087376048e-06, + "loss": 0.7139, + "step": 57590 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743372148718463e-06, + "loss": 0.4658, + "step": 57591 + }, + { + "epoch": 1.48, + "learning_rate": 1.0743096209491711e-06, + "loss": 0.5859, + "step": 57592 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742820269696001e-06, + "loss": 0.6797, + "step": 57593 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742544329331551e-06, + "loss": 0.5222, + "step": 57594 + }, + { + "epoch": 1.48, + "learning_rate": 1.0742268388398569e-06, + "loss": 0.7041, + "step": 57595 + }, + { + "epoch": 1.48, + "learning_rate": 1.074199244689726e-06, + "loss": 0.7373, + "step": 57596 + }, + { + "epoch": 1.48, + "learning_rate": 1.0741716504827852e-06, + "loss": 0.5562, + "step": 57597 + }, + { + "epoch": 1.48, + "learning_rate": 1.074144056219054e-06, + "loss": 0.6265, + "step": 57598 + }, + { + "epoch": 1.48, + "learning_rate": 1.074116461898554e-06, + "loss": 0.7217, + "step": 57599 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740888675213064e-06, + "loss": 0.6709, + "step": 57600 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740612730873327e-06, + "loss": 0.7412, + "step": 57601 + }, + { + "epoch": 1.48, + "learning_rate": 1.0740336785966536e-06, + "loss": 0.5303, + "step": 57602 + }, + { + "epoch": 1.48, + "learning_rate": 1.07400608404929e-06, + "loss": 0.709, + "step": 57603 + }, + { + "epoch": 1.48, + "learning_rate": 1.0739784894452634e-06, + "loss": 0.7842, + "step": 57604 + }, + { + "epoch": 1.48, + "learning_rate": 1.073950894784595e-06, + "loss": 0.5151, + "step": 57605 + }, + { + "epoch": 1.48, + "learning_rate": 1.0739233000673061e-06, + "loss": 0.5928, + "step": 57606 + }, + { + "epoch": 1.48, + "learning_rate": 1.0738957052934173e-06, + "loss": 0.4004, + "step": 57607 + }, + { + "epoch": 1.48, + "learning_rate": 1.0738681104629498e-06, + "loss": 0.4071, + "step": 57608 + }, + { + "epoch": 1.48, + "learning_rate": 1.073840515575925e-06, + "loss": 0.4524, + "step": 57609 + }, + { + "epoch": 1.48, + "learning_rate": 1.073812920632364e-06, + "loss": 0.6362, + "step": 57610 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737853256322875e-06, + "loss": 0.6162, + "step": 57611 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737577305757175e-06, + "loss": 0.6875, + "step": 57612 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737301354626743e-06, + "loss": 0.6274, + "step": 57613 + }, + { + "epoch": 1.48, + "learning_rate": 1.0737025402931794e-06, + "loss": 0.6426, + "step": 57614 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736749450672536e-06, + "loss": 0.6304, + "step": 57615 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736473497849186e-06, + "loss": 0.7607, + "step": 57616 + }, + { + "epoch": 1.48, + "learning_rate": 1.0736197544461952e-06, + "loss": 0.6172, + "step": 57617 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735921590511043e-06, + "loss": 0.5383, + "step": 57618 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735645635996674e-06, + "loss": 0.7939, + "step": 57619 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735369680919054e-06, + "loss": 0.7393, + "step": 57620 + }, + { + "epoch": 1.48, + "learning_rate": 1.0735093725278397e-06, + "loss": 0.6338, + "step": 57621 + }, + { + "epoch": 1.48, + "learning_rate": 1.0734817769074913e-06, + "loss": 0.5708, + "step": 57622 + }, + { + "epoch": 1.48, + "learning_rate": 1.073454181230881e-06, + "loss": 0.4712, + "step": 57623 + }, + { + "epoch": 1.48, + "learning_rate": 1.0734265854980308e-06, + "loss": 0.7744, + "step": 57624 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733989897089604e-06, + "loss": 0.8018, + "step": 57625 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733713938636925e-06, + "loss": 0.6006, + "step": 57626 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733437979622471e-06, + "loss": 0.7012, + "step": 57627 + }, + { + "epoch": 1.48, + "learning_rate": 1.0733162020046456e-06, + "loss": 0.6592, + "step": 57628 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732886059909093e-06, + "loss": 0.6543, + "step": 57629 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732610099210595e-06, + "loss": 0.6328, + "step": 57630 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732334137951172e-06, + "loss": 0.5303, + "step": 57631 + }, + { + "epoch": 1.48, + "learning_rate": 1.0732058176131034e-06, + "loss": 0.6514, + "step": 57632 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731782213750391e-06, + "loss": 0.6875, + "step": 57633 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731506250809457e-06, + "loss": 0.7031, + "step": 57634 + }, + { + "epoch": 1.48, + "learning_rate": 1.0731230287308442e-06, + "loss": 0.6592, + "step": 57635 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730954323247557e-06, + "loss": 0.7031, + "step": 57636 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730678358627016e-06, + "loss": 0.9004, + "step": 57637 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730402393447025e-06, + "loss": 0.6836, + "step": 57638 + }, + { + "epoch": 1.48, + "learning_rate": 1.0730126427707801e-06, + "loss": 0.6948, + "step": 57639 + }, + { + "epoch": 1.48, + "learning_rate": 1.072985046140955e-06, + "loss": 0.7383, + "step": 57640 + }, + { + "epoch": 1.48, + "learning_rate": 1.072957449455249e-06, + "loss": 0.6719, + "step": 57641 + }, + { + "epoch": 1.48, + "learning_rate": 1.0729298527136824e-06, + "loss": 0.6211, + "step": 57642 + }, + { + "epoch": 1.48, + "learning_rate": 1.0729022559162772e-06, + "loss": 0.5249, + "step": 57643 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728746590630538e-06, + "loss": 0.6162, + "step": 57644 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728470621540337e-06, + "loss": 0.7588, + "step": 57645 + }, + { + "epoch": 1.48, + "learning_rate": 1.0728194651892379e-06, + "loss": 0.5952, + "step": 57646 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727918681686877e-06, + "loss": 0.574, + "step": 57647 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727642710924043e-06, + "loss": 0.4351, + "step": 57648 + }, + { + "epoch": 1.48, + "learning_rate": 1.0727366739604082e-06, + "loss": 0.6011, + "step": 57649 + }, + { + "epoch": 1.48, + "learning_rate": 1.072709076772721e-06, + "loss": 0.8701, + "step": 57650 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726814795293642e-06, + "loss": 0.5469, + "step": 57651 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726538822303586e-06, + "loss": 0.6387, + "step": 57652 + }, + { + "epoch": 1.48, + "learning_rate": 1.0726262848757249e-06, + "loss": 0.6982, + "step": 57653 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725986874654847e-06, + "loss": 0.7354, + "step": 57654 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725710899996587e-06, + "loss": 0.3763, + "step": 57655 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725434924782688e-06, + "loss": 0.7686, + "step": 57656 + }, + { + "epoch": 1.48, + "learning_rate": 1.0725158949013355e-06, + "loss": 0.5005, + "step": 57657 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724882972688801e-06, + "loss": 0.6685, + "step": 57658 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724606995809237e-06, + "loss": 0.6523, + "step": 57659 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724331018374877e-06, + "loss": 0.5781, + "step": 57660 + }, + { + "epoch": 1.48, + "learning_rate": 1.0724055040385929e-06, + "loss": 0.7646, + "step": 57661 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723779061842606e-06, + "loss": 0.6475, + "step": 57662 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723503082745118e-06, + "loss": 0.6279, + "step": 57663 + }, + { + "epoch": 1.48, + "learning_rate": 1.0723227103093677e-06, + "loss": 0.6641, + "step": 57664 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722951122888492e-06, + "loss": 0.7744, + "step": 57665 + }, + { + "epoch": 1.48, + "learning_rate": 1.072267514212978e-06, + "loss": 0.7158, + "step": 57666 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722399160817747e-06, + "loss": 0.7529, + "step": 57667 + }, + { + "epoch": 1.48, + "learning_rate": 1.0722123178952604e-06, + "loss": 0.5962, + "step": 57668 + }, + { + "epoch": 1.48, + "learning_rate": 1.072184719653457e-06, + "loss": 0.5615, + "step": 57669 + }, + { + "epoch": 1.48, + "learning_rate": 1.0721571213563847e-06, + "loss": 0.5195, + "step": 57670 + }, + { + "epoch": 1.48, + "learning_rate": 1.072129523004065e-06, + "loss": 0.748, + "step": 57671 + }, + { + "epoch": 1.48, + "learning_rate": 1.0721019245965192e-06, + "loss": 0.7725, + "step": 57672 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720743261337684e-06, + "loss": 0.5869, + "step": 57673 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720467276158332e-06, + "loss": 0.6504, + "step": 57674 + }, + { + "epoch": 1.48, + "learning_rate": 1.0720191290427355e-06, + "loss": 0.7266, + "step": 57675 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719915304144958e-06, + "loss": 0.6348, + "step": 57676 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719639317311357e-06, + "loss": 0.6416, + "step": 57677 + }, + { + "epoch": 1.48, + "learning_rate": 1.0719363329926757e-06, + "loss": 0.6548, + "step": 57678 + }, + { + "epoch": 1.48, + "learning_rate": 1.071908734199138e-06, + "loss": 0.8008, + "step": 57679 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718811353505426e-06, + "loss": 0.8145, + "step": 57680 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718535364469114e-06, + "loss": 0.5562, + "step": 57681 + }, + { + "epoch": 1.48, + "learning_rate": 1.0718259374882652e-06, + "loss": 0.688, + "step": 57682 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717983384746251e-06, + "loss": 0.6289, + "step": 57683 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717707394060122e-06, + "loss": 0.5811, + "step": 57684 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717431402824478e-06, + "loss": 0.584, + "step": 57685 + }, + { + "epoch": 1.48, + "learning_rate": 1.0717155411039532e-06, + "loss": 0.5508, + "step": 57686 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716879418705494e-06, + "loss": 0.4966, + "step": 57687 + }, + { + "epoch": 1.48, + "learning_rate": 1.071660342582257e-06, + "loss": 0.7383, + "step": 57688 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716327432390978e-06, + "loss": 0.6055, + "step": 57689 + }, + { + "epoch": 1.48, + "learning_rate": 1.0716051438410927e-06, + "loss": 0.5752, + "step": 57690 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715775443882629e-06, + "loss": 0.6982, + "step": 57691 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715499448806294e-06, + "loss": 0.5444, + "step": 57692 + }, + { + "epoch": 1.48, + "learning_rate": 1.0715223453182132e-06, + "loss": 0.5908, + "step": 57693 + }, + { + "epoch": 1.48, + "learning_rate": 1.071494745701036e-06, + "loss": 0.4692, + "step": 57694 + }, + { + "epoch": 1.48, + "learning_rate": 1.0714671460291183e-06, + "loss": 0.6665, + "step": 57695 + }, + { + "epoch": 1.48, + "learning_rate": 1.0714395463024815e-06, + "loss": 0.5205, + "step": 57696 + }, + { + "epoch": 1.48, + "learning_rate": 1.071411946521147e-06, + "loss": 0.6123, + "step": 57697 + }, + { + "epoch": 1.48, + "learning_rate": 1.0713843466851353e-06, + "loss": 0.7256, + "step": 57698 + }, + { + "epoch": 1.48, + "learning_rate": 1.071356746794468e-06, + "loss": 0.6421, + "step": 57699 + }, + { + "epoch": 1.48, + "learning_rate": 1.071329146849166e-06, + "loss": 0.5376, + "step": 57700 + }, + { + "epoch": 1.48, + "learning_rate": 1.0713015468492508e-06, + "loss": 0.6836, + "step": 57701 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712739467947434e-06, + "loss": 0.8467, + "step": 57702 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712463466856645e-06, + "loss": 0.6001, + "step": 57703 + }, + { + "epoch": 1.48, + "learning_rate": 1.0712187465220358e-06, + "loss": 0.7051, + "step": 57704 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711911463038778e-06, + "loss": 0.5762, + "step": 57705 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711635460312122e-06, + "loss": 0.5273, + "step": 57706 + }, + { + "epoch": 1.48, + "learning_rate": 1.07113594570406e-06, + "loss": 0.6279, + "step": 57707 + }, + { + "epoch": 1.48, + "learning_rate": 1.0711083453224425e-06, + "loss": 0.7197, + "step": 57708 + }, + { + "epoch": 1.48, + "learning_rate": 1.0710807448863804e-06, + "loss": 0.7861, + "step": 57709 + }, + { + "epoch": 1.48, + "learning_rate": 1.071053144395895e-06, + "loss": 0.5137, + "step": 57710 + }, + { + "epoch": 1.48, + "learning_rate": 1.0710255438510072e-06, + "loss": 0.5232, + "step": 57711 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709979432517389e-06, + "loss": 0.5996, + "step": 57712 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709703425981105e-06, + "loss": 0.6211, + "step": 57713 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709427418901435e-06, + "loss": 0.6267, + "step": 57714 + }, + { + "epoch": 1.48, + "learning_rate": 1.0709151411278587e-06, + "loss": 0.7773, + "step": 57715 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708875403112775e-06, + "loss": 0.6982, + "step": 57716 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708599394404212e-06, + "loss": 0.6685, + "step": 57717 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708323385153105e-06, + "loss": 0.7012, + "step": 57718 + }, + { + "epoch": 1.48, + "learning_rate": 1.0708047375359668e-06, + "loss": 0.5679, + "step": 57719 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707771365024109e-06, + "loss": 0.5083, + "step": 57720 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707495354146645e-06, + "loss": 0.543, + "step": 57721 + }, + { + "epoch": 1.48, + "learning_rate": 1.0707219342727485e-06, + "loss": 0.71, + "step": 57722 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706943330766839e-06, + "loss": 0.7549, + "step": 57723 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706667318264916e-06, + "loss": 0.7539, + "step": 57724 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706391305221933e-06, + "loss": 0.3938, + "step": 57725 + }, + { + "epoch": 1.48, + "learning_rate": 1.0706115291638098e-06, + "loss": 0.752, + "step": 57726 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705839277513627e-06, + "loss": 0.5554, + "step": 57727 + }, + { + "epoch": 1.48, + "learning_rate": 1.070556326284872e-06, + "loss": 0.8242, + "step": 57728 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705287247643602e-06, + "loss": 0.6772, + "step": 57729 + }, + { + "epoch": 1.48, + "learning_rate": 1.0705011231898473e-06, + "loss": 0.5645, + "step": 57730 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704735215613551e-06, + "loss": 0.5688, + "step": 57731 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704459198789049e-06, + "loss": 0.5879, + "step": 57732 + }, + { + "epoch": 1.48, + "learning_rate": 1.0704183181425172e-06, + "loss": 0.707, + "step": 57733 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703907163522132e-06, + "loss": 0.7266, + "step": 57734 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703631145080148e-06, + "loss": 0.6387, + "step": 57735 + }, + { + "epoch": 1.48, + "learning_rate": 1.070335512609942e-06, + "loss": 0.4852, + "step": 57736 + }, + { + "epoch": 1.48, + "learning_rate": 1.0703079106580172e-06, + "loss": 0.6504, + "step": 57737 + }, + { + "epoch": 1.48, + "learning_rate": 1.0702803086522603e-06, + "loss": 0.7539, + "step": 57738 + }, + { + "epoch": 1.48, + "learning_rate": 1.0702527065926932e-06, + "loss": 0.7793, + "step": 57739 + }, + { + "epoch": 1.48, + "learning_rate": 1.070225104479337e-06, + "loss": 0.4559, + "step": 57740 + }, + { + "epoch": 1.48, + "learning_rate": 1.070197502312212e-06, + "loss": 0.709, + "step": 57741 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701699000913409e-06, + "loss": 0.511, + "step": 57742 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701422978167434e-06, + "loss": 0.686, + "step": 57743 + }, + { + "epoch": 1.48, + "learning_rate": 1.0701146954884415e-06, + "loss": 0.7305, + "step": 57744 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700870931064555e-06, + "loss": 0.5894, + "step": 57745 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700594906708077e-06, + "loss": 0.7168, + "step": 57746 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700318881815183e-06, + "loss": 0.7441, + "step": 57747 + }, + { + "epoch": 1.48, + "learning_rate": 1.0700042856386085e-06, + "loss": 0.708, + "step": 57748 + }, + { + "epoch": 1.48, + "learning_rate": 1.0699766830420998e-06, + "loss": 0.7402, + "step": 57749 + }, + { + "epoch": 1.48, + "learning_rate": 1.069949080392013e-06, + "loss": 0.5923, + "step": 57750 + }, + { + "epoch": 1.48, + "learning_rate": 1.0699214776883693e-06, + "loss": 0.6396, + "step": 57751 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698938749311905e-06, + "loss": 0.7412, + "step": 57752 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698662721204967e-06, + "loss": 0.6172, + "step": 57753 + }, + { + "epoch": 1.48, + "learning_rate": 1.06983866925631e-06, + "loss": 0.5315, + "step": 57754 + }, + { + "epoch": 1.48, + "learning_rate": 1.0698110663386504e-06, + "loss": 0.665, + "step": 57755 + }, + { + "epoch": 1.48, + "learning_rate": 1.06978346336754e-06, + "loss": 0.7314, + "step": 57756 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697558603429997e-06, + "loss": 0.6426, + "step": 57757 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697282572650504e-06, + "loss": 0.6357, + "step": 57758 + }, + { + "epoch": 1.48, + "learning_rate": 1.0697006541337134e-06, + "loss": 0.7236, + "step": 57759 + }, + { + "epoch": 1.48, + "learning_rate": 1.06967305094901e-06, + "loss": 0.4971, + "step": 57760 + }, + { + "epoch": 1.48, + "learning_rate": 1.0696454477109606e-06, + "loss": 0.8311, + "step": 57761 + }, + { + "epoch": 1.48, + "learning_rate": 1.0696178444195873e-06, + "loss": 0.5381, + "step": 57762 + }, + { + "epoch": 1.48, + "learning_rate": 1.069590241074911e-06, + "loss": 0.7129, + "step": 57763 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695626376769521e-06, + "loss": 0.5903, + "step": 57764 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695350342257327e-06, + "loss": 0.5967, + "step": 57765 + }, + { + "epoch": 1.48, + "learning_rate": 1.0695074307212735e-06, + "loss": 0.8252, + "step": 57766 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694798271635958e-06, + "loss": 0.6006, + "step": 57767 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694522235527204e-06, + "loss": 0.6001, + "step": 57768 + }, + { + "epoch": 1.48, + "learning_rate": 1.0694246198886686e-06, + "loss": 0.7705, + "step": 57769 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693970161714613e-06, + "loss": 0.7627, + "step": 57770 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693694124011206e-06, + "loss": 0.7915, + "step": 57771 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693418085776662e-06, + "loss": 0.6982, + "step": 57772 + }, + { + "epoch": 1.48, + "learning_rate": 1.0693142047011202e-06, + "loss": 0.4844, + "step": 57773 + }, + { + "epoch": 1.48, + "learning_rate": 1.0692866007715036e-06, + "loss": 0.5938, + "step": 57774 + }, + { + "epoch": 1.48, + "learning_rate": 1.0692589967888375e-06, + "loss": 0.7422, + "step": 57775 + }, + { + "epoch": 1.48, + "learning_rate": 1.069231392753143e-06, + "loss": 0.7627, + "step": 57776 + }, + { + "epoch": 1.48, + "learning_rate": 1.069203788664441e-06, + "loss": 0.575, + "step": 57777 + }, + { + "epoch": 1.48, + "learning_rate": 1.069176184522753e-06, + "loss": 0.7695, + "step": 57778 + }, + { + "epoch": 1.48, + "learning_rate": 1.0691485803280998e-06, + "loss": 0.7798, + "step": 57779 + }, + { + "epoch": 1.48, + "learning_rate": 1.0691209760805026e-06, + "loss": 0.4749, + "step": 57780 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690933717799831e-06, + "loss": 0.5996, + "step": 57781 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690657674265616e-06, + "loss": 0.6853, + "step": 57782 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690381630202597e-06, + "loss": 0.5874, + "step": 57783 + }, + { + "epoch": 1.48, + "learning_rate": 1.0690105585610986e-06, + "loss": 0.6465, + "step": 57784 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689829540490992e-06, + "loss": 0.6982, + "step": 57785 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689553494842828e-06, + "loss": 0.5459, + "step": 57786 + }, + { + "epoch": 1.48, + "learning_rate": 1.0689277448666702e-06, + "loss": 0.6641, + "step": 57787 + }, + { + "epoch": 1.48, + "learning_rate": 1.068900140196283e-06, + "loss": 0.5303, + "step": 57788 + }, + { + "epoch": 1.48, + "learning_rate": 1.068872535473142e-06, + "loss": 0.5319, + "step": 57789 + }, + { + "epoch": 1.48, + "learning_rate": 1.0688449306972686e-06, + "loss": 0.7275, + "step": 57790 + }, + { + "epoch": 1.48, + "learning_rate": 1.0688173258686838e-06, + "loss": 0.6709, + "step": 57791 + }, + { + "epoch": 1.48, + "learning_rate": 1.068789720987409e-06, + "loss": 0.6377, + "step": 57792 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687621160534646e-06, + "loss": 0.752, + "step": 57793 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687345110668724e-06, + "loss": 0.6997, + "step": 57794 + }, + { + "epoch": 1.48, + "learning_rate": 1.0687069060276532e-06, + "loss": 0.7432, + "step": 57795 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686793009358288e-06, + "loss": 0.6816, + "step": 57796 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686516957914191e-06, + "loss": 0.71, + "step": 57797 + }, + { + "epoch": 1.48, + "learning_rate": 1.0686240905944466e-06, + "loss": 0.8066, + "step": 57798 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685964853449312e-06, + "loss": 0.7559, + "step": 57799 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685688800428948e-06, + "loss": 0.646, + "step": 57800 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685412746883587e-06, + "loss": 0.4226, + "step": 57801 + }, + { + "epoch": 1.48, + "learning_rate": 1.0685136692813434e-06, + "loss": 0.4697, + "step": 57802 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684860638218705e-06, + "loss": 0.7578, + "step": 57803 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684584583099608e-06, + "loss": 0.7949, + "step": 57804 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684308527456356e-06, + "loss": 0.7217, + "step": 57805 + }, + { + "epoch": 1.48, + "learning_rate": 1.0684032471289161e-06, + "loss": 0.667, + "step": 57806 + }, + { + "epoch": 1.48, + "learning_rate": 1.0683756414598235e-06, + "loss": 0.6992, + "step": 57807 + }, + { + "epoch": 1.48, + "learning_rate": 1.0683480357383786e-06, + "loss": 0.6123, + "step": 57808 + }, + { + "epoch": 1.48, + "learning_rate": 1.068320429964603e-06, + "loss": 0.6592, + "step": 57809 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682928241385172e-06, + "loss": 0.6675, + "step": 57810 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682652182601433e-06, + "loss": 0.5908, + "step": 57811 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682376123295014e-06, + "loss": 0.6855, + "step": 57812 + }, + { + "epoch": 1.48, + "learning_rate": 1.0682100063466134e-06, + "loss": 0.6309, + "step": 57813 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681824003114996e-06, + "loss": 0.6826, + "step": 57814 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681547942241822e-06, + "loss": 0.5664, + "step": 57815 + }, + { + "epoch": 1.48, + "learning_rate": 1.0681271880846818e-06, + "loss": 0.7285, + "step": 57816 + }, + { + "epoch": 1.48, + "learning_rate": 1.0680995818930195e-06, + "loss": 0.624, + "step": 57817 + }, + { + "epoch": 1.48, + "learning_rate": 1.068071975649216e-06, + "loss": 0.6387, + "step": 57818 + }, + { + "epoch": 1.48, + "learning_rate": 1.0680443693532935e-06, + "loss": 0.6094, + "step": 57819 + }, + { + "epoch": 1.48, + "learning_rate": 1.068016763005272e-06, + "loss": 0.6807, + "step": 57820 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679891566051737e-06, + "loss": 0.5024, + "step": 57821 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679615501530193e-06, + "loss": 0.531, + "step": 57822 + }, + { + "epoch": 1.48, + "learning_rate": 1.0679339436488297e-06, + "loss": 0.6826, + "step": 57823 + }, + { + "epoch": 1.48, + "learning_rate": 1.067906337092626e-06, + "loss": 0.8779, + "step": 57824 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678787304844297e-06, + "loss": 0.5688, + "step": 57825 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678511238242618e-06, + "loss": 0.6914, + "step": 57826 + }, + { + "epoch": 1.48, + "learning_rate": 1.0678235171121432e-06, + "loss": 0.6001, + "step": 57827 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677959103480956e-06, + "loss": 0.6536, + "step": 57828 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677683035321394e-06, + "loss": 0.4469, + "step": 57829 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677406966642964e-06, + "loss": 0.5908, + "step": 57830 + }, + { + "epoch": 1.48, + "learning_rate": 1.0677130897445874e-06, + "loss": 0.5073, + "step": 57831 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676854827730336e-06, + "loss": 0.511, + "step": 57832 + }, + { + "epoch": 1.48, + "learning_rate": 1.067657875749656e-06, + "loss": 0.6104, + "step": 57833 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676302686744763e-06, + "loss": 0.6738, + "step": 57834 + }, + { + "epoch": 1.48, + "learning_rate": 1.0676026615475147e-06, + "loss": 0.5466, + "step": 57835 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675750543687934e-06, + "loss": 0.6282, + "step": 57836 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675474471383326e-06, + "loss": 0.7285, + "step": 57837 + }, + { + "epoch": 1.48, + "learning_rate": 1.0675198398561538e-06, + "loss": 0.7598, + "step": 57838 + }, + { + "epoch": 1.48, + "learning_rate": 1.0674922325222781e-06, + "loss": 0.48, + "step": 57839 + }, + { + "epoch": 1.48, + "learning_rate": 1.067464625136727e-06, + "loss": 0.6875, + "step": 57840 + }, + { + "epoch": 1.48, + "learning_rate": 1.0674370176995214e-06, + "loss": 0.5786, + "step": 57841 + }, + { + "epoch": 1.48, + "learning_rate": 1.067409410210682e-06, + "loss": 0.4648, + "step": 57842 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673818026702303e-06, + "loss": 0.5413, + "step": 57843 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673541950781876e-06, + "loss": 0.5347, + "step": 57844 + }, + { + "epoch": 1.48, + "learning_rate": 1.0673265874345748e-06, + "loss": 0.7529, + "step": 57845 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672989797394133e-06, + "loss": 0.6333, + "step": 57846 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672713719927243e-06, + "loss": 0.7607, + "step": 57847 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672437641945282e-06, + "loss": 0.5957, + "step": 57848 + }, + { + "epoch": 1.48, + "learning_rate": 1.0672161563448469e-06, + "loss": 0.7539, + "step": 57849 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671885484437014e-06, + "loss": 0.7422, + "step": 57850 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671609404911126e-06, + "loss": 0.5068, + "step": 57851 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671333324871017e-06, + "loss": 0.7212, + "step": 57852 + }, + { + "epoch": 1.48, + "learning_rate": 1.0671057244316898e-06, + "loss": 0.4622, + "step": 57853 + }, + { + "epoch": 1.48, + "learning_rate": 1.0670781163248983e-06, + "loss": 0.542, + "step": 57854 + }, + { + "epoch": 1.48, + "learning_rate": 1.067050508166748e-06, + "loss": 0.5679, + "step": 57855 + }, + { + "epoch": 1.48, + "learning_rate": 1.0670228999572606e-06, + "loss": 0.5894, + "step": 57856 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669952916964566e-06, + "loss": 0.5796, + "step": 57857 + }, + { + "epoch": 1.48, + "learning_rate": 1.066967683384357e-06, + "loss": 0.7158, + "step": 57858 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669400750209839e-06, + "loss": 0.6436, + "step": 57859 + }, + { + "epoch": 1.48, + "learning_rate": 1.0669124666063577e-06, + "loss": 0.7109, + "step": 57860 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668848581404997e-06, + "loss": 0.6377, + "step": 57861 + }, + { + "epoch": 1.48, + "learning_rate": 1.066857249623431e-06, + "loss": 0.7188, + "step": 57862 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668296410551727e-06, + "loss": 0.5879, + "step": 57863 + }, + { + "epoch": 1.48, + "learning_rate": 1.0668020324357458e-06, + "loss": 0.6475, + "step": 57864 + }, + { + "epoch": 1.48, + "learning_rate": 1.066774423765172e-06, + "loss": 0.4983, + "step": 57865 + }, + { + "epoch": 1.48, + "learning_rate": 1.0667468150434723e-06, + "loss": 0.6143, + "step": 57866 + }, + { + "epoch": 1.48, + "learning_rate": 1.0667192062706674e-06, + "loss": 0.7334, + "step": 57867 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666915974467785e-06, + "loss": 0.6265, + "step": 57868 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666639885718272e-06, + "loss": 0.6904, + "step": 57869 + }, + { + "epoch": 1.48, + "learning_rate": 1.066636379645834e-06, + "loss": 0.6982, + "step": 57870 + }, + { + "epoch": 1.48, + "learning_rate": 1.0666087706688205e-06, + "loss": 0.6335, + "step": 57871 + }, + { + "epoch": 1.48, + "learning_rate": 1.066581161640808e-06, + "loss": 0.5435, + "step": 57872 + }, + { + "epoch": 1.48, + "learning_rate": 1.066553552561817e-06, + "loss": 0.6396, + "step": 57873 + }, + { + "epoch": 1.48, + "learning_rate": 1.0665259434318691e-06, + "loss": 0.5439, + "step": 57874 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664983342509854e-06, + "loss": 0.6338, + "step": 57875 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664707250191873e-06, + "loss": 0.6548, + "step": 57876 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664431157364952e-06, + "loss": 0.61, + "step": 57877 + }, + { + "epoch": 1.48, + "learning_rate": 1.0664155064029308e-06, + "loss": 0.748, + "step": 57878 + }, + { + "epoch": 1.48, + "learning_rate": 1.066387897018515e-06, + "loss": 0.8008, + "step": 57879 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663602875832691e-06, + "loss": 0.7412, + "step": 57880 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663326780972144e-06, + "loss": 0.4973, + "step": 57881 + }, + { + "epoch": 1.48, + "learning_rate": 1.0663050685603716e-06, + "loss": 0.6167, + "step": 57882 + }, + { + "epoch": 1.48, + "learning_rate": 1.0662774589727619e-06, + "loss": 0.6484, + "step": 57883 + }, + { + "epoch": 1.48, + "learning_rate": 1.066249849334407e-06, + "loss": 0.5474, + "step": 57884 + }, + { + "epoch": 1.48, + "learning_rate": 1.0662222396453272e-06, + "loss": 0.8496, + "step": 57885 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661946299055447e-06, + "loss": 0.584, + "step": 57886 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661670201150794e-06, + "loss": 0.5291, + "step": 57887 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661394102739534e-06, + "loss": 0.8438, + "step": 57888 + }, + { + "epoch": 1.48, + "learning_rate": 1.0661118003821873e-06, + "loss": 0.7764, + "step": 57889 + }, + { + "epoch": 1.48, + "learning_rate": 1.0660841904398023e-06, + "loss": 0.541, + "step": 57890 + }, + { + "epoch": 1.48, + "learning_rate": 1.06605658044682e-06, + "loss": 0.6465, + "step": 57891 + }, + { + "epoch": 1.48, + "learning_rate": 1.066028970403261e-06, + "loss": 0.6758, + "step": 57892 + }, + { + "epoch": 1.48, + "learning_rate": 1.0660013603091468e-06, + "loss": 1.0078, + "step": 57893 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659737501644984e-06, + "loss": 0.6123, + "step": 57894 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659461399693369e-06, + "loss": 0.6284, + "step": 57895 + }, + { + "epoch": 1.48, + "learning_rate": 1.0659185297236832e-06, + "loss": 0.4224, + "step": 57896 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658909194275592e-06, + "loss": 0.5137, + "step": 57897 + }, + { + "epoch": 1.48, + "learning_rate": 1.065863309080985e-06, + "loss": 0.8096, + "step": 57898 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658356986839826e-06, + "loss": 0.748, + "step": 57899 + }, + { + "epoch": 1.48, + "learning_rate": 1.0658080882365728e-06, + "loss": 0.5376, + "step": 57900 + }, + { + "epoch": 1.48, + "learning_rate": 1.065780477738777e-06, + "loss": 0.5518, + "step": 57901 + }, + { + "epoch": 1.48, + "learning_rate": 1.065752867190616e-06, + "loss": 0.5166, + "step": 57902 + }, + { + "epoch": 1.48, + "learning_rate": 1.065725256592111e-06, + "loss": 0.6089, + "step": 57903 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656976459432828e-06, + "loss": 0.7178, + "step": 57904 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656700352441535e-06, + "loss": 0.3619, + "step": 57905 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656424244947434e-06, + "loss": 0.7046, + "step": 57906 + }, + { + "epoch": 1.48, + "learning_rate": 1.0656148136950742e-06, + "loss": 0.5942, + "step": 57907 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655872028451665e-06, + "loss": 0.7178, + "step": 57908 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655595919450417e-06, + "loss": 0.6953, + "step": 57909 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655319809947207e-06, + "loss": 0.604, + "step": 57910 + }, + { + "epoch": 1.48, + "learning_rate": 1.0655043699942251e-06, + "loss": 0.5732, + "step": 57911 + }, + { + "epoch": 1.48, + "learning_rate": 1.065476758943576e-06, + "loss": 0.4907, + "step": 57912 + }, + { + "epoch": 1.48, + "learning_rate": 1.0654491478427945e-06, + "loss": 0.5684, + "step": 57913 + }, + { + "epoch": 1.48, + "learning_rate": 1.065421536691901e-06, + "loss": 0.7305, + "step": 57914 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653939254909177e-06, + "loss": 0.5587, + "step": 57915 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653663142398653e-06, + "loss": 0.6016, + "step": 57916 + }, + { + "epoch": 1.48, + "learning_rate": 1.0653387029387643e-06, + "loss": 0.5518, + "step": 57917 + }, + { + "epoch": 1.48, + "learning_rate": 1.065311091587637e-06, + "loss": 0.6948, + "step": 57918 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652834801865037e-06, + "loss": 0.5488, + "step": 57919 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652558687353864e-06, + "loss": 0.585, + "step": 57920 + }, + { + "epoch": 1.48, + "learning_rate": 1.0652282572343053e-06, + "loss": 0.5889, + "step": 57921 + }, + { + "epoch": 1.48, + "learning_rate": 1.065200645683282e-06, + "loss": 0.7051, + "step": 57922 + }, + { + "epoch": 1.48, + "learning_rate": 1.0651730340823373e-06, + "loss": 0.8379, + "step": 57923 + }, + { + "epoch": 1.48, + "learning_rate": 1.065145422431493e-06, + "loss": 0.6086, + "step": 57924 + }, + { + "epoch": 1.48, + "learning_rate": 1.0651178107307694e-06, + "loss": 0.6738, + "step": 57925 + }, + { + "epoch": 1.48, + "learning_rate": 1.0650901989801888e-06, + "loss": 0.5543, + "step": 57926 + }, + { + "epoch": 1.48, + "learning_rate": 1.065062587179771e-06, + "loss": 0.5913, + "step": 57927 + }, + { + "epoch": 1.48, + "learning_rate": 1.065034975329538e-06, + "loss": 0.6079, + "step": 57928 + }, + { + "epoch": 1.48, + "learning_rate": 1.0650073634295104e-06, + "loss": 0.6035, + "step": 57929 + }, + { + "epoch": 1.48, + "learning_rate": 1.06497975147971e-06, + "loss": 0.5464, + "step": 57930 + }, + { + "epoch": 1.48, + "learning_rate": 1.0649521394801575e-06, + "loss": 0.5308, + "step": 57931 + }, + { + "epoch": 1.48, + "learning_rate": 1.0649245274308743e-06, + "loss": 0.6353, + "step": 57932 + }, + { + "epoch": 1.48, + "learning_rate": 1.064896915331881e-06, + "loss": 0.6689, + "step": 57933 + }, + { + "epoch": 1.48, + "learning_rate": 1.0648693031831993e-06, + "loss": 0.5012, + "step": 57934 + }, + { + "epoch": 1.48, + "learning_rate": 1.06484169098485e-06, + "loss": 0.752, + "step": 57935 + }, + { + "epoch": 1.48, + "learning_rate": 1.064814078736855e-06, + "loss": 0.5503, + "step": 57936 + }, + { + "epoch": 1.48, + "learning_rate": 1.0647864664392342e-06, + "loss": 0.5479, + "step": 57937 + }, + { + "epoch": 1.48, + "learning_rate": 1.0647588540920096e-06, + "loss": 0.7021, + "step": 57938 + }, + { + "epoch": 1.49, + "learning_rate": 1.0647312416952022e-06, + "loss": 0.5664, + "step": 57939 + }, + { + "epoch": 1.49, + "learning_rate": 1.064703629248833e-06, + "loss": 0.5638, + "step": 57940 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646760167529233e-06, + "loss": 0.6143, + "step": 57941 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646484042074938e-06, + "loss": 0.7051, + "step": 57942 + }, + { + "epoch": 1.49, + "learning_rate": 1.0646207916125665e-06, + "loss": 0.7676, + "step": 57943 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645931789681614e-06, + "loss": 0.7466, + "step": 57944 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645655662743008e-06, + "loss": 0.5552, + "step": 57945 + }, + { + "epoch": 1.49, + "learning_rate": 1.0645379535310052e-06, + "loss": 0.4966, + "step": 57946 + }, + { + "epoch": 1.49, + "learning_rate": 1.064510340738296e-06, + "loss": 0.835, + "step": 57947 + }, + { + "epoch": 1.49, + "learning_rate": 1.064482727896194e-06, + "loss": 0.751, + "step": 57948 + }, + { + "epoch": 1.49, + "learning_rate": 1.0644551150047204e-06, + "loss": 0.729, + "step": 57949 + }, + { + "epoch": 1.49, + "learning_rate": 1.0644275020638965e-06, + "loss": 0.5242, + "step": 57950 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643998890737438e-06, + "loss": 0.6104, + "step": 57951 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643722760342825e-06, + "loss": 0.7114, + "step": 57952 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643446629455348e-06, + "loss": 0.8223, + "step": 57953 + }, + { + "epoch": 1.49, + "learning_rate": 1.0643170498075212e-06, + "loss": 0.6978, + "step": 57954 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642894366202629e-06, + "loss": 0.645, + "step": 57955 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642618233837813e-06, + "loss": 0.6719, + "step": 57956 + }, + { + "epoch": 1.49, + "learning_rate": 1.0642342100980973e-06, + "loss": 0.6763, + "step": 57957 + }, + { + "epoch": 1.49, + "learning_rate": 1.064206596763232e-06, + "loss": 0.6074, + "step": 57958 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641789833792067e-06, + "loss": 0.5012, + "step": 57959 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641513699460424e-06, + "loss": 0.6904, + "step": 57960 + }, + { + "epoch": 1.49, + "learning_rate": 1.0641237564637606e-06, + "loss": 0.6113, + "step": 57961 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640961429323822e-06, + "loss": 0.6494, + "step": 57962 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640685293519282e-06, + "loss": 0.5293, + "step": 57963 + }, + { + "epoch": 1.49, + "learning_rate": 1.06404091572242e-06, + "loss": 0.4924, + "step": 57964 + }, + { + "epoch": 1.49, + "learning_rate": 1.0640133020438785e-06, + "loss": 0.8525, + "step": 57965 + }, + { + "epoch": 1.49, + "learning_rate": 1.063985688316325e-06, + "loss": 0.6523, + "step": 57966 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639580745397805e-06, + "loss": 0.6162, + "step": 57967 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639304607142663e-06, + "loss": 0.5034, + "step": 57968 + }, + { + "epoch": 1.49, + "learning_rate": 1.0639028468398036e-06, + "loss": 0.6406, + "step": 57969 + }, + { + "epoch": 1.49, + "learning_rate": 1.063875232916413e-06, + "loss": 0.6025, + "step": 57970 + }, + { + "epoch": 1.49, + "learning_rate": 1.0638476189441167e-06, + "loss": 0.573, + "step": 57971 + }, + { + "epoch": 1.49, + "learning_rate": 1.0638200049229352e-06, + "loss": 0.7002, + "step": 57972 + }, + { + "epoch": 1.49, + "learning_rate": 1.063792390852889e-06, + "loss": 0.6113, + "step": 57973 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637647767340004e-06, + "loss": 0.6777, + "step": 57974 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637371625662896e-06, + "loss": 0.6362, + "step": 57975 + }, + { + "epoch": 1.49, + "learning_rate": 1.0637095483497789e-06, + "loss": 0.5562, + "step": 57976 + }, + { + "epoch": 1.49, + "learning_rate": 1.0636819340844883e-06, + "loss": 0.7637, + "step": 57977 + }, + { + "epoch": 1.49, + "learning_rate": 1.0636543197704392e-06, + "loss": 0.5486, + "step": 57978 + }, + { + "epoch": 1.49, + "learning_rate": 1.063626705407653e-06, + "loss": 0.5166, + "step": 57979 + }, + { + "epoch": 1.49, + "learning_rate": 1.063599090996151e-06, + "loss": 0.7344, + "step": 57980 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635714765359541e-06, + "loss": 0.5337, + "step": 57981 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635438620270832e-06, + "loss": 0.709, + "step": 57982 + }, + { + "epoch": 1.49, + "learning_rate": 1.0635162474695597e-06, + "loss": 0.7598, + "step": 57983 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634886328634047e-06, + "loss": 0.5859, + "step": 57984 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634610182086396e-06, + "loss": 0.6021, + "step": 57985 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634334035052854e-06, + "loss": 0.6504, + "step": 57986 + }, + { + "epoch": 1.49, + "learning_rate": 1.0634057887533633e-06, + "loss": 0.8164, + "step": 57987 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633781739528936e-06, + "loss": 0.6797, + "step": 57988 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633505591038987e-06, + "loss": 0.5479, + "step": 57989 + }, + { + "epoch": 1.49, + "learning_rate": 1.0633229442063987e-06, + "loss": 0.7988, + "step": 57990 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632953292604158e-06, + "loss": 0.6162, + "step": 57991 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632677142659703e-06, + "loss": 0.6582, + "step": 57992 + }, + { + "epoch": 1.49, + "learning_rate": 1.0632400992230836e-06, + "loss": 0.7334, + "step": 57993 + }, + { + "epoch": 1.49, + "learning_rate": 1.063212484131777e-06, + "loss": 0.6387, + "step": 57994 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631848689920715e-06, + "loss": 0.5518, + "step": 57995 + }, + { + "epoch": 1.49, + "learning_rate": 1.063157253803988e-06, + "loss": 0.7031, + "step": 57996 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631296385675483e-06, + "loss": 0.6182, + "step": 57997 + }, + { + "epoch": 1.49, + "learning_rate": 1.0631020232827727e-06, + "loss": 0.6445, + "step": 57998 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630744079496832e-06, + "loss": 0.4954, + "step": 57999 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630467925683e-06, + "loss": 0.5391, + "step": 58000 + }, + { + "epoch": 1.49, + "learning_rate": 1.0630191771386451e-06, + "loss": 0.606, + "step": 58001 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629915616607395e-06, + "loss": 0.7881, + "step": 58002 + }, + { + "epoch": 1.49, + "learning_rate": 1.062963946134604e-06, + "loss": 0.7715, + "step": 58003 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629363305602597e-06, + "loss": 0.8105, + "step": 58004 + }, + { + "epoch": 1.49, + "learning_rate": 1.0629087149377282e-06, + "loss": 0.4823, + "step": 58005 + }, + { + "epoch": 1.49, + "learning_rate": 1.0628810992670303e-06, + "loss": 0.5054, + "step": 58006 + }, + { + "epoch": 1.49, + "learning_rate": 1.062853483548187e-06, + "loss": 0.8369, + "step": 58007 + }, + { + "epoch": 1.49, + "learning_rate": 1.0628258677812201e-06, + "loss": 0.729, + "step": 58008 + }, + { + "epoch": 1.49, + "learning_rate": 1.06279825196615e-06, + "loss": 0.6846, + "step": 58009 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627706361029984e-06, + "loss": 0.7188, + "step": 58010 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627430201917863e-06, + "loss": 0.7715, + "step": 58011 + }, + { + "epoch": 1.49, + "learning_rate": 1.0627154042325345e-06, + "loss": 0.7002, + "step": 58012 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626877882252644e-06, + "loss": 0.6963, + "step": 58013 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626601721699971e-06, + "loss": 0.6611, + "step": 58014 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626325560667538e-06, + "loss": 0.7324, + "step": 58015 + }, + { + "epoch": 1.49, + "learning_rate": 1.0626049399155558e-06, + "loss": 0.458, + "step": 58016 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625773237164239e-06, + "loss": 0.6924, + "step": 58017 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625497074693797e-06, + "loss": 0.6543, + "step": 58018 + }, + { + "epoch": 1.49, + "learning_rate": 1.0625220911744437e-06, + "loss": 0.5732, + "step": 58019 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624944748316378e-06, + "loss": 0.8242, + "step": 58020 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624668584409826e-06, + "loss": 0.3826, + "step": 58021 + }, + { + "epoch": 1.49, + "learning_rate": 1.0624392420024992e-06, + "loss": 0.7939, + "step": 58022 + }, + { + "epoch": 1.49, + "learning_rate": 1.062411625516209e-06, + "loss": 0.5111, + "step": 58023 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623840089821334e-06, + "loss": 0.7451, + "step": 58024 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623563924002927e-06, + "loss": 0.5903, + "step": 58025 + }, + { + "epoch": 1.49, + "learning_rate": 1.0623287757707092e-06, + "loss": 0.7812, + "step": 58026 + }, + { + "epoch": 1.49, + "learning_rate": 1.062301159093403e-06, + "loss": 0.5969, + "step": 58027 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622735423683957e-06, + "loss": 0.6748, + "step": 58028 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622459255957085e-06, + "loss": 0.5039, + "step": 58029 + }, + { + "epoch": 1.49, + "learning_rate": 1.0622183087753624e-06, + "loss": 0.8594, + "step": 58030 + }, + { + "epoch": 1.49, + "learning_rate": 1.062190691907379e-06, + "loss": 0.4807, + "step": 58031 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621630749917782e-06, + "loss": 0.5413, + "step": 58032 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621354580285825e-06, + "loss": 0.4648, + "step": 58033 + }, + { + "epoch": 1.49, + "learning_rate": 1.0621078410178126e-06, + "loss": 0.6323, + "step": 58034 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620802239594894e-06, + "loss": 0.6582, + "step": 58035 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620526068536347e-06, + "loss": 0.6611, + "step": 58036 + }, + { + "epoch": 1.49, + "learning_rate": 1.0620249897002687e-06, + "loss": 0.6982, + "step": 58037 + }, + { + "epoch": 1.49, + "learning_rate": 1.061997372499413e-06, + "loss": 0.6023, + "step": 58038 + }, + { + "epoch": 1.49, + "learning_rate": 1.061969755251089e-06, + "loss": 0.4709, + "step": 58039 + }, + { + "epoch": 1.49, + "learning_rate": 1.0619421379553172e-06, + "loss": 0.261, + "step": 58040 + }, + { + "epoch": 1.49, + "learning_rate": 1.06191452061212e-06, + "loss": 0.6553, + "step": 58041 + }, + { + "epoch": 1.49, + "learning_rate": 1.0618869032215167e-06, + "loss": 0.6396, + "step": 58042 + }, + { + "epoch": 1.49, + "learning_rate": 1.06185928578353e-06, + "loss": 0.7051, + "step": 58043 + }, + { + "epoch": 1.49, + "learning_rate": 1.0618316682981802e-06, + "loss": 0.8613, + "step": 58044 + }, + { + "epoch": 1.49, + "learning_rate": 1.061804050765489e-06, + "loss": 0.6372, + "step": 58045 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617764331854772e-06, + "loss": 0.4725, + "step": 58046 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617488155581662e-06, + "loss": 0.5691, + "step": 58047 + }, + { + "epoch": 1.49, + "learning_rate": 1.0617211978835768e-06, + "loss": 0.6519, + "step": 58048 + }, + { + "epoch": 1.49, + "learning_rate": 1.06169358016173e-06, + "loss": 0.5732, + "step": 58049 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616659623926475e-06, + "loss": 0.6538, + "step": 58050 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616383445763505e-06, + "loss": 0.5447, + "step": 58051 + }, + { + "epoch": 1.49, + "learning_rate": 1.0616107267128598e-06, + "loss": 0.6748, + "step": 58052 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615831088021962e-06, + "loss": 0.6279, + "step": 58053 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615554908443816e-06, + "loss": 0.5972, + "step": 58054 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615278728394363e-06, + "loss": 0.6611, + "step": 58055 + }, + { + "epoch": 1.49, + "learning_rate": 1.0615002547873828e-06, + "loss": 0.5981, + "step": 58056 + }, + { + "epoch": 1.49, + "learning_rate": 1.0614726366882407e-06, + "loss": 0.554, + "step": 58057 + }, + { + "epoch": 1.49, + "learning_rate": 1.061445018542032e-06, + "loss": 0.7559, + "step": 58058 + }, + { + "epoch": 1.49, + "learning_rate": 1.0614174003487774e-06, + "loss": 0.7988, + "step": 58059 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613897821084989e-06, + "loss": 0.5579, + "step": 58060 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613621638212166e-06, + "loss": 0.5349, + "step": 58061 + }, + { + "epoch": 1.49, + "learning_rate": 1.0613345454869524e-06, + "loss": 0.6074, + "step": 58062 + }, + { + "epoch": 1.49, + "learning_rate": 1.061306927105727e-06, + "loss": 0.5996, + "step": 58063 + }, + { + "epoch": 1.49, + "learning_rate": 1.0612793086775618e-06, + "loss": 0.6104, + "step": 58064 + }, + { + "epoch": 1.49, + "learning_rate": 1.061251690202478e-06, + "loss": 0.4724, + "step": 58065 + }, + { + "epoch": 1.49, + "learning_rate": 1.0612240716804964e-06, + "loss": 0.542, + "step": 58066 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611964531116381e-06, + "loss": 0.7646, + "step": 58067 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611688344959248e-06, + "loss": 0.606, + "step": 58068 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611412158333773e-06, + "loss": 0.5383, + "step": 58069 + }, + { + "epoch": 1.49, + "learning_rate": 1.0611135971240168e-06, + "loss": 0.5752, + "step": 58070 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610859783678643e-06, + "loss": 0.6816, + "step": 58071 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610583595649413e-06, + "loss": 0.7812, + "step": 58072 + }, + { + "epoch": 1.49, + "learning_rate": 1.0610307407152683e-06, + "loss": 0.543, + "step": 58073 + }, + { + "epoch": 1.49, + "learning_rate": 1.061003121818867e-06, + "loss": 0.6846, + "step": 58074 + }, + { + "epoch": 1.49, + "learning_rate": 1.060975502875759e-06, + "loss": 0.6362, + "step": 58075 + }, + { + "epoch": 1.49, + "learning_rate": 1.0609478838859643e-06, + "loss": 0.7822, + "step": 58076 + }, + { + "epoch": 1.49, + "learning_rate": 1.060920264849505e-06, + "loss": 0.6807, + "step": 58077 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608926457664011e-06, + "loss": 0.7314, + "step": 58078 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608650266366751e-06, + "loss": 0.5508, + "step": 58079 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608374074603475e-06, + "loss": 0.7168, + "step": 58080 + }, + { + "epoch": 1.49, + "learning_rate": 1.0608097882374396e-06, + "loss": 0.7041, + "step": 58081 + }, + { + "epoch": 1.49, + "learning_rate": 1.060782168967972e-06, + "loss": 0.6704, + "step": 58082 + }, + { + "epoch": 1.49, + "learning_rate": 1.0607545496519668e-06, + "loss": 0.7393, + "step": 58083 + }, + { + "epoch": 1.49, + "learning_rate": 1.0607269302894442e-06, + "loss": 0.689, + "step": 58084 + }, + { + "epoch": 1.49, + "learning_rate": 1.060699310880426e-06, + "loss": 0.6885, + "step": 58085 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606716914249331e-06, + "loss": 0.7305, + "step": 58086 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606440719229868e-06, + "loss": 0.5732, + "step": 58087 + }, + { + "epoch": 1.49, + "learning_rate": 1.0606164523746078e-06, + "loss": 0.7119, + "step": 58088 + }, + { + "epoch": 1.49, + "learning_rate": 1.060588832779818e-06, + "loss": 0.7148, + "step": 58089 + }, + { + "epoch": 1.49, + "learning_rate": 1.060561213138638e-06, + "loss": 0.5051, + "step": 58090 + }, + { + "epoch": 1.49, + "learning_rate": 1.0605335934510887e-06, + "loss": 0.6494, + "step": 58091 + }, + { + "epoch": 1.49, + "learning_rate": 1.0605059737171917e-06, + "loss": 0.502, + "step": 58092 + }, + { + "epoch": 1.49, + "learning_rate": 1.0604783539369683e-06, + "loss": 0.709, + "step": 58093 + }, + { + "epoch": 1.49, + "learning_rate": 1.0604507341104392e-06, + "loss": 0.8369, + "step": 58094 + }, + { + "epoch": 1.49, + "learning_rate": 1.060423114237626e-06, + "loss": 0.7002, + "step": 58095 + }, + { + "epoch": 1.49, + "learning_rate": 1.0603954943185496e-06, + "loss": 0.6172, + "step": 58096 + }, + { + "epoch": 1.49, + "learning_rate": 1.060367874353231e-06, + "loss": 0.6211, + "step": 58097 + }, + { + "epoch": 1.49, + "learning_rate": 1.0603402543416916e-06, + "loss": 0.5898, + "step": 58098 + }, + { + "epoch": 1.49, + "learning_rate": 1.060312634283952e-06, + "loss": 0.6846, + "step": 58099 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602850141800344e-06, + "loss": 0.6548, + "step": 58100 + }, + { + "epoch": 1.49, + "learning_rate": 1.060257394029959e-06, + "loss": 0.521, + "step": 58101 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602297738337474e-06, + "loss": 0.5654, + "step": 58102 + }, + { + "epoch": 1.49, + "learning_rate": 1.0602021535914205e-06, + "loss": 0.6455, + "step": 58103 + }, + { + "epoch": 1.49, + "learning_rate": 1.0601745333029996e-06, + "loss": 0.457, + "step": 58104 + }, + { + "epoch": 1.49, + "learning_rate": 1.060146912968506e-06, + "loss": 0.6436, + "step": 58105 + }, + { + "epoch": 1.49, + "learning_rate": 1.0601192925879606e-06, + "loss": 0.6709, + "step": 58106 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600916721613846e-06, + "loss": 0.6943, + "step": 58107 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600640516887993e-06, + "loss": 0.5928, + "step": 58108 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600364311702254e-06, + "loss": 0.6221, + "step": 58109 + }, + { + "epoch": 1.49, + "learning_rate": 1.0600088106056849e-06, + "loss": 0.748, + "step": 58110 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599811899951977e-06, + "loss": 0.5771, + "step": 58111 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599535693387861e-06, + "loss": 0.6387, + "step": 58112 + }, + { + "epoch": 1.49, + "learning_rate": 1.0599259486364706e-06, + "loss": 0.7598, + "step": 58113 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598983278882728e-06, + "loss": 0.6128, + "step": 58114 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598707070942137e-06, + "loss": 0.6221, + "step": 58115 + }, + { + "epoch": 1.49, + "learning_rate": 1.059843086254314e-06, + "loss": 0.5803, + "step": 58116 + }, + { + "epoch": 1.49, + "learning_rate": 1.0598154653685954e-06, + "loss": 0.6798, + "step": 58117 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597878444370787e-06, + "loss": 0.6919, + "step": 58118 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597602234597854e-06, + "loss": 0.5869, + "step": 58119 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597326024367364e-06, + "loss": 0.7627, + "step": 58120 + }, + { + "epoch": 1.49, + "learning_rate": 1.0597049813679528e-06, + "loss": 0.7441, + "step": 58121 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596773602534556e-06, + "loss": 0.5972, + "step": 58122 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596497390932667e-06, + "loss": 0.7783, + "step": 58123 + }, + { + "epoch": 1.49, + "learning_rate": 1.0596221178874062e-06, + "loss": 0.5428, + "step": 58124 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595944966358966e-06, + "loss": 0.8584, + "step": 58125 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595668753387575e-06, + "loss": 0.6978, + "step": 58126 + }, + { + "epoch": 1.49, + "learning_rate": 1.059539253996011e-06, + "loss": 0.6934, + "step": 58127 + }, + { + "epoch": 1.49, + "learning_rate": 1.0595116326076778e-06, + "loss": 0.7344, + "step": 58128 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594840111737797e-06, + "loss": 0.709, + "step": 58129 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594563896943373e-06, + "loss": 0.8003, + "step": 58130 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594287681693718e-06, + "loss": 0.6631, + "step": 58131 + }, + { + "epoch": 1.49, + "learning_rate": 1.0594011465989043e-06, + "loss": 0.5277, + "step": 58132 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593735249829564e-06, + "loss": 0.5554, + "step": 58133 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593459033215487e-06, + "loss": 0.6953, + "step": 58134 + }, + { + "epoch": 1.49, + "learning_rate": 1.0593182816147025e-06, + "loss": 0.584, + "step": 58135 + }, + { + "epoch": 1.49, + "learning_rate": 1.059290659862439e-06, + "loss": 0.749, + "step": 58136 + }, + { + "epoch": 1.49, + "learning_rate": 1.0592630380647797e-06, + "loss": 0.5386, + "step": 58137 + }, + { + "epoch": 1.49, + "learning_rate": 1.059235416221745e-06, + "loss": 0.5209, + "step": 58138 + }, + { + "epoch": 1.49, + "learning_rate": 1.0592077943333569e-06, + "loss": 0.563, + "step": 58139 + }, + { + "epoch": 1.49, + "learning_rate": 1.059180172399636e-06, + "loss": 0.7725, + "step": 58140 + }, + { + "epoch": 1.49, + "learning_rate": 1.0591525504206033e-06, + "loss": 0.7773, + "step": 58141 + }, + { + "epoch": 1.49, + "learning_rate": 1.0591249283962805e-06, + "loss": 0.6562, + "step": 58142 + }, + { + "epoch": 1.49, + "learning_rate": 1.0590973063266882e-06, + "loss": 0.6162, + "step": 58143 + }, + { + "epoch": 1.49, + "learning_rate": 1.059069684211848e-06, + "loss": 0.708, + "step": 58144 + }, + { + "epoch": 1.49, + "learning_rate": 1.0590420620517809e-06, + "loss": 0.6655, + "step": 58145 + }, + { + "epoch": 1.49, + "learning_rate": 1.059014439846508e-06, + "loss": 0.7754, + "step": 58146 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589868175960502e-06, + "loss": 0.6069, + "step": 58147 + }, + { + "epoch": 1.49, + "learning_rate": 1.058959195300429e-06, + "loss": 0.6992, + "step": 58148 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589315729596654e-06, + "loss": 0.6294, + "step": 58149 + }, + { + "epoch": 1.49, + "learning_rate": 1.0589039505737808e-06, + "loss": 0.609, + "step": 58150 + }, + { + "epoch": 1.49, + "learning_rate": 1.0588763281427962e-06, + "loss": 0.5664, + "step": 58151 + }, + { + "epoch": 1.49, + "learning_rate": 1.0588487056667326e-06, + "loss": 0.7832, + "step": 58152 + }, + { + "epoch": 1.49, + "learning_rate": 1.058821083145611e-06, + "loss": 0.7549, + "step": 58153 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587934605794533e-06, + "loss": 0.6377, + "step": 58154 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587658379682798e-06, + "loss": 0.8076, + "step": 58155 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587382153121123e-06, + "loss": 0.446, + "step": 58156 + }, + { + "epoch": 1.49, + "learning_rate": 1.0587105926109712e-06, + "loss": 0.7617, + "step": 58157 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586829698648785e-06, + "loss": 0.5039, + "step": 58158 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586553470738545e-06, + "loss": 0.6016, + "step": 58159 + }, + { + "epoch": 1.49, + "learning_rate": 1.058627724237921e-06, + "loss": 0.7119, + "step": 58160 + }, + { + "epoch": 1.49, + "learning_rate": 1.0586001013570993e-06, + "loss": 0.6748, + "step": 58161 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585724784314098e-06, + "loss": 0.625, + "step": 58162 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585448554608743e-06, + "loss": 0.5459, + "step": 58163 + }, + { + "epoch": 1.49, + "learning_rate": 1.0585172324455134e-06, + "loss": 0.791, + "step": 58164 + }, + { + "epoch": 1.49, + "learning_rate": 1.058489609385349e-06, + "loss": 0.5205, + "step": 58165 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584619862804014e-06, + "loss": 0.7998, + "step": 58166 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584343631306922e-06, + "loss": 0.6865, + "step": 58167 + }, + { + "epoch": 1.49, + "learning_rate": 1.0584067399362423e-06, + "loss": 0.6543, + "step": 58168 + }, + { + "epoch": 1.49, + "learning_rate": 1.0583791166970735e-06, + "loss": 0.771, + "step": 58169 + }, + { + "epoch": 1.49, + "learning_rate": 1.0583514934132062e-06, + "loss": 0.7197, + "step": 58170 + }, + { + "epoch": 1.49, + "learning_rate": 1.058323870084662e-06, + "loss": 0.647, + "step": 58171 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582962467114618e-06, + "loss": 0.5942, + "step": 58172 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582686232936268e-06, + "loss": 0.6523, + "step": 58173 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582409998311782e-06, + "loss": 0.5836, + "step": 58174 + }, + { + "epoch": 1.49, + "learning_rate": 1.0582133763241376e-06, + "loss": 0.4434, + "step": 58175 + }, + { + "epoch": 1.49, + "learning_rate": 1.058185752772525e-06, + "loss": 0.5903, + "step": 58176 + }, + { + "epoch": 1.49, + "learning_rate": 1.0581581291763628e-06, + "loss": 0.5986, + "step": 58177 + }, + { + "epoch": 1.49, + "learning_rate": 1.0581305055356711e-06, + "loss": 0.5933, + "step": 58178 + }, + { + "epoch": 1.49, + "learning_rate": 1.058102881850472e-06, + "loss": 0.6445, + "step": 58179 + }, + { + "epoch": 1.49, + "learning_rate": 1.058075258120786e-06, + "loss": 0.7559, + "step": 58180 + }, + { + "epoch": 1.49, + "learning_rate": 1.0580476343466343e-06, + "loss": 0.7251, + "step": 58181 + }, + { + "epoch": 1.49, + "learning_rate": 1.0580200105280383e-06, + "loss": 0.6865, + "step": 58182 + }, + { + "epoch": 1.49, + "learning_rate": 1.057992386665019e-06, + "loss": 0.623, + "step": 58183 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579647627575979e-06, + "loss": 0.7988, + "step": 58184 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579371388057957e-06, + "loss": 0.5908, + "step": 58185 + }, + { + "epoch": 1.49, + "learning_rate": 1.0579095148096335e-06, + "loss": 0.7129, + "step": 58186 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578818907691326e-06, + "loss": 0.7676, + "step": 58187 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578542666843145e-06, + "loss": 0.5232, + "step": 58188 + }, + { + "epoch": 1.49, + "learning_rate": 1.0578266425551995e-06, + "loss": 0.6567, + "step": 58189 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577990183818102e-06, + "loss": 0.5382, + "step": 58190 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577713941641663e-06, + "loss": 0.584, + "step": 58191 + }, + { + "epoch": 1.49, + "learning_rate": 1.0577437699022895e-06, + "loss": 0.75, + "step": 58192 + }, + { + "epoch": 1.49, + "learning_rate": 1.057716145596201e-06, + "loss": 0.5786, + "step": 58193 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576885212459219e-06, + "loss": 0.5837, + "step": 58194 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576608968514734e-06, + "loss": 0.4268, + "step": 58195 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576332724128767e-06, + "loss": 0.6758, + "step": 58196 + }, + { + "epoch": 1.49, + "learning_rate": 1.0576056479301526e-06, + "loss": 0.6074, + "step": 58197 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575780234033224e-06, + "loss": 0.6953, + "step": 58198 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575503988324076e-06, + "loss": 0.7119, + "step": 58199 + }, + { + "epoch": 1.49, + "learning_rate": 1.0575227742174294e-06, + "loss": 0.6367, + "step": 58200 + }, + { + "epoch": 1.49, + "learning_rate": 1.057495149558408e-06, + "loss": 0.7334, + "step": 58201 + }, + { + "epoch": 1.49, + "learning_rate": 1.0574675248553658e-06, + "loss": 0.485, + "step": 58202 + }, + { + "epoch": 1.49, + "learning_rate": 1.057439900108323e-06, + "loss": 0.4888, + "step": 58203 + }, + { + "epoch": 1.49, + "learning_rate": 1.057412275317301e-06, + "loss": 0.4397, + "step": 58204 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573846504823216e-06, + "loss": 0.7412, + "step": 58205 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573570256034048e-06, + "loss": 0.5068, + "step": 58206 + }, + { + "epoch": 1.49, + "learning_rate": 1.057329400680573e-06, + "loss": 0.709, + "step": 58207 + }, + { + "epoch": 1.49, + "learning_rate": 1.0573017757138461e-06, + "loss": 0.5859, + "step": 58208 + }, + { + "epoch": 1.49, + "learning_rate": 1.0572741507032462e-06, + "loss": 0.7588, + "step": 58209 + }, + { + "epoch": 1.49, + "learning_rate": 1.057246525648794e-06, + "loss": 0.707, + "step": 58210 + }, + { + "epoch": 1.49, + "learning_rate": 1.0572189005505108e-06, + "loss": 0.4924, + "step": 58211 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571912754084175e-06, + "loss": 0.6816, + "step": 58212 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571636502225358e-06, + "loss": 0.6299, + "step": 58213 + }, + { + "epoch": 1.49, + "learning_rate": 1.0571360249928865e-06, + "loss": 0.4675, + "step": 58214 + }, + { + "epoch": 1.49, + "learning_rate": 1.057108399719491e-06, + "loss": 0.6685, + "step": 58215 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570807744023696e-06, + "loss": 0.5898, + "step": 58216 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570531490415444e-06, + "loss": 0.4187, + "step": 58217 + }, + { + "epoch": 1.49, + "learning_rate": 1.0570255236370363e-06, + "loss": 0.71, + "step": 58218 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569978981888663e-06, + "loss": 0.562, + "step": 58219 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569702726970555e-06, + "loss": 0.6953, + "step": 58220 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569426471616253e-06, + "loss": 0.7031, + "step": 58221 + }, + { + "epoch": 1.49, + "learning_rate": 1.0569150215825968e-06, + "loss": 0.7074, + "step": 58222 + }, + { + "epoch": 1.49, + "learning_rate": 1.056887395959991e-06, + "loss": 0.6631, + "step": 58223 + }, + { + "epoch": 1.49, + "learning_rate": 1.0568597702938291e-06, + "loss": 0.6904, + "step": 58224 + }, + { + "epoch": 1.49, + "learning_rate": 1.0568321445841325e-06, + "loss": 0.5918, + "step": 58225 + }, + { + "epoch": 1.49, + "learning_rate": 1.056804518830922e-06, + "loss": 0.6826, + "step": 58226 + }, + { + "epoch": 1.49, + "learning_rate": 1.056776893034219e-06, + "loss": 0.4463, + "step": 58227 + }, + { + "epoch": 1.49, + "learning_rate": 1.056749267194044e-06, + "loss": 0.7339, + "step": 58228 + }, + { + "epoch": 1.49, + "learning_rate": 1.0567216413104194e-06, + "loss": 0.6143, + "step": 58229 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566940153833654e-06, + "loss": 0.5266, + "step": 58230 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566663894129033e-06, + "loss": 0.645, + "step": 58231 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566387633990545e-06, + "loss": 0.7129, + "step": 58232 + }, + { + "epoch": 1.49, + "learning_rate": 1.0566111373418399e-06, + "loss": 0.7285, + "step": 58233 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565835112412807e-06, + "loss": 0.5386, + "step": 58234 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565558850973983e-06, + "loss": 0.708, + "step": 58235 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565282589102135e-06, + "loss": 0.9082, + "step": 58236 + }, + { + "epoch": 1.49, + "learning_rate": 1.0565006326797477e-06, + "loss": 0.5706, + "step": 58237 + }, + { + "epoch": 1.49, + "learning_rate": 1.056473006406022e-06, + "loss": 0.6719, + "step": 58238 + }, + { + "epoch": 1.49, + "learning_rate": 1.056445380089057e-06, + "loss": 0.6797, + "step": 58239 + }, + { + "epoch": 1.49, + "learning_rate": 1.0564177537288751e-06, + "loss": 0.6616, + "step": 58240 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563901273254966e-06, + "loss": 0.7139, + "step": 58241 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563625008789425e-06, + "loss": 0.8149, + "step": 58242 + }, + { + "epoch": 1.49, + "learning_rate": 1.0563348743892341e-06, + "loss": 0.7969, + "step": 58243 + }, + { + "epoch": 1.49, + "learning_rate": 1.056307247856393e-06, + "loss": 0.6279, + "step": 58244 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562796212804401e-06, + "loss": 0.7754, + "step": 58245 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562519946613964e-06, + "loss": 0.6475, + "step": 58246 + }, + { + "epoch": 1.49, + "learning_rate": 1.0562243679992828e-06, + "loss": 0.624, + "step": 58247 + }, + { + "epoch": 1.49, + "learning_rate": 1.056196741294121e-06, + "loss": 0.7363, + "step": 58248 + }, + { + "epoch": 1.49, + "learning_rate": 1.056169114545932e-06, + "loss": 0.9355, + "step": 58249 + }, + { + "epoch": 1.49, + "learning_rate": 1.0561414877547368e-06, + "loss": 0.4019, + "step": 58250 + }, + { + "epoch": 1.49, + "learning_rate": 1.056113860920557e-06, + "loss": 0.792, + "step": 58251 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560862340434127e-06, + "loss": 0.7158, + "step": 58252 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560586071233263e-06, + "loss": 0.7578, + "step": 58253 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560309801603182e-06, + "loss": 0.645, + "step": 58254 + }, + { + "epoch": 1.49, + "learning_rate": 1.0560033531544102e-06, + "loss": 0.7188, + "step": 58255 + }, + { + "epoch": 1.49, + "learning_rate": 1.0559757261056224e-06, + "loss": 0.6533, + "step": 58256 + }, + { + "epoch": 1.49, + "learning_rate": 1.055948099013977e-06, + "loss": 0.6089, + "step": 58257 + }, + { + "epoch": 1.49, + "learning_rate": 1.0559204718794942e-06, + "loss": 0.6748, + "step": 58258 + }, + { + "epoch": 1.49, + "learning_rate": 1.055892844702196e-06, + "loss": 0.749, + "step": 58259 + }, + { + "epoch": 1.49, + "learning_rate": 1.0558652174821033e-06, + "loss": 0.7656, + "step": 58260 + }, + { + "epoch": 1.49, + "learning_rate": 1.055837590219237e-06, + "loss": 0.5234, + "step": 58261 + }, + { + "epoch": 1.49, + "learning_rate": 1.0558099629136183e-06, + "loss": 0.6016, + "step": 58262 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557823355652686e-06, + "loss": 0.6201, + "step": 58263 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557547081742088e-06, + "loss": 0.6597, + "step": 58264 + }, + { + "epoch": 1.49, + "learning_rate": 1.0557270807404608e-06, + "loss": 0.5327, + "step": 58265 + }, + { + "epoch": 1.49, + "learning_rate": 1.0556994532640447e-06, + "loss": 0.5654, + "step": 58266 + }, + { + "epoch": 1.49, + "learning_rate": 1.0556718257449819e-06, + "loss": 0.4829, + "step": 58267 + }, + { + "epoch": 1.49, + "learning_rate": 1.055644198183294e-06, + "loss": 0.6851, + "step": 58268 + }, + { + "epoch": 1.49, + "learning_rate": 1.055616570579002e-06, + "loss": 0.8701, + "step": 58269 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555889429321267e-06, + "loss": 0.5017, + "step": 58270 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555613152426894e-06, + "loss": 0.479, + "step": 58271 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555336875107115e-06, + "loss": 0.8398, + "step": 58272 + }, + { + "epoch": 1.49, + "learning_rate": 1.0555060597362143e-06, + "loss": 0.6182, + "step": 58273 + }, + { + "epoch": 1.49, + "learning_rate": 1.0554784319192183e-06, + "loss": 0.8008, + "step": 58274 + }, + { + "epoch": 1.49, + "learning_rate": 1.055450804059745e-06, + "loss": 0.6279, + "step": 58275 + }, + { + "epoch": 1.49, + "learning_rate": 1.0554231761578159e-06, + "loss": 0.4871, + "step": 58276 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553955482134513e-06, + "loss": 0.7476, + "step": 58277 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553679202266734e-06, + "loss": 0.7451, + "step": 58278 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553402921975024e-06, + "loss": 0.665, + "step": 58279 + }, + { + "epoch": 1.49, + "learning_rate": 1.0553126641259604e-06, + "loss": 0.6069, + "step": 58280 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552850360120675e-06, + "loss": 0.6782, + "step": 58281 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552574078558457e-06, + "loss": 0.3735, + "step": 58282 + }, + { + "epoch": 1.49, + "learning_rate": 1.0552297796573158e-06, + "loss": 0.709, + "step": 58283 + }, + { + "epoch": 1.49, + "learning_rate": 1.055202151416499e-06, + "loss": 0.6494, + "step": 58284 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551745231334165e-06, + "loss": 0.5156, + "step": 58285 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551468948080893e-06, + "loss": 0.5635, + "step": 58286 + }, + { + "epoch": 1.49, + "learning_rate": 1.0551192664405385e-06, + "loss": 0.6831, + "step": 58287 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550916380307856e-06, + "loss": 0.5298, + "step": 58288 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550640095788516e-06, + "loss": 0.7158, + "step": 58289 + }, + { + "epoch": 1.49, + "learning_rate": 1.0550363810847577e-06, + "loss": 0.7559, + "step": 58290 + }, + { + "epoch": 1.49, + "learning_rate": 1.055008752548525e-06, + "loss": 0.665, + "step": 58291 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549811239701745e-06, + "loss": 0.6416, + "step": 58292 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549534953497272e-06, + "loss": 0.6016, + "step": 58293 + }, + { + "epoch": 1.49, + "learning_rate": 1.0549258666872049e-06, + "loss": 0.7432, + "step": 58294 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548982379826284e-06, + "loss": 0.5854, + "step": 58295 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548706092360184e-06, + "loss": 0.5308, + "step": 58296 + }, + { + "epoch": 1.49, + "learning_rate": 1.054842980447397e-06, + "loss": 0.4374, + "step": 58297 + }, + { + "epoch": 1.49, + "learning_rate": 1.0548153516167846e-06, + "loss": 0.5562, + "step": 58298 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547877227442027e-06, + "loss": 0.4853, + "step": 58299 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547600938296724e-06, + "loss": 0.8037, + "step": 58300 + }, + { + "epoch": 1.49, + "learning_rate": 1.054732464873215e-06, + "loss": 0.6055, + "step": 58301 + }, + { + "epoch": 1.49, + "learning_rate": 1.0547048358748509e-06, + "loss": 0.6455, + "step": 58302 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546772068346025e-06, + "loss": 0.479, + "step": 58303 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546495777524894e-06, + "loss": 0.5101, + "step": 58304 + }, + { + "epoch": 1.49, + "learning_rate": 1.0546219486285347e-06, + "loss": 0.749, + "step": 58305 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545943194627579e-06, + "loss": 0.6709, + "step": 58306 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545666902551806e-06, + "loss": 0.6973, + "step": 58307 + }, + { + "epoch": 1.49, + "learning_rate": 1.0545390610058241e-06, + "loss": 0.6108, + "step": 58308 + }, + { + "epoch": 1.49, + "learning_rate": 1.05451143171471e-06, + "loss": 0.6055, + "step": 58309 + }, + { + "epoch": 1.49, + "learning_rate": 1.0544838023818587e-06, + "loss": 0.6406, + "step": 58310 + }, + { + "epoch": 1.49, + "learning_rate": 1.0544561730072919e-06, + "loss": 0.7979, + "step": 58311 + }, + { + "epoch": 1.49, + "learning_rate": 1.05442854359103e-06, + "loss": 0.5227, + "step": 58312 + }, + { + "epoch": 1.49, + "learning_rate": 1.054400914133095e-06, + "loss": 0.531, + "step": 58313 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543732846335077e-06, + "loss": 0.7109, + "step": 58314 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543456550922892e-06, + "loss": 0.6606, + "step": 58315 + }, + { + "epoch": 1.49, + "learning_rate": 1.0543180255094607e-06, + "loss": 0.6846, + "step": 58316 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542903958850438e-06, + "loss": 0.4963, + "step": 58317 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542627662190589e-06, + "loss": 0.7451, + "step": 58318 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542351365115274e-06, + "loss": 0.6392, + "step": 58319 + }, + { + "epoch": 1.49, + "learning_rate": 1.0542075067624708e-06, + "loss": 0.5283, + "step": 58320 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541798769719096e-06, + "loss": 0.4907, + "step": 58321 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541522471398658e-06, + "loss": 0.6709, + "step": 58322 + }, + { + "epoch": 1.49, + "learning_rate": 1.0541246172663597e-06, + "loss": 0.6426, + "step": 58323 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540969873514134e-06, + "loss": 0.5371, + "step": 58324 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540693573950472e-06, + "loss": 0.6685, + "step": 58325 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540417273972826e-06, + "loss": 0.6201, + "step": 58326 + }, + { + "epoch": 1.49, + "learning_rate": 1.0540140973581406e-06, + "loss": 0.5547, + "step": 58327 + }, + { + "epoch": 1.49, + "learning_rate": 1.053986467277643e-06, + "loss": 0.7168, + "step": 58328 + }, + { + "epoch": 1.5, + "learning_rate": 1.0539588371558097e-06, + "loss": 0.606, + "step": 58329 + }, + { + "epoch": 1.5, + "learning_rate": 1.0539312069926634e-06, + "loss": 0.3275, + "step": 58330 + }, + { + "epoch": 1.5, + "learning_rate": 1.053903576788224e-06, + "loss": 0.8062, + "step": 58331 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538759465425131e-06, + "loss": 0.5244, + "step": 58332 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538483162555516e-06, + "loss": 0.7559, + "step": 58333 + }, + { + "epoch": 1.5, + "learning_rate": 1.0538206859273615e-06, + "loss": 0.4357, + "step": 58334 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537930555579631e-06, + "loss": 0.5488, + "step": 58335 + }, + { + "epoch": 1.5, + "learning_rate": 1.053765425147378e-06, + "loss": 0.6025, + "step": 58336 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537377946956267e-06, + "loss": 0.5386, + "step": 58337 + }, + { + "epoch": 1.5, + "learning_rate": 1.0537101642027312e-06, + "loss": 0.7031, + "step": 58338 + }, + { + "epoch": 1.5, + "learning_rate": 1.0536825336687122e-06, + "loss": 0.5957, + "step": 58339 + }, + { + "epoch": 1.5, + "learning_rate": 1.053654903093591e-06, + "loss": 0.53, + "step": 58340 + }, + { + "epoch": 1.5, + "learning_rate": 1.0536272724773888e-06, + "loss": 0.6128, + "step": 58341 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535996418201266e-06, + "loss": 0.7031, + "step": 58342 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535720111218255e-06, + "loss": 0.6494, + "step": 58343 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535443803825067e-06, + "loss": 0.6904, + "step": 58344 + }, + { + "epoch": 1.5, + "learning_rate": 1.0535167496021922e-06, + "loss": 0.6084, + "step": 58345 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534891187809016e-06, + "loss": 0.8672, + "step": 58346 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534614879186569e-06, + "loss": 0.6631, + "step": 58347 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534338570154794e-06, + "loss": 0.6406, + "step": 58348 + }, + { + "epoch": 1.5, + "learning_rate": 1.0534062260713901e-06, + "loss": 0.5269, + "step": 58349 + }, + { + "epoch": 1.5, + "learning_rate": 1.05337859508641e-06, + "loss": 0.502, + "step": 58350 + }, + { + "epoch": 1.5, + "learning_rate": 1.0533509640605605e-06, + "loss": 0.668, + "step": 58351 + }, + { + "epoch": 1.5, + "learning_rate": 1.0533233329938622e-06, + "loss": 0.8418, + "step": 58352 + }, + { + "epoch": 1.5, + "learning_rate": 1.053295701886337e-06, + "loss": 0.5957, + "step": 58353 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532680707380058e-06, + "loss": 0.7471, + "step": 58354 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532404395488896e-06, + "loss": 0.7188, + "step": 58355 + }, + { + "epoch": 1.5, + "learning_rate": 1.0532128083190096e-06, + "loss": 0.6108, + "step": 58356 + }, + { + "epoch": 1.5, + "learning_rate": 1.053185177048387e-06, + "loss": 0.5371, + "step": 58357 + }, + { + "epoch": 1.5, + "learning_rate": 1.053157545737043e-06, + "loss": 0.6167, + "step": 58358 + }, + { + "epoch": 1.5, + "learning_rate": 1.0531299143849985e-06, + "loss": 0.7061, + "step": 58359 + }, + { + "epoch": 1.5, + "learning_rate": 1.0531022829922753e-06, + "loss": 0.5898, + "step": 58360 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530746515588937e-06, + "loss": 0.7451, + "step": 58361 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530470200848755e-06, + "loss": 0.7266, + "step": 58362 + }, + { + "epoch": 1.5, + "learning_rate": 1.0530193885702416e-06, + "loss": 0.6211, + "step": 58363 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529917570150132e-06, + "loss": 0.6328, + "step": 58364 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529641254192113e-06, + "loss": 0.71, + "step": 58365 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529364937828575e-06, + "loss": 0.5649, + "step": 58366 + }, + { + "epoch": 1.5, + "learning_rate": 1.0529088621059724e-06, + "loss": 0.7007, + "step": 58367 + }, + { + "epoch": 1.5, + "learning_rate": 1.0528812303885776e-06, + "loss": 0.6582, + "step": 58368 + }, + { + "epoch": 1.5, + "learning_rate": 1.052853598630694e-06, + "loss": 0.5229, + "step": 58369 + }, + { + "epoch": 1.5, + "learning_rate": 1.052825966832343e-06, + "loss": 0.5342, + "step": 58370 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527983349935453e-06, + "loss": 0.5176, + "step": 58371 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527707031143224e-06, + "loss": 0.6494, + "step": 58372 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527430711946954e-06, + "loss": 0.7686, + "step": 58373 + }, + { + "epoch": 1.5, + "learning_rate": 1.0527154392346858e-06, + "loss": 0.79, + "step": 58374 + }, + { + "epoch": 1.5, + "learning_rate": 1.052687807234314e-06, + "loss": 0.5869, + "step": 58375 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526601751936018e-06, + "loss": 0.6963, + "step": 58376 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526325431125697e-06, + "loss": 0.6631, + "step": 58377 + }, + { + "epoch": 1.5, + "learning_rate": 1.0526049109912396e-06, + "loss": 0.6562, + "step": 58378 + }, + { + "epoch": 1.5, + "learning_rate": 1.0525772788296326e-06, + "loss": 0.5176, + "step": 58379 + }, + { + "epoch": 1.5, + "learning_rate": 1.0525496466277693e-06, + "loss": 0.6836, + "step": 58380 + }, + { + "epoch": 1.5, + "learning_rate": 1.052522014385671e-06, + "loss": 0.6465, + "step": 58381 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524943821033592e-06, + "loss": 0.3567, + "step": 58382 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524667497808548e-06, + "loss": 0.7266, + "step": 58383 + }, + { + "epoch": 1.5, + "learning_rate": 1.052439117418179e-06, + "loss": 0.7344, + "step": 58384 + }, + { + "epoch": 1.5, + "learning_rate": 1.0524114850153532e-06, + "loss": 0.6719, + "step": 58385 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523838525723981e-06, + "loss": 0.5991, + "step": 58386 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523562200893352e-06, + "loss": 0.6299, + "step": 58387 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523285875661853e-06, + "loss": 0.5327, + "step": 58388 + }, + { + "epoch": 1.5, + "learning_rate": 1.0523009550029704e-06, + "loss": 0.6558, + "step": 58389 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522733223997105e-06, + "loss": 0.6025, + "step": 58390 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522456897564276e-06, + "loss": 0.7576, + "step": 58391 + }, + { + "epoch": 1.5, + "learning_rate": 1.0522180570731424e-06, + "loss": 0.6602, + "step": 58392 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521904243498765e-06, + "loss": 0.7266, + "step": 58393 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521627915866507e-06, + "loss": 0.4976, + "step": 58394 + }, + { + "epoch": 1.5, + "learning_rate": 1.0521351587834861e-06, + "loss": 0.5437, + "step": 58395 + }, + { + "epoch": 1.5, + "learning_rate": 1.052107525940404e-06, + "loss": 0.6641, + "step": 58396 + }, + { + "epoch": 1.5, + "learning_rate": 1.0520798930574257e-06, + "loss": 0.7031, + "step": 58397 + }, + { + "epoch": 1.5, + "learning_rate": 1.052052260134572e-06, + "loss": 0.542, + "step": 58398 + }, + { + "epoch": 1.5, + "learning_rate": 1.0520246271718646e-06, + "loss": 0.6348, + "step": 58399 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519969941693242e-06, + "loss": 0.6953, + "step": 58400 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519693611269721e-06, + "loss": 0.5923, + "step": 58401 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519417280448292e-06, + "loss": 0.7402, + "step": 58402 + }, + { + "epoch": 1.5, + "learning_rate": 1.0519140949229173e-06, + "loss": 0.6699, + "step": 58403 + }, + { + "epoch": 1.5, + "learning_rate": 1.051886461761257e-06, + "loss": 0.7725, + "step": 58404 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518588285598695e-06, + "loss": 0.5859, + "step": 58405 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518311953187762e-06, + "loss": 0.6069, + "step": 58406 + }, + { + "epoch": 1.5, + "learning_rate": 1.0518035620379981e-06, + "loss": 0.6616, + "step": 58407 + }, + { + "epoch": 1.5, + "learning_rate": 1.0517759287175565e-06, + "loss": 0.4846, + "step": 58408 + }, + { + "epoch": 1.5, + "learning_rate": 1.0517482953574722e-06, + "loss": 0.4429, + "step": 58409 + }, + { + "epoch": 1.5, + "learning_rate": 1.051720661957767e-06, + "loss": 0.7173, + "step": 58410 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516930285184614e-06, + "loss": 0.5498, + "step": 58411 + }, + { + "epoch": 1.5, + "learning_rate": 1.051665395039577e-06, + "loss": 0.5005, + "step": 58412 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516377615211346e-06, + "loss": 0.7881, + "step": 58413 + }, + { + "epoch": 1.5, + "learning_rate": 1.0516101279631557e-06, + "loss": 0.5669, + "step": 58414 + }, + { + "epoch": 1.5, + "learning_rate": 1.051582494365661e-06, + "loss": 0.8184, + "step": 58415 + }, + { + "epoch": 1.5, + "learning_rate": 1.0515548607286723e-06, + "loss": 0.481, + "step": 58416 + }, + { + "epoch": 1.5, + "learning_rate": 1.0515272270522103e-06, + "loss": 0.6465, + "step": 58417 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514995933362961e-06, + "loss": 0.5596, + "step": 58418 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514719595809514e-06, + "loss": 0.4922, + "step": 58419 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514443257861967e-06, + "loss": 0.5581, + "step": 58420 + }, + { + "epoch": 1.5, + "learning_rate": 1.0514166919520533e-06, + "loss": 0.6582, + "step": 58421 + }, + { + "epoch": 1.5, + "learning_rate": 1.051389058078543e-06, + "loss": 0.6973, + "step": 58422 + }, + { + "epoch": 1.5, + "learning_rate": 1.0513614241656858e-06, + "loss": 0.7744, + "step": 58423 + }, + { + "epoch": 1.5, + "learning_rate": 1.051333790213504e-06, + "loss": 0.7041, + "step": 58424 + }, + { + "epoch": 1.5, + "learning_rate": 1.0513061562220182e-06, + "loss": 0.5425, + "step": 58425 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512785221912497e-06, + "loss": 0.7051, + "step": 58426 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512508881212195e-06, + "loss": 0.625, + "step": 58427 + }, + { + "epoch": 1.5, + "learning_rate": 1.0512232540119487e-06, + "loss": 0.5669, + "step": 58428 + }, + { + "epoch": 1.5, + "learning_rate": 1.051195619863459e-06, + "loss": 0.8115, + "step": 58429 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511679856757707e-06, + "loss": 0.709, + "step": 58430 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511403514489056e-06, + "loss": 0.7324, + "step": 58431 + }, + { + "epoch": 1.5, + "learning_rate": 1.0511127171828846e-06, + "loss": 0.752, + "step": 58432 + }, + { + "epoch": 1.5, + "learning_rate": 1.051085082877729e-06, + "loss": 0.5711, + "step": 58433 + }, + { + "epoch": 1.5, + "learning_rate": 1.0510574485334603e-06, + "loss": 0.4685, + "step": 58434 + }, + { + "epoch": 1.5, + "learning_rate": 1.051029814150099e-06, + "loss": 0.5928, + "step": 58435 + }, + { + "epoch": 1.5, + "learning_rate": 1.0510021797276662e-06, + "loss": 0.4385, + "step": 58436 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509745452661838e-06, + "loss": 0.5908, + "step": 58437 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509469107656721e-06, + "loss": 0.7393, + "step": 58438 + }, + { + "epoch": 1.5, + "learning_rate": 1.0509192762261534e-06, + "loss": 0.7256, + "step": 58439 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508916416476474e-06, + "loss": 0.563, + "step": 58440 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508640070301763e-06, + "loss": 0.5493, + "step": 58441 + }, + { + "epoch": 1.5, + "learning_rate": 1.050836372373761e-06, + "loss": 0.7881, + "step": 58442 + }, + { + "epoch": 1.5, + "learning_rate": 1.0508087376784228e-06, + "loss": 0.5332, + "step": 58443 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507811029441823e-06, + "loss": 0.5649, + "step": 58444 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507534681710614e-06, + "loss": 0.7373, + "step": 58445 + }, + { + "epoch": 1.5, + "learning_rate": 1.0507258333590807e-06, + "loss": 0.6641, + "step": 58446 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506981985082617e-06, + "loss": 0.668, + "step": 58447 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506705636186252e-06, + "loss": 0.8242, + "step": 58448 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506429286901928e-06, + "loss": 0.7422, + "step": 58449 + }, + { + "epoch": 1.5, + "learning_rate": 1.0506152937229852e-06, + "loss": 0.4829, + "step": 58450 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505876587170238e-06, + "loss": 0.6865, + "step": 58451 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505600236723302e-06, + "loss": 0.4529, + "step": 58452 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505323885889248e-06, + "loss": 0.6343, + "step": 58453 + }, + { + "epoch": 1.5, + "learning_rate": 1.0505047534668292e-06, + "loss": 0.6841, + "step": 58454 + }, + { + "epoch": 1.5, + "learning_rate": 1.050477118306064e-06, + "loss": 0.6855, + "step": 58455 + }, + { + "epoch": 1.5, + "learning_rate": 1.0504494831066514e-06, + "loss": 0.7075, + "step": 58456 + }, + { + "epoch": 1.5, + "learning_rate": 1.0504218478686116e-06, + "loss": 0.4905, + "step": 58457 + }, + { + "epoch": 1.5, + "learning_rate": 1.050394212591966e-06, + "loss": 0.7246, + "step": 58458 + }, + { + "epoch": 1.5, + "learning_rate": 1.0503665772767362e-06, + "loss": 0.7607, + "step": 58459 + }, + { + "epoch": 1.5, + "learning_rate": 1.050338941922943e-06, + "loss": 0.6377, + "step": 58460 + }, + { + "epoch": 1.5, + "learning_rate": 1.0503113065306073e-06, + "loss": 0.7266, + "step": 58461 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502836710997507e-06, + "loss": 0.6348, + "step": 58462 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502560356303939e-06, + "loss": 0.7598, + "step": 58463 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502284001225591e-06, + "loss": 0.6421, + "step": 58464 + }, + { + "epoch": 1.5, + "learning_rate": 1.0502007645762663e-06, + "loss": 0.5757, + "step": 58465 + }, + { + "epoch": 1.5, + "learning_rate": 1.050173128991537e-06, + "loss": 0.752, + "step": 58466 + }, + { + "epoch": 1.5, + "learning_rate": 1.0501454933683925e-06, + "loss": 0.7529, + "step": 58467 + }, + { + "epoch": 1.5, + "learning_rate": 1.0501178577068539e-06, + "loss": 0.6558, + "step": 58468 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500902220069425e-06, + "loss": 0.5107, + "step": 58469 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500625862686792e-06, + "loss": 0.7188, + "step": 58470 + }, + { + "epoch": 1.5, + "learning_rate": 1.0500349504920851e-06, + "loss": 0.563, + "step": 58471 + }, + { + "epoch": 1.5, + "learning_rate": 1.050007314677182e-06, + "loss": 0.6797, + "step": 58472 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499796788239901e-06, + "loss": 0.665, + "step": 58473 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499520429325312e-06, + "loss": 0.5664, + "step": 58474 + }, + { + "epoch": 1.5, + "learning_rate": 1.0499244070028266e-06, + "loss": 0.7046, + "step": 58475 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498967710348966e-06, + "loss": 0.7495, + "step": 58476 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498691350287636e-06, + "loss": 0.7468, + "step": 58477 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498414989844476e-06, + "loss": 0.5112, + "step": 58478 + }, + { + "epoch": 1.5, + "learning_rate": 1.0498138629019709e-06, + "loss": 0.6641, + "step": 58479 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497862267813533e-06, + "loss": 0.748, + "step": 58480 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497585906226169e-06, + "loss": 0.5366, + "step": 58481 + }, + { + "epoch": 1.5, + "learning_rate": 1.0497309544257826e-06, + "loss": 0.4563, + "step": 58482 + }, + { + "epoch": 1.5, + "learning_rate": 1.049703318190872e-06, + "loss": 0.6519, + "step": 58483 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496756819179053e-06, + "loss": 0.7637, + "step": 58484 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496480456069046e-06, + "loss": 0.6484, + "step": 58485 + }, + { + "epoch": 1.5, + "learning_rate": 1.0496204092578905e-06, + "loss": 0.6177, + "step": 58486 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495927728708845e-06, + "loss": 0.6758, + "step": 58487 + }, + { + "epoch": 1.5, + "learning_rate": 1.049565136445907e-06, + "loss": 0.4912, + "step": 58488 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495374999829807e-06, + "loss": 0.5452, + "step": 58489 + }, + { + "epoch": 1.5, + "learning_rate": 1.0495098634821252e-06, + "loss": 0.5887, + "step": 58490 + }, + { + "epoch": 1.5, + "learning_rate": 1.0494822269433624e-06, + "loss": 0.5928, + "step": 58491 + }, + { + "epoch": 1.5, + "learning_rate": 1.049454590366713e-06, + "loss": 0.7236, + "step": 58492 + }, + { + "epoch": 1.5, + "learning_rate": 1.049426953752199e-06, + "loss": 0.6738, + "step": 58493 + }, + { + "epoch": 1.5, + "learning_rate": 1.049399317099841e-06, + "loss": 0.4467, + "step": 58494 + }, + { + "epoch": 1.5, + "learning_rate": 1.04937168040966e-06, + "loss": 0.5649, + "step": 58495 + }, + { + "epoch": 1.5, + "learning_rate": 1.0493440436816773e-06, + "loss": 0.4194, + "step": 58496 + }, + { + "epoch": 1.5, + "learning_rate": 1.0493164069159144e-06, + "loss": 0.6748, + "step": 58497 + }, + { + "epoch": 1.5, + "learning_rate": 1.049288770112392e-06, + "loss": 0.5095, + "step": 58498 + }, + { + "epoch": 1.5, + "learning_rate": 1.0492611332711319e-06, + "loss": 0.748, + "step": 58499 + }, + { + "epoch": 1.5, + "learning_rate": 1.0492334963921542e-06, + "loss": 0.7246, + "step": 58500 + }, + { + "epoch": 1.5, + "learning_rate": 1.049205859475481e-06, + "loss": 0.6831, + "step": 58501 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491782225211332e-06, + "loss": 0.5317, + "step": 58502 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491505855291316e-06, + "loss": 0.7314, + "step": 58503 + }, + { + "epoch": 1.5, + "learning_rate": 1.0491229484994981e-06, + "loss": 0.6484, + "step": 58504 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490953114322529e-06, + "loss": 0.7314, + "step": 58505 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490676743274181e-06, + "loss": 0.8418, + "step": 58506 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490400371850141e-06, + "loss": 0.666, + "step": 58507 + }, + { + "epoch": 1.5, + "learning_rate": 1.0490124000050626e-06, + "loss": 0.452, + "step": 58508 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489847627875846e-06, + "loss": 0.6348, + "step": 58509 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489571255326012e-06, + "loss": 0.6235, + "step": 58510 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489294882401335e-06, + "loss": 0.5095, + "step": 58511 + }, + { + "epoch": 1.5, + "learning_rate": 1.0489018509102027e-06, + "loss": 0.6445, + "step": 58512 + }, + { + "epoch": 1.5, + "learning_rate": 1.04887421354283e-06, + "loss": 0.5103, + "step": 58513 + }, + { + "epoch": 1.5, + "learning_rate": 1.0488465761380367e-06, + "loss": 0.6973, + "step": 58514 + }, + { + "epoch": 1.5, + "learning_rate": 1.0488189386958436e-06, + "loss": 0.708, + "step": 58515 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487913012162726e-06, + "loss": 0.6338, + "step": 58516 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487636636993437e-06, + "loss": 0.6152, + "step": 58517 + }, + { + "epoch": 1.5, + "learning_rate": 1.048736026145079e-06, + "loss": 0.4949, + "step": 58518 + }, + { + "epoch": 1.5, + "learning_rate": 1.0487083885534996e-06, + "loss": 0.4866, + "step": 58519 + }, + { + "epoch": 1.5, + "learning_rate": 1.0486807509246259e-06, + "loss": 0.5415, + "step": 58520 + }, + { + "epoch": 1.5, + "learning_rate": 1.04865311325848e-06, + "loss": 0.6895, + "step": 58521 + }, + { + "epoch": 1.5, + "learning_rate": 1.0486254755550823e-06, + "loss": 0.5312, + "step": 58522 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485978378144547e-06, + "loss": 0.7021, + "step": 58523 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485702000366178e-06, + "loss": 0.5151, + "step": 58524 + }, + { + "epoch": 1.5, + "learning_rate": 1.048542562221593e-06, + "loss": 0.5029, + "step": 58525 + }, + { + "epoch": 1.5, + "learning_rate": 1.0485149243694012e-06, + "loss": 0.5942, + "step": 58526 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484872864800638e-06, + "loss": 0.5752, + "step": 58527 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484596485536018e-06, + "loss": 0.5535, + "step": 58528 + }, + { + "epoch": 1.5, + "learning_rate": 1.048432010590037e-06, + "loss": 0.6758, + "step": 58529 + }, + { + "epoch": 1.5, + "learning_rate": 1.0484043725893896e-06, + "loss": 0.6392, + "step": 58530 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483767345516813e-06, + "loss": 0.7549, + "step": 58531 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483490964769331e-06, + "loss": 0.6555, + "step": 58532 + }, + { + "epoch": 1.5, + "learning_rate": 1.0483214583651662e-06, + "loss": 0.6724, + "step": 58533 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482938202164021e-06, + "loss": 0.5034, + "step": 58534 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482661820306612e-06, + "loss": 0.6235, + "step": 58535 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482385438079654e-06, + "loss": 0.6943, + "step": 58536 + }, + { + "epoch": 1.5, + "learning_rate": 1.0482109055483355e-06, + "loss": 0.6572, + "step": 58537 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481832672517926e-06, + "loss": 0.5591, + "step": 58538 + }, + { + "epoch": 1.5, + "learning_rate": 1.048155628918358e-06, + "loss": 0.6704, + "step": 58539 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481279905480528e-06, + "loss": 0.6299, + "step": 58540 + }, + { + "epoch": 1.5, + "learning_rate": 1.0481003521408984e-06, + "loss": 0.6289, + "step": 58541 + }, + { + "epoch": 1.5, + "learning_rate": 1.0480727136969156e-06, + "loss": 0.4922, + "step": 58542 + }, + { + "epoch": 1.5, + "learning_rate": 1.048045075216126e-06, + "loss": 0.5938, + "step": 58543 + }, + { + "epoch": 1.5, + "learning_rate": 1.0480174366985503e-06, + "loss": 0.5967, + "step": 58544 + }, + { + "epoch": 1.5, + "learning_rate": 1.04798979814421e-06, + "loss": 0.6548, + "step": 58545 + }, + { + "epoch": 1.5, + "learning_rate": 1.047962159553126e-06, + "loss": 0.5098, + "step": 58546 + }, + { + "epoch": 1.5, + "learning_rate": 1.0479345209253194e-06, + "loss": 0.7256, + "step": 58547 + }, + { + "epoch": 1.5, + "learning_rate": 1.047906882260812e-06, + "loss": 0.6855, + "step": 58548 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478792435596242e-06, + "loss": 0.6299, + "step": 58549 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478516048217775e-06, + "loss": 0.7217, + "step": 58550 + }, + { + "epoch": 1.5, + "learning_rate": 1.0478239660472929e-06, + "loss": 0.6904, + "step": 58551 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477963272361918e-06, + "loss": 0.5503, + "step": 58552 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477686883884951e-06, + "loss": 0.6113, + "step": 58553 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477410495042246e-06, + "loss": 0.5396, + "step": 58554 + }, + { + "epoch": 1.5, + "learning_rate": 1.0477134105834004e-06, + "loss": 0.6748, + "step": 58555 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476857716260447e-06, + "loss": 0.6758, + "step": 58556 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476581326321779e-06, + "loss": 0.605, + "step": 58557 + }, + { + "epoch": 1.5, + "learning_rate": 1.0476304936018215e-06, + "loss": 0.6587, + "step": 58558 + }, + { + "epoch": 1.5, + "learning_rate": 1.047602854534997e-06, + "loss": 0.6025, + "step": 58559 + }, + { + "epoch": 1.5, + "learning_rate": 1.0475752154317248e-06, + "loss": 0.5339, + "step": 58560 + }, + { + "epoch": 1.5, + "learning_rate": 1.0475475762920262e-06, + "loss": 0.6143, + "step": 58561 + }, + { + "epoch": 1.5, + "learning_rate": 1.047519937115923e-06, + "loss": 0.8467, + "step": 58562 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474922979034356e-06, + "loss": 0.6562, + "step": 58563 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474646586545858e-06, + "loss": 0.4539, + "step": 58564 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474370193693947e-06, + "loss": 0.625, + "step": 58565 + }, + { + "epoch": 1.5, + "learning_rate": 1.0474093800478828e-06, + "loss": 0.4083, + "step": 58566 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473817406900722e-06, + "loss": 0.6465, + "step": 58567 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473541012959831e-06, + "loss": 0.6035, + "step": 58568 + }, + { + "epoch": 1.5, + "learning_rate": 1.0473264618656377e-06, + "loss": 0.8369, + "step": 58569 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472988223990562e-06, + "loss": 0.7686, + "step": 58570 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472711828962604e-06, + "loss": 0.7598, + "step": 58571 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472435433572709e-06, + "loss": 0.7588, + "step": 58572 + }, + { + "epoch": 1.5, + "learning_rate": 1.0472159037821092e-06, + "loss": 0.5759, + "step": 58573 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471882641707969e-06, + "loss": 0.5776, + "step": 58574 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471606245233546e-06, + "loss": 0.5869, + "step": 58575 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471329848398032e-06, + "loss": 0.5088, + "step": 58576 + }, + { + "epoch": 1.5, + "learning_rate": 1.0471053451201647e-06, + "loss": 0.6152, + "step": 58577 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470777053644592e-06, + "loss": 0.7422, + "step": 58578 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470500655727092e-06, + "loss": 0.6768, + "step": 58579 + }, + { + "epoch": 1.5, + "learning_rate": 1.0470224257449346e-06, + "loss": 0.6431, + "step": 58580 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469947858811575e-06, + "loss": 0.4226, + "step": 58581 + }, + { + "epoch": 1.5, + "learning_rate": 1.046967145981398e-06, + "loss": 0.6553, + "step": 58582 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469395060456784e-06, + "loss": 0.5879, + "step": 58583 + }, + { + "epoch": 1.5, + "learning_rate": 1.0469118660740194e-06, + "loss": 0.5923, + "step": 58584 + }, + { + "epoch": 1.5, + "learning_rate": 1.046884226066442e-06, + "loss": 0.6768, + "step": 58585 + }, + { + "epoch": 1.5, + "learning_rate": 1.0468565860229675e-06, + "loss": 0.6377, + "step": 58586 + }, + { + "epoch": 1.5, + "learning_rate": 1.046828945943617e-06, + "loss": 0.6074, + "step": 58587 + }, + { + "epoch": 1.5, + "learning_rate": 1.046801305828412e-06, + "loss": 0.5229, + "step": 58588 + }, + { + "epoch": 1.5, + "learning_rate": 1.046773665677373e-06, + "loss": 0.6621, + "step": 58589 + }, + { + "epoch": 1.5, + "learning_rate": 1.0467460254905221e-06, + "loss": 0.7012, + "step": 58590 + }, + { + "epoch": 1.5, + "learning_rate": 1.0467183852678794e-06, + "loss": 0.6479, + "step": 58591 + }, + { + "epoch": 1.5, + "learning_rate": 1.046690745009467e-06, + "loss": 0.7725, + "step": 58592 + }, + { + "epoch": 1.5, + "learning_rate": 1.0466631047153052e-06, + "loss": 0.4902, + "step": 58593 + }, + { + "epoch": 1.5, + "learning_rate": 1.046635464385416e-06, + "loss": 0.6245, + "step": 58594 + }, + { + "epoch": 1.5, + "learning_rate": 1.04660782401982e-06, + "loss": 0.6846, + "step": 58595 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465801836185387e-06, + "loss": 0.7529, + "step": 58596 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465525431815926e-06, + "loss": 0.6401, + "step": 58597 + }, + { + "epoch": 1.5, + "learning_rate": 1.0465249027090038e-06, + "loss": 0.5767, + "step": 58598 + }, + { + "epoch": 1.5, + "learning_rate": 1.046497262200793e-06, + "loss": 0.4673, + "step": 58599 + }, + { + "epoch": 1.5, + "learning_rate": 1.0464696216569813e-06, + "loss": 0.752, + "step": 58600 + }, + { + "epoch": 1.5, + "learning_rate": 1.0464419810775899e-06, + "loss": 0.6152, + "step": 58601 + }, + { + "epoch": 1.5, + "learning_rate": 1.04641434046264e-06, + "loss": 0.605, + "step": 58602 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463866998121527e-06, + "loss": 0.5776, + "step": 58603 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463590591261496e-06, + "loss": 0.5586, + "step": 58604 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463314184046512e-06, + "loss": 0.4041, + "step": 58605 + }, + { + "epoch": 1.5, + "learning_rate": 1.0463037776476792e-06, + "loss": 0.7783, + "step": 58606 + }, + { + "epoch": 1.5, + "learning_rate": 1.0462761368552541e-06, + "loss": 0.6953, + "step": 58607 + }, + { + "epoch": 1.5, + "learning_rate": 1.046248496027398e-06, + "loss": 0.7861, + "step": 58608 + }, + { + "epoch": 1.5, + "learning_rate": 1.0462208551641313e-06, + "loss": 0.6387, + "step": 58609 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461932142654751e-06, + "loss": 0.6382, + "step": 58610 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461655733314514e-06, + "loss": 0.5511, + "step": 58611 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461379323620805e-06, + "loss": 0.4585, + "step": 58612 + }, + { + "epoch": 1.5, + "learning_rate": 1.0461102913573841e-06, + "loss": 0.5942, + "step": 58613 + }, + { + "epoch": 1.5, + "learning_rate": 1.0460826503173832e-06, + "loss": 0.6455, + "step": 58614 + }, + { + "epoch": 1.5, + "learning_rate": 1.046055009242099e-06, + "loss": 0.4969, + "step": 58615 + }, + { + "epoch": 1.5, + "learning_rate": 1.046027368131552e-06, + "loss": 0.7148, + "step": 58616 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459997269857645e-06, + "loss": 0.7793, + "step": 58617 + }, + { + "epoch": 1.5, + "learning_rate": 1.045972085804757e-06, + "loss": 0.7383, + "step": 58618 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459444445885512e-06, + "loss": 0.8477, + "step": 58619 + }, + { + "epoch": 1.5, + "learning_rate": 1.0459168033371673e-06, + "loss": 0.6484, + "step": 58620 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458891620506272e-06, + "loss": 0.542, + "step": 58621 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458615207289519e-06, + "loss": 0.6753, + "step": 58622 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458338793721623e-06, + "loss": 0.5867, + "step": 58623 + }, + { + "epoch": 1.5, + "learning_rate": 1.0458062379802802e-06, + "loss": 0.6304, + "step": 58624 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457785965533263e-06, + "loss": 0.6479, + "step": 58625 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457509550913215e-06, + "loss": 0.6113, + "step": 58626 + }, + { + "epoch": 1.5, + "learning_rate": 1.0457233135942876e-06, + "loss": 0.4907, + "step": 58627 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456956720622452e-06, + "loss": 0.6377, + "step": 58628 + }, + { + "epoch": 1.5, + "learning_rate": 1.045668030495216e-06, + "loss": 0.644, + "step": 58629 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456403888932208e-06, + "loss": 0.6152, + "step": 58630 + }, + { + "epoch": 1.5, + "learning_rate": 1.0456127472562808e-06, + "loss": 0.5205, + "step": 58631 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455851055844174e-06, + "loss": 0.6992, + "step": 58632 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455574638776514e-06, + "loss": 0.7256, + "step": 58633 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455298221360042e-06, + "loss": 0.8281, + "step": 58634 + }, + { + "epoch": 1.5, + "learning_rate": 1.0455021803594967e-06, + "loss": 0.6875, + "step": 58635 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454745385481508e-06, + "loss": 0.6885, + "step": 58636 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454468967019864e-06, + "loss": 0.5, + "step": 58637 + }, + { + "epoch": 1.5, + "learning_rate": 1.0454192548210258e-06, + "loss": 0.6284, + "step": 58638 + }, + { + "epoch": 1.5, + "learning_rate": 1.04539161290529e-06, + "loss": 0.5679, + "step": 58639 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453639709547996e-06, + "loss": 0.748, + "step": 58640 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453363289695762e-06, + "loss": 0.6392, + "step": 58641 + }, + { + "epoch": 1.5, + "learning_rate": 1.0453086869496408e-06, + "loss": 0.6943, + "step": 58642 + }, + { + "epoch": 1.5, + "learning_rate": 1.0452810448950146e-06, + "loss": 0.5957, + "step": 58643 + }, + { + "epoch": 1.5, + "learning_rate": 1.0452534028057193e-06, + "loss": 0.7393, + "step": 58644 + }, + { + "epoch": 1.5, + "learning_rate": 1.045225760681775e-06, + "loss": 0.4663, + "step": 58645 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451981185232035e-06, + "loss": 0.6797, + "step": 58646 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451704763300256e-06, + "loss": 0.7051, + "step": 58647 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451428341022633e-06, + "loss": 0.8662, + "step": 58648 + }, + { + "epoch": 1.5, + "learning_rate": 1.0451151918399368e-06, + "loss": 0.7617, + "step": 58649 + }, + { + "epoch": 1.5, + "learning_rate": 1.045087549543068e-06, + "loss": 0.6284, + "step": 58650 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450599072116774e-06, + "loss": 0.8438, + "step": 58651 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450322648457868e-06, + "loss": 0.4927, + "step": 58652 + }, + { + "epoch": 1.5, + "learning_rate": 1.0450046224454167e-06, + "loss": 0.7959, + "step": 58653 + }, + { + "epoch": 1.5, + "learning_rate": 1.044976980010589e-06, + "loss": 0.5374, + "step": 58654 + }, + { + "epoch": 1.5, + "learning_rate": 1.0449493375413242e-06, + "loss": 0.4966, + "step": 58655 + }, + { + "epoch": 1.5, + "learning_rate": 1.0449216950376438e-06, + "loss": 0.6406, + "step": 58656 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448940524995692e-06, + "loss": 0.6553, + "step": 58657 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448664099271211e-06, + "loss": 0.6963, + "step": 58658 + }, + { + "epoch": 1.5, + "learning_rate": 1.044838767320321e-06, + "loss": 0.7666, + "step": 58659 + }, + { + "epoch": 1.5, + "learning_rate": 1.0448111246791898e-06, + "loss": 0.7393, + "step": 58660 + }, + { + "epoch": 1.5, + "learning_rate": 1.0447834820037487e-06, + "loss": 0.7441, + "step": 58661 + }, + { + "epoch": 1.5, + "learning_rate": 1.044755839294019e-06, + "loss": 0.7148, + "step": 58662 + }, + { + "epoch": 1.5, + "learning_rate": 1.044728196550022e-06, + "loss": 0.5586, + "step": 58663 + }, + { + "epoch": 1.5, + "learning_rate": 1.0447005537717784e-06, + "loss": 0.8389, + "step": 58664 + }, + { + "epoch": 1.5, + "learning_rate": 1.0446729109593098e-06, + "loss": 0.6426, + "step": 58665 + }, + { + "epoch": 1.5, + "learning_rate": 1.044645268112637e-06, + "loss": 0.5996, + "step": 58666 + }, + { + "epoch": 1.5, + "learning_rate": 1.0446176252317815e-06, + "loss": 0.5227, + "step": 58667 + }, + { + "epoch": 1.5, + "learning_rate": 1.0445899823167645e-06, + "loss": 0.575, + "step": 58668 + }, + { + "epoch": 1.5, + "learning_rate": 1.044562339367607e-06, + "loss": 0.5474, + "step": 58669 + }, + { + "epoch": 1.5, + "learning_rate": 1.0445346963843297e-06, + "loss": 0.7422, + "step": 58670 + }, + { + "epoch": 1.5, + "learning_rate": 1.044507053366955e-06, + "loss": 0.6772, + "step": 58671 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444794103155026e-06, + "loss": 0.5298, + "step": 58672 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444517672299946e-06, + "loss": 0.625, + "step": 58673 + }, + { + "epoch": 1.5, + "learning_rate": 1.0444241241104522e-06, + "loss": 0.5879, + "step": 58674 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443964809568957e-06, + "loss": 0.3336, + "step": 58675 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443688377693472e-06, + "loss": 0.4768, + "step": 58676 + }, + { + "epoch": 1.5, + "learning_rate": 1.0443411945478273e-06, + "loss": 0.4497, + "step": 58677 + }, + { + "epoch": 1.5, + "learning_rate": 1.044313551292358e-06, + "loss": 0.6851, + "step": 58678 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442859080029593e-06, + "loss": 0.5322, + "step": 58679 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442582646796532e-06, + "loss": 0.6367, + "step": 58680 + }, + { + "epoch": 1.5, + "learning_rate": 1.0442306213224603e-06, + "loss": 0.7881, + "step": 58681 + }, + { + "epoch": 1.5, + "learning_rate": 1.044202977931402e-06, + "loss": 0.7305, + "step": 58682 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441753345064999e-06, + "loss": 0.8281, + "step": 58683 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441476910477748e-06, + "loss": 0.5469, + "step": 58684 + }, + { + "epoch": 1.5, + "learning_rate": 1.0441200475552473e-06, + "loss": 0.7891, + "step": 58685 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440924040289396e-06, + "loss": 0.5791, + "step": 58686 + }, + { + "epoch": 1.5, + "learning_rate": 1.044064760468872e-06, + "loss": 0.6631, + "step": 58687 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440371168750666e-06, + "loss": 0.6055, + "step": 58688 + }, + { + "epoch": 1.5, + "learning_rate": 1.0440094732475435e-06, + "loss": 0.5894, + "step": 58689 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439818295863246e-06, + "loss": 0.7217, + "step": 58690 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439541858914306e-06, + "loss": 0.5195, + "step": 58691 + }, + { + "epoch": 1.5, + "learning_rate": 1.0439265421628832e-06, + "loss": 0.582, + "step": 58692 + }, + { + "epoch": 1.5, + "learning_rate": 1.043898898400703e-06, + "loss": 0.6084, + "step": 58693 + }, + { + "epoch": 1.5, + "learning_rate": 1.0438712546049115e-06, + "loss": 0.5107, + "step": 58694 + }, + { + "epoch": 1.5, + "learning_rate": 1.04384361077553e-06, + "loss": 0.6006, + "step": 58695 + }, + { + "epoch": 1.5, + "learning_rate": 1.0438159669125795e-06, + "loss": 0.5933, + "step": 58696 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437883230160807e-06, + "loss": 0.6284, + "step": 58697 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437606790860554e-06, + "loss": 0.6001, + "step": 58698 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437330351225247e-06, + "loss": 0.6201, + "step": 58699 + }, + { + "epoch": 1.5, + "learning_rate": 1.0437053911255093e-06, + "loss": 0.6279, + "step": 58700 + }, + { + "epoch": 1.5, + "learning_rate": 1.043677747095031e-06, + "loss": 0.6069, + "step": 58701 + }, + { + "epoch": 1.5, + "learning_rate": 1.0436501030311105e-06, + "loss": 0.6455, + "step": 58702 + }, + { + "epoch": 1.5, + "learning_rate": 1.0436224589337695e-06, + "loss": 0.5942, + "step": 58703 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435948148030282e-06, + "loss": 0.6689, + "step": 58704 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435671706389089e-06, + "loss": 0.5508, + "step": 58705 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435395264414317e-06, + "loss": 0.6914, + "step": 58706 + }, + { + "epoch": 1.5, + "learning_rate": 1.0435118822106185e-06, + "loss": 0.7178, + "step": 58707 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434842379464906e-06, + "loss": 0.5938, + "step": 58708 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434565936490685e-06, + "loss": 0.6025, + "step": 58709 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434289493183738e-06, + "loss": 0.7324, + "step": 58710 + }, + { + "epoch": 1.5, + "learning_rate": 1.0434013049544273e-06, + "loss": 0.5627, + "step": 58711 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433736605572505e-06, + "loss": 0.7178, + "step": 58712 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433460161268649e-06, + "loss": 0.6475, + "step": 58713 + }, + { + "epoch": 1.5, + "learning_rate": 1.0433183716632908e-06, + "loss": 0.6699, + "step": 58714 + }, + { + "epoch": 1.5, + "learning_rate": 1.04329072716655e-06, + "loss": 0.7461, + "step": 58715 + }, + { + "epoch": 1.5, + "learning_rate": 1.0432630826366632e-06, + "loss": 0.6836, + "step": 58716 + }, + { + "epoch": 1.5, + "learning_rate": 1.043235438073652e-06, + "loss": 0.7227, + "step": 58717 + }, + { + "epoch": 1.5, + "learning_rate": 1.0432077934775377e-06, + "loss": 0.6362, + "step": 58718 + }, + { + "epoch": 1.5, + "learning_rate": 1.0431801488483408e-06, + "loss": 0.689, + "step": 58719 + }, + { + "epoch": 1.51, + "learning_rate": 1.0431525041860829e-06, + "loss": 0.6157, + "step": 58720 + }, + { + "epoch": 1.51, + "learning_rate": 1.0431248594907852e-06, + "loss": 0.792, + "step": 58721 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430972147624686e-06, + "loss": 0.6973, + "step": 58722 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430695700011547e-06, + "loss": 0.6572, + "step": 58723 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430419252068644e-06, + "loss": 0.7617, + "step": 58724 + }, + { + "epoch": 1.51, + "learning_rate": 1.0430142803796187e-06, + "loss": 0.5459, + "step": 58725 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429866355194393e-06, + "loss": 0.7461, + "step": 58726 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429589906263465e-06, + "loss": 0.6611, + "step": 58727 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429313457003625e-06, + "loss": 0.6047, + "step": 58728 + }, + { + "epoch": 1.51, + "learning_rate": 1.0429037007415075e-06, + "loss": 0.4412, + "step": 58729 + }, + { + "epoch": 1.51, + "learning_rate": 1.0428760557498034e-06, + "loss": 0.6816, + "step": 58730 + }, + { + "epoch": 1.51, + "learning_rate": 1.042848410725271e-06, + "loss": 0.667, + "step": 58731 + }, + { + "epoch": 1.51, + "learning_rate": 1.0428207656679313e-06, + "loss": 0.7041, + "step": 58732 + }, + { + "epoch": 1.51, + "learning_rate": 1.042793120577806e-06, + "loss": 0.6924, + "step": 58733 + }, + { + "epoch": 1.51, + "learning_rate": 1.042765475454916e-06, + "loss": 0.8447, + "step": 58734 + }, + { + "epoch": 1.51, + "learning_rate": 1.0427378302992821e-06, + "loss": 0.6641, + "step": 58735 + }, + { + "epoch": 1.51, + "learning_rate": 1.0427101851109261e-06, + "loss": 0.6748, + "step": 58736 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426825398898687e-06, + "loss": 0.5391, + "step": 58737 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426548946361315e-06, + "loss": 0.5601, + "step": 58738 + }, + { + "epoch": 1.51, + "learning_rate": 1.0426272493497353e-06, + "loss": 0.5444, + "step": 58739 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425996040307012e-06, + "loss": 0.5571, + "step": 58740 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425719586790508e-06, + "loss": 0.623, + "step": 58741 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425443132948048e-06, + "loss": 0.6758, + "step": 58742 + }, + { + "epoch": 1.51, + "learning_rate": 1.0425166678779848e-06, + "loss": 0.6143, + "step": 58743 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424890224286115e-06, + "loss": 0.5557, + "step": 58744 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424613769467065e-06, + "loss": 0.6963, + "step": 58745 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424337314322907e-06, + "loss": 0.6445, + "step": 58746 + }, + { + "epoch": 1.51, + "learning_rate": 1.0424060858853852e-06, + "loss": 0.7212, + "step": 58747 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423784403060117e-06, + "loss": 0.6001, + "step": 58748 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423507946941907e-06, + "loss": 0.4915, + "step": 58749 + }, + { + "epoch": 1.51, + "learning_rate": 1.0423231490499436e-06, + "loss": 0.6125, + "step": 58750 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422955033732917e-06, + "loss": 0.6719, + "step": 58751 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422678576642559e-06, + "loss": 0.5439, + "step": 58752 + }, + { + "epoch": 1.51, + "learning_rate": 1.0422402119228579e-06, + "loss": 0.8643, + "step": 58753 + }, + { + "epoch": 1.51, + "learning_rate": 1.042212566149118e-06, + "loss": 0.5845, + "step": 58754 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421849203430584e-06, + "loss": 0.4346, + "step": 58755 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421572745046995e-06, + "loss": 0.8096, + "step": 58756 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421296286340629e-06, + "loss": 0.7412, + "step": 58757 + }, + { + "epoch": 1.51, + "learning_rate": 1.0421019827311694e-06, + "loss": 0.6187, + "step": 58758 + }, + { + "epoch": 1.51, + "learning_rate": 1.0420743367960403e-06, + "loss": 0.5757, + "step": 58759 + }, + { + "epoch": 1.51, + "learning_rate": 1.042046690828697e-06, + "loss": 0.6357, + "step": 58760 + }, + { + "epoch": 1.51, + "learning_rate": 1.0420190448291603e-06, + "loss": 0.7432, + "step": 58761 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419913987974515e-06, + "loss": 0.5493, + "step": 58762 + }, + { + "epoch": 1.51, + "learning_rate": 1.041963752733592e-06, + "loss": 0.6699, + "step": 58763 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419361066376026e-06, + "loss": 0.6797, + "step": 58764 + }, + { + "epoch": 1.51, + "learning_rate": 1.0419084605095048e-06, + "loss": 0.7002, + "step": 58765 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418808143493196e-06, + "loss": 0.6548, + "step": 58766 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418531681570682e-06, + "loss": 0.5938, + "step": 58767 + }, + { + "epoch": 1.51, + "learning_rate": 1.0418255219327718e-06, + "loss": 0.5659, + "step": 58768 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417978756764515e-06, + "loss": 0.6006, + "step": 58769 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417702293881285e-06, + "loss": 0.5493, + "step": 58770 + }, + { + "epoch": 1.51, + "learning_rate": 1.0417425830678237e-06, + "loss": 0.7393, + "step": 58771 + }, + { + "epoch": 1.51, + "learning_rate": 1.041714936715559e-06, + "loss": 0.4741, + "step": 58772 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416872903313548e-06, + "loss": 0.5869, + "step": 58773 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416596439152326e-06, + "loss": 0.7373, + "step": 58774 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416319974672132e-06, + "loss": 0.6943, + "step": 58775 + }, + { + "epoch": 1.51, + "learning_rate": 1.0416043509873186e-06, + "loss": 0.6816, + "step": 58776 + }, + { + "epoch": 1.51, + "learning_rate": 1.041576704475569e-06, + "loss": 0.7051, + "step": 58777 + }, + { + "epoch": 1.51, + "learning_rate": 1.0415490579319866e-06, + "loss": 0.5557, + "step": 58778 + }, + { + "epoch": 1.51, + "learning_rate": 1.0415214113565915e-06, + "loss": 0.447, + "step": 58779 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414937647494058e-06, + "loss": 0.4597, + "step": 58780 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414661181104497e-06, + "loss": 0.6978, + "step": 58781 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414384714397452e-06, + "loss": 0.7979, + "step": 58782 + }, + { + "epoch": 1.51, + "learning_rate": 1.0414108247373131e-06, + "loss": 0.7686, + "step": 58783 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413831780031747e-06, + "loss": 0.6675, + "step": 58784 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413555312373512e-06, + "loss": 0.4761, + "step": 58785 + }, + { + "epoch": 1.51, + "learning_rate": 1.0413278844398636e-06, + "loss": 0.6924, + "step": 58786 + }, + { + "epoch": 1.51, + "learning_rate": 1.041300237610733e-06, + "loss": 0.5234, + "step": 58787 + }, + { + "epoch": 1.51, + "learning_rate": 1.041272590749981e-06, + "loss": 0.7031, + "step": 58788 + }, + { + "epoch": 1.51, + "learning_rate": 1.0412449438576282e-06, + "loss": 0.6709, + "step": 58789 + }, + { + "epoch": 1.51, + "learning_rate": 1.0412172969336958e-06, + "loss": 0.6411, + "step": 58790 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411896499782059e-06, + "loss": 0.7988, + "step": 58791 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411620029911784e-06, + "loss": 0.6035, + "step": 58792 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411343559726355e-06, + "loss": 0.5701, + "step": 58793 + }, + { + "epoch": 1.51, + "learning_rate": 1.0411067089225975e-06, + "loss": 0.4143, + "step": 58794 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410790618410864e-06, + "loss": 0.4883, + "step": 58795 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410514147281225e-06, + "loss": 0.5679, + "step": 58796 + }, + { + "epoch": 1.51, + "learning_rate": 1.0410237675837277e-06, + "loss": 0.625, + "step": 58797 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409961204079228e-06, + "loss": 0.5234, + "step": 58798 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409684732007292e-06, + "loss": 0.5459, + "step": 58799 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409408259621674e-06, + "loss": 0.8066, + "step": 58800 + }, + { + "epoch": 1.51, + "learning_rate": 1.0409131786922597e-06, + "loss": 0.7163, + "step": 58801 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408855313910264e-06, + "loss": 0.6812, + "step": 58802 + }, + { + "epoch": 1.51, + "learning_rate": 1.040857884058489e-06, + "loss": 0.7236, + "step": 58803 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408302366946687e-06, + "loss": 0.5183, + "step": 58804 + }, + { + "epoch": 1.51, + "learning_rate": 1.0408025892995865e-06, + "loss": 0.7773, + "step": 58805 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407749418732633e-06, + "loss": 0.6299, + "step": 58806 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407472944157209e-06, + "loss": 0.6924, + "step": 58807 + }, + { + "epoch": 1.51, + "learning_rate": 1.0407196469269803e-06, + "loss": 0.3357, + "step": 58808 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406919994070622e-06, + "loss": 0.6499, + "step": 58809 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406643518559884e-06, + "loss": 0.647, + "step": 58810 + }, + { + "epoch": 1.51, + "learning_rate": 1.0406367042737797e-06, + "loss": 0.5857, + "step": 58811 + }, + { + "epoch": 1.51, + "learning_rate": 1.040609056660457e-06, + "loss": 0.6133, + "step": 58812 + }, + { + "epoch": 1.51, + "learning_rate": 1.0405814090160422e-06, + "loss": 0.502, + "step": 58813 + }, + { + "epoch": 1.51, + "learning_rate": 1.040553761340556e-06, + "loss": 0.6597, + "step": 58814 + }, + { + "epoch": 1.51, + "learning_rate": 1.0405261136340198e-06, + "loss": 0.8496, + "step": 58815 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404984658964544e-06, + "loss": 0.7432, + "step": 58816 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404708181278813e-06, + "loss": 0.4575, + "step": 58817 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404431703283215e-06, + "loss": 0.8276, + "step": 58818 + }, + { + "epoch": 1.51, + "learning_rate": 1.0404155224977962e-06, + "loss": 0.6177, + "step": 58819 + }, + { + "epoch": 1.51, + "learning_rate": 1.0403878746363268e-06, + "loss": 0.5623, + "step": 58820 + }, + { + "epoch": 1.51, + "learning_rate": 1.040360226743934e-06, + "loss": 0.709, + "step": 58821 + }, + { + "epoch": 1.51, + "learning_rate": 1.0403325788206394e-06, + "loss": 0.7061, + "step": 58822 + }, + { + "epoch": 1.51, + "learning_rate": 1.040304930866464e-06, + "loss": 0.792, + "step": 58823 + }, + { + "epoch": 1.51, + "learning_rate": 1.0402772828814288e-06, + "loss": 0.5425, + "step": 58824 + }, + { + "epoch": 1.51, + "learning_rate": 1.040249634865555e-06, + "loss": 0.395, + "step": 58825 + }, + { + "epoch": 1.51, + "learning_rate": 1.0402219868188644e-06, + "loss": 0.6372, + "step": 58826 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401943387413772e-06, + "loss": 0.6089, + "step": 58827 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401666906331153e-06, + "loss": 0.6021, + "step": 58828 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401390424940997e-06, + "loss": 0.6641, + "step": 58829 + }, + { + "epoch": 1.51, + "learning_rate": 1.0401113943243512e-06, + "loss": 0.7764, + "step": 58830 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400837461238914e-06, + "loss": 0.6777, + "step": 58831 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400560978927413e-06, + "loss": 0.7568, + "step": 58832 + }, + { + "epoch": 1.51, + "learning_rate": 1.0400284496309222e-06, + "loss": 0.6602, + "step": 58833 + }, + { + "epoch": 1.51, + "learning_rate": 1.040000801338455e-06, + "loss": 0.5764, + "step": 58834 + }, + { + "epoch": 1.51, + "learning_rate": 1.039973153015361e-06, + "loss": 0.5654, + "step": 58835 + }, + { + "epoch": 1.51, + "learning_rate": 1.0399455046616614e-06, + "loss": 0.7085, + "step": 58836 + }, + { + "epoch": 1.51, + "learning_rate": 1.0399178562773776e-06, + "loss": 0.6724, + "step": 58837 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398902078625304e-06, + "loss": 0.6396, + "step": 58838 + }, + { + "epoch": 1.51, + "learning_rate": 1.039862559417141e-06, + "loss": 0.6582, + "step": 58839 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398349109412308e-06, + "loss": 0.5049, + "step": 58840 + }, + { + "epoch": 1.51, + "learning_rate": 1.0398072624348206e-06, + "loss": 0.6309, + "step": 58841 + }, + { + "epoch": 1.51, + "learning_rate": 1.039779613897932e-06, + "loss": 0.5654, + "step": 58842 + }, + { + "epoch": 1.51, + "learning_rate": 1.0397519653305863e-06, + "loss": 0.7061, + "step": 58843 + }, + { + "epoch": 1.51, + "learning_rate": 1.0397243167328039e-06, + "loss": 0.6509, + "step": 58844 + }, + { + "epoch": 1.51, + "learning_rate": 1.0396966681046064e-06, + "loss": 0.5732, + "step": 58845 + }, + { + "epoch": 1.51, + "learning_rate": 1.039669019446015e-06, + "loss": 0.7031, + "step": 58846 + }, + { + "epoch": 1.51, + "learning_rate": 1.039641370757051e-06, + "loss": 0.6846, + "step": 58847 + }, + { + "epoch": 1.51, + "learning_rate": 1.0396137220377357e-06, + "loss": 0.7227, + "step": 58848 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395860732880896e-06, + "loss": 0.5596, + "step": 58849 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395584245081344e-06, + "loss": 0.6084, + "step": 58850 + }, + { + "epoch": 1.51, + "learning_rate": 1.039530775697891e-06, + "loss": 0.6816, + "step": 58851 + }, + { + "epoch": 1.51, + "learning_rate": 1.0395031268573808e-06, + "loss": 0.7471, + "step": 58852 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394754779866249e-06, + "loss": 0.7725, + "step": 58853 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394478290856445e-06, + "loss": 0.7041, + "step": 58854 + }, + { + "epoch": 1.51, + "learning_rate": 1.0394201801544604e-06, + "loss": 0.6309, + "step": 58855 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393925311930944e-06, + "loss": 0.6042, + "step": 58856 + }, + { + "epoch": 1.51, + "learning_rate": 1.039364882201567e-06, + "loss": 0.6333, + "step": 58857 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393372331799005e-06, + "loss": 0.5581, + "step": 58858 + }, + { + "epoch": 1.51, + "learning_rate": 1.0393095841281146e-06, + "loss": 0.6211, + "step": 58859 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392819350462312e-06, + "loss": 0.7061, + "step": 58860 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392542859342714e-06, + "loss": 0.6533, + "step": 58861 + }, + { + "epoch": 1.51, + "learning_rate": 1.0392266367922566e-06, + "loss": 0.7119, + "step": 58862 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391989876202079e-06, + "loss": 0.4331, + "step": 58863 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391713384181462e-06, + "loss": 0.7754, + "step": 58864 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391436891860926e-06, + "loss": 0.543, + "step": 58865 + }, + { + "epoch": 1.51, + "learning_rate": 1.0391160399240689e-06, + "loss": 0.6025, + "step": 58866 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390883906320953e-06, + "loss": 0.5815, + "step": 58867 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390607413101942e-06, + "loss": 0.8203, + "step": 58868 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390330919583854e-06, + "loss": 0.7666, + "step": 58869 + }, + { + "epoch": 1.51, + "learning_rate": 1.0390054425766911e-06, + "loss": 0.4297, + "step": 58870 + }, + { + "epoch": 1.51, + "learning_rate": 1.038977793165132e-06, + "loss": 0.4929, + "step": 58871 + }, + { + "epoch": 1.51, + "learning_rate": 1.0389501437237295e-06, + "loss": 0.7275, + "step": 58872 + }, + { + "epoch": 1.51, + "learning_rate": 1.0389224942525047e-06, + "loss": 0.4639, + "step": 58873 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388948447514786e-06, + "loss": 0.7549, + "step": 58874 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388671952206724e-06, + "loss": 0.6816, + "step": 58875 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388395456601077e-06, + "loss": 0.522, + "step": 58876 + }, + { + "epoch": 1.51, + "learning_rate": 1.0388118960698051e-06, + "loss": 0.5254, + "step": 58877 + }, + { + "epoch": 1.51, + "learning_rate": 1.0387842464497863e-06, + "loss": 0.8662, + "step": 58878 + }, + { + "epoch": 1.51, + "learning_rate": 1.038756596800072e-06, + "loss": 0.6333, + "step": 58879 + }, + { + "epoch": 1.51, + "learning_rate": 1.0387289471206835e-06, + "loss": 0.6631, + "step": 58880 + }, + { + "epoch": 1.51, + "learning_rate": 1.038701297411642e-06, + "loss": 0.5488, + "step": 58881 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386736476729686e-06, + "loss": 0.8271, + "step": 58882 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386459979046852e-06, + "loss": 0.6689, + "step": 58883 + }, + { + "epoch": 1.51, + "learning_rate": 1.0386183481068117e-06, + "loss": 0.5718, + "step": 58884 + }, + { + "epoch": 1.51, + "learning_rate": 1.03859069827937e-06, + "loss": 0.5977, + "step": 58885 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385630484223811e-06, + "loss": 0.7012, + "step": 58886 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385353985358665e-06, + "loss": 0.7812, + "step": 58887 + }, + { + "epoch": 1.51, + "learning_rate": 1.0385077486198473e-06, + "loss": 0.6055, + "step": 58888 + }, + { + "epoch": 1.51, + "learning_rate": 1.038480098674344e-06, + "loss": 0.4277, + "step": 58889 + }, + { + "epoch": 1.51, + "learning_rate": 1.0384524486993783e-06, + "loss": 0.6099, + "step": 58890 + }, + { + "epoch": 1.51, + "learning_rate": 1.0384247986949717e-06, + "loss": 0.6855, + "step": 58891 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383971486611447e-06, + "loss": 0.6582, + "step": 58892 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383694985979193e-06, + "loss": 0.5459, + "step": 58893 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383418485053156e-06, + "loss": 0.8086, + "step": 58894 + }, + { + "epoch": 1.51, + "learning_rate": 1.0383141983833552e-06, + "loss": 0.7764, + "step": 58895 + }, + { + "epoch": 1.51, + "learning_rate": 1.0382865482320595e-06, + "loss": 0.6494, + "step": 58896 + }, + { + "epoch": 1.51, + "learning_rate": 1.0382588980514497e-06, + "loss": 0.6357, + "step": 58897 + }, + { + "epoch": 1.51, + "learning_rate": 1.038231247841547e-06, + "loss": 0.8164, + "step": 58898 + }, + { + "epoch": 1.51, + "learning_rate": 1.038203597602372e-06, + "loss": 0.5947, + "step": 58899 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381759473339465e-06, + "loss": 0.5845, + "step": 58900 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381482970362912e-06, + "loss": 0.7598, + "step": 58901 + }, + { + "epoch": 1.51, + "learning_rate": 1.0381206467094276e-06, + "loss": 0.5449, + "step": 58902 + }, + { + "epoch": 1.51, + "learning_rate": 1.038092996353377e-06, + "loss": 0.583, + "step": 58903 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380653459681602e-06, + "loss": 0.6172, + "step": 58904 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380376955537983e-06, + "loss": 0.5488, + "step": 58905 + }, + { + "epoch": 1.51, + "learning_rate": 1.0380100451103129e-06, + "loss": 0.7598, + "step": 58906 + }, + { + "epoch": 1.51, + "learning_rate": 1.037982394637725e-06, + "loss": 0.6421, + "step": 58907 + }, + { + "epoch": 1.51, + "learning_rate": 1.037954744136056e-06, + "loss": 0.623, + "step": 58908 + }, + { + "epoch": 1.51, + "learning_rate": 1.0379270936053261e-06, + "loss": 0.6562, + "step": 58909 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378994430455577e-06, + "loss": 0.7339, + "step": 58910 + }, + { + "epoch": 1.51, + "learning_rate": 1.037871792456771e-06, + "loss": 0.6367, + "step": 58911 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378441418389878e-06, + "loss": 0.4038, + "step": 58912 + }, + { + "epoch": 1.51, + "learning_rate": 1.0378164911922293e-06, + "loss": 0.7139, + "step": 58913 + }, + { + "epoch": 1.51, + "learning_rate": 1.0377888405165165e-06, + "loss": 0.6494, + "step": 58914 + }, + { + "epoch": 1.51, + "learning_rate": 1.03776118981187e-06, + "loss": 0.7012, + "step": 58915 + }, + { + "epoch": 1.51, + "learning_rate": 1.037733539078312e-06, + "loss": 0.5566, + "step": 58916 + }, + { + "epoch": 1.51, + "learning_rate": 1.0377058883158628e-06, + "loss": 0.7109, + "step": 58917 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376782375245444e-06, + "loss": 0.6665, + "step": 58918 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376505867043773e-06, + "loss": 0.5713, + "step": 58919 + }, + { + "epoch": 1.51, + "learning_rate": 1.0376229358553825e-06, + "loss": 0.6099, + "step": 58920 + }, + { + "epoch": 1.51, + "learning_rate": 1.037595284977582e-06, + "loss": 0.626, + "step": 58921 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375676340709963e-06, + "loss": 0.748, + "step": 58922 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375399831356471e-06, + "loss": 0.5571, + "step": 58923 + }, + { + "epoch": 1.51, + "learning_rate": 1.0375123321715547e-06, + "loss": 0.3448, + "step": 58924 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374846811787411e-06, + "loss": 0.6455, + "step": 58925 + }, + { + "epoch": 1.51, + "learning_rate": 1.037457030157227e-06, + "loss": 0.6484, + "step": 58926 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374293791070342e-06, + "loss": 0.4635, + "step": 58927 + }, + { + "epoch": 1.51, + "learning_rate": 1.0374017280281835e-06, + "loss": 0.4885, + "step": 58928 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373740769206958e-06, + "loss": 0.6797, + "step": 58929 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373464257845926e-06, + "loss": 0.7393, + "step": 58930 + }, + { + "epoch": 1.51, + "learning_rate": 1.0373187746198948e-06, + "loss": 0.5806, + "step": 58931 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372911234266235e-06, + "loss": 0.5996, + "step": 58932 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372634722048008e-06, + "loss": 0.6694, + "step": 58933 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372358209544466e-06, + "loss": 0.593, + "step": 58934 + }, + { + "epoch": 1.51, + "learning_rate": 1.0372081696755828e-06, + "loss": 0.8135, + "step": 58935 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371805183682303e-06, + "loss": 0.5583, + "step": 58936 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371528670324105e-06, + "loss": 0.4648, + "step": 58937 + }, + { + "epoch": 1.51, + "learning_rate": 1.0371252156681445e-06, + "loss": 0.7119, + "step": 58938 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370975642754535e-06, + "loss": 0.625, + "step": 58939 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370699128543582e-06, + "loss": 0.6592, + "step": 58940 + }, + { + "epoch": 1.51, + "learning_rate": 1.0370422614048806e-06, + "loss": 0.7065, + "step": 58941 + }, + { + "epoch": 1.51, + "learning_rate": 1.037014609927041e-06, + "loss": 0.791, + "step": 58942 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369869584208616e-06, + "loss": 0.7324, + "step": 58943 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369593068863628e-06, + "loss": 0.6138, + "step": 58944 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369316553235657e-06, + "loss": 0.6787, + "step": 58945 + }, + { + "epoch": 1.51, + "learning_rate": 1.0369040037324918e-06, + "loss": 0.7256, + "step": 58946 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368763521131623e-06, + "loss": 0.6348, + "step": 58947 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368487004655984e-06, + "loss": 0.5908, + "step": 58948 + }, + { + "epoch": 1.51, + "learning_rate": 1.0368210487898208e-06, + "loss": 0.5139, + "step": 58949 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367933970858513e-06, + "loss": 0.8223, + "step": 58950 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367657453537107e-06, + "loss": 0.749, + "step": 58951 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367380935934205e-06, + "loss": 0.5327, + "step": 58952 + }, + { + "epoch": 1.51, + "learning_rate": 1.0367104418050013e-06, + "loss": 0.7568, + "step": 58953 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366827899884746e-06, + "loss": 0.7197, + "step": 58954 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366551381438618e-06, + "loss": 0.6611, + "step": 58955 + }, + { + "epoch": 1.51, + "learning_rate": 1.0366274862711837e-06, + "loss": 0.5527, + "step": 58956 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365998343704617e-06, + "loss": 0.6875, + "step": 58957 + }, + { + "epoch": 1.51, + "learning_rate": 1.036572182441717e-06, + "loss": 0.5715, + "step": 58958 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365445304849703e-06, + "loss": 0.8408, + "step": 58959 + }, + { + "epoch": 1.51, + "learning_rate": 1.0365168785002432e-06, + "loss": 0.7324, + "step": 58960 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364892264875569e-06, + "loss": 0.7148, + "step": 58961 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364615744469326e-06, + "loss": 0.4624, + "step": 58962 + }, + { + "epoch": 1.51, + "learning_rate": 1.0364339223783914e-06, + "loss": 0.5288, + "step": 58963 + }, + { + "epoch": 1.51, + "learning_rate": 1.036406270281954e-06, + "loss": 0.7148, + "step": 58964 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363786181576424e-06, + "loss": 0.6592, + "step": 58965 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363509660054773e-06, + "loss": 0.4767, + "step": 58966 + }, + { + "epoch": 1.51, + "learning_rate": 1.0363233138254799e-06, + "loss": 0.48, + "step": 58967 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362956616176712e-06, + "loss": 0.6265, + "step": 58968 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362680093820729e-06, + "loss": 0.6831, + "step": 58969 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362403571187054e-06, + "loss": 0.4761, + "step": 58970 + }, + { + "epoch": 1.51, + "learning_rate": 1.0362127048275908e-06, + "loss": 0.5173, + "step": 58971 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361850525087497e-06, + "loss": 0.6069, + "step": 58972 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361574001622034e-06, + "loss": 0.6763, + "step": 58973 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361297477879727e-06, + "loss": 0.6943, + "step": 58974 + }, + { + "epoch": 1.51, + "learning_rate": 1.0361020953860795e-06, + "loss": 0.6704, + "step": 58975 + }, + { + "epoch": 1.51, + "learning_rate": 1.0360744429565443e-06, + "loss": 0.7205, + "step": 58976 + }, + { + "epoch": 1.51, + "learning_rate": 1.036046790499389e-06, + "loss": 0.553, + "step": 58977 + }, + { + "epoch": 1.51, + "learning_rate": 1.0360191380146338e-06, + "loss": 0.5498, + "step": 58978 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359914855023007e-06, + "loss": 0.667, + "step": 58979 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359638329624103e-06, + "loss": 0.6484, + "step": 58980 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359361803949844e-06, + "loss": 0.7568, + "step": 58981 + }, + { + "epoch": 1.51, + "learning_rate": 1.0359085278000436e-06, + "loss": 0.6709, + "step": 58982 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358808751776096e-06, + "loss": 0.5903, + "step": 58983 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358532225277028e-06, + "loss": 0.6172, + "step": 58984 + }, + { + "epoch": 1.51, + "learning_rate": 1.0358255698503453e-06, + "loss": 0.6982, + "step": 58985 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357979171455574e-06, + "loss": 0.7168, + "step": 58986 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357702644133608e-06, + "loss": 0.4629, + "step": 58987 + }, + { + "epoch": 1.51, + "learning_rate": 1.0357426116537766e-06, + "loss": 0.6826, + "step": 58988 + }, + { + "epoch": 1.51, + "learning_rate": 1.035714958866826e-06, + "loss": 0.9453, + "step": 58989 + }, + { + "epoch": 1.51, + "learning_rate": 1.03568730605253e-06, + "loss": 0.5552, + "step": 58990 + }, + { + "epoch": 1.51, + "learning_rate": 1.0356596532109099e-06, + "loss": 0.6846, + "step": 58991 + }, + { + "epoch": 1.51, + "learning_rate": 1.035632000341987e-06, + "loss": 0.6904, + "step": 58992 + }, + { + "epoch": 1.51, + "learning_rate": 1.035604347445782e-06, + "loss": 0.6387, + "step": 58993 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355766945223166e-06, + "loss": 0.6504, + "step": 58994 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355490415716115e-06, + "loss": 0.6816, + "step": 58995 + }, + { + "epoch": 1.51, + "learning_rate": 1.0355213885936885e-06, + "loss": 0.7139, + "step": 58996 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354937355885682e-06, + "loss": 0.7217, + "step": 58997 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354660825562722e-06, + "loss": 0.5776, + "step": 58998 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354384294968213e-06, + "loss": 0.8604, + "step": 58999 + }, + { + "epoch": 1.51, + "learning_rate": 1.0354107764102367e-06, + "loss": 0.5859, + "step": 59000 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353831232965398e-06, + "loss": 0.6768, + "step": 59001 + }, + { + "epoch": 1.51, + "learning_rate": 1.035355470155752e-06, + "loss": 0.7119, + "step": 59002 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353278169878934e-06, + "loss": 0.6465, + "step": 59003 + }, + { + "epoch": 1.51, + "learning_rate": 1.0353001637929867e-06, + "loss": 0.666, + "step": 59004 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352725105710515e-06, + "loss": 0.7305, + "step": 59005 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352448573221102e-06, + "loss": 0.5483, + "step": 59006 + }, + { + "epoch": 1.51, + "learning_rate": 1.0352172040461838e-06, + "loss": 0.4958, + "step": 59007 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351895507432926e-06, + "loss": 0.8193, + "step": 59008 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351618974134588e-06, + "loss": 0.5845, + "step": 59009 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351342440567031e-06, + "loss": 0.6748, + "step": 59010 + }, + { + "epoch": 1.51, + "learning_rate": 1.0351065906730465e-06, + "loss": 0.6719, + "step": 59011 + }, + { + "epoch": 1.51, + "learning_rate": 1.0350789372625105e-06, + "loss": 0.6572, + "step": 59012 + }, + { + "epoch": 1.51, + "learning_rate": 1.0350512838251164e-06, + "loss": 0.6953, + "step": 59013 + }, + { + "epoch": 1.51, + "learning_rate": 1.035023630360885e-06, + "loss": 0.6226, + "step": 59014 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349959768698375e-06, + "loss": 0.832, + "step": 59015 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349683233519951e-06, + "loss": 0.6104, + "step": 59016 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349406698073798e-06, + "loss": 0.6606, + "step": 59017 + }, + { + "epoch": 1.51, + "learning_rate": 1.0349130162360111e-06, + "loss": 0.7087, + "step": 59018 + }, + { + "epoch": 1.51, + "learning_rate": 1.0348853626379116e-06, + "loss": 0.6641, + "step": 59019 + }, + { + "epoch": 1.51, + "learning_rate": 1.034857709013102e-06, + "loss": 0.6577, + "step": 59020 + }, + { + "epoch": 1.51, + "learning_rate": 1.0348300553616031e-06, + "loss": 0.6836, + "step": 59021 + }, + { + "epoch": 1.51, + "learning_rate": 1.034802401683437e-06, + "loss": 0.4834, + "step": 59022 + }, + { + "epoch": 1.51, + "learning_rate": 1.034774747978624e-06, + "loss": 0.5962, + "step": 59023 + }, + { + "epoch": 1.51, + "learning_rate": 1.0347470942471851e-06, + "loss": 0.4722, + "step": 59024 + }, + { + "epoch": 1.51, + "learning_rate": 1.0347194404891427e-06, + "loss": 0.5493, + "step": 59025 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346917867045166e-06, + "loss": 0.7251, + "step": 59026 + }, + { + "epoch": 1.51, + "learning_rate": 1.034664132893329e-06, + "loss": 0.6167, + "step": 59027 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346364790556008e-06, + "loss": 0.3945, + "step": 59028 + }, + { + "epoch": 1.51, + "learning_rate": 1.0346088251913527e-06, + "loss": 0.5795, + "step": 59029 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345811713006063e-06, + "loss": 0.7617, + "step": 59030 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345535173833828e-06, + "loss": 0.5449, + "step": 59031 + }, + { + "epoch": 1.51, + "learning_rate": 1.0345258634397032e-06, + "loss": 0.5752, + "step": 59032 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344982094695885e-06, + "loss": 0.3206, + "step": 59033 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344705554730603e-06, + "loss": 0.499, + "step": 59034 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344429014501394e-06, + "loss": 0.6287, + "step": 59035 + }, + { + "epoch": 1.51, + "learning_rate": 1.0344152474008477e-06, + "loss": 0.5454, + "step": 59036 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343875933252054e-06, + "loss": 0.4938, + "step": 59037 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343599392232343e-06, + "loss": 0.7471, + "step": 59038 + }, + { + "epoch": 1.51, + "learning_rate": 1.034332285094955e-06, + "loss": 0.7607, + "step": 59039 + }, + { + "epoch": 1.51, + "learning_rate": 1.0343046309403894e-06, + "loss": 0.4756, + "step": 59040 + }, + { + "epoch": 1.51, + "learning_rate": 1.034276976759558e-06, + "loss": 0.751, + "step": 59041 + }, + { + "epoch": 1.51, + "learning_rate": 1.034249322552483e-06, + "loss": 0.486, + "step": 59042 + }, + { + "epoch": 1.51, + "learning_rate": 1.034221668319184e-06, + "loss": 0.3964, + "step": 59043 + }, + { + "epoch": 1.51, + "learning_rate": 1.0341940140596837e-06, + "loss": 0.5742, + "step": 59044 + }, + { + "epoch": 1.51, + "learning_rate": 1.034166359774002e-06, + "loss": 0.75, + "step": 59045 + }, + { + "epoch": 1.51, + "learning_rate": 1.0341387054621612e-06, + "loss": 0.6084, + "step": 59046 + }, + { + "epoch": 1.51, + "learning_rate": 1.034111051124182e-06, + "loss": 0.4961, + "step": 59047 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340833967600853e-06, + "loss": 0.4958, + "step": 59048 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340557423698922e-06, + "loss": 0.8477, + "step": 59049 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340280879536247e-06, + "loss": 0.5347, + "step": 59050 + }, + { + "epoch": 1.51, + "learning_rate": 1.0340004335113031e-06, + "loss": 0.5879, + "step": 59051 + }, + { + "epoch": 1.51, + "learning_rate": 1.0339727790429492e-06, + "loss": 0.6079, + "step": 59052 + }, + { + "epoch": 1.51, + "learning_rate": 1.033945124548584e-06, + "loss": 0.7197, + "step": 59053 + }, + { + "epoch": 1.51, + "learning_rate": 1.0339174700282282e-06, + "loss": 0.6157, + "step": 59054 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338898154819035e-06, + "loss": 0.5447, + "step": 59055 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338621609096311e-06, + "loss": 0.5352, + "step": 59056 + }, + { + "epoch": 1.51, + "learning_rate": 1.033834506311432e-06, + "loss": 0.8145, + "step": 59057 + }, + { + "epoch": 1.51, + "learning_rate": 1.0338068516873271e-06, + "loss": 0.7109, + "step": 59058 + }, + { + "epoch": 1.51, + "learning_rate": 1.033779197037338e-06, + "loss": 0.7092, + "step": 59059 + }, + { + "epoch": 1.51, + "learning_rate": 1.0337515423614856e-06, + "loss": 0.3816, + "step": 59060 + }, + { + "epoch": 1.51, + "learning_rate": 1.0337238876597913e-06, + "loss": 0.6191, + "step": 59061 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336962329322763e-06, + "loss": 0.6055, + "step": 59062 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336685781789616e-06, + "loss": 0.7471, + "step": 59063 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336409233998682e-06, + "loss": 0.7939, + "step": 59064 + }, + { + "epoch": 1.51, + "learning_rate": 1.0336132685950178e-06, + "loss": 0.7227, + "step": 59065 + }, + { + "epoch": 1.51, + "learning_rate": 1.033585613764431e-06, + "loss": 0.7178, + "step": 59066 + }, + { + "epoch": 1.51, + "learning_rate": 1.0335579589081295e-06, + "loss": 0.6523, + "step": 59067 + }, + { + "epoch": 1.51, + "learning_rate": 1.033530304026134e-06, + "loss": 0.6553, + "step": 59068 + }, + { + "epoch": 1.51, + "learning_rate": 1.033502649118466e-06, + "loss": 0.5977, + "step": 59069 + }, + { + "epoch": 1.51, + "learning_rate": 1.0334749941851464e-06, + "loss": 0.5127, + "step": 59070 + }, + { + "epoch": 1.51, + "learning_rate": 1.0334473392261966e-06, + "loss": 0.5151, + "step": 59071 + }, + { + "epoch": 1.51, + "learning_rate": 1.033419684241638e-06, + "loss": 0.5703, + "step": 59072 + }, + { + "epoch": 1.51, + "learning_rate": 1.033392029231491e-06, + "loss": 0.6982, + "step": 59073 + }, + { + "epoch": 1.51, + "learning_rate": 1.0333643741957776e-06, + "loss": 0.5781, + "step": 59074 + }, + { + "epoch": 1.51, + "learning_rate": 1.0333367191345186e-06, + "loss": 0.7764, + "step": 59075 + }, + { + "epoch": 1.51, + "learning_rate": 1.033309064047735e-06, + "loss": 0.5571, + "step": 59076 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332814089354482e-06, + "loss": 0.4095, + "step": 59077 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332537537976797e-06, + "loss": 0.5781, + "step": 59078 + }, + { + "epoch": 1.51, + "learning_rate": 1.0332260986344498e-06, + "loss": 0.5693, + "step": 59079 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331984434457808e-06, + "loss": 0.7681, + "step": 59080 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331707882316928e-06, + "loss": 0.6602, + "step": 59081 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331431329922077e-06, + "loss": 0.5859, + "step": 59082 + }, + { + "epoch": 1.51, + "learning_rate": 1.0331154777273464e-06, + "loss": 0.7012, + "step": 59083 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330878224371302e-06, + "loss": 0.5232, + "step": 59084 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330601671215797e-06, + "loss": 0.6426, + "step": 59085 + }, + { + "epoch": 1.51, + "learning_rate": 1.033032511780717e-06, + "loss": 0.564, + "step": 59086 + }, + { + "epoch": 1.51, + "learning_rate": 1.0330048564145628e-06, + "loss": 0.7148, + "step": 59087 + }, + { + "epoch": 1.51, + "learning_rate": 1.0329772010231383e-06, + "loss": 0.6733, + "step": 59088 + }, + { + "epoch": 1.51, + "learning_rate": 1.0329495456064645e-06, + "loss": 0.4561, + "step": 59089 + }, + { + "epoch": 1.51, + "learning_rate": 1.032921890164563e-06, + "loss": 0.665, + "step": 59090 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328942346974543e-06, + "loss": 0.5615, + "step": 59091 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328665792051606e-06, + "loss": 0.6008, + "step": 59092 + }, + { + "epoch": 1.51, + "learning_rate": 1.032838923687702e-06, + "loss": 0.5967, + "step": 59093 + }, + { + "epoch": 1.51, + "learning_rate": 1.0328112681451002e-06, + "loss": 0.7822, + "step": 59094 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327836125773763e-06, + "loss": 0.7148, + "step": 59095 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327559569845517e-06, + "loss": 0.5708, + "step": 59096 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327283013666473e-06, + "loss": 0.4622, + "step": 59097 + }, + { + "epoch": 1.51, + "learning_rate": 1.0327006457236842e-06, + "loss": 0.6123, + "step": 59098 + }, + { + "epoch": 1.51, + "learning_rate": 1.0326729900556839e-06, + "loss": 0.5303, + "step": 59099 + }, + { + "epoch": 1.51, + "learning_rate": 1.032645334362667e-06, + "loss": 0.5542, + "step": 59100 + }, + { + "epoch": 1.51, + "learning_rate": 1.0326176786446556e-06, + "loss": 0.7432, + "step": 59101 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325900229016703e-06, + "loss": 0.6323, + "step": 59102 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325623671337321e-06, + "loss": 0.6211, + "step": 59103 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325347113408622e-06, + "loss": 0.6621, + "step": 59104 + }, + { + "epoch": 1.51, + "learning_rate": 1.0325070555230824e-06, + "loss": 0.5962, + "step": 59105 + }, + { + "epoch": 1.51, + "learning_rate": 1.032479399680413e-06, + "loss": 0.397, + "step": 59106 + }, + { + "epoch": 1.51, + "learning_rate": 1.0324517438128764e-06, + "loss": 0.5908, + "step": 59107 + }, + { + "epoch": 1.51, + "learning_rate": 1.0324240879204922e-06, + "loss": 0.6797, + "step": 59108 + }, + { + "epoch": 1.51, + "learning_rate": 1.0323964320032827e-06, + "loss": 0.4375, + "step": 59109 + }, + { + "epoch": 1.52, + "learning_rate": 1.0323687760612685e-06, + "loss": 0.5958, + "step": 59110 + }, + { + "epoch": 1.52, + "learning_rate": 1.0323411200944712e-06, + "loss": 0.7178, + "step": 59111 + }, + { + "epoch": 1.52, + "learning_rate": 1.032313464102912e-06, + "loss": 0.8262, + "step": 59112 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322858080866117e-06, + "loss": 0.665, + "step": 59113 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322581520455912e-06, + "loss": 0.5854, + "step": 59114 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322304959798727e-06, + "loss": 0.6611, + "step": 59115 + }, + { + "epoch": 1.52, + "learning_rate": 1.0322028398894764e-06, + "loss": 0.6816, + "step": 59116 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321751837744241e-06, + "loss": 0.6904, + "step": 59117 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321475276347368e-06, + "loss": 0.6699, + "step": 59118 + }, + { + "epoch": 1.52, + "learning_rate": 1.0321198714704355e-06, + "loss": 0.8008, + "step": 59119 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320922152815415e-06, + "loss": 0.6626, + "step": 59120 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320645590680762e-06, + "loss": 0.5957, + "step": 59121 + }, + { + "epoch": 1.52, + "learning_rate": 1.0320369028300602e-06, + "loss": 0.6807, + "step": 59122 + }, + { + "epoch": 1.52, + "learning_rate": 1.032009246567515e-06, + "loss": 0.5454, + "step": 59123 + }, + { + "epoch": 1.52, + "learning_rate": 1.031981590280462e-06, + "loss": 0.7246, + "step": 59124 + }, + { + "epoch": 1.52, + "learning_rate": 1.0319539339689222e-06, + "loss": 0.7979, + "step": 59125 + }, + { + "epoch": 1.52, + "learning_rate": 1.0319262776329165e-06, + "loss": 0.7246, + "step": 59126 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318986212724666e-06, + "loss": 0.5698, + "step": 59127 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318709648875933e-06, + "loss": 0.4902, + "step": 59128 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318433084783176e-06, + "loss": 0.6577, + "step": 59129 + }, + { + "epoch": 1.52, + "learning_rate": 1.0318156520446613e-06, + "loss": 0.7197, + "step": 59130 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317879955866448e-06, + "loss": 0.541, + "step": 59131 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317603391042901e-06, + "loss": 0.6821, + "step": 59132 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317326825976177e-06, + "loss": 0.5918, + "step": 59133 + }, + { + "epoch": 1.52, + "learning_rate": 1.0317050260666492e-06, + "loss": 0.647, + "step": 59134 + }, + { + "epoch": 1.52, + "learning_rate": 1.0316773695114056e-06, + "loss": 0.626, + "step": 59135 + }, + { + "epoch": 1.52, + "learning_rate": 1.031649712931908e-06, + "loss": 0.5717, + "step": 59136 + }, + { + "epoch": 1.52, + "learning_rate": 1.0316220563281782e-06, + "loss": 0.8037, + "step": 59137 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315943997002363e-06, + "loss": 0.5596, + "step": 59138 + }, + { + "epoch": 1.52, + "learning_rate": 1.031566743048104e-06, + "loss": 0.7393, + "step": 59139 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315390863718027e-06, + "loss": 0.6042, + "step": 59140 + }, + { + "epoch": 1.52, + "learning_rate": 1.0315114296713533e-06, + "loss": 0.5396, + "step": 59141 + }, + { + "epoch": 1.52, + "learning_rate": 1.031483772946777e-06, + "loss": 0.6133, + "step": 59142 + }, + { + "epoch": 1.52, + "learning_rate": 1.031456116198095e-06, + "loss": 0.7832, + "step": 59143 + }, + { + "epoch": 1.52, + "learning_rate": 1.0314284594253285e-06, + "loss": 0.584, + "step": 59144 + }, + { + "epoch": 1.52, + "learning_rate": 1.0314008026284988e-06, + "loss": 0.5825, + "step": 59145 + }, + { + "epoch": 1.52, + "learning_rate": 1.031373145807627e-06, + "loss": 0.7012, + "step": 59146 + }, + { + "epoch": 1.52, + "learning_rate": 1.0313454889627343e-06, + "loss": 0.6699, + "step": 59147 + }, + { + "epoch": 1.52, + "learning_rate": 1.0313178320938414e-06, + "loss": 0.7822, + "step": 59148 + }, + { + "epoch": 1.52, + "learning_rate": 1.03129017520097e-06, + "loss": 0.6641, + "step": 59149 + }, + { + "epoch": 1.52, + "learning_rate": 1.0312625182841412e-06, + "loss": 0.5669, + "step": 59150 + }, + { + "epoch": 1.52, + "learning_rate": 1.031234861343376e-06, + "loss": 0.6372, + "step": 59151 + }, + { + "epoch": 1.52, + "learning_rate": 1.0312072043786962e-06, + "loss": 0.647, + "step": 59152 + }, + { + "epoch": 1.52, + "learning_rate": 1.0311795473901222e-06, + "loss": 0.7285, + "step": 59153 + }, + { + "epoch": 1.52, + "learning_rate": 1.0311518903776752e-06, + "loss": 0.6738, + "step": 59154 + }, + { + "epoch": 1.52, + "learning_rate": 1.031124233341377e-06, + "loss": 0.7423, + "step": 59155 + }, + { + "epoch": 1.52, + "learning_rate": 1.031096576281248e-06, + "loss": 0.488, + "step": 59156 + }, + { + "epoch": 1.52, + "learning_rate": 1.0310689191973104e-06, + "loss": 0.6472, + "step": 59157 + }, + { + "epoch": 1.52, + "learning_rate": 1.031041262089584e-06, + "loss": 0.5801, + "step": 59158 + }, + { + "epoch": 1.52, + "learning_rate": 1.0310136049580912e-06, + "loss": 0.8027, + "step": 59159 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309859478028527e-06, + "loss": 0.6714, + "step": 59160 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309582906238896e-06, + "loss": 0.5713, + "step": 59161 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309306334212231e-06, + "loss": 0.7559, + "step": 59162 + }, + { + "epoch": 1.52, + "learning_rate": 1.0309029761948745e-06, + "loss": 0.7021, + "step": 59163 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308753189448648e-06, + "loss": 0.6689, + "step": 59164 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308476616712155e-06, + "loss": 0.413, + "step": 59165 + }, + { + "epoch": 1.52, + "learning_rate": 1.0308200043739476e-06, + "loss": 0.562, + "step": 59166 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307923470530819e-06, + "loss": 0.6602, + "step": 59167 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307646897086401e-06, + "loss": 0.582, + "step": 59168 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307370323406432e-06, + "loss": 0.6758, + "step": 59169 + }, + { + "epoch": 1.52, + "learning_rate": 1.0307093749491125e-06, + "loss": 0.6299, + "step": 59170 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306817175340687e-06, + "loss": 0.6709, + "step": 59171 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306540600955338e-06, + "loss": 0.6948, + "step": 59172 + }, + { + "epoch": 1.52, + "learning_rate": 1.0306264026335281e-06, + "loss": 0.6172, + "step": 59173 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305987451480736e-06, + "loss": 0.8633, + "step": 59174 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305710876391905e-06, + "loss": 0.6201, + "step": 59175 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305434301069008e-06, + "loss": 0.6465, + "step": 59176 + }, + { + "epoch": 1.52, + "learning_rate": 1.0305157725512255e-06, + "loss": 0.6709, + "step": 59177 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304881149721857e-06, + "loss": 0.564, + "step": 59178 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304604573698022e-06, + "loss": 0.7559, + "step": 59179 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304327997440966e-06, + "loss": 0.5786, + "step": 59180 + }, + { + "epoch": 1.52, + "learning_rate": 1.0304051420950902e-06, + "loss": 0.8828, + "step": 59181 + }, + { + "epoch": 1.52, + "learning_rate": 1.030377484422804e-06, + "loss": 0.6101, + "step": 59182 + }, + { + "epoch": 1.52, + "learning_rate": 1.030349826727259e-06, + "loss": 0.457, + "step": 59183 + }, + { + "epoch": 1.52, + "learning_rate": 1.0303221690084766e-06, + "loss": 0.4658, + "step": 59184 + }, + { + "epoch": 1.52, + "learning_rate": 1.030294511266478e-06, + "loss": 0.4958, + "step": 59185 + }, + { + "epoch": 1.52, + "learning_rate": 1.030266853501284e-06, + "loss": 0.7144, + "step": 59186 + }, + { + "epoch": 1.52, + "learning_rate": 1.0302391957129166e-06, + "loss": 0.7148, + "step": 59187 + }, + { + "epoch": 1.52, + "learning_rate": 1.0302115379013959e-06, + "loss": 0.6216, + "step": 59188 + }, + { + "epoch": 1.52, + "learning_rate": 1.030183880066744e-06, + "loss": 0.7158, + "step": 59189 + }, + { + "epoch": 1.52, + "learning_rate": 1.0301562222089811e-06, + "loss": 0.604, + "step": 59190 + }, + { + "epoch": 1.52, + "learning_rate": 1.0301285643281297e-06, + "loss": 0.6213, + "step": 59191 + }, + { + "epoch": 1.52, + "learning_rate": 1.03010090642421e-06, + "loss": 0.6602, + "step": 59192 + }, + { + "epoch": 1.52, + "learning_rate": 1.0300732484972433e-06, + "loss": 0.6265, + "step": 59193 + }, + { + "epoch": 1.52, + "learning_rate": 1.030045590547251e-06, + "loss": 0.5864, + "step": 59194 + }, + { + "epoch": 1.52, + "learning_rate": 1.030017932574254e-06, + "loss": 0.645, + "step": 59195 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299902745782736e-06, + "loss": 0.6553, + "step": 59196 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299626165593316e-06, + "loss": 0.626, + "step": 59197 + }, + { + "epoch": 1.52, + "learning_rate": 1.029934958517448e-06, + "loss": 0.6113, + "step": 59198 + }, + { + "epoch": 1.52, + "learning_rate": 1.0299073004526448e-06, + "loss": 0.7109, + "step": 59199 + }, + { + "epoch": 1.52, + "learning_rate": 1.0298796423649428e-06, + "loss": 0.6523, + "step": 59200 + }, + { + "epoch": 1.52, + "learning_rate": 1.0298519842543635e-06, + "loss": 0.5427, + "step": 59201 + }, + { + "epoch": 1.52, + "learning_rate": 1.029824326120928e-06, + "loss": 0.7451, + "step": 59202 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297966679646572e-06, + "loss": 0.6885, + "step": 59203 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297690097855724e-06, + "loss": 0.6216, + "step": 59204 + }, + { + "epoch": 1.52, + "learning_rate": 1.029741351583695e-06, + "loss": 0.814, + "step": 59205 + }, + { + "epoch": 1.52, + "learning_rate": 1.0297136933590457e-06, + "loss": 0.5938, + "step": 59206 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296860351116465e-06, + "loss": 0.6626, + "step": 59207 + }, + { + "epoch": 1.52, + "learning_rate": 1.029658376841518e-06, + "loss": 0.7246, + "step": 59208 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296307185486812e-06, + "loss": 0.5972, + "step": 59209 + }, + { + "epoch": 1.52, + "learning_rate": 1.0296030602331574e-06, + "loss": 0.417, + "step": 59210 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295754018949683e-06, + "loss": 0.5449, + "step": 59211 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295477435341344e-06, + "loss": 0.6182, + "step": 59212 + }, + { + "epoch": 1.52, + "learning_rate": 1.0295200851506772e-06, + "loss": 0.637, + "step": 59213 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294924267446179e-06, + "loss": 0.6792, + "step": 59214 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294647683159773e-06, + "loss": 0.7383, + "step": 59215 + }, + { + "epoch": 1.52, + "learning_rate": 1.029437109864777e-06, + "loss": 0.4993, + "step": 59216 + }, + { + "epoch": 1.52, + "learning_rate": 1.0294094513910386e-06, + "loss": 0.7949, + "step": 59217 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293817928947824e-06, + "loss": 0.7422, + "step": 59218 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293541343760294e-06, + "loss": 0.6094, + "step": 59219 + }, + { + "epoch": 1.52, + "learning_rate": 1.0293264758348018e-06, + "loss": 0.5923, + "step": 59220 + }, + { + "epoch": 1.52, + "learning_rate": 1.02929881727112e-06, + "loss": 0.7129, + "step": 59221 + }, + { + "epoch": 1.52, + "learning_rate": 1.029271158685006e-06, + "loss": 0.7036, + "step": 59222 + }, + { + "epoch": 1.52, + "learning_rate": 1.0292435000764802e-06, + "loss": 0.5996, + "step": 59223 + }, + { + "epoch": 1.52, + "learning_rate": 1.029215841445564e-06, + "loss": 0.5718, + "step": 59224 + }, + { + "epoch": 1.52, + "learning_rate": 1.029188182792278e-06, + "loss": 0.583, + "step": 59225 + }, + { + "epoch": 1.52, + "learning_rate": 1.0291605241166443e-06, + "loss": 0.7754, + "step": 59226 + }, + { + "epoch": 1.52, + "learning_rate": 1.0291328654186839e-06, + "loss": 0.5935, + "step": 59227 + }, + { + "epoch": 1.52, + "learning_rate": 1.029105206698418e-06, + "loss": 0.5693, + "step": 59228 + }, + { + "epoch": 1.52, + "learning_rate": 1.0290775479558671e-06, + "loss": 0.6377, + "step": 59229 + }, + { + "epoch": 1.52, + "learning_rate": 1.029049889191053e-06, + "loss": 0.7368, + "step": 59230 + }, + { + "epoch": 1.52, + "learning_rate": 1.0290222304039966e-06, + "loss": 0.666, + "step": 59231 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289945715947195e-06, + "loss": 0.6465, + "step": 59232 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289669127632426e-06, + "loss": 0.7539, + "step": 59233 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289392539095867e-06, + "loss": 0.4158, + "step": 59234 + }, + { + "epoch": 1.52, + "learning_rate": 1.0289115950337736e-06, + "loss": 0.5889, + "step": 59235 + }, + { + "epoch": 1.52, + "learning_rate": 1.028883936135824e-06, + "loss": 0.666, + "step": 59236 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288562772157602e-06, + "loss": 0.7783, + "step": 59237 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288286182736014e-06, + "loss": 0.7754, + "step": 59238 + }, + { + "epoch": 1.52, + "learning_rate": 1.0288009593093703e-06, + "loss": 0.5869, + "step": 59239 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287733003230873e-06, + "loss": 0.5938, + "step": 59240 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287456413147745e-06, + "loss": 0.3835, + "step": 59241 + }, + { + "epoch": 1.52, + "learning_rate": 1.0287179822844523e-06, + "loss": 0.4558, + "step": 59242 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286903232321418e-06, + "loss": 0.5454, + "step": 59243 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286626641578644e-06, + "loss": 0.686, + "step": 59244 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286350050616418e-06, + "loss": 0.6519, + "step": 59245 + }, + { + "epoch": 1.52, + "learning_rate": 1.0286073459434944e-06, + "loss": 0.7227, + "step": 59246 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285796868034436e-06, + "loss": 0.7783, + "step": 59247 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285520276415105e-06, + "loss": 0.4767, + "step": 59248 + }, + { + "epoch": 1.52, + "learning_rate": 1.0285243684577168e-06, + "loss": 0.5996, + "step": 59249 + }, + { + "epoch": 1.52, + "learning_rate": 1.028496709252083e-06, + "loss": 0.6621, + "step": 59250 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284690500246306e-06, + "loss": 0.6318, + "step": 59251 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284413907753811e-06, + "loss": 0.7056, + "step": 59252 + }, + { + "epoch": 1.52, + "learning_rate": 1.0284137315043549e-06, + "loss": 0.7275, + "step": 59253 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283860722115739e-06, + "loss": 0.7529, + "step": 59254 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283584128970588e-06, + "loss": 0.4888, + "step": 59255 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283307535608311e-06, + "loss": 0.5466, + "step": 59256 + }, + { + "epoch": 1.52, + "learning_rate": 1.0283030942029118e-06, + "loss": 0.6221, + "step": 59257 + }, + { + "epoch": 1.52, + "learning_rate": 1.028275434823322e-06, + "loss": 0.5347, + "step": 59258 + }, + { + "epoch": 1.52, + "learning_rate": 1.028247775422083e-06, + "loss": 0.793, + "step": 59259 + }, + { + "epoch": 1.52, + "learning_rate": 1.0282201159992164e-06, + "loss": 0.7051, + "step": 59260 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281924565547425e-06, + "loss": 0.5767, + "step": 59261 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281647970886833e-06, + "loss": 0.7695, + "step": 59262 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281371376010593e-06, + "loss": 0.667, + "step": 59263 + }, + { + "epoch": 1.52, + "learning_rate": 1.0281094780918919e-06, + "loss": 0.6973, + "step": 59264 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280818185612026e-06, + "loss": 0.5764, + "step": 59265 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280541590090126e-06, + "loss": 0.665, + "step": 59266 + }, + { + "epoch": 1.52, + "learning_rate": 1.0280264994353424e-06, + "loss": 0.4692, + "step": 59267 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279988398402138e-06, + "loss": 0.5913, + "step": 59268 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279711802236474e-06, + "loss": 0.7266, + "step": 59269 + }, + { + "epoch": 1.52, + "learning_rate": 1.0279435205856653e-06, + "loss": 0.6729, + "step": 59270 + }, + { + "epoch": 1.52, + "learning_rate": 1.027915860926288e-06, + "loss": 0.4204, + "step": 59271 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278882012455364e-06, + "loss": 0.5271, + "step": 59272 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278605415434325e-06, + "loss": 0.7573, + "step": 59273 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278328818199968e-06, + "loss": 0.8223, + "step": 59274 + }, + { + "epoch": 1.52, + "learning_rate": 1.0278052220752509e-06, + "loss": 0.5952, + "step": 59275 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277775623092158e-06, + "loss": 0.6309, + "step": 59276 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277499025219128e-06, + "loss": 0.7183, + "step": 59277 + }, + { + "epoch": 1.52, + "learning_rate": 1.0277222427133628e-06, + "loss": 0.511, + "step": 59278 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276945828835872e-06, + "loss": 0.5767, + "step": 59279 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276669230326068e-06, + "loss": 0.6123, + "step": 59280 + }, + { + "epoch": 1.52, + "learning_rate": 1.027639263160444e-06, + "loss": 0.6201, + "step": 59281 + }, + { + "epoch": 1.52, + "learning_rate": 1.0276116032671184e-06, + "loss": 0.5798, + "step": 59282 + }, + { + "epoch": 1.52, + "learning_rate": 1.027583943352652e-06, + "loss": 0.6592, + "step": 59283 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275562834170657e-06, + "loss": 0.5923, + "step": 59284 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275286234603811e-06, + "loss": 0.834, + "step": 59285 + }, + { + "epoch": 1.52, + "learning_rate": 1.0275009634826192e-06, + "loss": 0.6387, + "step": 59286 + }, + { + "epoch": 1.52, + "learning_rate": 1.0274733034838008e-06, + "loss": 0.5908, + "step": 59287 + }, + { + "epoch": 1.52, + "learning_rate": 1.027445643463947e-06, + "loss": 0.585, + "step": 59288 + }, + { + "epoch": 1.52, + "learning_rate": 1.02741798342308e-06, + "loss": 0.6289, + "step": 59289 + }, + { + "epoch": 1.52, + "learning_rate": 1.02739032336122e-06, + "loss": 0.751, + "step": 59290 + }, + { + "epoch": 1.52, + "learning_rate": 1.0273626632783887e-06, + "loss": 0.6172, + "step": 59291 + }, + { + "epoch": 1.52, + "learning_rate": 1.0273350031746069e-06, + "loss": 0.481, + "step": 59292 + }, + { + "epoch": 1.52, + "learning_rate": 1.027307343049896e-06, + "loss": 0.5986, + "step": 59293 + }, + { + "epoch": 1.52, + "learning_rate": 1.027279682904277e-06, + "loss": 0.6855, + "step": 59294 + }, + { + "epoch": 1.52, + "learning_rate": 1.0272520227377713e-06, + "loss": 0.5591, + "step": 59295 + }, + { + "epoch": 1.52, + "learning_rate": 1.0272243625504e-06, + "loss": 0.7227, + "step": 59296 + }, + { + "epoch": 1.52, + "learning_rate": 1.027196702342184e-06, + "loss": 0.5593, + "step": 59297 + }, + { + "epoch": 1.52, + "learning_rate": 1.027169042113145e-06, + "loss": 0.75, + "step": 59298 + }, + { + "epoch": 1.52, + "learning_rate": 1.027141381863304e-06, + "loss": 0.7227, + "step": 59299 + }, + { + "epoch": 1.52, + "learning_rate": 1.0271137215926816e-06, + "loss": 0.6226, + "step": 59300 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270860613013002e-06, + "loss": 0.9805, + "step": 59301 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270584009891799e-06, + "loss": 0.6553, + "step": 59302 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270307406563419e-06, + "loss": 0.6689, + "step": 59303 + }, + { + "epoch": 1.52, + "learning_rate": 1.0270030803028082e-06, + "loss": 0.832, + "step": 59304 + }, + { + "epoch": 1.52, + "learning_rate": 1.0269754199285992e-06, + "loss": 0.5835, + "step": 59305 + }, + { + "epoch": 1.52, + "learning_rate": 1.0269477595337366e-06, + "loss": 0.6743, + "step": 59306 + }, + { + "epoch": 1.52, + "learning_rate": 1.026920099118241e-06, + "loss": 0.5605, + "step": 59307 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268924386821342e-06, + "loss": 0.6118, + "step": 59308 + }, + { + "epoch": 1.52, + "learning_rate": 1.026864778225437e-06, + "loss": 0.7412, + "step": 59309 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268371177481708e-06, + "loss": 0.7598, + "step": 59310 + }, + { + "epoch": 1.52, + "learning_rate": 1.0268094572503564e-06, + "loss": 0.4661, + "step": 59311 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267817967320155e-06, + "loss": 0.6177, + "step": 59312 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267541361931685e-06, + "loss": 0.6265, + "step": 59313 + }, + { + "epoch": 1.52, + "learning_rate": 1.0267264756338376e-06, + "loss": 0.6982, + "step": 59314 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266988150540431e-06, + "loss": 0.5737, + "step": 59315 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266711544538075e-06, + "loss": 0.6953, + "step": 59316 + }, + { + "epoch": 1.52, + "learning_rate": 1.0266434938331498e-06, + "loss": 0.7725, + "step": 59317 + }, + { + "epoch": 1.52, + "learning_rate": 1.026615833192093e-06, + "loss": 0.4285, + "step": 59318 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265881725306576e-06, + "loss": 0.7383, + "step": 59319 + }, + { + "epoch": 1.52, + "learning_rate": 1.026560511848865e-06, + "loss": 0.5381, + "step": 59320 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265328511467358e-06, + "loss": 0.582, + "step": 59321 + }, + { + "epoch": 1.52, + "learning_rate": 1.0265051904242917e-06, + "loss": 0.5229, + "step": 59322 + }, + { + "epoch": 1.52, + "learning_rate": 1.0264775296815542e-06, + "loss": 0.667, + "step": 59323 + }, + { + "epoch": 1.52, + "learning_rate": 1.0264498689185436e-06, + "loss": 0.6099, + "step": 59324 + }, + { + "epoch": 1.52, + "learning_rate": 1.026422208135282e-06, + "loss": 0.5491, + "step": 59325 + }, + { + "epoch": 1.52, + "learning_rate": 1.02639454733179e-06, + "loss": 0.5532, + "step": 59326 + }, + { + "epoch": 1.52, + "learning_rate": 1.026366886508089e-06, + "loss": 0.5376, + "step": 59327 + }, + { + "epoch": 1.52, + "learning_rate": 1.0263392256641997e-06, + "loss": 0.7539, + "step": 59328 + }, + { + "epoch": 1.52, + "learning_rate": 1.0263115648001442e-06, + "loss": 0.6948, + "step": 59329 + }, + { + "epoch": 1.52, + "learning_rate": 1.0262839039159426e-06, + "loss": 0.4434, + "step": 59330 + }, + { + "epoch": 1.52, + "learning_rate": 1.026256243011617e-06, + "loss": 0.4946, + "step": 59331 + }, + { + "epoch": 1.52, + "learning_rate": 1.026228582087188e-06, + "loss": 0.54, + "step": 59332 + }, + { + "epoch": 1.52, + "learning_rate": 1.0262009211426773e-06, + "loss": 0.6797, + "step": 59333 + }, + { + "epoch": 1.52, + "learning_rate": 1.0261732601781052e-06, + "loss": 0.6362, + "step": 59334 + }, + { + "epoch": 1.52, + "learning_rate": 1.0261455991934938e-06, + "loss": 0.6089, + "step": 59335 + }, + { + "epoch": 1.52, + "learning_rate": 1.026117938188864e-06, + "loss": 0.6411, + "step": 59336 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260902771642367e-06, + "loss": 0.7017, + "step": 59337 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260626161196334e-06, + "loss": 0.7676, + "step": 59338 + }, + { + "epoch": 1.52, + "learning_rate": 1.026034955055075e-06, + "loss": 0.6572, + "step": 59339 + }, + { + "epoch": 1.52, + "learning_rate": 1.0260072939705827e-06, + "loss": 0.8301, + "step": 59340 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259796328661782e-06, + "loss": 0.6343, + "step": 59341 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259519717418822e-06, + "loss": 0.7197, + "step": 59342 + }, + { + "epoch": 1.52, + "learning_rate": 1.0259243105977159e-06, + "loss": 0.5833, + "step": 59343 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258966494337004e-06, + "loss": 0.9023, + "step": 59344 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258689882498573e-06, + "loss": 0.4688, + "step": 59345 + }, + { + "epoch": 1.52, + "learning_rate": 1.0258413270462074e-06, + "loss": 0.6382, + "step": 59346 + }, + { + "epoch": 1.52, + "learning_rate": 1.025813665822772e-06, + "loss": 0.3816, + "step": 59347 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257860045795722e-06, + "loss": 0.7686, + "step": 59348 + }, + { + "epoch": 1.52, + "learning_rate": 1.025758343316629e-06, + "loss": 0.71, + "step": 59349 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257306820339642e-06, + "loss": 0.7285, + "step": 59350 + }, + { + "epoch": 1.52, + "learning_rate": 1.0257030207315986e-06, + "loss": 0.6035, + "step": 59351 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256753594095532e-06, + "loss": 0.5229, + "step": 59352 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256476980678492e-06, + "loss": 0.5835, + "step": 59353 + }, + { + "epoch": 1.52, + "learning_rate": 1.0256200367065085e-06, + "loss": 0.52, + "step": 59354 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255923753255511e-06, + "loss": 0.7139, + "step": 59355 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255647139249993e-06, + "loss": 0.8535, + "step": 59356 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255370525048735e-06, + "loss": 0.5415, + "step": 59357 + }, + { + "epoch": 1.52, + "learning_rate": 1.0255093910651953e-06, + "loss": 0.7051, + "step": 59358 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254817296059854e-06, + "loss": 0.707, + "step": 59359 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254540681272656e-06, + "loss": 0.7012, + "step": 59360 + }, + { + "epoch": 1.52, + "learning_rate": 1.0254264066290567e-06, + "loss": 0.73, + "step": 59361 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253987451113801e-06, + "loss": 0.7383, + "step": 59362 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253710835742566e-06, + "loss": 0.585, + "step": 59363 + }, + { + "epoch": 1.52, + "learning_rate": 1.025343422017708e-06, + "loss": 0.834, + "step": 59364 + }, + { + "epoch": 1.52, + "learning_rate": 1.0253157604417545e-06, + "loss": 0.6111, + "step": 59365 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252880988464186e-06, + "loss": 0.5825, + "step": 59366 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252604372317204e-06, + "loss": 0.6387, + "step": 59367 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252327755976812e-06, + "loss": 0.835, + "step": 59368 + }, + { + "epoch": 1.52, + "learning_rate": 1.0252051139443227e-06, + "loss": 0.7148, + "step": 59369 + }, + { + "epoch": 1.52, + "learning_rate": 1.0251774522716658e-06, + "loss": 0.6157, + "step": 59370 + }, + { + "epoch": 1.52, + "learning_rate": 1.025149790579732e-06, + "loss": 0.7061, + "step": 59371 + }, + { + "epoch": 1.52, + "learning_rate": 1.0251221288685416e-06, + "loss": 0.5215, + "step": 59372 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250944671381169e-06, + "loss": 0.6875, + "step": 59373 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250668053884778e-06, + "loss": 0.5693, + "step": 59374 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250391436196469e-06, + "loss": 0.6626, + "step": 59375 + }, + { + "epoch": 1.52, + "learning_rate": 1.0250114818316442e-06, + "loss": 0.4661, + "step": 59376 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249838200244918e-06, + "loss": 0.7178, + "step": 59377 + }, + { + "epoch": 1.52, + "learning_rate": 1.02495615819821e-06, + "loss": 0.8125, + "step": 59378 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249284963528207e-06, + "loss": 0.4993, + "step": 59379 + }, + { + "epoch": 1.52, + "learning_rate": 1.0249008344883445e-06, + "loss": 0.5596, + "step": 59380 + }, + { + "epoch": 1.52, + "learning_rate": 1.0248731726048033e-06, + "loss": 0.7139, + "step": 59381 + }, + { + "epoch": 1.52, + "learning_rate": 1.0248455107022177e-06, + "loss": 0.6807, + "step": 59382 + }, + { + "epoch": 1.52, + "learning_rate": 1.024817848780609e-06, + "loss": 0.7354, + "step": 59383 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247901868399982e-06, + "loss": 0.4683, + "step": 59384 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247625248804068e-06, + "loss": 0.7432, + "step": 59385 + }, + { + "epoch": 1.52, + "learning_rate": 1.024734862901856e-06, + "loss": 0.5918, + "step": 59386 + }, + { + "epoch": 1.52, + "learning_rate": 1.0247072009043667e-06, + "loss": 0.6445, + "step": 59387 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246795388879603e-06, + "loss": 0.5732, + "step": 59388 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246518768526581e-06, + "loss": 0.6709, + "step": 59389 + }, + { + "epoch": 1.52, + "learning_rate": 1.0246242147984807e-06, + "loss": 0.6758, + "step": 59390 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245965527254501e-06, + "loss": 0.8398, + "step": 59391 + }, + { + "epoch": 1.52, + "learning_rate": 1.024568890633587e-06, + "loss": 0.5322, + "step": 59392 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245412285229123e-06, + "loss": 0.7119, + "step": 59393 + }, + { + "epoch": 1.52, + "learning_rate": 1.0245135663934476e-06, + "loss": 0.6294, + "step": 59394 + }, + { + "epoch": 1.52, + "learning_rate": 1.0244859042452141e-06, + "loss": 0.6313, + "step": 59395 + }, + { + "epoch": 1.52, + "learning_rate": 1.024458242078233e-06, + "loss": 0.7529, + "step": 59396 + }, + { + "epoch": 1.52, + "learning_rate": 1.024430579892525e-06, + "loss": 0.561, + "step": 59397 + }, + { + "epoch": 1.52, + "learning_rate": 1.024402917688112e-06, + "loss": 0.875, + "step": 59398 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243752554650145e-06, + "loss": 0.6416, + "step": 59399 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243475932232542e-06, + "loss": 0.623, + "step": 59400 + }, + { + "epoch": 1.52, + "learning_rate": 1.0243199309628522e-06, + "loss": 0.5015, + "step": 59401 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242922686838294e-06, + "loss": 0.5576, + "step": 59402 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242646063862068e-06, + "loss": 0.6274, + "step": 59403 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242369440700063e-06, + "loss": 0.3384, + "step": 59404 + }, + { + "epoch": 1.52, + "learning_rate": 1.0242092817352483e-06, + "loss": 0.6777, + "step": 59405 + }, + { + "epoch": 1.52, + "learning_rate": 1.024181619381955e-06, + "loss": 0.4412, + "step": 59406 + }, + { + "epoch": 1.52, + "learning_rate": 1.0241539570101462e-06, + "loss": 0.7373, + "step": 59407 + }, + { + "epoch": 1.52, + "learning_rate": 1.0241262946198443e-06, + "loss": 0.7402, + "step": 59408 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240986322110698e-06, + "loss": 0.5752, + "step": 59409 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240709697838444e-06, + "loss": 0.5327, + "step": 59410 + }, + { + "epoch": 1.52, + "learning_rate": 1.0240433073381888e-06, + "loss": 0.6152, + "step": 59411 + }, + { + "epoch": 1.52, + "learning_rate": 1.024015644874124e-06, + "loss": 0.5579, + "step": 59412 + }, + { + "epoch": 1.52, + "learning_rate": 1.023987982391672e-06, + "loss": 0.6108, + "step": 59413 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239603198908534e-06, + "loss": 0.6255, + "step": 59414 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239326573716893e-06, + "loss": 0.5479, + "step": 59415 + }, + { + "epoch": 1.52, + "learning_rate": 1.0239049948342014e-06, + "loss": 0.71, + "step": 59416 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238773322784102e-06, + "loss": 0.6792, + "step": 59417 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238496697043372e-06, + "loss": 0.6221, + "step": 59418 + }, + { + "epoch": 1.52, + "learning_rate": 1.0238220071120037e-06, + "loss": 0.8418, + "step": 59419 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237943445014307e-06, + "loss": 0.6157, + "step": 59420 + }, + { + "epoch": 1.52, + "learning_rate": 1.02376668187264e-06, + "loss": 0.6895, + "step": 59421 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237390192256517e-06, + "loss": 0.707, + "step": 59422 + }, + { + "epoch": 1.52, + "learning_rate": 1.0237113565604878e-06, + "loss": 0.5166, + "step": 59423 + }, + { + "epoch": 1.52, + "learning_rate": 1.023683693877169e-06, + "loss": 0.6572, + "step": 59424 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236560311757167e-06, + "loss": 0.7603, + "step": 59425 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236283684561523e-06, + "loss": 0.6895, + "step": 59426 + }, + { + "epoch": 1.52, + "learning_rate": 1.0236007057184965e-06, + "loss": 0.7002, + "step": 59427 + }, + { + "epoch": 1.52, + "learning_rate": 1.0235730429627708e-06, + "loss": 0.5215, + "step": 59428 + }, + { + "epoch": 1.52, + "learning_rate": 1.0235453801889964e-06, + "loss": 0.7095, + "step": 59429 + }, + { + "epoch": 1.52, + "learning_rate": 1.023517717397194e-06, + "loss": 0.6626, + "step": 59430 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234900545873855e-06, + "loss": 0.6875, + "step": 59431 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234623917595917e-06, + "loss": 0.5957, + "step": 59432 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234347289138338e-06, + "loss": 0.5942, + "step": 59433 + }, + { + "epoch": 1.52, + "learning_rate": 1.0234070660501332e-06, + "loss": 0.6841, + "step": 59434 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233794031685106e-06, + "loss": 0.7617, + "step": 59435 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233517402689877e-06, + "loss": 0.6479, + "step": 59436 + }, + { + "epoch": 1.52, + "learning_rate": 1.0233240773515852e-06, + "loss": 0.4231, + "step": 59437 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232964144163247e-06, + "loss": 0.7207, + "step": 59438 + }, + { + "epoch": 1.52, + "learning_rate": 1.023268751463227e-06, + "loss": 0.4351, + "step": 59439 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232410884923137e-06, + "loss": 0.7026, + "step": 59440 + }, + { + "epoch": 1.52, + "learning_rate": 1.0232134255036059e-06, + "loss": 0.5266, + "step": 59441 + }, + { + "epoch": 1.52, + "learning_rate": 1.0231857624971245e-06, + "loss": 0.7246, + "step": 59442 + }, + { + "epoch": 1.52, + "learning_rate": 1.0231580994728906e-06, + "loss": 0.6514, + "step": 59443 + }, + { + "epoch": 1.52, + "learning_rate": 1.023130436430926e-06, + "loss": 0.8066, + "step": 59444 + }, + { + "epoch": 1.52, + "learning_rate": 1.023102773371251e-06, + "loss": 0.6831, + "step": 59445 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230751102938877e-06, + "loss": 0.6309, + "step": 59446 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230474471988567e-06, + "loss": 0.7168, + "step": 59447 + }, + { + "epoch": 1.52, + "learning_rate": 1.0230197840861794e-06, + "loss": 0.7559, + "step": 59448 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229921209558767e-06, + "loss": 0.7012, + "step": 59449 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229644578079702e-06, + "loss": 0.6675, + "step": 59450 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229367946424807e-06, + "loss": 0.6572, + "step": 59451 + }, + { + "epoch": 1.52, + "learning_rate": 1.0229091314594298e-06, + "loss": 0.583, + "step": 59452 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228814682588383e-06, + "loss": 0.5084, + "step": 59453 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228538050407275e-06, + "loss": 0.624, + "step": 59454 + }, + { + "epoch": 1.52, + "learning_rate": 1.0228261418051182e-06, + "loss": 0.3838, + "step": 59455 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227984785520325e-06, + "loss": 0.644, + "step": 59456 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227708152814912e-06, + "loss": 0.5852, + "step": 59457 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227431519935147e-06, + "loss": 0.7354, + "step": 59458 + }, + { + "epoch": 1.52, + "learning_rate": 1.0227154886881254e-06, + "loss": 0.6318, + "step": 59459 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226878253653435e-06, + "loss": 0.5728, + "step": 59460 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226601620251908e-06, + "loss": 0.5874, + "step": 59461 + }, + { + "epoch": 1.52, + "learning_rate": 1.0226324986676882e-06, + "loss": 0.5571, + "step": 59462 + }, + { + "epoch": 1.52, + "learning_rate": 1.022604835292857e-06, + "loss": 0.6743, + "step": 59463 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225771719007182e-06, + "loss": 0.6904, + "step": 59464 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225495084912933e-06, + "loss": 0.7109, + "step": 59465 + }, + { + "epoch": 1.52, + "learning_rate": 1.0225218450646029e-06, + "loss": 0.792, + "step": 59466 + }, + { + "epoch": 1.52, + "learning_rate": 1.022494181620669e-06, + "loss": 0.5693, + "step": 59467 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224665181595118e-06, + "loss": 0.6084, + "step": 59468 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224388546811535e-06, + "loss": 0.8203, + "step": 59469 + }, + { + "epoch": 1.52, + "learning_rate": 1.0224111911856143e-06, + "loss": 0.6143, + "step": 59470 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223835276729167e-06, + "loss": 0.6846, + "step": 59471 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223558641430803e-06, + "loss": 0.5864, + "step": 59472 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223282005961276e-06, + "loss": 0.4028, + "step": 59473 + }, + { + "epoch": 1.52, + "learning_rate": 1.0223005370320787e-06, + "loss": 0.4946, + "step": 59474 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222728734509556e-06, + "loss": 0.6558, + "step": 59475 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222452098527791e-06, + "loss": 0.4904, + "step": 59476 + }, + { + "epoch": 1.52, + "learning_rate": 1.0222175462375703e-06, + "loss": 0.6416, + "step": 59477 + }, + { + "epoch": 1.52, + "learning_rate": 1.022189882605351e-06, + "loss": 0.7314, + "step": 59478 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221622189561417e-06, + "loss": 0.6631, + "step": 59479 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221345552899635e-06, + "loss": 0.8174, + "step": 59480 + }, + { + "epoch": 1.52, + "learning_rate": 1.0221068916068386e-06, + "loss": 0.4692, + "step": 59481 + }, + { + "epoch": 1.52, + "learning_rate": 1.022079227906787e-06, + "loss": 0.7334, + "step": 59482 + }, + { + "epoch": 1.52, + "learning_rate": 1.0220515641898302e-06, + "loss": 0.6162, + "step": 59483 + }, + { + "epoch": 1.52, + "learning_rate": 1.0220239004559896e-06, + "loss": 0.5435, + "step": 59484 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219962367052862e-06, + "loss": 0.4768, + "step": 59485 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219685729377422e-06, + "loss": 0.6367, + "step": 59486 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219409091533769e-06, + "loss": 0.6924, + "step": 59487 + }, + { + "epoch": 1.52, + "learning_rate": 1.0219132453522128e-06, + "loss": 0.6646, + "step": 59488 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218855815342707e-06, + "loss": 0.6934, + "step": 59489 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218579176995715e-06, + "loss": 0.5806, + "step": 59490 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218302538481373e-06, + "loss": 0.3357, + "step": 59491 + }, + { + "epoch": 1.52, + "learning_rate": 1.0218025899799884e-06, + "loss": 0.7119, + "step": 59492 + }, + { + "epoch": 1.52, + "learning_rate": 1.021774926095146e-06, + "loss": 0.5449, + "step": 59493 + }, + { + "epoch": 1.52, + "learning_rate": 1.021747262193632e-06, + "loss": 0.627, + "step": 59494 + }, + { + "epoch": 1.52, + "learning_rate": 1.0217195982754668e-06, + "loss": 0.6816, + "step": 59495 + }, + { + "epoch": 1.52, + "learning_rate": 1.021691934340672e-06, + "loss": 0.8057, + "step": 59496 + }, + { + "epoch": 1.52, + "learning_rate": 1.021664270389269e-06, + "loss": 0.5205, + "step": 59497 + }, + { + "epoch": 1.52, + "learning_rate": 1.0216366064212783e-06, + "loss": 0.6904, + "step": 59498 + }, + { + "epoch": 1.52, + "learning_rate": 1.0216089424367214e-06, + "loss": 0.751, + "step": 59499 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215812784356195e-06, + "loss": 0.7119, + "step": 59500 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215536144179942e-06, + "loss": 0.7061, + "step": 59501 + }, + { + "epoch": 1.53, + "learning_rate": 1.0215259503838658e-06, + "loss": 0.6826, + "step": 59502 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214982863332562e-06, + "loss": 0.5996, + "step": 59503 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214706222661863e-06, + "loss": 0.6587, + "step": 59504 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214429581826773e-06, + "loss": 0.6758, + "step": 59505 + }, + { + "epoch": 1.53, + "learning_rate": 1.0214152940827505e-06, + "loss": 0.7812, + "step": 59506 + }, + { + "epoch": 1.53, + "learning_rate": 1.0213876299664273e-06, + "loss": 0.4482, + "step": 59507 + }, + { + "epoch": 1.53, + "learning_rate": 1.021359965833728e-06, + "loss": 0.5518, + "step": 59508 + }, + { + "epoch": 1.53, + "learning_rate": 1.0213323016846746e-06, + "loss": 0.4028, + "step": 59509 + }, + { + "epoch": 1.53, + "learning_rate": 1.021304637519288e-06, + "loss": 0.5471, + "step": 59510 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212769733375897e-06, + "loss": 0.6533, + "step": 59511 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212493091396002e-06, + "loss": 0.665, + "step": 59512 + }, + { + "epoch": 1.53, + "learning_rate": 1.0212216449253412e-06, + "loss": 0.6279, + "step": 59513 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211939806948337e-06, + "loss": 0.502, + "step": 59514 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211663164480993e-06, + "loss": 0.5435, + "step": 59515 + }, + { + "epoch": 1.53, + "learning_rate": 1.0211386521851585e-06, + "loss": 0.584, + "step": 59516 + }, + { + "epoch": 1.53, + "learning_rate": 1.021110987906033e-06, + "loss": 0.5996, + "step": 59517 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210833236107434e-06, + "loss": 0.6211, + "step": 59518 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210556592993118e-06, + "loss": 0.5725, + "step": 59519 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210279949717585e-06, + "loss": 0.6899, + "step": 59520 + }, + { + "epoch": 1.53, + "learning_rate": 1.0210003306281052e-06, + "loss": 0.605, + "step": 59521 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209726662683729e-06, + "loss": 0.7393, + "step": 59522 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209450018925825e-06, + "loss": 0.6216, + "step": 59523 + }, + { + "epoch": 1.53, + "learning_rate": 1.0209173375007559e-06, + "loss": 0.6426, + "step": 59524 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208896730929135e-06, + "loss": 0.5181, + "step": 59525 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208620086690771e-06, + "loss": 0.6104, + "step": 59526 + }, + { + "epoch": 1.53, + "learning_rate": 1.0208343442292676e-06, + "loss": 0.7578, + "step": 59527 + }, + { + "epoch": 1.53, + "learning_rate": 1.020806679773506e-06, + "loss": 0.6069, + "step": 59528 + }, + { + "epoch": 1.53, + "learning_rate": 1.0207790153018135e-06, + "loss": 0.7246, + "step": 59529 + }, + { + "epoch": 1.53, + "learning_rate": 1.020751350814212e-06, + "loss": 0.4556, + "step": 59530 + }, + { + "epoch": 1.53, + "learning_rate": 1.020723686310722e-06, + "loss": 0.7207, + "step": 59531 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206960217913648e-06, + "loss": 0.6396, + "step": 59532 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206683572561613e-06, + "loss": 0.8232, + "step": 59533 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206406927051334e-06, + "loss": 0.6265, + "step": 59534 + }, + { + "epoch": 1.53, + "learning_rate": 1.0206130281383017e-06, + "loss": 0.4194, + "step": 59535 + }, + { + "epoch": 1.53, + "learning_rate": 1.0205853635556877e-06, + "loss": 0.6382, + "step": 59536 + }, + { + "epoch": 1.53, + "learning_rate": 1.020557698957312e-06, + "loss": 0.5742, + "step": 59537 + }, + { + "epoch": 1.53, + "learning_rate": 1.0205300343431967e-06, + "loss": 0.7305, + "step": 59538 + }, + { + "epoch": 1.53, + "learning_rate": 1.020502369713362e-06, + "loss": 0.8447, + "step": 59539 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204747050678302e-06, + "loss": 0.5732, + "step": 59540 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204470404066215e-06, + "loss": 0.2485, + "step": 59541 + }, + { + "epoch": 1.53, + "learning_rate": 1.0204193757297575e-06, + "loss": 0.7246, + "step": 59542 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203917110372594e-06, + "loss": 0.4927, + "step": 59543 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203640463291481e-06, + "loss": 0.584, + "step": 59544 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203363816054451e-06, + "loss": 0.6465, + "step": 59545 + }, + { + "epoch": 1.53, + "learning_rate": 1.0203087168661713e-06, + "loss": 0.5508, + "step": 59546 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202810521113483e-06, + "loss": 0.7427, + "step": 59547 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202533873409968e-06, + "loss": 0.5903, + "step": 59548 + }, + { + "epoch": 1.53, + "learning_rate": 1.0202257225551385e-06, + "loss": 0.6836, + "step": 59549 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201980577537941e-06, + "loss": 0.7988, + "step": 59550 + }, + { + "epoch": 1.53, + "learning_rate": 1.020170392936985e-06, + "loss": 0.6416, + "step": 59551 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201427281047324e-06, + "loss": 0.6216, + "step": 59552 + }, + { + "epoch": 1.53, + "learning_rate": 1.0201150632570574e-06, + "loss": 0.6187, + "step": 59553 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200873983939813e-06, + "loss": 0.7246, + "step": 59554 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200597335155251e-06, + "loss": 0.6973, + "step": 59555 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200320686217102e-06, + "loss": 0.5332, + "step": 59556 + }, + { + "epoch": 1.53, + "learning_rate": 1.0200044037125577e-06, + "loss": 0.6069, + "step": 59557 + }, + { + "epoch": 1.53, + "learning_rate": 1.0199767387880884e-06, + "loss": 0.7842, + "step": 59558 + }, + { + "epoch": 1.53, + "learning_rate": 1.0199490738483242e-06, + "loss": 0.7617, + "step": 59559 + }, + { + "epoch": 1.53, + "learning_rate": 1.019921408893286e-06, + "loss": 0.6196, + "step": 59560 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198937439229947e-06, + "loss": 0.3867, + "step": 59561 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198660789374712e-06, + "loss": 0.6204, + "step": 59562 + }, + { + "epoch": 1.53, + "learning_rate": 1.019838413936738e-06, + "loss": 0.6826, + "step": 59563 + }, + { + "epoch": 1.53, + "learning_rate": 1.0198107489208148e-06, + "loss": 0.7256, + "step": 59564 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197830838897237e-06, + "loss": 0.8037, + "step": 59565 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197554188434856e-06, + "loss": 0.7007, + "step": 59566 + }, + { + "epoch": 1.53, + "learning_rate": 1.0197277537821216e-06, + "loss": 0.5283, + "step": 59567 + }, + { + "epoch": 1.53, + "learning_rate": 1.019700088705653e-06, + "loss": 0.791, + "step": 59568 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196724236141008e-06, + "loss": 0.832, + "step": 59569 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196447585074868e-06, + "loss": 0.8604, + "step": 59570 + }, + { + "epoch": 1.53, + "learning_rate": 1.0196170933858311e-06, + "loss": 0.75, + "step": 59571 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195894282491561e-06, + "loss": 0.873, + "step": 59572 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195617630974819e-06, + "loss": 0.7256, + "step": 59573 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195340979308304e-06, + "loss": 0.5046, + "step": 59574 + }, + { + "epoch": 1.53, + "learning_rate": 1.0195064327492226e-06, + "loss": 0.6826, + "step": 59575 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194787675526796e-06, + "loss": 0.4978, + "step": 59576 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194511023412222e-06, + "loss": 0.6875, + "step": 59577 + }, + { + "epoch": 1.53, + "learning_rate": 1.0194234371148724e-06, + "loss": 0.5635, + "step": 59578 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193957718736507e-06, + "loss": 0.7119, + "step": 59579 + }, + { + "epoch": 1.53, + "learning_rate": 1.019368106617579e-06, + "loss": 0.7246, + "step": 59580 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193404413466774e-06, + "loss": 0.6084, + "step": 59581 + }, + { + "epoch": 1.53, + "learning_rate": 1.0193127760609683e-06, + "loss": 0.6738, + "step": 59582 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192851107604718e-06, + "loss": 0.4426, + "step": 59583 + }, + { + "epoch": 1.53, + "learning_rate": 1.01925744544521e-06, + "loss": 0.3772, + "step": 59584 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192297801152036e-06, + "loss": 0.6477, + "step": 59585 + }, + { + "epoch": 1.53, + "learning_rate": 1.0192021147704734e-06, + "loss": 0.4814, + "step": 59586 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191744494110415e-06, + "loss": 0.469, + "step": 59587 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191467840369285e-06, + "loss": 0.7178, + "step": 59588 + }, + { + "epoch": 1.53, + "learning_rate": 1.0191191186481556e-06, + "loss": 0.4893, + "step": 59589 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190914532447442e-06, + "loss": 0.6135, + "step": 59590 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190637878267151e-06, + "loss": 0.7891, + "step": 59591 + }, + { + "epoch": 1.53, + "learning_rate": 1.01903612239409e-06, + "loss": 0.6846, + "step": 59592 + }, + { + "epoch": 1.53, + "learning_rate": 1.0190084569468897e-06, + "loss": 0.665, + "step": 59593 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189807914851354e-06, + "loss": 0.6333, + "step": 59594 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189531260088489e-06, + "loss": 0.5837, + "step": 59595 + }, + { + "epoch": 1.53, + "learning_rate": 1.0189254605180501e-06, + "loss": 0.5918, + "step": 59596 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188977950127614e-06, + "loss": 0.6289, + "step": 59597 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188701294930033e-06, + "loss": 0.6973, + "step": 59598 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188424639587973e-06, + "loss": 0.748, + "step": 59599 + }, + { + "epoch": 1.53, + "learning_rate": 1.0188147984101647e-06, + "loss": 0.71, + "step": 59600 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187871328471265e-06, + "loss": 0.5713, + "step": 59601 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187594672697033e-06, + "loss": 0.6904, + "step": 59602 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187318016779175e-06, + "loss": 0.7158, + "step": 59603 + }, + { + "epoch": 1.53, + "learning_rate": 1.0187041360717889e-06, + "loss": 0.7744, + "step": 59604 + }, + { + "epoch": 1.53, + "learning_rate": 1.01867647045134e-06, + "loss": 0.7803, + "step": 59605 + }, + { + "epoch": 1.53, + "learning_rate": 1.0186488048165913e-06, + "loss": 0.7891, + "step": 59606 + }, + { + "epoch": 1.53, + "learning_rate": 1.018621139167564e-06, + "loss": 0.626, + "step": 59607 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185934735042792e-06, + "loss": 0.7314, + "step": 59608 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185658078267584e-06, + "loss": 0.8184, + "step": 59609 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185381421350227e-06, + "loss": 0.6768, + "step": 59610 + }, + { + "epoch": 1.53, + "learning_rate": 1.0185104764290929e-06, + "loss": 0.668, + "step": 59611 + }, + { + "epoch": 1.53, + "learning_rate": 1.0184828107089907e-06, + "loss": 0.8281, + "step": 59612 + }, + { + "epoch": 1.53, + "learning_rate": 1.018455144974737e-06, + "loss": 0.7988, + "step": 59613 + }, + { + "epoch": 1.53, + "learning_rate": 1.018427479226353e-06, + "loss": 0.6074, + "step": 59614 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183998134638601e-06, + "loss": 0.6897, + "step": 59615 + }, + { + "epoch": 1.53, + "learning_rate": 1.018372147687279e-06, + "loss": 0.6982, + "step": 59616 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183444818966313e-06, + "loss": 0.6006, + "step": 59617 + }, + { + "epoch": 1.53, + "learning_rate": 1.0183168160919385e-06, + "loss": 0.574, + "step": 59618 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182891502732207e-06, + "loss": 0.7051, + "step": 59619 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182614844405004e-06, + "loss": 0.8018, + "step": 59620 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182338185937975e-06, + "loss": 0.7773, + "step": 59621 + }, + { + "epoch": 1.53, + "learning_rate": 1.0182061527331343e-06, + "loss": 0.5901, + "step": 59622 + }, + { + "epoch": 1.53, + "learning_rate": 1.018178486858531e-06, + "loss": 0.2466, + "step": 59623 + }, + { + "epoch": 1.53, + "learning_rate": 1.0181508209700096e-06, + "loss": 0.4519, + "step": 59624 + }, + { + "epoch": 1.53, + "learning_rate": 1.0181231550675908e-06, + "loss": 0.5034, + "step": 59625 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180954891512963e-06, + "loss": 0.7529, + "step": 59626 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180678232211464e-06, + "loss": 0.5933, + "step": 59627 + }, + { + "epoch": 1.53, + "learning_rate": 1.018040157277163e-06, + "loss": 0.6064, + "step": 59628 + }, + { + "epoch": 1.53, + "learning_rate": 1.0180124913193671e-06, + "loss": 0.6836, + "step": 59629 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179848253477798e-06, + "loss": 0.6172, + "step": 59630 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179571593624225e-06, + "loss": 0.4814, + "step": 59631 + }, + { + "epoch": 1.53, + "learning_rate": 1.0179294933633163e-06, + "loss": 0.5737, + "step": 59632 + }, + { + "epoch": 1.53, + "learning_rate": 1.017901827350482e-06, + "loss": 0.5583, + "step": 59633 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178741613239412e-06, + "loss": 0.5767, + "step": 59634 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178464952837152e-06, + "loss": 0.5791, + "step": 59635 + }, + { + "epoch": 1.53, + "learning_rate": 1.0178188292298246e-06, + "loss": 0.5913, + "step": 59636 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177911631622913e-06, + "loss": 0.568, + "step": 59637 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177634970811357e-06, + "loss": 0.7061, + "step": 59638 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177358309863798e-06, + "loss": 0.6616, + "step": 59639 + }, + { + "epoch": 1.53, + "learning_rate": 1.0177081648780443e-06, + "loss": 0.6987, + "step": 59640 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176804987561505e-06, + "loss": 0.6089, + "step": 59641 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176528326207193e-06, + "loss": 0.6577, + "step": 59642 + }, + { + "epoch": 1.53, + "learning_rate": 1.0176251664717724e-06, + "loss": 0.6943, + "step": 59643 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175975003093305e-06, + "loss": 0.5161, + "step": 59644 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175698341334154e-06, + "loss": 0.5854, + "step": 59645 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175421679440474e-06, + "loss": 0.7207, + "step": 59646 + }, + { + "epoch": 1.53, + "learning_rate": 1.0175145017412485e-06, + "loss": 0.6895, + "step": 59647 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174868355250393e-06, + "loss": 0.667, + "step": 59648 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174591692954415e-06, + "loss": 0.5386, + "step": 59649 + }, + { + "epoch": 1.53, + "learning_rate": 1.017431503052476e-06, + "loss": 0.8076, + "step": 59650 + }, + { + "epoch": 1.53, + "learning_rate": 1.0174038367961639e-06, + "loss": 0.6631, + "step": 59651 + }, + { + "epoch": 1.53, + "learning_rate": 1.0173761705265262e-06, + "loss": 0.6372, + "step": 59652 + }, + { + "epoch": 1.53, + "learning_rate": 1.0173485042435848e-06, + "loss": 0.7939, + "step": 59653 + }, + { + "epoch": 1.53, + "learning_rate": 1.01732083794736e-06, + "loss": 0.7422, + "step": 59654 + }, + { + "epoch": 1.53, + "learning_rate": 1.017293171637874e-06, + "loss": 0.5459, + "step": 59655 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172655053151472e-06, + "loss": 0.5664, + "step": 59656 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172378389792006e-06, + "loss": 0.6099, + "step": 59657 + }, + { + "epoch": 1.53, + "learning_rate": 1.0172101726300564e-06, + "loss": 0.6689, + "step": 59658 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171825062677347e-06, + "loss": 0.6982, + "step": 59659 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171548398922577e-06, + "loss": 0.5051, + "step": 59660 + }, + { + "epoch": 1.53, + "learning_rate": 1.0171271735036453e-06, + "loss": 0.8027, + "step": 59661 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170995071019199e-06, + "loss": 0.5928, + "step": 59662 + }, + { + "epoch": 1.53, + "learning_rate": 1.017071840687102e-06, + "loss": 0.6025, + "step": 59663 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170441742592132e-06, + "loss": 0.5801, + "step": 59664 + }, + { + "epoch": 1.53, + "learning_rate": 1.0170165078182743e-06, + "loss": 0.5859, + "step": 59665 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169888413643066e-06, + "loss": 0.7354, + "step": 59666 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169611748973312e-06, + "loss": 0.6982, + "step": 59667 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169335084173695e-06, + "loss": 0.5535, + "step": 59668 + }, + { + "epoch": 1.53, + "learning_rate": 1.0169058419244425e-06, + "loss": 0.6245, + "step": 59669 + }, + { + "epoch": 1.53, + "learning_rate": 1.016878175418572e-06, + "loss": 0.7188, + "step": 59670 + }, + { + "epoch": 1.53, + "learning_rate": 1.016850508899778e-06, + "loss": 0.6426, + "step": 59671 + }, + { + "epoch": 1.53, + "learning_rate": 1.0168228423680828e-06, + "loss": 0.7007, + "step": 59672 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167951758235067e-06, + "loss": 0.6851, + "step": 59673 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167675092660716e-06, + "loss": 0.5918, + "step": 59674 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167398426957984e-06, + "loss": 0.6758, + "step": 59675 + }, + { + "epoch": 1.53, + "learning_rate": 1.0167121761127082e-06, + "loss": 0.7256, + "step": 59676 + }, + { + "epoch": 1.53, + "learning_rate": 1.0166845095168224e-06, + "loss": 0.7734, + "step": 59677 + }, + { + "epoch": 1.53, + "learning_rate": 1.016656842908162e-06, + "loss": 0.582, + "step": 59678 + }, + { + "epoch": 1.53, + "learning_rate": 1.0166291762867479e-06, + "loss": 0.7295, + "step": 59679 + }, + { + "epoch": 1.53, + "learning_rate": 1.016601509652602e-06, + "loss": 0.6436, + "step": 59680 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165738430057448e-06, + "loss": 0.5828, + "step": 59681 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165461763461978e-06, + "loss": 0.7002, + "step": 59682 + }, + { + "epoch": 1.53, + "learning_rate": 1.0165185096739823e-06, + "loss": 0.6626, + "step": 59683 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164908429891193e-06, + "loss": 0.6611, + "step": 59684 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164631762916302e-06, + "loss": 0.5142, + "step": 59685 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164355095815356e-06, + "loss": 0.6558, + "step": 59686 + }, + { + "epoch": 1.53, + "learning_rate": 1.0164078428588573e-06, + "loss": 0.5786, + "step": 59687 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163801761236162e-06, + "loss": 0.8125, + "step": 59688 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163525093758335e-06, + "loss": 0.4976, + "step": 59689 + }, + { + "epoch": 1.53, + "learning_rate": 1.0163248426155308e-06, + "loss": 0.6621, + "step": 59690 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162971758427287e-06, + "loss": 0.6069, + "step": 59691 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162695090574485e-06, + "loss": 0.6006, + "step": 59692 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162418422597116e-06, + "loss": 0.5327, + "step": 59693 + }, + { + "epoch": 1.53, + "learning_rate": 1.0162141754495388e-06, + "loss": 0.5908, + "step": 59694 + }, + { + "epoch": 1.53, + "learning_rate": 1.016186508626952e-06, + "loss": 0.7129, + "step": 59695 + }, + { + "epoch": 1.53, + "learning_rate": 1.0161588417919718e-06, + "loss": 0.7119, + "step": 59696 + }, + { + "epoch": 1.53, + "learning_rate": 1.0161311749446193e-06, + "loss": 0.5703, + "step": 59697 + }, + { + "epoch": 1.53, + "learning_rate": 1.016103508084916e-06, + "loss": 0.7002, + "step": 59698 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160758412128831e-06, + "loss": 0.5029, + "step": 59699 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160481743285416e-06, + "loss": 0.5327, + "step": 59700 + }, + { + "epoch": 1.53, + "learning_rate": 1.0160205074319125e-06, + "loss": 0.6978, + "step": 59701 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159928405230176e-06, + "loss": 0.5752, + "step": 59702 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159651736018775e-06, + "loss": 0.9062, + "step": 59703 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159375066685135e-06, + "loss": 0.7871, + "step": 59704 + }, + { + "epoch": 1.53, + "learning_rate": 1.0159098397229474e-06, + "loss": 0.6123, + "step": 59705 + }, + { + "epoch": 1.53, + "learning_rate": 1.0158821727651996e-06, + "loss": 0.6631, + "step": 59706 + }, + { + "epoch": 1.53, + "learning_rate": 1.0158545057952912e-06, + "loss": 0.583, + "step": 59707 + }, + { + "epoch": 1.53, + "learning_rate": 1.015826838813244e-06, + "loss": 0.7139, + "step": 59708 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157991718190789e-06, + "loss": 0.6738, + "step": 59709 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157715048128175e-06, + "loss": 0.3671, + "step": 59710 + }, + { + "epoch": 1.53, + "learning_rate": 1.01574383779448e-06, + "loss": 0.5496, + "step": 59711 + }, + { + "epoch": 1.53, + "learning_rate": 1.0157161707640884e-06, + "loss": 0.5559, + "step": 59712 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156885037216636e-06, + "loss": 0.6553, + "step": 59713 + }, + { + "epoch": 1.53, + "learning_rate": 1.015660836667227e-06, + "loss": 0.8184, + "step": 59714 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156331696007994e-06, + "loss": 0.6992, + "step": 59715 + }, + { + "epoch": 1.53, + "learning_rate": 1.0156055025224024e-06, + "loss": 0.7246, + "step": 59716 + }, + { + "epoch": 1.53, + "learning_rate": 1.0155778354320567e-06, + "loss": 0.6328, + "step": 59717 + }, + { + "epoch": 1.53, + "learning_rate": 1.015550168329784e-06, + "loss": 0.6309, + "step": 59718 + }, + { + "epoch": 1.53, + "learning_rate": 1.015522501215605e-06, + "loss": 0.7539, + "step": 59719 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154948340895415e-06, + "loss": 0.7178, + "step": 59720 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154671669516142e-06, + "loss": 0.7031, + "step": 59721 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154394998018445e-06, + "loss": 0.6943, + "step": 59722 + }, + { + "epoch": 1.53, + "learning_rate": 1.0154118326402531e-06, + "loss": 0.3767, + "step": 59723 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153841654668618e-06, + "loss": 0.6299, + "step": 59724 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153564982816918e-06, + "loss": 0.6982, + "step": 59725 + }, + { + "epoch": 1.53, + "learning_rate": 1.0153288310847636e-06, + "loss": 0.7754, + "step": 59726 + }, + { + "epoch": 1.53, + "learning_rate": 1.015301163876099e-06, + "loss": 0.9277, + "step": 59727 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152734966557187e-06, + "loss": 0.6104, + "step": 59728 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152458294236447e-06, + "loss": 0.6729, + "step": 59729 + }, + { + "epoch": 1.53, + "learning_rate": 1.0152181621798976e-06, + "loss": 0.4128, + "step": 59730 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151904949244984e-06, + "loss": 0.7397, + "step": 59731 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151628276574686e-06, + "loss": 0.7109, + "step": 59732 + }, + { + "epoch": 1.53, + "learning_rate": 1.0151351603788294e-06, + "loss": 0.8369, + "step": 59733 + }, + { + "epoch": 1.53, + "learning_rate": 1.015107493088602e-06, + "loss": 0.6445, + "step": 59734 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150798257868074e-06, + "loss": 0.5894, + "step": 59735 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150521584734668e-06, + "loss": 0.6914, + "step": 59736 + }, + { + "epoch": 1.53, + "learning_rate": 1.0150244911486014e-06, + "loss": 0.6133, + "step": 59737 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149968238122326e-06, + "loss": 0.562, + "step": 59738 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149691564643813e-06, + "loss": 0.5601, + "step": 59739 + }, + { + "epoch": 1.53, + "learning_rate": 1.014941489105069e-06, + "loss": 0.7881, + "step": 59740 + }, + { + "epoch": 1.53, + "learning_rate": 1.0149138217343164e-06, + "loss": 0.6475, + "step": 59741 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148861543521452e-06, + "loss": 0.5596, + "step": 59742 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148584869585764e-06, + "loss": 0.8262, + "step": 59743 + }, + { + "epoch": 1.53, + "learning_rate": 1.0148308195536308e-06, + "loss": 0.6982, + "step": 59744 + }, + { + "epoch": 1.53, + "learning_rate": 1.01480315213733e-06, + "loss": 0.6211, + "step": 59745 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147754847096955e-06, + "loss": 0.7422, + "step": 59746 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147478172707474e-06, + "loss": 0.5957, + "step": 59747 + }, + { + "epoch": 1.53, + "learning_rate": 1.0147201498205083e-06, + "loss": 0.542, + "step": 59748 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146924823589982e-06, + "loss": 0.8447, + "step": 59749 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146648148862392e-06, + "loss": 0.561, + "step": 59750 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146371474022517e-06, + "loss": 0.5747, + "step": 59751 + }, + { + "epoch": 1.53, + "learning_rate": 1.0146094799070573e-06, + "loss": 0.5459, + "step": 59752 + }, + { + "epoch": 1.53, + "learning_rate": 1.014581812400677e-06, + "loss": 0.7822, + "step": 59753 + }, + { + "epoch": 1.53, + "learning_rate": 1.014554144883132e-06, + "loss": 0.4893, + "step": 59754 + }, + { + "epoch": 1.53, + "learning_rate": 1.0145264773544437e-06, + "loss": 0.7236, + "step": 59755 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144988098146333e-06, + "loss": 0.6313, + "step": 59756 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144711422637213e-06, + "loss": 0.7207, + "step": 59757 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144434747017299e-06, + "loss": 0.6455, + "step": 59758 + }, + { + "epoch": 1.53, + "learning_rate": 1.0144158071286794e-06, + "loss": 0.7314, + "step": 59759 + }, + { + "epoch": 1.53, + "learning_rate": 1.014388139544592e-06, + "loss": 0.7783, + "step": 59760 + }, + { + "epoch": 1.53, + "learning_rate": 1.0143604719494878e-06, + "loss": 0.4931, + "step": 59761 + }, + { + "epoch": 1.53, + "learning_rate": 1.0143328043433886e-06, + "loss": 0.7004, + "step": 59762 + }, + { + "epoch": 1.53, + "learning_rate": 1.014305136726315e-06, + "loss": 0.623, + "step": 59763 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142774690982894e-06, + "loss": 0.79, + "step": 59764 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142498014593317e-06, + "loss": 0.5896, + "step": 59765 + }, + { + "epoch": 1.53, + "learning_rate": 1.0142221338094637e-06, + "loss": 0.6836, + "step": 59766 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141944661487064e-06, + "loss": 0.7207, + "step": 59767 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141667984770812e-06, + "loss": 0.605, + "step": 59768 + }, + { + "epoch": 1.53, + "learning_rate": 1.0141391307946088e-06, + "loss": 0.7715, + "step": 59769 + }, + { + "epoch": 1.53, + "learning_rate": 1.014111463101311e-06, + "loss": 0.5693, + "step": 59770 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140837953972088e-06, + "loss": 0.6846, + "step": 59771 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140561276823229e-06, + "loss": 0.6929, + "step": 59772 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140284599566752e-06, + "loss": 0.6206, + "step": 59773 + }, + { + "epoch": 1.53, + "learning_rate": 1.0140007922202862e-06, + "loss": 0.5635, + "step": 59774 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139731244731779e-06, + "loss": 0.5752, + "step": 59775 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139454567153707e-06, + "loss": 0.7634, + "step": 59776 + }, + { + "epoch": 1.53, + "learning_rate": 1.0139177889468864e-06, + "loss": 0.7559, + "step": 59777 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138901211677456e-06, + "loss": 0.8848, + "step": 59778 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138624533779698e-06, + "loss": 0.7979, + "step": 59779 + }, + { + "epoch": 1.53, + "learning_rate": 1.0138347855775801e-06, + "loss": 0.7012, + "step": 59780 + }, + { + "epoch": 1.53, + "learning_rate": 1.013807117766598e-06, + "loss": 0.8018, + "step": 59781 + }, + { + "epoch": 1.53, + "learning_rate": 1.0137794499450442e-06, + "loss": 0.6499, + "step": 59782 + }, + { + "epoch": 1.53, + "learning_rate": 1.0137517821129403e-06, + "loss": 0.626, + "step": 59783 + }, + { + "epoch": 1.53, + "learning_rate": 1.013724114270307e-06, + "loss": 0.5959, + "step": 59784 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136964464171662e-06, + "loss": 0.7441, + "step": 59785 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136687785535385e-06, + "loss": 0.6196, + "step": 59786 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136411106794451e-06, + "loss": 0.6689, + "step": 59787 + }, + { + "epoch": 1.53, + "learning_rate": 1.0136134427949071e-06, + "loss": 0.6826, + "step": 59788 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135857748999467e-06, + "loss": 0.7354, + "step": 59789 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135581069945837e-06, + "loss": 0.46, + "step": 59790 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135304390788398e-06, + "loss": 0.7354, + "step": 59791 + }, + { + "epoch": 1.53, + "learning_rate": 1.0135027711527367e-06, + "loss": 0.5822, + "step": 59792 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134751032162946e-06, + "loss": 0.6748, + "step": 59793 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134474352695358e-06, + "loss": 0.5498, + "step": 59794 + }, + { + "epoch": 1.53, + "learning_rate": 1.0134197673124805e-06, + "loss": 0.4709, + "step": 59795 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133920993451506e-06, + "loss": 0.5996, + "step": 59796 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133644313675667e-06, + "loss": 0.7041, + "step": 59797 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133367633797504e-06, + "loss": 0.6528, + "step": 59798 + }, + { + "epoch": 1.53, + "learning_rate": 1.0133090953817228e-06, + "loss": 0.6738, + "step": 59799 + }, + { + "epoch": 1.53, + "learning_rate": 1.013281427373505e-06, + "loss": 0.5791, + "step": 59800 + }, + { + "epoch": 1.53, + "learning_rate": 1.0132537593551183e-06, + "loss": 0.6064, + "step": 59801 + }, + { + "epoch": 1.53, + "learning_rate": 1.0132260913265837e-06, + "loss": 0.7129, + "step": 59802 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131984232879226e-06, + "loss": 0.6121, + "step": 59803 + }, + { + "epoch": 1.53, + "learning_rate": 1.013170755239156e-06, + "loss": 0.4087, + "step": 59804 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131430871803052e-06, + "loss": 0.4971, + "step": 59805 + }, + { + "epoch": 1.53, + "learning_rate": 1.0131154191113914e-06, + "loss": 0.6846, + "step": 59806 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130877510324355e-06, + "loss": 0.7686, + "step": 59807 + }, + { + "epoch": 1.53, + "learning_rate": 1.013060082943459e-06, + "loss": 0.6592, + "step": 59808 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130324148444829e-06, + "loss": 0.5713, + "step": 59809 + }, + { + "epoch": 1.53, + "learning_rate": 1.0130047467355286e-06, + "loss": 0.7764, + "step": 59810 + }, + { + "epoch": 1.53, + "learning_rate": 1.0129770786166173e-06, + "loss": 0.542, + "step": 59811 + }, + { + "epoch": 1.53, + "learning_rate": 1.01294941048777e-06, + "loss": 0.5562, + "step": 59812 + }, + { + "epoch": 1.53, + "learning_rate": 1.0129217423490078e-06, + "loss": 0.4797, + "step": 59813 + }, + { + "epoch": 1.53, + "learning_rate": 1.012894074200352e-06, + "loss": 0.8652, + "step": 59814 + }, + { + "epoch": 1.53, + "learning_rate": 1.012866406041824e-06, + "loss": 0.6631, + "step": 59815 + }, + { + "epoch": 1.53, + "learning_rate": 1.0128387378734444e-06, + "loss": 0.7598, + "step": 59816 + }, + { + "epoch": 1.53, + "learning_rate": 1.0128110696952352e-06, + "loss": 0.585, + "step": 59817 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127834015072168e-06, + "loss": 0.5522, + "step": 59818 + }, + { + "epoch": 1.53, + "learning_rate": 1.012755733309411e-06, + "loss": 0.4041, + "step": 59819 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127280651018387e-06, + "loss": 0.5005, + "step": 59820 + }, + { + "epoch": 1.53, + "learning_rate": 1.0127003968845212e-06, + "loss": 0.5854, + "step": 59821 + }, + { + "epoch": 1.53, + "learning_rate": 1.0126727286574793e-06, + "loss": 0.6631, + "step": 59822 + }, + { + "epoch": 1.53, + "learning_rate": 1.0126450604207346e-06, + "loss": 0.7656, + "step": 59823 + }, + { + "epoch": 1.53, + "learning_rate": 1.012617392174308e-06, + "loss": 0.4229, + "step": 59824 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125897239182213e-06, + "loss": 0.6963, + "step": 59825 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125620556524948e-06, + "loss": 0.8701, + "step": 59826 + }, + { + "epoch": 1.53, + "learning_rate": 1.01253438737715e-06, + "loss": 0.4637, + "step": 59827 + }, + { + "epoch": 1.53, + "learning_rate": 1.0125067190922086e-06, + "loss": 0.7129, + "step": 59828 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124790507976912e-06, + "loss": 0.8867, + "step": 59829 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124513824936193e-06, + "loss": 0.5278, + "step": 59830 + }, + { + "epoch": 1.53, + "learning_rate": 1.0124237141800139e-06, + "loss": 0.7588, + "step": 59831 + }, + { + "epoch": 1.53, + "learning_rate": 1.012396045856896e-06, + "loss": 0.5566, + "step": 59832 + }, + { + "epoch": 1.53, + "learning_rate": 1.0123683775242873e-06, + "loss": 0.6914, + "step": 59833 + }, + { + "epoch": 1.53, + "learning_rate": 1.0123407091822084e-06, + "loss": 0.6187, + "step": 59834 + }, + { + "epoch": 1.53, + "learning_rate": 1.012313040830681e-06, + "loss": 0.71, + "step": 59835 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122853724697263e-06, + "loss": 0.5798, + "step": 59836 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122577040993647e-06, + "loss": 0.4875, + "step": 59837 + }, + { + "epoch": 1.53, + "learning_rate": 1.0122300357196183e-06, + "loss": 0.8237, + "step": 59838 + }, + { + "epoch": 1.53, + "learning_rate": 1.012202367330508e-06, + "loss": 0.707, + "step": 59839 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121746989320547e-06, + "loss": 0.6797, + "step": 59840 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121470305242799e-06, + "loss": 0.5013, + "step": 59841 + }, + { + "epoch": 1.53, + "learning_rate": 1.0121193621072047e-06, + "loss": 0.574, + "step": 59842 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120916936808498e-06, + "loss": 0.8086, + "step": 59843 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120640252452377e-06, + "loss": 0.7354, + "step": 59844 + }, + { + "epoch": 1.53, + "learning_rate": 1.0120363568003883e-06, + "loss": 0.5576, + "step": 59845 + }, + { + "epoch": 1.53, + "learning_rate": 1.012008688346323e-06, + "loss": 0.5605, + "step": 59846 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119810198830635e-06, + "loss": 0.7563, + "step": 59847 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119533514106304e-06, + "loss": 0.6318, + "step": 59848 + }, + { + "epoch": 1.53, + "learning_rate": 1.0119256829290454e-06, + "loss": 0.5859, + "step": 59849 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118980144383296e-06, + "loss": 0.6094, + "step": 59850 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118703459385037e-06, + "loss": 0.6797, + "step": 59851 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118426774295894e-06, + "loss": 0.5565, + "step": 59852 + }, + { + "epoch": 1.53, + "learning_rate": 1.0118150089116076e-06, + "loss": 0.5762, + "step": 59853 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117873403845797e-06, + "loss": 0.6685, + "step": 59854 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117596718485268e-06, + "loss": 0.71, + "step": 59855 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117320033034698e-06, + "loss": 0.793, + "step": 59856 + }, + { + "epoch": 1.53, + "learning_rate": 1.0117043347494304e-06, + "loss": 0.6787, + "step": 59857 + }, + { + "epoch": 1.53, + "learning_rate": 1.0116766661864295e-06, + "loss": 0.7119, + "step": 59858 + }, + { + "epoch": 1.53, + "learning_rate": 1.0116489976144885e-06, + "loss": 0.5421, + "step": 59859 + }, + { + "epoch": 1.53, + "learning_rate": 1.011621329033628e-06, + "loss": 0.7754, + "step": 59860 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115936604438697e-06, + "loss": 0.627, + "step": 59861 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115659918452347e-06, + "loss": 0.6797, + "step": 59862 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115383232377441e-06, + "loss": 0.6924, + "step": 59863 + }, + { + "epoch": 1.53, + "learning_rate": 1.0115106546214194e-06, + "loss": 0.7217, + "step": 59864 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114829859962814e-06, + "loss": 0.4402, + "step": 59865 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114553173623512e-06, + "loss": 0.5667, + "step": 59866 + }, + { + "epoch": 1.53, + "learning_rate": 1.0114276487196505e-06, + "loss": 0.3584, + "step": 59867 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113999800681998e-06, + "loss": 0.554, + "step": 59868 + }, + { + "epoch": 1.53, + "learning_rate": 1.011372311408021e-06, + "loss": 0.7383, + "step": 59869 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113446427391348e-06, + "loss": 0.8745, + "step": 59870 + }, + { + "epoch": 1.53, + "learning_rate": 1.0113169740615625e-06, + "loss": 0.5791, + "step": 59871 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112893053753254e-06, + "loss": 0.748, + "step": 59872 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112616366804446e-06, + "loss": 0.6719, + "step": 59873 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112339679769414e-06, + "loss": 0.8779, + "step": 59874 + }, + { + "epoch": 1.53, + "learning_rate": 1.0112062992648365e-06, + "loss": 0.6069, + "step": 59875 + }, + { + "epoch": 1.53, + "learning_rate": 1.0111786305441517e-06, + "loss": 0.5693, + "step": 59876 + }, + { + "epoch": 1.53, + "learning_rate": 1.0111509618149078e-06, + "loss": 0.7559, + "step": 59877 + }, + { + "epoch": 1.53, + "learning_rate": 1.011123293077126e-06, + "loss": 0.6758, + "step": 59878 + }, + { + "epoch": 1.53, + "learning_rate": 1.011095624330828e-06, + "loss": 0.5947, + "step": 59879 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110679555760343e-06, + "loss": 0.5295, + "step": 59880 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110402868127666e-06, + "loss": 0.6553, + "step": 59881 + }, + { + "epoch": 1.53, + "learning_rate": 1.0110126180410457e-06, + "loss": 0.6274, + "step": 59882 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109849492608928e-06, + "loss": 0.7808, + "step": 59883 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109572804723297e-06, + "loss": 0.5605, + "step": 59884 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109296116753767e-06, + "loss": 0.7705, + "step": 59885 + }, + { + "epoch": 1.53, + "learning_rate": 1.0109019428700555e-06, + "loss": 0.5918, + "step": 59886 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108742740563872e-06, + "loss": 0.498, + "step": 59887 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108466052343932e-06, + "loss": 0.6582, + "step": 59888 + }, + { + "epoch": 1.53, + "learning_rate": 1.0108189364040942e-06, + "loss": 0.7773, + "step": 59889 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107912675655117e-06, + "loss": 0.7637, + "step": 59890 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107635987186666e-06, + "loss": 0.6602, + "step": 59891 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107359298635807e-06, + "loss": 0.6445, + "step": 59892 + }, + { + "epoch": 1.54, + "learning_rate": 1.0107082610002744e-06, + "loss": 0.7793, + "step": 59893 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106805921287698e-06, + "loss": 0.5635, + "step": 59894 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106529232490871e-06, + "loss": 0.7744, + "step": 59895 + }, + { + "epoch": 1.54, + "learning_rate": 1.0106252543612482e-06, + "loss": 0.6045, + "step": 59896 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105975854652736e-06, + "loss": 0.6572, + "step": 59897 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105699165611854e-06, + "loss": 0.6309, + "step": 59898 + }, + { + "epoch": 1.54, + "learning_rate": 1.0105422476490042e-06, + "loss": 0.8232, + "step": 59899 + }, + { + "epoch": 1.54, + "learning_rate": 1.010514578728751e-06, + "loss": 0.7803, + "step": 59900 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104869098004476e-06, + "loss": 0.9287, + "step": 59901 + }, + { + "epoch": 1.54, + "learning_rate": 1.010459240864115e-06, + "loss": 0.6147, + "step": 59902 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104315719197736e-06, + "loss": 0.668, + "step": 59903 + }, + { + "epoch": 1.54, + "learning_rate": 1.0104039029674455e-06, + "loss": 0.6719, + "step": 59904 + }, + { + "epoch": 1.54, + "learning_rate": 1.010376234007152e-06, + "loss": 0.5923, + "step": 59905 + }, + { + "epoch": 1.54, + "learning_rate": 1.0103485650389135e-06, + "loss": 0.6104, + "step": 59906 + }, + { + "epoch": 1.54, + "learning_rate": 1.0103208960627517e-06, + "loss": 0.4648, + "step": 59907 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102932270786874e-06, + "loss": 0.5532, + "step": 59908 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102655580867428e-06, + "loss": 0.792, + "step": 59909 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102378890869375e-06, + "loss": 0.6943, + "step": 59910 + }, + { + "epoch": 1.54, + "learning_rate": 1.0102102200792938e-06, + "loss": 0.7305, + "step": 59911 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101825510638326e-06, + "loss": 0.3728, + "step": 59912 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101548820405753e-06, + "loss": 0.4618, + "step": 59913 + }, + { + "epoch": 1.54, + "learning_rate": 1.0101272130095429e-06, + "loss": 0.7852, + "step": 59914 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100995439707565e-06, + "loss": 0.6309, + "step": 59915 + }, + { + "epoch": 1.54, + "learning_rate": 1.010071874924237e-06, + "loss": 0.5938, + "step": 59916 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100442058700062e-06, + "loss": 0.6631, + "step": 59917 + }, + { + "epoch": 1.54, + "learning_rate": 1.0100165368080848e-06, + "loss": 0.502, + "step": 59918 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099888677384944e-06, + "loss": 0.8232, + "step": 59919 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099611986612559e-06, + "loss": 0.6885, + "step": 59920 + }, + { + "epoch": 1.54, + "learning_rate": 1.009933529576391e-06, + "loss": 0.4452, + "step": 59921 + }, + { + "epoch": 1.54, + "learning_rate": 1.0099058604839196e-06, + "loss": 0.5957, + "step": 59922 + }, + { + "epoch": 1.54, + "learning_rate": 1.0098781913838646e-06, + "loss": 0.7383, + "step": 59923 + }, + { + "epoch": 1.54, + "learning_rate": 1.009850522276246e-06, + "loss": 0.3878, + "step": 59924 + }, + { + "epoch": 1.54, + "learning_rate": 1.0098228531610848e-06, + "loss": 0.7441, + "step": 59925 + }, + { + "epoch": 1.54, + "learning_rate": 1.0097951840384034e-06, + "loss": 0.5552, + "step": 59926 + }, + { + "epoch": 1.54, + "learning_rate": 1.009767514908222e-06, + "loss": 0.79, + "step": 59927 + }, + { + "epoch": 1.54, + "learning_rate": 1.009739845770562e-06, + "loss": 0.7598, + "step": 59928 + }, + { + "epoch": 1.54, + "learning_rate": 1.0097121766254449e-06, + "loss": 0.6198, + "step": 59929 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096845074728912e-06, + "loss": 0.7686, + "step": 59930 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096568383129227e-06, + "loss": 0.6787, + "step": 59931 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096291691455606e-06, + "loss": 0.5408, + "step": 59932 + }, + { + "epoch": 1.54, + "learning_rate": 1.0096014999708256e-06, + "loss": 0.6348, + "step": 59933 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095738307887397e-06, + "loss": 0.6758, + "step": 59934 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095461615993231e-06, + "loss": 0.6484, + "step": 59935 + }, + { + "epoch": 1.54, + "learning_rate": 1.0095184924025975e-06, + "loss": 0.7979, + "step": 59936 + }, + { + "epoch": 1.54, + "learning_rate": 1.009490823198584e-06, + "loss": 0.5439, + "step": 59937 + }, + { + "epoch": 1.54, + "learning_rate": 1.009463153987304e-06, + "loss": 0.5127, + "step": 59938 + }, + { + "epoch": 1.54, + "learning_rate": 1.0094354847687783e-06, + "loss": 0.5957, + "step": 59939 + }, + { + "epoch": 1.54, + "learning_rate": 1.0094078155430285e-06, + "loss": 0.6279, + "step": 59940 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093801463100753e-06, + "loss": 0.751, + "step": 59941 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093524770699403e-06, + "loss": 0.6191, + "step": 59942 + }, + { + "epoch": 1.54, + "learning_rate": 1.0093248078226444e-06, + "loss": 0.6719, + "step": 59943 + }, + { + "epoch": 1.54, + "learning_rate": 1.009297138568209e-06, + "loss": 0.6973, + "step": 59944 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092694693066555e-06, + "loss": 0.6719, + "step": 59945 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092418000380043e-06, + "loss": 0.5933, + "step": 59946 + }, + { + "epoch": 1.54, + "learning_rate": 1.0092141307622774e-06, + "loss": 0.7427, + "step": 59947 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091864614794955e-06, + "loss": 0.7363, + "step": 59948 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091587921896804e-06, + "loss": 0.6807, + "step": 59949 + }, + { + "epoch": 1.54, + "learning_rate": 1.0091311228928522e-06, + "loss": 0.6475, + "step": 59950 + }, + { + "epoch": 1.54, + "learning_rate": 1.009103453589033e-06, + "loss": 0.6187, + "step": 59951 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090757842782436e-06, + "loss": 0.5903, + "step": 59952 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090481149605055e-06, + "loss": 0.4103, + "step": 59953 + }, + { + "epoch": 1.54, + "learning_rate": 1.0090204456358396e-06, + "loss": 0.5996, + "step": 59954 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089927763042672e-06, + "loss": 0.7881, + "step": 59955 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089651069658093e-06, + "loss": 0.748, + "step": 59956 + }, + { + "epoch": 1.54, + "learning_rate": 1.0089374376204872e-06, + "loss": 0.5623, + "step": 59957 + }, + { + "epoch": 1.54, + "learning_rate": 1.008909768268322e-06, + "loss": 0.6899, + "step": 59958 + }, + { + "epoch": 1.54, + "learning_rate": 1.0088820989093357e-06, + "loss": 0.8389, + "step": 59959 + }, + { + "epoch": 1.54, + "learning_rate": 1.008854429543548e-06, + "loss": 0.5933, + "step": 59960 + }, + { + "epoch": 1.54, + "learning_rate": 1.0088267601709813e-06, + "loss": 0.6293, + "step": 59961 + }, + { + "epoch": 1.54, + "learning_rate": 1.008799090791656e-06, + "loss": 0.7607, + "step": 59962 + }, + { + "epoch": 1.54, + "learning_rate": 1.008771421405594e-06, + "loss": 0.5068, + "step": 59963 + }, + { + "epoch": 1.54, + "learning_rate": 1.008743752012816e-06, + "loss": 0.6787, + "step": 59964 + }, + { + "epoch": 1.54, + "learning_rate": 1.0087160826133434e-06, + "loss": 0.5649, + "step": 59965 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086884132071972e-06, + "loss": 0.6338, + "step": 59966 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086607437943985e-06, + "loss": 0.7261, + "step": 59967 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086330743749687e-06, + "loss": 0.5742, + "step": 59968 + }, + { + "epoch": 1.54, + "learning_rate": 1.0086054049489292e-06, + "loss": 0.6279, + "step": 59969 + }, + { + "epoch": 1.54, + "learning_rate": 1.008577735516301e-06, + "loss": 0.5205, + "step": 59970 + }, + { + "epoch": 1.54, + "learning_rate": 1.0085500660771049e-06, + "loss": 0.5962, + "step": 59971 + }, + { + "epoch": 1.54, + "learning_rate": 1.0085223966313626e-06, + "loss": 0.7822, + "step": 59972 + }, + { + "epoch": 1.54, + "learning_rate": 1.008494727179095e-06, + "loss": 0.8594, + "step": 59973 + }, + { + "epoch": 1.54, + "learning_rate": 1.0084670577203236e-06, + "loss": 0.7695, + "step": 59974 + }, + { + "epoch": 1.54, + "learning_rate": 1.008439388255069e-06, + "loss": 0.6782, + "step": 59975 + }, + { + "epoch": 1.54, + "learning_rate": 1.008411718783353e-06, + "loss": 0.5991, + "step": 59976 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083840493051964e-06, + "loss": 0.6533, + "step": 59977 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083563798206206e-06, + "loss": 0.6826, + "step": 59978 + }, + { + "epoch": 1.54, + "learning_rate": 1.0083287103296467e-06, + "loss": 0.7334, + "step": 59979 + }, + { + "epoch": 1.54, + "learning_rate": 1.008301040832296e-06, + "loss": 0.6279, + "step": 59980 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082733713285893e-06, + "loss": 0.6904, + "step": 59981 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082457018185483e-06, + "loss": 0.5288, + "step": 59982 + }, + { + "epoch": 1.54, + "learning_rate": 1.0082180323021937e-06, + "loss": 0.5874, + "step": 59983 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081903627795474e-06, + "loss": 0.6235, + "step": 59984 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081626932506297e-06, + "loss": 0.5815, + "step": 59985 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081350237154625e-06, + "loss": 0.7266, + "step": 59986 + }, + { + "epoch": 1.54, + "learning_rate": 1.0081073541740663e-06, + "loss": 0.5562, + "step": 59987 + }, + { + "epoch": 1.54, + "learning_rate": 1.008079684626463e-06, + "loss": 0.6802, + "step": 59988 + }, + { + "epoch": 1.54, + "learning_rate": 1.0080520150726731e-06, + "loss": 0.6147, + "step": 59989 + }, + { + "epoch": 1.54, + "learning_rate": 1.0080243455127184e-06, + "loss": 0.6729, + "step": 59990 + }, + { + "epoch": 1.54, + "learning_rate": 1.00799667594662e-06, + "loss": 0.625, + "step": 59991 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079690063743984e-06, + "loss": 0.5186, + "step": 59992 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079413367960756e-06, + "loss": 0.5469, + "step": 59993 + }, + { + "epoch": 1.54, + "learning_rate": 1.0079136672116725e-06, + "loss": 0.5332, + "step": 59994 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078859976212106e-06, + "loss": 0.6523, + "step": 59995 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078583280247102e-06, + "loss": 0.5415, + "step": 59996 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078306584221934e-06, + "loss": 0.4824, + "step": 59997 + }, + { + "epoch": 1.54, + "learning_rate": 1.0078029888136808e-06, + "loss": 0.7109, + "step": 59998 + }, + { + "epoch": 1.54, + "learning_rate": 1.007775319199194e-06, + "loss": 0.6172, + "step": 59999 + }, + { + "epoch": 1.54, + "learning_rate": 1.0077476495787537e-06, + "loss": 0.7861, + "step": 60000 + }, + { + "epoch": 1.54, + "learning_rate": 1.0077199799523817e-06, + "loss": 0.6147, + "step": 60001 + }, + { + "epoch": 1.54, + "learning_rate": 1.0076923103200988e-06, + "loss": 0.6504, + "step": 60002 + }, + { + "epoch": 1.54, + "learning_rate": 1.007664640681926e-06, + "loss": 0.6758, + "step": 60003 + }, + { + "epoch": 1.54, + "learning_rate": 1.007636971037885e-06, + "loss": 0.646, + "step": 60004 + }, + { + "epoch": 1.54, + "learning_rate": 1.0076093013879966e-06, + "loss": 0.5085, + "step": 60005 + }, + { + "epoch": 1.54, + "learning_rate": 1.0075816317322823e-06, + "loss": 0.6406, + "step": 60006 + }, + { + "epoch": 1.54, + "learning_rate": 1.007553962070763e-06, + "loss": 0.5791, + "step": 60007 + }, + { + "epoch": 1.54, + "learning_rate": 1.0075262924034598e-06, + "loss": 0.5474, + "step": 60008 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074986227303941e-06, + "loss": 0.5283, + "step": 60009 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074709530515873e-06, + "loss": 0.5752, + "step": 60010 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074432833670603e-06, + "loss": 0.7285, + "step": 60011 + }, + { + "epoch": 1.54, + "learning_rate": 1.0074156136768338e-06, + "loss": 0.6914, + "step": 60012 + }, + { + "epoch": 1.54, + "learning_rate": 1.00738794398093e-06, + "loss": 0.7441, + "step": 60013 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073602742793697e-06, + "loss": 0.6746, + "step": 60014 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073326045721735e-06, + "loss": 0.5845, + "step": 60015 + }, + { + "epoch": 1.54, + "learning_rate": 1.0073049348593634e-06, + "loss": 0.5962, + "step": 60016 + }, + { + "epoch": 1.54, + "learning_rate": 1.0072772651409601e-06, + "loss": 0.6367, + "step": 60017 + }, + { + "epoch": 1.54, + "learning_rate": 1.007249595416985e-06, + "loss": 0.4041, + "step": 60018 + }, + { + "epoch": 1.54, + "learning_rate": 1.0072219256874594e-06, + "loss": 0.6875, + "step": 60019 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071942559524044e-06, + "loss": 0.5161, + "step": 60020 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071665862118406e-06, + "loss": 0.7578, + "step": 60021 + }, + { + "epoch": 1.54, + "learning_rate": 1.0071389164657898e-06, + "loss": 0.6685, + "step": 60022 + }, + { + "epoch": 1.54, + "learning_rate": 1.007111246714273e-06, + "loss": 0.7705, + "step": 60023 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070835769573118e-06, + "loss": 0.5806, + "step": 60024 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070559071949267e-06, + "loss": 0.5693, + "step": 60025 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070282374271395e-06, + "loss": 0.6201, + "step": 60026 + }, + { + "epoch": 1.54, + "learning_rate": 1.0070005676539707e-06, + "loss": 0.8076, + "step": 60027 + }, + { + "epoch": 1.54, + "learning_rate": 1.0069728978754423e-06, + "loss": 0.5425, + "step": 60028 + }, + { + "epoch": 1.54, + "learning_rate": 1.006945228091575e-06, + "loss": 0.7354, + "step": 60029 + }, + { + "epoch": 1.54, + "learning_rate": 1.0069175583023901e-06, + "loss": 0.6104, + "step": 60030 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068898885079085e-06, + "loss": 0.5293, + "step": 60031 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068622187081517e-06, + "loss": 0.5615, + "step": 60032 + }, + { + "epoch": 1.54, + "learning_rate": 1.0068345489031406e-06, + "loss": 0.5, + "step": 60033 + }, + { + "epoch": 1.54, + "learning_rate": 1.006806879092897e-06, + "loss": 0.5669, + "step": 60034 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067792092774417e-06, + "loss": 0.6621, + "step": 60035 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067515394567957e-06, + "loss": 0.6626, + "step": 60036 + }, + { + "epoch": 1.54, + "learning_rate": 1.0067238696309804e-06, + "loss": 0.7451, + "step": 60037 + }, + { + "epoch": 1.54, + "learning_rate": 1.006696199800017e-06, + "loss": 0.6069, + "step": 60038 + }, + { + "epoch": 1.54, + "learning_rate": 1.0066685299639264e-06, + "loss": 0.4805, + "step": 60039 + }, + { + "epoch": 1.54, + "learning_rate": 1.00664086012273e-06, + "loss": 0.7539, + "step": 60040 + }, + { + "epoch": 1.54, + "learning_rate": 1.0066131902764491e-06, + "loss": 0.7568, + "step": 60041 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065855204251049e-06, + "loss": 0.5173, + "step": 60042 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065578505687185e-06, + "loss": 0.6086, + "step": 60043 + }, + { + "epoch": 1.54, + "learning_rate": 1.006530180707311e-06, + "loss": 0.473, + "step": 60044 + }, + { + "epoch": 1.54, + "learning_rate": 1.0065025108409038e-06, + "loss": 0.6768, + "step": 60045 + }, + { + "epoch": 1.54, + "learning_rate": 1.0064748409695173e-06, + "loss": 0.605, + "step": 60046 + }, + { + "epoch": 1.54, + "learning_rate": 1.006447171093174e-06, + "loss": 0.627, + "step": 60047 + }, + { + "epoch": 1.54, + "learning_rate": 1.0064195012118939e-06, + "loss": 0.4822, + "step": 60048 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063918313256991e-06, + "loss": 0.4761, + "step": 60049 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063641614346102e-06, + "loss": 0.6006, + "step": 60050 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063364915386485e-06, + "loss": 0.6597, + "step": 60051 + }, + { + "epoch": 1.54, + "learning_rate": 1.0063088216378352e-06, + "loss": 0.7993, + "step": 60052 + }, + { + "epoch": 1.54, + "learning_rate": 1.0062811517321917e-06, + "loss": 0.4128, + "step": 60053 + }, + { + "epoch": 1.54, + "learning_rate": 1.006253481821739e-06, + "loss": 0.5306, + "step": 60054 + }, + { + "epoch": 1.54, + "learning_rate": 1.0062258119064984e-06, + "loss": 0.6035, + "step": 60055 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061981419864905e-06, + "loss": 0.6465, + "step": 60056 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061704720617375e-06, + "loss": 0.6089, + "step": 60057 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061428021322596e-06, + "loss": 0.6396, + "step": 60058 + }, + { + "epoch": 1.54, + "learning_rate": 1.0061151321980787e-06, + "loss": 0.6079, + "step": 60059 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060874622592156e-06, + "loss": 0.6519, + "step": 60060 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060597923156918e-06, + "loss": 0.7021, + "step": 60061 + }, + { + "epoch": 1.54, + "learning_rate": 1.006032122367528e-06, + "loss": 0.6455, + "step": 60062 + }, + { + "epoch": 1.54, + "learning_rate": 1.0060044524147457e-06, + "loss": 0.7363, + "step": 60063 + }, + { + "epoch": 1.54, + "learning_rate": 1.0059767824573667e-06, + "loss": 0.5117, + "step": 60064 + }, + { + "epoch": 1.54, + "learning_rate": 1.005949112495411e-06, + "loss": 0.4927, + "step": 60065 + }, + { + "epoch": 1.54, + "learning_rate": 1.0059214425289003e-06, + "loss": 0.7402, + "step": 60066 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058937725578557e-06, + "loss": 0.7021, + "step": 60067 + }, + { + "epoch": 1.54, + "learning_rate": 1.005866102582299e-06, + "loss": 0.5708, + "step": 60068 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058384326022506e-06, + "loss": 0.7539, + "step": 60069 + }, + { + "epoch": 1.54, + "learning_rate": 1.0058107626177323e-06, + "loss": 0.6787, + "step": 60070 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057830926287645e-06, + "loss": 0.5649, + "step": 60071 + }, + { + "epoch": 1.54, + "learning_rate": 1.005755422635369e-06, + "loss": 0.6182, + "step": 60072 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057277526375668e-06, + "loss": 0.6313, + "step": 60073 + }, + { + "epoch": 1.54, + "learning_rate": 1.0057000826353796e-06, + "loss": 0.6309, + "step": 60074 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056724126288276e-06, + "loss": 0.5007, + "step": 60075 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056447426179326e-06, + "loss": 0.7012, + "step": 60076 + }, + { + "epoch": 1.54, + "learning_rate": 1.0056170726027157e-06, + "loss": 0.6748, + "step": 60077 + }, + { + "epoch": 1.54, + "learning_rate": 1.005589402583198e-06, + "loss": 0.7627, + "step": 60078 + }, + { + "epoch": 1.54, + "learning_rate": 1.0055617325594007e-06, + "loss": 0.5957, + "step": 60079 + }, + { + "epoch": 1.54, + "learning_rate": 1.005534062531345e-06, + "loss": 0.7061, + "step": 60080 + }, + { + "epoch": 1.54, + "learning_rate": 1.0055063924990526e-06, + "loss": 0.5654, + "step": 60081 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054787224625436e-06, + "loss": 0.5459, + "step": 60082 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054510524218402e-06, + "loss": 0.7686, + "step": 60083 + }, + { + "epoch": 1.54, + "learning_rate": 1.0054233823769632e-06, + "loss": 0.6733, + "step": 60084 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053957123279337e-06, + "loss": 0.7705, + "step": 60085 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053680422747727e-06, + "loss": 0.6714, + "step": 60086 + }, + { + "epoch": 1.54, + "learning_rate": 1.0053403722175018e-06, + "loss": 0.4596, + "step": 60087 + }, + { + "epoch": 1.54, + "learning_rate": 1.005312702156142e-06, + "loss": 0.8486, + "step": 60088 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052850320907147e-06, + "loss": 0.5015, + "step": 60089 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052573620212405e-06, + "loss": 0.481, + "step": 60090 + }, + { + "epoch": 1.54, + "learning_rate": 1.0052296919477415e-06, + "loss": 0.5908, + "step": 60091 + }, + { + "epoch": 1.54, + "learning_rate": 1.005202021870238e-06, + "loss": 0.5354, + "step": 60092 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051743517887517e-06, + "loss": 0.6914, + "step": 60093 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051466817033035e-06, + "loss": 0.6006, + "step": 60094 + }, + { + "epoch": 1.54, + "learning_rate": 1.0051190116139148e-06, + "loss": 0.6738, + "step": 60095 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050913415206065e-06, + "loss": 0.6233, + "step": 60096 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050636714234004e-06, + "loss": 0.6709, + "step": 60097 + }, + { + "epoch": 1.54, + "learning_rate": 1.005036001322317e-06, + "loss": 0.5103, + "step": 60098 + }, + { + "epoch": 1.54, + "learning_rate": 1.0050083312173778e-06, + "loss": 0.6895, + "step": 60099 + }, + { + "epoch": 1.54, + "learning_rate": 1.004980661108604e-06, + "loss": 0.7451, + "step": 60100 + }, + { + "epoch": 1.54, + "learning_rate": 1.0049529909960168e-06, + "loss": 0.6064, + "step": 60101 + }, + { + "epoch": 1.54, + "learning_rate": 1.0049253208796372e-06, + "loss": 0.8926, + "step": 60102 + }, + { + "epoch": 1.54, + "learning_rate": 1.0048976507594866e-06, + "loss": 0.6123, + "step": 60103 + }, + { + "epoch": 1.54, + "learning_rate": 1.004869980635586e-06, + "loss": 0.6499, + "step": 60104 + }, + { + "epoch": 1.54, + "learning_rate": 1.0048423105079566e-06, + "loss": 0.6709, + "step": 60105 + }, + { + "epoch": 1.54, + "learning_rate": 1.00481464037662e-06, + "loss": 0.5034, + "step": 60106 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047869702415967e-06, + "loss": 0.665, + "step": 60107 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047593001029084e-06, + "loss": 0.6699, + "step": 60108 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047316299605762e-06, + "loss": 0.7256, + "step": 60109 + }, + { + "epoch": 1.54, + "learning_rate": 1.0047039598146212e-06, + "loss": 0.7793, + "step": 60110 + }, + { + "epoch": 1.54, + "learning_rate": 1.0046762896650642e-06, + "loss": 0.79, + "step": 60111 + }, + { + "epoch": 1.54, + "learning_rate": 1.0046486195119272e-06, + "loss": 0.5295, + "step": 60112 + }, + { + "epoch": 1.54, + "learning_rate": 1.004620949355231e-06, + "loss": 0.6631, + "step": 60113 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045932791949967e-06, + "loss": 0.6162, + "step": 60114 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045656090312453e-06, + "loss": 0.6543, + "step": 60115 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045379388639984e-06, + "loss": 0.7676, + "step": 60116 + }, + { + "epoch": 1.54, + "learning_rate": 1.0045102686932768e-06, + "loss": 0.4463, + "step": 60117 + }, + { + "epoch": 1.54, + "learning_rate": 1.004482598519102e-06, + "loss": 0.7959, + "step": 60118 + }, + { + "epoch": 1.54, + "learning_rate": 1.0044549283414954e-06, + "loss": 0.5361, + "step": 60119 + }, + { + "epoch": 1.54, + "learning_rate": 1.0044272581604779e-06, + "loss": 0.7056, + "step": 60120 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043995879760701e-06, + "loss": 0.4377, + "step": 60121 + }, + { + "epoch": 1.54, + "learning_rate": 1.004371917788294e-06, + "loss": 0.5593, + "step": 60122 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043442475971705e-06, + "loss": 0.7285, + "step": 60123 + }, + { + "epoch": 1.54, + "learning_rate": 1.0043165774027207e-06, + "loss": 0.5244, + "step": 60124 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042889072049663e-06, + "loss": 0.5249, + "step": 60125 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042612370039276e-06, + "loss": 0.5913, + "step": 60126 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042335667996265e-06, + "loss": 0.5762, + "step": 60127 + }, + { + "epoch": 1.54, + "learning_rate": 1.0042058965920841e-06, + "loss": 0.5957, + "step": 60128 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041782263813212e-06, + "loss": 0.7148, + "step": 60129 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041505561673592e-06, + "loss": 0.6528, + "step": 60130 + }, + { + "epoch": 1.54, + "learning_rate": 1.0041228859502195e-06, + "loss": 0.5476, + "step": 60131 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040952157299228e-06, + "loss": 0.6299, + "step": 60132 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040675455064911e-06, + "loss": 0.5935, + "step": 60133 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040398752799446e-06, + "loss": 0.5527, + "step": 60134 + }, + { + "epoch": 1.54, + "learning_rate": 1.0040122050503052e-06, + "loss": 0.5742, + "step": 60135 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039845348175935e-06, + "loss": 0.4805, + "step": 60136 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039568645818314e-06, + "loss": 0.52, + "step": 60137 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039291943430397e-06, + "loss": 0.71, + "step": 60138 + }, + { + "epoch": 1.54, + "learning_rate": 1.0039015241012396e-06, + "loss": 0.5337, + "step": 60139 + }, + { + "epoch": 1.54, + "learning_rate": 1.003873853856452e-06, + "loss": 0.7881, + "step": 60140 + }, + { + "epoch": 1.54, + "learning_rate": 1.0038461836086984e-06, + "loss": 0.7461, + "step": 60141 + }, + { + "epoch": 1.54, + "learning_rate": 1.0038185133580001e-06, + "loss": 0.6104, + "step": 60142 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037908431043781e-06, + "loss": 0.6396, + "step": 60143 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037631728478538e-06, + "loss": 0.5122, + "step": 60144 + }, + { + "epoch": 1.54, + "learning_rate": 1.0037355025884482e-06, + "loss": 0.7124, + "step": 60145 + }, + { + "epoch": 1.54, + "learning_rate": 1.003707832326182e-06, + "loss": 0.5923, + "step": 60146 + }, + { + "epoch": 1.54, + "learning_rate": 1.0036801620610775e-06, + "loss": 0.6245, + "step": 60147 + }, + { + "epoch": 1.54, + "learning_rate": 1.003652491793155e-06, + "loss": 0.6582, + "step": 60148 + }, + { + "epoch": 1.54, + "learning_rate": 1.003624821522436e-06, + "loss": 0.707, + "step": 60149 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035971512489414e-06, + "loss": 0.6826, + "step": 60150 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035694809726927e-06, + "loss": 0.5928, + "step": 60151 + }, + { + "epoch": 1.54, + "learning_rate": 1.0035418106937111e-06, + "loss": 0.6904, + "step": 60152 + }, + { + "epoch": 1.54, + "learning_rate": 1.003514140412018e-06, + "loss": 0.6016, + "step": 60153 + }, + { + "epoch": 1.54, + "learning_rate": 1.003486470127634e-06, + "loss": 0.707, + "step": 60154 + }, + { + "epoch": 1.54, + "learning_rate": 1.0034587998405806e-06, + "loss": 0.7017, + "step": 60155 + }, + { + "epoch": 1.54, + "learning_rate": 1.003431129550879e-06, + "loss": 0.4719, + "step": 60156 + }, + { + "epoch": 1.54, + "learning_rate": 1.00340345925855e-06, + "loss": 0.6016, + "step": 60157 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033757889636159e-06, + "loss": 0.6406, + "step": 60158 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033481186660964e-06, + "loss": 0.5723, + "step": 60159 + }, + { + "epoch": 1.54, + "learning_rate": 1.0033204483660138e-06, + "loss": 0.7852, + "step": 60160 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032927780633884e-06, + "loss": 0.7988, + "step": 60161 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032651077582424e-06, + "loss": 0.5034, + "step": 60162 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032374374505963e-06, + "loss": 0.5688, + "step": 60163 + }, + { + "epoch": 1.54, + "learning_rate": 1.0032097671404713e-06, + "loss": 0.5439, + "step": 60164 + }, + { + "epoch": 1.54, + "learning_rate": 1.0031820968278888e-06, + "loss": 0.6143, + "step": 60165 + }, + { + "epoch": 1.54, + "learning_rate": 1.00315442651287e-06, + "loss": 0.668, + "step": 60166 + }, + { + "epoch": 1.54, + "learning_rate": 1.0031267561954357e-06, + "loss": 0.7832, + "step": 60167 + }, + { + "epoch": 1.54, + "learning_rate": 1.003099085875608e-06, + "loss": 0.7334, + "step": 60168 + }, + { + "epoch": 1.54, + "learning_rate": 1.003071415553407e-06, + "loss": 0.8301, + "step": 60169 + }, + { + "epoch": 1.54, + "learning_rate": 1.0030437452288543e-06, + "loss": 0.6785, + "step": 60170 + }, + { + "epoch": 1.54, + "learning_rate": 1.0030160749019713e-06, + "loss": 0.5601, + "step": 60171 + }, + { + "epoch": 1.54, + "learning_rate": 1.002988404572779e-06, + "loss": 0.5518, + "step": 60172 + }, + { + "epoch": 1.54, + "learning_rate": 1.002960734241299e-06, + "loss": 0.6606, + "step": 60173 + }, + { + "epoch": 1.54, + "learning_rate": 1.0029330639075515e-06, + "loss": 0.7402, + "step": 60174 + }, + { + "epoch": 1.54, + "learning_rate": 1.0029053935715585e-06, + "loss": 0.6836, + "step": 60175 + }, + { + "epoch": 1.54, + "learning_rate": 1.002877723233341e-06, + "loss": 0.4028, + "step": 60176 + }, + { + "epoch": 1.54, + "learning_rate": 1.0028500528929201e-06, + "loss": 0.8057, + "step": 60177 + }, + { + "epoch": 1.54, + "learning_rate": 1.0028223825503173e-06, + "loss": 0.8066, + "step": 60178 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027947122055533e-06, + "loss": 0.6768, + "step": 60179 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027670418586493e-06, + "loss": 0.6699, + "step": 60180 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027393715096273e-06, + "loss": 0.707, + "step": 60181 + }, + { + "epoch": 1.54, + "learning_rate": 1.0027117011585073e-06, + "loss": 0.625, + "step": 60182 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026840308053115e-06, + "loss": 0.5796, + "step": 60183 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026563604500604e-06, + "loss": 0.6001, + "step": 60184 + }, + { + "epoch": 1.54, + "learning_rate": 1.0026286900927756e-06, + "loss": 0.5295, + "step": 60185 + }, + { + "epoch": 1.54, + "learning_rate": 1.002601019733478e-06, + "loss": 0.688, + "step": 60186 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025733493721892e-06, + "loss": 0.6338, + "step": 60187 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025456790089298e-06, + "loss": 0.8564, + "step": 60188 + }, + { + "epoch": 1.54, + "learning_rate": 1.0025180086437214e-06, + "loss": 0.5303, + "step": 60189 + }, + { + "epoch": 1.54, + "learning_rate": 1.002490338276585e-06, + "loss": 0.5442, + "step": 60190 + }, + { + "epoch": 1.54, + "learning_rate": 1.002462667907542e-06, + "loss": 0.5757, + "step": 60191 + }, + { + "epoch": 1.54, + "learning_rate": 1.002434997536613e-06, + "loss": 0.6729, + "step": 60192 + }, + { + "epoch": 1.54, + "learning_rate": 1.0024073271638203e-06, + "loss": 0.5165, + "step": 60193 + }, + { + "epoch": 1.54, + "learning_rate": 1.0023796567891842e-06, + "loss": 0.5688, + "step": 60194 + }, + { + "epoch": 1.54, + "learning_rate": 1.002351986412726e-06, + "loss": 0.6377, + "step": 60195 + }, + { + "epoch": 1.54, + "learning_rate": 1.002324316034467e-06, + "loss": 0.6899, + "step": 60196 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022966456544282e-06, + "loss": 0.7656, + "step": 60197 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022689752726315e-06, + "loss": 0.6777, + "step": 60198 + }, + { + "epoch": 1.54, + "learning_rate": 1.002241304889097e-06, + "loss": 0.5797, + "step": 60199 + }, + { + "epoch": 1.54, + "learning_rate": 1.0022136345038468e-06, + "loss": 0.5132, + "step": 60200 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021859641169012e-06, + "loss": 0.5386, + "step": 60201 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021582937282824e-06, + "loss": 0.6709, + "step": 60202 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021306233380112e-06, + "loss": 0.5337, + "step": 60203 + }, + { + "epoch": 1.54, + "learning_rate": 1.0021029529461085e-06, + "loss": 0.51, + "step": 60204 + }, + { + "epoch": 1.54, + "learning_rate": 1.0020752825525956e-06, + "loss": 0.748, + "step": 60205 + }, + { + "epoch": 1.54, + "learning_rate": 1.0020476121574937e-06, + "loss": 0.5137, + "step": 60206 + }, + { + "epoch": 1.54, + "learning_rate": 1.002019941760824e-06, + "loss": 0.6523, + "step": 60207 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019922713626082e-06, + "loss": 0.6201, + "step": 60208 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019646009628664e-06, + "loss": 0.7549, + "step": 60209 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019369305616208e-06, + "loss": 0.5972, + "step": 60210 + }, + { + "epoch": 1.54, + "learning_rate": 1.0019092601588918e-06, + "loss": 0.6206, + "step": 60211 + }, + { + "epoch": 1.54, + "learning_rate": 1.0018815897547012e-06, + "loss": 0.6193, + "step": 60212 + }, + { + "epoch": 1.54, + "learning_rate": 1.00185391934907e-06, + "loss": 0.6025, + "step": 60213 + }, + { + "epoch": 1.54, + "learning_rate": 1.001826248942019e-06, + "loss": 0.7393, + "step": 60214 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017985785335702e-06, + "loss": 0.6816, + "step": 60215 + }, + { + "epoch": 1.54, + "learning_rate": 1.001770908123744e-06, + "loss": 0.7607, + "step": 60216 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017432377125621e-06, + "loss": 0.5811, + "step": 60217 + }, + { + "epoch": 1.54, + "learning_rate": 1.0017155673000454e-06, + "loss": 0.5757, + "step": 60218 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016878968862152e-06, + "loss": 0.5703, + "step": 60219 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016602264710924e-06, + "loss": 0.604, + "step": 60220 + }, + { + "epoch": 1.54, + "learning_rate": 1.001632556054699e-06, + "loss": 0.459, + "step": 60221 + }, + { + "epoch": 1.54, + "learning_rate": 1.0016048856370549e-06, + "loss": 0.7949, + "step": 60222 + }, + { + "epoch": 1.54, + "learning_rate": 1.0015772152181827e-06, + "loss": 0.8184, + "step": 60223 + }, + { + "epoch": 1.54, + "learning_rate": 1.0015495447981026e-06, + "loss": 0.5781, + "step": 60224 + }, + { + "epoch": 1.54, + "learning_rate": 1.001521874376836e-06, + "loss": 0.7134, + "step": 60225 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014942039544042e-06, + "loss": 0.6992, + "step": 60226 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014665335308285e-06, + "loss": 0.873, + "step": 60227 + }, + { + "epoch": 1.54, + "learning_rate": 1.00143886310613e-06, + "loss": 0.8086, + "step": 60228 + }, + { + "epoch": 1.54, + "learning_rate": 1.0014111926803297e-06, + "loss": 0.6494, + "step": 60229 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013835222534488e-06, + "loss": 0.7881, + "step": 60230 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013558518255087e-06, + "loss": 0.7275, + "step": 60231 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013281813965303e-06, + "loss": 0.6042, + "step": 60232 + }, + { + "epoch": 1.54, + "learning_rate": 1.0013005109665353e-06, + "loss": 0.6392, + "step": 60233 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012728405355444e-06, + "loss": 0.6592, + "step": 60234 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012451701035792e-06, + "loss": 0.6455, + "step": 60235 + }, + { + "epoch": 1.54, + "learning_rate": 1.0012174996706602e-06, + "loss": 0.6794, + "step": 60236 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011898292368093e-06, + "loss": 0.7324, + "step": 60237 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011621588020474e-06, + "loss": 0.4565, + "step": 60238 + }, + { + "epoch": 1.54, + "learning_rate": 1.0011344883663953e-06, + "loss": 0.5864, + "step": 60239 + }, + { + "epoch": 1.54, + "learning_rate": 1.001106817929875e-06, + "loss": 0.5425, + "step": 60240 + }, + { + "epoch": 1.54, + "learning_rate": 1.001079147492507e-06, + "loss": 0.7979, + "step": 60241 + }, + { + "epoch": 1.54, + "learning_rate": 1.001051477054313e-06, + "loss": 0.7158, + "step": 60242 + }, + { + "epoch": 1.54, + "learning_rate": 1.0010238066153137e-06, + "loss": 0.9268, + "step": 60243 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009961361755308e-06, + "loss": 0.7725, + "step": 60244 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009684657349848e-06, + "loss": 0.627, + "step": 60245 + }, + { + "epoch": 1.54, + "learning_rate": 1.0009407952936978e-06, + "loss": 0.5664, + "step": 60246 + }, + { + "epoch": 1.54, + "learning_rate": 1.00091312485169e-06, + "loss": 0.6504, + "step": 60247 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008854544089835e-06, + "loss": 0.5271, + "step": 60248 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008577839655988e-06, + "loss": 0.6689, + "step": 60249 + }, + { + "epoch": 1.54, + "learning_rate": 1.0008301135215572e-06, + "loss": 0.5752, + "step": 60250 + }, + { + "epoch": 1.54, + "learning_rate": 1.00080244307688e-06, + "loss": 0.7422, + "step": 60251 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007747726315886e-06, + "loss": 0.5908, + "step": 60252 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007471021857041e-06, + "loss": 0.6245, + "step": 60253 + }, + { + "epoch": 1.54, + "learning_rate": 1.0007194317392475e-06, + "loss": 0.5303, + "step": 60254 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006917612922398e-06, + "loss": 0.4619, + "step": 60255 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006640908447027e-06, + "loss": 0.4778, + "step": 60256 + }, + { + "epoch": 1.54, + "learning_rate": 1.000636420396657e-06, + "loss": 0.6582, + "step": 60257 + }, + { + "epoch": 1.54, + "learning_rate": 1.0006087499481243e-06, + "loss": 0.7783, + "step": 60258 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005810794991255e-06, + "loss": 0.5913, + "step": 60259 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005534090496815e-06, + "loss": 0.7363, + "step": 60260 + }, + { + "epoch": 1.54, + "learning_rate": 1.0005257385998139e-06, + "loss": 0.626, + "step": 60261 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004980681495436e-06, + "loss": 0.5239, + "step": 60262 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004703976988925e-06, + "loss": 0.4545, + "step": 60263 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004427272478807e-06, + "loss": 0.7773, + "step": 60264 + }, + { + "epoch": 1.54, + "learning_rate": 1.0004150567965298e-06, + "loss": 0.7275, + "step": 60265 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003873863448616e-06, + "loss": 0.9746, + "step": 60266 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003597158928965e-06, + "loss": 0.5538, + "step": 60267 + }, + { + "epoch": 1.54, + "learning_rate": 1.000332045440656e-06, + "loss": 0.6333, + "step": 60268 + }, + { + "epoch": 1.54, + "learning_rate": 1.0003043749881615e-06, + "loss": 0.5977, + "step": 60269 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002767045354336e-06, + "loss": 0.4883, + "step": 60270 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002490340824942e-06, + "loss": 0.5415, + "step": 60271 + }, + { + "epoch": 1.54, + "learning_rate": 1.0002213636293638e-06, + "loss": 0.6055, + "step": 60272 + }, + { + "epoch": 1.54, + "learning_rate": 1.0001936931760643e-06, + "loss": 0.8164, + "step": 60273 + }, + { + "epoch": 1.54, + "learning_rate": 1.000166022722616e-06, + "loss": 0.7295, + "step": 60274 + }, + { + "epoch": 1.54, + "learning_rate": 1.0001383522690411e-06, + "loss": 0.575, + "step": 60275 + }, + { + "epoch": 1.54, + "learning_rate": 1.00011068181536e-06, + "loss": 0.749, + "step": 60276 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000830113615942e-06, + "loss": 0.4927, + "step": 60277 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000553409077647e-06, + "loss": 0.5247, + "step": 60278 + }, + { + "epoch": 1.54, + "learning_rate": 1.0000276704538927e-06, + "loss": 0.7324, + "step": 60279 + }, + { + "epoch": 1.55, + "learning_rate": 1e-06, + "loss": 0.7705, + "step": 60280 + }, + { + "epoch": 1.55, + "learning_rate": 9.999723295461072e-07, + "loss": 0.7637, + "step": 60281 + }, + { + "epoch": 1.55, + "learning_rate": 9.999446590922352e-07, + "loss": 0.7344, + "step": 60282 + }, + { + "epoch": 1.55, + "learning_rate": 9.99916988638406e-07, + "loss": 0.7314, + "step": 60283 + }, + { + "epoch": 1.55, + "learning_rate": 9.9988931818464e-07, + "loss": 0.4971, + "step": 60284 + }, + { + "epoch": 1.55, + "learning_rate": 9.998616477309592e-07, + "loss": 0.668, + "step": 60285 + }, + { + "epoch": 1.55, + "learning_rate": 9.99833977277384e-07, + "loss": 0.6865, + "step": 60286 + }, + { + "epoch": 1.55, + "learning_rate": 9.998063068239358e-07, + "loss": 0.5713, + "step": 60287 + }, + { + "epoch": 1.55, + "learning_rate": 9.997786363706362e-07, + "loss": 0.5596, + "step": 60288 + }, + { + "epoch": 1.55, + "learning_rate": 9.99750965917506e-07, + "loss": 0.6802, + "step": 60289 + }, + { + "epoch": 1.55, + "learning_rate": 9.997232954645663e-07, + "loss": 0.6846, + "step": 60290 + }, + { + "epoch": 1.55, + "learning_rate": 9.996956250118384e-07, + "loss": 0.7295, + "step": 60291 + }, + { + "epoch": 1.55, + "learning_rate": 9.996679545593439e-07, + "loss": 0.6768, + "step": 60292 + }, + { + "epoch": 1.55, + "learning_rate": 9.996402841071032e-07, + "loss": 0.5918, + "step": 60293 + }, + { + "epoch": 1.55, + "learning_rate": 9.996126136551383e-07, + "loss": 0.8623, + "step": 60294 + }, + { + "epoch": 1.55, + "learning_rate": 9.995849432034703e-07, + "loss": 0.7861, + "step": 60295 + }, + { + "epoch": 1.55, + "learning_rate": 9.995572727521195e-07, + "loss": 0.6943, + "step": 60296 + }, + { + "epoch": 1.55, + "learning_rate": 9.995296023011079e-07, + "loss": 0.4783, + "step": 60297 + }, + { + "epoch": 1.55, + "learning_rate": 9.995019318504565e-07, + "loss": 0.5502, + "step": 60298 + }, + { + "epoch": 1.55, + "learning_rate": 9.994742614001863e-07, + "loss": 0.6118, + "step": 60299 + }, + { + "epoch": 1.55, + "learning_rate": 9.994465909503186e-07, + "loss": 0.7256, + "step": 60300 + }, + { + "epoch": 1.55, + "learning_rate": 9.994189205008747e-07, + "loss": 0.6523, + "step": 60301 + }, + { + "epoch": 1.55, + "learning_rate": 9.993912500518758e-07, + "loss": 0.7832, + "step": 60302 + }, + { + "epoch": 1.55, + "learning_rate": 9.993635796033427e-07, + "loss": 0.5573, + "step": 60303 + }, + { + "epoch": 1.55, + "learning_rate": 9.993359091552972e-07, + "loss": 0.4624, + "step": 60304 + }, + { + "epoch": 1.55, + "learning_rate": 9.993082387077603e-07, + "loss": 0.7188, + "step": 60305 + }, + { + "epoch": 1.55, + "learning_rate": 9.992805682607527e-07, + "loss": 0.7246, + "step": 60306 + }, + { + "epoch": 1.55, + "learning_rate": 9.992528978142962e-07, + "loss": 0.6367, + "step": 60307 + }, + { + "epoch": 1.55, + "learning_rate": 9.992252273684113e-07, + "loss": 0.6646, + "step": 60308 + }, + { + "epoch": 1.55, + "learning_rate": 9.9919755692312e-07, + "loss": 0.7266, + "step": 60309 + }, + { + "epoch": 1.55, + "learning_rate": 9.991698864784429e-07, + "loss": 0.5603, + "step": 60310 + }, + { + "epoch": 1.55, + "learning_rate": 9.991422160344013e-07, + "loss": 0.5034, + "step": 60311 + }, + { + "epoch": 1.55, + "learning_rate": 9.991145455910164e-07, + "loss": 0.563, + "step": 60312 + }, + { + "epoch": 1.55, + "learning_rate": 9.9908687514831e-07, + "loss": 0.749, + "step": 60313 + }, + { + "epoch": 1.55, + "learning_rate": 9.990592047063022e-07, + "loss": 0.8057, + "step": 60314 + }, + { + "epoch": 1.55, + "learning_rate": 9.990315342650154e-07, + "loss": 0.6445, + "step": 60315 + }, + { + "epoch": 1.55, + "learning_rate": 9.990038638244695e-07, + "loss": 0.5535, + "step": 60316 + }, + { + "epoch": 1.55, + "learning_rate": 9.989761933846864e-07, + "loss": 0.8467, + "step": 60317 + }, + { + "epoch": 1.55, + "learning_rate": 9.98948522945687e-07, + "loss": 0.6509, + "step": 60318 + }, + { + "epoch": 1.55, + "learning_rate": 9.98920852507493e-07, + "loss": 0.5624, + "step": 60319 + }, + { + "epoch": 1.55, + "learning_rate": 9.988931820701251e-07, + "loss": 0.6631, + "step": 60320 + }, + { + "epoch": 1.55, + "learning_rate": 9.988655116336046e-07, + "loss": 0.5481, + "step": 60321 + }, + { + "epoch": 1.55, + "learning_rate": 9.988378411979527e-07, + "loss": 0.5747, + "step": 60322 + }, + { + "epoch": 1.55, + "learning_rate": 9.988101707631908e-07, + "loss": 0.7188, + "step": 60323 + }, + { + "epoch": 1.55, + "learning_rate": 9.987825003293397e-07, + "loss": 0.7695, + "step": 60324 + }, + { + "epoch": 1.55, + "learning_rate": 9.987548298964211e-07, + "loss": 0.7036, + "step": 60325 + }, + { + "epoch": 1.55, + "learning_rate": 9.98727159464456e-07, + "loss": 0.6816, + "step": 60326 + }, + { + "epoch": 1.55, + "learning_rate": 9.986994890334648e-07, + "loss": 0.6533, + "step": 60327 + }, + { + "epoch": 1.55, + "learning_rate": 9.986718186034698e-07, + "loss": 0.7344, + "step": 60328 + }, + { + "epoch": 1.55, + "learning_rate": 9.986441481744912e-07, + "loss": 0.4391, + "step": 60329 + }, + { + "epoch": 1.55, + "learning_rate": 9.986164777465513e-07, + "loss": 0.5654, + "step": 60330 + }, + { + "epoch": 1.55, + "learning_rate": 9.985888073196702e-07, + "loss": 0.8242, + "step": 60331 + }, + { + "epoch": 1.55, + "learning_rate": 9.985611368938702e-07, + "loss": 0.577, + "step": 60332 + }, + { + "epoch": 1.55, + "learning_rate": 9.985334664691712e-07, + "loss": 0.5747, + "step": 60333 + }, + { + "epoch": 1.55, + "learning_rate": 9.985057960455957e-07, + "loss": 0.7734, + "step": 60334 + }, + { + "epoch": 1.55, + "learning_rate": 9.98478125623164e-07, + "loss": 0.7012, + "step": 60335 + }, + { + "epoch": 1.55, + "learning_rate": 9.984504552018977e-07, + "loss": 0.6101, + "step": 60336 + }, + { + "epoch": 1.55, + "learning_rate": 9.984227847818174e-07, + "loss": 0.7617, + "step": 60337 + }, + { + "epoch": 1.55, + "learning_rate": 9.98395114362945e-07, + "loss": 0.4521, + "step": 60338 + }, + { + "epoch": 1.55, + "learning_rate": 9.98367443945301e-07, + "loss": 0.7695, + "step": 60339 + }, + { + "epoch": 1.55, + "learning_rate": 9.983397735289075e-07, + "loss": 0.6626, + "step": 60340 + }, + { + "epoch": 1.55, + "learning_rate": 9.983121031137847e-07, + "loss": 0.585, + "step": 60341 + }, + { + "epoch": 1.55, + "learning_rate": 9.982844326999545e-07, + "loss": 0.6816, + "step": 60342 + }, + { + "epoch": 1.55, + "learning_rate": 9.982567622874378e-07, + "loss": 0.8237, + "step": 60343 + }, + { + "epoch": 1.55, + "learning_rate": 9.982290918762558e-07, + "loss": 0.7266, + "step": 60344 + }, + { + "epoch": 1.55, + "learning_rate": 9.982014214664301e-07, + "loss": 0.8037, + "step": 60345 + }, + { + "epoch": 1.55, + "learning_rate": 9.981737510579809e-07, + "loss": 0.707, + "step": 60346 + }, + { + "epoch": 1.55, + "learning_rate": 9.9814608065093e-07, + "loss": 0.6455, + "step": 60347 + }, + { + "epoch": 1.55, + "learning_rate": 9.98118410245299e-07, + "loss": 0.7744, + "step": 60348 + }, + { + "epoch": 1.55, + "learning_rate": 9.980907398411082e-07, + "loss": 0.7402, + "step": 60349 + }, + { + "epoch": 1.55, + "learning_rate": 9.980630694383794e-07, + "loss": 0.5732, + "step": 60350 + }, + { + "epoch": 1.55, + "learning_rate": 9.980353990371337e-07, + "loss": 0.8701, + "step": 60351 + }, + { + "epoch": 1.55, + "learning_rate": 9.98007728637392e-07, + "loss": 0.6528, + "step": 60352 + }, + { + "epoch": 1.55, + "learning_rate": 9.97980058239176e-07, + "loss": 0.6377, + "step": 60353 + }, + { + "epoch": 1.55, + "learning_rate": 9.979523878425064e-07, + "loss": 0.7041, + "step": 60354 + }, + { + "epoch": 1.55, + "learning_rate": 9.97924717447405e-07, + "loss": 0.6797, + "step": 60355 + }, + { + "epoch": 1.55, + "learning_rate": 9.978970470538918e-07, + "loss": 0.6431, + "step": 60356 + }, + { + "epoch": 1.55, + "learning_rate": 9.978693766619892e-07, + "loss": 0.5562, + "step": 60357 + }, + { + "epoch": 1.55, + "learning_rate": 9.978417062717175e-07, + "loss": 0.7607, + "step": 60358 + }, + { + "epoch": 1.55, + "learning_rate": 9.978140358830987e-07, + "loss": 0.6108, + "step": 60359 + }, + { + "epoch": 1.55, + "learning_rate": 9.977863654961533e-07, + "loss": 0.6836, + "step": 60360 + }, + { + "epoch": 1.55, + "learning_rate": 9.97758695110903e-07, + "loss": 0.6821, + "step": 60361 + }, + { + "epoch": 1.55, + "learning_rate": 9.977310247273687e-07, + "loss": 0.6553, + "step": 60362 + }, + { + "epoch": 1.55, + "learning_rate": 9.977033543455715e-07, + "loss": 0.7334, + "step": 60363 + }, + { + "epoch": 1.55, + "learning_rate": 9.976756839655328e-07, + "loss": 0.5081, + "step": 60364 + }, + { + "epoch": 1.55, + "learning_rate": 9.976480135872742e-07, + "loss": 0.5137, + "step": 60365 + }, + { + "epoch": 1.55, + "learning_rate": 9.976203432108161e-07, + "loss": 0.707, + "step": 60366 + }, + { + "epoch": 1.55, + "learning_rate": 9.975926728361798e-07, + "loss": 0.7207, + "step": 60367 + }, + { + "epoch": 1.55, + "learning_rate": 9.975650024633868e-07, + "loss": 0.5654, + "step": 60368 + }, + { + "epoch": 1.55, + "learning_rate": 9.97537332092458e-07, + "loss": 0.6362, + "step": 60369 + }, + { + "epoch": 1.55, + "learning_rate": 9.97509661723415e-07, + "loss": 0.4802, + "step": 60370 + }, + { + "epoch": 1.55, + "learning_rate": 9.974819913562788e-07, + "loss": 0.583, + "step": 60371 + }, + { + "epoch": 1.55, + "learning_rate": 9.974543209910701e-07, + "loss": 0.6748, + "step": 60372 + }, + { + "epoch": 1.55, + "learning_rate": 9.97426650627811e-07, + "loss": 0.7305, + "step": 60373 + }, + { + "epoch": 1.55, + "learning_rate": 9.973989802665218e-07, + "loss": 0.6777, + "step": 60374 + }, + { + "epoch": 1.55, + "learning_rate": 9.973713099072246e-07, + "loss": 0.5249, + "step": 60375 + }, + { + "epoch": 1.55, + "learning_rate": 9.9734363954994e-07, + "loss": 0.5957, + "step": 60376 + }, + { + "epoch": 1.55, + "learning_rate": 9.973159691946886e-07, + "loss": 0.791, + "step": 60377 + }, + { + "epoch": 1.55, + "learning_rate": 9.972882988414928e-07, + "loss": 0.6313, + "step": 60378 + }, + { + "epoch": 1.55, + "learning_rate": 9.972606284903729e-07, + "loss": 0.7393, + "step": 60379 + }, + { + "epoch": 1.55, + "learning_rate": 9.972329581413506e-07, + "loss": 0.6211, + "step": 60380 + }, + { + "epoch": 1.55, + "learning_rate": 9.972052877944468e-07, + "loss": 0.708, + "step": 60381 + }, + { + "epoch": 1.55, + "learning_rate": 9.971776174496828e-07, + "loss": 0.7686, + "step": 60382 + }, + { + "epoch": 1.55, + "learning_rate": 9.971499471070798e-07, + "loss": 0.6772, + "step": 60383 + }, + { + "epoch": 1.55, + "learning_rate": 9.97122276766659e-07, + "loss": 0.5923, + "step": 60384 + }, + { + "epoch": 1.55, + "learning_rate": 9.970946064284416e-07, + "loss": 0.8496, + "step": 60385 + }, + { + "epoch": 1.55, + "learning_rate": 9.970669360924486e-07, + "loss": 0.5586, + "step": 60386 + }, + { + "epoch": 1.55, + "learning_rate": 9.970392657587014e-07, + "loss": 0.5947, + "step": 60387 + }, + { + "epoch": 1.55, + "learning_rate": 9.970115954272212e-07, + "loss": 0.6265, + "step": 60388 + }, + { + "epoch": 1.55, + "learning_rate": 9.969839250980288e-07, + "loss": 0.749, + "step": 60389 + }, + { + "epoch": 1.55, + "learning_rate": 9.969562547711459e-07, + "loss": 0.5977, + "step": 60390 + }, + { + "epoch": 1.55, + "learning_rate": 9.969285844465931e-07, + "loss": 0.7051, + "step": 60391 + }, + { + "epoch": 1.55, + "learning_rate": 9.969009141243922e-07, + "loss": 0.7051, + "step": 60392 + }, + { + "epoch": 1.55, + "learning_rate": 9.968732438045642e-07, + "loss": 0.6692, + "step": 60393 + }, + { + "epoch": 1.55, + "learning_rate": 9.9684557348713e-07, + "loss": 0.2661, + "step": 60394 + }, + { + "epoch": 1.55, + "learning_rate": 9.968179031721116e-07, + "loss": 0.6196, + "step": 60395 + }, + { + "epoch": 1.55, + "learning_rate": 9.967902328595289e-07, + "loss": 0.5874, + "step": 60396 + }, + { + "epoch": 1.55, + "learning_rate": 9.967625625494038e-07, + "loss": 0.6836, + "step": 60397 + }, + { + "epoch": 1.55, + "learning_rate": 9.967348922417577e-07, + "loss": 0.6621, + "step": 60398 + }, + { + "epoch": 1.55, + "learning_rate": 9.967072219366115e-07, + "loss": 0.5674, + "step": 60399 + }, + { + "epoch": 1.55, + "learning_rate": 9.966795516339863e-07, + "loss": 0.5516, + "step": 60400 + }, + { + "epoch": 1.55, + "learning_rate": 9.966518813339037e-07, + "loss": 0.6528, + "step": 60401 + }, + { + "epoch": 1.55, + "learning_rate": 9.966242110363843e-07, + "loss": 0.5772, + "step": 60402 + }, + { + "epoch": 1.55, + "learning_rate": 9.965965407414497e-07, + "loss": 0.6558, + "step": 60403 + }, + { + "epoch": 1.55, + "learning_rate": 9.965688704491209e-07, + "loss": 0.5571, + "step": 60404 + }, + { + "epoch": 1.55, + "learning_rate": 9.965412001594197e-07, + "loss": 0.6665, + "step": 60405 + }, + { + "epoch": 1.55, + "learning_rate": 9.965135298723662e-07, + "loss": 0.7598, + "step": 60406 + }, + { + "epoch": 1.55, + "learning_rate": 9.964858595879823e-07, + "loss": 0.6738, + "step": 60407 + }, + { + "epoch": 1.55, + "learning_rate": 9.964581893062888e-07, + "loss": 0.5864, + "step": 60408 + }, + { + "epoch": 1.55, + "learning_rate": 9.964305190273072e-07, + "loss": 0.613, + "step": 60409 + }, + { + "epoch": 1.55, + "learning_rate": 9.964028487510585e-07, + "loss": 0.6123, + "step": 60410 + }, + { + "epoch": 1.55, + "learning_rate": 9.963751784775642e-07, + "loss": 0.6865, + "step": 60411 + }, + { + "epoch": 1.55, + "learning_rate": 9.96347508206845e-07, + "loss": 0.5181, + "step": 60412 + }, + { + "epoch": 1.55, + "learning_rate": 9.963198379389226e-07, + "loss": 0.5457, + "step": 60413 + }, + { + "epoch": 1.55, + "learning_rate": 9.962921676738178e-07, + "loss": 0.5444, + "step": 60414 + }, + { + "epoch": 1.55, + "learning_rate": 9.96264497411552e-07, + "loss": 0.7949, + "step": 60415 + }, + { + "epoch": 1.55, + "learning_rate": 9.962368271521466e-07, + "loss": 0.7764, + "step": 60416 + }, + { + "epoch": 1.55, + "learning_rate": 9.96209156895622e-07, + "loss": 0.5508, + "step": 60417 + }, + { + "epoch": 1.55, + "learning_rate": 9.96181486642e-07, + "loss": 0.457, + "step": 60418 + }, + { + "epoch": 1.55, + "learning_rate": 9.961538163913015e-07, + "loss": 0.5962, + "step": 60419 + }, + { + "epoch": 1.55, + "learning_rate": 9.96126146143548e-07, + "loss": 0.8086, + "step": 60420 + }, + { + "epoch": 1.55, + "learning_rate": 9.960984758987606e-07, + "loss": 0.6675, + "step": 60421 + }, + { + "epoch": 1.55, + "learning_rate": 9.960708056569604e-07, + "loss": 0.7178, + "step": 60422 + }, + { + "epoch": 1.55, + "learning_rate": 9.960431354181685e-07, + "loss": 0.5913, + "step": 60423 + }, + { + "epoch": 1.55, + "learning_rate": 9.960154651824062e-07, + "loss": 0.6714, + "step": 60424 + }, + { + "epoch": 1.55, + "learning_rate": 9.95987794949695e-07, + "loss": 0.4756, + "step": 60425 + }, + { + "epoch": 1.55, + "learning_rate": 9.959601247200556e-07, + "loss": 0.6289, + "step": 60426 + }, + { + "epoch": 1.55, + "learning_rate": 9.959324544935092e-07, + "loss": 0.5896, + "step": 60427 + }, + { + "epoch": 1.55, + "learning_rate": 9.959047842700772e-07, + "loss": 0.5957, + "step": 60428 + }, + { + "epoch": 1.55, + "learning_rate": 9.958771140497806e-07, + "loss": 0.7588, + "step": 60429 + }, + { + "epoch": 1.55, + "learning_rate": 9.958494438326408e-07, + "loss": 0.542, + "step": 60430 + }, + { + "epoch": 1.55, + "learning_rate": 9.958217736186787e-07, + "loss": 0.7695, + "step": 60431 + }, + { + "epoch": 1.55, + "learning_rate": 9.95794103407916e-07, + "loss": 0.7061, + "step": 60432 + }, + { + "epoch": 1.55, + "learning_rate": 9.957664332003734e-07, + "loss": 0.6426, + "step": 60433 + }, + { + "epoch": 1.55, + "learning_rate": 9.957387629960723e-07, + "loss": 0.6865, + "step": 60434 + }, + { + "epoch": 1.55, + "learning_rate": 9.95711092795034e-07, + "loss": 0.6455, + "step": 60435 + }, + { + "epoch": 1.55, + "learning_rate": 9.956834225972792e-07, + "loss": 0.5928, + "step": 60436 + }, + { + "epoch": 1.55, + "learning_rate": 9.956557524028297e-07, + "loss": 0.4871, + "step": 60437 + }, + { + "epoch": 1.55, + "learning_rate": 9.95628082211706e-07, + "loss": 0.6592, + "step": 60438 + }, + { + "epoch": 1.55, + "learning_rate": 9.9560041202393e-07, + "loss": 0.6533, + "step": 60439 + }, + { + "epoch": 1.55, + "learning_rate": 9.955727418395223e-07, + "loss": 0.5703, + "step": 60440 + }, + { + "epoch": 1.55, + "learning_rate": 9.955450716585048e-07, + "loss": 0.6157, + "step": 60441 + }, + { + "epoch": 1.55, + "learning_rate": 9.955174014808976e-07, + "loss": 0.7144, + "step": 60442 + }, + { + "epoch": 1.55, + "learning_rate": 9.95489731306723e-07, + "loss": 0.5686, + "step": 60443 + }, + { + "epoch": 1.55, + "learning_rate": 9.954620611360017e-07, + "loss": 0.707, + "step": 60444 + }, + { + "epoch": 1.55, + "learning_rate": 9.95434390968755e-07, + "loss": 0.624, + "step": 60445 + }, + { + "epoch": 1.55, + "learning_rate": 9.954067208050034e-07, + "loss": 0.6235, + "step": 60446 + }, + { + "epoch": 1.55, + "learning_rate": 9.953790506447692e-07, + "loss": 0.7422, + "step": 60447 + }, + { + "epoch": 1.55, + "learning_rate": 9.953513804880727e-07, + "loss": 0.665, + "step": 60448 + }, + { + "epoch": 1.55, + "learning_rate": 9.953237103349357e-07, + "loss": 0.5537, + "step": 60449 + }, + { + "epoch": 1.55, + "learning_rate": 9.952960401853787e-07, + "loss": 0.7295, + "step": 60450 + }, + { + "epoch": 1.55, + "learning_rate": 9.95268370039424e-07, + "loss": 0.5166, + "step": 60451 + }, + { + "epoch": 1.55, + "learning_rate": 9.952406998970913e-07, + "loss": 0.6851, + "step": 60452 + }, + { + "epoch": 1.55, + "learning_rate": 9.952130297584032e-07, + "loss": 0.5947, + "step": 60453 + }, + { + "epoch": 1.55, + "learning_rate": 9.9518535962338e-07, + "loss": 0.564, + "step": 60454 + }, + { + "epoch": 1.55, + "learning_rate": 9.951576894920433e-07, + "loss": 0.7627, + "step": 60455 + }, + { + "epoch": 1.55, + "learning_rate": 9.95130019364414e-07, + "loss": 0.5652, + "step": 60456 + }, + { + "epoch": 1.55, + "learning_rate": 9.951023492405135e-07, + "loss": 0.625, + "step": 60457 + }, + { + "epoch": 1.55, + "learning_rate": 9.95074679120363e-07, + "loss": 0.7637, + "step": 60458 + }, + { + "epoch": 1.55, + "learning_rate": 9.950470090039831e-07, + "loss": 0.6499, + "step": 60459 + }, + { + "epoch": 1.55, + "learning_rate": 9.95019338891396e-07, + "loss": 0.6465, + "step": 60460 + }, + { + "epoch": 1.55, + "learning_rate": 9.949916687826223e-07, + "loss": 0.71, + "step": 60461 + }, + { + "epoch": 1.55, + "learning_rate": 9.94963998677683e-07, + "loss": 0.4968, + "step": 60462 + }, + { + "epoch": 1.55, + "learning_rate": 9.949363285765997e-07, + "loss": 0.4373, + "step": 60463 + }, + { + "epoch": 1.55, + "learning_rate": 9.949086584793932e-07, + "loss": 0.8281, + "step": 60464 + }, + { + "epoch": 1.55, + "learning_rate": 9.948809883860853e-07, + "loss": 0.7627, + "step": 60465 + }, + { + "epoch": 1.55, + "learning_rate": 9.948533182966966e-07, + "loss": 0.7373, + "step": 60466 + }, + { + "epoch": 1.55, + "learning_rate": 9.948256482112484e-07, + "loss": 0.6328, + "step": 60467 + }, + { + "epoch": 1.55, + "learning_rate": 9.947979781297621e-07, + "loss": 0.75, + "step": 60468 + }, + { + "epoch": 1.55, + "learning_rate": 9.947703080522586e-07, + "loss": 0.6865, + "step": 60469 + }, + { + "epoch": 1.55, + "learning_rate": 9.947426379787594e-07, + "loss": 0.8193, + "step": 60470 + }, + { + "epoch": 1.55, + "learning_rate": 9.947149679092852e-07, + "loss": 0.6113, + "step": 60471 + }, + { + "epoch": 1.55, + "learning_rate": 9.946872978438578e-07, + "loss": 0.7549, + "step": 60472 + }, + { + "epoch": 1.55, + "learning_rate": 9.94659627782498e-07, + "loss": 0.8779, + "step": 60473 + }, + { + "epoch": 1.55, + "learning_rate": 9.94631957725227e-07, + "loss": 0.7422, + "step": 60474 + }, + { + "epoch": 1.55, + "learning_rate": 9.946042876720666e-07, + "loss": 0.6152, + "step": 60475 + }, + { + "epoch": 1.55, + "learning_rate": 9.94576617623037e-07, + "loss": 0.7129, + "step": 60476 + }, + { + "epoch": 1.55, + "learning_rate": 9.945489475781599e-07, + "loss": 0.6533, + "step": 60477 + }, + { + "epoch": 1.55, + "learning_rate": 9.945212775374563e-07, + "loss": 0.6885, + "step": 60478 + }, + { + "epoch": 1.55, + "learning_rate": 9.944936075009475e-07, + "loss": 0.6963, + "step": 60479 + }, + { + "epoch": 1.55, + "learning_rate": 9.944659374686548e-07, + "loss": 0.7026, + "step": 60480 + }, + { + "epoch": 1.55, + "learning_rate": 9.944382674405992e-07, + "loss": 0.594, + "step": 60481 + }, + { + "epoch": 1.55, + "learning_rate": 9.94410597416802e-07, + "loss": 0.7402, + "step": 60482 + }, + { + "epoch": 1.55, + "learning_rate": 9.943829273972843e-07, + "loss": 0.6196, + "step": 60483 + }, + { + "epoch": 1.55, + "learning_rate": 9.943552573820673e-07, + "loss": 0.6318, + "step": 60484 + }, + { + "epoch": 1.55, + "learning_rate": 9.943275873711728e-07, + "loss": 0.7109, + "step": 60485 + }, + { + "epoch": 1.55, + "learning_rate": 9.942999173646208e-07, + "loss": 0.6011, + "step": 60486 + }, + { + "epoch": 1.55, + "learning_rate": 9.942722473624333e-07, + "loss": 0.8623, + "step": 60487 + }, + { + "epoch": 1.55, + "learning_rate": 9.94244577364631e-07, + "loss": 0.665, + "step": 60488 + }, + { + "epoch": 1.55, + "learning_rate": 9.942169073712355e-07, + "loss": 0.7461, + "step": 60489 + }, + { + "epoch": 1.55, + "learning_rate": 9.941892373822678e-07, + "loss": 0.6675, + "step": 60490 + }, + { + "epoch": 1.55, + "learning_rate": 9.941615673977493e-07, + "loss": 0.5985, + "step": 60491 + }, + { + "epoch": 1.55, + "learning_rate": 9.941338974177007e-07, + "loss": 0.6045, + "step": 60492 + }, + { + "epoch": 1.55, + "learning_rate": 9.94106227442144e-07, + "loss": 0.5308, + "step": 60493 + }, + { + "epoch": 1.55, + "learning_rate": 9.940785574710994e-07, + "loss": 0.8789, + "step": 60494 + }, + { + "epoch": 1.55, + "learning_rate": 9.940508875045891e-07, + "loss": 0.6953, + "step": 60495 + }, + { + "epoch": 1.55, + "learning_rate": 9.940232175426336e-07, + "loss": 0.6416, + "step": 60496 + }, + { + "epoch": 1.55, + "learning_rate": 9.939955475852542e-07, + "loss": 0.7256, + "step": 60497 + }, + { + "epoch": 1.55, + "learning_rate": 9.939678776324719e-07, + "loss": 0.6294, + "step": 60498 + }, + { + "epoch": 1.55, + "learning_rate": 9.939402076843084e-07, + "loss": 0.6426, + "step": 60499 + }, + { + "epoch": 1.55, + "learning_rate": 9.939125377407843e-07, + "loss": 0.6499, + "step": 60500 + }, + { + "epoch": 1.55, + "learning_rate": 9.938848678019214e-07, + "loss": 0.6782, + "step": 60501 + }, + { + "epoch": 1.55, + "learning_rate": 9.938571978677403e-07, + "loss": 0.7051, + "step": 60502 + }, + { + "epoch": 1.55, + "learning_rate": 9.938295279382626e-07, + "loss": 0.8506, + "step": 60503 + }, + { + "epoch": 1.55, + "learning_rate": 9.938018580135092e-07, + "loss": 0.7344, + "step": 60504 + }, + { + "epoch": 1.55, + "learning_rate": 9.93774188093502e-07, + "loss": 0.5771, + "step": 60505 + }, + { + "epoch": 1.55, + "learning_rate": 9.937465181782613e-07, + "loss": 0.5654, + "step": 60506 + }, + { + "epoch": 1.55, + "learning_rate": 9.937188482678082e-07, + "loss": 0.7588, + "step": 60507 + }, + { + "epoch": 1.55, + "learning_rate": 9.936911783621647e-07, + "loss": 0.6196, + "step": 60508 + }, + { + "epoch": 1.55, + "learning_rate": 9.936635084613514e-07, + "loss": 0.7002, + "step": 60509 + }, + { + "epoch": 1.55, + "learning_rate": 9.9363583856539e-07, + "loss": 0.5679, + "step": 60510 + }, + { + "epoch": 1.55, + "learning_rate": 9.936081686743008e-07, + "loss": 0.5186, + "step": 60511 + }, + { + "epoch": 1.55, + "learning_rate": 9.935804987881058e-07, + "loss": 0.7295, + "step": 60512 + }, + { + "epoch": 1.55, + "learning_rate": 9.93552828906826e-07, + "loss": 0.6396, + "step": 60513 + }, + { + "epoch": 1.55, + "learning_rate": 9.935251590304824e-07, + "loss": 0.6719, + "step": 60514 + }, + { + "epoch": 1.55, + "learning_rate": 9.934974891590965e-07, + "loss": 0.543, + "step": 60515 + }, + { + "epoch": 1.55, + "learning_rate": 9.934698192926893e-07, + "loss": 0.7559, + "step": 60516 + }, + { + "epoch": 1.55, + "learning_rate": 9.934421494312816e-07, + "loss": 0.707, + "step": 60517 + }, + { + "epoch": 1.55, + "learning_rate": 9.93414479574895e-07, + "loss": 0.5161, + "step": 60518 + }, + { + "epoch": 1.55, + "learning_rate": 9.933868097235508e-07, + "loss": 0.4829, + "step": 60519 + }, + { + "epoch": 1.55, + "learning_rate": 9.9335913987727e-07, + "loss": 0.4512, + "step": 60520 + }, + { + "epoch": 1.55, + "learning_rate": 9.933314700360735e-07, + "loss": 0.584, + "step": 60521 + }, + { + "epoch": 1.55, + "learning_rate": 9.93303800199983e-07, + "loss": 0.5981, + "step": 60522 + }, + { + "epoch": 1.55, + "learning_rate": 9.932761303690195e-07, + "loss": 0.7036, + "step": 60523 + }, + { + "epoch": 1.55, + "learning_rate": 9.932484605432042e-07, + "loss": 0.7188, + "step": 60524 + }, + { + "epoch": 1.55, + "learning_rate": 9.932207907225586e-07, + "loss": 0.5693, + "step": 60525 + }, + { + "epoch": 1.55, + "learning_rate": 9.93193120907103e-07, + "loss": 0.2461, + "step": 60526 + }, + { + "epoch": 1.55, + "learning_rate": 9.931654510968593e-07, + "loss": 0.7266, + "step": 60527 + }, + { + "epoch": 1.55, + "learning_rate": 9.931377812918484e-07, + "loss": 0.6611, + "step": 60528 + }, + { + "epoch": 1.55, + "learning_rate": 9.931101114920916e-07, + "loss": 0.6899, + "step": 60529 + }, + { + "epoch": 1.55, + "learning_rate": 9.9308244169761e-07, + "loss": 0.6895, + "step": 60530 + }, + { + "epoch": 1.55, + "learning_rate": 9.93054771908425e-07, + "loss": 0.7344, + "step": 60531 + }, + { + "epoch": 1.55, + "learning_rate": 9.930271021245574e-07, + "loss": 0.6841, + "step": 60532 + }, + { + "epoch": 1.55, + "learning_rate": 9.92999432346029e-07, + "loss": 0.752, + "step": 60533 + }, + { + "epoch": 1.55, + "learning_rate": 9.929717625728606e-07, + "loss": 0.6299, + "step": 60534 + }, + { + "epoch": 1.55, + "learning_rate": 9.929440928050734e-07, + "loss": 0.6357, + "step": 60535 + }, + { + "epoch": 1.55, + "learning_rate": 9.929164230426884e-07, + "loss": 0.6592, + "step": 60536 + }, + { + "epoch": 1.55, + "learning_rate": 9.928887532857269e-07, + "loss": 0.5347, + "step": 60537 + }, + { + "epoch": 1.55, + "learning_rate": 9.928610835342101e-07, + "loss": 0.7705, + "step": 60538 + }, + { + "epoch": 1.55, + "learning_rate": 9.928334137881595e-07, + "loss": 0.748, + "step": 60539 + }, + { + "epoch": 1.55, + "learning_rate": 9.92805744047596e-07, + "loss": 0.5693, + "step": 60540 + }, + { + "epoch": 1.55, + "learning_rate": 9.927780743125407e-07, + "loss": 0.4807, + "step": 60541 + }, + { + "epoch": 1.55, + "learning_rate": 9.927504045830148e-07, + "loss": 0.5027, + "step": 60542 + }, + { + "epoch": 1.55, + "learning_rate": 9.927227348590398e-07, + "loss": 0.6377, + "step": 60543 + }, + { + "epoch": 1.55, + "learning_rate": 9.926950651406363e-07, + "loss": 0.7129, + "step": 60544 + }, + { + "epoch": 1.55, + "learning_rate": 9.926673954278264e-07, + "loss": 0.7529, + "step": 60545 + }, + { + "epoch": 1.55, + "learning_rate": 9.926397257206307e-07, + "loss": 0.6045, + "step": 60546 + }, + { + "epoch": 1.55, + "learning_rate": 9.9261205601907e-07, + "loss": 0.6016, + "step": 60547 + }, + { + "epoch": 1.55, + "learning_rate": 9.92584386323166e-07, + "loss": 0.7617, + "step": 60548 + }, + { + "epoch": 1.55, + "learning_rate": 9.925567166329398e-07, + "loss": 0.6133, + "step": 60549 + }, + { + "epoch": 1.55, + "learning_rate": 9.925290469484128e-07, + "loss": 0.5754, + "step": 60550 + }, + { + "epoch": 1.55, + "learning_rate": 9.92501377269606e-07, + "loss": 0.6406, + "step": 60551 + }, + { + "epoch": 1.55, + "learning_rate": 9.924737075965402e-07, + "loss": 0.6665, + "step": 60552 + }, + { + "epoch": 1.55, + "learning_rate": 9.924460379292371e-07, + "loss": 0.7891, + "step": 60553 + }, + { + "epoch": 1.55, + "learning_rate": 9.924183682677176e-07, + "loss": 0.79, + "step": 60554 + }, + { + "epoch": 1.55, + "learning_rate": 9.923906986120035e-07, + "loss": 0.5815, + "step": 60555 + }, + { + "epoch": 1.55, + "learning_rate": 9.923630289621152e-07, + "loss": 0.6855, + "step": 60556 + }, + { + "epoch": 1.55, + "learning_rate": 9.92335359318074e-07, + "loss": 0.6416, + "step": 60557 + }, + { + "epoch": 1.55, + "learning_rate": 9.923076896799013e-07, + "loss": 0.8984, + "step": 60558 + }, + { + "epoch": 1.55, + "learning_rate": 9.922800200476185e-07, + "loss": 0.8232, + "step": 60559 + }, + { + "epoch": 1.55, + "learning_rate": 9.922523504212462e-07, + "loss": 0.7285, + "step": 60560 + }, + { + "epoch": 1.55, + "learning_rate": 9.92224680800806e-07, + "loss": 0.5928, + "step": 60561 + }, + { + "epoch": 1.55, + "learning_rate": 9.921970111863192e-07, + "loss": 0.5542, + "step": 60562 + }, + { + "epoch": 1.55, + "learning_rate": 9.921693415778066e-07, + "loss": 0.5701, + "step": 60563 + }, + { + "epoch": 1.55, + "learning_rate": 9.921416719752897e-07, + "loss": 0.6665, + "step": 60564 + }, + { + "epoch": 1.55, + "learning_rate": 9.921140023787897e-07, + "loss": 0.708, + "step": 60565 + }, + { + "epoch": 1.55, + "learning_rate": 9.920863327883274e-07, + "loss": 0.6016, + "step": 60566 + }, + { + "epoch": 1.55, + "learning_rate": 9.920586632039243e-07, + "loss": 0.7227, + "step": 60567 + }, + { + "epoch": 1.55, + "learning_rate": 9.920309936256017e-07, + "loss": 0.5791, + "step": 60568 + }, + { + "epoch": 1.55, + "learning_rate": 9.920033240533802e-07, + "loss": 0.5645, + "step": 60569 + }, + { + "epoch": 1.55, + "learning_rate": 9.919756544872815e-07, + "loss": 1.0068, + "step": 60570 + }, + { + "epoch": 1.55, + "learning_rate": 9.919479849273268e-07, + "loss": 0.4917, + "step": 60571 + }, + { + "epoch": 1.55, + "learning_rate": 9.919203153735372e-07, + "loss": 0.7275, + "step": 60572 + }, + { + "epoch": 1.55, + "learning_rate": 9.918926458259337e-07, + "loss": 0.7656, + "step": 60573 + }, + { + "epoch": 1.55, + "learning_rate": 9.918649762845376e-07, + "loss": 0.6328, + "step": 60574 + }, + { + "epoch": 1.55, + "learning_rate": 9.918373067493705e-07, + "loss": 0.6147, + "step": 60575 + }, + { + "epoch": 1.55, + "learning_rate": 9.91809637220453e-07, + "loss": 0.6895, + "step": 60576 + }, + { + "epoch": 1.55, + "learning_rate": 9.917819676978064e-07, + "loss": 0.709, + "step": 60577 + }, + { + "epoch": 1.55, + "learning_rate": 9.917542981814518e-07, + "loss": 0.5693, + "step": 60578 + }, + { + "epoch": 1.55, + "learning_rate": 9.917266286714106e-07, + "loss": 0.8076, + "step": 60579 + }, + { + "epoch": 1.55, + "learning_rate": 9.91698959167704e-07, + "loss": 0.6758, + "step": 60580 + }, + { + "epoch": 1.55, + "learning_rate": 9.916712896703532e-07, + "loss": 0.5542, + "step": 60581 + }, + { + "epoch": 1.55, + "learning_rate": 9.916436201793791e-07, + "loss": 0.6694, + "step": 60582 + }, + { + "epoch": 1.55, + "learning_rate": 9.916159506948033e-07, + "loss": 0.6465, + "step": 60583 + }, + { + "epoch": 1.55, + "learning_rate": 9.915882812166472e-07, + "loss": 0.8535, + "step": 60584 + }, + { + "epoch": 1.55, + "learning_rate": 9.91560611744931e-07, + "loss": 0.6675, + "step": 60585 + }, + { + "epoch": 1.55, + "learning_rate": 9.915329422796767e-07, + "loss": 0.6006, + "step": 60586 + }, + { + "epoch": 1.55, + "learning_rate": 9.915052728209052e-07, + "loss": 0.7812, + "step": 60587 + }, + { + "epoch": 1.55, + "learning_rate": 9.914776033686375e-07, + "loss": 0.73, + "step": 60588 + }, + { + "epoch": 1.55, + "learning_rate": 9.914499339228953e-07, + "loss": 0.5088, + "step": 60589 + }, + { + "epoch": 1.55, + "learning_rate": 9.914222644836992e-07, + "loss": 0.6931, + "step": 60590 + }, + { + "epoch": 1.55, + "learning_rate": 9.913945950510707e-07, + "loss": 0.6152, + "step": 60591 + }, + { + "epoch": 1.55, + "learning_rate": 9.91366925625031e-07, + "loss": 0.5117, + "step": 60592 + }, + { + "epoch": 1.55, + "learning_rate": 9.913392562056014e-07, + "loss": 0.5791, + "step": 60593 + }, + { + "epoch": 1.55, + "learning_rate": 9.913115867928032e-07, + "loss": 0.5659, + "step": 60594 + }, + { + "epoch": 1.55, + "learning_rate": 9.91283917386657e-07, + "loss": 0.5684, + "step": 60595 + }, + { + "epoch": 1.55, + "learning_rate": 9.912562479871842e-07, + "loss": 0.5933, + "step": 60596 + }, + { + "epoch": 1.55, + "learning_rate": 9.91228578594406e-07, + "loss": 0.7979, + "step": 60597 + }, + { + "epoch": 1.55, + "learning_rate": 9.91200909208344e-07, + "loss": 0.7637, + "step": 60598 + }, + { + "epoch": 1.55, + "learning_rate": 9.911732398290188e-07, + "loss": 0.7344, + "step": 60599 + }, + { + "epoch": 1.55, + "learning_rate": 9.91145570456452e-07, + "loss": 0.6338, + "step": 60600 + }, + { + "epoch": 1.55, + "learning_rate": 9.911179010906645e-07, + "loss": 0.637, + "step": 60601 + }, + { + "epoch": 1.55, + "learning_rate": 9.910902317316778e-07, + "loss": 0.582, + "step": 60602 + }, + { + "epoch": 1.55, + "learning_rate": 9.910625623795125e-07, + "loss": 0.6821, + "step": 60603 + }, + { + "epoch": 1.55, + "learning_rate": 9.91034893034191e-07, + "loss": 0.6802, + "step": 60604 + }, + { + "epoch": 1.55, + "learning_rate": 9.910072236957331e-07, + "loss": 0.4978, + "step": 60605 + }, + { + "epoch": 1.55, + "learning_rate": 9.909795543641607e-07, + "loss": 0.6211, + "step": 60606 + }, + { + "epoch": 1.55, + "learning_rate": 9.909518850394946e-07, + "loss": 0.5867, + "step": 60607 + }, + { + "epoch": 1.55, + "learning_rate": 9.909242157217565e-07, + "loss": 0.5938, + "step": 60608 + }, + { + "epoch": 1.55, + "learning_rate": 9.90896546410967e-07, + "loss": 0.5732, + "step": 60609 + }, + { + "epoch": 1.55, + "learning_rate": 9.908688771071477e-07, + "loss": 0.5112, + "step": 60610 + }, + { + "epoch": 1.55, + "learning_rate": 9.908412078103198e-07, + "loss": 0.6118, + "step": 60611 + }, + { + "epoch": 1.55, + "learning_rate": 9.908135385205044e-07, + "loss": 0.6572, + "step": 60612 + }, + { + "epoch": 1.55, + "learning_rate": 9.907858692377225e-07, + "loss": 0.5695, + "step": 60613 + }, + { + "epoch": 1.55, + "learning_rate": 9.907581999619956e-07, + "loss": 0.6655, + "step": 60614 + }, + { + "epoch": 1.55, + "learning_rate": 9.907305306933448e-07, + "loss": 0.7793, + "step": 60615 + }, + { + "epoch": 1.55, + "learning_rate": 9.90702861431791e-07, + "loss": 0.5444, + "step": 60616 + }, + { + "epoch": 1.55, + "learning_rate": 9.906751921773557e-07, + "loss": 0.6816, + "step": 60617 + }, + { + "epoch": 1.55, + "learning_rate": 9.906475229300597e-07, + "loss": 0.7031, + "step": 60618 + }, + { + "epoch": 1.55, + "learning_rate": 9.906198536899249e-07, + "loss": 0.6333, + "step": 60619 + }, + { + "epoch": 1.55, + "learning_rate": 9.905921844569716e-07, + "loss": 0.5903, + "step": 60620 + }, + { + "epoch": 1.55, + "learning_rate": 9.905645152312218e-07, + "loss": 0.6431, + "step": 60621 + }, + { + "epoch": 1.55, + "learning_rate": 9.905368460126959e-07, + "loss": 0.488, + "step": 60622 + }, + { + "epoch": 1.55, + "learning_rate": 9.90509176801416e-07, + "loss": 0.6406, + "step": 60623 + }, + { + "epoch": 1.55, + "learning_rate": 9.904815075974028e-07, + "loss": 0.7051, + "step": 60624 + }, + { + "epoch": 1.55, + "learning_rate": 9.904538384006772e-07, + "loss": 0.5442, + "step": 60625 + }, + { + "epoch": 1.55, + "learning_rate": 9.904261692112606e-07, + "loss": 0.6787, + "step": 60626 + }, + { + "epoch": 1.55, + "learning_rate": 9.903985000291743e-07, + "loss": 0.6787, + "step": 60627 + }, + { + "epoch": 1.55, + "learning_rate": 9.903708308544393e-07, + "loss": 0.8682, + "step": 60628 + }, + { + "epoch": 1.55, + "learning_rate": 9.903431616870772e-07, + "loss": 0.7822, + "step": 60629 + }, + { + "epoch": 1.55, + "learning_rate": 9.903154925271088e-07, + "loss": 0.71, + "step": 60630 + }, + { + "epoch": 1.55, + "learning_rate": 9.902878233745553e-07, + "loss": 0.4467, + "step": 60631 + }, + { + "epoch": 1.55, + "learning_rate": 9.902601542294379e-07, + "loss": 0.4531, + "step": 60632 + }, + { + "epoch": 1.55, + "learning_rate": 9.90232485091778e-07, + "loss": 0.7158, + "step": 60633 + }, + { + "epoch": 1.55, + "learning_rate": 9.90204815961597e-07, + "loss": 0.7373, + "step": 60634 + }, + { + "epoch": 1.55, + "learning_rate": 9.901771468389152e-07, + "loss": 0.605, + "step": 60635 + }, + { + "epoch": 1.55, + "learning_rate": 9.901494777237544e-07, + "loss": 0.6533, + "step": 60636 + }, + { + "epoch": 1.55, + "learning_rate": 9.901218086161355e-07, + "loss": 0.9014, + "step": 60637 + }, + { + "epoch": 1.55, + "learning_rate": 9.900941395160803e-07, + "loss": 0.7305, + "step": 60638 + }, + { + "epoch": 1.55, + "learning_rate": 9.900664704236092e-07, + "loss": 0.583, + "step": 60639 + }, + { + "epoch": 1.55, + "learning_rate": 9.90038801338744e-07, + "loss": 0.6069, + "step": 60640 + }, + { + "epoch": 1.55, + "learning_rate": 9.900111322615055e-07, + "loss": 0.5979, + "step": 60641 + }, + { + "epoch": 1.55, + "learning_rate": 9.89983463191915e-07, + "loss": 0.5586, + "step": 60642 + }, + { + "epoch": 1.55, + "learning_rate": 9.89955794129994e-07, + "loss": 0.6514, + "step": 60643 + }, + { + "epoch": 1.55, + "learning_rate": 9.899281250757634e-07, + "loss": 0.6704, + "step": 60644 + }, + { + "epoch": 1.55, + "learning_rate": 9.899004560292438e-07, + "loss": 0.7222, + "step": 60645 + }, + { + "epoch": 1.55, + "learning_rate": 9.898727869904574e-07, + "loss": 0.4342, + "step": 60646 + }, + { + "epoch": 1.55, + "learning_rate": 9.898451179594248e-07, + "loss": 0.5474, + "step": 60647 + }, + { + "epoch": 1.55, + "learning_rate": 9.898174489361673e-07, + "loss": 0.6172, + "step": 60648 + }, + { + "epoch": 1.55, + "learning_rate": 9.89789779920706e-07, + "loss": 0.5228, + "step": 60649 + }, + { + "epoch": 1.55, + "learning_rate": 9.897621109130626e-07, + "loss": 0.7666, + "step": 60650 + }, + { + "epoch": 1.55, + "learning_rate": 9.897344419132573e-07, + "loss": 0.4736, + "step": 60651 + }, + { + "epoch": 1.55, + "learning_rate": 9.897067729213123e-07, + "loss": 0.6953, + "step": 60652 + }, + { + "epoch": 1.55, + "learning_rate": 9.896791039372482e-07, + "loss": 0.6416, + "step": 60653 + }, + { + "epoch": 1.55, + "learning_rate": 9.896514349610866e-07, + "loss": 0.7266, + "step": 60654 + }, + { + "epoch": 1.55, + "learning_rate": 9.896237659928483e-07, + "loss": 0.6826, + "step": 60655 + }, + { + "epoch": 1.55, + "learning_rate": 9.895960970325544e-07, + "loss": 0.5879, + "step": 60656 + }, + { + "epoch": 1.55, + "learning_rate": 9.895684280802264e-07, + "loss": 0.5605, + "step": 60657 + }, + { + "epoch": 1.55, + "learning_rate": 9.895407591358852e-07, + "loss": 0.6375, + "step": 60658 + }, + { + "epoch": 1.55, + "learning_rate": 9.895130901995526e-07, + "loss": 0.6621, + "step": 60659 + }, + { + "epoch": 1.55, + "learning_rate": 9.89485421271249e-07, + "loss": 0.7173, + "step": 60660 + }, + { + "epoch": 1.55, + "learning_rate": 9.89457752350996e-07, + "loss": 0.665, + "step": 60661 + }, + { + "epoch": 1.55, + "learning_rate": 9.894300834388147e-07, + "loss": 0.5425, + "step": 60662 + }, + { + "epoch": 1.55, + "learning_rate": 9.894024145347263e-07, + "loss": 0.6475, + "step": 60663 + }, + { + "epoch": 1.55, + "learning_rate": 9.893747456387522e-07, + "loss": 0.5139, + "step": 60664 + }, + { + "epoch": 1.55, + "learning_rate": 9.893470767509132e-07, + "loss": 0.5759, + "step": 60665 + }, + { + "epoch": 1.55, + "learning_rate": 9.893194078712305e-07, + "loss": 0.5042, + "step": 60666 + }, + { + "epoch": 1.55, + "learning_rate": 9.892917389997256e-07, + "loss": 0.749, + "step": 60667 + }, + { + "epoch": 1.55, + "learning_rate": 9.892640701364194e-07, + "loss": 0.6646, + "step": 60668 + }, + { + "epoch": 1.55, + "learning_rate": 9.892364012813333e-07, + "loss": 0.7021, + "step": 60669 + }, + { + "epoch": 1.56, + "learning_rate": 9.892087324344884e-07, + "loss": 0.604, + "step": 60670 + }, + { + "epoch": 1.56, + "learning_rate": 9.89181063595906e-07, + "loss": 0.7666, + "step": 60671 + }, + { + "epoch": 1.56, + "learning_rate": 9.891533947656067e-07, + "loss": 0.6675, + "step": 60672 + }, + { + "epoch": 1.56, + "learning_rate": 9.891257259436127e-07, + "loss": 0.748, + "step": 60673 + }, + { + "epoch": 1.56, + "learning_rate": 9.890980571299446e-07, + "loss": 0.7588, + "step": 60674 + }, + { + "epoch": 1.56, + "learning_rate": 9.890703883246234e-07, + "loss": 0.7588, + "step": 60675 + }, + { + "epoch": 1.56, + "learning_rate": 9.890427195276704e-07, + "loss": 0.6797, + "step": 60676 + }, + { + "epoch": 1.56, + "learning_rate": 9.890150507391071e-07, + "loss": 0.7549, + "step": 60677 + }, + { + "epoch": 1.56, + "learning_rate": 9.889873819589544e-07, + "loss": 0.5635, + "step": 60678 + }, + { + "epoch": 1.56, + "learning_rate": 9.889597131872335e-07, + "loss": 0.5991, + "step": 60679 + }, + { + "epoch": 1.56, + "learning_rate": 9.889320444239656e-07, + "loss": 0.6689, + "step": 60680 + }, + { + "epoch": 1.56, + "learning_rate": 9.88904375669172e-07, + "loss": 0.6748, + "step": 60681 + }, + { + "epoch": 1.56, + "learning_rate": 9.888767069228737e-07, + "loss": 0.5649, + "step": 60682 + }, + { + "epoch": 1.56, + "learning_rate": 9.888490381850923e-07, + "loss": 0.748, + "step": 60683 + }, + { + "epoch": 1.56, + "learning_rate": 9.888213694558486e-07, + "loss": 0.5127, + "step": 60684 + }, + { + "epoch": 1.56, + "learning_rate": 9.887937007351636e-07, + "loss": 0.6675, + "step": 60685 + }, + { + "epoch": 1.56, + "learning_rate": 9.887660320230592e-07, + "loss": 0.5952, + "step": 60686 + }, + { + "epoch": 1.56, + "learning_rate": 9.887383633195556e-07, + "loss": 0.5259, + "step": 60687 + }, + { + "epoch": 1.56, + "learning_rate": 9.887106946246747e-07, + "loss": 0.6699, + "step": 60688 + }, + { + "epoch": 1.56, + "learning_rate": 9.886830259384374e-07, + "loss": 0.4629, + "step": 60689 + }, + { + "epoch": 1.56, + "learning_rate": 9.886553572608653e-07, + "loss": 0.6309, + "step": 60690 + }, + { + "epoch": 1.56, + "learning_rate": 9.88627688591979e-07, + "loss": 0.7676, + "step": 60691 + }, + { + "epoch": 1.56, + "learning_rate": 9.886000199318e-07, + "loss": 0.7646, + "step": 60692 + }, + { + "epoch": 1.56, + "learning_rate": 9.885723512803494e-07, + "loss": 0.7842, + "step": 60693 + }, + { + "epoch": 1.56, + "learning_rate": 9.885446826376492e-07, + "loss": 0.6826, + "step": 60694 + }, + { + "epoch": 1.56, + "learning_rate": 9.88517014003719e-07, + "loss": 0.5723, + "step": 60695 + }, + { + "epoch": 1.56, + "learning_rate": 9.884893453785809e-07, + "loss": 0.6177, + "step": 60696 + }, + { + "epoch": 1.56, + "learning_rate": 9.884616767622558e-07, + "loss": 0.563, + "step": 60697 + }, + { + "epoch": 1.56, + "learning_rate": 9.884340081547655e-07, + "loss": 0.6418, + "step": 60698 + }, + { + "epoch": 1.56, + "learning_rate": 9.884063395561302e-07, + "loss": 0.5928, + "step": 60699 + }, + { + "epoch": 1.56, + "learning_rate": 9.883786709663721e-07, + "loss": 0.6182, + "step": 60700 + }, + { + "epoch": 1.56, + "learning_rate": 9.883510023855117e-07, + "loss": 0.5571, + "step": 60701 + }, + { + "epoch": 1.56, + "learning_rate": 9.883233338135705e-07, + "loss": 0.5728, + "step": 60702 + }, + { + "epoch": 1.56, + "learning_rate": 9.882956652505695e-07, + "loss": 0.3381, + "step": 60703 + }, + { + "epoch": 1.56, + "learning_rate": 9.882679966965303e-07, + "loss": 0.6675, + "step": 60704 + }, + { + "epoch": 1.56, + "learning_rate": 9.882403281514735e-07, + "loss": 0.6191, + "step": 60705 + }, + { + "epoch": 1.56, + "learning_rate": 9.882126596154202e-07, + "loss": 0.7852, + "step": 60706 + }, + { + "epoch": 1.56, + "learning_rate": 9.881849910883925e-07, + "loss": 0.47, + "step": 60707 + }, + { + "epoch": 1.56, + "learning_rate": 9.881573225704105e-07, + "loss": 0.5353, + "step": 60708 + }, + { + "epoch": 1.56, + "learning_rate": 9.881296540614964e-07, + "loss": 0.5688, + "step": 60709 + }, + { + "epoch": 1.56, + "learning_rate": 9.881019855616705e-07, + "loss": 0.6406, + "step": 60710 + }, + { + "epoch": 1.56, + "learning_rate": 9.880743170709545e-07, + "loss": 0.6504, + "step": 60711 + }, + { + "epoch": 1.56, + "learning_rate": 9.880466485893693e-07, + "loss": 0.6973, + "step": 60712 + }, + { + "epoch": 1.56, + "learning_rate": 9.880189801169364e-07, + "loss": 0.6289, + "step": 60713 + }, + { + "epoch": 1.56, + "learning_rate": 9.879913116536772e-07, + "loss": 0.6094, + "step": 60714 + }, + { + "epoch": 1.56, + "learning_rate": 9.87963643199612e-07, + "loss": 0.8193, + "step": 60715 + }, + { + "epoch": 1.56, + "learning_rate": 9.879359747547626e-07, + "loss": 0.644, + "step": 60716 + }, + { + "epoch": 1.56, + "learning_rate": 9.879083063191501e-07, + "loss": 0.4155, + "step": 60717 + }, + { + "epoch": 1.56, + "learning_rate": 9.878806378927954e-07, + "loss": 0.5391, + "step": 60718 + }, + { + "epoch": 1.56, + "learning_rate": 9.878529694757202e-07, + "loss": 0.4857, + "step": 60719 + }, + { + "epoch": 1.56, + "learning_rate": 9.878253010679453e-07, + "loss": 0.7021, + "step": 60720 + }, + { + "epoch": 1.56, + "learning_rate": 9.87797632669492e-07, + "loss": 0.583, + "step": 60721 + }, + { + "epoch": 1.56, + "learning_rate": 9.877699642803814e-07, + "loss": 0.53, + "step": 60722 + }, + { + "epoch": 1.56, + "learning_rate": 9.87742295900635e-07, + "loss": 0.6841, + "step": 60723 + }, + { + "epoch": 1.56, + "learning_rate": 9.87714627530274e-07, + "loss": 0.6748, + "step": 60724 + }, + { + "epoch": 1.56, + "learning_rate": 9.87686959169319e-07, + "loss": 0.7324, + "step": 60725 + }, + { + "epoch": 1.56, + "learning_rate": 9.876592908177917e-07, + "loss": 0.6982, + "step": 60726 + }, + { + "epoch": 1.56, + "learning_rate": 9.876316224757128e-07, + "loss": 0.6797, + "step": 60727 + }, + { + "epoch": 1.56, + "learning_rate": 9.876039541431041e-07, + "loss": 0.6694, + "step": 60728 + }, + { + "epoch": 1.56, + "learning_rate": 9.875762858199863e-07, + "loss": 0.5552, + "step": 60729 + }, + { + "epoch": 1.56, + "learning_rate": 9.875486175063808e-07, + "loss": 0.6475, + "step": 60730 + }, + { + "epoch": 1.56, + "learning_rate": 9.875209492023087e-07, + "loss": 0.6997, + "step": 60731 + }, + { + "epoch": 1.56, + "learning_rate": 9.874932809077913e-07, + "loss": 0.458, + "step": 60732 + }, + { + "epoch": 1.56, + "learning_rate": 9.874656126228499e-07, + "loss": 0.6084, + "step": 60733 + }, + { + "epoch": 1.56, + "learning_rate": 9.874379443475055e-07, + "loss": 0.5913, + "step": 60734 + }, + { + "epoch": 1.56, + "learning_rate": 9.87410276081779e-07, + "loss": 0.6626, + "step": 60735 + }, + { + "epoch": 1.56, + "learning_rate": 9.873826078256921e-07, + "loss": 0.606, + "step": 60736 + }, + { + "epoch": 1.56, + "learning_rate": 9.873549395792655e-07, + "loss": 0.6388, + "step": 60737 + }, + { + "epoch": 1.56, + "learning_rate": 9.873272713425208e-07, + "loss": 0.6406, + "step": 60738 + }, + { + "epoch": 1.56, + "learning_rate": 9.87299603115479e-07, + "loss": 0.7197, + "step": 60739 + }, + { + "epoch": 1.56, + "learning_rate": 9.872719348981614e-07, + "loss": 0.5583, + "step": 60740 + }, + { + "epoch": 1.56, + "learning_rate": 9.872442666905888e-07, + "loss": 0.6348, + "step": 60741 + }, + { + "epoch": 1.56, + "learning_rate": 9.872165984927831e-07, + "loss": 0.6738, + "step": 60742 + }, + { + "epoch": 1.56, + "learning_rate": 9.871889303047647e-07, + "loss": 0.6094, + "step": 60743 + }, + { + "epoch": 1.56, + "learning_rate": 9.871612621265555e-07, + "loss": 0.7002, + "step": 60744 + }, + { + "epoch": 1.56, + "learning_rate": 9.871335939581762e-07, + "loss": 0.624, + "step": 60745 + }, + { + "epoch": 1.56, + "learning_rate": 9.87105925799648e-07, + "loss": 0.6882, + "step": 60746 + }, + { + "epoch": 1.56, + "learning_rate": 9.870782576509923e-07, + "loss": 0.5571, + "step": 60747 + }, + { + "epoch": 1.56, + "learning_rate": 9.8705058951223e-07, + "loss": 0.7202, + "step": 60748 + }, + { + "epoch": 1.56, + "learning_rate": 9.870229213833826e-07, + "loss": 0.7295, + "step": 60749 + }, + { + "epoch": 1.56, + "learning_rate": 9.869952532644715e-07, + "loss": 0.5601, + "step": 60750 + }, + { + "epoch": 1.56, + "learning_rate": 9.86967585155517e-07, + "loss": 0.5586, + "step": 60751 + }, + { + "epoch": 1.56, + "learning_rate": 9.86939917056541e-07, + "loss": 0.6172, + "step": 60752 + }, + { + "epoch": 1.56, + "learning_rate": 9.869122489675645e-07, + "loss": 0.5552, + "step": 60753 + }, + { + "epoch": 1.56, + "learning_rate": 9.86884580888609e-07, + "loss": 0.7637, + "step": 60754 + }, + { + "epoch": 1.56, + "learning_rate": 9.868569128196952e-07, + "loss": 0.6436, + "step": 60755 + }, + { + "epoch": 1.56, + "learning_rate": 9.868292447608442e-07, + "loss": 0.6025, + "step": 60756 + }, + { + "epoch": 1.56, + "learning_rate": 9.868015767120775e-07, + "loss": 0.5936, + "step": 60757 + }, + { + "epoch": 1.56, + "learning_rate": 9.867739086734162e-07, + "loss": 0.7051, + "step": 60758 + }, + { + "epoch": 1.56, + "learning_rate": 9.867462406448818e-07, + "loss": 0.561, + "step": 60759 + }, + { + "epoch": 1.56, + "learning_rate": 9.867185726264948e-07, + "loss": 0.6196, + "step": 60760 + }, + { + "epoch": 1.56, + "learning_rate": 9.866909046182771e-07, + "loss": 0.7471, + "step": 60761 + }, + { + "epoch": 1.56, + "learning_rate": 9.866632366202493e-07, + "loss": 0.7998, + "step": 60762 + }, + { + "epoch": 1.56, + "learning_rate": 9.866355686324332e-07, + "loss": 0.7339, + "step": 60763 + }, + { + "epoch": 1.56, + "learning_rate": 9.866079006548497e-07, + "loss": 0.7197, + "step": 60764 + }, + { + "epoch": 1.56, + "learning_rate": 9.865802326875194e-07, + "loss": 0.8125, + "step": 60765 + }, + { + "epoch": 1.56, + "learning_rate": 9.865525647304644e-07, + "loss": 0.709, + "step": 60766 + }, + { + "epoch": 1.56, + "learning_rate": 9.865248967837055e-07, + "loss": 0.5068, + "step": 60767 + }, + { + "epoch": 1.56, + "learning_rate": 9.864972288472634e-07, + "loss": 0.5835, + "step": 60768 + }, + { + "epoch": 1.56, + "learning_rate": 9.8646956092116e-07, + "loss": 0.3438, + "step": 60769 + }, + { + "epoch": 1.56, + "learning_rate": 9.864418930054164e-07, + "loss": 0.793, + "step": 60770 + }, + { + "epoch": 1.56, + "learning_rate": 9.864142251000535e-07, + "loss": 0.7266, + "step": 60771 + }, + { + "epoch": 1.56, + "learning_rate": 9.863865572050925e-07, + "loss": 0.7617, + "step": 60772 + }, + { + "epoch": 1.56, + "learning_rate": 9.863588893205548e-07, + "loss": 0.585, + "step": 60773 + }, + { + "epoch": 1.56, + "learning_rate": 9.863312214464618e-07, + "loss": 0.7959, + "step": 60774 + }, + { + "epoch": 1.56, + "learning_rate": 9.86303553582834e-07, + "loss": 0.665, + "step": 60775 + }, + { + "epoch": 1.56, + "learning_rate": 9.86275885729693e-07, + "loss": 0.7383, + "step": 60776 + }, + { + "epoch": 1.56, + "learning_rate": 9.862482178870598e-07, + "loss": 0.6436, + "step": 60777 + }, + { + "epoch": 1.56, + "learning_rate": 9.862205500549557e-07, + "loss": 0.6738, + "step": 60778 + }, + { + "epoch": 1.56, + "learning_rate": 9.861928822334018e-07, + "loss": 0.6846, + "step": 60779 + }, + { + "epoch": 1.56, + "learning_rate": 9.861652144224198e-07, + "loss": 0.4863, + "step": 60780 + }, + { + "epoch": 1.56, + "learning_rate": 9.861375466220299e-07, + "loss": 0.7559, + "step": 60781 + }, + { + "epoch": 1.56, + "learning_rate": 9.861098788322544e-07, + "loss": 0.6362, + "step": 60782 + }, + { + "epoch": 1.56, + "learning_rate": 9.860822110531135e-07, + "loss": 0.48, + "step": 60783 + }, + { + "epoch": 1.56, + "learning_rate": 9.860545432846295e-07, + "loss": 0.6499, + "step": 60784 + }, + { + "epoch": 1.56, + "learning_rate": 9.860268755268222e-07, + "loss": 0.5376, + "step": 60785 + }, + { + "epoch": 1.56, + "learning_rate": 9.859992077797139e-07, + "loss": 0.6455, + "step": 60786 + }, + { + "epoch": 1.56, + "learning_rate": 9.85971540043325e-07, + "loss": 0.6973, + "step": 60787 + }, + { + "epoch": 1.56, + "learning_rate": 9.859438723176772e-07, + "loss": 0.6606, + "step": 60788 + }, + { + "epoch": 1.56, + "learning_rate": 9.859162046027913e-07, + "loss": 0.6411, + "step": 60789 + }, + { + "epoch": 1.56, + "learning_rate": 9.85888536898689e-07, + "loss": 0.8457, + "step": 60790 + }, + { + "epoch": 1.56, + "learning_rate": 9.85860869205391e-07, + "loss": 0.7627, + "step": 60791 + }, + { + "epoch": 1.56, + "learning_rate": 9.85833201522919e-07, + "loss": 0.5786, + "step": 60792 + }, + { + "epoch": 1.56, + "learning_rate": 9.858055338512935e-07, + "loss": 0.6172, + "step": 60793 + }, + { + "epoch": 1.56, + "learning_rate": 9.857778661905366e-07, + "loss": 0.6255, + "step": 60794 + }, + { + "epoch": 1.56, + "learning_rate": 9.857501985406685e-07, + "loss": 0.6504, + "step": 60795 + }, + { + "epoch": 1.56, + "learning_rate": 9.857225309017108e-07, + "loss": 0.6826, + "step": 60796 + }, + { + "epoch": 1.56, + "learning_rate": 9.856948632736849e-07, + "loss": 0.6787, + "step": 60797 + }, + { + "epoch": 1.56, + "learning_rate": 9.856671956566113e-07, + "loss": 0.625, + "step": 60798 + }, + { + "epoch": 1.56, + "learning_rate": 9.856395280505121e-07, + "loss": 0.7061, + "step": 60799 + }, + { + "epoch": 1.56, + "learning_rate": 9.85611860455408e-07, + "loss": 0.7451, + "step": 60800 + }, + { + "epoch": 1.56, + "learning_rate": 9.855841928713203e-07, + "loss": 0.5212, + "step": 60801 + }, + { + "epoch": 1.56, + "learning_rate": 9.8555652529827e-07, + "loss": 0.6992, + "step": 60802 + }, + { + "epoch": 1.56, + "learning_rate": 9.855288577362784e-07, + "loss": 0.6685, + "step": 60803 + }, + { + "epoch": 1.56, + "learning_rate": 9.85501190185367e-07, + "loss": 0.708, + "step": 60804 + }, + { + "epoch": 1.56, + "learning_rate": 9.854735226455564e-07, + "loss": 0.6108, + "step": 60805 + }, + { + "epoch": 1.56, + "learning_rate": 9.85445855116868e-07, + "loss": 0.7012, + "step": 60806 + }, + { + "epoch": 1.56, + "learning_rate": 9.854181875993232e-07, + "loss": 0.6895, + "step": 60807 + }, + { + "epoch": 1.56, + "learning_rate": 9.853905200929429e-07, + "loss": 0.8359, + "step": 60808 + }, + { + "epoch": 1.56, + "learning_rate": 9.853628525977485e-07, + "loss": 0.5256, + "step": 60809 + }, + { + "epoch": 1.56, + "learning_rate": 9.853351851137607e-07, + "loss": 0.7397, + "step": 60810 + }, + { + "epoch": 1.56, + "learning_rate": 9.853075176410017e-07, + "loss": 0.7256, + "step": 60811 + }, + { + "epoch": 1.56, + "learning_rate": 9.852798501794917e-07, + "loss": 0.5217, + "step": 60812 + }, + { + "epoch": 1.56, + "learning_rate": 9.85252182729252e-07, + "loss": 0.6836, + "step": 60813 + }, + { + "epoch": 1.56, + "learning_rate": 9.852245152903049e-07, + "loss": 0.6479, + "step": 60814 + }, + { + "epoch": 1.56, + "learning_rate": 9.851968478626698e-07, + "loss": 0.6162, + "step": 60815 + }, + { + "epoch": 1.56, + "learning_rate": 9.851691804463693e-07, + "loss": 0.6235, + "step": 60816 + }, + { + "epoch": 1.56, + "learning_rate": 9.851415130414238e-07, + "loss": 0.8105, + "step": 60817 + }, + { + "epoch": 1.56, + "learning_rate": 9.851138456478549e-07, + "loss": 0.7793, + "step": 60818 + }, + { + "epoch": 1.56, + "learning_rate": 9.850861782656835e-07, + "loss": 0.8496, + "step": 60819 + }, + { + "epoch": 1.56, + "learning_rate": 9.850585108949311e-07, + "loss": 0.7529, + "step": 60820 + }, + { + "epoch": 1.56, + "learning_rate": 9.850308435356186e-07, + "loss": 0.6758, + "step": 60821 + }, + { + "epoch": 1.56, + "learning_rate": 9.850031761877673e-07, + "loss": 0.7451, + "step": 60822 + }, + { + "epoch": 1.56, + "learning_rate": 9.849755088513985e-07, + "loss": 0.5602, + "step": 60823 + }, + { + "epoch": 1.56, + "learning_rate": 9.849478415265334e-07, + "loss": 0.4722, + "step": 60824 + }, + { + "epoch": 1.56, + "learning_rate": 9.849201742131927e-07, + "loss": 0.7061, + "step": 60825 + }, + { + "epoch": 1.56, + "learning_rate": 9.848925069113981e-07, + "loss": 0.8359, + "step": 60826 + }, + { + "epoch": 1.56, + "learning_rate": 9.848648396211705e-07, + "loss": 0.5546, + "step": 60827 + }, + { + "epoch": 1.56, + "learning_rate": 9.848371723425315e-07, + "loss": 0.5664, + "step": 60828 + }, + { + "epoch": 1.56, + "learning_rate": 9.848095050755015e-07, + "loss": 0.6211, + "step": 60829 + }, + { + "epoch": 1.56, + "learning_rate": 9.847818378201025e-07, + "loss": 0.563, + "step": 60830 + }, + { + "epoch": 1.56, + "learning_rate": 9.847541705763552e-07, + "loss": 0.6475, + "step": 60831 + }, + { + "epoch": 1.56, + "learning_rate": 9.84726503344281e-07, + "loss": 0.7334, + "step": 60832 + }, + { + "epoch": 1.56, + "learning_rate": 9.846988361239009e-07, + "loss": 0.5088, + "step": 60833 + }, + { + "epoch": 1.56, + "learning_rate": 9.846711689152366e-07, + "loss": 0.6567, + "step": 60834 + }, + { + "epoch": 1.56, + "learning_rate": 9.846435017183085e-07, + "loss": 0.668, + "step": 60835 + }, + { + "epoch": 1.56, + "learning_rate": 9.846158345331381e-07, + "loss": 0.5813, + "step": 60836 + }, + { + "epoch": 1.56, + "learning_rate": 9.84588167359747e-07, + "loss": 0.7031, + "step": 60837 + }, + { + "epoch": 1.56, + "learning_rate": 9.845605001981557e-07, + "loss": 0.5449, + "step": 60838 + }, + { + "epoch": 1.56, + "learning_rate": 9.84532833048386e-07, + "loss": 0.6978, + "step": 60839 + }, + { + "epoch": 1.56, + "learning_rate": 9.845051659104584e-07, + "loss": 0.6602, + "step": 60840 + }, + { + "epoch": 1.56, + "learning_rate": 9.844774987843946e-07, + "loss": 0.6191, + "step": 60841 + }, + { + "epoch": 1.56, + "learning_rate": 9.84449831670216e-07, + "loss": 0.6973, + "step": 60842 + }, + { + "epoch": 1.56, + "learning_rate": 9.84422164567943e-07, + "loss": 0.4824, + "step": 60843 + }, + { + "epoch": 1.56, + "learning_rate": 9.84394497477598e-07, + "loss": 0.5425, + "step": 60844 + }, + { + "epoch": 1.56, + "learning_rate": 9.843668303992007e-07, + "loss": 0.7871, + "step": 60845 + }, + { + "epoch": 1.56, + "learning_rate": 9.843391633327731e-07, + "loss": 0.5996, + "step": 60846 + }, + { + "epoch": 1.56, + "learning_rate": 9.843114962783363e-07, + "loss": 0.7021, + "step": 60847 + }, + { + "epoch": 1.56, + "learning_rate": 9.842838292359115e-07, + "loss": 0.6104, + "step": 60848 + }, + { + "epoch": 1.56, + "learning_rate": 9.842561622055199e-07, + "loss": 0.6758, + "step": 60849 + }, + { + "epoch": 1.56, + "learning_rate": 9.842284951871826e-07, + "loss": 0.5513, + "step": 60850 + }, + { + "epoch": 1.56, + "learning_rate": 9.842008281809208e-07, + "loss": 0.5596, + "step": 60851 + }, + { + "epoch": 1.56, + "learning_rate": 9.841731611867557e-07, + "loss": 0.4653, + "step": 60852 + }, + { + "epoch": 1.56, + "learning_rate": 9.841454942047087e-07, + "loss": 0.6558, + "step": 60853 + }, + { + "epoch": 1.56, + "learning_rate": 9.841178272348007e-07, + "loss": 0.6738, + "step": 60854 + }, + { + "epoch": 1.56, + "learning_rate": 9.840901602770527e-07, + "loss": 0.6777, + "step": 60855 + }, + { + "epoch": 1.56, + "learning_rate": 9.840624933314864e-07, + "loss": 0.7256, + "step": 60856 + }, + { + "epoch": 1.56, + "learning_rate": 9.840348263981226e-07, + "loss": 0.6201, + "step": 60857 + }, + { + "epoch": 1.56, + "learning_rate": 9.840071594769825e-07, + "loss": 0.6753, + "step": 60858 + }, + { + "epoch": 1.56, + "learning_rate": 9.839794925680874e-07, + "loss": 0.7007, + "step": 60859 + }, + { + "epoch": 1.56, + "learning_rate": 9.839518256714583e-07, + "loss": 0.5044, + "step": 60860 + }, + { + "epoch": 1.56, + "learning_rate": 9.83924158787117e-07, + "loss": 0.8047, + "step": 60861 + }, + { + "epoch": 1.56, + "learning_rate": 9.838964919150839e-07, + "loss": 0.583, + "step": 60862 + }, + { + "epoch": 1.56, + "learning_rate": 9.838688250553806e-07, + "loss": 0.6885, + "step": 60863 + }, + { + "epoch": 1.56, + "learning_rate": 9.838411582080286e-07, + "loss": 0.6973, + "step": 60864 + }, + { + "epoch": 1.56, + "learning_rate": 9.83813491373048e-07, + "loss": 0.6914, + "step": 60865 + }, + { + "epoch": 1.56, + "learning_rate": 9.837858245504611e-07, + "loss": 0.6553, + "step": 60866 + }, + { + "epoch": 1.56, + "learning_rate": 9.837581577402885e-07, + "loss": 0.7246, + "step": 60867 + }, + { + "epoch": 1.56, + "learning_rate": 9.837304909425516e-07, + "loss": 0.6143, + "step": 60868 + }, + { + "epoch": 1.56, + "learning_rate": 9.837028241572712e-07, + "loss": 0.6182, + "step": 60869 + }, + { + "epoch": 1.56, + "learning_rate": 9.83675157384469e-07, + "loss": 0.5664, + "step": 60870 + }, + { + "epoch": 1.56, + "learning_rate": 9.83647490624166e-07, + "loss": 0.4873, + "step": 60871 + }, + { + "epoch": 1.56, + "learning_rate": 9.836198238763835e-07, + "loss": 0.5488, + "step": 60872 + }, + { + "epoch": 1.56, + "learning_rate": 9.835921571411428e-07, + "loss": 0.7588, + "step": 60873 + }, + { + "epoch": 1.56, + "learning_rate": 9.835644904184645e-07, + "loss": 0.7666, + "step": 60874 + }, + { + "epoch": 1.56, + "learning_rate": 9.8353682370837e-07, + "loss": 0.5935, + "step": 60875 + }, + { + "epoch": 1.56, + "learning_rate": 9.835091570108808e-07, + "loss": 0.6777, + "step": 60876 + }, + { + "epoch": 1.56, + "learning_rate": 9.834814903260177e-07, + "loss": 0.6758, + "step": 60877 + }, + { + "epoch": 1.56, + "learning_rate": 9.834538236538022e-07, + "loss": 0.6621, + "step": 60878 + }, + { + "epoch": 1.56, + "learning_rate": 9.83426156994255e-07, + "loss": 0.6001, + "step": 60879 + }, + { + "epoch": 1.56, + "learning_rate": 9.83398490347398e-07, + "loss": 0.7686, + "step": 60880 + }, + { + "epoch": 1.56, + "learning_rate": 9.833708237132518e-07, + "loss": 0.5254, + "step": 60881 + }, + { + "epoch": 1.56, + "learning_rate": 9.833431570918382e-07, + "loss": 0.6748, + "step": 60882 + }, + { + "epoch": 1.56, + "learning_rate": 9.83315490483178e-07, + "loss": 0.5039, + "step": 60883 + }, + { + "epoch": 1.56, + "learning_rate": 9.832878238872917e-07, + "loss": 0.5809, + "step": 60884 + }, + { + "epoch": 1.56, + "learning_rate": 9.832601573042017e-07, + "loss": 0.7783, + "step": 60885 + }, + { + "epoch": 1.56, + "learning_rate": 9.832324907339283e-07, + "loss": 0.4893, + "step": 60886 + }, + { + "epoch": 1.56, + "learning_rate": 9.832048241764932e-07, + "loss": 0.6372, + "step": 60887 + }, + { + "epoch": 1.56, + "learning_rate": 9.831771576319173e-07, + "loss": 0.665, + "step": 60888 + }, + { + "epoch": 1.56, + "learning_rate": 9.83149491100222e-07, + "loss": 0.6758, + "step": 60889 + }, + { + "epoch": 1.56, + "learning_rate": 9.83121824581428e-07, + "loss": 0.6777, + "step": 60890 + }, + { + "epoch": 1.56, + "learning_rate": 9.830941580755572e-07, + "loss": 0.7393, + "step": 60891 + }, + { + "epoch": 1.56, + "learning_rate": 9.830664915826302e-07, + "loss": 0.6082, + "step": 60892 + }, + { + "epoch": 1.56, + "learning_rate": 9.830388251026691e-07, + "loss": 0.6504, + "step": 60893 + }, + { + "epoch": 1.56, + "learning_rate": 9.830111586356938e-07, + "loss": 0.8008, + "step": 60894 + }, + { + "epoch": 1.56, + "learning_rate": 9.829834921817263e-07, + "loss": 0.6108, + "step": 60895 + }, + { + "epoch": 1.56, + "learning_rate": 9.82955825740787e-07, + "loss": 0.6143, + "step": 60896 + }, + { + "epoch": 1.56, + "learning_rate": 9.829281593128981e-07, + "loss": 0.6064, + "step": 60897 + }, + { + "epoch": 1.56, + "learning_rate": 9.829004928980803e-07, + "loss": 0.6073, + "step": 60898 + }, + { + "epoch": 1.56, + "learning_rate": 9.828728264963546e-07, + "loss": 0.6914, + "step": 60899 + }, + { + "epoch": 1.56, + "learning_rate": 9.828451601077424e-07, + "loss": 0.707, + "step": 60900 + }, + { + "epoch": 1.56, + "learning_rate": 9.828174937322652e-07, + "loss": 0.6021, + "step": 60901 + }, + { + "epoch": 1.56, + "learning_rate": 9.827898273699435e-07, + "loss": 0.6313, + "step": 60902 + }, + { + "epoch": 1.56, + "learning_rate": 9.827621610207993e-07, + "loss": 0.7539, + "step": 60903 + }, + { + "epoch": 1.56, + "learning_rate": 9.82734494684853e-07, + "loss": 0.6353, + "step": 60904 + }, + { + "epoch": 1.56, + "learning_rate": 9.82706828362126e-07, + "loss": 0.6714, + "step": 60905 + }, + { + "epoch": 1.56, + "learning_rate": 9.826791620526399e-07, + "loss": 0.6538, + "step": 60906 + }, + { + "epoch": 1.56, + "learning_rate": 9.82651495756415e-07, + "loss": 0.5698, + "step": 60907 + }, + { + "epoch": 1.56, + "learning_rate": 9.826238294734737e-07, + "loss": 0.5266, + "step": 60908 + }, + { + "epoch": 1.56, + "learning_rate": 9.82596163203836e-07, + "loss": 0.5205, + "step": 60909 + }, + { + "epoch": 1.56, + "learning_rate": 9.82568496947524e-07, + "loss": 0.6328, + "step": 60910 + }, + { + "epoch": 1.56, + "learning_rate": 9.825408307045582e-07, + "loss": 0.6758, + "step": 60911 + }, + { + "epoch": 1.56, + "learning_rate": 9.825131644749604e-07, + "loss": 0.7178, + "step": 60912 + }, + { + "epoch": 1.56, + "learning_rate": 9.824854982587517e-07, + "loss": 0.5781, + "step": 60913 + }, + { + "epoch": 1.56, + "learning_rate": 9.824578320559527e-07, + "loss": 0.751, + "step": 60914 + }, + { + "epoch": 1.56, + "learning_rate": 9.82430165866585e-07, + "loss": 0.646, + "step": 60915 + }, + { + "epoch": 1.56, + "learning_rate": 9.824024996906696e-07, + "loss": 0.7461, + "step": 60916 + }, + { + "epoch": 1.56, + "learning_rate": 9.823748335282275e-07, + "loss": 0.5369, + "step": 60917 + }, + { + "epoch": 1.56, + "learning_rate": 9.823471673792806e-07, + "loss": 0.5518, + "step": 60918 + }, + { + "epoch": 1.56, + "learning_rate": 9.823195012438496e-07, + "loss": 0.499, + "step": 60919 + }, + { + "epoch": 1.56, + "learning_rate": 9.822918351219558e-07, + "loss": 0.6523, + "step": 60920 + }, + { + "epoch": 1.56, + "learning_rate": 9.822641690136201e-07, + "loss": 0.5681, + "step": 60921 + }, + { + "epoch": 1.56, + "learning_rate": 9.82236502918864e-07, + "loss": 0.7588, + "step": 60922 + }, + { + "epoch": 1.56, + "learning_rate": 9.82208836837709e-07, + "loss": 0.6572, + "step": 60923 + }, + { + "epoch": 1.56, + "learning_rate": 9.821811707701753e-07, + "loss": 0.509, + "step": 60924 + }, + { + "epoch": 1.56, + "learning_rate": 9.82153504716285e-07, + "loss": 0.7373, + "step": 60925 + }, + { + "epoch": 1.56, + "learning_rate": 9.821258386760587e-07, + "loss": 0.5264, + "step": 60926 + }, + { + "epoch": 1.56, + "learning_rate": 9.82098172649518e-07, + "loss": 0.4202, + "step": 60927 + }, + { + "epoch": 1.56, + "learning_rate": 9.820705066366838e-07, + "loss": 0.5679, + "step": 60928 + }, + { + "epoch": 1.56, + "learning_rate": 9.820428406375774e-07, + "loss": 0.667, + "step": 60929 + }, + { + "epoch": 1.56, + "learning_rate": 9.8201517465222e-07, + "loss": 0.6709, + "step": 60930 + }, + { + "epoch": 1.56, + "learning_rate": 9.819875086806328e-07, + "loss": 0.562, + "step": 60931 + }, + { + "epoch": 1.56, + "learning_rate": 9.819598427228368e-07, + "loss": 0.6655, + "step": 60932 + }, + { + "epoch": 1.56, + "learning_rate": 9.81932176778854e-07, + "loss": 0.7803, + "step": 60933 + }, + { + "epoch": 1.56, + "learning_rate": 9.81904510848704e-07, + "loss": 0.668, + "step": 60934 + }, + { + "epoch": 1.56, + "learning_rate": 9.818768449324094e-07, + "loss": 0.5349, + "step": 60935 + }, + { + "epoch": 1.56, + "learning_rate": 9.818491790299905e-07, + "loss": 0.585, + "step": 60936 + }, + { + "epoch": 1.56, + "learning_rate": 9.81821513141469e-07, + "loss": 0.6289, + "step": 60937 + }, + { + "epoch": 1.56, + "learning_rate": 9.817938472668659e-07, + "loss": 0.4854, + "step": 60938 + }, + { + "epoch": 1.56, + "learning_rate": 9.817661814062026e-07, + "loss": 0.6514, + "step": 60939 + }, + { + "epoch": 1.56, + "learning_rate": 9.817385155594997e-07, + "loss": 0.5459, + "step": 60940 + }, + { + "epoch": 1.56, + "learning_rate": 9.817108497267792e-07, + "loss": 0.4534, + "step": 60941 + }, + { + "epoch": 1.56, + "learning_rate": 9.816831839080614e-07, + "loss": 0.5558, + "step": 60942 + }, + { + "epoch": 1.56, + "learning_rate": 9.816555181033686e-07, + "loss": 0.6206, + "step": 60943 + }, + { + "epoch": 1.56, + "learning_rate": 9.81627852312721e-07, + "loss": 0.5386, + "step": 60944 + }, + { + "epoch": 1.56, + "learning_rate": 9.8160018653614e-07, + "loss": 0.4768, + "step": 60945 + }, + { + "epoch": 1.56, + "learning_rate": 9.81572520773647e-07, + "loss": 0.6357, + "step": 60946 + }, + { + "epoch": 1.56, + "learning_rate": 9.815448550252632e-07, + "loss": 0.6245, + "step": 60947 + }, + { + "epoch": 1.56, + "learning_rate": 9.815171892910094e-07, + "loss": 0.6973, + "step": 60948 + }, + { + "epoch": 1.56, + "learning_rate": 9.814895235709072e-07, + "loss": 0.5933, + "step": 60949 + }, + { + "epoch": 1.56, + "learning_rate": 9.814618578649774e-07, + "loss": 0.6523, + "step": 60950 + }, + { + "epoch": 1.56, + "learning_rate": 9.814341921732417e-07, + "loss": 0.6982, + "step": 60951 + }, + { + "epoch": 1.56, + "learning_rate": 9.814065264957207e-07, + "loss": 0.6826, + "step": 60952 + }, + { + "epoch": 1.56, + "learning_rate": 9.813788608324363e-07, + "loss": 0.7104, + "step": 60953 + }, + { + "epoch": 1.56, + "learning_rate": 9.813511951834088e-07, + "loss": 0.5635, + "step": 60954 + }, + { + "epoch": 1.56, + "learning_rate": 9.8132352954866e-07, + "loss": 0.6567, + "step": 60955 + }, + { + "epoch": 1.56, + "learning_rate": 9.81295863928211e-07, + "loss": 0.6738, + "step": 60956 + }, + { + "epoch": 1.56, + "learning_rate": 9.812681983220827e-07, + "loss": 0.4839, + "step": 60957 + }, + { + "epoch": 1.56, + "learning_rate": 9.812405327302967e-07, + "loss": 0.709, + "step": 60958 + }, + { + "epoch": 1.56, + "learning_rate": 9.812128671528736e-07, + "loss": 0.7783, + "step": 60959 + }, + { + "epoch": 1.56, + "learning_rate": 9.811852015898352e-07, + "loss": 0.519, + "step": 60960 + }, + { + "epoch": 1.56, + "learning_rate": 9.811575360412024e-07, + "loss": 0.8018, + "step": 60961 + }, + { + "epoch": 1.56, + "learning_rate": 9.811298705069964e-07, + "loss": 0.7393, + "step": 60962 + }, + { + "epoch": 1.56, + "learning_rate": 9.811022049872389e-07, + "loss": 0.5239, + "step": 60963 + }, + { + "epoch": 1.56, + "learning_rate": 9.8107453948195e-07, + "loss": 0.7334, + "step": 60964 + }, + { + "epoch": 1.56, + "learning_rate": 9.810468739911515e-07, + "loss": 0.4501, + "step": 60965 + }, + { + "epoch": 1.56, + "learning_rate": 9.810192085148645e-07, + "loss": 0.6562, + "step": 60966 + }, + { + "epoch": 1.56, + "learning_rate": 9.809915430531102e-07, + "loss": 0.6348, + "step": 60967 + }, + { + "epoch": 1.56, + "learning_rate": 9.809638776059101e-07, + "loss": 0.6357, + "step": 60968 + }, + { + "epoch": 1.56, + "learning_rate": 9.809362121732848e-07, + "loss": 0.3662, + "step": 60969 + }, + { + "epoch": 1.56, + "learning_rate": 9.80908546755256e-07, + "loss": 0.6577, + "step": 60970 + }, + { + "epoch": 1.56, + "learning_rate": 9.808808813518441e-07, + "loss": 0.4836, + "step": 60971 + }, + { + "epoch": 1.56, + "learning_rate": 9.808532159630714e-07, + "loss": 0.5376, + "step": 60972 + }, + { + "epoch": 1.56, + "learning_rate": 9.808255505889587e-07, + "loss": 0.6257, + "step": 60973 + }, + { + "epoch": 1.56, + "learning_rate": 9.807978852295265e-07, + "loss": 0.6123, + "step": 60974 + }, + { + "epoch": 1.56, + "learning_rate": 9.807702198847967e-07, + "loss": 0.4752, + "step": 60975 + }, + { + "epoch": 1.56, + "learning_rate": 9.8074255455479e-07, + "loss": 0.5537, + "step": 60976 + }, + { + "epoch": 1.56, + "learning_rate": 9.80714889239528e-07, + "loss": 0.623, + "step": 60977 + }, + { + "epoch": 1.56, + "learning_rate": 9.806872239390316e-07, + "loss": 0.5981, + "step": 60978 + }, + { + "epoch": 1.56, + "learning_rate": 9.806595586533225e-07, + "loss": 0.572, + "step": 60979 + }, + { + "epoch": 1.56, + "learning_rate": 9.80631893382421e-07, + "loss": 0.6846, + "step": 60980 + }, + { + "epoch": 1.56, + "learning_rate": 9.80604228126349e-07, + "loss": 0.5056, + "step": 60981 + }, + { + "epoch": 1.56, + "learning_rate": 9.805765628851273e-07, + "loss": 0.6396, + "step": 60982 + }, + { + "epoch": 1.56, + "learning_rate": 9.80548897658778e-07, + "loss": 0.376, + "step": 60983 + }, + { + "epoch": 1.56, + "learning_rate": 9.805212324473208e-07, + "loss": 0.5879, + "step": 60984 + }, + { + "epoch": 1.56, + "learning_rate": 9.804935672507777e-07, + "loss": 0.5342, + "step": 60985 + }, + { + "epoch": 1.56, + "learning_rate": 9.804659020691695e-07, + "loss": 0.6406, + "step": 60986 + }, + { + "epoch": 1.56, + "learning_rate": 9.804382369025182e-07, + "loss": 0.6035, + "step": 60987 + }, + { + "epoch": 1.56, + "learning_rate": 9.80410571750844e-07, + "loss": 0.6343, + "step": 60988 + }, + { + "epoch": 1.56, + "learning_rate": 9.803829066141688e-07, + "loss": 0.5669, + "step": 60989 + }, + { + "epoch": 1.56, + "learning_rate": 9.803552414925132e-07, + "loss": 0.666, + "step": 60990 + }, + { + "epoch": 1.56, + "learning_rate": 9.80327576385899e-07, + "loss": 0.5042, + "step": 60991 + }, + { + "epoch": 1.56, + "learning_rate": 9.802999112943467e-07, + "loss": 0.624, + "step": 60992 + }, + { + "epoch": 1.56, + "learning_rate": 9.802722462178785e-07, + "loss": 0.6748, + "step": 60993 + }, + { + "epoch": 1.56, + "learning_rate": 9.802445811565147e-07, + "loss": 0.675, + "step": 60994 + }, + { + "epoch": 1.56, + "learning_rate": 9.802169161102764e-07, + "loss": 0.6743, + "step": 60995 + }, + { + "epoch": 1.56, + "learning_rate": 9.801892510791853e-07, + "loss": 0.7734, + "step": 60996 + }, + { + "epoch": 1.56, + "learning_rate": 9.80161586063262e-07, + "loss": 0.7871, + "step": 60997 + }, + { + "epoch": 1.56, + "learning_rate": 9.801339210625287e-07, + "loss": 0.7598, + "step": 60998 + }, + { + "epoch": 1.56, + "learning_rate": 9.801062560770054e-07, + "loss": 0.668, + "step": 60999 + }, + { + "epoch": 1.56, + "learning_rate": 9.800785911067142e-07, + "loss": 0.6389, + "step": 61000 + }, + { + "epoch": 1.56, + "learning_rate": 9.800509261516757e-07, + "loss": 0.7178, + "step": 61001 + }, + { + "epoch": 1.56, + "learning_rate": 9.800232612119113e-07, + "loss": 0.4868, + "step": 61002 + }, + { + "epoch": 1.56, + "learning_rate": 9.799955962874426e-07, + "loss": 0.5591, + "step": 61003 + }, + { + "epoch": 1.56, + "learning_rate": 9.7996793137829e-07, + "loss": 0.4751, + "step": 61004 + }, + { + "epoch": 1.56, + "learning_rate": 9.79940266484475e-07, + "loss": 0.4846, + "step": 61005 + }, + { + "epoch": 1.56, + "learning_rate": 9.799126016060188e-07, + "loss": 0.5884, + "step": 61006 + }, + { + "epoch": 1.56, + "learning_rate": 9.798849367429427e-07, + "loss": 0.6509, + "step": 61007 + }, + { + "epoch": 1.56, + "learning_rate": 9.798572718952677e-07, + "loss": 0.6855, + "step": 61008 + }, + { + "epoch": 1.56, + "learning_rate": 9.798296070630149e-07, + "loss": 0.7063, + "step": 61009 + }, + { + "epoch": 1.56, + "learning_rate": 9.798019422462058e-07, + "loss": 0.6851, + "step": 61010 + }, + { + "epoch": 1.56, + "learning_rate": 9.797742774448614e-07, + "loss": 0.7529, + "step": 61011 + }, + { + "epoch": 1.56, + "learning_rate": 9.797466126590029e-07, + "loss": 0.4448, + "step": 61012 + }, + { + "epoch": 1.56, + "learning_rate": 9.79718947888652e-07, + "loss": 0.5659, + "step": 61013 + }, + { + "epoch": 1.56, + "learning_rate": 9.796912831338286e-07, + "loss": 0.6465, + "step": 61014 + }, + { + "epoch": 1.56, + "learning_rate": 9.796636183945552e-07, + "loss": 0.5288, + "step": 61015 + }, + { + "epoch": 1.56, + "learning_rate": 9.79635953670852e-07, + "loss": 0.5364, + "step": 61016 + }, + { + "epoch": 1.56, + "learning_rate": 9.79608288962741e-07, + "loss": 0.7461, + "step": 61017 + }, + { + "epoch": 1.56, + "learning_rate": 9.795806242702424e-07, + "loss": 0.7017, + "step": 61018 + }, + { + "epoch": 1.56, + "learning_rate": 9.795529595933786e-07, + "loss": 0.5864, + "step": 61019 + }, + { + "epoch": 1.56, + "learning_rate": 9.795252949321699e-07, + "loss": 0.5273, + "step": 61020 + }, + { + "epoch": 1.56, + "learning_rate": 9.794976302866376e-07, + "loss": 0.625, + "step": 61021 + }, + { + "epoch": 1.56, + "learning_rate": 9.794699656568032e-07, + "loss": 0.7383, + "step": 61022 + }, + { + "epoch": 1.56, + "learning_rate": 9.79442301042688e-07, + "loss": 0.708, + "step": 61023 + }, + { + "epoch": 1.56, + "learning_rate": 9.794146364443124e-07, + "loss": 0.7085, + "step": 61024 + }, + { + "epoch": 1.56, + "learning_rate": 9.793869718616984e-07, + "loss": 0.7451, + "step": 61025 + }, + { + "epoch": 1.56, + "learning_rate": 9.793593072948665e-07, + "loss": 0.6572, + "step": 61026 + }, + { + "epoch": 1.56, + "learning_rate": 9.793316427438386e-07, + "loss": 0.6572, + "step": 61027 + }, + { + "epoch": 1.56, + "learning_rate": 9.793039782086351e-07, + "loss": 0.4731, + "step": 61028 + }, + { + "epoch": 1.56, + "learning_rate": 9.792763136892782e-07, + "loss": 0.5835, + "step": 61029 + }, + { + "epoch": 1.56, + "learning_rate": 9.792486491857878e-07, + "loss": 0.7178, + "step": 61030 + }, + { + "epoch": 1.56, + "learning_rate": 9.792209846981861e-07, + "loss": 0.6665, + "step": 61031 + }, + { + "epoch": 1.56, + "learning_rate": 9.791933202264939e-07, + "loss": 0.5322, + "step": 61032 + }, + { + "epoch": 1.56, + "learning_rate": 9.791656557707326e-07, + "loss": 0.7832, + "step": 61033 + }, + { + "epoch": 1.56, + "learning_rate": 9.791379913309232e-07, + "loss": 0.6182, + "step": 61034 + }, + { + "epoch": 1.56, + "learning_rate": 9.791103269070864e-07, + "loss": 0.7373, + "step": 61035 + }, + { + "epoch": 1.56, + "learning_rate": 9.790826624992443e-07, + "loss": 0.7178, + "step": 61036 + }, + { + "epoch": 1.56, + "learning_rate": 9.790549981074176e-07, + "loss": 0.7422, + "step": 61037 + }, + { + "epoch": 1.56, + "learning_rate": 9.790273337316273e-07, + "loss": 0.5347, + "step": 61038 + }, + { + "epoch": 1.56, + "learning_rate": 9.78999669371895e-07, + "loss": 0.9043, + "step": 61039 + }, + { + "epoch": 1.56, + "learning_rate": 9.789720050282414e-07, + "loss": 0.6631, + "step": 61040 + }, + { + "epoch": 1.56, + "learning_rate": 9.789443407006883e-07, + "loss": 0.7734, + "step": 61041 + }, + { + "epoch": 1.56, + "learning_rate": 9.789166763892563e-07, + "loss": 0.7373, + "step": 61042 + }, + { + "epoch": 1.56, + "learning_rate": 9.788890120939673e-07, + "loss": 0.5139, + "step": 61043 + }, + { + "epoch": 1.56, + "learning_rate": 9.788613478148416e-07, + "loss": 0.709, + "step": 61044 + }, + { + "epoch": 1.56, + "learning_rate": 9.788336835519008e-07, + "loss": 0.7236, + "step": 61045 + }, + { + "epoch": 1.56, + "learning_rate": 9.788060193051663e-07, + "loss": 0.4851, + "step": 61046 + }, + { + "epoch": 1.56, + "learning_rate": 9.787783550746587e-07, + "loss": 0.6436, + "step": 61047 + }, + { + "epoch": 1.56, + "learning_rate": 9.787506908603999e-07, + "loss": 0.5546, + "step": 61048 + }, + { + "epoch": 1.56, + "learning_rate": 9.787230266624104e-07, + "loss": 0.6592, + "step": 61049 + }, + { + "epoch": 1.56, + "learning_rate": 9.78695362480712e-07, + "loss": 0.5291, + "step": 61050 + }, + { + "epoch": 1.56, + "learning_rate": 9.786676983153251e-07, + "loss": 0.3342, + "step": 61051 + }, + { + "epoch": 1.56, + "learning_rate": 9.78640034166272e-07, + "loss": 0.6543, + "step": 61052 + }, + { + "epoch": 1.56, + "learning_rate": 9.78612370033573e-07, + "loss": 0.667, + "step": 61053 + }, + { + "epoch": 1.56, + "learning_rate": 9.785847059172496e-07, + "loss": 0.752, + "step": 61054 + }, + { + "epoch": 1.56, + "learning_rate": 9.785570418173226e-07, + "loss": 0.6006, + "step": 61055 + }, + { + "epoch": 1.56, + "learning_rate": 9.785293777338138e-07, + "loss": 0.6289, + "step": 61056 + }, + { + "epoch": 1.56, + "learning_rate": 9.785017136667439e-07, + "loss": 0.6416, + "step": 61057 + }, + { + "epoch": 1.56, + "learning_rate": 9.784740496161343e-07, + "loss": 0.6387, + "step": 61058 + }, + { + "epoch": 1.56, + "learning_rate": 9.78446385582006e-07, + "loss": 0.6836, + "step": 61059 + }, + { + "epoch": 1.56, + "learning_rate": 9.784187215643804e-07, + "loss": 0.6641, + "step": 61060 + }, + { + "epoch": 1.57, + "learning_rate": 9.783910575632785e-07, + "loss": 0.5264, + "step": 61061 + }, + { + "epoch": 1.57, + "learning_rate": 9.783633935787218e-07, + "loss": 0.5344, + "step": 61062 + }, + { + "epoch": 1.57, + "learning_rate": 9.783357296107314e-07, + "loss": 0.6777, + "step": 61063 + }, + { + "epoch": 1.57, + "learning_rate": 9.78308065659328e-07, + "loss": 0.8232, + "step": 61064 + }, + { + "epoch": 1.57, + "learning_rate": 9.782804017245333e-07, + "loss": 0.6436, + "step": 61065 + }, + { + "epoch": 1.57, + "learning_rate": 9.782527378063682e-07, + "loss": 0.6348, + "step": 61066 + }, + { + "epoch": 1.57, + "learning_rate": 9.78225073904854e-07, + "loss": 0.6187, + "step": 61067 + }, + { + "epoch": 1.57, + "learning_rate": 9.781974100200115e-07, + "loss": 0.6494, + "step": 61068 + }, + { + "epoch": 1.57, + "learning_rate": 9.781697461518628e-07, + "loss": 0.5181, + "step": 61069 + }, + { + "epoch": 1.57, + "learning_rate": 9.78142082300428e-07, + "loss": 0.6221, + "step": 61070 + }, + { + "epoch": 1.57, + "learning_rate": 9.781144184657292e-07, + "loss": 0.5933, + "step": 61071 + }, + { + "epoch": 1.57, + "learning_rate": 9.78086754647787e-07, + "loss": 0.8154, + "step": 61072 + }, + { + "epoch": 1.57, + "learning_rate": 9.780590908466235e-07, + "loss": 0.6748, + "step": 61073 + }, + { + "epoch": 1.57, + "learning_rate": 9.780314270622584e-07, + "loss": 0.7158, + "step": 61074 + }, + { + "epoch": 1.57, + "learning_rate": 9.780037632947137e-07, + "loss": 0.5032, + "step": 61075 + }, + { + "epoch": 1.57, + "learning_rate": 9.779760995440103e-07, + "loss": 0.7285, + "step": 61076 + }, + { + "epoch": 1.57, + "learning_rate": 9.7794843581017e-07, + "loss": 0.5964, + "step": 61077 + }, + { + "epoch": 1.57, + "learning_rate": 9.779207720932132e-07, + "loss": 0.5481, + "step": 61078 + }, + { + "epoch": 1.57, + "learning_rate": 9.778931083931615e-07, + "loss": 0.6431, + "step": 61079 + }, + { + "epoch": 1.57, + "learning_rate": 9.778654447100362e-07, + "loss": 0.5439, + "step": 61080 + }, + { + "epoch": 1.57, + "learning_rate": 9.778377810438582e-07, + "loss": 0.5151, + "step": 61081 + }, + { + "epoch": 1.57, + "learning_rate": 9.77810117394649e-07, + "loss": 0.5405, + "step": 61082 + }, + { + "epoch": 1.57, + "learning_rate": 9.777824537624296e-07, + "loss": 0.7686, + "step": 61083 + }, + { + "epoch": 1.57, + "learning_rate": 9.77754790147221e-07, + "loss": 0.6885, + "step": 61084 + }, + { + "epoch": 1.57, + "learning_rate": 9.777271265490443e-07, + "loss": 0.6611, + "step": 61085 + }, + { + "epoch": 1.57, + "learning_rate": 9.776994629679214e-07, + "loss": 0.498, + "step": 61086 + }, + { + "epoch": 1.57, + "learning_rate": 9.776717994038726e-07, + "loss": 0.4708, + "step": 61087 + }, + { + "epoch": 1.57, + "learning_rate": 9.776441358569196e-07, + "loss": 0.5017, + "step": 61088 + }, + { + "epoch": 1.57, + "learning_rate": 9.776164723270833e-07, + "loss": 0.582, + "step": 61089 + }, + { + "epoch": 1.57, + "learning_rate": 9.775888088143854e-07, + "loss": 0.5513, + "step": 61090 + }, + { + "epoch": 1.57, + "learning_rate": 9.775611453188464e-07, + "loss": 0.5508, + "step": 61091 + }, + { + "epoch": 1.57, + "learning_rate": 9.775334818404879e-07, + "loss": 0.7207, + "step": 61092 + }, + { + "epoch": 1.57, + "learning_rate": 9.775058183793313e-07, + "loss": 0.7578, + "step": 61093 + }, + { + "epoch": 1.57, + "learning_rate": 9.774781549353972e-07, + "loss": 0.6309, + "step": 61094 + }, + { + "epoch": 1.57, + "learning_rate": 9.774504915087069e-07, + "loss": 0.7803, + "step": 61095 + }, + { + "epoch": 1.57, + "learning_rate": 9.77422828099282e-07, + "loss": 0.5283, + "step": 61096 + }, + { + "epoch": 1.57, + "learning_rate": 9.77395164707143e-07, + "loss": 0.5811, + "step": 61097 + }, + { + "epoch": 1.57, + "learning_rate": 9.773675013323119e-07, + "loss": 0.8672, + "step": 61098 + }, + { + "epoch": 1.57, + "learning_rate": 9.77339837974809e-07, + "loss": 0.6992, + "step": 61099 + }, + { + "epoch": 1.57, + "learning_rate": 9.773121746346564e-07, + "loss": 0.7041, + "step": 61100 + }, + { + "epoch": 1.57, + "learning_rate": 9.772845113118745e-07, + "loss": 0.5869, + "step": 61101 + }, + { + "epoch": 1.57, + "learning_rate": 9.77256848006485e-07, + "loss": 0.7275, + "step": 61102 + }, + { + "epoch": 1.57, + "learning_rate": 9.772291847185092e-07, + "loss": 0.7285, + "step": 61103 + }, + { + "epoch": 1.57, + "learning_rate": 9.772015214479674e-07, + "loss": 0.6445, + "step": 61104 + }, + { + "epoch": 1.57, + "learning_rate": 9.771738581948817e-07, + "loss": 0.595, + "step": 61105 + }, + { + "epoch": 1.57, + "learning_rate": 9.771461949592726e-07, + "loss": 0.4692, + "step": 61106 + }, + { + "epoch": 1.57, + "learning_rate": 9.771185317411618e-07, + "loss": 0.7607, + "step": 61107 + }, + { + "epoch": 1.57, + "learning_rate": 9.770908685405701e-07, + "loss": 0.6152, + "step": 61108 + }, + { + "epoch": 1.57, + "learning_rate": 9.770632053575192e-07, + "loss": 0.543, + "step": 61109 + }, + { + "epoch": 1.57, + "learning_rate": 9.770355421920299e-07, + "loss": 0.4549, + "step": 61110 + }, + { + "epoch": 1.57, + "learning_rate": 9.770078790441232e-07, + "loss": 0.6572, + "step": 61111 + }, + { + "epoch": 1.57, + "learning_rate": 9.769802159138207e-07, + "loss": 0.6265, + "step": 61112 + }, + { + "epoch": 1.57, + "learning_rate": 9.769525528011436e-07, + "loss": 0.7202, + "step": 61113 + }, + { + "epoch": 1.57, + "learning_rate": 9.769248897061124e-07, + "loss": 0.687, + "step": 61114 + }, + { + "epoch": 1.57, + "learning_rate": 9.76897226628749e-07, + "loss": 0.7354, + "step": 61115 + }, + { + "epoch": 1.57, + "learning_rate": 9.768695635690742e-07, + "loss": 0.5244, + "step": 61116 + }, + { + "epoch": 1.57, + "learning_rate": 9.768419005271095e-07, + "loss": 0.6982, + "step": 61117 + }, + { + "epoch": 1.57, + "learning_rate": 9.768142375028756e-07, + "loss": 0.6953, + "step": 61118 + }, + { + "epoch": 1.57, + "learning_rate": 9.767865744963942e-07, + "loss": 0.6489, + "step": 61119 + }, + { + "epoch": 1.57, + "learning_rate": 9.767589115076862e-07, + "loss": 0.5972, + "step": 61120 + }, + { + "epoch": 1.57, + "learning_rate": 9.767312485367728e-07, + "loss": 0.5928, + "step": 61121 + }, + { + "epoch": 1.57, + "learning_rate": 9.767035855836752e-07, + "loss": 0.5491, + "step": 61122 + }, + { + "epoch": 1.57, + "learning_rate": 9.766759226484147e-07, + "loss": 0.729, + "step": 61123 + }, + { + "epoch": 1.57, + "learning_rate": 9.766482597310124e-07, + "loss": 0.4917, + "step": 61124 + }, + { + "epoch": 1.57, + "learning_rate": 9.766205968314893e-07, + "loss": 0.5488, + "step": 61125 + }, + { + "epoch": 1.57, + "learning_rate": 9.76592933949867e-07, + "loss": 0.6235, + "step": 61126 + }, + { + "epoch": 1.57, + "learning_rate": 9.765652710861663e-07, + "loss": 0.625, + "step": 61127 + }, + { + "epoch": 1.57, + "learning_rate": 9.765376082404082e-07, + "loss": 0.5513, + "step": 61128 + }, + { + "epoch": 1.57, + "learning_rate": 9.765099454126144e-07, + "loss": 0.5452, + "step": 61129 + }, + { + "epoch": 1.57, + "learning_rate": 9.764822826028058e-07, + "loss": 0.6479, + "step": 61130 + }, + { + "epoch": 1.57, + "learning_rate": 9.764546198110037e-07, + "loss": 0.5557, + "step": 61131 + }, + { + "epoch": 1.57, + "learning_rate": 9.764269570372292e-07, + "loss": 0.7354, + "step": 61132 + }, + { + "epoch": 1.57, + "learning_rate": 9.763992942815036e-07, + "loss": 0.5225, + "step": 61133 + }, + { + "epoch": 1.57, + "learning_rate": 9.76371631543848e-07, + "loss": 0.6885, + "step": 61134 + }, + { + "epoch": 1.57, + "learning_rate": 9.763439688242832e-07, + "loss": 0.5327, + "step": 61135 + }, + { + "epoch": 1.57, + "learning_rate": 9.763163061228311e-07, + "loss": 0.6816, + "step": 61136 + }, + { + "epoch": 1.57, + "learning_rate": 9.762886434395121e-07, + "loss": 0.5806, + "step": 61137 + }, + { + "epoch": 1.57, + "learning_rate": 9.762609807743482e-07, + "loss": 0.7373, + "step": 61138 + }, + { + "epoch": 1.57, + "learning_rate": 9.762333181273599e-07, + "loss": 0.6548, + "step": 61139 + }, + { + "epoch": 1.57, + "learning_rate": 9.762056554985688e-07, + "loss": 0.6309, + "step": 61140 + }, + { + "epoch": 1.57, + "learning_rate": 9.76177992887996e-07, + "loss": 0.563, + "step": 61141 + }, + { + "epoch": 1.57, + "learning_rate": 9.761503302956625e-07, + "loss": 0.5972, + "step": 61142 + }, + { + "epoch": 1.57, + "learning_rate": 9.7612266772159e-07, + "loss": 0.5762, + "step": 61143 + }, + { + "epoch": 1.57, + "learning_rate": 9.76095005165799e-07, + "loss": 0.6587, + "step": 61144 + }, + { + "epoch": 1.57, + "learning_rate": 9.760673426283108e-07, + "loss": 0.4727, + "step": 61145 + }, + { + "epoch": 1.57, + "learning_rate": 9.760396801091468e-07, + "loss": 0.8438, + "step": 61146 + }, + { + "epoch": 1.57, + "learning_rate": 9.76012017608328e-07, + "loss": 0.6328, + "step": 61147 + }, + { + "epoch": 1.57, + "learning_rate": 9.759843551258758e-07, + "loss": 0.478, + "step": 61148 + }, + { + "epoch": 1.57, + "learning_rate": 9.759566926618113e-07, + "loss": 0.624, + "step": 61149 + }, + { + "epoch": 1.57, + "learning_rate": 9.759290302161557e-07, + "loss": 0.6934, + "step": 61150 + }, + { + "epoch": 1.57, + "learning_rate": 9.7590136778893e-07, + "loss": 0.7373, + "step": 61151 + }, + { + "epoch": 1.57, + "learning_rate": 9.758737053801556e-07, + "loss": 0.5991, + "step": 61152 + }, + { + "epoch": 1.57, + "learning_rate": 9.75846042989854e-07, + "loss": 0.6699, + "step": 61153 + }, + { + "epoch": 1.57, + "learning_rate": 9.758183806180454e-07, + "loss": 0.6343, + "step": 61154 + }, + { + "epoch": 1.57, + "learning_rate": 9.757907182647516e-07, + "loss": 0.6455, + "step": 61155 + }, + { + "epoch": 1.57, + "learning_rate": 9.757630559299936e-07, + "loss": 0.7007, + "step": 61156 + }, + { + "epoch": 1.57, + "learning_rate": 9.75735393613793e-07, + "loss": 0.6865, + "step": 61157 + }, + { + "epoch": 1.57, + "learning_rate": 9.757077313161707e-07, + "loss": 0.6003, + "step": 61158 + }, + { + "epoch": 1.57, + "learning_rate": 9.75680069037148e-07, + "loss": 0.6299, + "step": 61159 + }, + { + "epoch": 1.57, + "learning_rate": 9.756524067767457e-07, + "loss": 0.6992, + "step": 61160 + }, + { + "epoch": 1.57, + "learning_rate": 9.756247445349854e-07, + "loss": 0.6143, + "step": 61161 + }, + { + "epoch": 1.57, + "learning_rate": 9.755970823118877e-07, + "loss": 0.6025, + "step": 61162 + }, + { + "epoch": 1.57, + "learning_rate": 9.755694201074752e-07, + "loss": 0.5796, + "step": 61163 + }, + { + "epoch": 1.57, + "learning_rate": 9.755417579217673e-07, + "loss": 0.6943, + "step": 61164 + }, + { + "epoch": 1.57, + "learning_rate": 9.75514095754786e-07, + "loss": 0.8027, + "step": 61165 + }, + { + "epoch": 1.57, + "learning_rate": 9.754864336065523e-07, + "loss": 0.707, + "step": 61166 + }, + { + "epoch": 1.57, + "learning_rate": 9.754587714770878e-07, + "loss": 0.5803, + "step": 61167 + }, + { + "epoch": 1.57, + "learning_rate": 9.754311093664132e-07, + "loss": 0.5264, + "step": 61168 + }, + { + "epoch": 1.57, + "learning_rate": 9.7540344727455e-07, + "loss": 0.6128, + "step": 61169 + }, + { + "epoch": 1.57, + "learning_rate": 9.75375785201519e-07, + "loss": 0.4795, + "step": 61170 + }, + { + "epoch": 1.57, + "learning_rate": 9.75348123147342e-07, + "loss": 0.6289, + "step": 61171 + }, + { + "epoch": 1.57, + "learning_rate": 9.7532046111204e-07, + "loss": 0.7197, + "step": 61172 + }, + { + "epoch": 1.57, + "learning_rate": 9.752927990956332e-07, + "loss": 0.6367, + "step": 61173 + }, + { + "epoch": 1.57, + "learning_rate": 9.75265137098144e-07, + "loss": 0.6484, + "step": 61174 + }, + { + "epoch": 1.57, + "learning_rate": 9.75237475119593e-07, + "loss": 0.481, + "step": 61175 + }, + { + "epoch": 1.57, + "learning_rate": 9.75209813160002e-07, + "loss": 0.9219, + "step": 61176 + }, + { + "epoch": 1.57, + "learning_rate": 9.751821512193912e-07, + "loss": 0.6172, + "step": 61177 + }, + { + "epoch": 1.57, + "learning_rate": 9.751544892977825e-07, + "loss": 0.7021, + "step": 61178 + }, + { + "epoch": 1.57, + "learning_rate": 9.751268273951968e-07, + "loss": 0.499, + "step": 61179 + }, + { + "epoch": 1.57, + "learning_rate": 9.750991655116554e-07, + "loss": 0.6621, + "step": 61180 + }, + { + "epoch": 1.57, + "learning_rate": 9.750715036471792e-07, + "loss": 0.7007, + "step": 61181 + }, + { + "epoch": 1.57, + "learning_rate": 9.750438418017903e-07, + "loss": 0.7246, + "step": 61182 + }, + { + "epoch": 1.57, + "learning_rate": 9.750161799755085e-07, + "loss": 0.3639, + "step": 61183 + }, + { + "epoch": 1.57, + "learning_rate": 9.749885181683559e-07, + "loss": 0.6255, + "step": 61184 + }, + { + "epoch": 1.57, + "learning_rate": 9.749608563803532e-07, + "loss": 0.6025, + "step": 61185 + }, + { + "epoch": 1.57, + "learning_rate": 9.749331946115221e-07, + "loss": 0.8447, + "step": 61186 + }, + { + "epoch": 1.57, + "learning_rate": 9.749055328618835e-07, + "loss": 0.6929, + "step": 61187 + }, + { + "epoch": 1.57, + "learning_rate": 9.748778711314583e-07, + "loss": 0.4937, + "step": 61188 + }, + { + "epoch": 1.57, + "learning_rate": 9.74850209420268e-07, + "loss": 0.6328, + "step": 61189 + }, + { + "epoch": 1.57, + "learning_rate": 9.748225477283341e-07, + "loss": 0.5112, + "step": 61190 + }, + { + "epoch": 1.57, + "learning_rate": 9.74794886055677e-07, + "loss": 0.5508, + "step": 61191 + }, + { + "epoch": 1.57, + "learning_rate": 9.747672244023187e-07, + "loss": 0.6028, + "step": 61192 + }, + { + "epoch": 1.57, + "learning_rate": 9.7473956276828e-07, + "loss": 0.7549, + "step": 61193 + }, + { + "epoch": 1.57, + "learning_rate": 9.747119011535815e-07, + "loss": 0.7725, + "step": 61194 + }, + { + "epoch": 1.57, + "learning_rate": 9.746842395582454e-07, + "loss": 0.7485, + "step": 61195 + }, + { + "epoch": 1.57, + "learning_rate": 9.746565779822921e-07, + "loss": 0.5923, + "step": 61196 + }, + { + "epoch": 1.57, + "learning_rate": 9.746289164257433e-07, + "loss": 0.5752, + "step": 61197 + }, + { + "epoch": 1.57, + "learning_rate": 9.746012548886198e-07, + "loss": 0.8032, + "step": 61198 + }, + { + "epoch": 1.57, + "learning_rate": 9.745735933709432e-07, + "loss": 0.7559, + "step": 61199 + }, + { + "epoch": 1.57, + "learning_rate": 9.745459318727345e-07, + "loss": 0.6602, + "step": 61200 + }, + { + "epoch": 1.57, + "learning_rate": 9.745182703940145e-07, + "loss": 0.6562, + "step": 61201 + }, + { + "epoch": 1.57, + "learning_rate": 9.74490608934805e-07, + "loss": 0.7461, + "step": 61202 + }, + { + "epoch": 1.57, + "learning_rate": 9.744629474951269e-07, + "loss": 0.6406, + "step": 61203 + }, + { + "epoch": 1.57, + "learning_rate": 9.74435286075001e-07, + "loss": 0.7373, + "step": 61204 + }, + { + "epoch": 1.57, + "learning_rate": 9.74407624674449e-07, + "loss": 0.6152, + "step": 61205 + }, + { + "epoch": 1.57, + "learning_rate": 9.743799632934916e-07, + "loss": 0.6846, + "step": 61206 + }, + { + "epoch": 1.57, + "learning_rate": 9.743523019321507e-07, + "loss": 0.5527, + "step": 61207 + }, + { + "epoch": 1.57, + "learning_rate": 9.743246405904467e-07, + "loss": 0.531, + "step": 61208 + }, + { + "epoch": 1.57, + "learning_rate": 9.742969792684015e-07, + "loss": 0.6958, + "step": 61209 + }, + { + "epoch": 1.57, + "learning_rate": 9.742693179660357e-07, + "loss": 0.6729, + "step": 61210 + }, + { + "epoch": 1.57, + "learning_rate": 9.742416566833708e-07, + "loss": 0.5466, + "step": 61211 + }, + { + "epoch": 1.57, + "learning_rate": 9.742139954204282e-07, + "loss": 0.4937, + "step": 61212 + }, + { + "epoch": 1.57, + "learning_rate": 9.741863341772282e-07, + "loss": 0.7285, + "step": 61213 + }, + { + "epoch": 1.57, + "learning_rate": 9.74158672953793e-07, + "loss": 0.7842, + "step": 61214 + }, + { + "epoch": 1.57, + "learning_rate": 9.741310117501428e-07, + "loss": 0.7002, + "step": 61215 + }, + { + "epoch": 1.57, + "learning_rate": 9.741033505662995e-07, + "loss": 0.8623, + "step": 61216 + }, + { + "epoch": 1.57, + "learning_rate": 9.740756894022842e-07, + "loss": 0.7393, + "step": 61217 + }, + { + "epoch": 1.57, + "learning_rate": 9.74048028258118e-07, + "loss": 0.748, + "step": 61218 + }, + { + "epoch": 1.57, + "learning_rate": 9.740203671338219e-07, + "loss": 0.5308, + "step": 61219 + }, + { + "epoch": 1.57, + "learning_rate": 9.73992706029417e-07, + "loss": 0.751, + "step": 61220 + }, + { + "epoch": 1.57, + "learning_rate": 9.739650449449251e-07, + "loss": 0.7197, + "step": 61221 + }, + { + "epoch": 1.57, + "learning_rate": 9.73937383880367e-07, + "loss": 0.6367, + "step": 61222 + }, + { + "epoch": 1.57, + "learning_rate": 9.739097228357634e-07, + "loss": 0.7871, + "step": 61223 + }, + { + "epoch": 1.57, + "learning_rate": 9.738820618111363e-07, + "loss": 0.5142, + "step": 61224 + }, + { + "epoch": 1.57, + "learning_rate": 9.73854400806506e-07, + "loss": 0.4839, + "step": 61225 + }, + { + "epoch": 1.57, + "learning_rate": 9.738267398218947e-07, + "loss": 0.7192, + "step": 61226 + }, + { + "epoch": 1.57, + "learning_rate": 9.737990788573229e-07, + "loss": 0.7119, + "step": 61227 + }, + { + "epoch": 1.57, + "learning_rate": 9.737714179128121e-07, + "loss": 0.6826, + "step": 61228 + }, + { + "epoch": 1.57, + "learning_rate": 9.73743756988383e-07, + "loss": 0.6504, + "step": 61229 + }, + { + "epoch": 1.57, + "learning_rate": 9.737160960840573e-07, + "loss": 0.6621, + "step": 61230 + }, + { + "epoch": 1.57, + "learning_rate": 9.736884351998557e-07, + "loss": 0.4495, + "step": 61231 + }, + { + "epoch": 1.57, + "learning_rate": 9.736607743358004e-07, + "loss": 0.6963, + "step": 61232 + }, + { + "epoch": 1.57, + "learning_rate": 9.736331134919112e-07, + "loss": 0.6284, + "step": 61233 + }, + { + "epoch": 1.57, + "learning_rate": 9.7360545266821e-07, + "loss": 0.8301, + "step": 61234 + }, + { + "epoch": 1.57, + "learning_rate": 9.73577791864718e-07, + "loss": 0.6338, + "step": 61235 + }, + { + "epoch": 1.57, + "learning_rate": 9.735501310814563e-07, + "loss": 0.5437, + "step": 61236 + }, + { + "epoch": 1.57, + "learning_rate": 9.73522470318446e-07, + "loss": 0.7275, + "step": 61237 + }, + { + "epoch": 1.57, + "learning_rate": 9.734948095757082e-07, + "loss": 0.6233, + "step": 61238 + }, + { + "epoch": 1.57, + "learning_rate": 9.73467148853264e-07, + "loss": 0.5801, + "step": 61239 + }, + { + "epoch": 1.57, + "learning_rate": 9.734394881511352e-07, + "loss": 0.7861, + "step": 61240 + }, + { + "epoch": 1.57, + "learning_rate": 9.734118274693423e-07, + "loss": 0.5747, + "step": 61241 + }, + { + "epoch": 1.57, + "learning_rate": 9.73384166807907e-07, + "loss": 0.835, + "step": 61242 + }, + { + "epoch": 1.57, + "learning_rate": 9.733565061668503e-07, + "loss": 0.7695, + "step": 61243 + }, + { + "epoch": 1.57, + "learning_rate": 9.73328845546193e-07, + "loss": 0.5195, + "step": 61244 + }, + { + "epoch": 1.57, + "learning_rate": 9.733011849459568e-07, + "loss": 0.667, + "step": 61245 + }, + { + "epoch": 1.57, + "learning_rate": 9.732735243661623e-07, + "loss": 0.5278, + "step": 61246 + }, + { + "epoch": 1.57, + "learning_rate": 9.732458638068314e-07, + "loss": 0.7461, + "step": 61247 + }, + { + "epoch": 1.57, + "learning_rate": 9.732182032679846e-07, + "loss": 0.5159, + "step": 61248 + }, + { + "epoch": 1.57, + "learning_rate": 9.731905427496437e-07, + "loss": 0.5, + "step": 61249 + }, + { + "epoch": 1.57, + "learning_rate": 9.731628822518291e-07, + "loss": 0.6387, + "step": 61250 + }, + { + "epoch": 1.57, + "learning_rate": 9.73135221774563e-07, + "loss": 0.7695, + "step": 61251 + }, + { + "epoch": 1.57, + "learning_rate": 9.73107561317866e-07, + "loss": 0.6426, + "step": 61252 + }, + { + "epoch": 1.57, + "learning_rate": 9.730799008817592e-07, + "loss": 0.3396, + "step": 61253 + }, + { + "epoch": 1.57, + "learning_rate": 9.730522404662637e-07, + "loss": 0.6338, + "step": 61254 + }, + { + "epoch": 1.57, + "learning_rate": 9.73024580071401e-07, + "loss": 0.6045, + "step": 61255 + }, + { + "epoch": 1.57, + "learning_rate": 9.72996919697192e-07, + "loss": 0.7871, + "step": 61256 + }, + { + "epoch": 1.57, + "learning_rate": 9.72969259343658e-07, + "loss": 0.4629, + "step": 61257 + }, + { + "epoch": 1.57, + "learning_rate": 9.729415990108203e-07, + "loss": 0.6562, + "step": 61258 + }, + { + "epoch": 1.57, + "learning_rate": 9.729139386986999e-07, + "loss": 0.5967, + "step": 61259 + }, + { + "epoch": 1.57, + "learning_rate": 9.72886278407318e-07, + "loss": 0.6279, + "step": 61260 + }, + { + "epoch": 1.57, + "learning_rate": 9.72858618136696e-07, + "loss": 0.8145, + "step": 61261 + }, + { + "epoch": 1.57, + "learning_rate": 9.728309578868551e-07, + "loss": 0.6533, + "step": 61262 + }, + { + "epoch": 1.57, + "learning_rate": 9.72803297657816e-07, + "loss": 0.7471, + "step": 61263 + }, + { + "epoch": 1.57, + "learning_rate": 9.727756374496003e-07, + "loss": 0.5056, + "step": 61264 + }, + { + "epoch": 1.57, + "learning_rate": 9.727479772622288e-07, + "loss": 0.5708, + "step": 61265 + }, + { + "epoch": 1.57, + "learning_rate": 9.727203170957231e-07, + "loss": 0.6851, + "step": 61266 + }, + { + "epoch": 1.57, + "learning_rate": 9.72692656950104e-07, + "loss": 0.5996, + "step": 61267 + }, + { + "epoch": 1.57, + "learning_rate": 9.726649968253933e-07, + "loss": 0.5793, + "step": 61268 + }, + { + "epoch": 1.57, + "learning_rate": 9.726373367216112e-07, + "loss": 0.7139, + "step": 61269 + }, + { + "epoch": 1.57, + "learning_rate": 9.7260967663878e-07, + "loss": 0.668, + "step": 61270 + }, + { + "epoch": 1.57, + "learning_rate": 9.725820165769196e-07, + "loss": 0.6963, + "step": 61271 + }, + { + "epoch": 1.57, + "learning_rate": 9.72554356536053e-07, + "loss": 0.4697, + "step": 61272 + }, + { + "epoch": 1.57, + "learning_rate": 9.725266965161995e-07, + "loss": 0.6597, + "step": 61273 + }, + { + "epoch": 1.57, + "learning_rate": 9.724990365173812e-07, + "loss": 0.6875, + "step": 61274 + }, + { + "epoch": 1.57, + "learning_rate": 9.72471376539619e-07, + "loss": 0.5327, + "step": 61275 + }, + { + "epoch": 1.57, + "learning_rate": 9.724437165829344e-07, + "loss": 0.7529, + "step": 61276 + }, + { + "epoch": 1.57, + "learning_rate": 9.724160566473481e-07, + "loss": 0.5229, + "step": 61277 + }, + { + "epoch": 1.57, + "learning_rate": 9.723883967328818e-07, + "loss": 0.7334, + "step": 61278 + }, + { + "epoch": 1.57, + "learning_rate": 9.72360736839556e-07, + "loss": 0.5879, + "step": 61279 + }, + { + "epoch": 1.57, + "learning_rate": 9.723330769673928e-07, + "loss": 0.6602, + "step": 61280 + }, + { + "epoch": 1.57, + "learning_rate": 9.723054171164127e-07, + "loss": 0.5977, + "step": 61281 + }, + { + "epoch": 1.57, + "learning_rate": 9.722777572866373e-07, + "loss": 0.7861, + "step": 61282 + }, + { + "epoch": 1.57, + "learning_rate": 9.722500974780875e-07, + "loss": 0.6875, + "step": 61283 + }, + { + "epoch": 1.57, + "learning_rate": 9.722224376907843e-07, + "loss": 0.3678, + "step": 61284 + }, + { + "epoch": 1.57, + "learning_rate": 9.721947779247493e-07, + "loss": 0.6919, + "step": 61285 + }, + { + "epoch": 1.57, + "learning_rate": 9.721671181800031e-07, + "loss": 0.7148, + "step": 61286 + }, + { + "epoch": 1.57, + "learning_rate": 9.721394584565677e-07, + "loss": 0.5737, + "step": 61287 + }, + { + "epoch": 1.57, + "learning_rate": 9.721117987544635e-07, + "loss": 0.7188, + "step": 61288 + }, + { + "epoch": 1.57, + "learning_rate": 9.720841390737121e-07, + "loss": 0.5781, + "step": 61289 + }, + { + "epoch": 1.57, + "learning_rate": 9.720564794143348e-07, + "loss": 0.6826, + "step": 61290 + }, + { + "epoch": 1.57, + "learning_rate": 9.720288197763523e-07, + "loss": 0.5381, + "step": 61291 + }, + { + "epoch": 1.57, + "learning_rate": 9.720011601597866e-07, + "loss": 0.7666, + "step": 61292 + }, + { + "epoch": 1.57, + "learning_rate": 9.71973500564658e-07, + "loss": 0.7207, + "step": 61293 + }, + { + "epoch": 1.57, + "learning_rate": 9.719458409909877e-07, + "loss": 0.6191, + "step": 61294 + }, + { + "epoch": 1.57, + "learning_rate": 9.719181814387975e-07, + "loss": 0.6934, + "step": 61295 + }, + { + "epoch": 1.57, + "learning_rate": 9.71890521908108e-07, + "loss": 0.4392, + "step": 61296 + }, + { + "epoch": 1.57, + "learning_rate": 9.718628623989408e-07, + "loss": 0.7109, + "step": 61297 + }, + { + "epoch": 1.57, + "learning_rate": 9.718352029113168e-07, + "loss": 0.48, + "step": 61298 + }, + { + "epoch": 1.57, + "learning_rate": 9.718075434452574e-07, + "loss": 0.5203, + "step": 61299 + }, + { + "epoch": 1.57, + "learning_rate": 9.717798840007835e-07, + "loss": 0.8047, + "step": 61300 + }, + { + "epoch": 1.57, + "learning_rate": 9.717522245779167e-07, + "loss": 0.5278, + "step": 61301 + }, + { + "epoch": 1.57, + "learning_rate": 9.717245651766782e-07, + "loss": 0.6538, + "step": 61302 + }, + { + "epoch": 1.57, + "learning_rate": 9.716969057970883e-07, + "loss": 0.6343, + "step": 61303 + }, + { + "epoch": 1.57, + "learning_rate": 9.71669246439169e-07, + "loss": 0.5679, + "step": 61304 + }, + { + "epoch": 1.57, + "learning_rate": 9.71641587102941e-07, + "loss": 0.4775, + "step": 61305 + }, + { + "epoch": 1.57, + "learning_rate": 9.716139277884263e-07, + "loss": 0.7761, + "step": 61306 + }, + { + "epoch": 1.57, + "learning_rate": 9.715862684956452e-07, + "loss": 0.5243, + "step": 61307 + }, + { + "epoch": 1.57, + "learning_rate": 9.71558609224619e-07, + "loss": 0.8184, + "step": 61308 + }, + { + "epoch": 1.57, + "learning_rate": 9.715309499753695e-07, + "loss": 0.4261, + "step": 61309 + }, + { + "epoch": 1.57, + "learning_rate": 9.71503290747917e-07, + "loss": 0.5771, + "step": 61310 + }, + { + "epoch": 1.57, + "learning_rate": 9.714756315422834e-07, + "loss": 0.5815, + "step": 61311 + }, + { + "epoch": 1.57, + "learning_rate": 9.714479723584898e-07, + "loss": 0.7476, + "step": 61312 + }, + { + "epoch": 1.57, + "learning_rate": 9.714203131965568e-07, + "loss": 0.6558, + "step": 61313 + }, + { + "epoch": 1.57, + "learning_rate": 9.71392654056506e-07, + "loss": 0.6445, + "step": 61314 + }, + { + "epoch": 1.57, + "learning_rate": 9.713649949383583e-07, + "loss": 0.5718, + "step": 61315 + }, + { + "epoch": 1.57, + "learning_rate": 9.713373358421355e-07, + "loss": 0.6431, + "step": 61316 + }, + { + "epoch": 1.57, + "learning_rate": 9.71309676767858e-07, + "loss": 0.6919, + "step": 61317 + }, + { + "epoch": 1.57, + "learning_rate": 9.712820177155478e-07, + "loss": 0.5109, + "step": 61318 + }, + { + "epoch": 1.57, + "learning_rate": 9.712543586852252e-07, + "loss": 0.3787, + "step": 61319 + }, + { + "epoch": 1.57, + "learning_rate": 9.712266996769122e-07, + "loss": 0.668, + "step": 61320 + }, + { + "epoch": 1.57, + "learning_rate": 9.711990406906294e-07, + "loss": 0.4607, + "step": 61321 + }, + { + "epoch": 1.57, + "learning_rate": 9.711713817263985e-07, + "loss": 0.6758, + "step": 61322 + }, + { + "epoch": 1.57, + "learning_rate": 9.711437227842404e-07, + "loss": 0.9092, + "step": 61323 + }, + { + "epoch": 1.57, + "learning_rate": 9.711160638641759e-07, + "loss": 0.5404, + "step": 61324 + }, + { + "epoch": 1.57, + "learning_rate": 9.710884049662263e-07, + "loss": 0.5874, + "step": 61325 + }, + { + "epoch": 1.57, + "learning_rate": 9.710607460904132e-07, + "loss": 0.4418, + "step": 61326 + }, + { + "epoch": 1.57, + "learning_rate": 9.710330872367575e-07, + "loss": 0.6337, + "step": 61327 + }, + { + "epoch": 1.57, + "learning_rate": 9.710054284052806e-07, + "loss": 0.7334, + "step": 61328 + }, + { + "epoch": 1.57, + "learning_rate": 9.709777695960031e-07, + "loss": 0.8887, + "step": 61329 + }, + { + "epoch": 1.57, + "learning_rate": 9.70950110808947e-07, + "loss": 0.626, + "step": 61330 + }, + { + "epoch": 1.57, + "learning_rate": 9.709224520441328e-07, + "loss": 0.6738, + "step": 61331 + }, + { + "epoch": 1.57, + "learning_rate": 9.708947933015824e-07, + "loss": 0.6128, + "step": 61332 + }, + { + "epoch": 1.57, + "learning_rate": 9.708671345813163e-07, + "loss": 0.7705, + "step": 61333 + }, + { + "epoch": 1.57, + "learning_rate": 9.708394758833557e-07, + "loss": 0.5479, + "step": 61334 + }, + { + "epoch": 1.57, + "learning_rate": 9.70811817207722e-07, + "loss": 0.6245, + "step": 61335 + }, + { + "epoch": 1.57, + "learning_rate": 9.707841585544362e-07, + "loss": 0.6533, + "step": 61336 + }, + { + "epoch": 1.57, + "learning_rate": 9.7075649992352e-07, + "loss": 0.4175, + "step": 61337 + }, + { + "epoch": 1.57, + "learning_rate": 9.70728841314994e-07, + "loss": 0.7471, + "step": 61338 + }, + { + "epoch": 1.57, + "learning_rate": 9.707011827288796e-07, + "loss": 0.5356, + "step": 61339 + }, + { + "epoch": 1.57, + "learning_rate": 9.706735241651979e-07, + "loss": 0.5884, + "step": 61340 + }, + { + "epoch": 1.57, + "learning_rate": 9.706458656239701e-07, + "loss": 0.4736, + "step": 61341 + }, + { + "epoch": 1.57, + "learning_rate": 9.70618207105218e-07, + "loss": 0.6338, + "step": 61342 + }, + { + "epoch": 1.57, + "learning_rate": 9.70590548608962e-07, + "loss": 0.7061, + "step": 61343 + }, + { + "epoch": 1.57, + "learning_rate": 9.705628901352228e-07, + "loss": 0.7148, + "step": 61344 + }, + { + "epoch": 1.57, + "learning_rate": 9.705352316840228e-07, + "loss": 0.5459, + "step": 61345 + }, + { + "epoch": 1.57, + "learning_rate": 9.705075732553822e-07, + "loss": 0.687, + "step": 61346 + }, + { + "epoch": 1.57, + "learning_rate": 9.70479914849323e-07, + "loss": 0.7656, + "step": 61347 + }, + { + "epoch": 1.57, + "learning_rate": 9.704522564658657e-07, + "loss": 0.532, + "step": 61348 + }, + { + "epoch": 1.57, + "learning_rate": 9.704245981050318e-07, + "loss": 0.6973, + "step": 61349 + }, + { + "epoch": 1.57, + "learning_rate": 9.703969397668423e-07, + "loss": 0.7783, + "step": 61350 + }, + { + "epoch": 1.57, + "learning_rate": 9.703692814513188e-07, + "loss": 0.8232, + "step": 61351 + }, + { + "epoch": 1.57, + "learning_rate": 9.703416231584824e-07, + "loss": 0.6631, + "step": 61352 + }, + { + "epoch": 1.57, + "learning_rate": 9.703139648883536e-07, + "loss": 0.6689, + "step": 61353 + }, + { + "epoch": 1.57, + "learning_rate": 9.702863066409542e-07, + "loss": 0.6094, + "step": 61354 + }, + { + "epoch": 1.57, + "learning_rate": 9.70258648416305e-07, + "loss": 0.5381, + "step": 61355 + }, + { + "epoch": 1.57, + "learning_rate": 9.702309902144277e-07, + "loss": 0.626, + "step": 61356 + }, + { + "epoch": 1.57, + "learning_rate": 9.702033320353427e-07, + "loss": 0.6299, + "step": 61357 + }, + { + "epoch": 1.57, + "learning_rate": 9.70175673879072e-07, + "loss": 0.7236, + "step": 61358 + }, + { + "epoch": 1.57, + "learning_rate": 9.701480157456364e-07, + "loss": 0.7324, + "step": 61359 + }, + { + "epoch": 1.57, + "learning_rate": 9.701203576350571e-07, + "loss": 0.5066, + "step": 61360 + }, + { + "epoch": 1.57, + "learning_rate": 9.700926995473551e-07, + "loss": 0.5635, + "step": 61361 + }, + { + "epoch": 1.57, + "learning_rate": 9.700650414825523e-07, + "loss": 0.5811, + "step": 61362 + }, + { + "epoch": 1.57, + "learning_rate": 9.700373834406687e-07, + "loss": 0.6113, + "step": 61363 + }, + { + "epoch": 1.57, + "learning_rate": 9.700097254217265e-07, + "loss": 0.7056, + "step": 61364 + }, + { + "epoch": 1.57, + "learning_rate": 9.699820674257462e-07, + "loss": 0.6553, + "step": 61365 + }, + { + "epoch": 1.57, + "learning_rate": 9.699544094527492e-07, + "loss": 0.7065, + "step": 61366 + }, + { + "epoch": 1.57, + "learning_rate": 9.699267515027568e-07, + "loss": 0.6191, + "step": 61367 + }, + { + "epoch": 1.57, + "learning_rate": 9.698990935757901e-07, + "loss": 0.6338, + "step": 61368 + }, + { + "epoch": 1.57, + "learning_rate": 9.698714356718702e-07, + "loss": 0.7632, + "step": 61369 + }, + { + "epoch": 1.57, + "learning_rate": 9.698437777910185e-07, + "loss": 0.3727, + "step": 61370 + }, + { + "epoch": 1.57, + "learning_rate": 9.698161199332558e-07, + "loss": 0.4746, + "step": 61371 + }, + { + "epoch": 1.57, + "learning_rate": 9.69788462098604e-07, + "loss": 0.7109, + "step": 61372 + }, + { + "epoch": 1.57, + "learning_rate": 9.697608042870837e-07, + "loss": 0.5916, + "step": 61373 + }, + { + "epoch": 1.57, + "learning_rate": 9.697331464987158e-07, + "loss": 0.623, + "step": 61374 + }, + { + "epoch": 1.57, + "learning_rate": 9.69705488733522e-07, + "loss": 0.6772, + "step": 61375 + }, + { + "epoch": 1.57, + "learning_rate": 9.696778309915233e-07, + "loss": 0.4282, + "step": 61376 + }, + { + "epoch": 1.57, + "learning_rate": 9.69650173272741e-07, + "loss": 0.6616, + "step": 61377 + }, + { + "epoch": 1.57, + "learning_rate": 9.696225155771958e-07, + "loss": 0.7104, + "step": 61378 + }, + { + "epoch": 1.57, + "learning_rate": 9.695948579049097e-07, + "loss": 0.5989, + "step": 61379 + }, + { + "epoch": 1.57, + "learning_rate": 9.695672002559033e-07, + "loss": 0.707, + "step": 61380 + }, + { + "epoch": 1.57, + "learning_rate": 9.695395426301977e-07, + "loss": 0.6816, + "step": 61381 + }, + { + "epoch": 1.57, + "learning_rate": 9.695118850278147e-07, + "loss": 0.7188, + "step": 61382 + }, + { + "epoch": 1.57, + "learning_rate": 9.694842274487748e-07, + "loss": 0.645, + "step": 61383 + }, + { + "epoch": 1.57, + "learning_rate": 9.694565698930991e-07, + "loss": 0.6968, + "step": 61384 + }, + { + "epoch": 1.57, + "learning_rate": 9.694289123608096e-07, + "loss": 0.6338, + "step": 61385 + }, + { + "epoch": 1.57, + "learning_rate": 9.694012548519266e-07, + "loss": 0.4893, + "step": 61386 + }, + { + "epoch": 1.57, + "learning_rate": 9.693735973664718e-07, + "loss": 0.6978, + "step": 61387 + }, + { + "epoch": 1.57, + "learning_rate": 9.69345939904466e-07, + "loss": 0.5757, + "step": 61388 + }, + { + "epoch": 1.57, + "learning_rate": 9.69318282465931e-07, + "loss": 0.6553, + "step": 61389 + }, + { + "epoch": 1.57, + "learning_rate": 9.692906250508874e-07, + "loss": 0.6753, + "step": 61390 + }, + { + "epoch": 1.57, + "learning_rate": 9.692629676593565e-07, + "loss": 0.7529, + "step": 61391 + }, + { + "epoch": 1.57, + "learning_rate": 9.6923531029136e-07, + "loss": 0.689, + "step": 61392 + }, + { + "epoch": 1.57, + "learning_rate": 9.69207652946918e-07, + "loss": 0.6729, + "step": 61393 + }, + { + "epoch": 1.57, + "learning_rate": 9.691799956260528e-07, + "loss": 0.666, + "step": 61394 + }, + { + "epoch": 1.57, + "learning_rate": 9.691523383287844e-07, + "loss": 0.4927, + "step": 61395 + }, + { + "epoch": 1.57, + "learning_rate": 9.69124681055135e-07, + "loss": 0.6689, + "step": 61396 + }, + { + "epoch": 1.57, + "learning_rate": 9.690970238051256e-07, + "loss": 0.5488, + "step": 61397 + }, + { + "epoch": 1.57, + "learning_rate": 9.690693665787768e-07, + "loss": 0.5833, + "step": 61398 + }, + { + "epoch": 1.57, + "learning_rate": 9.690417093761105e-07, + "loss": 0.5627, + "step": 61399 + }, + { + "epoch": 1.57, + "learning_rate": 9.690140521971472e-07, + "loss": 0.6191, + "step": 61400 + }, + { + "epoch": 1.57, + "learning_rate": 9.689863950419087e-07, + "loss": 0.6641, + "step": 61401 + }, + { + "epoch": 1.57, + "learning_rate": 9.68958737910416e-07, + "loss": 0.7344, + "step": 61402 + }, + { + "epoch": 1.57, + "learning_rate": 9.6893108080269e-07, + "loss": 0.5315, + "step": 61403 + }, + { + "epoch": 1.57, + "learning_rate": 9.68903423718752e-07, + "loss": 0.7529, + "step": 61404 + }, + { + "epoch": 1.57, + "learning_rate": 9.68875766658623e-07, + "loss": 0.5244, + "step": 61405 + }, + { + "epoch": 1.57, + "learning_rate": 9.68848109622325e-07, + "loss": 0.6318, + "step": 61406 + }, + { + "epoch": 1.57, + "learning_rate": 9.68820452609878e-07, + "loss": 0.8496, + "step": 61407 + }, + { + "epoch": 1.57, + "learning_rate": 9.68792795621304e-07, + "loss": 0.6558, + "step": 61408 + }, + { + "epoch": 1.57, + "learning_rate": 9.687651386566237e-07, + "loss": 0.5947, + "step": 61409 + }, + { + "epoch": 1.57, + "learning_rate": 9.687374817158587e-07, + "loss": 0.4824, + "step": 61410 + }, + { + "epoch": 1.57, + "learning_rate": 9.687098247990297e-07, + "loss": 0.7266, + "step": 61411 + }, + { + "epoch": 1.57, + "learning_rate": 9.686821679061587e-07, + "loss": 0.5688, + "step": 61412 + }, + { + "epoch": 1.57, + "learning_rate": 9.68654511037266e-07, + "loss": 0.7139, + "step": 61413 + }, + { + "epoch": 1.57, + "learning_rate": 9.686268541923732e-07, + "loss": 0.7393, + "step": 61414 + }, + { + "epoch": 1.57, + "learning_rate": 9.685991973715011e-07, + "loss": 0.4573, + "step": 61415 + }, + { + "epoch": 1.57, + "learning_rate": 9.685715405746714e-07, + "loss": 0.8174, + "step": 61416 + }, + { + "epoch": 1.57, + "learning_rate": 9.68543883801905e-07, + "loss": 0.5273, + "step": 61417 + }, + { + "epoch": 1.57, + "learning_rate": 9.685162270532231e-07, + "loss": 0.5737, + "step": 61418 + }, + { + "epoch": 1.57, + "learning_rate": 9.684885703286466e-07, + "loss": 0.8008, + "step": 61419 + }, + { + "epoch": 1.57, + "learning_rate": 9.684609136281974e-07, + "loss": 0.7734, + "step": 61420 + }, + { + "epoch": 1.57, + "learning_rate": 9.684332569518959e-07, + "loss": 0.5747, + "step": 61421 + }, + { + "epoch": 1.57, + "learning_rate": 9.68405600299764e-07, + "loss": 0.7275, + "step": 61422 + }, + { + "epoch": 1.57, + "learning_rate": 9.683779436718223e-07, + "loss": 0.6953, + "step": 61423 + }, + { + "epoch": 1.57, + "learning_rate": 9.683502870680918e-07, + "loss": 0.6111, + "step": 61424 + }, + { + "epoch": 1.57, + "learning_rate": 9.683226304885945e-07, + "loss": 0.5342, + "step": 61425 + }, + { + "epoch": 1.57, + "learning_rate": 9.682949739333507e-07, + "loss": 0.6631, + "step": 61426 + }, + { + "epoch": 1.57, + "learning_rate": 9.682673174023822e-07, + "loss": 0.4697, + "step": 61427 + }, + { + "epoch": 1.57, + "learning_rate": 9.682396608957098e-07, + "loss": 0.5684, + "step": 61428 + }, + { + "epoch": 1.57, + "learning_rate": 9.68212004413355e-07, + "loss": 0.6826, + "step": 61429 + }, + { + "epoch": 1.57, + "learning_rate": 9.681843479553386e-07, + "loss": 0.3916, + "step": 61430 + }, + { + "epoch": 1.57, + "learning_rate": 9.681566915216823e-07, + "loss": 0.8154, + "step": 61431 + }, + { + "epoch": 1.57, + "learning_rate": 9.68129035112407e-07, + "loss": 0.6865, + "step": 61432 + }, + { + "epoch": 1.57, + "learning_rate": 9.681013787275338e-07, + "loss": 0.543, + "step": 61433 + }, + { + "epoch": 1.57, + "learning_rate": 9.680737223670836e-07, + "loss": 0.6641, + "step": 61434 + }, + { + "epoch": 1.57, + "learning_rate": 9.680460660310782e-07, + "loss": 0.6367, + "step": 61435 + }, + { + "epoch": 1.57, + "learning_rate": 9.68018409719538e-07, + "loss": 0.8086, + "step": 61436 + }, + { + "epoch": 1.57, + "learning_rate": 9.67990753432485e-07, + "loss": 0.5693, + "step": 61437 + }, + { + "epoch": 1.57, + "learning_rate": 9.679630971699397e-07, + "loss": 0.6348, + "step": 61438 + }, + { + "epoch": 1.57, + "learning_rate": 9.67935440931924e-07, + "loss": 0.7715, + "step": 61439 + }, + { + "epoch": 1.57, + "learning_rate": 9.679077847184582e-07, + "loss": 0.728, + "step": 61440 + }, + { + "epoch": 1.57, + "learning_rate": 9.678801285295644e-07, + "loss": 0.5024, + "step": 61441 + }, + { + "epoch": 1.57, + "learning_rate": 9.678524723652633e-07, + "loss": 0.8652, + "step": 61442 + }, + { + "epoch": 1.57, + "learning_rate": 9.67824816225576e-07, + "loss": 0.5698, + "step": 61443 + }, + { + "epoch": 1.57, + "learning_rate": 9.677971601105236e-07, + "loss": 0.6313, + "step": 61444 + }, + { + "epoch": 1.57, + "learning_rate": 9.677695040201272e-07, + "loss": 0.6001, + "step": 61445 + }, + { + "epoch": 1.57, + "learning_rate": 9.677418479544087e-07, + "loss": 0.688, + "step": 61446 + }, + { + "epoch": 1.57, + "learning_rate": 9.677141919133884e-07, + "loss": 0.6963, + "step": 61447 + }, + { + "epoch": 1.57, + "learning_rate": 9.676865358970882e-07, + "loss": 0.7524, + "step": 61448 + }, + { + "epoch": 1.57, + "learning_rate": 9.676588799055285e-07, + "loss": 0.6592, + "step": 61449 + }, + { + "epoch": 1.57, + "learning_rate": 9.676312239387314e-07, + "loss": 0.5669, + "step": 61450 + }, + { + "epoch": 1.58, + "learning_rate": 9.676035679967172e-07, + "loss": 0.626, + "step": 61451 + }, + { + "epoch": 1.58, + "learning_rate": 9.675759120795082e-07, + "loss": 0.532, + "step": 61452 + }, + { + "epoch": 1.58, + "learning_rate": 9.67548256187124e-07, + "loss": 0.5752, + "step": 61453 + }, + { + "epoch": 1.58, + "learning_rate": 9.675206003195868e-07, + "loss": 0.6494, + "step": 61454 + }, + { + "epoch": 1.58, + "learning_rate": 9.674929444769177e-07, + "loss": 0.6631, + "step": 61455 + }, + { + "epoch": 1.58, + "learning_rate": 9.674652886591377e-07, + "loss": 0.3945, + "step": 61456 + }, + { + "epoch": 1.58, + "learning_rate": 9.67437632866268e-07, + "loss": 0.6235, + "step": 61457 + }, + { + "epoch": 1.58, + "learning_rate": 9.674099770983299e-07, + "loss": 0.6758, + "step": 61458 + }, + { + "epoch": 1.58, + "learning_rate": 9.67382321355344e-07, + "loss": 0.6416, + "step": 61459 + }, + { + "epoch": 1.58, + "learning_rate": 9.673546656373326e-07, + "loss": 0.5869, + "step": 61460 + }, + { + "epoch": 1.58, + "learning_rate": 9.67327009944316e-07, + "loss": 0.606, + "step": 61461 + }, + { + "epoch": 1.58, + "learning_rate": 9.672993542763157e-07, + "loss": 0.7891, + "step": 61462 + }, + { + "epoch": 1.58, + "learning_rate": 9.672716986333529e-07, + "loss": 0.5386, + "step": 61463 + }, + { + "epoch": 1.58, + "learning_rate": 9.672440430154484e-07, + "loss": 0.6724, + "step": 61464 + }, + { + "epoch": 1.58, + "learning_rate": 9.672163874226238e-07, + "loss": 0.752, + "step": 61465 + }, + { + "epoch": 1.58, + "learning_rate": 9.671887318548997e-07, + "loss": 0.7051, + "step": 61466 + }, + { + "epoch": 1.58, + "learning_rate": 9.67161076312298e-07, + "loss": 0.6143, + "step": 61467 + }, + { + "epoch": 1.58, + "learning_rate": 9.671334207948395e-07, + "loss": 0.7905, + "step": 61468 + }, + { + "epoch": 1.58, + "learning_rate": 9.671057653025454e-07, + "loss": 0.5875, + "step": 61469 + }, + { + "epoch": 1.58, + "learning_rate": 9.670781098354372e-07, + "loss": 0.6733, + "step": 61470 + }, + { + "epoch": 1.58, + "learning_rate": 9.670504543935358e-07, + "loss": 0.5986, + "step": 61471 + }, + { + "epoch": 1.58, + "learning_rate": 9.670227989768618e-07, + "loss": 0.5327, + "step": 61472 + }, + { + "epoch": 1.58, + "learning_rate": 9.669951435854375e-07, + "loss": 0.6768, + "step": 61473 + }, + { + "epoch": 1.58, + "learning_rate": 9.669674882192829e-07, + "loss": 0.5241, + "step": 61474 + }, + { + "epoch": 1.58, + "learning_rate": 9.669398328784203e-07, + "loss": 0.6724, + "step": 61475 + }, + { + "epoch": 1.58, + "learning_rate": 9.6691217756287e-07, + "loss": 0.6289, + "step": 61476 + }, + { + "epoch": 1.58, + "learning_rate": 9.668845222726535e-07, + "loss": 0.7441, + "step": 61477 + }, + { + "epoch": 1.58, + "learning_rate": 9.668568670077922e-07, + "loss": 0.4766, + "step": 61478 + }, + { + "epoch": 1.58, + "learning_rate": 9.668292117683071e-07, + "loss": 0.8262, + "step": 61479 + }, + { + "epoch": 1.58, + "learning_rate": 9.66801556554219e-07, + "loss": 0.3895, + "step": 61480 + }, + { + "epoch": 1.58, + "learning_rate": 9.6677390136555e-07, + "loss": 0.748, + "step": 61481 + }, + { + "epoch": 1.58, + "learning_rate": 9.667462462023206e-07, + "loss": 0.606, + "step": 61482 + }, + { + "epoch": 1.58, + "learning_rate": 9.667185910645517e-07, + "loss": 0.5337, + "step": 61483 + }, + { + "epoch": 1.58, + "learning_rate": 9.666909359522652e-07, + "loss": 0.6504, + "step": 61484 + }, + { + "epoch": 1.58, + "learning_rate": 9.666632808654815e-07, + "loss": 0.6855, + "step": 61485 + }, + { + "epoch": 1.58, + "learning_rate": 9.666356258042226e-07, + "loss": 0.8535, + "step": 61486 + }, + { + "epoch": 1.58, + "learning_rate": 9.66607970768509e-07, + "loss": 0.4211, + "step": 61487 + }, + { + "epoch": 1.58, + "learning_rate": 9.665803157583622e-07, + "loss": 0.668, + "step": 61488 + }, + { + "epoch": 1.58, + "learning_rate": 9.665526607738033e-07, + "loss": 0.5232, + "step": 61489 + }, + { + "epoch": 1.58, + "learning_rate": 9.665250058148535e-07, + "loss": 0.5203, + "step": 61490 + }, + { + "epoch": 1.58, + "learning_rate": 9.664973508815342e-07, + "loss": 0.6318, + "step": 61491 + }, + { + "epoch": 1.58, + "learning_rate": 9.664696959738662e-07, + "loss": 0.6006, + "step": 61492 + }, + { + "epoch": 1.58, + "learning_rate": 9.664420410918706e-07, + "loss": 0.7705, + "step": 61493 + }, + { + "epoch": 1.58, + "learning_rate": 9.664143862355692e-07, + "loss": 0.623, + "step": 61494 + }, + { + "epoch": 1.58, + "learning_rate": 9.663867314049823e-07, + "loss": 0.519, + "step": 61495 + }, + { + "epoch": 1.58, + "learning_rate": 9.663590766001317e-07, + "loss": 0.6226, + "step": 61496 + }, + { + "epoch": 1.58, + "learning_rate": 9.663314218210383e-07, + "loss": 0.5669, + "step": 61497 + }, + { + "epoch": 1.58, + "learning_rate": 9.663037670677236e-07, + "loss": 0.7393, + "step": 61498 + }, + { + "epoch": 1.58, + "learning_rate": 9.662761123402084e-07, + "loss": 0.6797, + "step": 61499 + }, + { + "epoch": 1.58, + "learning_rate": 9.66248457638514e-07, + "loss": 0.792, + "step": 61500 + }, + { + "epoch": 1.58, + "learning_rate": 9.66220802962662e-07, + "loss": 0.5913, + "step": 61501 + }, + { + "epoch": 1.58, + "learning_rate": 9.66193148312673e-07, + "loss": 0.6099, + "step": 61502 + }, + { + "epoch": 1.58, + "learning_rate": 9.661654936885682e-07, + "loss": 0.6172, + "step": 61503 + }, + { + "epoch": 1.58, + "learning_rate": 9.66137839090369e-07, + "loss": 0.666, + "step": 61504 + }, + { + "epoch": 1.58, + "learning_rate": 9.661101845180964e-07, + "loss": 0.6431, + "step": 61505 + }, + { + "epoch": 1.58, + "learning_rate": 9.660825299717719e-07, + "loss": 0.7227, + "step": 61506 + }, + { + "epoch": 1.58, + "learning_rate": 9.66054875451416e-07, + "loss": 0.5049, + "step": 61507 + }, + { + "epoch": 1.58, + "learning_rate": 9.660272209570509e-07, + "loss": 0.6392, + "step": 61508 + }, + { + "epoch": 1.58, + "learning_rate": 9.659995664886966e-07, + "loss": 0.7334, + "step": 61509 + }, + { + "epoch": 1.58, + "learning_rate": 9.659719120463754e-07, + "loss": 0.6226, + "step": 61510 + }, + { + "epoch": 1.58, + "learning_rate": 9.659442576301079e-07, + "loss": 0.4514, + "step": 61511 + }, + { + "epoch": 1.58, + "learning_rate": 9.65916603239915e-07, + "loss": 0.3894, + "step": 61512 + }, + { + "epoch": 1.58, + "learning_rate": 9.658889488758184e-07, + "loss": 0.5908, + "step": 61513 + }, + { + "epoch": 1.58, + "learning_rate": 9.658612945378387e-07, + "loss": 0.583, + "step": 61514 + }, + { + "epoch": 1.58, + "learning_rate": 9.65833640225998e-07, + "loss": 0.5947, + "step": 61515 + }, + { + "epoch": 1.58, + "learning_rate": 9.658059859403164e-07, + "loss": 0.72, + "step": 61516 + }, + { + "epoch": 1.58, + "learning_rate": 9.657783316808159e-07, + "loss": 0.6455, + "step": 61517 + }, + { + "epoch": 1.58, + "learning_rate": 9.657506774475172e-07, + "loss": 0.6572, + "step": 61518 + }, + { + "epoch": 1.58, + "learning_rate": 9.657230232404418e-07, + "loss": 0.71, + "step": 61519 + }, + { + "epoch": 1.58, + "learning_rate": 9.656953690596103e-07, + "loss": 0.7461, + "step": 61520 + }, + { + "epoch": 1.58, + "learning_rate": 9.656677149050449e-07, + "loss": 0.7432, + "step": 61521 + }, + { + "epoch": 1.58, + "learning_rate": 9.65640060776766e-07, + "loss": 0.751, + "step": 61522 + }, + { + "epoch": 1.58, + "learning_rate": 9.656124066747947e-07, + "loss": 0.8052, + "step": 61523 + }, + { + "epoch": 1.58, + "learning_rate": 9.655847525991524e-07, + "loss": 0.6025, + "step": 61524 + }, + { + "epoch": 1.58, + "learning_rate": 9.655570985498605e-07, + "loss": 0.6826, + "step": 61525 + }, + { + "epoch": 1.58, + "learning_rate": 9.655294445269396e-07, + "loss": 0.8037, + "step": 61526 + }, + { + "epoch": 1.58, + "learning_rate": 9.655017905304114e-07, + "loss": 0.7534, + "step": 61527 + }, + { + "epoch": 1.58, + "learning_rate": 9.65474136560297e-07, + "loss": 0.5708, + "step": 61528 + }, + { + "epoch": 1.58, + "learning_rate": 9.654464826166173e-07, + "loss": 0.6426, + "step": 61529 + }, + { + "epoch": 1.58, + "learning_rate": 9.654188286993936e-07, + "loss": 0.5266, + "step": 61530 + }, + { + "epoch": 1.58, + "learning_rate": 9.653911748086476e-07, + "loss": 0.7598, + "step": 61531 + }, + { + "epoch": 1.58, + "learning_rate": 9.653635209443995e-07, + "loss": 0.4529, + "step": 61532 + }, + { + "epoch": 1.58, + "learning_rate": 9.65335867106671e-07, + "loss": 0.584, + "step": 61533 + }, + { + "epoch": 1.58, + "learning_rate": 9.653082132954833e-07, + "loss": 0.5776, + "step": 61534 + }, + { + "epoch": 1.58, + "learning_rate": 9.652805595108574e-07, + "loss": 0.5928, + "step": 61535 + }, + { + "epoch": 1.58, + "learning_rate": 9.652529057528148e-07, + "loss": 0.6641, + "step": 61536 + }, + { + "epoch": 1.58, + "learning_rate": 9.652252520213762e-07, + "loss": 0.6611, + "step": 61537 + }, + { + "epoch": 1.58, + "learning_rate": 9.651975983165632e-07, + "loss": 0.667, + "step": 61538 + }, + { + "epoch": 1.58, + "learning_rate": 9.651699446383966e-07, + "loss": 0.5239, + "step": 61539 + }, + { + "epoch": 1.58, + "learning_rate": 9.65142290986898e-07, + "loss": 0.5981, + "step": 61540 + }, + { + "epoch": 1.58, + "learning_rate": 9.651146373620885e-07, + "loss": 0.5908, + "step": 61541 + }, + { + "epoch": 1.58, + "learning_rate": 9.65086983763989e-07, + "loss": 0.6006, + "step": 61542 + }, + { + "epoch": 1.58, + "learning_rate": 9.650593301926205e-07, + "loss": 0.7246, + "step": 61543 + }, + { + "epoch": 1.58, + "learning_rate": 9.650316766480048e-07, + "loss": 0.5771, + "step": 61544 + }, + { + "epoch": 1.58, + "learning_rate": 9.650040231301624e-07, + "loss": 0.7637, + "step": 61545 + }, + { + "epoch": 1.58, + "learning_rate": 9.649763696391152e-07, + "loss": 0.6987, + "step": 61546 + }, + { + "epoch": 1.58, + "learning_rate": 9.649487161748835e-07, + "loss": 0.5962, + "step": 61547 + }, + { + "epoch": 1.58, + "learning_rate": 9.649210627374894e-07, + "loss": 0.7358, + "step": 61548 + }, + { + "epoch": 1.58, + "learning_rate": 9.648934093269532e-07, + "loss": 0.7666, + "step": 61549 + }, + { + "epoch": 1.58, + "learning_rate": 9.648657559432968e-07, + "loss": 0.6001, + "step": 61550 + }, + { + "epoch": 1.58, + "learning_rate": 9.648381025865415e-07, + "loss": 0.6558, + "step": 61551 + }, + { + "epoch": 1.58, + "learning_rate": 9.648104492567075e-07, + "loss": 0.4612, + "step": 61552 + }, + { + "epoch": 1.58, + "learning_rate": 9.647827959538167e-07, + "loss": 0.5488, + "step": 61553 + }, + { + "epoch": 1.58, + "learning_rate": 9.647551426778898e-07, + "loss": 0.499, + "step": 61554 + }, + { + "epoch": 1.58, + "learning_rate": 9.647274894289484e-07, + "loss": 0.6182, + "step": 61555 + }, + { + "epoch": 1.58, + "learning_rate": 9.646998362070135e-07, + "loss": 0.4961, + "step": 61556 + }, + { + "epoch": 1.58, + "learning_rate": 9.646721830121065e-07, + "loss": 0.6816, + "step": 61557 + }, + { + "epoch": 1.58, + "learning_rate": 9.646445298442482e-07, + "loss": 0.8066, + "step": 61558 + }, + { + "epoch": 1.58, + "learning_rate": 9.6461687670346e-07, + "loss": 0.4504, + "step": 61559 + }, + { + "epoch": 1.58, + "learning_rate": 9.645892235897632e-07, + "loss": 0.6934, + "step": 61560 + }, + { + "epoch": 1.58, + "learning_rate": 9.64561570503179e-07, + "loss": 0.6758, + "step": 61561 + }, + { + "epoch": 1.58, + "learning_rate": 9.64533917443728e-07, + "loss": 0.6602, + "step": 61562 + }, + { + "epoch": 1.58, + "learning_rate": 9.64506264411432e-07, + "loss": 0.7773, + "step": 61563 + }, + { + "epoch": 1.58, + "learning_rate": 9.644786114063114e-07, + "loss": 0.7202, + "step": 61564 + }, + { + "epoch": 1.58, + "learning_rate": 9.644509584283884e-07, + "loss": 0.7129, + "step": 61565 + }, + { + "epoch": 1.58, + "learning_rate": 9.644233054776834e-07, + "loss": 0.6699, + "step": 61566 + }, + { + "epoch": 1.58, + "learning_rate": 9.64395652554218e-07, + "loss": 0.4277, + "step": 61567 + }, + { + "epoch": 1.58, + "learning_rate": 9.64367999658013e-07, + "loss": 0.6021, + "step": 61568 + }, + { + "epoch": 1.58, + "learning_rate": 9.6434034678909e-07, + "loss": 0.4104, + "step": 61569 + }, + { + "epoch": 1.58, + "learning_rate": 9.643126939474699e-07, + "loss": 0.7109, + "step": 61570 + }, + { + "epoch": 1.58, + "learning_rate": 9.642850411331742e-07, + "loss": 0.6235, + "step": 61571 + }, + { + "epoch": 1.58, + "learning_rate": 9.642573883462235e-07, + "loss": 0.7227, + "step": 61572 + }, + { + "epoch": 1.58, + "learning_rate": 9.642297355866391e-07, + "loss": 0.7471, + "step": 61573 + }, + { + "epoch": 1.58, + "learning_rate": 9.642020828544427e-07, + "loss": 0.6836, + "step": 61574 + }, + { + "epoch": 1.58, + "learning_rate": 9.641744301496549e-07, + "loss": 0.6895, + "step": 61575 + }, + { + "epoch": 1.58, + "learning_rate": 9.64146777472297e-07, + "loss": 0.5042, + "step": 61576 + }, + { + "epoch": 1.58, + "learning_rate": 9.641191248223904e-07, + "loss": 0.4296, + "step": 61577 + }, + { + "epoch": 1.58, + "learning_rate": 9.640914721999563e-07, + "loss": 0.5493, + "step": 61578 + }, + { + "epoch": 1.58, + "learning_rate": 9.640638196050157e-07, + "loss": 0.4976, + "step": 61579 + }, + { + "epoch": 1.58, + "learning_rate": 9.640361670375894e-07, + "loss": 0.6367, + "step": 61580 + }, + { + "epoch": 1.58, + "learning_rate": 9.640085144976996e-07, + "loss": 0.5991, + "step": 61581 + }, + { + "epoch": 1.58, + "learning_rate": 9.639808619853665e-07, + "loss": 0.4822, + "step": 61582 + }, + { + "epoch": 1.58, + "learning_rate": 9.639532095006113e-07, + "loss": 0.6357, + "step": 61583 + }, + { + "epoch": 1.58, + "learning_rate": 9.639255570434558e-07, + "loss": 0.7324, + "step": 61584 + }, + { + "epoch": 1.58, + "learning_rate": 9.638979046139206e-07, + "loss": 0.7715, + "step": 61585 + }, + { + "epoch": 1.58, + "learning_rate": 9.638702522120273e-07, + "loss": 0.7334, + "step": 61586 + }, + { + "epoch": 1.58, + "learning_rate": 9.638425998377967e-07, + "loss": 0.668, + "step": 61587 + }, + { + "epoch": 1.58, + "learning_rate": 9.638149474912504e-07, + "loss": 0.4666, + "step": 61588 + }, + { + "epoch": 1.58, + "learning_rate": 9.63787295172409e-07, + "loss": 0.4268, + "step": 61589 + }, + { + "epoch": 1.58, + "learning_rate": 9.637596428812943e-07, + "loss": 0.5122, + "step": 61590 + }, + { + "epoch": 1.58, + "learning_rate": 9.637319906179275e-07, + "loss": 0.7166, + "step": 61591 + }, + { + "epoch": 1.58, + "learning_rate": 9.63704338382329e-07, + "loss": 0.5332, + "step": 61592 + }, + { + "epoch": 1.58, + "learning_rate": 9.636766861745205e-07, + "loss": 0.7178, + "step": 61593 + }, + { + "epoch": 1.58, + "learning_rate": 9.636490339945228e-07, + "loss": 0.6064, + "step": 61594 + }, + { + "epoch": 1.58, + "learning_rate": 9.636213818423577e-07, + "loss": 0.7207, + "step": 61595 + }, + { + "epoch": 1.58, + "learning_rate": 9.635937297180461e-07, + "loss": 0.791, + "step": 61596 + }, + { + "epoch": 1.58, + "learning_rate": 9.635660776216087e-07, + "loss": 0.7354, + "step": 61597 + }, + { + "epoch": 1.58, + "learning_rate": 9.635384255530675e-07, + "loss": 0.585, + "step": 61598 + }, + { + "epoch": 1.58, + "learning_rate": 9.63510773512443e-07, + "loss": 0.4575, + "step": 61599 + }, + { + "epoch": 1.58, + "learning_rate": 9.634831214997567e-07, + "loss": 0.5488, + "step": 61600 + }, + { + "epoch": 1.58, + "learning_rate": 9.6345546951503e-07, + "loss": 0.5718, + "step": 61601 + }, + { + "epoch": 1.58, + "learning_rate": 9.634278175582834e-07, + "loss": 0.7061, + "step": 61602 + }, + { + "epoch": 1.58, + "learning_rate": 9.634001656295386e-07, + "loss": 0.6543, + "step": 61603 + }, + { + "epoch": 1.58, + "learning_rate": 9.633725137288165e-07, + "loss": 0.6357, + "step": 61604 + }, + { + "epoch": 1.58, + "learning_rate": 9.633448618561383e-07, + "loss": 0.3599, + "step": 61605 + }, + { + "epoch": 1.58, + "learning_rate": 9.633172100115253e-07, + "loss": 0.6982, + "step": 61606 + }, + { + "epoch": 1.58, + "learning_rate": 9.632895581949988e-07, + "loss": 0.6558, + "step": 61607 + }, + { + "epoch": 1.58, + "learning_rate": 9.632619064065795e-07, + "loss": 0.5283, + "step": 61608 + }, + { + "epoch": 1.58, + "learning_rate": 9.632342546462892e-07, + "loss": 0.583, + "step": 61609 + }, + { + "epoch": 1.58, + "learning_rate": 9.632066029141484e-07, + "loss": 0.626, + "step": 61610 + }, + { + "epoch": 1.58, + "learning_rate": 9.63178951210179e-07, + "loss": 0.7715, + "step": 61611 + }, + { + "epoch": 1.58, + "learning_rate": 9.631512995344018e-07, + "loss": 0.6133, + "step": 61612 + }, + { + "epoch": 1.58, + "learning_rate": 9.631236478868378e-07, + "loss": 0.603, + "step": 61613 + }, + { + "epoch": 1.58, + "learning_rate": 9.63095996267508e-07, + "loss": 0.624, + "step": 61614 + }, + { + "epoch": 1.58, + "learning_rate": 9.630683446764345e-07, + "loss": 0.5068, + "step": 61615 + }, + { + "epoch": 1.58, + "learning_rate": 9.630406931136374e-07, + "loss": 0.748, + "step": 61616 + }, + { + "epoch": 1.58, + "learning_rate": 9.630130415791386e-07, + "loss": 0.7637, + "step": 61617 + }, + { + "epoch": 1.58, + "learning_rate": 9.629853900729586e-07, + "loss": 0.5967, + "step": 61618 + }, + { + "epoch": 1.58, + "learning_rate": 9.629577385951194e-07, + "loss": 0.6772, + "step": 61619 + }, + { + "epoch": 1.58, + "learning_rate": 9.629300871456415e-07, + "loss": 0.7686, + "step": 61620 + }, + { + "epoch": 1.58, + "learning_rate": 9.629024357245469e-07, + "loss": 0.708, + "step": 61621 + }, + { + "epoch": 1.58, + "learning_rate": 9.628747843318558e-07, + "loss": 0.5854, + "step": 61622 + }, + { + "epoch": 1.58, + "learning_rate": 9.628471329675897e-07, + "loss": 0.6411, + "step": 61623 + }, + { + "epoch": 1.58, + "learning_rate": 9.628194816317699e-07, + "loss": 0.7197, + "step": 61624 + }, + { + "epoch": 1.58, + "learning_rate": 9.627918303244171e-07, + "loss": 0.6763, + "step": 61625 + }, + { + "epoch": 1.58, + "learning_rate": 9.627641790455535e-07, + "loss": 0.449, + "step": 61626 + }, + { + "epoch": 1.58, + "learning_rate": 9.627365277951994e-07, + "loss": 0.666, + "step": 61627 + }, + { + "epoch": 1.58, + "learning_rate": 9.627088765733762e-07, + "loss": 0.6499, + "step": 61628 + }, + { + "epoch": 1.58, + "learning_rate": 9.62681225380105e-07, + "loss": 0.625, + "step": 61629 + }, + { + "epoch": 1.58, + "learning_rate": 9.626535742154073e-07, + "loss": 0.7422, + "step": 61630 + }, + { + "epoch": 1.58, + "learning_rate": 9.626259230793043e-07, + "loss": 0.6523, + "step": 61631 + }, + { + "epoch": 1.58, + "learning_rate": 9.625982719718167e-07, + "loss": 0.7988, + "step": 61632 + }, + { + "epoch": 1.58, + "learning_rate": 9.625706208929657e-07, + "loss": 0.668, + "step": 61633 + }, + { + "epoch": 1.58, + "learning_rate": 9.625429698427728e-07, + "loss": 0.7236, + "step": 61634 + }, + { + "epoch": 1.58, + "learning_rate": 9.625153188212588e-07, + "loss": 0.8213, + "step": 61635 + }, + { + "epoch": 1.58, + "learning_rate": 9.624876678284452e-07, + "loss": 0.6543, + "step": 61636 + }, + { + "epoch": 1.58, + "learning_rate": 9.62460016864353e-07, + "loss": 0.6577, + "step": 61637 + }, + { + "epoch": 1.58, + "learning_rate": 9.624323659290036e-07, + "loss": 0.4976, + "step": 61638 + }, + { + "epoch": 1.58, + "learning_rate": 9.62404715022418e-07, + "loss": 0.6416, + "step": 61639 + }, + { + "epoch": 1.58, + "learning_rate": 9.623770641446172e-07, + "loss": 0.493, + "step": 61640 + }, + { + "epoch": 1.58, + "learning_rate": 9.62349413295623e-07, + "loss": 0.5718, + "step": 61641 + }, + { + "epoch": 1.58, + "learning_rate": 9.623217624754557e-07, + "loss": 0.5129, + "step": 61642 + }, + { + "epoch": 1.58, + "learning_rate": 9.622941116841373e-07, + "loss": 0.6313, + "step": 61643 + }, + { + "epoch": 1.58, + "learning_rate": 9.62266460921688e-07, + "loss": 0.6543, + "step": 61644 + }, + { + "epoch": 1.58, + "learning_rate": 9.622388101881299e-07, + "loss": 0.6338, + "step": 61645 + }, + { + "epoch": 1.58, + "learning_rate": 9.622111594834837e-07, + "loss": 0.4424, + "step": 61646 + }, + { + "epoch": 1.58, + "learning_rate": 9.621835088077706e-07, + "loss": 0.7803, + "step": 61647 + }, + { + "epoch": 1.58, + "learning_rate": 9.62155858161012e-07, + "loss": 0.6421, + "step": 61648 + }, + { + "epoch": 1.58, + "learning_rate": 9.621282075432287e-07, + "loss": 0.5938, + "step": 61649 + }, + { + "epoch": 1.58, + "learning_rate": 9.621005569544424e-07, + "loss": 0.5356, + "step": 61650 + }, + { + "epoch": 1.58, + "learning_rate": 9.620729063946742e-07, + "loss": 0.6865, + "step": 61651 + }, + { + "epoch": 1.58, + "learning_rate": 9.620452558639444e-07, + "loss": 0.7227, + "step": 61652 + }, + { + "epoch": 1.58, + "learning_rate": 9.620176053622752e-07, + "loss": 0.6963, + "step": 61653 + }, + { + "epoch": 1.58, + "learning_rate": 9.61989954889687e-07, + "loss": 0.626, + "step": 61654 + }, + { + "epoch": 1.58, + "learning_rate": 9.619623044462018e-07, + "loss": 0.552, + "step": 61655 + }, + { + "epoch": 1.58, + "learning_rate": 9.619346540318397e-07, + "loss": 0.6086, + "step": 61656 + }, + { + "epoch": 1.58, + "learning_rate": 9.619070036466232e-07, + "loss": 0.6138, + "step": 61657 + }, + { + "epoch": 1.58, + "learning_rate": 9.618793532905723e-07, + "loss": 0.6689, + "step": 61658 + }, + { + "epoch": 1.58, + "learning_rate": 9.618517029637088e-07, + "loss": 0.3191, + "step": 61659 + }, + { + "epoch": 1.58, + "learning_rate": 9.618240526660534e-07, + "loss": 0.708, + "step": 61660 + }, + { + "epoch": 1.58, + "learning_rate": 9.61796402397628e-07, + "loss": 0.5283, + "step": 61661 + }, + { + "epoch": 1.58, + "learning_rate": 9.617687521584534e-07, + "loss": 0.7788, + "step": 61662 + }, + { + "epoch": 1.58, + "learning_rate": 9.617411019485502e-07, + "loss": 0.5762, + "step": 61663 + }, + { + "epoch": 1.58, + "learning_rate": 9.617134517679404e-07, + "loss": 0.5405, + "step": 61664 + }, + { + "epoch": 1.58, + "learning_rate": 9.616858016166447e-07, + "loss": 0.6821, + "step": 61665 + }, + { + "epoch": 1.58, + "learning_rate": 9.616581514946846e-07, + "loss": 0.7852, + "step": 61666 + }, + { + "epoch": 1.58, + "learning_rate": 9.616305014020809e-07, + "loss": 0.7432, + "step": 61667 + }, + { + "epoch": 1.58, + "learning_rate": 9.61602851338855e-07, + "loss": 0.5564, + "step": 61668 + }, + { + "epoch": 1.58, + "learning_rate": 9.615752013050284e-07, + "loss": 0.5366, + "step": 61669 + }, + { + "epoch": 1.58, + "learning_rate": 9.615475513006214e-07, + "loss": 0.5908, + "step": 61670 + }, + { + "epoch": 1.58, + "learning_rate": 9.615199013256561e-07, + "loss": 0.5171, + "step": 61671 + }, + { + "epoch": 1.58, + "learning_rate": 9.61492251380153e-07, + "loss": 0.6504, + "step": 61672 + }, + { + "epoch": 1.58, + "learning_rate": 9.614646014641334e-07, + "loss": 0.5913, + "step": 61673 + }, + { + "epoch": 1.58, + "learning_rate": 9.614369515776188e-07, + "loss": 0.5981, + "step": 61674 + }, + { + "epoch": 1.58, + "learning_rate": 9.6140930172063e-07, + "loss": 0.7939, + "step": 61675 + }, + { + "epoch": 1.58, + "learning_rate": 9.613816518931885e-07, + "loss": 0.5391, + "step": 61676 + }, + { + "epoch": 1.58, + "learning_rate": 9.61354002095315e-07, + "loss": 0.5908, + "step": 61677 + }, + { + "epoch": 1.58, + "learning_rate": 9.613263523270313e-07, + "loss": 0.7393, + "step": 61678 + }, + { + "epoch": 1.58, + "learning_rate": 9.612987025883577e-07, + "loss": 0.6558, + "step": 61679 + }, + { + "epoch": 1.58, + "learning_rate": 9.612710528793164e-07, + "loss": 0.5732, + "step": 61680 + }, + { + "epoch": 1.58, + "learning_rate": 9.612434031999282e-07, + "loss": 0.4714, + "step": 61681 + }, + { + "epoch": 1.58, + "learning_rate": 9.612157535502138e-07, + "loss": 0.6475, + "step": 61682 + }, + { + "epoch": 1.58, + "learning_rate": 9.611881039301948e-07, + "loss": 0.6528, + "step": 61683 + }, + { + "epoch": 1.58, + "learning_rate": 9.611604543398922e-07, + "loss": 0.6367, + "step": 61684 + }, + { + "epoch": 1.58, + "learning_rate": 9.611328047793275e-07, + "loss": 0.6543, + "step": 61685 + }, + { + "epoch": 1.58, + "learning_rate": 9.611051552485215e-07, + "loss": 0.7236, + "step": 61686 + }, + { + "epoch": 1.58, + "learning_rate": 9.610775057474954e-07, + "loss": 0.6006, + "step": 61687 + }, + { + "epoch": 1.58, + "learning_rate": 9.610498562762706e-07, + "loss": 0.7607, + "step": 61688 + }, + { + "epoch": 1.58, + "learning_rate": 9.61022206834868e-07, + "loss": 0.5713, + "step": 61689 + }, + { + "epoch": 1.58, + "learning_rate": 9.60994557423309e-07, + "loss": 0.7646, + "step": 61690 + }, + { + "epoch": 1.58, + "learning_rate": 9.609669080416147e-07, + "loss": 0.6387, + "step": 61691 + }, + { + "epoch": 1.58, + "learning_rate": 9.609392586898061e-07, + "loss": 0.3875, + "step": 61692 + }, + { + "epoch": 1.58, + "learning_rate": 9.609116093679048e-07, + "loss": 0.6592, + "step": 61693 + }, + { + "epoch": 1.58, + "learning_rate": 9.608839600759312e-07, + "loss": 0.5747, + "step": 61694 + }, + { + "epoch": 1.58, + "learning_rate": 9.608563108139073e-07, + "loss": 0.6855, + "step": 61695 + }, + { + "epoch": 1.58, + "learning_rate": 9.60828661581854e-07, + "loss": 0.4943, + "step": 61696 + }, + { + "epoch": 1.58, + "learning_rate": 9.608010123797923e-07, + "loss": 0.5142, + "step": 61697 + }, + { + "epoch": 1.58, + "learning_rate": 9.60773363207743e-07, + "loss": 0.6509, + "step": 61698 + }, + { + "epoch": 1.58, + "learning_rate": 9.607457140657283e-07, + "loss": 0.7314, + "step": 61699 + }, + { + "epoch": 1.58, + "learning_rate": 9.607180649537685e-07, + "loss": 0.8223, + "step": 61700 + }, + { + "epoch": 1.58, + "learning_rate": 9.606904158718856e-07, + "loss": 0.6401, + "step": 61701 + }, + { + "epoch": 1.58, + "learning_rate": 9.606627668200998e-07, + "loss": 0.6157, + "step": 61702 + }, + { + "epoch": 1.58, + "learning_rate": 9.60635117798433e-07, + "loss": 0.5398, + "step": 61703 + }, + { + "epoch": 1.58, + "learning_rate": 9.606074688069058e-07, + "loss": 0.4568, + "step": 61704 + }, + { + "epoch": 1.58, + "learning_rate": 9.605798198455395e-07, + "loss": 0.7295, + "step": 61705 + }, + { + "epoch": 1.58, + "learning_rate": 9.605521709143556e-07, + "loss": 0.6626, + "step": 61706 + }, + { + "epoch": 1.58, + "learning_rate": 9.605245220133753e-07, + "loss": 0.6523, + "step": 61707 + }, + { + "epoch": 1.58, + "learning_rate": 9.604968731426191e-07, + "loss": 0.625, + "step": 61708 + }, + { + "epoch": 1.58, + "learning_rate": 9.60469224302109e-07, + "loss": 0.6641, + "step": 61709 + }, + { + "epoch": 1.58, + "learning_rate": 9.604415754918656e-07, + "loss": 0.699, + "step": 61710 + }, + { + "epoch": 1.58, + "learning_rate": 9.604139267119105e-07, + "loss": 0.6641, + "step": 61711 + }, + { + "epoch": 1.58, + "learning_rate": 9.603862779622646e-07, + "loss": 0.6709, + "step": 61712 + }, + { + "epoch": 1.58, + "learning_rate": 9.603586292429489e-07, + "loss": 0.5723, + "step": 61713 + }, + { + "epoch": 1.58, + "learning_rate": 9.60330980553985e-07, + "loss": 0.5786, + "step": 61714 + }, + { + "epoch": 1.58, + "learning_rate": 9.603033318953935e-07, + "loss": 0.5415, + "step": 61715 + }, + { + "epoch": 1.58, + "learning_rate": 9.602756832671963e-07, + "loss": 0.5161, + "step": 61716 + }, + { + "epoch": 1.58, + "learning_rate": 9.602480346694136e-07, + "loss": 0.7588, + "step": 61717 + }, + { + "epoch": 1.58, + "learning_rate": 9.602203861020679e-07, + "loss": 0.616, + "step": 61718 + }, + { + "epoch": 1.58, + "learning_rate": 9.60192737565179e-07, + "loss": 0.6826, + "step": 61719 + }, + { + "epoch": 1.58, + "learning_rate": 9.60165089058769e-07, + "loss": 0.4333, + "step": 61720 + }, + { + "epoch": 1.58, + "learning_rate": 9.601374405828593e-07, + "loss": 0.7559, + "step": 61721 + }, + { + "epoch": 1.58, + "learning_rate": 9.6010979213747e-07, + "loss": 0.6172, + "step": 61722 + }, + { + "epoch": 1.58, + "learning_rate": 9.600821437226225e-07, + "loss": 0.6594, + "step": 61723 + }, + { + "epoch": 1.58, + "learning_rate": 9.600544953383385e-07, + "loss": 0.4338, + "step": 61724 + }, + { + "epoch": 1.58, + "learning_rate": 9.60026846984639e-07, + "loss": 0.7109, + "step": 61725 + }, + { + "epoch": 1.58, + "learning_rate": 9.599991986615452e-07, + "loss": 0.5352, + "step": 61726 + }, + { + "epoch": 1.58, + "learning_rate": 9.59971550369078e-07, + "loss": 0.6411, + "step": 61727 + }, + { + "epoch": 1.58, + "learning_rate": 9.599439021072586e-07, + "loss": 0.7729, + "step": 61728 + }, + { + "epoch": 1.58, + "learning_rate": 9.599162538761085e-07, + "loss": 0.4937, + "step": 61729 + }, + { + "epoch": 1.58, + "learning_rate": 9.598886056756487e-07, + "loss": 0.7261, + "step": 61730 + }, + { + "epoch": 1.58, + "learning_rate": 9.598609575059006e-07, + "loss": 0.407, + "step": 61731 + }, + { + "epoch": 1.58, + "learning_rate": 9.598333093668846e-07, + "loss": 0.5642, + "step": 61732 + }, + { + "epoch": 1.58, + "learning_rate": 9.598056612586229e-07, + "loss": 0.6699, + "step": 61733 + }, + { + "epoch": 1.58, + "learning_rate": 9.597780131811357e-07, + "loss": 0.5316, + "step": 61734 + }, + { + "epoch": 1.58, + "learning_rate": 9.597503651344448e-07, + "loss": 0.6543, + "step": 61735 + }, + { + "epoch": 1.58, + "learning_rate": 9.59722717118571e-07, + "loss": 0.6758, + "step": 61736 + }, + { + "epoch": 1.58, + "learning_rate": 9.596950691335361e-07, + "loss": 0.6465, + "step": 61737 + }, + { + "epoch": 1.58, + "learning_rate": 9.596674211793605e-07, + "loss": 0.7178, + "step": 61738 + }, + { + "epoch": 1.58, + "learning_rate": 9.59639773256066e-07, + "loss": 0.4648, + "step": 61739 + }, + { + "epoch": 1.58, + "learning_rate": 9.596121253636729e-07, + "loss": 0.6577, + "step": 61740 + }, + { + "epoch": 1.58, + "learning_rate": 9.59584477502204e-07, + "loss": 0.6787, + "step": 61741 + }, + { + "epoch": 1.58, + "learning_rate": 9.595568296716786e-07, + "loss": 0.5386, + "step": 61742 + }, + { + "epoch": 1.58, + "learning_rate": 9.595291818721188e-07, + "loss": 0.7666, + "step": 61743 + }, + { + "epoch": 1.58, + "learning_rate": 9.595015341035455e-07, + "loss": 0.5469, + "step": 61744 + }, + { + "epoch": 1.58, + "learning_rate": 9.594738863659803e-07, + "loss": 0.4487, + "step": 61745 + }, + { + "epoch": 1.58, + "learning_rate": 9.594462386594438e-07, + "loss": 0.5015, + "step": 61746 + }, + { + "epoch": 1.58, + "learning_rate": 9.594185909839577e-07, + "loss": 0.7354, + "step": 61747 + }, + { + "epoch": 1.58, + "learning_rate": 9.593909433395426e-07, + "loss": 0.5073, + "step": 61748 + }, + { + "epoch": 1.58, + "learning_rate": 9.593632957262202e-07, + "loss": 0.6333, + "step": 61749 + }, + { + "epoch": 1.58, + "learning_rate": 9.593356481440115e-07, + "loss": 0.6377, + "step": 61750 + }, + { + "epoch": 1.58, + "learning_rate": 9.593080005929378e-07, + "loss": 0.551, + "step": 61751 + }, + { + "epoch": 1.58, + "learning_rate": 9.5928035307302e-07, + "loss": 0.7295, + "step": 61752 + }, + { + "epoch": 1.58, + "learning_rate": 9.59252705584279e-07, + "loss": 0.7734, + "step": 61753 + }, + { + "epoch": 1.58, + "learning_rate": 9.592250581267368e-07, + "loss": 0.5841, + "step": 61754 + }, + { + "epoch": 1.58, + "learning_rate": 9.591974107004136e-07, + "loss": 0.8115, + "step": 61755 + }, + { + "epoch": 1.58, + "learning_rate": 9.591697633053314e-07, + "loss": 0.6025, + "step": 61756 + }, + { + "epoch": 1.58, + "learning_rate": 9.591421159415108e-07, + "loss": 0.6475, + "step": 61757 + }, + { + "epoch": 1.58, + "learning_rate": 9.591144686089735e-07, + "loss": 0.6084, + "step": 61758 + }, + { + "epoch": 1.58, + "learning_rate": 9.590868213077404e-07, + "loss": 0.8398, + "step": 61759 + }, + { + "epoch": 1.58, + "learning_rate": 9.590591740378327e-07, + "loss": 0.7686, + "step": 61760 + }, + { + "epoch": 1.58, + "learning_rate": 9.590315267992712e-07, + "loss": 0.7637, + "step": 61761 + }, + { + "epoch": 1.58, + "learning_rate": 9.590038795920776e-07, + "loss": 0.5205, + "step": 61762 + }, + { + "epoch": 1.58, + "learning_rate": 9.589762324162725e-07, + "loss": 0.6836, + "step": 61763 + }, + { + "epoch": 1.58, + "learning_rate": 9.589485852718777e-07, + "loss": 0.5947, + "step": 61764 + }, + { + "epoch": 1.58, + "learning_rate": 9.58920938158914e-07, + "loss": 0.6777, + "step": 61765 + }, + { + "epoch": 1.58, + "learning_rate": 9.588932910774027e-07, + "loss": 0.6719, + "step": 61766 + }, + { + "epoch": 1.58, + "learning_rate": 9.588656440273646e-07, + "loss": 0.6113, + "step": 61767 + }, + { + "epoch": 1.58, + "learning_rate": 9.588379970088215e-07, + "loss": 0.5601, + "step": 61768 + }, + { + "epoch": 1.58, + "learning_rate": 9.58810350021794e-07, + "loss": 0.5659, + "step": 61769 + }, + { + "epoch": 1.58, + "learning_rate": 9.587827030663041e-07, + "loss": 0.6865, + "step": 61770 + }, + { + "epoch": 1.58, + "learning_rate": 9.587550561423721e-07, + "loss": 0.7402, + "step": 61771 + }, + { + "epoch": 1.58, + "learning_rate": 9.587274092500192e-07, + "loss": 0.603, + "step": 61772 + }, + { + "epoch": 1.58, + "learning_rate": 9.586997623892671e-07, + "loss": 0.7227, + "step": 61773 + }, + { + "epoch": 1.58, + "learning_rate": 9.586721155601363e-07, + "loss": 0.6846, + "step": 61774 + }, + { + "epoch": 1.58, + "learning_rate": 9.586444687626487e-07, + "loss": 0.5178, + "step": 61775 + }, + { + "epoch": 1.58, + "learning_rate": 9.586168219968254e-07, + "loss": 0.5518, + "step": 61776 + }, + { + "epoch": 1.58, + "learning_rate": 9.585891752626868e-07, + "loss": 0.7695, + "step": 61777 + }, + { + "epoch": 1.58, + "learning_rate": 9.585615285602547e-07, + "loss": 0.4602, + "step": 61778 + }, + { + "epoch": 1.58, + "learning_rate": 9.585338818895502e-07, + "loss": 0.6343, + "step": 61779 + }, + { + "epoch": 1.58, + "learning_rate": 9.585062352505946e-07, + "loss": 0.624, + "step": 61780 + }, + { + "epoch": 1.58, + "learning_rate": 9.584785886434086e-07, + "loss": 0.6294, + "step": 61781 + }, + { + "epoch": 1.58, + "learning_rate": 9.584509420680135e-07, + "loss": 0.6719, + "step": 61782 + }, + { + "epoch": 1.58, + "learning_rate": 9.58423295524431e-07, + "loss": 0.7002, + "step": 61783 + }, + { + "epoch": 1.58, + "learning_rate": 9.583956490126814e-07, + "loss": 0.5298, + "step": 61784 + }, + { + "epoch": 1.58, + "learning_rate": 9.583680025327867e-07, + "loss": 0.7588, + "step": 61785 + }, + { + "epoch": 1.58, + "learning_rate": 9.583403560847675e-07, + "loss": 0.4594, + "step": 61786 + }, + { + "epoch": 1.58, + "learning_rate": 9.583127096686453e-07, + "loss": 0.5571, + "step": 61787 + }, + { + "epoch": 1.58, + "learning_rate": 9.58285063284441e-07, + "loss": 0.6982, + "step": 61788 + }, + { + "epoch": 1.58, + "learning_rate": 9.582574169321762e-07, + "loss": 0.5469, + "step": 61789 + }, + { + "epoch": 1.58, + "learning_rate": 9.582297706118718e-07, + "loss": 0.6074, + "step": 61790 + }, + { + "epoch": 1.58, + "learning_rate": 9.582021243235487e-07, + "loss": 0.6289, + "step": 61791 + }, + { + "epoch": 1.58, + "learning_rate": 9.581744780672283e-07, + "loss": 0.7227, + "step": 61792 + }, + { + "epoch": 1.58, + "learning_rate": 9.58146831842932e-07, + "loss": 0.6914, + "step": 61793 + }, + { + "epoch": 1.58, + "learning_rate": 9.581191856506803e-07, + "loss": 0.7246, + "step": 61794 + }, + { + "epoch": 1.58, + "learning_rate": 9.580915394904953e-07, + "loss": 0.7705, + "step": 61795 + }, + { + "epoch": 1.58, + "learning_rate": 9.580638933623973e-07, + "loss": 0.5115, + "step": 61796 + }, + { + "epoch": 1.58, + "learning_rate": 9.58036247266408e-07, + "loss": 0.5595, + "step": 61797 + }, + { + "epoch": 1.58, + "learning_rate": 9.580086012025484e-07, + "loss": 0.6753, + "step": 61798 + }, + { + "epoch": 1.58, + "learning_rate": 9.579809551708398e-07, + "loss": 0.6929, + "step": 61799 + }, + { + "epoch": 1.58, + "learning_rate": 9.579533091713034e-07, + "loss": 0.5366, + "step": 61800 + }, + { + "epoch": 1.58, + "learning_rate": 9.579256632039598e-07, + "loss": 0.7832, + "step": 61801 + }, + { + "epoch": 1.58, + "learning_rate": 9.57898017268831e-07, + "loss": 0.5342, + "step": 61802 + }, + { + "epoch": 1.58, + "learning_rate": 9.578703713659372e-07, + "loss": 0.6895, + "step": 61803 + }, + { + "epoch": 1.58, + "learning_rate": 9.578427254953007e-07, + "loss": 0.751, + "step": 61804 + }, + { + "epoch": 1.58, + "learning_rate": 9.578150796569417e-07, + "loss": 0.8105, + "step": 61805 + }, + { + "epoch": 1.58, + "learning_rate": 9.577874338508819e-07, + "loss": 0.7588, + "step": 61806 + }, + { + "epoch": 1.58, + "learning_rate": 9.57759788077142e-07, + "loss": 0.7549, + "step": 61807 + }, + { + "epoch": 1.58, + "learning_rate": 9.57732142335744e-07, + "loss": 0.6409, + "step": 61808 + }, + { + "epoch": 1.58, + "learning_rate": 9.577044966267082e-07, + "loss": 0.877, + "step": 61809 + }, + { + "epoch": 1.58, + "learning_rate": 9.576768509500568e-07, + "loss": 0.7119, + "step": 61810 + }, + { + "epoch": 1.58, + "learning_rate": 9.576492053058096e-07, + "loss": 0.6133, + "step": 61811 + }, + { + "epoch": 1.58, + "learning_rate": 9.576215596939888e-07, + "loss": 0.5669, + "step": 61812 + }, + { + "epoch": 1.58, + "learning_rate": 9.575939141146147e-07, + "loss": 0.7559, + "step": 61813 + }, + { + "epoch": 1.58, + "learning_rate": 9.575662685677094e-07, + "loss": 0.7998, + "step": 61814 + }, + { + "epoch": 1.58, + "learning_rate": 9.575386230532936e-07, + "loss": 0.791, + "step": 61815 + }, + { + "epoch": 1.58, + "learning_rate": 9.575109775713886e-07, + "loss": 0.5601, + "step": 61816 + }, + { + "epoch": 1.58, + "learning_rate": 9.574833321220151e-07, + "loss": 0.6387, + "step": 61817 + }, + { + "epoch": 1.58, + "learning_rate": 9.57455686705195e-07, + "loss": 0.4011, + "step": 61818 + }, + { + "epoch": 1.58, + "learning_rate": 9.57428041320949e-07, + "loss": 0.5176, + "step": 61819 + }, + { + "epoch": 1.58, + "learning_rate": 9.57400395969299e-07, + "loss": 0.6084, + "step": 61820 + }, + { + "epoch": 1.58, + "learning_rate": 9.573727506502648e-07, + "loss": 0.4901, + "step": 61821 + }, + { + "epoch": 1.58, + "learning_rate": 9.573451053638686e-07, + "loss": 0.6396, + "step": 61822 + }, + { + "epoch": 1.58, + "learning_rate": 9.573174601101312e-07, + "loss": 0.4089, + "step": 61823 + }, + { + "epoch": 1.58, + "learning_rate": 9.57289814889074e-07, + "loss": 0.6084, + "step": 61824 + }, + { + "epoch": 1.58, + "learning_rate": 9.572621697007178e-07, + "loss": 0.6411, + "step": 61825 + }, + { + "epoch": 1.58, + "learning_rate": 9.572345245450841e-07, + "loss": 0.7266, + "step": 61826 + }, + { + "epoch": 1.58, + "learning_rate": 9.57206879422194e-07, + "loss": 0.6025, + "step": 61827 + }, + { + "epoch": 1.58, + "learning_rate": 9.571792343320684e-07, + "loss": 0.7378, + "step": 61828 + }, + { + "epoch": 1.58, + "learning_rate": 9.57151589274729e-07, + "loss": 0.6797, + "step": 61829 + }, + { + "epoch": 1.58, + "learning_rate": 9.57123944250197e-07, + "loss": 0.5596, + "step": 61830 + }, + { + "epoch": 1.58, + "learning_rate": 9.570962992584928e-07, + "loss": 0.6904, + "step": 61831 + }, + { + "epoch": 1.58, + "learning_rate": 9.570686542996378e-07, + "loss": 0.5645, + "step": 61832 + }, + { + "epoch": 1.58, + "learning_rate": 9.570410093736537e-07, + "loss": 0.572, + "step": 61833 + }, + { + "epoch": 1.58, + "learning_rate": 9.570133644805609e-07, + "loss": 0.5603, + "step": 61834 + }, + { + "epoch": 1.58, + "learning_rate": 9.569857196203814e-07, + "loss": 0.5615, + "step": 61835 + }, + { + "epoch": 1.58, + "learning_rate": 9.569580747931357e-07, + "loss": 0.7715, + "step": 61836 + }, + { + "epoch": 1.58, + "learning_rate": 9.569304299988452e-07, + "loss": 0.5496, + "step": 61837 + }, + { + "epoch": 1.58, + "learning_rate": 9.56902785237531e-07, + "loss": 0.5205, + "step": 61838 + }, + { + "epoch": 1.58, + "learning_rate": 9.568751405092147e-07, + "loss": 0.6841, + "step": 61839 + }, + { + "epoch": 1.58, + "learning_rate": 9.568474958139173e-07, + "loss": 0.793, + "step": 61840 + }, + { + "epoch": 1.59, + "learning_rate": 9.568198511516593e-07, + "loss": 0.606, + "step": 61841 + }, + { + "epoch": 1.59, + "learning_rate": 9.567922065224628e-07, + "loss": 0.6963, + "step": 61842 + }, + { + "epoch": 1.59, + "learning_rate": 9.56764561926348e-07, + "loss": 0.6299, + "step": 61843 + }, + { + "epoch": 1.59, + "learning_rate": 9.56736917363337e-07, + "loss": 0.7305, + "step": 61844 + }, + { + "epoch": 1.59, + "learning_rate": 9.567092728334502e-07, + "loss": 0.665, + "step": 61845 + }, + { + "epoch": 1.59, + "learning_rate": 9.566816283367093e-07, + "loss": 0.5249, + "step": 61846 + }, + { + "epoch": 1.59, + "learning_rate": 9.566539838731352e-07, + "loss": 0.4888, + "step": 61847 + }, + { + "epoch": 1.59, + "learning_rate": 9.566263394427494e-07, + "loss": 0.5615, + "step": 61848 + }, + { + "epoch": 1.59, + "learning_rate": 9.565986950455726e-07, + "loss": 0.5494, + "step": 61849 + }, + { + "epoch": 1.59, + "learning_rate": 9.565710506816268e-07, + "loss": 0.4373, + "step": 61850 + }, + { + "epoch": 1.59, + "learning_rate": 9.565434063509317e-07, + "loss": 0.8018, + "step": 61851 + }, + { + "epoch": 1.59, + "learning_rate": 9.565157620535097e-07, + "loss": 0.3726, + "step": 61852 + }, + { + "epoch": 1.59, + "learning_rate": 9.564881177893814e-07, + "loss": 0.5945, + "step": 61853 + }, + { + "epoch": 1.59, + "learning_rate": 9.564604735585682e-07, + "loss": 0.6575, + "step": 61854 + }, + { + "epoch": 1.59, + "learning_rate": 9.564328293610912e-07, + "loss": 0.6228, + "step": 61855 + }, + { + "epoch": 1.59, + "learning_rate": 9.564051851969717e-07, + "loss": 0.6484, + "step": 61856 + }, + { + "epoch": 1.59, + "learning_rate": 9.563775410662304e-07, + "loss": 0.79, + "step": 61857 + }, + { + "epoch": 1.59, + "learning_rate": 9.563498969688894e-07, + "loss": 0.6689, + "step": 61858 + }, + { + "epoch": 1.59, + "learning_rate": 9.563222529049686e-07, + "loss": 0.6902, + "step": 61859 + }, + { + "epoch": 1.59, + "learning_rate": 9.562946088744906e-07, + "loss": 0.6621, + "step": 61860 + }, + { + "epoch": 1.59, + "learning_rate": 9.562669648774754e-07, + "loss": 0.6572, + "step": 61861 + }, + { + "epoch": 1.59, + "learning_rate": 9.562393209139445e-07, + "loss": 0.8711, + "step": 61862 + }, + { + "epoch": 1.59, + "learning_rate": 9.562116769839195e-07, + "loss": 0.6069, + "step": 61863 + }, + { + "epoch": 1.59, + "learning_rate": 9.561840330874206e-07, + "loss": 0.6543, + "step": 61864 + }, + { + "epoch": 1.59, + "learning_rate": 9.5615638922447e-07, + "loss": 0.7744, + "step": 61865 + }, + { + "epoch": 1.59, + "learning_rate": 9.561287453950884e-07, + "loss": 0.533, + "step": 61866 + }, + { + "epoch": 1.59, + "learning_rate": 9.56101101599297e-07, + "loss": 0.6519, + "step": 61867 + }, + { + "epoch": 1.59, + "learning_rate": 9.56073457837117e-07, + "loss": 0.5522, + "step": 61868 + }, + { + "epoch": 1.59, + "learning_rate": 9.560458141085693e-07, + "loss": 0.6201, + "step": 61869 + }, + { + "epoch": 1.59, + "learning_rate": 9.560181704136755e-07, + "loss": 0.6836, + "step": 61870 + }, + { + "epoch": 1.59, + "learning_rate": 9.559905267524568e-07, + "loss": 0.6719, + "step": 61871 + }, + { + "epoch": 1.59, + "learning_rate": 9.559628831249337e-07, + "loss": 0.6816, + "step": 61872 + }, + { + "epoch": 1.59, + "learning_rate": 9.55935239531128e-07, + "loss": 0.5591, + "step": 61873 + }, + { + "epoch": 1.59, + "learning_rate": 9.559075959710603e-07, + "loss": 0.4646, + "step": 61874 + }, + { + "epoch": 1.59, + "learning_rate": 9.558799524447526e-07, + "loss": 0.6104, + "step": 61875 + }, + { + "epoch": 1.59, + "learning_rate": 9.558523089522254e-07, + "loss": 0.668, + "step": 61876 + }, + { + "epoch": 1.59, + "learning_rate": 9.558246654935e-07, + "loss": 0.6963, + "step": 61877 + }, + { + "epoch": 1.59, + "learning_rate": 9.557970220685976e-07, + "loss": 0.7432, + "step": 61878 + }, + { + "epoch": 1.59, + "learning_rate": 9.557693786775397e-07, + "loss": 0.541, + "step": 61879 + }, + { + "epoch": 1.59, + "learning_rate": 9.557417353203471e-07, + "loss": 0.6079, + "step": 61880 + }, + { + "epoch": 1.59, + "learning_rate": 9.557140919970408e-07, + "loss": 0.4531, + "step": 61881 + }, + { + "epoch": 1.59, + "learning_rate": 9.556864487076422e-07, + "loss": 0.6499, + "step": 61882 + }, + { + "epoch": 1.59, + "learning_rate": 9.556588054521726e-07, + "loss": 0.5444, + "step": 61883 + }, + { + "epoch": 1.59, + "learning_rate": 9.556311622306528e-07, + "loss": 0.6714, + "step": 61884 + }, + { + "epoch": 1.59, + "learning_rate": 9.556035190431044e-07, + "loss": 0.5049, + "step": 61885 + }, + { + "epoch": 1.59, + "learning_rate": 9.555758758895481e-07, + "loss": 0.7695, + "step": 61886 + }, + { + "epoch": 1.59, + "learning_rate": 9.555482327700053e-07, + "loss": 0.4585, + "step": 61887 + }, + { + "epoch": 1.59, + "learning_rate": 9.555205896844973e-07, + "loss": 0.748, + "step": 61888 + }, + { + "epoch": 1.59, + "learning_rate": 9.554929466330454e-07, + "loss": 0.7432, + "step": 61889 + }, + { + "epoch": 1.59, + "learning_rate": 9.554653036156704e-07, + "loss": 0.6494, + "step": 61890 + }, + { + "epoch": 1.59, + "learning_rate": 9.554376606323933e-07, + "loss": 0.4958, + "step": 61891 + }, + { + "epoch": 1.59, + "learning_rate": 9.554100176832356e-07, + "loss": 0.6357, + "step": 61892 + }, + { + "epoch": 1.59, + "learning_rate": 9.553823747682184e-07, + "loss": 0.7529, + "step": 61893 + }, + { + "epoch": 1.59, + "learning_rate": 9.55354731887363e-07, + "loss": 0.7178, + "step": 61894 + }, + { + "epoch": 1.59, + "learning_rate": 9.553270890406903e-07, + "loss": 0.4391, + "step": 61895 + }, + { + "epoch": 1.59, + "learning_rate": 9.552994462282217e-07, + "loss": 0.7012, + "step": 61896 + }, + { + "epoch": 1.59, + "learning_rate": 9.55271803449978e-07, + "loss": 0.5161, + "step": 61897 + }, + { + "epoch": 1.59, + "learning_rate": 9.552441607059809e-07, + "loss": 0.6562, + "step": 61898 + }, + { + "epoch": 1.59, + "learning_rate": 9.55216517996251e-07, + "loss": 0.6904, + "step": 61899 + }, + { + "epoch": 1.59, + "learning_rate": 9.551888753208105e-07, + "loss": 0.5854, + "step": 61900 + }, + { + "epoch": 1.59, + "learning_rate": 9.55161232679679e-07, + "loss": 0.6338, + "step": 61901 + }, + { + "epoch": 1.59, + "learning_rate": 9.55133590072879e-07, + "loss": 0.5752, + "step": 61902 + }, + { + "epoch": 1.59, + "learning_rate": 9.55105947500431e-07, + "loss": 0.583, + "step": 61903 + }, + { + "epoch": 1.59, + "learning_rate": 9.55078304962356e-07, + "loss": 0.6204, + "step": 61904 + }, + { + "epoch": 1.59, + "learning_rate": 9.550506624586757e-07, + "loss": 0.7412, + "step": 61905 + }, + { + "epoch": 1.59, + "learning_rate": 9.55023019989411e-07, + "loss": 0.6504, + "step": 61906 + }, + { + "epoch": 1.59, + "learning_rate": 9.549953775545832e-07, + "loss": 0.7695, + "step": 61907 + }, + { + "epoch": 1.59, + "learning_rate": 9.549677351542133e-07, + "loss": 0.5449, + "step": 61908 + }, + { + "epoch": 1.59, + "learning_rate": 9.549400927883225e-07, + "loss": 0.4722, + "step": 61909 + }, + { + "epoch": 1.59, + "learning_rate": 9.549124504569321e-07, + "loss": 0.5757, + "step": 61910 + }, + { + "epoch": 1.59, + "learning_rate": 9.548848081600633e-07, + "loss": 0.7598, + "step": 61911 + }, + { + "epoch": 1.59, + "learning_rate": 9.548571658977369e-07, + "loss": 0.5757, + "step": 61912 + }, + { + "epoch": 1.59, + "learning_rate": 9.548295236699745e-07, + "loss": 0.6338, + "step": 61913 + }, + { + "epoch": 1.59, + "learning_rate": 9.548018814767966e-07, + "loss": 0.4045, + "step": 61914 + }, + { + "epoch": 1.59, + "learning_rate": 9.547742393182252e-07, + "loss": 0.5967, + "step": 61915 + }, + { + "epoch": 1.59, + "learning_rate": 9.547465971942809e-07, + "loss": 0.7109, + "step": 61916 + }, + { + "epoch": 1.59, + "learning_rate": 9.547189551049853e-07, + "loss": 0.7559, + "step": 61917 + }, + { + "epoch": 1.59, + "learning_rate": 9.54691313050359e-07, + "loss": 0.5425, + "step": 61918 + }, + { + "epoch": 1.59, + "learning_rate": 9.546636710304237e-07, + "loss": 0.6348, + "step": 61919 + }, + { + "epoch": 1.59, + "learning_rate": 9.546360290452005e-07, + "loss": 0.667, + "step": 61920 + }, + { + "epoch": 1.59, + "learning_rate": 9.546083870947103e-07, + "loss": 0.5874, + "step": 61921 + }, + { + "epoch": 1.59, + "learning_rate": 9.545807451789741e-07, + "loss": 0.6689, + "step": 61922 + }, + { + "epoch": 1.59, + "learning_rate": 9.545531032980135e-07, + "loss": 0.6738, + "step": 61923 + }, + { + "epoch": 1.59, + "learning_rate": 9.545254614518494e-07, + "loss": 0.6274, + "step": 61924 + }, + { + "epoch": 1.59, + "learning_rate": 9.544978196405032e-07, + "loss": 0.5903, + "step": 61925 + }, + { + "epoch": 1.59, + "learning_rate": 9.544701778639957e-07, + "loss": 0.772, + "step": 61926 + }, + { + "epoch": 1.59, + "learning_rate": 9.544425361223487e-07, + "loss": 0.5024, + "step": 61927 + }, + { + "epoch": 1.59, + "learning_rate": 9.544148944155825e-07, + "loss": 0.6436, + "step": 61928 + }, + { + "epoch": 1.59, + "learning_rate": 9.54387252743719e-07, + "loss": 0.4553, + "step": 61929 + }, + { + "epoch": 1.59, + "learning_rate": 9.543596111067794e-07, + "loss": 0.751, + "step": 61930 + }, + { + "epoch": 1.59, + "learning_rate": 9.54331969504784e-07, + "loss": 0.6943, + "step": 61931 + }, + { + "epoch": 1.59, + "learning_rate": 9.543043279377549e-07, + "loss": 0.6914, + "step": 61932 + }, + { + "epoch": 1.59, + "learning_rate": 9.542766864057125e-07, + "loss": 0.8125, + "step": 61933 + }, + { + "epoch": 1.59, + "learning_rate": 9.542490449086785e-07, + "loss": 0.5635, + "step": 61934 + }, + { + "epoch": 1.59, + "learning_rate": 9.542214034466739e-07, + "loss": 0.8135, + "step": 61935 + }, + { + "epoch": 1.59, + "learning_rate": 9.541937620197197e-07, + "loss": 0.6279, + "step": 61936 + }, + { + "epoch": 1.59, + "learning_rate": 9.541661206278374e-07, + "loss": 0.6494, + "step": 61937 + }, + { + "epoch": 1.59, + "learning_rate": 9.54138479271048e-07, + "loss": 0.707, + "step": 61938 + }, + { + "epoch": 1.59, + "learning_rate": 9.541108379493727e-07, + "loss": 0.6792, + "step": 61939 + }, + { + "epoch": 1.59, + "learning_rate": 9.54083196662833e-07, + "loss": 0.5474, + "step": 61940 + }, + { + "epoch": 1.59, + "learning_rate": 9.540555554114491e-07, + "loss": 0.5957, + "step": 61941 + }, + { + "epoch": 1.59, + "learning_rate": 9.54027914195243e-07, + "loss": 0.5557, + "step": 61942 + }, + { + "epoch": 1.59, + "learning_rate": 9.540002730142354e-07, + "loss": 0.6719, + "step": 61943 + }, + { + "epoch": 1.59, + "learning_rate": 9.539726318684479e-07, + "loss": 0.5684, + "step": 61944 + }, + { + "epoch": 1.59, + "learning_rate": 9.539449907579012e-07, + "loss": 0.5581, + "step": 61945 + }, + { + "epoch": 1.59, + "learning_rate": 9.539173496826169e-07, + "loss": 0.4077, + "step": 61946 + }, + { + "epoch": 1.59, + "learning_rate": 9.538897086426158e-07, + "loss": 0.6055, + "step": 61947 + }, + { + "epoch": 1.59, + "learning_rate": 9.538620676379194e-07, + "loss": 0.7637, + "step": 61948 + }, + { + "epoch": 1.59, + "learning_rate": 9.538344266685483e-07, + "loss": 0.7617, + "step": 61949 + }, + { + "epoch": 1.59, + "learning_rate": 9.538067857345248e-07, + "loss": 0.5361, + "step": 61950 + }, + { + "epoch": 1.59, + "learning_rate": 9.537791448358689e-07, + "loss": 0.7031, + "step": 61951 + }, + { + "epoch": 1.59, + "learning_rate": 9.537515039726022e-07, + "loss": 0.6865, + "step": 61952 + }, + { + "epoch": 1.59, + "learning_rate": 9.537238631447458e-07, + "loss": 0.8125, + "step": 61953 + }, + { + "epoch": 1.59, + "learning_rate": 9.536962223523207e-07, + "loss": 0.5786, + "step": 61954 + }, + { + "epoch": 1.59, + "learning_rate": 9.536685815953488e-07, + "loss": 0.7129, + "step": 61955 + }, + { + "epoch": 1.59, + "learning_rate": 9.536409408738505e-07, + "loss": 0.6855, + "step": 61956 + }, + { + "epoch": 1.59, + "learning_rate": 9.536133001878471e-07, + "loss": 0.7051, + "step": 61957 + }, + { + "epoch": 1.59, + "learning_rate": 9.5358565953736e-07, + "loss": 0.7417, + "step": 61958 + }, + { + "epoch": 1.59, + "learning_rate": 9.535580189224099e-07, + "loss": 0.439, + "step": 61959 + }, + { + "epoch": 1.59, + "learning_rate": 9.535303783430188e-07, + "loss": 0.522, + "step": 61960 + }, + { + "epoch": 1.59, + "learning_rate": 9.535027377992072e-07, + "loss": 0.636, + "step": 61961 + }, + { + "epoch": 1.59, + "learning_rate": 9.534750972909962e-07, + "loss": 0.6343, + "step": 61962 + }, + { + "epoch": 1.59, + "learning_rate": 9.534474568184073e-07, + "loss": 0.5181, + "step": 61963 + }, + { + "epoch": 1.59, + "learning_rate": 9.534198163814614e-07, + "loss": 0.4386, + "step": 61964 + }, + { + "epoch": 1.59, + "learning_rate": 9.533921759801801e-07, + "loss": 0.7871, + "step": 61965 + }, + { + "epoch": 1.59, + "learning_rate": 9.53364535614584e-07, + "loss": 0.6021, + "step": 61966 + }, + { + "epoch": 1.59, + "learning_rate": 9.533368952846946e-07, + "loss": 0.7139, + "step": 61967 + }, + { + "epoch": 1.59, + "learning_rate": 9.53309254990533e-07, + "loss": 0.8203, + "step": 61968 + }, + { + "epoch": 1.59, + "learning_rate": 9.532816147321203e-07, + "loss": 0.7188, + "step": 61969 + }, + { + "epoch": 1.59, + "learning_rate": 9.532539745094782e-07, + "loss": 0.5815, + "step": 61970 + }, + { + "epoch": 1.59, + "learning_rate": 9.532263343226268e-07, + "loss": 0.7373, + "step": 61971 + }, + { + "epoch": 1.59, + "learning_rate": 9.531986941715882e-07, + "loss": 0.5698, + "step": 61972 + }, + { + "epoch": 1.59, + "learning_rate": 9.53171054056383e-07, + "loss": 0.6641, + "step": 61973 + }, + { + "epoch": 1.59, + "learning_rate": 9.531434139770325e-07, + "loss": 0.6514, + "step": 61974 + }, + { + "epoch": 1.59, + "learning_rate": 9.531157739335582e-07, + "loss": 0.6436, + "step": 61975 + }, + { + "epoch": 1.59, + "learning_rate": 9.530881339259806e-07, + "loss": 0.7969, + "step": 61976 + }, + { + "epoch": 1.59, + "learning_rate": 9.530604939543215e-07, + "loss": 0.7363, + "step": 61977 + }, + { + "epoch": 1.59, + "learning_rate": 9.530328540186018e-07, + "loss": 0.605, + "step": 61978 + }, + { + "epoch": 1.59, + "learning_rate": 9.530052141188427e-07, + "loss": 0.6494, + "step": 61979 + }, + { + "epoch": 1.59, + "learning_rate": 9.529775742550656e-07, + "loss": 0.7627, + "step": 61980 + }, + { + "epoch": 1.59, + "learning_rate": 9.529499344272911e-07, + "loss": 0.5078, + "step": 61981 + }, + { + "epoch": 1.59, + "learning_rate": 9.529222946355408e-07, + "loss": 0.4312, + "step": 61982 + }, + { + "epoch": 1.59, + "learning_rate": 9.528946548798356e-07, + "loss": 0.6235, + "step": 61983 + }, + { + "epoch": 1.59, + "learning_rate": 9.528670151601968e-07, + "loss": 0.8359, + "step": 61984 + }, + { + "epoch": 1.59, + "learning_rate": 9.528393754766455e-07, + "loss": 0.7617, + "step": 61985 + }, + { + "epoch": 1.59, + "learning_rate": 9.528117358292031e-07, + "loss": 0.4795, + "step": 61986 + }, + { + "epoch": 1.59, + "learning_rate": 9.527840962178904e-07, + "loss": 0.6157, + "step": 61987 + }, + { + "epoch": 1.59, + "learning_rate": 9.527564566427289e-07, + "loss": 0.5508, + "step": 61988 + }, + { + "epoch": 1.59, + "learning_rate": 9.527288171037395e-07, + "loss": 0.6047, + "step": 61989 + }, + { + "epoch": 1.59, + "learning_rate": 9.527011776009441e-07, + "loss": 0.752, + "step": 61990 + }, + { + "epoch": 1.59, + "learning_rate": 9.526735381343624e-07, + "loss": 0.5918, + "step": 61991 + }, + { + "epoch": 1.59, + "learning_rate": 9.526458987040169e-07, + "loss": 0.6865, + "step": 61992 + }, + { + "epoch": 1.59, + "learning_rate": 9.526182593099279e-07, + "loss": 0.6367, + "step": 61993 + }, + { + "epoch": 1.59, + "learning_rate": 9.525906199521171e-07, + "loss": 0.667, + "step": 61994 + }, + { + "epoch": 1.59, + "learning_rate": 9.525629806306053e-07, + "loss": 0.6484, + "step": 61995 + }, + { + "epoch": 1.59, + "learning_rate": 9.525353413454141e-07, + "loss": 0.5154, + "step": 61996 + }, + { + "epoch": 1.59, + "learning_rate": 9.525077020965641e-07, + "loss": 0.5786, + "step": 61997 + }, + { + "epoch": 1.59, + "learning_rate": 9.52480062884077e-07, + "loss": 0.4736, + "step": 61998 + }, + { + "epoch": 1.59, + "learning_rate": 9.524524237079736e-07, + "loss": 0.624, + "step": 61999 + }, + { + "epoch": 1.59, + "learning_rate": 9.524247845682756e-07, + "loss": 0.604, + "step": 62000 + }, + { + "epoch": 1.59, + "learning_rate": 9.523971454650035e-07, + "loss": 0.7588, + "step": 62001 + }, + { + "epoch": 1.59, + "learning_rate": 9.523695063981784e-07, + "loss": 0.6621, + "step": 62002 + }, + { + "epoch": 1.59, + "learning_rate": 9.523418673678222e-07, + "loss": 0.3718, + "step": 62003 + }, + { + "epoch": 1.59, + "learning_rate": 9.523142283739553e-07, + "loss": 0.4351, + "step": 62004 + }, + { + "epoch": 1.59, + "learning_rate": 9.522865894165994e-07, + "loss": 0.5708, + "step": 62005 + }, + { + "epoch": 1.59, + "learning_rate": 9.522589504957754e-07, + "loss": 0.626, + "step": 62006 + }, + { + "epoch": 1.59, + "learning_rate": 9.522313116115046e-07, + "loss": 0.6748, + "step": 62007 + }, + { + "epoch": 1.59, + "learning_rate": 9.52203672763808e-07, + "loss": 0.5635, + "step": 62008 + }, + { + "epoch": 1.59, + "learning_rate": 9.521760339527069e-07, + "loss": 0.5776, + "step": 62009 + }, + { + "epoch": 1.59, + "learning_rate": 9.521483951782228e-07, + "loss": 0.5581, + "step": 62010 + }, + { + "epoch": 1.59, + "learning_rate": 9.521207564403761e-07, + "loss": 0.7393, + "step": 62011 + }, + { + "epoch": 1.59, + "learning_rate": 9.520931177391883e-07, + "loss": 0.5786, + "step": 62012 + }, + { + "epoch": 1.59, + "learning_rate": 9.520654790746806e-07, + "loss": 0.8105, + "step": 62013 + }, + { + "epoch": 1.59, + "learning_rate": 9.52037840446874e-07, + "loss": 0.6504, + "step": 62014 + }, + { + "epoch": 1.59, + "learning_rate": 9.520102018557902e-07, + "loss": 0.5103, + "step": 62015 + }, + { + "epoch": 1.59, + "learning_rate": 9.519825633014495e-07, + "loss": 0.7295, + "step": 62016 + }, + { + "epoch": 1.59, + "learning_rate": 9.51954924783874e-07, + "loss": 0.7275, + "step": 62017 + }, + { + "epoch": 1.59, + "learning_rate": 9.519272863030841e-07, + "loss": 0.7217, + "step": 62018 + }, + { + "epoch": 1.59, + "learning_rate": 9.518996478591015e-07, + "loss": 0.4031, + "step": 62019 + }, + { + "epoch": 1.59, + "learning_rate": 9.518720094519472e-07, + "loss": 0.4856, + "step": 62020 + }, + { + "epoch": 1.59, + "learning_rate": 9.518443710816421e-07, + "loss": 0.5181, + "step": 62021 + }, + { + "epoch": 1.59, + "learning_rate": 9.518167327482077e-07, + "loss": 0.7529, + "step": 62022 + }, + { + "epoch": 1.59, + "learning_rate": 9.517890944516646e-07, + "loss": 0.6865, + "step": 62023 + }, + { + "epoch": 1.59, + "learning_rate": 9.517614561920347e-07, + "loss": 0.752, + "step": 62024 + }, + { + "epoch": 1.59, + "learning_rate": 9.517338179693387e-07, + "loss": 0.7417, + "step": 62025 + }, + { + "epoch": 1.59, + "learning_rate": 9.51706179783598e-07, + "loss": 0.6826, + "step": 62026 + }, + { + "epoch": 1.59, + "learning_rate": 9.516785416348335e-07, + "loss": 0.6216, + "step": 62027 + }, + { + "epoch": 1.59, + "learning_rate": 9.516509035230668e-07, + "loss": 0.6602, + "step": 62028 + }, + { + "epoch": 1.59, + "learning_rate": 9.516232654483187e-07, + "loss": 0.5713, + "step": 62029 + }, + { + "epoch": 1.59, + "learning_rate": 9.515956274106107e-07, + "loss": 0.7285, + "step": 62030 + }, + { + "epoch": 1.59, + "learning_rate": 9.515679894099633e-07, + "loss": 0.5693, + "step": 62031 + }, + { + "epoch": 1.59, + "learning_rate": 9.515403514463982e-07, + "loss": 0.5225, + "step": 62032 + }, + { + "epoch": 1.59, + "learning_rate": 9.515127135199362e-07, + "loss": 0.7168, + "step": 62033 + }, + { + "epoch": 1.59, + "learning_rate": 9.51485075630599e-07, + "loss": 0.5249, + "step": 62034 + }, + { + "epoch": 1.59, + "learning_rate": 9.514574377784072e-07, + "loss": 0.4597, + "step": 62035 + }, + { + "epoch": 1.59, + "learning_rate": 9.514297999633822e-07, + "loss": 0.665, + "step": 62036 + }, + { + "epoch": 1.59, + "learning_rate": 9.514021621855452e-07, + "loss": 0.4883, + "step": 62037 + }, + { + "epoch": 1.59, + "learning_rate": 9.513745244449175e-07, + "loss": 0.6348, + "step": 62038 + }, + { + "epoch": 1.59, + "learning_rate": 9.513468867415199e-07, + "loss": 0.6064, + "step": 62039 + }, + { + "epoch": 1.59, + "learning_rate": 9.513192490753741e-07, + "loss": 0.4253, + "step": 62040 + }, + { + "epoch": 1.59, + "learning_rate": 9.512916114465009e-07, + "loss": 0.7183, + "step": 62041 + }, + { + "epoch": 1.59, + "learning_rate": 9.51263973854921e-07, + "loss": 0.5698, + "step": 62042 + }, + { + "epoch": 1.59, + "learning_rate": 9.512363363006563e-07, + "loss": 0.6777, + "step": 62043 + }, + { + "epoch": 1.59, + "learning_rate": 9.512086987837276e-07, + "loss": 0.7793, + "step": 62044 + }, + { + "epoch": 1.59, + "learning_rate": 9.511810613041562e-07, + "loss": 0.7285, + "step": 62045 + }, + { + "epoch": 1.59, + "learning_rate": 9.511534238619634e-07, + "loss": 0.6299, + "step": 62046 + }, + { + "epoch": 1.59, + "learning_rate": 9.511257864571699e-07, + "loss": 0.7017, + "step": 62047 + }, + { + "epoch": 1.59, + "learning_rate": 9.510981490897973e-07, + "loss": 0.6729, + "step": 62048 + }, + { + "epoch": 1.59, + "learning_rate": 9.510705117598664e-07, + "loss": 0.644, + "step": 62049 + }, + { + "epoch": 1.59, + "learning_rate": 9.510428744673991e-07, + "loss": 0.4419, + "step": 62050 + }, + { + "epoch": 1.59, + "learning_rate": 9.510152372124156e-07, + "loss": 0.5234, + "step": 62051 + }, + { + "epoch": 1.59, + "learning_rate": 9.509875999949374e-07, + "loss": 0.4214, + "step": 62052 + }, + { + "epoch": 1.59, + "learning_rate": 9.509599628149859e-07, + "loss": 0.7002, + "step": 62053 + }, + { + "epoch": 1.59, + "learning_rate": 9.50932325672582e-07, + "loss": 0.7891, + "step": 62054 + }, + { + "epoch": 1.59, + "learning_rate": 9.509046885677471e-07, + "loss": 0.6855, + "step": 62055 + }, + { + "epoch": 1.59, + "learning_rate": 9.508770515005019e-07, + "loss": 0.5908, + "step": 62056 + }, + { + "epoch": 1.59, + "learning_rate": 9.508494144708683e-07, + "loss": 0.6172, + "step": 62057 + }, + { + "epoch": 1.59, + "learning_rate": 9.508217774788667e-07, + "loss": 0.8174, + "step": 62058 + }, + { + "epoch": 1.59, + "learning_rate": 9.50794140524519e-07, + "loss": 0.6216, + "step": 62059 + }, + { + "epoch": 1.59, + "learning_rate": 9.507665036078458e-07, + "loss": 0.7432, + "step": 62060 + }, + { + "epoch": 1.59, + "learning_rate": 9.507388667288683e-07, + "loss": 0.6499, + "step": 62061 + }, + { + "epoch": 1.59, + "learning_rate": 9.507112298876079e-07, + "loss": 0.657, + "step": 62062 + }, + { + "epoch": 1.59, + "learning_rate": 9.506835930840856e-07, + "loss": 0.6641, + "step": 62063 + }, + { + "epoch": 1.59, + "learning_rate": 9.506559563183226e-07, + "loss": 0.7412, + "step": 62064 + }, + { + "epoch": 1.59, + "learning_rate": 9.506283195903401e-07, + "loss": 0.6216, + "step": 62065 + }, + { + "epoch": 1.59, + "learning_rate": 9.506006829001591e-07, + "loss": 0.7539, + "step": 62066 + }, + { + "epoch": 1.59, + "learning_rate": 9.50573046247801e-07, + "loss": 0.7598, + "step": 62067 + }, + { + "epoch": 1.59, + "learning_rate": 9.505454096332866e-07, + "loss": 0.4873, + "step": 62068 + }, + { + "epoch": 1.59, + "learning_rate": 9.505177730566378e-07, + "loss": 0.5879, + "step": 62069 + }, + { + "epoch": 1.59, + "learning_rate": 9.504901365178751e-07, + "loss": 0.7422, + "step": 62070 + }, + { + "epoch": 1.59, + "learning_rate": 9.504625000170195e-07, + "loss": 0.6348, + "step": 62071 + }, + { + "epoch": 1.59, + "learning_rate": 9.504348635540928e-07, + "loss": 0.7539, + "step": 62072 + }, + { + "epoch": 1.59, + "learning_rate": 9.504072271291157e-07, + "loss": 0.4907, + "step": 62073 + }, + { + "epoch": 1.59, + "learning_rate": 9.503795907421096e-07, + "loss": 0.6641, + "step": 62074 + }, + { + "epoch": 1.59, + "learning_rate": 9.503519543930953e-07, + "loss": 0.5186, + "step": 62075 + }, + { + "epoch": 1.59, + "learning_rate": 9.503243180820946e-07, + "loss": 0.876, + "step": 62076 + }, + { + "epoch": 1.59, + "learning_rate": 9.502966818091281e-07, + "loss": 0.5786, + "step": 62077 + }, + { + "epoch": 1.59, + "learning_rate": 9.502690455742172e-07, + "loss": 0.5942, + "step": 62078 + }, + { + "epoch": 1.59, + "learning_rate": 9.502414093773832e-07, + "loss": 0.5503, + "step": 62079 + }, + { + "epoch": 1.59, + "learning_rate": 9.502137732186467e-07, + "loss": 0.4368, + "step": 62080 + }, + { + "epoch": 1.59, + "learning_rate": 9.501861370980295e-07, + "loss": 0.6499, + "step": 62081 + }, + { + "epoch": 1.59, + "learning_rate": 9.501585010155524e-07, + "loss": 0.5222, + "step": 62082 + }, + { + "epoch": 1.59, + "learning_rate": 9.501308649712365e-07, + "loss": 0.5591, + "step": 62083 + }, + { + "epoch": 1.59, + "learning_rate": 9.501032289651033e-07, + "loss": 0.5967, + "step": 62084 + }, + { + "epoch": 1.59, + "learning_rate": 9.500755929971734e-07, + "loss": 0.8379, + "step": 62085 + }, + { + "epoch": 1.59, + "learning_rate": 9.500479570674687e-07, + "loss": 0.7114, + "step": 62086 + }, + { + "epoch": 1.59, + "learning_rate": 9.500203211760099e-07, + "loss": 0.7212, + "step": 62087 + }, + { + "epoch": 1.59, + "learning_rate": 9.499926853228182e-07, + "loss": 0.6475, + "step": 62088 + }, + { + "epoch": 1.59, + "learning_rate": 9.499650495079151e-07, + "loss": 0.6152, + "step": 62089 + }, + { + "epoch": 1.59, + "learning_rate": 9.499374137313209e-07, + "loss": 0.7656, + "step": 62090 + }, + { + "epoch": 1.59, + "learning_rate": 9.499097779930578e-07, + "loss": 0.604, + "step": 62091 + }, + { + "epoch": 1.59, + "learning_rate": 9.498821422931462e-07, + "loss": 0.5112, + "step": 62092 + }, + { + "epoch": 1.59, + "learning_rate": 9.498545066316076e-07, + "loss": 0.5586, + "step": 62093 + }, + { + "epoch": 1.59, + "learning_rate": 9.498268710084631e-07, + "loss": 0.4924, + "step": 62094 + }, + { + "epoch": 1.59, + "learning_rate": 9.497992354237338e-07, + "loss": 0.5645, + "step": 62095 + }, + { + "epoch": 1.59, + "learning_rate": 9.497715998774409e-07, + "loss": 0.6113, + "step": 62096 + }, + { + "epoch": 1.59, + "learning_rate": 9.497439643696057e-07, + "loss": 0.6035, + "step": 62097 + }, + { + "epoch": 1.59, + "learning_rate": 9.497163289002491e-07, + "loss": 0.7219, + "step": 62098 + }, + { + "epoch": 1.59, + "learning_rate": 9.49688693469393e-07, + "loss": 0.7056, + "step": 62099 + }, + { + "epoch": 1.59, + "learning_rate": 9.496610580770573e-07, + "loss": 0.8398, + "step": 62100 + }, + { + "epoch": 1.59, + "learning_rate": 9.496334227232641e-07, + "loss": 0.4678, + "step": 62101 + }, + { + "epoch": 1.59, + "learning_rate": 9.496057874080339e-07, + "loss": 0.6689, + "step": 62102 + }, + { + "epoch": 1.59, + "learning_rate": 9.495781521313886e-07, + "loss": 0.7041, + "step": 62103 + }, + { + "epoch": 1.59, + "learning_rate": 9.495505168933487e-07, + "loss": 0.5391, + "step": 62104 + }, + { + "epoch": 1.59, + "learning_rate": 9.495228816939359e-07, + "loss": 0.6069, + "step": 62105 + }, + { + "epoch": 1.59, + "learning_rate": 9.494952465331708e-07, + "loss": 0.6572, + "step": 62106 + }, + { + "epoch": 1.59, + "learning_rate": 9.494676114110753e-07, + "loss": 0.6106, + "step": 62107 + }, + { + "epoch": 1.59, + "learning_rate": 9.494399763276697e-07, + "loss": 0.5853, + "step": 62108 + }, + { + "epoch": 1.59, + "learning_rate": 9.494123412829761e-07, + "loss": 0.5288, + "step": 62109 + }, + { + "epoch": 1.59, + "learning_rate": 9.493847062770148e-07, + "loss": 0.7861, + "step": 62110 + }, + { + "epoch": 1.59, + "learning_rate": 9.493570713098073e-07, + "loss": 0.5864, + "step": 62111 + }, + { + "epoch": 1.59, + "learning_rate": 9.493294363813749e-07, + "loss": 0.6741, + "step": 62112 + }, + { + "epoch": 1.59, + "learning_rate": 9.493018014917383e-07, + "loss": 0.5498, + "step": 62113 + }, + { + "epoch": 1.59, + "learning_rate": 9.492741666409193e-07, + "loss": 0.376, + "step": 62114 + }, + { + "epoch": 1.59, + "learning_rate": 9.492465318289386e-07, + "loss": 0.7656, + "step": 62115 + }, + { + "epoch": 1.59, + "learning_rate": 9.492188970558175e-07, + "loss": 0.666, + "step": 62116 + }, + { + "epoch": 1.59, + "learning_rate": 9.491912623215771e-07, + "loss": 0.6953, + "step": 62117 + }, + { + "epoch": 1.59, + "learning_rate": 9.491636276262388e-07, + "loss": 0.7178, + "step": 62118 + }, + { + "epoch": 1.59, + "learning_rate": 9.491359929698237e-07, + "loss": 0.4448, + "step": 62119 + }, + { + "epoch": 1.59, + "learning_rate": 9.491083583523527e-07, + "loss": 0.7173, + "step": 62120 + }, + { + "epoch": 1.59, + "learning_rate": 9.49080723773847e-07, + "loss": 0.6177, + "step": 62121 + }, + { + "epoch": 1.59, + "learning_rate": 9.490530892343278e-07, + "loss": 0.6191, + "step": 62122 + }, + { + "epoch": 1.59, + "learning_rate": 9.490254547338162e-07, + "loss": 0.425, + "step": 62123 + }, + { + "epoch": 1.59, + "learning_rate": 9.489978202723338e-07, + "loss": 0.5879, + "step": 62124 + }, + { + "epoch": 1.59, + "learning_rate": 9.489701858499011e-07, + "loss": 0.6875, + "step": 62125 + }, + { + "epoch": 1.59, + "learning_rate": 9.489425514665398e-07, + "loss": 0.707, + "step": 62126 + }, + { + "epoch": 1.59, + "learning_rate": 9.489149171222705e-07, + "loss": 0.4863, + "step": 62127 + }, + { + "epoch": 1.59, + "learning_rate": 9.488872828171152e-07, + "loss": 0.7061, + "step": 62128 + }, + { + "epoch": 1.59, + "learning_rate": 9.488596485510945e-07, + "loss": 0.6055, + "step": 62129 + }, + { + "epoch": 1.59, + "learning_rate": 9.488320143242293e-07, + "loss": 0.3149, + "step": 62130 + }, + { + "epoch": 1.59, + "learning_rate": 9.488043801365413e-07, + "loss": 0.6509, + "step": 62131 + }, + { + "epoch": 1.59, + "learning_rate": 9.487767459880513e-07, + "loss": 0.6338, + "step": 62132 + }, + { + "epoch": 1.59, + "learning_rate": 9.487491118787807e-07, + "loss": 0.7109, + "step": 62133 + }, + { + "epoch": 1.59, + "learning_rate": 9.487214778087503e-07, + "loss": 0.5107, + "step": 62134 + }, + { + "epoch": 1.59, + "learning_rate": 9.486938437779818e-07, + "loss": 0.6108, + "step": 62135 + }, + { + "epoch": 1.59, + "learning_rate": 9.486662097864961e-07, + "loss": 0.6392, + "step": 62136 + }, + { + "epoch": 1.59, + "learning_rate": 9.48638575834314e-07, + "loss": 0.6436, + "step": 62137 + }, + { + "epoch": 1.59, + "learning_rate": 9.486109419214572e-07, + "loss": 0.5251, + "step": 62138 + }, + { + "epoch": 1.59, + "learning_rate": 9.485833080479469e-07, + "loss": 0.4761, + "step": 62139 + }, + { + "epoch": 1.59, + "learning_rate": 9.485556742138036e-07, + "loss": 0.6616, + "step": 62140 + }, + { + "epoch": 1.59, + "learning_rate": 9.48528040419049e-07, + "loss": 0.6074, + "step": 62141 + }, + { + "epoch": 1.59, + "learning_rate": 9.485004066637039e-07, + "loss": 0.6045, + "step": 62142 + }, + { + "epoch": 1.59, + "learning_rate": 9.4847277294779e-07, + "loss": 0.6763, + "step": 62143 + }, + { + "epoch": 1.59, + "learning_rate": 9.484451392713278e-07, + "loss": 0.5664, + "step": 62144 + }, + { + "epoch": 1.59, + "learning_rate": 9.48417505634339e-07, + "loss": 0.5552, + "step": 62145 + }, + { + "epoch": 1.59, + "learning_rate": 9.483898720368442e-07, + "loss": 0.7441, + "step": 62146 + }, + { + "epoch": 1.59, + "learning_rate": 9.483622384788654e-07, + "loss": 0.7002, + "step": 62147 + }, + { + "epoch": 1.59, + "learning_rate": 9.483346049604229e-07, + "loss": 0.6262, + "step": 62148 + }, + { + "epoch": 1.59, + "learning_rate": 9.483069714815387e-07, + "loss": 0.5972, + "step": 62149 + }, + { + "epoch": 1.59, + "learning_rate": 9.482793380422332e-07, + "loss": 0.7285, + "step": 62150 + }, + { + "epoch": 1.59, + "learning_rate": 9.482517046425276e-07, + "loss": 0.5947, + "step": 62151 + }, + { + "epoch": 1.59, + "learning_rate": 9.482240712824435e-07, + "loss": 0.6187, + "step": 62152 + }, + { + "epoch": 1.59, + "learning_rate": 9.48196437962002e-07, + "loss": 0.6123, + "step": 62153 + }, + { + "epoch": 1.59, + "learning_rate": 9.481688046812237e-07, + "loss": 0.5947, + "step": 62154 + }, + { + "epoch": 1.59, + "learning_rate": 9.481411714401305e-07, + "loss": 0.6333, + "step": 62155 + }, + { + "epoch": 1.59, + "learning_rate": 9.48113538238743e-07, + "loss": 0.7129, + "step": 62156 + }, + { + "epoch": 1.59, + "learning_rate": 9.480859050770827e-07, + "loss": 0.6699, + "step": 62157 + }, + { + "epoch": 1.59, + "learning_rate": 9.480582719551705e-07, + "loss": 0.8203, + "step": 62158 + }, + { + "epoch": 1.59, + "learning_rate": 9.480306388730281e-07, + "loss": 0.4741, + "step": 62159 + }, + { + "epoch": 1.59, + "learning_rate": 9.480030058306761e-07, + "loss": 0.6353, + "step": 62160 + }, + { + "epoch": 1.59, + "learning_rate": 9.479753728281355e-07, + "loss": 0.5079, + "step": 62161 + }, + { + "epoch": 1.59, + "learning_rate": 9.47947739865428e-07, + "loss": 0.6914, + "step": 62162 + }, + { + "epoch": 1.59, + "learning_rate": 9.479201069425743e-07, + "loss": 0.5161, + "step": 62163 + }, + { + "epoch": 1.59, + "learning_rate": 9.47892474059596e-07, + "loss": 0.6543, + "step": 62164 + }, + { + "epoch": 1.59, + "learning_rate": 9.478648412165139e-07, + "loss": 0.7803, + "step": 62165 + }, + { + "epoch": 1.59, + "learning_rate": 9.478372084133495e-07, + "loss": 0.6807, + "step": 62166 + }, + { + "epoch": 1.59, + "learning_rate": 9.478095756501235e-07, + "loss": 0.7363, + "step": 62167 + }, + { + "epoch": 1.59, + "learning_rate": 9.477819429268574e-07, + "loss": 0.7637, + "step": 62168 + }, + { + "epoch": 1.59, + "learning_rate": 9.477543102435726e-07, + "loss": 0.5029, + "step": 62169 + }, + { + "epoch": 1.59, + "learning_rate": 9.477266776002894e-07, + "loss": 0.6733, + "step": 62170 + }, + { + "epoch": 1.59, + "learning_rate": 9.476990449970297e-07, + "loss": 0.7148, + "step": 62171 + }, + { + "epoch": 1.59, + "learning_rate": 9.476714124338147e-07, + "loss": 0.708, + "step": 62172 + }, + { + "epoch": 1.59, + "learning_rate": 9.476437799106648e-07, + "loss": 0.6548, + "step": 62173 + }, + { + "epoch": 1.59, + "learning_rate": 9.47616147427602e-07, + "loss": 0.79, + "step": 62174 + }, + { + "epoch": 1.59, + "learning_rate": 9.475885149846469e-07, + "loss": 0.5215, + "step": 62175 + }, + { + "epoch": 1.59, + "learning_rate": 9.47560882581821e-07, + "loss": 0.6704, + "step": 62176 + }, + { + "epoch": 1.59, + "learning_rate": 9.47533250219145e-07, + "loss": 0.5735, + "step": 62177 + }, + { + "epoch": 1.59, + "learning_rate": 9.475056178966408e-07, + "loss": 0.5908, + "step": 62178 + }, + { + "epoch": 1.59, + "learning_rate": 9.474779856143292e-07, + "loss": 0.5645, + "step": 62179 + }, + { + "epoch": 1.59, + "learning_rate": 9.47450353372231e-07, + "loss": 0.6006, + "step": 62180 + }, + { + "epoch": 1.59, + "learning_rate": 9.474227211703678e-07, + "loss": 0.6216, + "step": 62181 + }, + { + "epoch": 1.59, + "learning_rate": 9.473950890087604e-07, + "loss": 0.5889, + "step": 62182 + }, + { + "epoch": 1.59, + "learning_rate": 9.473674568874304e-07, + "loss": 0.6094, + "step": 62183 + }, + { + "epoch": 1.59, + "learning_rate": 9.473398248063984e-07, + "loss": 0.6523, + "step": 62184 + }, + { + "epoch": 1.59, + "learning_rate": 9.473121927656862e-07, + "loss": 0.6118, + "step": 62185 + }, + { + "epoch": 1.59, + "learning_rate": 9.472845607653144e-07, + "loss": 0.5469, + "step": 62186 + }, + { + "epoch": 1.59, + "learning_rate": 9.472569288053045e-07, + "loss": 0.5233, + "step": 62187 + }, + { + "epoch": 1.59, + "learning_rate": 9.472292968856774e-07, + "loss": 0.6924, + "step": 62188 + }, + { + "epoch": 1.59, + "learning_rate": 9.47201665006455e-07, + "loss": 0.7363, + "step": 62189 + }, + { + "epoch": 1.59, + "learning_rate": 9.471740331676573e-07, + "loss": 0.6577, + "step": 62190 + }, + { + "epoch": 1.59, + "learning_rate": 9.471464013693062e-07, + "loss": 0.6621, + "step": 62191 + }, + { + "epoch": 1.59, + "learning_rate": 9.471187696114225e-07, + "loss": 0.5979, + "step": 62192 + }, + { + "epoch": 1.59, + "learning_rate": 9.470911378940276e-07, + "loss": 0.6504, + "step": 62193 + }, + { + "epoch": 1.59, + "learning_rate": 9.470635062171425e-07, + "loss": 0.7129, + "step": 62194 + }, + { + "epoch": 1.59, + "learning_rate": 9.470358745807886e-07, + "loss": 0.6553, + "step": 62195 + }, + { + "epoch": 1.59, + "learning_rate": 9.470082429849867e-07, + "loss": 0.7246, + "step": 62196 + }, + { + "epoch": 1.59, + "learning_rate": 9.469806114297583e-07, + "loss": 0.516, + "step": 62197 + }, + { + "epoch": 1.59, + "learning_rate": 9.469529799151243e-07, + "loss": 0.5913, + "step": 62198 + }, + { + "epoch": 1.59, + "learning_rate": 9.469253484411064e-07, + "loss": 0.6587, + "step": 62199 + }, + { + "epoch": 1.59, + "learning_rate": 9.46897717007725e-07, + "loss": 0.7559, + "step": 62200 + }, + { + "epoch": 1.59, + "learning_rate": 9.468700856150014e-07, + "loss": 0.5911, + "step": 62201 + }, + { + "epoch": 1.59, + "learning_rate": 9.468424542629572e-07, + "loss": 0.519, + "step": 62202 + }, + { + "epoch": 1.59, + "learning_rate": 9.46814822951613e-07, + "loss": 0.6729, + "step": 62203 + }, + { + "epoch": 1.59, + "learning_rate": 9.467871916809906e-07, + "loss": 0.6777, + "step": 62204 + }, + { + "epoch": 1.59, + "learning_rate": 9.467595604511104e-07, + "loss": 0.6719, + "step": 62205 + }, + { + "epoch": 1.59, + "learning_rate": 9.467319292619941e-07, + "loss": 0.7734, + "step": 62206 + }, + { + "epoch": 1.59, + "learning_rate": 9.467042981136627e-07, + "loss": 0.6387, + "step": 62207 + }, + { + "epoch": 1.59, + "learning_rate": 9.466766670061375e-07, + "loss": 0.6836, + "step": 62208 + }, + { + "epoch": 1.59, + "learning_rate": 9.466490359394399e-07, + "loss": 0.6221, + "step": 62209 + }, + { + "epoch": 1.59, + "learning_rate": 9.466214049135904e-07, + "loss": 0.8076, + "step": 62210 + }, + { + "epoch": 1.59, + "learning_rate": 9.465937739286101e-07, + "loss": 0.6211, + "step": 62211 + }, + { + "epoch": 1.59, + "learning_rate": 9.465661429845207e-07, + "loss": 0.4642, + "step": 62212 + }, + { + "epoch": 1.59, + "learning_rate": 9.465385120813429e-07, + "loss": 0.6885, + "step": 62213 + }, + { + "epoch": 1.59, + "learning_rate": 9.465108812190985e-07, + "loss": 0.6548, + "step": 62214 + }, + { + "epoch": 1.59, + "learning_rate": 9.464832503978079e-07, + "loss": 0.3291, + "step": 62215 + }, + { + "epoch": 1.59, + "learning_rate": 9.464556196174929e-07, + "loss": 0.5129, + "step": 62216 + }, + { + "epoch": 1.59, + "learning_rate": 9.464279888781741e-07, + "loss": 0.5498, + "step": 62217 + }, + { + "epoch": 1.59, + "learning_rate": 9.464003581798731e-07, + "loss": 0.751, + "step": 62218 + }, + { + "epoch": 1.59, + "learning_rate": 9.463727275226113e-07, + "loss": 0.6016, + "step": 62219 + }, + { + "epoch": 1.59, + "learning_rate": 9.463450969064088e-07, + "loss": 0.6738, + "step": 62220 + }, + { + "epoch": 1.59, + "learning_rate": 9.463174663312878e-07, + "loss": 0.7598, + "step": 62221 + }, + { + "epoch": 1.59, + "learning_rate": 9.462898357972687e-07, + "loss": 0.6841, + "step": 62222 + }, + { + "epoch": 1.59, + "learning_rate": 9.462622053043733e-07, + "loss": 0.5264, + "step": 62223 + }, + { + "epoch": 1.59, + "learning_rate": 9.462345748526222e-07, + "loss": 0.5146, + "step": 62224 + }, + { + "epoch": 1.59, + "learning_rate": 9.46206944442037e-07, + "loss": 0.4814, + "step": 62225 + }, + { + "epoch": 1.59, + "learning_rate": 9.461793140726387e-07, + "loss": 0.7461, + "step": 62226 + }, + { + "epoch": 1.59, + "learning_rate": 9.46151683744448e-07, + "loss": 0.6582, + "step": 62227 + }, + { + "epoch": 1.59, + "learning_rate": 9.46124053457487e-07, + "loss": 0.7559, + "step": 62228 + }, + { + "epoch": 1.59, + "learning_rate": 9.460964232117764e-07, + "loss": 0.5396, + "step": 62229 + }, + { + "epoch": 1.59, + "learning_rate": 9.460687930073369e-07, + "loss": 0.44, + "step": 62230 + }, + { + "epoch": 1.6, + "learning_rate": 9.460411628441904e-07, + "loss": 0.5938, + "step": 62231 + }, + { + "epoch": 1.6, + "learning_rate": 9.460135327223573e-07, + "loss": 0.7402, + "step": 62232 + }, + { + "epoch": 1.6, + "learning_rate": 9.459859026418593e-07, + "loss": 0.4114, + "step": 62233 + }, + { + "epoch": 1.6, + "learning_rate": 9.459582726027174e-07, + "loss": 0.6602, + "step": 62234 + }, + { + "epoch": 1.6, + "learning_rate": 9.459306426049528e-07, + "loss": 0.7427, + "step": 62235 + }, + { + "epoch": 1.6, + "learning_rate": 9.459030126485865e-07, + "loss": 0.6016, + "step": 62236 + }, + { + "epoch": 1.6, + "learning_rate": 9.4587538273364e-07, + "loss": 0.6504, + "step": 62237 + }, + { + "epoch": 1.6, + "learning_rate": 9.458477528601339e-07, + "loss": 0.7285, + "step": 62238 + }, + { + "epoch": 1.6, + "learning_rate": 9.458201230280903e-07, + "loss": 0.5547, + "step": 62239 + }, + { + "epoch": 1.6, + "learning_rate": 9.457924932375295e-07, + "loss": 0.4927, + "step": 62240 + }, + { + "epoch": 1.6, + "learning_rate": 9.457648634884726e-07, + "loss": 0.7529, + "step": 62241 + }, + { + "epoch": 1.6, + "learning_rate": 9.457372337809413e-07, + "loss": 0.5869, + "step": 62242 + }, + { + "epoch": 1.6, + "learning_rate": 9.457096041149562e-07, + "loss": 0.5132, + "step": 62243 + }, + { + "epoch": 1.6, + "learning_rate": 9.456819744905391e-07, + "loss": 0.8008, + "step": 62244 + }, + { + "epoch": 1.6, + "learning_rate": 9.456543449077108e-07, + "loss": 0.7197, + "step": 62245 + }, + { + "epoch": 1.6, + "learning_rate": 9.456267153664922e-07, + "loss": 0.668, + "step": 62246 + }, + { + "epoch": 1.6, + "learning_rate": 9.455990858669049e-07, + "loss": 0.6802, + "step": 62247 + }, + { + "epoch": 1.6, + "learning_rate": 9.455714564089697e-07, + "loss": 0.7568, + "step": 62248 + }, + { + "epoch": 1.6, + "learning_rate": 9.455438269927085e-07, + "loss": 0.5898, + "step": 62249 + }, + { + "epoch": 1.6, + "learning_rate": 9.455161976181415e-07, + "loss": 0.582, + "step": 62250 + }, + { + "epoch": 1.6, + "learning_rate": 9.454885682852901e-07, + "loss": 0.7129, + "step": 62251 + }, + { + "epoch": 1.6, + "learning_rate": 9.454609389941758e-07, + "loss": 0.5752, + "step": 62252 + }, + { + "epoch": 1.6, + "learning_rate": 9.454333097448194e-07, + "loss": 0.7539, + "step": 62253 + }, + { + "epoch": 1.6, + "learning_rate": 9.454056805372423e-07, + "loss": 0.7549, + "step": 62254 + }, + { + "epoch": 1.6, + "learning_rate": 9.453780513714654e-07, + "loss": 0.494, + "step": 62255 + }, + { + "epoch": 1.6, + "learning_rate": 9.453504222475103e-07, + "loss": 0.5854, + "step": 62256 + }, + { + "epoch": 1.6, + "learning_rate": 9.453227931653975e-07, + "loss": 0.5444, + "step": 62257 + }, + { + "epoch": 1.6, + "learning_rate": 9.452951641251489e-07, + "loss": 0.6299, + "step": 62258 + }, + { + "epoch": 1.6, + "learning_rate": 9.452675351267853e-07, + "loss": 0.667, + "step": 62259 + }, + { + "epoch": 1.6, + "learning_rate": 9.452399061703275e-07, + "loss": 0.8516, + "step": 62260 + }, + { + "epoch": 1.6, + "learning_rate": 9.452122772557973e-07, + "loss": 0.9287, + "step": 62261 + }, + { + "epoch": 1.6, + "learning_rate": 9.451846483832155e-07, + "loss": 0.564, + "step": 62262 + }, + { + "epoch": 1.6, + "learning_rate": 9.451570195526029e-07, + "loss": 0.5381, + "step": 62263 + }, + { + "epoch": 1.6, + "learning_rate": 9.451293907639814e-07, + "loss": 0.5542, + "step": 62264 + }, + { + "epoch": 1.6, + "learning_rate": 9.451017620173717e-07, + "loss": 0.5717, + "step": 62265 + }, + { + "epoch": 1.6, + "learning_rate": 9.450741333127951e-07, + "loss": 0.6484, + "step": 62266 + }, + { + "epoch": 1.6, + "learning_rate": 9.450465046502726e-07, + "loss": 0.4825, + "step": 62267 + }, + { + "epoch": 1.6, + "learning_rate": 9.450188760298256e-07, + "loss": 0.6038, + "step": 62268 + }, + { + "epoch": 1.6, + "learning_rate": 9.449912474514754e-07, + "loss": 0.3607, + "step": 62269 + }, + { + "epoch": 1.6, + "learning_rate": 9.449636189152425e-07, + "loss": 0.5649, + "step": 62270 + }, + { + "epoch": 1.6, + "learning_rate": 9.449359904211484e-07, + "loss": 0.6152, + "step": 62271 + }, + { + "epoch": 1.6, + "learning_rate": 9.449083619692143e-07, + "loss": 0.6211, + "step": 62272 + }, + { + "epoch": 1.6, + "learning_rate": 9.448807335594614e-07, + "loss": 0.7266, + "step": 62273 + }, + { + "epoch": 1.6, + "learning_rate": 9.448531051919106e-07, + "loss": 0.5273, + "step": 62274 + }, + { + "epoch": 1.6, + "learning_rate": 9.448254768665836e-07, + "loss": 0.7275, + "step": 62275 + }, + { + "epoch": 1.6, + "learning_rate": 9.447978485835008e-07, + "loss": 0.7976, + "step": 62276 + }, + { + "epoch": 1.6, + "learning_rate": 9.44770220342684e-07, + "loss": 0.8037, + "step": 62277 + }, + { + "epoch": 1.6, + "learning_rate": 9.44742592144154e-07, + "loss": 0.5215, + "step": 62278 + }, + { + "epoch": 1.6, + "learning_rate": 9.447149639879326e-07, + "loss": 0.7197, + "step": 62279 + }, + { + "epoch": 1.6, + "learning_rate": 9.446873358740398e-07, + "loss": 0.4393, + "step": 62280 + }, + { + "epoch": 1.6, + "learning_rate": 9.446597078024976e-07, + "loss": 0.4438, + "step": 62281 + }, + { + "epoch": 1.6, + "learning_rate": 9.446320797733267e-07, + "loss": 0.5527, + "step": 62282 + }, + { + "epoch": 1.6, + "learning_rate": 9.446044517865487e-07, + "loss": 0.6274, + "step": 62283 + }, + { + "epoch": 1.6, + "learning_rate": 9.445768238421841e-07, + "loss": 0.8359, + "step": 62284 + }, + { + "epoch": 1.6, + "learning_rate": 9.445491959402549e-07, + "loss": 0.7295, + "step": 62285 + }, + { + "epoch": 1.6, + "learning_rate": 9.445215680807817e-07, + "loss": 0.7061, + "step": 62286 + }, + { + "epoch": 1.6, + "learning_rate": 9.444939402637858e-07, + "loss": 0.7432, + "step": 62287 + }, + { + "epoch": 1.6, + "learning_rate": 9.444663124892882e-07, + "loss": 0.6855, + "step": 62288 + }, + { + "epoch": 1.6, + "learning_rate": 9.444386847573107e-07, + "loss": 0.457, + "step": 62289 + }, + { + "epoch": 1.6, + "learning_rate": 9.444110570678736e-07, + "loss": 0.6562, + "step": 62290 + }, + { + "epoch": 1.6, + "learning_rate": 9.443834294209983e-07, + "loss": 0.6138, + "step": 62291 + }, + { + "epoch": 1.6, + "learning_rate": 9.443558018167062e-07, + "loss": 0.6313, + "step": 62292 + }, + { + "epoch": 1.6, + "learning_rate": 9.443281742550179e-07, + "loss": 0.4912, + "step": 62293 + }, + { + "epoch": 1.6, + "learning_rate": 9.443005467359555e-07, + "loss": 0.4243, + "step": 62294 + }, + { + "epoch": 1.6, + "learning_rate": 9.442729192595392e-07, + "loss": 0.5923, + "step": 62295 + }, + { + "epoch": 1.6, + "learning_rate": 9.442452918257908e-07, + "loss": 0.4585, + "step": 62296 + }, + { + "epoch": 1.6, + "learning_rate": 9.442176644347311e-07, + "loss": 0.7324, + "step": 62297 + }, + { + "epoch": 1.6, + "learning_rate": 9.441900370863815e-07, + "loss": 0.6387, + "step": 62298 + }, + { + "epoch": 1.6, + "learning_rate": 9.441624097807632e-07, + "loss": 0.6152, + "step": 62299 + }, + { + "epoch": 1.6, + "learning_rate": 9.441347825178972e-07, + "loss": 0.8389, + "step": 62300 + }, + { + "epoch": 1.6, + "learning_rate": 9.441071552978042e-07, + "loss": 0.6826, + "step": 62301 + }, + { + "epoch": 1.6, + "learning_rate": 9.44079528120506e-07, + "loss": 0.687, + "step": 62302 + }, + { + "epoch": 1.6, + "learning_rate": 9.440519009860233e-07, + "loss": 0.6333, + "step": 62303 + }, + { + "epoch": 1.6, + "learning_rate": 9.440242738943778e-07, + "loss": 0.5781, + "step": 62304 + }, + { + "epoch": 1.6, + "learning_rate": 9.4399664684559e-07, + "loss": 0.666, + "step": 62305 + }, + { + "epoch": 1.6, + "learning_rate": 9.439690198396817e-07, + "loss": 0.5825, + "step": 62306 + }, + { + "epoch": 1.6, + "learning_rate": 9.439413928766735e-07, + "loss": 0.666, + "step": 62307 + }, + { + "epoch": 1.6, + "learning_rate": 9.43913765956587e-07, + "loss": 0.6118, + "step": 62308 + }, + { + "epoch": 1.6, + "learning_rate": 9.438861390794434e-07, + "loss": 0.5776, + "step": 62309 + }, + { + "epoch": 1.6, + "learning_rate": 9.438585122452631e-07, + "loss": 0.6328, + "step": 62310 + }, + { + "epoch": 1.6, + "learning_rate": 9.438308854540681e-07, + "loss": 0.4883, + "step": 62311 + }, + { + "epoch": 1.6, + "learning_rate": 9.43803258705879e-07, + "loss": 0.5649, + "step": 62312 + }, + { + "epoch": 1.6, + "learning_rate": 9.437756320007172e-07, + "loss": 0.6807, + "step": 62313 + }, + { + "epoch": 1.6, + "learning_rate": 9.437480053386038e-07, + "loss": 0.4487, + "step": 62314 + }, + { + "epoch": 1.6, + "learning_rate": 9.4372037871956e-07, + "loss": 0.5539, + "step": 62315 + }, + { + "epoch": 1.6, + "learning_rate": 9.43692752143607e-07, + "loss": 0.5591, + "step": 62316 + }, + { + "epoch": 1.6, + "learning_rate": 9.436651256107656e-07, + "loss": 0.7109, + "step": 62317 + }, + { + "epoch": 1.6, + "learning_rate": 9.436374991210575e-07, + "loss": 0.5071, + "step": 62318 + }, + { + "epoch": 1.6, + "learning_rate": 9.436098726745039e-07, + "loss": 0.4346, + "step": 62319 + }, + { + "epoch": 1.6, + "learning_rate": 9.43582246271125e-07, + "loss": 0.6816, + "step": 62320 + }, + { + "epoch": 1.6, + "learning_rate": 9.435546199109428e-07, + "loss": 0.686, + "step": 62321 + }, + { + "epoch": 1.6, + "learning_rate": 9.435269935939782e-07, + "loss": 0.5586, + "step": 62322 + }, + { + "epoch": 1.6, + "learning_rate": 9.434993673202524e-07, + "loss": 0.5476, + "step": 62323 + }, + { + "epoch": 1.6, + "learning_rate": 9.434717410897865e-07, + "loss": 0.5679, + "step": 62324 + }, + { + "epoch": 1.6, + "learning_rate": 9.434441149026018e-07, + "loss": 0.6875, + "step": 62325 + }, + { + "epoch": 1.6, + "learning_rate": 9.434164887587191e-07, + "loss": 0.7256, + "step": 62326 + }, + { + "epoch": 1.6, + "learning_rate": 9.4338886265816e-07, + "loss": 0.6401, + "step": 62327 + }, + { + "epoch": 1.6, + "learning_rate": 9.433612366009453e-07, + "loss": 0.5649, + "step": 62328 + }, + { + "epoch": 1.6, + "learning_rate": 9.433336105870968e-07, + "loss": 0.6753, + "step": 62329 + }, + { + "epoch": 1.6, + "learning_rate": 9.433059846166348e-07, + "loss": 0.613, + "step": 62330 + }, + { + "epoch": 1.6, + "learning_rate": 9.432783586895806e-07, + "loss": 0.6064, + "step": 62331 + }, + { + "epoch": 1.6, + "learning_rate": 9.432507328059558e-07, + "loss": 0.5549, + "step": 62332 + }, + { + "epoch": 1.6, + "learning_rate": 9.432231069657811e-07, + "loss": 0.7334, + "step": 62333 + }, + { + "epoch": 1.6, + "learning_rate": 9.431954811690781e-07, + "loss": 0.5986, + "step": 62334 + }, + { + "epoch": 1.6, + "learning_rate": 9.431678554158677e-07, + "loss": 0.6904, + "step": 62335 + }, + { + "epoch": 1.6, + "learning_rate": 9.431402297061707e-07, + "loss": 0.5833, + "step": 62336 + }, + { + "epoch": 1.6, + "learning_rate": 9.43112604040009e-07, + "loss": 0.5358, + "step": 62337 + }, + { + "epoch": 1.6, + "learning_rate": 9.430849784174031e-07, + "loss": 0.4495, + "step": 62338 + }, + { + "epoch": 1.6, + "learning_rate": 9.430573528383747e-07, + "loss": 0.7246, + "step": 62339 + }, + { + "epoch": 1.6, + "learning_rate": 9.430297273029446e-07, + "loss": 0.7539, + "step": 62340 + }, + { + "epoch": 1.6, + "learning_rate": 9.430021018111338e-07, + "loss": 0.6914, + "step": 62341 + }, + { + "epoch": 1.6, + "learning_rate": 9.429744763629639e-07, + "loss": 0.6294, + "step": 62342 + }, + { + "epoch": 1.6, + "learning_rate": 9.429468509584556e-07, + "loss": 0.6187, + "step": 62343 + }, + { + "epoch": 1.6, + "learning_rate": 9.429192255976304e-07, + "loss": 0.6436, + "step": 62344 + }, + { + "epoch": 1.6, + "learning_rate": 9.428916002805092e-07, + "loss": 0.6167, + "step": 62345 + }, + { + "epoch": 1.6, + "learning_rate": 9.428639750071135e-07, + "loss": 0.478, + "step": 62346 + }, + { + "epoch": 1.6, + "learning_rate": 9.428363497774639e-07, + "loss": 0.7715, + "step": 62347 + }, + { + "epoch": 1.6, + "learning_rate": 9.428087245915822e-07, + "loss": 0.4993, + "step": 62348 + }, + { + "epoch": 1.6, + "learning_rate": 9.427810994494894e-07, + "loss": 0.6816, + "step": 62349 + }, + { + "epoch": 1.6, + "learning_rate": 9.427534743512061e-07, + "loss": 0.7061, + "step": 62350 + }, + { + "epoch": 1.6, + "learning_rate": 9.42725849296754e-07, + "loss": 0.6714, + "step": 62351 + }, + { + "epoch": 1.6, + "learning_rate": 9.426982242861541e-07, + "loss": 0.6143, + "step": 62352 + }, + { + "epoch": 1.6, + "learning_rate": 9.426705993194273e-07, + "loss": 0.6787, + "step": 62353 + }, + { + "epoch": 1.6, + "learning_rate": 9.426429743965952e-07, + "loss": 0.6621, + "step": 62354 + }, + { + "epoch": 1.6, + "learning_rate": 9.426153495176786e-07, + "loss": 0.3123, + "step": 62355 + }, + { + "epoch": 1.6, + "learning_rate": 9.425877246826988e-07, + "loss": 0.605, + "step": 62356 + }, + { + "epoch": 1.6, + "learning_rate": 9.42560099891677e-07, + "loss": 0.6187, + "step": 62357 + }, + { + "epoch": 1.6, + "learning_rate": 9.425324751446345e-07, + "loss": 0.8174, + "step": 62358 + }, + { + "epoch": 1.6, + "learning_rate": 9.425048504415922e-07, + "loss": 0.6304, + "step": 62359 + }, + { + "epoch": 1.6, + "learning_rate": 9.424772257825709e-07, + "loss": 0.4212, + "step": 62360 + }, + { + "epoch": 1.6, + "learning_rate": 9.424496011675925e-07, + "loss": 0.6738, + "step": 62361 + }, + { + "epoch": 1.6, + "learning_rate": 9.424219765966774e-07, + "loss": 0.6631, + "step": 62362 + }, + { + "epoch": 1.6, + "learning_rate": 9.423943520698476e-07, + "loss": 0.4971, + "step": 62363 + }, + { + "epoch": 1.6, + "learning_rate": 9.423667275871234e-07, + "loss": 0.4692, + "step": 62364 + }, + { + "epoch": 1.6, + "learning_rate": 9.423391031485267e-07, + "loss": 0.6416, + "step": 62365 + }, + { + "epoch": 1.6, + "learning_rate": 9.423114787540781e-07, + "loss": 0.6026, + "step": 62366 + }, + { + "epoch": 1.6, + "learning_rate": 9.42283854403799e-07, + "loss": 0.7383, + "step": 62367 + }, + { + "epoch": 1.6, + "learning_rate": 9.422562300977108e-07, + "loss": 0.6016, + "step": 62368 + }, + { + "epoch": 1.6, + "learning_rate": 9.422286058358341e-07, + "loss": 0.6807, + "step": 62369 + }, + { + "epoch": 1.6, + "learning_rate": 9.422009816181901e-07, + "loss": 0.5537, + "step": 62370 + }, + { + "epoch": 1.6, + "learning_rate": 9.421733574448003e-07, + "loss": 0.6035, + "step": 62371 + }, + { + "epoch": 1.6, + "learning_rate": 9.421457333156856e-07, + "loss": 0.3418, + "step": 62372 + }, + { + "epoch": 1.6, + "learning_rate": 9.421181092308674e-07, + "loss": 0.4365, + "step": 62373 + }, + { + "epoch": 1.6, + "learning_rate": 9.420904851903665e-07, + "loss": 0.5728, + "step": 62374 + }, + { + "epoch": 1.6, + "learning_rate": 9.420628611942045e-07, + "loss": 0.6885, + "step": 62375 + }, + { + "epoch": 1.6, + "learning_rate": 9.420352372424021e-07, + "loss": 0.5122, + "step": 62376 + }, + { + "epoch": 1.6, + "learning_rate": 9.420076133349808e-07, + "loss": 0.4312, + "step": 62377 + }, + { + "epoch": 1.6, + "learning_rate": 9.419799894719619e-07, + "loss": 0.6689, + "step": 62378 + }, + { + "epoch": 1.6, + "learning_rate": 9.419523656533658e-07, + "loss": 0.5518, + "step": 62379 + }, + { + "epoch": 1.6, + "learning_rate": 9.419247418792143e-07, + "loss": 0.6021, + "step": 62380 + }, + { + "epoch": 1.6, + "learning_rate": 9.418971181495281e-07, + "loss": 0.4268, + "step": 62381 + }, + { + "epoch": 1.6, + "learning_rate": 9.418694944643289e-07, + "loss": 0.71, + "step": 62382 + }, + { + "epoch": 1.6, + "learning_rate": 9.418418708236373e-07, + "loss": 0.6699, + "step": 62383 + }, + { + "epoch": 1.6, + "learning_rate": 9.418142472274749e-07, + "loss": 0.6133, + "step": 62384 + }, + { + "epoch": 1.6, + "learning_rate": 9.417866236758625e-07, + "loss": 0.7559, + "step": 62385 + }, + { + "epoch": 1.6, + "learning_rate": 9.417590001688215e-07, + "loss": 0.6699, + "step": 62386 + }, + { + "epoch": 1.6, + "learning_rate": 9.417313767063728e-07, + "loss": 0.6064, + "step": 62387 + }, + { + "epoch": 1.6, + "learning_rate": 9.417037532885385e-07, + "loss": 0.4929, + "step": 62388 + }, + { + "epoch": 1.6, + "learning_rate": 9.41676129915338e-07, + "loss": 0.6895, + "step": 62389 + }, + { + "epoch": 1.6, + "learning_rate": 9.416485065867939e-07, + "loss": 0.6719, + "step": 62390 + }, + { + "epoch": 1.6, + "learning_rate": 9.416208833029266e-07, + "loss": 0.4021, + "step": 62391 + }, + { + "epoch": 1.6, + "learning_rate": 9.415932600637576e-07, + "loss": 0.5247, + "step": 62392 + }, + { + "epoch": 1.6, + "learning_rate": 9.415656368693078e-07, + "loss": 0.7705, + "step": 62393 + }, + { + "epoch": 1.6, + "learning_rate": 9.415380137195987e-07, + "loss": 0.5725, + "step": 62394 + }, + { + "epoch": 1.6, + "learning_rate": 9.41510390614651e-07, + "loss": 0.644, + "step": 62395 + }, + { + "epoch": 1.6, + "learning_rate": 9.414827675544865e-07, + "loss": 0.5498, + "step": 62396 + }, + { + "epoch": 1.6, + "learning_rate": 9.414551445391256e-07, + "loss": 0.7432, + "step": 62397 + }, + { + "epoch": 1.6, + "learning_rate": 9.414275215685903e-07, + "loss": 0.749, + "step": 62398 + }, + { + "epoch": 1.6, + "learning_rate": 9.413998986429009e-07, + "loss": 0.6328, + "step": 62399 + }, + { + "epoch": 1.6, + "learning_rate": 9.413722757620789e-07, + "loss": 0.6904, + "step": 62400 + }, + { + "epoch": 1.6, + "learning_rate": 9.413446529261455e-07, + "loss": 0.6855, + "step": 62401 + }, + { + "epoch": 1.6, + "learning_rate": 9.413170301351217e-07, + "loss": 0.5386, + "step": 62402 + }, + { + "epoch": 1.6, + "learning_rate": 9.412894073890289e-07, + "loss": 0.6606, + "step": 62403 + }, + { + "epoch": 1.6, + "learning_rate": 9.412617846878879e-07, + "loss": 0.6729, + "step": 62404 + }, + { + "epoch": 1.6, + "learning_rate": 9.412341620317201e-07, + "loss": 0.7998, + "step": 62405 + }, + { + "epoch": 1.6, + "learning_rate": 9.412065394205467e-07, + "loss": 0.7598, + "step": 62406 + }, + { + "epoch": 1.6, + "learning_rate": 9.411789168543887e-07, + "loss": 0.5032, + "step": 62407 + }, + { + "epoch": 1.6, + "learning_rate": 9.411512943332677e-07, + "loss": 0.6104, + "step": 62408 + }, + { + "epoch": 1.6, + "learning_rate": 9.411236718572041e-07, + "loss": 0.7578, + "step": 62409 + }, + { + "epoch": 1.6, + "learning_rate": 9.410960494262192e-07, + "loss": 0.5389, + "step": 62410 + }, + { + "epoch": 1.6, + "learning_rate": 9.410684270403347e-07, + "loss": 0.7188, + "step": 62411 + }, + { + "epoch": 1.6, + "learning_rate": 9.41040804699571e-07, + "loss": 0.7129, + "step": 62412 + }, + { + "epoch": 1.6, + "learning_rate": 9.4101318240395e-07, + "loss": 0.6357, + "step": 62413 + }, + { + "epoch": 1.6, + "learning_rate": 9.409855601534922e-07, + "loss": 0.666, + "step": 62414 + }, + { + "epoch": 1.6, + "learning_rate": 9.409579379482192e-07, + "loss": 0.584, + "step": 62415 + }, + { + "epoch": 1.6, + "learning_rate": 9.409303157881519e-07, + "loss": 0.791, + "step": 62416 + }, + { + "epoch": 1.6, + "learning_rate": 9.409026936733117e-07, + "loss": 0.6216, + "step": 62417 + }, + { + "epoch": 1.6, + "learning_rate": 9.408750716037198e-07, + "loss": 0.4746, + "step": 62418 + }, + { + "epoch": 1.6, + "learning_rate": 9.408474495793968e-07, + "loss": 0.7046, + "step": 62419 + }, + { + "epoch": 1.6, + "learning_rate": 9.408198276003642e-07, + "loss": 0.7314, + "step": 62420 + }, + { + "epoch": 1.6, + "learning_rate": 9.40792205666643e-07, + "loss": 0.562, + "step": 62421 + }, + { + "epoch": 1.6, + "learning_rate": 9.407645837782548e-07, + "loss": 0.627, + "step": 62422 + }, + { + "epoch": 1.6, + "learning_rate": 9.407369619352203e-07, + "loss": 0.6211, + "step": 62423 + }, + { + "epoch": 1.6, + "learning_rate": 9.407093401375607e-07, + "loss": 0.8408, + "step": 62424 + }, + { + "epoch": 1.6, + "learning_rate": 9.406817183852975e-07, + "loss": 0.6602, + "step": 62425 + }, + { + "epoch": 1.6, + "learning_rate": 9.406540966784512e-07, + "loss": 0.6953, + "step": 62426 + }, + { + "epoch": 1.6, + "learning_rate": 9.406264750170436e-07, + "loss": 0.5596, + "step": 62427 + }, + { + "epoch": 1.6, + "learning_rate": 9.405988534010958e-07, + "loss": 0.6699, + "step": 62428 + }, + { + "epoch": 1.6, + "learning_rate": 9.405712318306283e-07, + "loss": 0.6392, + "step": 62429 + }, + { + "epoch": 1.6, + "learning_rate": 9.40543610305663e-07, + "loss": 0.6182, + "step": 62430 + }, + { + "epoch": 1.6, + "learning_rate": 9.405159888262203e-07, + "loss": 0.6357, + "step": 62431 + }, + { + "epoch": 1.6, + "learning_rate": 9.40488367392322e-07, + "loss": 0.6846, + "step": 62432 + }, + { + "epoch": 1.6, + "learning_rate": 9.404607460039889e-07, + "loss": 0.5879, + "step": 62433 + }, + { + "epoch": 1.6, + "learning_rate": 9.404331246612425e-07, + "loss": 0.582, + "step": 62434 + }, + { + "epoch": 1.6, + "learning_rate": 9.404055033641036e-07, + "loss": 0.3972, + "step": 62435 + }, + { + "epoch": 1.6, + "learning_rate": 9.403778821125935e-07, + "loss": 0.6475, + "step": 62436 + }, + { + "epoch": 1.6, + "learning_rate": 9.403502609067331e-07, + "loss": 0.4285, + "step": 62437 + }, + { + "epoch": 1.6, + "learning_rate": 9.403226397465442e-07, + "loss": 0.5962, + "step": 62438 + }, + { + "epoch": 1.6, + "learning_rate": 9.402950186320474e-07, + "loss": 0.4026, + "step": 62439 + }, + { + "epoch": 1.6, + "learning_rate": 9.402673975632637e-07, + "loss": 0.7041, + "step": 62440 + }, + { + "epoch": 1.6, + "learning_rate": 9.402397765402147e-07, + "loss": 0.5796, + "step": 62441 + }, + { + "epoch": 1.6, + "learning_rate": 9.402121555629214e-07, + "loss": 0.6147, + "step": 62442 + }, + { + "epoch": 1.6, + "learning_rate": 9.401845346314046e-07, + "loss": 0.6128, + "step": 62443 + }, + { + "epoch": 1.6, + "learning_rate": 9.401569137456861e-07, + "loss": 0.7412, + "step": 62444 + }, + { + "epoch": 1.6, + "learning_rate": 9.401292929057864e-07, + "loss": 0.6597, + "step": 62445 + }, + { + "epoch": 1.6, + "learning_rate": 9.401016721117271e-07, + "loss": 0.5869, + "step": 62446 + }, + { + "epoch": 1.6, + "learning_rate": 9.40074051363529e-07, + "loss": 0.6069, + "step": 62447 + }, + { + "epoch": 1.6, + "learning_rate": 9.40046430661214e-07, + "loss": 0.708, + "step": 62448 + }, + { + "epoch": 1.6, + "learning_rate": 9.400188100048024e-07, + "loss": 0.3684, + "step": 62449 + }, + { + "epoch": 1.6, + "learning_rate": 9.399911893943154e-07, + "loss": 0.5663, + "step": 62450 + }, + { + "epoch": 1.6, + "learning_rate": 9.399635688297746e-07, + "loss": 0.5349, + "step": 62451 + }, + { + "epoch": 1.6, + "learning_rate": 9.399359483112008e-07, + "loss": 0.4644, + "step": 62452 + }, + { + "epoch": 1.6, + "learning_rate": 9.399083278386154e-07, + "loss": 0.7056, + "step": 62453 + }, + { + "epoch": 1.6, + "learning_rate": 9.398807074120393e-07, + "loss": 0.3629, + "step": 62454 + }, + { + "epoch": 1.6, + "learning_rate": 9.398530870314939e-07, + "loss": 0.6465, + "step": 62455 + }, + { + "epoch": 1.6, + "learning_rate": 9.39825466697e-07, + "loss": 0.7393, + "step": 62456 + }, + { + "epoch": 1.6, + "learning_rate": 9.397978464085793e-07, + "loss": 0.605, + "step": 62457 + }, + { + "epoch": 1.6, + "learning_rate": 9.397702261662527e-07, + "loss": 0.5293, + "step": 62458 + }, + { + "epoch": 1.6, + "learning_rate": 9.397426059700412e-07, + "loss": 0.4128, + "step": 62459 + }, + { + "epoch": 1.6, + "learning_rate": 9.397149858199658e-07, + "loss": 0.5996, + "step": 62460 + }, + { + "epoch": 1.6, + "learning_rate": 9.39687365716048e-07, + "loss": 0.6099, + "step": 62461 + }, + { + "epoch": 1.6, + "learning_rate": 9.396597456583087e-07, + "loss": 0.7441, + "step": 62462 + }, + { + "epoch": 1.6, + "learning_rate": 9.396321256467692e-07, + "loss": 0.5566, + "step": 62463 + }, + { + "epoch": 1.6, + "learning_rate": 9.396045056814504e-07, + "loss": 0.5537, + "step": 62464 + }, + { + "epoch": 1.6, + "learning_rate": 9.39576885762374e-07, + "loss": 0.4681, + "step": 62465 + }, + { + "epoch": 1.6, + "learning_rate": 9.395492658895605e-07, + "loss": 0.5273, + "step": 62466 + }, + { + "epoch": 1.6, + "learning_rate": 9.395216460630317e-07, + "loss": 0.7822, + "step": 62467 + }, + { + "epoch": 1.6, + "learning_rate": 9.394940262828084e-07, + "loss": 0.7217, + "step": 62468 + }, + { + "epoch": 1.6, + "learning_rate": 9.394664065489114e-07, + "loss": 0.6436, + "step": 62469 + }, + { + "epoch": 1.6, + "learning_rate": 9.394387868613625e-07, + "loss": 0.5035, + "step": 62470 + }, + { + "epoch": 1.6, + "learning_rate": 9.394111672201822e-07, + "loss": 0.8418, + "step": 62471 + }, + { + "epoch": 1.6, + "learning_rate": 9.393835476253922e-07, + "loss": 0.6084, + "step": 62472 + }, + { + "epoch": 1.6, + "learning_rate": 9.393559280770133e-07, + "loss": 0.5776, + "step": 62473 + }, + { + "epoch": 1.6, + "learning_rate": 9.393283085750669e-07, + "loss": 0.709, + "step": 62474 + }, + { + "epoch": 1.6, + "learning_rate": 9.393006891195739e-07, + "loss": 0.7578, + "step": 62475 + }, + { + "epoch": 1.6, + "learning_rate": 9.392730697105558e-07, + "loss": 0.5972, + "step": 62476 + }, + { + "epoch": 1.6, + "learning_rate": 9.392454503480332e-07, + "loss": 0.7529, + "step": 62477 + }, + { + "epoch": 1.6, + "learning_rate": 9.392178310320283e-07, + "loss": 0.7344, + "step": 62478 + }, + { + "epoch": 1.6, + "learning_rate": 9.391902117625608e-07, + "loss": 0.4397, + "step": 62479 + }, + { + "epoch": 1.6, + "learning_rate": 9.391625925396527e-07, + "loss": 0.5405, + "step": 62480 + }, + { + "epoch": 1.6, + "learning_rate": 9.391349733633249e-07, + "loss": 0.7588, + "step": 62481 + }, + { + "epoch": 1.6, + "learning_rate": 9.391073542335989e-07, + "loss": 0.6133, + "step": 62482 + }, + { + "epoch": 1.6, + "learning_rate": 9.390797351504953e-07, + "loss": 0.4644, + "step": 62483 + }, + { + "epoch": 1.6, + "learning_rate": 9.390521161140358e-07, + "loss": 0.5037, + "step": 62484 + }, + { + "epoch": 1.6, + "learning_rate": 9.390244971242411e-07, + "loss": 0.6484, + "step": 62485 + }, + { + "epoch": 1.6, + "learning_rate": 9.389968781811327e-07, + "loss": 0.5459, + "step": 62486 + }, + { + "epoch": 1.6, + "learning_rate": 9.389692592847314e-07, + "loss": 0.6768, + "step": 62487 + }, + { + "epoch": 1.6, + "learning_rate": 9.38941640435059e-07, + "loss": 0.6689, + "step": 62488 + }, + { + "epoch": 1.6, + "learning_rate": 9.389140216321359e-07, + "loss": 0.6777, + "step": 62489 + }, + { + "epoch": 1.6, + "learning_rate": 9.388864028759833e-07, + "loss": 0.6616, + "step": 62490 + }, + { + "epoch": 1.6, + "learning_rate": 9.388587841666228e-07, + "loss": 0.4568, + "step": 62491 + }, + { + "epoch": 1.6, + "learning_rate": 9.388311655040751e-07, + "loss": 0.5425, + "step": 62492 + }, + { + "epoch": 1.6, + "learning_rate": 9.388035468883619e-07, + "loss": 0.7109, + "step": 62493 + }, + { + "epoch": 1.6, + "learning_rate": 9.387759283195036e-07, + "loss": 0.5532, + "step": 62494 + }, + { + "epoch": 1.6, + "learning_rate": 9.387483097975221e-07, + "loss": 0.6431, + "step": 62495 + }, + { + "epoch": 1.6, + "learning_rate": 9.387206913224379e-07, + "loss": 0.5234, + "step": 62496 + }, + { + "epoch": 1.6, + "learning_rate": 9.386930728942728e-07, + "loss": 0.5605, + "step": 62497 + }, + { + "epoch": 1.6, + "learning_rate": 9.386654545130477e-07, + "loss": 0.646, + "step": 62498 + }, + { + "epoch": 1.6, + "learning_rate": 9.386378361787835e-07, + "loss": 0.5356, + "step": 62499 + }, + { + "epoch": 1.6, + "learning_rate": 9.386102178915012e-07, + "loss": 0.6792, + "step": 62500 + }, + { + "epoch": 1.6, + "learning_rate": 9.385825996512224e-07, + "loss": 0.6943, + "step": 62501 + }, + { + "epoch": 1.6, + "learning_rate": 9.38554981457968e-07, + "loss": 0.5645, + "step": 62502 + }, + { + "epoch": 1.6, + "learning_rate": 9.385273633117594e-07, + "loss": 0.6304, + "step": 62503 + }, + { + "epoch": 1.6, + "learning_rate": 9.384997452126174e-07, + "loss": 0.6113, + "step": 62504 + }, + { + "epoch": 1.6, + "learning_rate": 9.384721271605634e-07, + "loss": 0.6309, + "step": 62505 + }, + { + "epoch": 1.6, + "learning_rate": 9.384445091556184e-07, + "loss": 0.5864, + "step": 62506 + }, + { + "epoch": 1.6, + "learning_rate": 9.384168911978036e-07, + "loss": 0.676, + "step": 62507 + }, + { + "epoch": 1.6, + "learning_rate": 9.383892732871406e-07, + "loss": 0.4158, + "step": 62508 + }, + { + "epoch": 1.6, + "learning_rate": 9.383616554236496e-07, + "loss": 0.7144, + "step": 62509 + }, + { + "epoch": 1.6, + "learning_rate": 9.383340376073524e-07, + "loss": 0.5322, + "step": 62510 + }, + { + "epoch": 1.6, + "learning_rate": 9.383064198382697e-07, + "loss": 0.6182, + "step": 62511 + }, + { + "epoch": 1.6, + "learning_rate": 9.382788021164234e-07, + "loss": 0.5981, + "step": 62512 + }, + { + "epoch": 1.6, + "learning_rate": 9.382511844418338e-07, + "loss": 0.5715, + "step": 62513 + }, + { + "epoch": 1.6, + "learning_rate": 9.382235668145227e-07, + "loss": 0.7935, + "step": 62514 + }, + { + "epoch": 1.6, + "learning_rate": 9.381959492345109e-07, + "loss": 0.6465, + "step": 62515 + }, + { + "epoch": 1.6, + "learning_rate": 9.381683317018195e-07, + "loss": 0.6553, + "step": 62516 + }, + { + "epoch": 1.6, + "learning_rate": 9.381407142164699e-07, + "loss": 0.6301, + "step": 62517 + }, + { + "epoch": 1.6, + "learning_rate": 9.381130967784833e-07, + "loss": 0.6284, + "step": 62518 + }, + { + "epoch": 1.6, + "learning_rate": 9.380854793878804e-07, + "loss": 0.5215, + "step": 62519 + }, + { + "epoch": 1.6, + "learning_rate": 9.380578620446828e-07, + "loss": 0.4424, + "step": 62520 + }, + { + "epoch": 1.6, + "learning_rate": 9.380302447489111e-07, + "loss": 0.6348, + "step": 62521 + }, + { + "epoch": 1.6, + "learning_rate": 9.38002627500587e-07, + "loss": 0.606, + "step": 62522 + }, + { + "epoch": 1.6, + "learning_rate": 9.379750102997312e-07, + "loss": 0.6421, + "step": 62523 + }, + { + "epoch": 1.6, + "learning_rate": 9.379473931463655e-07, + "loss": 0.53, + "step": 62524 + }, + { + "epoch": 1.6, + "learning_rate": 9.379197760405102e-07, + "loss": 0.6221, + "step": 62525 + }, + { + "epoch": 1.6, + "learning_rate": 9.378921589821872e-07, + "loss": 0.4111, + "step": 62526 + }, + { + "epoch": 1.6, + "learning_rate": 9.37864541971417e-07, + "loss": 0.6475, + "step": 62527 + }, + { + "epoch": 1.6, + "learning_rate": 9.378369250082217e-07, + "loss": 0.7695, + "step": 62528 + }, + { + "epoch": 1.6, + "learning_rate": 9.378093080926215e-07, + "loss": 0.5835, + "step": 62529 + }, + { + "epoch": 1.6, + "learning_rate": 9.377816912246376e-07, + "loss": 0.6328, + "step": 62530 + }, + { + "epoch": 1.6, + "learning_rate": 9.377540744042916e-07, + "loss": 0.5903, + "step": 62531 + }, + { + "epoch": 1.6, + "learning_rate": 9.377264576316044e-07, + "loss": 0.8008, + "step": 62532 + }, + { + "epoch": 1.6, + "learning_rate": 9.37698840906597e-07, + "loss": 0.6807, + "step": 62533 + }, + { + "epoch": 1.6, + "learning_rate": 9.37671224229291e-07, + "loss": 0.4851, + "step": 62534 + }, + { + "epoch": 1.6, + "learning_rate": 9.376436075997071e-07, + "loss": 0.5444, + "step": 62535 + }, + { + "epoch": 1.6, + "learning_rate": 9.376159910178667e-07, + "loss": 0.5239, + "step": 62536 + }, + { + "epoch": 1.6, + "learning_rate": 9.375883744837907e-07, + "loss": 0.5977, + "step": 62537 + }, + { + "epoch": 1.6, + "learning_rate": 9.375607579975009e-07, + "loss": 0.623, + "step": 62538 + }, + { + "epoch": 1.6, + "learning_rate": 9.375331415590178e-07, + "loss": 0.4878, + "step": 62539 + }, + { + "epoch": 1.6, + "learning_rate": 9.375055251683624e-07, + "loss": 0.5181, + "step": 62540 + }, + { + "epoch": 1.6, + "learning_rate": 9.374779088255564e-07, + "loss": 0.6689, + "step": 62541 + }, + { + "epoch": 1.6, + "learning_rate": 9.374502925306203e-07, + "loss": 0.5703, + "step": 62542 + }, + { + "epoch": 1.6, + "learning_rate": 9.374226762835759e-07, + "loss": 0.47, + "step": 62543 + }, + { + "epoch": 1.6, + "learning_rate": 9.37395060084444e-07, + "loss": 0.7549, + "step": 62544 + }, + { + "epoch": 1.6, + "learning_rate": 9.37367443933246e-07, + "loss": 0.6943, + "step": 62545 + }, + { + "epoch": 1.6, + "learning_rate": 9.373398278300027e-07, + "loss": 0.7412, + "step": 62546 + }, + { + "epoch": 1.6, + "learning_rate": 9.373122117747356e-07, + "loss": 0.6158, + "step": 62547 + }, + { + "epoch": 1.6, + "learning_rate": 9.372845957674658e-07, + "loss": 0.4146, + "step": 62548 + }, + { + "epoch": 1.6, + "learning_rate": 9.372569798082142e-07, + "loss": 0.6045, + "step": 62549 + }, + { + "epoch": 1.6, + "learning_rate": 9.372293638970016e-07, + "loss": 0.5801, + "step": 62550 + }, + { + "epoch": 1.6, + "learning_rate": 9.3720174803385e-07, + "loss": 0.7646, + "step": 62551 + }, + { + "epoch": 1.6, + "learning_rate": 9.371741322187799e-07, + "loss": 0.541, + "step": 62552 + }, + { + "epoch": 1.6, + "learning_rate": 9.371465164518128e-07, + "loss": 0.5508, + "step": 62553 + }, + { + "epoch": 1.6, + "learning_rate": 9.371189007329696e-07, + "loss": 0.7441, + "step": 62554 + }, + { + "epoch": 1.6, + "learning_rate": 9.370912850622719e-07, + "loss": 0.8262, + "step": 62555 + }, + { + "epoch": 1.6, + "learning_rate": 9.370636694397401e-07, + "loss": 0.5229, + "step": 62556 + }, + { + "epoch": 1.6, + "learning_rate": 9.370360538653961e-07, + "loss": 0.6157, + "step": 62557 + }, + { + "epoch": 1.6, + "learning_rate": 9.370084383392608e-07, + "loss": 0.6113, + "step": 62558 + }, + { + "epoch": 1.6, + "learning_rate": 9.369808228613548e-07, + "loss": 0.5513, + "step": 62559 + }, + { + "epoch": 1.6, + "learning_rate": 9.369532074316999e-07, + "loss": 0.4302, + "step": 62560 + }, + { + "epoch": 1.6, + "learning_rate": 9.36925592050317e-07, + "loss": 0.6509, + "step": 62561 + }, + { + "epoch": 1.6, + "learning_rate": 9.368979767172272e-07, + "loss": 0.8359, + "step": 62562 + }, + { + "epoch": 1.6, + "learning_rate": 9.368703614324518e-07, + "loss": 0.752, + "step": 62563 + }, + { + "epoch": 1.6, + "learning_rate": 9.368427461960119e-07, + "loss": 0.4971, + "step": 62564 + }, + { + "epoch": 1.6, + "learning_rate": 9.368151310079285e-07, + "loss": 0.791, + "step": 62565 + }, + { + "epoch": 1.6, + "learning_rate": 9.36787515868223e-07, + "loss": 0.6934, + "step": 62566 + }, + { + "epoch": 1.6, + "learning_rate": 9.367599007769161e-07, + "loss": 0.6992, + "step": 62567 + }, + { + "epoch": 1.6, + "learning_rate": 9.367322857340299e-07, + "loss": 0.8164, + "step": 62568 + }, + { + "epoch": 1.6, + "learning_rate": 9.367046707395843e-07, + "loss": 0.5947, + "step": 62569 + }, + { + "epoch": 1.6, + "learning_rate": 9.366770557936012e-07, + "loss": 0.6045, + "step": 62570 + }, + { + "epoch": 1.6, + "learning_rate": 9.366494408961014e-07, + "loss": 0.6265, + "step": 62571 + }, + { + "epoch": 1.6, + "learning_rate": 9.366218260471064e-07, + "loss": 0.7871, + "step": 62572 + }, + { + "epoch": 1.6, + "learning_rate": 9.36594211246637e-07, + "loss": 0.749, + "step": 62573 + }, + { + "epoch": 1.6, + "learning_rate": 9.365665964947146e-07, + "loss": 0.5723, + "step": 62574 + }, + { + "epoch": 1.6, + "learning_rate": 9.3653898179136e-07, + "loss": 0.5381, + "step": 62575 + }, + { + "epoch": 1.6, + "learning_rate": 9.36511367136595e-07, + "loss": 0.6265, + "step": 62576 + }, + { + "epoch": 1.6, + "learning_rate": 9.3648375253044e-07, + "loss": 0.6387, + "step": 62577 + }, + { + "epoch": 1.6, + "learning_rate": 9.364561379729167e-07, + "loss": 0.7891, + "step": 62578 + }, + { + "epoch": 1.6, + "learning_rate": 9.364285234640461e-07, + "loss": 0.6294, + "step": 62579 + }, + { + "epoch": 1.6, + "learning_rate": 9.36400909003849e-07, + "loss": 0.5088, + "step": 62580 + }, + { + "epoch": 1.6, + "learning_rate": 9.363732945923469e-07, + "loss": 0.5864, + "step": 62581 + }, + { + "epoch": 1.6, + "learning_rate": 9.363456802295606e-07, + "loss": 0.5786, + "step": 62582 + }, + { + "epoch": 1.6, + "learning_rate": 9.363180659155119e-07, + "loss": 0.6416, + "step": 62583 + }, + { + "epoch": 1.6, + "learning_rate": 9.362904516502212e-07, + "loss": 0.564, + "step": 62584 + }, + { + "epoch": 1.6, + "learning_rate": 9.3626283743371e-07, + "loss": 0.7695, + "step": 62585 + }, + { + "epoch": 1.6, + "learning_rate": 9.362352232659995e-07, + "loss": 0.5354, + "step": 62586 + }, + { + "epoch": 1.6, + "learning_rate": 9.362076091471109e-07, + "loss": 0.6841, + "step": 62587 + }, + { + "epoch": 1.6, + "learning_rate": 9.361799950770653e-07, + "loss": 0.5435, + "step": 62588 + }, + { + "epoch": 1.6, + "learning_rate": 9.361523810558836e-07, + "loss": 0.7139, + "step": 62589 + }, + { + "epoch": 1.6, + "learning_rate": 9.361247670835868e-07, + "loss": 0.5889, + "step": 62590 + }, + { + "epoch": 1.6, + "learning_rate": 9.360971531601967e-07, + "loss": 0.6133, + "step": 62591 + }, + { + "epoch": 1.6, + "learning_rate": 9.360695392857336e-07, + "loss": 0.3765, + "step": 62592 + }, + { + "epoch": 1.6, + "learning_rate": 9.360419254602195e-07, + "loss": 0.6992, + "step": 62593 + }, + { + "epoch": 1.6, + "learning_rate": 9.36014311683675e-07, + "loss": 0.5952, + "step": 62594 + }, + { + "epoch": 1.6, + "learning_rate": 9.359866979561215e-07, + "loss": 0.6895, + "step": 62595 + }, + { + "epoch": 1.6, + "learning_rate": 9.359590842775798e-07, + "loss": 0.6899, + "step": 62596 + }, + { + "epoch": 1.6, + "learning_rate": 9.359314706480716e-07, + "loss": 0.708, + "step": 62597 + }, + { + "epoch": 1.6, + "learning_rate": 9.35903857067618e-07, + "loss": 0.4442, + "step": 62598 + }, + { + "epoch": 1.6, + "learning_rate": 9.358762435362393e-07, + "loss": 0.6421, + "step": 62599 + }, + { + "epoch": 1.6, + "learning_rate": 9.358486300539575e-07, + "loss": 0.4393, + "step": 62600 + }, + { + "epoch": 1.6, + "learning_rate": 9.358210166207932e-07, + "loss": 0.7256, + "step": 62601 + }, + { + "epoch": 1.6, + "learning_rate": 9.35793403236768e-07, + "loss": 0.6309, + "step": 62602 + }, + { + "epoch": 1.6, + "learning_rate": 9.357657899019027e-07, + "loss": 0.7549, + "step": 62603 + }, + { + "epoch": 1.6, + "learning_rate": 9.357381766162187e-07, + "loss": 0.6938, + "step": 62604 + }, + { + "epoch": 1.6, + "learning_rate": 9.357105633797371e-07, + "loss": 0.6895, + "step": 62605 + }, + { + "epoch": 1.6, + "learning_rate": 9.356829501924788e-07, + "loss": 0.521, + "step": 62606 + }, + { + "epoch": 1.6, + "learning_rate": 9.356553370544653e-07, + "loss": 0.7261, + "step": 62607 + }, + { + "epoch": 1.6, + "learning_rate": 9.356277239657176e-07, + "loss": 0.7461, + "step": 62608 + }, + { + "epoch": 1.6, + "learning_rate": 9.356001109262564e-07, + "loss": 0.4991, + "step": 62609 + }, + { + "epoch": 1.6, + "learning_rate": 9.355724979361036e-07, + "loss": 0.6528, + "step": 62610 + }, + { + "epoch": 1.6, + "learning_rate": 9.355448849952797e-07, + "loss": 0.6743, + "step": 62611 + }, + { + "epoch": 1.6, + "learning_rate": 9.355172721038063e-07, + "loss": 0.3672, + "step": 62612 + }, + { + "epoch": 1.6, + "learning_rate": 9.354896592617041e-07, + "loss": 0.7217, + "step": 62613 + }, + { + "epoch": 1.6, + "learning_rate": 9.354620464689949e-07, + "loss": 0.6743, + "step": 62614 + }, + { + "epoch": 1.6, + "learning_rate": 9.35434433725699e-07, + "loss": 0.8545, + "step": 62615 + }, + { + "epoch": 1.6, + "learning_rate": 9.354068210318383e-07, + "loss": 0.6543, + "step": 62616 + }, + { + "epoch": 1.6, + "learning_rate": 9.353792083874334e-07, + "loss": 0.4402, + "step": 62617 + }, + { + "epoch": 1.6, + "learning_rate": 9.353515957925061e-07, + "loss": 0.6963, + "step": 62618 + }, + { + "epoch": 1.6, + "learning_rate": 9.35323983247077e-07, + "loss": 0.5459, + "step": 62619 + }, + { + "epoch": 1.6, + "learning_rate": 9.35296370751167e-07, + "loss": 0.666, + "step": 62620 + }, + { + "epoch": 1.61, + "learning_rate": 9.352687583047978e-07, + "loss": 0.8037, + "step": 62621 + }, + { + "epoch": 1.61, + "learning_rate": 9.352411459079904e-07, + "loss": 0.6914, + "step": 62622 + }, + { + "epoch": 1.61, + "learning_rate": 9.352135335607657e-07, + "loss": 0.48, + "step": 62623 + }, + { + "epoch": 1.61, + "learning_rate": 9.351859212631452e-07, + "loss": 0.6001, + "step": 62624 + }, + { + "epoch": 1.61, + "learning_rate": 9.351583090151496e-07, + "loss": 0.6316, + "step": 62625 + }, + { + "epoch": 1.61, + "learning_rate": 9.351306968168006e-07, + "loss": 0.6533, + "step": 62626 + }, + { + "epoch": 1.61, + "learning_rate": 9.351030846681187e-07, + "loss": 0.5764, + "step": 62627 + }, + { + "epoch": 1.61, + "learning_rate": 9.350754725691259e-07, + "loss": 0.7617, + "step": 62628 + }, + { + "epoch": 1.61, + "learning_rate": 9.350478605198427e-07, + "loss": 0.749, + "step": 62629 + }, + { + "epoch": 1.61, + "learning_rate": 9.3502024852029e-07, + "loss": 0.7041, + "step": 62630 + }, + { + "epoch": 1.61, + "learning_rate": 9.349926365704895e-07, + "loss": 0.6895, + "step": 62631 + }, + { + "epoch": 1.61, + "learning_rate": 9.349650246704622e-07, + "loss": 0.5076, + "step": 62632 + }, + { + "epoch": 1.61, + "learning_rate": 9.349374128202291e-07, + "loss": 0.6187, + "step": 62633 + }, + { + "epoch": 1.61, + "learning_rate": 9.349098010198113e-07, + "loss": 0.647, + "step": 62634 + }, + { + "epoch": 1.61, + "learning_rate": 9.348821892692304e-07, + "loss": 0.4836, + "step": 62635 + }, + { + "epoch": 1.61, + "learning_rate": 9.348545775685068e-07, + "loss": 0.6357, + "step": 62636 + }, + { + "epoch": 1.61, + "learning_rate": 9.348269659176624e-07, + "loss": 0.5806, + "step": 62637 + }, + { + "epoch": 1.61, + "learning_rate": 9.347993543167182e-07, + "loss": 0.4961, + "step": 62638 + }, + { + "epoch": 1.61, + "learning_rate": 9.347717427656949e-07, + "loss": 0.5923, + "step": 62639 + }, + { + "epoch": 1.61, + "learning_rate": 9.347441312646137e-07, + "loss": 0.4724, + "step": 62640 + }, + { + "epoch": 1.61, + "learning_rate": 9.347165198134961e-07, + "loss": 0.7021, + "step": 62641 + }, + { + "epoch": 1.61, + "learning_rate": 9.346889084123629e-07, + "loss": 0.5493, + "step": 62642 + }, + { + "epoch": 1.61, + "learning_rate": 9.346612970612355e-07, + "loss": 0.6558, + "step": 62643 + }, + { + "epoch": 1.61, + "learning_rate": 9.346336857601349e-07, + "loss": 0.6484, + "step": 62644 + }, + { + "epoch": 1.61, + "learning_rate": 9.346060745090824e-07, + "loss": 0.5571, + "step": 62645 + }, + { + "epoch": 1.61, + "learning_rate": 9.345784633080987e-07, + "loss": 0.6675, + "step": 62646 + }, + { + "epoch": 1.61, + "learning_rate": 9.345508521572059e-07, + "loss": 0.4613, + "step": 62647 + }, + { + "epoch": 1.61, + "learning_rate": 9.345232410564241e-07, + "loss": 0.7056, + "step": 62648 + }, + { + "epoch": 1.61, + "learning_rate": 9.344956300057747e-07, + "loss": 0.4182, + "step": 62649 + }, + { + "epoch": 1.61, + "learning_rate": 9.344680190052793e-07, + "loss": 0.5493, + "step": 62650 + }, + { + "epoch": 1.61, + "learning_rate": 9.344404080549584e-07, + "loss": 0.6792, + "step": 62651 + }, + { + "epoch": 1.61, + "learning_rate": 9.344127971548336e-07, + "loss": 0.7104, + "step": 62652 + }, + { + "epoch": 1.61, + "learning_rate": 9.343851863049259e-07, + "loss": 0.519, + "step": 62653 + }, + { + "epoch": 1.61, + "learning_rate": 9.343575755052565e-07, + "loss": 0.4983, + "step": 62654 + }, + { + "epoch": 1.61, + "learning_rate": 9.343299647558463e-07, + "loss": 0.7021, + "step": 62655 + }, + { + "epoch": 1.61, + "learning_rate": 9.343023540567169e-07, + "loss": 0.6777, + "step": 62656 + }, + { + "epoch": 1.61, + "learning_rate": 9.342747434078894e-07, + "loss": 0.6206, + "step": 62657 + }, + { + "epoch": 1.61, + "learning_rate": 9.342471328093844e-07, + "loss": 0.6729, + "step": 62658 + }, + { + "epoch": 1.61, + "learning_rate": 9.342195222612231e-07, + "loss": 0.7607, + "step": 62659 + }, + { + "epoch": 1.61, + "learning_rate": 9.341919117634272e-07, + "loss": 0.7656, + "step": 62660 + }, + { + "epoch": 1.61, + "learning_rate": 9.341643013160173e-07, + "loss": 0.7715, + "step": 62661 + }, + { + "epoch": 1.61, + "learning_rate": 9.34136690919015e-07, + "loss": 0.6606, + "step": 62662 + }, + { + "epoch": 1.61, + "learning_rate": 9.341090805724408e-07, + "loss": 0.5261, + "step": 62663 + }, + { + "epoch": 1.61, + "learning_rate": 9.340814702763166e-07, + "loss": 0.3267, + "step": 62664 + }, + { + "epoch": 1.61, + "learning_rate": 9.340538600306631e-07, + "loss": 0.5103, + "step": 62665 + }, + { + "epoch": 1.61, + "learning_rate": 9.340262498355016e-07, + "loss": 0.6133, + "step": 62666 + }, + { + "epoch": 1.61, + "learning_rate": 9.339986396908534e-07, + "loss": 0.5127, + "step": 62667 + }, + { + "epoch": 1.61, + "learning_rate": 9.33971029596739e-07, + "loss": 0.6108, + "step": 62668 + }, + { + "epoch": 1.61, + "learning_rate": 9.339434195531802e-07, + "loss": 0.5061, + "step": 62669 + }, + { + "epoch": 1.61, + "learning_rate": 9.339158095601977e-07, + "loss": 0.624, + "step": 62670 + }, + { + "epoch": 1.61, + "learning_rate": 9.33888199617813e-07, + "loss": 0.624, + "step": 62671 + }, + { + "epoch": 1.61, + "learning_rate": 9.338605897260467e-07, + "loss": 0.7139, + "step": 62672 + }, + { + "epoch": 1.61, + "learning_rate": 9.338329798849207e-07, + "loss": 0.6592, + "step": 62673 + }, + { + "epoch": 1.61, + "learning_rate": 9.338053700944554e-07, + "loss": 0.707, + "step": 62674 + }, + { + "epoch": 1.61, + "learning_rate": 9.337777603546726e-07, + "loss": 0.6606, + "step": 62675 + }, + { + "epoch": 1.61, + "learning_rate": 9.337501506655928e-07, + "loss": 0.6621, + "step": 62676 + }, + { + "epoch": 1.61, + "learning_rate": 9.337225410272382e-07, + "loss": 0.623, + "step": 62677 + }, + { + "epoch": 1.61, + "learning_rate": 9.336949314396286e-07, + "loss": 0.5532, + "step": 62678 + }, + { + "epoch": 1.61, + "learning_rate": 9.336673219027858e-07, + "loss": 0.5476, + "step": 62679 + }, + { + "epoch": 1.61, + "learning_rate": 9.336397124167309e-07, + "loss": 0.4976, + "step": 62680 + }, + { + "epoch": 1.61, + "learning_rate": 9.33612102981485e-07, + "loss": 0.7046, + "step": 62681 + }, + { + "epoch": 1.61, + "learning_rate": 9.335844935970691e-07, + "loss": 0.7236, + "step": 62682 + }, + { + "epoch": 1.61, + "learning_rate": 9.335568842635049e-07, + "loss": 0.6846, + "step": 62683 + }, + { + "epoch": 1.61, + "learning_rate": 9.335292749808127e-07, + "loss": 0.8428, + "step": 62684 + }, + { + "epoch": 1.61, + "learning_rate": 9.335016657490144e-07, + "loss": 0.6055, + "step": 62685 + }, + { + "epoch": 1.61, + "learning_rate": 9.334740565681306e-07, + "loss": 0.6953, + "step": 62686 + }, + { + "epoch": 1.61, + "learning_rate": 9.33446447438183e-07, + "loss": 0.4355, + "step": 62687 + }, + { + "epoch": 1.61, + "learning_rate": 9.334188383591923e-07, + "loss": 0.561, + "step": 62688 + }, + { + "epoch": 1.61, + "learning_rate": 9.333912293311794e-07, + "loss": 0.6611, + "step": 62689 + }, + { + "epoch": 1.61, + "learning_rate": 9.333636203541662e-07, + "loss": 0.6826, + "step": 62690 + }, + { + "epoch": 1.61, + "learning_rate": 9.333360114281729e-07, + "loss": 0.6401, + "step": 62691 + }, + { + "epoch": 1.61, + "learning_rate": 9.333084025532216e-07, + "loss": 0.6318, + "step": 62692 + }, + { + "epoch": 1.61, + "learning_rate": 9.332807937293327e-07, + "loss": 0.4622, + "step": 62693 + }, + { + "epoch": 1.61, + "learning_rate": 9.332531849565279e-07, + "loss": 0.5474, + "step": 62694 + }, + { + "epoch": 1.61, + "learning_rate": 9.332255762348279e-07, + "loss": 0.7715, + "step": 62695 + }, + { + "epoch": 1.61, + "learning_rate": 9.331979675642538e-07, + "loss": 0.4868, + "step": 62696 + }, + { + "epoch": 1.61, + "learning_rate": 9.331703589448275e-07, + "loss": 0.6294, + "step": 62697 + }, + { + "epoch": 1.61, + "learning_rate": 9.331427503765694e-07, + "loss": 0.5947, + "step": 62698 + }, + { + "epoch": 1.61, + "learning_rate": 9.331151418595005e-07, + "loss": 0.7324, + "step": 62699 + }, + { + "epoch": 1.61, + "learning_rate": 9.330875333936426e-07, + "loss": 0.7217, + "step": 62700 + }, + { + "epoch": 1.61, + "learning_rate": 9.33059924979016e-07, + "loss": 0.6509, + "step": 62701 + }, + { + "epoch": 1.61, + "learning_rate": 9.330323166156428e-07, + "loss": 0.7227, + "step": 62702 + }, + { + "epoch": 1.61, + "learning_rate": 9.330047083035435e-07, + "loss": 0.6133, + "step": 62703 + }, + { + "epoch": 1.61, + "learning_rate": 9.329771000427395e-07, + "loss": 0.6133, + "step": 62704 + }, + { + "epoch": 1.61, + "learning_rate": 9.329494918332517e-07, + "loss": 0.6953, + "step": 62705 + }, + { + "epoch": 1.61, + "learning_rate": 9.329218836751016e-07, + "loss": 0.5986, + "step": 62706 + }, + { + "epoch": 1.61, + "learning_rate": 9.328942755683104e-07, + "loss": 0.5952, + "step": 62707 + }, + { + "epoch": 1.61, + "learning_rate": 9.328666675128985e-07, + "loss": 0.686, + "step": 62708 + }, + { + "epoch": 1.61, + "learning_rate": 9.328390595088877e-07, + "loss": 0.6445, + "step": 62709 + }, + { + "epoch": 1.61, + "learning_rate": 9.328114515562985e-07, + "loss": 0.5703, + "step": 62710 + }, + { + "epoch": 1.61, + "learning_rate": 9.32783843655153e-07, + "loss": 0.5803, + "step": 62711 + }, + { + "epoch": 1.61, + "learning_rate": 9.327562358054718e-07, + "loss": 0.5894, + "step": 62712 + }, + { + "epoch": 1.61, + "learning_rate": 9.327286280072757e-07, + "loss": 0.4177, + "step": 62713 + }, + { + "epoch": 1.61, + "learning_rate": 9.327010202605865e-07, + "loss": 0.6885, + "step": 62714 + }, + { + "epoch": 1.61, + "learning_rate": 9.326734125654249e-07, + "loss": 0.8569, + "step": 62715 + }, + { + "epoch": 1.61, + "learning_rate": 9.326458049218122e-07, + "loss": 0.814, + "step": 62716 + }, + { + "epoch": 1.61, + "learning_rate": 9.326181973297699e-07, + "loss": 0.7646, + "step": 62717 + }, + { + "epoch": 1.61, + "learning_rate": 9.325905897893182e-07, + "loss": 0.4868, + "step": 62718 + }, + { + "epoch": 1.61, + "learning_rate": 9.325629823004791e-07, + "loss": 0.6797, + "step": 62719 + }, + { + "epoch": 1.61, + "learning_rate": 9.325353748632731e-07, + "loss": 0.6084, + "step": 62720 + }, + { + "epoch": 1.61, + "learning_rate": 9.325077674777219e-07, + "loss": 0.6533, + "step": 62721 + }, + { + "epoch": 1.61, + "learning_rate": 9.324801601438462e-07, + "loss": 0.6963, + "step": 62722 + }, + { + "epoch": 1.61, + "learning_rate": 9.324525528616676e-07, + "loss": 0.5962, + "step": 62723 + }, + { + "epoch": 1.61, + "learning_rate": 9.324249456312066e-07, + "loss": 0.6626, + "step": 62724 + }, + { + "epoch": 1.61, + "learning_rate": 9.323973384524851e-07, + "loss": 0.542, + "step": 62725 + }, + { + "epoch": 1.61, + "learning_rate": 9.323697313255236e-07, + "loss": 0.5181, + "step": 62726 + }, + { + "epoch": 1.61, + "learning_rate": 9.32342124250344e-07, + "loss": 0.4622, + "step": 62727 + }, + { + "epoch": 1.61, + "learning_rate": 9.323145172269665e-07, + "loss": 0.6348, + "step": 62728 + }, + { + "epoch": 1.61, + "learning_rate": 9.322869102554128e-07, + "loss": 0.6245, + "step": 62729 + }, + { + "epoch": 1.61, + "learning_rate": 9.322593033357036e-07, + "loss": 0.6611, + "step": 62730 + }, + { + "epoch": 1.61, + "learning_rate": 9.322316964678607e-07, + "loss": 0.6553, + "step": 62731 + }, + { + "epoch": 1.61, + "learning_rate": 9.322040896519046e-07, + "loss": 0.5811, + "step": 62732 + }, + { + "epoch": 1.61, + "learning_rate": 9.321764828878567e-07, + "loss": 0.6284, + "step": 62733 + }, + { + "epoch": 1.61, + "learning_rate": 9.321488761757383e-07, + "loss": 0.627, + "step": 62734 + }, + { + "epoch": 1.61, + "learning_rate": 9.321212695155703e-07, + "loss": 0.7861, + "step": 62735 + }, + { + "epoch": 1.61, + "learning_rate": 9.320936629073739e-07, + "loss": 0.5027, + "step": 62736 + }, + { + "epoch": 1.61, + "learning_rate": 9.320660563511706e-07, + "loss": 0.7061, + "step": 62737 + }, + { + "epoch": 1.61, + "learning_rate": 9.32038449846981e-07, + "loss": 0.7041, + "step": 62738 + }, + { + "epoch": 1.61, + "learning_rate": 9.320108433948263e-07, + "loss": 0.5557, + "step": 62739 + }, + { + "epoch": 1.61, + "learning_rate": 9.319832369947279e-07, + "loss": 0.7275, + "step": 62740 + }, + { + "epoch": 1.61, + "learning_rate": 9.319556306467066e-07, + "loss": 0.5786, + "step": 62741 + }, + { + "epoch": 1.61, + "learning_rate": 9.319280243507839e-07, + "loss": 0.7295, + "step": 62742 + }, + { + "epoch": 1.61, + "learning_rate": 9.319004181069806e-07, + "loss": 0.668, + "step": 62743 + }, + { + "epoch": 1.61, + "learning_rate": 9.318728119153183e-07, + "loss": 0.6895, + "step": 62744 + }, + { + "epoch": 1.61, + "learning_rate": 9.318452057758176e-07, + "loss": 0.6226, + "step": 62745 + }, + { + "epoch": 1.61, + "learning_rate": 9.318175996885002e-07, + "loss": 0.791, + "step": 62746 + }, + { + "epoch": 1.61, + "learning_rate": 9.31789993653387e-07, + "loss": 0.5972, + "step": 62747 + }, + { + "epoch": 1.61, + "learning_rate": 9.317623876704988e-07, + "loss": 0.6533, + "step": 62748 + }, + { + "epoch": 1.61, + "learning_rate": 9.31734781739857e-07, + "loss": 0.6074, + "step": 62749 + }, + { + "epoch": 1.61, + "learning_rate": 9.317071758614828e-07, + "loss": 0.8213, + "step": 62750 + }, + { + "epoch": 1.61, + "learning_rate": 9.316795700353971e-07, + "loss": 0.4839, + "step": 62751 + }, + { + "epoch": 1.61, + "learning_rate": 9.316519642616214e-07, + "loss": 0.7002, + "step": 62752 + }, + { + "epoch": 1.61, + "learning_rate": 9.316243585401765e-07, + "loss": 0.7627, + "step": 62753 + }, + { + "epoch": 1.61, + "learning_rate": 9.315967528710839e-07, + "loss": 0.7822, + "step": 62754 + }, + { + "epoch": 1.61, + "learning_rate": 9.315691472543642e-07, + "loss": 0.5444, + "step": 62755 + }, + { + "epoch": 1.61, + "learning_rate": 9.315415416900392e-07, + "loss": 0.5405, + "step": 62756 + }, + { + "epoch": 1.61, + "learning_rate": 9.315139361781299e-07, + "loss": 0.6357, + "step": 62757 + }, + { + "epoch": 1.61, + "learning_rate": 9.314863307186567e-07, + "loss": 0.5566, + "step": 62758 + }, + { + "epoch": 1.61, + "learning_rate": 9.314587253116415e-07, + "loss": 0.6279, + "step": 62759 + }, + { + "epoch": 1.61, + "learning_rate": 9.31431119957105e-07, + "loss": 0.5298, + "step": 62760 + }, + { + "epoch": 1.61, + "learning_rate": 9.314035146550688e-07, + "loss": 0.6621, + "step": 62761 + }, + { + "epoch": 1.61, + "learning_rate": 9.313759094055535e-07, + "loss": 0.6465, + "step": 62762 + }, + { + "epoch": 1.61, + "learning_rate": 9.313483042085808e-07, + "loss": 0.6582, + "step": 62763 + }, + { + "epoch": 1.61, + "learning_rate": 9.313206990641713e-07, + "loss": 0.425, + "step": 62764 + }, + { + "epoch": 1.61, + "learning_rate": 9.312930939723465e-07, + "loss": 0.6097, + "step": 62765 + }, + { + "epoch": 1.61, + "learning_rate": 9.312654889331274e-07, + "loss": 0.5688, + "step": 62766 + }, + { + "epoch": 1.61, + "learning_rate": 9.312378839465357e-07, + "loss": 0.4829, + "step": 62767 + }, + { + "epoch": 1.61, + "learning_rate": 9.312102790125913e-07, + "loss": 0.8828, + "step": 62768 + }, + { + "epoch": 1.61, + "learning_rate": 9.311826741313164e-07, + "loss": 0.5918, + "step": 62769 + }, + { + "epoch": 1.61, + "learning_rate": 9.311550693027313e-07, + "loss": 0.7158, + "step": 62770 + }, + { + "epoch": 1.61, + "learning_rate": 9.311274645268579e-07, + "loss": 0.5869, + "step": 62771 + }, + { + "epoch": 1.61, + "learning_rate": 9.310998598037169e-07, + "loss": 0.6724, + "step": 62772 + }, + { + "epoch": 1.61, + "learning_rate": 9.310722551333298e-07, + "loss": 0.5237, + "step": 62773 + }, + { + "epoch": 1.61, + "learning_rate": 9.310446505157172e-07, + "loss": 0.6641, + "step": 62774 + }, + { + "epoch": 1.61, + "learning_rate": 9.310170459509008e-07, + "loss": 0.5486, + "step": 62775 + }, + { + "epoch": 1.61, + "learning_rate": 9.309894414389012e-07, + "loss": 0.7314, + "step": 62776 + }, + { + "epoch": 1.61, + "learning_rate": 9.309618369797403e-07, + "loss": 0.7148, + "step": 62777 + }, + { + "epoch": 1.61, + "learning_rate": 9.309342325734385e-07, + "loss": 0.5, + "step": 62778 + }, + { + "epoch": 1.61, + "learning_rate": 9.309066282200171e-07, + "loss": 0.5605, + "step": 62779 + }, + { + "epoch": 1.61, + "learning_rate": 9.308790239194973e-07, + "loss": 0.5811, + "step": 62780 + }, + { + "epoch": 1.61, + "learning_rate": 9.308514196719002e-07, + "loss": 0.625, + "step": 62781 + }, + { + "epoch": 1.61, + "learning_rate": 9.308238154772472e-07, + "loss": 0.7158, + "step": 62782 + }, + { + "epoch": 1.61, + "learning_rate": 9.30796211335559e-07, + "loss": 0.6465, + "step": 62783 + }, + { + "epoch": 1.61, + "learning_rate": 9.307686072468572e-07, + "loss": 0.5649, + "step": 62784 + }, + { + "epoch": 1.61, + "learning_rate": 9.307410032111626e-07, + "loss": 0.5021, + "step": 62785 + }, + { + "epoch": 1.61, + "learning_rate": 9.307133992284962e-07, + "loss": 0.5332, + "step": 62786 + }, + { + "epoch": 1.61, + "learning_rate": 9.306857952988798e-07, + "loss": 0.5291, + "step": 62787 + }, + { + "epoch": 1.61, + "learning_rate": 9.306581914223339e-07, + "loss": 0.7285, + "step": 62788 + }, + { + "epoch": 1.61, + "learning_rate": 9.306305875988796e-07, + "loss": 0.7666, + "step": 62789 + }, + { + "epoch": 1.61, + "learning_rate": 9.306029838285387e-07, + "loss": 0.5466, + "step": 62790 + }, + { + "epoch": 1.61, + "learning_rate": 9.305753801113316e-07, + "loss": 0.6294, + "step": 62791 + }, + { + "epoch": 1.61, + "learning_rate": 9.305477764472798e-07, + "loss": 0.7861, + "step": 62792 + }, + { + "epoch": 1.61, + "learning_rate": 9.305201728364042e-07, + "loss": 0.5547, + "step": 62793 + }, + { + "epoch": 1.61, + "learning_rate": 9.304925692787264e-07, + "loss": 0.4888, + "step": 62794 + }, + { + "epoch": 1.61, + "learning_rate": 9.304649657742669e-07, + "loss": 0.7021, + "step": 62795 + }, + { + "epoch": 1.61, + "learning_rate": 9.304373623230476e-07, + "loss": 0.5435, + "step": 62796 + }, + { + "epoch": 1.61, + "learning_rate": 9.304097589250892e-07, + "loss": 0.7344, + "step": 62797 + }, + { + "epoch": 1.61, + "learning_rate": 9.303821555804126e-07, + "loss": 0.8164, + "step": 62798 + }, + { + "epoch": 1.61, + "learning_rate": 9.303545522890393e-07, + "loss": 0.3901, + "step": 62799 + }, + { + "epoch": 1.61, + "learning_rate": 9.303269490509902e-07, + "loss": 0.6064, + "step": 62800 + }, + { + "epoch": 1.61, + "learning_rate": 9.302993458662867e-07, + "loss": 0.3881, + "step": 62801 + }, + { + "epoch": 1.61, + "learning_rate": 9.302717427349498e-07, + "loss": 0.5884, + "step": 62802 + }, + { + "epoch": 1.61, + "learning_rate": 9.302441396570003e-07, + "loss": 0.6885, + "step": 62803 + }, + { + "epoch": 1.61, + "learning_rate": 9.3021653663246e-07, + "loss": 0.7324, + "step": 62804 + }, + { + "epoch": 1.61, + "learning_rate": 9.301889336613494e-07, + "loss": 0.665, + "step": 62805 + }, + { + "epoch": 1.61, + "learning_rate": 9.301613307436902e-07, + "loss": 0.8252, + "step": 62806 + }, + { + "epoch": 1.61, + "learning_rate": 9.301337278795034e-07, + "loss": 0.5444, + "step": 62807 + }, + { + "epoch": 1.61, + "learning_rate": 9.301061250688095e-07, + "loss": 0.6904, + "step": 62808 + }, + { + "epoch": 1.61, + "learning_rate": 9.300785223116305e-07, + "loss": 0.6807, + "step": 62809 + }, + { + "epoch": 1.61, + "learning_rate": 9.30050919607987e-07, + "loss": 0.6445, + "step": 62810 + }, + { + "epoch": 1.61, + "learning_rate": 9.300233169579003e-07, + "loss": 0.5439, + "step": 62811 + }, + { + "epoch": 1.61, + "learning_rate": 9.299957143613915e-07, + "loss": 0.7393, + "step": 62812 + }, + { + "epoch": 1.61, + "learning_rate": 9.299681118184819e-07, + "loss": 0.3955, + "step": 62813 + }, + { + "epoch": 1.61, + "learning_rate": 9.299405093291922e-07, + "loss": 0.6914, + "step": 62814 + }, + { + "epoch": 1.61, + "learning_rate": 9.299129068935442e-07, + "loss": 0.6841, + "step": 62815 + }, + { + "epoch": 1.61, + "learning_rate": 9.298853045115584e-07, + "loss": 0.6318, + "step": 62816 + }, + { + "epoch": 1.61, + "learning_rate": 9.298577021832565e-07, + "loss": 0.7598, + "step": 62817 + }, + { + "epoch": 1.61, + "learning_rate": 9.298300999086593e-07, + "loss": 0.7402, + "step": 62818 + }, + { + "epoch": 1.61, + "learning_rate": 9.298024976877878e-07, + "loss": 0.6787, + "step": 62819 + }, + { + "epoch": 1.61, + "learning_rate": 9.297748955206633e-07, + "loss": 0.6504, + "step": 62820 + }, + { + "epoch": 1.61, + "learning_rate": 9.297472934073069e-07, + "loss": 0.5303, + "step": 62821 + }, + { + "epoch": 1.61, + "learning_rate": 9.297196913477397e-07, + "loss": 0.6973, + "step": 62822 + }, + { + "epoch": 1.61, + "learning_rate": 9.296920893419831e-07, + "loss": 0.6787, + "step": 62823 + }, + { + "epoch": 1.61, + "learning_rate": 9.296644873900577e-07, + "loss": 0.5786, + "step": 62824 + }, + { + "epoch": 1.61, + "learning_rate": 9.296368854919854e-07, + "loss": 0.6553, + "step": 62825 + }, + { + "epoch": 1.61, + "learning_rate": 9.296092836477865e-07, + "loss": 0.5815, + "step": 62826 + }, + { + "epoch": 1.61, + "learning_rate": 9.295816818574831e-07, + "loss": 0.606, + "step": 62827 + }, + { + "epoch": 1.61, + "learning_rate": 9.295540801210955e-07, + "loss": 0.6377, + "step": 62828 + }, + { + "epoch": 1.61, + "learning_rate": 9.295264784386449e-07, + "loss": 0.6152, + "step": 62829 + }, + { + "epoch": 1.61, + "learning_rate": 9.294988768101528e-07, + "loss": 0.7744, + "step": 62830 + }, + { + "epoch": 1.61, + "learning_rate": 9.2947127523564e-07, + "loss": 0.5483, + "step": 62831 + }, + { + "epoch": 1.61, + "learning_rate": 9.294436737151279e-07, + "loss": 0.6763, + "step": 62832 + }, + { + "epoch": 1.61, + "learning_rate": 9.294160722486375e-07, + "loss": 0.7373, + "step": 62833 + }, + { + "epoch": 1.61, + "learning_rate": 9.293884708361901e-07, + "loss": 0.615, + "step": 62834 + }, + { + "epoch": 1.61, + "learning_rate": 9.293608694778065e-07, + "loss": 0.7974, + "step": 62835 + }, + { + "epoch": 1.61, + "learning_rate": 9.293332681735083e-07, + "loss": 0.604, + "step": 62836 + }, + { + "epoch": 1.61, + "learning_rate": 9.293056669233164e-07, + "loss": 0.6279, + "step": 62837 + }, + { + "epoch": 1.61, + "learning_rate": 9.292780657272518e-07, + "loss": 0.6533, + "step": 62838 + }, + { + "epoch": 1.61, + "learning_rate": 9.292504645853355e-07, + "loss": 0.6855, + "step": 62839 + }, + { + "epoch": 1.61, + "learning_rate": 9.292228634975891e-07, + "loss": 0.5459, + "step": 62840 + }, + { + "epoch": 1.61, + "learning_rate": 9.291952624640333e-07, + "loss": 0.4248, + "step": 62841 + }, + { + "epoch": 1.61, + "learning_rate": 9.291676614846897e-07, + "loss": 0.5444, + "step": 62842 + }, + { + "epoch": 1.61, + "learning_rate": 9.291400605595788e-07, + "loss": 0.6719, + "step": 62843 + }, + { + "epoch": 1.61, + "learning_rate": 9.291124596887224e-07, + "loss": 0.6963, + "step": 62844 + }, + { + "epoch": 1.61, + "learning_rate": 9.290848588721412e-07, + "loss": 0.6562, + "step": 62845 + }, + { + "epoch": 1.61, + "learning_rate": 9.290572581098565e-07, + "loss": 0.5859, + "step": 62846 + }, + { + "epoch": 1.61, + "learning_rate": 9.290296574018896e-07, + "loss": 0.6064, + "step": 62847 + }, + { + "epoch": 1.61, + "learning_rate": 9.290020567482611e-07, + "loss": 0.5522, + "step": 62848 + }, + { + "epoch": 1.61, + "learning_rate": 9.289744561489927e-07, + "loss": 0.6885, + "step": 62849 + }, + { + "epoch": 1.61, + "learning_rate": 9.289468556041051e-07, + "loss": 0.5974, + "step": 62850 + }, + { + "epoch": 1.61, + "learning_rate": 9.289192551136198e-07, + "loss": 0.8018, + "step": 62851 + }, + { + "epoch": 1.61, + "learning_rate": 9.288916546775576e-07, + "loss": 0.5747, + "step": 62852 + }, + { + "epoch": 1.61, + "learning_rate": 9.288640542959398e-07, + "loss": 0.7441, + "step": 62853 + }, + { + "epoch": 1.61, + "learning_rate": 9.288364539687875e-07, + "loss": 0.5137, + "step": 62854 + }, + { + "epoch": 1.61, + "learning_rate": 9.288088536961221e-07, + "loss": 0.8545, + "step": 62855 + }, + { + "epoch": 1.61, + "learning_rate": 9.287812534779642e-07, + "loss": 0.575, + "step": 62856 + }, + { + "epoch": 1.61, + "learning_rate": 9.287536533143357e-07, + "loss": 0.3889, + "step": 62857 + }, + { + "epoch": 1.61, + "learning_rate": 9.287260532052569e-07, + "loss": 0.6279, + "step": 62858 + }, + { + "epoch": 1.61, + "learning_rate": 9.286984531507493e-07, + "loss": 0.5254, + "step": 62859 + }, + { + "epoch": 1.61, + "learning_rate": 9.286708531508338e-07, + "loss": 0.7559, + "step": 62860 + }, + { + "epoch": 1.61, + "learning_rate": 9.286432532055321e-07, + "loss": 0.3954, + "step": 62861 + }, + { + "epoch": 1.61, + "learning_rate": 9.286156533148647e-07, + "loss": 0.7529, + "step": 62862 + }, + { + "epoch": 1.61, + "learning_rate": 9.285880534788532e-07, + "loss": 0.7227, + "step": 62863 + }, + { + "epoch": 1.61, + "learning_rate": 9.285604536975183e-07, + "loss": 0.7168, + "step": 62864 + }, + { + "epoch": 1.61, + "learning_rate": 9.285328539708817e-07, + "loss": 0.7109, + "step": 62865 + }, + { + "epoch": 1.61, + "learning_rate": 9.285052542989639e-07, + "loss": 0.6973, + "step": 62866 + }, + { + "epoch": 1.61, + "learning_rate": 9.284776546817867e-07, + "loss": 0.6299, + "step": 62867 + }, + { + "epoch": 1.61, + "learning_rate": 9.284500551193708e-07, + "loss": 0.5991, + "step": 62868 + }, + { + "epoch": 1.61, + "learning_rate": 9.284224556117372e-07, + "loss": 0.7197, + "step": 62869 + }, + { + "epoch": 1.61, + "learning_rate": 9.283948561589074e-07, + "loss": 0.7119, + "step": 62870 + }, + { + "epoch": 1.61, + "learning_rate": 9.283672567609021e-07, + "loss": 0.6221, + "step": 62871 + }, + { + "epoch": 1.61, + "learning_rate": 9.283396574177429e-07, + "loss": 0.4966, + "step": 62872 + }, + { + "epoch": 1.61, + "learning_rate": 9.283120581294505e-07, + "loss": 0.7617, + "step": 62873 + }, + { + "epoch": 1.61, + "learning_rate": 9.282844588960466e-07, + "loss": 0.6304, + "step": 62874 + }, + { + "epoch": 1.61, + "learning_rate": 9.28256859717552e-07, + "loss": 0.6621, + "step": 62875 + }, + { + "epoch": 1.61, + "learning_rate": 9.282292605939876e-07, + "loss": 0.7656, + "step": 62876 + }, + { + "epoch": 1.61, + "learning_rate": 9.28201661525375e-07, + "loss": 0.6113, + "step": 62877 + }, + { + "epoch": 1.61, + "learning_rate": 9.281740625117351e-07, + "loss": 0.4568, + "step": 62878 + }, + { + "epoch": 1.61, + "learning_rate": 9.281464635530886e-07, + "loss": 0.7588, + "step": 62879 + }, + { + "epoch": 1.61, + "learning_rate": 9.281188646494574e-07, + "loss": 0.521, + "step": 62880 + }, + { + "epoch": 1.61, + "learning_rate": 9.280912658008621e-07, + "loss": 0.6758, + "step": 62881 + }, + { + "epoch": 1.61, + "learning_rate": 9.280636670073241e-07, + "loss": 0.6353, + "step": 62882 + }, + { + "epoch": 1.61, + "learning_rate": 9.280360682688643e-07, + "loss": 0.7617, + "step": 62883 + }, + { + "epoch": 1.61, + "learning_rate": 9.280084695855042e-07, + "loss": 0.573, + "step": 62884 + }, + { + "epoch": 1.61, + "learning_rate": 9.279808709572644e-07, + "loss": 0.6782, + "step": 62885 + }, + { + "epoch": 1.61, + "learning_rate": 9.279532723841667e-07, + "loss": 0.6132, + "step": 62886 + }, + { + "epoch": 1.61, + "learning_rate": 9.27925673866232e-07, + "loss": 0.8027, + "step": 62887 + }, + { + "epoch": 1.61, + "learning_rate": 9.278980754034807e-07, + "loss": 0.4673, + "step": 62888 + }, + { + "epoch": 1.61, + "learning_rate": 9.27870476995935e-07, + "loss": 0.6514, + "step": 62889 + }, + { + "epoch": 1.61, + "learning_rate": 9.278428786436152e-07, + "loss": 0.5732, + "step": 62890 + }, + { + "epoch": 1.61, + "learning_rate": 9.278152803465431e-07, + "loss": 0.6963, + "step": 62891 + }, + { + "epoch": 1.61, + "learning_rate": 9.277876821047395e-07, + "loss": 0.7188, + "step": 62892 + }, + { + "epoch": 1.61, + "learning_rate": 9.277600839182252e-07, + "loss": 0.4927, + "step": 62893 + }, + { + "epoch": 1.61, + "learning_rate": 9.277324857870222e-07, + "loss": 0.7822, + "step": 62894 + }, + { + "epoch": 1.61, + "learning_rate": 9.277048877111506e-07, + "loss": 0.626, + "step": 62895 + }, + { + "epoch": 1.61, + "learning_rate": 9.276772896906325e-07, + "loss": 0.5361, + "step": 62896 + }, + { + "epoch": 1.61, + "learning_rate": 9.276496917254886e-07, + "loss": 0.8057, + "step": 62897 + }, + { + "epoch": 1.61, + "learning_rate": 9.276220938157395e-07, + "loss": 0.6309, + "step": 62898 + }, + { + "epoch": 1.61, + "learning_rate": 9.275944959614072e-07, + "loss": 0.2593, + "step": 62899 + }, + { + "epoch": 1.61, + "learning_rate": 9.275668981625122e-07, + "loss": 0.5708, + "step": 62900 + }, + { + "epoch": 1.61, + "learning_rate": 9.275393004190763e-07, + "loss": 0.6748, + "step": 62901 + }, + { + "epoch": 1.61, + "learning_rate": 9.275117027311198e-07, + "loss": 0.5981, + "step": 62902 + }, + { + "epoch": 1.61, + "learning_rate": 9.274841050986645e-07, + "loss": 0.6196, + "step": 62903 + }, + { + "epoch": 1.61, + "learning_rate": 9.274565075217311e-07, + "loss": 0.7085, + "step": 62904 + }, + { + "epoch": 1.61, + "learning_rate": 9.274289100003411e-07, + "loss": 0.8379, + "step": 62905 + }, + { + "epoch": 1.61, + "learning_rate": 9.274013125345153e-07, + "loss": 0.5479, + "step": 62906 + }, + { + "epoch": 1.61, + "learning_rate": 9.273737151242754e-07, + "loss": 0.5952, + "step": 62907 + }, + { + "epoch": 1.61, + "learning_rate": 9.273461177696418e-07, + "loss": 0.6133, + "step": 62908 + }, + { + "epoch": 1.61, + "learning_rate": 9.27318520470636e-07, + "loss": 0.5339, + "step": 62909 + }, + { + "epoch": 1.61, + "learning_rate": 9.272909232272787e-07, + "loss": 0.5056, + "step": 62910 + }, + { + "epoch": 1.61, + "learning_rate": 9.272633260395919e-07, + "loss": 0.8418, + "step": 62911 + }, + { + "epoch": 1.61, + "learning_rate": 9.272357289075958e-07, + "loss": 0.6807, + "step": 62912 + }, + { + "epoch": 1.61, + "learning_rate": 9.272081318313123e-07, + "loss": 0.624, + "step": 62913 + }, + { + "epoch": 1.61, + "learning_rate": 9.271805348107618e-07, + "loss": 0.686, + "step": 62914 + }, + { + "epoch": 1.61, + "learning_rate": 9.271529378459662e-07, + "loss": 0.7163, + "step": 62915 + }, + { + "epoch": 1.61, + "learning_rate": 9.271253409369459e-07, + "loss": 0.6626, + "step": 62916 + }, + { + "epoch": 1.61, + "learning_rate": 9.27097744083723e-07, + "loss": 0.5771, + "step": 62917 + }, + { + "epoch": 1.61, + "learning_rate": 9.270701472863176e-07, + "loss": 0.7139, + "step": 62918 + }, + { + "epoch": 1.61, + "learning_rate": 9.270425505447511e-07, + "loss": 0.6719, + "step": 62919 + }, + { + "epoch": 1.61, + "learning_rate": 9.270149538590449e-07, + "loss": 0.6992, + "step": 62920 + }, + { + "epoch": 1.61, + "learning_rate": 9.2698735722922e-07, + "loss": 0.6465, + "step": 62921 + }, + { + "epoch": 1.61, + "learning_rate": 9.269597606552974e-07, + "loss": 0.5657, + "step": 62922 + }, + { + "epoch": 1.61, + "learning_rate": 9.269321641372985e-07, + "loss": 0.7202, + "step": 62923 + }, + { + "epoch": 1.61, + "learning_rate": 9.269045676752443e-07, + "loss": 0.5654, + "step": 62924 + }, + { + "epoch": 1.61, + "learning_rate": 9.268769712691557e-07, + "loss": 0.7783, + "step": 62925 + }, + { + "epoch": 1.61, + "learning_rate": 9.268493749190543e-07, + "loss": 0.7412, + "step": 62926 + }, + { + "epoch": 1.61, + "learning_rate": 9.268217786249611e-07, + "loss": 0.6416, + "step": 62927 + }, + { + "epoch": 1.61, + "learning_rate": 9.267941823868969e-07, + "loss": 0.5996, + "step": 62928 + }, + { + "epoch": 1.61, + "learning_rate": 9.267665862048829e-07, + "loss": 0.7783, + "step": 62929 + }, + { + "epoch": 1.61, + "learning_rate": 9.267389900789405e-07, + "loss": 0.6748, + "step": 62930 + }, + { + "epoch": 1.61, + "learning_rate": 9.267113940090905e-07, + "loss": 0.7588, + "step": 62931 + }, + { + "epoch": 1.61, + "learning_rate": 9.266837979953545e-07, + "loss": 0.6836, + "step": 62932 + }, + { + "epoch": 1.61, + "learning_rate": 9.26656202037753e-07, + "loss": 0.5437, + "step": 62933 + }, + { + "epoch": 1.61, + "learning_rate": 9.266286061363078e-07, + "loss": 0.5068, + "step": 62934 + }, + { + "epoch": 1.61, + "learning_rate": 9.266010102910394e-07, + "loss": 0.4402, + "step": 62935 + }, + { + "epoch": 1.61, + "learning_rate": 9.265734145019695e-07, + "loss": 0.5616, + "step": 62936 + }, + { + "epoch": 1.61, + "learning_rate": 9.265458187691191e-07, + "loss": 0.5713, + "step": 62937 + }, + { + "epoch": 1.61, + "learning_rate": 9.265182230925088e-07, + "loss": 0.7217, + "step": 62938 + }, + { + "epoch": 1.61, + "learning_rate": 9.264906274721603e-07, + "loss": 0.8945, + "step": 62939 + }, + { + "epoch": 1.61, + "learning_rate": 9.264630319080945e-07, + "loss": 0.6807, + "step": 62940 + }, + { + "epoch": 1.61, + "learning_rate": 9.264354364003326e-07, + "loss": 0.668, + "step": 62941 + }, + { + "epoch": 1.61, + "learning_rate": 9.264078409488955e-07, + "loss": 0.5361, + "step": 62942 + }, + { + "epoch": 1.61, + "learning_rate": 9.263802455538049e-07, + "loss": 0.7012, + "step": 62943 + }, + { + "epoch": 1.61, + "learning_rate": 9.263526502150813e-07, + "loss": 0.7764, + "step": 62944 + }, + { + "epoch": 1.61, + "learning_rate": 9.263250549327462e-07, + "loss": 0.5166, + "step": 62945 + }, + { + "epoch": 1.61, + "learning_rate": 9.26297459706821e-07, + "loss": 0.6367, + "step": 62946 + }, + { + "epoch": 1.61, + "learning_rate": 9.26269864537326e-07, + "loss": 0.6367, + "step": 62947 + }, + { + "epoch": 1.61, + "learning_rate": 9.262422694242827e-07, + "loss": 0.7236, + "step": 62948 + }, + { + "epoch": 1.61, + "learning_rate": 9.262146743677125e-07, + "loss": 0.75, + "step": 62949 + }, + { + "epoch": 1.61, + "learning_rate": 9.261870793676361e-07, + "loss": 0.6094, + "step": 62950 + }, + { + "epoch": 1.61, + "learning_rate": 9.261594844240751e-07, + "loss": 0.835, + "step": 62951 + }, + { + "epoch": 1.61, + "learning_rate": 9.261318895370501e-07, + "loss": 0.6719, + "step": 62952 + }, + { + "epoch": 1.61, + "learning_rate": 9.261042947065828e-07, + "loss": 0.4995, + "step": 62953 + }, + { + "epoch": 1.61, + "learning_rate": 9.260766999326939e-07, + "loss": 0.7158, + "step": 62954 + }, + { + "epoch": 1.61, + "learning_rate": 9.260491052154048e-07, + "loss": 0.6289, + "step": 62955 + }, + { + "epoch": 1.61, + "learning_rate": 9.260215105547367e-07, + "loss": 0.4543, + "step": 62956 + }, + { + "epoch": 1.61, + "learning_rate": 9.259939159507101e-07, + "loss": 0.359, + "step": 62957 + }, + { + "epoch": 1.61, + "learning_rate": 9.259663214033468e-07, + "loss": 0.5796, + "step": 62958 + }, + { + "epoch": 1.61, + "learning_rate": 9.259387269126675e-07, + "loss": 0.4028, + "step": 62959 + }, + { + "epoch": 1.61, + "learning_rate": 9.259111324786937e-07, + "loss": 0.6938, + "step": 62960 + }, + { + "epoch": 1.61, + "learning_rate": 9.258835381014461e-07, + "loss": 0.6904, + "step": 62961 + }, + { + "epoch": 1.61, + "learning_rate": 9.258559437809462e-07, + "loss": 0.6646, + "step": 62962 + }, + { + "epoch": 1.61, + "learning_rate": 9.258283495172149e-07, + "loss": 0.7744, + "step": 62963 + }, + { + "epoch": 1.61, + "learning_rate": 9.258007553102735e-07, + "loss": 0.668, + "step": 62964 + }, + { + "epoch": 1.61, + "learning_rate": 9.257731611601433e-07, + "loss": 0.6172, + "step": 62965 + }, + { + "epoch": 1.61, + "learning_rate": 9.257455670668453e-07, + "loss": 0.6572, + "step": 62966 + }, + { + "epoch": 1.61, + "learning_rate": 9.257179730303999e-07, + "loss": 0.748, + "step": 62967 + }, + { + "epoch": 1.61, + "learning_rate": 9.256903790508292e-07, + "loss": 0.79, + "step": 62968 + }, + { + "epoch": 1.61, + "learning_rate": 9.256627851281537e-07, + "loss": 0.635, + "step": 62969 + }, + { + "epoch": 1.61, + "learning_rate": 9.256351912623951e-07, + "loss": 0.6279, + "step": 62970 + }, + { + "epoch": 1.61, + "learning_rate": 9.256075974535739e-07, + "loss": 0.7051, + "step": 62971 + }, + { + "epoch": 1.61, + "learning_rate": 9.255800037017117e-07, + "loss": 0.4048, + "step": 62972 + }, + { + "epoch": 1.61, + "learning_rate": 9.255524100068293e-07, + "loss": 0.7134, + "step": 62973 + }, + { + "epoch": 1.61, + "learning_rate": 9.255248163689483e-07, + "loss": 0.7559, + "step": 62974 + }, + { + "epoch": 1.61, + "learning_rate": 9.254972227880893e-07, + "loss": 0.6155, + "step": 62975 + }, + { + "epoch": 1.61, + "learning_rate": 9.25469629264274e-07, + "loss": 0.6934, + "step": 62976 + }, + { + "epoch": 1.61, + "learning_rate": 9.25442035797523e-07, + "loss": 0.5825, + "step": 62977 + }, + { + "epoch": 1.61, + "learning_rate": 9.254144423878574e-07, + "loss": 0.5576, + "step": 62978 + }, + { + "epoch": 1.61, + "learning_rate": 9.253868490352987e-07, + "loss": 0.6973, + "step": 62979 + }, + { + "epoch": 1.61, + "learning_rate": 9.253592557398677e-07, + "loss": 0.7832, + "step": 62980 + }, + { + "epoch": 1.61, + "learning_rate": 9.25331662501586e-07, + "loss": 0.481, + "step": 62981 + }, + { + "epoch": 1.61, + "learning_rate": 9.253040693204741e-07, + "loss": 0.6987, + "step": 62982 + }, + { + "epoch": 1.61, + "learning_rate": 9.252764761965534e-07, + "loss": 0.8145, + "step": 62983 + }, + { + "epoch": 1.61, + "learning_rate": 9.252488831298454e-07, + "loss": 0.5916, + "step": 62984 + }, + { + "epoch": 1.61, + "learning_rate": 9.252212901203706e-07, + "loss": 0.6489, + "step": 62985 + }, + { + "epoch": 1.61, + "learning_rate": 9.251936971681508e-07, + "loss": 0.584, + "step": 62986 + }, + { + "epoch": 1.61, + "learning_rate": 9.251661042732065e-07, + "loss": 0.6641, + "step": 62987 + }, + { + "epoch": 1.61, + "learning_rate": 9.251385114355589e-07, + "loss": 0.564, + "step": 62988 + }, + { + "epoch": 1.61, + "learning_rate": 9.251109186552295e-07, + "loss": 0.6934, + "step": 62989 + }, + { + "epoch": 1.61, + "learning_rate": 9.250833259322391e-07, + "loss": 0.9033, + "step": 62990 + }, + { + "epoch": 1.61, + "learning_rate": 9.250557332666091e-07, + "loss": 0.6904, + "step": 62991 + }, + { + "epoch": 1.61, + "learning_rate": 9.250281406583602e-07, + "loss": 0.6416, + "step": 62992 + }, + { + "epoch": 1.61, + "learning_rate": 9.250005481075141e-07, + "loss": 0.7646, + "step": 62993 + }, + { + "epoch": 1.61, + "learning_rate": 9.249729556140915e-07, + "loss": 0.7515, + "step": 62994 + }, + { + "epoch": 1.61, + "learning_rate": 9.249453631781138e-07, + "loss": 0.6416, + "step": 62995 + }, + { + "epoch": 1.61, + "learning_rate": 9.249177707996021e-07, + "loss": 0.6499, + "step": 62996 + }, + { + "epoch": 1.61, + "learning_rate": 9.248901784785771e-07, + "loss": 0.5967, + "step": 62997 + }, + { + "epoch": 1.61, + "learning_rate": 9.248625862150604e-07, + "loss": 0.7407, + "step": 62998 + }, + { + "epoch": 1.61, + "learning_rate": 9.248349940090727e-07, + "loss": 0.6904, + "step": 62999 + }, + { + "epoch": 1.61, + "learning_rate": 9.248074018606356e-07, + "loss": 0.7148, + "step": 63000 + }, + { + "epoch": 1.61, + "learning_rate": 9.247798097697702e-07, + "loss": 0.606, + "step": 63001 + }, + { + "epoch": 1.61, + "learning_rate": 9.247522177364971e-07, + "loss": 0.6689, + "step": 63002 + }, + { + "epoch": 1.61, + "learning_rate": 9.24724625760838e-07, + "loss": 0.6719, + "step": 63003 + }, + { + "epoch": 1.61, + "learning_rate": 9.246970338428135e-07, + "loss": 0.6641, + "step": 63004 + }, + { + "epoch": 1.61, + "learning_rate": 9.246694419824454e-07, + "loss": 0.666, + "step": 63005 + }, + { + "epoch": 1.61, + "learning_rate": 9.246418501797545e-07, + "loss": 0.5254, + "step": 63006 + }, + { + "epoch": 1.61, + "learning_rate": 9.246142584347615e-07, + "loss": 0.583, + "step": 63007 + }, + { + "epoch": 1.61, + "learning_rate": 9.245866667474881e-07, + "loss": 0.5634, + "step": 63008 + }, + { + "epoch": 1.61, + "learning_rate": 9.24559075117955e-07, + "loss": 0.6753, + "step": 63009 + }, + { + "epoch": 1.61, + "learning_rate": 9.245314835461839e-07, + "loss": 0.6978, + "step": 63010 + }, + { + "epoch": 1.62, + "learning_rate": 9.245038920321951e-07, + "loss": 0.7334, + "step": 63011 + }, + { + "epoch": 1.62, + "learning_rate": 9.244763005760106e-07, + "loss": 0.6738, + "step": 63012 + }, + { + "epoch": 1.62, + "learning_rate": 9.244487091776508e-07, + "loss": 0.7285, + "step": 63013 + }, + { + "epoch": 1.62, + "learning_rate": 9.244211178371375e-07, + "loss": 0.6084, + "step": 63014 + }, + { + "epoch": 1.62, + "learning_rate": 9.243935265544911e-07, + "loss": 0.7275, + "step": 63015 + }, + { + "epoch": 1.62, + "learning_rate": 9.243659353297336e-07, + "loss": 0.6318, + "step": 63016 + }, + { + "epoch": 1.62, + "learning_rate": 9.243383441628854e-07, + "loss": 0.7236, + "step": 63017 + }, + { + "epoch": 1.62, + "learning_rate": 9.24310753053968e-07, + "loss": 0.6582, + "step": 63018 + }, + { + "epoch": 1.62, + "learning_rate": 9.24283162003002e-07, + "loss": 0.7441, + "step": 63019 + }, + { + "epoch": 1.62, + "learning_rate": 9.24255571010009e-07, + "loss": 0.5457, + "step": 63020 + }, + { + "epoch": 1.62, + "learning_rate": 9.242279800750101e-07, + "loss": 0.79, + "step": 63021 + }, + { + "epoch": 1.62, + "learning_rate": 9.242003891980264e-07, + "loss": 0.7207, + "step": 63022 + }, + { + "epoch": 1.62, + "learning_rate": 9.241727983790788e-07, + "loss": 0.5303, + "step": 63023 + }, + { + "epoch": 1.62, + "learning_rate": 9.241452076181888e-07, + "loss": 0.5952, + "step": 63024 + }, + { + "epoch": 1.62, + "learning_rate": 9.241176169153772e-07, + "loss": 0.6094, + "step": 63025 + }, + { + "epoch": 1.62, + "learning_rate": 9.240900262706655e-07, + "loss": 0.6138, + "step": 63026 + }, + { + "epoch": 1.62, + "learning_rate": 9.240624356840745e-07, + "loss": 0.6631, + "step": 63027 + }, + { + "epoch": 1.62, + "learning_rate": 9.240348451556251e-07, + "loss": 0.7373, + "step": 63028 + }, + { + "epoch": 1.62, + "learning_rate": 9.24007254685339e-07, + "loss": 0.6211, + "step": 63029 + }, + { + "epoch": 1.62, + "learning_rate": 9.239796642732368e-07, + "loss": 0.7432, + "step": 63030 + }, + { + "epoch": 1.62, + "learning_rate": 9.239520739193402e-07, + "loss": 0.8301, + "step": 63031 + }, + { + "epoch": 1.62, + "learning_rate": 9.239244836236697e-07, + "loss": 0.8047, + "step": 63032 + }, + { + "epoch": 1.62, + "learning_rate": 9.238968933862468e-07, + "loss": 0.6309, + "step": 63033 + }, + { + "epoch": 1.62, + "learning_rate": 9.238693032070926e-07, + "loss": 0.6626, + "step": 63034 + }, + { + "epoch": 1.62, + "learning_rate": 9.238417130862282e-07, + "loss": 0.5801, + "step": 63035 + }, + { + "epoch": 1.62, + "learning_rate": 9.23814123023675e-07, + "loss": 0.5128, + "step": 63036 + }, + { + "epoch": 1.62, + "learning_rate": 9.237865330194536e-07, + "loss": 0.6538, + "step": 63037 + }, + { + "epoch": 1.62, + "learning_rate": 9.237589430735851e-07, + "loss": 0.6294, + "step": 63038 + }, + { + "epoch": 1.62, + "learning_rate": 9.237313531860911e-07, + "loss": 0.5007, + "step": 63039 + }, + { + "epoch": 1.62, + "learning_rate": 9.237037633569923e-07, + "loss": 0.5439, + "step": 63040 + }, + { + "epoch": 1.62, + "learning_rate": 9.236761735863102e-07, + "loss": 0.5742, + "step": 63041 + }, + { + "epoch": 1.62, + "learning_rate": 9.236485838740656e-07, + "loss": 0.7871, + "step": 63042 + }, + { + "epoch": 1.62, + "learning_rate": 9.2362099422028e-07, + "loss": 0.5112, + "step": 63043 + }, + { + "epoch": 1.62, + "learning_rate": 9.235934046249739e-07, + "loss": 0.3789, + "step": 63044 + }, + { + "epoch": 1.62, + "learning_rate": 9.235658150881692e-07, + "loss": 0.4921, + "step": 63045 + }, + { + "epoch": 1.62, + "learning_rate": 9.235382256098867e-07, + "loss": 0.5559, + "step": 63046 + }, + { + "epoch": 1.62, + "learning_rate": 9.235106361901472e-07, + "loss": 0.5046, + "step": 63047 + }, + { + "epoch": 1.62, + "learning_rate": 9.234830468289722e-07, + "loss": 0.7236, + "step": 63048 + }, + { + "epoch": 1.62, + "learning_rate": 9.234554575263825e-07, + "loss": 0.6548, + "step": 63049 + }, + { + "epoch": 1.62, + "learning_rate": 9.234278682823997e-07, + "loss": 0.5308, + "step": 63050 + }, + { + "epoch": 1.62, + "learning_rate": 9.234002790970444e-07, + "loss": 0.5898, + "step": 63051 + }, + { + "epoch": 1.62, + "learning_rate": 9.233726899703382e-07, + "loss": 0.6582, + "step": 63052 + }, + { + "epoch": 1.62, + "learning_rate": 9.233451009023019e-07, + "loss": 0.8799, + "step": 63053 + }, + { + "epoch": 1.62, + "learning_rate": 9.23317511892957e-07, + "loss": 0.6084, + "step": 63054 + }, + { + "epoch": 1.62, + "learning_rate": 9.232899229423241e-07, + "loss": 0.6768, + "step": 63055 + }, + { + "epoch": 1.62, + "learning_rate": 9.23262334050425e-07, + "loss": 0.7334, + "step": 63056 + }, + { + "epoch": 1.62, + "learning_rate": 9.232347452172799e-07, + "loss": 0.7393, + "step": 63057 + }, + { + "epoch": 1.62, + "learning_rate": 9.232071564429106e-07, + "loss": 0.6758, + "step": 63058 + }, + { + "epoch": 1.62, + "learning_rate": 9.231795677273379e-07, + "loss": 0.5254, + "step": 63059 + }, + { + "epoch": 1.62, + "learning_rate": 9.231519790705831e-07, + "loss": 0.6738, + "step": 63060 + }, + { + "epoch": 1.62, + "learning_rate": 9.231243904726673e-07, + "loss": 0.7305, + "step": 63061 + }, + { + "epoch": 1.62, + "learning_rate": 9.230968019336118e-07, + "loss": 0.7109, + "step": 63062 + }, + { + "epoch": 1.62, + "learning_rate": 9.230692134534372e-07, + "loss": 0.3699, + "step": 63063 + }, + { + "epoch": 1.62, + "learning_rate": 9.230416250321653e-07, + "loss": 0.5045, + "step": 63064 + }, + { + "epoch": 1.62, + "learning_rate": 9.230140366698167e-07, + "loss": 0.4692, + "step": 63065 + }, + { + "epoch": 1.62, + "learning_rate": 9.229864483664132e-07, + "loss": 0.4692, + "step": 63066 + }, + { + "epoch": 1.62, + "learning_rate": 9.22958860121975e-07, + "loss": 0.6001, + "step": 63067 + }, + { + "epoch": 1.62, + "learning_rate": 9.229312719365235e-07, + "loss": 0.7363, + "step": 63068 + }, + { + "epoch": 1.62, + "learning_rate": 9.229036838100803e-07, + "loss": 0.479, + "step": 63069 + }, + { + "epoch": 1.62, + "learning_rate": 9.22876095742666e-07, + "loss": 0.7617, + "step": 63070 + }, + { + "epoch": 1.62, + "learning_rate": 9.22848507734302e-07, + "loss": 0.6401, + "step": 63071 + }, + { + "epoch": 1.62, + "learning_rate": 9.228209197850095e-07, + "loss": 0.7627, + "step": 63072 + }, + { + "epoch": 1.62, + "learning_rate": 9.227933318948092e-07, + "loss": 0.6807, + "step": 63073 + }, + { + "epoch": 1.62, + "learning_rate": 9.227657440637226e-07, + "loss": 0.6597, + "step": 63074 + }, + { + "epoch": 1.62, + "learning_rate": 9.227381562917707e-07, + "loss": 0.6689, + "step": 63075 + }, + { + "epoch": 1.62, + "learning_rate": 9.22710568578975e-07, + "loss": 0.6309, + "step": 63076 + }, + { + "epoch": 1.62, + "learning_rate": 9.22682980925356e-07, + "loss": 0.8418, + "step": 63077 + }, + { + "epoch": 1.62, + "learning_rate": 9.226553933309349e-07, + "loss": 0.5718, + "step": 63078 + }, + { + "epoch": 1.62, + "learning_rate": 9.226278057957333e-07, + "loss": 0.6865, + "step": 63079 + }, + { + "epoch": 1.62, + "learning_rate": 9.226002183197717e-07, + "loss": 0.437, + "step": 63080 + }, + { + "epoch": 1.62, + "learning_rate": 9.225726309030718e-07, + "loss": 0.6191, + "step": 63081 + }, + { + "epoch": 1.62, + "learning_rate": 9.225450435456543e-07, + "loss": 0.7705, + "step": 63082 + }, + { + "epoch": 1.62, + "learning_rate": 9.225174562475406e-07, + "loss": 0.4085, + "step": 63083 + }, + { + "epoch": 1.62, + "learning_rate": 9.224898690087516e-07, + "loss": 0.6333, + "step": 63084 + }, + { + "epoch": 1.62, + "learning_rate": 9.224622818293087e-07, + "loss": 0.6455, + "step": 63085 + }, + { + "epoch": 1.62, + "learning_rate": 9.224346947092332e-07, + "loss": 0.6572, + "step": 63086 + }, + { + "epoch": 1.62, + "learning_rate": 9.224071076485454e-07, + "loss": 0.6108, + "step": 63087 + }, + { + "epoch": 1.62, + "learning_rate": 9.223795206472671e-07, + "loss": 0.7158, + "step": 63088 + }, + { + "epoch": 1.62, + "learning_rate": 9.223519337054191e-07, + "loss": 0.4478, + "step": 63089 + }, + { + "epoch": 1.62, + "learning_rate": 9.223243468230227e-07, + "loss": 0.4315, + "step": 63090 + }, + { + "epoch": 1.62, + "learning_rate": 9.22296760000099e-07, + "loss": 0.6646, + "step": 63091 + }, + { + "epoch": 1.62, + "learning_rate": 9.222691732366691e-07, + "loss": 0.5991, + "step": 63092 + }, + { + "epoch": 1.62, + "learning_rate": 9.222415865327542e-07, + "loss": 0.6348, + "step": 63093 + }, + { + "epoch": 1.62, + "learning_rate": 9.222139998883751e-07, + "loss": 0.5974, + "step": 63094 + }, + { + "epoch": 1.62, + "learning_rate": 9.221864133035534e-07, + "loss": 0.5981, + "step": 63095 + }, + { + "epoch": 1.62, + "learning_rate": 9.221588267783102e-07, + "loss": 0.6865, + "step": 63096 + }, + { + "epoch": 1.62, + "learning_rate": 9.22131240312666e-07, + "loss": 0.6123, + "step": 63097 + }, + { + "epoch": 1.62, + "learning_rate": 9.221036539066425e-07, + "loss": 0.7188, + "step": 63098 + }, + { + "epoch": 1.62, + "learning_rate": 9.220760675602603e-07, + "loss": 0.6738, + "step": 63099 + }, + { + "epoch": 1.62, + "learning_rate": 9.220484812735414e-07, + "loss": 0.5415, + "step": 63100 + }, + { + "epoch": 1.62, + "learning_rate": 9.220208950465059e-07, + "loss": 0.6875, + "step": 63101 + }, + { + "epoch": 1.62, + "learning_rate": 9.219933088791758e-07, + "loss": 0.5979, + "step": 63102 + }, + { + "epoch": 1.62, + "learning_rate": 9.219657227715716e-07, + "loss": 0.5676, + "step": 63103 + }, + { + "epoch": 1.62, + "learning_rate": 9.219381367237148e-07, + "loss": 0.6543, + "step": 63104 + }, + { + "epoch": 1.62, + "learning_rate": 9.219105507356262e-07, + "loss": 0.5234, + "step": 63105 + }, + { + "epoch": 1.62, + "learning_rate": 9.218829648073275e-07, + "loss": 0.3706, + "step": 63106 + }, + { + "epoch": 1.62, + "learning_rate": 9.218553789388394e-07, + "loss": 0.71, + "step": 63107 + }, + { + "epoch": 1.62, + "learning_rate": 9.218277931301827e-07, + "loss": 0.3783, + "step": 63108 + }, + { + "epoch": 1.62, + "learning_rate": 9.218002073813789e-07, + "loss": 0.5596, + "step": 63109 + }, + { + "epoch": 1.62, + "learning_rate": 9.217726216924493e-07, + "loss": 0.6514, + "step": 63110 + }, + { + "epoch": 1.62, + "learning_rate": 9.217450360634145e-07, + "loss": 0.6455, + "step": 63111 + }, + { + "epoch": 1.62, + "learning_rate": 9.217174504942961e-07, + "loss": 0.6115, + "step": 63112 + }, + { + "epoch": 1.62, + "learning_rate": 9.216898649851151e-07, + "loss": 0.7754, + "step": 63113 + }, + { + "epoch": 1.62, + "learning_rate": 9.216622795358925e-07, + "loss": 0.6655, + "step": 63114 + }, + { + "epoch": 1.62, + "learning_rate": 9.216346941466493e-07, + "loss": 0.606, + "step": 63115 + }, + { + "epoch": 1.62, + "learning_rate": 9.216071088174073e-07, + "loss": 0.5518, + "step": 63116 + }, + { + "epoch": 1.62, + "learning_rate": 9.215795235481871e-07, + "loss": 0.6084, + "step": 63117 + }, + { + "epoch": 1.62, + "learning_rate": 9.215519383390093e-07, + "loss": 0.6787, + "step": 63118 + }, + { + "epoch": 1.62, + "learning_rate": 9.215243531898959e-07, + "loss": 0.7266, + "step": 63119 + }, + { + "epoch": 1.62, + "learning_rate": 9.214967681008677e-07, + "loss": 0.7832, + "step": 63120 + }, + { + "epoch": 1.62, + "learning_rate": 9.214691830719457e-07, + "loss": 0.8086, + "step": 63121 + }, + { + "epoch": 1.62, + "learning_rate": 9.214415981031511e-07, + "loss": 0.4722, + "step": 63122 + }, + { + "epoch": 1.62, + "learning_rate": 9.214140131945053e-07, + "loss": 0.6797, + "step": 63123 + }, + { + "epoch": 1.62, + "learning_rate": 9.213864283460288e-07, + "loss": 0.7646, + "step": 63124 + }, + { + "epoch": 1.62, + "learning_rate": 9.213588435577435e-07, + "loss": 0.5674, + "step": 63125 + }, + { + "epoch": 1.62, + "learning_rate": 9.213312588296703e-07, + "loss": 0.8311, + "step": 63126 + }, + { + "epoch": 1.62, + "learning_rate": 9.213036741618298e-07, + "loss": 1.0, + "step": 63127 + }, + { + "epoch": 1.62, + "learning_rate": 9.212760895542434e-07, + "loss": 0.6826, + "step": 63128 + }, + { + "epoch": 1.62, + "learning_rate": 9.212485050069324e-07, + "loss": 0.4392, + "step": 63129 + }, + { + "epoch": 1.62, + "learning_rate": 9.212209205199177e-07, + "loss": 0.6387, + "step": 63130 + }, + { + "epoch": 1.62, + "learning_rate": 9.211933360932206e-07, + "loss": 0.5635, + "step": 63131 + }, + { + "epoch": 1.62, + "learning_rate": 9.21165751726862e-07, + "loss": 0.5898, + "step": 63132 + }, + { + "epoch": 1.62, + "learning_rate": 9.211381674208633e-07, + "loss": 0.6699, + "step": 63133 + }, + { + "epoch": 1.62, + "learning_rate": 9.211105831752453e-07, + "loss": 0.3584, + "step": 63134 + }, + { + "epoch": 1.62, + "learning_rate": 9.210829989900295e-07, + "loss": 0.6211, + "step": 63135 + }, + { + "epoch": 1.62, + "learning_rate": 9.21055414865237e-07, + "loss": 0.585, + "step": 63136 + }, + { + "epoch": 1.62, + "learning_rate": 9.210278308008883e-07, + "loss": 0.6548, + "step": 63137 + }, + { + "epoch": 1.62, + "learning_rate": 9.210002467970053e-07, + "loss": 0.7471, + "step": 63138 + }, + { + "epoch": 1.62, + "learning_rate": 9.209726628536086e-07, + "loss": 0.6396, + "step": 63139 + }, + { + "epoch": 1.62, + "learning_rate": 9.209450789707195e-07, + "loss": 0.6279, + "step": 63140 + }, + { + "epoch": 1.62, + "learning_rate": 9.209174951483591e-07, + "loss": 0.7402, + "step": 63141 + }, + { + "epoch": 1.62, + "learning_rate": 9.208899113865485e-07, + "loss": 0.5732, + "step": 63142 + }, + { + "epoch": 1.62, + "learning_rate": 9.208623276853088e-07, + "loss": 0.6865, + "step": 63143 + }, + { + "epoch": 1.62, + "learning_rate": 9.208347440446615e-07, + "loss": 0.6482, + "step": 63144 + }, + { + "epoch": 1.62, + "learning_rate": 9.208071604646273e-07, + "loss": 0.7695, + "step": 63145 + }, + { + "epoch": 1.62, + "learning_rate": 9.207795769452275e-07, + "loss": 0.5576, + "step": 63146 + }, + { + "epoch": 1.62, + "learning_rate": 9.20751993486483e-07, + "loss": 0.79, + "step": 63147 + }, + { + "epoch": 1.62, + "learning_rate": 9.20724410088415e-07, + "loss": 0.571, + "step": 63148 + }, + { + "epoch": 1.62, + "learning_rate": 9.206968267510446e-07, + "loss": 0.6431, + "step": 63149 + }, + { + "epoch": 1.62, + "learning_rate": 9.206692434743931e-07, + "loss": 0.728, + "step": 63150 + }, + { + "epoch": 1.62, + "learning_rate": 9.206416602584814e-07, + "loss": 0.7646, + "step": 63151 + }, + { + "epoch": 1.62, + "learning_rate": 9.206140771033309e-07, + "loss": 0.6768, + "step": 63152 + }, + { + "epoch": 1.62, + "learning_rate": 9.205864940089623e-07, + "loss": 0.6479, + "step": 63153 + }, + { + "epoch": 1.62, + "learning_rate": 9.205589109753972e-07, + "loss": 0.7578, + "step": 63154 + }, + { + "epoch": 1.62, + "learning_rate": 9.205313280026563e-07, + "loss": 0.6465, + "step": 63155 + }, + { + "epoch": 1.62, + "learning_rate": 9.205037450907613e-07, + "loss": 0.6592, + "step": 63156 + }, + { + "epoch": 1.62, + "learning_rate": 9.204761622397328e-07, + "loss": 0.5596, + "step": 63157 + }, + { + "epoch": 1.62, + "learning_rate": 9.204485794495919e-07, + "loss": 0.6475, + "step": 63158 + }, + { + "epoch": 1.62, + "learning_rate": 9.204209967203599e-07, + "loss": 0.6914, + "step": 63159 + }, + { + "epoch": 1.62, + "learning_rate": 9.203934140520577e-07, + "loss": 0.8281, + "step": 63160 + }, + { + "epoch": 1.62, + "learning_rate": 9.20365831444707e-07, + "loss": 0.4509, + "step": 63161 + }, + { + "epoch": 1.62, + "learning_rate": 9.20338248898328e-07, + "loss": 0.6211, + "step": 63162 + }, + { + "epoch": 1.62, + "learning_rate": 9.203106664129428e-07, + "loss": 0.6787, + "step": 63163 + }, + { + "epoch": 1.62, + "learning_rate": 9.202830839885719e-07, + "loss": 0.7021, + "step": 63164 + }, + { + "epoch": 1.62, + "learning_rate": 9.202555016252365e-07, + "loss": 0.5879, + "step": 63165 + }, + { + "epoch": 1.62, + "learning_rate": 9.20227919322958e-07, + "loss": 0.7456, + "step": 63166 + }, + { + "epoch": 1.62, + "learning_rate": 9.202003370817574e-07, + "loss": 0.543, + "step": 63167 + }, + { + "epoch": 1.62, + "learning_rate": 9.201727549016554e-07, + "loss": 0.5957, + "step": 63168 + }, + { + "epoch": 1.62, + "learning_rate": 9.201451727826735e-07, + "loss": 0.5046, + "step": 63169 + }, + { + "epoch": 1.62, + "learning_rate": 9.201175907248327e-07, + "loss": 0.6199, + "step": 63170 + }, + { + "epoch": 1.62, + "learning_rate": 9.200900087281545e-07, + "loss": 0.5623, + "step": 63171 + }, + { + "epoch": 1.62, + "learning_rate": 9.200624267926593e-07, + "loss": 0.5432, + "step": 63172 + }, + { + "epoch": 1.62, + "learning_rate": 9.200348449183691e-07, + "loss": 0.7344, + "step": 63173 + }, + { + "epoch": 1.62, + "learning_rate": 9.20007263105304e-07, + "loss": 0.6689, + "step": 63174 + }, + { + "epoch": 1.62, + "learning_rate": 9.19979681353486e-07, + "loss": 0.752, + "step": 63175 + }, + { + "epoch": 1.62, + "learning_rate": 9.199520996629362e-07, + "loss": 0.624, + "step": 63176 + }, + { + "epoch": 1.62, + "learning_rate": 9.199245180336748e-07, + "loss": 0.5308, + "step": 63177 + }, + { + "epoch": 1.62, + "learning_rate": 9.198969364657239e-07, + "loss": 0.7139, + "step": 63178 + }, + { + "epoch": 1.62, + "learning_rate": 9.198693549591039e-07, + "loss": 0.6016, + "step": 63179 + }, + { + "epoch": 1.62, + "learning_rate": 9.198417735138365e-07, + "loss": 0.6274, + "step": 63180 + }, + { + "epoch": 1.62, + "learning_rate": 9.198141921299426e-07, + "loss": 0.6953, + "step": 63181 + }, + { + "epoch": 1.62, + "learning_rate": 9.19786610807443e-07, + "loss": 0.4951, + "step": 63182 + }, + { + "epoch": 1.62, + "learning_rate": 9.197590295463594e-07, + "loss": 0.6475, + "step": 63183 + }, + { + "epoch": 1.62, + "learning_rate": 9.197314483467124e-07, + "loss": 0.7158, + "step": 63184 + }, + { + "epoch": 1.62, + "learning_rate": 9.197038672085235e-07, + "loss": 0.918, + "step": 63185 + }, + { + "epoch": 1.62, + "learning_rate": 9.196762861318139e-07, + "loss": 0.6885, + "step": 63186 + }, + { + "epoch": 1.62, + "learning_rate": 9.196487051166041e-07, + "loss": 0.4902, + "step": 63187 + }, + { + "epoch": 1.62, + "learning_rate": 9.196211241629157e-07, + "loss": 0.7686, + "step": 63188 + }, + { + "epoch": 1.62, + "learning_rate": 9.195935432707696e-07, + "loss": 0.6002, + "step": 63189 + }, + { + "epoch": 1.62, + "learning_rate": 9.195659624401872e-07, + "loss": 0.6611, + "step": 63190 + }, + { + "epoch": 1.62, + "learning_rate": 9.195383816711892e-07, + "loss": 0.5886, + "step": 63191 + }, + { + "epoch": 1.62, + "learning_rate": 9.195108009637971e-07, + "loss": 0.6904, + "step": 63192 + }, + { + "epoch": 1.62, + "learning_rate": 9.194832203180317e-07, + "loss": 0.7285, + "step": 63193 + }, + { + "epoch": 1.62, + "learning_rate": 9.194556397339146e-07, + "loss": 0.6758, + "step": 63194 + }, + { + "epoch": 1.62, + "learning_rate": 9.194280592114664e-07, + "loss": 0.7139, + "step": 63195 + }, + { + "epoch": 1.62, + "learning_rate": 9.194004787507088e-07, + "loss": 0.5449, + "step": 63196 + }, + { + "epoch": 1.62, + "learning_rate": 9.193728983516623e-07, + "loss": 0.6963, + "step": 63197 + }, + { + "epoch": 1.62, + "learning_rate": 9.193453180143483e-07, + "loss": 0.646, + "step": 63198 + }, + { + "epoch": 1.62, + "learning_rate": 9.193177377387877e-07, + "loss": 0.6787, + "step": 63199 + }, + { + "epoch": 1.62, + "learning_rate": 9.19290157525002e-07, + "loss": 0.7256, + "step": 63200 + }, + { + "epoch": 1.62, + "learning_rate": 9.192625773730119e-07, + "loss": 0.6396, + "step": 63201 + }, + { + "epoch": 1.62, + "learning_rate": 9.192349972828389e-07, + "loss": 0.5254, + "step": 63202 + }, + { + "epoch": 1.62, + "learning_rate": 9.192074172545039e-07, + "loss": 0.6787, + "step": 63203 + }, + { + "epoch": 1.62, + "learning_rate": 9.191798372880281e-07, + "loss": 0.6934, + "step": 63204 + }, + { + "epoch": 1.62, + "learning_rate": 9.191522573834324e-07, + "loss": 0.6377, + "step": 63205 + }, + { + "epoch": 1.62, + "learning_rate": 9.191246775407386e-07, + "loss": 0.7139, + "step": 63206 + }, + { + "epoch": 1.62, + "learning_rate": 9.19097097759967e-07, + "loss": 0.5137, + "step": 63207 + }, + { + "epoch": 1.62, + "learning_rate": 9.19069518041139e-07, + "loss": 0.7227, + "step": 63208 + }, + { + "epoch": 1.62, + "learning_rate": 9.190419383842758e-07, + "loss": 0.5347, + "step": 63209 + }, + { + "epoch": 1.62, + "learning_rate": 9.190143587893983e-07, + "loss": 0.5488, + "step": 63210 + }, + { + "epoch": 1.62, + "learning_rate": 9.189867792565279e-07, + "loss": 0.6201, + "step": 63211 + }, + { + "epoch": 1.62, + "learning_rate": 9.189591997856854e-07, + "loss": 0.564, + "step": 63212 + }, + { + "epoch": 1.62, + "learning_rate": 9.189316203768924e-07, + "loss": 0.6343, + "step": 63213 + }, + { + "epoch": 1.62, + "learning_rate": 9.189040410301696e-07, + "loss": 0.6045, + "step": 63214 + }, + { + "epoch": 1.62, + "learning_rate": 9.188764617455383e-07, + "loss": 0.4961, + "step": 63215 + }, + { + "epoch": 1.62, + "learning_rate": 9.188488825230199e-07, + "loss": 0.8291, + "step": 63216 + }, + { + "epoch": 1.62, + "learning_rate": 9.18821303362635e-07, + "loss": 0.5664, + "step": 63217 + }, + { + "epoch": 1.62, + "learning_rate": 9.187937242644045e-07, + "loss": 0.6812, + "step": 63218 + }, + { + "epoch": 1.62, + "learning_rate": 9.187661452283502e-07, + "loss": 0.4111, + "step": 63219 + }, + { + "epoch": 1.62, + "learning_rate": 9.187385662544928e-07, + "loss": 0.5933, + "step": 63220 + }, + { + "epoch": 1.62, + "learning_rate": 9.187109873428537e-07, + "loss": 0.6055, + "step": 63221 + }, + { + "epoch": 1.62, + "learning_rate": 9.186834084934536e-07, + "loss": 0.6504, + "step": 63222 + }, + { + "epoch": 1.62, + "learning_rate": 9.186558297063142e-07, + "loss": 0.6436, + "step": 63223 + }, + { + "epoch": 1.62, + "learning_rate": 9.186282509814559e-07, + "loss": 0.7246, + "step": 63224 + }, + { + "epoch": 1.62, + "learning_rate": 9.186006723189006e-07, + "loss": 0.4796, + "step": 63225 + }, + { + "epoch": 1.62, + "learning_rate": 9.185730937186691e-07, + "loss": 0.5303, + "step": 63226 + }, + { + "epoch": 1.62, + "learning_rate": 9.18545515180782e-07, + "loss": 0.6116, + "step": 63227 + }, + { + "epoch": 1.62, + "learning_rate": 9.185179367052613e-07, + "loss": 0.5449, + "step": 63228 + }, + { + "epoch": 1.62, + "learning_rate": 9.184903582921272e-07, + "loss": 0.6802, + "step": 63229 + }, + { + "epoch": 1.62, + "learning_rate": 9.184627799414017e-07, + "loss": 0.6465, + "step": 63230 + }, + { + "epoch": 1.62, + "learning_rate": 9.18435201653105e-07, + "loss": 0.5786, + "step": 63231 + }, + { + "epoch": 1.62, + "learning_rate": 9.184076234272592e-07, + "loss": 0.7676, + "step": 63232 + }, + { + "epoch": 1.62, + "learning_rate": 9.183800452638845e-07, + "loss": 0.6865, + "step": 63233 + }, + { + "epoch": 1.62, + "learning_rate": 9.183524671630029e-07, + "loss": 0.6016, + "step": 63234 + }, + { + "epoch": 1.62, + "learning_rate": 9.183248891246349e-07, + "loss": 0.4863, + "step": 63235 + }, + { + "epoch": 1.62, + "learning_rate": 9.182973111488021e-07, + "loss": 0.6689, + "step": 63236 + }, + { + "epoch": 1.62, + "learning_rate": 9.182697332355248e-07, + "loss": 0.589, + "step": 63237 + }, + { + "epoch": 1.62, + "learning_rate": 9.182421553848248e-07, + "loss": 0.3691, + "step": 63238 + }, + { + "epoch": 1.62, + "learning_rate": 9.182145775967228e-07, + "loss": 0.7217, + "step": 63239 + }, + { + "epoch": 1.62, + "learning_rate": 9.181869998712404e-07, + "loss": 0.6416, + "step": 63240 + }, + { + "epoch": 1.62, + "learning_rate": 9.181594222083983e-07, + "loss": 0.8184, + "step": 63241 + }, + { + "epoch": 1.62, + "learning_rate": 9.181318446082178e-07, + "loss": 0.6069, + "step": 63242 + }, + { + "epoch": 1.62, + "learning_rate": 9.1810426707072e-07, + "loss": 0.6758, + "step": 63243 + }, + { + "epoch": 1.62, + "learning_rate": 9.18076689595926e-07, + "loss": 0.4662, + "step": 63244 + }, + { + "epoch": 1.62, + "learning_rate": 9.180491121838572e-07, + "loss": 0.6992, + "step": 63245 + }, + { + "epoch": 1.62, + "learning_rate": 9.18021534834534e-07, + "loss": 0.709, + "step": 63246 + }, + { + "epoch": 1.62, + "learning_rate": 9.179939575479782e-07, + "loss": 0.8076, + "step": 63247 + }, + { + "epoch": 1.62, + "learning_rate": 9.179663803242104e-07, + "loss": 0.6108, + "step": 63248 + }, + { + "epoch": 1.62, + "learning_rate": 9.179388031632522e-07, + "loss": 0.6357, + "step": 63249 + }, + { + "epoch": 1.62, + "learning_rate": 9.179112260651242e-07, + "loss": 0.6255, + "step": 63250 + }, + { + "epoch": 1.62, + "learning_rate": 9.178836490298481e-07, + "loss": 0.6475, + "step": 63251 + }, + { + "epoch": 1.62, + "learning_rate": 9.178560720574444e-07, + "loss": 0.6255, + "step": 63252 + }, + { + "epoch": 1.62, + "learning_rate": 9.178284951479349e-07, + "loss": 0.6006, + "step": 63253 + }, + { + "epoch": 1.62, + "learning_rate": 9.178009183013402e-07, + "loss": 0.5796, + "step": 63254 + }, + { + "epoch": 1.62, + "learning_rate": 9.17773341517682e-07, + "loss": 0.6914, + "step": 63255 + }, + { + "epoch": 1.62, + "learning_rate": 9.177457647969803e-07, + "loss": 0.6191, + "step": 63256 + }, + { + "epoch": 1.62, + "learning_rate": 9.177181881392571e-07, + "loss": 0.7212, + "step": 63257 + }, + { + "epoch": 1.62, + "learning_rate": 9.176906115445332e-07, + "loss": 0.5073, + "step": 63258 + }, + { + "epoch": 1.62, + "learning_rate": 9.1766303501283e-07, + "loss": 0.5996, + "step": 63259 + }, + { + "epoch": 1.62, + "learning_rate": 9.176354585441682e-07, + "loss": 0.7373, + "step": 63260 + }, + { + "epoch": 1.62, + "learning_rate": 9.176078821385693e-07, + "loss": 0.6943, + "step": 63261 + }, + { + "epoch": 1.62, + "learning_rate": 9.175803057960541e-07, + "loss": 0.6538, + "step": 63262 + }, + { + "epoch": 1.62, + "learning_rate": 9.175527295166441e-07, + "loss": 0.7617, + "step": 63263 + }, + { + "epoch": 1.62, + "learning_rate": 9.1752515330036e-07, + "loss": 0.5801, + "step": 63264 + }, + { + "epoch": 1.62, + "learning_rate": 9.174975771472234e-07, + "loss": 0.7422, + "step": 63265 + }, + { + "epoch": 1.62, + "learning_rate": 9.17470001057255e-07, + "loss": 0.5435, + "step": 63266 + }, + { + "epoch": 1.62, + "learning_rate": 9.174424250304758e-07, + "loss": 0.6016, + "step": 63267 + }, + { + "epoch": 1.62, + "learning_rate": 9.174148490669073e-07, + "loss": 0.6396, + "step": 63268 + }, + { + "epoch": 1.62, + "learning_rate": 9.173872731665703e-07, + "loss": 0.7471, + "step": 63269 + }, + { + "epoch": 1.62, + "learning_rate": 9.173596973294863e-07, + "loss": 0.4133, + "step": 63270 + }, + { + "epoch": 1.62, + "learning_rate": 9.173321215556761e-07, + "loss": 0.7256, + "step": 63271 + }, + { + "epoch": 1.62, + "learning_rate": 9.173045458451608e-07, + "loss": 0.6655, + "step": 63272 + }, + { + "epoch": 1.62, + "learning_rate": 9.172769701979616e-07, + "loss": 0.6836, + "step": 63273 + }, + { + "epoch": 1.62, + "learning_rate": 9.172493946140995e-07, + "loss": 0.7295, + "step": 63274 + }, + { + "epoch": 1.62, + "learning_rate": 9.172218190935963e-07, + "loss": 0.5166, + "step": 63275 + }, + { + "epoch": 1.62, + "learning_rate": 9.171942436364723e-07, + "loss": 0.4756, + "step": 63276 + }, + { + "epoch": 1.62, + "learning_rate": 9.171666682427486e-07, + "loss": 0.6255, + "step": 63277 + }, + { + "epoch": 1.62, + "learning_rate": 9.171390929124468e-07, + "loss": 0.7314, + "step": 63278 + }, + { + "epoch": 1.62, + "learning_rate": 9.171115176455875e-07, + "loss": 0.6108, + "step": 63279 + }, + { + "epoch": 1.62, + "learning_rate": 9.170839424421923e-07, + "loss": 0.6099, + "step": 63280 + }, + { + "epoch": 1.62, + "learning_rate": 9.17056367302282e-07, + "loss": 0.522, + "step": 63281 + }, + { + "epoch": 1.62, + "learning_rate": 9.170287922258781e-07, + "loss": 0.5967, + "step": 63282 + }, + { + "epoch": 1.62, + "learning_rate": 9.170012172130011e-07, + "loss": 0.7871, + "step": 63283 + }, + { + "epoch": 1.62, + "learning_rate": 9.169736422636725e-07, + "loss": 0.6313, + "step": 63284 + }, + { + "epoch": 1.62, + "learning_rate": 9.169460673779139e-07, + "loss": 0.5791, + "step": 63285 + }, + { + "epoch": 1.62, + "learning_rate": 9.169184925557453e-07, + "loss": 0.5885, + "step": 63286 + }, + { + "epoch": 1.62, + "learning_rate": 9.168909177971886e-07, + "loss": 0.5977, + "step": 63287 + }, + { + "epoch": 1.62, + "learning_rate": 9.168633431022648e-07, + "loss": 0.5537, + "step": 63288 + }, + { + "epoch": 1.62, + "learning_rate": 9.168357684709946e-07, + "loss": 0.7217, + "step": 63289 + }, + { + "epoch": 1.62, + "learning_rate": 9.168081939033996e-07, + "loss": 0.6191, + "step": 63290 + }, + { + "epoch": 1.62, + "learning_rate": 9.167806193995006e-07, + "loss": 0.5798, + "step": 63291 + }, + { + "epoch": 1.62, + "learning_rate": 9.16753044959319e-07, + "loss": 0.834, + "step": 63292 + }, + { + "epoch": 1.62, + "learning_rate": 9.167254705828758e-07, + "loss": 0.6582, + "step": 63293 + }, + { + "epoch": 1.62, + "learning_rate": 9.16697896270192e-07, + "loss": 0.7666, + "step": 63294 + }, + { + "epoch": 1.62, + "learning_rate": 9.166703220212892e-07, + "loss": 0.6328, + "step": 63295 + }, + { + "epoch": 1.62, + "learning_rate": 9.166427478361875e-07, + "loss": 0.554, + "step": 63296 + }, + { + "epoch": 1.62, + "learning_rate": 9.16615173714909e-07, + "loss": 0.5942, + "step": 63297 + }, + { + "epoch": 1.62, + "learning_rate": 9.16587599657474e-07, + "loss": 0.7236, + "step": 63298 + }, + { + "epoch": 1.62, + "learning_rate": 9.165600256639044e-07, + "loss": 0.6475, + "step": 63299 + }, + { + "epoch": 1.62, + "learning_rate": 9.165324517342208e-07, + "loss": 0.6621, + "step": 63300 + }, + { + "epoch": 1.62, + "learning_rate": 9.165048778684445e-07, + "loss": 0.5791, + "step": 63301 + }, + { + "epoch": 1.62, + "learning_rate": 9.164773040665966e-07, + "loss": 0.644, + "step": 63302 + }, + { + "epoch": 1.62, + "learning_rate": 9.164497303286981e-07, + "loss": 0.6943, + "step": 63303 + }, + { + "epoch": 1.62, + "learning_rate": 9.164221566547702e-07, + "loss": 0.7227, + "step": 63304 + }, + { + "epoch": 1.62, + "learning_rate": 9.163945830448346e-07, + "loss": 0.5947, + "step": 63305 + }, + { + "epoch": 1.62, + "learning_rate": 9.163670094989112e-07, + "loss": 0.6543, + "step": 63306 + }, + { + "epoch": 1.62, + "learning_rate": 9.163394360170219e-07, + "loss": 0.6113, + "step": 63307 + }, + { + "epoch": 1.62, + "learning_rate": 9.163118625991875e-07, + "loss": 0.5557, + "step": 63308 + }, + { + "epoch": 1.62, + "learning_rate": 9.162842892454295e-07, + "loss": 0.6301, + "step": 63309 + }, + { + "epoch": 1.62, + "learning_rate": 9.162567159557684e-07, + "loss": 0.7549, + "step": 63310 + }, + { + "epoch": 1.62, + "learning_rate": 9.16229142730226e-07, + "loss": 0.6934, + "step": 63311 + }, + { + "epoch": 1.62, + "learning_rate": 9.162015695688228e-07, + "loss": 0.5815, + "step": 63312 + }, + { + "epoch": 1.62, + "learning_rate": 9.161739964715805e-07, + "loss": 0.6284, + "step": 63313 + }, + { + "epoch": 1.62, + "learning_rate": 9.161464234385197e-07, + "loss": 0.7266, + "step": 63314 + }, + { + "epoch": 1.62, + "learning_rate": 9.161188504696622e-07, + "loss": 0.7256, + "step": 63315 + }, + { + "epoch": 1.62, + "learning_rate": 9.160912775650284e-07, + "loss": 0.6108, + "step": 63316 + }, + { + "epoch": 1.62, + "learning_rate": 9.160637047246394e-07, + "loss": 0.6592, + "step": 63317 + }, + { + "epoch": 1.62, + "learning_rate": 9.160361319485167e-07, + "loss": 0.6641, + "step": 63318 + }, + { + "epoch": 1.62, + "learning_rate": 9.160085592366811e-07, + "loss": 0.728, + "step": 63319 + }, + { + "epoch": 1.62, + "learning_rate": 9.159809865891542e-07, + "loss": 0.5393, + "step": 63320 + }, + { + "epoch": 1.62, + "learning_rate": 9.159534140059565e-07, + "loss": 0.5809, + "step": 63321 + }, + { + "epoch": 1.62, + "learning_rate": 9.159258414871096e-07, + "loss": 0.5581, + "step": 63322 + }, + { + "epoch": 1.62, + "learning_rate": 9.158982690326343e-07, + "loss": 0.5393, + "step": 63323 + }, + { + "epoch": 1.62, + "learning_rate": 9.15870696642552e-07, + "loss": 0.6143, + "step": 63324 + }, + { + "epoch": 1.62, + "learning_rate": 9.158431243168838e-07, + "loss": 0.6279, + "step": 63325 + }, + { + "epoch": 1.62, + "learning_rate": 9.158155520556506e-07, + "loss": 0.709, + "step": 63326 + }, + { + "epoch": 1.62, + "learning_rate": 9.157879798588731e-07, + "loss": 0.5687, + "step": 63327 + }, + { + "epoch": 1.62, + "learning_rate": 9.157604077265733e-07, + "loss": 0.71, + "step": 63328 + }, + { + "epoch": 1.62, + "learning_rate": 9.157328356587715e-07, + "loss": 0.423, + "step": 63329 + }, + { + "epoch": 1.62, + "learning_rate": 9.157052636554895e-07, + "loss": 0.6772, + "step": 63330 + }, + { + "epoch": 1.62, + "learning_rate": 9.156776917167479e-07, + "loss": 0.7695, + "step": 63331 + }, + { + "epoch": 1.62, + "learning_rate": 9.156501198425681e-07, + "loss": 0.5206, + "step": 63332 + }, + { + "epoch": 1.62, + "learning_rate": 9.156225480329711e-07, + "loss": 0.7744, + "step": 63333 + }, + { + "epoch": 1.62, + "learning_rate": 9.155949762879781e-07, + "loss": 0.749, + "step": 63334 + }, + { + "epoch": 1.62, + "learning_rate": 9.155674046076105e-07, + "loss": 0.6992, + "step": 63335 + }, + { + "epoch": 1.62, + "learning_rate": 9.155398329918885e-07, + "loss": 0.5908, + "step": 63336 + }, + { + "epoch": 1.62, + "learning_rate": 9.15512261440834e-07, + "loss": 0.6553, + "step": 63337 + }, + { + "epoch": 1.62, + "learning_rate": 9.154846899544678e-07, + "loss": 0.583, + "step": 63338 + }, + { + "epoch": 1.62, + "learning_rate": 9.154571185328112e-07, + "loss": 0.7939, + "step": 63339 + }, + { + "epoch": 1.62, + "learning_rate": 9.154295471758849e-07, + "loss": 0.7061, + "step": 63340 + }, + { + "epoch": 1.62, + "learning_rate": 9.154019758837106e-07, + "loss": 0.6084, + "step": 63341 + }, + { + "epoch": 1.62, + "learning_rate": 9.153744046563089e-07, + "loss": 0.5168, + "step": 63342 + }, + { + "epoch": 1.62, + "learning_rate": 9.153468334937013e-07, + "loss": 0.6758, + "step": 63343 + }, + { + "epoch": 1.62, + "learning_rate": 9.153192623959089e-07, + "loss": 0.5801, + "step": 63344 + }, + { + "epoch": 1.62, + "learning_rate": 9.152916913629527e-07, + "loss": 0.5552, + "step": 63345 + }, + { + "epoch": 1.62, + "learning_rate": 9.152641203948533e-07, + "loss": 0.6553, + "step": 63346 + }, + { + "epoch": 1.62, + "learning_rate": 9.152365494916325e-07, + "loss": 0.5718, + "step": 63347 + }, + { + "epoch": 1.62, + "learning_rate": 9.15208978653311e-07, + "loss": 0.6799, + "step": 63348 + }, + { + "epoch": 1.62, + "learning_rate": 9.151814078799104e-07, + "loss": 0.6089, + "step": 63349 + }, + { + "epoch": 1.62, + "learning_rate": 9.151538371714512e-07, + "loss": 0.7148, + "step": 63350 + }, + { + "epoch": 1.62, + "learning_rate": 9.15126266527955e-07, + "loss": 0.8633, + "step": 63351 + }, + { + "epoch": 1.62, + "learning_rate": 9.150986959494426e-07, + "loss": 0.6602, + "step": 63352 + }, + { + "epoch": 1.62, + "learning_rate": 9.150711254359353e-07, + "loss": 0.5615, + "step": 63353 + }, + { + "epoch": 1.62, + "learning_rate": 9.150435549874539e-07, + "loss": 0.6001, + "step": 63354 + }, + { + "epoch": 1.62, + "learning_rate": 9.150159846040203e-07, + "loss": 0.6475, + "step": 63355 + }, + { + "epoch": 1.62, + "learning_rate": 9.149884142856548e-07, + "loss": 0.5898, + "step": 63356 + }, + { + "epoch": 1.62, + "learning_rate": 9.149608440323785e-07, + "loss": 0.6797, + "step": 63357 + }, + { + "epoch": 1.62, + "learning_rate": 9.149332738442131e-07, + "loss": 0.7402, + "step": 63358 + }, + { + "epoch": 1.62, + "learning_rate": 9.149057037211791e-07, + "loss": 0.413, + "step": 63359 + }, + { + "epoch": 1.62, + "learning_rate": 9.148781336632981e-07, + "loss": 0.6895, + "step": 63360 + }, + { + "epoch": 1.62, + "learning_rate": 9.148505636705908e-07, + "loss": 0.5342, + "step": 63361 + }, + { + "epoch": 1.62, + "learning_rate": 9.148229937430786e-07, + "loss": 0.7588, + "step": 63362 + }, + { + "epoch": 1.62, + "learning_rate": 9.147954238807826e-07, + "loss": 0.7168, + "step": 63363 + }, + { + "epoch": 1.62, + "learning_rate": 9.147678540837236e-07, + "loss": 0.7412, + "step": 63364 + }, + { + "epoch": 1.62, + "learning_rate": 9.147402843519234e-07, + "loss": 0.7393, + "step": 63365 + }, + { + "epoch": 1.62, + "learning_rate": 9.147127146854023e-07, + "loss": 0.3306, + "step": 63366 + }, + { + "epoch": 1.62, + "learning_rate": 9.146851450841817e-07, + "loss": 0.7275, + "step": 63367 + }, + { + "epoch": 1.62, + "learning_rate": 9.14657575548283e-07, + "loss": 0.6641, + "step": 63368 + }, + { + "epoch": 1.62, + "learning_rate": 9.146300060777268e-07, + "loss": 0.7217, + "step": 63369 + }, + { + "epoch": 1.62, + "learning_rate": 9.146024366725347e-07, + "loss": 0.7959, + "step": 63370 + }, + { + "epoch": 1.62, + "learning_rate": 9.145748673327272e-07, + "loss": 0.5571, + "step": 63371 + }, + { + "epoch": 1.62, + "learning_rate": 9.145472980583263e-07, + "loss": 0.5235, + "step": 63372 + }, + { + "epoch": 1.62, + "learning_rate": 9.145197288493522e-07, + "loss": 0.7368, + "step": 63373 + }, + { + "epoch": 1.62, + "learning_rate": 9.144921597058268e-07, + "loss": 0.7461, + "step": 63374 + }, + { + "epoch": 1.62, + "learning_rate": 9.144645906277708e-07, + "loss": 0.6338, + "step": 63375 + }, + { + "epoch": 1.62, + "learning_rate": 9.144370216152051e-07, + "loss": 0.7842, + "step": 63376 + }, + { + "epoch": 1.62, + "learning_rate": 9.144094526681512e-07, + "loss": 0.7246, + "step": 63377 + }, + { + "epoch": 1.62, + "learning_rate": 9.1438188378663e-07, + "loss": 0.5549, + "step": 63378 + }, + { + "epoch": 1.62, + "learning_rate": 9.143543149706624e-07, + "loss": 0.5574, + "step": 63379 + }, + { + "epoch": 1.62, + "learning_rate": 9.143267462202701e-07, + "loss": 0.7144, + "step": 63380 + }, + { + "epoch": 1.62, + "learning_rate": 9.142991775354734e-07, + "loss": 0.5879, + "step": 63381 + }, + { + "epoch": 1.62, + "learning_rate": 9.142716089162944e-07, + "loss": 0.7256, + "step": 63382 + }, + { + "epoch": 1.62, + "learning_rate": 9.142440403627534e-07, + "loss": 0.6108, + "step": 63383 + }, + { + "epoch": 1.62, + "learning_rate": 9.14216471874872e-07, + "loss": 0.5352, + "step": 63384 + }, + { + "epoch": 1.62, + "learning_rate": 9.141889034526712e-07, + "loss": 0.708, + "step": 63385 + }, + { + "epoch": 1.62, + "learning_rate": 9.141613350961717e-07, + "loss": 0.6172, + "step": 63386 + }, + { + "epoch": 1.62, + "learning_rate": 9.141337668053951e-07, + "loss": 0.6978, + "step": 63387 + }, + { + "epoch": 1.62, + "learning_rate": 9.141061985803621e-07, + "loss": 0.5046, + "step": 63388 + }, + { + "epoch": 1.62, + "learning_rate": 9.140786304210942e-07, + "loss": 0.426, + "step": 63389 + }, + { + "epoch": 1.62, + "learning_rate": 9.140510623276123e-07, + "loss": 0.4487, + "step": 63390 + }, + { + "epoch": 1.62, + "learning_rate": 9.140234942999376e-07, + "loss": 0.6538, + "step": 63391 + }, + { + "epoch": 1.62, + "learning_rate": 9.13995926338091e-07, + "loss": 0.7676, + "step": 63392 + }, + { + "epoch": 1.62, + "learning_rate": 9.13968358442094e-07, + "loss": 0.6274, + "step": 63393 + }, + { + "epoch": 1.62, + "learning_rate": 9.139407906119671e-07, + "loss": 0.562, + "step": 63394 + }, + { + "epoch": 1.62, + "learning_rate": 9.139132228477326e-07, + "loss": 0.6348, + "step": 63395 + }, + { + "epoch": 1.62, + "learning_rate": 9.138856551494102e-07, + "loss": 0.5869, + "step": 63396 + }, + { + "epoch": 1.62, + "learning_rate": 9.138580875170217e-07, + "loss": 0.6157, + "step": 63397 + }, + { + "epoch": 1.62, + "learning_rate": 9.138305199505879e-07, + "loss": 0.6172, + "step": 63398 + }, + { + "epoch": 1.62, + "learning_rate": 9.138029524501303e-07, + "loss": 0.5864, + "step": 63399 + }, + { + "epoch": 1.62, + "learning_rate": 9.137753850156697e-07, + "loss": 0.5913, + "step": 63400 + }, + { + "epoch": 1.62, + "learning_rate": 9.137478176472275e-07, + "loss": 0.5623, + "step": 63401 + }, + { + "epoch": 1.63, + "learning_rate": 9.137202503448243e-07, + "loss": 0.4895, + "step": 63402 + }, + { + "epoch": 1.63, + "learning_rate": 9.136926831084818e-07, + "loss": 0.498, + "step": 63403 + }, + { + "epoch": 1.63, + "learning_rate": 9.136651159382206e-07, + "loss": 0.6411, + "step": 63404 + }, + { + "epoch": 1.63, + "learning_rate": 9.136375488340625e-07, + "loss": 0.5068, + "step": 63405 + }, + { + "epoch": 1.63, + "learning_rate": 9.13609981796028e-07, + "loss": 0.4407, + "step": 63406 + }, + { + "epoch": 1.63, + "learning_rate": 9.135824148241382e-07, + "loss": 0.6038, + "step": 63407 + }, + { + "epoch": 1.63, + "learning_rate": 9.135548479184146e-07, + "loss": 0.6064, + "step": 63408 + }, + { + "epoch": 1.63, + "learning_rate": 9.135272810788777e-07, + "loss": 0.5159, + "step": 63409 + }, + { + "epoch": 1.63, + "learning_rate": 9.134997143055492e-07, + "loss": 0.6187, + "step": 63410 + }, + { + "epoch": 1.63, + "learning_rate": 9.134721475984499e-07, + "loss": 0.4857, + "step": 63411 + }, + { + "epoch": 1.63, + "learning_rate": 9.134445809576011e-07, + "loss": 0.6465, + "step": 63412 + }, + { + "epoch": 1.63, + "learning_rate": 9.134170143830236e-07, + "loss": 0.5845, + "step": 63413 + }, + { + "epoch": 1.63, + "learning_rate": 9.13389447874739e-07, + "loss": 0.6582, + "step": 63414 + }, + { + "epoch": 1.63, + "learning_rate": 9.133618814327684e-07, + "loss": 0.5811, + "step": 63415 + }, + { + "epoch": 1.63, + "learning_rate": 9.133343150571323e-07, + "loss": 0.5197, + "step": 63416 + }, + { + "epoch": 1.63, + "learning_rate": 9.13306748747852e-07, + "loss": 0.6528, + "step": 63417 + }, + { + "epoch": 1.63, + "learning_rate": 9.132791825049488e-07, + "loss": 0.7705, + "step": 63418 + }, + { + "epoch": 1.63, + "learning_rate": 9.132516163284436e-07, + "loss": 0.6245, + "step": 63419 + }, + { + "epoch": 1.63, + "learning_rate": 9.132240502183579e-07, + "loss": 0.5698, + "step": 63420 + }, + { + "epoch": 1.63, + "learning_rate": 9.131964841747124e-07, + "loss": 0.6431, + "step": 63421 + }, + { + "epoch": 1.63, + "learning_rate": 9.131689181975284e-07, + "loss": 0.4824, + "step": 63422 + }, + { + "epoch": 1.63, + "learning_rate": 9.131413522868269e-07, + "loss": 0.7334, + "step": 63423 + }, + { + "epoch": 1.63, + "learning_rate": 9.131137864426293e-07, + "loss": 0.5278, + "step": 63424 + }, + { + "epoch": 1.63, + "learning_rate": 9.130862206649565e-07, + "loss": 0.708, + "step": 63425 + }, + { + "epoch": 1.63, + "learning_rate": 9.130586549538292e-07, + "loss": 0.4844, + "step": 63426 + }, + { + "epoch": 1.63, + "learning_rate": 9.130310893092693e-07, + "loss": 0.7041, + "step": 63427 + }, + { + "epoch": 1.63, + "learning_rate": 9.130035237312972e-07, + "loss": 0.5552, + "step": 63428 + }, + { + "epoch": 1.63, + "learning_rate": 9.129759582199344e-07, + "loss": 0.7129, + "step": 63429 + }, + { + "epoch": 1.63, + "learning_rate": 9.129483927752019e-07, + "loss": 0.6304, + "step": 63430 + }, + { + "epoch": 1.63, + "learning_rate": 9.129208273971208e-07, + "loss": 0.603, + "step": 63431 + }, + { + "epoch": 1.63, + "learning_rate": 9.128932620857122e-07, + "loss": 0.583, + "step": 63432 + }, + { + "epoch": 1.63, + "learning_rate": 9.128656968409974e-07, + "loss": 0.7402, + "step": 63433 + }, + { + "epoch": 1.63, + "learning_rate": 9.128381316629972e-07, + "loss": 0.6885, + "step": 63434 + }, + { + "epoch": 1.63, + "learning_rate": 9.128105665517332e-07, + "loss": 0.6973, + "step": 63435 + }, + { + "epoch": 1.63, + "learning_rate": 9.127830015072255e-07, + "loss": 0.6851, + "step": 63436 + }, + { + "epoch": 1.63, + "learning_rate": 9.127554365294963e-07, + "loss": 0.7471, + "step": 63437 + }, + { + "epoch": 1.63, + "learning_rate": 9.127278716185659e-07, + "loss": 0.7139, + "step": 63438 + }, + { + "epoch": 1.63, + "learning_rate": 9.12700306774456e-07, + "loss": 0.666, + "step": 63439 + }, + { + "epoch": 1.63, + "learning_rate": 9.126727419971873e-07, + "loss": 0.5776, + "step": 63440 + }, + { + "epoch": 1.63, + "learning_rate": 9.126451772867811e-07, + "loss": 0.8916, + "step": 63441 + }, + { + "epoch": 1.63, + "learning_rate": 9.126176126432584e-07, + "loss": 0.5806, + "step": 63442 + }, + { + "epoch": 1.63, + "learning_rate": 9.125900480666406e-07, + "loss": 0.749, + "step": 63443 + }, + { + "epoch": 1.63, + "learning_rate": 9.125624835569483e-07, + "loss": 0.5957, + "step": 63444 + }, + { + "epoch": 1.63, + "learning_rate": 9.125349191142034e-07, + "loss": 0.6963, + "step": 63445 + }, + { + "epoch": 1.63, + "learning_rate": 9.125073547384263e-07, + "loss": 0.469, + "step": 63446 + }, + { + "epoch": 1.63, + "learning_rate": 9.12479790429638e-07, + "loss": 0.5454, + "step": 63447 + }, + { + "epoch": 1.63, + "learning_rate": 9.124522261878601e-07, + "loss": 0.627, + "step": 63448 + }, + { + "epoch": 1.63, + "learning_rate": 9.124246620131133e-07, + "loss": 0.4619, + "step": 63449 + }, + { + "epoch": 1.63, + "learning_rate": 9.123970979054192e-07, + "loss": 0.5345, + "step": 63450 + }, + { + "epoch": 1.63, + "learning_rate": 9.123695338647986e-07, + "loss": 0.6499, + "step": 63451 + }, + { + "epoch": 1.63, + "learning_rate": 9.123419698912723e-07, + "loss": 0.666, + "step": 63452 + }, + { + "epoch": 1.63, + "learning_rate": 9.12314405984862e-07, + "loss": 0.5283, + "step": 63453 + }, + { + "epoch": 1.63, + "learning_rate": 9.122868421455883e-07, + "loss": 0.6519, + "step": 63454 + }, + { + "epoch": 1.63, + "learning_rate": 9.12259278373473e-07, + "loss": 0.6743, + "step": 63455 + }, + { + "epoch": 1.63, + "learning_rate": 9.122317146685365e-07, + "loss": 0.6973, + "step": 63456 + }, + { + "epoch": 1.63, + "learning_rate": 9.122041510308e-07, + "loss": 0.5337, + "step": 63457 + }, + { + "epoch": 1.63, + "learning_rate": 9.121765874602848e-07, + "loss": 0.4929, + "step": 63458 + }, + { + "epoch": 1.63, + "learning_rate": 9.121490239570118e-07, + "loss": 0.6621, + "step": 63459 + }, + { + "epoch": 1.63, + "learning_rate": 9.121214605210025e-07, + "loss": 0.5649, + "step": 63460 + }, + { + "epoch": 1.63, + "learning_rate": 9.120938971522775e-07, + "loss": 0.585, + "step": 63461 + }, + { + "epoch": 1.63, + "learning_rate": 9.120663338508584e-07, + "loss": 0.6768, + "step": 63462 + }, + { + "epoch": 1.63, + "learning_rate": 9.120387706167658e-07, + "loss": 0.5425, + "step": 63463 + }, + { + "epoch": 1.63, + "learning_rate": 9.120112074500213e-07, + "loss": 0.5596, + "step": 63464 + }, + { + "epoch": 1.63, + "learning_rate": 9.119836443506461e-07, + "loss": 0.5022, + "step": 63465 + }, + { + "epoch": 1.63, + "learning_rate": 9.119560813186605e-07, + "loss": 0.4922, + "step": 63466 + }, + { + "epoch": 1.63, + "learning_rate": 9.119285183540863e-07, + "loss": 0.626, + "step": 63467 + }, + { + "epoch": 1.63, + "learning_rate": 9.119009554569444e-07, + "loss": 0.5327, + "step": 63468 + }, + { + "epoch": 1.63, + "learning_rate": 9.118733926272555e-07, + "loss": 0.5015, + "step": 63469 + }, + { + "epoch": 1.63, + "learning_rate": 9.118458298650414e-07, + "loss": 0.8525, + "step": 63470 + }, + { + "epoch": 1.63, + "learning_rate": 9.118182671703227e-07, + "loss": 0.5869, + "step": 63471 + }, + { + "epoch": 1.63, + "learning_rate": 9.11790704543121e-07, + "loss": 0.6387, + "step": 63472 + }, + { + "epoch": 1.63, + "learning_rate": 9.117631419834568e-07, + "loss": 0.7471, + "step": 63473 + }, + { + "epoch": 1.63, + "learning_rate": 9.117355794913517e-07, + "loss": 0.5596, + "step": 63474 + }, + { + "epoch": 1.63, + "learning_rate": 9.117080170668268e-07, + "loss": 0.6191, + "step": 63475 + }, + { + "epoch": 1.63, + "learning_rate": 9.116804547099026e-07, + "loss": 0.668, + "step": 63476 + }, + { + "epoch": 1.63, + "learning_rate": 9.11652892420601e-07, + "loss": 0.5161, + "step": 63477 + }, + { + "epoch": 1.63, + "learning_rate": 9.116253301989423e-07, + "loss": 0.6816, + "step": 63478 + }, + { + "epoch": 1.63, + "learning_rate": 9.115977680449483e-07, + "loss": 0.6895, + "step": 63479 + }, + { + "epoch": 1.63, + "learning_rate": 9.115702059586396e-07, + "loss": 0.7754, + "step": 63480 + }, + { + "epoch": 1.63, + "learning_rate": 9.115426439400378e-07, + "loss": 0.5796, + "step": 63481 + }, + { + "epoch": 1.63, + "learning_rate": 9.115150819891634e-07, + "loss": 0.6152, + "step": 63482 + }, + { + "epoch": 1.63, + "learning_rate": 9.114875201060382e-07, + "loss": 0.499, + "step": 63483 + }, + { + "epoch": 1.63, + "learning_rate": 9.114599582906825e-07, + "loss": 0.6973, + "step": 63484 + }, + { + "epoch": 1.63, + "learning_rate": 9.114323965431186e-07, + "loss": 0.6577, + "step": 63485 + }, + { + "epoch": 1.63, + "learning_rate": 9.114048348633663e-07, + "loss": 0.7007, + "step": 63486 + }, + { + "epoch": 1.63, + "learning_rate": 9.113772732514475e-07, + "loss": 0.5317, + "step": 63487 + }, + { + "epoch": 1.63, + "learning_rate": 9.113497117073826e-07, + "loss": 0.4019, + "step": 63488 + }, + { + "epoch": 1.63, + "learning_rate": 9.113221502311935e-07, + "loss": 0.5679, + "step": 63489 + }, + { + "epoch": 1.63, + "learning_rate": 9.112945888229007e-07, + "loss": 0.5903, + "step": 63490 + }, + { + "epoch": 1.63, + "learning_rate": 9.112670274825258e-07, + "loss": 0.5242, + "step": 63491 + }, + { + "epoch": 1.63, + "learning_rate": 9.112394662100893e-07, + "loss": 0.6162, + "step": 63492 + }, + { + "epoch": 1.63, + "learning_rate": 9.11211905005613e-07, + "loss": 0.5225, + "step": 63493 + }, + { + "epoch": 1.63, + "learning_rate": 9.111843438691174e-07, + "loss": 0.6787, + "step": 63494 + }, + { + "epoch": 1.63, + "learning_rate": 9.111567828006244e-07, + "loss": 0.6489, + "step": 63495 + }, + { + "epoch": 1.63, + "learning_rate": 9.111292218001543e-07, + "loss": 0.582, + "step": 63496 + }, + { + "epoch": 1.63, + "learning_rate": 9.111016608677282e-07, + "loss": 0.7744, + "step": 63497 + }, + { + "epoch": 1.63, + "learning_rate": 9.110741000033678e-07, + "loss": 0.4829, + "step": 63498 + }, + { + "epoch": 1.63, + "learning_rate": 9.110465392070935e-07, + "loss": 0.645, + "step": 63499 + }, + { + "epoch": 1.63, + "learning_rate": 9.110189784789272e-07, + "loss": 0.5054, + "step": 63500 + }, + { + "epoch": 1.63, + "learning_rate": 9.109914178188892e-07, + "loss": 0.6665, + "step": 63501 + }, + { + "epoch": 1.63, + "learning_rate": 9.109638572270012e-07, + "loss": 0.6611, + "step": 63502 + }, + { + "epoch": 1.63, + "learning_rate": 9.109362967032838e-07, + "loss": 0.6284, + "step": 63503 + }, + { + "epoch": 1.63, + "learning_rate": 9.109087362477588e-07, + "loss": 0.8359, + "step": 63504 + }, + { + "epoch": 1.63, + "learning_rate": 9.10881175860447e-07, + "loss": 0.5688, + "step": 63505 + }, + { + "epoch": 1.63, + "learning_rate": 9.108536155413691e-07, + "loss": 0.6245, + "step": 63506 + }, + { + "epoch": 1.63, + "learning_rate": 9.108260552905464e-07, + "loss": 0.625, + "step": 63507 + }, + { + "epoch": 1.63, + "learning_rate": 9.107984951080003e-07, + "loss": 0.6011, + "step": 63508 + }, + { + "epoch": 1.63, + "learning_rate": 9.107709349937514e-07, + "loss": 0.666, + "step": 63509 + }, + { + "epoch": 1.63, + "learning_rate": 9.107433749478213e-07, + "loss": 0.6655, + "step": 63510 + }, + { + "epoch": 1.63, + "learning_rate": 9.107158149702306e-07, + "loss": 0.7676, + "step": 63511 + }, + { + "epoch": 1.63, + "learning_rate": 9.10688255061001e-07, + "loss": 0.5791, + "step": 63512 + }, + { + "epoch": 1.63, + "learning_rate": 9.106606952201531e-07, + "loss": 0.5762, + "step": 63513 + }, + { + "epoch": 1.63, + "learning_rate": 9.106331354477084e-07, + "loss": 0.647, + "step": 63514 + }, + { + "epoch": 1.63, + "learning_rate": 9.106055757436881e-07, + "loss": 0.6494, + "step": 63515 + }, + { + "epoch": 1.63, + "learning_rate": 9.105780161081124e-07, + "loss": 0.6133, + "step": 63516 + }, + { + "epoch": 1.63, + "learning_rate": 9.105504565410034e-07, + "loss": 0.5435, + "step": 63517 + }, + { + "epoch": 1.63, + "learning_rate": 9.105228970423813e-07, + "loss": 0.6338, + "step": 63518 + }, + { + "epoch": 1.63, + "learning_rate": 9.104953376122683e-07, + "loss": 0.6365, + "step": 63519 + }, + { + "epoch": 1.63, + "learning_rate": 9.104677782506844e-07, + "loss": 0.6338, + "step": 63520 + }, + { + "epoch": 1.63, + "learning_rate": 9.104402189576515e-07, + "loss": 0.6016, + "step": 63521 + }, + { + "epoch": 1.63, + "learning_rate": 9.104126597331902e-07, + "loss": 0.6768, + "step": 63522 + }, + { + "epoch": 1.63, + "learning_rate": 9.103851005773221e-07, + "loss": 0.4993, + "step": 63523 + }, + { + "epoch": 1.63, + "learning_rate": 9.103575414900679e-07, + "loss": 0.5659, + "step": 63524 + }, + { + "epoch": 1.63, + "learning_rate": 9.103299824714491e-07, + "loss": 0.5432, + "step": 63525 + }, + { + "epoch": 1.63, + "learning_rate": 9.10302423521486e-07, + "loss": 0.5483, + "step": 63526 + }, + { + "epoch": 1.63, + "learning_rate": 9.102748646402005e-07, + "loss": 0.6475, + "step": 63527 + }, + { + "epoch": 1.63, + "learning_rate": 9.102473058276132e-07, + "loss": 0.708, + "step": 63528 + }, + { + "epoch": 1.63, + "learning_rate": 9.102197470837456e-07, + "loss": 0.6333, + "step": 63529 + }, + { + "epoch": 1.63, + "learning_rate": 9.101921884086184e-07, + "loss": 0.6333, + "step": 63530 + }, + { + "epoch": 1.63, + "learning_rate": 9.101646298022531e-07, + "loss": 0.6187, + "step": 63531 + }, + { + "epoch": 1.63, + "learning_rate": 9.101370712646704e-07, + "loss": 0.7349, + "step": 63532 + }, + { + "epoch": 1.63, + "learning_rate": 9.101095127958918e-07, + "loss": 0.7441, + "step": 63533 + }, + { + "epoch": 1.63, + "learning_rate": 9.100819543959385e-07, + "loss": 0.6191, + "step": 63534 + }, + { + "epoch": 1.63, + "learning_rate": 9.100543960648308e-07, + "loss": 0.5898, + "step": 63535 + }, + { + "epoch": 1.63, + "learning_rate": 9.100268378025906e-07, + "loss": 0.6885, + "step": 63536 + }, + { + "epoch": 1.63, + "learning_rate": 9.099992796092385e-07, + "loss": 0.5376, + "step": 63537 + }, + { + "epoch": 1.63, + "learning_rate": 9.099717214847959e-07, + "loss": 0.666, + "step": 63538 + }, + { + "epoch": 1.63, + "learning_rate": 9.099441634292837e-07, + "loss": 0.6641, + "step": 63539 + }, + { + "epoch": 1.63, + "learning_rate": 9.099166054427234e-07, + "loss": 0.5845, + "step": 63540 + }, + { + "epoch": 1.63, + "learning_rate": 9.098890475251357e-07, + "loss": 1.0518, + "step": 63541 + }, + { + "epoch": 1.63, + "learning_rate": 9.098614896765417e-07, + "loss": 0.7686, + "step": 63542 + }, + { + "epoch": 1.63, + "learning_rate": 9.098339318969628e-07, + "loss": 0.6851, + "step": 63543 + }, + { + "epoch": 1.63, + "learning_rate": 9.0980637418642e-07, + "loss": 0.668, + "step": 63544 + }, + { + "epoch": 1.63, + "learning_rate": 9.097788165449341e-07, + "loss": 0.7637, + "step": 63545 + }, + { + "epoch": 1.63, + "learning_rate": 9.097512589725265e-07, + "loss": 0.5757, + "step": 63546 + }, + { + "epoch": 1.63, + "learning_rate": 9.09723701469218e-07, + "loss": 0.6763, + "step": 63547 + }, + { + "epoch": 1.63, + "learning_rate": 9.0969614403503e-07, + "loss": 0.4348, + "step": 63548 + }, + { + "epoch": 1.63, + "learning_rate": 9.096685866699835e-07, + "loss": 0.6001, + "step": 63549 + }, + { + "epoch": 1.63, + "learning_rate": 9.096410293740997e-07, + "loss": 0.5483, + "step": 63550 + }, + { + "epoch": 1.63, + "learning_rate": 9.096134721473995e-07, + "loss": 0.4819, + "step": 63551 + }, + { + "epoch": 1.63, + "learning_rate": 9.095859149899042e-07, + "loss": 0.5515, + "step": 63552 + }, + { + "epoch": 1.63, + "learning_rate": 9.095583579016347e-07, + "loss": 0.6152, + "step": 63553 + }, + { + "epoch": 1.63, + "learning_rate": 9.095308008826126e-07, + "loss": 0.646, + "step": 63554 + }, + { + "epoch": 1.63, + "learning_rate": 9.095032439328584e-07, + "loss": 0.7393, + "step": 63555 + }, + { + "epoch": 1.63, + "learning_rate": 9.09475687052393e-07, + "loss": 0.5239, + "step": 63556 + }, + { + "epoch": 1.63, + "learning_rate": 9.094481302412385e-07, + "loss": 0.6943, + "step": 63557 + }, + { + "epoch": 1.63, + "learning_rate": 9.094205734994152e-07, + "loss": 0.6709, + "step": 63558 + }, + { + "epoch": 1.63, + "learning_rate": 9.093930168269442e-07, + "loss": 0.564, + "step": 63559 + }, + { + "epoch": 1.63, + "learning_rate": 9.093654602238469e-07, + "loss": 0.6104, + "step": 63560 + }, + { + "epoch": 1.63, + "learning_rate": 9.093379036901442e-07, + "loss": 0.6323, + "step": 63561 + }, + { + "epoch": 1.63, + "learning_rate": 9.093103472258574e-07, + "loss": 0.5659, + "step": 63562 + }, + { + "epoch": 1.63, + "learning_rate": 9.092827908310075e-07, + "loss": 0.623, + "step": 63563 + }, + { + "epoch": 1.63, + "learning_rate": 9.092552345056159e-07, + "loss": 0.8389, + "step": 63564 + }, + { + "epoch": 1.63, + "learning_rate": 9.092276782497031e-07, + "loss": 0.53, + "step": 63565 + }, + { + "epoch": 1.63, + "learning_rate": 9.092001220632904e-07, + "loss": 0.5442, + "step": 63566 + }, + { + "epoch": 1.63, + "learning_rate": 9.091725659463991e-07, + "loss": 0.6387, + "step": 63567 + }, + { + "epoch": 1.63, + "learning_rate": 9.091450098990501e-07, + "loss": 0.5161, + "step": 63568 + }, + { + "epoch": 1.63, + "learning_rate": 9.091174539212647e-07, + "loss": 0.6509, + "step": 63569 + }, + { + "epoch": 1.63, + "learning_rate": 9.090898980130638e-07, + "loss": 0.5659, + "step": 63570 + }, + { + "epoch": 1.63, + "learning_rate": 9.090623421744688e-07, + "loss": 0.542, + "step": 63571 + }, + { + "epoch": 1.63, + "learning_rate": 9.090347864055002e-07, + "loss": 0.5771, + "step": 63572 + }, + { + "epoch": 1.63, + "learning_rate": 9.090072307061798e-07, + "loss": 0.5469, + "step": 63573 + }, + { + "epoch": 1.63, + "learning_rate": 9.089796750765285e-07, + "loss": 0.7383, + "step": 63574 + }, + { + "epoch": 1.63, + "learning_rate": 9.089521195165671e-07, + "loss": 0.5996, + "step": 63575 + }, + { + "epoch": 1.63, + "learning_rate": 9.089245640263168e-07, + "loss": 0.6279, + "step": 63576 + }, + { + "epoch": 1.63, + "learning_rate": 9.088970086057989e-07, + "loss": 0.4722, + "step": 63577 + }, + { + "epoch": 1.63, + "learning_rate": 9.08869453255034e-07, + "loss": 0.5889, + "step": 63578 + }, + { + "epoch": 1.63, + "learning_rate": 9.088418979740441e-07, + "loss": 0.5247, + "step": 63579 + }, + { + "epoch": 1.63, + "learning_rate": 9.088143427628493e-07, + "loss": 0.7061, + "step": 63580 + }, + { + "epoch": 1.63, + "learning_rate": 9.087867876214715e-07, + "loss": 0.7515, + "step": 63581 + }, + { + "epoch": 1.63, + "learning_rate": 9.087592325499312e-07, + "loss": 0.6924, + "step": 63582 + }, + { + "epoch": 1.63, + "learning_rate": 9.0873167754825e-07, + "loss": 0.6953, + "step": 63583 + }, + { + "epoch": 1.63, + "learning_rate": 9.087041226164489e-07, + "loss": 0.7979, + "step": 63584 + }, + { + "epoch": 1.63, + "learning_rate": 9.086765677545485e-07, + "loss": 0.6543, + "step": 63585 + }, + { + "epoch": 1.63, + "learning_rate": 9.086490129625705e-07, + "loss": 0.5566, + "step": 63586 + }, + { + "epoch": 1.63, + "learning_rate": 9.086214582405355e-07, + "loss": 0.7373, + "step": 63587 + }, + { + "epoch": 1.63, + "learning_rate": 9.08593903588465e-07, + "loss": 0.5405, + "step": 63588 + }, + { + "epoch": 1.63, + "learning_rate": 9.085663490063797e-07, + "loss": 0.7754, + "step": 63589 + }, + { + "epoch": 1.63, + "learning_rate": 9.085387944943013e-07, + "loss": 0.5991, + "step": 63590 + }, + { + "epoch": 1.63, + "learning_rate": 9.085112400522504e-07, + "loss": 0.7441, + "step": 63591 + }, + { + "epoch": 1.63, + "learning_rate": 9.084836856802482e-07, + "loss": 0.6396, + "step": 63592 + }, + { + "epoch": 1.63, + "learning_rate": 9.084561313783157e-07, + "loss": 0.4316, + "step": 63593 + }, + { + "epoch": 1.63, + "learning_rate": 9.084285771464748e-07, + "loss": 0.5278, + "step": 63594 + }, + { + "epoch": 1.63, + "learning_rate": 9.084010229847453e-07, + "loss": 0.6699, + "step": 63595 + }, + { + "epoch": 1.63, + "learning_rate": 9.083734688931492e-07, + "loss": 0.8525, + "step": 63596 + }, + { + "epoch": 1.63, + "learning_rate": 9.08345914871707e-07, + "loss": 0.6313, + "step": 63597 + }, + { + "epoch": 1.63, + "learning_rate": 9.083183609204404e-07, + "loss": 0.6494, + "step": 63598 + }, + { + "epoch": 1.63, + "learning_rate": 9.082908070393699e-07, + "loss": 0.7109, + "step": 63599 + }, + { + "epoch": 1.63, + "learning_rate": 9.082632532285173e-07, + "loss": 0.6421, + "step": 63600 + }, + { + "epoch": 1.63, + "learning_rate": 9.082356994879029e-07, + "loss": 0.4519, + "step": 63601 + }, + { + "epoch": 1.63, + "learning_rate": 9.082081458175485e-07, + "loss": 0.5977, + "step": 63602 + }, + { + "epoch": 1.63, + "learning_rate": 9.081805922174747e-07, + "loss": 0.4744, + "step": 63603 + }, + { + "epoch": 1.63, + "learning_rate": 9.081530386877032e-07, + "loss": 0.6533, + "step": 63604 + }, + { + "epoch": 1.63, + "learning_rate": 9.081254852282546e-07, + "loss": 0.4424, + "step": 63605 + }, + { + "epoch": 1.63, + "learning_rate": 9.080979318391498e-07, + "loss": 0.627, + "step": 63606 + }, + { + "epoch": 1.63, + "learning_rate": 9.080703785204103e-07, + "loss": 0.7627, + "step": 63607 + }, + { + "epoch": 1.63, + "learning_rate": 9.08042825272057e-07, + "loss": 0.6174, + "step": 63608 + }, + { + "epoch": 1.63, + "learning_rate": 9.080152720941112e-07, + "loss": 0.6729, + "step": 63609 + }, + { + "epoch": 1.63, + "learning_rate": 9.079877189865937e-07, + "loss": 0.5878, + "step": 63610 + }, + { + "epoch": 1.63, + "learning_rate": 9.079601659495261e-07, + "loss": 0.6836, + "step": 63611 + }, + { + "epoch": 1.63, + "learning_rate": 9.079326129829287e-07, + "loss": 0.7471, + "step": 63612 + }, + { + "epoch": 1.63, + "learning_rate": 9.079050600868236e-07, + "loss": 0.666, + "step": 63613 + }, + { + "epoch": 1.63, + "learning_rate": 9.078775072612314e-07, + "loss": 0.6309, + "step": 63614 + }, + { + "epoch": 1.63, + "learning_rate": 9.078499545061729e-07, + "loss": 0.7744, + "step": 63615 + }, + { + "epoch": 1.63, + "learning_rate": 9.078224018216692e-07, + "loss": 0.6479, + "step": 63616 + }, + { + "epoch": 1.63, + "learning_rate": 9.077948492077421e-07, + "loss": 0.6914, + "step": 63617 + }, + { + "epoch": 1.63, + "learning_rate": 9.077672966644119e-07, + "loss": 0.6172, + "step": 63618 + }, + { + "epoch": 1.63, + "learning_rate": 9.077397441917002e-07, + "loss": 0.8525, + "step": 63619 + }, + { + "epoch": 1.63, + "learning_rate": 9.077121917896278e-07, + "loss": 0.5234, + "step": 63620 + }, + { + "epoch": 1.63, + "learning_rate": 9.07684639458216e-07, + "loss": 0.5488, + "step": 63621 + }, + { + "epoch": 1.63, + "learning_rate": 9.076570871974858e-07, + "loss": 0.7246, + "step": 63622 + }, + { + "epoch": 1.63, + "learning_rate": 9.076295350074584e-07, + "loss": 0.5869, + "step": 63623 + }, + { + "epoch": 1.63, + "learning_rate": 9.076019828881551e-07, + "loss": 0.6324, + "step": 63624 + }, + { + "epoch": 1.63, + "learning_rate": 9.075744308395963e-07, + "loss": 0.6357, + "step": 63625 + }, + { + "epoch": 1.63, + "learning_rate": 9.075468788618037e-07, + "loss": 0.4751, + "step": 63626 + }, + { + "epoch": 1.63, + "learning_rate": 9.075193269547979e-07, + "loss": 0.6133, + "step": 63627 + }, + { + "epoch": 1.63, + "learning_rate": 9.074917751186006e-07, + "loss": 0.6846, + "step": 63628 + }, + { + "epoch": 1.63, + "learning_rate": 9.074642233532323e-07, + "loss": 0.7275, + "step": 63629 + }, + { + "epoch": 1.63, + "learning_rate": 9.074366716587148e-07, + "loss": 0.7622, + "step": 63630 + }, + { + "epoch": 1.63, + "learning_rate": 9.074091200350687e-07, + "loss": 0.7393, + "step": 63631 + }, + { + "epoch": 1.63, + "learning_rate": 9.073815684823149e-07, + "loss": 0.5361, + "step": 63632 + }, + { + "epoch": 1.63, + "learning_rate": 9.07354017000475e-07, + "loss": 0.6558, + "step": 63633 + }, + { + "epoch": 1.63, + "learning_rate": 9.0732646558957e-07, + "loss": 0.709, + "step": 63634 + }, + { + "epoch": 1.63, + "learning_rate": 9.072989142496206e-07, + "loss": 0.6543, + "step": 63635 + }, + { + "epoch": 1.63, + "learning_rate": 9.072713629806483e-07, + "loss": 0.6729, + "step": 63636 + }, + { + "epoch": 1.63, + "learning_rate": 9.072438117826739e-07, + "loss": 0.6504, + "step": 63637 + }, + { + "epoch": 1.63, + "learning_rate": 9.072162606557188e-07, + "loss": 0.426, + "step": 63638 + }, + { + "epoch": 1.63, + "learning_rate": 9.071887095998037e-07, + "loss": 0.6426, + "step": 63639 + }, + { + "epoch": 1.63, + "learning_rate": 9.071611586149503e-07, + "loss": 0.4778, + "step": 63640 + }, + { + "epoch": 1.63, + "learning_rate": 9.071336077011789e-07, + "loss": 0.6567, + "step": 63641 + }, + { + "epoch": 1.63, + "learning_rate": 9.071060568585114e-07, + "loss": 0.7056, + "step": 63642 + }, + { + "epoch": 1.63, + "learning_rate": 9.070785060869682e-07, + "loss": 0.7744, + "step": 63643 + }, + { + "epoch": 1.63, + "learning_rate": 9.070509553865713e-07, + "loss": 0.5459, + "step": 63644 + }, + { + "epoch": 1.63, + "learning_rate": 9.070234047573409e-07, + "loss": 0.7285, + "step": 63645 + }, + { + "epoch": 1.63, + "learning_rate": 9.069958541992981e-07, + "loss": 0.5336, + "step": 63646 + }, + { + "epoch": 1.63, + "learning_rate": 9.069683037124646e-07, + "loss": 0.79, + "step": 63647 + }, + { + "epoch": 1.63, + "learning_rate": 9.069407532968612e-07, + "loss": 0.7871, + "step": 63648 + }, + { + "epoch": 1.63, + "learning_rate": 9.069132029525088e-07, + "loss": 0.521, + "step": 63649 + }, + { + "epoch": 1.63, + "learning_rate": 9.068856526794288e-07, + "loss": 0.6611, + "step": 63650 + }, + { + "epoch": 1.63, + "learning_rate": 9.068581024776421e-07, + "loss": 0.7817, + "step": 63651 + }, + { + "epoch": 1.63, + "learning_rate": 9.0683055234717e-07, + "loss": 0.7637, + "step": 63652 + }, + { + "epoch": 1.63, + "learning_rate": 9.068030022880332e-07, + "loss": 0.4767, + "step": 63653 + }, + { + "epoch": 1.63, + "learning_rate": 9.067754523002535e-07, + "loss": 0.6196, + "step": 63654 + }, + { + "epoch": 1.63, + "learning_rate": 9.067479023838514e-07, + "loss": 0.7783, + "step": 63655 + }, + { + "epoch": 1.63, + "learning_rate": 9.067203525388478e-07, + "loss": 0.4922, + "step": 63656 + }, + { + "epoch": 1.63, + "learning_rate": 9.066928027652645e-07, + "loss": 0.4611, + "step": 63657 + }, + { + "epoch": 1.63, + "learning_rate": 9.06665253063122e-07, + "loss": 0.6729, + "step": 63658 + }, + { + "epoch": 1.63, + "learning_rate": 9.066377034324418e-07, + "loss": 0.5918, + "step": 63659 + }, + { + "epoch": 1.63, + "learning_rate": 9.066101538732446e-07, + "loss": 0.8525, + "step": 63660 + }, + { + "epoch": 1.63, + "learning_rate": 9.065826043855519e-07, + "loss": 0.6592, + "step": 63661 + }, + { + "epoch": 1.63, + "learning_rate": 9.065550549693845e-07, + "loss": 0.707, + "step": 63662 + }, + { + "epoch": 1.63, + "learning_rate": 9.065275056247636e-07, + "loss": 0.5781, + "step": 63663 + }, + { + "epoch": 1.63, + "learning_rate": 9.064999563517107e-07, + "loss": 0.7285, + "step": 63664 + }, + { + "epoch": 1.63, + "learning_rate": 9.06472407150246e-07, + "loss": 0.5989, + "step": 63665 + }, + { + "epoch": 1.63, + "learning_rate": 9.064448580203913e-07, + "loss": 0.5488, + "step": 63666 + }, + { + "epoch": 1.63, + "learning_rate": 9.064173089621674e-07, + "loss": 0.6709, + "step": 63667 + }, + { + "epoch": 1.63, + "learning_rate": 9.063897599755953e-07, + "loss": 0.6504, + "step": 63668 + }, + { + "epoch": 1.63, + "learning_rate": 9.063622110606965e-07, + "loss": 0.626, + "step": 63669 + }, + { + "epoch": 1.63, + "learning_rate": 9.063346622174917e-07, + "loss": 0.6089, + "step": 63670 + }, + { + "epoch": 1.63, + "learning_rate": 9.063071134460022e-07, + "loss": 0.6943, + "step": 63671 + }, + { + "epoch": 1.63, + "learning_rate": 9.062795647462489e-07, + "loss": 0.6631, + "step": 63672 + }, + { + "epoch": 1.63, + "learning_rate": 9.062520161182532e-07, + "loss": 0.5422, + "step": 63673 + }, + { + "epoch": 1.63, + "learning_rate": 9.062244675620362e-07, + "loss": 0.7529, + "step": 63674 + }, + { + "epoch": 1.63, + "learning_rate": 9.061969190776185e-07, + "loss": 0.7178, + "step": 63675 + }, + { + "epoch": 1.63, + "learning_rate": 9.061693706650216e-07, + "loss": 0.6064, + "step": 63676 + }, + { + "epoch": 1.63, + "learning_rate": 9.061418223242664e-07, + "loss": 0.7715, + "step": 63677 + }, + { + "epoch": 1.63, + "learning_rate": 9.061142740553742e-07, + "loss": 0.6367, + "step": 63678 + }, + { + "epoch": 1.63, + "learning_rate": 9.060867258583658e-07, + "loss": 0.6367, + "step": 63679 + }, + { + "epoch": 1.63, + "learning_rate": 9.060591777332628e-07, + "loss": 0.6221, + "step": 63680 + }, + { + "epoch": 1.63, + "learning_rate": 9.060316296800858e-07, + "loss": 0.8096, + "step": 63681 + }, + { + "epoch": 1.63, + "learning_rate": 9.06004081698856e-07, + "loss": 0.5537, + "step": 63682 + }, + { + "epoch": 1.63, + "learning_rate": 9.059765337895945e-07, + "loss": 0.7656, + "step": 63683 + }, + { + "epoch": 1.63, + "learning_rate": 9.059489859523231e-07, + "loss": 0.8555, + "step": 63684 + }, + { + "epoch": 1.63, + "learning_rate": 9.059214381870615e-07, + "loss": 0.5864, + "step": 63685 + }, + { + "epoch": 1.63, + "learning_rate": 9.058938904938319e-07, + "loss": 0.6187, + "step": 63686 + }, + { + "epoch": 1.63, + "learning_rate": 9.058663428726547e-07, + "loss": 0.5947, + "step": 63687 + }, + { + "epoch": 1.63, + "learning_rate": 9.058387953235515e-07, + "loss": 0.623, + "step": 63688 + }, + { + "epoch": 1.63, + "learning_rate": 9.05811247846543e-07, + "loss": 0.6436, + "step": 63689 + }, + { + "epoch": 1.63, + "learning_rate": 9.057837004416507e-07, + "loss": 0.6826, + "step": 63690 + }, + { + "epoch": 1.63, + "learning_rate": 9.057561531088955e-07, + "loss": 0.5107, + "step": 63691 + }, + { + "epoch": 1.63, + "learning_rate": 9.057286058482985e-07, + "loss": 0.6487, + "step": 63692 + }, + { + "epoch": 1.63, + "learning_rate": 9.057010586598805e-07, + "loss": 0.666, + "step": 63693 + }, + { + "epoch": 1.63, + "learning_rate": 9.056735115436633e-07, + "loss": 0.5491, + "step": 63694 + }, + { + "epoch": 1.63, + "learning_rate": 9.056459644996674e-07, + "loss": 0.6885, + "step": 63695 + }, + { + "epoch": 1.63, + "learning_rate": 9.056184175279139e-07, + "loss": 0.5332, + "step": 63696 + }, + { + "epoch": 1.63, + "learning_rate": 9.055908706284242e-07, + "loss": 0.7437, + "step": 63697 + }, + { + "epoch": 1.63, + "learning_rate": 9.055633238012191e-07, + "loss": 0.5122, + "step": 63698 + }, + { + "epoch": 1.63, + "learning_rate": 9.055357770463198e-07, + "loss": 0.6489, + "step": 63699 + }, + { + "epoch": 1.63, + "learning_rate": 9.055082303637473e-07, + "loss": 0.7812, + "step": 63700 + }, + { + "epoch": 1.63, + "learning_rate": 9.054806837535231e-07, + "loss": 0.6279, + "step": 63701 + }, + { + "epoch": 1.63, + "learning_rate": 9.054531372156677e-07, + "loss": 0.4487, + "step": 63702 + }, + { + "epoch": 1.63, + "learning_rate": 9.054255907502027e-07, + "loss": 0.5356, + "step": 63703 + }, + { + "epoch": 1.63, + "learning_rate": 9.053980443571493e-07, + "loss": 0.6543, + "step": 63704 + }, + { + "epoch": 1.63, + "learning_rate": 9.053704980365279e-07, + "loss": 0.6494, + "step": 63705 + }, + { + "epoch": 1.63, + "learning_rate": 9.053429517883598e-07, + "loss": 0.5447, + "step": 63706 + }, + { + "epoch": 1.63, + "learning_rate": 9.053154056126666e-07, + "loss": 0.7441, + "step": 63707 + }, + { + "epoch": 1.63, + "learning_rate": 9.052878595094687e-07, + "loss": 0.7861, + "step": 63708 + }, + { + "epoch": 1.63, + "learning_rate": 9.052603134787878e-07, + "loss": 0.6216, + "step": 63709 + }, + { + "epoch": 1.63, + "learning_rate": 9.052327675206444e-07, + "loss": 0.7031, + "step": 63710 + }, + { + "epoch": 1.63, + "learning_rate": 9.052052216350602e-07, + "loss": 0.4858, + "step": 63711 + }, + { + "epoch": 1.63, + "learning_rate": 9.051776758220557e-07, + "loss": 0.748, + "step": 63712 + }, + { + "epoch": 1.63, + "learning_rate": 9.051501300816527e-07, + "loss": 0.4192, + "step": 63713 + }, + { + "epoch": 1.63, + "learning_rate": 9.051225844138719e-07, + "loss": 0.478, + "step": 63714 + }, + { + "epoch": 1.63, + "learning_rate": 9.05095038818734e-07, + "loss": 0.8457, + "step": 63715 + }, + { + "epoch": 1.63, + "learning_rate": 9.050674932962607e-07, + "loss": 0.5327, + "step": 63716 + }, + { + "epoch": 1.63, + "learning_rate": 9.050399478464727e-07, + "loss": 0.666, + "step": 63717 + }, + { + "epoch": 1.63, + "learning_rate": 9.050124024693915e-07, + "loss": 0.7812, + "step": 63718 + }, + { + "epoch": 1.63, + "learning_rate": 9.049848571650376e-07, + "loss": 0.6943, + "step": 63719 + }, + { + "epoch": 1.63, + "learning_rate": 9.049573119334326e-07, + "loss": 0.7031, + "step": 63720 + }, + { + "epoch": 1.63, + "learning_rate": 9.049297667745975e-07, + "loss": 0.5212, + "step": 63721 + }, + { + "epoch": 1.63, + "learning_rate": 9.049022216885531e-07, + "loss": 0.6328, + "step": 63722 + }, + { + "epoch": 1.63, + "learning_rate": 9.048746766753209e-07, + "loss": 0.5703, + "step": 63723 + }, + { + "epoch": 1.63, + "learning_rate": 9.04847131734922e-07, + "loss": 0.5627, + "step": 63724 + }, + { + "epoch": 1.63, + "learning_rate": 9.048195868673768e-07, + "loss": 0.4658, + "step": 63725 + }, + { + "epoch": 1.63, + "learning_rate": 9.047920420727071e-07, + "loss": 0.666, + "step": 63726 + }, + { + "epoch": 1.63, + "learning_rate": 9.047644973509337e-07, + "loss": 0.3472, + "step": 63727 + }, + { + "epoch": 1.63, + "learning_rate": 9.047369527020778e-07, + "loss": 0.7822, + "step": 63728 + }, + { + "epoch": 1.63, + "learning_rate": 9.047094081261602e-07, + "loss": 0.7363, + "step": 63729 + }, + { + "epoch": 1.63, + "learning_rate": 9.046818636232024e-07, + "loss": 0.6377, + "step": 63730 + }, + { + "epoch": 1.63, + "learning_rate": 9.046543191932252e-07, + "loss": 0.6167, + "step": 63731 + }, + { + "epoch": 1.63, + "learning_rate": 9.0462677483625e-07, + "loss": 0.6602, + "step": 63732 + }, + { + "epoch": 1.63, + "learning_rate": 9.045992305522975e-07, + "loss": 0.6201, + "step": 63733 + }, + { + "epoch": 1.63, + "learning_rate": 9.045716863413894e-07, + "loss": 0.6274, + "step": 63734 + }, + { + "epoch": 1.63, + "learning_rate": 9.045441422035462e-07, + "loss": 0.5591, + "step": 63735 + }, + { + "epoch": 1.63, + "learning_rate": 9.045165981387887e-07, + "loss": 0.6309, + "step": 63736 + }, + { + "epoch": 1.63, + "learning_rate": 9.044890541471389e-07, + "loss": 0.6904, + "step": 63737 + }, + { + "epoch": 1.63, + "learning_rate": 9.044615102286175e-07, + "loss": 0.6738, + "step": 63738 + }, + { + "epoch": 1.63, + "learning_rate": 9.044339663832452e-07, + "loss": 0.8018, + "step": 63739 + }, + { + "epoch": 1.63, + "learning_rate": 9.044064226110436e-07, + "loss": 0.6079, + "step": 63740 + }, + { + "epoch": 1.63, + "learning_rate": 9.043788789120334e-07, + "loss": 0.5459, + "step": 63741 + }, + { + "epoch": 1.63, + "learning_rate": 9.043513352862362e-07, + "loss": 0.6704, + "step": 63742 + }, + { + "epoch": 1.63, + "learning_rate": 9.043237917336725e-07, + "loss": 0.5972, + "step": 63743 + }, + { + "epoch": 1.63, + "learning_rate": 9.042962482543641e-07, + "loss": 0.5538, + "step": 63744 + }, + { + "epoch": 1.63, + "learning_rate": 9.042687048483315e-07, + "loss": 0.6719, + "step": 63745 + }, + { + "epoch": 1.63, + "learning_rate": 9.042411615155957e-07, + "loss": 0.667, + "step": 63746 + }, + { + "epoch": 1.63, + "learning_rate": 9.042136182561782e-07, + "loss": 0.6011, + "step": 63747 + }, + { + "epoch": 1.63, + "learning_rate": 9.041860750700998e-07, + "loss": 0.446, + "step": 63748 + }, + { + "epoch": 1.63, + "learning_rate": 9.04158531957382e-07, + "loss": 0.5063, + "step": 63749 + }, + { + "epoch": 1.63, + "learning_rate": 9.041309889180451e-07, + "loss": 0.8076, + "step": 63750 + }, + { + "epoch": 1.63, + "learning_rate": 9.041034459521111e-07, + "loss": 0.5957, + "step": 63751 + }, + { + "epoch": 1.63, + "learning_rate": 9.040759030596006e-07, + "loss": 0.6237, + "step": 63752 + }, + { + "epoch": 1.63, + "learning_rate": 9.040483602405347e-07, + "loss": 0.7173, + "step": 63753 + }, + { + "epoch": 1.63, + "learning_rate": 9.04020817494935e-07, + "loss": 0.5112, + "step": 63754 + }, + { + "epoch": 1.63, + "learning_rate": 9.039932748228216e-07, + "loss": 0.6797, + "step": 63755 + }, + { + "epoch": 1.63, + "learning_rate": 9.039657322242164e-07, + "loss": 0.5942, + "step": 63756 + }, + { + "epoch": 1.63, + "learning_rate": 9.039381896991402e-07, + "loss": 0.6914, + "step": 63757 + }, + { + "epoch": 1.63, + "learning_rate": 9.03910647247614e-07, + "loss": 0.6084, + "step": 63758 + }, + { + "epoch": 1.63, + "learning_rate": 9.038831048696592e-07, + "loss": 0.667, + "step": 63759 + }, + { + "epoch": 1.63, + "learning_rate": 9.038555625652962e-07, + "loss": 0.427, + "step": 63760 + }, + { + "epoch": 1.63, + "learning_rate": 9.038280203345471e-07, + "loss": 0.5708, + "step": 63761 + }, + { + "epoch": 1.63, + "learning_rate": 9.038004781774321e-07, + "loss": 0.728, + "step": 63762 + }, + { + "epoch": 1.63, + "learning_rate": 9.037729360939729e-07, + "loss": 0.7344, + "step": 63763 + }, + { + "epoch": 1.63, + "learning_rate": 9.037453940841906e-07, + "loss": 0.5962, + "step": 63764 + }, + { + "epoch": 1.63, + "learning_rate": 9.037178521481055e-07, + "loss": 0.7949, + "step": 63765 + }, + { + "epoch": 1.63, + "learning_rate": 9.036903102857395e-07, + "loss": 0.6768, + "step": 63766 + }, + { + "epoch": 1.63, + "learning_rate": 9.036627684971132e-07, + "loss": 0.5679, + "step": 63767 + }, + { + "epoch": 1.63, + "learning_rate": 9.036352267822481e-07, + "loss": 0.5454, + "step": 63768 + }, + { + "epoch": 1.63, + "learning_rate": 9.036076851411647e-07, + "loss": 0.5884, + "step": 63769 + }, + { + "epoch": 1.63, + "learning_rate": 9.035801435738848e-07, + "loss": 0.6582, + "step": 63770 + }, + { + "epoch": 1.63, + "learning_rate": 9.03552602080429e-07, + "loss": 0.6436, + "step": 63771 + }, + { + "epoch": 1.63, + "learning_rate": 9.035250606608186e-07, + "loss": 0.5815, + "step": 63772 + }, + { + "epoch": 1.63, + "learning_rate": 9.034975193150746e-07, + "loss": 0.4535, + "step": 63773 + }, + { + "epoch": 1.63, + "learning_rate": 9.034699780432186e-07, + "loss": 0.7441, + "step": 63774 + }, + { + "epoch": 1.63, + "learning_rate": 9.034424368452707e-07, + "loss": 0.5923, + "step": 63775 + }, + { + "epoch": 1.63, + "learning_rate": 9.034148957212526e-07, + "loss": 0.7266, + "step": 63776 + }, + { + "epoch": 1.63, + "learning_rate": 9.03387354671185e-07, + "loss": 0.5205, + "step": 63777 + }, + { + "epoch": 1.63, + "learning_rate": 9.033598136950897e-07, + "loss": 0.71, + "step": 63778 + }, + { + "epoch": 1.63, + "learning_rate": 9.033322727929868e-07, + "loss": 0.7617, + "step": 63779 + }, + { + "epoch": 1.63, + "learning_rate": 9.033047319648984e-07, + "loss": 0.5615, + "step": 63780 + }, + { + "epoch": 1.63, + "learning_rate": 9.032771912108448e-07, + "loss": 0.623, + "step": 63781 + }, + { + "epoch": 1.63, + "learning_rate": 9.032496505308477e-07, + "loss": 0.6431, + "step": 63782 + }, + { + "epoch": 1.63, + "learning_rate": 9.032221099249276e-07, + "loss": 0.4873, + "step": 63783 + }, + { + "epoch": 1.63, + "learning_rate": 9.031945693931064e-07, + "loss": 0.6226, + "step": 63784 + }, + { + "epoch": 1.63, + "learning_rate": 9.031670289354044e-07, + "loss": 0.6641, + "step": 63785 + }, + { + "epoch": 1.63, + "learning_rate": 9.031394885518428e-07, + "loss": 0.7158, + "step": 63786 + }, + { + "epoch": 1.63, + "learning_rate": 9.03111948242443e-07, + "loss": 0.5234, + "step": 63787 + }, + { + "epoch": 1.63, + "learning_rate": 9.030844080072257e-07, + "loss": 0.6006, + "step": 63788 + }, + { + "epoch": 1.63, + "learning_rate": 9.030568678462124e-07, + "loss": 0.563, + "step": 63789 + }, + { + "epoch": 1.63, + "learning_rate": 9.030293277594237e-07, + "loss": 0.7695, + "step": 63790 + }, + { + "epoch": 1.63, + "learning_rate": 9.030017877468814e-07, + "loss": 0.6914, + "step": 63791 + }, + { + "epoch": 1.64, + "learning_rate": 9.029742478086059e-07, + "loss": 0.6816, + "step": 63792 + }, + { + "epoch": 1.64, + "learning_rate": 9.029467079446186e-07, + "loss": 0.6172, + "step": 63793 + }, + { + "epoch": 1.64, + "learning_rate": 9.02919168154941e-07, + "loss": 0.707, + "step": 63794 + }, + { + "epoch": 1.64, + "learning_rate": 9.028916284395935e-07, + "loss": 0.7188, + "step": 63795 + }, + { + "epoch": 1.64, + "learning_rate": 9.02864088798597e-07, + "loss": 0.7998, + "step": 63796 + }, + { + "epoch": 1.64, + "learning_rate": 9.028365492319734e-07, + "loss": 0.5599, + "step": 63797 + }, + { + "epoch": 1.64, + "learning_rate": 9.02809009739743e-07, + "loss": 0.45, + "step": 63798 + }, + { + "epoch": 1.64, + "learning_rate": 9.027814703219277e-07, + "loss": 0.7871, + "step": 63799 + }, + { + "epoch": 1.64, + "learning_rate": 9.027539309785478e-07, + "loss": 0.7646, + "step": 63800 + }, + { + "epoch": 1.64, + "learning_rate": 9.027263917096249e-07, + "loss": 0.5845, + "step": 63801 + }, + { + "epoch": 1.64, + "learning_rate": 9.026988525151799e-07, + "loss": 0.7861, + "step": 63802 + }, + { + "epoch": 1.64, + "learning_rate": 9.026713133952339e-07, + "loss": 0.7705, + "step": 63803 + }, + { + "epoch": 1.64, + "learning_rate": 9.026437743498084e-07, + "loss": 0.6523, + "step": 63804 + }, + { + "epoch": 1.64, + "learning_rate": 9.026162353789236e-07, + "loss": 0.6035, + "step": 63805 + }, + { + "epoch": 1.64, + "learning_rate": 9.025886964826014e-07, + "loss": 0.5809, + "step": 63806 + }, + { + "epoch": 1.64, + "learning_rate": 9.025611576608622e-07, + "loss": 0.5859, + "step": 63807 + }, + { + "epoch": 1.64, + "learning_rate": 9.025336189137277e-07, + "loss": 0.8203, + "step": 63808 + }, + { + "epoch": 1.64, + "learning_rate": 9.025060802412184e-07, + "loss": 0.7422, + "step": 63809 + }, + { + "epoch": 1.64, + "learning_rate": 9.024785416433562e-07, + "loss": 0.5503, + "step": 63810 + }, + { + "epoch": 1.64, + "learning_rate": 9.024510031201614e-07, + "loss": 0.6787, + "step": 63811 + }, + { + "epoch": 1.64, + "learning_rate": 9.024234646716553e-07, + "loss": 0.5605, + "step": 63812 + }, + { + "epoch": 1.64, + "learning_rate": 9.023959262978593e-07, + "loss": 0.5737, + "step": 63813 + }, + { + "epoch": 1.64, + "learning_rate": 9.023683879987945e-07, + "loss": 0.7773, + "step": 63814 + }, + { + "epoch": 1.64, + "learning_rate": 9.023408497744813e-07, + "loss": 0.644, + "step": 63815 + }, + { + "epoch": 1.64, + "learning_rate": 9.023133116249413e-07, + "loss": 0.8066, + "step": 63816 + }, + { + "epoch": 1.64, + "learning_rate": 9.022857735501953e-07, + "loss": 0.7021, + "step": 63817 + }, + { + "epoch": 1.64, + "learning_rate": 9.022582355502649e-07, + "loss": 0.6091, + "step": 63818 + }, + { + "epoch": 1.64, + "learning_rate": 9.022306976251705e-07, + "loss": 0.6855, + "step": 63819 + }, + { + "epoch": 1.64, + "learning_rate": 9.02203159774934e-07, + "loss": 0.6265, + "step": 63820 + }, + { + "epoch": 1.64, + "learning_rate": 9.021756219995757e-07, + "loss": 0.6504, + "step": 63821 + }, + { + "epoch": 1.64, + "learning_rate": 9.021480842991174e-07, + "loss": 0.7217, + "step": 63822 + }, + { + "epoch": 1.64, + "learning_rate": 9.021205466735794e-07, + "loss": 0.6279, + "step": 63823 + }, + { + "epoch": 1.64, + "learning_rate": 9.020930091229837e-07, + "loss": 0.6611, + "step": 63824 + }, + { + "epoch": 1.64, + "learning_rate": 9.020654716473507e-07, + "loss": 0.6069, + "step": 63825 + }, + { + "epoch": 1.64, + "learning_rate": 9.020379342467014e-07, + "loss": 0.7598, + "step": 63826 + }, + { + "epoch": 1.64, + "learning_rate": 9.020103969210574e-07, + "loss": 0.5703, + "step": 63827 + }, + { + "epoch": 1.64, + "learning_rate": 9.019828596704393e-07, + "loss": 0.6221, + "step": 63828 + }, + { + "epoch": 1.64, + "learning_rate": 9.019553224948687e-07, + "loss": 0.7285, + "step": 63829 + }, + { + "epoch": 1.64, + "learning_rate": 9.019277853943664e-07, + "loss": 0.7627, + "step": 63830 + }, + { + "epoch": 1.64, + "learning_rate": 9.019002483689531e-07, + "loss": 0.6641, + "step": 63831 + }, + { + "epoch": 1.64, + "learning_rate": 9.018727114186506e-07, + "loss": 0.7617, + "step": 63832 + }, + { + "epoch": 1.64, + "learning_rate": 9.018451745434799e-07, + "loss": 0.6797, + "step": 63833 + }, + { + "epoch": 1.64, + "learning_rate": 9.018176377434613e-07, + "loss": 0.6226, + "step": 63834 + }, + { + "epoch": 1.64, + "learning_rate": 9.017901010186167e-07, + "loss": 0.5962, + "step": 63835 + }, + { + "epoch": 1.64, + "learning_rate": 9.017625643689667e-07, + "loss": 0.5962, + "step": 63836 + }, + { + "epoch": 1.64, + "learning_rate": 9.017350277945328e-07, + "loss": 0.6489, + "step": 63837 + }, + { + "epoch": 1.64, + "learning_rate": 9.017074912953357e-07, + "loss": 0.6943, + "step": 63838 + }, + { + "epoch": 1.64, + "learning_rate": 9.016799548713968e-07, + "loss": 0.6113, + "step": 63839 + }, + { + "epoch": 1.64, + "learning_rate": 9.016524185227368e-07, + "loss": 0.7598, + "step": 63840 + }, + { + "epoch": 1.64, + "learning_rate": 9.016248822493773e-07, + "loss": 0.665, + "step": 63841 + }, + { + "epoch": 1.64, + "learning_rate": 9.015973460513389e-07, + "loss": 0.6284, + "step": 63842 + }, + { + "epoch": 1.64, + "learning_rate": 9.015698099286432e-07, + "loss": 0.7939, + "step": 63843 + }, + { + "epoch": 1.64, + "learning_rate": 9.015422738813109e-07, + "loss": 0.6455, + "step": 63844 + }, + { + "epoch": 1.64, + "learning_rate": 9.015147379093629e-07, + "loss": 0.6797, + "step": 63845 + }, + { + "epoch": 1.64, + "learning_rate": 9.014872020128207e-07, + "loss": 0.637, + "step": 63846 + }, + { + "epoch": 1.64, + "learning_rate": 9.014596661917052e-07, + "loss": 0.5396, + "step": 63847 + }, + { + "epoch": 1.64, + "learning_rate": 9.014321304460374e-07, + "loss": 0.6484, + "step": 63848 + }, + { + "epoch": 1.64, + "learning_rate": 9.014045947758387e-07, + "loss": 0.6035, + "step": 63849 + }, + { + "epoch": 1.64, + "learning_rate": 9.013770591811296e-07, + "loss": 0.5537, + "step": 63850 + }, + { + "epoch": 1.64, + "learning_rate": 9.013495236619318e-07, + "loss": 0.6665, + "step": 63851 + }, + { + "epoch": 1.64, + "learning_rate": 9.01321988218266e-07, + "loss": 0.665, + "step": 63852 + }, + { + "epoch": 1.64, + "learning_rate": 9.012944528501538e-07, + "loss": 0.6162, + "step": 63853 + }, + { + "epoch": 1.64, + "learning_rate": 9.012669175576158e-07, + "loss": 0.9404, + "step": 63854 + }, + { + "epoch": 1.64, + "learning_rate": 9.012393823406728e-07, + "loss": 0.6621, + "step": 63855 + }, + { + "epoch": 1.64, + "learning_rate": 9.012118471993466e-07, + "loss": 0.5562, + "step": 63856 + }, + { + "epoch": 1.64, + "learning_rate": 9.011843121336577e-07, + "loss": 0.5503, + "step": 63857 + }, + { + "epoch": 1.64, + "learning_rate": 9.011567771436276e-07, + "loss": 0.4727, + "step": 63858 + }, + { + "epoch": 1.64, + "learning_rate": 9.01129242229277e-07, + "loss": 0.6187, + "step": 63859 + }, + { + "epoch": 1.64, + "learning_rate": 9.011017073906274e-07, + "loss": 0.6006, + "step": 63860 + }, + { + "epoch": 1.64, + "learning_rate": 9.010741726276994e-07, + "loss": 0.6436, + "step": 63861 + }, + { + "epoch": 1.64, + "learning_rate": 9.010466379405148e-07, + "loss": 0.6611, + "step": 63862 + }, + { + "epoch": 1.64, + "learning_rate": 9.010191033290943e-07, + "loss": 0.7578, + "step": 63863 + }, + { + "epoch": 1.64, + "learning_rate": 9.009915687934587e-07, + "loss": 0.6758, + "step": 63864 + }, + { + "epoch": 1.64, + "learning_rate": 9.009640343336291e-07, + "loss": 0.7939, + "step": 63865 + }, + { + "epoch": 1.64, + "learning_rate": 9.00936499949627e-07, + "loss": 0.5532, + "step": 63866 + }, + { + "epoch": 1.64, + "learning_rate": 9.009089656414731e-07, + "loss": 0.5952, + "step": 63867 + }, + { + "epoch": 1.64, + "learning_rate": 9.008814314091888e-07, + "loss": 0.6465, + "step": 63868 + }, + { + "epoch": 1.64, + "learning_rate": 9.008538972527948e-07, + "loss": 0.665, + "step": 63869 + }, + { + "epoch": 1.64, + "learning_rate": 9.008263631723128e-07, + "loss": 0.5276, + "step": 63870 + }, + { + "epoch": 1.64, + "learning_rate": 9.00798829167763e-07, + "loss": 0.5967, + "step": 63871 + }, + { + "epoch": 1.64, + "learning_rate": 9.007712952391673e-07, + "loss": 0.7051, + "step": 63872 + }, + { + "epoch": 1.64, + "learning_rate": 9.007437613865468e-07, + "loss": 0.5972, + "step": 63873 + }, + { + "epoch": 1.64, + "learning_rate": 9.007162276099218e-07, + "loss": 0.6846, + "step": 63874 + }, + { + "epoch": 1.64, + "learning_rate": 9.006886939093139e-07, + "loss": 0.5796, + "step": 63875 + }, + { + "epoch": 1.64, + "learning_rate": 9.006611602847439e-07, + "loss": 0.6035, + "step": 63876 + }, + { + "epoch": 1.64, + "learning_rate": 9.006336267362333e-07, + "loss": 0.5186, + "step": 63877 + }, + { + "epoch": 1.64, + "learning_rate": 9.006060932638029e-07, + "loss": 0.5596, + "step": 63878 + }, + { + "epoch": 1.64, + "learning_rate": 9.005785598674739e-07, + "loss": 0.5447, + "step": 63879 + }, + { + "epoch": 1.64, + "learning_rate": 9.005510265472672e-07, + "loss": 0.5308, + "step": 63880 + }, + { + "epoch": 1.64, + "learning_rate": 9.005234933032041e-07, + "loss": 0.6943, + "step": 63881 + }, + { + "epoch": 1.64, + "learning_rate": 9.004959601353055e-07, + "loss": 0.5474, + "step": 63882 + }, + { + "epoch": 1.64, + "learning_rate": 9.004684270435931e-07, + "loss": 0.5088, + "step": 63883 + }, + { + "epoch": 1.64, + "learning_rate": 9.004408940280869e-07, + "loss": 0.5674, + "step": 63884 + }, + { + "epoch": 1.64, + "learning_rate": 9.004133610888087e-07, + "loss": 0.6499, + "step": 63885 + }, + { + "epoch": 1.64, + "learning_rate": 9.003858282257791e-07, + "loss": 0.5171, + "step": 63886 + }, + { + "epoch": 1.64, + "learning_rate": 9.003582954390198e-07, + "loss": 0.3039, + "step": 63887 + }, + { + "epoch": 1.64, + "learning_rate": 9.003307627285514e-07, + "loss": 0.5312, + "step": 63888 + }, + { + "epoch": 1.64, + "learning_rate": 9.003032300943953e-07, + "loss": 0.6367, + "step": 63889 + }, + { + "epoch": 1.64, + "learning_rate": 9.002756975365723e-07, + "loss": 0.5566, + "step": 63890 + }, + { + "epoch": 1.64, + "learning_rate": 9.002481650551038e-07, + "loss": 0.6392, + "step": 63891 + }, + { + "epoch": 1.64, + "learning_rate": 9.002206326500105e-07, + "loss": 0.7275, + "step": 63892 + }, + { + "epoch": 1.64, + "learning_rate": 9.00193100321314e-07, + "loss": 0.7354, + "step": 63893 + }, + { + "epoch": 1.64, + "learning_rate": 9.001655680690349e-07, + "loss": 0.6743, + "step": 63894 + }, + { + "epoch": 1.64, + "learning_rate": 9.001380358931942e-07, + "loss": 0.6304, + "step": 63895 + }, + { + "epoch": 1.64, + "learning_rate": 9.001105037938135e-07, + "loss": 0.6245, + "step": 63896 + }, + { + "epoch": 1.64, + "learning_rate": 9.000829717709133e-07, + "loss": 0.8574, + "step": 63897 + }, + { + "epoch": 1.64, + "learning_rate": 9.000554398245152e-07, + "loss": 0.6406, + "step": 63898 + }, + { + "epoch": 1.64, + "learning_rate": 9.000279079546399e-07, + "loss": 0.7842, + "step": 63899 + }, + { + "epoch": 1.64, + "learning_rate": 9.000003761613088e-07, + "loss": 0.4658, + "step": 63900 + }, + { + "epoch": 1.64, + "learning_rate": 8.999728444445428e-07, + "loss": 0.5344, + "step": 63901 + }, + { + "epoch": 1.64, + "learning_rate": 8.999453128043628e-07, + "loss": 0.7422, + "step": 63902 + }, + { + "epoch": 1.64, + "learning_rate": 8.999177812407905e-07, + "loss": 0.5435, + "step": 63903 + }, + { + "epoch": 1.64, + "learning_rate": 8.998902497538463e-07, + "loss": 0.6914, + "step": 63904 + }, + { + "epoch": 1.64, + "learning_rate": 8.998627183435513e-07, + "loss": 0.7168, + "step": 63905 + }, + { + "epoch": 1.64, + "learning_rate": 8.998351870099271e-07, + "loss": 0.7236, + "step": 63906 + }, + { + "epoch": 1.64, + "learning_rate": 8.998076557529944e-07, + "loss": 0.5005, + "step": 63907 + }, + { + "epoch": 1.64, + "learning_rate": 8.997801245727743e-07, + "loss": 0.6982, + "step": 63908 + }, + { + "epoch": 1.64, + "learning_rate": 8.997525934692879e-07, + "loss": 0.5491, + "step": 63909 + }, + { + "epoch": 1.64, + "learning_rate": 8.997250624425565e-07, + "loss": 0.5903, + "step": 63910 + }, + { + "epoch": 1.64, + "learning_rate": 8.996975314926009e-07, + "loss": 0.5674, + "step": 63911 + }, + { + "epoch": 1.64, + "learning_rate": 8.996700006194425e-07, + "loss": 0.7031, + "step": 63912 + }, + { + "epoch": 1.64, + "learning_rate": 8.996424698231022e-07, + "loss": 0.626, + "step": 63913 + }, + { + "epoch": 1.64, + "learning_rate": 8.996149391036006e-07, + "loss": 0.5356, + "step": 63914 + }, + { + "epoch": 1.64, + "learning_rate": 8.995874084609596e-07, + "loss": 0.5581, + "step": 63915 + }, + { + "epoch": 1.64, + "learning_rate": 8.995598778951998e-07, + "loss": 0.6875, + "step": 63916 + }, + { + "epoch": 1.64, + "learning_rate": 8.995323474063423e-07, + "loss": 0.5723, + "step": 63917 + }, + { + "epoch": 1.64, + "learning_rate": 8.995048169944082e-07, + "loss": 0.4263, + "step": 63918 + }, + { + "epoch": 1.64, + "learning_rate": 8.994772866594189e-07, + "loss": 0.6509, + "step": 63919 + }, + { + "epoch": 1.64, + "learning_rate": 8.994497564013952e-07, + "loss": 0.6313, + "step": 63920 + }, + { + "epoch": 1.64, + "learning_rate": 8.994222262203579e-07, + "loss": 0.4771, + "step": 63921 + }, + { + "epoch": 1.64, + "learning_rate": 8.993946961163287e-07, + "loss": 0.647, + "step": 63922 + }, + { + "epoch": 1.64, + "learning_rate": 8.993671660893285e-07, + "loss": 0.6069, + "step": 63923 + }, + { + "epoch": 1.64, + "learning_rate": 8.993396361393778e-07, + "loss": 0.7505, + "step": 63924 + }, + { + "epoch": 1.64, + "learning_rate": 8.993121062664984e-07, + "loss": 0.5249, + "step": 63925 + }, + { + "epoch": 1.64, + "learning_rate": 8.992845764707108e-07, + "loss": 0.6436, + "step": 63926 + }, + { + "epoch": 1.64, + "learning_rate": 8.992570467520366e-07, + "loss": 0.5654, + "step": 63927 + }, + { + "epoch": 1.64, + "learning_rate": 8.992295171104963e-07, + "loss": 0.5493, + "step": 63928 + }, + { + "epoch": 1.64, + "learning_rate": 8.992019875461118e-07, + "loss": 0.5474, + "step": 63929 + }, + { + "epoch": 1.64, + "learning_rate": 8.991744580589033e-07, + "loss": 0.5715, + "step": 63930 + }, + { + "epoch": 1.64, + "learning_rate": 8.991469286488926e-07, + "loss": 0.6504, + "step": 63931 + }, + { + "epoch": 1.64, + "learning_rate": 8.991193993161002e-07, + "loss": 0.7217, + "step": 63932 + }, + { + "epoch": 1.64, + "learning_rate": 8.990918700605479e-07, + "loss": 0.8125, + "step": 63933 + }, + { + "epoch": 1.64, + "learning_rate": 8.99064340882256e-07, + "loss": 0.6333, + "step": 63934 + }, + { + "epoch": 1.64, + "learning_rate": 8.990368117812458e-07, + "loss": 0.6226, + "step": 63935 + }, + { + "epoch": 1.64, + "learning_rate": 8.990092827575386e-07, + "loss": 0.876, + "step": 63936 + }, + { + "epoch": 1.64, + "learning_rate": 8.989817538111554e-07, + "loss": 0.5942, + "step": 63937 + }, + { + "epoch": 1.64, + "learning_rate": 8.98954224942117e-07, + "loss": 0.7773, + "step": 63938 + }, + { + "epoch": 1.64, + "learning_rate": 8.98926696150445e-07, + "loss": 0.4991, + "step": 63939 + }, + { + "epoch": 1.64, + "learning_rate": 8.988991674361597e-07, + "loss": 0.5283, + "step": 63940 + }, + { + "epoch": 1.64, + "learning_rate": 8.988716387992832e-07, + "loss": 0.6343, + "step": 63941 + }, + { + "epoch": 1.64, + "learning_rate": 8.988441102398357e-07, + "loss": 0.6636, + "step": 63942 + }, + { + "epoch": 1.64, + "learning_rate": 8.988165817578389e-07, + "loss": 0.6313, + "step": 63943 + }, + { + "epoch": 1.64, + "learning_rate": 8.987890533533136e-07, + "loss": 0.5869, + "step": 63944 + }, + { + "epoch": 1.64, + "learning_rate": 8.987615250262804e-07, + "loss": 0.5586, + "step": 63945 + }, + { + "epoch": 1.64, + "learning_rate": 8.987339967767613e-07, + "loss": 0.5781, + "step": 63946 + }, + { + "epoch": 1.64, + "learning_rate": 8.987064686047766e-07, + "loss": 0.7852, + "step": 63947 + }, + { + "epoch": 1.64, + "learning_rate": 8.986789405103478e-07, + "loss": 0.416, + "step": 63948 + }, + { + "epoch": 1.64, + "learning_rate": 8.98651412493496e-07, + "loss": 0.6514, + "step": 63949 + }, + { + "epoch": 1.64, + "learning_rate": 8.986238845542421e-07, + "loss": 0.6572, + "step": 63950 + }, + { + "epoch": 1.64, + "learning_rate": 8.985963566926071e-07, + "loss": 0.5825, + "step": 63951 + }, + { + "epoch": 1.64, + "learning_rate": 8.985688289086124e-07, + "loss": 0.7168, + "step": 63952 + }, + { + "epoch": 1.64, + "learning_rate": 8.985413012022791e-07, + "loss": 0.5059, + "step": 63953 + }, + { + "epoch": 1.64, + "learning_rate": 8.985137735736278e-07, + "loss": 0.7246, + "step": 63954 + }, + { + "epoch": 1.64, + "learning_rate": 8.984862460226797e-07, + "loss": 0.5205, + "step": 63955 + }, + { + "epoch": 1.64, + "learning_rate": 8.984587185494561e-07, + "loss": 0.6182, + "step": 63956 + }, + { + "epoch": 1.64, + "learning_rate": 8.984311911539779e-07, + "loss": 0.5645, + "step": 63957 + }, + { + "epoch": 1.64, + "learning_rate": 8.984036638362664e-07, + "loss": 0.6206, + "step": 63958 + }, + { + "epoch": 1.64, + "learning_rate": 8.983761365963425e-07, + "loss": 0.5078, + "step": 63959 + }, + { + "epoch": 1.64, + "learning_rate": 8.983486094342273e-07, + "loss": 0.6982, + "step": 63960 + }, + { + "epoch": 1.64, + "learning_rate": 8.983210823499419e-07, + "loss": 0.6338, + "step": 63961 + }, + { + "epoch": 1.64, + "learning_rate": 8.982935553435074e-07, + "loss": 0.7295, + "step": 63962 + }, + { + "epoch": 1.64, + "learning_rate": 8.982660284149452e-07, + "loss": 0.8184, + "step": 63963 + }, + { + "epoch": 1.64, + "learning_rate": 8.982385015642755e-07, + "loss": 0.5718, + "step": 63964 + }, + { + "epoch": 1.64, + "learning_rate": 8.982109747915202e-07, + "loss": 0.5825, + "step": 63965 + }, + { + "epoch": 1.64, + "learning_rate": 8.981834480966997e-07, + "loss": 0.7061, + "step": 63966 + }, + { + "epoch": 1.64, + "learning_rate": 8.981559214798359e-07, + "loss": 0.6318, + "step": 63967 + }, + { + "epoch": 1.64, + "learning_rate": 8.98128394940949e-07, + "loss": 0.533, + "step": 63968 + }, + { + "epoch": 1.64, + "learning_rate": 8.981008684800608e-07, + "loss": 0.6655, + "step": 63969 + }, + { + "epoch": 1.64, + "learning_rate": 8.980733420971918e-07, + "loss": 0.5571, + "step": 63970 + }, + { + "epoch": 1.64, + "learning_rate": 8.980458157923638e-07, + "loss": 0.7246, + "step": 63971 + }, + { + "epoch": 1.64, + "learning_rate": 8.98018289565597e-07, + "loss": 0.7178, + "step": 63972 + }, + { + "epoch": 1.64, + "learning_rate": 8.979907634169137e-07, + "loss": 0.6777, + "step": 63973 + }, + { + "epoch": 1.64, + "learning_rate": 8.979632373463334e-07, + "loss": 0.6934, + "step": 63974 + }, + { + "epoch": 1.64, + "learning_rate": 8.979357113538783e-07, + "loss": 0.4824, + "step": 63975 + }, + { + "epoch": 1.64, + "learning_rate": 8.979081854395687e-07, + "loss": 0.6562, + "step": 63976 + }, + { + "epoch": 1.64, + "learning_rate": 8.978806596034265e-07, + "loss": 0.5078, + "step": 63977 + }, + { + "epoch": 1.64, + "learning_rate": 8.978531338454721e-07, + "loss": 0.5422, + "step": 63978 + }, + { + "epoch": 1.64, + "learning_rate": 8.978256081657271e-07, + "loss": 0.5895, + "step": 63979 + }, + { + "epoch": 1.64, + "learning_rate": 8.977980825642122e-07, + "loss": 0.7598, + "step": 63980 + }, + { + "epoch": 1.64, + "learning_rate": 8.977705570409487e-07, + "loss": 0.6758, + "step": 63981 + }, + { + "epoch": 1.64, + "learning_rate": 8.977430315959575e-07, + "loss": 0.3647, + "step": 63982 + }, + { + "epoch": 1.64, + "learning_rate": 8.977155062292601e-07, + "loss": 0.6128, + "step": 63983 + }, + { + "epoch": 1.64, + "learning_rate": 8.976879809408769e-07, + "loss": 0.6387, + "step": 63984 + }, + { + "epoch": 1.64, + "learning_rate": 8.976604557308293e-07, + "loss": 0.6353, + "step": 63985 + }, + { + "epoch": 1.64, + "learning_rate": 8.976329305991385e-07, + "loss": 0.6592, + "step": 63986 + }, + { + "epoch": 1.64, + "learning_rate": 8.976054055458253e-07, + "loss": 0.8291, + "step": 63987 + }, + { + "epoch": 1.64, + "learning_rate": 8.975778805709111e-07, + "loss": 0.5171, + "step": 63988 + }, + { + "epoch": 1.64, + "learning_rate": 8.975503556744166e-07, + "loss": 0.4854, + "step": 63989 + }, + { + "epoch": 1.64, + "learning_rate": 8.975228308563632e-07, + "loss": 0.6802, + "step": 63990 + }, + { + "epoch": 1.64, + "learning_rate": 8.974953061167721e-07, + "loss": 0.6953, + "step": 63991 + }, + { + "epoch": 1.64, + "learning_rate": 8.974677814556637e-07, + "loss": 0.6167, + "step": 63992 + }, + { + "epoch": 1.64, + "learning_rate": 8.9744025687306e-07, + "loss": 0.792, + "step": 63993 + }, + { + "epoch": 1.64, + "learning_rate": 8.974127323689814e-07, + "loss": 0.5854, + "step": 63994 + }, + { + "epoch": 1.64, + "learning_rate": 8.973852079434489e-07, + "loss": 0.5908, + "step": 63995 + }, + { + "epoch": 1.64, + "learning_rate": 8.97357683596484e-07, + "loss": 0.7305, + "step": 63996 + }, + { + "epoch": 1.64, + "learning_rate": 8.973301593281075e-07, + "loss": 0.6284, + "step": 63997 + }, + { + "epoch": 1.64, + "learning_rate": 8.973026351383407e-07, + "loss": 0.6572, + "step": 63998 + }, + { + "epoch": 1.64, + "learning_rate": 8.972751110272044e-07, + "loss": 0.6748, + "step": 63999 + }, + { + "epoch": 1.64, + "learning_rate": 8.972475869947199e-07, + "loss": 0.6167, + "step": 64000 + }, + { + "epoch": 1.64, + "learning_rate": 8.972200630409081e-07, + "loss": 0.3369, + "step": 64001 + }, + { + "epoch": 1.64, + "learning_rate": 8.971925391657904e-07, + "loss": 0.6929, + "step": 64002 + }, + { + "epoch": 1.64, + "learning_rate": 8.971650153693878e-07, + "loss": 0.647, + "step": 64003 + }, + { + "epoch": 1.64, + "learning_rate": 8.971374916517209e-07, + "loss": 0.5615, + "step": 64004 + }, + { + "epoch": 1.64, + "learning_rate": 8.971099680128113e-07, + "loss": 0.5139, + "step": 64005 + }, + { + "epoch": 1.64, + "learning_rate": 8.970824444526794e-07, + "loss": 0.6807, + "step": 64006 + }, + { + "epoch": 1.64, + "learning_rate": 8.970549209713471e-07, + "loss": 0.6763, + "step": 64007 + }, + { + "epoch": 1.64, + "learning_rate": 8.97027397568835e-07, + "loss": 0.7441, + "step": 64008 + }, + { + "epoch": 1.64, + "learning_rate": 8.969998742451645e-07, + "loss": 0.6377, + "step": 64009 + }, + { + "epoch": 1.64, + "learning_rate": 8.969723510003564e-07, + "loss": 0.626, + "step": 64010 + }, + { + "epoch": 1.64, + "learning_rate": 8.969448278344316e-07, + "loss": 0.5349, + "step": 64011 + }, + { + "epoch": 1.64, + "learning_rate": 8.969173047474116e-07, + "loss": 0.6553, + "step": 64012 + }, + { + "epoch": 1.64, + "learning_rate": 8.968897817393176e-07, + "loss": 0.5186, + "step": 64013 + }, + { + "epoch": 1.64, + "learning_rate": 8.968622588101699e-07, + "loss": 0.7119, + "step": 64014 + }, + { + "epoch": 1.64, + "learning_rate": 8.968347359599901e-07, + "loss": 0.6562, + "step": 64015 + }, + { + "epoch": 1.64, + "learning_rate": 8.968072131887991e-07, + "loss": 0.7881, + "step": 64016 + }, + { + "epoch": 1.64, + "learning_rate": 8.967796904966183e-07, + "loss": 0.6475, + "step": 64017 + }, + { + "epoch": 1.64, + "learning_rate": 8.967521678834683e-07, + "loss": 0.6299, + "step": 64018 + }, + { + "epoch": 1.64, + "learning_rate": 8.967246453493707e-07, + "loss": 0.6152, + "step": 64019 + }, + { + "epoch": 1.64, + "learning_rate": 8.966971228943458e-07, + "loss": 0.7607, + "step": 64020 + }, + { + "epoch": 1.64, + "learning_rate": 8.966696005184157e-07, + "loss": 0.4971, + "step": 64021 + }, + { + "epoch": 1.64, + "learning_rate": 8.966420782216006e-07, + "loss": 0.4658, + "step": 64022 + }, + { + "epoch": 1.64, + "learning_rate": 8.966145560039223e-07, + "loss": 0.624, + "step": 64023 + }, + { + "epoch": 1.64, + "learning_rate": 8.965870338654014e-07, + "loss": 0.4866, + "step": 64024 + }, + { + "epoch": 1.64, + "learning_rate": 8.965595118060587e-07, + "loss": 0.8252, + "step": 64025 + }, + { + "epoch": 1.64, + "learning_rate": 8.965319898259158e-07, + "loss": 0.7305, + "step": 64026 + }, + { + "epoch": 1.64, + "learning_rate": 8.965044679249938e-07, + "loss": 0.667, + "step": 64027 + }, + { + "epoch": 1.64, + "learning_rate": 8.964769461033133e-07, + "loss": 0.6377, + "step": 64028 + }, + { + "epoch": 1.64, + "learning_rate": 8.964494243608957e-07, + "loss": 0.6602, + "step": 64029 + }, + { + "epoch": 1.64, + "learning_rate": 8.964219026977619e-07, + "loss": 0.5317, + "step": 64030 + }, + { + "epoch": 1.64, + "learning_rate": 8.963943811139333e-07, + "loss": 0.8564, + "step": 64031 + }, + { + "epoch": 1.64, + "learning_rate": 8.963668596094305e-07, + "loss": 0.5049, + "step": 64032 + }, + { + "epoch": 1.64, + "learning_rate": 8.963393381842753e-07, + "loss": 0.6021, + "step": 64033 + }, + { + "epoch": 1.64, + "learning_rate": 8.963118168384881e-07, + "loss": 0.5139, + "step": 64034 + }, + { + "epoch": 1.64, + "learning_rate": 8.9628429557209e-07, + "loss": 0.561, + "step": 64035 + }, + { + "epoch": 1.64, + "learning_rate": 8.962567743851024e-07, + "loss": 0.6816, + "step": 64036 + }, + { + "epoch": 1.64, + "learning_rate": 8.962292532775459e-07, + "loss": 0.708, + "step": 64037 + }, + { + "epoch": 1.64, + "learning_rate": 8.962017322494423e-07, + "loss": 0.7695, + "step": 64038 + }, + { + "epoch": 1.64, + "learning_rate": 8.961742113008119e-07, + "loss": 0.6396, + "step": 64039 + }, + { + "epoch": 1.64, + "learning_rate": 8.961466904316764e-07, + "loss": 0.5635, + "step": 64040 + }, + { + "epoch": 1.64, + "learning_rate": 8.961191696420564e-07, + "loss": 0.6279, + "step": 64041 + }, + { + "epoch": 1.64, + "learning_rate": 8.960916489319734e-07, + "loss": 0.6844, + "step": 64042 + }, + { + "epoch": 1.64, + "learning_rate": 8.960641283014485e-07, + "loss": 0.7622, + "step": 64043 + }, + { + "epoch": 1.64, + "learning_rate": 8.960366077505023e-07, + "loss": 0.5918, + "step": 64044 + }, + { + "epoch": 1.64, + "learning_rate": 8.960090872791558e-07, + "loss": 0.6865, + "step": 64045 + }, + { + "epoch": 1.64, + "learning_rate": 8.959815668874305e-07, + "loss": 0.4868, + "step": 64046 + }, + { + "epoch": 1.64, + "learning_rate": 8.959540465753474e-07, + "loss": 0.6025, + "step": 64047 + }, + { + "epoch": 1.64, + "learning_rate": 8.959265263429274e-07, + "loss": 0.5195, + "step": 64048 + }, + { + "epoch": 1.64, + "learning_rate": 8.958990061901917e-07, + "loss": 0.5862, + "step": 64049 + }, + { + "epoch": 1.64, + "learning_rate": 8.958714861171614e-07, + "loss": 0.7705, + "step": 64050 + }, + { + "epoch": 1.64, + "learning_rate": 8.958439661238573e-07, + "loss": 0.6484, + "step": 64051 + }, + { + "epoch": 1.64, + "learning_rate": 8.958164462103009e-07, + "loss": 0.666, + "step": 64052 + }, + { + "epoch": 1.64, + "learning_rate": 8.957889263765134e-07, + "loss": 0.7217, + "step": 64053 + }, + { + "epoch": 1.64, + "learning_rate": 8.957614066225149e-07, + "loss": 0.6484, + "step": 64054 + }, + { + "epoch": 1.64, + "learning_rate": 8.957338869483276e-07, + "loss": 0.6514, + "step": 64055 + }, + { + "epoch": 1.64, + "learning_rate": 8.957063673539716e-07, + "loss": 0.7354, + "step": 64056 + }, + { + "epoch": 1.64, + "learning_rate": 8.956788478394688e-07, + "loss": 0.6914, + "step": 64057 + }, + { + "epoch": 1.64, + "learning_rate": 8.956513284048396e-07, + "loss": 0.583, + "step": 64058 + }, + { + "epoch": 1.64, + "learning_rate": 8.956238090501057e-07, + "loss": 0.7979, + "step": 64059 + }, + { + "epoch": 1.64, + "learning_rate": 8.955962897752876e-07, + "loss": 0.6321, + "step": 64060 + }, + { + "epoch": 1.64, + "learning_rate": 8.955687705804067e-07, + "loss": 0.6553, + "step": 64061 + }, + { + "epoch": 1.64, + "learning_rate": 8.955412514654839e-07, + "loss": 0.6294, + "step": 64062 + }, + { + "epoch": 1.64, + "learning_rate": 8.955137324305409e-07, + "loss": 0.6377, + "step": 64063 + }, + { + "epoch": 1.64, + "learning_rate": 8.954862134755978e-07, + "loss": 0.6841, + "step": 64064 + }, + { + "epoch": 1.64, + "learning_rate": 8.954586946006761e-07, + "loss": 0.7783, + "step": 64065 + }, + { + "epoch": 1.64, + "learning_rate": 8.954311758057969e-07, + "loss": 0.7637, + "step": 64066 + }, + { + "epoch": 1.64, + "learning_rate": 8.954036570909813e-07, + "loss": 0.4819, + "step": 64067 + }, + { + "epoch": 1.64, + "learning_rate": 8.953761384562499e-07, + "loss": 0.604, + "step": 64068 + }, + { + "epoch": 1.64, + "learning_rate": 8.953486199016246e-07, + "loss": 0.8096, + "step": 64069 + }, + { + "epoch": 1.64, + "learning_rate": 8.953211014271259e-07, + "loss": 0.5562, + "step": 64070 + }, + { + "epoch": 1.64, + "learning_rate": 8.952935830327751e-07, + "loss": 0.5811, + "step": 64071 + }, + { + "epoch": 1.64, + "learning_rate": 8.95266064718593e-07, + "loss": 0.6108, + "step": 64072 + }, + { + "epoch": 1.64, + "learning_rate": 8.952385464846014e-07, + "loss": 0.5188, + "step": 64073 + }, + { + "epoch": 1.64, + "learning_rate": 8.952110283308205e-07, + "loss": 0.7266, + "step": 64074 + }, + { + "epoch": 1.64, + "learning_rate": 8.951835102572716e-07, + "loss": 0.7285, + "step": 64075 + }, + { + "epoch": 1.64, + "learning_rate": 8.95155992263976e-07, + "loss": 0.566, + "step": 64076 + }, + { + "epoch": 1.64, + "learning_rate": 8.951284743509544e-07, + "loss": 0.5835, + "step": 64077 + }, + { + "epoch": 1.64, + "learning_rate": 8.951009565182283e-07, + "loss": 0.875, + "step": 64078 + }, + { + "epoch": 1.64, + "learning_rate": 8.950734387658183e-07, + "loss": 0.6562, + "step": 64079 + }, + { + "epoch": 1.64, + "learning_rate": 8.950459210937462e-07, + "loss": 0.4822, + "step": 64080 + }, + { + "epoch": 1.64, + "learning_rate": 8.950184035020321e-07, + "loss": 0.6792, + "step": 64081 + }, + { + "epoch": 1.64, + "learning_rate": 8.949908859906981e-07, + "loss": 0.7402, + "step": 64082 + }, + { + "epoch": 1.64, + "learning_rate": 8.949633685597647e-07, + "loss": 0.3672, + "step": 64083 + }, + { + "epoch": 1.64, + "learning_rate": 8.94935851209253e-07, + "loss": 0.6992, + "step": 64084 + }, + { + "epoch": 1.64, + "learning_rate": 8.949083339391837e-07, + "loss": 0.6172, + "step": 64085 + }, + { + "epoch": 1.64, + "learning_rate": 8.948808167495786e-07, + "loss": 0.5605, + "step": 64086 + }, + { + "epoch": 1.64, + "learning_rate": 8.948532996404582e-07, + "loss": 0.6904, + "step": 64087 + }, + { + "epoch": 1.64, + "learning_rate": 8.948257826118439e-07, + "loss": 0.7588, + "step": 64088 + }, + { + "epoch": 1.64, + "learning_rate": 8.947982656637566e-07, + "loss": 0.6611, + "step": 64089 + }, + { + "epoch": 1.64, + "learning_rate": 8.947707487962175e-07, + "loss": 0.6895, + "step": 64090 + }, + { + "epoch": 1.64, + "learning_rate": 8.947432320092475e-07, + "loss": 0.5669, + "step": 64091 + }, + { + "epoch": 1.64, + "learning_rate": 8.94715715302868e-07, + "loss": 0.6787, + "step": 64092 + }, + { + "epoch": 1.64, + "learning_rate": 8.946881986771e-07, + "loss": 0.6885, + "step": 64093 + }, + { + "epoch": 1.64, + "learning_rate": 8.946606821319639e-07, + "loss": 0.5078, + "step": 64094 + }, + { + "epoch": 1.64, + "learning_rate": 8.946331656674816e-07, + "loss": 0.4719, + "step": 64095 + }, + { + "epoch": 1.64, + "learning_rate": 8.946056492836736e-07, + "loss": 0.4592, + "step": 64096 + }, + { + "epoch": 1.64, + "learning_rate": 8.945781329805613e-07, + "loss": 0.6174, + "step": 64097 + }, + { + "epoch": 1.64, + "learning_rate": 8.945506167581655e-07, + "loss": 0.6177, + "step": 64098 + }, + { + "epoch": 1.64, + "learning_rate": 8.945231006165079e-07, + "loss": 0.7754, + "step": 64099 + }, + { + "epoch": 1.64, + "learning_rate": 8.944955845556088e-07, + "loss": 0.6758, + "step": 64100 + }, + { + "epoch": 1.64, + "learning_rate": 8.944680685754895e-07, + "loss": 0.3979, + "step": 64101 + }, + { + "epoch": 1.64, + "learning_rate": 8.944405526761714e-07, + "loss": 0.5977, + "step": 64102 + }, + { + "epoch": 1.64, + "learning_rate": 8.944130368576754e-07, + "loss": 0.6465, + "step": 64103 + }, + { + "epoch": 1.64, + "learning_rate": 8.943855211200222e-07, + "loss": 0.5957, + "step": 64104 + }, + { + "epoch": 1.64, + "learning_rate": 8.943580054632334e-07, + "loss": 0.5347, + "step": 64105 + }, + { + "epoch": 1.64, + "learning_rate": 8.943304898873294e-07, + "loss": 0.3381, + "step": 64106 + }, + { + "epoch": 1.64, + "learning_rate": 8.94302974392332e-07, + "loss": 0.4387, + "step": 64107 + }, + { + "epoch": 1.64, + "learning_rate": 8.942754589782617e-07, + "loss": 0.6094, + "step": 64108 + }, + { + "epoch": 1.64, + "learning_rate": 8.942479436451401e-07, + "loss": 0.667, + "step": 64109 + }, + { + "epoch": 1.64, + "learning_rate": 8.942204283929879e-07, + "loss": 0.3755, + "step": 64110 + }, + { + "epoch": 1.64, + "learning_rate": 8.941929132218262e-07, + "loss": 0.6562, + "step": 64111 + }, + { + "epoch": 1.64, + "learning_rate": 8.94165398131676e-07, + "loss": 0.625, + "step": 64112 + }, + { + "epoch": 1.64, + "learning_rate": 8.94137883122559e-07, + "loss": 0.4338, + "step": 64113 + }, + { + "epoch": 1.64, + "learning_rate": 8.941103681944955e-07, + "loss": 0.4849, + "step": 64114 + }, + { + "epoch": 1.64, + "learning_rate": 8.940828533475066e-07, + "loss": 0.6377, + "step": 64115 + }, + { + "epoch": 1.64, + "learning_rate": 8.940553385816137e-07, + "loss": 0.6841, + "step": 64116 + }, + { + "epoch": 1.64, + "learning_rate": 8.940278238968379e-07, + "loss": 0.6523, + "step": 64117 + }, + { + "epoch": 1.64, + "learning_rate": 8.940003092931999e-07, + "loss": 0.6245, + "step": 64118 + }, + { + "epoch": 1.64, + "learning_rate": 8.939727947707212e-07, + "loss": 0.6763, + "step": 64119 + }, + { + "epoch": 1.64, + "learning_rate": 8.939452803294224e-07, + "loss": 0.6467, + "step": 64120 + }, + { + "epoch": 1.64, + "learning_rate": 8.93917765969325e-07, + "loss": 0.4954, + "step": 64121 + }, + { + "epoch": 1.64, + "learning_rate": 8.938902516904497e-07, + "loss": 0.5308, + "step": 64122 + }, + { + "epoch": 1.64, + "learning_rate": 8.938627374928182e-07, + "loss": 0.6987, + "step": 64123 + }, + { + "epoch": 1.64, + "learning_rate": 8.938352233764509e-07, + "loss": 0.5625, + "step": 64124 + }, + { + "epoch": 1.64, + "learning_rate": 8.938077093413689e-07, + "loss": 0.7109, + "step": 64125 + }, + { + "epoch": 1.64, + "learning_rate": 8.937801953875937e-07, + "loss": 0.4004, + "step": 64126 + }, + { + "epoch": 1.64, + "learning_rate": 8.937526815151459e-07, + "loss": 0.4854, + "step": 64127 + }, + { + "epoch": 1.64, + "learning_rate": 8.937251677240469e-07, + "loss": 0.7344, + "step": 64128 + }, + { + "epoch": 1.64, + "learning_rate": 8.936976540143175e-07, + "loss": 0.624, + "step": 64129 + }, + { + "epoch": 1.64, + "learning_rate": 8.936701403859791e-07, + "loss": 0.5906, + "step": 64130 + }, + { + "epoch": 1.64, + "learning_rate": 8.936426268390524e-07, + "loss": 0.5288, + "step": 64131 + }, + { + "epoch": 1.64, + "learning_rate": 8.936151133735591e-07, + "loss": 0.552, + "step": 64132 + }, + { + "epoch": 1.64, + "learning_rate": 8.935875999895195e-07, + "loss": 0.4695, + "step": 64133 + }, + { + "epoch": 1.64, + "learning_rate": 8.935600866869551e-07, + "loss": 0.7627, + "step": 64134 + }, + { + "epoch": 1.64, + "learning_rate": 8.935325734658866e-07, + "loss": 0.4861, + "step": 64135 + }, + { + "epoch": 1.64, + "learning_rate": 8.935050603263356e-07, + "loss": 0.5415, + "step": 64136 + }, + { + "epoch": 1.64, + "learning_rate": 8.934775472683224e-07, + "loss": 0.5728, + "step": 64137 + }, + { + "epoch": 1.64, + "learning_rate": 8.93450034291869e-07, + "loss": 0.4638, + "step": 64138 + }, + { + "epoch": 1.64, + "learning_rate": 8.934225213969958e-07, + "loss": 0.792, + "step": 64139 + }, + { + "epoch": 1.64, + "learning_rate": 8.933950085837242e-07, + "loss": 0.7021, + "step": 64140 + }, + { + "epoch": 1.64, + "learning_rate": 8.933674958520749e-07, + "loss": 0.4536, + "step": 64141 + }, + { + "epoch": 1.64, + "learning_rate": 8.933399832020697e-07, + "loss": 0.5796, + "step": 64142 + }, + { + "epoch": 1.64, + "learning_rate": 8.93312470633729e-07, + "loss": 0.6562, + "step": 64143 + }, + { + "epoch": 1.64, + "learning_rate": 8.932849581470737e-07, + "loss": 0.6323, + "step": 64144 + }, + { + "epoch": 1.64, + "learning_rate": 8.932574457421256e-07, + "loss": 0.7617, + "step": 64145 + }, + { + "epoch": 1.64, + "learning_rate": 8.932299334189049e-07, + "loss": 0.6265, + "step": 64146 + }, + { + "epoch": 1.64, + "learning_rate": 8.932024211774335e-07, + "loss": 0.6416, + "step": 64147 + }, + { + "epoch": 1.64, + "learning_rate": 8.931749090177318e-07, + "loss": 0.6011, + "step": 64148 + }, + { + "epoch": 1.64, + "learning_rate": 8.931473969398215e-07, + "loss": 0.3865, + "step": 64149 + }, + { + "epoch": 1.64, + "learning_rate": 8.93119884943723e-07, + "loss": 0.6321, + "step": 64150 + }, + { + "epoch": 1.64, + "learning_rate": 8.93092373029458e-07, + "loss": 0.6714, + "step": 64151 + }, + { + "epoch": 1.64, + "learning_rate": 8.930648611970475e-07, + "loss": 0.5581, + "step": 64152 + }, + { + "epoch": 1.64, + "learning_rate": 8.93037349446512e-07, + "loss": 0.5833, + "step": 64153 + }, + { + "epoch": 1.64, + "learning_rate": 8.930098377778727e-07, + "loss": 0.564, + "step": 64154 + }, + { + "epoch": 1.64, + "learning_rate": 8.92982326191151e-07, + "loss": 0.5591, + "step": 64155 + }, + { + "epoch": 1.64, + "learning_rate": 8.929548146863677e-07, + "loss": 0.5513, + "step": 64156 + }, + { + "epoch": 1.64, + "learning_rate": 8.92927303263544e-07, + "loss": 0.6982, + "step": 64157 + }, + { + "epoch": 1.64, + "learning_rate": 8.928997919227009e-07, + "loss": 0.752, + "step": 64158 + }, + { + "epoch": 1.64, + "learning_rate": 8.928722806638597e-07, + "loss": 0.5358, + "step": 64159 + }, + { + "epoch": 1.64, + "learning_rate": 8.92844769487041e-07, + "loss": 0.5693, + "step": 64160 + }, + { + "epoch": 1.64, + "learning_rate": 8.928172583922664e-07, + "loss": 0.6895, + "step": 64161 + }, + { + "epoch": 1.64, + "learning_rate": 8.92789747379557e-07, + "loss": 0.5068, + "step": 64162 + }, + { + "epoch": 1.64, + "learning_rate": 8.92762236448933e-07, + "loss": 0.6602, + "step": 64163 + }, + { + "epoch": 1.64, + "learning_rate": 8.927347256004162e-07, + "loss": 0.749, + "step": 64164 + }, + { + "epoch": 1.64, + "learning_rate": 8.927072148340273e-07, + "loss": 0.6113, + "step": 64165 + }, + { + "epoch": 1.64, + "learning_rate": 8.926797041497878e-07, + "loss": 0.4634, + "step": 64166 + }, + { + "epoch": 1.64, + "learning_rate": 8.926521935477183e-07, + "loss": 0.7598, + "step": 64167 + }, + { + "epoch": 1.64, + "learning_rate": 8.926246830278403e-07, + "loss": 0.604, + "step": 64168 + }, + { + "epoch": 1.64, + "learning_rate": 8.925971725901745e-07, + "loss": 0.6914, + "step": 64169 + }, + { + "epoch": 1.64, + "learning_rate": 8.925696622347423e-07, + "loss": 0.4893, + "step": 64170 + }, + { + "epoch": 1.64, + "learning_rate": 8.925421519615642e-07, + "loss": 0.6309, + "step": 64171 + }, + { + "epoch": 1.64, + "learning_rate": 8.925146417706625e-07, + "loss": 0.5732, + "step": 64172 + }, + { + "epoch": 1.64, + "learning_rate": 8.924871316620566e-07, + "loss": 0.5649, + "step": 64173 + }, + { + "epoch": 1.64, + "learning_rate": 8.924596216357686e-07, + "loss": 0.6758, + "step": 64174 + }, + { + "epoch": 1.64, + "learning_rate": 8.924321116918191e-07, + "loss": 0.6416, + "step": 64175 + }, + { + "epoch": 1.64, + "learning_rate": 8.924046018302297e-07, + "loss": 0.5967, + "step": 64176 + }, + { + "epoch": 1.64, + "learning_rate": 8.923770920510209e-07, + "loss": 0.7236, + "step": 64177 + }, + { + "epoch": 1.64, + "learning_rate": 8.923495823542141e-07, + "loss": 0.5542, + "step": 64178 + }, + { + "epoch": 1.64, + "learning_rate": 8.923220727398302e-07, + "loss": 0.4839, + "step": 64179 + }, + { + "epoch": 1.64, + "learning_rate": 8.922945632078905e-07, + "loss": 0.5649, + "step": 64180 + }, + { + "epoch": 1.64, + "learning_rate": 8.922670537584156e-07, + "loss": 0.7295, + "step": 64181 + }, + { + "epoch": 1.65, + "learning_rate": 8.922395443914274e-07, + "loss": 0.6328, + "step": 64182 + }, + { + "epoch": 1.65, + "learning_rate": 8.922120351069462e-07, + "loss": 0.4889, + "step": 64183 + }, + { + "epoch": 1.65, + "learning_rate": 8.921845259049931e-07, + "loss": 0.4729, + "step": 64184 + }, + { + "epoch": 1.65, + "learning_rate": 8.921570167855894e-07, + "loss": 0.7119, + "step": 64185 + }, + { + "epoch": 1.65, + "learning_rate": 8.92129507748756e-07, + "loss": 0.7549, + "step": 64186 + }, + { + "epoch": 1.65, + "learning_rate": 8.921019987945144e-07, + "loss": 0.6333, + "step": 64187 + }, + { + "epoch": 1.65, + "learning_rate": 8.920744899228851e-07, + "loss": 0.7715, + "step": 64188 + }, + { + "epoch": 1.65, + "learning_rate": 8.920469811338894e-07, + "loss": 0.4742, + "step": 64189 + }, + { + "epoch": 1.65, + "learning_rate": 8.920194724275486e-07, + "loss": 0.6445, + "step": 64190 + }, + { + "epoch": 1.65, + "learning_rate": 8.919919638038832e-07, + "loss": 0.6528, + "step": 64191 + }, + { + "epoch": 1.65, + "learning_rate": 8.919644552629151e-07, + "loss": 0.5908, + "step": 64192 + }, + { + "epoch": 1.65, + "learning_rate": 8.919369468046644e-07, + "loss": 0.7314, + "step": 64193 + }, + { + "epoch": 1.65, + "learning_rate": 8.919094384291527e-07, + "loss": 0.6196, + "step": 64194 + }, + { + "epoch": 1.65, + "learning_rate": 8.918819301364011e-07, + "loss": 0.6582, + "step": 64195 + }, + { + "epoch": 1.65, + "learning_rate": 8.918544219264302e-07, + "loss": 0.7529, + "step": 64196 + }, + { + "epoch": 1.65, + "learning_rate": 8.918269137992618e-07, + "loss": 0.6548, + "step": 64197 + }, + { + "epoch": 1.65, + "learning_rate": 8.917994057549161e-07, + "loss": 0.6729, + "step": 64198 + }, + { + "epoch": 1.65, + "learning_rate": 8.91771897793415e-07, + "loss": 0.6196, + "step": 64199 + }, + { + "epoch": 1.65, + "learning_rate": 8.917443899147789e-07, + "loss": 0.4061, + "step": 64200 + }, + { + "epoch": 1.65, + "learning_rate": 8.917168821190295e-07, + "loss": 0.6445, + "step": 64201 + }, + { + "epoch": 1.65, + "learning_rate": 8.916893744061875e-07, + "loss": 0.5581, + "step": 64202 + }, + { + "epoch": 1.65, + "learning_rate": 8.916618667762737e-07, + "loss": 0.7109, + "step": 64203 + }, + { + "epoch": 1.65, + "learning_rate": 8.916343592293096e-07, + "loss": 0.8086, + "step": 64204 + }, + { + "epoch": 1.65, + "learning_rate": 8.916068517653159e-07, + "loss": 0.7803, + "step": 64205 + }, + { + "epoch": 1.65, + "learning_rate": 8.91579344384314e-07, + "loss": 0.751, + "step": 64206 + }, + { + "epoch": 1.65, + "learning_rate": 8.915518370863249e-07, + "loss": 0.5835, + "step": 64207 + }, + { + "epoch": 1.65, + "learning_rate": 8.915243298713693e-07, + "loss": 0.6299, + "step": 64208 + }, + { + "epoch": 1.65, + "learning_rate": 8.914968227394687e-07, + "loss": 0.5532, + "step": 64209 + }, + { + "epoch": 1.65, + "learning_rate": 8.914693156906438e-07, + "loss": 0.6816, + "step": 64210 + }, + { + "epoch": 1.65, + "learning_rate": 8.91441808724916e-07, + "loss": 0.7549, + "step": 64211 + }, + { + "epoch": 1.65, + "learning_rate": 8.914143018423066e-07, + "loss": 0.5947, + "step": 64212 + }, + { + "epoch": 1.65, + "learning_rate": 8.913867950428357e-07, + "loss": 0.6523, + "step": 64213 + }, + { + "epoch": 1.65, + "learning_rate": 8.913592883265253e-07, + "loss": 0.6357, + "step": 64214 + }, + { + "epoch": 1.65, + "learning_rate": 8.913317816933958e-07, + "loss": 0.6646, + "step": 64215 + }, + { + "epoch": 1.65, + "learning_rate": 8.913042751434687e-07, + "loss": 0.5974, + "step": 64216 + }, + { + "epoch": 1.65, + "learning_rate": 8.912767686767649e-07, + "loss": 0.7281, + "step": 64217 + }, + { + "epoch": 1.65, + "learning_rate": 8.912492622933055e-07, + "loss": 0.6797, + "step": 64218 + }, + { + "epoch": 1.65, + "learning_rate": 8.912217559931115e-07, + "loss": 0.6055, + "step": 64219 + }, + { + "epoch": 1.65, + "learning_rate": 8.911942497762041e-07, + "loss": 0.7021, + "step": 64220 + }, + { + "epoch": 1.65, + "learning_rate": 8.91166743642604e-07, + "loss": 0.6138, + "step": 64221 + }, + { + "epoch": 1.65, + "learning_rate": 8.91139237592333e-07, + "loss": 0.6184, + "step": 64222 + }, + { + "epoch": 1.65, + "learning_rate": 8.911117316254115e-07, + "loss": 0.4824, + "step": 64223 + }, + { + "epoch": 1.65, + "learning_rate": 8.910842257418607e-07, + "loss": 0.6831, + "step": 64224 + }, + { + "epoch": 1.65, + "learning_rate": 8.910567199417015e-07, + "loss": 0.5986, + "step": 64225 + }, + { + "epoch": 1.65, + "learning_rate": 8.910292142249553e-07, + "loss": 0.7095, + "step": 64226 + }, + { + "epoch": 1.65, + "learning_rate": 8.91001708591643e-07, + "loss": 0.559, + "step": 64227 + }, + { + "epoch": 1.65, + "learning_rate": 8.909742030417858e-07, + "loss": 0.627, + "step": 64228 + }, + { + "epoch": 1.65, + "learning_rate": 8.909466975754043e-07, + "loss": 0.5103, + "step": 64229 + }, + { + "epoch": 1.65, + "learning_rate": 8.909191921925202e-07, + "loss": 0.6436, + "step": 64230 + }, + { + "epoch": 1.65, + "learning_rate": 8.90891686893154e-07, + "loss": 0.7031, + "step": 64231 + }, + { + "epoch": 1.65, + "learning_rate": 8.908641816773276e-07, + "loss": 0.751, + "step": 64232 + }, + { + "epoch": 1.65, + "learning_rate": 8.908366765450611e-07, + "loss": 0.6929, + "step": 64233 + }, + { + "epoch": 1.65, + "learning_rate": 8.908091714963758e-07, + "loss": 0.6738, + "step": 64234 + }, + { + "epoch": 1.65, + "learning_rate": 8.907816665312932e-07, + "loss": 0.445, + "step": 64235 + }, + { + "epoch": 1.65, + "learning_rate": 8.907541616498337e-07, + "loss": 0.6289, + "step": 64236 + }, + { + "epoch": 1.65, + "learning_rate": 8.907266568520189e-07, + "loss": 0.427, + "step": 64237 + }, + { + "epoch": 1.65, + "learning_rate": 8.906991521378696e-07, + "loss": 0.5642, + "step": 64238 + }, + { + "epoch": 1.65, + "learning_rate": 8.906716475074071e-07, + "loss": 0.5898, + "step": 64239 + }, + { + "epoch": 1.65, + "learning_rate": 8.906441429606521e-07, + "loss": 0.7402, + "step": 64240 + }, + { + "epoch": 1.65, + "learning_rate": 8.906166384976259e-07, + "loss": 0.5366, + "step": 64241 + }, + { + "epoch": 1.65, + "learning_rate": 8.9058913411835e-07, + "loss": 0.7432, + "step": 64242 + }, + { + "epoch": 1.65, + "learning_rate": 8.905616298228445e-07, + "loss": 0.9053, + "step": 64243 + }, + { + "epoch": 1.65, + "learning_rate": 8.905341256111309e-07, + "loss": 0.6709, + "step": 64244 + }, + { + "epoch": 1.65, + "learning_rate": 8.905066214832303e-07, + "loss": 0.6077, + "step": 64245 + }, + { + "epoch": 1.65, + "learning_rate": 8.904791174391638e-07, + "loss": 0.6211, + "step": 64246 + }, + { + "epoch": 1.65, + "learning_rate": 8.904516134789524e-07, + "loss": 0.4768, + "step": 64247 + }, + { + "epoch": 1.65, + "learning_rate": 8.904241096026169e-07, + "loss": 0.4883, + "step": 64248 + }, + { + "epoch": 1.65, + "learning_rate": 8.903966058101789e-07, + "loss": 0.6611, + "step": 64249 + }, + { + "epoch": 1.65, + "learning_rate": 8.90369102101659e-07, + "loss": 0.6445, + "step": 64250 + }, + { + "epoch": 1.65, + "learning_rate": 8.903415984770788e-07, + "loss": 0.6726, + "step": 64251 + }, + { + "epoch": 1.65, + "learning_rate": 8.90314094936459e-07, + "loss": 0.7441, + "step": 64252 + }, + { + "epoch": 1.65, + "learning_rate": 8.902865914798204e-07, + "loss": 0.7324, + "step": 64253 + }, + { + "epoch": 1.65, + "learning_rate": 8.902590881071844e-07, + "loss": 0.7041, + "step": 64254 + }, + { + "epoch": 1.65, + "learning_rate": 8.902315848185718e-07, + "loss": 0.6265, + "step": 64255 + }, + { + "epoch": 1.65, + "learning_rate": 8.90204081614004e-07, + "loss": 0.6865, + "step": 64256 + }, + { + "epoch": 1.65, + "learning_rate": 8.901765784935017e-07, + "loss": 0.6045, + "step": 64257 + }, + { + "epoch": 1.65, + "learning_rate": 8.901490754570864e-07, + "loss": 0.8145, + "step": 64258 + }, + { + "epoch": 1.65, + "learning_rate": 8.901215725047786e-07, + "loss": 0.7373, + "step": 64259 + }, + { + "epoch": 1.65, + "learning_rate": 8.900940696365999e-07, + "loss": 0.6353, + "step": 64260 + }, + { + "epoch": 1.65, + "learning_rate": 8.900665668525709e-07, + "loss": 0.5864, + "step": 64261 + }, + { + "epoch": 1.65, + "learning_rate": 8.900390641527136e-07, + "loss": 0.6846, + "step": 64262 + }, + { + "epoch": 1.65, + "learning_rate": 8.900115615370476e-07, + "loss": 0.6572, + "step": 64263 + }, + { + "epoch": 1.65, + "learning_rate": 8.899840590055949e-07, + "loss": 0.636, + "step": 64264 + }, + { + "epoch": 1.65, + "learning_rate": 8.899565565583762e-07, + "loss": 0.7578, + "step": 64265 + }, + { + "epoch": 1.65, + "learning_rate": 8.899290541954128e-07, + "loss": 0.5474, + "step": 64266 + }, + { + "epoch": 1.65, + "learning_rate": 8.899015519167257e-07, + "loss": 0.688, + "step": 64267 + }, + { + "epoch": 1.65, + "learning_rate": 8.89874049722336e-07, + "loss": 0.6155, + "step": 64268 + }, + { + "epoch": 1.65, + "learning_rate": 8.898465476122643e-07, + "loss": 0.6377, + "step": 64269 + }, + { + "epoch": 1.65, + "learning_rate": 8.898190455865324e-07, + "loss": 0.6738, + "step": 64270 + }, + { + "epoch": 1.65, + "learning_rate": 8.897915436451607e-07, + "loss": 0.7451, + "step": 64271 + }, + { + "epoch": 1.65, + "learning_rate": 8.897640417881711e-07, + "loss": 0.5156, + "step": 64272 + }, + { + "epoch": 1.65, + "learning_rate": 8.897365400155838e-07, + "loss": 0.7012, + "step": 64273 + }, + { + "epoch": 1.65, + "learning_rate": 8.897090383274199e-07, + "loss": 0.6382, + "step": 64274 + }, + { + "epoch": 1.65, + "learning_rate": 8.89681536723701e-07, + "loss": 0.4492, + "step": 64275 + }, + { + "epoch": 1.65, + "learning_rate": 8.896540352044477e-07, + "loss": 0.5923, + "step": 64276 + }, + { + "epoch": 1.65, + "learning_rate": 8.896265337696814e-07, + "loss": 0.52, + "step": 64277 + }, + { + "epoch": 1.65, + "learning_rate": 8.895990324194228e-07, + "loss": 0.7461, + "step": 64278 + }, + { + "epoch": 1.65, + "learning_rate": 8.895715311536934e-07, + "loss": 0.5879, + "step": 64279 + }, + { + "epoch": 1.65, + "learning_rate": 8.895440299725139e-07, + "loss": 0.6035, + "step": 64280 + }, + { + "epoch": 1.65, + "learning_rate": 8.895165288759053e-07, + "loss": 0.6011, + "step": 64281 + }, + { + "epoch": 1.65, + "learning_rate": 8.894890278638891e-07, + "loss": 0.5771, + "step": 64282 + }, + { + "epoch": 1.65, + "learning_rate": 8.89461526936486e-07, + "loss": 0.6948, + "step": 64283 + }, + { + "epoch": 1.65, + "learning_rate": 8.89434026093717e-07, + "loss": 0.7422, + "step": 64284 + }, + { + "epoch": 1.65, + "learning_rate": 8.894065253356033e-07, + "loss": 0.584, + "step": 64285 + }, + { + "epoch": 1.65, + "learning_rate": 8.893790246621658e-07, + "loss": 0.7578, + "step": 64286 + }, + { + "epoch": 1.65, + "learning_rate": 8.893515240734259e-07, + "loss": 0.5342, + "step": 64287 + }, + { + "epoch": 1.65, + "learning_rate": 8.893240235694042e-07, + "loss": 0.6448, + "step": 64288 + }, + { + "epoch": 1.65, + "learning_rate": 8.892965231501224e-07, + "loss": 0.606, + "step": 64289 + }, + { + "epoch": 1.65, + "learning_rate": 8.892690228156008e-07, + "loss": 0.6597, + "step": 64290 + }, + { + "epoch": 1.65, + "learning_rate": 8.89241522565861e-07, + "loss": 0.5464, + "step": 64291 + }, + { + "epoch": 1.65, + "learning_rate": 8.892140224009242e-07, + "loss": 0.7246, + "step": 64292 + }, + { + "epoch": 1.65, + "learning_rate": 8.891865223208107e-07, + "loss": 0.5444, + "step": 64293 + }, + { + "epoch": 1.65, + "learning_rate": 8.891590223255421e-07, + "loss": 0.6841, + "step": 64294 + }, + { + "epoch": 1.65, + "learning_rate": 8.891315224151392e-07, + "loss": 0.5674, + "step": 64295 + }, + { + "epoch": 1.65, + "learning_rate": 8.891040225896234e-07, + "loss": 0.4468, + "step": 64296 + }, + { + "epoch": 1.65, + "learning_rate": 8.890765228490155e-07, + "loss": 0.5742, + "step": 64297 + }, + { + "epoch": 1.65, + "learning_rate": 8.890490231933364e-07, + "loss": 0.6611, + "step": 64298 + }, + { + "epoch": 1.65, + "learning_rate": 8.890215236226077e-07, + "loss": 0.6348, + "step": 64299 + }, + { + "epoch": 1.65, + "learning_rate": 8.889940241368496e-07, + "loss": 0.6494, + "step": 64300 + }, + { + "epoch": 1.65, + "learning_rate": 8.889665247360841e-07, + "loss": 0.7012, + "step": 64301 + }, + { + "epoch": 1.65, + "learning_rate": 8.889390254203321e-07, + "loss": 0.6396, + "step": 64302 + }, + { + "epoch": 1.65, + "learning_rate": 8.889115261896139e-07, + "loss": 0.6558, + "step": 64303 + }, + { + "epoch": 1.65, + "learning_rate": 8.888840270439512e-07, + "loss": 0.5552, + "step": 64304 + }, + { + "epoch": 1.65, + "learning_rate": 8.888565279833647e-07, + "loss": 0.6558, + "step": 64305 + }, + { + "epoch": 1.65, + "learning_rate": 8.88829029007876e-07, + "loss": 0.7695, + "step": 64306 + }, + { + "epoch": 1.65, + "learning_rate": 8.888015301175054e-07, + "loss": 0.5601, + "step": 64307 + }, + { + "epoch": 1.65, + "learning_rate": 8.887740313122746e-07, + "loss": 0.5164, + "step": 64308 + }, + { + "epoch": 1.65, + "learning_rate": 8.887465325922041e-07, + "loss": 0.7559, + "step": 64309 + }, + { + "epoch": 1.65, + "learning_rate": 8.887190339573157e-07, + "loss": 0.7227, + "step": 64310 + }, + { + "epoch": 1.65, + "learning_rate": 8.886915354076297e-07, + "loss": 0.7031, + "step": 64311 + }, + { + "epoch": 1.65, + "learning_rate": 8.886640369431678e-07, + "loss": 0.6104, + "step": 64312 + }, + { + "epoch": 1.65, + "learning_rate": 8.886365385639508e-07, + "loss": 0.6353, + "step": 64313 + }, + { + "epoch": 1.65, + "learning_rate": 8.886090402699994e-07, + "loss": 0.5659, + "step": 64314 + }, + { + "epoch": 1.65, + "learning_rate": 8.885815420613348e-07, + "loss": 0.7275, + "step": 64315 + }, + { + "epoch": 1.65, + "learning_rate": 8.885540439379783e-07, + "loss": 0.7197, + "step": 64316 + }, + { + "epoch": 1.65, + "learning_rate": 8.885265458999509e-07, + "loss": 0.7129, + "step": 64317 + }, + { + "epoch": 1.65, + "learning_rate": 8.884990479472736e-07, + "loss": 0.4475, + "step": 64318 + }, + { + "epoch": 1.65, + "learning_rate": 8.884715500799673e-07, + "loss": 0.6479, + "step": 64319 + }, + { + "epoch": 1.65, + "learning_rate": 8.884440522980534e-07, + "loss": 0.5615, + "step": 64320 + }, + { + "epoch": 1.65, + "learning_rate": 8.884165546015526e-07, + "loss": 0.4993, + "step": 64321 + }, + { + "epoch": 1.65, + "learning_rate": 8.883890569904866e-07, + "loss": 0.5938, + "step": 64322 + }, + { + "epoch": 1.65, + "learning_rate": 8.883615594648756e-07, + "loss": 0.5513, + "step": 64323 + }, + { + "epoch": 1.65, + "learning_rate": 8.883340620247409e-07, + "loss": 0.583, + "step": 64324 + }, + { + "epoch": 1.65, + "learning_rate": 8.883065646701039e-07, + "loss": 0.6401, + "step": 64325 + }, + { + "epoch": 1.65, + "learning_rate": 8.882790674009851e-07, + "loss": 0.6426, + "step": 64326 + }, + { + "epoch": 1.65, + "learning_rate": 8.882515702174062e-07, + "loss": 0.6836, + "step": 64327 + }, + { + "epoch": 1.65, + "learning_rate": 8.882240731193876e-07, + "loss": 0.5796, + "step": 64328 + }, + { + "epoch": 1.65, + "learning_rate": 8.881965761069511e-07, + "loss": 0.6248, + "step": 64329 + }, + { + "epoch": 1.65, + "learning_rate": 8.88169079180117e-07, + "loss": 0.7939, + "step": 64330 + }, + { + "epoch": 1.65, + "learning_rate": 8.881415823389069e-07, + "loss": 0.5032, + "step": 64331 + }, + { + "epoch": 1.65, + "learning_rate": 8.881140855833419e-07, + "loss": 0.6592, + "step": 64332 + }, + { + "epoch": 1.65, + "learning_rate": 8.880865889134425e-07, + "loss": 0.7773, + "step": 64333 + }, + { + "epoch": 1.65, + "learning_rate": 8.880590923292299e-07, + "loss": 0.6514, + "step": 64334 + }, + { + "epoch": 1.65, + "learning_rate": 8.880315958307256e-07, + "loss": 0.5369, + "step": 64335 + }, + { + "epoch": 1.65, + "learning_rate": 8.8800409941795e-07, + "loss": 0.7148, + "step": 64336 + }, + { + "epoch": 1.65, + "learning_rate": 8.879766030909249e-07, + "loss": 0.5385, + "step": 64337 + }, + { + "epoch": 1.65, + "learning_rate": 8.879491068496707e-07, + "loss": 0.665, + "step": 64338 + }, + { + "epoch": 1.65, + "learning_rate": 8.879216106942088e-07, + "loss": 0.6699, + "step": 64339 + }, + { + "epoch": 1.65, + "learning_rate": 8.8789411462456e-07, + "loss": 0.5664, + "step": 64340 + }, + { + "epoch": 1.65, + "learning_rate": 8.878666186407458e-07, + "loss": 0.6445, + "step": 64341 + }, + { + "epoch": 1.65, + "learning_rate": 8.878391227427872e-07, + "loss": 0.4833, + "step": 64342 + }, + { + "epoch": 1.65, + "learning_rate": 8.878116269307046e-07, + "loss": 0.8066, + "step": 64343 + }, + { + "epoch": 1.65, + "learning_rate": 8.877841312045195e-07, + "loss": 0.4019, + "step": 64344 + }, + { + "epoch": 1.65, + "learning_rate": 8.877566355642529e-07, + "loss": 0.5435, + "step": 64345 + }, + { + "epoch": 1.65, + "learning_rate": 8.877291400099262e-07, + "loss": 0.6035, + "step": 64346 + }, + { + "epoch": 1.65, + "learning_rate": 8.877016445415597e-07, + "loss": 0.4995, + "step": 64347 + }, + { + "epoch": 1.65, + "learning_rate": 8.876741491591752e-07, + "loss": 0.7939, + "step": 64348 + }, + { + "epoch": 1.65, + "learning_rate": 8.876466538627932e-07, + "loss": 0.7891, + "step": 64349 + }, + { + "epoch": 1.65, + "learning_rate": 8.876191586524352e-07, + "loss": 0.6846, + "step": 64350 + }, + { + "epoch": 1.65, + "learning_rate": 8.875916635281219e-07, + "loss": 0.6072, + "step": 64351 + }, + { + "epoch": 1.65, + "learning_rate": 8.875641684898751e-07, + "loss": 0.8018, + "step": 64352 + }, + { + "epoch": 1.65, + "learning_rate": 8.875366735377145e-07, + "loss": 0.4006, + "step": 64353 + }, + { + "epoch": 1.65, + "learning_rate": 8.875091786716622e-07, + "loss": 0.7607, + "step": 64354 + }, + { + "epoch": 1.65, + "learning_rate": 8.874816838917387e-07, + "loss": 0.7578, + "step": 64355 + }, + { + "epoch": 1.65, + "learning_rate": 8.874541891979657e-07, + "loss": 0.7295, + "step": 64356 + }, + { + "epoch": 1.65, + "learning_rate": 8.874266945903635e-07, + "loss": 0.5474, + "step": 64357 + }, + { + "epoch": 1.65, + "learning_rate": 8.873992000689536e-07, + "loss": 0.6904, + "step": 64358 + }, + { + "epoch": 1.65, + "learning_rate": 8.873717056337569e-07, + "loss": 0.3857, + "step": 64359 + }, + { + "epoch": 1.65, + "learning_rate": 8.873442112847946e-07, + "loss": 0.6172, + "step": 64360 + }, + { + "epoch": 1.65, + "learning_rate": 8.873167170220876e-07, + "loss": 0.7754, + "step": 64361 + }, + { + "epoch": 1.65, + "learning_rate": 8.872892228456573e-07, + "loss": 0.6772, + "step": 64362 + }, + { + "epoch": 1.65, + "learning_rate": 8.872617287555243e-07, + "loss": 0.6411, + "step": 64363 + }, + { + "epoch": 1.65, + "learning_rate": 8.872342347517096e-07, + "loss": 0.4902, + "step": 64364 + }, + { + "epoch": 1.65, + "learning_rate": 8.872067408342346e-07, + "loss": 0.7363, + "step": 64365 + }, + { + "epoch": 1.65, + "learning_rate": 8.871792470031201e-07, + "loss": 0.6689, + "step": 64366 + }, + { + "epoch": 1.65, + "learning_rate": 8.871517532583875e-07, + "loss": 0.7764, + "step": 64367 + }, + { + "epoch": 1.65, + "learning_rate": 8.871242596000573e-07, + "loss": 0.6768, + "step": 64368 + }, + { + "epoch": 1.65, + "learning_rate": 8.870967660281511e-07, + "loss": 0.6826, + "step": 64369 + }, + { + "epoch": 1.65, + "learning_rate": 8.870692725426897e-07, + "loss": 0.6611, + "step": 64370 + }, + { + "epoch": 1.65, + "learning_rate": 8.870417791436939e-07, + "loss": 0.7402, + "step": 64371 + }, + { + "epoch": 1.65, + "learning_rate": 8.870142858311857e-07, + "loss": 0.666, + "step": 64372 + }, + { + "epoch": 1.65, + "learning_rate": 8.86986792605185e-07, + "loss": 0.6421, + "step": 64373 + }, + { + "epoch": 1.65, + "learning_rate": 8.869592994657131e-07, + "loss": 0.6006, + "step": 64374 + }, + { + "epoch": 1.65, + "learning_rate": 8.869318064127917e-07, + "loss": 0.5552, + "step": 64375 + }, + { + "epoch": 1.65, + "learning_rate": 8.86904313446441e-07, + "loss": 0.6055, + "step": 64376 + }, + { + "epoch": 1.65, + "learning_rate": 8.868768205666827e-07, + "loss": 0.6218, + "step": 64377 + }, + { + "epoch": 1.65, + "learning_rate": 8.868493277735375e-07, + "loss": 0.5474, + "step": 64378 + }, + { + "epoch": 1.65, + "learning_rate": 8.868218350670267e-07, + "loss": 0.6157, + "step": 64379 + }, + { + "epoch": 1.65, + "learning_rate": 8.867943424471711e-07, + "loss": 0.4735, + "step": 64380 + }, + { + "epoch": 1.65, + "learning_rate": 8.86766849913992e-07, + "loss": 0.4414, + "step": 64381 + }, + { + "epoch": 1.65, + "learning_rate": 8.867393574675105e-07, + "loss": 0.5229, + "step": 64382 + }, + { + "epoch": 1.65, + "learning_rate": 8.867118651077471e-07, + "loss": 0.7988, + "step": 64383 + }, + { + "epoch": 1.65, + "learning_rate": 8.866843728347234e-07, + "loss": 0.6504, + "step": 64384 + }, + { + "epoch": 1.65, + "learning_rate": 8.8665688064846e-07, + "loss": 0.7773, + "step": 64385 + }, + { + "epoch": 1.65, + "learning_rate": 8.866293885489786e-07, + "loss": 0.5527, + "step": 64386 + }, + { + "epoch": 1.65, + "learning_rate": 8.866018965362997e-07, + "loss": 0.6895, + "step": 64387 + }, + { + "epoch": 1.65, + "learning_rate": 8.865744046104444e-07, + "loss": 0.6865, + "step": 64388 + }, + { + "epoch": 1.65, + "learning_rate": 8.86546912771434e-07, + "loss": 0.6504, + "step": 64389 + }, + { + "epoch": 1.65, + "learning_rate": 8.865194210192892e-07, + "loss": 0.7432, + "step": 64390 + }, + { + "epoch": 1.65, + "learning_rate": 8.864919293540315e-07, + "loss": 0.7012, + "step": 64391 + }, + { + "epoch": 1.65, + "learning_rate": 8.86464437775682e-07, + "loss": 0.6611, + "step": 64392 + }, + { + "epoch": 1.65, + "learning_rate": 8.86436946284261e-07, + "loss": 0.6699, + "step": 64393 + }, + { + "epoch": 1.65, + "learning_rate": 8.864094548797901e-07, + "loss": 0.6904, + "step": 64394 + }, + { + "epoch": 1.65, + "learning_rate": 8.863819635622901e-07, + "loss": 0.5076, + "step": 64395 + }, + { + "epoch": 1.65, + "learning_rate": 8.863544723317825e-07, + "loss": 0.6782, + "step": 64396 + }, + { + "epoch": 1.65, + "learning_rate": 8.863269811882877e-07, + "loss": 0.5107, + "step": 64397 + }, + { + "epoch": 1.65, + "learning_rate": 8.862994901318275e-07, + "loss": 0.5908, + "step": 64398 + }, + { + "epoch": 1.65, + "learning_rate": 8.862719991624222e-07, + "loss": 0.6562, + "step": 64399 + }, + { + "epoch": 1.65, + "learning_rate": 8.862445082800934e-07, + "loss": 0.5686, + "step": 64400 + }, + { + "epoch": 1.65, + "learning_rate": 8.862170174848619e-07, + "loss": 0.6479, + "step": 64401 + }, + { + "epoch": 1.65, + "learning_rate": 8.861895267767491e-07, + "loss": 0.6479, + "step": 64402 + }, + { + "epoch": 1.65, + "learning_rate": 8.861620361557755e-07, + "loss": 0.7197, + "step": 64403 + }, + { + "epoch": 1.65, + "learning_rate": 8.861345456219626e-07, + "loss": 0.6396, + "step": 64404 + }, + { + "epoch": 1.65, + "learning_rate": 8.861070551753308e-07, + "loss": 0.6631, + "step": 64405 + }, + { + "epoch": 1.65, + "learning_rate": 8.860795648159018e-07, + "loss": 0.6387, + "step": 64406 + }, + { + "epoch": 1.65, + "learning_rate": 8.860520745436963e-07, + "loss": 0.5039, + "step": 64407 + }, + { + "epoch": 1.65, + "learning_rate": 8.860245843587357e-07, + "loss": 0.5752, + "step": 64408 + }, + { + "epoch": 1.65, + "learning_rate": 8.859970942610406e-07, + "loss": 0.6157, + "step": 64409 + }, + { + "epoch": 1.65, + "learning_rate": 8.859696042506326e-07, + "loss": 0.689, + "step": 64410 + }, + { + "epoch": 1.65, + "learning_rate": 8.859421143275322e-07, + "loss": 0.5781, + "step": 64411 + }, + { + "epoch": 1.65, + "learning_rate": 8.85914624491761e-07, + "loss": 0.7012, + "step": 64412 + }, + { + "epoch": 1.65, + "learning_rate": 8.858871347433396e-07, + "loss": 0.6064, + "step": 64413 + }, + { + "epoch": 1.65, + "learning_rate": 8.858596450822888e-07, + "loss": 0.5151, + "step": 64414 + }, + { + "epoch": 1.65, + "learning_rate": 8.858321555086305e-07, + "loss": 0.623, + "step": 64415 + }, + { + "epoch": 1.65, + "learning_rate": 8.858046660223848e-07, + "loss": 0.8018, + "step": 64416 + }, + { + "epoch": 1.65, + "learning_rate": 8.857771766235735e-07, + "loss": 0.7188, + "step": 64417 + }, + { + "epoch": 1.65, + "learning_rate": 8.857496873122174e-07, + "loss": 0.4678, + "step": 64418 + }, + { + "epoch": 1.65, + "learning_rate": 8.857221980883374e-07, + "loss": 0.8018, + "step": 64419 + }, + { + "epoch": 1.65, + "learning_rate": 8.856947089519545e-07, + "loss": 0.6611, + "step": 64420 + }, + { + "epoch": 1.65, + "learning_rate": 8.856672199030905e-07, + "loss": 0.6104, + "step": 64421 + }, + { + "epoch": 1.65, + "learning_rate": 8.856397309417655e-07, + "loss": 0.7739, + "step": 64422 + }, + { + "epoch": 1.65, + "learning_rate": 8.856122420680008e-07, + "loss": 0.6807, + "step": 64423 + }, + { + "epoch": 1.65, + "learning_rate": 8.855847532818176e-07, + "loss": 0.7007, + "step": 64424 + }, + { + "epoch": 1.65, + "learning_rate": 8.85557264583237e-07, + "loss": 0.6719, + "step": 64425 + }, + { + "epoch": 1.65, + "learning_rate": 8.855297759722796e-07, + "loss": 0.6494, + "step": 64426 + }, + { + "epoch": 1.65, + "learning_rate": 8.855022874489671e-07, + "loss": 0.6514, + "step": 64427 + }, + { + "epoch": 1.65, + "learning_rate": 8.854747990133201e-07, + "loss": 0.5884, + "step": 64428 + }, + { + "epoch": 1.65, + "learning_rate": 8.8544731066536e-07, + "loss": 0.707, + "step": 64429 + }, + { + "epoch": 1.65, + "learning_rate": 8.854198224051073e-07, + "loss": 0.5247, + "step": 64430 + }, + { + "epoch": 1.65, + "learning_rate": 8.853923342325838e-07, + "loss": 0.6084, + "step": 64431 + }, + { + "epoch": 1.65, + "learning_rate": 8.853648461478099e-07, + "loss": 0.6606, + "step": 64432 + }, + { + "epoch": 1.65, + "learning_rate": 8.853373581508067e-07, + "loss": 0.584, + "step": 64433 + }, + { + "epoch": 1.65, + "learning_rate": 8.853098702415955e-07, + "loss": 0.7324, + "step": 64434 + }, + { + "epoch": 1.65, + "learning_rate": 8.852823824201972e-07, + "loss": 0.7393, + "step": 64435 + }, + { + "epoch": 1.65, + "learning_rate": 8.852548946866332e-07, + "loss": 0.6479, + "step": 64436 + }, + { + "epoch": 1.65, + "learning_rate": 8.852274070409238e-07, + "loss": 0.6821, + "step": 64437 + }, + { + "epoch": 1.65, + "learning_rate": 8.851999194830908e-07, + "loss": 0.5144, + "step": 64438 + }, + { + "epoch": 1.65, + "learning_rate": 8.851724320131548e-07, + "loss": 0.584, + "step": 64439 + }, + { + "epoch": 1.65, + "learning_rate": 8.851449446311372e-07, + "loss": 0.5913, + "step": 64440 + }, + { + "epoch": 1.65, + "learning_rate": 8.85117457337059e-07, + "loss": 0.8652, + "step": 64441 + }, + { + "epoch": 1.65, + "learning_rate": 8.850899701309409e-07, + "loss": 0.6517, + "step": 64442 + }, + { + "epoch": 1.65, + "learning_rate": 8.850624830128038e-07, + "loss": 0.6084, + "step": 64443 + }, + { + "epoch": 1.65, + "learning_rate": 8.850349959826694e-07, + "loss": 0.687, + "step": 64444 + }, + { + "epoch": 1.65, + "learning_rate": 8.850075090405582e-07, + "loss": 0.7686, + "step": 64445 + }, + { + "epoch": 1.65, + "learning_rate": 8.849800221864916e-07, + "loss": 0.6621, + "step": 64446 + }, + { + "epoch": 1.65, + "learning_rate": 8.849525354204903e-07, + "loss": 0.6675, + "step": 64447 + }, + { + "epoch": 1.65, + "learning_rate": 8.849250487425759e-07, + "loss": 0.5974, + "step": 64448 + }, + { + "epoch": 1.65, + "learning_rate": 8.848975621527688e-07, + "loss": 0.5737, + "step": 64449 + }, + { + "epoch": 1.65, + "learning_rate": 8.848700756510905e-07, + "loss": 0.4956, + "step": 64450 + }, + { + "epoch": 1.65, + "learning_rate": 8.848425892375621e-07, + "loss": 0.6709, + "step": 64451 + }, + { + "epoch": 1.65, + "learning_rate": 8.848151029122042e-07, + "loss": 0.6309, + "step": 64452 + }, + { + "epoch": 1.65, + "learning_rate": 8.847876166750381e-07, + "loss": 0.6021, + "step": 64453 + }, + { + "epoch": 1.65, + "learning_rate": 8.847601305260846e-07, + "loss": 0.5864, + "step": 64454 + }, + { + "epoch": 1.65, + "learning_rate": 8.847326444653653e-07, + "loss": 0.7607, + "step": 64455 + }, + { + "epoch": 1.65, + "learning_rate": 8.847051584929006e-07, + "loss": 0.6455, + "step": 64456 + }, + { + "epoch": 1.65, + "learning_rate": 8.846776726087122e-07, + "loss": 0.7891, + "step": 64457 + }, + { + "epoch": 1.65, + "learning_rate": 8.846501868128204e-07, + "loss": 0.5425, + "step": 64458 + }, + { + "epoch": 1.65, + "learning_rate": 8.846227011052471e-07, + "loss": 0.6504, + "step": 64459 + }, + { + "epoch": 1.65, + "learning_rate": 8.845952154860128e-07, + "loss": 0.6006, + "step": 64460 + }, + { + "epoch": 1.65, + "learning_rate": 8.845677299551387e-07, + "loss": 0.4795, + "step": 64461 + }, + { + "epoch": 1.65, + "learning_rate": 8.845402445126456e-07, + "loss": 0.5769, + "step": 64462 + }, + { + "epoch": 1.65, + "learning_rate": 8.845127591585547e-07, + "loss": 0.4531, + "step": 64463 + }, + { + "epoch": 1.65, + "learning_rate": 8.84485273892887e-07, + "loss": 0.5498, + "step": 64464 + }, + { + "epoch": 1.65, + "learning_rate": 8.844577887156638e-07, + "loss": 0.6172, + "step": 64465 + }, + { + "epoch": 1.65, + "learning_rate": 8.844303036269058e-07, + "loss": 0.6274, + "step": 64466 + }, + { + "epoch": 1.65, + "learning_rate": 8.844028186266343e-07, + "loss": 0.6777, + "step": 64467 + }, + { + "epoch": 1.65, + "learning_rate": 8.8437533371487e-07, + "loss": 0.6807, + "step": 64468 + }, + { + "epoch": 1.65, + "learning_rate": 8.843478488916346e-07, + "loss": 0.6172, + "step": 64469 + }, + { + "epoch": 1.65, + "learning_rate": 8.843203641569484e-07, + "loss": 0.7012, + "step": 64470 + }, + { + "epoch": 1.65, + "learning_rate": 8.842928795108332e-07, + "loss": 0.5315, + "step": 64471 + }, + { + "epoch": 1.65, + "learning_rate": 8.842653949533094e-07, + "loss": 0.6445, + "step": 64472 + }, + { + "epoch": 1.65, + "learning_rate": 8.842379104843982e-07, + "loss": 0.5386, + "step": 64473 + }, + { + "epoch": 1.65, + "learning_rate": 8.842104261041207e-07, + "loss": 0.6689, + "step": 64474 + }, + { + "epoch": 1.65, + "learning_rate": 8.841829418124978e-07, + "loss": 0.5591, + "step": 64475 + }, + { + "epoch": 1.65, + "learning_rate": 8.84155457609551e-07, + "loss": 0.5234, + "step": 64476 + }, + { + "epoch": 1.65, + "learning_rate": 8.84127973495301e-07, + "loss": 0.6665, + "step": 64477 + }, + { + "epoch": 1.65, + "learning_rate": 8.841004894697687e-07, + "loss": 0.5962, + "step": 64478 + }, + { + "epoch": 1.65, + "learning_rate": 8.840730055329755e-07, + "loss": 0.6367, + "step": 64479 + }, + { + "epoch": 1.65, + "learning_rate": 8.840455216849421e-07, + "loss": 0.6221, + "step": 64480 + }, + { + "epoch": 1.65, + "learning_rate": 8.8401803792569e-07, + "loss": 0.8145, + "step": 64481 + }, + { + "epoch": 1.65, + "learning_rate": 8.839905542552398e-07, + "loss": 0.6992, + "step": 64482 + }, + { + "epoch": 1.65, + "learning_rate": 8.839630706736125e-07, + "loss": 0.7236, + "step": 64483 + }, + { + "epoch": 1.65, + "learning_rate": 8.839355871808296e-07, + "loss": 0.6758, + "step": 64484 + }, + { + "epoch": 1.65, + "learning_rate": 8.839081037769117e-07, + "loss": 0.4636, + "step": 64485 + }, + { + "epoch": 1.65, + "learning_rate": 8.838806204618802e-07, + "loss": 0.8213, + "step": 64486 + }, + { + "epoch": 1.65, + "learning_rate": 8.838531372357557e-07, + "loss": 0.5645, + "step": 64487 + }, + { + "epoch": 1.65, + "learning_rate": 8.838256540985598e-07, + "loss": 0.7227, + "step": 64488 + }, + { + "epoch": 1.65, + "learning_rate": 8.83798171050313e-07, + "loss": 0.6934, + "step": 64489 + }, + { + "epoch": 1.65, + "learning_rate": 8.837706880910369e-07, + "loss": 0.6064, + "step": 64490 + }, + { + "epoch": 1.65, + "learning_rate": 8.837432052207523e-07, + "loss": 0.7676, + "step": 64491 + }, + { + "epoch": 1.65, + "learning_rate": 8.837157224394797e-07, + "loss": 0.5625, + "step": 64492 + }, + { + "epoch": 1.65, + "learning_rate": 8.836882397472411e-07, + "loss": 0.7031, + "step": 64493 + }, + { + "epoch": 1.65, + "learning_rate": 8.83660757144057e-07, + "loss": 0.5654, + "step": 64494 + }, + { + "epoch": 1.65, + "learning_rate": 8.836332746299481e-07, + "loss": 0.5637, + "step": 64495 + }, + { + "epoch": 1.65, + "learning_rate": 8.836057922049363e-07, + "loss": 0.7339, + "step": 64496 + }, + { + "epoch": 1.65, + "learning_rate": 8.835783098690418e-07, + "loss": 0.5134, + "step": 64497 + }, + { + "epoch": 1.65, + "learning_rate": 8.835508276222863e-07, + "loss": 0.792, + "step": 64498 + }, + { + "epoch": 1.65, + "learning_rate": 8.835233454646904e-07, + "loss": 0.5835, + "step": 64499 + }, + { + "epoch": 1.65, + "learning_rate": 8.834958633962756e-07, + "loss": 0.5259, + "step": 64500 + }, + { + "epoch": 1.65, + "learning_rate": 8.834683814170627e-07, + "loss": 0.7305, + "step": 64501 + }, + { + "epoch": 1.65, + "learning_rate": 8.834408995270725e-07, + "loss": 0.6826, + "step": 64502 + }, + { + "epoch": 1.65, + "learning_rate": 8.834134177263263e-07, + "loss": 0.6455, + "step": 64503 + }, + { + "epoch": 1.65, + "learning_rate": 8.833859360148448e-07, + "loss": 0.8037, + "step": 64504 + }, + { + "epoch": 1.65, + "learning_rate": 8.833584543926497e-07, + "loss": 0.5952, + "step": 64505 + }, + { + "epoch": 1.65, + "learning_rate": 8.833309728597613e-07, + "loss": 0.8604, + "step": 64506 + }, + { + "epoch": 1.65, + "learning_rate": 8.833034914162014e-07, + "loss": 0.6094, + "step": 64507 + }, + { + "epoch": 1.65, + "learning_rate": 8.832760100619903e-07, + "loss": 0.709, + "step": 64508 + }, + { + "epoch": 1.65, + "learning_rate": 8.832485287971496e-07, + "loss": 0.6328, + "step": 64509 + }, + { + "epoch": 1.65, + "learning_rate": 8.832210476217e-07, + "loss": 0.5293, + "step": 64510 + }, + { + "epoch": 1.65, + "learning_rate": 8.831935665356631e-07, + "loss": 0.5386, + "step": 64511 + }, + { + "epoch": 1.65, + "learning_rate": 8.831660855390593e-07, + "loss": 0.7529, + "step": 64512 + }, + { + "epoch": 1.65, + "learning_rate": 8.831386046319098e-07, + "loss": 0.6479, + "step": 64513 + }, + { + "epoch": 1.65, + "learning_rate": 8.831111238142356e-07, + "loss": 0.7026, + "step": 64514 + }, + { + "epoch": 1.65, + "learning_rate": 8.830836430860579e-07, + "loss": 0.6367, + "step": 64515 + }, + { + "epoch": 1.65, + "learning_rate": 8.830561624473976e-07, + "loss": 0.667, + "step": 64516 + }, + { + "epoch": 1.65, + "learning_rate": 8.830286818982759e-07, + "loss": 0.7119, + "step": 64517 + }, + { + "epoch": 1.65, + "learning_rate": 8.830012014387136e-07, + "loss": 0.7227, + "step": 64518 + }, + { + "epoch": 1.65, + "learning_rate": 8.829737210687321e-07, + "loss": 0.6582, + "step": 64519 + }, + { + "epoch": 1.65, + "learning_rate": 8.829462407883522e-07, + "loss": 0.7959, + "step": 64520 + }, + { + "epoch": 1.65, + "learning_rate": 8.829187605975952e-07, + "loss": 0.7412, + "step": 64521 + }, + { + "epoch": 1.65, + "learning_rate": 8.828912804964818e-07, + "loss": 0.5151, + "step": 64522 + }, + { + "epoch": 1.65, + "learning_rate": 8.828638004850328e-07, + "loss": 0.7344, + "step": 64523 + }, + { + "epoch": 1.65, + "learning_rate": 8.828363205632701e-07, + "loss": 0.6768, + "step": 64524 + }, + { + "epoch": 1.65, + "learning_rate": 8.828088407312137e-07, + "loss": 0.5542, + "step": 64525 + }, + { + "epoch": 1.65, + "learning_rate": 8.827813609888856e-07, + "loss": 0.584, + "step": 64526 + }, + { + "epoch": 1.65, + "learning_rate": 8.827538813363062e-07, + "loss": 0.8418, + "step": 64527 + }, + { + "epoch": 1.65, + "learning_rate": 8.827264017734969e-07, + "loss": 0.5063, + "step": 64528 + }, + { + "epoch": 1.65, + "learning_rate": 8.826989223004785e-07, + "loss": 0.6602, + "step": 64529 + }, + { + "epoch": 1.65, + "learning_rate": 8.826714429172723e-07, + "loss": 0.7344, + "step": 64530 + }, + { + "epoch": 1.65, + "learning_rate": 8.826439636238993e-07, + "loss": 0.623, + "step": 64531 + }, + { + "epoch": 1.65, + "learning_rate": 8.826164844203802e-07, + "loss": 0.7437, + "step": 64532 + }, + { + "epoch": 1.65, + "learning_rate": 8.825890053067362e-07, + "loss": 0.4678, + "step": 64533 + }, + { + "epoch": 1.65, + "learning_rate": 8.825615262829886e-07, + "loss": 0.7021, + "step": 64534 + }, + { + "epoch": 1.65, + "learning_rate": 8.82534047349158e-07, + "loss": 0.7007, + "step": 64535 + }, + { + "epoch": 1.65, + "learning_rate": 8.825065685052659e-07, + "loss": 0.6826, + "step": 64536 + }, + { + "epoch": 1.65, + "learning_rate": 8.824790897513328e-07, + "loss": 0.6377, + "step": 64537 + }, + { + "epoch": 1.65, + "learning_rate": 8.824516110873803e-07, + "loss": 0.7622, + "step": 64538 + }, + { + "epoch": 1.65, + "learning_rate": 8.824241325134291e-07, + "loss": 0.7158, + "step": 64539 + }, + { + "epoch": 1.65, + "learning_rate": 8.823966540295005e-07, + "loss": 0.5776, + "step": 64540 + }, + { + "epoch": 1.65, + "learning_rate": 8.823691756356155e-07, + "loss": 0.6079, + "step": 64541 + }, + { + "epoch": 1.65, + "learning_rate": 8.823416973317946e-07, + "loss": 0.6592, + "step": 64542 + }, + { + "epoch": 1.65, + "learning_rate": 8.823142191180596e-07, + "loss": 0.4427, + "step": 64543 + }, + { + "epoch": 1.65, + "learning_rate": 8.82286740994431e-07, + "loss": 0.6006, + "step": 64544 + }, + { + "epoch": 1.65, + "learning_rate": 8.8225926296093e-07, + "loss": 0.6797, + "step": 64545 + }, + { + "epoch": 1.65, + "learning_rate": 8.822317850175775e-07, + "loss": 0.6963, + "step": 64546 + }, + { + "epoch": 1.65, + "learning_rate": 8.822043071643951e-07, + "loss": 0.6113, + "step": 64547 + }, + { + "epoch": 1.65, + "learning_rate": 8.821768294014031e-07, + "loss": 0.4442, + "step": 64548 + }, + { + "epoch": 1.65, + "learning_rate": 8.821493517286231e-07, + "loss": 0.4866, + "step": 64549 + }, + { + "epoch": 1.65, + "learning_rate": 8.821218741460761e-07, + "loss": 0.6367, + "step": 64550 + }, + { + "epoch": 1.65, + "learning_rate": 8.820943966537829e-07, + "loss": 0.6245, + "step": 64551 + }, + { + "epoch": 1.65, + "learning_rate": 8.820669192517644e-07, + "loss": 0.7168, + "step": 64552 + }, + { + "epoch": 1.65, + "learning_rate": 8.820394419400418e-07, + "loss": 0.6421, + "step": 64553 + }, + { + "epoch": 1.65, + "learning_rate": 8.820119647186363e-07, + "loss": 0.4469, + "step": 64554 + }, + { + "epoch": 1.65, + "learning_rate": 8.819844875875688e-07, + "loss": 0.8711, + "step": 64555 + }, + { + "epoch": 1.65, + "learning_rate": 8.819570105468602e-07, + "loss": 0.5873, + "step": 64556 + }, + { + "epoch": 1.65, + "learning_rate": 8.819295335965319e-07, + "loss": 0.8535, + "step": 64557 + }, + { + "epoch": 1.65, + "learning_rate": 8.819020567366044e-07, + "loss": 0.7153, + "step": 64558 + }, + { + "epoch": 1.65, + "learning_rate": 8.818745799670994e-07, + "loss": 0.6021, + "step": 64559 + }, + { + "epoch": 1.65, + "learning_rate": 8.818471032880374e-07, + "loss": 0.606, + "step": 64560 + }, + { + "epoch": 1.65, + "learning_rate": 8.818196266994401e-07, + "loss": 0.665, + "step": 64561 + }, + { + "epoch": 1.65, + "learning_rate": 8.817921502013278e-07, + "loss": 0.7119, + "step": 64562 + }, + { + "epoch": 1.65, + "learning_rate": 8.817646737937216e-07, + "loss": 0.6299, + "step": 64563 + }, + { + "epoch": 1.65, + "learning_rate": 8.81737197476643e-07, + "loss": 0.4985, + "step": 64564 + }, + { + "epoch": 1.65, + "learning_rate": 8.817097212501125e-07, + "loss": 0.6445, + "step": 64565 + }, + { + "epoch": 1.65, + "learning_rate": 8.816822451141517e-07, + "loss": 0.8154, + "step": 64566 + }, + { + "epoch": 1.65, + "learning_rate": 8.816547690687813e-07, + "loss": 0.6455, + "step": 64567 + }, + { + "epoch": 1.65, + "learning_rate": 8.816272931140222e-07, + "loss": 0.6562, + "step": 64568 + }, + { + "epoch": 1.65, + "learning_rate": 8.815998172498959e-07, + "loss": 0.498, + "step": 64569 + }, + { + "epoch": 1.65, + "learning_rate": 8.81572341476423e-07, + "loss": 0.7256, + "step": 64570 + }, + { + "epoch": 1.65, + "learning_rate": 8.81544865793625e-07, + "loss": 0.4746, + "step": 64571 + }, + { + "epoch": 1.66, + "learning_rate": 8.815173902015226e-07, + "loss": 0.5016, + "step": 64572 + }, + { + "epoch": 1.66, + "learning_rate": 8.814899147001367e-07, + "loss": 0.7197, + "step": 64573 + }, + { + "epoch": 1.66, + "learning_rate": 8.814624392894886e-07, + "loss": 0.4905, + "step": 64574 + }, + { + "epoch": 1.66, + "learning_rate": 8.814349639695991e-07, + "loss": 0.6182, + "step": 64575 + }, + { + "epoch": 1.66, + "learning_rate": 8.814074887404895e-07, + "loss": 0.8154, + "step": 64576 + }, + { + "epoch": 1.66, + "learning_rate": 8.813800136021806e-07, + "loss": 0.541, + "step": 64577 + }, + { + "epoch": 1.66, + "learning_rate": 8.813525385546939e-07, + "loss": 0.5288, + "step": 64578 + }, + { + "epoch": 1.66, + "learning_rate": 8.813250635980497e-07, + "loss": 0.6631, + "step": 64579 + }, + { + "epoch": 1.66, + "learning_rate": 8.812975887322698e-07, + "loss": 0.6528, + "step": 64580 + }, + { + "epoch": 1.66, + "learning_rate": 8.81270113957375e-07, + "loss": 0.665, + "step": 64581 + }, + { + "epoch": 1.66, + "learning_rate": 8.812426392733858e-07, + "loss": 0.6895, + "step": 64582 + }, + { + "epoch": 1.66, + "learning_rate": 8.812151646803238e-07, + "loss": 0.5654, + "step": 64583 + }, + { + "epoch": 1.66, + "learning_rate": 8.811876901782099e-07, + "loss": 0.4512, + "step": 64584 + }, + { + "epoch": 1.66, + "learning_rate": 8.811602157670652e-07, + "loss": 0.4785, + "step": 64585 + }, + { + "epoch": 1.66, + "learning_rate": 8.811327414469107e-07, + "loss": 0.6406, + "step": 64586 + }, + { + "epoch": 1.66, + "learning_rate": 8.81105267217767e-07, + "loss": 0.5967, + "step": 64587 + }, + { + "epoch": 1.66, + "learning_rate": 8.810777930796559e-07, + "loss": 0.8525, + "step": 64588 + }, + { + "epoch": 1.66, + "learning_rate": 8.810503190325979e-07, + "loss": 0.7949, + "step": 64589 + }, + { + "epoch": 1.66, + "learning_rate": 8.810228450766143e-07, + "loss": 0.5654, + "step": 64590 + }, + { + "epoch": 1.66, + "learning_rate": 8.809953712117263e-07, + "loss": 0.7178, + "step": 64591 + }, + { + "epoch": 1.66, + "learning_rate": 8.809678974379543e-07, + "loss": 0.6147, + "step": 64592 + }, + { + "epoch": 1.66, + "learning_rate": 8.809404237553198e-07, + "loss": 0.6973, + "step": 64593 + }, + { + "epoch": 1.66, + "learning_rate": 8.809129501638436e-07, + "loss": 0.6782, + "step": 64594 + }, + { + "epoch": 1.66, + "learning_rate": 8.80885476663547e-07, + "loss": 0.6357, + "step": 64595 + }, + { + "epoch": 1.66, + "learning_rate": 8.808580032544509e-07, + "loss": 0.7822, + "step": 64596 + }, + { + "epoch": 1.66, + "learning_rate": 8.808305299365765e-07, + "loss": 0.5864, + "step": 64597 + }, + { + "epoch": 1.66, + "learning_rate": 8.808030567099443e-07, + "loss": 0.7568, + "step": 64598 + }, + { + "epoch": 1.66, + "learning_rate": 8.807755835745761e-07, + "loss": 0.6318, + "step": 64599 + }, + { + "epoch": 1.66, + "learning_rate": 8.807481105304922e-07, + "loss": 0.5959, + "step": 64600 + }, + { + "epoch": 1.66, + "learning_rate": 8.807206375777146e-07, + "loss": 0.6152, + "step": 64601 + }, + { + "epoch": 1.66, + "learning_rate": 8.806931647162634e-07, + "loss": 0.8203, + "step": 64602 + }, + { + "epoch": 1.66, + "learning_rate": 8.806656919461599e-07, + "loss": 0.5337, + "step": 64603 + }, + { + "epoch": 1.66, + "learning_rate": 8.806382192674251e-07, + "loss": 0.6216, + "step": 64604 + }, + { + "epoch": 1.66, + "learning_rate": 8.806107466800803e-07, + "loss": 0.5352, + "step": 64605 + }, + { + "epoch": 1.66, + "learning_rate": 8.805832741841461e-07, + "loss": 0.6406, + "step": 64606 + }, + { + "epoch": 1.66, + "learning_rate": 8.80555801779644e-07, + "loss": 0.7422, + "step": 64607 + }, + { + "epoch": 1.66, + "learning_rate": 8.805283294665947e-07, + "loss": 0.5474, + "step": 64608 + }, + { + "epoch": 1.66, + "learning_rate": 8.805008572450196e-07, + "loss": 0.5938, + "step": 64609 + }, + { + "epoch": 1.66, + "learning_rate": 8.804733851149392e-07, + "loss": 0.5269, + "step": 64610 + }, + { + "epoch": 1.66, + "learning_rate": 8.804459130763752e-07, + "loss": 0.5679, + "step": 64611 + }, + { + "epoch": 1.66, + "learning_rate": 8.804184411293482e-07, + "loss": 0.5244, + "step": 64612 + }, + { + "epoch": 1.66, + "learning_rate": 8.803909692738791e-07, + "loss": 0.6543, + "step": 64613 + }, + { + "epoch": 1.66, + "learning_rate": 8.803634975099893e-07, + "loss": 0.6001, + "step": 64614 + }, + { + "epoch": 1.66, + "learning_rate": 8.803360258376994e-07, + "loss": 0.7441, + "step": 64615 + }, + { + "epoch": 1.66, + "learning_rate": 8.80308554257031e-07, + "loss": 0.7402, + "step": 64616 + }, + { + "epoch": 1.66, + "learning_rate": 8.802810827680045e-07, + "loss": 0.5742, + "step": 64617 + }, + { + "epoch": 1.66, + "learning_rate": 8.802536113706415e-07, + "loss": 0.6152, + "step": 64618 + }, + { + "epoch": 1.66, + "learning_rate": 8.802261400649628e-07, + "loss": 0.7852, + "step": 64619 + }, + { + "epoch": 1.66, + "learning_rate": 8.801986688509894e-07, + "loss": 0.5312, + "step": 64620 + }, + { + "epoch": 1.66, + "learning_rate": 8.801711977287428e-07, + "loss": 0.4028, + "step": 64621 + }, + { + "epoch": 1.66, + "learning_rate": 8.801437266982432e-07, + "loss": 0.5176, + "step": 64622 + }, + { + "epoch": 1.66, + "learning_rate": 8.801162557595118e-07, + "loss": 0.5791, + "step": 64623 + }, + { + "epoch": 1.66, + "learning_rate": 8.800887849125702e-07, + "loss": 0.6016, + "step": 64624 + }, + { + "epoch": 1.66, + "learning_rate": 8.800613141574389e-07, + "loss": 0.8672, + "step": 64625 + }, + { + "epoch": 1.66, + "learning_rate": 8.800338434941393e-07, + "loss": 0.8735, + "step": 64626 + }, + { + "epoch": 1.66, + "learning_rate": 8.800063729226921e-07, + "loss": 0.7822, + "step": 64627 + }, + { + "epoch": 1.66, + "learning_rate": 8.799789024431188e-07, + "loss": 0.438, + "step": 64628 + }, + { + "epoch": 1.66, + "learning_rate": 8.799514320554397e-07, + "loss": 0.7451, + "step": 64629 + }, + { + "epoch": 1.66, + "learning_rate": 8.799239617596767e-07, + "loss": 0.6553, + "step": 64630 + }, + { + "epoch": 1.66, + "learning_rate": 8.798964915558505e-07, + "loss": 0.6846, + "step": 64631 + }, + { + "epoch": 1.66, + "learning_rate": 8.798690214439815e-07, + "loss": 0.8926, + "step": 64632 + }, + { + "epoch": 1.66, + "learning_rate": 8.798415514240917e-07, + "loss": 0.604, + "step": 64633 + }, + { + "epoch": 1.66, + "learning_rate": 8.798140814962014e-07, + "loss": 0.8232, + "step": 64634 + }, + { + "epoch": 1.66, + "learning_rate": 8.797866116603321e-07, + "loss": 0.6855, + "step": 64635 + }, + { + "epoch": 1.66, + "learning_rate": 8.797591419165045e-07, + "loss": 0.6152, + "step": 64636 + }, + { + "epoch": 1.66, + "learning_rate": 8.7973167226474e-07, + "loss": 0.6694, + "step": 64637 + }, + { + "epoch": 1.66, + "learning_rate": 8.797042027050592e-07, + "loss": 0.4227, + "step": 64638 + }, + { + "epoch": 1.66, + "learning_rate": 8.796767332374835e-07, + "loss": 0.6387, + "step": 64639 + }, + { + "epoch": 1.66, + "learning_rate": 8.796492638620339e-07, + "loss": 0.5159, + "step": 64640 + }, + { + "epoch": 1.66, + "learning_rate": 8.796217945787315e-07, + "loss": 0.5269, + "step": 64641 + }, + { + "epoch": 1.66, + "learning_rate": 8.795943253875968e-07, + "loss": 0.6025, + "step": 64642 + }, + { + "epoch": 1.66, + "learning_rate": 8.795668562886513e-07, + "loss": 0.6035, + "step": 64643 + }, + { + "epoch": 1.66, + "learning_rate": 8.795393872819158e-07, + "loss": 0.665, + "step": 64644 + }, + { + "epoch": 1.66, + "learning_rate": 8.795119183674116e-07, + "loss": 0.6104, + "step": 64645 + }, + { + "epoch": 1.66, + "learning_rate": 8.794844495451593e-07, + "loss": 0.6631, + "step": 64646 + }, + { + "epoch": 1.66, + "learning_rate": 8.794569808151806e-07, + "loss": 0.6714, + "step": 64647 + }, + { + "epoch": 1.66, + "learning_rate": 8.794295121774959e-07, + "loss": 0.5908, + "step": 64648 + }, + { + "epoch": 1.66, + "learning_rate": 8.794020436321266e-07, + "loss": 0.7031, + "step": 64649 + }, + { + "epoch": 1.66, + "learning_rate": 8.793745751790935e-07, + "loss": 0.6753, + "step": 64650 + }, + { + "epoch": 1.66, + "learning_rate": 8.793471068184179e-07, + "loss": 0.6235, + "step": 64651 + }, + { + "epoch": 1.66, + "learning_rate": 8.793196385501208e-07, + "loss": 0.5659, + "step": 64652 + }, + { + "epoch": 1.66, + "learning_rate": 8.792921703742227e-07, + "loss": 0.6201, + "step": 64653 + }, + { + "epoch": 1.66, + "learning_rate": 8.792647022907454e-07, + "loss": 0.8359, + "step": 64654 + }, + { + "epoch": 1.66, + "learning_rate": 8.792372342997092e-07, + "loss": 0.7305, + "step": 64655 + }, + { + "epoch": 1.66, + "learning_rate": 8.792097664011358e-07, + "loss": 0.6533, + "step": 64656 + }, + { + "epoch": 1.66, + "learning_rate": 8.791822985950459e-07, + "loss": 0.4971, + "step": 64657 + }, + { + "epoch": 1.66, + "learning_rate": 8.791548308814602e-07, + "loss": 0.707, + "step": 64658 + }, + { + "epoch": 1.66, + "learning_rate": 8.791273632604005e-07, + "loss": 0.5859, + "step": 64659 + }, + { + "epoch": 1.66, + "learning_rate": 8.790998957318871e-07, + "loss": 0.6233, + "step": 64660 + }, + { + "epoch": 1.66, + "learning_rate": 8.790724282959419e-07, + "loss": 0.7207, + "step": 64661 + }, + { + "epoch": 1.66, + "learning_rate": 8.790449609525851e-07, + "loss": 0.668, + "step": 64662 + }, + { + "epoch": 1.66, + "learning_rate": 8.790174937018377e-07, + "loss": 0.55, + "step": 64663 + }, + { + "epoch": 1.66, + "learning_rate": 8.789900265437215e-07, + "loss": 0.8936, + "step": 64664 + }, + { + "epoch": 1.66, + "learning_rate": 8.789625594782566e-07, + "loss": 0.6064, + "step": 64665 + }, + { + "epoch": 1.66, + "learning_rate": 8.789350925054648e-07, + "loss": 0.75, + "step": 64666 + }, + { + "epoch": 1.66, + "learning_rate": 8.789076256253666e-07, + "loss": 0.5903, + "step": 64667 + }, + { + "epoch": 1.66, + "learning_rate": 8.788801588379837e-07, + "loss": 0.7656, + "step": 64668 + }, + { + "epoch": 1.66, + "learning_rate": 8.788526921433363e-07, + "loss": 0.7266, + "step": 64669 + }, + { + "epoch": 1.66, + "learning_rate": 8.788252255414459e-07, + "loss": 0.6958, + "step": 64670 + }, + { + "epoch": 1.66, + "learning_rate": 8.787977590323339e-07, + "loss": 0.7393, + "step": 64671 + }, + { + "epoch": 1.66, + "learning_rate": 8.787702926160204e-07, + "loss": 0.7441, + "step": 64672 + }, + { + "epoch": 1.66, + "learning_rate": 8.787428262925269e-07, + "loss": 0.6038, + "step": 64673 + }, + { + "epoch": 1.66, + "learning_rate": 8.787153600618746e-07, + "loss": 0.666, + "step": 64674 + }, + { + "epoch": 1.66, + "learning_rate": 8.786878939240842e-07, + "loss": 0.7266, + "step": 64675 + }, + { + "epoch": 1.66, + "learning_rate": 8.786604278791772e-07, + "loss": 0.6924, + "step": 64676 + }, + { + "epoch": 1.66, + "learning_rate": 8.78632961927174e-07, + "loss": 0.5327, + "step": 64677 + }, + { + "epoch": 1.66, + "learning_rate": 8.786054960680962e-07, + "loss": 0.79, + "step": 64678 + }, + { + "epoch": 1.66, + "learning_rate": 8.785780303019644e-07, + "loss": 0.5894, + "step": 64679 + }, + { + "epoch": 1.66, + "learning_rate": 8.785505646288e-07, + "loss": 0.5684, + "step": 64680 + }, + { + "epoch": 1.66, + "learning_rate": 8.78523099048624e-07, + "loss": 0.5732, + "step": 64681 + }, + { + "epoch": 1.66, + "learning_rate": 8.784956335614569e-07, + "loss": 0.509, + "step": 64682 + }, + { + "epoch": 1.66, + "learning_rate": 8.784681681673204e-07, + "loss": 0.8623, + "step": 64683 + }, + { + "epoch": 1.66, + "learning_rate": 8.78440702866235e-07, + "loss": 0.604, + "step": 64684 + }, + { + "epoch": 1.66, + "learning_rate": 8.784132376582221e-07, + "loss": 0.5679, + "step": 64685 + }, + { + "epoch": 1.66, + "learning_rate": 8.783857725433024e-07, + "loss": 0.7988, + "step": 64686 + }, + { + "epoch": 1.66, + "learning_rate": 8.783583075214973e-07, + "loss": 0.6387, + "step": 64687 + }, + { + "epoch": 1.66, + "learning_rate": 8.783308425928275e-07, + "loss": 0.5669, + "step": 64688 + }, + { + "epoch": 1.66, + "learning_rate": 8.783033777573144e-07, + "loss": 0.5225, + "step": 64689 + }, + { + "epoch": 1.66, + "learning_rate": 8.782759130149785e-07, + "loss": 0.79, + "step": 64690 + }, + { + "epoch": 1.66, + "learning_rate": 8.782484483658417e-07, + "loss": 0.6465, + "step": 64691 + }, + { + "epoch": 1.66, + "learning_rate": 8.782209838099241e-07, + "loss": 0.6528, + "step": 64692 + }, + { + "epoch": 1.66, + "learning_rate": 8.781935193472473e-07, + "loss": 0.4194, + "step": 64693 + }, + { + "epoch": 1.66, + "learning_rate": 8.781660549778317e-07, + "loss": 0.7422, + "step": 64694 + }, + { + "epoch": 1.66, + "learning_rate": 8.781385907016991e-07, + "loss": 0.5317, + "step": 64695 + }, + { + "epoch": 1.66, + "learning_rate": 8.781111265188699e-07, + "loss": 0.6064, + "step": 64696 + }, + { + "epoch": 1.66, + "learning_rate": 8.780836624293656e-07, + "loss": 0.606, + "step": 64697 + }, + { + "epoch": 1.66, + "learning_rate": 8.780561984332069e-07, + "loss": 0.6011, + "step": 64698 + }, + { + "epoch": 1.66, + "learning_rate": 8.780287345304151e-07, + "loss": 0.6279, + "step": 64699 + }, + { + "epoch": 1.66, + "learning_rate": 8.780012707210109e-07, + "loss": 0.7178, + "step": 64700 + }, + { + "epoch": 1.66, + "learning_rate": 8.77973807005016e-07, + "loss": 0.6729, + "step": 64701 + }, + { + "epoch": 1.66, + "learning_rate": 8.779463433824507e-07, + "loss": 0.5908, + "step": 64702 + }, + { + "epoch": 1.66, + "learning_rate": 8.77918879853336e-07, + "loss": 0.7832, + "step": 64703 + }, + { + "epoch": 1.66, + "learning_rate": 8.778914164176934e-07, + "loss": 0.6108, + "step": 64704 + }, + { + "epoch": 1.66, + "learning_rate": 8.778639530755436e-07, + "loss": 0.6738, + "step": 64705 + }, + { + "epoch": 1.66, + "learning_rate": 8.77836489826908e-07, + "loss": 0.6973, + "step": 64706 + }, + { + "epoch": 1.66, + "learning_rate": 8.77809026671807e-07, + "loss": 0.8076, + "step": 64707 + }, + { + "epoch": 1.66, + "learning_rate": 8.777815636102624e-07, + "loss": 0.6641, + "step": 64708 + }, + { + "epoch": 1.66, + "learning_rate": 8.777541006422945e-07, + "loss": 0.6711, + "step": 64709 + }, + { + "epoch": 1.66, + "learning_rate": 8.77726637767925e-07, + "loss": 0.5757, + "step": 64710 + }, + { + "epoch": 1.66, + "learning_rate": 8.776991749871747e-07, + "loss": 0.542, + "step": 64711 + }, + { + "epoch": 1.66, + "learning_rate": 8.776717123000643e-07, + "loss": 0.4817, + "step": 64712 + }, + { + "epoch": 1.66, + "learning_rate": 8.776442497066149e-07, + "loss": 0.7422, + "step": 64713 + }, + { + "epoch": 1.66, + "learning_rate": 8.776167872068479e-07, + "loss": 0.7734, + "step": 64714 + }, + { + "epoch": 1.66, + "learning_rate": 8.775893248007839e-07, + "loss": 0.5913, + "step": 64715 + }, + { + "epoch": 1.66, + "learning_rate": 8.775618624884442e-07, + "loss": 0.7686, + "step": 64716 + }, + { + "epoch": 1.66, + "learning_rate": 8.775344002698496e-07, + "loss": 0.571, + "step": 64717 + }, + { + "epoch": 1.66, + "learning_rate": 8.775069381450215e-07, + "loss": 0.6309, + "step": 64718 + }, + { + "epoch": 1.66, + "learning_rate": 8.774794761139805e-07, + "loss": 0.6846, + "step": 64719 + }, + { + "epoch": 1.66, + "learning_rate": 8.774520141767483e-07, + "loss": 0.707, + "step": 64720 + }, + { + "epoch": 1.66, + "learning_rate": 8.774245523333452e-07, + "loss": 0.543, + "step": 64721 + }, + { + "epoch": 1.66, + "learning_rate": 8.773970905837922e-07, + "loss": 0.645, + "step": 64722 + }, + { + "epoch": 1.66, + "learning_rate": 8.773696289281109e-07, + "loss": 0.6519, + "step": 64723 + }, + { + "epoch": 1.66, + "learning_rate": 8.77342167366322e-07, + "loss": 0.6689, + "step": 64724 + }, + { + "epoch": 1.66, + "learning_rate": 8.773147058984465e-07, + "loss": 0.834, + "step": 64725 + }, + { + "epoch": 1.66, + "learning_rate": 8.772872445245053e-07, + "loss": 0.6748, + "step": 64726 + }, + { + "epoch": 1.66, + "learning_rate": 8.7725978324452e-07, + "loss": 0.646, + "step": 64727 + }, + { + "epoch": 1.66, + "learning_rate": 8.772323220585108e-07, + "loss": 0.6982, + "step": 64728 + }, + { + "epoch": 1.66, + "learning_rate": 8.772048609664996e-07, + "loss": 0.5708, + "step": 64729 + }, + { + "epoch": 1.66, + "learning_rate": 8.771773999685071e-07, + "loss": 0.7002, + "step": 64730 + }, + { + "epoch": 1.66, + "learning_rate": 8.77149939064554e-07, + "loss": 0.6548, + "step": 64731 + }, + { + "epoch": 1.66, + "learning_rate": 8.771224782546614e-07, + "loss": 0.5254, + "step": 64732 + }, + { + "epoch": 1.66, + "learning_rate": 8.770950175388507e-07, + "loss": 0.6733, + "step": 64733 + }, + { + "epoch": 1.66, + "learning_rate": 8.770675569171423e-07, + "loss": 0.5479, + "step": 64734 + }, + { + "epoch": 1.66, + "learning_rate": 8.770400963895579e-07, + "loss": 0.599, + "step": 64735 + }, + { + "epoch": 1.66, + "learning_rate": 8.770126359561181e-07, + "loss": 0.6641, + "step": 64736 + }, + { + "epoch": 1.66, + "learning_rate": 8.769851756168443e-07, + "loss": 0.5369, + "step": 64737 + }, + { + "epoch": 1.66, + "learning_rate": 8.76957715371757e-07, + "loss": 0.5126, + "step": 64738 + }, + { + "epoch": 1.66, + "learning_rate": 8.769302552208778e-07, + "loss": 0.6172, + "step": 64739 + }, + { + "epoch": 1.66, + "learning_rate": 8.769027951642276e-07, + "loss": 0.7061, + "step": 64740 + }, + { + "epoch": 1.66, + "learning_rate": 8.768753352018269e-07, + "loss": 0.646, + "step": 64741 + }, + { + "epoch": 1.66, + "learning_rate": 8.768478753336974e-07, + "loss": 0.5479, + "step": 64742 + }, + { + "epoch": 1.66, + "learning_rate": 8.768204155598593e-07, + "loss": 0.6938, + "step": 64743 + }, + { + "epoch": 1.66, + "learning_rate": 8.767929558803347e-07, + "loss": 0.6611, + "step": 64744 + }, + { + "epoch": 1.66, + "learning_rate": 8.767654962951437e-07, + "loss": 0.6299, + "step": 64745 + }, + { + "epoch": 1.66, + "learning_rate": 8.767380368043078e-07, + "loss": 0.481, + "step": 64746 + }, + { + "epoch": 1.66, + "learning_rate": 8.767105774078478e-07, + "loss": 0.5928, + "step": 64747 + }, + { + "epoch": 1.66, + "learning_rate": 8.76683118105785e-07, + "loss": 0.7998, + "step": 64748 + }, + { + "epoch": 1.66, + "learning_rate": 8.766556588981404e-07, + "loss": 0.6904, + "step": 64749 + }, + { + "epoch": 1.66, + "learning_rate": 8.76628199784935e-07, + "loss": 0.6528, + "step": 64750 + }, + { + "epoch": 1.66, + "learning_rate": 8.766007407661893e-07, + "loss": 0.626, + "step": 64751 + }, + { + "epoch": 1.66, + "learning_rate": 8.76573281841925e-07, + "loss": 0.7012, + "step": 64752 + }, + { + "epoch": 1.66, + "learning_rate": 8.765458230121626e-07, + "loss": 0.6953, + "step": 64753 + }, + { + "epoch": 1.66, + "learning_rate": 8.765183642769236e-07, + "loss": 0.4121, + "step": 64754 + }, + { + "epoch": 1.66, + "learning_rate": 8.764909056362286e-07, + "loss": 0.5435, + "step": 64755 + }, + { + "epoch": 1.66, + "learning_rate": 8.764634470900991e-07, + "loss": 0.7656, + "step": 64756 + }, + { + "epoch": 1.66, + "learning_rate": 8.764359886385556e-07, + "loss": 0.5903, + "step": 64757 + }, + { + "epoch": 1.66, + "learning_rate": 8.764085302816196e-07, + "loss": 0.5957, + "step": 64758 + }, + { + "epoch": 1.66, + "learning_rate": 8.763810720193118e-07, + "loss": 0.6963, + "step": 64759 + }, + { + "epoch": 1.66, + "learning_rate": 8.763536138516536e-07, + "loss": 0.4824, + "step": 64760 + }, + { + "epoch": 1.66, + "learning_rate": 8.763261557786656e-07, + "loss": 0.6372, + "step": 64761 + }, + { + "epoch": 1.66, + "learning_rate": 8.762986978003688e-07, + "loss": 0.6387, + "step": 64762 + }, + { + "epoch": 1.66, + "learning_rate": 8.762712399167846e-07, + "loss": 0.8613, + "step": 64763 + }, + { + "epoch": 1.66, + "learning_rate": 8.762437821279335e-07, + "loss": 0.6968, + "step": 64764 + }, + { + "epoch": 1.66, + "learning_rate": 8.762163244338371e-07, + "loss": 0.6895, + "step": 64765 + }, + { + "epoch": 1.66, + "learning_rate": 8.761888668345162e-07, + "loss": 0.7383, + "step": 64766 + }, + { + "epoch": 1.66, + "learning_rate": 8.761614093299916e-07, + "loss": 0.7446, + "step": 64767 + }, + { + "epoch": 1.66, + "learning_rate": 8.761339519202848e-07, + "loss": 0.5527, + "step": 64768 + }, + { + "epoch": 1.66, + "learning_rate": 8.761064946054162e-07, + "loss": 0.625, + "step": 64769 + }, + { + "epoch": 1.66, + "learning_rate": 8.760790373854076e-07, + "loss": 0.5068, + "step": 64770 + }, + { + "epoch": 1.66, + "learning_rate": 8.760515802602793e-07, + "loss": 0.6309, + "step": 64771 + }, + { + "epoch": 1.66, + "learning_rate": 8.760241232300526e-07, + "loss": 0.6582, + "step": 64772 + }, + { + "epoch": 1.66, + "learning_rate": 8.759966662947487e-07, + "loss": 0.5605, + "step": 64773 + }, + { + "epoch": 1.66, + "learning_rate": 8.75969209454388e-07, + "loss": 0.6401, + "step": 64774 + }, + { + "epoch": 1.66, + "learning_rate": 8.759417527089924e-07, + "loss": 0.4548, + "step": 64775 + }, + { + "epoch": 1.66, + "learning_rate": 8.759142960585822e-07, + "loss": 0.5903, + "step": 64776 + }, + { + "epoch": 1.66, + "learning_rate": 8.75886839503179e-07, + "loss": 0.626, + "step": 64777 + }, + { + "epoch": 1.66, + "learning_rate": 8.758593830428032e-07, + "loss": 0.7236, + "step": 64778 + }, + { + "epoch": 1.66, + "learning_rate": 8.758319266774766e-07, + "loss": 0.6587, + "step": 64779 + }, + { + "epoch": 1.66, + "learning_rate": 8.758044704072198e-07, + "loss": 0.6802, + "step": 64780 + }, + { + "epoch": 1.66, + "learning_rate": 8.757770142320536e-07, + "loss": 0.6128, + "step": 64781 + }, + { + "epoch": 1.66, + "learning_rate": 8.757495581519991e-07, + "loss": 0.6929, + "step": 64782 + }, + { + "epoch": 1.66, + "learning_rate": 8.757221021670777e-07, + "loss": 0.6836, + "step": 64783 + }, + { + "epoch": 1.66, + "learning_rate": 8.756946462773099e-07, + "loss": 0.6973, + "step": 64784 + }, + { + "epoch": 1.66, + "learning_rate": 8.756671904827172e-07, + "loss": 0.6108, + "step": 64785 + }, + { + "epoch": 1.66, + "learning_rate": 8.756397347833203e-07, + "loss": 0.5938, + "step": 64786 + }, + { + "epoch": 1.66, + "learning_rate": 8.756122791791404e-07, + "loss": 0.6353, + "step": 64787 + }, + { + "epoch": 1.66, + "learning_rate": 8.755848236701982e-07, + "loss": 0.5803, + "step": 64788 + }, + { + "epoch": 1.66, + "learning_rate": 8.755573682565154e-07, + "loss": 0.5701, + "step": 64789 + }, + { + "epoch": 1.66, + "learning_rate": 8.755299129381126e-07, + "loss": 0.5869, + "step": 64790 + }, + { + "epoch": 1.66, + "learning_rate": 8.755024577150105e-07, + "loss": 0.6328, + "step": 64791 + }, + { + "epoch": 1.66, + "learning_rate": 8.754750025872308e-07, + "loss": 0.6943, + "step": 64792 + }, + { + "epoch": 1.66, + "learning_rate": 8.754475475547937e-07, + "loss": 0.7832, + "step": 64793 + }, + { + "epoch": 1.66, + "learning_rate": 8.75420092617721e-07, + "loss": 0.7295, + "step": 64794 + }, + { + "epoch": 1.66, + "learning_rate": 8.753926377760333e-07, + "loss": 0.4084, + "step": 64795 + }, + { + "epoch": 1.66, + "learning_rate": 8.753651830297517e-07, + "loss": 0.5603, + "step": 64796 + }, + { + "epoch": 1.66, + "learning_rate": 8.753377283788972e-07, + "loss": 0.6162, + "step": 64797 + }, + { + "epoch": 1.66, + "learning_rate": 8.75310273823491e-07, + "loss": 0.593, + "step": 64798 + }, + { + "epoch": 1.66, + "learning_rate": 8.75282819363554e-07, + "loss": 0.688, + "step": 64799 + }, + { + "epoch": 1.66, + "learning_rate": 8.752553649991076e-07, + "loss": 0.5508, + "step": 64800 + }, + { + "epoch": 1.66, + "learning_rate": 8.752279107301719e-07, + "loss": 0.666, + "step": 64801 + }, + { + "epoch": 1.66, + "learning_rate": 8.752004565567687e-07, + "loss": 0.877, + "step": 64802 + }, + { + "epoch": 1.66, + "learning_rate": 8.751730024789185e-07, + "loss": 0.5889, + "step": 64803 + }, + { + "epoch": 1.66, + "learning_rate": 8.751455484966428e-07, + "loss": 0.6016, + "step": 64804 + }, + { + "epoch": 1.66, + "learning_rate": 8.751180946099621e-07, + "loss": 0.502, + "step": 64805 + }, + { + "epoch": 1.66, + "learning_rate": 8.750906408188981e-07, + "loss": 0.5509, + "step": 64806 + }, + { + "epoch": 1.66, + "learning_rate": 8.750631871234712e-07, + "loss": 0.5557, + "step": 64807 + }, + { + "epoch": 1.66, + "learning_rate": 8.750357335237029e-07, + "loss": 0.4956, + "step": 64808 + }, + { + "epoch": 1.66, + "learning_rate": 8.750082800196138e-07, + "loss": 0.6191, + "step": 64809 + }, + { + "epoch": 1.66, + "learning_rate": 8.749808266112255e-07, + "loss": 0.5967, + "step": 64810 + }, + { + "epoch": 1.66, + "learning_rate": 8.749533732985583e-07, + "loss": 0.6904, + "step": 64811 + }, + { + "epoch": 1.66, + "learning_rate": 8.749259200816335e-07, + "loss": 0.6914, + "step": 64812 + }, + { + "epoch": 1.66, + "learning_rate": 8.748984669604724e-07, + "loss": 0.7124, + "step": 64813 + }, + { + "epoch": 1.66, + "learning_rate": 8.748710139350954e-07, + "loss": 0.5244, + "step": 64814 + }, + { + "epoch": 1.66, + "learning_rate": 8.748435610055244e-07, + "loss": 0.6772, + "step": 64815 + }, + { + "epoch": 1.66, + "learning_rate": 8.748161081717795e-07, + "loss": 0.7432, + "step": 64816 + }, + { + "epoch": 1.66, + "learning_rate": 8.747886554338824e-07, + "loss": 0.6431, + "step": 64817 + }, + { + "epoch": 1.66, + "learning_rate": 8.747612027918537e-07, + "loss": 0.5659, + "step": 64818 + }, + { + "epoch": 1.66, + "learning_rate": 8.747337502457148e-07, + "loss": 0.8506, + "step": 64819 + }, + { + "epoch": 1.66, + "learning_rate": 8.747062977954867e-07, + "loss": 0.6836, + "step": 64820 + }, + { + "epoch": 1.66, + "learning_rate": 8.7467884544119e-07, + "loss": 0.6567, + "step": 64821 + }, + { + "epoch": 1.66, + "learning_rate": 8.746513931828458e-07, + "loss": 0.5664, + "step": 64822 + }, + { + "epoch": 1.66, + "learning_rate": 8.746239410204754e-07, + "loss": 0.6426, + "step": 64823 + }, + { + "epoch": 1.66, + "learning_rate": 8.745964889540995e-07, + "loss": 0.6812, + "step": 64824 + }, + { + "epoch": 1.66, + "learning_rate": 8.745690369837395e-07, + "loss": 0.6787, + "step": 64825 + }, + { + "epoch": 1.66, + "learning_rate": 8.74541585109416e-07, + "loss": 0.6807, + "step": 64826 + }, + { + "epoch": 1.66, + "learning_rate": 8.745141333311506e-07, + "loss": 0.6714, + "step": 64827 + }, + { + "epoch": 1.66, + "learning_rate": 8.744866816489635e-07, + "loss": 0.792, + "step": 64828 + }, + { + "epoch": 1.66, + "learning_rate": 8.744592300628765e-07, + "loss": 0.6196, + "step": 64829 + }, + { + "epoch": 1.66, + "learning_rate": 8.744317785729106e-07, + "loss": 0.5586, + "step": 64830 + }, + { + "epoch": 1.66, + "learning_rate": 8.744043271790859e-07, + "loss": 0.5668, + "step": 64831 + }, + { + "epoch": 1.66, + "learning_rate": 8.743768758814244e-07, + "loss": 0.6836, + "step": 64832 + }, + { + "epoch": 1.66, + "learning_rate": 8.743494246799465e-07, + "loss": 0.7861, + "step": 64833 + }, + { + "epoch": 1.66, + "learning_rate": 8.743219735746737e-07, + "loss": 0.519, + "step": 64834 + }, + { + "epoch": 1.66, + "learning_rate": 8.742945225656264e-07, + "loss": 0.8115, + "step": 64835 + }, + { + "epoch": 1.66, + "learning_rate": 8.742670716528264e-07, + "loss": 0.7007, + "step": 64836 + }, + { + "epoch": 1.66, + "learning_rate": 8.742396208362941e-07, + "loss": 0.6006, + "step": 64837 + }, + { + "epoch": 1.66, + "learning_rate": 8.742121701160508e-07, + "loss": 0.6733, + "step": 64838 + }, + { + "epoch": 1.66, + "learning_rate": 8.741847194921176e-07, + "loss": 0.6514, + "step": 64839 + }, + { + "epoch": 1.66, + "learning_rate": 8.741572689645156e-07, + "loss": 0.665, + "step": 64840 + }, + { + "epoch": 1.66, + "learning_rate": 8.741298185332651e-07, + "loss": 0.6499, + "step": 64841 + }, + { + "epoch": 1.66, + "learning_rate": 8.741023681983879e-07, + "loss": 0.7451, + "step": 64842 + }, + { + "epoch": 1.66, + "learning_rate": 8.740749179599045e-07, + "loss": 0.5413, + "step": 64843 + }, + { + "epoch": 1.66, + "learning_rate": 8.740474678178363e-07, + "loss": 0.6914, + "step": 64844 + }, + { + "epoch": 1.66, + "learning_rate": 8.740200177722039e-07, + "loss": 0.6304, + "step": 64845 + }, + { + "epoch": 1.66, + "learning_rate": 8.739925678230288e-07, + "loss": 0.5542, + "step": 64846 + }, + { + "epoch": 1.66, + "learning_rate": 8.739651179703318e-07, + "loss": 0.5459, + "step": 64847 + }, + { + "epoch": 1.66, + "learning_rate": 8.739376682141339e-07, + "loss": 0.5928, + "step": 64848 + }, + { + "epoch": 1.66, + "learning_rate": 8.73910218554456e-07, + "loss": 0.5957, + "step": 64849 + }, + { + "epoch": 1.66, + "learning_rate": 8.738827689913198e-07, + "loss": 0.6357, + "step": 64850 + }, + { + "epoch": 1.66, + "learning_rate": 8.738553195247453e-07, + "loss": 0.7656, + "step": 64851 + }, + { + "epoch": 1.66, + "learning_rate": 8.738278701547539e-07, + "loss": 0.6094, + "step": 64852 + }, + { + "epoch": 1.66, + "learning_rate": 8.738004208813669e-07, + "loss": 0.6196, + "step": 64853 + }, + { + "epoch": 1.66, + "learning_rate": 8.73772971704605e-07, + "loss": 0.6528, + "step": 64854 + }, + { + "epoch": 1.66, + "learning_rate": 8.737455226244894e-07, + "loss": 0.6128, + "step": 64855 + }, + { + "epoch": 1.66, + "learning_rate": 8.737180736410411e-07, + "loss": 0.6211, + "step": 64856 + }, + { + "epoch": 1.66, + "learning_rate": 8.736906247542808e-07, + "loss": 0.5396, + "step": 64857 + }, + { + "epoch": 1.66, + "learning_rate": 8.736631759642302e-07, + "loss": 0.5283, + "step": 64858 + }, + { + "epoch": 1.66, + "learning_rate": 8.736357272709094e-07, + "loss": 0.6238, + "step": 64859 + }, + { + "epoch": 1.66, + "learning_rate": 8.736082786743405e-07, + "loss": 0.5254, + "step": 64860 + }, + { + "epoch": 1.66, + "learning_rate": 8.735808301745436e-07, + "loss": 0.5708, + "step": 64861 + }, + { + "epoch": 1.66, + "learning_rate": 8.735533817715399e-07, + "loss": 0.7793, + "step": 64862 + }, + { + "epoch": 1.66, + "learning_rate": 8.735259334653508e-07, + "loss": 0.7021, + "step": 64863 + }, + { + "epoch": 1.66, + "learning_rate": 8.734984852559969e-07, + "loss": 0.6036, + "step": 64864 + }, + { + "epoch": 1.66, + "learning_rate": 8.734710371434996e-07, + "loss": 0.6382, + "step": 64865 + }, + { + "epoch": 1.66, + "learning_rate": 8.734435891278794e-07, + "loss": 0.4995, + "step": 64866 + }, + { + "epoch": 1.66, + "learning_rate": 8.734161412091578e-07, + "loss": 0.54, + "step": 64867 + }, + { + "epoch": 1.66, + "learning_rate": 8.733886933873556e-07, + "loss": 0.4243, + "step": 64868 + }, + { + "epoch": 1.66, + "learning_rate": 8.73361245662494e-07, + "loss": 0.6582, + "step": 64869 + }, + { + "epoch": 1.66, + "learning_rate": 8.733337980345941e-07, + "loss": 0.7686, + "step": 64870 + }, + { + "epoch": 1.66, + "learning_rate": 8.733063505036762e-07, + "loss": 0.4672, + "step": 64871 + }, + { + "epoch": 1.66, + "learning_rate": 8.73278903069762e-07, + "loss": 0.7109, + "step": 64872 + }, + { + "epoch": 1.66, + "learning_rate": 8.732514557328725e-07, + "loss": 0.5977, + "step": 64873 + }, + { + "epoch": 1.66, + "learning_rate": 8.732240084930281e-07, + "loss": 0.5366, + "step": 64874 + }, + { + "epoch": 1.66, + "learning_rate": 8.731965613502505e-07, + "loss": 0.5513, + "step": 64875 + }, + { + "epoch": 1.66, + "learning_rate": 8.731691143045603e-07, + "loss": 0.4143, + "step": 64876 + }, + { + "epoch": 1.66, + "learning_rate": 8.731416673559789e-07, + "loss": 0.5508, + "step": 64877 + }, + { + "epoch": 1.66, + "learning_rate": 8.731142205045269e-07, + "loss": 0.603, + "step": 64878 + }, + { + "epoch": 1.66, + "learning_rate": 8.730867737502257e-07, + "loss": 0.5713, + "step": 64879 + }, + { + "epoch": 1.66, + "learning_rate": 8.730593270930963e-07, + "loss": 0.6333, + "step": 64880 + }, + { + "epoch": 1.66, + "learning_rate": 8.730318805331591e-07, + "loss": 0.7119, + "step": 64881 + }, + { + "epoch": 1.66, + "learning_rate": 8.730044340704359e-07, + "loss": 0.666, + "step": 64882 + }, + { + "epoch": 1.66, + "learning_rate": 8.72976987704947e-07, + "loss": 0.6436, + "step": 64883 + }, + { + "epoch": 1.66, + "learning_rate": 8.729495414367141e-07, + "loss": 0.7324, + "step": 64884 + }, + { + "epoch": 1.66, + "learning_rate": 8.729220952657576e-07, + "loss": 0.8232, + "step": 64885 + }, + { + "epoch": 1.66, + "learning_rate": 8.72894649192099e-07, + "loss": 0.6504, + "step": 64886 + }, + { + "epoch": 1.66, + "learning_rate": 8.72867203215759e-07, + "loss": 0.5979, + "step": 64887 + }, + { + "epoch": 1.66, + "learning_rate": 8.728397573367589e-07, + "loss": 0.6152, + "step": 64888 + }, + { + "epoch": 1.66, + "learning_rate": 8.728123115551193e-07, + "loss": 0.5151, + "step": 64889 + }, + { + "epoch": 1.66, + "learning_rate": 8.727848658708621e-07, + "loss": 0.6826, + "step": 64890 + }, + { + "epoch": 1.66, + "learning_rate": 8.727574202840071e-07, + "loss": 0.5446, + "step": 64891 + }, + { + "epoch": 1.66, + "learning_rate": 8.727299747945761e-07, + "loss": 0.603, + "step": 64892 + }, + { + "epoch": 1.66, + "learning_rate": 8.727025294025896e-07, + "loss": 0.6221, + "step": 64893 + }, + { + "epoch": 1.66, + "learning_rate": 8.726750841080692e-07, + "loss": 0.5811, + "step": 64894 + }, + { + "epoch": 1.66, + "learning_rate": 8.726476389110355e-07, + "loss": 0.5493, + "step": 64895 + }, + { + "epoch": 1.66, + "learning_rate": 8.726201938115098e-07, + "loss": 0.603, + "step": 64896 + }, + { + "epoch": 1.66, + "learning_rate": 8.725927488095127e-07, + "loss": 0.6357, + "step": 64897 + }, + { + "epoch": 1.66, + "learning_rate": 8.725653039050658e-07, + "loss": 0.5764, + "step": 64898 + }, + { + "epoch": 1.66, + "learning_rate": 8.725378590981895e-07, + "loss": 0.6079, + "step": 64899 + }, + { + "epoch": 1.66, + "learning_rate": 8.725104143889055e-07, + "loss": 0.6934, + "step": 64900 + }, + { + "epoch": 1.66, + "learning_rate": 8.724829697772342e-07, + "loss": 0.6001, + "step": 64901 + }, + { + "epoch": 1.66, + "learning_rate": 8.724555252631967e-07, + "loss": 0.6665, + "step": 64902 + }, + { + "epoch": 1.66, + "learning_rate": 8.724280808468143e-07, + "loss": 0.4741, + "step": 64903 + }, + { + "epoch": 1.66, + "learning_rate": 8.724006365281076e-07, + "loss": 0.7178, + "step": 64904 + }, + { + "epoch": 1.66, + "learning_rate": 8.72373192307098e-07, + "loss": 0.6738, + "step": 64905 + }, + { + "epoch": 1.66, + "learning_rate": 8.723457481838064e-07, + "loss": 0.5212, + "step": 64906 + }, + { + "epoch": 1.66, + "learning_rate": 8.723183041582538e-07, + "loss": 0.7393, + "step": 64907 + }, + { + "epoch": 1.66, + "learning_rate": 8.72290860230461e-07, + "loss": 0.5016, + "step": 64908 + }, + { + "epoch": 1.66, + "learning_rate": 8.722634164004496e-07, + "loss": 0.5996, + "step": 64909 + }, + { + "epoch": 1.66, + "learning_rate": 8.722359726682403e-07, + "loss": 0.4175, + "step": 64910 + }, + { + "epoch": 1.66, + "learning_rate": 8.722085290338539e-07, + "loss": 0.5913, + "step": 64911 + }, + { + "epoch": 1.66, + "learning_rate": 8.721810854973112e-07, + "loss": 0.6748, + "step": 64912 + }, + { + "epoch": 1.66, + "learning_rate": 8.72153642058634e-07, + "loss": 0.647, + "step": 64913 + }, + { + "epoch": 1.66, + "learning_rate": 8.721261987178426e-07, + "loss": 0.6211, + "step": 64914 + }, + { + "epoch": 1.66, + "learning_rate": 8.720987554749585e-07, + "loss": 0.6201, + "step": 64915 + }, + { + "epoch": 1.66, + "learning_rate": 8.720713123300022e-07, + "loss": 0.3367, + "step": 64916 + }, + { + "epoch": 1.66, + "learning_rate": 8.720438692829953e-07, + "loss": 0.6606, + "step": 64917 + }, + { + "epoch": 1.66, + "learning_rate": 8.720164263339583e-07, + "loss": 0.708, + "step": 64918 + }, + { + "epoch": 1.66, + "learning_rate": 8.719889834829126e-07, + "loss": 0.3324, + "step": 64919 + }, + { + "epoch": 1.66, + "learning_rate": 8.719615407298793e-07, + "loss": 0.5801, + "step": 64920 + }, + { + "epoch": 1.66, + "learning_rate": 8.719340980748788e-07, + "loss": 0.8564, + "step": 64921 + }, + { + "epoch": 1.66, + "learning_rate": 8.719066555179326e-07, + "loss": 0.604, + "step": 64922 + }, + { + "epoch": 1.66, + "learning_rate": 8.718792130590613e-07, + "loss": 0.7402, + "step": 64923 + }, + { + "epoch": 1.66, + "learning_rate": 8.718517706982865e-07, + "loss": 0.5396, + "step": 64924 + }, + { + "epoch": 1.66, + "learning_rate": 8.718243284356287e-07, + "loss": 0.6582, + "step": 64925 + }, + { + "epoch": 1.66, + "learning_rate": 8.717968862711094e-07, + "loss": 0.6216, + "step": 64926 + }, + { + "epoch": 1.66, + "learning_rate": 8.71769444204749e-07, + "loss": 0.6904, + "step": 64927 + }, + { + "epoch": 1.66, + "learning_rate": 8.717420022365692e-07, + "loss": 0.5234, + "step": 64928 + }, + { + "epoch": 1.66, + "learning_rate": 8.717145603665904e-07, + "loss": 0.5747, + "step": 64929 + }, + { + "epoch": 1.66, + "learning_rate": 8.716871185948342e-07, + "loss": 0.6279, + "step": 64930 + }, + { + "epoch": 1.66, + "learning_rate": 8.716596769213209e-07, + "loss": 0.6641, + "step": 64931 + }, + { + "epoch": 1.66, + "learning_rate": 8.716322353460721e-07, + "loss": 0.6982, + "step": 64932 + }, + { + "epoch": 1.66, + "learning_rate": 8.716047938691084e-07, + "loss": 0.6792, + "step": 64933 + }, + { + "epoch": 1.66, + "learning_rate": 8.715773524904511e-07, + "loss": 0.667, + "step": 64934 + }, + { + "epoch": 1.66, + "learning_rate": 8.71549911210121e-07, + "loss": 0.6504, + "step": 64935 + }, + { + "epoch": 1.66, + "learning_rate": 8.715224700281394e-07, + "loss": 0.5967, + "step": 64936 + }, + { + "epoch": 1.66, + "learning_rate": 8.714950289445269e-07, + "loss": 0.4773, + "step": 64937 + }, + { + "epoch": 1.66, + "learning_rate": 8.714675879593049e-07, + "loss": 0.7803, + "step": 64938 + }, + { + "epoch": 1.66, + "learning_rate": 8.714401470724942e-07, + "loss": 0.5513, + "step": 64939 + }, + { + "epoch": 1.66, + "learning_rate": 8.714127062841162e-07, + "loss": 0.6121, + "step": 64940 + }, + { + "epoch": 1.66, + "learning_rate": 8.713852655941914e-07, + "loss": 0.4902, + "step": 64941 + }, + { + "epoch": 1.66, + "learning_rate": 8.713578250027408e-07, + "loss": 0.6885, + "step": 64942 + }, + { + "epoch": 1.66, + "learning_rate": 8.713303845097859e-07, + "loss": 0.6748, + "step": 64943 + }, + { + "epoch": 1.66, + "learning_rate": 8.71302944115347e-07, + "loss": 0.4602, + "step": 64944 + }, + { + "epoch": 1.66, + "learning_rate": 8.712755038194458e-07, + "loss": 0.3499, + "step": 64945 + }, + { + "epoch": 1.66, + "learning_rate": 8.71248063622103e-07, + "loss": 0.75, + "step": 64946 + }, + { + "epoch": 1.66, + "learning_rate": 8.712206235233395e-07, + "loss": 0.5879, + "step": 64947 + }, + { + "epoch": 1.66, + "learning_rate": 8.711931835231766e-07, + "loss": 0.4783, + "step": 64948 + }, + { + "epoch": 1.66, + "learning_rate": 8.71165743621635e-07, + "loss": 0.6665, + "step": 64949 + }, + { + "epoch": 1.66, + "learning_rate": 8.711383038187362e-07, + "loss": 0.6826, + "step": 64950 + }, + { + "epoch": 1.66, + "learning_rate": 8.711108641145008e-07, + "loss": 0.8467, + "step": 64951 + }, + { + "epoch": 1.66, + "learning_rate": 8.710834245089495e-07, + "loss": 0.8262, + "step": 64952 + }, + { + "epoch": 1.66, + "learning_rate": 8.71055985002104e-07, + "loss": 0.5732, + "step": 64953 + }, + { + "epoch": 1.66, + "learning_rate": 8.710285455939848e-07, + "loss": 0.605, + "step": 64954 + }, + { + "epoch": 1.66, + "learning_rate": 8.710011062846133e-07, + "loss": 0.6064, + "step": 64955 + }, + { + "epoch": 1.66, + "learning_rate": 8.709736670740102e-07, + "loss": 0.7109, + "step": 64956 + }, + { + "epoch": 1.66, + "learning_rate": 8.709462279621968e-07, + "loss": 0.5942, + "step": 64957 + }, + { + "epoch": 1.66, + "learning_rate": 8.709187889491936e-07, + "loss": 0.603, + "step": 64958 + }, + { + "epoch": 1.66, + "learning_rate": 8.708913500350223e-07, + "loss": 0.6611, + "step": 64959 + }, + { + "epoch": 1.66, + "learning_rate": 8.708639112197037e-07, + "loss": 0.7061, + "step": 64960 + }, + { + "epoch": 1.66, + "learning_rate": 8.708364725032583e-07, + "loss": 0.6426, + "step": 64961 + }, + { + "epoch": 1.67, + "learning_rate": 8.708090338857076e-07, + "loss": 0.5288, + "step": 64962 + }, + { + "epoch": 1.67, + "learning_rate": 8.707815953670726e-07, + "loss": 0.5923, + "step": 64963 + }, + { + "epoch": 1.67, + "learning_rate": 8.707541569473739e-07, + "loss": 0.6875, + "step": 64964 + }, + { + "epoch": 1.67, + "learning_rate": 8.70726718626633e-07, + "loss": 0.2667, + "step": 64965 + }, + { + "epoch": 1.67, + "learning_rate": 8.706992804048705e-07, + "loss": 0.6123, + "step": 64966 + }, + { + "epoch": 1.67, + "learning_rate": 8.706718422821079e-07, + "loss": 0.7188, + "step": 64967 + }, + { + "epoch": 1.67, + "learning_rate": 8.706444042583656e-07, + "loss": 0.5947, + "step": 64968 + }, + { + "epoch": 1.67, + "learning_rate": 8.706169663336652e-07, + "loss": 0.6455, + "step": 64969 + }, + { + "epoch": 1.67, + "learning_rate": 8.705895285080277e-07, + "loss": 0.6711, + "step": 64970 + }, + { + "epoch": 1.67, + "learning_rate": 8.705620907814733e-07, + "loss": 0.626, + "step": 64971 + }, + { + "epoch": 1.67, + "learning_rate": 8.705346531540238e-07, + "loss": 0.7764, + "step": 64972 + }, + { + "epoch": 1.67, + "learning_rate": 8.705072156256998e-07, + "loss": 0.6333, + "step": 64973 + }, + { + "epoch": 1.67, + "learning_rate": 8.704797781965227e-07, + "loss": 0.4651, + "step": 64974 + }, + { + "epoch": 1.67, + "learning_rate": 8.704523408665131e-07, + "loss": 0.7539, + "step": 64975 + }, + { + "epoch": 1.67, + "learning_rate": 8.704249036356923e-07, + "loss": 0.5554, + "step": 64976 + }, + { + "epoch": 1.67, + "learning_rate": 8.70397466504081e-07, + "loss": 0.7031, + "step": 64977 + }, + { + "epoch": 1.67, + "learning_rate": 8.703700294717007e-07, + "loss": 0.6997, + "step": 64978 + }, + { + "epoch": 1.67, + "learning_rate": 8.703425925385718e-07, + "loss": 0.751, + "step": 64979 + }, + { + "epoch": 1.67, + "learning_rate": 8.703151557047164e-07, + "loss": 0.6592, + "step": 64980 + }, + { + "epoch": 1.67, + "learning_rate": 8.702877189701538e-07, + "loss": 0.7393, + "step": 64981 + }, + { + "epoch": 1.67, + "learning_rate": 8.702602823349063e-07, + "loss": 0.6362, + "step": 64982 + }, + { + "epoch": 1.67, + "learning_rate": 8.702328457989945e-07, + "loss": 0.52, + "step": 64983 + }, + { + "epoch": 1.67, + "learning_rate": 8.702054093624393e-07, + "loss": 0.6196, + "step": 64984 + }, + { + "epoch": 1.67, + "learning_rate": 8.701779730252619e-07, + "loss": 0.6123, + "step": 64985 + }, + { + "epoch": 1.67, + "learning_rate": 8.701505367874834e-07, + "loss": 0.4768, + "step": 64986 + }, + { + "epoch": 1.67, + "learning_rate": 8.701231006491245e-07, + "loss": 0.7158, + "step": 64987 + }, + { + "epoch": 1.67, + "learning_rate": 8.700956646102064e-07, + "loss": 0.7373, + "step": 64988 + }, + { + "epoch": 1.67, + "learning_rate": 8.700682286707501e-07, + "loss": 0.4431, + "step": 64989 + }, + { + "epoch": 1.67, + "learning_rate": 8.700407928307769e-07, + "loss": 0.6196, + "step": 64990 + }, + { + "epoch": 1.67, + "learning_rate": 8.700133570903073e-07, + "loss": 0.7451, + "step": 64991 + }, + { + "epoch": 1.67, + "learning_rate": 8.699859214493622e-07, + "loss": 0.7812, + "step": 64992 + }, + { + "epoch": 1.67, + "learning_rate": 8.699584859079632e-07, + "loss": 0.573, + "step": 64993 + }, + { + "epoch": 1.67, + "learning_rate": 8.699310504661308e-07, + "loss": 0.4912, + "step": 64994 + }, + { + "epoch": 1.67, + "learning_rate": 8.699036151238863e-07, + "loss": 0.6177, + "step": 64995 + }, + { + "epoch": 1.67, + "learning_rate": 8.698761798812507e-07, + "loss": 0.7803, + "step": 64996 + }, + { + "epoch": 1.67, + "learning_rate": 8.698487447382447e-07, + "loss": 0.6924, + "step": 64997 + }, + { + "epoch": 1.67, + "learning_rate": 8.698213096948897e-07, + "loss": 0.7012, + "step": 64998 + }, + { + "epoch": 1.67, + "learning_rate": 8.697938747512066e-07, + "loss": 0.7021, + "step": 64999 + }, + { + "epoch": 1.67, + "learning_rate": 8.697664399072166e-07, + "loss": 0.6416, + "step": 65000 } ], "logging_steps": 1.0, "max_steps": 117048, "num_train_epochs": 3, "save_steps": 5000, - "total_flos": 779052670156800.0, + "total_flos": 1687867611955200.0, "trial_name": null, "trial_params": null }