{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.9547461258777878, "global_step": 1620000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00012066332248268406, "learning_rate": 1.0000000000000001e-07, "loss": 10.998963623046874, "step": 100 }, { "epoch": 0.00024132664496536813, "learning_rate": 2.0000000000000002e-07, "loss": 10.867801513671875, "step": 200 }, { "epoch": 0.0003619899674480522, "learning_rate": 3.0000000000000004e-07, "loss": 10.671025390625, "step": 300 }, { "epoch": 0.00048265328993073625, "learning_rate": 4.0000000000000003e-07, "loss": 10.47958740234375, "step": 400 }, { "epoch": 0.0006033166124134203, "learning_rate": 5.000000000000001e-07, "loss": 10.36065185546875, "step": 500 }, { "epoch": 0.0007239799348961044, "learning_rate": 6.000000000000001e-07, "loss": 10.27036865234375, "step": 600 }, { "epoch": 0.0008446432573787884, "learning_rate": 7.000000000000001e-07, "loss": 10.198671264648437, "step": 700 }, { "epoch": 0.0009653065798614725, "learning_rate": 8.000000000000001e-07, "loss": 10.139332275390625, "step": 800 }, { "epoch": 0.0010859699023441566, "learning_rate": 9.000000000000001e-07, "loss": 10.094085083007812, "step": 900 }, { "epoch": 0.0012066332248268407, "learning_rate": 1.0000000000000002e-06, "loss": 10.038567504882813, "step": 1000 }, { "epoch": 0.0013272965473095247, "learning_rate": 1.1e-06, "loss": 9.995147705078125, "step": 1100 }, { "epoch": 0.0014479598697922087, "learning_rate": 1.2000000000000002e-06, "loss": 9.927572021484375, "step": 1200 }, { "epoch": 0.0015686231922748927, "learning_rate": 1.3e-06, "loss": 9.875374755859376, "step": 1300 }, { "epoch": 0.0016892865147575768, "learning_rate": 1.4000000000000001e-06, "loss": 9.811220092773437, "step": 1400 }, { "epoch": 0.001809949837240261, "learning_rate": 1.5e-06, "loss": 9.74679931640625, "step": 1500 }, { "epoch": 0.001930613159722945, "learning_rate": 1.6000000000000001e-06, "loss": 9.663087768554687, "step": 1600 }, { "epoch": 0.002051276482205629, "learning_rate": 1.7000000000000002e-06, "loss": 9.591069946289062, "step": 1700 }, { "epoch": 0.0021719398046883133, "learning_rate": 1.8000000000000001e-06, "loss": 9.529061889648437, "step": 1800 }, { "epoch": 0.002292603127170997, "learning_rate": 1.9000000000000002e-06, "loss": 9.4752197265625, "step": 1900 }, { "epoch": 0.0024132664496536813, "learning_rate": 2.0000000000000003e-06, "loss": 9.4010302734375, "step": 2000 }, { "epoch": 0.002533929772136365, "learning_rate": 2.1000000000000002e-06, "loss": 9.35108642578125, "step": 2100 }, { "epoch": 0.0026545930946190494, "learning_rate": 2.2e-06, "loss": 9.2584326171875, "step": 2200 }, { "epoch": 0.002775256417101733, "learning_rate": 2.3000000000000004e-06, "loss": 9.214194946289062, "step": 2300 }, { "epoch": 0.0028959197395844174, "learning_rate": 2.4000000000000003e-06, "loss": 9.132109985351562, "step": 2400 }, { "epoch": 0.0030165830620671017, "learning_rate": 2.5e-06, "loss": 9.047922973632813, "step": 2500 }, { "epoch": 0.0031372463845497855, "learning_rate": 2.6e-06, "loss": 8.99282958984375, "step": 2600 }, { "epoch": 0.0032579097070324697, "learning_rate": 2.7000000000000004e-06, "loss": 8.95028076171875, "step": 2700 }, { "epoch": 0.0033785730295151535, "learning_rate": 2.8000000000000003e-06, "loss": 8.865433349609376, "step": 2800 }, { "epoch": 0.0034992363519978377, "learning_rate": 2.9e-06, "loss": 8.848460083007813, "step": 2900 }, { "epoch": 0.003619899674480522, "learning_rate": 3e-06, "loss": 8.786046752929687, "step": 3000 }, { "epoch": 0.003740562996963206, "learning_rate": 3.1000000000000004e-06, "loss": 8.73739501953125, "step": 3100 }, { "epoch": 0.00386122631944589, "learning_rate": 3.2000000000000003e-06, "loss": 8.654747924804688, "step": 3200 }, { "epoch": 0.003981889641928574, "learning_rate": 3.3000000000000006e-06, "loss": 8.638505859375, "step": 3300 }, { "epoch": 0.004102552964411258, "learning_rate": 3.4000000000000005e-06, "loss": 8.57900390625, "step": 3400 }, { "epoch": 0.004223216286893942, "learning_rate": 3.5e-06, "loss": 8.544164428710937, "step": 3500 }, { "epoch": 0.0043438796093766266, "learning_rate": 3.6000000000000003e-06, "loss": 8.50919189453125, "step": 3600 }, { "epoch": 0.00446454293185931, "learning_rate": 3.7e-06, "loss": 8.48513671875, "step": 3700 }, { "epoch": 0.004585206254341994, "learning_rate": 3.8000000000000005e-06, "loss": 8.434906005859375, "step": 3800 }, { "epoch": 0.004705869576824678, "learning_rate": 3.900000000000001e-06, "loss": 8.401183471679687, "step": 3900 }, { "epoch": 0.004826532899307363, "learning_rate": 4.000000000000001e-06, "loss": 8.37177001953125, "step": 4000 }, { "epoch": 0.0049471962217900465, "learning_rate": 4.1e-06, "loss": 8.339204711914062, "step": 4100 }, { "epoch": 0.00506785954427273, "learning_rate": 4.2000000000000004e-06, "loss": 8.3411181640625, "step": 4200 }, { "epoch": 0.005188522866755415, "learning_rate": 4.3e-06, "loss": 8.30220947265625, "step": 4300 }, { "epoch": 0.005309186189238099, "learning_rate": 4.4e-06, "loss": 8.303151245117187, "step": 4400 }, { "epoch": 0.0054298495117207825, "learning_rate": 4.5e-06, "loss": 8.252617797851563, "step": 4500 }, { "epoch": 0.005550512834203466, "learning_rate": 4.600000000000001e-06, "loss": 8.258956909179688, "step": 4600 }, { "epoch": 0.005671176156686151, "learning_rate": 4.7e-06, "loss": 8.244758911132813, "step": 4700 }, { "epoch": 0.005791839479168835, "learning_rate": 4.800000000000001e-06, "loss": 8.21389404296875, "step": 4800 }, { "epoch": 0.005912502801651519, "learning_rate": 4.9000000000000005e-06, "loss": 8.185855712890625, "step": 4900 }, { "epoch": 0.006033166124134203, "learning_rate": 5e-06, "loss": 8.198721923828124, "step": 5000 }, { "epoch": 0.006153829446616887, "learning_rate": 5.1e-06, "loss": 8.184302368164062, "step": 5100 }, { "epoch": 0.006274492769099571, "learning_rate": 5.2e-06, "loss": 8.141995849609375, "step": 5200 }, { "epoch": 0.006395156091582255, "learning_rate": 5.300000000000001e-06, "loss": 8.149254150390625, "step": 5300 }, { "epoch": 0.006515819414064939, "learning_rate": 5.400000000000001e-06, "loss": 8.134349365234375, "step": 5400 }, { "epoch": 0.006636482736547623, "learning_rate": 5.500000000000001e-06, "loss": 8.126637573242187, "step": 5500 }, { "epoch": 0.006757146059030307, "learning_rate": 5.600000000000001e-06, "loss": 8.11840087890625, "step": 5600 }, { "epoch": 0.006877809381512992, "learning_rate": 5.7e-06, "loss": 8.152865600585937, "step": 5700 }, { "epoch": 0.0069984727039956755, "learning_rate": 5.8e-06, "loss": 8.106795654296874, "step": 5800 }, { "epoch": 0.007119136026478359, "learning_rate": 5.9e-06, "loss": 8.087644653320313, "step": 5900 }, { "epoch": 0.007239799348961044, "learning_rate": 6e-06, "loss": 8.071045532226563, "step": 6000 }, { "epoch": 0.007360462671443728, "learning_rate": 6.1e-06, "loss": 8.07795654296875, "step": 6100 }, { "epoch": 0.007481125993926412, "learning_rate": 6.200000000000001e-06, "loss": 8.07419677734375, "step": 6200 }, { "epoch": 0.007601789316409095, "learning_rate": 6.300000000000001e-06, "loss": 8.054071655273438, "step": 6300 }, { "epoch": 0.00772245263889178, "learning_rate": 6.4000000000000006e-06, "loss": 8.069452514648438, "step": 6400 }, { "epoch": 0.007843115961374464, "learning_rate": 6.5000000000000004e-06, "loss": 8.062046508789063, "step": 6500 }, { "epoch": 0.007963779283857149, "learning_rate": 6.600000000000001e-06, "loss": 8.041135864257813, "step": 6600 }, { "epoch": 0.008084442606339831, "learning_rate": 6.700000000000001e-06, "loss": 8.0472509765625, "step": 6700 }, { "epoch": 0.008205105928822516, "learning_rate": 6.800000000000001e-06, "loss": 8.015521240234374, "step": 6800 }, { "epoch": 0.0083257692513052, "learning_rate": 6.9e-06, "loss": 7.99987060546875, "step": 6900 }, { "epoch": 0.008446432573787884, "learning_rate": 7e-06, "loss": 8.021083374023437, "step": 7000 }, { "epoch": 0.008567095896270568, "learning_rate": 7.100000000000001e-06, "loss": 8.009032592773437, "step": 7100 }, { "epoch": 0.008687759218753253, "learning_rate": 7.2000000000000005e-06, "loss": 7.98518798828125, "step": 7200 }, { "epoch": 0.008808422541235936, "learning_rate": 7.3e-06, "loss": 7.98792724609375, "step": 7300 }, { "epoch": 0.00892908586371862, "learning_rate": 7.4e-06, "loss": 7.98720703125, "step": 7400 }, { "epoch": 0.009049749186201304, "learning_rate": 7.500000000000001e-06, "loss": 7.946220092773437, "step": 7500 }, { "epoch": 0.009170412508683988, "learning_rate": 7.600000000000001e-06, "loss": 7.945390014648438, "step": 7600 }, { "epoch": 0.009291075831166673, "learning_rate": 7.7e-06, "loss": 7.98837158203125, "step": 7700 }, { "epoch": 0.009411739153649356, "learning_rate": 7.800000000000002e-06, "loss": 7.9614019775390625, "step": 7800 }, { "epoch": 0.00953240247613204, "learning_rate": 7.9e-06, "loss": 7.951765747070312, "step": 7900 }, { "epoch": 0.009653065798614725, "learning_rate": 8.000000000000001e-06, "loss": 7.924186401367187, "step": 8000 }, { "epoch": 0.009773729121097408, "learning_rate": 8.1e-06, "loss": 7.929385375976563, "step": 8100 }, { "epoch": 0.009894392443580093, "learning_rate": 8.2e-06, "loss": 7.926139526367187, "step": 8200 }, { "epoch": 0.010015055766062778, "learning_rate": 8.3e-06, "loss": 7.90500244140625, "step": 8300 }, { "epoch": 0.01013571908854546, "learning_rate": 8.400000000000001e-06, "loss": 7.927145385742188, "step": 8400 }, { "epoch": 0.010256382411028145, "learning_rate": 8.5e-06, "loss": 7.9099884033203125, "step": 8500 }, { "epoch": 0.01037704573351083, "learning_rate": 8.6e-06, "loss": 7.90431640625, "step": 8600 }, { "epoch": 0.010497709055993513, "learning_rate": 8.700000000000001e-06, "loss": 7.885325927734375, "step": 8700 }, { "epoch": 0.010618372378476197, "learning_rate": 8.8e-06, "loss": 7.895731201171875, "step": 8800 }, { "epoch": 0.01073903570095888, "learning_rate": 8.900000000000001e-06, "loss": 7.873722534179688, "step": 8900 }, { "epoch": 0.010859699023441565, "learning_rate": 9e-06, "loss": 7.867328491210937, "step": 9000 }, { "epoch": 0.01098036234592425, "learning_rate": 9.100000000000001e-06, "loss": 7.870953369140625, "step": 9100 }, { "epoch": 0.011101025668406933, "learning_rate": 9.200000000000002e-06, "loss": 7.89510498046875, "step": 9200 }, { "epoch": 0.011221688990889617, "learning_rate": 9.3e-06, "loss": 7.866868896484375, "step": 9300 }, { "epoch": 0.011342352313372302, "learning_rate": 9.4e-06, "loss": 7.843492431640625, "step": 9400 }, { "epoch": 0.011463015635854985, "learning_rate": 9.5e-06, "loss": 7.845059204101562, "step": 9500 }, { "epoch": 0.01158367895833767, "learning_rate": 9.600000000000001e-06, "loss": 7.835038452148438, "step": 9600 }, { "epoch": 0.011704342280820354, "learning_rate": 9.7e-06, "loss": 7.848790893554687, "step": 9700 }, { "epoch": 0.011825005603303037, "learning_rate": 9.800000000000001e-06, "loss": 7.842159423828125, "step": 9800 }, { "epoch": 0.011945668925785722, "learning_rate": 9.9e-06, "loss": 7.8275146484375, "step": 9900 }, { "epoch": 0.012066332248268407, "learning_rate": 1e-05, "loss": 7.826830444335937, "step": 10000 }, { "epoch": 0.01218699557075109, "learning_rate": 9.999596164532263e-06, "loss": 7.812598876953125, "step": 10100 }, { "epoch": 0.012307658893233774, "learning_rate": 9.999192329064525e-06, "loss": 7.807442626953125, "step": 10200 }, { "epoch": 0.012428322215716459, "learning_rate": 9.998788493596787e-06, "loss": 7.79939697265625, "step": 10300 }, { "epoch": 0.012548985538199142, "learning_rate": 9.998384658129047e-06, "loss": 7.804387817382812, "step": 10400 }, { "epoch": 0.012669648860681827, "learning_rate": 9.997980822661309e-06, "loss": 7.799457397460937, "step": 10500 }, { "epoch": 0.01279031218316451, "learning_rate": 9.99757698719357e-06, "loss": 7.800637817382812, "step": 10600 }, { "epoch": 0.012910975505647194, "learning_rate": 9.997173151725831e-06, "loss": 7.776885986328125, "step": 10700 }, { "epoch": 0.013031638828129879, "learning_rate": 9.996769316258093e-06, "loss": 7.790662231445313, "step": 10800 }, { "epoch": 0.013152302150612562, "learning_rate": 9.996365480790355e-06, "loss": 7.780765991210938, "step": 10900 }, { "epoch": 0.013272965473095246, "learning_rate": 9.995961645322617e-06, "loss": 7.776314697265625, "step": 11000 }, { "epoch": 0.013393628795577931, "learning_rate": 9.99555780985488e-06, "loss": 7.753301391601562, "step": 11100 }, { "epoch": 0.013514292118060614, "learning_rate": 9.995153974387141e-06, "loss": 7.774302368164062, "step": 11200 }, { "epoch": 0.013634955440543299, "learning_rate": 9.994750138919402e-06, "loss": 7.761792602539063, "step": 11300 }, { "epoch": 0.013755618763025983, "learning_rate": 9.994346303451663e-06, "loss": 7.756895751953125, "step": 11400 }, { "epoch": 0.013876282085508666, "learning_rate": 9.993942467983925e-06, "loss": 7.756287231445312, "step": 11500 }, { "epoch": 0.013996945407991351, "learning_rate": 9.993538632516186e-06, "loss": 7.74819580078125, "step": 11600 }, { "epoch": 0.014117608730474036, "learning_rate": 9.993134797048448e-06, "loss": 7.748518676757812, "step": 11700 }, { "epoch": 0.014238272052956719, "learning_rate": 9.99273096158071e-06, "loss": 7.73031005859375, "step": 11800 }, { "epoch": 0.014358935375439403, "learning_rate": 9.992327126112972e-06, "loss": 7.731920776367187, "step": 11900 }, { "epoch": 0.014479598697922088, "learning_rate": 9.991923290645234e-06, "loss": 7.719931030273438, "step": 12000 }, { "epoch": 0.014600262020404771, "learning_rate": 9.991519455177494e-06, "loss": 7.723886108398437, "step": 12100 }, { "epoch": 0.014720925342887456, "learning_rate": 9.991115619709756e-06, "loss": 7.706294555664062, "step": 12200 }, { "epoch": 0.014841588665370139, "learning_rate": 9.990711784242018e-06, "loss": 7.7386846923828125, "step": 12300 }, { "epoch": 0.014962251987852823, "learning_rate": 9.99030794877428e-06, "loss": 7.722437744140625, "step": 12400 }, { "epoch": 0.015082915310335508, "learning_rate": 9.989904113306542e-06, "loss": 7.702894287109375, "step": 12500 }, { "epoch": 0.01520357863281819, "learning_rate": 9.989500277838802e-06, "loss": 7.699403076171875, "step": 12600 }, { "epoch": 0.015324241955300875, "learning_rate": 9.989096442371064e-06, "loss": 7.70286865234375, "step": 12700 }, { "epoch": 0.01544490527778356, "learning_rate": 9.988692606903326e-06, "loss": 7.727252197265625, "step": 12800 }, { "epoch": 0.015565568600266243, "learning_rate": 9.988288771435586e-06, "loss": 7.681318969726562, "step": 12900 }, { "epoch": 0.015686231922748928, "learning_rate": 9.987884935967848e-06, "loss": 7.681355590820313, "step": 13000 }, { "epoch": 0.01580689524523161, "learning_rate": 9.98748110050011e-06, "loss": 7.669380493164063, "step": 13100 }, { "epoch": 0.015927558567714297, "learning_rate": 9.987077265032372e-06, "loss": 7.691492309570313, "step": 13200 }, { "epoch": 0.01604822189019698, "learning_rate": 9.986673429564634e-06, "loss": 7.735159301757813, "step": 13300 }, { "epoch": 0.016168885212679663, "learning_rate": 9.986269594096896e-06, "loss": 7.67091552734375, "step": 13400 }, { "epoch": 0.01628954853516235, "learning_rate": 9.985865758629157e-06, "loss": 7.673142700195313, "step": 13500 }, { "epoch": 0.016410211857645032, "learning_rate": 9.985461923161419e-06, "loss": 7.694071044921875, "step": 13600 }, { "epoch": 0.016530875180127715, "learning_rate": 9.98505808769368e-06, "loss": 7.685897216796875, "step": 13700 }, { "epoch": 0.0166515385026104, "learning_rate": 9.984654252225941e-06, "loss": 7.67085693359375, "step": 13800 }, { "epoch": 0.016772201825093085, "learning_rate": 9.984250416758203e-06, "loss": 7.652900390625, "step": 13900 }, { "epoch": 0.016892865147575768, "learning_rate": 9.983846581290465e-06, "loss": 7.666927490234375, "step": 14000 }, { "epoch": 0.017013528470058454, "learning_rate": 9.983442745822727e-06, "loss": 7.651405029296875, "step": 14100 }, { "epoch": 0.017134191792541137, "learning_rate": 9.983038910354989e-06, "loss": 7.638584594726563, "step": 14200 }, { "epoch": 0.01725485511502382, "learning_rate": 9.98263507488725e-06, "loss": 7.643876953125, "step": 14300 }, { "epoch": 0.017375518437506506, "learning_rate": 9.982231239419513e-06, "loss": 7.6271630859375, "step": 14400 }, { "epoch": 0.01749618175998919, "learning_rate": 9.981827403951773e-06, "loss": 7.63806884765625, "step": 14500 }, { "epoch": 0.017616845082471872, "learning_rate": 9.981423568484035e-06, "loss": 7.62742919921875, "step": 14600 }, { "epoch": 0.017737508404954555, "learning_rate": 9.981019733016295e-06, "loss": 7.642492065429687, "step": 14700 }, { "epoch": 0.01785817172743724, "learning_rate": 9.980615897548557e-06, "loss": 7.6192822265625, "step": 14800 }, { "epoch": 0.017978835049919924, "learning_rate": 9.98021206208082e-06, "loss": 7.607686157226563, "step": 14900 }, { "epoch": 0.018099498372402607, "learning_rate": 9.979808226613081e-06, "loss": 7.62489501953125, "step": 15000 }, { "epoch": 0.018220161694885294, "learning_rate": 9.979404391145343e-06, "loss": 7.608429565429687, "step": 15100 }, { "epoch": 0.018340825017367977, "learning_rate": 9.979000555677605e-06, "loss": 7.597339477539062, "step": 15200 }, { "epoch": 0.01846148833985066, "learning_rate": 9.978596720209867e-06, "loss": 7.593267211914062, "step": 15300 }, { "epoch": 0.018582151662333346, "learning_rate": 9.978192884742128e-06, "loss": 7.600186157226562, "step": 15400 }, { "epoch": 0.01870281498481603, "learning_rate": 9.97778904927439e-06, "loss": 7.575609130859375, "step": 15500 }, { "epoch": 0.018823478307298712, "learning_rate": 9.977385213806652e-06, "loss": 7.578140869140625, "step": 15600 }, { "epoch": 0.0189441416297814, "learning_rate": 9.976981378338912e-06, "loss": 7.588411865234375, "step": 15700 }, { "epoch": 0.01906480495226408, "learning_rate": 9.976577542871174e-06, "loss": 7.566851806640625, "step": 15800 }, { "epoch": 0.019185468274746764, "learning_rate": 9.976173707403436e-06, "loss": 7.549029541015625, "step": 15900 }, { "epoch": 0.01930613159722945, "learning_rate": 9.975769871935698e-06, "loss": 7.562918701171875, "step": 16000 }, { "epoch": 0.019426794919712134, "learning_rate": 9.97536603646796e-06, "loss": 7.537685546875, "step": 16100 }, { "epoch": 0.019547458242194816, "learning_rate": 9.97496220100022e-06, "loss": 7.517478637695312, "step": 16200 }, { "epoch": 0.019668121564677503, "learning_rate": 9.974558365532482e-06, "loss": 7.5180731201171875, "step": 16300 }, { "epoch": 0.019788784887160186, "learning_rate": 9.974154530064744e-06, "loss": 7.493146362304688, "step": 16400 }, { "epoch": 0.01990944820964287, "learning_rate": 9.973750694597006e-06, "loss": 7.484447021484375, "step": 16500 }, { "epoch": 0.020030111532125555, "learning_rate": 9.973346859129266e-06, "loss": 7.502681274414062, "step": 16600 }, { "epoch": 0.020150774854608238, "learning_rate": 9.972943023661528e-06, "loss": 7.45322998046875, "step": 16700 }, { "epoch": 0.02027143817709092, "learning_rate": 9.97253918819379e-06, "loss": 7.495328369140625, "step": 16800 }, { "epoch": 0.020392101499573607, "learning_rate": 9.972135352726052e-06, "loss": 7.466298828125, "step": 16900 }, { "epoch": 0.02051276482205629, "learning_rate": 9.971731517258312e-06, "loss": 7.4412060546875, "step": 17000 }, { "epoch": 0.020633428144538973, "learning_rate": 9.971327681790574e-06, "loss": 7.4665283203125, "step": 17100 }, { "epoch": 0.02075409146702166, "learning_rate": 9.970923846322836e-06, "loss": 7.432006225585938, "step": 17200 }, { "epoch": 0.020874754789504343, "learning_rate": 9.970520010855098e-06, "loss": 7.4205126953125, "step": 17300 }, { "epoch": 0.020995418111987026, "learning_rate": 9.97011617538736e-06, "loss": 7.412860107421875, "step": 17400 }, { "epoch": 0.021116081434469712, "learning_rate": 9.969712339919622e-06, "loss": 7.390285034179687, "step": 17500 }, { "epoch": 0.021236744756952395, "learning_rate": 9.969308504451883e-06, "loss": 7.388471069335938, "step": 17600 }, { "epoch": 0.021357408079435078, "learning_rate": 9.968904668984145e-06, "loss": 7.357642822265625, "step": 17700 }, { "epoch": 0.02147807140191776, "learning_rate": 9.968500833516405e-06, "loss": 7.374608154296875, "step": 17800 }, { "epoch": 0.021598734724400447, "learning_rate": 9.968096998048667e-06, "loss": 7.348936767578125, "step": 17900 }, { "epoch": 0.02171939804688313, "learning_rate": 9.967693162580929e-06, "loss": 7.326118774414063, "step": 18000 }, { "epoch": 0.021840061369365813, "learning_rate": 9.967289327113191e-06, "loss": 7.3109765625, "step": 18100 }, { "epoch": 0.0219607246918485, "learning_rate": 9.966885491645453e-06, "loss": 7.311011962890625, "step": 18200 }, { "epoch": 0.022081388014331182, "learning_rate": 9.966481656177715e-06, "loss": 7.274530029296875, "step": 18300 }, { "epoch": 0.022202051336813865, "learning_rate": 9.966077820709977e-06, "loss": 7.23897705078125, "step": 18400 }, { "epoch": 0.022322714659296552, "learning_rate": 9.965673985242237e-06, "loss": 7.2407861328125, "step": 18500 }, { "epoch": 0.022443377981779235, "learning_rate": 9.965270149774499e-06, "loss": 7.240975341796875, "step": 18600 }, { "epoch": 0.022564041304261918, "learning_rate": 9.964866314306761e-06, "loss": 7.222609252929687, "step": 18700 }, { "epoch": 0.022684704626744604, "learning_rate": 9.964462478839021e-06, "loss": 7.2113800048828125, "step": 18800 }, { "epoch": 0.022805367949227287, "learning_rate": 9.964058643371283e-06, "loss": 7.19686767578125, "step": 18900 }, { "epoch": 0.02292603127170997, "learning_rate": 9.963654807903545e-06, "loss": 7.1889306640625, "step": 19000 }, { "epoch": 0.023046694594192656, "learning_rate": 9.963250972435807e-06, "loss": 7.175922241210937, "step": 19100 }, { "epoch": 0.02316735791667534, "learning_rate": 9.96284713696807e-06, "loss": 7.178650512695312, "step": 19200 }, { "epoch": 0.023288021239158022, "learning_rate": 9.962443301500331e-06, "loss": 7.181878662109375, "step": 19300 }, { "epoch": 0.02340868456164071, "learning_rate": 9.962039466032592e-06, "loss": 7.137700805664062, "step": 19400 }, { "epoch": 0.02352934788412339, "learning_rate": 9.961635630564854e-06, "loss": 7.1376220703125, "step": 19500 }, { "epoch": 0.023650011206606075, "learning_rate": 9.961231795097116e-06, "loss": 7.112848510742188, "step": 19600 }, { "epoch": 0.02377067452908876, "learning_rate": 9.960827959629376e-06, "loss": 7.077623291015625, "step": 19700 }, { "epoch": 0.023891337851571444, "learning_rate": 9.960424124161638e-06, "loss": 7.10410888671875, "step": 19800 }, { "epoch": 0.024012001174054127, "learning_rate": 9.9600202886939e-06, "loss": 7.04318359375, "step": 19900 }, { "epoch": 0.024132664496536813, "learning_rate": 9.959616453226162e-06, "loss": 7.05190185546875, "step": 20000 }, { "epoch": 0.024253327819019496, "learning_rate": 9.959212617758424e-06, "loss": 7.062595825195313, "step": 20100 }, { "epoch": 0.02437399114150218, "learning_rate": 9.958808782290684e-06, "loss": 7.040302734375, "step": 20200 }, { "epoch": 0.024494654463984866, "learning_rate": 9.958404946822946e-06, "loss": 7.060929565429688, "step": 20300 }, { "epoch": 0.02461531778646755, "learning_rate": 9.958001111355208e-06, "loss": 7.056749267578125, "step": 20400 }, { "epoch": 0.02473598110895023, "learning_rate": 9.95759727588747e-06, "loss": 7.02091796875, "step": 20500 }, { "epoch": 0.024856644431432918, "learning_rate": 9.957193440419732e-06, "loss": 7.011871337890625, "step": 20600 }, { "epoch": 0.0249773077539156, "learning_rate": 9.956789604951992e-06, "loss": 7.002923583984375, "step": 20700 }, { "epoch": 0.025097971076398284, "learning_rate": 9.956385769484254e-06, "loss": 6.983974609375, "step": 20800 }, { "epoch": 0.025218634398880967, "learning_rate": 9.955981934016516e-06, "loss": 6.9759765625, "step": 20900 }, { "epoch": 0.025339297721363653, "learning_rate": 9.955578098548778e-06, "loss": 6.959908447265625, "step": 21000 }, { "epoch": 0.025459961043846336, "learning_rate": 9.955174263081039e-06, "loss": 6.96692626953125, "step": 21100 }, { "epoch": 0.02558062436632902, "learning_rate": 9.9547704276133e-06, "loss": 6.933953857421875, "step": 21200 }, { "epoch": 0.025701287688811705, "learning_rate": 9.954366592145562e-06, "loss": 6.96384033203125, "step": 21300 }, { "epoch": 0.02582195101129439, "learning_rate": 9.953962756677824e-06, "loss": 6.8951177978515625, "step": 21400 }, { "epoch": 0.02594261433377707, "learning_rate": 9.953558921210086e-06, "loss": 6.91238037109375, "step": 21500 }, { "epoch": 0.026063277656259758, "learning_rate": 9.953155085742347e-06, "loss": 6.896270141601563, "step": 21600 }, { "epoch": 0.02618394097874244, "learning_rate": 9.952751250274609e-06, "loss": 6.896909790039063, "step": 21700 }, { "epoch": 0.026304604301225123, "learning_rate": 9.95234741480687e-06, "loss": 6.881757202148438, "step": 21800 }, { "epoch": 0.02642526762370781, "learning_rate": 9.951943579339131e-06, "loss": 6.8531689453125, "step": 21900 }, { "epoch": 0.026545930946190493, "learning_rate": 9.951539743871393e-06, "loss": 6.872998046875, "step": 22000 }, { "epoch": 0.026666594268673176, "learning_rate": 9.951135908403655e-06, "loss": 6.854584350585937, "step": 22100 }, { "epoch": 0.026787257591155862, "learning_rate": 9.950732072935917e-06, "loss": 6.827476806640625, "step": 22200 }, { "epoch": 0.026907920913638545, "learning_rate": 9.950328237468179e-06, "loss": 6.831190185546875, "step": 22300 }, { "epoch": 0.027028584236121228, "learning_rate": 9.949924402000441e-06, "loss": 6.7924261474609375, "step": 22400 }, { "epoch": 0.027149247558603914, "learning_rate": 9.949520566532703e-06, "loss": 6.790482177734375, "step": 22500 }, { "epoch": 0.027269910881086597, "learning_rate": 9.949116731064963e-06, "loss": 6.803350219726562, "step": 22600 }, { "epoch": 0.02739057420356928, "learning_rate": 9.948712895597225e-06, "loss": 6.785421752929688, "step": 22700 }, { "epoch": 0.027511237526051967, "learning_rate": 9.948309060129485e-06, "loss": 6.777293701171875, "step": 22800 }, { "epoch": 0.02763190084853465, "learning_rate": 9.947905224661747e-06, "loss": 6.767362060546875, "step": 22900 }, { "epoch": 0.027752564171017333, "learning_rate": 9.94750138919401e-06, "loss": 6.742926025390625, "step": 23000 }, { "epoch": 0.02787322749350002, "learning_rate": 9.947097553726271e-06, "loss": 6.78175048828125, "step": 23100 }, { "epoch": 0.027993890815982702, "learning_rate": 9.946693718258533e-06, "loss": 6.729476318359375, "step": 23200 }, { "epoch": 0.028114554138465385, "learning_rate": 9.946289882790795e-06, "loss": 6.729383544921875, "step": 23300 }, { "epoch": 0.02823521746094807, "learning_rate": 9.945886047323057e-06, "loss": 6.723148193359375, "step": 23400 }, { "epoch": 0.028355880783430754, "learning_rate": 9.945482211855318e-06, "loss": 6.739766235351563, "step": 23500 }, { "epoch": 0.028476544105913437, "learning_rate": 9.94507837638758e-06, "loss": 6.685776977539063, "step": 23600 }, { "epoch": 0.028597207428396124, "learning_rate": 9.944674540919842e-06, "loss": 6.71983154296875, "step": 23700 }, { "epoch": 0.028717870750878807, "learning_rate": 9.944270705452102e-06, "loss": 6.673611450195312, "step": 23800 }, { "epoch": 0.02883853407336149, "learning_rate": 9.943866869984364e-06, "loss": 6.659153442382813, "step": 23900 }, { "epoch": 0.028959197395844176, "learning_rate": 9.943463034516626e-06, "loss": 6.669003295898437, "step": 24000 }, { "epoch": 0.02907986071832686, "learning_rate": 9.943059199048888e-06, "loss": 6.634718017578125, "step": 24100 }, { "epoch": 0.029200524040809542, "learning_rate": 9.94265536358115e-06, "loss": 6.655950317382812, "step": 24200 }, { "epoch": 0.029321187363292225, "learning_rate": 9.94225152811341e-06, "loss": 6.658018188476563, "step": 24300 }, { "epoch": 0.02944185068577491, "learning_rate": 9.941847692645672e-06, "loss": 6.616795654296875, "step": 24400 }, { "epoch": 0.029562514008257594, "learning_rate": 9.941443857177934e-06, "loss": 6.64441650390625, "step": 24500 }, { "epoch": 0.029683177330740277, "learning_rate": 9.941040021710196e-06, "loss": 6.600654907226563, "step": 24600 }, { "epoch": 0.029803840653222963, "learning_rate": 9.940636186242458e-06, "loss": 6.606512451171875, "step": 24700 }, { "epoch": 0.029924503975705646, "learning_rate": 9.940232350774718e-06, "loss": 6.615017700195312, "step": 24800 }, { "epoch": 0.03004516729818833, "learning_rate": 9.93982851530698e-06, "loss": 6.570202026367188, "step": 24900 }, { "epoch": 0.030165830620671016, "learning_rate": 9.939424679839242e-06, "loss": 6.583402099609375, "step": 25000 }, { "epoch": 0.0302864939431537, "learning_rate": 9.939020844371503e-06, "loss": 6.571268310546875, "step": 25100 }, { "epoch": 0.03040715726563638, "learning_rate": 9.938617008903765e-06, "loss": 6.569072265625, "step": 25200 }, { "epoch": 0.030527820588119068, "learning_rate": 9.938213173436027e-06, "loss": 6.567750244140625, "step": 25300 }, { "epoch": 0.03064848391060175, "learning_rate": 9.937809337968289e-06, "loss": 6.578480834960938, "step": 25400 }, { "epoch": 0.030769147233084434, "learning_rate": 9.93740550250055e-06, "loss": 6.548373413085938, "step": 25500 }, { "epoch": 0.03088981055556712, "learning_rate": 9.937001667032812e-06, "loss": 6.56265380859375, "step": 25600 }, { "epoch": 0.031010473878049803, "learning_rate": 9.936597831565073e-06, "loss": 6.53989501953125, "step": 25700 }, { "epoch": 0.031131137200532486, "learning_rate": 9.936193996097335e-06, "loss": 6.511539916992188, "step": 25800 }, { "epoch": 0.03125180052301517, "learning_rate": 9.935790160629597e-06, "loss": 6.52816650390625, "step": 25900 }, { "epoch": 0.031372463845497855, "learning_rate": 9.935386325161857e-06, "loss": 6.500388793945312, "step": 26000 }, { "epoch": 0.03149312716798054, "learning_rate": 9.934982489694119e-06, "loss": 6.523255004882812, "step": 26100 }, { "epoch": 0.03161379049046322, "learning_rate": 9.934578654226381e-06, "loss": 6.49367919921875, "step": 26200 }, { "epoch": 0.03173445381294591, "learning_rate": 9.934174818758643e-06, "loss": 6.478309326171875, "step": 26300 }, { "epoch": 0.031855117135428594, "learning_rate": 9.933770983290905e-06, "loss": 6.448147583007812, "step": 26400 }, { "epoch": 0.031975780457911274, "learning_rate": 9.933367147823167e-06, "loss": 6.495176391601563, "step": 26500 }, { "epoch": 0.03209644378039396, "learning_rate": 9.932963312355429e-06, "loss": 6.46186767578125, "step": 26600 }, { "epoch": 0.032217107102876646, "learning_rate": 9.93255947688769e-06, "loss": 6.471776123046875, "step": 26700 }, { "epoch": 0.032337770425359326, "learning_rate": 9.932155641419951e-06, "loss": 6.472383422851562, "step": 26800 }, { "epoch": 0.03245843374784201, "learning_rate": 9.931751805952211e-06, "loss": 6.4738720703125, "step": 26900 }, { "epoch": 0.0325790970703247, "learning_rate": 9.931347970484473e-06, "loss": 6.445848999023437, "step": 27000 }, { "epoch": 0.03269976039280738, "learning_rate": 9.930944135016735e-06, "loss": 6.462876586914063, "step": 27100 }, { "epoch": 0.032820423715290065, "learning_rate": 9.930540299548997e-06, "loss": 6.435804443359375, "step": 27200 }, { "epoch": 0.03294108703777275, "learning_rate": 9.93013646408126e-06, "loss": 6.43695068359375, "step": 27300 }, { "epoch": 0.03306175036025543, "learning_rate": 9.929732628613521e-06, "loss": 6.411896362304687, "step": 27400 }, { "epoch": 0.03318241368273812, "learning_rate": 9.929328793145783e-06, "loss": 6.4326409912109375, "step": 27500 }, { "epoch": 0.0333030770052208, "learning_rate": 9.928924957678044e-06, "loss": 6.415225830078125, "step": 27600 }, { "epoch": 0.03342374032770348, "learning_rate": 9.928521122210306e-06, "loss": 6.409244384765625, "step": 27700 }, { "epoch": 0.03354440365018617, "learning_rate": 9.928117286742568e-06, "loss": 6.386112060546875, "step": 27800 }, { "epoch": 0.033665066972668856, "learning_rate": 9.927713451274828e-06, "loss": 6.3937005615234375, "step": 27900 }, { "epoch": 0.033785730295151535, "learning_rate": 9.92730961580709e-06, "loss": 6.390086059570312, "step": 28000 }, { "epoch": 0.03390639361763422, "learning_rate": 9.926905780339352e-06, "loss": 6.386889038085937, "step": 28100 }, { "epoch": 0.03402705694011691, "learning_rate": 9.926501944871614e-06, "loss": 6.370198974609375, "step": 28200 }, { "epoch": 0.03414772026259959, "learning_rate": 9.926098109403876e-06, "loss": 6.3718328857421875, "step": 28300 }, { "epoch": 0.034268383585082274, "learning_rate": 9.925694273936136e-06, "loss": 6.381991577148438, "step": 28400 }, { "epoch": 0.03438904690756496, "learning_rate": 9.925290438468398e-06, "loss": 6.355091552734375, "step": 28500 }, { "epoch": 0.03450971023004764, "learning_rate": 9.92488660300066e-06, "loss": 6.332806396484375, "step": 28600 }, { "epoch": 0.034630373552530326, "learning_rate": 9.924482767532922e-06, "loss": 6.320509643554687, "step": 28700 }, { "epoch": 0.03475103687501301, "learning_rate": 9.924078932065182e-06, "loss": 6.34507080078125, "step": 28800 }, { "epoch": 0.03487170019749569, "learning_rate": 9.923675096597444e-06, "loss": 6.32692626953125, "step": 28900 }, { "epoch": 0.03499236351997838, "learning_rate": 9.923271261129706e-06, "loss": 6.352927856445312, "step": 29000 }, { "epoch": 0.03511302684246106, "learning_rate": 9.922867425661968e-06, "loss": 6.342001953125, "step": 29100 }, { "epoch": 0.035233690164943744, "learning_rate": 9.922463590194229e-06, "loss": 6.319302368164062, "step": 29200 }, { "epoch": 0.03535435348742643, "learning_rate": 9.92205975472649e-06, "loss": 6.307904052734375, "step": 29300 }, { "epoch": 0.03547501680990911, "learning_rate": 9.921655919258753e-06, "loss": 6.295087280273438, "step": 29400 }, { "epoch": 0.035595680132391797, "learning_rate": 9.921252083791015e-06, "loss": 6.290713500976563, "step": 29500 }, { "epoch": 0.03571634345487448, "learning_rate": 9.920848248323277e-06, "loss": 6.285931396484375, "step": 29600 }, { "epoch": 0.03583700677735716, "learning_rate": 9.920444412855539e-06, "loss": 6.309791870117188, "step": 29700 }, { "epoch": 0.03595767009983985, "learning_rate": 9.920040577387799e-06, "loss": 6.302537841796875, "step": 29800 }, { "epoch": 0.036078333422322535, "learning_rate": 9.91963674192006e-06, "loss": 6.308652954101563, "step": 29900 }, { "epoch": 0.036198996744805215, "learning_rate": 9.919232906452321e-06, "loss": 6.258733520507812, "step": 30000 }, { "epoch": 0.0363196600672879, "learning_rate": 9.918829070984583e-06, "loss": 6.288374633789062, "step": 30100 }, { "epoch": 0.03644032338977059, "learning_rate": 9.918425235516845e-06, "loss": 6.268796997070313, "step": 30200 }, { "epoch": 0.03656098671225327, "learning_rate": 9.918021400049107e-06, "loss": 6.256526489257812, "step": 30300 }, { "epoch": 0.03668165003473595, "learning_rate": 9.917617564581369e-06, "loss": 6.274508056640625, "step": 30400 }, { "epoch": 0.03680231335721864, "learning_rate": 9.917213729113631e-06, "loss": 6.27301025390625, "step": 30500 }, { "epoch": 0.03692297667970132, "learning_rate": 9.916809893645893e-06, "loss": 6.24278076171875, "step": 30600 }, { "epoch": 0.037043640002184006, "learning_rate": 9.916406058178153e-06, "loss": 6.2477734375, "step": 30700 }, { "epoch": 0.03716430332466669, "learning_rate": 9.916002222710415e-06, "loss": 6.243428955078125, "step": 30800 }, { "epoch": 0.03728496664714937, "learning_rate": 9.915598387242677e-06, "loss": 6.238870239257812, "step": 30900 }, { "epoch": 0.03740562996963206, "learning_rate": 9.915194551774938e-06, "loss": 6.225955810546875, "step": 31000 }, { "epoch": 0.037526293292114744, "learning_rate": 9.9147907163072e-06, "loss": 6.218800659179688, "step": 31100 }, { "epoch": 0.037646956614597424, "learning_rate": 9.914386880839461e-06, "loss": 6.21949462890625, "step": 31200 }, { "epoch": 0.03776761993708011, "learning_rate": 9.913983045371723e-06, "loss": 6.182770385742187, "step": 31300 }, { "epoch": 0.0378882832595628, "learning_rate": 9.913579209903985e-06, "loss": 6.196390991210937, "step": 31400 }, { "epoch": 0.038008946582045476, "learning_rate": 9.913175374436247e-06, "loss": 6.185361328125, "step": 31500 }, { "epoch": 0.03812960990452816, "learning_rate": 9.91277153896851e-06, "loss": 6.214140014648438, "step": 31600 }, { "epoch": 0.03825027322701085, "learning_rate": 9.91236770350077e-06, "loss": 6.208532104492187, "step": 31700 }, { "epoch": 0.03837093654949353, "learning_rate": 9.911963868033032e-06, "loss": 6.163168334960938, "step": 31800 }, { "epoch": 0.038491599871976215, "learning_rate": 9.911560032565292e-06, "loss": 6.170020751953125, "step": 31900 }, { "epoch": 0.0386122631944589, "learning_rate": 9.911156197097554e-06, "loss": 6.167660522460937, "step": 32000 }, { "epoch": 0.03873292651694158, "learning_rate": 9.910752361629816e-06, "loss": 6.15995361328125, "step": 32100 }, { "epoch": 0.03885358983942427, "learning_rate": 9.910348526162078e-06, "loss": 6.178750610351562, "step": 32200 }, { "epoch": 0.038974253161906953, "learning_rate": 9.90994469069434e-06, "loss": 6.160189208984375, "step": 32300 }, { "epoch": 0.03909491648438963, "learning_rate": 9.909540855226602e-06, "loss": 6.1517181396484375, "step": 32400 }, { "epoch": 0.03921557980687232, "learning_rate": 9.909137019758862e-06, "loss": 6.173123168945312, "step": 32500 }, { "epoch": 0.039336243129355006, "learning_rate": 9.908733184291124e-06, "loss": 6.134052124023437, "step": 32600 }, { "epoch": 0.039456906451837685, "learning_rate": 9.908329348823386e-06, "loss": 6.1498785400390625, "step": 32700 }, { "epoch": 0.03957756977432037, "learning_rate": 9.907925513355648e-06, "loss": 6.165042724609375, "step": 32800 }, { "epoch": 0.03969823309680306, "learning_rate": 9.907521677887908e-06, "loss": 6.1348779296875, "step": 32900 }, { "epoch": 0.03981889641928574, "learning_rate": 9.90711784242017e-06, "loss": 6.134515991210938, "step": 33000 }, { "epoch": 0.039939559741768424, "learning_rate": 9.906714006952432e-06, "loss": 6.169119873046875, "step": 33100 }, { "epoch": 0.04006022306425111, "learning_rate": 9.906310171484694e-06, "loss": 6.122115478515625, "step": 33200 }, { "epoch": 0.04018088638673379, "learning_rate": 9.905906336016955e-06, "loss": 6.1315069580078125, "step": 33300 }, { "epoch": 0.040301549709216476, "learning_rate": 9.905502500549217e-06, "loss": 6.11522216796875, "step": 33400 }, { "epoch": 0.04042221303169916, "learning_rate": 9.905098665081479e-06, "loss": 6.1282586669921875, "step": 33500 }, { "epoch": 0.04054287635418184, "learning_rate": 9.90469482961374e-06, "loss": 6.114356689453125, "step": 33600 }, { "epoch": 0.04066353967666453, "learning_rate": 9.904290994146003e-06, "loss": 6.118187255859375, "step": 33700 }, { "epoch": 0.040784202999147215, "learning_rate": 9.903887158678263e-06, "loss": 6.131346435546875, "step": 33800 }, { "epoch": 0.040904866321629894, "learning_rate": 9.903483323210525e-06, "loss": 6.07158447265625, "step": 33900 }, { "epoch": 0.04102552964411258, "learning_rate": 9.903079487742787e-06, "loss": 6.1041943359375, "step": 34000 }, { "epoch": 0.04114619296659527, "learning_rate": 9.902675652275047e-06, "loss": 6.083723754882812, "step": 34100 }, { "epoch": 0.04126685628907795, "learning_rate": 9.902271816807309e-06, "loss": 6.080000610351562, "step": 34200 }, { "epoch": 0.04138751961156063, "learning_rate": 9.901867981339571e-06, "loss": 6.075195922851562, "step": 34300 }, { "epoch": 0.04150818293404332, "learning_rate": 9.901464145871833e-06, "loss": 6.10289306640625, "step": 34400 }, { "epoch": 0.041628846256526, "learning_rate": 9.901060310404095e-06, "loss": 6.061969604492187, "step": 34500 }, { "epoch": 0.041749509579008685, "learning_rate": 9.900656474936357e-06, "loss": 6.068685302734375, "step": 34600 }, { "epoch": 0.04187017290149137, "learning_rate": 9.900252639468619e-06, "loss": 6.074742431640625, "step": 34700 }, { "epoch": 0.04199083622397405, "learning_rate": 9.89984880400088e-06, "loss": 6.040508422851563, "step": 34800 }, { "epoch": 0.04211149954645674, "learning_rate": 9.899444968533141e-06, "loss": 6.060413208007812, "step": 34900 }, { "epoch": 0.042232162868939424, "learning_rate": 9.899041133065402e-06, "loss": 6.077679443359375, "step": 35000 }, { "epoch": 0.042352826191422104, "learning_rate": 9.898637297597664e-06, "loss": 6.033153076171875, "step": 35100 }, { "epoch": 0.04247348951390479, "learning_rate": 9.898233462129926e-06, "loss": 6.03320556640625, "step": 35200 }, { "epoch": 0.04259415283638747, "learning_rate": 9.897829626662188e-06, "loss": 6.057587280273437, "step": 35300 }, { "epoch": 0.042714816158870156, "learning_rate": 9.89742579119445e-06, "loss": 6.067791748046875, "step": 35400 }, { "epoch": 0.04283547948135284, "learning_rate": 9.897021955726711e-06, "loss": 6.061552124023438, "step": 35500 }, { "epoch": 0.04295614280383552, "learning_rate": 9.896618120258973e-06, "loss": 6.047073974609375, "step": 35600 }, { "epoch": 0.04307680612631821, "learning_rate": 9.896214284791234e-06, "loss": 6.028131103515625, "step": 35700 }, { "epoch": 0.043197469448800895, "learning_rate": 9.895810449323496e-06, "loss": 6.0347705078125, "step": 35800 }, { "epoch": 0.043318132771283574, "learning_rate": 9.895406613855758e-06, "loss": 6.010587768554688, "step": 35900 }, { "epoch": 0.04343879609376626, "learning_rate": 9.895002778388018e-06, "loss": 6.03420166015625, "step": 36000 }, { "epoch": 0.04355945941624895, "learning_rate": 9.89459894292028e-06, "loss": 6.025477905273437, "step": 36100 }, { "epoch": 0.043680122738731626, "learning_rate": 9.894195107452542e-06, "loss": 6.012522583007812, "step": 36200 }, { "epoch": 0.04380078606121431, "learning_rate": 9.893791271984804e-06, "loss": 5.981051025390625, "step": 36300 }, { "epoch": 0.043921449383697, "learning_rate": 9.893387436517066e-06, "loss": 6.0163201904296875, "step": 36400 }, { "epoch": 0.04404211270617968, "learning_rate": 9.892983601049328e-06, "loss": 6.000119018554687, "step": 36500 }, { "epoch": 0.044162776028662365, "learning_rate": 9.892579765581588e-06, "loss": 6.0064239501953125, "step": 36600 }, { "epoch": 0.04428343935114505, "learning_rate": 9.89217593011385e-06, "loss": 5.995327758789062, "step": 36700 }, { "epoch": 0.04440410267362773, "learning_rate": 9.891772094646112e-06, "loss": 5.96276123046875, "step": 36800 }, { "epoch": 0.04452476599611042, "learning_rate": 9.891368259178372e-06, "loss": 5.97086181640625, "step": 36900 }, { "epoch": 0.044645429318593104, "learning_rate": 9.890964423710634e-06, "loss": 5.97990234375, "step": 37000 }, { "epoch": 0.04476609264107578, "learning_rate": 9.890560588242896e-06, "loss": 5.986522827148438, "step": 37100 }, { "epoch": 0.04488675596355847, "learning_rate": 9.890156752775158e-06, "loss": 6.0063623046875, "step": 37200 }, { "epoch": 0.045007419286041156, "learning_rate": 9.88975291730742e-06, "loss": 5.954756469726562, "step": 37300 }, { "epoch": 0.045128082608523835, "learning_rate": 9.88934908183968e-06, "loss": 5.989403076171875, "step": 37400 }, { "epoch": 0.04524874593100652, "learning_rate": 9.888945246371943e-06, "loss": 5.97143310546875, "step": 37500 }, { "epoch": 0.04536940925348921, "learning_rate": 9.888541410904205e-06, "loss": 5.985697021484375, "step": 37600 }, { "epoch": 0.04549007257597189, "learning_rate": 9.888137575436467e-06, "loss": 5.979300537109375, "step": 37700 }, { "epoch": 0.045610735898454574, "learning_rate": 9.887733739968729e-06, "loss": 5.945584106445312, "step": 37800 }, { "epoch": 0.04573139922093726, "learning_rate": 9.887329904500989e-06, "loss": 5.941597290039063, "step": 37900 }, { "epoch": 0.04585206254341994, "learning_rate": 9.886926069033251e-06, "loss": 5.938487548828125, "step": 38000 }, { "epoch": 0.045972725865902626, "learning_rate": 9.886522233565513e-06, "loss": 5.946324462890625, "step": 38100 }, { "epoch": 0.04609338918838531, "learning_rate": 9.886118398097773e-06, "loss": 5.954590454101562, "step": 38200 }, { "epoch": 0.04621405251086799, "learning_rate": 9.885714562630035e-06, "loss": 5.935897216796875, "step": 38300 }, { "epoch": 0.04633471583335068, "learning_rate": 9.885310727162297e-06, "loss": 5.946389770507812, "step": 38400 }, { "epoch": 0.046455379155833365, "learning_rate": 9.884906891694559e-06, "loss": 5.924605712890625, "step": 38500 }, { "epoch": 0.046576042478316045, "learning_rate": 9.884503056226821e-06, "loss": 5.8884765625, "step": 38600 }, { "epoch": 0.04669670580079873, "learning_rate": 9.884099220759083e-06, "loss": 5.920947875976562, "step": 38700 }, { "epoch": 0.04681736912328142, "learning_rate": 9.883695385291345e-06, "loss": 5.917391357421875, "step": 38800 }, { "epoch": 0.0469380324457641, "learning_rate": 9.883291549823605e-06, "loss": 5.922462768554688, "step": 38900 }, { "epoch": 0.04705869576824678, "learning_rate": 9.882887714355867e-06, "loss": 5.899052124023438, "step": 39000 }, { "epoch": 0.04717935909072947, "learning_rate": 9.882483878888128e-06, "loss": 5.926414184570312, "step": 39100 }, { "epoch": 0.04730002241321215, "learning_rate": 9.88208004342039e-06, "loss": 5.90779296875, "step": 39200 }, { "epoch": 0.047420685735694836, "learning_rate": 9.881676207952652e-06, "loss": 5.891823120117188, "step": 39300 }, { "epoch": 0.04754134905817752, "learning_rate": 9.881272372484914e-06, "loss": 5.90169189453125, "step": 39400 }, { "epoch": 0.0476620123806602, "learning_rate": 9.880868537017176e-06, "loss": 5.892493896484375, "step": 39500 }, { "epoch": 0.04778267570314289, "learning_rate": 9.880464701549438e-06, "loss": 5.870087890625, "step": 39600 }, { "epoch": 0.047903339025625574, "learning_rate": 9.8800608660817e-06, "loss": 5.886649780273437, "step": 39700 }, { "epoch": 0.048024002348108254, "learning_rate": 9.87965703061396e-06, "loss": 5.894774780273438, "step": 39800 }, { "epoch": 0.04814466567059094, "learning_rate": 9.879253195146222e-06, "loss": 5.86189208984375, "step": 39900 }, { "epoch": 0.048265328993073627, "learning_rate": 9.878849359678484e-06, "loss": 5.86906005859375, "step": 40000 }, { "epoch": 0.048385992315556306, "learning_rate": 9.878445524210744e-06, "loss": 5.907960815429687, "step": 40100 }, { "epoch": 0.04850665563803899, "learning_rate": 9.878041688743006e-06, "loss": 5.850534057617187, "step": 40200 }, { "epoch": 0.04862731896052168, "learning_rate": 9.877637853275268e-06, "loss": 5.88085693359375, "step": 40300 }, { "epoch": 0.04874798228300436, "learning_rate": 9.87723401780753e-06, "loss": 5.872523803710937, "step": 40400 }, { "epoch": 0.048868645605487045, "learning_rate": 9.876830182339792e-06, "loss": 5.859061889648437, "step": 40500 }, { "epoch": 0.04898930892796973, "learning_rate": 9.876426346872052e-06, "loss": 5.855042114257812, "step": 40600 }, { "epoch": 0.04910997225045241, "learning_rate": 9.876022511404314e-06, "loss": 5.862298583984375, "step": 40700 }, { "epoch": 0.0492306355729351, "learning_rate": 9.875618675936576e-06, "loss": 5.823678588867187, "step": 40800 }, { "epoch": 0.04935129889541778, "learning_rate": 9.875214840468838e-06, "loss": 5.839556884765625, "step": 40900 }, { "epoch": 0.04947196221790046, "learning_rate": 9.874811005001098e-06, "loss": 5.82404052734375, "step": 41000 }, { "epoch": 0.04959262554038315, "learning_rate": 9.87440716953336e-06, "loss": 5.824871215820313, "step": 41100 }, { "epoch": 0.049713288862865836, "learning_rate": 9.874003334065622e-06, "loss": 5.827488403320313, "step": 41200 }, { "epoch": 0.049833952185348515, "learning_rate": 9.873599498597884e-06, "loss": 5.848665771484375, "step": 41300 }, { "epoch": 0.0499546155078312, "learning_rate": 9.873195663130146e-06, "loss": 5.826472778320312, "step": 41400 }, { "epoch": 0.05007527883031389, "learning_rate": 9.872791827662407e-06, "loss": 5.829556274414062, "step": 41500 }, { "epoch": 0.05019594215279657, "learning_rate": 9.872387992194669e-06, "loss": 5.819097290039062, "step": 41600 }, { "epoch": 0.050316605475279254, "learning_rate": 9.87198415672693e-06, "loss": 5.812535400390625, "step": 41700 }, { "epoch": 0.05043726879776193, "learning_rate": 9.871580321259193e-06, "loss": 5.79991943359375, "step": 41800 }, { "epoch": 0.05055793212024462, "learning_rate": 9.871176485791455e-06, "loss": 5.77990234375, "step": 41900 }, { "epoch": 0.050678595442727306, "learning_rate": 9.870772650323715e-06, "loss": 5.809010009765625, "step": 42000 }, { "epoch": 0.050799258765209986, "learning_rate": 9.870368814855977e-06, "loss": 5.794039306640625, "step": 42100 }, { "epoch": 0.05091992208769267, "learning_rate": 9.869964979388239e-06, "loss": 5.773182373046875, "step": 42200 }, { "epoch": 0.05104058541017536, "learning_rate": 9.8695611439205e-06, "loss": 5.795257568359375, "step": 42300 }, { "epoch": 0.05116124873265804, "learning_rate": 9.869157308452761e-06, "loss": 5.828724975585938, "step": 42400 }, { "epoch": 0.051281912055140724, "learning_rate": 9.868753472985023e-06, "loss": 5.810231323242188, "step": 42500 }, { "epoch": 0.05140257537762341, "learning_rate": 9.868349637517285e-06, "loss": 5.766407470703125, "step": 42600 }, { "epoch": 0.05152323870010609, "learning_rate": 9.867945802049547e-06, "loss": 5.799169311523437, "step": 42700 }, { "epoch": 0.05164390202258878, "learning_rate": 9.867541966581809e-06, "loss": 5.8177978515625, "step": 42800 }, { "epoch": 0.05176456534507146, "learning_rate": 9.86713813111407e-06, "loss": 5.7826611328125, "step": 42900 }, { "epoch": 0.05188522866755414, "learning_rate": 9.866734295646331e-06, "loss": 5.781925659179688, "step": 43000 }, { "epoch": 0.05200589199003683, "learning_rate": 9.866330460178593e-06, "loss": 5.7845916748046875, "step": 43100 }, { "epoch": 0.052126555312519515, "learning_rate": 9.865926624710854e-06, "loss": 5.79017822265625, "step": 43200 }, { "epoch": 0.052247218635002195, "learning_rate": 9.865522789243116e-06, "loss": 5.769013061523437, "step": 43300 }, { "epoch": 0.05236788195748488, "learning_rate": 9.865118953775378e-06, "loss": 5.766888427734375, "step": 43400 }, { "epoch": 0.05248854527996757, "learning_rate": 9.86471511830764e-06, "loss": 5.764293212890625, "step": 43500 }, { "epoch": 0.05260920860245025, "learning_rate": 9.864311282839902e-06, "loss": 5.7430487060546875, "step": 43600 }, { "epoch": 0.05272987192493293, "learning_rate": 9.863907447372164e-06, "loss": 5.750333251953125, "step": 43700 }, { "epoch": 0.05285053524741562, "learning_rate": 9.863503611904426e-06, "loss": 5.78717529296875, "step": 43800 }, { "epoch": 0.0529711985698983, "learning_rate": 9.863099776436686e-06, "loss": 5.78459228515625, "step": 43900 }, { "epoch": 0.053091861892380986, "learning_rate": 9.862695940968948e-06, "loss": 5.7740380859375, "step": 44000 }, { "epoch": 0.05321252521486367, "learning_rate": 9.862292105501208e-06, "loss": 5.722774658203125, "step": 44100 }, { "epoch": 0.05333318853734635, "learning_rate": 9.86188827003347e-06, "loss": 5.745663452148437, "step": 44200 }, { "epoch": 0.05345385185982904, "learning_rate": 9.861484434565732e-06, "loss": 5.737649536132812, "step": 44300 }, { "epoch": 0.053574515182311724, "learning_rate": 9.861080599097994e-06, "loss": 5.747950439453125, "step": 44400 }, { "epoch": 0.053695178504794404, "learning_rate": 9.860676763630256e-06, "loss": 5.738473510742187, "step": 44500 }, { "epoch": 0.05381584182727709, "learning_rate": 9.860272928162518e-06, "loss": 5.716368408203125, "step": 44600 }, { "epoch": 0.05393650514975978, "learning_rate": 9.859869092694778e-06, "loss": 5.750637817382812, "step": 44700 }, { "epoch": 0.054057168472242456, "learning_rate": 9.85946525722704e-06, "loss": 5.746980590820312, "step": 44800 }, { "epoch": 0.05417783179472514, "learning_rate": 9.859061421759302e-06, "loss": 5.73247314453125, "step": 44900 }, { "epoch": 0.05429849511720783, "learning_rate": 9.858657586291564e-06, "loss": 5.742887573242188, "step": 45000 }, { "epoch": 0.05441915843969051, "learning_rate": 9.858253750823825e-06, "loss": 5.718990478515625, "step": 45100 }, { "epoch": 0.054539821762173195, "learning_rate": 9.857849915356087e-06, "loss": 5.700264282226563, "step": 45200 }, { "epoch": 0.05466048508465588, "learning_rate": 9.857446079888348e-06, "loss": 5.7020849609375, "step": 45300 }, { "epoch": 0.05478114840713856, "learning_rate": 9.85704224442061e-06, "loss": 5.697625732421875, "step": 45400 }, { "epoch": 0.05490181172962125, "learning_rate": 9.85663840895287e-06, "loss": 5.695245361328125, "step": 45500 }, { "epoch": 0.055022475052103934, "learning_rate": 9.856234573485133e-06, "loss": 5.713543090820313, "step": 45600 }, { "epoch": 0.05514313837458661, "learning_rate": 9.855830738017395e-06, "loss": 5.684797973632812, "step": 45700 }, { "epoch": 0.0552638016970693, "learning_rate": 9.855426902549657e-06, "loss": 5.691742553710937, "step": 45800 }, { "epoch": 0.055384465019551986, "learning_rate": 9.855023067081919e-06, "loss": 5.704517211914062, "step": 45900 }, { "epoch": 0.055505128342034665, "learning_rate": 9.854619231614179e-06, "loss": 5.6752166748046875, "step": 46000 }, { "epoch": 0.05562579166451735, "learning_rate": 9.854215396146441e-06, "loss": 5.681259765625, "step": 46100 }, { "epoch": 0.05574645498700004, "learning_rate": 9.853811560678703e-06, "loss": 5.696261596679688, "step": 46200 }, { "epoch": 0.05586711830948272, "learning_rate": 9.853407725210965e-06, "loss": 5.70001953125, "step": 46300 }, { "epoch": 0.055987781631965404, "learning_rate": 9.853003889743225e-06, "loss": 5.69338134765625, "step": 46400 }, { "epoch": 0.05610844495444809, "learning_rate": 9.852600054275487e-06, "loss": 5.696197509765625, "step": 46500 }, { "epoch": 0.05622910827693077, "learning_rate": 9.85219621880775e-06, "loss": 5.712601928710938, "step": 46600 }, { "epoch": 0.056349771599413456, "learning_rate": 9.851792383340011e-06, "loss": 5.650829467773438, "step": 46700 }, { "epoch": 0.05647043492189614, "learning_rate": 9.851388547872273e-06, "loss": 5.642108154296875, "step": 46800 }, { "epoch": 0.05659109824437882, "learning_rate": 9.850984712404535e-06, "loss": 5.658579711914062, "step": 46900 }, { "epoch": 0.05671176156686151, "learning_rate": 9.850580876936795e-06, "loss": 5.652801513671875, "step": 47000 }, { "epoch": 0.056832424889344195, "learning_rate": 9.850177041469057e-06, "loss": 5.683375854492187, "step": 47100 }, { "epoch": 0.056953088211826874, "learning_rate": 9.849773206001318e-06, "loss": 5.64796630859375, "step": 47200 }, { "epoch": 0.05707375153430956, "learning_rate": 9.84936937053358e-06, "loss": 5.649228515625, "step": 47300 }, { "epoch": 0.05719441485679225, "learning_rate": 9.848965535065842e-06, "loss": 5.65912841796875, "step": 47400 }, { "epoch": 0.05731507817927493, "learning_rate": 9.848561699598104e-06, "loss": 5.653483276367187, "step": 47500 }, { "epoch": 0.05743574150175761, "learning_rate": 9.848157864130366e-06, "loss": 5.6471826171875, "step": 47600 }, { "epoch": 0.0575564048242403, "learning_rate": 9.847754028662628e-06, "loss": 5.65800048828125, "step": 47700 }, { "epoch": 0.05767706814672298, "learning_rate": 9.84735019319489e-06, "loss": 5.6379833984375, "step": 47800 }, { "epoch": 0.057797731469205665, "learning_rate": 9.84694635772715e-06, "loss": 5.633699340820312, "step": 47900 }, { "epoch": 0.05791839479168835, "learning_rate": 9.846542522259412e-06, "loss": 5.66202392578125, "step": 48000 }, { "epoch": 0.05803905811417103, "learning_rate": 9.846138686791674e-06, "loss": 5.6377734375, "step": 48100 }, { "epoch": 0.05815972143665372, "learning_rate": 9.845734851323934e-06, "loss": 5.629166870117188, "step": 48200 }, { "epoch": 0.0582803847591364, "learning_rate": 9.845331015856196e-06, "loss": 5.624560546875, "step": 48300 }, { "epoch": 0.058401048081619084, "learning_rate": 9.844927180388458e-06, "loss": 5.6068878173828125, "step": 48400 }, { "epoch": 0.05852171140410177, "learning_rate": 9.84452334492072e-06, "loss": 5.632612915039062, "step": 48500 }, { "epoch": 0.05864237472658445, "learning_rate": 9.844119509452982e-06, "loss": 5.59102294921875, "step": 48600 }, { "epoch": 0.058763038049067136, "learning_rate": 9.843715673985244e-06, "loss": 5.6015252685546875, "step": 48700 }, { "epoch": 0.05888370137154982, "learning_rate": 9.843311838517504e-06, "loss": 5.610700073242188, "step": 48800 }, { "epoch": 0.0590043646940325, "learning_rate": 9.842908003049766e-06, "loss": 5.6188427734375, "step": 48900 }, { "epoch": 0.05912502801651519, "learning_rate": 9.842504167582028e-06, "loss": 5.6034698486328125, "step": 49000 }, { "epoch": 0.059245691338997875, "learning_rate": 9.842100332114289e-06, "loss": 5.592289428710938, "step": 49100 }, { "epoch": 0.059366354661480554, "learning_rate": 9.84169649664655e-06, "loss": 5.59678466796875, "step": 49200 }, { "epoch": 0.05948701798396324, "learning_rate": 9.841292661178813e-06, "loss": 5.584678344726562, "step": 49300 }, { "epoch": 0.05960768130644593, "learning_rate": 9.840888825711075e-06, "loss": 5.604636840820312, "step": 49400 }, { "epoch": 0.059728344628928606, "learning_rate": 9.840484990243337e-06, "loss": 5.59030029296875, "step": 49500 }, { "epoch": 0.05984900795141129, "learning_rate": 9.840081154775597e-06, "loss": 5.601084594726562, "step": 49600 }, { "epoch": 0.05996967127389398, "learning_rate": 9.839677319307859e-06, "loss": 5.613219604492188, "step": 49700 }, { "epoch": 0.06009033459637666, "learning_rate": 9.83927348384012e-06, "loss": 5.557407836914063, "step": 49800 }, { "epoch": 0.060210997918859345, "learning_rate": 9.838869648372383e-06, "loss": 5.575147094726563, "step": 49900 }, { "epoch": 0.06033166124134203, "learning_rate": 9.838465812904645e-06, "loss": 5.553262939453125, "step": 50000 }, { "epoch": 0.06045232456382471, "learning_rate": 9.838061977436905e-06, "loss": 5.550405883789063, "step": 50100 }, { "epoch": 0.0605729878863074, "learning_rate": 9.837658141969167e-06, "loss": 5.579466552734375, "step": 50200 }, { "epoch": 0.060693651208790084, "learning_rate": 9.837254306501429e-06, "loss": 5.56111328125, "step": 50300 }, { "epoch": 0.06081431453127276, "learning_rate": 9.83685047103369e-06, "loss": 5.578643798828125, "step": 50400 }, { "epoch": 0.06093497785375545, "learning_rate": 9.836446635565951e-06, "loss": 5.561683349609375, "step": 50500 }, { "epoch": 0.061055641176238136, "learning_rate": 9.836042800098213e-06, "loss": 5.570487060546875, "step": 50600 }, { "epoch": 0.061176304498720815, "learning_rate": 9.835638964630475e-06, "loss": 5.524298095703125, "step": 50700 }, { "epoch": 0.0612969678212035, "learning_rate": 9.835235129162737e-06, "loss": 5.562306518554688, "step": 50800 }, { "epoch": 0.06141763114368619, "learning_rate": 9.834831293695e-06, "loss": 5.566176147460937, "step": 50900 }, { "epoch": 0.06153829446616887, "learning_rate": 9.83442745822726e-06, "loss": 5.533325805664062, "step": 51000 }, { "epoch": 0.061658957788651554, "learning_rate": 9.834023622759521e-06, "loss": 5.5660498046875, "step": 51100 }, { "epoch": 0.06177962111113424, "learning_rate": 9.833619787291783e-06, "loss": 5.52291748046875, "step": 51200 }, { "epoch": 0.06190028443361692, "learning_rate": 9.833215951824044e-06, "loss": 5.526439208984375, "step": 51300 }, { "epoch": 0.062020947756099606, "learning_rate": 9.832812116356306e-06, "loss": 5.51739990234375, "step": 51400 }, { "epoch": 0.06214161107858229, "learning_rate": 9.832408280888568e-06, "loss": 5.55761474609375, "step": 51500 }, { "epoch": 0.06226227440106497, "learning_rate": 9.83200444542083e-06, "loss": 5.556441650390625, "step": 51600 }, { "epoch": 0.06238293772354766, "learning_rate": 9.831600609953092e-06, "loss": 5.51667724609375, "step": 51700 }, { "epoch": 0.06250360104603034, "learning_rate": 9.831196774485354e-06, "loss": 5.497745971679688, "step": 51800 }, { "epoch": 0.06262426436851302, "learning_rate": 9.830792939017616e-06, "loss": 5.506736450195312, "step": 51900 }, { "epoch": 0.06274492769099571, "learning_rate": 9.830389103549876e-06, "loss": 5.5475836181640625, "step": 52000 }, { "epoch": 0.0628655910134784, "learning_rate": 9.829985268082138e-06, "loss": 5.504075317382813, "step": 52100 }, { "epoch": 0.06298625433596108, "learning_rate": 9.829581432614398e-06, "loss": 5.52787109375, "step": 52200 }, { "epoch": 0.06310691765844376, "learning_rate": 9.82917759714666e-06, "loss": 5.494723510742188, "step": 52300 }, { "epoch": 0.06322758098092644, "learning_rate": 9.828773761678922e-06, "loss": 5.514593505859375, "step": 52400 }, { "epoch": 0.06334824430340913, "learning_rate": 9.828369926211184e-06, "loss": 5.506063232421875, "step": 52500 }, { "epoch": 0.06346890762589182, "learning_rate": 9.827966090743446e-06, "loss": 5.525193481445313, "step": 52600 }, { "epoch": 0.0635895709483745, "learning_rate": 9.827562255275708e-06, "loss": 5.536563720703125, "step": 52700 }, { "epoch": 0.06371023427085719, "learning_rate": 9.82715841980797e-06, "loss": 5.473799438476562, "step": 52800 }, { "epoch": 0.06383089759333986, "learning_rate": 9.82675458434023e-06, "loss": 5.494265747070313, "step": 52900 }, { "epoch": 0.06395156091582255, "learning_rate": 9.826350748872492e-06, "loss": 5.47943603515625, "step": 53000 }, { "epoch": 0.06407222423830523, "learning_rate": 9.825946913404754e-06, "loss": 5.489384155273438, "step": 53100 }, { "epoch": 0.06419288756078792, "learning_rate": 9.825543077937015e-06, "loss": 5.486170654296875, "step": 53200 }, { "epoch": 0.0643135508832706, "learning_rate": 9.825139242469277e-06, "loss": 5.4916314697265625, "step": 53300 }, { "epoch": 0.06443421420575329, "learning_rate": 9.824735407001539e-06, "loss": 5.490230102539062, "step": 53400 }, { "epoch": 0.06455487752823597, "learning_rate": 9.8243315715338e-06, "loss": 5.4870233154296875, "step": 53500 }, { "epoch": 0.06467554085071865, "learning_rate": 9.823927736066063e-06, "loss": 5.458673706054688, "step": 53600 }, { "epoch": 0.06479620417320134, "learning_rate": 9.823523900598323e-06, "loss": 5.498256225585937, "step": 53700 }, { "epoch": 0.06491686749568402, "learning_rate": 9.823120065130585e-06, "loss": 5.452241821289062, "step": 53800 }, { "epoch": 0.06503753081816671, "learning_rate": 9.822716229662847e-06, "loss": 5.48254150390625, "step": 53900 }, { "epoch": 0.0651581941406494, "learning_rate": 9.822312394195109e-06, "loss": 5.49094970703125, "step": 54000 }, { "epoch": 0.06527885746313207, "learning_rate": 9.82190855872737e-06, "loss": 5.470156860351563, "step": 54100 }, { "epoch": 0.06539952078561476, "learning_rate": 9.821504723259631e-06, "loss": 5.458375244140625, "step": 54200 }, { "epoch": 0.06552018410809744, "learning_rate": 9.821100887791893e-06, "loss": 5.4711083984375, "step": 54300 }, { "epoch": 0.06564084743058013, "learning_rate": 9.820697052324155e-06, "loss": 5.451007080078125, "step": 54400 }, { "epoch": 0.06576151075306282, "learning_rate": 9.820293216856415e-06, "loss": 5.4637518310546875, "step": 54500 }, { "epoch": 0.0658821740755455, "learning_rate": 9.819889381388677e-06, "loss": 5.446215209960937, "step": 54600 }, { "epoch": 0.06600283739802817, "learning_rate": 9.81948554592094e-06, "loss": 5.457670288085938, "step": 54700 }, { "epoch": 0.06612350072051086, "learning_rate": 9.819081710453201e-06, "loss": 5.455287475585937, "step": 54800 }, { "epoch": 0.06624416404299355, "learning_rate": 9.818677874985463e-06, "loss": 5.436695556640625, "step": 54900 }, { "epoch": 0.06636482736547623, "learning_rate": 9.818274039517725e-06, "loss": 5.45849853515625, "step": 55000 }, { "epoch": 0.06648549068795892, "learning_rate": 9.817870204049985e-06, "loss": 5.436983032226562, "step": 55100 }, { "epoch": 0.0666061540104416, "learning_rate": 9.817466368582247e-06, "loss": 5.450509033203125, "step": 55200 }, { "epoch": 0.06672681733292428, "learning_rate": 9.81706253311451e-06, "loss": 5.440614013671875, "step": 55300 }, { "epoch": 0.06684748065540697, "learning_rate": 9.81665869764677e-06, "loss": 5.450062866210938, "step": 55400 }, { "epoch": 0.06696814397788965, "learning_rate": 9.816254862179032e-06, "loss": 5.440513305664062, "step": 55500 }, { "epoch": 0.06708880730037234, "learning_rate": 9.815851026711294e-06, "loss": 5.45876953125, "step": 55600 }, { "epoch": 0.06720947062285502, "learning_rate": 9.815447191243556e-06, "loss": 5.445390014648438, "step": 55700 }, { "epoch": 0.06733013394533771, "learning_rate": 9.815043355775818e-06, "loss": 5.438015747070312, "step": 55800 }, { "epoch": 0.06745079726782038, "learning_rate": 9.81463952030808e-06, "loss": 5.417323608398437, "step": 55900 }, { "epoch": 0.06757146059030307, "learning_rate": 9.814235684840342e-06, "loss": 5.4468841552734375, "step": 56000 }, { "epoch": 0.06769212391278576, "learning_rate": 9.813831849372602e-06, "loss": 5.424739379882812, "step": 56100 }, { "epoch": 0.06781278723526844, "learning_rate": 9.813428013904864e-06, "loss": 5.445565795898437, "step": 56200 }, { "epoch": 0.06793345055775113, "learning_rate": 9.813024178437124e-06, "loss": 5.397311401367188, "step": 56300 }, { "epoch": 0.06805411388023382, "learning_rate": 9.812620342969386e-06, "loss": 5.42822998046875, "step": 56400 }, { "epoch": 0.06817477720271649, "learning_rate": 9.812216507501648e-06, "loss": 5.4188385009765625, "step": 56500 }, { "epoch": 0.06829544052519917, "learning_rate": 9.81181267203391e-06, "loss": 5.391190795898438, "step": 56600 }, { "epoch": 0.06841610384768186, "learning_rate": 9.811408836566172e-06, "loss": 5.405062255859375, "step": 56700 }, { "epoch": 0.06853676717016455, "learning_rate": 9.811005001098434e-06, "loss": 5.404650268554687, "step": 56800 }, { "epoch": 0.06865743049264723, "learning_rate": 9.810601165630696e-06, "loss": 5.415482788085938, "step": 56900 }, { "epoch": 0.06877809381512992, "learning_rate": 9.810197330162956e-06, "loss": 5.415482177734375, "step": 57000 }, { "epoch": 0.06889875713761259, "learning_rate": 9.809793494695218e-06, "loss": 5.37707763671875, "step": 57100 }, { "epoch": 0.06901942046009528, "learning_rate": 9.80938965922748e-06, "loss": 5.413468017578125, "step": 57200 }, { "epoch": 0.06914008378257797, "learning_rate": 9.80898582375974e-06, "loss": 5.379092407226563, "step": 57300 }, { "epoch": 0.06926074710506065, "learning_rate": 9.808581988292003e-06, "loss": 5.39713623046875, "step": 57400 }, { "epoch": 0.06938141042754334, "learning_rate": 9.808178152824265e-06, "loss": 5.401636352539063, "step": 57500 }, { "epoch": 0.06950207375002602, "learning_rate": 9.807774317356527e-06, "loss": 5.393638916015625, "step": 57600 }, { "epoch": 0.0696227370725087, "learning_rate": 9.807370481888789e-06, "loss": 5.391743774414063, "step": 57700 }, { "epoch": 0.06974340039499138, "learning_rate": 9.806966646421049e-06, "loss": 5.345445556640625, "step": 57800 }, { "epoch": 0.06986406371747407, "learning_rate": 9.80656281095331e-06, "loss": 5.348238525390625, "step": 57900 }, { "epoch": 0.06998472703995676, "learning_rate": 9.806158975485573e-06, "loss": 5.375379028320313, "step": 58000 }, { "epoch": 0.07010539036243944, "learning_rate": 9.805755140017835e-06, "loss": 5.3898388671875, "step": 58100 }, { "epoch": 0.07022605368492212, "learning_rate": 9.805351304550095e-06, "loss": 5.37486328125, "step": 58200 }, { "epoch": 0.0703467170074048, "learning_rate": 9.804947469082357e-06, "loss": 5.377813110351562, "step": 58300 }, { "epoch": 0.07046738032988749, "learning_rate": 9.804543633614619e-06, "loss": 5.381748046875, "step": 58400 }, { "epoch": 0.07058804365237017, "learning_rate": 9.804139798146881e-06, "loss": 5.348593139648438, "step": 58500 }, { "epoch": 0.07070870697485286, "learning_rate": 9.803735962679141e-06, "loss": 5.369475708007813, "step": 58600 }, { "epoch": 0.07082937029733555, "learning_rate": 9.803332127211403e-06, "loss": 5.3422998046875, "step": 58700 }, { "epoch": 0.07095003361981822, "learning_rate": 9.802928291743665e-06, "loss": 5.3921356201171875, "step": 58800 }, { "epoch": 0.0710706969423009, "learning_rate": 9.802524456275927e-06, "loss": 5.365232543945313, "step": 58900 }, { "epoch": 0.07119136026478359, "learning_rate": 9.80212062080819e-06, "loss": 5.341582641601563, "step": 59000 }, { "epoch": 0.07131202358726628, "learning_rate": 9.801716785340451e-06, "loss": 5.3381201171875, "step": 59100 }, { "epoch": 0.07143268690974897, "learning_rate": 9.801312949872712e-06, "loss": 5.333232421875, "step": 59200 }, { "epoch": 0.07155335023223165, "learning_rate": 9.800909114404974e-06, "loss": 5.338631591796875, "step": 59300 }, { "epoch": 0.07167401355471432, "learning_rate": 9.800505278937234e-06, "loss": 5.317579345703125, "step": 59400 }, { "epoch": 0.07179467687719701, "learning_rate": 9.800101443469496e-06, "loss": 5.331469116210937, "step": 59500 }, { "epoch": 0.0719153401996797, "learning_rate": 9.799697608001758e-06, "loss": 5.339337768554688, "step": 59600 }, { "epoch": 0.07203600352216238, "learning_rate": 9.79929377253402e-06, "loss": 5.327628173828125, "step": 59700 }, { "epoch": 0.07215666684464507, "learning_rate": 9.798889937066282e-06, "loss": 5.363141479492188, "step": 59800 }, { "epoch": 0.07227733016712776, "learning_rate": 9.798486101598544e-06, "loss": 5.346229858398438, "step": 59900 }, { "epoch": 0.07239799348961043, "learning_rate": 9.798082266130806e-06, "loss": 5.3337109375, "step": 60000 }, { "epoch": 0.07251865681209312, "learning_rate": 9.797678430663066e-06, "loss": 5.371128540039063, "step": 60100 }, { "epoch": 0.0726393201345758, "learning_rate": 9.797274595195328e-06, "loss": 5.325468139648438, "step": 60200 }, { "epoch": 0.07275998345705849, "learning_rate": 9.79687075972759e-06, "loss": 5.351263427734375, "step": 60300 }, { "epoch": 0.07288064677954117, "learning_rate": 9.79646692425985e-06, "loss": 5.302833251953125, "step": 60400 }, { "epoch": 0.07300131010202386, "learning_rate": 9.796063088792112e-06, "loss": 5.320345458984375, "step": 60500 }, { "epoch": 0.07312197342450653, "learning_rate": 9.795659253324374e-06, "loss": 5.30924560546875, "step": 60600 }, { "epoch": 0.07324263674698922, "learning_rate": 9.795255417856636e-06, "loss": 5.312813110351563, "step": 60700 }, { "epoch": 0.0733633000694719, "learning_rate": 9.794851582388898e-06, "loss": 5.312037963867187, "step": 60800 }, { "epoch": 0.0734839633919546, "learning_rate": 9.79444774692116e-06, "loss": 5.3346142578125, "step": 60900 }, { "epoch": 0.07360462671443728, "learning_rate": 9.79404391145342e-06, "loss": 5.290857543945313, "step": 61000 }, { "epoch": 0.07372529003691997, "learning_rate": 9.793640075985682e-06, "loss": 5.333678588867188, "step": 61100 }, { "epoch": 0.07384595335940264, "learning_rate": 9.793236240517944e-06, "loss": 5.278713989257812, "step": 61200 }, { "epoch": 0.07396661668188532, "learning_rate": 9.792832405050205e-06, "loss": 5.292643432617187, "step": 61300 }, { "epoch": 0.07408728000436801, "learning_rate": 9.792428569582467e-06, "loss": 5.316370849609375, "step": 61400 }, { "epoch": 0.0742079433268507, "learning_rate": 9.792024734114729e-06, "loss": 5.312543334960938, "step": 61500 }, { "epoch": 0.07432860664933338, "learning_rate": 9.79162089864699e-06, "loss": 5.278667602539063, "step": 61600 }, { "epoch": 0.07444926997181607, "learning_rate": 9.791217063179253e-06, "loss": 5.2681646728515625, "step": 61700 }, { "epoch": 0.07456993329429874, "learning_rate": 9.790813227711515e-06, "loss": 5.295643310546875, "step": 61800 }, { "epoch": 0.07469059661678143, "learning_rate": 9.790409392243775e-06, "loss": 5.30662353515625, "step": 61900 }, { "epoch": 0.07481125993926412, "learning_rate": 9.790005556776037e-06, "loss": 5.2986328125, "step": 62000 }, { "epoch": 0.0749319232617468, "learning_rate": 9.789601721308299e-06, "loss": 5.298446044921875, "step": 62100 }, { "epoch": 0.07505258658422949, "learning_rate": 9.78919788584056e-06, "loss": 5.273689575195313, "step": 62200 }, { "epoch": 0.07517324990671218, "learning_rate": 9.788794050372821e-06, "loss": 5.304020385742188, "step": 62300 }, { "epoch": 0.07529391322919485, "learning_rate": 9.788390214905083e-06, "loss": 5.283749389648437, "step": 62400 }, { "epoch": 0.07541457655167753, "learning_rate": 9.787986379437345e-06, "loss": 5.284664916992187, "step": 62500 }, { "epoch": 0.07553523987416022, "learning_rate": 9.787582543969607e-06, "loss": 5.242105712890625, "step": 62600 }, { "epoch": 0.0756559031966429, "learning_rate": 9.787178708501867e-06, "loss": 5.273545532226563, "step": 62700 }, { "epoch": 0.0757765665191256, "learning_rate": 9.78677487303413e-06, "loss": 5.291265869140625, "step": 62800 }, { "epoch": 0.07589722984160828, "learning_rate": 9.786371037566391e-06, "loss": 5.2325592041015625, "step": 62900 }, { "epoch": 0.07601789316409095, "learning_rate": 9.785967202098653e-06, "loss": 5.281777954101562, "step": 63000 }, { "epoch": 0.07613855648657364, "learning_rate": 9.785563366630915e-06, "loss": 5.252301635742188, "step": 63100 }, { "epoch": 0.07625921980905633, "learning_rate": 9.785159531163176e-06, "loss": 5.271336669921875, "step": 63200 }, { "epoch": 0.07637988313153901, "learning_rate": 9.784755695695438e-06, "loss": 5.248751831054688, "step": 63300 }, { "epoch": 0.0765005464540217, "learning_rate": 9.7843518602277e-06, "loss": 5.28734130859375, "step": 63400 }, { "epoch": 0.07662120977650438, "learning_rate": 9.78394802475996e-06, "loss": 5.259991455078125, "step": 63500 }, { "epoch": 0.07674187309898706, "learning_rate": 9.783544189292222e-06, "loss": 5.244822998046875, "step": 63600 }, { "epoch": 0.07686253642146974, "learning_rate": 9.783140353824484e-06, "loss": 5.237239990234375, "step": 63700 }, { "epoch": 0.07698319974395243, "learning_rate": 9.782736518356746e-06, "loss": 5.25580078125, "step": 63800 }, { "epoch": 0.07710386306643512, "learning_rate": 9.782332682889008e-06, "loss": 5.237862548828125, "step": 63900 }, { "epoch": 0.0772245263889178, "learning_rate": 9.78192884742127e-06, "loss": 5.2344818115234375, "step": 64000 }, { "epoch": 0.07734518971140047, "learning_rate": 9.781525011953532e-06, "loss": 5.210677490234375, "step": 64100 }, { "epoch": 0.07746585303388316, "learning_rate": 9.781121176485792e-06, "loss": 5.2437255859375, "step": 64200 }, { "epoch": 0.07758651635636585, "learning_rate": 9.780717341018054e-06, "loss": 5.2295465087890625, "step": 64300 }, { "epoch": 0.07770717967884853, "learning_rate": 9.780313505550314e-06, "loss": 5.21697265625, "step": 64400 }, { "epoch": 0.07782784300133122, "learning_rate": 9.779909670082576e-06, "loss": 5.272308959960937, "step": 64500 }, { "epoch": 0.07794850632381391, "learning_rate": 9.779505834614838e-06, "loss": 5.207241821289062, "step": 64600 }, { "epoch": 0.07806916964629658, "learning_rate": 9.7791019991471e-06, "loss": 5.221626586914063, "step": 64700 }, { "epoch": 0.07818983296877927, "learning_rate": 9.778698163679362e-06, "loss": 5.228670654296875, "step": 64800 }, { "epoch": 0.07831049629126195, "learning_rate": 9.778294328211624e-06, "loss": 5.212542114257812, "step": 64900 }, { "epoch": 0.07843115961374464, "learning_rate": 9.777890492743886e-06, "loss": 5.1939501953125, "step": 65000 }, { "epoch": 0.07855182293622733, "learning_rate": 9.777486657276146e-06, "loss": 5.21961669921875, "step": 65100 }, { "epoch": 0.07867248625871001, "learning_rate": 9.777082821808408e-06, "loss": 5.210693969726562, "step": 65200 }, { "epoch": 0.07879314958119268, "learning_rate": 9.77667898634067e-06, "loss": 5.213010864257813, "step": 65300 }, { "epoch": 0.07891381290367537, "learning_rate": 9.77627515087293e-06, "loss": 5.203443603515625, "step": 65400 }, { "epoch": 0.07903447622615806, "learning_rate": 9.775871315405193e-06, "loss": 5.190748291015625, "step": 65500 }, { "epoch": 0.07915513954864074, "learning_rate": 9.775467479937455e-06, "loss": 5.1969976806640625, "step": 65600 }, { "epoch": 0.07927580287112343, "learning_rate": 9.775063644469717e-06, "loss": 5.207017822265625, "step": 65700 }, { "epoch": 0.07939646619360612, "learning_rate": 9.774659809001979e-06, "loss": 5.158209228515625, "step": 65800 }, { "epoch": 0.07951712951608879, "learning_rate": 9.774255973534239e-06, "loss": 5.209757080078125, "step": 65900 }, { "epoch": 0.07963779283857148, "learning_rate": 9.773852138066501e-06, "loss": 5.1891015625, "step": 66000 }, { "epoch": 0.07975845616105416, "learning_rate": 9.773448302598763e-06, "loss": 5.185696411132812, "step": 66100 }, { "epoch": 0.07987911948353685, "learning_rate": 9.773044467131025e-06, "loss": 5.192301635742187, "step": 66200 }, { "epoch": 0.07999978280601953, "learning_rate": 9.772640631663285e-06, "loss": 5.201160888671875, "step": 66300 }, { "epoch": 0.08012044612850222, "learning_rate": 9.772236796195547e-06, "loss": 5.201710815429688, "step": 66400 }, { "epoch": 0.0802411094509849, "learning_rate": 9.771832960727809e-06, "loss": 5.205989379882812, "step": 66500 }, { "epoch": 0.08036177277346758, "learning_rate": 9.771429125260071e-06, "loss": 5.183333129882812, "step": 66600 }, { "epoch": 0.08048243609595027, "learning_rate": 9.771025289792333e-06, "loss": 5.190036010742188, "step": 66700 }, { "epoch": 0.08060309941843295, "learning_rate": 9.770621454324593e-06, "loss": 5.178285522460937, "step": 66800 }, { "epoch": 0.08072376274091564, "learning_rate": 9.770217618856855e-06, "loss": 5.192055053710938, "step": 66900 }, { "epoch": 0.08084442606339833, "learning_rate": 9.769813783389117e-06, "loss": 5.202462768554687, "step": 67000 }, { "epoch": 0.080965089385881, "learning_rate": 9.76940994792138e-06, "loss": 5.140267333984375, "step": 67100 }, { "epoch": 0.08108575270836368, "learning_rate": 9.769006112453641e-06, "loss": 5.167439575195313, "step": 67200 }, { "epoch": 0.08120641603084637, "learning_rate": 9.768602276985902e-06, "loss": 5.2037286376953125, "step": 67300 }, { "epoch": 0.08132707935332906, "learning_rate": 9.768198441518164e-06, "loss": 5.164884643554688, "step": 67400 }, { "epoch": 0.08144774267581174, "learning_rate": 9.767794606050426e-06, "loss": 5.17246826171875, "step": 67500 }, { "epoch": 0.08156840599829443, "learning_rate": 9.767390770582686e-06, "loss": 5.15818603515625, "step": 67600 }, { "epoch": 0.0816890693207771, "learning_rate": 9.766986935114948e-06, "loss": 5.151226196289063, "step": 67700 }, { "epoch": 0.08180973264325979, "learning_rate": 9.76658309964721e-06, "loss": 5.15694091796875, "step": 67800 }, { "epoch": 0.08193039596574248, "learning_rate": 9.766179264179472e-06, "loss": 5.159863891601563, "step": 67900 }, { "epoch": 0.08205105928822516, "learning_rate": 9.765775428711734e-06, "loss": 5.170521240234375, "step": 68000 }, { "epoch": 0.08217172261070785, "learning_rate": 9.765371593243996e-06, "loss": 5.14292724609375, "step": 68100 }, { "epoch": 0.08229238593319053, "learning_rate": 9.764967757776258e-06, "loss": 5.156976928710938, "step": 68200 }, { "epoch": 0.0824130492556732, "learning_rate": 9.764563922308518e-06, "loss": 5.152540893554687, "step": 68300 }, { "epoch": 0.0825337125781559, "learning_rate": 9.76416008684078e-06, "loss": 5.16983154296875, "step": 68400 }, { "epoch": 0.08265437590063858, "learning_rate": 9.76375625137304e-06, "loss": 5.146065673828125, "step": 68500 }, { "epoch": 0.08277503922312127, "learning_rate": 9.763352415905302e-06, "loss": 5.119190673828125, "step": 68600 }, { "epoch": 0.08289570254560395, "learning_rate": 9.762948580437564e-06, "loss": 5.125591430664063, "step": 68700 }, { "epoch": 0.08301636586808664, "learning_rate": 9.762544744969826e-06, "loss": 5.17458740234375, "step": 68800 }, { "epoch": 0.08313702919056931, "learning_rate": 9.762140909502088e-06, "loss": 5.173352661132813, "step": 68900 }, { "epoch": 0.083257692513052, "learning_rate": 9.76173707403435e-06, "loss": 5.160217895507812, "step": 69000 }, { "epoch": 0.08337835583553468, "learning_rate": 9.761333238566612e-06, "loss": 5.165855102539062, "step": 69100 }, { "epoch": 0.08349901915801737, "learning_rate": 9.760929403098873e-06, "loss": 5.143590087890625, "step": 69200 }, { "epoch": 0.08361968248050006, "learning_rate": 9.760525567631134e-06, "loss": 5.137591552734375, "step": 69300 }, { "epoch": 0.08374034580298274, "learning_rate": 9.760121732163396e-06, "loss": 5.131078491210937, "step": 69400 }, { "epoch": 0.08386100912546542, "learning_rate": 9.759717896695657e-06, "loss": 5.101188659667969, "step": 69500 }, { "epoch": 0.0839816724479481, "learning_rate": 9.759314061227919e-06, "loss": 5.096486206054688, "step": 69600 }, { "epoch": 0.08410233577043079, "learning_rate": 9.75891022576018e-06, "loss": 5.105284118652344, "step": 69700 }, { "epoch": 0.08422299909291348, "learning_rate": 9.758506390292443e-06, "loss": 5.142880859375, "step": 69800 }, { "epoch": 0.08434366241539616, "learning_rate": 9.758102554824705e-06, "loss": 5.14042236328125, "step": 69900 }, { "epoch": 0.08446432573787885, "learning_rate": 9.757698719356965e-06, "loss": 5.126434326171875, "step": 70000 }, { "epoch": 0.08458498906036152, "learning_rate": 9.757294883889227e-06, "loss": 5.136691284179688, "step": 70100 }, { "epoch": 0.08470565238284421, "learning_rate": 9.756891048421489e-06, "loss": 5.160778198242188, "step": 70200 }, { "epoch": 0.0848263157053269, "learning_rate": 9.756487212953751e-06, "loss": 5.119503173828125, "step": 70300 }, { "epoch": 0.08494697902780958, "learning_rate": 9.756083377486011e-06, "loss": 5.148392333984375, "step": 70400 }, { "epoch": 0.08506764235029227, "learning_rate": 9.755679542018273e-06, "loss": 5.1181948852539065, "step": 70500 }, { "epoch": 0.08518830567277494, "learning_rate": 9.755275706550535e-06, "loss": 5.115385131835938, "step": 70600 }, { "epoch": 0.08530896899525763, "learning_rate": 9.754871871082797e-06, "loss": 5.105375366210938, "step": 70700 }, { "epoch": 0.08542963231774031, "learning_rate": 9.754468035615057e-06, "loss": 5.084530944824219, "step": 70800 }, { "epoch": 0.085550295640223, "learning_rate": 9.75406420014732e-06, "loss": 5.155774536132813, "step": 70900 }, { "epoch": 0.08567095896270568, "learning_rate": 9.753660364679581e-06, "loss": 5.116604614257812, "step": 71000 }, { "epoch": 0.08579162228518837, "learning_rate": 9.753256529211843e-06, "loss": 5.0745150756835935, "step": 71100 }, { "epoch": 0.08591228560767104, "learning_rate": 9.752852693744105e-06, "loss": 5.102546081542969, "step": 71200 }, { "epoch": 0.08603294893015373, "learning_rate": 9.752448858276367e-06, "loss": 5.091918334960938, "step": 71300 }, { "epoch": 0.08615361225263642, "learning_rate": 9.752045022808628e-06, "loss": 5.106720886230469, "step": 71400 }, { "epoch": 0.0862742755751191, "learning_rate": 9.75164118734089e-06, "loss": 5.116187438964844, "step": 71500 }, { "epoch": 0.08639493889760179, "learning_rate": 9.75123735187315e-06, "loss": 5.068934326171875, "step": 71600 }, { "epoch": 0.08651560222008448, "learning_rate": 9.750833516405412e-06, "loss": 5.076722717285156, "step": 71700 }, { "epoch": 0.08663626554256715, "learning_rate": 9.750429680937674e-06, "loss": 5.0759515380859375, "step": 71800 }, { "epoch": 0.08675692886504983, "learning_rate": 9.750025845469936e-06, "loss": 5.0674676513671875, "step": 71900 }, { "epoch": 0.08687759218753252, "learning_rate": 9.749622010002198e-06, "loss": 5.062613525390625, "step": 72000 }, { "epoch": 0.08699825551001521, "learning_rate": 9.74921817453446e-06, "loss": 5.085945739746093, "step": 72100 }, { "epoch": 0.0871189188324979, "learning_rate": 9.748814339066722e-06, "loss": 5.070661926269532, "step": 72200 }, { "epoch": 0.08723958215498058, "learning_rate": 9.748410503598982e-06, "loss": 5.0639105224609375, "step": 72300 }, { "epoch": 0.08736024547746325, "learning_rate": 9.748006668131244e-06, "loss": 5.0563897705078125, "step": 72400 }, { "epoch": 0.08748090879994594, "learning_rate": 9.747602832663506e-06, "loss": 5.087702941894531, "step": 72500 }, { "epoch": 0.08760157212242863, "learning_rate": 9.747198997195766e-06, "loss": 5.096186218261718, "step": 72600 }, { "epoch": 0.08772223544491131, "learning_rate": 9.746795161728028e-06, "loss": 5.075828857421875, "step": 72700 }, { "epoch": 0.087842898767394, "learning_rate": 9.74639132626029e-06, "loss": 5.065995788574218, "step": 72800 }, { "epoch": 0.08796356208987668, "learning_rate": 9.745987490792552e-06, "loss": 5.065982971191406, "step": 72900 }, { "epoch": 0.08808422541235936, "learning_rate": 9.745583655324814e-06, "loss": 5.0935498046875, "step": 73000 }, { "epoch": 0.08820488873484204, "learning_rate": 9.745179819857076e-06, "loss": 5.057830200195313, "step": 73100 }, { "epoch": 0.08832555205732473, "learning_rate": 9.744775984389338e-06, "loss": 5.07429443359375, "step": 73200 }, { "epoch": 0.08844621537980742, "learning_rate": 9.744372148921599e-06, "loss": 5.056070251464844, "step": 73300 }, { "epoch": 0.0885668787022901, "learning_rate": 9.74396831345386e-06, "loss": 5.0279473876953125, "step": 73400 }, { "epoch": 0.08868754202477279, "learning_rate": 9.74356447798612e-06, "loss": 5.027820739746094, "step": 73500 }, { "epoch": 0.08880820534725546, "learning_rate": 9.743160642518383e-06, "loss": 5.057041625976563, "step": 73600 }, { "epoch": 0.08892886866973815, "learning_rate": 9.742756807050645e-06, "loss": 5.04556640625, "step": 73700 }, { "epoch": 0.08904953199222083, "learning_rate": 9.742352971582907e-06, "loss": 5.0384423828125, "step": 73800 }, { "epoch": 0.08917019531470352, "learning_rate": 9.741949136115169e-06, "loss": 5.0619985961914065, "step": 73900 }, { "epoch": 0.08929085863718621, "learning_rate": 9.74154530064743e-06, "loss": 5.019390563964844, "step": 74000 }, { "epoch": 0.0894115219596689, "learning_rate": 9.741141465179691e-06, "loss": 5.043472900390625, "step": 74100 }, { "epoch": 0.08953218528215157, "learning_rate": 9.740737629711953e-06, "loss": 5.038667907714844, "step": 74200 }, { "epoch": 0.08965284860463425, "learning_rate": 9.740333794244215e-06, "loss": 5.0395071411132815, "step": 74300 }, { "epoch": 0.08977351192711694, "learning_rate": 9.739929958776477e-06, "loss": 5.0318997192382815, "step": 74400 }, { "epoch": 0.08989417524959963, "learning_rate": 9.739526123308737e-06, "loss": 5.012469177246094, "step": 74500 }, { "epoch": 0.09001483857208231, "learning_rate": 9.739122287841e-06, "loss": 5.035643005371094, "step": 74600 }, { "epoch": 0.090135501894565, "learning_rate": 9.738718452373261e-06, "loss": 5.027536010742187, "step": 74700 }, { "epoch": 0.09025616521704767, "learning_rate": 9.738314616905523e-06, "loss": 5.043776245117187, "step": 74800 }, { "epoch": 0.09037682853953036, "learning_rate": 9.737910781437783e-06, "loss": 5.01318115234375, "step": 74900 }, { "epoch": 0.09049749186201304, "learning_rate": 9.737506945970045e-06, "loss": 5.0130615234375, "step": 75000 }, { "epoch": 0.09061815518449573, "learning_rate": 9.737103110502307e-06, "loss": 5.016927490234375, "step": 75100 }, { "epoch": 0.09073881850697842, "learning_rate": 9.73669927503457e-06, "loss": 5.021900939941406, "step": 75200 }, { "epoch": 0.0908594818294611, "learning_rate": 9.736295439566831e-06, "loss": 5.039082946777344, "step": 75300 }, { "epoch": 0.09098014515194378, "learning_rate": 9.735891604099092e-06, "loss": 5.025408325195312, "step": 75400 }, { "epoch": 0.09110080847442646, "learning_rate": 9.735487768631354e-06, "loss": 4.999896545410156, "step": 75500 }, { "epoch": 0.09122147179690915, "learning_rate": 9.735083933163616e-06, "loss": 5.0109646606445315, "step": 75600 }, { "epoch": 0.09134213511939183, "learning_rate": 9.734680097695876e-06, "loss": 5.01272705078125, "step": 75700 }, { "epoch": 0.09146279844187452, "learning_rate": 9.734276262228138e-06, "loss": 4.993172302246093, "step": 75800 }, { "epoch": 0.09158346176435721, "learning_rate": 9.7338724267604e-06, "loss": 5.027442321777344, "step": 75900 }, { "epoch": 0.09170412508683988, "learning_rate": 9.733468591292662e-06, "loss": 5.016123046875, "step": 76000 }, { "epoch": 0.09182478840932257, "learning_rate": 9.733064755824924e-06, "loss": 5.013028869628906, "step": 76100 }, { "epoch": 0.09194545173180525, "learning_rate": 9.732660920357186e-06, "loss": 4.973556213378906, "step": 76200 }, { "epoch": 0.09206611505428794, "learning_rate": 9.732257084889448e-06, "loss": 5.0146942138671875, "step": 76300 }, { "epoch": 0.09218677837677063, "learning_rate": 9.731853249421708e-06, "loss": 4.992164611816406, "step": 76400 }, { "epoch": 0.09230744169925331, "learning_rate": 9.73144941395397e-06, "loss": 4.999853210449219, "step": 76500 }, { "epoch": 0.09242810502173598, "learning_rate": 9.73104557848623e-06, "loss": 4.986173706054688, "step": 76600 }, { "epoch": 0.09254876834421867, "learning_rate": 9.730641743018492e-06, "loss": 5.011735534667968, "step": 76700 }, { "epoch": 0.09266943166670136, "learning_rate": 9.730237907550754e-06, "loss": 5.000827941894531, "step": 76800 }, { "epoch": 0.09279009498918404, "learning_rate": 9.729834072083016e-06, "loss": 4.992151489257813, "step": 76900 }, { "epoch": 0.09291075831166673, "learning_rate": 9.729430236615278e-06, "loss": 4.989145812988281, "step": 77000 }, { "epoch": 0.0930314216341494, "learning_rate": 9.72902640114754e-06, "loss": 5.0138681030273435, "step": 77100 }, { "epoch": 0.09315208495663209, "learning_rate": 9.728622565679802e-06, "loss": 4.996145324707031, "step": 77200 }, { "epoch": 0.09327274827911478, "learning_rate": 9.728218730212063e-06, "loss": 4.9842221069335935, "step": 77300 }, { "epoch": 0.09339341160159746, "learning_rate": 9.727814894744325e-06, "loss": 4.972623291015625, "step": 77400 }, { "epoch": 0.09351407492408015, "learning_rate": 9.727411059276587e-06, "loss": 4.973984069824219, "step": 77500 }, { "epoch": 0.09363473824656283, "learning_rate": 9.727007223808847e-06, "loss": 4.984323120117187, "step": 77600 }, { "epoch": 0.09375540156904551, "learning_rate": 9.726603388341109e-06, "loss": 4.98031982421875, "step": 77700 }, { "epoch": 0.0938760648915282, "learning_rate": 9.72619955287337e-06, "loss": 4.959669799804687, "step": 77800 }, { "epoch": 0.09399672821401088, "learning_rate": 9.725795717405633e-06, "loss": 4.968257751464844, "step": 77900 }, { "epoch": 0.09411739153649357, "learning_rate": 9.725391881937895e-06, "loss": 4.966848754882813, "step": 78000 }, { "epoch": 0.09423805485897625, "learning_rate": 9.724988046470157e-06, "loss": 4.976156311035156, "step": 78100 }, { "epoch": 0.09435871818145894, "learning_rate": 9.724584211002417e-06, "loss": 4.9650640869140625, "step": 78200 }, { "epoch": 0.09447938150394161, "learning_rate": 9.724180375534679e-06, "loss": 5.000171203613281, "step": 78300 }, { "epoch": 0.0946000448264243, "learning_rate": 9.723776540066941e-06, "loss": 4.980813903808594, "step": 78400 }, { "epoch": 0.09472070814890698, "learning_rate": 9.723372704599201e-06, "loss": 4.964000854492188, "step": 78500 }, { "epoch": 0.09484137147138967, "learning_rate": 9.722968869131463e-06, "loss": 4.972636108398437, "step": 78600 }, { "epoch": 0.09496203479387236, "learning_rate": 9.722565033663725e-06, "loss": 4.949419555664062, "step": 78700 }, { "epoch": 0.09508269811635504, "learning_rate": 9.722161198195987e-06, "loss": 4.97333740234375, "step": 78800 }, { "epoch": 0.09520336143883772, "learning_rate": 9.72175736272825e-06, "loss": 4.967134704589844, "step": 78900 }, { "epoch": 0.0953240247613204, "learning_rate": 9.72135352726051e-06, "loss": 4.9573486328125, "step": 79000 }, { "epoch": 0.09544468808380309, "learning_rate": 9.720949691792772e-06, "loss": 4.946339111328125, "step": 79100 }, { "epoch": 0.09556535140628578, "learning_rate": 9.720545856325033e-06, "loss": 4.958375244140625, "step": 79200 }, { "epoch": 0.09568601472876846, "learning_rate": 9.720142020857295e-06, "loss": 4.967229919433594, "step": 79300 }, { "epoch": 0.09580667805125115, "learning_rate": 9.719738185389557e-06, "loss": 4.963417358398438, "step": 79400 }, { "epoch": 0.09592734137373382, "learning_rate": 9.719334349921818e-06, "loss": 4.937957153320313, "step": 79500 }, { "epoch": 0.09604800469621651, "learning_rate": 9.71893051445408e-06, "loss": 4.933610534667968, "step": 79600 }, { "epoch": 0.0961686680186992, "learning_rate": 9.718526678986342e-06, "loss": 4.95427978515625, "step": 79700 }, { "epoch": 0.09628933134118188, "learning_rate": 9.718122843518602e-06, "loss": 4.928057250976562, "step": 79800 }, { "epoch": 0.09640999466366457, "learning_rate": 9.717719008050864e-06, "loss": 4.925322875976563, "step": 79900 }, { "epoch": 0.09653065798614725, "learning_rate": 9.717315172583126e-06, "loss": 4.908415222167969, "step": 80000 }, { "epoch": 0.09665132130862993, "learning_rate": 9.716911337115388e-06, "loss": 4.9557421875, "step": 80100 }, { "epoch": 0.09677198463111261, "learning_rate": 9.71650750164765e-06, "loss": 4.940488891601563, "step": 80200 }, { "epoch": 0.0968926479535953, "learning_rate": 9.716103666179912e-06, "loss": 4.938771362304688, "step": 80300 }, { "epoch": 0.09701331127607798, "learning_rate": 9.715699830712174e-06, "loss": 4.942922973632813, "step": 80400 }, { "epoch": 0.09713397459856067, "learning_rate": 9.715295995244434e-06, "loss": 4.9132516479492185, "step": 80500 }, { "epoch": 0.09725463792104336, "learning_rate": 9.714892159776696e-06, "loss": 4.945633239746094, "step": 80600 }, { "epoch": 0.09737530124352603, "learning_rate": 9.714488324308956e-06, "loss": 4.918882141113281, "step": 80700 }, { "epoch": 0.09749596456600872, "learning_rate": 9.714084488841218e-06, "loss": 4.931737060546875, "step": 80800 }, { "epoch": 0.0976166278884914, "learning_rate": 9.71368065337348e-06, "loss": 4.926199951171875, "step": 80900 }, { "epoch": 0.09773729121097409, "learning_rate": 9.713276817905742e-06, "loss": 4.918571472167969, "step": 81000 }, { "epoch": 0.09785795453345678, "learning_rate": 9.712872982438004e-06, "loss": 4.9157711791992185, "step": 81100 }, { "epoch": 0.09797861785593946, "learning_rate": 9.712469146970266e-06, "loss": 4.908008422851562, "step": 81200 }, { "epoch": 0.09809928117842213, "learning_rate": 9.712065311502528e-06, "loss": 4.907994995117187, "step": 81300 }, { "epoch": 0.09821994450090482, "learning_rate": 9.711661476034789e-06, "loss": 4.899029846191406, "step": 81400 }, { "epoch": 0.09834060782338751, "learning_rate": 9.71125764056705e-06, "loss": 4.894893798828125, "step": 81500 }, { "epoch": 0.0984612711458702, "learning_rate": 9.710853805099313e-06, "loss": 4.921471252441406, "step": 81600 }, { "epoch": 0.09858193446835288, "learning_rate": 9.710449969631573e-06, "loss": 4.907397766113281, "step": 81700 }, { "epoch": 0.09870259779083557, "learning_rate": 9.710046134163835e-06, "loss": 4.908330383300782, "step": 81800 }, { "epoch": 0.09882326111331824, "learning_rate": 9.709642298696097e-06, "loss": 4.893409729003906, "step": 81900 }, { "epoch": 0.09894392443580093, "learning_rate": 9.709238463228359e-06, "loss": 4.886049194335937, "step": 82000 }, { "epoch": 0.09906458775828361, "learning_rate": 9.70883462776062e-06, "loss": 4.882464294433594, "step": 82100 }, { "epoch": 0.0991852510807663, "learning_rate": 9.708430792292883e-06, "loss": 4.888573303222656, "step": 82200 }, { "epoch": 0.09930591440324898, "learning_rate": 9.708026956825143e-06, "loss": 4.882120361328125, "step": 82300 }, { "epoch": 0.09942657772573167, "learning_rate": 9.707623121357405e-06, "loss": 4.903425903320312, "step": 82400 }, { "epoch": 0.09954724104821434, "learning_rate": 9.707219285889667e-06, "loss": 4.868942565917969, "step": 82500 }, { "epoch": 0.09966790437069703, "learning_rate": 9.706815450421927e-06, "loss": 4.895352783203125, "step": 82600 }, { "epoch": 0.09978856769317972, "learning_rate": 9.70641161495419e-06, "loss": 4.913453063964844, "step": 82700 }, { "epoch": 0.0999092310156624, "learning_rate": 9.706007779486451e-06, "loss": 4.8864443969726565, "step": 82800 }, { "epoch": 0.10002989433814509, "learning_rate": 9.705603944018713e-06, "loss": 4.874024353027344, "step": 82900 }, { "epoch": 0.10015055766062778, "learning_rate": 9.705200108550975e-06, "loss": 4.913255615234375, "step": 83000 }, { "epoch": 0.10027122098311045, "learning_rate": 9.704796273083236e-06, "loss": 4.861760864257812, "step": 83100 }, { "epoch": 0.10039188430559313, "learning_rate": 9.704392437615498e-06, "loss": 4.886510009765625, "step": 83200 }, { "epoch": 0.10051254762807582, "learning_rate": 9.70398860214776e-06, "loss": 4.860154418945313, "step": 83300 }, { "epoch": 0.10063321095055851, "learning_rate": 9.703584766680022e-06, "loss": 4.873463745117188, "step": 83400 }, { "epoch": 0.1007538742730412, "learning_rate": 9.703180931212283e-06, "loss": 4.890827331542969, "step": 83500 }, { "epoch": 0.10087453759552387, "learning_rate": 9.702777095744544e-06, "loss": 4.879186401367187, "step": 83600 }, { "epoch": 0.10099520091800655, "learning_rate": 9.702373260276806e-06, "loss": 4.876583251953125, "step": 83700 }, { "epoch": 0.10111586424048924, "learning_rate": 9.701969424809068e-06, "loss": 4.86263671875, "step": 83800 }, { "epoch": 0.10123652756297193, "learning_rate": 9.701565589341328e-06, "loss": 4.866602783203125, "step": 83900 }, { "epoch": 0.10135719088545461, "learning_rate": 9.70116175387359e-06, "loss": 4.905928344726562, "step": 84000 }, { "epoch": 0.1014778542079373, "learning_rate": 9.700757918405852e-06, "loss": 4.867268371582031, "step": 84100 }, { "epoch": 0.10159851753041997, "learning_rate": 9.700354082938114e-06, "loss": 4.870028381347656, "step": 84200 }, { "epoch": 0.10171918085290266, "learning_rate": 9.699950247470376e-06, "loss": 4.886224670410156, "step": 84300 }, { "epoch": 0.10183984417538534, "learning_rate": 9.699546412002638e-06, "loss": 4.862721862792969, "step": 84400 }, { "epoch": 0.10196050749786803, "learning_rate": 9.699142576534898e-06, "loss": 4.869748840332031, "step": 84500 }, { "epoch": 0.10208117082035072, "learning_rate": 9.69873874106716e-06, "loss": 4.842414245605469, "step": 84600 }, { "epoch": 0.1022018341428334, "learning_rate": 9.698334905599422e-06, "loss": 4.873136291503906, "step": 84700 }, { "epoch": 0.10232249746531608, "learning_rate": 9.697931070131682e-06, "loss": 4.825064697265625, "step": 84800 }, { "epoch": 0.10244316078779876, "learning_rate": 9.697527234663944e-06, "loss": 4.85788818359375, "step": 84900 }, { "epoch": 0.10256382411028145, "learning_rate": 9.697123399196206e-06, "loss": 4.894467468261719, "step": 85000 }, { "epoch": 0.10268448743276413, "learning_rate": 9.696719563728468e-06, "loss": 4.841428527832031, "step": 85100 }, { "epoch": 0.10280515075524682, "learning_rate": 9.69631572826073e-06, "loss": 4.850602722167968, "step": 85200 }, { "epoch": 0.10292581407772951, "learning_rate": 9.695911892792992e-06, "loss": 4.853901062011719, "step": 85300 }, { "epoch": 0.10304647740021218, "learning_rate": 9.695508057325254e-06, "loss": 4.848119201660157, "step": 85400 }, { "epoch": 0.10316714072269487, "learning_rate": 9.695104221857515e-06, "loss": 4.851161499023437, "step": 85500 }, { "epoch": 0.10328780404517755, "learning_rate": 9.694700386389777e-06, "loss": 4.804761962890625, "step": 85600 }, { "epoch": 0.10340846736766024, "learning_rate": 9.694296550922037e-06, "loss": 4.843150024414062, "step": 85700 }, { "epoch": 0.10352913069014293, "learning_rate": 9.693892715454299e-06, "loss": 4.845422973632813, "step": 85800 }, { "epoch": 0.10364979401262561, "learning_rate": 9.693488879986561e-06, "loss": 4.843452758789063, "step": 85900 }, { "epoch": 0.10377045733510828, "learning_rate": 9.693085044518823e-06, "loss": 4.856632385253906, "step": 86000 }, { "epoch": 0.10389112065759097, "learning_rate": 9.692681209051085e-06, "loss": 4.823756713867187, "step": 86100 }, { "epoch": 0.10401178398007366, "learning_rate": 9.692277373583347e-06, "loss": 4.834161987304688, "step": 86200 }, { "epoch": 0.10413244730255634, "learning_rate": 9.691873538115607e-06, "loss": 4.850711059570313, "step": 86300 }, { "epoch": 0.10425311062503903, "learning_rate": 9.691469702647869e-06, "loss": 4.828718566894532, "step": 86400 }, { "epoch": 0.10437377394752172, "learning_rate": 9.691065867180131e-06, "loss": 4.8225927734375, "step": 86500 }, { "epoch": 0.10449443727000439, "learning_rate": 9.690662031712393e-06, "loss": 4.8287655639648435, "step": 86600 }, { "epoch": 0.10461510059248708, "learning_rate": 9.690258196244653e-06, "loss": 4.809221801757812, "step": 86700 }, { "epoch": 0.10473576391496976, "learning_rate": 9.689854360776915e-06, "loss": 4.803803405761719, "step": 86800 }, { "epoch": 0.10485642723745245, "learning_rate": 9.689450525309177e-06, "loss": 4.820423889160156, "step": 86900 }, { "epoch": 0.10497709055993514, "learning_rate": 9.68904668984144e-06, "loss": 4.808703002929687, "step": 87000 }, { "epoch": 0.10509775388241782, "learning_rate": 9.6886428543737e-06, "loss": 4.8158642578125, "step": 87100 }, { "epoch": 0.1052184172049005, "learning_rate": 9.688239018905962e-06, "loss": 4.816473388671875, "step": 87200 }, { "epoch": 0.10533908052738318, "learning_rate": 9.687835183438224e-06, "loss": 4.785604858398438, "step": 87300 }, { "epoch": 0.10545974384986587, "learning_rate": 9.687431347970486e-06, "loss": 4.79506103515625, "step": 87400 }, { "epoch": 0.10558040717234855, "learning_rate": 9.687027512502748e-06, "loss": 4.809523315429687, "step": 87500 }, { "epoch": 0.10570107049483124, "learning_rate": 9.686623677035008e-06, "loss": 4.778346557617187, "step": 87600 }, { "epoch": 0.10582173381731393, "learning_rate": 9.68621984156727e-06, "loss": 4.822114562988281, "step": 87700 }, { "epoch": 0.1059423971397966, "learning_rate": 9.685816006099532e-06, "loss": 4.785655212402344, "step": 87800 }, { "epoch": 0.10606306046227928, "learning_rate": 9.685412170631794e-06, "loss": 4.827339172363281, "step": 87900 }, { "epoch": 0.10618372378476197, "learning_rate": 9.685008335164054e-06, "loss": 4.80163330078125, "step": 88000 }, { "epoch": 0.10630438710724466, "learning_rate": 9.684604499696316e-06, "loss": 4.787745666503906, "step": 88100 }, { "epoch": 0.10642505042972734, "learning_rate": 9.684200664228578e-06, "loss": 4.800241088867187, "step": 88200 }, { "epoch": 0.10654571375221003, "learning_rate": 9.68379682876084e-06, "loss": 4.812076721191406, "step": 88300 }, { "epoch": 0.1066663770746927, "learning_rate": 9.683392993293102e-06, "loss": 4.784380493164062, "step": 88400 }, { "epoch": 0.10678704039717539, "learning_rate": 9.682989157825364e-06, "loss": 4.791062316894531, "step": 88500 }, { "epoch": 0.10690770371965808, "learning_rate": 9.682585322357624e-06, "loss": 4.775936279296875, "step": 88600 }, { "epoch": 0.10702836704214076, "learning_rate": 9.682181486889886e-06, "loss": 4.784500732421875, "step": 88700 }, { "epoch": 0.10714903036462345, "learning_rate": 9.681777651422147e-06, "loss": 4.803079833984375, "step": 88800 }, { "epoch": 0.10726969368710614, "learning_rate": 9.681373815954409e-06, "loss": 4.794912719726563, "step": 88900 }, { "epoch": 0.10739035700958881, "learning_rate": 9.68096998048667e-06, "loss": 4.7925244140625, "step": 89000 }, { "epoch": 0.1075110203320715, "learning_rate": 9.680566145018932e-06, "loss": 4.777199401855468, "step": 89100 }, { "epoch": 0.10763168365455418, "learning_rate": 9.680162309551194e-06, "loss": 4.778366394042969, "step": 89200 }, { "epoch": 0.10775234697703687, "learning_rate": 9.679758474083456e-06, "loss": 4.776029663085938, "step": 89300 }, { "epoch": 0.10787301029951955, "learning_rate": 9.679354638615718e-06, "loss": 4.753299865722656, "step": 89400 }, { "epoch": 0.10799367362200224, "learning_rate": 9.678950803147979e-06, "loss": 4.788411254882813, "step": 89500 }, { "epoch": 0.10811433694448491, "learning_rate": 9.67854696768024e-06, "loss": 4.8108148193359375, "step": 89600 }, { "epoch": 0.1082350002669676, "learning_rate": 9.678143132212503e-06, "loss": 4.770762634277344, "step": 89700 }, { "epoch": 0.10835566358945029, "learning_rate": 9.677739296744763e-06, "loss": 4.769071350097656, "step": 89800 }, { "epoch": 0.10847632691193297, "learning_rate": 9.677335461277025e-06, "loss": 4.78750244140625, "step": 89900 }, { "epoch": 0.10859699023441566, "learning_rate": 9.676931625809287e-06, "loss": 4.77056640625, "step": 90000 }, { "epoch": 0.10871765355689833, "learning_rate": 9.676527790341549e-06, "loss": 4.7862374877929685, "step": 90100 }, { "epoch": 0.10883831687938102, "learning_rate": 9.676123954873811e-06, "loss": 4.737091674804687, "step": 90200 }, { "epoch": 0.1089589802018637, "learning_rate": 9.675720119406073e-06, "loss": 4.722448425292969, "step": 90300 }, { "epoch": 0.10907964352434639, "learning_rate": 9.675316283938333e-06, "loss": 4.7578128051757815, "step": 90400 }, { "epoch": 0.10920030684682908, "learning_rate": 9.674912448470595e-06, "loss": 4.75033447265625, "step": 90500 }, { "epoch": 0.10932097016931176, "learning_rate": 9.674508613002857e-06, "loss": 4.728914794921875, "step": 90600 }, { "epoch": 0.10944163349179444, "learning_rate": 9.674104777535117e-06, "loss": 4.737483520507812, "step": 90700 }, { "epoch": 0.10956229681427712, "learning_rate": 9.67370094206738e-06, "loss": 4.750766906738281, "step": 90800 }, { "epoch": 0.10968296013675981, "learning_rate": 9.673297106599641e-06, "loss": 4.759916687011719, "step": 90900 }, { "epoch": 0.1098036234592425, "learning_rate": 9.672893271131903e-06, "loss": 4.754288635253906, "step": 91000 }, { "epoch": 0.10992428678172518, "learning_rate": 9.672489435664165e-06, "loss": 4.7359814453125, "step": 91100 }, { "epoch": 0.11004495010420787, "learning_rate": 9.672085600196426e-06, "loss": 4.7439111328125, "step": 91200 }, { "epoch": 0.11016561342669054, "learning_rate": 9.671681764728688e-06, "loss": 4.73325927734375, "step": 91300 }, { "epoch": 0.11028627674917323, "learning_rate": 9.67127792926095e-06, "loss": 4.771037902832031, "step": 91400 }, { "epoch": 0.11040694007165591, "learning_rate": 9.670874093793212e-06, "loss": 4.7424014282226565, "step": 91500 }, { "epoch": 0.1105276033941386, "learning_rate": 9.670470258325474e-06, "loss": 4.757178955078125, "step": 91600 }, { "epoch": 0.11064826671662129, "learning_rate": 9.670066422857734e-06, "loss": 4.728418884277343, "step": 91700 }, { "epoch": 0.11076893003910397, "learning_rate": 9.669662587389996e-06, "loss": 4.741020202636719, "step": 91800 }, { "epoch": 0.11088959336158664, "learning_rate": 9.669258751922258e-06, "loss": 4.755391845703125, "step": 91900 }, { "epoch": 0.11101025668406933, "learning_rate": 9.668854916454518e-06, "loss": 4.733238830566406, "step": 92000 }, { "epoch": 0.11113092000655202, "learning_rate": 9.66845108098678e-06, "loss": 4.754249877929688, "step": 92100 }, { "epoch": 0.1112515833290347, "learning_rate": 9.668047245519042e-06, "loss": 4.741124877929687, "step": 92200 }, { "epoch": 0.11137224665151739, "learning_rate": 9.667643410051304e-06, "loss": 4.741844787597656, "step": 92300 }, { "epoch": 0.11149290997400008, "learning_rate": 9.667239574583566e-06, "loss": 4.70602294921875, "step": 92400 }, { "epoch": 0.11161357329648275, "learning_rate": 9.666835739115828e-06, "loss": 4.732904357910156, "step": 92500 }, { "epoch": 0.11173423661896544, "learning_rate": 9.666431903648088e-06, "loss": 4.720787353515625, "step": 92600 }, { "epoch": 0.11185489994144812, "learning_rate": 9.66602806818035e-06, "loss": 4.731036987304687, "step": 92700 }, { "epoch": 0.11197556326393081, "learning_rate": 9.665624232712612e-06, "loss": 4.728709716796875, "step": 92800 }, { "epoch": 0.1120962265864135, "learning_rate": 9.665220397244873e-06, "loss": 4.719226989746094, "step": 92900 }, { "epoch": 0.11221688990889618, "learning_rate": 9.664816561777135e-06, "loss": 4.7157666015625, "step": 93000 }, { "epoch": 0.11233755323137885, "learning_rate": 9.664412726309397e-06, "loss": 4.7111337280273435, "step": 93100 }, { "epoch": 0.11245821655386154, "learning_rate": 9.664008890841659e-06, "loss": 4.713517150878906, "step": 93200 }, { "epoch": 0.11257887987634423, "learning_rate": 9.66360505537392e-06, "loss": 4.706962585449219, "step": 93300 }, { "epoch": 0.11269954319882691, "learning_rate": 9.663201219906182e-06, "loss": 4.721396484375, "step": 93400 }, { "epoch": 0.1128202065213096, "learning_rate": 9.662797384438444e-06, "loss": 4.731193237304687, "step": 93500 }, { "epoch": 0.11294086984379229, "learning_rate": 9.662393548970705e-06, "loss": 4.722343139648437, "step": 93600 }, { "epoch": 0.11306153316627496, "learning_rate": 9.661989713502967e-06, "loss": 4.701794128417969, "step": 93700 }, { "epoch": 0.11318219648875764, "learning_rate": 9.661585878035227e-06, "loss": 4.6912774658203125, "step": 93800 }, { "epoch": 0.11330285981124033, "learning_rate": 9.661182042567489e-06, "loss": 4.714636535644531, "step": 93900 }, { "epoch": 0.11342352313372302, "learning_rate": 9.660778207099751e-06, "loss": 4.71160888671875, "step": 94000 }, { "epoch": 0.1135441864562057, "learning_rate": 9.660374371632013e-06, "loss": 4.710344848632812, "step": 94100 }, { "epoch": 0.11366484977868839, "learning_rate": 9.659970536164275e-06, "loss": 4.702177429199219, "step": 94200 }, { "epoch": 0.11378551310117106, "learning_rate": 9.659566700696537e-06, "loss": 4.699169006347656, "step": 94300 }, { "epoch": 0.11390617642365375, "learning_rate": 9.659162865228799e-06, "loss": 4.69635986328125, "step": 94400 }, { "epoch": 0.11402683974613644, "learning_rate": 9.65875902976106e-06, "loss": 4.693934936523437, "step": 94500 }, { "epoch": 0.11414750306861912, "learning_rate": 9.658355194293321e-06, "loss": 4.700142211914063, "step": 94600 }, { "epoch": 0.11426816639110181, "learning_rate": 9.657951358825583e-06, "loss": 4.660438537597656, "step": 94700 }, { "epoch": 0.1143888297135845, "learning_rate": 9.657547523357843e-06, "loss": 4.706804809570312, "step": 94800 }, { "epoch": 0.11450949303606717, "learning_rate": 9.657143687890105e-06, "loss": 4.686411437988281, "step": 94900 }, { "epoch": 0.11463015635854985, "learning_rate": 9.656739852422367e-06, "loss": 4.704990234375, "step": 95000 }, { "epoch": 0.11475081968103254, "learning_rate": 9.65633601695463e-06, "loss": 4.678945617675781, "step": 95100 }, { "epoch": 0.11487148300351523, "learning_rate": 9.655932181486891e-06, "loss": 4.6987918090820315, "step": 95200 }, { "epoch": 0.11499214632599791, "learning_rate": 9.655528346019152e-06, "loss": 4.716113586425781, "step": 95300 }, { "epoch": 0.1151128096484806, "learning_rate": 9.655124510551414e-06, "loss": 4.678018188476562, "step": 95400 }, { "epoch": 0.11523347297096327, "learning_rate": 9.654720675083676e-06, "loss": 4.681973266601562, "step": 95500 }, { "epoch": 0.11535413629344596, "learning_rate": 9.654316839615938e-06, "loss": 4.708043212890625, "step": 95600 }, { "epoch": 0.11547479961592864, "learning_rate": 9.6539130041482e-06, "loss": 4.685238342285157, "step": 95700 }, { "epoch": 0.11559546293841133, "learning_rate": 9.65350916868046e-06, "loss": 4.6925115966796875, "step": 95800 }, { "epoch": 0.11571612626089402, "learning_rate": 9.653105333212722e-06, "loss": 4.63882568359375, "step": 95900 }, { "epoch": 0.1158367895833767, "learning_rate": 9.652701497744984e-06, "loss": 4.678868103027344, "step": 96000 }, { "epoch": 0.11595745290585938, "learning_rate": 9.652297662277244e-06, "loss": 4.679849243164062, "step": 96100 }, { "epoch": 0.11607811622834206, "learning_rate": 9.651893826809506e-06, "loss": 4.697474060058593, "step": 96200 }, { "epoch": 0.11619877955082475, "learning_rate": 9.651489991341768e-06, "loss": 4.663589782714844, "step": 96300 }, { "epoch": 0.11631944287330744, "learning_rate": 9.65108615587403e-06, "loss": 4.677477416992187, "step": 96400 }, { "epoch": 0.11644010619579012, "learning_rate": 9.650682320406292e-06, "loss": 4.647117309570312, "step": 96500 }, { "epoch": 0.1165607695182728, "learning_rate": 9.650278484938554e-06, "loss": 4.643777465820312, "step": 96600 }, { "epoch": 0.11668143284075548, "learning_rate": 9.649874649470814e-06, "loss": 4.6652224731445315, "step": 96700 }, { "epoch": 0.11680209616323817, "learning_rate": 9.649470814003076e-06, "loss": 4.657362060546875, "step": 96800 }, { "epoch": 0.11692275948572085, "learning_rate": 9.649066978535338e-06, "loss": 4.674615173339844, "step": 96900 }, { "epoch": 0.11704342280820354, "learning_rate": 9.648663143067599e-06, "loss": 4.679769592285156, "step": 97000 }, { "epoch": 0.11716408613068623, "learning_rate": 9.64825930759986e-06, "loss": 4.653609619140625, "step": 97100 }, { "epoch": 0.1172847494531689, "learning_rate": 9.647855472132123e-06, "loss": 4.664938354492188, "step": 97200 }, { "epoch": 0.11740541277565159, "learning_rate": 9.647451636664385e-06, "loss": 4.677825927734375, "step": 97300 }, { "epoch": 0.11752607609813427, "learning_rate": 9.647047801196647e-06, "loss": 4.654386596679688, "step": 97400 }, { "epoch": 0.11764673942061696, "learning_rate": 9.646643965728909e-06, "loss": 4.682733154296875, "step": 97500 }, { "epoch": 0.11776740274309964, "learning_rate": 9.64624013026117e-06, "loss": 4.636017761230469, "step": 97600 }, { "epoch": 0.11788806606558233, "learning_rate": 9.64583629479343e-06, "loss": 4.643951416015625, "step": 97700 }, { "epoch": 0.118008729388065, "learning_rate": 9.645432459325693e-06, "loss": 4.623200378417969, "step": 97800 }, { "epoch": 0.11812939271054769, "learning_rate": 9.645028623857953e-06, "loss": 4.645050964355469, "step": 97900 }, { "epoch": 0.11825005603303038, "learning_rate": 9.644624788390215e-06, "loss": 4.64683349609375, "step": 98000 }, { "epoch": 0.11837071935551306, "learning_rate": 9.644220952922477e-06, "loss": 4.662095031738281, "step": 98100 }, { "epoch": 0.11849138267799575, "learning_rate": 9.643817117454739e-06, "loss": 4.666967468261719, "step": 98200 }, { "epoch": 0.11861204600047844, "learning_rate": 9.643413281987001e-06, "loss": 4.644697875976562, "step": 98300 }, { "epoch": 0.11873270932296111, "learning_rate": 9.643009446519263e-06, "loss": 4.6283261108398435, "step": 98400 }, { "epoch": 0.1188533726454438, "learning_rate": 9.642605611051525e-06, "loss": 4.625231628417969, "step": 98500 }, { "epoch": 0.11897403596792648, "learning_rate": 9.642201775583785e-06, "loss": 4.631438598632813, "step": 98600 }, { "epoch": 0.11909469929040917, "learning_rate": 9.641797940116047e-06, "loss": 4.632507934570312, "step": 98700 }, { "epoch": 0.11921536261289185, "learning_rate": 9.64139410464831e-06, "loss": 4.62410400390625, "step": 98800 }, { "epoch": 0.11933602593537454, "learning_rate": 9.64099026918057e-06, "loss": 4.644050598144531, "step": 98900 }, { "epoch": 0.11945668925785721, "learning_rate": 9.640586433712831e-06, "loss": 4.642160034179687, "step": 99000 }, { "epoch": 0.1195773525803399, "learning_rate": 9.640182598245093e-06, "loss": 4.639566345214844, "step": 99100 }, { "epoch": 0.11969801590282259, "learning_rate": 9.639778762777355e-06, "loss": 4.6316439819335935, "step": 99200 }, { "epoch": 0.11981867922530527, "learning_rate": 9.639374927309617e-06, "loss": 4.651192321777343, "step": 99300 }, { "epoch": 0.11993934254778796, "learning_rate": 9.638971091841878e-06, "loss": 4.610224609375, "step": 99400 }, { "epoch": 0.12006000587027064, "learning_rate": 9.63856725637414e-06, "loss": 4.625392761230469, "step": 99500 }, { "epoch": 0.12018066919275332, "learning_rate": 9.638163420906402e-06, "loss": 4.602829895019531, "step": 99600 }, { "epoch": 0.120301332515236, "learning_rate": 9.637759585438664e-06, "loss": 4.594230041503907, "step": 99700 }, { "epoch": 0.12042199583771869, "learning_rate": 9.637355749970924e-06, "loss": 4.585758361816406, "step": 99800 }, { "epoch": 0.12054265916020138, "learning_rate": 9.636951914503186e-06, "loss": 4.6115719604492185, "step": 99900 }, { "epoch": 0.12066332248268406, "learning_rate": 9.636548079035448e-06, "loss": 4.627333068847657, "step": 100000 }, { "epoch": 0.12078398580516675, "learning_rate": 9.63614424356771e-06, "loss": 4.614095153808594, "step": 100100 }, { "epoch": 0.12090464912764942, "learning_rate": 9.63574040809997e-06, "loss": 4.606982421875, "step": 100200 }, { "epoch": 0.12102531245013211, "learning_rate": 9.635336572632232e-06, "loss": 4.619635009765625, "step": 100300 }, { "epoch": 0.1211459757726148, "learning_rate": 9.634932737164494e-06, "loss": 4.618819580078125, "step": 100400 }, { "epoch": 0.12126663909509748, "learning_rate": 9.634528901696756e-06, "loss": 4.615993041992187, "step": 100500 }, { "epoch": 0.12138730241758017, "learning_rate": 9.634125066229018e-06, "loss": 4.600937194824219, "step": 100600 }, { "epoch": 0.12150796574006285, "learning_rate": 9.63372123076128e-06, "loss": 4.617173156738281, "step": 100700 }, { "epoch": 0.12162862906254553, "learning_rate": 9.63331739529354e-06, "loss": 4.597644348144531, "step": 100800 }, { "epoch": 0.12174929238502821, "learning_rate": 9.632913559825802e-06, "loss": 4.587833862304688, "step": 100900 }, { "epoch": 0.1218699557075109, "learning_rate": 9.632509724358063e-06, "loss": 4.642342529296875, "step": 101000 }, { "epoch": 0.12199061902999359, "learning_rate": 9.632105888890325e-06, "loss": 4.589096984863281, "step": 101100 }, { "epoch": 0.12211128235247627, "learning_rate": 9.631702053422587e-06, "loss": 4.626454467773438, "step": 101200 }, { "epoch": 0.12223194567495896, "learning_rate": 9.631298217954849e-06, "loss": 4.596427917480469, "step": 101300 }, { "epoch": 0.12235260899744163, "learning_rate": 9.63089438248711e-06, "loss": 4.597868347167969, "step": 101400 }, { "epoch": 0.12247327231992432, "learning_rate": 9.630490547019373e-06, "loss": 4.6363897705078125, "step": 101500 }, { "epoch": 0.122593935642407, "learning_rate": 9.630086711551635e-06, "loss": 4.584929809570313, "step": 101600 }, { "epoch": 0.12271459896488969, "learning_rate": 9.629682876083895e-06, "loss": 4.581707153320313, "step": 101700 }, { "epoch": 0.12283526228737238, "learning_rate": 9.629279040616157e-06, "loss": 4.606552734375, "step": 101800 }, { "epoch": 0.12295592560985506, "learning_rate": 9.628875205148419e-06, "loss": 4.596510009765625, "step": 101900 }, { "epoch": 0.12307658893233774, "learning_rate": 9.628471369680679e-06, "loss": 4.600588684082031, "step": 102000 }, { "epoch": 0.12319725225482042, "learning_rate": 9.628067534212941e-06, "loss": 4.584922790527344, "step": 102100 }, { "epoch": 0.12331791557730311, "learning_rate": 9.627663698745203e-06, "loss": 4.573536071777344, "step": 102200 }, { "epoch": 0.1234385788997858, "learning_rate": 9.627259863277465e-06, "loss": 4.591594543457031, "step": 102300 }, { "epoch": 0.12355924222226848, "learning_rate": 9.626856027809727e-06, "loss": 4.5871514892578125, "step": 102400 }, { "epoch": 0.12367990554475117, "learning_rate": 9.626452192341989e-06, "loss": 4.576618957519531, "step": 102500 }, { "epoch": 0.12380056886723384, "learning_rate": 9.62604835687425e-06, "loss": 4.589746704101563, "step": 102600 }, { "epoch": 0.12392123218971653, "learning_rate": 9.625644521406511e-06, "loss": 4.559208374023438, "step": 102700 }, { "epoch": 0.12404189551219921, "learning_rate": 9.625240685938773e-06, "loss": 4.580867919921875, "step": 102800 }, { "epoch": 0.1241625588346819, "learning_rate": 9.624836850471034e-06, "loss": 4.589192199707031, "step": 102900 }, { "epoch": 0.12428322215716459, "learning_rate": 9.624433015003296e-06, "loss": 4.562888793945312, "step": 103000 }, { "epoch": 0.12440388547964726, "learning_rate": 9.624029179535558e-06, "loss": 4.571641540527343, "step": 103100 }, { "epoch": 0.12452454880212994, "learning_rate": 9.62362534406782e-06, "loss": 4.557775573730469, "step": 103200 }, { "epoch": 0.12464521212461263, "learning_rate": 9.623221508600081e-06, "loss": 4.56920654296875, "step": 103300 }, { "epoch": 0.12476587544709532, "learning_rate": 9.622817673132343e-06, "loss": 4.5724484252929685, "step": 103400 }, { "epoch": 0.124886538769578, "learning_rate": 9.622413837664604e-06, "loss": 4.571834716796875, "step": 103500 }, { "epoch": 0.12500720209206068, "learning_rate": 9.622010002196866e-06, "loss": 4.554250793457031, "step": 103600 }, { "epoch": 0.12512786541454338, "learning_rate": 9.621606166729128e-06, "loss": 4.5702078247070315, "step": 103700 }, { "epoch": 0.12524852873702605, "learning_rate": 9.62120233126139e-06, "loss": 4.584476013183593, "step": 103800 }, { "epoch": 0.12536919205950875, "learning_rate": 9.62079849579365e-06, "loss": 4.565232849121093, "step": 103900 }, { "epoch": 0.12548985538199142, "learning_rate": 9.620394660325912e-06, "loss": 4.563414001464844, "step": 104000 }, { "epoch": 0.1256105187044741, "learning_rate": 9.619990824858174e-06, "loss": 4.559494323730469, "step": 104100 }, { "epoch": 0.1257311820269568, "learning_rate": 9.619586989390436e-06, "loss": 4.534017944335938, "step": 104200 }, { "epoch": 0.12585184534943947, "learning_rate": 9.619183153922696e-06, "loss": 4.578702392578125, "step": 104300 }, { "epoch": 0.12597250867192217, "learning_rate": 9.618779318454958e-06, "loss": 4.575626831054688, "step": 104400 }, { "epoch": 0.12609317199440484, "learning_rate": 9.61837548298722e-06, "loss": 4.5360650634765625, "step": 104500 }, { "epoch": 0.1262138353168875, "learning_rate": 9.617971647519482e-06, "loss": 4.535835266113281, "step": 104600 }, { "epoch": 0.1263344986393702, "learning_rate": 9.617567812051744e-06, "loss": 4.560310363769531, "step": 104700 }, { "epoch": 0.12645516196185289, "learning_rate": 9.617163976584004e-06, "loss": 4.557838439941406, "step": 104800 }, { "epoch": 0.12657582528433559, "learning_rate": 9.616760141116266e-06, "loss": 4.553232727050781, "step": 104900 }, { "epoch": 0.12669648860681826, "learning_rate": 9.616356305648528e-06, "loss": 4.531650085449218, "step": 105000 }, { "epoch": 0.12681715192930096, "learning_rate": 9.615952470180789e-06, "loss": 4.5613400268554685, "step": 105100 }, { "epoch": 0.12693781525178363, "learning_rate": 9.61554863471305e-06, "loss": 4.540119018554687, "step": 105200 }, { "epoch": 0.1270584785742663, "learning_rate": 9.615144799245313e-06, "loss": 4.541902465820312, "step": 105300 }, { "epoch": 0.127179141896749, "learning_rate": 9.614740963777575e-06, "loss": 4.54156005859375, "step": 105400 }, { "epoch": 0.12729980521923168, "learning_rate": 9.614337128309837e-06, "loss": 4.518712158203125, "step": 105500 }, { "epoch": 0.12742046854171438, "learning_rate": 9.613933292842099e-06, "loss": 4.5665869140625, "step": 105600 }, { "epoch": 0.12754113186419705, "learning_rate": 9.61352945737436e-06, "loss": 4.523365783691406, "step": 105700 }, { "epoch": 0.12766179518667972, "learning_rate": 9.613125621906621e-06, "loss": 4.531428833007812, "step": 105800 }, { "epoch": 0.12778245850916242, "learning_rate": 9.612721786438883e-06, "loss": 4.523320007324219, "step": 105900 }, { "epoch": 0.1279031218316451, "learning_rate": 9.612317950971143e-06, "loss": 4.526325073242187, "step": 106000 }, { "epoch": 0.1280237851541278, "learning_rate": 9.611914115503405e-06, "loss": 4.555354919433594, "step": 106100 }, { "epoch": 0.12814444847661047, "learning_rate": 9.611510280035667e-06, "loss": 4.529878845214844, "step": 106200 }, { "epoch": 0.12826511179909317, "learning_rate": 9.611106444567929e-06, "loss": 4.527799987792969, "step": 106300 }, { "epoch": 0.12838577512157584, "learning_rate": 9.610702609100191e-06, "loss": 4.535277099609375, "step": 106400 }, { "epoch": 0.1285064384440585, "learning_rate": 9.610298773632453e-06, "loss": 4.510034790039063, "step": 106500 }, { "epoch": 0.1286271017665412, "learning_rate": 9.609894938164715e-06, "loss": 4.517027587890625, "step": 106600 }, { "epoch": 0.12874776508902389, "learning_rate": 9.609491102696975e-06, "loss": 4.513541259765625, "step": 106700 }, { "epoch": 0.12886842841150659, "learning_rate": 9.609087267229237e-06, "loss": 4.532938537597656, "step": 106800 }, { "epoch": 0.12898909173398926, "learning_rate": 9.6086834317615e-06, "loss": 4.523807067871093, "step": 106900 }, { "epoch": 0.12910975505647193, "learning_rate": 9.60827959629376e-06, "loss": 4.536944274902344, "step": 107000 }, { "epoch": 0.12923041837895463, "learning_rate": 9.607875760826022e-06, "loss": 4.547731323242187, "step": 107100 }, { "epoch": 0.1293510817014373, "learning_rate": 9.607471925358284e-06, "loss": 4.500527954101562, "step": 107200 }, { "epoch": 0.12947174502392, "learning_rate": 9.607068089890546e-06, "loss": 4.509184875488281, "step": 107300 }, { "epoch": 0.12959240834640268, "learning_rate": 9.606664254422808e-06, "loss": 4.506120300292968, "step": 107400 }, { "epoch": 0.12971307166888538, "learning_rate": 9.606260418955068e-06, "loss": 4.5154855346679685, "step": 107500 }, { "epoch": 0.12983373499136805, "learning_rate": 9.60585658348733e-06, "loss": 4.532999267578125, "step": 107600 }, { "epoch": 0.12995439831385072, "learning_rate": 9.605452748019592e-06, "loss": 4.532502136230469, "step": 107700 }, { "epoch": 0.13007506163633342, "learning_rate": 9.605048912551854e-06, "loss": 4.498631591796875, "step": 107800 }, { "epoch": 0.1301957249588161, "learning_rate": 9.604645077084114e-06, "loss": 4.540263977050781, "step": 107900 }, { "epoch": 0.1303163882812988, "learning_rate": 9.604241241616376e-06, "loss": 4.516459045410156, "step": 108000 }, { "epoch": 0.13043705160378147, "learning_rate": 9.603837406148638e-06, "loss": 4.507551574707032, "step": 108100 }, { "epoch": 0.13055771492626414, "learning_rate": 9.6034335706809e-06, "loss": 4.481290588378906, "step": 108200 }, { "epoch": 0.13067837824874684, "learning_rate": 9.603029735213162e-06, "loss": 4.516636047363281, "step": 108300 }, { "epoch": 0.1307990415712295, "learning_rate": 9.602625899745422e-06, "loss": 4.498446655273438, "step": 108400 }, { "epoch": 0.1309197048937122, "learning_rate": 9.602222064277684e-06, "loss": 4.496758117675781, "step": 108500 }, { "epoch": 0.13104036821619489, "learning_rate": 9.601818228809946e-06, "loss": 4.514501037597657, "step": 108600 }, { "epoch": 0.13116103153867759, "learning_rate": 9.601414393342208e-06, "loss": 4.525939331054688, "step": 108700 }, { "epoch": 0.13128169486116026, "learning_rate": 9.60101055787447e-06, "loss": 4.491955261230469, "step": 108800 }, { "epoch": 0.13140235818364293, "learning_rate": 9.60060672240673e-06, "loss": 4.504250183105468, "step": 108900 }, { "epoch": 0.13152302150612563, "learning_rate": 9.600202886938992e-06, "loss": 4.5038973999023435, "step": 109000 }, { "epoch": 0.1316436848286083, "learning_rate": 9.599799051471254e-06, "loss": 4.478483581542969, "step": 109100 }, { "epoch": 0.131764348151091, "learning_rate": 9.599395216003515e-06, "loss": 4.497598876953125, "step": 109200 }, { "epoch": 0.13188501147357368, "learning_rate": 9.598991380535777e-06, "loss": 4.518112487792969, "step": 109300 }, { "epoch": 0.13200567479605635, "learning_rate": 9.598587545068039e-06, "loss": 4.495831298828125, "step": 109400 }, { "epoch": 0.13212633811853905, "learning_rate": 9.5981837096003e-06, "loss": 4.465983581542969, "step": 109500 }, { "epoch": 0.13224700144102172, "learning_rate": 9.597779874132563e-06, "loss": 4.517566528320312, "step": 109600 }, { "epoch": 0.13236766476350442, "learning_rate": 9.597376038664825e-06, "loss": 4.489622192382813, "step": 109700 }, { "epoch": 0.1324883280859871, "learning_rate": 9.596972203197087e-06, "loss": 4.4957275390625, "step": 109800 }, { "epoch": 0.13260899140846977, "learning_rate": 9.596568367729347e-06, "loss": 4.512953491210937, "step": 109900 }, { "epoch": 0.13272965473095247, "learning_rate": 9.596164532261609e-06, "loss": 4.487915649414062, "step": 110000 }, { "epoch": 0.13285031805343514, "learning_rate": 9.59576069679387e-06, "loss": 4.477689514160156, "step": 110100 }, { "epoch": 0.13297098137591784, "learning_rate": 9.595356861326131e-06, "loss": 4.457083740234375, "step": 110200 }, { "epoch": 0.1330916446984005, "learning_rate": 9.594953025858393e-06, "loss": 4.4653662109375, "step": 110300 }, { "epoch": 0.1332123080208832, "learning_rate": 9.594549190390655e-06, "loss": 4.469291687011719, "step": 110400 }, { "epoch": 0.13333297134336589, "learning_rate": 9.594145354922917e-06, "loss": 4.486278381347656, "step": 110500 }, { "epoch": 0.13345363466584856, "learning_rate": 9.593741519455179e-06, "loss": 4.490919189453125, "step": 110600 }, { "epoch": 0.13357429798833126, "learning_rate": 9.593337683987441e-06, "loss": 4.4483575439453125, "step": 110700 }, { "epoch": 0.13369496131081393, "learning_rate": 9.592933848519701e-06, "loss": 4.45943359375, "step": 110800 }, { "epoch": 0.13381562463329663, "learning_rate": 9.592530013051963e-06, "loss": 4.465886535644532, "step": 110900 }, { "epoch": 0.1339362879557793, "learning_rate": 9.592126177584225e-06, "loss": 4.440640563964844, "step": 111000 }, { "epoch": 0.13405695127826198, "learning_rate": 9.591722342116486e-06, "loss": 4.476104736328125, "step": 111100 }, { "epoch": 0.13417761460074468, "learning_rate": 9.591318506648748e-06, "loss": 4.466950988769531, "step": 111200 }, { "epoch": 0.13429827792322735, "learning_rate": 9.59091467118101e-06, "loss": 4.44192138671875, "step": 111300 }, { "epoch": 0.13441894124571005, "learning_rate": 9.590510835713272e-06, "loss": 4.460939331054687, "step": 111400 }, { "epoch": 0.13453960456819272, "learning_rate": 9.590107000245534e-06, "loss": 4.462611083984375, "step": 111500 }, { "epoch": 0.13466026789067542, "learning_rate": 9.589703164777794e-06, "loss": 4.46771484375, "step": 111600 }, { "epoch": 0.1347809312131581, "learning_rate": 9.589299329310056e-06, "loss": 4.469099731445312, "step": 111700 }, { "epoch": 0.13490159453564077, "learning_rate": 9.588895493842318e-06, "loss": 4.476997985839843, "step": 111800 }, { "epoch": 0.13502225785812347, "learning_rate": 9.58849165837458e-06, "loss": 4.453414001464844, "step": 111900 }, { "epoch": 0.13514292118060614, "learning_rate": 9.58808782290684e-06, "loss": 4.475471496582031, "step": 112000 }, { "epoch": 0.13526358450308884, "learning_rate": 9.587683987439102e-06, "loss": 4.473577575683594, "step": 112100 }, { "epoch": 0.1353842478255715, "learning_rate": 9.587280151971364e-06, "loss": 4.458526000976563, "step": 112200 }, { "epoch": 0.13550491114805419, "learning_rate": 9.586876316503626e-06, "loss": 4.440609436035157, "step": 112300 }, { "epoch": 0.13562557447053689, "learning_rate": 9.586472481035886e-06, "loss": 4.463949584960938, "step": 112400 }, { "epoch": 0.13574623779301956, "learning_rate": 9.586068645568148e-06, "loss": 4.4455328369140625, "step": 112500 }, { "epoch": 0.13586690111550226, "learning_rate": 9.58566481010041e-06, "loss": 4.45734375, "step": 112600 }, { "epoch": 0.13598756443798493, "learning_rate": 9.585260974632672e-06, "loss": 4.432592468261719, "step": 112700 }, { "epoch": 0.13610822776046763, "learning_rate": 9.584857139164934e-06, "loss": 4.418620910644531, "step": 112800 }, { "epoch": 0.1362288910829503, "learning_rate": 9.584453303697196e-06, "loss": 4.41904052734375, "step": 112900 }, { "epoch": 0.13634955440543298, "learning_rate": 9.584049468229456e-06, "loss": 4.441593017578125, "step": 113000 }, { "epoch": 0.13647021772791568, "learning_rate": 9.583645632761718e-06, "loss": 4.4470431518554685, "step": 113100 }, { "epoch": 0.13659088105039835, "learning_rate": 9.58324179729398e-06, "loss": 4.4390283203125, "step": 113200 }, { "epoch": 0.13671154437288105, "learning_rate": 9.58283796182624e-06, "loss": 4.445567321777344, "step": 113300 }, { "epoch": 0.13683220769536372, "learning_rate": 9.582434126358503e-06, "loss": 4.437692565917969, "step": 113400 }, { "epoch": 0.1369528710178464, "learning_rate": 9.582030290890765e-06, "loss": 4.465968322753906, "step": 113500 }, { "epoch": 0.1370735343403291, "learning_rate": 9.581626455423027e-06, "loss": 4.4066619873046875, "step": 113600 }, { "epoch": 0.13719419766281177, "learning_rate": 9.581222619955289e-06, "loss": 4.454749755859375, "step": 113700 }, { "epoch": 0.13731486098529447, "learning_rate": 9.58081878448755e-06, "loss": 4.4673834228515625, "step": 113800 }, { "epoch": 0.13743552430777714, "learning_rate": 9.580414949019811e-06, "loss": 4.453739318847656, "step": 113900 }, { "epoch": 0.13755618763025984, "learning_rate": 9.580011113552073e-06, "loss": 4.429642639160156, "step": 114000 }, { "epoch": 0.1376768509527425, "learning_rate": 9.579607278084335e-06, "loss": 4.4275906372070315, "step": 114100 }, { "epoch": 0.13779751427522519, "learning_rate": 9.579203442616595e-06, "loss": 4.430051879882813, "step": 114200 }, { "epoch": 0.13791817759770789, "learning_rate": 9.578799607148857e-06, "loss": 4.434742126464844, "step": 114300 }, { "epoch": 0.13803884092019056, "learning_rate": 9.57839577168112e-06, "loss": 4.432896423339844, "step": 114400 }, { "epoch": 0.13815950424267326, "learning_rate": 9.577991936213381e-06, "loss": 4.445202331542969, "step": 114500 }, { "epoch": 0.13828016756515593, "learning_rate": 9.577588100745643e-06, "loss": 4.4600350952148435, "step": 114600 }, { "epoch": 0.1384008308876386, "learning_rate": 9.577184265277905e-06, "loss": 4.4270016479492185, "step": 114700 }, { "epoch": 0.1385214942101213, "learning_rate": 9.576780429810167e-06, "loss": 4.434621887207031, "step": 114800 }, { "epoch": 0.13864215753260398, "learning_rate": 9.576376594342427e-06, "loss": 4.406890869140625, "step": 114900 }, { "epoch": 0.13876282085508668, "learning_rate": 9.57597275887469e-06, "loss": 4.410062866210938, "step": 115000 }, { "epoch": 0.13888348417756935, "learning_rate": 9.57556892340695e-06, "loss": 4.430516357421875, "step": 115100 }, { "epoch": 0.13900414750005205, "learning_rate": 9.575165087939212e-06, "loss": 4.400594787597656, "step": 115200 }, { "epoch": 0.13912481082253472, "learning_rate": 9.574761252471474e-06, "loss": 4.425685424804687, "step": 115300 }, { "epoch": 0.1392454741450174, "learning_rate": 9.574357417003736e-06, "loss": 4.393196105957031, "step": 115400 }, { "epoch": 0.1393661374675001, "learning_rate": 9.573953581535998e-06, "loss": 4.400187683105469, "step": 115500 }, { "epoch": 0.13948680078998277, "learning_rate": 9.57354974606826e-06, "loss": 4.415928649902344, "step": 115600 }, { "epoch": 0.13960746411246547, "learning_rate": 9.57314591060052e-06, "loss": 4.41013671875, "step": 115700 }, { "epoch": 0.13972812743494814, "learning_rate": 9.572742075132782e-06, "loss": 4.4073974609375, "step": 115800 }, { "epoch": 0.1398487907574308, "learning_rate": 9.572338239665044e-06, "loss": 4.400917663574218, "step": 115900 }, { "epoch": 0.1399694540799135, "learning_rate": 9.571934404197306e-06, "loss": 4.448593444824219, "step": 116000 }, { "epoch": 0.14009011740239619, "learning_rate": 9.571530568729566e-06, "loss": 4.393462524414063, "step": 116100 }, { "epoch": 0.1402107807248789, "learning_rate": 9.571126733261828e-06, "loss": 4.4335107421875, "step": 116200 }, { "epoch": 0.14033144404736156, "learning_rate": 9.57072289779409e-06, "loss": 4.392406311035156, "step": 116300 }, { "epoch": 0.14045210736984423, "learning_rate": 9.570319062326352e-06, "loss": 4.394865417480469, "step": 116400 }, { "epoch": 0.14057277069232693, "learning_rate": 9.569915226858612e-06, "loss": 4.381990051269531, "step": 116500 }, { "epoch": 0.1406934340148096, "learning_rate": 9.569511391390874e-06, "loss": 4.418711242675781, "step": 116600 }, { "epoch": 0.1408140973372923, "learning_rate": 9.569107555923136e-06, "loss": 4.386910400390625, "step": 116700 }, { "epoch": 0.14093476065977498, "learning_rate": 9.568703720455398e-06, "loss": 4.409456481933594, "step": 116800 }, { "epoch": 0.14105542398225768, "learning_rate": 9.56829988498766e-06, "loss": 4.389706420898437, "step": 116900 }, { "epoch": 0.14117608730474035, "learning_rate": 9.56789604951992e-06, "loss": 4.406465759277344, "step": 117000 }, { "epoch": 0.14129675062722302, "learning_rate": 9.567492214052183e-06, "loss": 4.351282958984375, "step": 117100 }, { "epoch": 0.14141741394970572, "learning_rate": 9.567088378584445e-06, "loss": 4.409855041503906, "step": 117200 }, { "epoch": 0.1415380772721884, "learning_rate": 9.566684543116705e-06, "loss": 4.378627624511719, "step": 117300 }, { "epoch": 0.1416587405946711, "learning_rate": 9.566280707648967e-06, "loss": 4.415323486328125, "step": 117400 }, { "epoch": 0.14177940391715377, "learning_rate": 9.565876872181229e-06, "loss": 4.38979736328125, "step": 117500 }, { "epoch": 0.14190006723963644, "learning_rate": 9.56547303671349e-06, "loss": 4.387171020507813, "step": 117600 }, { "epoch": 0.14202073056211914, "learning_rate": 9.565069201245753e-06, "loss": 4.388475036621093, "step": 117700 }, { "epoch": 0.1421413938846018, "learning_rate": 9.564665365778015e-06, "loss": 4.3392642211914065, "step": 117800 }, { "epoch": 0.1422620572070845, "learning_rate": 9.564261530310277e-06, "loss": 4.374033813476562, "step": 117900 }, { "epoch": 0.14238272052956719, "learning_rate": 9.563857694842537e-06, "loss": 4.3949432373046875, "step": 118000 }, { "epoch": 0.1425033838520499, "learning_rate": 9.563453859374799e-06, "loss": 4.41203369140625, "step": 118100 }, { "epoch": 0.14262404717453256, "learning_rate": 9.56305002390706e-06, "loss": 4.352719421386719, "step": 118200 }, { "epoch": 0.14274471049701523, "learning_rate": 9.562646188439321e-06, "loss": 4.3942086791992185, "step": 118300 }, { "epoch": 0.14286537381949793, "learning_rate": 9.562242352971583e-06, "loss": 4.374820251464843, "step": 118400 }, { "epoch": 0.1429860371419806, "learning_rate": 9.561838517503845e-06, "loss": 4.379683837890625, "step": 118500 }, { "epoch": 0.1431067004644633, "learning_rate": 9.561434682036107e-06, "loss": 4.376545715332031, "step": 118600 }, { "epoch": 0.14322736378694598, "learning_rate": 9.56103084656837e-06, "loss": 4.389849243164062, "step": 118700 }, { "epoch": 0.14334802710942865, "learning_rate": 9.560627011100631e-06, "loss": 4.3559716796875, "step": 118800 }, { "epoch": 0.14346869043191135, "learning_rate": 9.560223175632891e-06, "loss": 4.365683898925782, "step": 118900 }, { "epoch": 0.14358935375439402, "learning_rate": 9.559819340165153e-06, "loss": 4.386561889648437, "step": 119000 }, { "epoch": 0.14371001707687672, "learning_rate": 9.559415504697415e-06, "loss": 4.356888427734375, "step": 119100 }, { "epoch": 0.1438306803993594, "learning_rate": 9.559011669229676e-06, "loss": 4.371274719238281, "step": 119200 }, { "epoch": 0.1439513437218421, "learning_rate": 9.558607833761938e-06, "loss": 4.351863098144531, "step": 119300 }, { "epoch": 0.14407200704432477, "learning_rate": 9.5582039982942e-06, "loss": 4.347482299804687, "step": 119400 }, { "epoch": 0.14419267036680744, "learning_rate": 9.557800162826462e-06, "loss": 4.378409423828125, "step": 119500 }, { "epoch": 0.14431333368929014, "learning_rate": 9.557396327358724e-06, "loss": 4.374012145996094, "step": 119600 }, { "epoch": 0.1444339970117728, "learning_rate": 9.556992491890986e-06, "loss": 4.375729675292969, "step": 119700 }, { "epoch": 0.1445546603342555, "learning_rate": 9.556588656423246e-06, "loss": 4.373175354003906, "step": 119800 }, { "epoch": 0.1446753236567382, "learning_rate": 9.556184820955508e-06, "loss": 4.3620947265625, "step": 119900 }, { "epoch": 0.14479598697922086, "learning_rate": 9.55578098548777e-06, "loss": 4.358991088867188, "step": 120000 }, { "epoch": 0.14491665030170356, "learning_rate": 9.55537715002003e-06, "loss": 4.350498352050781, "step": 120100 }, { "epoch": 0.14503731362418623, "learning_rate": 9.554973314552292e-06, "loss": 4.350937194824219, "step": 120200 }, { "epoch": 0.14515797694666893, "learning_rate": 9.554569479084554e-06, "loss": 4.331032409667968, "step": 120300 }, { "epoch": 0.1452786402691516, "learning_rate": 9.554165643616816e-06, "loss": 4.3107452392578125, "step": 120400 }, { "epoch": 0.1453993035916343, "learning_rate": 9.553761808149078e-06, "loss": 4.337636413574219, "step": 120500 }, { "epoch": 0.14551996691411698, "learning_rate": 9.553357972681338e-06, "loss": 4.359307861328125, "step": 120600 }, { "epoch": 0.14564063023659965, "learning_rate": 9.5529541372136e-06, "loss": 4.340976257324218, "step": 120700 }, { "epoch": 0.14576129355908235, "learning_rate": 9.552550301745862e-06, "loss": 4.384718933105469, "step": 120800 }, { "epoch": 0.14588195688156502, "learning_rate": 9.552146466278124e-06, "loss": 4.3548126220703125, "step": 120900 }, { "epoch": 0.14600262020404772, "learning_rate": 9.551742630810386e-06, "loss": 4.36437744140625, "step": 121000 }, { "epoch": 0.1461232835265304, "learning_rate": 9.551338795342647e-06, "loss": 4.35047119140625, "step": 121100 }, { "epoch": 0.14624394684901307, "learning_rate": 9.550934959874909e-06, "loss": 4.325852355957031, "step": 121200 }, { "epoch": 0.14636461017149577, "learning_rate": 9.55053112440717e-06, "loss": 4.342714233398437, "step": 121300 }, { "epoch": 0.14648527349397844, "learning_rate": 9.55012728893943e-06, "loss": 4.33703369140625, "step": 121400 }, { "epoch": 0.14660593681646114, "learning_rate": 9.549723453471693e-06, "loss": 4.339054565429688, "step": 121500 }, { "epoch": 0.1467266001389438, "learning_rate": 9.549319618003955e-06, "loss": 4.337333984375, "step": 121600 }, { "epoch": 0.1468472634614265, "learning_rate": 9.548915782536217e-06, "loss": 4.377168273925781, "step": 121700 }, { "epoch": 0.1469679267839092, "learning_rate": 9.548511947068479e-06, "loss": 4.317802124023437, "step": 121800 }, { "epoch": 0.14708859010639186, "learning_rate": 9.54810811160074e-06, "loss": 4.320137939453125, "step": 121900 }, { "epoch": 0.14720925342887456, "learning_rate": 9.547704276133001e-06, "loss": 4.329671936035156, "step": 122000 }, { "epoch": 0.14732991675135723, "learning_rate": 9.547300440665263e-06, "loss": 4.316641845703125, "step": 122100 }, { "epoch": 0.14745058007383993, "learning_rate": 9.546896605197525e-06, "loss": 4.347405700683594, "step": 122200 }, { "epoch": 0.1475712433963226, "learning_rate": 9.546492769729785e-06, "loss": 4.331479797363281, "step": 122300 }, { "epoch": 0.14769190671880528, "learning_rate": 9.546088934262047e-06, "loss": 4.31545166015625, "step": 122400 }, { "epoch": 0.14781257004128798, "learning_rate": 9.54568509879431e-06, "loss": 4.32429443359375, "step": 122500 }, { "epoch": 0.14793323336377065, "learning_rate": 9.545281263326571e-06, "loss": 4.3228302001953125, "step": 122600 }, { "epoch": 0.14805389668625335, "learning_rate": 9.544877427858833e-06, "loss": 4.308872680664063, "step": 122700 }, { "epoch": 0.14817456000873602, "learning_rate": 9.544473592391095e-06, "loss": 4.337101440429688, "step": 122800 }, { "epoch": 0.1482952233312187, "learning_rate": 9.544069756923357e-06, "loss": 4.331028137207031, "step": 122900 }, { "epoch": 0.1484158866537014, "learning_rate": 9.543665921455617e-06, "loss": 4.325223388671875, "step": 123000 }, { "epoch": 0.14853654997618407, "learning_rate": 9.54326208598788e-06, "loss": 4.3249508666992185, "step": 123100 }, { "epoch": 0.14865721329866677, "learning_rate": 9.54285825052014e-06, "loss": 4.341258850097656, "step": 123200 }, { "epoch": 0.14877787662114944, "learning_rate": 9.542454415052402e-06, "loss": 4.3162838745117185, "step": 123300 }, { "epoch": 0.14889853994363214, "learning_rate": 9.542050579584664e-06, "loss": 4.314066162109375, "step": 123400 }, { "epoch": 0.1490192032661148, "learning_rate": 9.541646744116926e-06, "loss": 4.327146911621094, "step": 123500 }, { "epoch": 0.1491398665885975, "learning_rate": 9.541242908649188e-06, "loss": 4.281849670410156, "step": 123600 }, { "epoch": 0.1492605299110802, "learning_rate": 9.54083907318145e-06, "loss": 4.31343505859375, "step": 123700 }, { "epoch": 0.14938119323356286, "learning_rate": 9.540435237713712e-06, "loss": 4.310948486328125, "step": 123800 }, { "epoch": 0.14950185655604556, "learning_rate": 9.540031402245972e-06, "loss": 4.299508056640625, "step": 123900 }, { "epoch": 0.14962251987852823, "learning_rate": 9.539627566778234e-06, "loss": 4.28039794921875, "step": 124000 }, { "epoch": 0.1497431832010109, "learning_rate": 9.539223731310496e-06, "loss": 4.311947326660157, "step": 124100 }, { "epoch": 0.1498638465234936, "learning_rate": 9.538819895842756e-06, "loss": 4.342105712890625, "step": 124200 }, { "epoch": 0.14998450984597628, "learning_rate": 9.538416060375018e-06, "loss": 4.314954833984375, "step": 124300 }, { "epoch": 0.15010517316845898, "learning_rate": 9.53801222490728e-06, "loss": 4.325047912597657, "step": 124400 }, { "epoch": 0.15022583649094165, "learning_rate": 9.537608389439542e-06, "loss": 4.295559692382812, "step": 124500 }, { "epoch": 0.15034649981342435, "learning_rate": 9.537204553971804e-06, "loss": 4.326130981445313, "step": 124600 }, { "epoch": 0.15046716313590702, "learning_rate": 9.536800718504064e-06, "loss": 4.280221557617187, "step": 124700 }, { "epoch": 0.1505878264583897, "learning_rate": 9.536396883036326e-06, "loss": 4.321505737304688, "step": 124800 }, { "epoch": 0.1507084897808724, "learning_rate": 9.535993047568588e-06, "loss": 4.304708557128906, "step": 124900 }, { "epoch": 0.15082915310335507, "learning_rate": 9.53558921210085e-06, "loss": 4.320899658203125, "step": 125000 }, { "epoch": 0.15094981642583777, "learning_rate": 9.535185376633112e-06, "loss": 4.311892700195313, "step": 125100 }, { "epoch": 0.15107047974832044, "learning_rate": 9.534781541165373e-06, "loss": 4.304443359375, "step": 125200 }, { "epoch": 0.1511911430708031, "learning_rate": 9.534377705697635e-06, "loss": 4.29806884765625, "step": 125300 }, { "epoch": 0.1513118063932858, "learning_rate": 9.533973870229897e-06, "loss": 4.282315368652344, "step": 125400 }, { "epoch": 0.1514324697157685, "learning_rate": 9.533570034762157e-06, "loss": 4.294893188476562, "step": 125500 }, { "epoch": 0.1515531330382512, "learning_rate": 9.533166199294419e-06, "loss": 4.278684997558594, "step": 125600 }, { "epoch": 0.15167379636073386, "learning_rate": 9.53276236382668e-06, "loss": 4.298463745117187, "step": 125700 }, { "epoch": 0.15179445968321656, "learning_rate": 9.532358528358943e-06, "loss": 4.276971435546875, "step": 125800 }, { "epoch": 0.15191512300569923, "learning_rate": 9.531954692891205e-06, "loss": 4.266158752441406, "step": 125900 }, { "epoch": 0.1520357863281819, "learning_rate": 9.531550857423467e-06, "loss": 4.272743835449218, "step": 126000 }, { "epoch": 0.1521564496506646, "learning_rate": 9.531147021955727e-06, "loss": 4.277969055175781, "step": 126100 }, { "epoch": 0.15227711297314728, "learning_rate": 9.530743186487989e-06, "loss": 4.287745361328125, "step": 126200 }, { "epoch": 0.15239777629562998, "learning_rate": 9.530339351020251e-06, "loss": 4.300249633789062, "step": 126300 }, { "epoch": 0.15251843961811265, "learning_rate": 9.529935515552511e-06, "loss": 4.285774841308593, "step": 126400 }, { "epoch": 0.15263910294059532, "learning_rate": 9.529531680084773e-06, "loss": 4.305826721191406, "step": 126500 }, { "epoch": 0.15275976626307802, "learning_rate": 9.529127844617035e-06, "loss": 4.295311279296875, "step": 126600 }, { "epoch": 0.1528804295855607, "learning_rate": 9.528724009149297e-06, "loss": 4.2653350830078125, "step": 126700 }, { "epoch": 0.1530010929080434, "learning_rate": 9.52832017368156e-06, "loss": 4.296410827636719, "step": 126800 }, { "epoch": 0.15312175623052607, "learning_rate": 9.527916338213821e-06, "loss": 4.288053283691406, "step": 126900 }, { "epoch": 0.15324241955300877, "learning_rate": 9.527512502746083e-06, "loss": 4.275084228515625, "step": 127000 }, { "epoch": 0.15336308287549144, "learning_rate": 9.527108667278344e-06, "loss": 4.290885009765625, "step": 127100 }, { "epoch": 0.1534837461979741, "learning_rate": 9.526704831810605e-06, "loss": 4.274404907226563, "step": 127200 }, { "epoch": 0.1536044095204568, "learning_rate": 9.526300996342866e-06, "loss": 4.293334350585938, "step": 127300 }, { "epoch": 0.1537250728429395, "learning_rate": 9.525897160875128e-06, "loss": 4.264752197265625, "step": 127400 }, { "epoch": 0.1538457361654222, "learning_rate": 9.52549332540739e-06, "loss": 4.257093505859375, "step": 127500 }, { "epoch": 0.15396639948790486, "learning_rate": 9.525089489939652e-06, "loss": 4.267686157226563, "step": 127600 }, { "epoch": 0.15408706281038753, "learning_rate": 9.524685654471914e-06, "loss": 4.289052734375, "step": 127700 }, { "epoch": 0.15420772613287023, "learning_rate": 9.524281819004176e-06, "loss": 4.2693087768554685, "step": 127800 }, { "epoch": 0.1543283894553529, "learning_rate": 9.523877983536436e-06, "loss": 4.302455139160156, "step": 127900 }, { "epoch": 0.1544490527778356, "learning_rate": 9.523474148068698e-06, "loss": 4.255574645996094, "step": 128000 }, { "epoch": 0.15456971610031828, "learning_rate": 9.52307031260096e-06, "loss": 4.264149169921875, "step": 128100 }, { "epoch": 0.15469037942280095, "learning_rate": 9.522666477133222e-06, "loss": 4.245845031738281, "step": 128200 }, { "epoch": 0.15481104274528365, "learning_rate": 9.522262641665482e-06, "loss": 4.248517150878906, "step": 128300 }, { "epoch": 0.15493170606776632, "learning_rate": 9.521858806197744e-06, "loss": 4.2542047119140625, "step": 128400 }, { "epoch": 0.15505236939024902, "learning_rate": 9.521454970730006e-06, "loss": 4.2518923950195315, "step": 128500 }, { "epoch": 0.1551730327127317, "learning_rate": 9.521051135262268e-06, "loss": 4.2552798461914065, "step": 128600 }, { "epoch": 0.1552936960352144, "learning_rate": 9.52064729979453e-06, "loss": 4.248907470703125, "step": 128700 }, { "epoch": 0.15541435935769707, "learning_rate": 9.52024346432679e-06, "loss": 4.2556304931640625, "step": 128800 }, { "epoch": 0.15553502268017974, "learning_rate": 9.519839628859052e-06, "loss": 4.2737353515625, "step": 128900 }, { "epoch": 0.15565568600266244, "learning_rate": 9.519435793391314e-06, "loss": 4.246327819824219, "step": 129000 }, { "epoch": 0.1557763493251451, "learning_rate": 9.519031957923576e-06, "loss": 4.262615051269531, "step": 129100 }, { "epoch": 0.15589701264762781, "learning_rate": 9.518628122455837e-06, "loss": 4.2385009765625, "step": 129200 }, { "epoch": 0.1560176759701105, "learning_rate": 9.518224286988099e-06, "loss": 4.2525567626953125, "step": 129300 }, { "epoch": 0.15613833929259316, "learning_rate": 9.51782045152036e-06, "loss": 4.260746765136719, "step": 129400 }, { "epoch": 0.15625900261507586, "learning_rate": 9.517416616052623e-06, "loss": 4.245251159667969, "step": 129500 }, { "epoch": 0.15637966593755853, "learning_rate": 9.517012780584883e-06, "loss": 4.228903198242188, "step": 129600 }, { "epoch": 0.15650032926004123, "learning_rate": 9.516608945117145e-06, "loss": 4.230923461914062, "step": 129700 }, { "epoch": 0.1566209925825239, "learning_rate": 9.516205109649407e-06, "loss": 4.2522366333007815, "step": 129800 }, { "epoch": 0.1567416559050066, "learning_rate": 9.515801274181669e-06, "loss": 4.241545104980469, "step": 129900 }, { "epoch": 0.15686231922748928, "learning_rate": 9.51539743871393e-06, "loss": 4.218800048828125, "step": 130000 }, { "epoch": 0.15698298254997195, "learning_rate": 9.514993603246193e-06, "loss": 4.24559326171875, "step": 130100 }, { "epoch": 0.15710364587245465, "learning_rate": 9.514589767778453e-06, "loss": 4.23311767578125, "step": 130200 }, { "epoch": 0.15722430919493732, "learning_rate": 9.514185932310715e-06, "loss": 4.249968566894531, "step": 130300 }, { "epoch": 0.15734497251742002, "learning_rate": 9.513782096842975e-06, "loss": 4.238301086425781, "step": 130400 }, { "epoch": 0.1574656358399027, "learning_rate": 9.513378261375237e-06, "loss": 4.258863525390625, "step": 130500 }, { "epoch": 0.15758629916238537, "learning_rate": 9.5129744259075e-06, "loss": 4.228417053222656, "step": 130600 }, { "epoch": 0.15770696248486807, "learning_rate": 9.512570590439761e-06, "loss": 4.212883605957031, "step": 130700 }, { "epoch": 0.15782762580735074, "learning_rate": 9.512166754972023e-06, "loss": 4.241891784667969, "step": 130800 }, { "epoch": 0.15794828912983344, "learning_rate": 9.511762919504285e-06, "loss": 4.2326287841796875, "step": 130900 }, { "epoch": 0.1580689524523161, "learning_rate": 9.511359084036547e-06, "loss": 4.238702392578125, "step": 131000 }, { "epoch": 0.15818961577479881, "learning_rate": 9.510955248568808e-06, "loss": 4.253780517578125, "step": 131100 }, { "epoch": 0.1583102790972815, "learning_rate": 9.51055141310107e-06, "loss": 4.240475769042969, "step": 131200 }, { "epoch": 0.15843094241976416, "learning_rate": 9.510147577633332e-06, "loss": 4.236222229003906, "step": 131300 }, { "epoch": 0.15855160574224686, "learning_rate": 9.509743742165592e-06, "loss": 4.194006652832031, "step": 131400 }, { "epoch": 0.15867226906472953, "learning_rate": 9.509339906697854e-06, "loss": 4.239622192382813, "step": 131500 }, { "epoch": 0.15879293238721223, "learning_rate": 9.508936071230116e-06, "loss": 4.252107849121094, "step": 131600 }, { "epoch": 0.1589135957096949, "learning_rate": 9.508532235762378e-06, "loss": 4.230406188964844, "step": 131700 }, { "epoch": 0.15903425903217758, "learning_rate": 9.50812840029464e-06, "loss": 4.215827941894531, "step": 131800 }, { "epoch": 0.15915492235466028, "learning_rate": 9.507724564826902e-06, "loss": 4.215340576171875, "step": 131900 }, { "epoch": 0.15927558567714295, "learning_rate": 9.507320729359162e-06, "loss": 4.2347238159179685, "step": 132000 }, { "epoch": 0.15939624899962565, "learning_rate": 9.506916893891424e-06, "loss": 4.237113647460937, "step": 132100 }, { "epoch": 0.15951691232210832, "learning_rate": 9.506513058423686e-06, "loss": 4.220930786132812, "step": 132200 }, { "epoch": 0.15963757564459102, "learning_rate": 9.506109222955946e-06, "loss": 4.192018432617187, "step": 132300 }, { "epoch": 0.1597582389670737, "learning_rate": 9.505705387488208e-06, "loss": 4.224645385742187, "step": 132400 }, { "epoch": 0.15987890228955637, "learning_rate": 9.50530155202047e-06, "loss": 4.231823425292969, "step": 132500 }, { "epoch": 0.15999956561203907, "learning_rate": 9.504897716552732e-06, "loss": 4.199769287109375, "step": 132600 }, { "epoch": 0.16012022893452174, "learning_rate": 9.504493881084994e-06, "loss": 4.216982421875, "step": 132700 }, { "epoch": 0.16024089225700444, "learning_rate": 9.504090045617254e-06, "loss": 4.201979675292969, "step": 132800 }, { "epoch": 0.16036155557948711, "learning_rate": 9.503686210149516e-06, "loss": 4.249957580566406, "step": 132900 }, { "epoch": 0.1604822189019698, "learning_rate": 9.503282374681778e-06, "loss": 4.234060668945313, "step": 133000 }, { "epoch": 0.1606028822244525, "learning_rate": 9.50287853921404e-06, "loss": 4.198249206542969, "step": 133100 }, { "epoch": 0.16072354554693516, "learning_rate": 9.502474703746302e-06, "loss": 4.212026977539063, "step": 133200 }, { "epoch": 0.16084420886941786, "learning_rate": 9.502070868278563e-06, "loss": 4.194464111328125, "step": 133300 }, { "epoch": 0.16096487219190053, "learning_rate": 9.501667032810825e-06, "loss": 4.19867919921875, "step": 133400 }, { "epoch": 0.16108553551438323, "learning_rate": 9.501263197343087e-06, "loss": 4.195557556152344, "step": 133500 }, { "epoch": 0.1612061988368659, "learning_rate": 9.500859361875349e-06, "loss": 4.191703491210937, "step": 133600 }, { "epoch": 0.16132686215934858, "learning_rate": 9.500455526407609e-06, "loss": 4.226734924316406, "step": 133700 }, { "epoch": 0.16144752548183128, "learning_rate": 9.500051690939871e-06, "loss": 4.220860290527344, "step": 133800 }, { "epoch": 0.16156818880431395, "learning_rate": 9.499647855472133e-06, "loss": 4.218114013671875, "step": 133900 }, { "epoch": 0.16168885212679665, "learning_rate": 9.499244020004395e-06, "loss": 4.2, "step": 134000 }, { "epoch": 0.16180951544927932, "learning_rate": 9.498840184536657e-06, "loss": 4.182944641113282, "step": 134100 }, { "epoch": 0.161930178771762, "learning_rate": 9.498436349068917e-06, "loss": 4.156382141113281, "step": 134200 }, { "epoch": 0.1620508420942447, "learning_rate": 9.498032513601179e-06, "loss": 4.207982788085937, "step": 134300 }, { "epoch": 0.16217150541672737, "learning_rate": 9.497628678133441e-06, "loss": 4.20839111328125, "step": 134400 }, { "epoch": 0.16229216873921007, "learning_rate": 9.497224842665701e-06, "loss": 4.201115112304688, "step": 134500 }, { "epoch": 0.16241283206169274, "learning_rate": 9.496821007197963e-06, "loss": 4.1791293334960935, "step": 134600 }, { "epoch": 0.1625334953841754, "learning_rate": 9.496417171730225e-06, "loss": 4.187546997070313, "step": 134700 }, { "epoch": 0.16265415870665811, "learning_rate": 9.496013336262487e-06, "loss": 4.196438293457032, "step": 134800 }, { "epoch": 0.1627748220291408, "learning_rate": 9.49560950079475e-06, "loss": 4.191497802734375, "step": 134900 }, { "epoch": 0.1628954853516235, "learning_rate": 9.495205665327011e-06, "loss": 4.215068054199219, "step": 135000 }, { "epoch": 0.16301614867410616, "learning_rate": 9.494801829859273e-06, "loss": 4.167944641113281, "step": 135100 }, { "epoch": 0.16313681199658886, "learning_rate": 9.494397994391534e-06, "loss": 4.205506591796875, "step": 135200 }, { "epoch": 0.16325747531907153, "learning_rate": 9.493994158923796e-06, "loss": 4.181203308105469, "step": 135300 }, { "epoch": 0.1633781386415542, "learning_rate": 9.493590323456056e-06, "loss": 4.181968383789062, "step": 135400 }, { "epoch": 0.1634988019640369, "learning_rate": 9.493186487988318e-06, "loss": 4.188661193847656, "step": 135500 }, { "epoch": 0.16361946528651958, "learning_rate": 9.49278265252058e-06, "loss": 4.200094604492188, "step": 135600 }, { "epoch": 0.16374012860900228, "learning_rate": 9.492378817052842e-06, "loss": 4.158785705566406, "step": 135700 }, { "epoch": 0.16386079193148495, "learning_rate": 9.491974981585104e-06, "loss": 4.159096374511718, "step": 135800 }, { "epoch": 0.16398145525396762, "learning_rate": 9.491571146117366e-06, "loss": 4.218682556152344, "step": 135900 }, { "epoch": 0.16410211857645032, "learning_rate": 9.491167310649628e-06, "loss": 4.178736572265625, "step": 136000 }, { "epoch": 0.164222781898933, "learning_rate": 9.490763475181888e-06, "loss": 4.1625192260742185, "step": 136100 }, { "epoch": 0.1643434452214157, "learning_rate": 9.49035963971415e-06, "loss": 4.173831787109375, "step": 136200 }, { "epoch": 0.16446410854389837, "learning_rate": 9.489955804246412e-06, "loss": 4.172528381347656, "step": 136300 }, { "epoch": 0.16458477186638107, "learning_rate": 9.489551968778672e-06, "loss": 4.1877224731445315, "step": 136400 }, { "epoch": 0.16470543518886374, "learning_rate": 9.489148133310934e-06, "loss": 4.170550231933594, "step": 136500 }, { "epoch": 0.1648260985113464, "learning_rate": 9.488744297843196e-06, "loss": 4.178667602539062, "step": 136600 }, { "epoch": 0.16494676183382911, "learning_rate": 9.488340462375458e-06, "loss": 4.193502807617188, "step": 136700 }, { "epoch": 0.1650674251563118, "learning_rate": 9.48793662690772e-06, "loss": 4.14175537109375, "step": 136800 }, { "epoch": 0.1651880884787945, "learning_rate": 9.48753279143998e-06, "loss": 4.170281982421875, "step": 136900 }, { "epoch": 0.16530875180127716, "learning_rate": 9.487128955972243e-06, "loss": 4.183246765136719, "step": 137000 }, { "epoch": 0.16542941512375983, "learning_rate": 9.486725120504504e-06, "loss": 4.175970458984375, "step": 137100 }, { "epoch": 0.16555007844624253, "learning_rate": 9.486321285036766e-06, "loss": 4.146685485839844, "step": 137200 }, { "epoch": 0.1656707417687252, "learning_rate": 9.485917449569028e-06, "loss": 4.153794250488281, "step": 137300 }, { "epoch": 0.1657914050912079, "learning_rate": 9.485513614101289e-06, "loss": 4.156079711914063, "step": 137400 }, { "epoch": 0.16591206841369058, "learning_rate": 9.48510977863355e-06, "loss": 4.1634674072265625, "step": 137500 }, { "epoch": 0.16603273173617328, "learning_rate": 9.484705943165813e-06, "loss": 4.172157897949218, "step": 137600 }, { "epoch": 0.16615339505865595, "learning_rate": 9.484302107698073e-06, "loss": 4.152699584960938, "step": 137700 }, { "epoch": 0.16627405838113862, "learning_rate": 9.483898272230335e-06, "loss": 4.132930297851562, "step": 137800 }, { "epoch": 0.16639472170362132, "learning_rate": 9.483494436762597e-06, "loss": 4.167182312011719, "step": 137900 }, { "epoch": 0.166515385026104, "learning_rate": 9.483090601294859e-06, "loss": 4.155087585449219, "step": 138000 }, { "epoch": 0.1666360483485867, "learning_rate": 9.482686765827121e-06, "loss": 4.171703491210938, "step": 138100 }, { "epoch": 0.16675671167106937, "learning_rate": 9.482282930359383e-06, "loss": 4.159670104980469, "step": 138200 }, { "epoch": 0.16687737499355204, "learning_rate": 9.481879094891643e-06, "loss": 4.147190856933594, "step": 138300 }, { "epoch": 0.16699803831603474, "learning_rate": 9.481475259423905e-06, "loss": 4.144685363769531, "step": 138400 }, { "epoch": 0.16711870163851741, "learning_rate": 9.481071423956167e-06, "loss": 4.152030334472657, "step": 138500 }, { "epoch": 0.16723936496100011, "learning_rate": 9.480667588488427e-06, "loss": 4.16162109375, "step": 138600 }, { "epoch": 0.1673600282834828, "learning_rate": 9.48026375302069e-06, "loss": 4.141409912109375, "step": 138700 }, { "epoch": 0.1674806916059655, "learning_rate": 9.479859917552951e-06, "loss": 4.161637573242188, "step": 138800 }, { "epoch": 0.16760135492844816, "learning_rate": 9.479456082085213e-06, "loss": 4.149785461425782, "step": 138900 }, { "epoch": 0.16772201825093083, "learning_rate": 9.479052246617475e-06, "loss": 4.137402648925781, "step": 139000 }, { "epoch": 0.16784268157341353, "learning_rate": 9.478648411149737e-06, "loss": 4.164827270507812, "step": 139100 }, { "epoch": 0.1679633448958962, "learning_rate": 9.478244575682e-06, "loss": 4.136315612792969, "step": 139200 }, { "epoch": 0.1680840082183789, "learning_rate": 9.47784074021426e-06, "loss": 4.13937744140625, "step": 139300 }, { "epoch": 0.16820467154086158, "learning_rate": 9.477436904746522e-06, "loss": 4.138125305175781, "step": 139400 }, { "epoch": 0.16832533486334425, "learning_rate": 9.477033069278782e-06, "loss": 4.1315478515625, "step": 139500 }, { "epoch": 0.16844599818582695, "learning_rate": 9.476629233811044e-06, "loss": 4.156204833984375, "step": 139600 }, { "epoch": 0.16856666150830962, "learning_rate": 9.476225398343306e-06, "loss": 4.163810119628907, "step": 139700 }, { "epoch": 0.16868732483079232, "learning_rate": 9.475821562875568e-06, "loss": 4.1622900390625, "step": 139800 }, { "epoch": 0.168807988153275, "learning_rate": 9.47541772740783e-06, "loss": 4.164542236328125, "step": 139900 }, { "epoch": 0.1689286514757577, "learning_rate": 9.475013891940092e-06, "loss": 4.1283544921875, "step": 140000 }, { "epoch": 0.16904931479824037, "learning_rate": 9.474610056472354e-06, "loss": 4.169474487304687, "step": 140100 }, { "epoch": 0.16916997812072304, "learning_rate": 9.474206221004614e-06, "loss": 4.153294677734375, "step": 140200 }, { "epoch": 0.16929064144320574, "learning_rate": 9.473802385536876e-06, "loss": 4.14068115234375, "step": 140300 }, { "epoch": 0.16941130476568841, "learning_rate": 9.473398550069138e-06, "loss": 4.134254455566406, "step": 140400 }, { "epoch": 0.16953196808817111, "learning_rate": 9.472994714601398e-06, "loss": 4.139063110351563, "step": 140500 }, { "epoch": 0.1696526314106538, "learning_rate": 9.47259087913366e-06, "loss": 4.143599853515625, "step": 140600 }, { "epoch": 0.16977329473313646, "learning_rate": 9.472187043665922e-06, "loss": 4.115407409667969, "step": 140700 }, { "epoch": 0.16989395805561916, "learning_rate": 9.471783208198184e-06, "loss": 4.142363586425781, "step": 140800 }, { "epoch": 0.17001462137810183, "learning_rate": 9.471379372730446e-06, "loss": 4.128663024902344, "step": 140900 }, { "epoch": 0.17013528470058453, "learning_rate": 9.470975537262707e-06, "loss": 4.125610961914062, "step": 141000 }, { "epoch": 0.1702559480230672, "learning_rate": 9.470571701794969e-06, "loss": 4.129360961914062, "step": 141100 }, { "epoch": 0.17037661134554988, "learning_rate": 9.47016786632723e-06, "loss": 4.167195739746094, "step": 141200 }, { "epoch": 0.17049727466803258, "learning_rate": 9.469764030859493e-06, "loss": 4.1093988037109375, "step": 141300 }, { "epoch": 0.17061793799051525, "learning_rate": 9.469360195391753e-06, "loss": 4.131300048828125, "step": 141400 }, { "epoch": 0.17073860131299795, "learning_rate": 9.468956359924015e-06, "loss": 4.122879943847656, "step": 141500 }, { "epoch": 0.17085926463548062, "learning_rate": 9.468552524456277e-06, "loss": 4.110649108886719, "step": 141600 }, { "epoch": 0.17097992795796332, "learning_rate": 9.468148688988539e-06, "loss": 4.117805786132813, "step": 141700 }, { "epoch": 0.171100591280446, "learning_rate": 9.467744853520799e-06, "loss": 4.1547119140625, "step": 141800 }, { "epoch": 0.17122125460292867, "learning_rate": 9.467341018053061e-06, "loss": 4.142525329589843, "step": 141900 }, { "epoch": 0.17134191792541137, "learning_rate": 9.466937182585323e-06, "loss": 4.132686462402344, "step": 142000 }, { "epoch": 0.17146258124789404, "learning_rate": 9.466533347117585e-06, "loss": 4.126594543457031, "step": 142100 }, { "epoch": 0.17158324457037674, "learning_rate": 9.466129511649847e-06, "loss": 4.121519470214844, "step": 142200 }, { "epoch": 0.17170390789285941, "learning_rate": 9.465725676182109e-06, "loss": 4.1388766479492185, "step": 142300 }, { "epoch": 0.1718245712153421, "learning_rate": 9.46532184071437e-06, "loss": 4.122481994628906, "step": 142400 }, { "epoch": 0.1719452345378248, "learning_rate": 9.464918005246631e-06, "loss": 4.111268920898437, "step": 142500 }, { "epoch": 0.17206589786030746, "learning_rate": 9.464514169778891e-06, "loss": 4.127690124511719, "step": 142600 }, { "epoch": 0.17218656118279016, "learning_rate": 9.464110334311153e-06, "loss": 4.116007995605469, "step": 142700 }, { "epoch": 0.17230722450527283, "learning_rate": 9.463706498843415e-06, "loss": 4.094861450195313, "step": 142800 }, { "epoch": 0.17242788782775553, "learning_rate": 9.463302663375677e-06, "loss": 4.121034240722656, "step": 142900 }, { "epoch": 0.1725485511502382, "learning_rate": 9.46289882790794e-06, "loss": 4.107123718261719, "step": 143000 }, { "epoch": 0.17266921447272088, "learning_rate": 9.462494992440201e-06, "loss": 4.114708251953125, "step": 143100 }, { "epoch": 0.17278987779520358, "learning_rate": 9.462091156972463e-06, "loss": 4.089667663574219, "step": 143200 }, { "epoch": 0.17291054111768625, "learning_rate": 9.461687321504724e-06, "loss": 4.112540893554687, "step": 143300 }, { "epoch": 0.17303120444016895, "learning_rate": 9.461283486036986e-06, "loss": 4.1080169677734375, "step": 143400 }, { "epoch": 0.17315186776265162, "learning_rate": 9.460879650569248e-06, "loss": 4.09574462890625, "step": 143500 }, { "epoch": 0.1732725310851343, "learning_rate": 9.460475815101508e-06, "loss": 4.110877990722656, "step": 143600 }, { "epoch": 0.173393194407617, "learning_rate": 9.46007197963377e-06, "loss": 4.111781005859375, "step": 143700 }, { "epoch": 0.17351385773009967, "learning_rate": 9.459668144166032e-06, "loss": 4.116029968261719, "step": 143800 }, { "epoch": 0.17363452105258237, "learning_rate": 9.459264308698294e-06, "loss": 4.083573303222656, "step": 143900 }, { "epoch": 0.17375518437506504, "learning_rate": 9.458860473230556e-06, "loss": 4.128597412109375, "step": 144000 }, { "epoch": 0.17387584769754774, "learning_rate": 9.458456637762818e-06, "loss": 4.100955200195313, "step": 144100 }, { "epoch": 0.17399651102003041, "learning_rate": 9.45805280229508e-06, "loss": 4.0837774658203125, "step": 144200 }, { "epoch": 0.1741171743425131, "learning_rate": 9.45764896682734e-06, "loss": 4.0916552734375, "step": 144300 }, { "epoch": 0.1742378376649958, "learning_rate": 9.457245131359602e-06, "loss": 4.099443969726562, "step": 144400 }, { "epoch": 0.17435850098747846, "learning_rate": 9.456841295891862e-06, "loss": 4.098468933105469, "step": 144500 }, { "epoch": 0.17447916430996116, "learning_rate": 9.456437460424124e-06, "loss": 4.083135070800782, "step": 144600 }, { "epoch": 0.17459982763244383, "learning_rate": 9.456033624956386e-06, "loss": 4.0824978637695315, "step": 144700 }, { "epoch": 0.1747204909549265, "learning_rate": 9.455629789488648e-06, "loss": 4.101973266601562, "step": 144800 }, { "epoch": 0.1748411542774092, "learning_rate": 9.45522595402091e-06, "loss": 4.093297424316407, "step": 144900 }, { "epoch": 0.17496181759989188, "learning_rate": 9.454822118553172e-06, "loss": 4.081582946777344, "step": 145000 }, { "epoch": 0.17508248092237458, "learning_rate": 9.454418283085433e-06, "loss": 4.115688781738282, "step": 145100 }, { "epoch": 0.17520314424485725, "learning_rate": 9.454014447617695e-06, "loss": 4.111075439453125, "step": 145200 }, { "epoch": 0.17532380756733995, "learning_rate": 9.453610612149957e-06, "loss": 4.104603271484375, "step": 145300 }, { "epoch": 0.17544447088982262, "learning_rate": 9.453206776682219e-06, "loss": 4.097171630859375, "step": 145400 }, { "epoch": 0.1755651342123053, "learning_rate": 9.452802941214479e-06, "loss": 4.0814361572265625, "step": 145500 }, { "epoch": 0.175685797534788, "learning_rate": 9.45239910574674e-06, "loss": 4.098536682128906, "step": 145600 }, { "epoch": 0.17580646085727067, "learning_rate": 9.451995270279003e-06, "loss": 4.097376098632813, "step": 145700 }, { "epoch": 0.17592712417975337, "learning_rate": 9.451591434811265e-06, "loss": 4.0992578125, "step": 145800 }, { "epoch": 0.17604778750223604, "learning_rate": 9.451187599343525e-06, "loss": 4.086771240234375, "step": 145900 }, { "epoch": 0.17616845082471871, "learning_rate": 9.450783763875787e-06, "loss": 4.094929504394531, "step": 146000 }, { "epoch": 0.17628911414720141, "learning_rate": 9.450379928408049e-06, "loss": 4.1046044921875, "step": 146100 }, { "epoch": 0.1764097774696841, "learning_rate": 9.449976092940311e-06, "loss": 4.060028686523437, "step": 146200 }, { "epoch": 0.1765304407921668, "learning_rate": 9.449572257472573e-06, "loss": 4.093073425292968, "step": 146300 }, { "epoch": 0.17665110411464946, "learning_rate": 9.449168422004833e-06, "loss": 4.060162963867188, "step": 146400 }, { "epoch": 0.17677176743713216, "learning_rate": 9.448764586537095e-06, "loss": 4.09326904296875, "step": 146500 }, { "epoch": 0.17689243075961483, "learning_rate": 9.448360751069357e-06, "loss": 4.03947265625, "step": 146600 }, { "epoch": 0.1770130940820975, "learning_rate": 9.447956915601618e-06, "loss": 4.081064758300781, "step": 146700 }, { "epoch": 0.1771337574045802, "learning_rate": 9.44755308013388e-06, "loss": 4.06759521484375, "step": 146800 }, { "epoch": 0.17725442072706288, "learning_rate": 9.447149244666141e-06, "loss": 4.101948547363281, "step": 146900 }, { "epoch": 0.17737508404954558, "learning_rate": 9.446745409198403e-06, "loss": 4.0613775634765625, "step": 147000 }, { "epoch": 0.17749574737202825, "learning_rate": 9.446341573730665e-06, "loss": 4.08305908203125, "step": 147100 }, { "epoch": 0.17761641069451092, "learning_rate": 9.445937738262927e-06, "loss": 4.054884338378907, "step": 147200 }, { "epoch": 0.17773707401699362, "learning_rate": 9.44553390279519e-06, "loss": 4.066440734863281, "step": 147300 }, { "epoch": 0.1778577373394763, "learning_rate": 9.44513006732745e-06, "loss": 4.063131713867188, "step": 147400 }, { "epoch": 0.177978400661959, "learning_rate": 9.444726231859712e-06, "loss": 4.0764794921875, "step": 147500 }, { "epoch": 0.17809906398444167, "learning_rate": 9.444322396391972e-06, "loss": 4.0662298583984375, "step": 147600 }, { "epoch": 0.17821972730692434, "learning_rate": 9.443918560924234e-06, "loss": 4.077352294921875, "step": 147700 }, { "epoch": 0.17834039062940704, "learning_rate": 9.443514725456496e-06, "loss": 4.088600158691406, "step": 147800 }, { "epoch": 0.17846105395188971, "learning_rate": 9.443110889988758e-06, "loss": 4.0680224609375, "step": 147900 }, { "epoch": 0.17858171727437241, "learning_rate": 9.44270705452102e-06, "loss": 4.052131958007813, "step": 148000 }, { "epoch": 0.1787023805968551, "learning_rate": 9.442303219053282e-06, "loss": 4.058963928222656, "step": 148100 }, { "epoch": 0.1788230439193378, "learning_rate": 9.441899383585544e-06, "loss": 4.080462341308594, "step": 148200 }, { "epoch": 0.17894370724182046, "learning_rate": 9.441495548117804e-06, "loss": 4.058490905761719, "step": 148300 }, { "epoch": 0.17906437056430313, "learning_rate": 9.441091712650066e-06, "loss": 4.058789672851563, "step": 148400 }, { "epoch": 0.17918503388678583, "learning_rate": 9.440687877182328e-06, "loss": 4.058347473144531, "step": 148500 }, { "epoch": 0.1793056972092685, "learning_rate": 9.440284041714588e-06, "loss": 4.04501708984375, "step": 148600 }, { "epoch": 0.1794263605317512, "learning_rate": 9.43988020624685e-06, "loss": 4.074843444824219, "step": 148700 }, { "epoch": 0.17954702385423388, "learning_rate": 9.439476370779112e-06, "loss": 4.060300598144531, "step": 148800 }, { "epoch": 0.17966768717671655, "learning_rate": 9.439072535311374e-06, "loss": 4.050150756835937, "step": 148900 }, { "epoch": 0.17978835049919925, "learning_rate": 9.438668699843636e-06, "loss": 4.049259338378906, "step": 149000 }, { "epoch": 0.17990901382168192, "learning_rate": 9.438264864375898e-06, "loss": 4.045036010742187, "step": 149100 }, { "epoch": 0.18002967714416462, "learning_rate": 9.437861028908159e-06, "loss": 4.089662170410156, "step": 149200 }, { "epoch": 0.1801503404666473, "learning_rate": 9.43745719344042e-06, "loss": 4.047580871582031, "step": 149300 }, { "epoch": 0.18027100378913, "learning_rate": 9.437053357972683e-06, "loss": 4.08689697265625, "step": 149400 }, { "epoch": 0.18039166711161267, "learning_rate": 9.436649522504943e-06, "loss": 4.0404141235351565, "step": 149500 }, { "epoch": 0.18051233043409534, "learning_rate": 9.436245687037205e-06, "loss": 4.0890960693359375, "step": 149600 }, { "epoch": 0.18063299375657804, "learning_rate": 9.435841851569467e-06, "loss": 4.05540283203125, "step": 149700 }, { "epoch": 0.18075365707906071, "learning_rate": 9.435438016101729e-06, "loss": 4.025476379394531, "step": 149800 }, { "epoch": 0.18087432040154341, "learning_rate": 9.43503418063399e-06, "loss": 4.0574777221679685, "step": 149900 }, { "epoch": 0.1809949837240261, "learning_rate": 9.434630345166251e-06, "loss": 4.03138916015625, "step": 150000 }, { "epoch": 0.18111564704650876, "learning_rate": 9.434226509698513e-06, "loss": 4.055688171386719, "step": 150100 }, { "epoch": 0.18123631036899146, "learning_rate": 9.433822674230775e-06, "loss": 4.031493530273438, "step": 150200 }, { "epoch": 0.18135697369147413, "learning_rate": 9.433418838763037e-06, "loss": 4.042034606933594, "step": 150300 }, { "epoch": 0.18147763701395683, "learning_rate": 9.433015003295299e-06, "loss": 4.044190368652344, "step": 150400 }, { "epoch": 0.1815983003364395, "learning_rate": 9.43261116782756e-06, "loss": 4.054629516601563, "step": 150500 }, { "epoch": 0.1817189636589222, "learning_rate": 9.432207332359821e-06, "loss": 4.025072631835937, "step": 150600 }, { "epoch": 0.18183962698140488, "learning_rate": 9.431803496892083e-06, "loss": 4.047225341796875, "step": 150700 }, { "epoch": 0.18196029030388755, "learning_rate": 9.431399661424344e-06, "loss": 4.048432312011719, "step": 150800 }, { "epoch": 0.18208095362637025, "learning_rate": 9.430995825956606e-06, "loss": 4.036373291015625, "step": 150900 }, { "epoch": 0.18220161694885292, "learning_rate": 9.430591990488868e-06, "loss": 4.003193359375, "step": 151000 }, { "epoch": 0.18232228027133562, "learning_rate": 9.43018815502113e-06, "loss": 4.0211181640625, "step": 151100 }, { "epoch": 0.1824429435938183, "learning_rate": 9.429784319553391e-06, "loss": 4.069910888671875, "step": 151200 }, { "epoch": 0.18256360691630097, "learning_rate": 9.429380484085653e-06, "loss": 4.06355712890625, "step": 151300 }, { "epoch": 0.18268427023878367, "learning_rate": 9.428976648617915e-06, "loss": 4.048116760253906, "step": 151400 }, { "epoch": 0.18280493356126634, "learning_rate": 9.428572813150176e-06, "loss": 4.045962829589843, "step": 151500 }, { "epoch": 0.18292559688374904, "learning_rate": 9.428168977682438e-06, "loss": 4.045631713867188, "step": 151600 }, { "epoch": 0.18304626020623171, "learning_rate": 9.427765142214698e-06, "loss": 4.052801818847656, "step": 151700 }, { "epoch": 0.18316692352871441, "learning_rate": 9.42736130674696e-06, "loss": 4.02794189453125, "step": 151800 }, { "epoch": 0.1832875868511971, "learning_rate": 9.426957471279222e-06, "loss": 4.015117492675781, "step": 151900 }, { "epoch": 0.18340825017367976, "learning_rate": 9.426553635811484e-06, "loss": 4.010919189453125, "step": 152000 }, { "epoch": 0.18352891349616246, "learning_rate": 9.426149800343746e-06, "loss": 4.0254150390625, "step": 152100 }, { "epoch": 0.18364957681864513, "learning_rate": 9.425745964876008e-06, "loss": 3.99409423828125, "step": 152200 }, { "epoch": 0.18377024014112783, "learning_rate": 9.42534212940827e-06, "loss": 4.019951477050781, "step": 152300 }, { "epoch": 0.1838909034636105, "learning_rate": 9.42493829394053e-06, "loss": 4.041195678710937, "step": 152400 }, { "epoch": 0.18401156678609318, "learning_rate": 9.424534458472792e-06, "loss": 4.027416381835938, "step": 152500 }, { "epoch": 0.18413223010857588, "learning_rate": 9.424130623005054e-06, "loss": 4.043953552246093, "step": 152600 }, { "epoch": 0.18425289343105855, "learning_rate": 9.423726787537314e-06, "loss": 4.022510070800781, "step": 152700 }, { "epoch": 0.18437355675354125, "learning_rate": 9.423322952069576e-06, "loss": 4.009160461425782, "step": 152800 }, { "epoch": 0.18449422007602392, "learning_rate": 9.422919116601838e-06, "loss": 4.020636901855469, "step": 152900 }, { "epoch": 0.18461488339850662, "learning_rate": 9.4225152811341e-06, "loss": 4.0316464233398435, "step": 153000 }, { "epoch": 0.1847355467209893, "learning_rate": 9.422111445666362e-06, "loss": 4.0219183349609375, "step": 153100 }, { "epoch": 0.18485621004347197, "learning_rate": 9.421707610198623e-06, "loss": 4.01727294921875, "step": 153200 }, { "epoch": 0.18497687336595467, "learning_rate": 9.421303774730885e-06, "loss": 4.0125732421875, "step": 153300 }, { "epoch": 0.18509753668843734, "learning_rate": 9.420899939263147e-06, "loss": 4.007660827636719, "step": 153400 }, { "epoch": 0.18521820001092004, "learning_rate": 9.420496103795409e-06, "loss": 3.996183166503906, "step": 153500 }, { "epoch": 0.18533886333340271, "learning_rate": 9.420092268327669e-06, "loss": 4.0167715454101565, "step": 153600 }, { "epoch": 0.1854595266558854, "learning_rate": 9.419688432859931e-06, "loss": 4.02603515625, "step": 153700 }, { "epoch": 0.1855801899783681, "learning_rate": 9.419284597392193e-06, "loss": 4.006358947753906, "step": 153800 }, { "epoch": 0.18570085330085076, "learning_rate": 9.418880761924455e-06, "loss": 4.02930908203125, "step": 153900 }, { "epoch": 0.18582151662333346, "learning_rate": 9.418476926456715e-06, "loss": 4.024056396484375, "step": 154000 }, { "epoch": 0.18594217994581613, "learning_rate": 9.418073090988977e-06, "loss": 4.001048889160156, "step": 154100 }, { "epoch": 0.1860628432682988, "learning_rate": 9.417669255521239e-06, "loss": 4.017117919921875, "step": 154200 }, { "epoch": 0.1861835065907815, "learning_rate": 9.417265420053501e-06, "loss": 3.9995022583007813, "step": 154300 }, { "epoch": 0.18630416991326418, "learning_rate": 9.416861584585763e-06, "loss": 3.9941656494140627, "step": 154400 }, { "epoch": 0.18642483323574688, "learning_rate": 9.416457749118025e-06, "loss": 3.992108154296875, "step": 154500 }, { "epoch": 0.18654549655822955, "learning_rate": 9.416053913650285e-06, "loss": 4.011061706542969, "step": 154600 }, { "epoch": 0.18666615988071225, "learning_rate": 9.415650078182547e-06, "loss": 4.010173034667969, "step": 154700 }, { "epoch": 0.18678682320319492, "learning_rate": 9.41524624271481e-06, "loss": 4.005847778320312, "step": 154800 }, { "epoch": 0.1869074865256776, "learning_rate": 9.41484240724707e-06, "loss": 4.026692504882813, "step": 154900 }, { "epoch": 0.1870281498481603, "learning_rate": 9.414438571779332e-06, "loss": 4.003030700683594, "step": 155000 }, { "epoch": 0.18714881317064297, "learning_rate": 9.414034736311594e-06, "loss": 3.986455078125, "step": 155100 }, { "epoch": 0.18726947649312567, "learning_rate": 9.413630900843856e-06, "loss": 3.9916006469726564, "step": 155200 }, { "epoch": 0.18739013981560834, "learning_rate": 9.413227065376118e-06, "loss": 4.001815185546875, "step": 155300 }, { "epoch": 0.18751080313809101, "learning_rate": 9.41282322990838e-06, "loss": 4.031525573730469, "step": 155400 }, { "epoch": 0.18763146646057371, "learning_rate": 9.41241939444064e-06, "loss": 4.016306762695312, "step": 155500 }, { "epoch": 0.1877521297830564, "learning_rate": 9.412015558972902e-06, "loss": 4.017903747558594, "step": 155600 }, { "epoch": 0.1878727931055391, "learning_rate": 9.411611723505164e-06, "loss": 3.995350646972656, "step": 155700 }, { "epoch": 0.18799345642802176, "learning_rate": 9.411207888037424e-06, "loss": 4.006609497070312, "step": 155800 }, { "epoch": 0.18811411975050446, "learning_rate": 9.410804052569686e-06, "loss": 4.022078247070312, "step": 155900 }, { "epoch": 0.18823478307298713, "learning_rate": 9.410400217101948e-06, "loss": 4.009051208496094, "step": 156000 }, { "epoch": 0.1883554463954698, "learning_rate": 9.40999638163421e-06, "loss": 4.0004119873046875, "step": 156100 }, { "epoch": 0.1884761097179525, "learning_rate": 9.409592546166472e-06, "loss": 3.9963970947265626, "step": 156200 }, { "epoch": 0.18859677304043518, "learning_rate": 9.409188710698734e-06, "loss": 3.958802490234375, "step": 156300 }, { "epoch": 0.18871743636291788, "learning_rate": 9.408784875230996e-06, "loss": 3.995546875, "step": 156400 }, { "epoch": 0.18883809968540055, "learning_rate": 9.408381039763256e-06, "loss": 4.009895935058593, "step": 156500 }, { "epoch": 0.18895876300788322, "learning_rate": 9.407977204295518e-06, "loss": 4.016905517578125, "step": 156600 }, { "epoch": 0.18907942633036592, "learning_rate": 9.407573368827779e-06, "loss": 3.996622314453125, "step": 156700 }, { "epoch": 0.1892000896528486, "learning_rate": 9.40716953336004e-06, "loss": 3.9768637084960936, "step": 156800 }, { "epoch": 0.1893207529753313, "learning_rate": 9.406765697892302e-06, "loss": 3.9941397094726563, "step": 156900 }, { "epoch": 0.18944141629781397, "learning_rate": 9.406361862424564e-06, "loss": 4.000443725585938, "step": 157000 }, { "epoch": 0.18956207962029667, "learning_rate": 9.405958026956826e-06, "loss": 3.9986016845703123, "step": 157100 }, { "epoch": 0.18968274294277934, "learning_rate": 9.405554191489088e-06, "loss": 3.9812774658203125, "step": 157200 }, { "epoch": 0.18980340626526201, "learning_rate": 9.405150356021349e-06, "loss": 3.9898141479492186, "step": 157300 }, { "epoch": 0.18992406958774471, "learning_rate": 9.40474652055361e-06, "loss": 3.9905380249023437, "step": 157400 }, { "epoch": 0.1900447329102274, "learning_rate": 9.404342685085873e-06, "loss": 3.9934176635742187, "step": 157500 }, { "epoch": 0.1901653962327101, "learning_rate": 9.403938849618135e-06, "loss": 3.9773764038085937, "step": 157600 }, { "epoch": 0.19028605955519276, "learning_rate": 9.403535014150395e-06, "loss": 3.9768081665039063, "step": 157700 }, { "epoch": 0.19040672287767543, "learning_rate": 9.403131178682657e-06, "loss": 3.9774356079101563, "step": 157800 }, { "epoch": 0.19052738620015813, "learning_rate": 9.402727343214919e-06, "loss": 3.984882507324219, "step": 157900 }, { "epoch": 0.1906480495226408, "learning_rate": 9.402323507747181e-06, "loss": 3.9816928100585938, "step": 158000 }, { "epoch": 0.1907687128451235, "learning_rate": 9.401919672279441e-06, "loss": 3.9713653564453124, "step": 158100 }, { "epoch": 0.19088937616760618, "learning_rate": 9.401515836811703e-06, "loss": 3.97996337890625, "step": 158200 }, { "epoch": 0.19101003949008888, "learning_rate": 9.401112001343965e-06, "loss": 3.9983935546875, "step": 158300 }, { "epoch": 0.19113070281257155, "learning_rate": 9.400708165876227e-06, "loss": 3.979936218261719, "step": 158400 }, { "epoch": 0.19125136613505422, "learning_rate": 9.400304330408489e-06, "loss": 3.9622076416015624, "step": 158500 }, { "epoch": 0.19137202945753692, "learning_rate": 9.39990049494075e-06, "loss": 3.994253845214844, "step": 158600 }, { "epoch": 0.1914926927800196, "learning_rate": 9.399496659473011e-06, "loss": 3.9754034423828126, "step": 158700 }, { "epoch": 0.1916133561025023, "learning_rate": 9.399092824005273e-06, "loss": 3.9619406127929686, "step": 158800 }, { "epoch": 0.19173401942498497, "learning_rate": 9.398688988537534e-06, "loss": 3.9780078125, "step": 158900 }, { "epoch": 0.19185468274746764, "learning_rate": 9.398285153069796e-06, "loss": 3.9652264404296873, "step": 159000 }, { "epoch": 0.19197534606995034, "learning_rate": 9.397881317602058e-06, "loss": 3.9717974853515625, "step": 159100 }, { "epoch": 0.19209600939243301, "learning_rate": 9.39747748213432e-06, "loss": 3.9876675415039062, "step": 159200 }, { "epoch": 0.19221667271491572, "learning_rate": 9.397073646666582e-06, "loss": 3.9908966064453124, "step": 159300 }, { "epoch": 0.1923373360373984, "learning_rate": 9.396669811198844e-06, "loss": 3.9443743896484373, "step": 159400 }, { "epoch": 0.1924579993598811, "learning_rate": 9.396265975731106e-06, "loss": 3.967160339355469, "step": 159500 }, { "epoch": 0.19257866268236376, "learning_rate": 9.395862140263366e-06, "loss": 3.9705538940429688, "step": 159600 }, { "epoch": 0.19269932600484643, "learning_rate": 9.395458304795628e-06, "loss": 4.003659973144531, "step": 159700 }, { "epoch": 0.19281998932732913, "learning_rate": 9.395054469327888e-06, "loss": 3.961138916015625, "step": 159800 }, { "epoch": 0.1929406526498118, "learning_rate": 9.39465063386015e-06, "loss": 3.9472125244140623, "step": 159900 }, { "epoch": 0.1930613159722945, "learning_rate": 9.394246798392412e-06, "loss": 3.961947021484375, "step": 160000 }, { "epoch": 0.19318197929477718, "learning_rate": 9.393842962924674e-06, "loss": 3.9489144897460937, "step": 160100 }, { "epoch": 0.19330264261725985, "learning_rate": 9.393439127456936e-06, "loss": 3.948178405761719, "step": 160200 }, { "epoch": 0.19342330593974255, "learning_rate": 9.393035291989198e-06, "loss": 3.9760037231445313, "step": 160300 }, { "epoch": 0.19354396926222522, "learning_rate": 9.39263145652146e-06, "loss": 3.9468838500976564, "step": 160400 }, { "epoch": 0.19366463258470792, "learning_rate": 9.39222762105372e-06, "loss": 3.9636865234375, "step": 160500 }, { "epoch": 0.1937852959071906, "learning_rate": 9.391823785585982e-06, "loss": 3.98802978515625, "step": 160600 }, { "epoch": 0.19390595922967327, "learning_rate": 9.391419950118244e-06, "loss": 3.943309020996094, "step": 160700 }, { "epoch": 0.19402662255215597, "learning_rate": 9.391016114650505e-06, "loss": 3.945246276855469, "step": 160800 }, { "epoch": 0.19414728587463864, "learning_rate": 9.390612279182767e-06, "loss": 3.943849792480469, "step": 160900 }, { "epoch": 0.19426794919712134, "learning_rate": 9.390208443715029e-06, "loss": 3.965051574707031, "step": 161000 }, { "epoch": 0.19438861251960401, "learning_rate": 9.38980460824729e-06, "loss": 3.9563021850585938, "step": 161100 }, { "epoch": 0.19450927584208672, "learning_rate": 9.389400772779552e-06, "loss": 3.9251171875, "step": 161200 }, { "epoch": 0.1946299391645694, "learning_rate": 9.388996937311814e-06, "loss": 3.9312396240234375, "step": 161300 }, { "epoch": 0.19475060248705206, "learning_rate": 9.388593101844075e-06, "loss": 3.945506591796875, "step": 161400 }, { "epoch": 0.19487126580953476, "learning_rate": 9.388189266376337e-06, "loss": 3.963096923828125, "step": 161500 }, { "epoch": 0.19499192913201743, "learning_rate": 9.387785430908599e-06, "loss": 3.951310729980469, "step": 161600 }, { "epoch": 0.19511259245450013, "learning_rate": 9.387381595440859e-06, "loss": 3.966768798828125, "step": 161700 }, { "epoch": 0.1952332557769828, "learning_rate": 9.386977759973121e-06, "loss": 3.9963201904296874, "step": 161800 }, { "epoch": 0.19535391909946548, "learning_rate": 9.386573924505383e-06, "loss": 3.9126287841796876, "step": 161900 }, { "epoch": 0.19547458242194818, "learning_rate": 9.386170089037645e-06, "loss": 3.967998046875, "step": 162000 }, { "epoch": 0.19559524574443085, "learning_rate": 9.385766253569907e-06, "loss": 3.973890686035156, "step": 162100 }, { "epoch": 0.19571590906691355, "learning_rate": 9.385362418102167e-06, "loss": 3.9504486083984376, "step": 162200 }, { "epoch": 0.19583657238939622, "learning_rate": 9.38495858263443e-06, "loss": 3.937174987792969, "step": 162300 }, { "epoch": 0.19595723571187892, "learning_rate": 9.384554747166691e-06, "loss": 3.95936279296875, "step": 162400 }, { "epoch": 0.1960778990343616, "learning_rate": 9.384150911698953e-06, "loss": 3.938043212890625, "step": 162500 }, { "epoch": 0.19619856235684427, "learning_rate": 9.383747076231215e-06, "loss": 3.968492431640625, "step": 162600 }, { "epoch": 0.19631922567932697, "learning_rate": 9.383343240763475e-06, "loss": 3.9378448486328126, "step": 162700 }, { "epoch": 0.19643988900180964, "learning_rate": 9.382939405295737e-06, "loss": 3.951314697265625, "step": 162800 }, { "epoch": 0.19656055232429234, "learning_rate": 9.382535569828e-06, "loss": 3.9318060302734374, "step": 162900 }, { "epoch": 0.19668121564677502, "learning_rate": 9.38213173436026e-06, "loss": 3.9562448120117186, "step": 163000 }, { "epoch": 0.1968018789692577, "learning_rate": 9.381727898892522e-06, "loss": 3.9357901000976563, "step": 163100 }, { "epoch": 0.1969225422917404, "learning_rate": 9.381324063424784e-06, "loss": 3.9316226196289064, "step": 163200 }, { "epoch": 0.19704320561422306, "learning_rate": 9.380920227957046e-06, "loss": 3.9586306762695314, "step": 163300 }, { "epoch": 0.19716386893670576, "learning_rate": 9.380516392489308e-06, "loss": 3.938726501464844, "step": 163400 }, { "epoch": 0.19728453225918843, "learning_rate": 9.38011255702157e-06, "loss": 3.940384826660156, "step": 163500 }, { "epoch": 0.19740519558167113, "learning_rate": 9.37970872155383e-06, "loss": 3.9382730102539063, "step": 163600 }, { "epoch": 0.1975258589041538, "learning_rate": 9.379304886086092e-06, "loss": 3.929862060546875, "step": 163700 }, { "epoch": 0.19764652222663648, "learning_rate": 9.378901050618354e-06, "loss": 3.934556884765625, "step": 163800 }, { "epoch": 0.19776718554911918, "learning_rate": 9.378497215150614e-06, "loss": 3.936484375, "step": 163900 }, { "epoch": 0.19788784887160185, "learning_rate": 9.378093379682876e-06, "loss": 3.9157168579101564, "step": 164000 }, { "epoch": 0.19800851219408455, "learning_rate": 9.377689544215138e-06, "loss": 3.92895263671875, "step": 164100 }, { "epoch": 0.19812917551656722, "learning_rate": 9.3772857087474e-06, "loss": 3.927414855957031, "step": 164200 }, { "epoch": 0.1982498388390499, "learning_rate": 9.376881873279662e-06, "loss": 3.9280136108398436, "step": 164300 }, { "epoch": 0.1983705021615326, "learning_rate": 9.376478037811924e-06, "loss": 3.951353759765625, "step": 164400 }, { "epoch": 0.19849116548401527, "learning_rate": 9.376074202344186e-06, "loss": 3.9360696411132814, "step": 164500 }, { "epoch": 0.19861182880649797, "learning_rate": 9.375670366876446e-06, "loss": 3.921869201660156, "step": 164600 }, { "epoch": 0.19873249212898064, "learning_rate": 9.375266531408708e-06, "loss": 3.925499267578125, "step": 164700 }, { "epoch": 0.19885315545146334, "learning_rate": 9.374862695940969e-06, "loss": 3.946710510253906, "step": 164800 }, { "epoch": 0.19897381877394602, "learning_rate": 9.37445886047323e-06, "loss": 3.8890890502929687, "step": 164900 }, { "epoch": 0.1990944820964287, "learning_rate": 9.374055025005493e-06, "loss": 3.9316473388671875, "step": 165000 }, { "epoch": 0.1992151454189114, "learning_rate": 9.373651189537755e-06, "loss": 3.92435546875, "step": 165100 }, { "epoch": 0.19933580874139406, "learning_rate": 9.373247354070017e-06, "loss": 3.9189715576171875, "step": 165200 }, { "epoch": 0.19945647206387676, "learning_rate": 9.372843518602279e-06, "loss": 3.904657287597656, "step": 165300 }, { "epoch": 0.19957713538635943, "learning_rate": 9.37243968313454e-06, "loss": 3.9273565673828124, "step": 165400 }, { "epoch": 0.1996977987088421, "learning_rate": 9.3720358476668e-06, "loss": 3.94675537109375, "step": 165500 }, { "epoch": 0.1998184620313248, "learning_rate": 9.371632012199063e-06, "loss": 3.9269332885742188, "step": 165600 }, { "epoch": 0.19993912535380748, "learning_rate": 9.371228176731325e-06, "loss": 3.9447283935546875, "step": 165700 }, { "epoch": 0.20005978867629018, "learning_rate": 9.370824341263585e-06, "loss": 3.9161105346679688, "step": 165800 }, { "epoch": 0.20018045199877285, "learning_rate": 9.370420505795847e-06, "loss": 3.913367919921875, "step": 165900 }, { "epoch": 0.20030111532125555, "learning_rate": 9.370016670328109e-06, "loss": 3.90974365234375, "step": 166000 }, { "epoch": 0.20042177864373822, "learning_rate": 9.369612834860371e-06, "loss": 3.916065979003906, "step": 166100 }, { "epoch": 0.2005424419662209, "learning_rate": 9.369208999392633e-06, "loss": 3.9042202758789064, "step": 166200 }, { "epoch": 0.2006631052887036, "learning_rate": 9.368805163924893e-06, "loss": 3.9106549072265624, "step": 166300 }, { "epoch": 0.20078376861118627, "learning_rate": 9.368401328457155e-06, "loss": 3.9116033935546874, "step": 166400 }, { "epoch": 0.20090443193366897, "learning_rate": 9.367997492989417e-06, "loss": 3.9169955444335938, "step": 166500 }, { "epoch": 0.20102509525615164, "learning_rate": 9.36759365752168e-06, "loss": 3.897344055175781, "step": 166600 }, { "epoch": 0.20114575857863431, "learning_rate": 9.367189822053941e-06, "loss": 3.8958749389648437, "step": 166700 }, { "epoch": 0.20126642190111702, "learning_rate": 9.366785986586201e-06, "loss": 3.917710266113281, "step": 166800 }, { "epoch": 0.2013870852235997, "learning_rate": 9.366382151118463e-06, "loss": 3.93051025390625, "step": 166900 }, { "epoch": 0.2015077485460824, "learning_rate": 9.365978315650725e-06, "loss": 3.91257080078125, "step": 167000 }, { "epoch": 0.20162841186856506, "learning_rate": 9.365574480182986e-06, "loss": 3.8849337768554686, "step": 167100 }, { "epoch": 0.20174907519104773, "learning_rate": 9.365170644715248e-06, "loss": 3.9154803466796877, "step": 167200 }, { "epoch": 0.20186973851353043, "learning_rate": 9.36476680924751e-06, "loss": 3.9124334716796874, "step": 167300 }, { "epoch": 0.2019904018360131, "learning_rate": 9.364362973779772e-06, "loss": 3.9076419067382813, "step": 167400 }, { "epoch": 0.2021110651584958, "learning_rate": 9.363959138312034e-06, "loss": 3.9181591796875, "step": 167500 }, { "epoch": 0.20223172848097848, "learning_rate": 9.363555302844296e-06, "loss": 3.9095223999023436, "step": 167600 }, { "epoch": 0.20235239180346118, "learning_rate": 9.363151467376556e-06, "loss": 3.9223626708984374, "step": 167700 }, { "epoch": 0.20247305512594385, "learning_rate": 9.362747631908818e-06, "loss": 3.908642578125, "step": 167800 }, { "epoch": 0.20259371844842652, "learning_rate": 9.36234379644108e-06, "loss": 3.912618408203125, "step": 167900 }, { "epoch": 0.20271438177090922, "learning_rate": 9.36193996097334e-06, "loss": 3.891865234375, "step": 168000 }, { "epoch": 0.2028350450933919, "learning_rate": 9.361536125505602e-06, "loss": 3.887584533691406, "step": 168100 }, { "epoch": 0.2029557084158746, "learning_rate": 9.361132290037864e-06, "loss": 3.902679443359375, "step": 168200 }, { "epoch": 0.20307637173835727, "learning_rate": 9.360728454570126e-06, "loss": 3.901674499511719, "step": 168300 }, { "epoch": 0.20319703506083994, "learning_rate": 9.360324619102388e-06, "loss": 3.8855657958984375, "step": 168400 }, { "epoch": 0.20331769838332264, "learning_rate": 9.35992078363465e-06, "loss": 3.9087725830078126, "step": 168500 }, { "epoch": 0.20343836170580532, "learning_rate": 9.359516948166912e-06, "loss": 3.8916744995117187, "step": 168600 }, { "epoch": 0.20355902502828802, "learning_rate": 9.359113112699172e-06, "loss": 3.903193054199219, "step": 168700 }, { "epoch": 0.2036796883507707, "learning_rate": 9.358709277231434e-06, "loss": 3.9031878662109376, "step": 168800 }, { "epoch": 0.2038003516732534, "learning_rate": 9.358305441763695e-06, "loss": 3.8811785888671877, "step": 168900 }, { "epoch": 0.20392101499573606, "learning_rate": 9.357901606295957e-06, "loss": 3.9057913208007813, "step": 169000 }, { "epoch": 0.20404167831821873, "learning_rate": 9.357497770828219e-06, "loss": 3.9004705810546874, "step": 169100 }, { "epoch": 0.20416234164070143, "learning_rate": 9.35709393536048e-06, "loss": 3.9152734375, "step": 169200 }, { "epoch": 0.2042830049631841, "learning_rate": 9.356690099892743e-06, "loss": 3.8760000610351564, "step": 169300 }, { "epoch": 0.2044036682856668, "learning_rate": 9.356286264425005e-06, "loss": 3.8949551391601562, "step": 169400 }, { "epoch": 0.20452433160814948, "learning_rate": 9.355882428957265e-06, "loss": 3.9081497192382812, "step": 169500 }, { "epoch": 0.20464499493063215, "learning_rate": 9.355478593489527e-06, "loss": 3.891767578125, "step": 169600 }, { "epoch": 0.20476565825311485, "learning_rate": 9.355074758021789e-06, "loss": 3.9051165771484375, "step": 169700 }, { "epoch": 0.20488632157559752, "learning_rate": 9.35467092255405e-06, "loss": 3.880681457519531, "step": 169800 }, { "epoch": 0.20500698489808022, "learning_rate": 9.354267087086311e-06, "loss": 3.882630615234375, "step": 169900 }, { "epoch": 0.2051276482205629, "learning_rate": 9.353863251618573e-06, "loss": 3.9082928466796876, "step": 170000 }, { "epoch": 0.2052483115430456, "learning_rate": 9.353459416150835e-06, "loss": 3.9023587036132814, "step": 170100 }, { "epoch": 0.20536897486552827, "learning_rate": 9.353055580683097e-06, "loss": 3.9219537353515626, "step": 170200 }, { "epoch": 0.20548963818801094, "learning_rate": 9.352651745215359e-06, "loss": 3.891326599121094, "step": 170300 }, { "epoch": 0.20561030151049364, "learning_rate": 9.35224790974762e-06, "loss": 3.893621826171875, "step": 170400 }, { "epoch": 0.20573096483297632, "learning_rate": 9.351844074279881e-06, "loss": 3.890181579589844, "step": 170500 }, { "epoch": 0.20585162815545902, "learning_rate": 9.351440238812143e-06, "loss": 3.882404479980469, "step": 170600 }, { "epoch": 0.2059722914779417, "learning_rate": 9.351036403344405e-06, "loss": 3.9055499267578124, "step": 170700 }, { "epoch": 0.20609295480042436, "learning_rate": 9.350632567876666e-06, "loss": 3.8784725952148436, "step": 170800 }, { "epoch": 0.20621361812290706, "learning_rate": 9.350228732408927e-06, "loss": 3.8956500244140626, "step": 170900 }, { "epoch": 0.20633428144538973, "learning_rate": 9.34982489694119e-06, "loss": 3.8820159912109373, "step": 171000 }, { "epoch": 0.20645494476787243, "learning_rate": 9.349421061473451e-06, "loss": 3.862356872558594, "step": 171100 }, { "epoch": 0.2065756080903551, "learning_rate": 9.349017226005712e-06, "loss": 3.8845086669921876, "step": 171200 }, { "epoch": 0.2066962714128378, "learning_rate": 9.348613390537974e-06, "loss": 3.8948565673828126, "step": 171300 }, { "epoch": 0.20681693473532048, "learning_rate": 9.348209555070236e-06, "loss": 3.9076422119140624, "step": 171400 }, { "epoch": 0.20693759805780315, "learning_rate": 9.347805719602498e-06, "loss": 3.8729852294921874, "step": 171500 }, { "epoch": 0.20705826138028585, "learning_rate": 9.34740188413476e-06, "loss": 3.870924072265625, "step": 171600 }, { "epoch": 0.20717892470276852, "learning_rate": 9.346998048667022e-06, "loss": 3.8728848266601563, "step": 171700 }, { "epoch": 0.20729958802525122, "learning_rate": 9.346594213199282e-06, "loss": 3.8923126220703126, "step": 171800 }, { "epoch": 0.2074202513477339, "learning_rate": 9.346190377731544e-06, "loss": 3.875132751464844, "step": 171900 }, { "epoch": 0.20754091467021657, "learning_rate": 9.345786542263804e-06, "loss": 3.858740234375, "step": 172000 }, { "epoch": 0.20766157799269927, "learning_rate": 9.345382706796066e-06, "loss": 3.896944885253906, "step": 172100 }, { "epoch": 0.20778224131518194, "learning_rate": 9.344978871328328e-06, "loss": 3.865123596191406, "step": 172200 }, { "epoch": 0.20790290463766464, "learning_rate": 9.34457503586059e-06, "loss": 3.870838317871094, "step": 172300 }, { "epoch": 0.20802356796014732, "learning_rate": 9.344171200392852e-06, "loss": 3.852091979980469, "step": 172400 }, { "epoch": 0.20814423128263002, "learning_rate": 9.343767364925114e-06, "loss": 3.8722979736328127, "step": 172500 }, { "epoch": 0.2082648946051127, "learning_rate": 9.343363529457376e-06, "loss": 3.868000793457031, "step": 172600 }, { "epoch": 0.20838555792759536, "learning_rate": 9.342959693989636e-06, "loss": 3.8725985717773437, "step": 172700 }, { "epoch": 0.20850622125007806, "learning_rate": 9.342555858521898e-06, "loss": 3.8823471069335938, "step": 172800 }, { "epoch": 0.20862688457256073, "learning_rate": 9.34215202305416e-06, "loss": 3.8700616455078123, "step": 172900 }, { "epoch": 0.20874754789504343, "learning_rate": 9.34174818758642e-06, "loss": 3.8738943481445314, "step": 173000 }, { "epoch": 0.2088682112175261, "learning_rate": 9.341344352118683e-06, "loss": 3.851153564453125, "step": 173100 }, { "epoch": 0.20898887454000878, "learning_rate": 9.340940516650945e-06, "loss": 3.8581884765625, "step": 173200 }, { "epoch": 0.20910953786249148, "learning_rate": 9.340536681183207e-06, "loss": 3.873965148925781, "step": 173300 }, { "epoch": 0.20923020118497415, "learning_rate": 9.340132845715469e-06, "loss": 3.8880624389648437, "step": 173400 }, { "epoch": 0.20935086450745685, "learning_rate": 9.33972901024773e-06, "loss": 3.8819808959960938, "step": 173500 }, { "epoch": 0.20947152782993952, "learning_rate": 9.339325174779991e-06, "loss": 3.8697860717773436, "step": 173600 }, { "epoch": 0.2095921911524222, "learning_rate": 9.338921339312253e-06, "loss": 3.8486712646484373, "step": 173700 }, { "epoch": 0.2097128544749049, "learning_rate": 9.338517503844515e-06, "loss": 3.879408264160156, "step": 173800 }, { "epoch": 0.20983351779738757, "learning_rate": 9.338113668376775e-06, "loss": 3.878307189941406, "step": 173900 }, { "epoch": 0.20995418111987027, "learning_rate": 9.337709832909037e-06, "loss": 3.856025390625, "step": 174000 }, { "epoch": 0.21007484444235294, "learning_rate": 9.337305997441299e-06, "loss": 3.864388427734375, "step": 174100 }, { "epoch": 0.21019550776483564, "learning_rate": 9.336902161973561e-06, "loss": 3.840981140136719, "step": 174200 }, { "epoch": 0.21031617108731832, "learning_rate": 9.336498326505823e-06, "loss": 3.8313128662109377, "step": 174300 }, { "epoch": 0.210436834409801, "learning_rate": 9.336094491038083e-06, "loss": 3.880459899902344, "step": 174400 }, { "epoch": 0.2105574977322837, "learning_rate": 9.335690655570345e-06, "loss": 3.8525216674804685, "step": 174500 }, { "epoch": 0.21067816105476636, "learning_rate": 9.335286820102607e-06, "loss": 3.859064636230469, "step": 174600 }, { "epoch": 0.21079882437724906, "learning_rate": 9.33488298463487e-06, "loss": 3.8755914306640626, "step": 174700 }, { "epoch": 0.21091948769973173, "learning_rate": 9.334479149167131e-06, "loss": 3.8529559326171876, "step": 174800 }, { "epoch": 0.2110401510222144, "learning_rate": 9.334075313699392e-06, "loss": 3.8421771240234377, "step": 174900 }, { "epoch": 0.2111608143446971, "learning_rate": 9.333671478231654e-06, "loss": 3.8353622436523436, "step": 175000 }, { "epoch": 0.21128147766717978, "learning_rate": 9.333267642763916e-06, "loss": 3.879399719238281, "step": 175100 }, { "epoch": 0.21140214098966248, "learning_rate": 9.332863807296177e-06, "loss": 3.85759765625, "step": 175200 }, { "epoch": 0.21152280431214515, "learning_rate": 9.332459971828438e-06, "loss": 3.827712097167969, "step": 175300 }, { "epoch": 0.21164346763462785, "learning_rate": 9.3320561363607e-06, "loss": 3.87615966796875, "step": 175400 }, { "epoch": 0.21176413095711052, "learning_rate": 9.331652300892962e-06, "loss": 3.8824026489257815, "step": 175500 }, { "epoch": 0.2118847942795932, "learning_rate": 9.331248465425224e-06, "loss": 3.8432635498046874, "step": 175600 }, { "epoch": 0.2120054576020759, "learning_rate": 9.330844629957486e-06, "loss": 3.834368896484375, "step": 175700 }, { "epoch": 0.21212612092455857, "learning_rate": 9.330440794489746e-06, "loss": 3.8644479370117186, "step": 175800 }, { "epoch": 0.21224678424704127, "learning_rate": 9.330036959022008e-06, "loss": 3.830558166503906, "step": 175900 }, { "epoch": 0.21236744756952394, "learning_rate": 9.32963312355427e-06, "loss": 3.849298095703125, "step": 176000 }, { "epoch": 0.21248811089200662, "learning_rate": 9.32922928808653e-06, "loss": 3.871258544921875, "step": 176100 }, { "epoch": 0.21260877421448932, "learning_rate": 9.328825452618792e-06, "loss": 3.8467529296875, "step": 176200 }, { "epoch": 0.212729437536972, "learning_rate": 9.328421617151054e-06, "loss": 3.833404541015625, "step": 176300 }, { "epoch": 0.2128501008594547, "learning_rate": 9.328017781683316e-06, "loss": 3.8632907104492187, "step": 176400 }, { "epoch": 0.21297076418193736, "learning_rate": 9.327613946215578e-06, "loss": 3.8525067138671876, "step": 176500 }, { "epoch": 0.21309142750442006, "learning_rate": 9.32721011074784e-06, "loss": 3.8538772583007814, "step": 176600 }, { "epoch": 0.21321209082690273, "learning_rate": 9.326806275280102e-06, "loss": 3.8527908325195312, "step": 176700 }, { "epoch": 0.2133327541493854, "learning_rate": 9.326402439812362e-06, "loss": 3.8154119873046874, "step": 176800 }, { "epoch": 0.2134534174718681, "learning_rate": 9.325998604344624e-06, "loss": 3.833676452636719, "step": 176900 }, { "epoch": 0.21357408079435078, "learning_rate": 9.325594768876885e-06, "loss": 3.8553839111328125, "step": 177000 }, { "epoch": 0.21369474411683348, "learning_rate": 9.325190933409147e-06, "loss": 3.8368209838867187, "step": 177100 }, { "epoch": 0.21381540743931615, "learning_rate": 9.324787097941409e-06, "loss": 3.82350830078125, "step": 177200 }, { "epoch": 0.21393607076179882, "learning_rate": 9.32438326247367e-06, "loss": 3.8502886962890623, "step": 177300 }, { "epoch": 0.21405673408428152, "learning_rate": 9.323979427005933e-06, "loss": 3.850924377441406, "step": 177400 }, { "epoch": 0.2141773974067642, "learning_rate": 9.323575591538195e-06, "loss": 3.8369631958007813, "step": 177500 }, { "epoch": 0.2142980607292469, "learning_rate": 9.323171756070457e-06, "loss": 3.81966552734375, "step": 177600 }, { "epoch": 0.21441872405172957, "learning_rate": 9.322767920602717e-06, "loss": 3.8794818115234375, "step": 177700 }, { "epoch": 0.21453938737421227, "learning_rate": 9.322364085134979e-06, "loss": 3.82856689453125, "step": 177800 }, { "epoch": 0.21466005069669494, "learning_rate": 9.321960249667241e-06, "loss": 3.8288058471679687, "step": 177900 }, { "epoch": 0.21478071401917762, "learning_rate": 9.321556414199501e-06, "loss": 3.831231689453125, "step": 178000 }, { "epoch": 0.21490137734166032, "learning_rate": 9.321152578731763e-06, "loss": 3.8515533447265624, "step": 178100 }, { "epoch": 0.215022040664143, "learning_rate": 9.320748743264025e-06, "loss": 3.857205505371094, "step": 178200 }, { "epoch": 0.2151427039866257, "learning_rate": 9.320344907796287e-06, "loss": 3.8408935546875, "step": 178300 }, { "epoch": 0.21526336730910836, "learning_rate": 9.319941072328549e-06, "loss": 3.83988525390625, "step": 178400 }, { "epoch": 0.21538403063159103, "learning_rate": 9.31953723686081e-06, "loss": 3.828887634277344, "step": 178500 }, { "epoch": 0.21550469395407373, "learning_rate": 9.319133401393071e-06, "loss": 3.840606994628906, "step": 178600 }, { "epoch": 0.2156253572765564, "learning_rate": 9.318729565925333e-06, "loss": 3.832397155761719, "step": 178700 }, { "epoch": 0.2157460205990391, "learning_rate": 9.318325730457595e-06, "loss": 3.8263336181640626, "step": 178800 }, { "epoch": 0.21586668392152178, "learning_rate": 9.317921894989856e-06, "loss": 3.80751708984375, "step": 178900 }, { "epoch": 0.21598734724400448, "learning_rate": 9.317518059522118e-06, "loss": 3.8040643310546876, "step": 179000 }, { "epoch": 0.21610801056648715, "learning_rate": 9.31711422405438e-06, "loss": 3.814153137207031, "step": 179100 }, { "epoch": 0.21622867388896982, "learning_rate": 9.316710388586642e-06, "loss": 3.8432388305664062, "step": 179200 }, { "epoch": 0.21634933721145252, "learning_rate": 9.316306553118902e-06, "loss": 3.816586608886719, "step": 179300 }, { "epoch": 0.2164700005339352, "learning_rate": 9.315902717651164e-06, "loss": 3.861735534667969, "step": 179400 }, { "epoch": 0.2165906638564179, "learning_rate": 9.315498882183426e-06, "loss": 3.8271188354492187, "step": 179500 }, { "epoch": 0.21671132717890057, "learning_rate": 9.315095046715688e-06, "loss": 3.8121441650390624, "step": 179600 }, { "epoch": 0.21683199050138324, "learning_rate": 9.31469121124795e-06, "loss": 3.8089938354492188, "step": 179700 }, { "epoch": 0.21695265382386594, "learning_rate": 9.314287375780212e-06, "loss": 3.844149475097656, "step": 179800 }, { "epoch": 0.21707331714634862, "learning_rate": 9.313883540312472e-06, "loss": 3.8364193725585936, "step": 179900 }, { "epoch": 0.21719398046883132, "learning_rate": 9.313479704844734e-06, "loss": 3.8371978759765626, "step": 180000 }, { "epoch": 0.217314643791314, "learning_rate": 9.313075869376996e-06, "loss": 3.8046685791015626, "step": 180100 }, { "epoch": 0.21743530711379666, "learning_rate": 9.312672033909256e-06, "loss": 3.8093197631835936, "step": 180200 }, { "epoch": 0.21755597043627936, "learning_rate": 9.312268198441518e-06, "loss": 3.820914001464844, "step": 180300 }, { "epoch": 0.21767663375876203, "learning_rate": 9.31186436297378e-06, "loss": 3.8356719970703126, "step": 180400 }, { "epoch": 0.21779729708124473, "learning_rate": 9.311460527506042e-06, "loss": 3.805845031738281, "step": 180500 }, { "epoch": 0.2179179604037274, "learning_rate": 9.311056692038304e-06, "loss": 3.83080078125, "step": 180600 }, { "epoch": 0.2180386237262101, "learning_rate": 9.310652856570566e-06, "loss": 3.8284832763671877, "step": 180700 }, { "epoch": 0.21815928704869278, "learning_rate": 9.310249021102828e-06, "loss": 3.7746923828125, "step": 180800 }, { "epoch": 0.21827995037117545, "learning_rate": 9.309845185635088e-06, "loss": 3.8273052978515625, "step": 180900 }, { "epoch": 0.21840061369365815, "learning_rate": 9.30944135016735e-06, "loss": 3.7906207275390624, "step": 181000 }, { "epoch": 0.21852127701614082, "learning_rate": 9.30903751469961e-06, "loss": 3.8062454223632813, "step": 181100 }, { "epoch": 0.21864194033862352, "learning_rate": 9.308633679231873e-06, "loss": 3.8278863525390623, "step": 181200 }, { "epoch": 0.2187626036611062, "learning_rate": 9.308229843764135e-06, "loss": 3.845267639160156, "step": 181300 }, { "epoch": 0.21888326698358887, "learning_rate": 9.307826008296397e-06, "loss": 3.819762878417969, "step": 181400 }, { "epoch": 0.21900393030607157, "learning_rate": 9.307422172828659e-06, "loss": 3.8009677124023438, "step": 181500 }, { "epoch": 0.21912459362855424, "learning_rate": 9.30701833736092e-06, "loss": 3.803919677734375, "step": 181600 }, { "epoch": 0.21924525695103694, "learning_rate": 9.306614501893183e-06, "loss": 3.797157897949219, "step": 181700 }, { "epoch": 0.21936592027351962, "learning_rate": 9.306210666425443e-06, "loss": 3.83072509765625, "step": 181800 }, { "epoch": 0.21948658359600232, "learning_rate": 9.305806830957705e-06, "loss": 3.7823165893554687, "step": 181900 }, { "epoch": 0.219607246918485, "learning_rate": 9.305402995489967e-06, "loss": 3.815687255859375, "step": 182000 }, { "epoch": 0.21972791024096766, "learning_rate": 9.304999160022227e-06, "loss": 3.82070556640625, "step": 182100 }, { "epoch": 0.21984857356345036, "learning_rate": 9.30459532455449e-06, "loss": 3.798536682128906, "step": 182200 }, { "epoch": 0.21996923688593303, "learning_rate": 9.304191489086751e-06, "loss": 3.8398867797851564, "step": 182300 }, { "epoch": 0.22008990020841573, "learning_rate": 9.303787653619013e-06, "loss": 3.8175033569335937, "step": 182400 }, { "epoch": 0.2202105635308984, "learning_rate": 9.303383818151275e-06, "loss": 3.8130667114257815, "step": 182500 }, { "epoch": 0.22033122685338108, "learning_rate": 9.302979982683535e-06, "loss": 3.8300772094726563, "step": 182600 }, { "epoch": 0.22045189017586378, "learning_rate": 9.302576147215797e-06, "loss": 3.801288757324219, "step": 182700 }, { "epoch": 0.22057255349834645, "learning_rate": 9.30217231174806e-06, "loss": 3.803774719238281, "step": 182800 }, { "epoch": 0.22069321682082915, "learning_rate": 9.301768476280321e-06, "loss": 3.7768594360351564, "step": 182900 }, { "epoch": 0.22081388014331182, "learning_rate": 9.301364640812582e-06, "loss": 3.8130340576171875, "step": 183000 }, { "epoch": 0.22093454346579453, "learning_rate": 9.300960805344844e-06, "loss": 3.803114013671875, "step": 183100 }, { "epoch": 0.2210552067882772, "learning_rate": 9.300556969877106e-06, "loss": 3.8122787475585938, "step": 183200 }, { "epoch": 0.22117587011075987, "learning_rate": 9.300153134409368e-06, "loss": 3.7887149047851563, "step": 183300 }, { "epoch": 0.22129653343324257, "learning_rate": 9.299749298941628e-06, "loss": 3.8040652465820313, "step": 183400 }, { "epoch": 0.22141719675572524, "learning_rate": 9.29934546347389e-06, "loss": 3.8092083740234375, "step": 183500 }, { "epoch": 0.22153786007820794, "learning_rate": 9.298941628006152e-06, "loss": 3.800281982421875, "step": 183600 }, { "epoch": 0.22165852340069062, "learning_rate": 9.298537792538414e-06, "loss": 3.8207421875, "step": 183700 }, { "epoch": 0.2217791867231733, "learning_rate": 9.298133957070676e-06, "loss": 3.8118405151367187, "step": 183800 }, { "epoch": 0.221899850045656, "learning_rate": 9.297730121602938e-06, "loss": 3.782644958496094, "step": 183900 }, { "epoch": 0.22202051336813866, "learning_rate": 9.297326286135198e-06, "loss": 3.8218756103515625, "step": 184000 }, { "epoch": 0.22214117669062136, "learning_rate": 9.29692245066746e-06, "loss": 3.771357421875, "step": 184100 }, { "epoch": 0.22226184001310403, "learning_rate": 9.29651861519972e-06, "loss": 3.796797180175781, "step": 184200 }, { "epoch": 0.22238250333558673, "learning_rate": 9.296114779731982e-06, "loss": 3.788507995605469, "step": 184300 }, { "epoch": 0.2225031666580694, "learning_rate": 9.295710944264244e-06, "loss": 3.787674560546875, "step": 184400 }, { "epoch": 0.22262382998055208, "learning_rate": 9.295307108796506e-06, "loss": 3.7998928833007812, "step": 184500 }, { "epoch": 0.22274449330303478, "learning_rate": 9.294903273328768e-06, "loss": 3.7879794311523436, "step": 184600 }, { "epoch": 0.22286515662551745, "learning_rate": 9.29449943786103e-06, "loss": 3.7838589477539064, "step": 184700 }, { "epoch": 0.22298581994800015, "learning_rate": 9.294095602393292e-06, "loss": 3.8012313842773438, "step": 184800 }, { "epoch": 0.22310648327048282, "learning_rate": 9.293691766925553e-06, "loss": 3.784291076660156, "step": 184900 }, { "epoch": 0.2232271465929655, "learning_rate": 9.293287931457815e-06, "loss": 3.8197982788085936, "step": 185000 }, { "epoch": 0.2233478099154482, "learning_rate": 9.292884095990076e-06, "loss": 3.8027383422851564, "step": 185100 }, { "epoch": 0.22346847323793087, "learning_rate": 9.292480260522337e-06, "loss": 3.7904058837890626, "step": 185200 }, { "epoch": 0.22358913656041357, "learning_rate": 9.292076425054599e-06, "loss": 3.794341735839844, "step": 185300 }, { "epoch": 0.22370979988289624, "learning_rate": 9.29167258958686e-06, "loss": 3.791290588378906, "step": 185400 }, { "epoch": 0.22383046320537894, "learning_rate": 9.291268754119123e-06, "loss": 3.8027297973632814, "step": 185500 }, { "epoch": 0.22395112652786162, "learning_rate": 9.290864918651385e-06, "loss": 3.7950787353515625, "step": 185600 }, { "epoch": 0.2240717898503443, "learning_rate": 9.290461083183647e-06, "loss": 3.767216796875, "step": 185700 }, { "epoch": 0.224192453172827, "learning_rate": 9.290057247715909e-06, "loss": 3.77049560546875, "step": 185800 }, { "epoch": 0.22431311649530966, "learning_rate": 9.289653412248169e-06, "loss": 3.7954052734375, "step": 185900 }, { "epoch": 0.22443377981779236, "learning_rate": 9.289249576780431e-06, "loss": 3.794927978515625, "step": 186000 }, { "epoch": 0.22455444314027503, "learning_rate": 9.288845741312691e-06, "loss": 3.8113580322265626, "step": 186100 }, { "epoch": 0.2246751064627577, "learning_rate": 9.288441905844953e-06, "loss": 3.784781188964844, "step": 186200 }, { "epoch": 0.2247957697852404, "learning_rate": 9.288038070377215e-06, "loss": 3.7929623413085936, "step": 186300 }, { "epoch": 0.22491643310772308, "learning_rate": 9.287634234909477e-06, "loss": 3.799100341796875, "step": 186400 }, { "epoch": 0.22503709643020578, "learning_rate": 9.28723039944174e-06, "loss": 3.7763958740234376, "step": 186500 }, { "epoch": 0.22515775975268845, "learning_rate": 9.286826563974001e-06, "loss": 3.769142761230469, "step": 186600 }, { "epoch": 0.22527842307517112, "learning_rate": 9.286422728506261e-06, "loss": 3.782398986816406, "step": 186700 }, { "epoch": 0.22539908639765383, "learning_rate": 9.286018893038523e-06, "loss": 3.7773593139648436, "step": 186800 }, { "epoch": 0.2255197497201365, "learning_rate": 9.285615057570785e-06, "loss": 3.775775146484375, "step": 186900 }, { "epoch": 0.2256404130426192, "learning_rate": 9.285211222103047e-06, "loss": 3.769295349121094, "step": 187000 }, { "epoch": 0.22576107636510187, "learning_rate": 9.284807386635308e-06, "loss": 3.772156982421875, "step": 187100 }, { "epoch": 0.22588173968758457, "learning_rate": 9.28440355116757e-06, "loss": 3.75919677734375, "step": 187200 }, { "epoch": 0.22600240301006724, "learning_rate": 9.283999715699832e-06, "loss": 3.76804443359375, "step": 187300 }, { "epoch": 0.22612306633254992, "learning_rate": 9.283595880232094e-06, "loss": 3.7640045166015623, "step": 187400 }, { "epoch": 0.22624372965503262, "learning_rate": 9.283192044764354e-06, "loss": 3.7552081298828126, "step": 187500 }, { "epoch": 0.2263643929775153, "learning_rate": 9.282788209296616e-06, "loss": 3.7742254638671877, "step": 187600 }, { "epoch": 0.226485056299998, "learning_rate": 9.282384373828878e-06, "loss": 3.7708554077148437, "step": 187700 }, { "epoch": 0.22660571962248066, "learning_rate": 9.28198053836114e-06, "loss": 3.781942138671875, "step": 187800 }, { "epoch": 0.22672638294496333, "learning_rate": 9.281576702893402e-06, "loss": 3.7824172973632812, "step": 187900 }, { "epoch": 0.22684704626744603, "learning_rate": 9.281172867425662e-06, "loss": 3.7651132202148436, "step": 188000 }, { "epoch": 0.2269677095899287, "learning_rate": 9.280769031957924e-06, "loss": 3.771176452636719, "step": 188100 }, { "epoch": 0.2270883729124114, "learning_rate": 9.280365196490186e-06, "loss": 3.8021160888671877, "step": 188200 }, { "epoch": 0.22720903623489408, "learning_rate": 9.279961361022446e-06, "loss": 3.779035949707031, "step": 188300 }, { "epoch": 0.22732969955737678, "learning_rate": 9.279557525554708e-06, "loss": 3.78049072265625, "step": 188400 }, { "epoch": 0.22745036287985945, "learning_rate": 9.27915369008697e-06, "loss": 3.7830355834960936, "step": 188500 }, { "epoch": 0.22757102620234212, "learning_rate": 9.278749854619232e-06, "loss": 3.775142822265625, "step": 188600 }, { "epoch": 0.22769168952482483, "learning_rate": 9.278346019151494e-06, "loss": 3.7713577270507814, "step": 188700 }, { "epoch": 0.2278123528473075, "learning_rate": 9.277942183683756e-06, "loss": 3.764349060058594, "step": 188800 }, { "epoch": 0.2279330161697902, "learning_rate": 9.277538348216018e-06, "loss": 3.7626797485351564, "step": 188900 }, { "epoch": 0.22805367949227287, "learning_rate": 9.277134512748279e-06, "loss": 3.7513308715820313, "step": 189000 }, { "epoch": 0.22817434281475554, "learning_rate": 9.27673067728054e-06, "loss": 3.7844378662109377, "step": 189100 }, { "epoch": 0.22829500613723824, "learning_rate": 9.2763268418128e-06, "loss": 3.776136474609375, "step": 189200 }, { "epoch": 0.22841566945972092, "learning_rate": 9.275923006345063e-06, "loss": 3.766302490234375, "step": 189300 }, { "epoch": 0.22853633278220362, "learning_rate": 9.275519170877325e-06, "loss": 3.7739431762695315, "step": 189400 }, { "epoch": 0.2286569961046863, "learning_rate": 9.275115335409587e-06, "loss": 3.746210632324219, "step": 189500 }, { "epoch": 0.228777659427169, "learning_rate": 9.274711499941849e-06, "loss": 3.7465924072265624, "step": 189600 }, { "epoch": 0.22889832274965166, "learning_rate": 9.27430766447411e-06, "loss": 3.7799801635742187, "step": 189700 }, { "epoch": 0.22901898607213433, "learning_rate": 9.273903829006373e-06, "loss": 3.725357666015625, "step": 189800 }, { "epoch": 0.22913964939461703, "learning_rate": 9.273499993538633e-06, "loss": 3.75540283203125, "step": 189900 }, { "epoch": 0.2292603127170997, "learning_rate": 9.273096158070895e-06, "loss": 3.7522036743164064, "step": 190000 }, { "epoch": 0.2293809760395824, "learning_rate": 9.272692322603157e-06, "loss": 3.7510440063476564, "step": 190100 }, { "epoch": 0.22950163936206508, "learning_rate": 9.272288487135417e-06, "loss": 3.727488708496094, "step": 190200 }, { "epoch": 0.22962230268454775, "learning_rate": 9.27188465166768e-06, "loss": 3.780382080078125, "step": 190300 }, { "epoch": 0.22974296600703045, "learning_rate": 9.271480816199941e-06, "loss": 3.7685797119140627, "step": 190400 }, { "epoch": 0.22986362932951312, "learning_rate": 9.271076980732203e-06, "loss": 3.7479373168945314, "step": 190500 }, { "epoch": 0.22998429265199583, "learning_rate": 9.270673145264465e-06, "loss": 3.75752197265625, "step": 190600 }, { "epoch": 0.2301049559744785, "learning_rate": 9.270269309796727e-06, "loss": 3.7632522583007812, "step": 190700 }, { "epoch": 0.2302256192969612, "learning_rate": 9.269865474328987e-06, "loss": 3.7460955810546874, "step": 190800 }, { "epoch": 0.23034628261944387, "learning_rate": 9.26946163886125e-06, "loss": 3.7422393798828124, "step": 190900 }, { "epoch": 0.23046694594192654, "learning_rate": 9.269057803393511e-06, "loss": 3.7621484375, "step": 191000 }, { "epoch": 0.23058760926440924, "learning_rate": 9.268653967925772e-06, "loss": 3.7656124877929686, "step": 191100 }, { "epoch": 0.23070827258689192, "learning_rate": 9.268250132458034e-06, "loss": 3.7832489013671875, "step": 191200 }, { "epoch": 0.23082893590937462, "learning_rate": 9.267846296990296e-06, "loss": 3.7495806884765623, "step": 191300 }, { "epoch": 0.2309495992318573, "learning_rate": 9.267442461522558e-06, "loss": 3.776719970703125, "step": 191400 }, { "epoch": 0.23107026255433996, "learning_rate": 9.26703862605482e-06, "loss": 3.7207135009765624, "step": 191500 }, { "epoch": 0.23119092587682266, "learning_rate": 9.26663479058708e-06, "loss": 3.7676181030273437, "step": 191600 }, { "epoch": 0.23131158919930533, "learning_rate": 9.266230955119342e-06, "loss": 3.753806457519531, "step": 191700 }, { "epoch": 0.23143225252178803, "learning_rate": 9.265827119651604e-06, "loss": 3.731363525390625, "step": 191800 }, { "epoch": 0.2315529158442707, "learning_rate": 9.265423284183866e-06, "loss": 3.77650146484375, "step": 191900 }, { "epoch": 0.2316735791667534, "learning_rate": 9.265019448716128e-06, "loss": 3.758489074707031, "step": 192000 }, { "epoch": 0.23179424248923608, "learning_rate": 9.264615613248388e-06, "loss": 3.737186279296875, "step": 192100 }, { "epoch": 0.23191490581171875, "learning_rate": 9.26421177778065e-06, "loss": 3.7510443115234375, "step": 192200 }, { "epoch": 0.23203556913420145, "learning_rate": 9.263807942312912e-06, "loss": 3.7581683349609376, "step": 192300 }, { "epoch": 0.23215623245668413, "learning_rate": 9.263404106845172e-06, "loss": 3.7492074584960937, "step": 192400 }, { "epoch": 0.23227689577916683, "learning_rate": 9.263000271377434e-06, "loss": 3.7553305053710937, "step": 192500 }, { "epoch": 0.2323975591016495, "learning_rate": 9.262596435909696e-06, "loss": 3.746603698730469, "step": 192600 }, { "epoch": 0.23251822242413217, "learning_rate": 9.262192600441958e-06, "loss": 3.7663336181640625, "step": 192700 }, { "epoch": 0.23263888574661487, "learning_rate": 9.26178876497422e-06, "loss": 3.7619973754882814, "step": 192800 }, { "epoch": 0.23275954906909754, "learning_rate": 9.261384929506482e-06, "loss": 3.777813720703125, "step": 192900 }, { "epoch": 0.23288021239158024, "learning_rate": 9.260981094038743e-06, "loss": 3.7624166870117186, "step": 193000 }, { "epoch": 0.23300087571406292, "learning_rate": 9.260577258571005e-06, "loss": 3.783835144042969, "step": 193100 }, { "epoch": 0.2331215390365456, "learning_rate": 9.260173423103267e-06, "loss": 3.7421395874023435, "step": 193200 }, { "epoch": 0.2332422023590283, "learning_rate": 9.259769587635527e-06, "loss": 3.709068603515625, "step": 193300 }, { "epoch": 0.23336286568151096, "learning_rate": 9.259365752167789e-06, "loss": 3.7289178466796873, "step": 193400 }, { "epoch": 0.23348352900399366, "learning_rate": 9.25896191670005e-06, "loss": 3.746418762207031, "step": 193500 }, { "epoch": 0.23360419232647633, "learning_rate": 9.258558081232313e-06, "loss": 3.744023742675781, "step": 193600 }, { "epoch": 0.23372485564895903, "learning_rate": 9.258154245764575e-06, "loss": 3.7015484619140624, "step": 193700 }, { "epoch": 0.2338455189714417, "learning_rate": 9.257750410296837e-06, "loss": 3.74681640625, "step": 193800 }, { "epoch": 0.23396618229392438, "learning_rate": 9.257346574829099e-06, "loss": 3.7518820190429687, "step": 193900 }, { "epoch": 0.23408684561640708, "learning_rate": 9.256942739361359e-06, "loss": 3.73414794921875, "step": 194000 }, { "epoch": 0.23420750893888975, "learning_rate": 9.256538903893621e-06, "loss": 3.717051696777344, "step": 194100 }, { "epoch": 0.23432817226137245, "learning_rate": 9.256135068425881e-06, "loss": 3.7203155517578126, "step": 194200 }, { "epoch": 0.23444883558385513, "learning_rate": 9.255731232958143e-06, "loss": 3.705076904296875, "step": 194300 }, { "epoch": 0.2345694989063378, "learning_rate": 9.255327397490405e-06, "loss": 3.7366397094726564, "step": 194400 }, { "epoch": 0.2346901622288205, "learning_rate": 9.254923562022667e-06, "loss": 3.734712829589844, "step": 194500 }, { "epoch": 0.23481082555130317, "learning_rate": 9.25451972655493e-06, "loss": 3.7418222045898437, "step": 194600 }, { "epoch": 0.23493148887378587, "learning_rate": 9.254115891087191e-06, "loss": 3.7293902587890626, "step": 194700 }, { "epoch": 0.23505215219626854, "learning_rate": 9.253712055619452e-06, "loss": 3.7267974853515624, "step": 194800 }, { "epoch": 0.23517281551875124, "learning_rate": 9.253308220151714e-06, "loss": 3.7221417236328125, "step": 194900 }, { "epoch": 0.23529347884123392, "learning_rate": 9.252904384683975e-06, "loss": 3.7525979614257814, "step": 195000 }, { "epoch": 0.2354141421637166, "learning_rate": 9.252500549216237e-06, "loss": 3.731783752441406, "step": 195100 }, { "epoch": 0.2355348054861993, "learning_rate": 9.252096713748498e-06, "loss": 3.7116549682617186, "step": 195200 }, { "epoch": 0.23565546880868196, "learning_rate": 9.25169287828076e-06, "loss": 3.7166778564453127, "step": 195300 }, { "epoch": 0.23577613213116466, "learning_rate": 9.251289042813022e-06, "loss": 3.7092495727539063, "step": 195400 }, { "epoch": 0.23589679545364733, "learning_rate": 9.250885207345284e-06, "loss": 3.7323504638671876, "step": 195500 }, { "epoch": 0.23601745877613, "learning_rate": 9.250481371877546e-06, "loss": 3.7345516967773436, "step": 195600 }, { "epoch": 0.2361381220986127, "learning_rate": 9.250077536409806e-06, "loss": 3.7101144409179687, "step": 195700 }, { "epoch": 0.23625878542109538, "learning_rate": 9.249673700942068e-06, "loss": 3.735495910644531, "step": 195800 }, { "epoch": 0.23637944874357808, "learning_rate": 9.24926986547433e-06, "loss": 3.755951232910156, "step": 195900 }, { "epoch": 0.23650011206606075, "learning_rate": 9.248866030006592e-06, "loss": 3.7482965087890623, "step": 196000 }, { "epoch": 0.23662077538854345, "learning_rate": 9.248462194538854e-06, "loss": 3.7130587768554686, "step": 196100 }, { "epoch": 0.23674143871102613, "learning_rate": 9.248058359071114e-06, "loss": 3.7413601684570312, "step": 196200 }, { "epoch": 0.2368621020335088, "learning_rate": 9.247654523603376e-06, "loss": 3.7243948364257813, "step": 196300 }, { "epoch": 0.2369827653559915, "learning_rate": 9.247250688135638e-06, "loss": 3.7133111572265625, "step": 196400 }, { "epoch": 0.23710342867847417, "learning_rate": 9.246846852667898e-06, "loss": 3.7211761474609375, "step": 196500 }, { "epoch": 0.23722409200095687, "learning_rate": 9.24644301720016e-06, "loss": 3.7363665771484373, "step": 196600 }, { "epoch": 0.23734475532343954, "learning_rate": 9.246039181732422e-06, "loss": 3.726129150390625, "step": 196700 }, { "epoch": 0.23746541864592222, "learning_rate": 9.245635346264684e-06, "loss": 3.7107388305664064, "step": 196800 }, { "epoch": 0.23758608196840492, "learning_rate": 9.245231510796946e-06, "loss": 3.7372119140625, "step": 196900 }, { "epoch": 0.2377067452908876, "learning_rate": 9.244827675329208e-06, "loss": 3.71290771484375, "step": 197000 }, { "epoch": 0.2378274086133703, "learning_rate": 9.244423839861469e-06, "loss": 3.7061029052734376, "step": 197100 }, { "epoch": 0.23794807193585296, "learning_rate": 9.24402000439373e-06, "loss": 3.7164041137695314, "step": 197200 }, { "epoch": 0.23806873525833566, "learning_rate": 9.243616168925993e-06, "loss": 3.712121887207031, "step": 197300 }, { "epoch": 0.23818939858081833, "learning_rate": 9.243212333458253e-06, "loss": 3.736483154296875, "step": 197400 }, { "epoch": 0.238310061903301, "learning_rate": 9.242808497990515e-06, "loss": 3.722565002441406, "step": 197500 }, { "epoch": 0.2384307252257837, "learning_rate": 9.242404662522777e-06, "loss": 3.7054348754882813, "step": 197600 }, { "epoch": 0.23855138854826638, "learning_rate": 9.242000827055039e-06, "loss": 3.7192474365234376, "step": 197700 }, { "epoch": 0.23867205187074908, "learning_rate": 9.2415969915873e-06, "loss": 3.716965637207031, "step": 197800 }, { "epoch": 0.23879271519323175, "learning_rate": 9.241193156119563e-06, "loss": 3.7091140747070312, "step": 197900 }, { "epoch": 0.23891337851571443, "learning_rate": 9.240789320651825e-06, "loss": 3.6944842529296875, "step": 198000 }, { "epoch": 0.23903404183819713, "learning_rate": 9.240385485184085e-06, "loss": 3.728592529296875, "step": 198100 }, { "epoch": 0.2391547051606798, "learning_rate": 9.239981649716347e-06, "loss": 3.74075439453125, "step": 198200 }, { "epoch": 0.2392753684831625, "learning_rate": 9.239577814248607e-06, "loss": 3.7070867919921877, "step": 198300 }, { "epoch": 0.23939603180564517, "learning_rate": 9.23917397878087e-06, "loss": 3.7243670654296874, "step": 198400 }, { "epoch": 0.23951669512812787, "learning_rate": 9.238770143313131e-06, "loss": 3.74302490234375, "step": 198500 }, { "epoch": 0.23963735845061054, "learning_rate": 9.238366307845393e-06, "loss": 3.7204736328125, "step": 198600 }, { "epoch": 0.23975802177309322, "learning_rate": 9.237962472377655e-06, "loss": 3.72676513671875, "step": 198700 }, { "epoch": 0.23987868509557592, "learning_rate": 9.237558636909917e-06, "loss": 3.714619445800781, "step": 198800 }, { "epoch": 0.2399993484180586, "learning_rate": 9.237154801442178e-06, "loss": 3.722392883300781, "step": 198900 }, { "epoch": 0.2401200117405413, "learning_rate": 9.23675096597444e-06, "loss": 3.7029483032226564, "step": 199000 }, { "epoch": 0.24024067506302396, "learning_rate": 9.236347130506702e-06, "loss": 3.6963409423828124, "step": 199100 }, { "epoch": 0.24036133838550663, "learning_rate": 9.235943295038964e-06, "loss": 3.7217718505859376, "step": 199200 }, { "epoch": 0.24048200170798933, "learning_rate": 9.235539459571224e-06, "loss": 3.7127450561523436, "step": 199300 }, { "epoch": 0.240602665030472, "learning_rate": 9.235135624103486e-06, "loss": 3.7036624145507813, "step": 199400 }, { "epoch": 0.2407233283529547, "learning_rate": 9.234731788635748e-06, "loss": 3.705352478027344, "step": 199500 }, { "epoch": 0.24084399167543738, "learning_rate": 9.23432795316801e-06, "loss": 3.6987686157226562, "step": 199600 }, { "epoch": 0.24096465499792005, "learning_rate": 9.23392411770027e-06, "loss": 3.707328186035156, "step": 199700 }, { "epoch": 0.24108531832040275, "learning_rate": 9.233520282232532e-06, "loss": 3.7200494384765626, "step": 199800 }, { "epoch": 0.24120598164288543, "learning_rate": 9.233116446764794e-06, "loss": 3.69326904296875, "step": 199900 }, { "epoch": 0.24132664496536813, "learning_rate": 9.232712611297056e-06, "loss": 3.7053985595703125, "step": 200000 }, { "epoch": 0.2414473082878508, "learning_rate": 9.232308775829318e-06, "loss": 3.7000717163085937, "step": 200100 }, { "epoch": 0.2415679716103335, "learning_rate": 9.231904940361578e-06, "loss": 3.6976361083984375, "step": 200200 }, { "epoch": 0.24168863493281617, "learning_rate": 9.23150110489384e-06, "loss": 3.673581848144531, "step": 200300 }, { "epoch": 0.24180929825529884, "learning_rate": 9.231097269426102e-06, "loss": 3.7136459350585938, "step": 200400 }, { "epoch": 0.24192996157778154, "learning_rate": 9.230693433958364e-06, "loss": 3.695909423828125, "step": 200500 }, { "epoch": 0.24205062490026422, "learning_rate": 9.230289598490624e-06, "loss": 3.674058532714844, "step": 200600 }, { "epoch": 0.24217128822274692, "learning_rate": 9.229885763022886e-06, "loss": 3.7147845458984374, "step": 200700 }, { "epoch": 0.2422919515452296, "learning_rate": 9.229481927555148e-06, "loss": 3.695434265136719, "step": 200800 }, { "epoch": 0.24241261486771226, "learning_rate": 9.22907809208741e-06, "loss": 3.6836480712890625, "step": 200900 }, { "epoch": 0.24253327819019496, "learning_rate": 9.228674256619672e-06, "loss": 3.6956515502929688, "step": 201000 }, { "epoch": 0.24265394151267763, "learning_rate": 9.228270421151934e-06, "loss": 3.6742889404296877, "step": 201100 }, { "epoch": 0.24277460483516033, "learning_rate": 9.227866585684195e-06, "loss": 3.69082763671875, "step": 201200 }, { "epoch": 0.242895268157643, "learning_rate": 9.227462750216457e-06, "loss": 3.7146572875976562, "step": 201300 }, { "epoch": 0.2430159314801257, "learning_rate": 9.227058914748717e-06, "loss": 3.7032601928710935, "step": 201400 }, { "epoch": 0.24313659480260838, "learning_rate": 9.226655079280979e-06, "loss": 3.695606384277344, "step": 201500 }, { "epoch": 0.24325725812509105, "learning_rate": 9.226251243813241e-06, "loss": 3.710067138671875, "step": 201600 }, { "epoch": 0.24337792144757375, "learning_rate": 9.225847408345503e-06, "loss": 3.6949334716796876, "step": 201700 }, { "epoch": 0.24349858477005643, "learning_rate": 9.225443572877765e-06, "loss": 3.694286193847656, "step": 201800 }, { "epoch": 0.24361924809253913, "learning_rate": 9.225039737410027e-06, "loss": 3.702607421875, "step": 201900 }, { "epoch": 0.2437399114150218, "learning_rate": 9.224635901942289e-06, "loss": 3.700819396972656, "step": 202000 }, { "epoch": 0.24386057473750447, "learning_rate": 9.224232066474549e-06, "loss": 3.7006906127929686, "step": 202100 }, { "epoch": 0.24398123805998717, "learning_rate": 9.223828231006811e-06, "loss": 3.707624816894531, "step": 202200 }, { "epoch": 0.24410190138246984, "learning_rate": 9.223424395539073e-06, "loss": 3.6560491943359374, "step": 202300 }, { "epoch": 0.24422256470495254, "learning_rate": 9.223020560071333e-06, "loss": 3.68814453125, "step": 202400 }, { "epoch": 0.24434322802743522, "learning_rate": 9.222616724603595e-06, "loss": 3.6900540161132813, "step": 202500 }, { "epoch": 0.24446389134991792, "learning_rate": 9.222212889135857e-06, "loss": 3.7148141479492187, "step": 202600 }, { "epoch": 0.2445845546724006, "learning_rate": 9.22180905366812e-06, "loss": 3.6685494995117187, "step": 202700 }, { "epoch": 0.24470521799488326, "learning_rate": 9.221405218200381e-06, "loss": 3.7073245239257813, "step": 202800 }, { "epoch": 0.24482588131736596, "learning_rate": 9.221001382732643e-06, "loss": 3.683519287109375, "step": 202900 }, { "epoch": 0.24494654463984863, "learning_rate": 9.220597547264904e-06, "loss": 3.6927325439453127, "step": 203000 }, { "epoch": 0.24506720796233133, "learning_rate": 9.220193711797166e-06, "loss": 3.6921255493164065, "step": 203100 }, { "epoch": 0.245187871284814, "learning_rate": 9.219789876329428e-06, "loss": 3.674447021484375, "step": 203200 }, { "epoch": 0.24530853460729668, "learning_rate": 9.219386040861688e-06, "loss": 3.699053955078125, "step": 203300 }, { "epoch": 0.24542919792977938, "learning_rate": 9.21898220539395e-06, "loss": 3.6666455078125, "step": 203400 }, { "epoch": 0.24554986125226205, "learning_rate": 9.218578369926212e-06, "loss": 3.687672424316406, "step": 203500 }, { "epoch": 0.24567052457474475, "learning_rate": 9.218174534458474e-06, "loss": 3.6936688232421875, "step": 203600 }, { "epoch": 0.24579118789722743, "learning_rate": 9.217770698990736e-06, "loss": 3.718658447265625, "step": 203700 }, { "epoch": 0.24591185121971013, "learning_rate": 9.217366863522996e-06, "loss": 3.6747882080078127, "step": 203800 }, { "epoch": 0.2460325145421928, "learning_rate": 9.216963028055258e-06, "loss": 3.6771527099609376, "step": 203900 }, { "epoch": 0.24615317786467547, "learning_rate": 9.21655919258752e-06, "loss": 3.701468200683594, "step": 204000 }, { "epoch": 0.24627384118715817, "learning_rate": 9.216155357119782e-06, "loss": 3.661234130859375, "step": 204100 }, { "epoch": 0.24639450450964084, "learning_rate": 9.215751521652044e-06, "loss": 3.68523193359375, "step": 204200 }, { "epoch": 0.24651516783212354, "learning_rate": 9.215347686184304e-06, "loss": 3.6767242431640623, "step": 204300 }, { "epoch": 0.24663583115460622, "learning_rate": 9.214943850716566e-06, "loss": 3.685646667480469, "step": 204400 }, { "epoch": 0.2467564944770889, "learning_rate": 9.214540015248828e-06, "loss": 3.6798504638671874, "step": 204500 }, { "epoch": 0.2468771577995716, "learning_rate": 9.214136179781089e-06, "loss": 3.669855041503906, "step": 204600 }, { "epoch": 0.24699782112205426, "learning_rate": 9.21373234431335e-06, "loss": 3.669905700683594, "step": 204700 }, { "epoch": 0.24711848444453696, "learning_rate": 9.213328508845612e-06, "loss": 3.6896548461914063, "step": 204800 }, { "epoch": 0.24723914776701963, "learning_rate": 9.212924673377874e-06, "loss": 3.68878662109375, "step": 204900 }, { "epoch": 0.24735981108950233, "learning_rate": 9.212520837910136e-06, "loss": 3.6997946166992186, "step": 205000 }, { "epoch": 0.247480474411985, "learning_rate": 9.212117002442398e-06, "loss": 3.6602401733398438, "step": 205100 }, { "epoch": 0.24760113773446768, "learning_rate": 9.211713166974659e-06, "loss": 3.6706509399414062, "step": 205200 }, { "epoch": 0.24772180105695038, "learning_rate": 9.21130933150692e-06, "loss": 3.7057321166992185, "step": 205300 }, { "epoch": 0.24784246437943305, "learning_rate": 9.210905496039183e-06, "loss": 3.6448834228515623, "step": 205400 }, { "epoch": 0.24796312770191575, "learning_rate": 9.210501660571443e-06, "loss": 3.686228942871094, "step": 205500 }, { "epoch": 0.24808379102439843, "learning_rate": 9.210097825103705e-06, "loss": 3.662328186035156, "step": 205600 }, { "epoch": 0.2482044543468811, "learning_rate": 9.209693989635967e-06, "loss": 3.638558044433594, "step": 205700 }, { "epoch": 0.2483251176693638, "learning_rate": 9.209290154168229e-06, "loss": 3.6871527099609374, "step": 205800 }, { "epoch": 0.24844578099184647, "learning_rate": 9.208886318700491e-06, "loss": 3.6697811889648437, "step": 205900 }, { "epoch": 0.24856644431432917, "learning_rate": 9.208482483232753e-06, "loss": 3.6819342041015624, "step": 206000 }, { "epoch": 0.24868710763681184, "learning_rate": 9.208078647765015e-06, "loss": 3.679654846191406, "step": 206100 }, { "epoch": 0.24880777095929452, "learning_rate": 9.207674812297275e-06, "loss": 3.680423583984375, "step": 206200 }, { "epoch": 0.24892843428177722, "learning_rate": 9.207270976829537e-06, "loss": 3.64692138671875, "step": 206300 }, { "epoch": 0.2490490976042599, "learning_rate": 9.206867141361797e-06, "loss": 3.659390869140625, "step": 206400 }, { "epoch": 0.2491697609267426, "learning_rate": 9.20646330589406e-06, "loss": 3.6611419677734376, "step": 206500 }, { "epoch": 0.24929042424922526, "learning_rate": 9.206059470426321e-06, "loss": 3.6673675537109376, "step": 206600 }, { "epoch": 0.24941108757170796, "learning_rate": 9.205655634958583e-06, "loss": 3.6616448974609375, "step": 206700 }, { "epoch": 0.24953175089419063, "learning_rate": 9.205251799490845e-06, "loss": 3.6692333984375, "step": 206800 }, { "epoch": 0.2496524142166733, "learning_rate": 9.204847964023107e-06, "loss": 3.6917459106445314, "step": 206900 }, { "epoch": 0.249773077539156, "learning_rate": 9.20444412855537e-06, "loss": 3.6804791259765626, "step": 207000 }, { "epoch": 0.24989374086163868, "learning_rate": 9.20404029308763e-06, "loss": 3.6656124877929686, "step": 207100 }, { "epoch": 0.25001440418412135, "learning_rate": 9.203636457619892e-06, "loss": 3.690818176269531, "step": 207200 }, { "epoch": 0.2501350675066041, "learning_rate": 9.203232622152154e-06, "loss": 3.6568429565429685, "step": 207300 }, { "epoch": 0.25025573082908675, "learning_rate": 9.202828786684414e-06, "loss": 3.6728955078125, "step": 207400 }, { "epoch": 0.2503763941515694, "learning_rate": 9.202424951216676e-06, "loss": 3.6812142944335937, "step": 207500 }, { "epoch": 0.2504970574740521, "learning_rate": 9.202021115748938e-06, "loss": 3.6532241821289064, "step": 207600 }, { "epoch": 0.25061772079653477, "learning_rate": 9.2016172802812e-06, "loss": 3.6612088012695314, "step": 207700 }, { "epoch": 0.2507383841190175, "learning_rate": 9.201213444813462e-06, "loss": 3.669891662597656, "step": 207800 }, { "epoch": 0.25085904744150017, "learning_rate": 9.200809609345722e-06, "loss": 3.652283935546875, "step": 207900 }, { "epoch": 0.25097971076398284, "learning_rate": 9.200405773877984e-06, "loss": 3.6692623901367187, "step": 208000 }, { "epoch": 0.2511003740864655, "learning_rate": 9.200001938410246e-06, "loss": 3.6599322509765626, "step": 208100 }, { "epoch": 0.2512210374089482, "learning_rate": 9.199598102942508e-06, "loss": 3.6554437255859376, "step": 208200 }, { "epoch": 0.2513417007314309, "learning_rate": 9.19919426747477e-06, "loss": 3.6617669677734375, "step": 208300 }, { "epoch": 0.2514623640539136, "learning_rate": 9.19879043200703e-06, "loss": 3.6685800170898437, "step": 208400 }, { "epoch": 0.25158302737639626, "learning_rate": 9.198386596539292e-06, "loss": 3.6759603881835936, "step": 208500 }, { "epoch": 0.25170369069887893, "learning_rate": 9.197982761071554e-06, "loss": 3.6685281372070313, "step": 208600 }, { "epoch": 0.2518243540213616, "learning_rate": 9.197578925603815e-06, "loss": 3.65275146484375, "step": 208700 }, { "epoch": 0.25194501734384434, "learning_rate": 9.197175090136077e-06, "loss": 3.665533447265625, "step": 208800 }, { "epoch": 0.252065680666327, "learning_rate": 9.196771254668339e-06, "loss": 3.656330871582031, "step": 208900 }, { "epoch": 0.2521863439888097, "learning_rate": 9.1963674192006e-06, "loss": 3.6645635986328124, "step": 209000 }, { "epoch": 0.25230700731129235, "learning_rate": 9.195963583732862e-06, "loss": 3.6672955322265626, "step": 209100 }, { "epoch": 0.252427670633775, "learning_rate": 9.195559748265124e-06, "loss": 3.643277893066406, "step": 209200 }, { "epoch": 0.25254833395625775, "learning_rate": 9.195155912797385e-06, "loss": 3.662528381347656, "step": 209300 }, { "epoch": 0.2526689972787404, "learning_rate": 9.194752077329647e-06, "loss": 3.638275146484375, "step": 209400 }, { "epoch": 0.2527896606012231, "learning_rate": 9.194348241861909e-06, "loss": 3.694941101074219, "step": 209500 }, { "epoch": 0.25291032392370577, "learning_rate": 9.193944406394169e-06, "loss": 3.640216064453125, "step": 209600 }, { "epoch": 0.2530309872461885, "learning_rate": 9.193540570926431e-06, "loss": 3.6376080322265625, "step": 209700 }, { "epoch": 0.25315165056867117, "learning_rate": 9.193136735458693e-06, "loss": 3.655018310546875, "step": 209800 }, { "epoch": 0.25327231389115384, "learning_rate": 9.192732899990955e-06, "loss": 3.6468634033203124, "step": 209900 }, { "epoch": 0.2533929772136365, "learning_rate": 9.192329064523217e-06, "loss": 3.677126159667969, "step": 210000 }, { "epoch": 0.2535136405361192, "learning_rate": 9.191925229055479e-06, "loss": 3.63465087890625, "step": 210100 }, { "epoch": 0.2536343038586019, "learning_rate": 9.191521393587741e-06, "loss": 3.6564712524414062, "step": 210200 }, { "epoch": 0.2537549671810846, "learning_rate": 9.191117558120001e-06, "loss": 3.666081848144531, "step": 210300 }, { "epoch": 0.25387563050356726, "learning_rate": 9.190713722652263e-06, "loss": 3.654061279296875, "step": 210400 }, { "epoch": 0.25399629382604993, "learning_rate": 9.190309887184523e-06, "loss": 3.659622802734375, "step": 210500 }, { "epoch": 0.2541169571485326, "learning_rate": 9.189906051716785e-06, "loss": 3.645521545410156, "step": 210600 }, { "epoch": 0.25423762047101534, "learning_rate": 9.189502216249047e-06, "loss": 3.634986572265625, "step": 210700 }, { "epoch": 0.254358283793498, "learning_rate": 9.18909838078131e-06, "loss": 3.6290347290039064, "step": 210800 }, { "epoch": 0.2544789471159807, "learning_rate": 9.188694545313571e-06, "loss": 3.6444961547851564, "step": 210900 }, { "epoch": 0.25459961043846335, "learning_rate": 9.188290709845833e-06, "loss": 3.62194580078125, "step": 211000 }, { "epoch": 0.254720273760946, "learning_rate": 9.187886874378095e-06, "loss": 3.651019287109375, "step": 211100 }, { "epoch": 0.25484093708342875, "learning_rate": 9.187483038910356e-06, "loss": 3.6369573974609377, "step": 211200 }, { "epoch": 0.2549616004059114, "learning_rate": 9.187079203442618e-06, "loss": 3.64165283203125, "step": 211300 }, { "epoch": 0.2550822637283941, "learning_rate": 9.18667536797488e-06, "loss": 3.655348205566406, "step": 211400 }, { "epoch": 0.25520292705087677, "learning_rate": 9.18627153250714e-06, "loss": 3.6637094116210935, "step": 211500 }, { "epoch": 0.25532359037335944, "learning_rate": 9.185867697039402e-06, "loss": 3.632470703125, "step": 211600 }, { "epoch": 0.25544425369584217, "learning_rate": 9.185463861571664e-06, "loss": 3.6434896850585936, "step": 211700 }, { "epoch": 0.25556491701832484, "learning_rate": 9.185060026103926e-06, "loss": 3.6458233642578124, "step": 211800 }, { "epoch": 0.2556855803408075, "learning_rate": 9.184656190636188e-06, "loss": 3.6436273193359376, "step": 211900 }, { "epoch": 0.2558062436632902, "learning_rate": 9.184252355168448e-06, "loss": 3.647513732910156, "step": 212000 }, { "epoch": 0.25592690698577286, "learning_rate": 9.18384851970071e-06, "loss": 3.6456484985351563, "step": 212100 }, { "epoch": 0.2560475703082556, "learning_rate": 9.183444684232972e-06, "loss": 3.6340908813476562, "step": 212200 }, { "epoch": 0.25616823363073826, "learning_rate": 9.183040848765234e-06, "loss": 3.64902587890625, "step": 212300 }, { "epoch": 0.25628889695322093, "learning_rate": 9.182637013297494e-06, "loss": 3.6336788940429687, "step": 212400 }, { "epoch": 0.2564095602757036, "learning_rate": 9.182233177829756e-06, "loss": 3.6513107299804686, "step": 212500 }, { "epoch": 0.25653022359818634, "learning_rate": 9.181829342362018e-06, "loss": 3.6526837158203125, "step": 212600 }, { "epoch": 0.256650886920669, "learning_rate": 9.18142550689428e-06, "loss": 3.6647525024414063, "step": 212700 }, { "epoch": 0.2567715502431517, "learning_rate": 9.18102167142654e-06, "loss": 3.6526068115234374, "step": 212800 }, { "epoch": 0.25689221356563435, "learning_rate": 9.180617835958803e-06, "loss": 3.6386724853515626, "step": 212900 }, { "epoch": 0.257012876888117, "learning_rate": 9.180214000491065e-06, "loss": 3.6438592529296874, "step": 213000 }, { "epoch": 0.25713354021059975, "learning_rate": 9.179810165023327e-06, "loss": 3.634393615722656, "step": 213100 }, { "epoch": 0.2572542035330824, "learning_rate": 9.179406329555589e-06, "loss": 3.6205813598632814, "step": 213200 }, { "epoch": 0.2573748668555651, "learning_rate": 9.17900249408785e-06, "loss": 3.6506982421875, "step": 213300 }, { "epoch": 0.25749553017804777, "learning_rate": 9.17859865862011e-06, "loss": 3.641763000488281, "step": 213400 }, { "epoch": 0.25761619350053044, "learning_rate": 9.178194823152373e-06, "loss": 3.643809814453125, "step": 213500 }, { "epoch": 0.25773685682301317, "learning_rate": 9.177790987684633e-06, "loss": 3.614754943847656, "step": 213600 }, { "epoch": 0.25785752014549584, "learning_rate": 9.177387152216895e-06, "loss": 3.6188323974609373, "step": 213700 }, { "epoch": 0.2579781834679785, "learning_rate": 9.176983316749157e-06, "loss": 3.6238937377929688, "step": 213800 }, { "epoch": 0.2580988467904612, "learning_rate": 9.176579481281419e-06, "loss": 3.64358642578125, "step": 213900 }, { "epoch": 0.25821951011294386, "learning_rate": 9.176175645813681e-06, "loss": 3.6493756103515627, "step": 214000 }, { "epoch": 0.2583401734354266, "learning_rate": 9.175771810345943e-06, "loss": 3.6419134521484375, "step": 214100 }, { "epoch": 0.25846083675790926, "learning_rate": 9.175367974878205e-06, "loss": 3.6235174560546874, "step": 214200 }, { "epoch": 0.25858150008039194, "learning_rate": 9.174964139410465e-06, "loss": 3.6091348266601564, "step": 214300 }, { "epoch": 0.2587021634028746, "learning_rate": 9.174560303942727e-06, "loss": 3.5955380249023436, "step": 214400 }, { "epoch": 0.2588228267253573, "learning_rate": 9.17415646847499e-06, "loss": 3.6241519165039064, "step": 214500 }, { "epoch": 0.25894349004784, "learning_rate": 9.17375263300725e-06, "loss": 3.62678466796875, "step": 214600 }, { "epoch": 0.2590641533703227, "learning_rate": 9.173348797539511e-06, "loss": 3.608099060058594, "step": 214700 }, { "epoch": 0.25918481669280535, "learning_rate": 9.172944962071773e-06, "loss": 3.628077087402344, "step": 214800 }, { "epoch": 0.259305480015288, "learning_rate": 9.172541126604035e-06, "loss": 3.631988525390625, "step": 214900 }, { "epoch": 0.25942614333777075, "learning_rate": 9.172137291136297e-06, "loss": 3.6361068725585937, "step": 215000 }, { "epoch": 0.2595468066602534, "learning_rate": 9.17173345566856e-06, "loss": 3.6112255859375, "step": 215100 }, { "epoch": 0.2596674699827361, "learning_rate": 9.17132962020082e-06, "loss": 3.6156387329101562, "step": 215200 }, { "epoch": 0.25978813330521877, "learning_rate": 9.170925784733082e-06, "loss": 3.6196099853515626, "step": 215300 }, { "epoch": 0.25990879662770144, "learning_rate": 9.170521949265344e-06, "loss": 3.632629699707031, "step": 215400 }, { "epoch": 0.26002945995018417, "learning_rate": 9.170118113797604e-06, "loss": 3.6325814819335935, "step": 215500 }, { "epoch": 0.26015012327266684, "learning_rate": 9.169714278329866e-06, "loss": 3.651593017578125, "step": 215600 }, { "epoch": 0.2602707865951495, "learning_rate": 9.169310442862128e-06, "loss": 3.63134033203125, "step": 215700 }, { "epoch": 0.2603914499176322, "learning_rate": 9.16890660739439e-06, "loss": 3.6174700927734373, "step": 215800 }, { "epoch": 0.26051211324011486, "learning_rate": 9.168502771926652e-06, "loss": 3.6308102416992187, "step": 215900 }, { "epoch": 0.2606327765625976, "learning_rate": 9.168098936458914e-06, "loss": 3.63929443359375, "step": 216000 }, { "epoch": 0.26075343988508026, "learning_rate": 9.167695100991174e-06, "loss": 3.635963134765625, "step": 216100 }, { "epoch": 0.26087410320756294, "learning_rate": 9.167291265523436e-06, "loss": 3.5966302490234376, "step": 216200 }, { "epoch": 0.2609947665300456, "learning_rate": 9.166887430055698e-06, "loss": 3.617817687988281, "step": 216300 }, { "epoch": 0.2611154298525283, "learning_rate": 9.16648359458796e-06, "loss": 3.591999816894531, "step": 216400 }, { "epoch": 0.261236093175011, "learning_rate": 9.16607975912022e-06, "loss": 3.6028131103515624, "step": 216500 }, { "epoch": 0.2613567564974937, "learning_rate": 9.165675923652482e-06, "loss": 3.6028277587890627, "step": 216600 }, { "epoch": 0.26147741981997635, "learning_rate": 9.165272088184744e-06, "loss": 3.631822204589844, "step": 216700 }, { "epoch": 0.261598083142459, "learning_rate": 9.164868252717006e-06, "loss": 3.6150082397460936, "step": 216800 }, { "epoch": 0.2617187464649417, "learning_rate": 9.164464417249267e-06, "loss": 3.644293212890625, "step": 216900 }, { "epoch": 0.2618394097874244, "learning_rate": 9.164060581781529e-06, "loss": 3.6161553955078123, "step": 217000 }, { "epoch": 0.2619600731099071, "learning_rate": 9.16365674631379e-06, "loss": 3.6294183349609375, "step": 217100 }, { "epoch": 0.26208073643238977, "learning_rate": 9.163252910846053e-06, "loss": 3.5988278198242187, "step": 217200 }, { "epoch": 0.26220139975487244, "learning_rate": 9.162849075378315e-06, "loss": 3.6180953979492188, "step": 217300 }, { "epoch": 0.26232206307735517, "learning_rate": 9.162445239910575e-06, "loss": 3.6175637817382813, "step": 217400 }, { "epoch": 0.26244272639983784, "learning_rate": 9.162041404442837e-06, "loss": 3.625796203613281, "step": 217500 }, { "epoch": 0.2625633897223205, "learning_rate": 9.161637568975099e-06, "loss": 3.6257003784179687, "step": 217600 }, { "epoch": 0.2626840530448032, "learning_rate": 9.161233733507359e-06, "loss": 3.6023458862304687, "step": 217700 }, { "epoch": 0.26280471636728586, "learning_rate": 9.160829898039621e-06, "loss": 3.6290814208984377, "step": 217800 }, { "epoch": 0.2629253796897686, "learning_rate": 9.160426062571883e-06, "loss": 3.65021484375, "step": 217900 }, { "epoch": 0.26304604301225126, "learning_rate": 9.160022227104145e-06, "loss": 3.615780029296875, "step": 218000 }, { "epoch": 0.26316670633473394, "learning_rate": 9.159618391636407e-06, "loss": 3.5862045288085938, "step": 218100 }, { "epoch": 0.2632873696572166, "learning_rate": 9.159214556168669e-06, "loss": 3.6121966552734377, "step": 218200 }, { "epoch": 0.2634080329796993, "learning_rate": 9.158810720700931e-06, "loss": 3.6020855712890625, "step": 218300 }, { "epoch": 0.263528696302182, "learning_rate": 9.158406885233191e-06, "loss": 3.609804992675781, "step": 218400 }, { "epoch": 0.2636493596246647, "learning_rate": 9.158003049765453e-06, "loss": 3.603859558105469, "step": 218500 }, { "epoch": 0.26377002294714735, "learning_rate": 9.157599214297714e-06, "loss": 3.6394342041015624, "step": 218600 }, { "epoch": 0.26389068626963, "learning_rate": 9.157195378829976e-06, "loss": 3.5866665649414062, "step": 218700 }, { "epoch": 0.2640113495921127, "learning_rate": 9.156791543362238e-06, "loss": 3.6207781982421876, "step": 218800 }, { "epoch": 0.2641320129145954, "learning_rate": 9.1563877078945e-06, "loss": 3.6049310302734376, "step": 218900 }, { "epoch": 0.2642526762370781, "learning_rate": 9.155983872426761e-06, "loss": 3.5931475830078123, "step": 219000 }, { "epoch": 0.26437333955956077, "learning_rate": 9.155580036959023e-06, "loss": 3.6016531372070313, "step": 219100 }, { "epoch": 0.26449400288204344, "learning_rate": 9.155176201491285e-06, "loss": 3.5916448974609376, "step": 219200 }, { "epoch": 0.2646146662045261, "learning_rate": 9.154772366023546e-06, "loss": 3.626486511230469, "step": 219300 }, { "epoch": 0.26473532952700884, "learning_rate": 9.154368530555808e-06, "loss": 3.5957351684570313, "step": 219400 }, { "epoch": 0.2648559928494915, "learning_rate": 9.15396469508807e-06, "loss": 3.6146258544921874, "step": 219500 }, { "epoch": 0.2649766561719742, "learning_rate": 9.15356085962033e-06, "loss": 3.587324523925781, "step": 219600 }, { "epoch": 0.26509731949445686, "learning_rate": 9.153157024152592e-06, "loss": 3.622711486816406, "step": 219700 }, { "epoch": 0.26521798281693953, "learning_rate": 9.152753188684854e-06, "loss": 3.609224548339844, "step": 219800 }, { "epoch": 0.26533864613942226, "learning_rate": 9.152349353217116e-06, "loss": 3.61752197265625, "step": 219900 }, { "epoch": 0.26545930946190494, "learning_rate": 9.151945517749378e-06, "loss": 3.6301898193359374, "step": 220000 }, { "epoch": 0.2655799727843876, "learning_rate": 9.151541682281638e-06, "loss": 3.624359436035156, "step": 220100 }, { "epoch": 0.2657006361068703, "learning_rate": 9.1511378468139e-06, "loss": 3.6032644653320314, "step": 220200 }, { "epoch": 0.265821299429353, "learning_rate": 9.150734011346162e-06, "loss": 3.602689208984375, "step": 220300 }, { "epoch": 0.2659419627518357, "learning_rate": 9.150330175878424e-06, "loss": 3.6062646484375, "step": 220400 }, { "epoch": 0.26606262607431835, "learning_rate": 9.149926340410684e-06, "loss": 3.589921569824219, "step": 220500 }, { "epoch": 0.266183289396801, "learning_rate": 9.149522504942946e-06, "loss": 3.6008013916015624, "step": 220600 }, { "epoch": 0.2663039527192837, "learning_rate": 9.149118669475208e-06, "loss": 3.5856967163085938, "step": 220700 }, { "epoch": 0.2664246160417664, "learning_rate": 9.14871483400747e-06, "loss": 3.616685791015625, "step": 220800 }, { "epoch": 0.2665452793642491, "learning_rate": 9.14831099853973e-06, "loss": 3.5684024047851564, "step": 220900 }, { "epoch": 0.26666594268673177, "learning_rate": 9.147907163071993e-06, "loss": 3.6155990600585937, "step": 221000 }, { "epoch": 0.26678660600921444, "learning_rate": 9.147503327604255e-06, "loss": 3.5665682983398437, "step": 221100 }, { "epoch": 0.2669072693316971, "learning_rate": 9.147099492136517e-06, "loss": 3.6033291625976562, "step": 221200 }, { "epoch": 0.26702793265417984, "learning_rate": 9.146695656668779e-06, "loss": 3.583944091796875, "step": 221300 }, { "epoch": 0.2671485959766625, "learning_rate": 9.14629182120104e-06, "loss": 3.6123919677734375, "step": 221400 }, { "epoch": 0.2672692592991452, "learning_rate": 9.145887985733301e-06, "loss": 3.590823059082031, "step": 221500 }, { "epoch": 0.26738992262162786, "learning_rate": 9.145484150265563e-06, "loss": 3.5947357177734376, "step": 221600 }, { "epoch": 0.26751058594411053, "learning_rate": 9.145080314797825e-06, "loss": 3.6045773315429686, "step": 221700 }, { "epoch": 0.26763124926659326, "learning_rate": 9.144676479330085e-06, "loss": 3.6083160400390626, "step": 221800 }, { "epoch": 0.26775191258907594, "learning_rate": 9.144272643862347e-06, "loss": 3.6236557006835937, "step": 221900 }, { "epoch": 0.2678725759115586, "learning_rate": 9.143868808394609e-06, "loss": 3.625653076171875, "step": 222000 }, { "epoch": 0.2679932392340413, "learning_rate": 9.143464972926871e-06, "loss": 3.6005319213867186, "step": 222100 }, { "epoch": 0.26811390255652395, "learning_rate": 9.143061137459133e-06, "loss": 3.6062551879882814, "step": 222200 }, { "epoch": 0.2682345658790067, "learning_rate": 9.142657301991395e-06, "loss": 3.593189697265625, "step": 222300 }, { "epoch": 0.26835522920148935, "learning_rate": 9.142253466523657e-06, "loss": 3.6193814086914062, "step": 222400 }, { "epoch": 0.268475892523972, "learning_rate": 9.141849631055917e-06, "loss": 3.6072567749023436, "step": 222500 }, { "epoch": 0.2685965558464547, "learning_rate": 9.14144579558818e-06, "loss": 3.6080941772460937, "step": 222600 }, { "epoch": 0.2687172191689374, "learning_rate": 9.14104196012044e-06, "loss": 3.5828091430664064, "step": 222700 }, { "epoch": 0.2688378824914201, "learning_rate": 9.140638124652702e-06, "loss": 3.569569396972656, "step": 222800 }, { "epoch": 0.26895854581390277, "learning_rate": 9.140234289184964e-06, "loss": 3.5858114624023436, "step": 222900 }, { "epoch": 0.26907920913638544, "learning_rate": 9.139830453717226e-06, "loss": 3.586725158691406, "step": 223000 }, { "epoch": 0.2691998724588681, "learning_rate": 9.139426618249488e-06, "loss": 3.5938870239257814, "step": 223100 }, { "epoch": 0.26932053578135084, "learning_rate": 9.13902278278175e-06, "loss": 3.5902413940429687, "step": 223200 }, { "epoch": 0.2694411991038335, "learning_rate": 9.138618947314011e-06, "loss": 3.583902587890625, "step": 223300 }, { "epoch": 0.2695618624263162, "learning_rate": 9.138215111846272e-06, "loss": 3.5930902099609376, "step": 223400 }, { "epoch": 0.26968252574879886, "learning_rate": 9.137811276378534e-06, "loss": 3.579262390136719, "step": 223500 }, { "epoch": 0.26980318907128154, "learning_rate": 9.137407440910796e-06, "loss": 3.557735595703125, "step": 223600 }, { "epoch": 0.26992385239376426, "learning_rate": 9.137003605443056e-06, "loss": 3.571603088378906, "step": 223700 }, { "epoch": 0.27004451571624694, "learning_rate": 9.136599769975318e-06, "loss": 3.5692864990234376, "step": 223800 }, { "epoch": 0.2701651790387296, "learning_rate": 9.13619593450758e-06, "loss": 3.5735678100585937, "step": 223900 }, { "epoch": 0.2702858423612123, "learning_rate": 9.135792099039842e-06, "loss": 3.5645697021484377, "step": 224000 }, { "epoch": 0.27040650568369495, "learning_rate": 9.135388263572104e-06, "loss": 3.5668536376953126, "step": 224100 }, { "epoch": 0.2705271690061777, "learning_rate": 9.134984428104364e-06, "loss": 3.590341796875, "step": 224200 }, { "epoch": 0.27064783232866035, "learning_rate": 9.134580592636626e-06, "loss": 3.5697021484375, "step": 224300 }, { "epoch": 0.270768495651143, "learning_rate": 9.134176757168888e-06, "loss": 3.5751992797851564, "step": 224400 }, { "epoch": 0.2708891589736257, "learning_rate": 9.13377292170115e-06, "loss": 3.585551452636719, "step": 224500 }, { "epoch": 0.27100982229610837, "learning_rate": 9.13336908623341e-06, "loss": 3.5663882446289064, "step": 224600 }, { "epoch": 0.2711304856185911, "learning_rate": 9.132965250765672e-06, "loss": 3.5887960815429687, "step": 224700 }, { "epoch": 0.27125114894107377, "learning_rate": 9.132561415297934e-06, "loss": 3.5697503662109376, "step": 224800 }, { "epoch": 0.27137181226355644, "learning_rate": 9.132157579830196e-06, "loss": 3.5834054565429687, "step": 224900 }, { "epoch": 0.2714924755860391, "learning_rate": 9.131753744362457e-06, "loss": 3.592548828125, "step": 225000 }, { "epoch": 0.2716131389085218, "learning_rate": 9.131349908894719e-06, "loss": 3.5807876586914062, "step": 225100 }, { "epoch": 0.2717338022310045, "learning_rate": 9.13094607342698e-06, "loss": 3.57626708984375, "step": 225200 }, { "epoch": 0.2718544655534872, "learning_rate": 9.130542237959243e-06, "loss": 3.6006484985351563, "step": 225300 }, { "epoch": 0.27197512887596986, "learning_rate": 9.130138402491505e-06, "loss": 3.560160827636719, "step": 225400 }, { "epoch": 0.27209579219845254, "learning_rate": 9.129734567023767e-06, "loss": 3.574559326171875, "step": 225500 }, { "epoch": 0.27221645552093526, "learning_rate": 9.129330731556027e-06, "loss": 3.5735488891601563, "step": 225600 }, { "epoch": 0.27233711884341794, "learning_rate": 9.128926896088289e-06, "loss": 3.5712103271484374, "step": 225700 }, { "epoch": 0.2724577821659006, "learning_rate": 9.12852306062055e-06, "loss": 3.5774057006835935, "step": 225800 }, { "epoch": 0.2725784454883833, "learning_rate": 9.128119225152811e-06, "loss": 3.581417236328125, "step": 225900 }, { "epoch": 0.27269910881086595, "learning_rate": 9.127715389685073e-06, "loss": 3.5692376708984375, "step": 226000 }, { "epoch": 0.2728197721333487, "learning_rate": 9.127311554217335e-06, "loss": 3.5908126831054688, "step": 226100 }, { "epoch": 0.27294043545583135, "learning_rate": 9.126907718749597e-06, "loss": 3.5904833984375, "step": 226200 }, { "epoch": 0.273061098778314, "learning_rate": 9.126503883281859e-06, "loss": 3.5807513427734374, "step": 226300 }, { "epoch": 0.2731817621007967, "learning_rate": 9.126100047814121e-06, "loss": 3.540194396972656, "step": 226400 }, { "epoch": 0.27330242542327937, "learning_rate": 9.125696212346381e-06, "loss": 3.5534262084960937, "step": 226500 }, { "epoch": 0.2734230887457621, "learning_rate": 9.125292376878643e-06, "loss": 3.570113220214844, "step": 226600 }, { "epoch": 0.27354375206824477, "learning_rate": 9.124888541410905e-06, "loss": 3.57446533203125, "step": 226700 }, { "epoch": 0.27366441539072744, "learning_rate": 9.124484705943166e-06, "loss": 3.5702655029296877, "step": 226800 }, { "epoch": 0.2737850787132101, "learning_rate": 9.124080870475428e-06, "loss": 3.5850836181640626, "step": 226900 }, { "epoch": 0.2739057420356928, "learning_rate": 9.12367703500769e-06, "loss": 3.5583111572265627, "step": 227000 }, { "epoch": 0.2740264053581755, "learning_rate": 9.123273199539952e-06, "loss": 3.5519818115234374, "step": 227100 }, { "epoch": 0.2741470686806582, "learning_rate": 9.122869364072214e-06, "loss": 3.594349365234375, "step": 227200 }, { "epoch": 0.27426773200314086, "learning_rate": 9.122465528604476e-06, "loss": 3.573846740722656, "step": 227300 }, { "epoch": 0.27438839532562354, "learning_rate": 9.122061693136738e-06, "loss": 3.58361572265625, "step": 227400 }, { "epoch": 0.2745090586481062, "learning_rate": 9.121657857668998e-06, "loss": 3.5692919921875, "step": 227500 }, { "epoch": 0.27462972197058894, "learning_rate": 9.12125402220126e-06, "loss": 3.5698699951171875, "step": 227600 }, { "epoch": 0.2747503852930716, "learning_rate": 9.12085018673352e-06, "loss": 3.5634820556640623, "step": 227700 }, { "epoch": 0.2748710486155543, "learning_rate": 9.120446351265782e-06, "loss": 3.5794137573242186, "step": 227800 }, { "epoch": 0.27499171193803695, "learning_rate": 9.120042515798044e-06, "loss": 3.5800238037109375, "step": 227900 }, { "epoch": 0.2751123752605197, "learning_rate": 9.119638680330306e-06, "loss": 3.561803283691406, "step": 228000 }, { "epoch": 0.27523303858300235, "learning_rate": 9.119234844862568e-06, "loss": 3.55359375, "step": 228100 }, { "epoch": 0.275353701905485, "learning_rate": 9.11883100939483e-06, "loss": 3.5770248413085937, "step": 228200 }, { "epoch": 0.2754743652279677, "learning_rate": 9.11842717392709e-06, "loss": 3.54753662109375, "step": 228300 }, { "epoch": 0.27559502855045037, "learning_rate": 9.118023338459352e-06, "loss": 3.5572323608398437, "step": 228400 }, { "epoch": 0.2757156918729331, "learning_rate": 9.117619502991614e-06, "loss": 3.55868896484375, "step": 228500 }, { "epoch": 0.27583635519541577, "learning_rate": 9.117215667523876e-06, "loss": 3.5834515380859373, "step": 228600 }, { "epoch": 0.27595701851789844, "learning_rate": 9.116811832056137e-06, "loss": 3.5615060424804685, "step": 228700 }, { "epoch": 0.2760776818403811, "learning_rate": 9.116407996588398e-06, "loss": 3.562529296875, "step": 228800 }, { "epoch": 0.2761983451628638, "learning_rate": 9.11600416112066e-06, "loss": 3.5629953002929686, "step": 228900 }, { "epoch": 0.2763190084853465, "learning_rate": 9.115600325652922e-06, "loss": 3.5576663208007813, "step": 229000 }, { "epoch": 0.2764396718078292, "learning_rate": 9.115196490185183e-06, "loss": 3.5684384155273436, "step": 229100 }, { "epoch": 0.27656033513031186, "learning_rate": 9.114792654717445e-06, "loss": 3.542799987792969, "step": 229200 }, { "epoch": 0.27668099845279454, "learning_rate": 9.114388819249707e-06, "loss": 3.544237060546875, "step": 229300 }, { "epoch": 0.2768016617752772, "learning_rate": 9.113984983781969e-06, "loss": 3.5936245727539062, "step": 229400 }, { "epoch": 0.27692232509775994, "learning_rate": 9.11358114831423e-06, "loss": 3.5565670776367186, "step": 229500 }, { "epoch": 0.2770429884202426, "learning_rate": 9.113177312846491e-06, "loss": 3.585528564453125, "step": 229600 }, { "epoch": 0.2771636517427253, "learning_rate": 9.112773477378753e-06, "loss": 3.54026611328125, "step": 229700 }, { "epoch": 0.27728431506520795, "learning_rate": 9.112369641911015e-06, "loss": 3.5612591552734374, "step": 229800 }, { "epoch": 0.2774049783876906, "learning_rate": 9.111965806443275e-06, "loss": 3.54359619140625, "step": 229900 }, { "epoch": 0.27752564171017335, "learning_rate": 9.111561970975537e-06, "loss": 3.5542388916015626, "step": 230000 }, { "epoch": 0.277646305032656, "learning_rate": 9.1111581355078e-06, "loss": 3.5533367919921877, "step": 230100 }, { "epoch": 0.2777669683551387, "learning_rate": 9.110754300040061e-06, "loss": 3.5700363159179687, "step": 230200 }, { "epoch": 0.27788763167762137, "learning_rate": 9.110350464572323e-06, "loss": 3.6037078857421876, "step": 230300 }, { "epoch": 0.2780082950001041, "learning_rate": 9.109946629104585e-06, "loss": 3.5694659423828123, "step": 230400 }, { "epoch": 0.2781289583225868, "learning_rate": 9.109542793636847e-06, "loss": 3.5792169189453125, "step": 230500 }, { "epoch": 0.27824962164506944, "learning_rate": 9.109138958169107e-06, "loss": 3.570884094238281, "step": 230600 }, { "epoch": 0.2783702849675521, "learning_rate": 9.10873512270137e-06, "loss": 3.5491015625, "step": 230700 }, { "epoch": 0.2784909482900348, "learning_rate": 9.10833128723363e-06, "loss": 3.541947937011719, "step": 230800 }, { "epoch": 0.2786116116125175, "learning_rate": 9.107927451765892e-06, "loss": 3.558038635253906, "step": 230900 }, { "epoch": 0.2787322749350002, "learning_rate": 9.107523616298154e-06, "loss": 3.5654672241210936, "step": 231000 }, { "epoch": 0.27885293825748286, "learning_rate": 9.107119780830416e-06, "loss": 3.572138366699219, "step": 231100 }, { "epoch": 0.27897360157996554, "learning_rate": 9.106715945362678e-06, "loss": 3.5210507202148436, "step": 231200 }, { "epoch": 0.2790942649024482, "learning_rate": 9.10631210989494e-06, "loss": 3.54669677734375, "step": 231300 }, { "epoch": 0.27921492822493094, "learning_rate": 9.105908274427202e-06, "loss": 3.5767861938476564, "step": 231400 }, { "epoch": 0.2793355915474136, "learning_rate": 9.105504438959462e-06, "loss": 3.534457092285156, "step": 231500 }, { "epoch": 0.2794562548698963, "learning_rate": 9.105100603491724e-06, "loss": 3.5653506469726564, "step": 231600 }, { "epoch": 0.27957691819237895, "learning_rate": 9.104696768023986e-06, "loss": 3.568785400390625, "step": 231700 }, { "epoch": 0.2796975815148616, "learning_rate": 9.104292932556246e-06, "loss": 3.569420166015625, "step": 231800 }, { "epoch": 0.27981824483734435, "learning_rate": 9.103889097088508e-06, "loss": 3.5457232666015623, "step": 231900 }, { "epoch": 0.279938908159827, "learning_rate": 9.10348526162077e-06, "loss": 3.5601092529296876, "step": 232000 }, { "epoch": 0.2800595714823097, "learning_rate": 9.103081426153032e-06, "loss": 3.5472662353515627, "step": 232100 }, { "epoch": 0.28018023480479237, "learning_rate": 9.102677590685294e-06, "loss": 3.559073486328125, "step": 232200 }, { "epoch": 0.28030089812727504, "learning_rate": 9.102273755217556e-06, "loss": 3.5434954833984373, "step": 232300 }, { "epoch": 0.2804215614497578, "learning_rate": 9.101869919749816e-06, "loss": 3.5494454956054686, "step": 232400 }, { "epoch": 0.28054222477224044, "learning_rate": 9.101466084282078e-06, "loss": 3.5655535888671874, "step": 232500 }, { "epoch": 0.2806628880947231, "learning_rate": 9.10106224881434e-06, "loss": 3.55737060546875, "step": 232600 }, { "epoch": 0.2807835514172058, "learning_rate": 9.1006584133466e-06, "loss": 3.5257229614257812, "step": 232700 }, { "epoch": 0.28090421473968846, "learning_rate": 9.100254577878863e-06, "loss": 3.560521545410156, "step": 232800 }, { "epoch": 0.2810248780621712, "learning_rate": 9.099850742411125e-06, "loss": 3.540338134765625, "step": 232900 }, { "epoch": 0.28114554138465386, "learning_rate": 9.099446906943387e-06, "loss": 3.5388763427734373, "step": 233000 }, { "epoch": 0.28126620470713654, "learning_rate": 9.099043071475648e-06, "loss": 3.5608856201171877, "step": 233100 }, { "epoch": 0.2813868680296192, "learning_rate": 9.098639236007909e-06, "loss": 3.511635437011719, "step": 233200 }, { "epoch": 0.28150753135210194, "learning_rate": 9.09823540054017e-06, "loss": 3.5601321411132814, "step": 233300 }, { "epoch": 0.2816281946745846, "learning_rate": 9.097831565072433e-06, "loss": 3.574920654296875, "step": 233400 }, { "epoch": 0.2817488579970673, "learning_rate": 9.097427729604695e-06, "loss": 3.5440493774414064, "step": 233500 }, { "epoch": 0.28186952131954995, "learning_rate": 9.097023894136957e-06, "loss": 3.51092529296875, "step": 233600 }, { "epoch": 0.2819901846420326, "learning_rate": 9.096620058669217e-06, "loss": 3.562699890136719, "step": 233700 }, { "epoch": 0.28211084796451535, "learning_rate": 9.096216223201479e-06, "loss": 3.5338290405273436, "step": 233800 }, { "epoch": 0.282231511286998, "learning_rate": 9.095812387733741e-06, "loss": 3.523289794921875, "step": 233900 }, { "epoch": 0.2823521746094807, "learning_rate": 9.095408552266001e-06, "loss": 3.556551818847656, "step": 234000 }, { "epoch": 0.28247283793196337, "learning_rate": 9.095004716798263e-06, "loss": 3.524173583984375, "step": 234100 }, { "epoch": 0.28259350125444604, "learning_rate": 9.094600881330525e-06, "loss": 3.546764221191406, "step": 234200 }, { "epoch": 0.2827141645769288, "learning_rate": 9.094197045862787e-06, "loss": 3.547751159667969, "step": 234300 }, { "epoch": 0.28283482789941145, "learning_rate": 9.09379321039505e-06, "loss": 3.5356320190429686, "step": 234400 }, { "epoch": 0.2829554912218941, "learning_rate": 9.093389374927311e-06, "loss": 3.5340701293945314, "step": 234500 }, { "epoch": 0.2830761545443768, "learning_rate": 9.092985539459571e-06, "loss": 3.54810302734375, "step": 234600 }, { "epoch": 0.28319681786685946, "learning_rate": 9.092581703991833e-06, "loss": 3.55381103515625, "step": 234700 }, { "epoch": 0.2833174811893422, "learning_rate": 9.092177868524095e-06, "loss": 3.533924865722656, "step": 234800 }, { "epoch": 0.28343814451182486, "learning_rate": 9.091774033056356e-06, "loss": 3.5165390014648437, "step": 234900 }, { "epoch": 0.28355880783430754, "learning_rate": 9.091370197588618e-06, "loss": 3.5360092163085937, "step": 235000 }, { "epoch": 0.2836794711567902, "learning_rate": 9.09096636212088e-06, "loss": 3.530864562988281, "step": 235100 }, { "epoch": 0.2838001344792729, "learning_rate": 9.090562526653142e-06, "loss": 3.551382751464844, "step": 235200 }, { "epoch": 0.2839207978017556, "learning_rate": 9.090158691185404e-06, "loss": 3.5360488891601562, "step": 235300 }, { "epoch": 0.2840414611242383, "learning_rate": 9.089754855717666e-06, "loss": 3.555943908691406, "step": 235400 }, { "epoch": 0.28416212444672095, "learning_rate": 9.089351020249928e-06, "loss": 3.5365390014648437, "step": 235500 }, { "epoch": 0.2842827877692036, "learning_rate": 9.088947184782188e-06, "loss": 3.5623223876953123, "step": 235600 }, { "epoch": 0.28440345109168635, "learning_rate": 9.08854334931445e-06, "loss": 3.5370941162109375, "step": 235700 }, { "epoch": 0.284524114414169, "learning_rate": 9.08813951384671e-06, "loss": 3.561373291015625, "step": 235800 }, { "epoch": 0.2846447777366517, "learning_rate": 9.087735678378972e-06, "loss": 3.523375244140625, "step": 235900 }, { "epoch": 0.28476544105913437, "learning_rate": 9.087331842911234e-06, "loss": 3.549563293457031, "step": 236000 }, { "epoch": 0.28488610438161704, "learning_rate": 9.086928007443496e-06, "loss": 3.5181460571289063, "step": 236100 }, { "epoch": 0.2850067677040998, "learning_rate": 9.086524171975758e-06, "loss": 3.5442230224609377, "step": 236200 }, { "epoch": 0.28512743102658245, "learning_rate": 9.08612033650802e-06, "loss": 3.5504837036132812, "step": 236300 }, { "epoch": 0.2852480943490651, "learning_rate": 9.08571650104028e-06, "loss": 3.5411907958984377, "step": 236400 }, { "epoch": 0.2853687576715478, "learning_rate": 9.085312665572542e-06, "loss": 3.547847900390625, "step": 236500 }, { "epoch": 0.28548942099403046, "learning_rate": 9.084908830104804e-06, "loss": 3.4919146728515624, "step": 236600 }, { "epoch": 0.2856100843165132, "learning_rate": 9.084504994637066e-06, "loss": 3.54189453125, "step": 236700 }, { "epoch": 0.28573074763899586, "learning_rate": 9.084101159169327e-06, "loss": 3.547510070800781, "step": 236800 }, { "epoch": 0.28585141096147854, "learning_rate": 9.083697323701589e-06, "loss": 3.552120361328125, "step": 236900 }, { "epoch": 0.2859720742839612, "learning_rate": 9.08329348823385e-06, "loss": 3.5490631103515624, "step": 237000 }, { "epoch": 0.2860927376064439, "learning_rate": 9.082889652766113e-06, "loss": 3.5557119750976565, "step": 237100 }, { "epoch": 0.2862134009289266, "learning_rate": 9.082485817298375e-06, "loss": 3.5196078491210936, "step": 237200 }, { "epoch": 0.2863340642514093, "learning_rate": 9.082081981830635e-06, "loss": 3.520566101074219, "step": 237300 }, { "epoch": 0.28645472757389195, "learning_rate": 9.081678146362897e-06, "loss": 3.5224969482421873, "step": 237400 }, { "epoch": 0.2865753908963746, "learning_rate": 9.081274310895159e-06, "loss": 3.5348040771484377, "step": 237500 }, { "epoch": 0.2866960542188573, "learning_rate": 9.08087047542742e-06, "loss": 3.523841552734375, "step": 237600 }, { "epoch": 0.28681671754134, "learning_rate": 9.080466639959683e-06, "loss": 3.539947204589844, "step": 237700 }, { "epoch": 0.2869373808638227, "learning_rate": 9.080062804491943e-06, "loss": 3.528543701171875, "step": 237800 }, { "epoch": 0.28705804418630537, "learning_rate": 9.079658969024205e-06, "loss": 3.5332635498046874, "step": 237900 }, { "epoch": 0.28717870750878804, "learning_rate": 9.079255133556467e-06, "loss": 3.5342922973632813, "step": 238000 }, { "epoch": 0.2872993708312707, "learning_rate": 9.078851298088727e-06, "loss": 3.511679992675781, "step": 238100 }, { "epoch": 0.28742003415375345, "learning_rate": 9.07844746262099e-06, "loss": 3.529948425292969, "step": 238200 }, { "epoch": 0.2875406974762361, "learning_rate": 9.078043627153251e-06, "loss": 3.533457946777344, "step": 238300 }, { "epoch": 0.2876613607987188, "learning_rate": 9.077639791685513e-06, "loss": 3.502527160644531, "step": 238400 }, { "epoch": 0.28778202412120146, "learning_rate": 9.077235956217775e-06, "loss": 3.5142483520507812, "step": 238500 }, { "epoch": 0.2879026874436842, "learning_rate": 9.076832120750037e-06, "loss": 3.549124755859375, "step": 238600 }, { "epoch": 0.28802335076616686, "learning_rate": 9.076428285282297e-06, "loss": 3.5248681640625, "step": 238700 }, { "epoch": 0.28814401408864954, "learning_rate": 9.07602444981456e-06, "loss": 3.5463262939453126, "step": 238800 }, { "epoch": 0.2882646774111322, "learning_rate": 9.075620614346821e-06, "loss": 3.5553033447265623, "step": 238900 }, { "epoch": 0.2883853407336149, "learning_rate": 9.075216778879082e-06, "loss": 3.5349688720703125, "step": 239000 }, { "epoch": 0.2885060040560976, "learning_rate": 9.074812943411344e-06, "loss": 3.5142343139648435, "step": 239100 }, { "epoch": 0.2886266673785803, "learning_rate": 9.074409107943606e-06, "loss": 3.503292236328125, "step": 239200 }, { "epoch": 0.28874733070106295, "learning_rate": 9.074005272475868e-06, "loss": 3.555716247558594, "step": 239300 }, { "epoch": 0.2888679940235456, "learning_rate": 9.07360143700813e-06, "loss": 3.532054748535156, "step": 239400 }, { "epoch": 0.2889886573460283, "learning_rate": 9.073197601540392e-06, "loss": 3.523057556152344, "step": 239500 }, { "epoch": 0.289109320668511, "learning_rate": 9.072793766072654e-06, "loss": 3.517941589355469, "step": 239600 }, { "epoch": 0.2892299839909937, "learning_rate": 9.072389930604914e-06, "loss": 3.51544189453125, "step": 239700 }, { "epoch": 0.2893506473134764, "learning_rate": 9.071986095137176e-06, "loss": 3.5075982666015624, "step": 239800 }, { "epoch": 0.28947131063595904, "learning_rate": 9.071582259669436e-06, "loss": 3.543909912109375, "step": 239900 }, { "epoch": 0.2895919739584417, "learning_rate": 9.071178424201698e-06, "loss": 3.523030090332031, "step": 240000 }, { "epoch": 0.28971263728092445, "learning_rate": 9.07077458873396e-06, "loss": 3.519525451660156, "step": 240100 }, { "epoch": 0.2898333006034071, "learning_rate": 9.070370753266222e-06, "loss": 3.4934246826171873, "step": 240200 }, { "epoch": 0.2899539639258898, "learning_rate": 9.069966917798484e-06, "loss": 3.5160708618164063, "step": 240300 }, { "epoch": 0.29007462724837246, "learning_rate": 9.069563082330746e-06, "loss": 3.4987454223632812, "step": 240400 }, { "epoch": 0.29019529057085514, "learning_rate": 9.069159246863006e-06, "loss": 3.52860595703125, "step": 240500 }, { "epoch": 0.29031595389333786, "learning_rate": 9.068755411395268e-06, "loss": 3.5318927001953124, "step": 240600 }, { "epoch": 0.29043661721582054, "learning_rate": 9.06835157592753e-06, "loss": 3.5177487182617186, "step": 240700 }, { "epoch": 0.2905572805383032, "learning_rate": 9.067947740459792e-06, "loss": 3.516593322753906, "step": 240800 }, { "epoch": 0.2906779438607859, "learning_rate": 9.067543904992053e-06, "loss": 3.533345947265625, "step": 240900 }, { "epoch": 0.2907986071832686, "learning_rate": 9.067140069524315e-06, "loss": 3.52850830078125, "step": 241000 }, { "epoch": 0.2909192705057513, "learning_rate": 9.066736234056577e-06, "loss": 3.49110107421875, "step": 241100 }, { "epoch": 0.29103993382823395, "learning_rate": 9.066332398588839e-06, "loss": 3.52057861328125, "step": 241200 }, { "epoch": 0.2911605971507166, "learning_rate": 9.065928563121099e-06, "loss": 3.5335784912109376, "step": 241300 }, { "epoch": 0.2912812604731993, "learning_rate": 9.065524727653361e-06, "loss": 3.51269287109375, "step": 241400 }, { "epoch": 0.291401923795682, "learning_rate": 9.065120892185623e-06, "loss": 3.5162054443359376, "step": 241500 }, { "epoch": 0.2915225871181647, "learning_rate": 9.064717056717885e-06, "loss": 3.530340270996094, "step": 241600 }, { "epoch": 0.2916432504406474, "learning_rate": 9.064313221250147e-06, "loss": 3.5295834350585937, "step": 241700 }, { "epoch": 0.29176391376313004, "learning_rate": 9.063909385782407e-06, "loss": 3.5167926025390623, "step": 241800 }, { "epoch": 0.2918845770856127, "learning_rate": 9.063505550314669e-06, "loss": 3.51607177734375, "step": 241900 }, { "epoch": 0.29200524040809545, "learning_rate": 9.063101714846931e-06, "loss": 3.4878125, "step": 242000 }, { "epoch": 0.2921259037305781, "learning_rate": 9.062697879379193e-06, "loss": 3.5096075439453127, "step": 242100 }, { "epoch": 0.2922465670530608, "learning_rate": 9.062294043911453e-06, "loss": 3.486436767578125, "step": 242200 }, { "epoch": 0.29236723037554346, "learning_rate": 9.061890208443715e-06, "loss": 3.5291424560546876, "step": 242300 }, { "epoch": 0.29248789369802614, "learning_rate": 9.061486372975977e-06, "loss": 3.5026568603515624, "step": 242400 }, { "epoch": 0.29260855702050886, "learning_rate": 9.06108253750824e-06, "loss": 3.522607727050781, "step": 242500 }, { "epoch": 0.29272922034299154, "learning_rate": 9.060678702040501e-06, "loss": 3.50931640625, "step": 242600 }, { "epoch": 0.2928498836654742, "learning_rate": 9.060274866572763e-06, "loss": 3.530660400390625, "step": 242700 }, { "epoch": 0.2929705469879569, "learning_rate": 9.059871031105024e-06, "loss": 3.5016534423828123, "step": 242800 }, { "epoch": 0.29309121031043955, "learning_rate": 9.059467195637286e-06, "loss": 3.5031503295898436, "step": 242900 }, { "epoch": 0.2932118736329223, "learning_rate": 9.059063360169546e-06, "loss": 3.4879962158203126, "step": 243000 }, { "epoch": 0.29333253695540495, "learning_rate": 9.058659524701808e-06, "loss": 3.487945861816406, "step": 243100 }, { "epoch": 0.2934532002778876, "learning_rate": 9.05825568923407e-06, "loss": 3.4756591796875, "step": 243200 }, { "epoch": 0.2935738636003703, "learning_rate": 9.057851853766332e-06, "loss": 3.479200439453125, "step": 243300 }, { "epoch": 0.293694526922853, "learning_rate": 9.057448018298594e-06, "loss": 3.5223843383789064, "step": 243400 }, { "epoch": 0.2938151902453357, "learning_rate": 9.057044182830856e-06, "loss": 3.508787841796875, "step": 243500 }, { "epoch": 0.2939358535678184, "learning_rate": 9.056640347363118e-06, "loss": 3.522214660644531, "step": 243600 }, { "epoch": 0.29405651689030105, "learning_rate": 9.056236511895378e-06, "loss": 3.505821533203125, "step": 243700 }, { "epoch": 0.2941771802127837, "learning_rate": 9.05583267642764e-06, "loss": 3.524658508300781, "step": 243800 }, { "epoch": 0.29429784353526645, "learning_rate": 9.055428840959902e-06, "loss": 3.4910598754882813, "step": 243900 }, { "epoch": 0.2944185068577491, "learning_rate": 9.055025005492162e-06, "loss": 3.5071173095703125, "step": 244000 }, { "epoch": 0.2945391701802318, "learning_rate": 9.054621170024424e-06, "loss": 3.5092437744140623, "step": 244100 }, { "epoch": 0.29465983350271446, "learning_rate": 9.054217334556686e-06, "loss": 3.504959716796875, "step": 244200 }, { "epoch": 0.29478049682519714, "learning_rate": 9.053813499088948e-06, "loss": 3.512716979980469, "step": 244300 }, { "epoch": 0.29490116014767986, "learning_rate": 9.05340966362121e-06, "loss": 3.5111618041992188, "step": 244400 }, { "epoch": 0.29502182347016254, "learning_rate": 9.053005828153472e-06, "loss": 3.4888232421875, "step": 244500 }, { "epoch": 0.2951424867926452, "learning_rate": 9.052601992685732e-06, "loss": 3.49567138671875, "step": 244600 }, { "epoch": 0.2952631501151279, "learning_rate": 9.052198157217994e-06, "loss": 3.5268939208984373, "step": 244700 }, { "epoch": 0.29538381343761055, "learning_rate": 9.051794321750256e-06, "loss": 3.4814801025390625, "step": 244800 }, { "epoch": 0.2955044767600933, "learning_rate": 9.051390486282517e-06, "loss": 3.5128665161132813, "step": 244900 }, { "epoch": 0.29562514008257595, "learning_rate": 9.050986650814779e-06, "loss": 3.5191455078125, "step": 245000 }, { "epoch": 0.2957458034050586, "learning_rate": 9.05058281534704e-06, "loss": 3.4879742431640626, "step": 245100 }, { "epoch": 0.2958664667275413, "learning_rate": 9.050178979879303e-06, "loss": 3.487076416015625, "step": 245200 }, { "epoch": 0.29598713005002397, "learning_rate": 9.049775144411565e-06, "loss": 3.495189208984375, "step": 245300 }, { "epoch": 0.2961077933725067, "learning_rate": 9.049371308943825e-06, "loss": 3.523011474609375, "step": 245400 }, { "epoch": 0.2962284566949894, "learning_rate": 9.048967473476087e-06, "loss": 3.5369317626953123, "step": 245500 }, { "epoch": 0.29634912001747205, "learning_rate": 9.048563638008349e-06, "loss": 3.493325500488281, "step": 245600 }, { "epoch": 0.2964697833399547, "learning_rate": 9.048159802540611e-06, "loss": 3.4990829467773437, "step": 245700 }, { "epoch": 0.2965904466624374, "learning_rate": 9.047755967072873e-06, "loss": 3.4918212890625, "step": 245800 }, { "epoch": 0.2967111099849201, "learning_rate": 9.047352131605133e-06, "loss": 3.5048931884765624, "step": 245900 }, { "epoch": 0.2968317733074028, "learning_rate": 9.046948296137395e-06, "loss": 3.501866760253906, "step": 246000 }, { "epoch": 0.29695243662988546, "learning_rate": 9.046544460669657e-06, "loss": 3.4870660400390623, "step": 246100 }, { "epoch": 0.29707309995236814, "learning_rate": 9.046140625201917e-06, "loss": 3.496470947265625, "step": 246200 }, { "epoch": 0.29719376327485086, "learning_rate": 9.04573678973418e-06, "loss": 3.4828750610351564, "step": 246300 }, { "epoch": 0.29731442659733354, "learning_rate": 9.045332954266441e-06, "loss": 3.51740966796875, "step": 246400 }, { "epoch": 0.2974350899198162, "learning_rate": 9.044929118798703e-06, "loss": 3.495346984863281, "step": 246500 }, { "epoch": 0.2975557532422989, "learning_rate": 9.044525283330965e-06, "loss": 3.4912945556640627, "step": 246600 }, { "epoch": 0.29767641656478155, "learning_rate": 9.044121447863227e-06, "loss": 3.474295654296875, "step": 246700 }, { "epoch": 0.2977970798872643, "learning_rate": 9.043717612395488e-06, "loss": 3.5308804321289062, "step": 246800 }, { "epoch": 0.29791774320974695, "learning_rate": 9.04331377692775e-06, "loss": 3.511390380859375, "step": 246900 }, { "epoch": 0.2980384065322296, "learning_rate": 9.042909941460012e-06, "loss": 3.5071051025390627, "step": 247000 }, { "epoch": 0.2981590698547123, "learning_rate": 9.042506105992272e-06, "loss": 3.499173583984375, "step": 247100 }, { "epoch": 0.298279733177195, "learning_rate": 9.042102270524534e-06, "loss": 3.4815493774414064, "step": 247200 }, { "epoch": 0.2984003964996777, "learning_rate": 9.041698435056796e-06, "loss": 3.486444091796875, "step": 247300 }, { "epoch": 0.2985210598221604, "learning_rate": 9.041294599589058e-06, "loss": 3.53158447265625, "step": 247400 }, { "epoch": 0.29864172314464305, "learning_rate": 9.04089076412132e-06, "loss": 3.4900189208984376, "step": 247500 }, { "epoch": 0.2987623864671257, "learning_rate": 9.040486928653582e-06, "loss": 3.4843649291992187, "step": 247600 }, { "epoch": 0.2988830497896084, "learning_rate": 9.040083093185844e-06, "loss": 3.5197415161132812, "step": 247700 }, { "epoch": 0.2990037131120911, "learning_rate": 9.039679257718104e-06, "loss": 3.4803619384765625, "step": 247800 }, { "epoch": 0.2991243764345738, "learning_rate": 9.039275422250366e-06, "loss": 3.492481994628906, "step": 247900 }, { "epoch": 0.29924503975705646, "learning_rate": 9.038871586782626e-06, "loss": 3.4937982177734375, "step": 248000 }, { "epoch": 0.29936570307953914, "learning_rate": 9.038467751314888e-06, "loss": 3.4978997802734373, "step": 248100 }, { "epoch": 0.2994863664020218, "learning_rate": 9.03806391584715e-06, "loss": 3.4873727416992186, "step": 248200 }, { "epoch": 0.29960702972450454, "learning_rate": 9.037660080379412e-06, "loss": 3.463453369140625, "step": 248300 }, { "epoch": 0.2997276930469872, "learning_rate": 9.037256244911674e-06, "loss": 3.4962835693359375, "step": 248400 }, { "epoch": 0.2998483563694699, "learning_rate": 9.036852409443936e-06, "loss": 3.4929794311523437, "step": 248500 }, { "epoch": 0.29996901969195255, "learning_rate": 9.036448573976198e-06, "loss": 3.4812042236328127, "step": 248600 }, { "epoch": 0.3000896830144353, "learning_rate": 9.036044738508458e-06, "loss": 3.54179443359375, "step": 248700 }, { "epoch": 0.30021034633691795, "learning_rate": 9.03564090304072e-06, "loss": 3.4588742065429687, "step": 248800 }, { "epoch": 0.3003310096594006, "learning_rate": 9.035237067572982e-06, "loss": 3.4777667236328127, "step": 248900 }, { "epoch": 0.3004516729818833, "learning_rate": 9.034833232105243e-06, "loss": 3.4772689819335936, "step": 249000 }, { "epoch": 0.300572336304366, "learning_rate": 9.034429396637505e-06, "loss": 3.4955755615234376, "step": 249100 }, { "epoch": 0.3006929996268487, "learning_rate": 9.034025561169767e-06, "loss": 3.4750491333007814, "step": 249200 }, { "epoch": 0.3008136629493314, "learning_rate": 9.033621725702029e-06, "loss": 3.4789614868164063, "step": 249300 }, { "epoch": 0.30093432627181405, "learning_rate": 9.03321789023429e-06, "loss": 3.484339294433594, "step": 249400 }, { "epoch": 0.3010549895942967, "learning_rate": 9.032814054766551e-06, "loss": 3.492952880859375, "step": 249500 }, { "epoch": 0.3011756529167794, "learning_rate": 9.032410219298813e-06, "loss": 3.4924002075195313, "step": 249600 }, { "epoch": 0.3012963162392621, "learning_rate": 9.032006383831075e-06, "loss": 3.479683532714844, "step": 249700 }, { "epoch": 0.3014169795617448, "learning_rate": 9.031602548363337e-06, "loss": 3.49135986328125, "step": 249800 }, { "epoch": 0.30153764288422746, "learning_rate": 9.031198712895597e-06, "loss": 3.4717813110351563, "step": 249900 }, { "epoch": 0.30165830620671014, "learning_rate": 9.03079487742786e-06, "loss": 3.507582092285156, "step": 250000 }, { "epoch": 0.3017789695291928, "learning_rate": 9.030391041960121e-06, "loss": 3.4800839233398437, "step": 250100 }, { "epoch": 0.30189963285167554, "learning_rate": 9.029987206492383e-06, "loss": 3.4723468017578125, "step": 250200 }, { "epoch": 0.3020202961741582, "learning_rate": 9.029583371024643e-06, "loss": 3.460505065917969, "step": 250300 }, { "epoch": 0.3021409594966409, "learning_rate": 9.029179535556905e-06, "loss": 3.4752301025390624, "step": 250400 }, { "epoch": 0.30226162281912355, "learning_rate": 9.028775700089167e-06, "loss": 3.4550735473632814, "step": 250500 }, { "epoch": 0.3023822861416062, "learning_rate": 9.02837186462143e-06, "loss": 3.459894714355469, "step": 250600 }, { "epoch": 0.30250294946408895, "learning_rate": 9.027968029153691e-06, "loss": 3.491341552734375, "step": 250700 }, { "epoch": 0.3026236127865716, "learning_rate": 9.027564193685953e-06, "loss": 3.4609600830078127, "step": 250800 }, { "epoch": 0.3027442761090543, "learning_rate": 9.027160358218214e-06, "loss": 3.4603173828125, "step": 250900 }, { "epoch": 0.302864939431537, "learning_rate": 9.026756522750476e-06, "loss": 3.4639407348632814, "step": 251000 }, { "epoch": 0.30298560275401965, "learning_rate": 9.026352687282736e-06, "loss": 3.47100830078125, "step": 251100 }, { "epoch": 0.3031062660765024, "learning_rate": 9.025948851814998e-06, "loss": 3.4888729858398437, "step": 251200 }, { "epoch": 0.30322692939898505, "learning_rate": 9.02554501634726e-06, "loss": 3.490747375488281, "step": 251300 }, { "epoch": 0.3033475927214677, "learning_rate": 9.025141180879522e-06, "loss": 3.4747659301757814, "step": 251400 }, { "epoch": 0.3034682560439504, "learning_rate": 9.024737345411784e-06, "loss": 3.468287353515625, "step": 251500 }, { "epoch": 0.3035889193664331, "learning_rate": 9.024333509944046e-06, "loss": 3.4877108764648437, "step": 251600 }, { "epoch": 0.3037095826889158, "learning_rate": 9.023929674476308e-06, "loss": 3.481889343261719, "step": 251700 }, { "epoch": 0.30383024601139846, "learning_rate": 9.02352583900857e-06, "loss": 3.4864935302734374, "step": 251800 }, { "epoch": 0.30395090933388114, "learning_rate": 9.02312200354083e-06, "loss": 3.4692153930664062, "step": 251900 }, { "epoch": 0.3040715726563638, "learning_rate": 9.022718168073092e-06, "loss": 3.477308349609375, "step": 252000 }, { "epoch": 0.30419223597884654, "learning_rate": 9.022314332605352e-06, "loss": 3.4716461181640623, "step": 252100 }, { "epoch": 0.3043128993013292, "learning_rate": 9.021910497137614e-06, "loss": 3.4954263305664064, "step": 252200 }, { "epoch": 0.3044335626238119, "learning_rate": 9.021506661669876e-06, "loss": 3.446484375, "step": 252300 }, { "epoch": 0.30455422594629455, "learning_rate": 9.021102826202138e-06, "loss": 3.4822540283203125, "step": 252400 }, { "epoch": 0.3046748892687772, "learning_rate": 9.0206989907344e-06, "loss": 3.4629345703125, "step": 252500 }, { "epoch": 0.30479555259125996, "learning_rate": 9.020295155266662e-06, "loss": 3.49714599609375, "step": 252600 }, { "epoch": 0.3049162159137426, "learning_rate": 9.019891319798924e-06, "loss": 3.4701107788085936, "step": 252700 }, { "epoch": 0.3050368792362253, "learning_rate": 9.019487484331185e-06, "loss": 3.4754180908203125, "step": 252800 }, { "epoch": 0.305157542558708, "learning_rate": 9.019083648863446e-06, "loss": 3.4624261474609375, "step": 252900 }, { "epoch": 0.30527820588119065, "learning_rate": 9.018679813395708e-06, "loss": 3.47029296875, "step": 253000 }, { "epoch": 0.3053988692036734, "learning_rate": 9.018275977927969e-06, "loss": 3.449705810546875, "step": 253100 }, { "epoch": 0.30551953252615605, "learning_rate": 9.01787214246023e-06, "loss": 3.4592404174804687, "step": 253200 }, { "epoch": 0.3056401958486387, "learning_rate": 9.017468306992493e-06, "loss": 3.4513589477539064, "step": 253300 }, { "epoch": 0.3057608591711214, "learning_rate": 9.017064471524755e-06, "loss": 3.45432373046875, "step": 253400 }, { "epoch": 0.30588152249360406, "learning_rate": 9.016660636057017e-06, "loss": 3.4828924560546874, "step": 253500 }, { "epoch": 0.3060021858160868, "learning_rate": 9.016256800589277e-06, "loss": 3.487909851074219, "step": 253600 }, { "epoch": 0.30612284913856946, "learning_rate": 9.015852965121539e-06, "loss": 3.48064697265625, "step": 253700 }, { "epoch": 0.30624351246105214, "learning_rate": 9.015449129653801e-06, "loss": 3.459417724609375, "step": 253800 }, { "epoch": 0.3063641757835348, "learning_rate": 9.015045294186063e-06, "loss": 3.430541687011719, "step": 253900 }, { "epoch": 0.30648483910601754, "learning_rate": 9.014641458718323e-06, "loss": 3.4528570556640625, "step": 254000 }, { "epoch": 0.3066055024285002, "learning_rate": 9.014237623250585e-06, "loss": 3.4385220336914064, "step": 254100 }, { "epoch": 0.3067261657509829, "learning_rate": 9.013833787782847e-06, "loss": 3.4766796875, "step": 254200 }, { "epoch": 0.30684682907346555, "learning_rate": 9.01342995231511e-06, "loss": 3.4515109252929688, "step": 254300 }, { "epoch": 0.3069674923959482, "learning_rate": 9.01302611684737e-06, "loss": 3.466062316894531, "step": 254400 }, { "epoch": 0.30708815571843096, "learning_rate": 9.012622281379631e-06, "loss": 3.459525451660156, "step": 254500 }, { "epoch": 0.3072088190409136, "learning_rate": 9.012218445911893e-06, "loss": 3.4751983642578126, "step": 254600 }, { "epoch": 0.3073294823633963, "learning_rate": 9.011814610444155e-06, "loss": 3.4866497802734373, "step": 254700 }, { "epoch": 0.307450145685879, "learning_rate": 9.011410774976417e-06, "loss": 3.47266845703125, "step": 254800 }, { "epoch": 0.30757080900836165, "learning_rate": 9.01100693950868e-06, "loss": 3.452107238769531, "step": 254900 }, { "epoch": 0.3076914723308444, "learning_rate": 9.01060310404094e-06, "loss": 3.4435076904296875, "step": 255000 }, { "epoch": 0.30781213565332705, "learning_rate": 9.010199268573202e-06, "loss": 3.458359375, "step": 255100 }, { "epoch": 0.3079327989758097, "learning_rate": 9.009795433105462e-06, "loss": 3.4515771484375, "step": 255200 }, { "epoch": 0.3080534622982924, "learning_rate": 9.009391597637724e-06, "loss": 3.4601556396484376, "step": 255300 }, { "epoch": 0.30817412562077506, "learning_rate": 9.008987762169986e-06, "loss": 3.4779644775390626, "step": 255400 }, { "epoch": 0.3082947889432578, "learning_rate": 9.008583926702248e-06, "loss": 3.443705749511719, "step": 255500 }, { "epoch": 0.30841545226574046, "learning_rate": 9.00818009123451e-06, "loss": 3.4390463256835937, "step": 255600 }, { "epoch": 0.30853611558822314, "learning_rate": 9.007776255766772e-06, "loss": 3.4790573120117188, "step": 255700 }, { "epoch": 0.3086567789107058, "learning_rate": 9.007372420299034e-06, "loss": 3.4838552856445313, "step": 255800 }, { "epoch": 0.3087774422331885, "learning_rate": 9.006968584831294e-06, "loss": 3.491734619140625, "step": 255900 }, { "epoch": 0.3088981055556712, "learning_rate": 9.006564749363556e-06, "loss": 3.4590802001953125, "step": 256000 }, { "epoch": 0.3090187688781539, "learning_rate": 9.006160913895818e-06, "loss": 3.4694879150390623, "step": 256100 }, { "epoch": 0.30913943220063655, "learning_rate": 9.005757078428078e-06, "loss": 3.476360168457031, "step": 256200 }, { "epoch": 0.3092600955231192, "learning_rate": 9.00535324296034e-06, "loss": 3.4748306274414062, "step": 256300 }, { "epoch": 0.3093807588456019, "learning_rate": 9.004949407492602e-06, "loss": 3.4740774536132815, "step": 256400 }, { "epoch": 0.30950142216808463, "learning_rate": 9.004545572024864e-06, "loss": 3.4562893676757813, "step": 256500 }, { "epoch": 0.3096220854905673, "learning_rate": 9.004141736557126e-06, "loss": 3.4700558471679686, "step": 256600 }, { "epoch": 0.30974274881305, "learning_rate": 9.003737901089388e-06, "loss": 3.483645324707031, "step": 256700 }, { "epoch": 0.30986341213553265, "learning_rate": 9.003334065621649e-06, "loss": 3.4599957275390625, "step": 256800 }, { "epoch": 0.3099840754580154, "learning_rate": 9.00293023015391e-06, "loss": 3.4322518920898437, "step": 256900 }, { "epoch": 0.31010473878049805, "learning_rate": 9.002526394686173e-06, "loss": 3.4546319580078126, "step": 257000 }, { "epoch": 0.3102254021029807, "learning_rate": 9.002122559218433e-06, "loss": 3.4382232666015624, "step": 257100 }, { "epoch": 0.3103460654254634, "learning_rate": 9.001718723750695e-06, "loss": 3.4302105712890625, "step": 257200 }, { "epoch": 0.31046672874794606, "learning_rate": 9.001314888282957e-06, "loss": 3.4439813232421876, "step": 257300 }, { "epoch": 0.3105873920704288, "learning_rate": 9.000911052815219e-06, "loss": 3.4578170776367188, "step": 257400 }, { "epoch": 0.31070805539291146, "learning_rate": 9.00050721734748e-06, "loss": 3.4609609985351564, "step": 257500 }, { "epoch": 0.31082871871539414, "learning_rate": 9.000103381879743e-06, "loss": 3.446241455078125, "step": 257600 }, { "epoch": 0.3109493820378768, "learning_rate": 8.999699546412003e-06, "loss": 3.454146728515625, "step": 257700 }, { "epoch": 0.3110700453603595, "learning_rate": 8.999295710944265e-06, "loss": 3.4278073120117187, "step": 257800 }, { "epoch": 0.3111907086828422, "learning_rate": 8.998891875476527e-06, "loss": 3.448636779785156, "step": 257900 }, { "epoch": 0.3113113720053249, "learning_rate": 8.998488040008789e-06, "loss": 3.4290347290039063, "step": 258000 }, { "epoch": 0.31143203532780755, "learning_rate": 8.99808420454105e-06, "loss": 3.467711181640625, "step": 258100 }, { "epoch": 0.3115526986502902, "learning_rate": 8.997680369073311e-06, "loss": 3.486952209472656, "step": 258200 }, { "epoch": 0.3116733619727729, "learning_rate": 8.997276533605573e-06, "loss": 3.483233642578125, "step": 258300 }, { "epoch": 0.31179402529525563, "learning_rate": 8.996872698137835e-06, "loss": 3.4470220947265626, "step": 258400 }, { "epoch": 0.3119146886177383, "learning_rate": 8.996468862670095e-06, "loss": 3.45255615234375, "step": 258500 }, { "epoch": 0.312035351940221, "learning_rate": 8.996065027202357e-06, "loss": 3.4778948974609376, "step": 258600 }, { "epoch": 0.31215601526270365, "learning_rate": 8.99566119173462e-06, "loss": 3.448267517089844, "step": 258700 }, { "epoch": 0.3122766785851863, "learning_rate": 8.995257356266881e-06, "loss": 3.4616732788085938, "step": 258800 }, { "epoch": 0.31239734190766905, "learning_rate": 8.994853520799143e-06, "loss": 3.4321258544921873, "step": 258900 }, { "epoch": 0.3125180052301517, "learning_rate": 8.994449685331404e-06, "loss": 3.4414938354492186, "step": 259000 }, { "epoch": 0.3126386685526344, "learning_rate": 8.994045849863666e-06, "loss": 3.442357482910156, "step": 259100 }, { "epoch": 0.31275933187511706, "learning_rate": 8.993642014395928e-06, "loss": 3.451965026855469, "step": 259200 }, { "epoch": 0.3128799951975998, "learning_rate": 8.993238178928188e-06, "loss": 3.4376675415039064, "step": 259300 }, { "epoch": 0.31300065852008246, "learning_rate": 8.99283434346045e-06, "loss": 3.4315447998046875, "step": 259400 }, { "epoch": 0.31312132184256514, "learning_rate": 8.992430507992712e-06, "loss": 3.4639126586914064, "step": 259500 }, { "epoch": 0.3132419851650478, "learning_rate": 8.992026672524974e-06, "loss": 3.438892517089844, "step": 259600 }, { "epoch": 0.3133626484875305, "learning_rate": 8.991622837057236e-06, "loss": 3.4461026000976562, "step": 259700 }, { "epoch": 0.3134833118100132, "learning_rate": 8.991219001589498e-06, "loss": 3.430269775390625, "step": 259800 }, { "epoch": 0.3136039751324959, "learning_rate": 8.99081516612176e-06, "loss": 3.4286233520507814, "step": 259900 }, { "epoch": 0.31372463845497855, "learning_rate": 8.99041133065402e-06, "loss": 3.4094638061523437, "step": 260000 }, { "epoch": 0.3138453017774612, "learning_rate": 8.990007495186282e-06, "loss": 3.471685485839844, "step": 260100 }, { "epoch": 0.3139659650999439, "learning_rate": 8.989603659718542e-06, "loss": 3.441114807128906, "step": 260200 }, { "epoch": 0.31408662842242663, "learning_rate": 8.989199824250804e-06, "loss": 3.4295526123046876, "step": 260300 }, { "epoch": 0.3142072917449093, "learning_rate": 8.988795988783066e-06, "loss": 3.449185485839844, "step": 260400 }, { "epoch": 0.314327955067392, "learning_rate": 8.988392153315328e-06, "loss": 3.433816223144531, "step": 260500 }, { "epoch": 0.31444861838987465, "learning_rate": 8.98798831784759e-06, "loss": 3.4271749877929687, "step": 260600 }, { "epoch": 0.3145692817123573, "learning_rate": 8.987584482379852e-06, "loss": 3.426239318847656, "step": 260700 }, { "epoch": 0.31468994503484005, "learning_rate": 8.987180646912114e-06, "loss": 3.441658630371094, "step": 260800 }, { "epoch": 0.3148106083573227, "learning_rate": 8.986776811444375e-06, "loss": 3.446959228515625, "step": 260900 }, { "epoch": 0.3149312716798054, "learning_rate": 8.986372975976637e-06, "loss": 3.4415554809570312, "step": 261000 }, { "epoch": 0.31505193500228806, "learning_rate": 8.985969140508899e-06, "loss": 3.459325866699219, "step": 261100 }, { "epoch": 0.31517259832477074, "learning_rate": 8.985565305041159e-06, "loss": 3.4426275634765626, "step": 261200 }, { "epoch": 0.31529326164725346, "learning_rate": 8.98516146957342e-06, "loss": 3.4380389404296876, "step": 261300 }, { "epoch": 0.31541392496973614, "learning_rate": 8.984757634105683e-06, "loss": 3.4577291870117186, "step": 261400 }, { "epoch": 0.3155345882922188, "learning_rate": 8.984353798637945e-06, "loss": 3.4526336669921873, "step": 261500 }, { "epoch": 0.3156552516147015, "learning_rate": 8.983949963170207e-06, "loss": 3.4343365478515624, "step": 261600 }, { "epoch": 0.3157759149371842, "learning_rate": 8.983546127702467e-06, "loss": 3.4428106689453126, "step": 261700 }, { "epoch": 0.3158965782596669, "learning_rate": 8.983142292234729e-06, "loss": 3.4348904418945314, "step": 261800 }, { "epoch": 0.31601724158214956, "learning_rate": 8.982738456766991e-06, "loss": 3.439107666015625, "step": 261900 }, { "epoch": 0.3161379049046322, "learning_rate": 8.982334621299253e-06, "loss": 3.4811529541015624, "step": 262000 }, { "epoch": 0.3162585682271149, "learning_rate": 8.981930785831513e-06, "loss": 3.425936279296875, "step": 262100 }, { "epoch": 0.31637923154959763, "learning_rate": 8.981526950363775e-06, "loss": 3.4206106567382815, "step": 262200 }, { "epoch": 0.3164998948720803, "learning_rate": 8.981123114896037e-06, "loss": 3.430743408203125, "step": 262300 }, { "epoch": 0.316620558194563, "learning_rate": 8.9807192794283e-06, "loss": 3.445758972167969, "step": 262400 }, { "epoch": 0.31674122151704565, "learning_rate": 8.980315443960561e-06, "loss": 3.429609375, "step": 262500 }, { "epoch": 0.3168618848395283, "learning_rate": 8.979911608492822e-06, "loss": 3.4421597290039063, "step": 262600 }, { "epoch": 0.31698254816201105, "learning_rate": 8.979507773025083e-06, "loss": 3.43178466796875, "step": 262700 }, { "epoch": 0.3171032114844937, "learning_rate": 8.979103937557345e-06, "loss": 3.4656103515625, "step": 262800 }, { "epoch": 0.3172238748069764, "learning_rate": 8.978700102089607e-06, "loss": 3.4023223876953126, "step": 262900 }, { "epoch": 0.31734453812945906, "learning_rate": 8.97829626662187e-06, "loss": 3.416497802734375, "step": 263000 }, { "epoch": 0.31746520145194174, "learning_rate": 8.97789243115413e-06, "loss": 3.4252813720703124, "step": 263100 }, { "epoch": 0.31758586477442446, "learning_rate": 8.977488595686392e-06, "loss": 3.4430691528320314, "step": 263200 }, { "epoch": 0.31770652809690714, "learning_rate": 8.977084760218654e-06, "loss": 3.426926574707031, "step": 263300 }, { "epoch": 0.3178271914193898, "learning_rate": 8.976680924750914e-06, "loss": 3.4162826538085938, "step": 263400 }, { "epoch": 0.3179478547418725, "learning_rate": 8.976277089283176e-06, "loss": 3.4495684814453127, "step": 263500 }, { "epoch": 0.31806851806435515, "learning_rate": 8.975873253815438e-06, "loss": 3.443098449707031, "step": 263600 }, { "epoch": 0.3181891813868379, "learning_rate": 8.9754694183477e-06, "loss": 3.4121856689453125, "step": 263700 }, { "epoch": 0.31830984470932056, "learning_rate": 8.975065582879962e-06, "loss": 3.4222564697265625, "step": 263800 }, { "epoch": 0.3184305080318032, "learning_rate": 8.974661747412224e-06, "loss": 3.457413635253906, "step": 263900 }, { "epoch": 0.3185511713542859, "learning_rate": 8.974257911944486e-06, "loss": 3.4241983032226564, "step": 264000 }, { "epoch": 0.3186718346767686, "learning_rate": 8.973854076476746e-06, "loss": 3.471674499511719, "step": 264100 }, { "epoch": 0.3187924979992513, "learning_rate": 8.973450241009008e-06, "loss": 3.458307800292969, "step": 264200 }, { "epoch": 0.318913161321734, "learning_rate": 8.973046405541268e-06, "loss": 3.4418869018554688, "step": 264300 }, { "epoch": 0.31903382464421665, "learning_rate": 8.97264257007353e-06, "loss": 3.424395751953125, "step": 264400 }, { "epoch": 0.3191544879666993, "learning_rate": 8.972238734605792e-06, "loss": 3.43928955078125, "step": 264500 }, { "epoch": 0.31927515128918205, "learning_rate": 8.971834899138054e-06, "loss": 3.4374850463867186, "step": 264600 }, { "epoch": 0.3193958146116647, "learning_rate": 8.971431063670316e-06, "loss": 3.413984375, "step": 264700 }, { "epoch": 0.3195164779341474, "learning_rate": 8.971027228202578e-06, "loss": 3.422423095703125, "step": 264800 }, { "epoch": 0.31963714125663006, "learning_rate": 8.97062339273484e-06, "loss": 3.4129583740234377, "step": 264900 }, { "epoch": 0.31975780457911274, "learning_rate": 8.9702195572671e-06, "loss": 3.4327459716796875, "step": 265000 }, { "epoch": 0.31987846790159546, "learning_rate": 8.969815721799363e-06, "loss": 3.452320251464844, "step": 265100 }, { "epoch": 0.31999913122407814, "learning_rate": 8.969411886331625e-06, "loss": 3.4316326904296877, "step": 265200 }, { "epoch": 0.3201197945465608, "learning_rate": 8.969008050863885e-06, "loss": 3.422105407714844, "step": 265300 }, { "epoch": 0.3202404578690435, "learning_rate": 8.968604215396147e-06, "loss": 3.448186340332031, "step": 265400 }, { "epoch": 0.32036112119152615, "learning_rate": 8.968200379928409e-06, "loss": 3.4348150634765626, "step": 265500 }, { "epoch": 0.3204817845140089, "learning_rate": 8.96779654446067e-06, "loss": 3.4232470703125, "step": 265600 }, { "epoch": 0.32060244783649156, "learning_rate": 8.967392708992933e-06, "loss": 3.420945739746094, "step": 265700 }, { "epoch": 0.32072311115897423, "learning_rate": 8.966988873525193e-06, "loss": 3.418802490234375, "step": 265800 }, { "epoch": 0.3208437744814569, "learning_rate": 8.966585038057455e-06, "loss": 3.4635491943359376, "step": 265900 }, { "epoch": 0.3209644378039396, "learning_rate": 8.966181202589717e-06, "loss": 3.439429931640625, "step": 266000 }, { "epoch": 0.3210851011264223, "learning_rate": 8.965777367121979e-06, "loss": 3.417015380859375, "step": 266100 }, { "epoch": 0.321205764448905, "learning_rate": 8.96537353165424e-06, "loss": 3.4199600219726562, "step": 266200 }, { "epoch": 0.32132642777138765, "learning_rate": 8.964969696186501e-06, "loss": 3.389524230957031, "step": 266300 }, { "epoch": 0.3214470910938703, "learning_rate": 8.964565860718763e-06, "loss": 3.4148764038085937, "step": 266400 }, { "epoch": 0.321567754416353, "learning_rate": 8.964162025251025e-06, "loss": 3.430206298828125, "step": 266500 }, { "epoch": 0.3216884177388357, "learning_rate": 8.963758189783286e-06, "loss": 3.4072830200195314, "step": 266600 }, { "epoch": 0.3218090810613184, "learning_rate": 8.963354354315548e-06, "loss": 3.4197808837890626, "step": 266700 }, { "epoch": 0.32192974438380106, "learning_rate": 8.96295051884781e-06, "loss": 3.4132696533203126, "step": 266800 }, { "epoch": 0.32205040770628374, "learning_rate": 8.962546683380072e-06, "loss": 3.3937384033203126, "step": 266900 }, { "epoch": 0.32217107102876646, "learning_rate": 8.962142847912333e-06, "loss": 3.4091748046875, "step": 267000 }, { "epoch": 0.32229173435124914, "learning_rate": 8.961739012444595e-06, "loss": 3.4112197875976564, "step": 267100 }, { "epoch": 0.3224123976737318, "learning_rate": 8.961335176976856e-06, "loss": 3.434464111328125, "step": 267200 }, { "epoch": 0.3225330609962145, "learning_rate": 8.960931341509118e-06, "loss": 3.4558660888671877, "step": 267300 }, { "epoch": 0.32265372431869715, "learning_rate": 8.960527506041378e-06, "loss": 3.422171936035156, "step": 267400 }, { "epoch": 0.3227743876411799, "learning_rate": 8.96012367057364e-06, "loss": 3.4338082885742187, "step": 267500 }, { "epoch": 0.32289505096366256, "learning_rate": 8.959719835105902e-06, "loss": 3.4131838989257814, "step": 267600 }, { "epoch": 0.32301571428614523, "learning_rate": 8.959315999638164e-06, "loss": 3.405376281738281, "step": 267700 }, { "epoch": 0.3231363776086279, "learning_rate": 8.958912164170426e-06, "loss": 3.41404541015625, "step": 267800 }, { "epoch": 0.3232570409311106, "learning_rate": 8.958508328702688e-06, "loss": 3.4180859375, "step": 267900 }, { "epoch": 0.3233777042535933, "learning_rate": 8.95810449323495e-06, "loss": 3.4190237426757815, "step": 268000 }, { "epoch": 0.323498367576076, "learning_rate": 8.95770065776721e-06, "loss": 3.431121826171875, "step": 268100 }, { "epoch": 0.32361903089855865, "learning_rate": 8.957296822299472e-06, "loss": 3.3913348388671873, "step": 268200 }, { "epoch": 0.3237396942210413, "learning_rate": 8.956892986831734e-06, "loss": 3.414170837402344, "step": 268300 }, { "epoch": 0.323860357543524, "learning_rate": 8.956489151363994e-06, "loss": 3.4269586181640626, "step": 268400 }, { "epoch": 0.3239810208660067, "learning_rate": 8.956085315896256e-06, "loss": 3.4055206298828127, "step": 268500 }, { "epoch": 0.3241016841884894, "learning_rate": 8.955681480428518e-06, "loss": 3.427828674316406, "step": 268600 }, { "epoch": 0.32422234751097206, "learning_rate": 8.95527764496078e-06, "loss": 3.4393997192382812, "step": 268700 }, { "epoch": 0.32434301083345474, "learning_rate": 8.954873809493042e-06, "loss": 3.4129901123046875, "step": 268800 }, { "epoch": 0.3244636741559374, "learning_rate": 8.954469974025304e-06, "loss": 3.407271423339844, "step": 268900 }, { "epoch": 0.32458433747842014, "learning_rate": 8.954066138557566e-06, "loss": 3.4225839233398436, "step": 269000 }, { "epoch": 0.3247050008009028, "learning_rate": 8.953662303089827e-06, "loss": 3.4220285034179687, "step": 269100 }, { "epoch": 0.3248256641233855, "learning_rate": 8.953258467622089e-06, "loss": 3.430135498046875, "step": 269200 }, { "epoch": 0.32494632744586815, "learning_rate": 8.952854632154349e-06, "loss": 3.402149963378906, "step": 269300 }, { "epoch": 0.3250669907683508, "learning_rate": 8.952450796686611e-06, "loss": 3.4288433837890624, "step": 269400 }, { "epoch": 0.32518765409083356, "learning_rate": 8.952046961218873e-06, "loss": 3.3944317626953127, "step": 269500 }, { "epoch": 0.32530831741331623, "learning_rate": 8.951643125751135e-06, "loss": 3.42071044921875, "step": 269600 }, { "epoch": 0.3254289807357989, "learning_rate": 8.951239290283397e-06, "loss": 3.4072747802734376, "step": 269700 }, { "epoch": 0.3255496440582816, "learning_rate": 8.950835454815659e-06, "loss": 3.4286843872070314, "step": 269800 }, { "epoch": 0.3256703073807643, "learning_rate": 8.950431619347919e-06, "loss": 3.4127377319335936, "step": 269900 }, { "epoch": 0.325790970703247, "learning_rate": 8.950027783880181e-06, "loss": 3.410301513671875, "step": 270000 }, { "epoch": 0.32591163402572965, "learning_rate": 8.949623948412443e-06, "loss": 3.4120755004882812, "step": 270100 }, { "epoch": 0.3260322973482123, "learning_rate": 8.949220112944705e-06, "loss": 3.4109710693359374, "step": 270200 }, { "epoch": 0.326152960670695, "learning_rate": 8.948816277476965e-06, "loss": 3.431054992675781, "step": 270300 }, { "epoch": 0.3262736239931777, "learning_rate": 8.948412442009227e-06, "loss": 3.435937805175781, "step": 270400 }, { "epoch": 0.3263942873156604, "learning_rate": 8.94800860654149e-06, "loss": 3.4051300048828126, "step": 270500 }, { "epoch": 0.32651495063814306, "learning_rate": 8.947604771073751e-06, "loss": 3.402293395996094, "step": 270600 }, { "epoch": 0.32663561396062574, "learning_rate": 8.947200935606012e-06, "loss": 3.4104534912109377, "step": 270700 }, { "epoch": 0.3267562772831084, "learning_rate": 8.946797100138274e-06, "loss": 3.450542297363281, "step": 270800 }, { "epoch": 0.32687694060559114, "learning_rate": 8.946393264670536e-06, "loss": 3.404408264160156, "step": 270900 }, { "epoch": 0.3269976039280738, "learning_rate": 8.945989429202798e-06, "loss": 3.3864266967773435, "step": 271000 }, { "epoch": 0.3271182672505565, "learning_rate": 8.94558559373506e-06, "loss": 3.438731384277344, "step": 271100 }, { "epoch": 0.32723893057303916, "learning_rate": 8.94518175826732e-06, "loss": 3.3691412353515626, "step": 271200 }, { "epoch": 0.3273595938955218, "learning_rate": 8.944777922799582e-06, "loss": 3.418052978515625, "step": 271300 }, { "epoch": 0.32748025721800456, "learning_rate": 8.944374087331844e-06, "loss": 3.402443542480469, "step": 271400 }, { "epoch": 0.32760092054048723, "learning_rate": 8.943970251864104e-06, "loss": 3.4133282470703126, "step": 271500 }, { "epoch": 0.3277215838629699, "learning_rate": 8.943566416396366e-06, "loss": 3.4210699462890624, "step": 271600 }, { "epoch": 0.3278422471854526, "learning_rate": 8.943162580928628e-06, "loss": 3.394195556640625, "step": 271700 }, { "epoch": 0.32796291050793525, "learning_rate": 8.94275874546089e-06, "loss": 3.3984625244140627, "step": 271800 }, { "epoch": 0.328083573830418, "learning_rate": 8.942354909993152e-06, "loss": 3.4185125732421877, "step": 271900 }, { "epoch": 0.32820423715290065, "learning_rate": 8.941951074525414e-06, "loss": 3.3967440795898436, "step": 272000 }, { "epoch": 0.3283249004753833, "learning_rate": 8.941547239057676e-06, "loss": 3.404901123046875, "step": 272100 }, { "epoch": 0.328445563797866, "learning_rate": 8.941143403589936e-06, "loss": 3.434716796875, "step": 272200 }, { "epoch": 0.3285662271203487, "learning_rate": 8.940739568122198e-06, "loss": 3.386178283691406, "step": 272300 }, { "epoch": 0.3286868904428314, "learning_rate": 8.940335732654459e-06, "loss": 3.3972821044921875, "step": 272400 }, { "epoch": 0.32880755376531406, "learning_rate": 8.93993189718672e-06, "loss": 3.3879278564453124, "step": 272500 }, { "epoch": 0.32892821708779674, "learning_rate": 8.939528061718982e-06, "loss": 3.4064971923828127, "step": 272600 }, { "epoch": 0.3290488804102794, "learning_rate": 8.939124226251244e-06, "loss": 3.384049987792969, "step": 272700 }, { "epoch": 0.32916954373276214, "learning_rate": 8.938720390783506e-06, "loss": 3.4083456420898437, "step": 272800 }, { "epoch": 0.3292902070552448, "learning_rate": 8.938316555315768e-06, "loss": 3.392106018066406, "step": 272900 }, { "epoch": 0.3294108703777275, "learning_rate": 8.93791271984803e-06, "loss": 3.3937637329101564, "step": 273000 }, { "epoch": 0.32953153370021016, "learning_rate": 8.93750888438029e-06, "loss": 3.4171212768554686, "step": 273100 }, { "epoch": 0.3296521970226928, "learning_rate": 8.937105048912553e-06, "loss": 3.382413635253906, "step": 273200 }, { "epoch": 0.32977286034517556, "learning_rate": 8.936701213444815e-06, "loss": 3.412478332519531, "step": 273300 }, { "epoch": 0.32989352366765823, "learning_rate": 8.936297377977075e-06, "loss": 3.3814852905273436, "step": 273400 }, { "epoch": 0.3300141869901409, "learning_rate": 8.935893542509337e-06, "loss": 3.3921054077148436, "step": 273500 }, { "epoch": 0.3301348503126236, "learning_rate": 8.935489707041599e-06, "loss": 3.406640625, "step": 273600 }, { "epoch": 0.33025551363510625, "learning_rate": 8.935085871573861e-06, "loss": 3.408719177246094, "step": 273700 }, { "epoch": 0.330376176957589, "learning_rate": 8.934682036106123e-06, "loss": 3.3929583740234377, "step": 273800 }, { "epoch": 0.33049684028007165, "learning_rate": 8.934278200638385e-06, "loss": 3.3913949584960936, "step": 273900 }, { "epoch": 0.3306175036025543, "learning_rate": 8.933874365170645e-06, "loss": 3.404845886230469, "step": 274000 }, { "epoch": 0.330738166925037, "learning_rate": 8.933470529702907e-06, "loss": 3.4157815551757813, "step": 274100 }, { "epoch": 0.33085883024751966, "learning_rate": 8.933066694235169e-06, "loss": 3.4067898559570313, "step": 274200 }, { "epoch": 0.3309794935700024, "learning_rate": 8.93266285876743e-06, "loss": 3.3764547729492187, "step": 274300 }, { "epoch": 0.33110015689248506, "learning_rate": 8.932259023299691e-06, "loss": 3.409166259765625, "step": 274400 }, { "epoch": 0.33122082021496774, "learning_rate": 8.931855187831953e-06, "loss": 3.3862844848632814, "step": 274500 }, { "epoch": 0.3313414835374504, "learning_rate": 8.931451352364215e-06, "loss": 3.386566467285156, "step": 274600 }, { "epoch": 0.33146214685993314, "learning_rate": 8.931047516896477e-06, "loss": 3.3982144165039063, "step": 274700 }, { "epoch": 0.3315828101824158, "learning_rate": 8.930643681428738e-06, "loss": 3.400815124511719, "step": 274800 }, { "epoch": 0.3317034735048985, "learning_rate": 8.930239845961e-06, "loss": 3.4145538330078127, "step": 274900 }, { "epoch": 0.33182413682738116, "learning_rate": 8.929836010493262e-06, "loss": 3.4297802734375, "step": 275000 }, { "epoch": 0.33194480014986383, "learning_rate": 8.929432175025524e-06, "loss": 3.41453857421875, "step": 275100 }, { "epoch": 0.33206546347234656, "learning_rate": 8.929028339557786e-06, "loss": 3.4054510498046877, "step": 275200 }, { "epoch": 0.33218612679482923, "learning_rate": 8.928624504090046e-06, "loss": 3.40883056640625, "step": 275300 }, { "epoch": 0.3323067901173119, "learning_rate": 8.928220668622308e-06, "loss": 3.395893859863281, "step": 275400 }, { "epoch": 0.3324274534397946, "learning_rate": 8.92781683315457e-06, "loss": 3.373174133300781, "step": 275500 }, { "epoch": 0.33254811676227725, "learning_rate": 8.92741299768683e-06, "loss": 3.391562194824219, "step": 275600 }, { "epoch": 0.33266878008476, "learning_rate": 8.927009162219092e-06, "loss": 3.4045245361328127, "step": 275700 }, { "epoch": 0.33278944340724265, "learning_rate": 8.926605326751354e-06, "loss": 3.406170654296875, "step": 275800 }, { "epoch": 0.3329101067297253, "learning_rate": 8.926201491283616e-06, "loss": 3.4026727294921875, "step": 275900 }, { "epoch": 0.333030770052208, "learning_rate": 8.925797655815878e-06, "loss": 3.394820556640625, "step": 276000 }, { "epoch": 0.33315143337469066, "learning_rate": 8.92539382034814e-06, "loss": 3.3794119262695315, "step": 276100 }, { "epoch": 0.3332720966971734, "learning_rate": 8.9249899848804e-06, "loss": 3.368946228027344, "step": 276200 }, { "epoch": 0.33339276001965606, "learning_rate": 8.924586149412662e-06, "loss": 3.4138827514648438, "step": 276300 }, { "epoch": 0.33351342334213874, "learning_rate": 8.924182313944924e-06, "loss": 3.3815133666992185, "step": 276400 }, { "epoch": 0.3336340866646214, "learning_rate": 8.923778478477185e-06, "loss": 3.359302673339844, "step": 276500 }, { "epoch": 0.3337547499871041, "learning_rate": 8.923374643009447e-06, "loss": 3.376070251464844, "step": 276600 }, { "epoch": 0.3338754133095868, "learning_rate": 8.922970807541709e-06, "loss": 3.35724853515625, "step": 276700 }, { "epoch": 0.3339960766320695, "learning_rate": 8.92256697207397e-06, "loss": 3.362991943359375, "step": 276800 }, { "epoch": 0.33411673995455216, "learning_rate": 8.922163136606232e-06, "loss": 3.383186950683594, "step": 276900 }, { "epoch": 0.33423740327703483, "learning_rate": 8.921759301138494e-06, "loss": 3.3990017700195314, "step": 277000 }, { "epoch": 0.3343580665995175, "learning_rate": 8.921355465670756e-06, "loss": 3.3729241943359374, "step": 277100 }, { "epoch": 0.33447872992200023, "learning_rate": 8.920951630203017e-06, "loss": 3.3886309814453126, "step": 277200 }, { "epoch": 0.3345993932444829, "learning_rate": 8.920547794735279e-06, "loss": 3.3883697509765627, "step": 277300 }, { "epoch": 0.3347200565669656, "learning_rate": 8.920143959267539e-06, "loss": 3.39986083984375, "step": 277400 }, { "epoch": 0.33484071988944825, "learning_rate": 8.919740123799801e-06, "loss": 3.388621826171875, "step": 277500 }, { "epoch": 0.334961383211931, "learning_rate": 8.919336288332063e-06, "loss": 3.39012451171875, "step": 277600 }, { "epoch": 0.33508204653441365, "learning_rate": 8.918932452864325e-06, "loss": 3.415402526855469, "step": 277700 }, { "epoch": 0.3352027098568963, "learning_rate": 8.918528617396587e-06, "loss": 3.3778555297851565, "step": 277800 }, { "epoch": 0.335323373179379, "learning_rate": 8.918124781928849e-06, "loss": 3.38413818359375, "step": 277900 }, { "epoch": 0.33544403650186166, "learning_rate": 8.917720946461111e-06, "loss": 3.4044259643554686, "step": 278000 }, { "epoch": 0.3355646998243444, "learning_rate": 8.917317110993371e-06, "loss": 3.384930419921875, "step": 278100 }, { "epoch": 0.33568536314682706, "learning_rate": 8.916913275525633e-06, "loss": 3.389382629394531, "step": 278200 }, { "epoch": 0.33580602646930974, "learning_rate": 8.916509440057895e-06, "loss": 3.363320617675781, "step": 278300 }, { "epoch": 0.3359266897917924, "learning_rate": 8.916105604590155e-06, "loss": 3.376626281738281, "step": 278400 }, { "epoch": 0.3360473531142751, "learning_rate": 8.915701769122417e-06, "loss": 3.387845153808594, "step": 278500 }, { "epoch": 0.3361680164367578, "learning_rate": 8.91529793365468e-06, "loss": 3.382444152832031, "step": 278600 }, { "epoch": 0.3362886797592405, "learning_rate": 8.914894098186941e-06, "loss": 3.3610235595703126, "step": 278700 }, { "epoch": 0.33640934308172316, "learning_rate": 8.914490262719203e-06, "loss": 3.3461782836914065, "step": 278800 }, { "epoch": 0.33653000640420583, "learning_rate": 8.914086427251464e-06, "loss": 3.344154968261719, "step": 278900 }, { "epoch": 0.3366506697266885, "learning_rate": 8.913682591783726e-06, "loss": 3.3894277954101564, "step": 279000 }, { "epoch": 0.33677133304917123, "learning_rate": 8.913278756315988e-06, "loss": 3.3843310546875, "step": 279100 }, { "epoch": 0.3368919963716539, "learning_rate": 8.91287492084825e-06, "loss": 3.392698059082031, "step": 279200 }, { "epoch": 0.3370126596941366, "learning_rate": 8.912471085380512e-06, "loss": 3.420693054199219, "step": 279300 }, { "epoch": 0.33713332301661925, "learning_rate": 8.912067249912772e-06, "loss": 3.367318115234375, "step": 279400 }, { "epoch": 0.3372539863391019, "learning_rate": 8.911663414445034e-06, "loss": 3.385009765625, "step": 279500 }, { "epoch": 0.33737464966158465, "learning_rate": 8.911259578977296e-06, "loss": 3.3924191284179686, "step": 279600 }, { "epoch": 0.3374953129840673, "learning_rate": 8.910855743509556e-06, "loss": 3.3769635009765624, "step": 279700 }, { "epoch": 0.33761597630655, "learning_rate": 8.910451908041818e-06, "loss": 3.3821453857421875, "step": 279800 }, { "epoch": 0.33773663962903266, "learning_rate": 8.91004807257408e-06, "loss": 3.37096435546875, "step": 279900 }, { "epoch": 0.3378573029515154, "learning_rate": 8.909644237106342e-06, "loss": 3.3777685546875, "step": 280000 }, { "epoch": 0.33797796627399807, "learning_rate": 8.909240401638604e-06, "loss": 3.3721749877929685, "step": 280100 }, { "epoch": 0.33809862959648074, "learning_rate": 8.908836566170866e-06, "loss": 3.395386962890625, "step": 280200 }, { "epoch": 0.3382192929189634, "learning_rate": 8.908432730703126e-06, "loss": 3.3792495727539062, "step": 280300 }, { "epoch": 0.3383399562414461, "learning_rate": 8.908028895235388e-06, "loss": 3.3678704833984376, "step": 280400 }, { "epoch": 0.3384606195639288, "learning_rate": 8.90762505976765e-06, "loss": 3.3860684204101563, "step": 280500 }, { "epoch": 0.3385812828864115, "learning_rate": 8.90722122429991e-06, "loss": 3.38067626953125, "step": 280600 }, { "epoch": 0.33870194620889416, "learning_rate": 8.906817388832173e-06, "loss": 3.4077716064453125, "step": 280700 }, { "epoch": 0.33882260953137683, "learning_rate": 8.906413553364435e-06, "loss": 3.38542236328125, "step": 280800 }, { "epoch": 0.3389432728538595, "learning_rate": 8.906009717896697e-06, "loss": 3.342257385253906, "step": 280900 }, { "epoch": 0.33906393617634223, "learning_rate": 8.905605882428959e-06, "loss": 3.411065979003906, "step": 281000 }, { "epoch": 0.3391845994988249, "learning_rate": 8.90520204696122e-06, "loss": 3.3679949951171877, "step": 281100 }, { "epoch": 0.3393052628213076, "learning_rate": 8.904798211493482e-06, "loss": 3.3774600219726563, "step": 281200 }, { "epoch": 0.33942592614379025, "learning_rate": 8.904394376025743e-06, "loss": 3.389027099609375, "step": 281300 }, { "epoch": 0.3395465894662729, "learning_rate": 8.903990540558005e-06, "loss": 3.4046002197265626, "step": 281400 }, { "epoch": 0.33966725278875565, "learning_rate": 8.903586705090265e-06, "loss": 3.37701416015625, "step": 281500 }, { "epoch": 0.3397879161112383, "learning_rate": 8.903182869622527e-06, "loss": 3.3534051513671876, "step": 281600 }, { "epoch": 0.339908579433721, "learning_rate": 8.902779034154789e-06, "loss": 3.368833312988281, "step": 281700 }, { "epoch": 0.34002924275620366, "learning_rate": 8.902375198687051e-06, "loss": 3.3513803100585937, "step": 281800 }, { "epoch": 0.34014990607868634, "learning_rate": 8.901971363219313e-06, "loss": 3.3462094116210936, "step": 281900 }, { "epoch": 0.34027056940116907, "learning_rate": 8.901567527751575e-06, "loss": 3.391901550292969, "step": 282000 }, { "epoch": 0.34039123272365174, "learning_rate": 8.901163692283835e-06, "loss": 3.37974609375, "step": 282100 }, { "epoch": 0.3405118960461344, "learning_rate": 8.900759856816097e-06, "loss": 3.3770928955078126, "step": 282200 }, { "epoch": 0.3406325593686171, "learning_rate": 8.90035602134836e-06, "loss": 3.3966827392578125, "step": 282300 }, { "epoch": 0.34075322269109976, "learning_rate": 8.899952185880621e-06, "loss": 3.3758489990234377, "step": 282400 }, { "epoch": 0.3408738860135825, "learning_rate": 8.899548350412881e-06, "loss": 3.412453308105469, "step": 282500 }, { "epoch": 0.34099454933606516, "learning_rate": 8.899144514945143e-06, "loss": 3.3762371826171873, "step": 282600 }, { "epoch": 0.34111521265854783, "learning_rate": 8.898740679477405e-06, "loss": 3.3829190063476564, "step": 282700 }, { "epoch": 0.3412358759810305, "learning_rate": 8.898336844009667e-06, "loss": 3.3675518798828126, "step": 282800 }, { "epoch": 0.34135653930351323, "learning_rate": 8.89793300854193e-06, "loss": 3.3886773681640623, "step": 282900 }, { "epoch": 0.3414772026259959, "learning_rate": 8.89752917307419e-06, "loss": 3.3868609619140626, "step": 283000 }, { "epoch": 0.3415978659484786, "learning_rate": 8.897125337606452e-06, "loss": 3.3706756591796876, "step": 283100 }, { "epoch": 0.34171852927096125, "learning_rate": 8.896721502138714e-06, "loss": 3.3764334106445313, "step": 283200 }, { "epoch": 0.3418391925934439, "learning_rate": 8.896317666670976e-06, "loss": 3.352802734375, "step": 283300 }, { "epoch": 0.34195985591592665, "learning_rate": 8.895913831203236e-06, "loss": 3.391837158203125, "step": 283400 }, { "epoch": 0.3420805192384093, "learning_rate": 8.895509995735498e-06, "loss": 3.388258972167969, "step": 283500 }, { "epoch": 0.342201182560892, "learning_rate": 8.89510616026776e-06, "loss": 3.361815185546875, "step": 283600 }, { "epoch": 0.34232184588337466, "learning_rate": 8.894702324800022e-06, "loss": 3.342745666503906, "step": 283700 }, { "epoch": 0.34244250920585734, "learning_rate": 8.894298489332282e-06, "loss": 3.3899136352539063, "step": 283800 }, { "epoch": 0.34256317252834007, "learning_rate": 8.893894653864544e-06, "loss": 3.3812921142578123, "step": 283900 }, { "epoch": 0.34268383585082274, "learning_rate": 8.893490818396806e-06, "loss": 3.3620645141601564, "step": 284000 }, { "epoch": 0.3428044991733054, "learning_rate": 8.893086982929068e-06, "loss": 3.3420245361328127, "step": 284100 }, { "epoch": 0.3429251624957881, "learning_rate": 8.89268314746133e-06, "loss": 3.374725036621094, "step": 284200 }, { "epoch": 0.34304582581827076, "learning_rate": 8.892279311993592e-06, "loss": 3.3634933471679687, "step": 284300 }, { "epoch": 0.3431664891407535, "learning_rate": 8.891875476525852e-06, "loss": 3.358265686035156, "step": 284400 }, { "epoch": 0.34328715246323616, "learning_rate": 8.891471641058114e-06, "loss": 3.3755764770507812, "step": 284500 }, { "epoch": 0.34340781578571883, "learning_rate": 8.891067805590375e-06, "loss": 3.360271301269531, "step": 284600 }, { "epoch": 0.3435284791082015, "learning_rate": 8.890663970122637e-06, "loss": 3.3660818481445314, "step": 284700 }, { "epoch": 0.3436491424306842, "learning_rate": 8.890260134654899e-06, "loss": 3.367215881347656, "step": 284800 }, { "epoch": 0.3437698057531669, "learning_rate": 8.88985629918716e-06, "loss": 3.3591278076171873, "step": 284900 }, { "epoch": 0.3438904690756496, "learning_rate": 8.889452463719423e-06, "loss": 3.3559494018554688, "step": 285000 }, { "epoch": 0.34401113239813225, "learning_rate": 8.889048628251685e-06, "loss": 3.3690521240234377, "step": 285100 }, { "epoch": 0.3441317957206149, "learning_rate": 8.888644792783947e-06, "loss": 3.3683761596679687, "step": 285200 }, { "epoch": 0.34425245904309765, "learning_rate": 8.888240957316207e-06, "loss": 3.3877032470703123, "step": 285300 }, { "epoch": 0.3443731223655803, "learning_rate": 8.887837121848469e-06, "loss": 3.348993225097656, "step": 285400 }, { "epoch": 0.344493785688063, "learning_rate": 8.88743328638073e-06, "loss": 3.358624267578125, "step": 285500 }, { "epoch": 0.34461444901054566, "learning_rate": 8.887029450912991e-06, "loss": 3.3711981201171874, "step": 285600 }, { "epoch": 0.34473511233302834, "learning_rate": 8.886625615445253e-06, "loss": 3.3545632934570313, "step": 285700 }, { "epoch": 0.34485577565551107, "learning_rate": 8.886221779977515e-06, "loss": 3.377494201660156, "step": 285800 }, { "epoch": 0.34497643897799374, "learning_rate": 8.885817944509777e-06, "loss": 3.332389221191406, "step": 285900 }, { "epoch": 0.3450971023004764, "learning_rate": 8.885414109042039e-06, "loss": 3.38436279296875, "step": 286000 }, { "epoch": 0.3452177656229591, "learning_rate": 8.885010273574301e-06, "loss": 3.3601043701171873, "step": 286100 }, { "epoch": 0.34533842894544176, "learning_rate": 8.884606438106561e-06, "loss": 3.349520568847656, "step": 286200 }, { "epoch": 0.3454590922679245, "learning_rate": 8.884202602638823e-06, "loss": 3.3518450927734373, "step": 286300 }, { "epoch": 0.34557975559040716, "learning_rate": 8.883798767171085e-06, "loss": 3.3643002319335937, "step": 286400 }, { "epoch": 0.34570041891288983, "learning_rate": 8.883394931703346e-06, "loss": 3.386228332519531, "step": 286500 }, { "epoch": 0.3458210822353725, "learning_rate": 8.882991096235608e-06, "loss": 3.3288198852539064, "step": 286600 }, { "epoch": 0.3459417455578552, "learning_rate": 8.88258726076787e-06, "loss": 3.368284912109375, "step": 286700 }, { "epoch": 0.3460624088803379, "learning_rate": 8.882183425300131e-06, "loss": 3.3436083984375, "step": 286800 }, { "epoch": 0.3461830722028206, "learning_rate": 8.881779589832393e-06, "loss": 3.3695303344726564, "step": 286900 }, { "epoch": 0.34630373552530325, "learning_rate": 8.881375754364654e-06, "loss": 3.3454019165039064, "step": 287000 }, { "epoch": 0.3464243988477859, "learning_rate": 8.880971918896916e-06, "loss": 3.3680816650390626, "step": 287100 }, { "epoch": 0.3465450621702686, "learning_rate": 8.880568083429178e-06, "loss": 3.356971435546875, "step": 287200 }, { "epoch": 0.3466657254927513, "learning_rate": 8.88016424796144e-06, "loss": 3.343841857910156, "step": 287300 }, { "epoch": 0.346786388815234, "learning_rate": 8.879760412493702e-06, "loss": 3.34329345703125, "step": 287400 }, { "epoch": 0.34690705213771666, "learning_rate": 8.879356577025962e-06, "loss": 3.3465447998046876, "step": 287500 }, { "epoch": 0.34702771546019934, "learning_rate": 8.878952741558224e-06, "loss": 3.362466125488281, "step": 287600 }, { "epoch": 0.34714837878268207, "learning_rate": 8.878548906090486e-06, "loss": 3.350896301269531, "step": 287700 }, { "epoch": 0.34726904210516474, "learning_rate": 8.878145070622746e-06, "loss": 3.349106750488281, "step": 287800 }, { "epoch": 0.3473897054276474, "learning_rate": 8.877741235155008e-06, "loss": 3.3594305419921877, "step": 287900 }, { "epoch": 0.3475103687501301, "learning_rate": 8.87733739968727e-06, "loss": 3.356083984375, "step": 288000 }, { "epoch": 0.34763103207261276, "learning_rate": 8.876933564219532e-06, "loss": 3.3537591552734374, "step": 288100 }, { "epoch": 0.3477516953950955, "learning_rate": 8.876529728751794e-06, "loss": 3.356206970214844, "step": 288200 }, { "epoch": 0.34787235871757816, "learning_rate": 8.876125893284056e-06, "loss": 3.345203552246094, "step": 288300 }, { "epoch": 0.34799302204006083, "learning_rate": 8.875722057816316e-06, "loss": 3.3486846923828124, "step": 288400 }, { "epoch": 0.3481136853625435, "learning_rate": 8.875318222348578e-06, "loss": 3.3630889892578124, "step": 288500 }, { "epoch": 0.3482343486850262, "learning_rate": 8.87491438688084e-06, "loss": 3.3618679809570313, "step": 288600 }, { "epoch": 0.3483550120075089, "learning_rate": 8.8745105514131e-06, "loss": 3.3436550903320312, "step": 288700 }, { "epoch": 0.3484756753299916, "learning_rate": 8.874106715945363e-06, "loss": 3.339142150878906, "step": 288800 }, { "epoch": 0.34859633865247425, "learning_rate": 8.873702880477625e-06, "loss": 3.3261767578125, "step": 288900 }, { "epoch": 0.3487170019749569, "learning_rate": 8.873299045009887e-06, "loss": 3.356783752441406, "step": 289000 }, { "epoch": 0.3488376652974396, "learning_rate": 8.872895209542149e-06, "loss": 3.3261572265625, "step": 289100 }, { "epoch": 0.3489583286199223, "learning_rate": 8.87249137407441e-06, "loss": 3.35098388671875, "step": 289200 }, { "epoch": 0.349078991942405, "learning_rate": 8.872087538606673e-06, "loss": 3.3693197631835936, "step": 289300 }, { "epoch": 0.34919965526488767, "learning_rate": 8.871683703138933e-06, "loss": 3.3170135498046873, "step": 289400 }, { "epoch": 0.34932031858737034, "learning_rate": 8.871279867671195e-06, "loss": 3.3583859252929686, "step": 289500 }, { "epoch": 0.349440981909853, "learning_rate": 8.870876032203455e-06, "loss": 3.3346939086914062, "step": 289600 }, { "epoch": 0.34956164523233574, "learning_rate": 8.870472196735717e-06, "loss": 3.3283795166015624, "step": 289700 }, { "epoch": 0.3496823085548184, "learning_rate": 8.870068361267979e-06, "loss": 3.3797503662109376, "step": 289800 }, { "epoch": 0.3498029718773011, "learning_rate": 8.869664525800241e-06, "loss": 3.3343365478515623, "step": 289900 }, { "epoch": 0.34992363519978376, "learning_rate": 8.869260690332503e-06, "loss": 3.3282159423828124, "step": 290000 }, { "epoch": 0.35004429852226643, "learning_rate": 8.868856854864765e-06, "loss": 3.363509521484375, "step": 290100 }, { "epoch": 0.35016496184474916, "learning_rate": 8.868453019397027e-06, "loss": 3.357915344238281, "step": 290200 }, { "epoch": 0.35028562516723183, "learning_rate": 8.868049183929287e-06, "loss": 3.3282785034179687, "step": 290300 }, { "epoch": 0.3504062884897145, "learning_rate": 8.86764534846155e-06, "loss": 3.35484130859375, "step": 290400 }, { "epoch": 0.3505269518121972, "learning_rate": 8.867241512993811e-06, "loss": 3.3576254272460937, "step": 290500 }, { "epoch": 0.3506476151346799, "learning_rate": 8.866837677526072e-06, "loss": 3.3507846069335936, "step": 290600 }, { "epoch": 0.3507682784571626, "learning_rate": 8.866433842058334e-06, "loss": 3.3488534545898436, "step": 290700 }, { "epoch": 0.35088894177964525, "learning_rate": 8.866030006590596e-06, "loss": 3.3541641235351562, "step": 290800 }, { "epoch": 0.3510096051021279, "learning_rate": 8.865626171122858e-06, "loss": 3.3707708740234374, "step": 290900 }, { "epoch": 0.3511302684246106, "learning_rate": 8.86522233565512e-06, "loss": 3.3741864013671874, "step": 291000 }, { "epoch": 0.3512509317470933, "learning_rate": 8.86481850018738e-06, "loss": 3.3598983764648436, "step": 291100 }, { "epoch": 0.351371595069576, "learning_rate": 8.864414664719642e-06, "loss": 3.33818359375, "step": 291200 }, { "epoch": 0.35149225839205867, "learning_rate": 8.864010829251904e-06, "loss": 3.328935241699219, "step": 291300 }, { "epoch": 0.35161292171454134, "learning_rate": 8.863606993784166e-06, "loss": 3.3236929321289064, "step": 291400 }, { "epoch": 0.351733585037024, "learning_rate": 8.863203158316426e-06, "loss": 3.3363943481445313, "step": 291500 }, { "epoch": 0.35185424835950674, "learning_rate": 8.862799322848688e-06, "loss": 3.3711962890625, "step": 291600 }, { "epoch": 0.3519749116819894, "learning_rate": 8.86239548738095e-06, "loss": 3.3208868408203127, "step": 291700 }, { "epoch": 0.3520955750044721, "learning_rate": 8.861991651913212e-06, "loss": 3.3388897705078127, "step": 291800 }, { "epoch": 0.35221623832695476, "learning_rate": 8.861587816445472e-06, "loss": 3.3541644287109373, "step": 291900 }, { "epoch": 0.35233690164943743, "learning_rate": 8.861183980977734e-06, "loss": 3.3478387451171874, "step": 292000 }, { "epoch": 0.35245756497192016, "learning_rate": 8.860780145509996e-06, "loss": 3.3465670776367187, "step": 292100 }, { "epoch": 0.35257822829440283, "learning_rate": 8.860376310042258e-06, "loss": 3.3381646728515624, "step": 292200 }, { "epoch": 0.3526988916168855, "learning_rate": 8.85997247457452e-06, "loss": 3.342335510253906, "step": 292300 }, { "epoch": 0.3528195549393682, "learning_rate": 8.859568639106782e-06, "loss": 3.331907043457031, "step": 292400 }, { "epoch": 0.35294021826185085, "learning_rate": 8.859164803639042e-06, "loss": 3.3521966552734375, "step": 292500 }, { "epoch": 0.3530608815843336, "learning_rate": 8.858760968171304e-06, "loss": 3.33973876953125, "step": 292600 }, { "epoch": 0.35318154490681625, "learning_rate": 8.858357132703565e-06, "loss": 3.349891357421875, "step": 292700 }, { "epoch": 0.3533022082292989, "learning_rate": 8.857953297235827e-06, "loss": 3.3384039306640627, "step": 292800 }, { "epoch": 0.3534228715517816, "learning_rate": 8.857549461768089e-06, "loss": 3.3312451171875, "step": 292900 }, { "epoch": 0.3535435348742643, "learning_rate": 8.85714562630035e-06, "loss": 3.351846008300781, "step": 293000 }, { "epoch": 0.353664198196747, "learning_rate": 8.856741790832613e-06, "loss": 3.3284475708007815, "step": 293100 }, { "epoch": 0.35378486151922967, "learning_rate": 8.856337955364875e-06, "loss": 3.3351480102539064, "step": 293200 }, { "epoch": 0.35390552484171234, "learning_rate": 8.855934119897137e-06, "loss": 3.3484158325195312, "step": 293300 }, { "epoch": 0.354026188164195, "learning_rate": 8.855530284429399e-06, "loss": 3.349937744140625, "step": 293400 }, { "epoch": 0.35414685148667774, "learning_rate": 8.855126448961659e-06, "loss": 3.3387371826171877, "step": 293500 }, { "epoch": 0.3542675148091604, "learning_rate": 8.854722613493921e-06, "loss": 3.34574951171875, "step": 293600 }, { "epoch": 0.3543881781316431, "learning_rate": 8.854318778026181e-06, "loss": 3.3603726196289063, "step": 293700 }, { "epoch": 0.35450884145412576, "learning_rate": 8.853914942558443e-06, "loss": 3.340113525390625, "step": 293800 }, { "epoch": 0.35462950477660843, "learning_rate": 8.853511107090705e-06, "loss": 3.3261257934570314, "step": 293900 }, { "epoch": 0.35475016809909116, "learning_rate": 8.853107271622967e-06, "loss": 3.3126797485351562, "step": 294000 }, { "epoch": 0.35487083142157383, "learning_rate": 8.852703436155229e-06, "loss": 3.329942321777344, "step": 294100 }, { "epoch": 0.3549914947440565, "learning_rate": 8.852299600687491e-06, "loss": 3.34689208984375, "step": 294200 }, { "epoch": 0.3551121580665392, "learning_rate": 8.851895765219753e-06, "loss": 3.3400753784179686, "step": 294300 }, { "epoch": 0.35523282138902185, "learning_rate": 8.851491929752013e-06, "loss": 3.3322042846679687, "step": 294400 }, { "epoch": 0.3553534847115046, "learning_rate": 8.851088094284275e-06, "loss": 3.3032736206054687, "step": 294500 }, { "epoch": 0.35547414803398725, "learning_rate": 8.850684258816537e-06, "loss": 3.3311907958984377, "step": 294600 }, { "epoch": 0.3555948113564699, "learning_rate": 8.850280423348798e-06, "loss": 3.3651763916015627, "step": 294700 }, { "epoch": 0.3557154746789526, "learning_rate": 8.84987658788106e-06, "loss": 3.313255615234375, "step": 294800 }, { "epoch": 0.35583613800143526, "learning_rate": 8.849472752413322e-06, "loss": 3.3502621459960937, "step": 294900 }, { "epoch": 0.355956801323918, "learning_rate": 8.849068916945584e-06, "loss": 3.32615966796875, "step": 295000 }, { "epoch": 0.35607746464640067, "learning_rate": 8.848665081477846e-06, "loss": 3.3292901611328123, "step": 295100 }, { "epoch": 0.35619812796888334, "learning_rate": 8.848261246010106e-06, "loss": 3.35273681640625, "step": 295200 }, { "epoch": 0.356318791291366, "learning_rate": 8.847857410542368e-06, "loss": 3.3344461059570314, "step": 295300 }, { "epoch": 0.3564394546138487, "learning_rate": 8.84745357507463e-06, "loss": 3.3574578857421873, "step": 295400 }, { "epoch": 0.3565601179363314, "learning_rate": 8.847049739606892e-06, "loss": 3.3437017822265624, "step": 295500 }, { "epoch": 0.3566807812588141, "learning_rate": 8.846645904139152e-06, "loss": 3.3250396728515623, "step": 295600 }, { "epoch": 0.35680144458129676, "learning_rate": 8.846242068671414e-06, "loss": 3.352808837890625, "step": 295700 }, { "epoch": 0.35692210790377943, "learning_rate": 8.845838233203676e-06, "loss": 3.3430130004882814, "step": 295800 }, { "epoch": 0.35704277122626216, "learning_rate": 8.845434397735938e-06, "loss": 3.2995059204101564, "step": 295900 }, { "epoch": 0.35716343454874483, "learning_rate": 8.845030562268198e-06, "loss": 3.323347473144531, "step": 296000 }, { "epoch": 0.3572840978712275, "learning_rate": 8.84462672680046e-06, "loss": 3.3315829467773437, "step": 296100 }, { "epoch": 0.3574047611937102, "learning_rate": 8.844222891332722e-06, "loss": 3.3295867919921873, "step": 296200 }, { "epoch": 0.35752542451619285, "learning_rate": 8.843819055864984e-06, "loss": 3.330219421386719, "step": 296300 }, { "epoch": 0.3576460878386756, "learning_rate": 8.843415220397246e-06, "loss": 3.31962646484375, "step": 296400 }, { "epoch": 0.35776675116115825, "learning_rate": 8.843011384929508e-06, "loss": 3.3472137451171875, "step": 296500 }, { "epoch": 0.3578874144836409, "learning_rate": 8.842607549461768e-06, "loss": 3.3337026977539064, "step": 296600 }, { "epoch": 0.3580080778061236, "learning_rate": 8.84220371399403e-06, "loss": 3.3129229736328125, "step": 296700 }, { "epoch": 0.35812874112860626, "learning_rate": 8.84179987852629e-06, "loss": 3.307882995605469, "step": 296800 }, { "epoch": 0.358249404451089, "learning_rate": 8.841396043058553e-06, "loss": 3.3341461181640626, "step": 296900 }, { "epoch": 0.35837006777357167, "learning_rate": 8.840992207590815e-06, "loss": 3.301899108886719, "step": 297000 }, { "epoch": 0.35849073109605434, "learning_rate": 8.840588372123077e-06, "loss": 3.3152227783203125, "step": 297100 }, { "epoch": 0.358611394418537, "learning_rate": 8.840184536655339e-06, "loss": 3.345552673339844, "step": 297200 }, { "epoch": 0.3587320577410197, "learning_rate": 8.8397807011876e-06, "loss": 3.3410565185546877, "step": 297300 }, { "epoch": 0.3588527210635024, "learning_rate": 8.839376865719863e-06, "loss": 3.3193359375, "step": 297400 }, { "epoch": 0.3589733843859851, "learning_rate": 8.838973030252123e-06, "loss": 3.33230712890625, "step": 297500 }, { "epoch": 0.35909404770846776, "learning_rate": 8.838569194784385e-06, "loss": 3.32958251953125, "step": 297600 }, { "epoch": 0.35921471103095043, "learning_rate": 8.838165359316647e-06, "loss": 3.328432922363281, "step": 297700 }, { "epoch": 0.3593353743534331, "learning_rate": 8.837761523848907e-06, "loss": 3.3343017578125, "step": 297800 }, { "epoch": 0.35945603767591583, "learning_rate": 8.83735768838117e-06, "loss": 3.33526123046875, "step": 297900 }, { "epoch": 0.3595767009983985, "learning_rate": 8.836953852913431e-06, "loss": 3.3219537353515625, "step": 298000 }, { "epoch": 0.3596973643208812, "learning_rate": 8.836550017445693e-06, "loss": 3.316231994628906, "step": 298100 }, { "epoch": 0.35981802764336385, "learning_rate": 8.836146181977955e-06, "loss": 3.3348828125, "step": 298200 }, { "epoch": 0.3599386909658466, "learning_rate": 8.835742346510217e-06, "loss": 3.3322988891601564, "step": 298300 }, { "epoch": 0.36005935428832925, "learning_rate": 8.835338511042479e-06, "loss": 3.3408843994140627, "step": 298400 }, { "epoch": 0.3601800176108119, "learning_rate": 8.83493467557474e-06, "loss": 3.3089837646484375, "step": 298500 }, { "epoch": 0.3603006809332946, "learning_rate": 8.834530840107001e-06, "loss": 3.305108947753906, "step": 298600 }, { "epoch": 0.36042134425577727, "learning_rate": 8.834127004639262e-06, "loss": 3.3198333740234376, "step": 298700 }, { "epoch": 0.36054200757826, "learning_rate": 8.833723169171524e-06, "loss": 3.325597839355469, "step": 298800 }, { "epoch": 0.36066267090074267, "learning_rate": 8.833319333703786e-06, "loss": 3.316040344238281, "step": 298900 }, { "epoch": 0.36078333422322534, "learning_rate": 8.832915498236048e-06, "loss": 3.3172955322265625, "step": 299000 }, { "epoch": 0.360903997545708, "learning_rate": 8.83251166276831e-06, "loss": 3.325193176269531, "step": 299100 }, { "epoch": 0.3610246608681907, "learning_rate": 8.832107827300572e-06, "loss": 3.31294189453125, "step": 299200 }, { "epoch": 0.3611453241906734, "learning_rate": 8.831703991832832e-06, "loss": 3.324296875, "step": 299300 }, { "epoch": 0.3612659875131561, "learning_rate": 8.831300156365094e-06, "loss": 3.333157958984375, "step": 299400 }, { "epoch": 0.36138665083563876, "learning_rate": 8.830896320897356e-06, "loss": 3.3377294921875, "step": 299500 }, { "epoch": 0.36150731415812143, "learning_rate": 8.830492485429618e-06, "loss": 3.3260113525390627, "step": 299600 }, { "epoch": 0.3616279774806041, "learning_rate": 8.830088649961878e-06, "loss": 3.3337860107421875, "step": 299700 }, { "epoch": 0.36174864080308683, "learning_rate": 8.82968481449414e-06, "loss": 3.31935546875, "step": 299800 }, { "epoch": 0.3618693041255695, "learning_rate": 8.829280979026402e-06, "loss": 3.2990069580078125, "step": 299900 }, { "epoch": 0.3619899674480522, "learning_rate": 8.828877143558664e-06, "loss": 3.31140380859375, "step": 300000 }, { "epoch": 0.36211063077053485, "learning_rate": 8.828473308090924e-06, "loss": 3.30639892578125, "step": 300100 }, { "epoch": 0.3622312940930175, "learning_rate": 8.828069472623186e-06, "loss": 3.322403869628906, "step": 300200 }, { "epoch": 0.36235195741550025, "learning_rate": 8.827665637155448e-06, "loss": 3.304969482421875, "step": 300300 }, { "epoch": 0.3624726207379829, "learning_rate": 8.82726180168771e-06, "loss": 3.3136441040039064, "step": 300400 }, { "epoch": 0.3625932840604656, "learning_rate": 8.826857966219972e-06, "loss": 3.31540283203125, "step": 300500 }, { "epoch": 0.36271394738294827, "learning_rate": 8.826454130752233e-06, "loss": 3.3179580688476564, "step": 300600 }, { "epoch": 0.362834610705431, "learning_rate": 8.826050295284495e-06, "loss": 3.3205157470703126, "step": 300700 }, { "epoch": 0.36295527402791367, "learning_rate": 8.825646459816757e-06, "loss": 3.3216207885742186, "step": 300800 }, { "epoch": 0.36307593735039634, "learning_rate": 8.825242624349017e-06, "loss": 3.3189358520507812, "step": 300900 }, { "epoch": 0.363196600672879, "learning_rate": 8.824838788881279e-06, "loss": 3.3213543701171875, "step": 301000 }, { "epoch": 0.3633172639953617, "learning_rate": 8.82443495341354e-06, "loss": 3.331612548828125, "step": 301100 }, { "epoch": 0.3634379273178444, "learning_rate": 8.824031117945803e-06, "loss": 3.3322308349609373, "step": 301200 }, { "epoch": 0.3635585906403271, "learning_rate": 8.823627282478065e-06, "loss": 3.319403076171875, "step": 301300 }, { "epoch": 0.36367925396280976, "learning_rate": 8.823223447010327e-06, "loss": 3.3143212890625, "step": 301400 }, { "epoch": 0.36379991728529243, "learning_rate": 8.822819611542589e-06, "loss": 3.316423034667969, "step": 301500 }, { "epoch": 0.3639205806077751, "learning_rate": 8.822415776074849e-06, "loss": 3.313104553222656, "step": 301600 }, { "epoch": 0.36404124393025783, "learning_rate": 8.822011940607111e-06, "loss": 3.32320068359375, "step": 301700 }, { "epoch": 0.3641619072527405, "learning_rate": 8.821608105139371e-06, "loss": 3.287771911621094, "step": 301800 }, { "epoch": 0.3642825705752232, "learning_rate": 8.821204269671633e-06, "loss": 3.29591552734375, "step": 301900 }, { "epoch": 0.36440323389770585, "learning_rate": 8.820800434203895e-06, "loss": 3.317733154296875, "step": 302000 }, { "epoch": 0.3645238972201885, "learning_rate": 8.820396598736157e-06, "loss": 3.2830380249023436, "step": 302100 }, { "epoch": 0.36464456054267125, "learning_rate": 8.81999276326842e-06, "loss": 3.3182296752929688, "step": 302200 }, { "epoch": 0.3647652238651539, "learning_rate": 8.819588927800681e-06, "loss": 3.3193603515625, "step": 302300 }, { "epoch": 0.3648858871876366, "learning_rate": 8.819185092332943e-06, "loss": 3.3257107543945312, "step": 302400 }, { "epoch": 0.36500655051011927, "learning_rate": 8.818781256865203e-06, "loss": 3.315701599121094, "step": 302500 }, { "epoch": 0.36512721383260194, "learning_rate": 8.818377421397465e-06, "loss": 3.3238140869140627, "step": 302600 }, { "epoch": 0.36524787715508467, "learning_rate": 8.817973585929727e-06, "loss": 3.3311126708984373, "step": 302700 }, { "epoch": 0.36536854047756734, "learning_rate": 8.817569750461988e-06, "loss": 3.3201943969726564, "step": 302800 }, { "epoch": 0.36548920380005, "learning_rate": 8.81716591499425e-06, "loss": 3.323199462890625, "step": 302900 }, { "epoch": 0.3656098671225327, "learning_rate": 8.816762079526512e-06, "loss": 3.333154296875, "step": 303000 }, { "epoch": 0.36573053044501536, "learning_rate": 8.816358244058774e-06, "loss": 3.2910009765625, "step": 303100 }, { "epoch": 0.3658511937674981, "learning_rate": 8.815954408591036e-06, "loss": 3.312349548339844, "step": 303200 }, { "epoch": 0.36597185708998076, "learning_rate": 8.815550573123296e-06, "loss": 3.2939016723632815, "step": 303300 }, { "epoch": 0.36609252041246343, "learning_rate": 8.815146737655558e-06, "loss": 3.3060198974609376, "step": 303400 }, { "epoch": 0.3662131837349461, "learning_rate": 8.81474290218782e-06, "loss": 3.3187295532226564, "step": 303500 }, { "epoch": 0.36633384705742883, "learning_rate": 8.814339066720082e-06, "loss": 3.319930114746094, "step": 303600 }, { "epoch": 0.3664545103799115, "learning_rate": 8.813935231252342e-06, "loss": 3.338509216308594, "step": 303700 }, { "epoch": 0.3665751737023942, "learning_rate": 8.813531395784604e-06, "loss": 3.3211935424804686, "step": 303800 }, { "epoch": 0.36669583702487685, "learning_rate": 8.813127560316866e-06, "loss": 3.304140930175781, "step": 303900 }, { "epoch": 0.3668165003473595, "learning_rate": 8.812723724849128e-06, "loss": 3.3051583862304685, "step": 304000 }, { "epoch": 0.36693716366984225, "learning_rate": 8.81231988938139e-06, "loss": 3.298758239746094, "step": 304100 }, { "epoch": 0.3670578269923249, "learning_rate": 8.81191605391365e-06, "loss": 3.31005126953125, "step": 304200 }, { "epoch": 0.3671784903148076, "learning_rate": 8.811512218445912e-06, "loss": 3.285517578125, "step": 304300 }, { "epoch": 0.36729915363729027, "learning_rate": 8.811108382978174e-06, "loss": 3.31759765625, "step": 304400 }, { "epoch": 0.36741981695977294, "learning_rate": 8.810704547510436e-06, "loss": 3.324541015625, "step": 304500 }, { "epoch": 0.36754048028225567, "learning_rate": 8.810300712042698e-06, "loss": 3.2998089599609375, "step": 304600 }, { "epoch": 0.36766114360473834, "learning_rate": 8.809896876574959e-06, "loss": 3.315268859863281, "step": 304700 }, { "epoch": 0.367781806927221, "learning_rate": 8.80949304110722e-06, "loss": 3.324373779296875, "step": 304800 }, { "epoch": 0.3679024702497037, "learning_rate": 8.809089205639483e-06, "loss": 3.3101516723632813, "step": 304900 }, { "epoch": 0.36802313357218636, "learning_rate": 8.808685370171743e-06, "loss": 3.3062335205078126, "step": 305000 }, { "epoch": 0.3681437968946691, "learning_rate": 8.808281534704005e-06, "loss": 3.283702392578125, "step": 305100 }, { "epoch": 0.36826446021715176, "learning_rate": 8.807877699236267e-06, "loss": 3.3325180053710937, "step": 305200 }, { "epoch": 0.36838512353963443, "learning_rate": 8.807473863768529e-06, "loss": 3.3021621704101562, "step": 305300 }, { "epoch": 0.3685057868621171, "learning_rate": 8.80707002830079e-06, "loss": 3.340378723144531, "step": 305400 }, { "epoch": 0.3686264501845998, "learning_rate": 8.806666192833053e-06, "loss": 3.3138494873046875, "step": 305500 }, { "epoch": 0.3687471135070825, "learning_rate": 8.806262357365313e-06, "loss": 3.295240478515625, "step": 305600 }, { "epoch": 0.3688677768295652, "learning_rate": 8.805858521897575e-06, "loss": 3.3037368774414064, "step": 305700 }, { "epoch": 0.36898844015204785, "learning_rate": 8.805454686429837e-06, "loss": 3.2917221069335936, "step": 305800 }, { "epoch": 0.3691091034745305, "learning_rate": 8.805050850962097e-06, "loss": 3.296153259277344, "step": 305900 }, { "epoch": 0.36922976679701325, "learning_rate": 8.80464701549436e-06, "loss": 3.2916195678710936, "step": 306000 }, { "epoch": 0.3693504301194959, "learning_rate": 8.804243180026621e-06, "loss": 3.3197772216796877, "step": 306100 }, { "epoch": 0.3694710934419786, "learning_rate": 8.803839344558883e-06, "loss": 3.3021240234375, "step": 306200 }, { "epoch": 0.36959175676446127, "learning_rate": 8.803435509091145e-06, "loss": 3.2962762451171876, "step": 306300 }, { "epoch": 0.36971242008694394, "learning_rate": 8.803031673623407e-06, "loss": 3.324712219238281, "step": 306400 }, { "epoch": 0.36983308340942667, "learning_rate": 8.80262783815567e-06, "loss": 3.3221090698242186, "step": 306500 }, { "epoch": 0.36995374673190934, "learning_rate": 8.80222400268793e-06, "loss": 3.3229052734375, "step": 306600 }, { "epoch": 0.370074410054392, "learning_rate": 8.801820167220191e-06, "loss": 3.3020254516601564, "step": 306700 }, { "epoch": 0.3701950733768747, "learning_rate": 8.801416331752452e-06, "loss": 3.301183166503906, "step": 306800 }, { "epoch": 0.37031573669935736, "learning_rate": 8.801012496284714e-06, "loss": 3.3134396362304686, "step": 306900 }, { "epoch": 0.3704364000218401, "learning_rate": 8.800608660816976e-06, "loss": 3.3111557006835937, "step": 307000 }, { "epoch": 0.37055706334432276, "learning_rate": 8.800204825349238e-06, "loss": 3.3167425537109376, "step": 307100 }, { "epoch": 0.37067772666680543, "learning_rate": 8.7998009898815e-06, "loss": 3.3008447265625, "step": 307200 }, { "epoch": 0.3707983899892881, "learning_rate": 8.799397154413762e-06, "loss": 3.285044860839844, "step": 307300 }, { "epoch": 0.3709190533117708, "learning_rate": 8.798993318946022e-06, "loss": 3.2854852294921875, "step": 307400 }, { "epoch": 0.3710397166342535, "learning_rate": 8.798589483478284e-06, "loss": 3.2860568237304686, "step": 307500 }, { "epoch": 0.3711603799567362, "learning_rate": 8.798185648010546e-06, "loss": 3.3158724975585936, "step": 307600 }, { "epoch": 0.37128104327921885, "learning_rate": 8.797781812542808e-06, "loss": 3.2934579467773437, "step": 307700 }, { "epoch": 0.3714017066017015, "learning_rate": 8.797377977075068e-06, "loss": 3.3062152099609374, "step": 307800 }, { "epoch": 0.3715223699241842, "learning_rate": 8.79697414160733e-06, "loss": 3.3139215087890626, "step": 307900 }, { "epoch": 0.3716430332466669, "learning_rate": 8.796570306139592e-06, "loss": 3.3147311401367188, "step": 308000 }, { "epoch": 0.3717636965691496, "learning_rate": 8.796166470671854e-06, "loss": 3.3254104614257813, "step": 308100 }, { "epoch": 0.37188435989163227, "learning_rate": 8.795762635204114e-06, "loss": 3.285187072753906, "step": 308200 }, { "epoch": 0.37200502321411494, "learning_rate": 8.795358799736376e-06, "loss": 3.296063232421875, "step": 308300 }, { "epoch": 0.3721256865365976, "learning_rate": 8.794954964268638e-06, "loss": 3.310453186035156, "step": 308400 }, { "epoch": 0.37224634985908034, "learning_rate": 8.7945511288009e-06, "loss": 3.3133758544921874, "step": 308500 }, { "epoch": 0.372367013181563, "learning_rate": 8.794147293333162e-06, "loss": 3.298341979980469, "step": 308600 }, { "epoch": 0.3724876765040457, "learning_rate": 8.793743457865424e-06, "loss": 3.3225396728515624, "step": 308700 }, { "epoch": 0.37260833982652836, "learning_rate": 8.793339622397685e-06, "loss": 3.2861734008789063, "step": 308800 }, { "epoch": 0.3727290031490111, "learning_rate": 8.792935786929947e-06, "loss": 3.273369140625, "step": 308900 }, { "epoch": 0.37284966647149376, "learning_rate": 8.792531951462209e-06, "loss": 3.312192687988281, "step": 309000 }, { "epoch": 0.37297032979397643, "learning_rate": 8.792128115994469e-06, "loss": 3.2700869750976564, "step": 309100 }, { "epoch": 0.3730909931164591, "learning_rate": 8.791724280526731e-06, "loss": 3.3293157958984376, "step": 309200 }, { "epoch": 0.3732116564389418, "learning_rate": 8.791320445058993e-06, "loss": 3.2952374267578124, "step": 309300 }, { "epoch": 0.3733323197614245, "learning_rate": 8.790916609591255e-06, "loss": 3.282659912109375, "step": 309400 }, { "epoch": 0.3734529830839072, "learning_rate": 8.790512774123517e-06, "loss": 3.280079345703125, "step": 309500 }, { "epoch": 0.37357364640638985, "learning_rate": 8.790108938655779e-06, "loss": 3.324193420410156, "step": 309600 }, { "epoch": 0.3736943097288725, "learning_rate": 8.789705103188039e-06, "loss": 3.320880126953125, "step": 309700 }, { "epoch": 0.3738149730513552, "learning_rate": 8.789301267720301e-06, "loss": 3.278819885253906, "step": 309800 }, { "epoch": 0.3739356363738379, "learning_rate": 8.788897432252563e-06, "loss": 3.288790283203125, "step": 309900 }, { "epoch": 0.3740562996963206, "learning_rate": 8.788493596784823e-06, "loss": 3.293543395996094, "step": 310000 }, { "epoch": 0.37417696301880327, "learning_rate": 8.788089761317085e-06, "loss": 3.289220886230469, "step": 310100 }, { "epoch": 0.37429762634128594, "learning_rate": 8.787685925849347e-06, "loss": 3.284038391113281, "step": 310200 }, { "epoch": 0.3744182896637686, "learning_rate": 8.78728209038161e-06, "loss": 3.311800231933594, "step": 310300 }, { "epoch": 0.37453895298625134, "learning_rate": 8.786878254913871e-06, "loss": 3.317510681152344, "step": 310400 }, { "epoch": 0.374659616308734, "learning_rate": 8.786474419446133e-06, "loss": 3.2828073120117187, "step": 310500 }, { "epoch": 0.3747802796312167, "learning_rate": 8.786070583978395e-06, "loss": 3.2694500732421874, "step": 310600 }, { "epoch": 0.37490094295369936, "learning_rate": 8.785666748510656e-06, "loss": 3.3128778076171876, "step": 310700 }, { "epoch": 0.37502160627618203, "learning_rate": 8.785262913042917e-06, "loss": 3.27744873046875, "step": 310800 }, { "epoch": 0.37514226959866476, "learning_rate": 8.784859077575178e-06, "loss": 3.2939593505859377, "step": 310900 }, { "epoch": 0.37526293292114743, "learning_rate": 8.78445524210744e-06, "loss": 3.3001422119140624, "step": 311000 }, { "epoch": 0.3753835962436301, "learning_rate": 8.784051406639702e-06, "loss": 3.2914654541015627, "step": 311100 }, { "epoch": 0.3755042595661128, "learning_rate": 8.783647571171964e-06, "loss": 3.287436828613281, "step": 311200 }, { "epoch": 0.3756249228885955, "learning_rate": 8.783243735704226e-06, "loss": 3.29072509765625, "step": 311300 }, { "epoch": 0.3757455862110782, "learning_rate": 8.782839900236488e-06, "loss": 3.2698114013671873, "step": 311400 }, { "epoch": 0.37586624953356085, "learning_rate": 8.782436064768748e-06, "loss": 3.304375, "step": 311500 }, { "epoch": 0.3759869128560435, "learning_rate": 8.78203222930101e-06, "loss": 3.2887890625, "step": 311600 }, { "epoch": 0.3761075761785262, "learning_rate": 8.781628393833272e-06, "loss": 3.292602844238281, "step": 311700 }, { "epoch": 0.3762282395010089, "learning_rate": 8.781224558365534e-06, "loss": 3.285872497558594, "step": 311800 }, { "epoch": 0.3763489028234916, "learning_rate": 8.780820722897794e-06, "loss": 3.301965637207031, "step": 311900 }, { "epoch": 0.37646956614597427, "learning_rate": 8.780416887430056e-06, "loss": 3.281133117675781, "step": 312000 }, { "epoch": 0.37659022946845694, "learning_rate": 8.780013051962318e-06, "loss": 3.2999783325195313, "step": 312100 }, { "epoch": 0.3767108927909396, "learning_rate": 8.77960921649458e-06, "loss": 3.3032260131835938, "step": 312200 }, { "epoch": 0.37683155611342234, "learning_rate": 8.77920538102684e-06, "loss": 3.28312255859375, "step": 312300 }, { "epoch": 0.376952219435905, "learning_rate": 8.778801545559102e-06, "loss": 3.308909912109375, "step": 312400 }, { "epoch": 0.3770728827583877, "learning_rate": 8.778397710091364e-06, "loss": 3.25122314453125, "step": 312500 }, { "epoch": 0.37719354608087036, "learning_rate": 8.777993874623626e-06, "loss": 3.2880038452148437, "step": 312600 }, { "epoch": 0.37731420940335303, "learning_rate": 8.777590039155888e-06, "loss": 3.3010659790039063, "step": 312700 }, { "epoch": 0.37743487272583576, "learning_rate": 8.777186203688149e-06, "loss": 3.279433288574219, "step": 312800 }, { "epoch": 0.37755553604831843, "learning_rate": 8.77678236822041e-06, "loss": 3.300711669921875, "step": 312900 }, { "epoch": 0.3776761993708011, "learning_rate": 8.776378532752673e-06, "loss": 3.277568359375, "step": 313000 }, { "epoch": 0.3777968626932838, "learning_rate": 8.775974697284933e-06, "loss": 3.2576052856445314, "step": 313100 }, { "epoch": 0.37791752601576645, "learning_rate": 8.775570861817195e-06, "loss": 3.2829791259765626, "step": 313200 }, { "epoch": 0.3780381893382492, "learning_rate": 8.775167026349457e-06, "loss": 3.281400451660156, "step": 313300 }, { "epoch": 0.37815885266073185, "learning_rate": 8.774763190881719e-06, "loss": 3.284503173828125, "step": 313400 }, { "epoch": 0.3782795159832145, "learning_rate": 8.77435935541398e-06, "loss": 3.308751525878906, "step": 313500 }, { "epoch": 0.3784001793056972, "learning_rate": 8.773955519946243e-06, "loss": 3.2616864013671876, "step": 313600 }, { "epoch": 0.3785208426281799, "learning_rate": 8.773551684478505e-06, "loss": 3.2837033081054687, "step": 313700 }, { "epoch": 0.3786415059506626, "learning_rate": 8.773147849010765e-06, "loss": 3.279918518066406, "step": 313800 }, { "epoch": 0.37876216927314527, "learning_rate": 8.772744013543027e-06, "loss": 3.2851162719726563, "step": 313900 }, { "epoch": 0.37888283259562794, "learning_rate": 8.772340178075287e-06, "loss": 3.2467465209960937, "step": 314000 }, { "epoch": 0.3790034959181106, "learning_rate": 8.77193634260755e-06, "loss": 3.2915631103515626, "step": 314100 }, { "epoch": 0.37912415924059334, "learning_rate": 8.771532507139811e-06, "loss": 3.273829040527344, "step": 314200 }, { "epoch": 0.379244822563076, "learning_rate": 8.771128671672073e-06, "loss": 3.238301086425781, "step": 314300 }, { "epoch": 0.3793654858855587, "learning_rate": 8.770724836204335e-06, "loss": 3.2906304931640626, "step": 314400 }, { "epoch": 0.37948614920804136, "learning_rate": 8.770321000736597e-06, "loss": 3.2664248657226564, "step": 314500 }, { "epoch": 0.37960681253052403, "learning_rate": 8.76991716526886e-06, "loss": 3.274669494628906, "step": 314600 }, { "epoch": 0.37972747585300676, "learning_rate": 8.76951332980112e-06, "loss": 3.2747454833984375, "step": 314700 }, { "epoch": 0.37984813917548943, "learning_rate": 8.769109494333382e-06, "loss": 3.295265808105469, "step": 314800 }, { "epoch": 0.3799688024979721, "learning_rate": 8.768705658865644e-06, "loss": 3.2701620483398437, "step": 314900 }, { "epoch": 0.3800894658204548, "learning_rate": 8.768301823397904e-06, "loss": 3.2717471313476563, "step": 315000 }, { "epoch": 0.38021012914293745, "learning_rate": 8.767897987930166e-06, "loss": 3.2744296264648436, "step": 315100 }, { "epoch": 0.3803307924654202, "learning_rate": 8.767494152462428e-06, "loss": 3.27110107421875, "step": 315200 }, { "epoch": 0.38045145578790285, "learning_rate": 8.76709031699469e-06, "loss": 3.2762799072265625, "step": 315300 }, { "epoch": 0.3805721191103855, "learning_rate": 8.766686481526952e-06, "loss": 3.2894537353515627, "step": 315400 }, { "epoch": 0.3806927824328682, "learning_rate": 8.766282646059214e-06, "loss": 3.2854052734375, "step": 315500 }, { "epoch": 0.38081344575535087, "learning_rate": 8.765878810591474e-06, "loss": 3.2787136840820312, "step": 315600 }, { "epoch": 0.3809341090778336, "learning_rate": 8.765474975123736e-06, "loss": 3.2867681884765627, "step": 315700 }, { "epoch": 0.38105477240031627, "learning_rate": 8.765071139655998e-06, "loss": 3.2680532836914065, "step": 315800 }, { "epoch": 0.38117543572279894, "learning_rate": 8.764667304188258e-06, "loss": 3.2739834594726562, "step": 315900 }, { "epoch": 0.3812960990452816, "learning_rate": 8.76426346872052e-06, "loss": 3.285141906738281, "step": 316000 }, { "epoch": 0.3814167623677643, "learning_rate": 8.763859633252782e-06, "loss": 3.2821109008789064, "step": 316100 }, { "epoch": 0.381537425690247, "learning_rate": 8.763455797785044e-06, "loss": 3.26627197265625, "step": 316200 }, { "epoch": 0.3816580890127297, "learning_rate": 8.763051962317306e-06, "loss": 3.240209655761719, "step": 316300 }, { "epoch": 0.38177875233521236, "learning_rate": 8.762648126849566e-06, "loss": 3.2754672241210936, "step": 316400 }, { "epoch": 0.38189941565769503, "learning_rate": 8.762244291381828e-06, "loss": 3.2747296142578124, "step": 316500 }, { "epoch": 0.38202007898017776, "learning_rate": 8.76184045591409e-06, "loss": 3.2793539428710936, "step": 316600 }, { "epoch": 0.38214074230266043, "learning_rate": 8.761436620446352e-06, "loss": 3.2627667236328124, "step": 316700 }, { "epoch": 0.3822614056251431, "learning_rate": 8.761032784978614e-06, "loss": 3.2436148071289064, "step": 316800 }, { "epoch": 0.3823820689476258, "learning_rate": 8.760628949510875e-06, "loss": 3.2827850341796876, "step": 316900 }, { "epoch": 0.38250273227010845, "learning_rate": 8.760225114043137e-06, "loss": 3.2916610717773436, "step": 317000 }, { "epoch": 0.3826233955925912, "learning_rate": 8.759821278575399e-06, "loss": 3.2335391235351563, "step": 317100 }, { "epoch": 0.38274405891507385, "learning_rate": 8.759417443107659e-06, "loss": 3.2764181518554687, "step": 317200 }, { "epoch": 0.3828647222375565, "learning_rate": 8.759013607639921e-06, "loss": 3.256866760253906, "step": 317300 }, { "epoch": 0.3829853855600392, "learning_rate": 8.758609772172183e-06, "loss": 3.2746463012695313, "step": 317400 }, { "epoch": 0.38310604888252187, "learning_rate": 8.758205936704445e-06, "loss": 3.246959228515625, "step": 317500 }, { "epoch": 0.3832267122050046, "learning_rate": 8.757802101236707e-06, "loss": 3.2848907470703126, "step": 317600 }, { "epoch": 0.38334737552748727, "learning_rate": 8.757398265768969e-06, "loss": 3.2458203125, "step": 317700 }, { "epoch": 0.38346803884996994, "learning_rate": 8.756994430301229e-06, "loss": 3.279761962890625, "step": 317800 }, { "epoch": 0.3835887021724526, "learning_rate": 8.756590594833491e-06, "loss": 3.292417297363281, "step": 317900 }, { "epoch": 0.3837093654949353, "learning_rate": 8.756186759365753e-06, "loss": 3.251089782714844, "step": 318000 }, { "epoch": 0.383830028817418, "learning_rate": 8.755782923898013e-06, "loss": 3.2748980712890625, "step": 318100 }, { "epoch": 0.3839506921399007, "learning_rate": 8.755379088430275e-06, "loss": 3.306053466796875, "step": 318200 }, { "epoch": 0.38407135546238336, "learning_rate": 8.754975252962537e-06, "loss": 3.2929010009765625, "step": 318300 }, { "epoch": 0.38419201878486603, "learning_rate": 8.7545714174948e-06, "loss": 3.269003601074219, "step": 318400 }, { "epoch": 0.3843126821073487, "learning_rate": 8.754167582027061e-06, "loss": 3.2758865356445312, "step": 318500 }, { "epoch": 0.38443334542983143, "learning_rate": 8.753763746559323e-06, "loss": 3.2650885009765624, "step": 318600 }, { "epoch": 0.3845540087523141, "learning_rate": 8.753359911091585e-06, "loss": 3.2991177368164064, "step": 318700 }, { "epoch": 0.3846746720747968, "learning_rate": 8.752956075623846e-06, "loss": 3.2663214111328127, "step": 318800 }, { "epoch": 0.38479533539727945, "learning_rate": 8.752552240156108e-06, "loss": 3.241009521484375, "step": 318900 }, { "epoch": 0.3849159987197622, "learning_rate": 8.752148404688368e-06, "loss": 3.2705615234375, "step": 319000 }, { "epoch": 0.38503666204224485, "learning_rate": 8.75174456922063e-06, "loss": 3.2790011596679687, "step": 319100 }, { "epoch": 0.3851573253647275, "learning_rate": 8.751340733752892e-06, "loss": 3.2712957763671877, "step": 319200 }, { "epoch": 0.3852779886872102, "learning_rate": 8.750936898285154e-06, "loss": 3.2643399047851562, "step": 319300 }, { "epoch": 0.38539865200969287, "learning_rate": 8.750533062817416e-06, "loss": 3.2708502197265625, "step": 319400 }, { "epoch": 0.3855193153321756, "learning_rate": 8.750129227349678e-06, "loss": 3.2638134765625, "step": 319500 }, { "epoch": 0.38563997865465827, "learning_rate": 8.74972539188194e-06, "loss": 3.2642227172851563, "step": 319600 }, { "epoch": 0.38576064197714094, "learning_rate": 8.7493215564142e-06, "loss": 3.246645812988281, "step": 319700 }, { "epoch": 0.3858813052996236, "learning_rate": 8.748917720946462e-06, "loss": 3.251583251953125, "step": 319800 }, { "epoch": 0.3860019686221063, "learning_rate": 8.748513885478724e-06, "loss": 3.2594647216796875, "step": 319900 }, { "epoch": 0.386122631944589, "learning_rate": 8.748110050010984e-06, "loss": 3.285966796875, "step": 320000 }, { "epoch": 0.3862432952670717, "learning_rate": 8.747706214543246e-06, "loss": 3.2659402465820313, "step": 320100 }, { "epoch": 0.38636395858955436, "learning_rate": 8.747302379075508e-06, "loss": 3.2546759033203125, "step": 320200 }, { "epoch": 0.38648462191203703, "learning_rate": 8.74689854360777e-06, "loss": 3.242425842285156, "step": 320300 }, { "epoch": 0.3866052852345197, "learning_rate": 8.746494708140032e-06, "loss": 3.2424041748046877, "step": 320400 }, { "epoch": 0.38672594855700243, "learning_rate": 8.746090872672293e-06, "loss": 3.2470562744140623, "step": 320500 }, { "epoch": 0.3868466118794851, "learning_rate": 8.745687037204554e-06, "loss": 3.30968017578125, "step": 320600 }, { "epoch": 0.3869672752019678, "learning_rate": 8.745283201736816e-06, "loss": 3.225361328125, "step": 320700 }, { "epoch": 0.38708793852445045, "learning_rate": 8.744879366269078e-06, "loss": 3.250545654296875, "step": 320800 }, { "epoch": 0.3872086018469331, "learning_rate": 8.74447553080134e-06, "loss": 3.2445709228515627, "step": 320900 }, { "epoch": 0.38732926516941585, "learning_rate": 8.7440716953336e-06, "loss": 3.270658264160156, "step": 321000 }, { "epoch": 0.3874499284918985, "learning_rate": 8.743667859865863e-06, "loss": 3.2479019165039062, "step": 321100 }, { "epoch": 0.3875705918143812, "learning_rate": 8.743264024398125e-06, "loss": 3.2724932861328124, "step": 321200 }, { "epoch": 0.38769125513686387, "learning_rate": 8.742860188930385e-06, "loss": 3.264521484375, "step": 321300 }, { "epoch": 0.38781191845934654, "learning_rate": 8.742456353462647e-06, "loss": 3.254627380371094, "step": 321400 }, { "epoch": 0.38793258178182927, "learning_rate": 8.742052517994909e-06, "loss": 3.267957763671875, "step": 321500 }, { "epoch": 0.38805324510431194, "learning_rate": 8.741648682527171e-06, "loss": 3.25322021484375, "step": 321600 }, { "epoch": 0.3881739084267946, "learning_rate": 8.741244847059433e-06, "loss": 3.270889892578125, "step": 321700 }, { "epoch": 0.3882945717492773, "learning_rate": 8.740841011591695e-06, "loss": 3.24781982421875, "step": 321800 }, { "epoch": 0.38841523507176, "learning_rate": 8.740437176123955e-06, "loss": 3.23787353515625, "step": 321900 }, { "epoch": 0.3885358983942427, "learning_rate": 8.740033340656217e-06, "loss": 3.2627996826171874, "step": 322000 }, { "epoch": 0.38865656171672536, "learning_rate": 8.739629505188477e-06, "loss": 3.2830990600585936, "step": 322100 }, { "epoch": 0.38877722503920803, "learning_rate": 8.73922566972074e-06, "loss": 3.249563903808594, "step": 322200 }, { "epoch": 0.3888978883616907, "learning_rate": 8.738821834253001e-06, "loss": 3.262378845214844, "step": 322300 }, { "epoch": 0.38901855168417343, "learning_rate": 8.738417998785263e-06, "loss": 3.242977294921875, "step": 322400 }, { "epoch": 0.3891392150066561, "learning_rate": 8.738014163317525e-06, "loss": 3.2355126953125, "step": 322500 }, { "epoch": 0.3892598783291388, "learning_rate": 8.737610327849787e-06, "loss": 3.258695373535156, "step": 322600 }, { "epoch": 0.38938054165162145, "learning_rate": 8.73720649238205e-06, "loss": 3.2482220458984377, "step": 322700 }, { "epoch": 0.3895012049741041, "learning_rate": 8.736802656914311e-06, "loss": 3.2713168334960936, "step": 322800 }, { "epoch": 0.38962186829658685, "learning_rate": 8.736398821446572e-06, "loss": 3.280970153808594, "step": 322900 }, { "epoch": 0.3897425316190695, "learning_rate": 8.735994985978834e-06, "loss": 3.267020263671875, "step": 323000 }, { "epoch": 0.3898631949415522, "learning_rate": 8.735591150511094e-06, "loss": 3.2653927612304687, "step": 323100 }, { "epoch": 0.38998385826403487, "learning_rate": 8.735187315043356e-06, "loss": 3.2459262084960936, "step": 323200 }, { "epoch": 0.39010452158651754, "learning_rate": 8.734783479575618e-06, "loss": 3.2473968505859374, "step": 323300 }, { "epoch": 0.39022518490900027, "learning_rate": 8.73437964410788e-06, "loss": 3.240254211425781, "step": 323400 }, { "epoch": 0.39034584823148294, "learning_rate": 8.733975808640142e-06, "loss": 3.2710537719726562, "step": 323500 }, { "epoch": 0.3904665115539656, "learning_rate": 8.733571973172404e-06, "loss": 3.2615786743164064, "step": 323600 }, { "epoch": 0.3905871748764483, "learning_rate": 8.733168137704664e-06, "loss": 3.2791656494140624, "step": 323700 }, { "epoch": 0.39070783819893096, "learning_rate": 8.732764302236926e-06, "loss": 3.2612799072265624, "step": 323800 }, { "epoch": 0.3908285015214137, "learning_rate": 8.732360466769188e-06, "loss": 3.252030029296875, "step": 323900 }, { "epoch": 0.39094916484389636, "learning_rate": 8.73195663130145e-06, "loss": 3.2781024169921875, "step": 324000 }, { "epoch": 0.39106982816637903, "learning_rate": 8.73155279583371e-06, "loss": 3.237001647949219, "step": 324100 }, { "epoch": 0.3911904914888617, "learning_rate": 8.731148960365972e-06, "loss": 3.275115966796875, "step": 324200 }, { "epoch": 0.39131115481134443, "learning_rate": 8.730745124898234e-06, "loss": 3.255198974609375, "step": 324300 }, { "epoch": 0.3914318181338271, "learning_rate": 8.730341289430496e-06, "loss": 3.256047668457031, "step": 324400 }, { "epoch": 0.3915524814563098, "learning_rate": 8.729937453962758e-06, "loss": 3.2424325561523437, "step": 324500 }, { "epoch": 0.39167314477879245, "learning_rate": 8.729533618495019e-06, "loss": 3.2617816162109374, "step": 324600 }, { "epoch": 0.3917938081012751, "learning_rate": 8.72912978302728e-06, "loss": 3.2746548461914062, "step": 324700 }, { "epoch": 0.39191447142375785, "learning_rate": 8.728725947559543e-06, "loss": 3.250362548828125, "step": 324800 }, { "epoch": 0.3920351347462405, "learning_rate": 8.728322112091804e-06, "loss": 3.2543563842773438, "step": 324900 }, { "epoch": 0.3921557980687232, "learning_rate": 8.727918276624065e-06, "loss": 3.2623782348632813, "step": 325000 }, { "epoch": 0.39227646139120587, "learning_rate": 8.727514441156327e-06, "loss": 3.2224575805664064, "step": 325100 }, { "epoch": 0.39239712471368854, "learning_rate": 8.727110605688589e-06, "loss": 3.261824035644531, "step": 325200 }, { "epoch": 0.39251778803617127, "learning_rate": 8.72670677022085e-06, "loss": 3.2519992065429686, "step": 325300 }, { "epoch": 0.39263845135865394, "learning_rate": 8.726302934753111e-06, "loss": 3.256750183105469, "step": 325400 }, { "epoch": 0.3927591146811366, "learning_rate": 8.725899099285373e-06, "loss": 3.2094772338867186, "step": 325500 }, { "epoch": 0.3928797780036193, "learning_rate": 8.725495263817635e-06, "loss": 3.266548767089844, "step": 325600 }, { "epoch": 0.39300044132610196, "learning_rate": 8.725091428349897e-06, "loss": 3.2751498413085938, "step": 325700 }, { "epoch": 0.3931211046485847, "learning_rate": 8.724687592882159e-06, "loss": 3.220372314453125, "step": 325800 }, { "epoch": 0.39324176797106736, "learning_rate": 8.724283757414421e-06, "loss": 3.2622271728515626, "step": 325900 }, { "epoch": 0.39336243129355003, "learning_rate": 8.723879921946681e-06, "loss": 3.2347183227539062, "step": 326000 }, { "epoch": 0.3934830946160327, "learning_rate": 8.723476086478943e-06, "loss": 3.2430880737304686, "step": 326100 }, { "epoch": 0.3936037579385154, "learning_rate": 8.723072251011203e-06, "loss": 3.2468997192382814, "step": 326200 }, { "epoch": 0.3937244212609981, "learning_rate": 8.722668415543465e-06, "loss": 3.2621139526367187, "step": 326300 }, { "epoch": 0.3938450845834808, "learning_rate": 8.722264580075727e-06, "loss": 3.274239501953125, "step": 326400 }, { "epoch": 0.39396574790596345, "learning_rate": 8.72186074460799e-06, "loss": 3.256181640625, "step": 326500 }, { "epoch": 0.3940864112284461, "learning_rate": 8.721456909140251e-06, "loss": 3.2360659790039064, "step": 326600 }, { "epoch": 0.39420707455092885, "learning_rate": 8.721053073672513e-06, "loss": 3.2457891845703126, "step": 326700 }, { "epoch": 0.3943277378734115, "learning_rate": 8.720649238204775e-06, "loss": 3.2437158203125, "step": 326800 }, { "epoch": 0.3944484011958942, "learning_rate": 8.720245402737036e-06, "loss": 3.2530947875976564, "step": 326900 }, { "epoch": 0.39456906451837687, "learning_rate": 8.719841567269298e-06, "loss": 3.2392318725585936, "step": 327000 }, { "epoch": 0.39468972784085954, "learning_rate": 8.71943773180156e-06, "loss": 3.2624307250976563, "step": 327100 }, { "epoch": 0.39481039116334227, "learning_rate": 8.71903389633382e-06, "loss": 3.2410653686523436, "step": 327200 }, { "epoch": 0.39493105448582494, "learning_rate": 8.718630060866082e-06, "loss": 3.2493820190429688, "step": 327300 }, { "epoch": 0.3950517178083076, "learning_rate": 8.718226225398344e-06, "loss": 3.224849853515625, "step": 327400 }, { "epoch": 0.3951723811307903, "learning_rate": 8.717822389930606e-06, "loss": 3.2115936279296875, "step": 327500 }, { "epoch": 0.39529304445327296, "learning_rate": 8.717418554462868e-06, "loss": 3.220730895996094, "step": 327600 }, { "epoch": 0.3954137077757557, "learning_rate": 8.71701471899513e-06, "loss": 3.2486026000976564, "step": 327700 }, { "epoch": 0.39553437109823836, "learning_rate": 8.71661088352739e-06, "loss": 3.2581307983398435, "step": 327800 }, { "epoch": 0.39565503442072103, "learning_rate": 8.716207048059652e-06, "loss": 3.2488836669921874, "step": 327900 }, { "epoch": 0.3957756977432037, "learning_rate": 8.715803212591914e-06, "loss": 3.2595529174804687, "step": 328000 }, { "epoch": 0.3958963610656864, "learning_rate": 8.715399377124174e-06, "loss": 3.2381057739257812, "step": 328100 }, { "epoch": 0.3960170243881691, "learning_rate": 8.714995541656436e-06, "loss": 3.240838623046875, "step": 328200 }, { "epoch": 0.3961376877106518, "learning_rate": 8.714591706188698e-06, "loss": 3.22958251953125, "step": 328300 }, { "epoch": 0.39625835103313445, "learning_rate": 8.71418787072096e-06, "loss": 3.2588885498046873, "step": 328400 }, { "epoch": 0.3963790143556171, "learning_rate": 8.713784035253222e-06, "loss": 3.2506768798828123, "step": 328500 }, { "epoch": 0.3964996776780998, "learning_rate": 8.713380199785483e-06, "loss": 3.239845886230469, "step": 328600 }, { "epoch": 0.3966203410005825, "learning_rate": 8.712976364317745e-06, "loss": 3.229544982910156, "step": 328700 }, { "epoch": 0.3967410043230652, "learning_rate": 8.712572528850007e-06, "loss": 3.237188415527344, "step": 328800 }, { "epoch": 0.39686166764554787, "learning_rate": 8.712168693382269e-06, "loss": 3.222325439453125, "step": 328900 }, { "epoch": 0.39698233096803054, "learning_rate": 8.71176485791453e-06, "loss": 3.2317233276367188, "step": 329000 }, { "epoch": 0.3971029942905132, "learning_rate": 8.71136102244679e-06, "loss": 3.2449880981445314, "step": 329100 }, { "epoch": 0.39722365761299594, "learning_rate": 8.710957186979053e-06, "loss": 3.247603454589844, "step": 329200 }, { "epoch": 0.3973443209354786, "learning_rate": 8.710553351511315e-06, "loss": 3.245472106933594, "step": 329300 }, { "epoch": 0.3974649842579613, "learning_rate": 8.710149516043577e-06, "loss": 3.2534674072265624, "step": 329400 }, { "epoch": 0.39758564758044396, "learning_rate": 8.709745680575837e-06, "loss": 3.260495300292969, "step": 329500 }, { "epoch": 0.3977063109029267, "learning_rate": 8.709341845108099e-06, "loss": 3.2542568969726564, "step": 329600 }, { "epoch": 0.39782697422540936, "learning_rate": 8.708938009640361e-06, "loss": 3.215430908203125, "step": 329700 }, { "epoch": 0.39794763754789203, "learning_rate": 8.708534174172623e-06, "loss": 3.2525616455078126, "step": 329800 }, { "epoch": 0.3980683008703747, "learning_rate": 8.708130338704885e-06, "loss": 3.2172467041015627, "step": 329900 }, { "epoch": 0.3981889641928574, "learning_rate": 8.707726503237145e-06, "loss": 3.227056579589844, "step": 330000 }, { "epoch": 0.3983096275153401, "learning_rate": 8.707322667769407e-06, "loss": 3.2540380859375, "step": 330100 }, { "epoch": 0.3984302908378228, "learning_rate": 8.70691883230167e-06, "loss": 3.2183956909179687, "step": 330200 }, { "epoch": 0.39855095416030545, "learning_rate": 8.70651499683393e-06, "loss": 3.222982177734375, "step": 330300 }, { "epoch": 0.3986716174827881, "learning_rate": 8.706111161366192e-06, "loss": 3.2263897705078124, "step": 330400 }, { "epoch": 0.3987922808052708, "learning_rate": 8.705707325898453e-06, "loss": 3.2129312133789063, "step": 330500 }, { "epoch": 0.3989129441277535, "learning_rate": 8.705303490430715e-06, "loss": 3.240805358886719, "step": 330600 }, { "epoch": 0.3990336074502362, "learning_rate": 8.704899654962977e-06, "loss": 3.2541278076171873, "step": 330700 }, { "epoch": 0.39915427077271887, "learning_rate": 8.70449581949524e-06, "loss": 3.23765625, "step": 330800 }, { "epoch": 0.39927493409520154, "learning_rate": 8.704091984027501e-06, "loss": 3.23277587890625, "step": 330900 }, { "epoch": 0.3993955974176842, "learning_rate": 8.703688148559762e-06, "loss": 3.2397525024414064, "step": 331000 }, { "epoch": 0.39951626074016694, "learning_rate": 8.703284313092024e-06, "loss": 3.2474267578125, "step": 331100 }, { "epoch": 0.3996369240626496, "learning_rate": 8.702880477624284e-06, "loss": 3.213720397949219, "step": 331200 }, { "epoch": 0.3997575873851323, "learning_rate": 8.702476642156546e-06, "loss": 3.209533386230469, "step": 331300 }, { "epoch": 0.39987825070761496, "learning_rate": 8.702072806688808e-06, "loss": 3.2245709228515627, "step": 331400 }, { "epoch": 0.39999891403009763, "learning_rate": 8.70166897122107e-06, "loss": 3.258290100097656, "step": 331500 }, { "epoch": 0.40011957735258036, "learning_rate": 8.701265135753332e-06, "loss": 3.2603057861328124, "step": 331600 }, { "epoch": 0.40024024067506303, "learning_rate": 8.700861300285594e-06, "loss": 3.2535665893554686, "step": 331700 }, { "epoch": 0.4003609039975457, "learning_rate": 8.700457464817856e-06, "loss": 3.2403680419921876, "step": 331800 }, { "epoch": 0.4004815673200284, "learning_rate": 8.700053629350116e-06, "loss": 3.223586120605469, "step": 331900 }, { "epoch": 0.4006022306425111, "learning_rate": 8.699649793882378e-06, "loss": 3.216365966796875, "step": 332000 }, { "epoch": 0.4007228939649938, "learning_rate": 8.69924595841464e-06, "loss": 3.230245361328125, "step": 332100 }, { "epoch": 0.40084355728747645, "learning_rate": 8.6988421229469e-06, "loss": 3.2543609619140623, "step": 332200 }, { "epoch": 0.4009642206099591, "learning_rate": 8.698438287479162e-06, "loss": 3.2624642944335935, "step": 332300 }, { "epoch": 0.4010848839324418, "learning_rate": 8.698034452011424e-06, "loss": 3.2456478881835937, "step": 332400 }, { "epoch": 0.4012055472549245, "learning_rate": 8.697630616543686e-06, "loss": 3.2356918334960936, "step": 332500 }, { "epoch": 0.4013262105774072, "learning_rate": 8.697226781075948e-06, "loss": 3.2194866943359375, "step": 332600 }, { "epoch": 0.40144687389988987, "learning_rate": 8.696822945608209e-06, "loss": 3.2380975341796874, "step": 332700 }, { "epoch": 0.40156753722237254, "learning_rate": 8.69641911014047e-06, "loss": 3.2371475219726564, "step": 332800 }, { "epoch": 0.4016882005448552, "learning_rate": 8.696015274672733e-06, "loss": 3.220198669433594, "step": 332900 }, { "epoch": 0.40180886386733794, "learning_rate": 8.695611439204995e-06, "loss": 3.241708068847656, "step": 333000 }, { "epoch": 0.4019295271898206, "learning_rate": 8.695207603737255e-06, "loss": 3.1977859497070313, "step": 333100 }, { "epoch": 0.4020501905123033, "learning_rate": 8.694803768269517e-06, "loss": 3.2426321411132815, "step": 333200 }, { "epoch": 0.40217085383478596, "learning_rate": 8.694399932801779e-06, "loss": 3.1952053833007814, "step": 333300 }, { "epoch": 0.40229151715726863, "learning_rate": 8.69399609733404e-06, "loss": 3.238172912597656, "step": 333400 }, { "epoch": 0.40241218047975136, "learning_rate": 8.693592261866301e-06, "loss": 3.2227496337890624, "step": 333500 }, { "epoch": 0.40253284380223403, "learning_rate": 8.693188426398563e-06, "loss": 3.240567321777344, "step": 333600 }, { "epoch": 0.4026535071247167, "learning_rate": 8.692784590930825e-06, "loss": 3.2373675537109374, "step": 333700 }, { "epoch": 0.4027741704471994, "learning_rate": 8.692380755463087e-06, "loss": 3.22337158203125, "step": 333800 }, { "epoch": 0.40289483376968205, "learning_rate": 8.691976919995349e-06, "loss": 3.219118347167969, "step": 333900 }, { "epoch": 0.4030154970921648, "learning_rate": 8.691573084527611e-06, "loss": 3.2311080932617187, "step": 334000 }, { "epoch": 0.40313616041464745, "learning_rate": 8.691169249059871e-06, "loss": 3.2483099365234374, "step": 334100 }, { "epoch": 0.4032568237371301, "learning_rate": 8.690765413592133e-06, "loss": 3.266927490234375, "step": 334200 }, { "epoch": 0.4033774870596128, "learning_rate": 8.690361578124394e-06, "loss": 3.2319259643554688, "step": 334300 }, { "epoch": 0.40349815038209547, "learning_rate": 8.689957742656656e-06, "loss": 3.2280313110351564, "step": 334400 }, { "epoch": 0.4036188137045782, "learning_rate": 8.689553907188918e-06, "loss": 3.253345642089844, "step": 334500 }, { "epoch": 0.40373947702706087, "learning_rate": 8.68915007172118e-06, "loss": 3.239232482910156, "step": 334600 }, { "epoch": 0.40386014034954354, "learning_rate": 8.688746236253442e-06, "loss": 3.25429443359375, "step": 334700 }, { "epoch": 0.4039808036720262, "learning_rate": 8.688342400785703e-06, "loss": 3.234934997558594, "step": 334800 }, { "epoch": 0.40410146699450894, "learning_rate": 8.687938565317965e-06, "loss": 3.2206710815429687, "step": 334900 }, { "epoch": 0.4042221303169916, "learning_rate": 8.687534729850227e-06, "loss": 3.2517941284179686, "step": 335000 }, { "epoch": 0.4043427936394743, "learning_rate": 8.687130894382488e-06, "loss": 3.2393963623046873, "step": 335100 }, { "epoch": 0.40446345696195696, "learning_rate": 8.68672705891475e-06, "loss": 3.226715393066406, "step": 335200 }, { "epoch": 0.40458412028443963, "learning_rate": 8.68632322344701e-06, "loss": 3.2386956787109376, "step": 335300 }, { "epoch": 0.40470478360692236, "learning_rate": 8.685919387979272e-06, "loss": 3.2447048950195314, "step": 335400 }, { "epoch": 0.40482544692940503, "learning_rate": 8.685515552511534e-06, "loss": 3.218361511230469, "step": 335500 }, { "epoch": 0.4049461102518877, "learning_rate": 8.685111717043796e-06, "loss": 3.209727783203125, "step": 335600 }, { "epoch": 0.4050667735743704, "learning_rate": 8.684707881576058e-06, "loss": 3.227924499511719, "step": 335700 }, { "epoch": 0.40518743689685305, "learning_rate": 8.68430404610832e-06, "loss": 3.2397885131835937, "step": 335800 }, { "epoch": 0.4053081002193358, "learning_rate": 8.683900210640582e-06, "loss": 3.23482666015625, "step": 335900 }, { "epoch": 0.40542876354181845, "learning_rate": 8.683496375172842e-06, "loss": 3.214422302246094, "step": 336000 }, { "epoch": 0.4055494268643011, "learning_rate": 8.683092539705104e-06, "loss": 3.2211929321289063, "step": 336100 }, { "epoch": 0.4056700901867838, "learning_rate": 8.682688704237366e-06, "loss": 3.197298583984375, "step": 336200 }, { "epoch": 0.40579075350926647, "learning_rate": 8.682284868769626e-06, "loss": 3.244281921386719, "step": 336300 }, { "epoch": 0.4059114168317492, "learning_rate": 8.681881033301888e-06, "loss": 3.2218942260742187, "step": 336400 }, { "epoch": 0.40603208015423187, "learning_rate": 8.68147719783415e-06, "loss": 3.2383651733398438, "step": 336500 }, { "epoch": 0.40615274347671454, "learning_rate": 8.681073362366412e-06, "loss": 3.211350402832031, "step": 336600 }, { "epoch": 0.4062734067991972, "learning_rate": 8.680669526898674e-06, "loss": 3.2161904907226564, "step": 336700 }, { "epoch": 0.4063940701216799, "learning_rate": 8.680265691430935e-06, "loss": 3.2426333618164063, "step": 336800 }, { "epoch": 0.4065147334441626, "learning_rate": 8.679861855963197e-06, "loss": 3.204479064941406, "step": 336900 }, { "epoch": 0.4066353967666453, "learning_rate": 8.679458020495459e-06, "loss": 3.25840576171875, "step": 337000 }, { "epoch": 0.40675606008912796, "learning_rate": 8.67905418502772e-06, "loss": 3.205541687011719, "step": 337100 }, { "epoch": 0.40687672341161063, "learning_rate": 8.678650349559981e-06, "loss": 3.2392449951171876, "step": 337200 }, { "epoch": 0.40699738673409336, "learning_rate": 8.678246514092243e-06, "loss": 3.2341339111328127, "step": 337300 }, { "epoch": 0.40711805005657603, "learning_rate": 8.677842678624505e-06, "loss": 3.178050842285156, "step": 337400 }, { "epoch": 0.4072387133790587, "learning_rate": 8.677438843156767e-06, "loss": 3.2221990966796876, "step": 337500 }, { "epoch": 0.4073593767015414, "learning_rate": 8.677035007689027e-06, "loss": 3.2231076049804686, "step": 337600 }, { "epoch": 0.40748004002402405, "learning_rate": 8.676631172221289e-06, "loss": 3.219910888671875, "step": 337700 }, { "epoch": 0.4076007033465068, "learning_rate": 8.676227336753551e-06, "loss": 3.2170254516601564, "step": 337800 }, { "epoch": 0.40772136666898945, "learning_rate": 8.675823501285813e-06, "loss": 3.21661376953125, "step": 337900 }, { "epoch": 0.4078420299914721, "learning_rate": 8.675419665818075e-06, "loss": 3.2232647705078126, "step": 338000 }, { "epoch": 0.4079626933139548, "learning_rate": 8.675015830350337e-06, "loss": 3.235281982421875, "step": 338100 }, { "epoch": 0.40808335663643747, "learning_rate": 8.674611994882597e-06, "loss": 3.229799499511719, "step": 338200 }, { "epoch": 0.4082040199589202, "learning_rate": 8.67420815941486e-06, "loss": 3.2149139404296876, "step": 338300 }, { "epoch": 0.40832468328140287, "learning_rate": 8.67380432394712e-06, "loss": 3.2462454223632813, "step": 338400 }, { "epoch": 0.40844534660388554, "learning_rate": 8.673400488479382e-06, "loss": 3.2204629516601564, "step": 338500 }, { "epoch": 0.4085660099263682, "learning_rate": 8.672996653011644e-06, "loss": 3.2181387329101563, "step": 338600 }, { "epoch": 0.4086866732488509, "learning_rate": 8.672592817543906e-06, "loss": 3.219879455566406, "step": 338700 }, { "epoch": 0.4088073365713336, "learning_rate": 8.672188982076168e-06, "loss": 3.231728210449219, "step": 338800 }, { "epoch": 0.4089279998938163, "learning_rate": 8.67178514660843e-06, "loss": 3.204775085449219, "step": 338900 }, { "epoch": 0.40904866321629896, "learning_rate": 8.671381311140692e-06, "loss": 3.2208401489257814, "step": 339000 }, { "epoch": 0.40916932653878163, "learning_rate": 8.670977475672952e-06, "loss": 3.2086062622070313, "step": 339100 }, { "epoch": 0.4092899898612643, "learning_rate": 8.670573640205214e-06, "loss": 3.197918701171875, "step": 339200 }, { "epoch": 0.40941065318374703, "learning_rate": 8.670169804737476e-06, "loss": 3.2291751098632813, "step": 339300 }, { "epoch": 0.4095313165062297, "learning_rate": 8.669765969269736e-06, "loss": 3.208134765625, "step": 339400 }, { "epoch": 0.4096519798287124, "learning_rate": 8.669362133801998e-06, "loss": 3.2309054565429687, "step": 339500 }, { "epoch": 0.40977264315119505, "learning_rate": 8.66895829833426e-06, "loss": 3.2387905883789063, "step": 339600 }, { "epoch": 0.4098933064736777, "learning_rate": 8.668554462866522e-06, "loss": 3.212843933105469, "step": 339700 }, { "epoch": 0.41001396979616045, "learning_rate": 8.668150627398784e-06, "loss": 3.22937255859375, "step": 339800 }, { "epoch": 0.4101346331186431, "learning_rate": 8.667746791931046e-06, "loss": 3.1962744140625, "step": 339900 }, { "epoch": 0.4102552964411258, "learning_rate": 8.667342956463308e-06, "loss": 3.2106356811523438, "step": 340000 }, { "epoch": 0.41037595976360847, "learning_rate": 8.666939120995568e-06, "loss": 3.209013671875, "step": 340100 }, { "epoch": 0.4104966230860912, "learning_rate": 8.66653528552783e-06, "loss": 3.1933554077148436, "step": 340200 }, { "epoch": 0.41061728640857387, "learning_rate": 8.66613145006009e-06, "loss": 3.2256842041015625, "step": 340300 }, { "epoch": 0.41073794973105654, "learning_rate": 8.665727614592352e-06, "loss": 3.229443359375, "step": 340400 }, { "epoch": 0.4108586130535392, "learning_rate": 8.665323779124614e-06, "loss": 3.230039367675781, "step": 340500 }, { "epoch": 0.4109792763760219, "learning_rate": 8.664919943656876e-06, "loss": 3.2083975219726564, "step": 340600 }, { "epoch": 0.4110999396985046, "learning_rate": 8.664516108189138e-06, "loss": 3.2223355102539064, "step": 340700 }, { "epoch": 0.4112206030209873, "learning_rate": 8.6641122727214e-06, "loss": 3.223494567871094, "step": 340800 }, { "epoch": 0.41134126634346996, "learning_rate": 8.66370843725366e-06, "loss": 3.2406671142578123, "step": 340900 }, { "epoch": 0.41146192966595263, "learning_rate": 8.663304601785923e-06, "loss": 3.242525939941406, "step": 341000 }, { "epoch": 0.4115825929884353, "learning_rate": 8.662900766318185e-06, "loss": 3.222906494140625, "step": 341100 }, { "epoch": 0.41170325631091803, "learning_rate": 8.662496930850447e-06, "loss": 3.231730651855469, "step": 341200 }, { "epoch": 0.4118239196334007, "learning_rate": 8.662093095382707e-06, "loss": 3.198711242675781, "step": 341300 }, { "epoch": 0.4119445829558834, "learning_rate": 8.661689259914969e-06, "loss": 3.226524658203125, "step": 341400 }, { "epoch": 0.41206524627836605, "learning_rate": 8.661285424447231e-06, "loss": 3.202694091796875, "step": 341500 }, { "epoch": 0.4121859096008487, "learning_rate": 8.660881588979493e-06, "loss": 3.239063720703125, "step": 341600 }, { "epoch": 0.41230657292333145, "learning_rate": 8.660477753511753e-06, "loss": 3.2045864868164062, "step": 341700 }, { "epoch": 0.4124272362458141, "learning_rate": 8.660073918044015e-06, "loss": 3.181391296386719, "step": 341800 }, { "epoch": 0.4125478995682968, "learning_rate": 8.659670082576277e-06, "loss": 3.2037448120117187, "step": 341900 }, { "epoch": 0.41266856289077947, "learning_rate": 8.659266247108539e-06, "loss": 3.224603271484375, "step": 342000 }, { "epoch": 0.41278922621326214, "learning_rate": 8.658862411640801e-06, "loss": 3.2082894897460936, "step": 342100 }, { "epoch": 0.41290988953574487, "learning_rate": 8.658458576173061e-06, "loss": 3.183901062011719, "step": 342200 }, { "epoch": 0.41303055285822754, "learning_rate": 8.658054740705323e-06, "loss": 3.2185455322265626, "step": 342300 }, { "epoch": 0.4131512161807102, "learning_rate": 8.657650905237585e-06, "loss": 3.1830328369140624, "step": 342400 }, { "epoch": 0.4132718795031929, "learning_rate": 8.657247069769846e-06, "loss": 3.2155596923828127, "step": 342500 }, { "epoch": 0.4133925428256756, "learning_rate": 8.656843234302108e-06, "loss": 3.1984686279296874, "step": 342600 }, { "epoch": 0.4135132061481583, "learning_rate": 8.65643939883437e-06, "loss": 3.192720947265625, "step": 342700 }, { "epoch": 0.41363386947064096, "learning_rate": 8.656035563366632e-06, "loss": 3.2008929443359375, "step": 342800 }, { "epoch": 0.41375453279312363, "learning_rate": 8.655631727898894e-06, "loss": 3.2165261840820314, "step": 342900 }, { "epoch": 0.4138751961156063, "learning_rate": 8.655227892431156e-06, "loss": 3.2417007446289063, "step": 343000 }, { "epoch": 0.41399585943808903, "learning_rate": 8.654824056963418e-06, "loss": 3.205733337402344, "step": 343100 }, { "epoch": 0.4141165227605717, "learning_rate": 8.654420221495678e-06, "loss": 3.221959228515625, "step": 343200 }, { "epoch": 0.4142371860830544, "learning_rate": 8.65401638602794e-06, "loss": 3.19021728515625, "step": 343300 }, { "epoch": 0.41435784940553705, "learning_rate": 8.6536125505602e-06, "loss": 3.2108798217773438, "step": 343400 }, { "epoch": 0.4144785127280197, "learning_rate": 8.653208715092462e-06, "loss": 3.2116644287109377, "step": 343500 }, { "epoch": 0.41459917605050245, "learning_rate": 8.652804879624724e-06, "loss": 3.2212738037109374, "step": 343600 }, { "epoch": 0.4147198393729851, "learning_rate": 8.652401044156986e-06, "loss": 3.2033590698242187, "step": 343700 }, { "epoch": 0.4148405026954678, "learning_rate": 8.651997208689248e-06, "loss": 3.195982666015625, "step": 343800 }, { "epoch": 0.41496116601795047, "learning_rate": 8.65159337322151e-06, "loss": 3.2180380249023437, "step": 343900 }, { "epoch": 0.41508182934043314, "learning_rate": 8.651189537753772e-06, "loss": 3.1774774169921876, "step": 344000 }, { "epoch": 0.41520249266291587, "learning_rate": 8.650785702286032e-06, "loss": 3.210050048828125, "step": 344100 }, { "epoch": 0.41532315598539854, "learning_rate": 8.650381866818294e-06, "loss": 3.211160888671875, "step": 344200 }, { "epoch": 0.4154438193078812, "learning_rate": 8.649978031350556e-06, "loss": 3.1976614379882813, "step": 344300 }, { "epoch": 0.4155644826303639, "learning_rate": 8.649574195882817e-06, "loss": 3.190289306640625, "step": 344400 }, { "epoch": 0.41568514595284656, "learning_rate": 8.649170360415079e-06, "loss": 3.225347595214844, "step": 344500 }, { "epoch": 0.4158058092753293, "learning_rate": 8.64876652494734e-06, "loss": 3.202977294921875, "step": 344600 }, { "epoch": 0.41592647259781196, "learning_rate": 8.648362689479602e-06, "loss": 3.2093356323242186, "step": 344700 }, { "epoch": 0.41604713592029463, "learning_rate": 8.647958854011864e-06, "loss": 3.1954550170898437, "step": 344800 }, { "epoch": 0.4161677992427773, "learning_rate": 8.647555018544126e-06, "loss": 3.1998214721679688, "step": 344900 }, { "epoch": 0.41628846256526003, "learning_rate": 8.647151183076387e-06, "loss": 3.2063043212890623, "step": 345000 }, { "epoch": 0.4164091258877427, "learning_rate": 8.646747347608649e-06, "loss": 3.22114013671875, "step": 345100 }, { "epoch": 0.4165297892102254, "learning_rate": 8.64634351214091e-06, "loss": 3.223668518066406, "step": 345200 }, { "epoch": 0.41665045253270805, "learning_rate": 8.645939676673171e-06, "loss": 3.206558837890625, "step": 345300 }, { "epoch": 0.4167711158551907, "learning_rate": 8.645535841205433e-06, "loss": 3.205198059082031, "step": 345400 }, { "epoch": 0.41689177917767345, "learning_rate": 8.645132005737695e-06, "loss": 3.192651672363281, "step": 345500 }, { "epoch": 0.4170124425001561, "learning_rate": 8.644728170269957e-06, "loss": 3.2244189453125, "step": 345600 }, { "epoch": 0.4171331058226388, "learning_rate": 8.644324334802219e-06, "loss": 3.2088446044921874, "step": 345700 }, { "epoch": 0.41725376914512147, "learning_rate": 8.64392049933448e-06, "loss": 3.205760192871094, "step": 345800 }, { "epoch": 0.41737443246760414, "learning_rate": 8.643516663866741e-06, "loss": 3.2174618530273436, "step": 345900 }, { "epoch": 0.41749509579008687, "learning_rate": 8.643112828399003e-06, "loss": 3.2103399658203124, "step": 346000 }, { "epoch": 0.41761575911256954, "learning_rate": 8.642708992931265e-06, "loss": 3.2393667602539065, "step": 346100 }, { "epoch": 0.4177364224350522, "learning_rate": 8.642305157463527e-06, "loss": 3.209239196777344, "step": 346200 }, { "epoch": 0.4178570857575349, "learning_rate": 8.641901321995787e-06, "loss": 3.2006735229492187, "step": 346300 }, { "epoch": 0.41797774908001756, "learning_rate": 8.64149748652805e-06, "loss": 3.2213815307617186, "step": 346400 }, { "epoch": 0.4180984124025003, "learning_rate": 8.641093651060311e-06, "loss": 3.1774542236328127, "step": 346500 }, { "epoch": 0.41821907572498296, "learning_rate": 8.640689815592572e-06, "loss": 3.2271368408203127, "step": 346600 }, { "epoch": 0.41833973904746563, "learning_rate": 8.640285980124834e-06, "loss": 3.196385498046875, "step": 346700 }, { "epoch": 0.4184604023699483, "learning_rate": 8.639882144657096e-06, "loss": 3.2082119750976563, "step": 346800 }, { "epoch": 0.418581065692431, "learning_rate": 8.639478309189358e-06, "loss": 3.181191101074219, "step": 346900 }, { "epoch": 0.4187017290149137, "learning_rate": 8.63907447372162e-06, "loss": 3.21628173828125, "step": 347000 }, { "epoch": 0.4188223923373964, "learning_rate": 8.638670638253882e-06, "loss": 3.1893939208984374, "step": 347100 }, { "epoch": 0.41894305565987905, "learning_rate": 8.638266802786142e-06, "loss": 3.2127761840820312, "step": 347200 }, { "epoch": 0.4190637189823617, "learning_rate": 8.637862967318404e-06, "loss": 3.2235122680664063, "step": 347300 }, { "epoch": 0.4191843823048444, "learning_rate": 8.637459131850666e-06, "loss": 3.1816720581054687, "step": 347400 }, { "epoch": 0.4193050456273271, "learning_rate": 8.637055296382926e-06, "loss": 3.2108224487304686, "step": 347500 }, { "epoch": 0.4194257089498098, "learning_rate": 8.636651460915188e-06, "loss": 3.1819384765625, "step": 347600 }, { "epoch": 0.41954637227229247, "learning_rate": 8.63624762544745e-06, "loss": 3.185660705566406, "step": 347700 }, { "epoch": 0.41966703559477514, "learning_rate": 8.635843789979712e-06, "loss": 3.178056640625, "step": 347800 }, { "epoch": 0.41978769891725787, "learning_rate": 8.635439954511974e-06, "loss": 3.2183203125, "step": 347900 }, { "epoch": 0.41990836223974054, "learning_rate": 8.635036119044236e-06, "loss": 3.205784912109375, "step": 348000 }, { "epoch": 0.4200290255622232, "learning_rate": 8.634632283576498e-06, "loss": 3.205758361816406, "step": 348100 }, { "epoch": 0.4201496888847059, "learning_rate": 8.634228448108758e-06, "loss": 3.186525573730469, "step": 348200 }, { "epoch": 0.42027035220718856, "learning_rate": 8.63382461264102e-06, "loss": 3.185724182128906, "step": 348300 }, { "epoch": 0.4203910155296713, "learning_rate": 8.63342077717328e-06, "loss": 3.1968618774414064, "step": 348400 }, { "epoch": 0.42051167885215396, "learning_rate": 8.633016941705543e-06, "loss": 3.1868109130859374, "step": 348500 }, { "epoch": 0.42063234217463663, "learning_rate": 8.632613106237805e-06, "loss": 3.2233200073242188, "step": 348600 }, { "epoch": 0.4207530054971193, "learning_rate": 8.632209270770067e-06, "loss": 3.2074380493164063, "step": 348700 }, { "epoch": 0.420873668819602, "learning_rate": 8.631805435302329e-06, "loss": 3.1990170288085937, "step": 348800 }, { "epoch": 0.4209943321420847, "learning_rate": 8.63140159983459e-06, "loss": 3.205107421875, "step": 348900 }, { "epoch": 0.4211149954645674, "learning_rate": 8.63099776436685e-06, "loss": 3.180198059082031, "step": 349000 }, { "epoch": 0.42123565878705005, "learning_rate": 8.630593928899113e-06, "loss": 3.2174258422851563, "step": 349100 }, { "epoch": 0.4213563221095327, "learning_rate": 8.630190093431375e-06, "loss": 3.212493591308594, "step": 349200 }, { "epoch": 0.4214769854320154, "learning_rate": 8.629786257963637e-06, "loss": 3.188234558105469, "step": 349300 }, { "epoch": 0.4215976487544981, "learning_rate": 8.629382422495897e-06, "loss": 3.2077059936523438, "step": 349400 }, { "epoch": 0.4217183120769808, "learning_rate": 8.628978587028159e-06, "loss": 3.219124450683594, "step": 349500 }, { "epoch": 0.42183897539946347, "learning_rate": 8.628574751560421e-06, "loss": 3.2035372924804686, "step": 349600 }, { "epoch": 0.42195963872194614, "learning_rate": 8.628170916092683e-06, "loss": 3.1906072998046877, "step": 349700 }, { "epoch": 0.4220803020444288, "learning_rate": 8.627767080624943e-06, "loss": 3.204189453125, "step": 349800 }, { "epoch": 0.42220096536691154, "learning_rate": 8.627363245157205e-06, "loss": 3.211806640625, "step": 349900 }, { "epoch": 0.4223216286893942, "learning_rate": 8.626959409689467e-06, "loss": 3.218048095703125, "step": 350000 }, { "epoch": 0.4224422920118769, "learning_rate": 8.62655557422173e-06, "loss": 3.2010458374023436, "step": 350100 }, { "epoch": 0.42256295533435956, "learning_rate": 8.626151738753991e-06, "loss": 3.2027316284179688, "step": 350200 }, { "epoch": 0.4226836186568423, "learning_rate": 8.625747903286253e-06, "loss": 3.193138427734375, "step": 350300 }, { "epoch": 0.42280428197932496, "learning_rate": 8.625344067818513e-06, "loss": 3.2288323974609376, "step": 350400 }, { "epoch": 0.42292494530180763, "learning_rate": 8.624940232350775e-06, "loss": 3.1780859375, "step": 350500 }, { "epoch": 0.4230456086242903, "learning_rate": 8.624536396883037e-06, "loss": 3.2224600219726565, "step": 350600 }, { "epoch": 0.423166271946773, "learning_rate": 8.624132561415298e-06, "loss": 3.1776654052734377, "step": 350700 }, { "epoch": 0.4232869352692557, "learning_rate": 8.62372872594756e-06, "loss": 3.2015042114257812, "step": 350800 }, { "epoch": 0.4234075985917384, "learning_rate": 8.623324890479822e-06, "loss": 3.1626651000976564, "step": 350900 }, { "epoch": 0.42352826191422105, "learning_rate": 8.622921055012084e-06, "loss": 3.226488037109375, "step": 351000 }, { "epoch": 0.4236489252367037, "learning_rate": 8.622517219544346e-06, "loss": 3.1890530395507812, "step": 351100 }, { "epoch": 0.4237695885591864, "learning_rate": 8.622113384076608e-06, "loss": 3.1845584106445313, "step": 351200 }, { "epoch": 0.4238902518816691, "learning_rate": 8.621709548608868e-06, "loss": 3.2036788940429686, "step": 351300 }, { "epoch": 0.4240109152041518, "learning_rate": 8.62130571314113e-06, "loss": 3.202007141113281, "step": 351400 }, { "epoch": 0.42413157852663447, "learning_rate": 8.620901877673392e-06, "loss": 3.1648004150390623, "step": 351500 }, { "epoch": 0.42425224184911714, "learning_rate": 8.620498042205652e-06, "loss": 3.213977966308594, "step": 351600 }, { "epoch": 0.4243729051715998, "learning_rate": 8.620094206737914e-06, "loss": 3.1970068359375, "step": 351700 }, { "epoch": 0.42449356849408254, "learning_rate": 8.619690371270176e-06, "loss": 3.2080477905273437, "step": 351800 }, { "epoch": 0.4246142318165652, "learning_rate": 8.619286535802438e-06, "loss": 3.1725588989257814, "step": 351900 }, { "epoch": 0.4247348951390479, "learning_rate": 8.6188827003347e-06, "loss": 3.1949203491210936, "step": 352000 }, { "epoch": 0.42485555846153056, "learning_rate": 8.618478864866962e-06, "loss": 3.1900143432617187, "step": 352100 }, { "epoch": 0.42497622178401323, "learning_rate": 8.618075029399224e-06, "loss": 3.1891775512695313, "step": 352200 }, { "epoch": 0.42509688510649596, "learning_rate": 8.617671193931484e-06, "loss": 3.1977944946289063, "step": 352300 }, { "epoch": 0.42521754842897863, "learning_rate": 8.617267358463746e-06, "loss": 3.2065228271484374, "step": 352400 }, { "epoch": 0.4253382117514613, "learning_rate": 8.616863522996007e-06, "loss": 3.1953411865234376, "step": 352500 }, { "epoch": 0.425458875073944, "learning_rate": 8.616459687528269e-06, "loss": 3.1885186767578126, "step": 352600 }, { "epoch": 0.42557953839642665, "learning_rate": 8.61605585206053e-06, "loss": 3.1860955810546874, "step": 352700 }, { "epoch": 0.4257002017189094, "learning_rate": 8.615652016592793e-06, "loss": 3.1615304565429687, "step": 352800 }, { "epoch": 0.42582086504139205, "learning_rate": 8.615248181125055e-06, "loss": 3.2005215454101563, "step": 352900 }, { "epoch": 0.4259415283638747, "learning_rate": 8.614844345657317e-06, "loss": 3.1655239868164062, "step": 353000 }, { "epoch": 0.4260621916863574, "learning_rate": 8.614440510189577e-06, "loss": 3.1802490234375, "step": 353100 }, { "epoch": 0.4261828550088401, "learning_rate": 8.614036674721839e-06, "loss": 3.1738934326171875, "step": 353200 }, { "epoch": 0.4263035183313228, "learning_rate": 8.6136328392541e-06, "loss": 3.1935418701171874, "step": 353300 }, { "epoch": 0.42642418165380547, "learning_rate": 8.613229003786363e-06, "loss": 3.168765869140625, "step": 353400 }, { "epoch": 0.42654484497628814, "learning_rate": 8.612825168318623e-06, "loss": 3.1861041259765623, "step": 353500 }, { "epoch": 0.4266655082987708, "learning_rate": 8.612421332850885e-06, "loss": 3.189508972167969, "step": 353600 }, { "epoch": 0.42678617162125354, "learning_rate": 8.612017497383147e-06, "loss": 3.197337341308594, "step": 353700 }, { "epoch": 0.4269068349437362, "learning_rate": 8.611613661915409e-06, "loss": 3.181391296386719, "step": 353800 }, { "epoch": 0.4270274982662189, "learning_rate": 8.61120982644767e-06, "loss": 3.1841604614257815, "step": 353900 }, { "epoch": 0.42714816158870156, "learning_rate": 8.610805990979931e-06, "loss": 3.198205871582031, "step": 354000 }, { "epoch": 0.42726882491118423, "learning_rate": 8.610402155512193e-06, "loss": 3.211336975097656, "step": 354100 }, { "epoch": 0.42738948823366696, "learning_rate": 8.609998320044455e-06, "loss": 3.149882507324219, "step": 354200 }, { "epoch": 0.42751015155614963, "learning_rate": 8.609594484576717e-06, "loss": 3.202339782714844, "step": 354300 }, { "epoch": 0.4276308148786323, "learning_rate": 8.609190649108978e-06, "loss": 3.196155700683594, "step": 354400 }, { "epoch": 0.427751478201115, "learning_rate": 8.60878681364124e-06, "loss": 3.178345947265625, "step": 354500 }, { "epoch": 0.42787214152359765, "learning_rate": 8.608382978173501e-06, "loss": 3.175726318359375, "step": 354600 }, { "epoch": 0.4279928048460804, "learning_rate": 8.607979142705762e-06, "loss": 3.1696160888671874, "step": 354700 }, { "epoch": 0.42811346816856305, "learning_rate": 8.607575307238024e-06, "loss": 3.1580960083007814, "step": 354800 }, { "epoch": 0.4282341314910457, "learning_rate": 8.607171471770286e-06, "loss": 3.1801498413085936, "step": 354900 }, { "epoch": 0.4283547948135284, "learning_rate": 8.606767636302548e-06, "loss": 3.204053955078125, "step": 355000 }, { "epoch": 0.42847545813601107, "learning_rate": 8.60636380083481e-06, "loss": 3.1976077270507814, "step": 355100 }, { "epoch": 0.4285961214584938, "learning_rate": 8.605959965367072e-06, "loss": 3.179556579589844, "step": 355200 }, { "epoch": 0.42871678478097647, "learning_rate": 8.605556129899334e-06, "loss": 3.15634033203125, "step": 355300 }, { "epoch": 0.42883744810345914, "learning_rate": 8.605152294431594e-06, "loss": 3.1712017822265626, "step": 355400 }, { "epoch": 0.4289581114259418, "learning_rate": 8.604748458963856e-06, "loss": 3.194010925292969, "step": 355500 }, { "epoch": 0.42907877474842454, "learning_rate": 8.604344623496116e-06, "loss": 3.1828439331054685, "step": 355600 }, { "epoch": 0.4291994380709072, "learning_rate": 8.603940788028378e-06, "loss": 3.1830108642578123, "step": 355700 }, { "epoch": 0.4293201013933899, "learning_rate": 8.60353695256064e-06, "loss": 3.218525390625, "step": 355800 }, { "epoch": 0.42944076471587256, "learning_rate": 8.603133117092902e-06, "loss": 3.1855133056640623, "step": 355900 }, { "epoch": 0.42956142803835523, "learning_rate": 8.602729281625164e-06, "loss": 3.20457763671875, "step": 356000 }, { "epoch": 0.42968209136083796, "learning_rate": 8.602325446157426e-06, "loss": 3.16480224609375, "step": 356100 }, { "epoch": 0.42980275468332063, "learning_rate": 8.601921610689688e-06, "loss": 3.1808721923828127, "step": 356200 }, { "epoch": 0.4299234180058033, "learning_rate": 8.601517775221948e-06, "loss": 3.193555908203125, "step": 356300 }, { "epoch": 0.430044081328286, "learning_rate": 8.60111393975421e-06, "loss": 3.164589538574219, "step": 356400 }, { "epoch": 0.43016474465076865, "learning_rate": 8.600710104286472e-06, "loss": 3.199861755371094, "step": 356500 }, { "epoch": 0.4302854079732514, "learning_rate": 8.600306268818733e-06, "loss": 3.16435302734375, "step": 356600 }, { "epoch": 0.43040607129573405, "learning_rate": 8.599902433350995e-06, "loss": 3.188094177246094, "step": 356700 }, { "epoch": 0.4305267346182167, "learning_rate": 8.599498597883257e-06, "loss": 3.175874938964844, "step": 356800 }, { "epoch": 0.4306473979406994, "learning_rate": 8.599094762415519e-06, "loss": 3.1786093139648437, "step": 356900 }, { "epoch": 0.43076806126318207, "learning_rate": 8.59869092694778e-06, "loss": 3.161024475097656, "step": 357000 }, { "epoch": 0.4308887245856648, "learning_rate": 8.598287091480043e-06, "loss": 3.1848822021484375, "step": 357100 }, { "epoch": 0.43100938790814747, "learning_rate": 8.597883256012303e-06, "loss": 3.173997802734375, "step": 357200 }, { "epoch": 0.43113005123063014, "learning_rate": 8.597479420544565e-06, "loss": 3.179041442871094, "step": 357300 }, { "epoch": 0.4312507145531128, "learning_rate": 8.597075585076827e-06, "loss": 3.166010437011719, "step": 357400 }, { "epoch": 0.4313713778755955, "learning_rate": 8.596671749609087e-06, "loss": 3.1589715576171873, "step": 357500 }, { "epoch": 0.4314920411980782, "learning_rate": 8.596267914141349e-06, "loss": 3.189253234863281, "step": 357600 }, { "epoch": 0.4316127045205609, "learning_rate": 8.595864078673611e-06, "loss": 3.1857418823242187, "step": 357700 }, { "epoch": 0.43173336784304356, "learning_rate": 8.595460243205873e-06, "loss": 3.1790679931640624, "step": 357800 }, { "epoch": 0.43185403116552623, "learning_rate": 8.595056407738135e-06, "loss": 3.1831463623046874, "step": 357900 }, { "epoch": 0.43197469448800896, "learning_rate": 8.594652572270395e-06, "loss": 3.1714358520507813, "step": 358000 }, { "epoch": 0.43209535781049163, "learning_rate": 8.594248736802657e-06, "loss": 3.189139099121094, "step": 358100 }, { "epoch": 0.4322160211329743, "learning_rate": 8.59384490133492e-06, "loss": 3.1406118774414065, "step": 358200 }, { "epoch": 0.432336684455457, "learning_rate": 8.593441065867181e-06, "loss": 3.1500439453125, "step": 358300 }, { "epoch": 0.43245734777793965, "learning_rate": 8.593037230399443e-06, "loss": 3.208973693847656, "step": 358400 }, { "epoch": 0.4325780111004224, "learning_rate": 8.592633394931704e-06, "loss": 3.1829348754882814, "step": 358500 }, { "epoch": 0.43269867442290505, "learning_rate": 8.592229559463966e-06, "loss": 3.1675155639648436, "step": 358600 }, { "epoch": 0.4328193377453877, "learning_rate": 8.591825723996228e-06, "loss": 3.153431701660156, "step": 358700 }, { "epoch": 0.4329400010678704, "learning_rate": 8.591421888528488e-06, "loss": 3.1683740234375, "step": 358800 }, { "epoch": 0.43306066439035307, "learning_rate": 8.59101805306075e-06, "loss": 3.2201156616210938, "step": 358900 }, { "epoch": 0.4331813277128358, "learning_rate": 8.590614217593012e-06, "loss": 3.1861221313476564, "step": 359000 }, { "epoch": 0.43330199103531847, "learning_rate": 8.590210382125274e-06, "loss": 3.2081201171875, "step": 359100 }, { "epoch": 0.43342265435780114, "learning_rate": 8.589806546657536e-06, "loss": 3.2040924072265624, "step": 359200 }, { "epoch": 0.4335433176802838, "learning_rate": 8.589402711189798e-06, "loss": 3.16206298828125, "step": 359300 }, { "epoch": 0.4336639810027665, "learning_rate": 8.588998875722058e-06, "loss": 3.1880618286132814, "step": 359400 }, { "epoch": 0.4337846443252492, "learning_rate": 8.58859504025432e-06, "loss": 3.1820343017578123, "step": 359500 }, { "epoch": 0.4339053076477319, "learning_rate": 8.588191204786582e-06, "loss": 3.1609405517578124, "step": 359600 }, { "epoch": 0.43402597097021456, "learning_rate": 8.587787369318842e-06, "loss": 3.1588265991210935, "step": 359700 }, { "epoch": 0.43414663429269723, "learning_rate": 8.587383533851104e-06, "loss": 3.148121032714844, "step": 359800 }, { "epoch": 0.4342672976151799, "learning_rate": 8.586979698383366e-06, "loss": 3.1572726440429686, "step": 359900 }, { "epoch": 0.43438796093766263, "learning_rate": 8.586575862915628e-06, "loss": 3.2002822875976564, "step": 360000 }, { "epoch": 0.4345086242601453, "learning_rate": 8.58617202744789e-06, "loss": 3.180852966308594, "step": 360100 }, { "epoch": 0.434629287582628, "learning_rate": 8.585768191980152e-06, "loss": 3.173353576660156, "step": 360200 }, { "epoch": 0.43474995090511065, "learning_rate": 8.585364356512414e-06, "loss": 3.1801852416992187, "step": 360300 }, { "epoch": 0.4348706142275933, "learning_rate": 8.584960521044674e-06, "loss": 3.172731628417969, "step": 360400 }, { "epoch": 0.43499127755007605, "learning_rate": 8.584556685576936e-06, "loss": 3.1771340942382813, "step": 360500 }, { "epoch": 0.4351119408725587, "learning_rate": 8.584152850109197e-06, "loss": 3.1508392333984374, "step": 360600 }, { "epoch": 0.4352326041950414, "learning_rate": 8.583749014641459e-06, "loss": 3.1647915649414062, "step": 360700 }, { "epoch": 0.43535326751752407, "learning_rate": 8.58334517917372e-06, "loss": 3.1881646728515625, "step": 360800 }, { "epoch": 0.4354739308400068, "learning_rate": 8.582941343705983e-06, "loss": 3.12959716796875, "step": 360900 }, { "epoch": 0.43559459416248947, "learning_rate": 8.582537508238245e-06, "loss": 3.2009005737304688, "step": 361000 }, { "epoch": 0.43571525748497214, "learning_rate": 8.582133672770507e-06, "loss": 3.1655712890625, "step": 361100 }, { "epoch": 0.4358359208074548, "learning_rate": 8.581729837302769e-06, "loss": 3.142994384765625, "step": 361200 }, { "epoch": 0.4359565841299375, "learning_rate": 8.581326001835029e-06, "loss": 3.1704888916015626, "step": 361300 }, { "epoch": 0.4360772474524202, "learning_rate": 8.580922166367291e-06, "loss": 3.151007080078125, "step": 361400 }, { "epoch": 0.4361979107749029, "learning_rate": 8.580518330899553e-06, "loss": 3.16232666015625, "step": 361500 }, { "epoch": 0.43631857409738556, "learning_rate": 8.580114495431813e-06, "loss": 3.1726116943359375, "step": 361600 }, { "epoch": 0.43643923741986823, "learning_rate": 8.579710659964075e-06, "loss": 3.1850286865234376, "step": 361700 }, { "epoch": 0.4365599007423509, "learning_rate": 8.579306824496337e-06, "loss": 3.180714416503906, "step": 361800 }, { "epoch": 0.43668056406483363, "learning_rate": 8.578902989028599e-06, "loss": 3.177583923339844, "step": 361900 }, { "epoch": 0.4368012273873163, "learning_rate": 8.578499153560861e-06, "loss": 3.175817565917969, "step": 362000 }, { "epoch": 0.436921890709799, "learning_rate": 8.578095318093121e-06, "loss": 3.182248840332031, "step": 362100 }, { "epoch": 0.43704255403228165, "learning_rate": 8.577691482625383e-06, "loss": 3.1497857666015623, "step": 362200 }, { "epoch": 0.4371632173547643, "learning_rate": 8.577287647157645e-06, "loss": 3.1653057861328127, "step": 362300 }, { "epoch": 0.43728388067724705, "learning_rate": 8.576883811689907e-06, "loss": 3.191617431640625, "step": 362400 }, { "epoch": 0.4374045439997297, "learning_rate": 8.576479976222168e-06, "loss": 3.169830017089844, "step": 362500 }, { "epoch": 0.4375252073222124, "learning_rate": 8.57607614075443e-06, "loss": 3.199478759765625, "step": 362600 }, { "epoch": 0.43764587064469507, "learning_rate": 8.575672305286692e-06, "loss": 3.1641168212890625, "step": 362700 }, { "epoch": 0.43776653396717774, "learning_rate": 8.575268469818954e-06, "loss": 3.182425842285156, "step": 362800 }, { "epoch": 0.43788719728966047, "learning_rate": 8.574864634351214e-06, "loss": 3.176493835449219, "step": 362900 }, { "epoch": 0.43800786061214314, "learning_rate": 8.574460798883476e-06, "loss": 3.163438415527344, "step": 363000 }, { "epoch": 0.4381285239346258, "learning_rate": 8.574056963415738e-06, "loss": 3.163382568359375, "step": 363100 }, { "epoch": 0.4382491872571085, "learning_rate": 8.573653127948e-06, "loss": 3.1730023193359376, "step": 363200 }, { "epoch": 0.4383698505795912, "learning_rate": 8.573249292480262e-06, "loss": 3.1458984375, "step": 363300 }, { "epoch": 0.4384905139020739, "learning_rate": 8.572845457012524e-06, "loss": 3.185274963378906, "step": 363400 }, { "epoch": 0.43861117722455656, "learning_rate": 8.572441621544784e-06, "loss": 3.1657293701171874, "step": 363500 }, { "epoch": 0.43873184054703923, "learning_rate": 8.572037786077046e-06, "loss": 3.1654953002929687, "step": 363600 }, { "epoch": 0.4388525038695219, "learning_rate": 8.571633950609306e-06, "loss": 3.162891540527344, "step": 363700 }, { "epoch": 0.43897316719200463, "learning_rate": 8.571230115141568e-06, "loss": 3.1667965698242186, "step": 363800 }, { "epoch": 0.4390938305144873, "learning_rate": 8.57082627967383e-06, "loss": 3.185269775390625, "step": 363900 }, { "epoch": 0.43921449383697, "learning_rate": 8.570422444206092e-06, "loss": 3.1614620971679686, "step": 364000 }, { "epoch": 0.43933515715945265, "learning_rate": 8.570018608738354e-06, "loss": 3.1583599853515625, "step": 364100 }, { "epoch": 0.4394558204819353, "learning_rate": 8.569614773270616e-06, "loss": 3.1524197387695314, "step": 364200 }, { "epoch": 0.43957648380441805, "learning_rate": 8.569210937802878e-06, "loss": 3.1714382934570313, "step": 364300 }, { "epoch": 0.4396971471269007, "learning_rate": 8.56880710233514e-06, "loss": 3.1352389526367186, "step": 364400 }, { "epoch": 0.4398178104493834, "learning_rate": 8.5684032668674e-06, "loss": 3.155145568847656, "step": 364500 }, { "epoch": 0.43993847377186607, "learning_rate": 8.567999431399662e-06, "loss": 3.165085754394531, "step": 364600 }, { "epoch": 0.44005913709434874, "learning_rate": 8.567595595931923e-06, "loss": 3.1434954833984374, "step": 364700 }, { "epoch": 0.44017980041683147, "learning_rate": 8.567191760464185e-06, "loss": 3.1698394775390626, "step": 364800 }, { "epoch": 0.44030046373931414, "learning_rate": 8.566787924996447e-06, "loss": 3.172398681640625, "step": 364900 }, { "epoch": 0.4404211270617968, "learning_rate": 8.566384089528709e-06, "loss": 3.1468621826171876, "step": 365000 }, { "epoch": 0.4405417903842795, "learning_rate": 8.56598025406097e-06, "loss": 3.1481427001953124, "step": 365100 }, { "epoch": 0.44066245370676216, "learning_rate": 8.565576418593233e-06, "loss": 3.1734017944335937, "step": 365200 }, { "epoch": 0.4407831170292449, "learning_rate": 8.565172583125495e-06, "loss": 3.161773681640625, "step": 365300 }, { "epoch": 0.44090378035172756, "learning_rate": 8.564768747657755e-06, "loss": 3.16112060546875, "step": 365400 }, { "epoch": 0.44102444367421023, "learning_rate": 8.564364912190017e-06, "loss": 3.160003356933594, "step": 365500 }, { "epoch": 0.4411451069966929, "learning_rate": 8.563961076722279e-06, "loss": 3.1549221801757814, "step": 365600 }, { "epoch": 0.4412657703191756, "learning_rate": 8.56355724125454e-06, "loss": 3.1470736694335937, "step": 365700 }, { "epoch": 0.4413864336416583, "learning_rate": 8.563153405786801e-06, "loss": 3.1689163208007813, "step": 365800 }, { "epoch": 0.441507096964141, "learning_rate": 8.562749570319063e-06, "loss": 3.151278076171875, "step": 365900 }, { "epoch": 0.44162776028662365, "learning_rate": 8.562345734851325e-06, "loss": 3.18524658203125, "step": 366000 }, { "epoch": 0.4417484236091063, "learning_rate": 8.561941899383587e-06, "loss": 3.165556640625, "step": 366100 }, { "epoch": 0.44186908693158905, "learning_rate": 8.561538063915847e-06, "loss": 3.1412313842773436, "step": 366200 }, { "epoch": 0.4419897502540717, "learning_rate": 8.56113422844811e-06, "loss": 3.1581845092773437, "step": 366300 }, { "epoch": 0.4421104135765544, "learning_rate": 8.560730392980371e-06, "loss": 3.1530862426757813, "step": 366400 }, { "epoch": 0.44223107689903707, "learning_rate": 8.560326557512633e-06, "loss": 3.1590106201171877, "step": 366500 }, { "epoch": 0.44235174022151974, "learning_rate": 8.559922722044894e-06, "loss": 3.1573910522460937, "step": 366600 }, { "epoch": 0.44247240354400247, "learning_rate": 8.559518886577156e-06, "loss": 3.164007263183594, "step": 366700 }, { "epoch": 0.44259306686648514, "learning_rate": 8.559115051109418e-06, "loss": 3.171766662597656, "step": 366800 }, { "epoch": 0.4427137301889678, "learning_rate": 8.55871121564168e-06, "loss": 3.141598815917969, "step": 366900 }, { "epoch": 0.4428343935114505, "learning_rate": 8.55830738017394e-06, "loss": 3.174053039550781, "step": 367000 }, { "epoch": 0.44295505683393316, "learning_rate": 8.557903544706202e-06, "loss": 3.1652215576171874, "step": 367100 }, { "epoch": 0.4430757201564159, "learning_rate": 8.557499709238464e-06, "loss": 3.15250244140625, "step": 367200 }, { "epoch": 0.44319638347889856, "learning_rate": 8.557095873770726e-06, "loss": 3.1612918090820314, "step": 367300 }, { "epoch": 0.44331704680138123, "learning_rate": 8.556692038302988e-06, "loss": 3.167114562988281, "step": 367400 }, { "epoch": 0.4434377101238639, "learning_rate": 8.55628820283525e-06, "loss": 3.20229248046875, "step": 367500 }, { "epoch": 0.4435583734463466, "learning_rate": 8.55588436736751e-06, "loss": 3.1544873046875, "step": 367600 }, { "epoch": 0.4436790367688293, "learning_rate": 8.555480531899772e-06, "loss": 3.155821533203125, "step": 367700 }, { "epoch": 0.443799700091312, "learning_rate": 8.555076696432032e-06, "loss": 3.1639593505859374, "step": 367800 }, { "epoch": 0.44392036341379465, "learning_rate": 8.554672860964294e-06, "loss": 3.1481503295898436, "step": 367900 }, { "epoch": 0.4440410267362773, "learning_rate": 8.554269025496556e-06, "loss": 3.1459994506835938, "step": 368000 }, { "epoch": 0.44416169005876, "learning_rate": 8.553865190028818e-06, "loss": 3.171048889160156, "step": 368100 }, { "epoch": 0.4442823533812427, "learning_rate": 8.55346135456108e-06, "loss": 3.1597695922851563, "step": 368200 }, { "epoch": 0.4444030167037254, "learning_rate": 8.553057519093342e-06, "loss": 3.1739923095703126, "step": 368300 }, { "epoch": 0.44452368002620807, "learning_rate": 8.552653683625604e-06, "loss": 3.160904541015625, "step": 368400 }, { "epoch": 0.44464434334869074, "learning_rate": 8.552249848157865e-06, "loss": 3.1608096313476564, "step": 368500 }, { "epoch": 0.44476500667117347, "learning_rate": 8.551846012690127e-06, "loss": 3.1560687255859374, "step": 368600 }, { "epoch": 0.44488566999365614, "learning_rate": 8.551442177222388e-06, "loss": 3.1521368408203125, "step": 368700 }, { "epoch": 0.4450063333161388, "learning_rate": 8.551038341754649e-06, "loss": 3.1734774780273436, "step": 368800 }, { "epoch": 0.4451269966386215, "learning_rate": 8.55063450628691e-06, "loss": 3.1270574951171874, "step": 368900 }, { "epoch": 0.44524765996110416, "learning_rate": 8.550230670819173e-06, "loss": 3.16264404296875, "step": 369000 }, { "epoch": 0.4453683232835869, "learning_rate": 8.549826835351435e-06, "loss": 3.163631591796875, "step": 369100 }, { "epoch": 0.44548898660606956, "learning_rate": 8.549422999883697e-06, "loss": 3.1469546508789064, "step": 369200 }, { "epoch": 0.44560964992855223, "learning_rate": 8.549019164415959e-06, "loss": 3.161377258300781, "step": 369300 }, { "epoch": 0.4457303132510349, "learning_rate": 8.548615328948219e-06, "loss": 3.173736877441406, "step": 369400 }, { "epoch": 0.4458509765735176, "learning_rate": 8.548211493480481e-06, "loss": 3.159951477050781, "step": 369500 }, { "epoch": 0.4459716398960003, "learning_rate": 8.547807658012743e-06, "loss": 3.1467889404296874, "step": 369600 }, { "epoch": 0.446092303218483, "learning_rate": 8.547403822545003e-06, "loss": 3.132040710449219, "step": 369700 }, { "epoch": 0.44621296654096565, "learning_rate": 8.546999987077265e-06, "loss": 3.169666748046875, "step": 369800 }, { "epoch": 0.4463336298634483, "learning_rate": 8.546596151609527e-06, "loss": 3.1499310302734376, "step": 369900 }, { "epoch": 0.446454293185931, "learning_rate": 8.54619231614179e-06, "loss": 3.154795837402344, "step": 370000 }, { "epoch": 0.4465749565084137, "learning_rate": 8.545788480674051e-06, "loss": 3.162998046875, "step": 370100 }, { "epoch": 0.4466956198308964, "learning_rate": 8.545384645206311e-06, "loss": 3.1742813110351564, "step": 370200 }, { "epoch": 0.44681628315337907, "learning_rate": 8.544980809738573e-06, "loss": 3.151202392578125, "step": 370300 }, { "epoch": 0.44693694647586174, "learning_rate": 8.544576974270835e-06, "loss": 3.169294738769531, "step": 370400 }, { "epoch": 0.4470576097983444, "learning_rate": 8.544173138803097e-06, "loss": 3.1597335815429686, "step": 370500 }, { "epoch": 0.44717827312082714, "learning_rate": 8.54376930333536e-06, "loss": 3.1634405517578124, "step": 370600 }, { "epoch": 0.4472989364433098, "learning_rate": 8.54336546786762e-06, "loss": 3.171553955078125, "step": 370700 }, { "epoch": 0.4474195997657925, "learning_rate": 8.542961632399882e-06, "loss": 3.1269326782226563, "step": 370800 }, { "epoch": 0.44754026308827516, "learning_rate": 8.542557796932144e-06, "loss": 3.1421353149414064, "step": 370900 }, { "epoch": 0.4476609264107579, "learning_rate": 8.542153961464406e-06, "loss": 3.181333312988281, "step": 371000 }, { "epoch": 0.44778158973324056, "learning_rate": 8.541750125996666e-06, "loss": 3.144024658203125, "step": 371100 }, { "epoch": 0.44790225305572323, "learning_rate": 8.541346290528928e-06, "loss": 3.155126037597656, "step": 371200 }, { "epoch": 0.4480229163782059, "learning_rate": 8.54094245506119e-06, "loss": 3.1495547485351563, "step": 371300 }, { "epoch": 0.4481435797006886, "learning_rate": 8.540538619593452e-06, "loss": 3.1388092041015625, "step": 371400 }, { "epoch": 0.4482642430231713, "learning_rate": 8.540134784125714e-06, "loss": 3.139412841796875, "step": 371500 }, { "epoch": 0.448384906345654, "learning_rate": 8.539730948657974e-06, "loss": 3.142877197265625, "step": 371600 }, { "epoch": 0.44850556966813665, "learning_rate": 8.539327113190236e-06, "loss": 3.1486831665039063, "step": 371700 }, { "epoch": 0.4486262329906193, "learning_rate": 8.538923277722498e-06, "loss": 3.1674664306640623, "step": 371800 }, { "epoch": 0.448746896313102, "learning_rate": 8.538519442254758e-06, "loss": 3.1398745727539064, "step": 371900 }, { "epoch": 0.4488675596355847, "learning_rate": 8.53811560678702e-06, "loss": 3.159801025390625, "step": 372000 }, { "epoch": 0.4489882229580674, "learning_rate": 8.537711771319282e-06, "loss": 3.141025390625, "step": 372100 }, { "epoch": 0.44910888628055007, "learning_rate": 8.537307935851544e-06, "loss": 3.1711880493164064, "step": 372200 }, { "epoch": 0.44922954960303274, "learning_rate": 8.536904100383806e-06, "loss": 3.163363037109375, "step": 372300 }, { "epoch": 0.4493502129255154, "learning_rate": 8.536500264916068e-06, "loss": 3.156895751953125, "step": 372400 }, { "epoch": 0.44947087624799814, "learning_rate": 8.53609642944833e-06, "loss": 3.151407470703125, "step": 372500 }, { "epoch": 0.4495915395704808, "learning_rate": 8.53569259398059e-06, "loss": 3.171239013671875, "step": 372600 }, { "epoch": 0.4497122028929635, "learning_rate": 8.535288758512853e-06, "loss": 3.171841735839844, "step": 372700 }, { "epoch": 0.44983286621544616, "learning_rate": 8.534884923045113e-06, "loss": 3.154608154296875, "step": 372800 }, { "epoch": 0.44995352953792883, "learning_rate": 8.534481087577375e-06, "loss": 3.1462692260742187, "step": 372900 }, { "epoch": 0.45007419286041156, "learning_rate": 8.534077252109637e-06, "loss": 3.1602447509765623, "step": 373000 }, { "epoch": 0.45019485618289423, "learning_rate": 8.533673416641899e-06, "loss": 3.143274230957031, "step": 373100 }, { "epoch": 0.4503155195053769, "learning_rate": 8.53326958117416e-06, "loss": 3.123106689453125, "step": 373200 }, { "epoch": 0.4504361828278596, "learning_rate": 8.532865745706423e-06, "loss": 3.1546035766601563, "step": 373300 }, { "epoch": 0.45055684615034225, "learning_rate": 8.532461910238685e-06, "loss": 3.1678475952148437, "step": 373400 }, { "epoch": 0.450677509472825, "learning_rate": 8.532058074770945e-06, "loss": 3.1607479858398437, "step": 373500 }, { "epoch": 0.45079817279530765, "learning_rate": 8.531654239303207e-06, "loss": 3.16156005859375, "step": 373600 }, { "epoch": 0.4509188361177903, "learning_rate": 8.531250403835469e-06, "loss": 3.14201416015625, "step": 373700 }, { "epoch": 0.451039499440273, "learning_rate": 8.53084656836773e-06, "loss": 3.137664489746094, "step": 373800 }, { "epoch": 0.4511601627627557, "learning_rate": 8.530442732899991e-06, "loss": 3.1570562744140624, "step": 373900 }, { "epoch": 0.4512808260852384, "learning_rate": 8.530038897432253e-06, "loss": 3.12742919921875, "step": 374000 }, { "epoch": 0.45140148940772107, "learning_rate": 8.529635061964515e-06, "loss": 3.1410791015625, "step": 374100 }, { "epoch": 0.45152215273020374, "learning_rate": 8.529231226496777e-06, "loss": 3.154504699707031, "step": 374200 }, { "epoch": 0.4516428160526864, "learning_rate": 8.528827391029037e-06, "loss": 3.14399169921875, "step": 374300 }, { "epoch": 0.45176347937516914, "learning_rate": 8.5284235555613e-06, "loss": 3.1732467651367187, "step": 374400 }, { "epoch": 0.4518841426976518, "learning_rate": 8.528019720093561e-06, "loss": 3.139784240722656, "step": 374500 }, { "epoch": 0.4520048060201345, "learning_rate": 8.527615884625823e-06, "loss": 3.146400146484375, "step": 374600 }, { "epoch": 0.45212546934261716, "learning_rate": 8.527212049158084e-06, "loss": 3.155608825683594, "step": 374700 }, { "epoch": 0.45224613266509983, "learning_rate": 8.526808213690346e-06, "loss": 3.1358660888671874, "step": 374800 }, { "epoch": 0.45236679598758256, "learning_rate": 8.526404378222608e-06, "loss": 3.165531005859375, "step": 374900 }, { "epoch": 0.45248745931006523, "learning_rate": 8.52600054275487e-06, "loss": 3.11739013671875, "step": 375000 }, { "epoch": 0.4526081226325479, "learning_rate": 8.52559670728713e-06, "loss": 3.1539596557617187, "step": 375100 }, { "epoch": 0.4527287859550306, "learning_rate": 8.525192871819392e-06, "loss": 3.1415203857421874, "step": 375200 }, { "epoch": 0.45284944927751325, "learning_rate": 8.524789036351654e-06, "loss": 3.14402587890625, "step": 375300 }, { "epoch": 0.452970112599996, "learning_rate": 8.524385200883916e-06, "loss": 3.143804931640625, "step": 375400 }, { "epoch": 0.45309077592247865, "learning_rate": 8.523981365416178e-06, "loss": 3.127929382324219, "step": 375500 }, { "epoch": 0.4532114392449613, "learning_rate": 8.52357752994844e-06, "loss": 3.1357431030273437, "step": 375600 }, { "epoch": 0.453332102567444, "learning_rate": 8.5231736944807e-06, "loss": 3.1591168212890626, "step": 375700 }, { "epoch": 0.45345276588992667, "learning_rate": 8.522769859012962e-06, "loss": 3.1183770751953124, "step": 375800 }, { "epoch": 0.4535734292124094, "learning_rate": 8.522366023545224e-06, "loss": 3.164037780761719, "step": 375900 }, { "epoch": 0.45369409253489207, "learning_rate": 8.521962188077484e-06, "loss": 3.135923156738281, "step": 376000 }, { "epoch": 0.45381475585737474, "learning_rate": 8.521558352609746e-06, "loss": 3.126140441894531, "step": 376100 }, { "epoch": 0.4539354191798574, "learning_rate": 8.521154517142008e-06, "loss": 3.12957275390625, "step": 376200 }, { "epoch": 0.45405608250234014, "learning_rate": 8.52075068167427e-06, "loss": 3.1425747680664062, "step": 376300 }, { "epoch": 0.4541767458248228, "learning_rate": 8.520346846206532e-06, "loss": 3.1216506958007812, "step": 376400 }, { "epoch": 0.4542974091473055, "learning_rate": 8.519943010738794e-06, "loss": 3.1401470947265624, "step": 376500 }, { "epoch": 0.45441807246978816, "learning_rate": 8.519539175271055e-06, "loss": 3.150085144042969, "step": 376600 }, { "epoch": 0.45453873579227083, "learning_rate": 8.519135339803317e-06, "loss": 3.127613525390625, "step": 376700 }, { "epoch": 0.45465939911475356, "learning_rate": 8.518731504335579e-06, "loss": 3.1407650756835936, "step": 376800 }, { "epoch": 0.45478006243723623, "learning_rate": 8.518327668867839e-06, "loss": 3.147749938964844, "step": 376900 }, { "epoch": 0.4549007257597189, "learning_rate": 8.5179238334001e-06, "loss": 3.1725, "step": 377000 }, { "epoch": 0.4550213890822016, "learning_rate": 8.517519997932363e-06, "loss": 3.126537170410156, "step": 377100 }, { "epoch": 0.45514205240468425, "learning_rate": 8.517116162464625e-06, "loss": 3.153029479980469, "step": 377200 }, { "epoch": 0.455262715727167, "learning_rate": 8.516712326996887e-06, "loss": 3.0733352661132813, "step": 377300 }, { "epoch": 0.45538337904964965, "learning_rate": 8.516308491529149e-06, "loss": 3.164046630859375, "step": 377400 }, { "epoch": 0.4555040423721323, "learning_rate": 8.51590465606141e-06, "loss": 3.1463336181640624, "step": 377500 }, { "epoch": 0.455624705694615, "learning_rate": 8.515500820593671e-06, "loss": 3.1542959594726563, "step": 377600 }, { "epoch": 0.45574536901709767, "learning_rate": 8.515096985125933e-06, "loss": 3.1383633422851562, "step": 377700 }, { "epoch": 0.4558660323395804, "learning_rate": 8.514693149658193e-06, "loss": 3.134474182128906, "step": 377800 }, { "epoch": 0.45598669566206307, "learning_rate": 8.514289314190455e-06, "loss": 3.1476385498046877, "step": 377900 }, { "epoch": 0.45610735898454574, "learning_rate": 8.513885478722717e-06, "loss": 3.119512939453125, "step": 378000 }, { "epoch": 0.4562280223070284, "learning_rate": 8.51348164325498e-06, "loss": 3.1564996337890623, "step": 378100 }, { "epoch": 0.4563486856295111, "learning_rate": 8.513077807787241e-06, "loss": 3.1333682250976564, "step": 378200 }, { "epoch": 0.4564693489519938, "learning_rate": 8.512673972319503e-06, "loss": 3.143529052734375, "step": 378300 }, { "epoch": 0.4565900122744765, "learning_rate": 8.512270136851764e-06, "loss": 3.1058917236328125, "step": 378400 }, { "epoch": 0.45671067559695916, "learning_rate": 8.511866301384025e-06, "loss": 3.1404119873046876, "step": 378500 }, { "epoch": 0.45683133891944183, "learning_rate": 8.511462465916287e-06, "loss": 3.129571533203125, "step": 378600 }, { "epoch": 0.4569520022419245, "learning_rate": 8.51105863044855e-06, "loss": 3.1644186401367187, "step": 378700 }, { "epoch": 0.45707266556440723, "learning_rate": 8.51065479498081e-06, "loss": 3.132996826171875, "step": 378800 }, { "epoch": 0.4571933288868899, "learning_rate": 8.510250959513072e-06, "loss": 3.121293640136719, "step": 378900 }, { "epoch": 0.4573139922093726, "learning_rate": 8.509847124045334e-06, "loss": 3.137345886230469, "step": 379000 }, { "epoch": 0.45743465553185525, "learning_rate": 8.509443288577596e-06, "loss": 3.122278747558594, "step": 379100 }, { "epoch": 0.457555318854338, "learning_rate": 8.509039453109856e-06, "loss": 3.1400909423828125, "step": 379200 }, { "epoch": 0.45767598217682065, "learning_rate": 8.508635617642118e-06, "loss": 3.145557861328125, "step": 379300 }, { "epoch": 0.4577966454993033, "learning_rate": 8.50823178217438e-06, "loss": 3.1471456909179687, "step": 379400 }, { "epoch": 0.457917308821786, "learning_rate": 8.507827946706642e-06, "loss": 3.1113134765625, "step": 379500 }, { "epoch": 0.45803797214426867, "learning_rate": 8.507424111238904e-06, "loss": 3.124092712402344, "step": 379600 }, { "epoch": 0.4581586354667514, "learning_rate": 8.507020275771166e-06, "loss": 3.16373046875, "step": 379700 }, { "epoch": 0.45827929878923407, "learning_rate": 8.506616440303426e-06, "loss": 3.09302490234375, "step": 379800 }, { "epoch": 0.45839996211171674, "learning_rate": 8.506212604835688e-06, "loss": 3.1182241821289063, "step": 379900 }, { "epoch": 0.4585206254341994, "learning_rate": 8.505808769367948e-06, "loss": 3.1402423095703127, "step": 380000 }, { "epoch": 0.4586412887566821, "learning_rate": 8.50540493390021e-06, "loss": 3.1161929321289064, "step": 380100 }, { "epoch": 0.4587619520791648, "learning_rate": 8.505001098432472e-06, "loss": 3.1541259765625, "step": 380200 }, { "epoch": 0.4588826154016475, "learning_rate": 8.504597262964734e-06, "loss": 3.129002990722656, "step": 380300 }, { "epoch": 0.45900327872413016, "learning_rate": 8.504193427496996e-06, "loss": 3.118363037109375, "step": 380400 }, { "epoch": 0.45912394204661283, "learning_rate": 8.503789592029258e-06, "loss": 3.14366943359375, "step": 380500 }, { "epoch": 0.4592446053690955, "learning_rate": 8.50338575656152e-06, "loss": 3.1468746948242186, "step": 380600 }, { "epoch": 0.45936526869157823, "learning_rate": 8.50298192109378e-06, "loss": 3.1465908813476564, "step": 380700 }, { "epoch": 0.4594859320140609, "learning_rate": 8.502578085626043e-06, "loss": 3.1310720825195313, "step": 380800 }, { "epoch": 0.4596065953365436, "learning_rate": 8.502174250158305e-06, "loss": 3.1352825927734376, "step": 380900 }, { "epoch": 0.45972725865902625, "learning_rate": 8.501770414690565e-06, "loss": 3.1203341674804688, "step": 381000 }, { "epoch": 0.4598479219815089, "learning_rate": 8.501366579222827e-06, "loss": 3.087215576171875, "step": 381100 }, { "epoch": 0.45996858530399165, "learning_rate": 8.500962743755089e-06, "loss": 3.139811706542969, "step": 381200 }, { "epoch": 0.4600892486264743, "learning_rate": 8.50055890828735e-06, "loss": 3.137640380859375, "step": 381300 }, { "epoch": 0.460209911948957, "learning_rate": 8.500155072819613e-06, "loss": 3.123800964355469, "step": 381400 }, { "epoch": 0.46033057527143967, "learning_rate": 8.499751237351875e-06, "loss": 3.1358523559570313, "step": 381500 }, { "epoch": 0.4604512385939224, "learning_rate": 8.499347401884137e-06, "loss": 3.121767578125, "step": 381600 }, { "epoch": 0.46057190191640507, "learning_rate": 8.498943566416397e-06, "loss": 3.14825927734375, "step": 381700 }, { "epoch": 0.46069256523888774, "learning_rate": 8.498539730948659e-06, "loss": 3.1300338745117187, "step": 381800 }, { "epoch": 0.4608132285613704, "learning_rate": 8.49813589548092e-06, "loss": 3.13264892578125, "step": 381900 }, { "epoch": 0.4609338918838531, "learning_rate": 8.497732060013181e-06, "loss": 3.1357421875, "step": 382000 }, { "epoch": 0.4610545552063358, "learning_rate": 8.497328224545443e-06, "loss": 3.149007568359375, "step": 382100 }, { "epoch": 0.4611752185288185, "learning_rate": 8.496924389077705e-06, "loss": 3.1301812744140625, "step": 382200 }, { "epoch": 0.46129588185130116, "learning_rate": 8.496520553609967e-06, "loss": 3.1490679931640626, "step": 382300 }, { "epoch": 0.46141654517378383, "learning_rate": 8.49611671814223e-06, "loss": 3.1284271240234376, "step": 382400 }, { "epoch": 0.4615372084962665, "learning_rate": 8.49571288267449e-06, "loss": 3.1376217651367186, "step": 382500 }, { "epoch": 0.46165787181874923, "learning_rate": 8.495309047206752e-06, "loss": 3.1286474609375, "step": 382600 }, { "epoch": 0.4617785351412319, "learning_rate": 8.494905211739014e-06, "loss": 3.1434860229492188, "step": 382700 }, { "epoch": 0.4618991984637146, "learning_rate": 8.494501376271275e-06, "loss": 3.1338992309570313, "step": 382800 }, { "epoch": 0.46201986178619725, "learning_rate": 8.494097540803536e-06, "loss": 3.1025015258789064, "step": 382900 }, { "epoch": 0.4621405251086799, "learning_rate": 8.493693705335798e-06, "loss": 3.1459490966796877, "step": 383000 }, { "epoch": 0.46226118843116265, "learning_rate": 8.49328986986806e-06, "loss": 3.106195983886719, "step": 383100 }, { "epoch": 0.4623818517536453, "learning_rate": 8.492886034400322e-06, "loss": 3.121510314941406, "step": 383200 }, { "epoch": 0.462502515076128, "learning_rate": 8.492482198932582e-06, "loss": 3.1088232421875, "step": 383300 }, { "epoch": 0.46262317839861067, "learning_rate": 8.492078363464844e-06, "loss": 3.127908020019531, "step": 383400 }, { "epoch": 0.46274384172109334, "learning_rate": 8.491674527997106e-06, "loss": 3.147369689941406, "step": 383500 }, { "epoch": 0.46286450504357607, "learning_rate": 8.491270692529368e-06, "loss": 3.1268460083007814, "step": 383600 }, { "epoch": 0.46298516836605874, "learning_rate": 8.49086685706163e-06, "loss": 3.145751647949219, "step": 383700 }, { "epoch": 0.4631058316885414, "learning_rate": 8.49046302159389e-06, "loss": 3.1424606323242186, "step": 383800 }, { "epoch": 0.4632264950110241, "learning_rate": 8.490059186126152e-06, "loss": 3.1460671997070313, "step": 383900 }, { "epoch": 0.4633471583335068, "learning_rate": 8.489655350658414e-06, "loss": 3.1438632202148438, "step": 384000 }, { "epoch": 0.4634678216559895, "learning_rate": 8.489251515190674e-06, "loss": 3.144010009765625, "step": 384100 }, { "epoch": 0.46358848497847216, "learning_rate": 8.488847679722936e-06, "loss": 3.1228207397460936, "step": 384200 }, { "epoch": 0.46370914830095483, "learning_rate": 8.488443844255198e-06, "loss": 3.125281982421875, "step": 384300 }, { "epoch": 0.4638298116234375, "learning_rate": 8.48804000878746e-06, "loss": 3.1420132446289064, "step": 384400 }, { "epoch": 0.46395047494592023, "learning_rate": 8.487636173319722e-06, "loss": 3.121570739746094, "step": 384500 }, { "epoch": 0.4640711382684029, "learning_rate": 8.487232337851984e-06, "loss": 3.120580749511719, "step": 384600 }, { "epoch": 0.4641918015908856, "learning_rate": 8.486828502384246e-06, "loss": 3.1439031982421874, "step": 384700 }, { "epoch": 0.46431246491336825, "learning_rate": 8.486424666916507e-06, "loss": 3.1362924194335937, "step": 384800 }, { "epoch": 0.4644331282358509, "learning_rate": 8.486020831448769e-06, "loss": 3.139161376953125, "step": 384900 }, { "epoch": 0.46455379155833365, "learning_rate": 8.485616995981029e-06, "loss": 3.1094711303710936, "step": 385000 }, { "epoch": 0.4646744548808163, "learning_rate": 8.485213160513291e-06, "loss": 3.129660339355469, "step": 385100 }, { "epoch": 0.464795118203299, "learning_rate": 8.484809325045553e-06, "loss": 3.106048278808594, "step": 385200 }, { "epoch": 0.46491578152578167, "learning_rate": 8.484405489577815e-06, "loss": 3.1188922119140625, "step": 385300 }, { "epoch": 0.46503644484826434, "learning_rate": 8.484001654110077e-06, "loss": 3.1234521484375, "step": 385400 }, { "epoch": 0.46515710817074707, "learning_rate": 8.483597818642339e-06, "loss": 3.1120724487304687, "step": 385500 }, { "epoch": 0.46527777149322974, "learning_rate": 8.4831939831746e-06, "loss": 3.1346871948242185, "step": 385600 }, { "epoch": 0.4653984348157124, "learning_rate": 8.482790147706861e-06, "loss": 3.1387060546875, "step": 385700 }, { "epoch": 0.4655190981381951, "learning_rate": 8.482386312239123e-06, "loss": 3.098907165527344, "step": 385800 }, { "epoch": 0.46563976146067776, "learning_rate": 8.481982476771385e-06, "loss": 3.1122482299804686, "step": 385900 }, { "epoch": 0.4657604247831605, "learning_rate": 8.481578641303645e-06, "loss": 3.138643493652344, "step": 386000 }, { "epoch": 0.46588108810564316, "learning_rate": 8.481174805835907e-06, "loss": 3.121631774902344, "step": 386100 }, { "epoch": 0.46600175142812583, "learning_rate": 8.48077097036817e-06, "loss": 3.136925048828125, "step": 386200 }, { "epoch": 0.4661224147506085, "learning_rate": 8.480367134900431e-06, "loss": 3.1138604736328124, "step": 386300 }, { "epoch": 0.4662430780730912, "learning_rate": 8.479963299432693e-06, "loss": 3.134913330078125, "step": 386400 }, { "epoch": 0.4663637413955739, "learning_rate": 8.479559463964955e-06, "loss": 3.1338992309570313, "step": 386500 }, { "epoch": 0.4664844047180566, "learning_rate": 8.479155628497216e-06, "loss": 3.1130938720703125, "step": 386600 }, { "epoch": 0.46660506804053925, "learning_rate": 8.478751793029478e-06, "loss": 3.1238580322265626, "step": 386700 }, { "epoch": 0.4667257313630219, "learning_rate": 8.47834795756174e-06, "loss": 3.153401184082031, "step": 386800 }, { "epoch": 0.46684639468550465, "learning_rate": 8.477944122094e-06, "loss": 3.1112994384765624, "step": 386900 }, { "epoch": 0.4669670580079873, "learning_rate": 8.477540286626262e-06, "loss": 3.1244522094726563, "step": 387000 }, { "epoch": 0.46708772133047, "learning_rate": 8.477136451158524e-06, "loss": 3.143729553222656, "step": 387100 }, { "epoch": 0.46720838465295267, "learning_rate": 8.476732615690786e-06, "loss": 3.0977691650390624, "step": 387200 }, { "epoch": 0.46732904797543534, "learning_rate": 8.476328780223048e-06, "loss": 3.1258074951171877, "step": 387300 }, { "epoch": 0.46744971129791807, "learning_rate": 8.475924944755308e-06, "loss": 3.1042694091796874, "step": 387400 }, { "epoch": 0.46757037462040074, "learning_rate": 8.47552110928757e-06, "loss": 3.14513427734375, "step": 387500 }, { "epoch": 0.4676910379428834, "learning_rate": 8.475117273819832e-06, "loss": 3.1334906005859375, "step": 387600 }, { "epoch": 0.4678117012653661, "learning_rate": 8.474713438352094e-06, "loss": 3.1305191040039064, "step": 387700 }, { "epoch": 0.46793236458784876, "learning_rate": 8.474309602884356e-06, "loss": 3.1091302490234374, "step": 387800 }, { "epoch": 0.4680530279103315, "learning_rate": 8.473905767416616e-06, "loss": 3.148889465332031, "step": 387900 }, { "epoch": 0.46817369123281416, "learning_rate": 8.473501931948878e-06, "loss": 3.1178985595703126, "step": 388000 }, { "epoch": 0.46829435455529683, "learning_rate": 8.47309809648114e-06, "loss": 3.120003967285156, "step": 388100 }, { "epoch": 0.4684150178777795, "learning_rate": 8.4726942610134e-06, "loss": 3.1320068359375, "step": 388200 }, { "epoch": 0.4685356812002622, "learning_rate": 8.472290425545663e-06, "loss": 3.124786376953125, "step": 388300 }, { "epoch": 0.4686563445227449, "learning_rate": 8.471886590077924e-06, "loss": 3.1269940185546874, "step": 388400 }, { "epoch": 0.4687770078452276, "learning_rate": 8.471482754610186e-06, "loss": 3.0979833984375, "step": 388500 }, { "epoch": 0.46889767116771025, "learning_rate": 8.471078919142448e-06, "loss": 3.1111489868164064, "step": 388600 }, { "epoch": 0.4690183344901929, "learning_rate": 8.47067508367471e-06, "loss": 3.138814697265625, "step": 388700 }, { "epoch": 0.4691389978126756, "learning_rate": 8.47027124820697e-06, "loss": 3.097029113769531, "step": 388800 }, { "epoch": 0.4692596611351583, "learning_rate": 8.469867412739233e-06, "loss": 3.122314147949219, "step": 388900 }, { "epoch": 0.469380324457641, "learning_rate": 8.469463577271495e-06, "loss": 3.1029534912109376, "step": 389000 }, { "epoch": 0.46950098778012367, "learning_rate": 8.469059741803755e-06, "loss": 3.1359765625, "step": 389100 }, { "epoch": 0.46962165110260634, "learning_rate": 8.468655906336017e-06, "loss": 3.1164794921875, "step": 389200 }, { "epoch": 0.46974231442508907, "learning_rate": 8.468252070868279e-06, "loss": 3.1202740478515625, "step": 389300 }, { "epoch": 0.46986297774757174, "learning_rate": 8.467848235400541e-06, "loss": 3.095294189453125, "step": 389400 }, { "epoch": 0.4699836410700544, "learning_rate": 8.467444399932803e-06, "loss": 3.11364013671875, "step": 389500 }, { "epoch": 0.4701043043925371, "learning_rate": 8.467040564465065e-06, "loss": 3.1192578125, "step": 389600 }, { "epoch": 0.47022496771501976, "learning_rate": 8.466636728997327e-06, "loss": 3.1293038940429687, "step": 389700 }, { "epoch": 0.4703456310375025, "learning_rate": 8.466232893529587e-06, "loss": 3.1205938720703124, "step": 389800 }, { "epoch": 0.47046629435998516, "learning_rate": 8.465829058061849e-06, "loss": 3.1202767944335936, "step": 389900 }, { "epoch": 0.47058695768246783, "learning_rate": 8.46542522259411e-06, "loss": 3.1283197021484375, "step": 390000 }, { "epoch": 0.4707076210049505, "learning_rate": 8.465021387126371e-06, "loss": 3.10061279296875, "step": 390100 }, { "epoch": 0.4708282843274332, "learning_rate": 8.464617551658633e-06, "loss": 3.137294921875, "step": 390200 }, { "epoch": 0.4709489476499159, "learning_rate": 8.464213716190895e-06, "loss": 3.0898785400390625, "step": 390300 }, { "epoch": 0.4710696109723986, "learning_rate": 8.463809880723157e-06, "loss": 3.1150802612304687, "step": 390400 }, { "epoch": 0.47119027429488125, "learning_rate": 8.46340604525542e-06, "loss": 3.1151358032226564, "step": 390500 }, { "epoch": 0.4713109376173639, "learning_rate": 8.46300220978768e-06, "loss": 3.107939453125, "step": 390600 }, { "epoch": 0.4714316009398466, "learning_rate": 8.462598374319942e-06, "loss": 3.1264968872070313, "step": 390700 }, { "epoch": 0.4715522642623293, "learning_rate": 8.462194538852204e-06, "loss": 3.122178649902344, "step": 390800 }, { "epoch": 0.471672927584812, "learning_rate": 8.461790703384466e-06, "loss": 3.089374694824219, "step": 390900 }, { "epoch": 0.47179359090729467, "learning_rate": 8.461386867916726e-06, "loss": 3.128847961425781, "step": 391000 }, { "epoch": 0.47191425422977734, "learning_rate": 8.460983032448988e-06, "loss": 3.1029425048828125, "step": 391100 }, { "epoch": 0.47203491755226, "learning_rate": 8.46057919698125e-06, "loss": 3.1005255126953126, "step": 391200 }, { "epoch": 0.47215558087474274, "learning_rate": 8.460175361513512e-06, "loss": 3.1312411499023436, "step": 391300 }, { "epoch": 0.4722762441972254, "learning_rate": 8.459771526045774e-06, "loss": 3.1139947509765626, "step": 391400 }, { "epoch": 0.4723969075197081, "learning_rate": 8.459367690578034e-06, "loss": 3.1184735107421875, "step": 391500 }, { "epoch": 0.47251757084219076, "learning_rate": 8.458963855110296e-06, "loss": 3.1278179931640624, "step": 391600 }, { "epoch": 0.47263823416467343, "learning_rate": 8.458560019642558e-06, "loss": 3.0912960815429686, "step": 391700 }, { "epoch": 0.47275889748715616, "learning_rate": 8.45815618417482e-06, "loss": 3.0673068237304686, "step": 391800 }, { "epoch": 0.47287956080963883, "learning_rate": 8.457752348707082e-06, "loss": 3.118819274902344, "step": 391900 }, { "epoch": 0.4730002241321215, "learning_rate": 8.457348513239342e-06, "loss": 3.1085861206054686, "step": 392000 }, { "epoch": 0.4731208874546042, "learning_rate": 8.456944677771604e-06, "loss": 3.1061740112304688, "step": 392100 }, { "epoch": 0.4732415507770869, "learning_rate": 8.456540842303866e-06, "loss": 3.105338134765625, "step": 392200 }, { "epoch": 0.4733622140995696, "learning_rate": 8.456137006836127e-06, "loss": 3.093358154296875, "step": 392300 }, { "epoch": 0.47348287742205225, "learning_rate": 8.455733171368389e-06, "loss": 3.1238018798828127, "step": 392400 }, { "epoch": 0.4736035407445349, "learning_rate": 8.45532933590065e-06, "loss": 3.1033029174804687, "step": 392500 }, { "epoch": 0.4737242040670176, "learning_rate": 8.454925500432913e-06, "loss": 3.1281802368164064, "step": 392600 }, { "epoch": 0.4738448673895003, "learning_rate": 8.454521664965174e-06, "loss": 3.1319540405273436, "step": 392700 }, { "epoch": 0.473965530711983, "learning_rate": 8.454117829497436e-06, "loss": 3.1147210693359373, "step": 392800 }, { "epoch": 0.47408619403446567, "learning_rate": 8.453713994029697e-06, "loss": 3.1519085693359377, "step": 392900 }, { "epoch": 0.47420685735694834, "learning_rate": 8.453310158561959e-06, "loss": 3.100499267578125, "step": 393000 }, { "epoch": 0.474327520679431, "learning_rate": 8.45290632309422e-06, "loss": 3.1120028686523438, "step": 393100 }, { "epoch": 0.47444818400191374, "learning_rate": 8.452502487626481e-06, "loss": 3.1080838012695313, "step": 393200 }, { "epoch": 0.4745688473243964, "learning_rate": 8.452098652158743e-06, "loss": 3.1241705322265627, "step": 393300 }, { "epoch": 0.4746895106468791, "learning_rate": 8.451694816691005e-06, "loss": 3.1080181884765623, "step": 393400 }, { "epoch": 0.47481017396936176, "learning_rate": 8.451290981223267e-06, "loss": 3.0980453491210938, "step": 393500 }, { "epoch": 0.47493083729184443, "learning_rate": 8.450887145755529e-06, "loss": 3.0788613891601564, "step": 393600 }, { "epoch": 0.47505150061432716, "learning_rate": 8.450483310287791e-06, "loss": 3.136014099121094, "step": 393700 }, { "epoch": 0.47517216393680983, "learning_rate": 8.450079474820053e-06, "loss": 3.120100402832031, "step": 393800 }, { "epoch": 0.4752928272592925, "learning_rate": 8.449675639352313e-06, "loss": 3.1098016357421874, "step": 393900 }, { "epoch": 0.4754134905817752, "learning_rate": 8.449271803884575e-06, "loss": 3.109454345703125, "step": 394000 }, { "epoch": 0.47553415390425785, "learning_rate": 8.448867968416835e-06, "loss": 3.1173699951171874, "step": 394100 }, { "epoch": 0.4756548172267406, "learning_rate": 8.448464132949097e-06, "loss": 3.0544357299804688, "step": 394200 }, { "epoch": 0.47577548054922325, "learning_rate": 8.44806029748136e-06, "loss": 3.098197021484375, "step": 394300 }, { "epoch": 0.4758961438717059, "learning_rate": 8.447656462013621e-06, "loss": 3.088961486816406, "step": 394400 }, { "epoch": 0.4760168071941886, "learning_rate": 8.447252626545883e-06, "loss": 3.0855181884765623, "step": 394500 }, { "epoch": 0.4761374705166713, "learning_rate": 8.446848791078145e-06, "loss": 3.1152850341796876, "step": 394600 }, { "epoch": 0.476258133839154, "learning_rate": 8.446444955610406e-06, "loss": 3.1350958251953127, "step": 394700 }, { "epoch": 0.47637879716163667, "learning_rate": 8.446041120142668e-06, "loss": 3.1023828125, "step": 394800 }, { "epoch": 0.47649946048411934, "learning_rate": 8.44563728467493e-06, "loss": 3.102723388671875, "step": 394900 }, { "epoch": 0.476620123806602, "learning_rate": 8.445233449207192e-06, "loss": 3.107860412597656, "step": 395000 }, { "epoch": 0.47674078712908474, "learning_rate": 8.444829613739452e-06, "loss": 3.10630859375, "step": 395100 }, { "epoch": 0.4768614504515674, "learning_rate": 8.444425778271714e-06, "loss": 3.128507080078125, "step": 395200 }, { "epoch": 0.4769821137740501, "learning_rate": 8.444021942803976e-06, "loss": 3.0866189575195313, "step": 395300 }, { "epoch": 0.47710277709653276, "learning_rate": 8.443618107336238e-06, "loss": 3.0778262329101564, "step": 395400 }, { "epoch": 0.47722344041901543, "learning_rate": 8.443214271868498e-06, "loss": 3.113604736328125, "step": 395500 }, { "epoch": 0.47734410374149816, "learning_rate": 8.44281043640076e-06, "loss": 3.0987164306640627, "step": 395600 }, { "epoch": 0.47746476706398083, "learning_rate": 8.442406600933022e-06, "loss": 3.1265911865234375, "step": 395700 }, { "epoch": 0.4775854303864635, "learning_rate": 8.442002765465284e-06, "loss": 3.0987625122070312, "step": 395800 }, { "epoch": 0.4777060937089462, "learning_rate": 8.441598929997546e-06, "loss": 3.086417236328125, "step": 395900 }, { "epoch": 0.47782675703142885, "learning_rate": 8.441195094529806e-06, "loss": 3.111502380371094, "step": 396000 }, { "epoch": 0.4779474203539116, "learning_rate": 8.440791259062068e-06, "loss": 3.0859475708007813, "step": 396100 }, { "epoch": 0.47806808367639425, "learning_rate": 8.44038742359433e-06, "loss": 3.0990335083007814, "step": 396200 }, { "epoch": 0.4781887469988769, "learning_rate": 8.439983588126592e-06, "loss": 3.116259765625, "step": 396300 }, { "epoch": 0.4783094103213596, "learning_rate": 8.439579752658853e-06, "loss": 3.110775146484375, "step": 396400 }, { "epoch": 0.47843007364384227, "learning_rate": 8.439175917191115e-06, "loss": 3.0855258178710936, "step": 396500 }, { "epoch": 0.478550736966325, "learning_rate": 8.438772081723377e-06, "loss": 3.121785888671875, "step": 396600 }, { "epoch": 0.47867140028880767, "learning_rate": 8.438368246255639e-06, "loss": 3.10590087890625, "step": 396700 }, { "epoch": 0.47879206361129034, "learning_rate": 8.4379644107879e-06, "loss": 3.128548278808594, "step": 396800 }, { "epoch": 0.478912726933773, "learning_rate": 8.437560575320163e-06, "loss": 3.0855377197265623, "step": 396900 }, { "epoch": 0.47903339025625574, "learning_rate": 8.437156739852423e-06, "loss": 3.0881637573242187, "step": 397000 }, { "epoch": 0.4791540535787384, "learning_rate": 8.436752904384685e-06, "loss": 3.0910745239257813, "step": 397100 }, { "epoch": 0.4792747169012211, "learning_rate": 8.436349068916945e-06, "loss": 3.1228036499023437, "step": 397200 }, { "epoch": 0.47939538022370376, "learning_rate": 8.435945233449207e-06, "loss": 3.081323547363281, "step": 397300 }, { "epoch": 0.47951604354618643, "learning_rate": 8.435541397981469e-06, "loss": 3.1056808471679687, "step": 397400 }, { "epoch": 0.47963670686866916, "learning_rate": 8.435137562513731e-06, "loss": 3.089926452636719, "step": 397500 }, { "epoch": 0.47975737019115183, "learning_rate": 8.434733727045993e-06, "loss": 3.0946749877929687, "step": 397600 }, { "epoch": 0.4798780335136345, "learning_rate": 8.434329891578255e-06, "loss": 3.087687683105469, "step": 397700 }, { "epoch": 0.4799986968361172, "learning_rate": 8.433926056110517e-06, "loss": 3.120843505859375, "step": 397800 }, { "epoch": 0.48011936015859985, "learning_rate": 8.433522220642777e-06, "loss": 3.1099539184570313, "step": 397900 }, { "epoch": 0.4802400234810826, "learning_rate": 8.43311838517504e-06, "loss": 3.11024658203125, "step": 398000 }, { "epoch": 0.48036068680356525, "learning_rate": 8.432714549707301e-06, "loss": 3.09318115234375, "step": 398100 }, { "epoch": 0.4804813501260479, "learning_rate": 8.432310714239562e-06, "loss": 3.1173333740234375, "step": 398200 }, { "epoch": 0.4806020134485306, "learning_rate": 8.431906878771823e-06, "loss": 3.097176513671875, "step": 398300 }, { "epoch": 0.48072267677101327, "learning_rate": 8.431503043304085e-06, "loss": 3.1012893676757813, "step": 398400 }, { "epoch": 0.480843340093496, "learning_rate": 8.431099207836347e-06, "loss": 3.1367181396484374, "step": 398500 }, { "epoch": 0.48096400341597867, "learning_rate": 8.43069537236861e-06, "loss": 3.0885751342773435, "step": 398600 }, { "epoch": 0.48108466673846134, "learning_rate": 8.430291536900871e-06, "loss": 3.10408447265625, "step": 398700 }, { "epoch": 0.481205330060944, "learning_rate": 8.429887701433132e-06, "loss": 3.1087435913085937, "step": 398800 }, { "epoch": 0.4813259933834267, "learning_rate": 8.429483865965394e-06, "loss": 3.0896182250976563, "step": 398900 }, { "epoch": 0.4814466567059094, "learning_rate": 8.429080030497656e-06, "loss": 3.0709848022460937, "step": 399000 }, { "epoch": 0.4815673200283921, "learning_rate": 8.428676195029916e-06, "loss": 3.0725668334960936, "step": 399100 }, { "epoch": 0.48168798335087476, "learning_rate": 8.428272359562178e-06, "loss": 3.0570263671875, "step": 399200 }, { "epoch": 0.48180864667335743, "learning_rate": 8.42786852409444e-06, "loss": 3.1007846069335936, "step": 399300 }, { "epoch": 0.4819293099958401, "learning_rate": 8.427464688626702e-06, "loss": 3.06720703125, "step": 399400 }, { "epoch": 0.48204997331832283, "learning_rate": 8.427060853158964e-06, "loss": 3.104925231933594, "step": 399500 }, { "epoch": 0.4821706366408055, "learning_rate": 8.426657017691224e-06, "loss": 3.0758880615234374, "step": 399600 }, { "epoch": 0.4822912999632882, "learning_rate": 8.426253182223486e-06, "loss": 3.1065664672851563, "step": 399700 }, { "epoch": 0.48241196328577085, "learning_rate": 8.425849346755748e-06, "loss": 3.1080535888671874, "step": 399800 }, { "epoch": 0.4825326266082536, "learning_rate": 8.42544551128801e-06, "loss": 3.129813232421875, "step": 399900 }, { "epoch": 0.48265328993073625, "learning_rate": 8.425041675820272e-06, "loss": 3.1167398071289063, "step": 400000 }, { "epoch": 0.4827739532532189, "learning_rate": 8.424637840352532e-06, "loss": 3.1018927001953127, "step": 400100 }, { "epoch": 0.4828946165757016, "learning_rate": 8.424234004884794e-06, "loss": 3.0845901489257814, "step": 400200 }, { "epoch": 0.48301527989818427, "learning_rate": 8.423830169417056e-06, "loss": 3.107624206542969, "step": 400300 }, { "epoch": 0.483135943220667, "learning_rate": 8.423426333949317e-06, "loss": 3.0834930419921873, "step": 400400 }, { "epoch": 0.48325660654314967, "learning_rate": 8.423022498481579e-06, "loss": 3.073968505859375, "step": 400500 }, { "epoch": 0.48337726986563234, "learning_rate": 8.42261866301384e-06, "loss": 3.07536376953125, "step": 400600 }, { "epoch": 0.483497933188115, "learning_rate": 8.422214827546103e-06, "loss": 3.0725445556640625, "step": 400700 }, { "epoch": 0.4836185965105977, "learning_rate": 8.421810992078365e-06, "loss": 3.094947509765625, "step": 400800 }, { "epoch": 0.4837392598330804, "learning_rate": 8.421407156610627e-06, "loss": 3.109068603515625, "step": 400900 }, { "epoch": 0.4838599231555631, "learning_rate": 8.421003321142887e-06, "loss": 3.091180419921875, "step": 401000 }, { "epoch": 0.48398058647804576, "learning_rate": 8.420599485675149e-06, "loss": 3.1118594360351564, "step": 401100 }, { "epoch": 0.48410124980052843, "learning_rate": 8.42019565020741e-06, "loss": 3.098489990234375, "step": 401200 }, { "epoch": 0.4842219131230111, "learning_rate": 8.419791814739671e-06, "loss": 3.0923114013671875, "step": 401300 }, { "epoch": 0.48434257644549383, "learning_rate": 8.419387979271933e-06, "loss": 3.101041564941406, "step": 401400 }, { "epoch": 0.4844632397679765, "learning_rate": 8.418984143804195e-06, "loss": 3.082236633300781, "step": 401500 }, { "epoch": 0.4845839030904592, "learning_rate": 8.418580308336457e-06, "loss": 3.083673400878906, "step": 401600 }, { "epoch": 0.48470456641294185, "learning_rate": 8.418176472868719e-06, "loss": 3.130315246582031, "step": 401700 }, { "epoch": 0.4848252297354245, "learning_rate": 8.417772637400981e-06, "loss": 3.1092239379882813, "step": 401800 }, { "epoch": 0.48494589305790725, "learning_rate": 8.417368801933243e-06, "loss": 3.09388671875, "step": 401900 }, { "epoch": 0.4850665563803899, "learning_rate": 8.416964966465503e-06, "loss": 3.1032403564453124, "step": 402000 }, { "epoch": 0.4851872197028726, "learning_rate": 8.416561130997765e-06, "loss": 3.1174456787109377, "step": 402100 }, { "epoch": 0.48530788302535527, "learning_rate": 8.416157295530026e-06, "loss": 3.0884149169921873, "step": 402200 }, { "epoch": 0.485428546347838, "learning_rate": 8.415753460062288e-06, "loss": 3.1053207397460936, "step": 402300 }, { "epoch": 0.48554920967032067, "learning_rate": 8.41534962459455e-06, "loss": 3.118140869140625, "step": 402400 }, { "epoch": 0.48566987299280334, "learning_rate": 8.414945789126811e-06, "loss": 3.0746533203125, "step": 402500 }, { "epoch": 0.485790536315286, "learning_rate": 8.414541953659073e-06, "loss": 3.0938232421875, "step": 402600 }, { "epoch": 0.4859111996377687, "learning_rate": 8.414138118191335e-06, "loss": 3.070401611328125, "step": 402700 }, { "epoch": 0.4860318629602514, "learning_rate": 8.413734282723597e-06, "loss": 3.123790588378906, "step": 402800 }, { "epoch": 0.4861525262827341, "learning_rate": 8.413330447255858e-06, "loss": 3.1210443115234376, "step": 402900 }, { "epoch": 0.48627318960521676, "learning_rate": 8.41292661178812e-06, "loss": 3.092182922363281, "step": 403000 }, { "epoch": 0.48639385292769943, "learning_rate": 8.412522776320382e-06, "loss": 3.0950628662109376, "step": 403100 }, { "epoch": 0.4865145162501821, "learning_rate": 8.412118940852642e-06, "loss": 3.0670315551757814, "step": 403200 }, { "epoch": 0.48663517957266483, "learning_rate": 8.411715105384904e-06, "loss": 3.098896789550781, "step": 403300 }, { "epoch": 0.4867558428951475, "learning_rate": 8.411311269917166e-06, "loss": 3.085815734863281, "step": 403400 }, { "epoch": 0.4868765062176302, "learning_rate": 8.410907434449428e-06, "loss": 3.1057781982421875, "step": 403500 }, { "epoch": 0.48699716954011285, "learning_rate": 8.41050359898169e-06, "loss": 3.0981674194335938, "step": 403600 }, { "epoch": 0.4871178328625955, "learning_rate": 8.41009976351395e-06, "loss": 3.105654296875, "step": 403700 }, { "epoch": 0.48723849618507825, "learning_rate": 8.409695928046212e-06, "loss": 3.088855895996094, "step": 403800 }, { "epoch": 0.4873591595075609, "learning_rate": 8.409292092578474e-06, "loss": 3.0955364990234373, "step": 403900 }, { "epoch": 0.4874798228300436, "learning_rate": 8.408888257110736e-06, "loss": 3.08198974609375, "step": 404000 }, { "epoch": 0.48760048615252627, "learning_rate": 8.408484421642996e-06, "loss": 3.10002685546875, "step": 404100 }, { "epoch": 0.48772114947500894, "learning_rate": 8.408080586175258e-06, "loss": 3.08379638671875, "step": 404200 }, { "epoch": 0.48784181279749167, "learning_rate": 8.40767675070752e-06, "loss": 3.065028076171875, "step": 404300 }, { "epoch": 0.48796247611997434, "learning_rate": 8.407272915239782e-06, "loss": 3.075791015625, "step": 404400 }, { "epoch": 0.488083139442457, "learning_rate": 8.406869079772043e-06, "loss": 3.1015188598632815, "step": 404500 }, { "epoch": 0.4882038027649397, "learning_rate": 8.406465244304305e-06, "loss": 3.0968704223632812, "step": 404600 }, { "epoch": 0.48832446608742236, "learning_rate": 8.406061408836567e-06, "loss": 3.0848504638671876, "step": 404700 }, { "epoch": 0.4884451294099051, "learning_rate": 8.405657573368829e-06, "loss": 3.0905316162109373, "step": 404800 }, { "epoch": 0.48856579273238776, "learning_rate": 8.40525373790109e-06, "loss": 3.1199295043945314, "step": 404900 }, { "epoch": 0.48868645605487043, "learning_rate": 8.404849902433353e-06, "loss": 3.109422302246094, "step": 405000 }, { "epoch": 0.4888071193773531, "learning_rate": 8.404446066965613e-06, "loss": 3.0794296264648438, "step": 405100 }, { "epoch": 0.48892778269983583, "learning_rate": 8.404042231497875e-06, "loss": 3.09427490234375, "step": 405200 }, { "epoch": 0.4890484460223185, "learning_rate": 8.403638396030135e-06, "loss": 3.0705914306640625, "step": 405300 }, { "epoch": 0.4891691093448012, "learning_rate": 8.403234560562397e-06, "loss": 3.1210516357421874, "step": 405400 }, { "epoch": 0.48928977266728385, "learning_rate": 8.402830725094659e-06, "loss": 3.0909454345703127, "step": 405500 }, { "epoch": 0.4894104359897665, "learning_rate": 8.402426889626921e-06, "loss": 3.084837646484375, "step": 405600 }, { "epoch": 0.48953109931224925, "learning_rate": 8.402023054159183e-06, "loss": 3.0785919189453126, "step": 405700 }, { "epoch": 0.4896517626347319, "learning_rate": 8.401619218691445e-06, "loss": 3.081869812011719, "step": 405800 }, { "epoch": 0.4897724259572146, "learning_rate": 8.401215383223707e-06, "loss": 3.103351745605469, "step": 405900 }, { "epoch": 0.48989308927969727, "learning_rate": 8.400811547755969e-06, "loss": 3.079375, "step": 406000 }, { "epoch": 0.49001375260217994, "learning_rate": 8.40040771228823e-06, "loss": 3.08417724609375, "step": 406100 }, { "epoch": 0.49013441592466267, "learning_rate": 8.400003876820491e-06, "loss": 3.088600769042969, "step": 406200 }, { "epoch": 0.49025507924714534, "learning_rate": 8.399600041352752e-06, "loss": 3.0954666137695312, "step": 406300 }, { "epoch": 0.490375742569628, "learning_rate": 8.399196205885014e-06, "loss": 3.1070513916015625, "step": 406400 }, { "epoch": 0.4904964058921107, "learning_rate": 8.398792370417276e-06, "loss": 3.06857666015625, "step": 406500 }, { "epoch": 0.49061706921459336, "learning_rate": 8.398388534949538e-06, "loss": 3.0771078491210937, "step": 406600 }, { "epoch": 0.4907377325370761, "learning_rate": 8.3979846994818e-06, "loss": 3.0796969604492186, "step": 406700 }, { "epoch": 0.49085839585955876, "learning_rate": 8.397580864014061e-06, "loss": 3.0720809936523437, "step": 406800 }, { "epoch": 0.49097905918204143, "learning_rate": 8.397177028546323e-06, "loss": 3.0769488525390627, "step": 406900 }, { "epoch": 0.4910997225045241, "learning_rate": 8.396773193078584e-06, "loss": 3.0817401123046877, "step": 407000 }, { "epoch": 0.4912203858270068, "learning_rate": 8.396369357610846e-06, "loss": 3.0994720458984375, "step": 407100 }, { "epoch": 0.4913410491494895, "learning_rate": 8.395965522143108e-06, "loss": 3.0987261962890624, "step": 407200 }, { "epoch": 0.4914617124719722, "learning_rate": 8.395561686675368e-06, "loss": 3.086059265136719, "step": 407300 }, { "epoch": 0.49158237579445485, "learning_rate": 8.39515785120763e-06, "loss": 3.09379638671875, "step": 407400 }, { "epoch": 0.4917030391169375, "learning_rate": 8.394754015739892e-06, "loss": 3.0986920166015626, "step": 407500 }, { "epoch": 0.49182370243942025, "learning_rate": 8.394350180272154e-06, "loss": 3.066160888671875, "step": 407600 }, { "epoch": 0.4919443657619029, "learning_rate": 8.393946344804416e-06, "loss": 3.07545654296875, "step": 407700 }, { "epoch": 0.4920650290843856, "learning_rate": 8.393542509336676e-06, "loss": 3.1040966796875, "step": 407800 }, { "epoch": 0.49218569240686827, "learning_rate": 8.393138673868938e-06, "loss": 3.0473764038085935, "step": 407900 }, { "epoch": 0.49230635572935094, "learning_rate": 8.3927348384012e-06, "loss": 3.1065716552734375, "step": 408000 }, { "epoch": 0.49242701905183367, "learning_rate": 8.392331002933462e-06, "loss": 3.0778955078125, "step": 408100 }, { "epoch": 0.49254768237431634, "learning_rate": 8.391927167465722e-06, "loss": 3.090491943359375, "step": 408200 }, { "epoch": 0.492668345696799, "learning_rate": 8.391523331997984e-06, "loss": 3.093789367675781, "step": 408300 }, { "epoch": 0.4927890090192817, "learning_rate": 8.391119496530246e-06, "loss": 3.0637112426757813, "step": 408400 }, { "epoch": 0.49290967234176436, "learning_rate": 8.390715661062508e-06, "loss": 3.0946466064453126, "step": 408500 }, { "epoch": 0.4930303356642471, "learning_rate": 8.390311825594769e-06, "loss": 3.0925286865234374, "step": 408600 }, { "epoch": 0.49315099898672976, "learning_rate": 8.38990799012703e-06, "loss": 3.098787841796875, "step": 408700 }, { "epoch": 0.49327166230921243, "learning_rate": 8.389504154659293e-06, "loss": 3.0761318969726563, "step": 408800 }, { "epoch": 0.4933923256316951, "learning_rate": 8.389100319191555e-06, "loss": 3.078929748535156, "step": 408900 }, { "epoch": 0.4935129889541778, "learning_rate": 8.388696483723817e-06, "loss": 3.0839797973632814, "step": 409000 }, { "epoch": 0.4936336522766605, "learning_rate": 8.388292648256079e-06, "loss": 3.096500244140625, "step": 409100 }, { "epoch": 0.4937543155991432, "learning_rate": 8.387888812788339e-06, "loss": 3.0792950439453124, "step": 409200 }, { "epoch": 0.49387497892162585, "learning_rate": 8.387484977320601e-06, "loss": 3.0995574951171876, "step": 409300 }, { "epoch": 0.4939956422441085, "learning_rate": 8.387081141852861e-06, "loss": 3.1124093627929685, "step": 409400 }, { "epoch": 0.4941163055665912, "learning_rate": 8.386677306385123e-06, "loss": 3.08474853515625, "step": 409500 }, { "epoch": 0.4942369688890739, "learning_rate": 8.386273470917385e-06, "loss": 3.073335876464844, "step": 409600 }, { "epoch": 0.4943576322115566, "learning_rate": 8.385869635449647e-06, "loss": 3.0866018676757814, "step": 409700 }, { "epoch": 0.49447829553403927, "learning_rate": 8.385465799981909e-06, "loss": 3.085537109375, "step": 409800 }, { "epoch": 0.49459895885652194, "learning_rate": 8.385061964514171e-06, "loss": 3.088872375488281, "step": 409900 }, { "epoch": 0.49471962217900467, "learning_rate": 8.384658129046433e-06, "loss": 3.09466064453125, "step": 410000 }, { "epoch": 0.49484028550148734, "learning_rate": 8.384254293578693e-06, "loss": 3.094207763671875, "step": 410100 }, { "epoch": 0.49496094882397, "learning_rate": 8.383850458110955e-06, "loss": 3.102781066894531, "step": 410200 }, { "epoch": 0.4950816121464527, "learning_rate": 8.383446622643217e-06, "loss": 3.0413330078125, "step": 410300 }, { "epoch": 0.49520227546893536, "learning_rate": 8.383042787175478e-06, "loss": 3.0440472412109374, "step": 410400 }, { "epoch": 0.4953229387914181, "learning_rate": 8.38263895170774e-06, "loss": 3.06772705078125, "step": 410500 }, { "epoch": 0.49544360211390076, "learning_rate": 8.382235116240002e-06, "loss": 3.064564208984375, "step": 410600 }, { "epoch": 0.49556426543638343, "learning_rate": 8.381831280772264e-06, "loss": 3.0978408813476563, "step": 410700 }, { "epoch": 0.4956849287588661, "learning_rate": 8.381427445304526e-06, "loss": 3.099930419921875, "step": 410800 }, { "epoch": 0.4958055920813488, "learning_rate": 8.381023609836788e-06, "loss": 3.078155212402344, "step": 410900 }, { "epoch": 0.4959262554038315, "learning_rate": 8.380619774369048e-06, "loss": 3.081851806640625, "step": 411000 }, { "epoch": 0.4960469187263142, "learning_rate": 8.38021593890131e-06, "loss": 3.0806903076171874, "step": 411100 }, { "epoch": 0.49616758204879685, "learning_rate": 8.379812103433572e-06, "loss": 3.0570693969726563, "step": 411200 }, { "epoch": 0.4962882453712795, "learning_rate": 8.379408267965832e-06, "loss": 3.095123596191406, "step": 411300 }, { "epoch": 0.4964089086937622, "learning_rate": 8.379004432498094e-06, "loss": 3.0806570434570313, "step": 411400 }, { "epoch": 0.4965295720162449, "learning_rate": 8.378600597030356e-06, "loss": 3.0630374145507813, "step": 411500 }, { "epoch": 0.4966502353387276, "learning_rate": 8.378196761562618e-06, "loss": 3.0827978515625, "step": 411600 }, { "epoch": 0.49677089866121027, "learning_rate": 8.37779292609488e-06, "loss": 3.0606640625, "step": 411700 }, { "epoch": 0.49689156198369294, "learning_rate": 8.377389090627142e-06, "loss": 3.060072021484375, "step": 411800 }, { "epoch": 0.4970122253061756, "learning_rate": 8.376985255159402e-06, "loss": 3.080679931640625, "step": 411900 }, { "epoch": 0.49713288862865834, "learning_rate": 8.376581419691664e-06, "loss": 3.0780239868164063, "step": 412000 }, { "epoch": 0.497253551951141, "learning_rate": 8.376177584223926e-06, "loss": 3.085160827636719, "step": 412100 }, { "epoch": 0.4973742152736237, "learning_rate": 8.375773748756188e-06, "loss": 3.051485595703125, "step": 412200 }, { "epoch": 0.49749487859610636, "learning_rate": 8.375369913288449e-06, "loss": 3.07180908203125, "step": 412300 }, { "epoch": 0.49761554191858903, "learning_rate": 8.37496607782071e-06, "loss": 3.087249450683594, "step": 412400 }, { "epoch": 0.49773620524107176, "learning_rate": 8.374562242352972e-06, "loss": 3.12490234375, "step": 412500 }, { "epoch": 0.49785686856355443, "learning_rate": 8.374158406885234e-06, "loss": 3.0543276977539064, "step": 412600 }, { "epoch": 0.4979775318860371, "learning_rate": 8.373754571417495e-06, "loss": 3.075504150390625, "step": 412700 }, { "epoch": 0.4980981952085198, "learning_rate": 8.373350735949757e-06, "loss": 3.07824462890625, "step": 412800 }, { "epoch": 0.4982188585310025, "learning_rate": 8.372946900482019e-06, "loss": 3.074071960449219, "step": 412900 }, { "epoch": 0.4983395218534852, "learning_rate": 8.37254306501428e-06, "loss": 3.067923889160156, "step": 413000 }, { "epoch": 0.49846018517596785, "learning_rate": 8.372139229546543e-06, "loss": 3.08997314453125, "step": 413100 }, { "epoch": 0.4985808484984505, "learning_rate": 8.371735394078803e-06, "loss": 3.0839306640625, "step": 413200 }, { "epoch": 0.4987015118209332, "learning_rate": 8.371331558611065e-06, "loss": 3.098357849121094, "step": 413300 }, { "epoch": 0.4988221751434159, "learning_rate": 8.370927723143327e-06, "loss": 3.1040664672851563, "step": 413400 }, { "epoch": 0.4989428384658986, "learning_rate": 8.370523887675587e-06, "loss": 3.033949890136719, "step": 413500 }, { "epoch": 0.49906350178838127, "learning_rate": 8.37012005220785e-06, "loss": 3.0517706298828124, "step": 413600 }, { "epoch": 0.49918416511086394, "learning_rate": 8.369716216740111e-06, "loss": 3.0464508056640627, "step": 413700 }, { "epoch": 0.4993048284333466, "learning_rate": 8.369312381272373e-06, "loss": 3.0998956298828126, "step": 413800 }, { "epoch": 0.49942549175582934, "learning_rate": 8.368908545804635e-06, "loss": 3.0913955688476564, "step": 413900 }, { "epoch": 0.499546155078312, "learning_rate": 8.368504710336897e-06, "loss": 3.069590759277344, "step": 414000 }, { "epoch": 0.4996668184007947, "learning_rate": 8.368100874869159e-06, "loss": 3.06601806640625, "step": 414100 }, { "epoch": 0.49978748172327736, "learning_rate": 8.36769703940142e-06, "loss": 3.0971914672851564, "step": 414200 }, { "epoch": 0.49990814504576003, "learning_rate": 8.367293203933681e-06, "loss": 3.067413635253906, "step": 414300 }, { "epoch": 0.5000288083682427, "learning_rate": 8.366889368465942e-06, "loss": 3.041134948730469, "step": 414400 }, { "epoch": 0.5001494716907254, "learning_rate": 8.366485532998204e-06, "loss": 3.0805117797851564, "step": 414500 }, { "epoch": 0.5002701350132082, "learning_rate": 8.366081697530466e-06, "loss": 3.063617858886719, "step": 414600 }, { "epoch": 0.5003907983356908, "learning_rate": 8.365677862062728e-06, "loss": 3.0628564453125, "step": 414700 }, { "epoch": 0.5005114616581735, "learning_rate": 8.36527402659499e-06, "loss": 3.105867614746094, "step": 414800 }, { "epoch": 0.5006321249806561, "learning_rate": 8.364870191127252e-06, "loss": 3.0685870361328127, "step": 414900 }, { "epoch": 0.5007527883031389, "learning_rate": 8.364466355659514e-06, "loss": 3.044700012207031, "step": 415000 }, { "epoch": 0.5008734516256216, "learning_rate": 8.364062520191774e-06, "loss": 3.0534841918945315, "step": 415100 }, { "epoch": 0.5009941149481042, "learning_rate": 8.363658684724036e-06, "loss": 3.0662347412109376, "step": 415200 }, { "epoch": 0.5011147782705869, "learning_rate": 8.363254849256298e-06, "loss": 3.0634332275390626, "step": 415300 }, { "epoch": 0.5012354415930695, "learning_rate": 8.362851013788558e-06, "loss": 3.0582424926757814, "step": 415400 }, { "epoch": 0.5013561049155523, "learning_rate": 8.36244717832082e-06, "loss": 3.0725778198242186, "step": 415500 }, { "epoch": 0.501476768238035, "learning_rate": 8.362043342853082e-06, "loss": 3.06215087890625, "step": 415600 }, { "epoch": 0.5015974315605176, "learning_rate": 8.361639507385344e-06, "loss": 3.06943603515625, "step": 415700 }, { "epoch": 0.5017180948830003, "learning_rate": 8.361235671917606e-06, "loss": 3.093991394042969, "step": 415800 }, { "epoch": 0.501838758205483, "learning_rate": 8.360831836449866e-06, "loss": 3.05564208984375, "step": 415900 }, { "epoch": 0.5019594215279657, "learning_rate": 8.360428000982128e-06, "loss": 3.0717501831054688, "step": 416000 }, { "epoch": 0.5020800848504484, "learning_rate": 8.36002416551439e-06, "loss": 3.0618905639648437, "step": 416100 }, { "epoch": 0.502200748172931, "learning_rate": 8.359620330046652e-06, "loss": 3.0480221557617186, "step": 416200 }, { "epoch": 0.5023214114954138, "learning_rate": 8.359216494578913e-06, "loss": 3.064105224609375, "step": 416300 }, { "epoch": 0.5024420748178964, "learning_rate": 8.358812659111175e-06, "loss": 3.068736267089844, "step": 416400 }, { "epoch": 0.5025627381403791, "learning_rate": 8.358408823643437e-06, "loss": 3.067481689453125, "step": 416500 }, { "epoch": 0.5026834014628618, "learning_rate": 8.358004988175699e-06, "loss": 3.083235778808594, "step": 416600 }, { "epoch": 0.5028040647853445, "learning_rate": 8.357601152707959e-06, "loss": 3.0538290405273436, "step": 416700 }, { "epoch": 0.5029247281078272, "learning_rate": 8.35719731724022e-06, "loss": 3.0361834716796876, "step": 416800 }, { "epoch": 0.5030453914303098, "learning_rate": 8.356793481772483e-06, "loss": 3.0473150634765624, "step": 416900 }, { "epoch": 0.5031660547527925, "learning_rate": 8.356389646304745e-06, "loss": 3.063091125488281, "step": 417000 }, { "epoch": 0.5032867180752753, "learning_rate": 8.355985810837007e-06, "loss": 3.0621282958984377, "step": 417100 }, { "epoch": 0.5034073813977579, "learning_rate": 8.355581975369269e-06, "loss": 3.0812948608398436, "step": 417200 }, { "epoch": 0.5035280447202406, "learning_rate": 8.355178139901529e-06, "loss": 3.0475759887695313, "step": 417300 }, { "epoch": 0.5036487080427232, "learning_rate": 8.354774304433791e-06, "loss": 3.07255859375, "step": 417400 }, { "epoch": 0.5037693713652059, "learning_rate": 8.354370468966053e-06, "loss": 3.0646743774414062, "step": 417500 }, { "epoch": 0.5038900346876887, "learning_rate": 8.353966633498313e-06, "loss": 3.08345703125, "step": 417600 }, { "epoch": 0.5040106980101713, "learning_rate": 8.353562798030575e-06, "loss": 3.0557269287109374, "step": 417700 }, { "epoch": 0.504131361332654, "learning_rate": 8.353158962562837e-06, "loss": 3.0752493286132814, "step": 417800 }, { "epoch": 0.5042520246551366, "learning_rate": 8.3527551270951e-06, "loss": 3.0719833374023438, "step": 417900 }, { "epoch": 0.5043726879776194, "learning_rate": 8.352351291627361e-06, "loss": 3.0604779052734377, "step": 418000 }, { "epoch": 0.5044933513001021, "learning_rate": 8.351947456159623e-06, "loss": 3.07777587890625, "step": 418100 }, { "epoch": 0.5046140146225847, "learning_rate": 8.351543620691883e-06, "loss": 3.079162902832031, "step": 418200 }, { "epoch": 0.5047346779450674, "learning_rate": 8.351139785224145e-06, "loss": 3.0609991455078127, "step": 418300 }, { "epoch": 0.50485534126755, "learning_rate": 8.350735949756407e-06, "loss": 3.061528625488281, "step": 418400 }, { "epoch": 0.5049760045900328, "learning_rate": 8.350332114288668e-06, "loss": 3.083462829589844, "step": 418500 }, { "epoch": 0.5050966679125155, "learning_rate": 8.34992827882093e-06, "loss": 3.066733093261719, "step": 418600 }, { "epoch": 0.5052173312349981, "learning_rate": 8.349524443353192e-06, "loss": 3.058432312011719, "step": 418700 }, { "epoch": 0.5053379945574809, "learning_rate": 8.349120607885454e-06, "loss": 3.0906692504882813, "step": 418800 }, { "epoch": 0.5054586578799635, "learning_rate": 8.348716772417716e-06, "loss": 3.048239440917969, "step": 418900 }, { "epoch": 0.5055793212024462, "learning_rate": 8.348312936949978e-06, "loss": 3.0807391357421876, "step": 419000 }, { "epoch": 0.5056999845249289, "learning_rate": 8.34790910148224e-06, "loss": 3.098170166015625, "step": 419100 }, { "epoch": 0.5058206478474115, "learning_rate": 8.3475052660145e-06, "loss": 3.056720886230469, "step": 419200 }, { "epoch": 0.5059413111698943, "learning_rate": 8.347101430546762e-06, "loss": 3.087235107421875, "step": 419300 }, { "epoch": 0.506061974492377, "learning_rate": 8.346697595079022e-06, "loss": 3.0625408935546874, "step": 419400 }, { "epoch": 0.5061826378148596, "learning_rate": 8.346293759611284e-06, "loss": 3.047413024902344, "step": 419500 }, { "epoch": 0.5063033011373423, "learning_rate": 8.345889924143546e-06, "loss": 3.032467956542969, "step": 419600 }, { "epoch": 0.506423964459825, "learning_rate": 8.345486088675808e-06, "loss": 3.070262145996094, "step": 419700 }, { "epoch": 0.5065446277823077, "learning_rate": 8.34508225320807e-06, "loss": 3.06198486328125, "step": 419800 }, { "epoch": 0.5066652911047904, "learning_rate": 8.344678417740332e-06, "loss": 3.0581536865234376, "step": 419900 }, { "epoch": 0.506785954427273, "learning_rate": 8.344274582272592e-06, "loss": 3.054132080078125, "step": 420000 }, { "epoch": 0.5069066177497558, "learning_rate": 8.343870746804854e-06, "loss": 3.0500445556640625, "step": 420100 }, { "epoch": 0.5070272810722384, "learning_rate": 8.343466911337116e-06, "loss": 3.069715576171875, "step": 420200 }, { "epoch": 0.5071479443947211, "learning_rate": 8.343063075869378e-06, "loss": 3.061250915527344, "step": 420300 }, { "epoch": 0.5072686077172038, "learning_rate": 8.342659240401639e-06, "loss": 3.065164794921875, "step": 420400 }, { "epoch": 0.5073892710396865, "learning_rate": 8.3422554049339e-06, "loss": 3.071152648925781, "step": 420500 }, { "epoch": 0.5075099343621692, "learning_rate": 8.341851569466163e-06, "loss": 3.0517401123046874, "step": 420600 }, { "epoch": 0.5076305976846518, "learning_rate": 8.341447733998425e-06, "loss": 3.04858642578125, "step": 420700 }, { "epoch": 0.5077512610071345, "learning_rate": 8.341043898530685e-06, "loss": 3.0574853515625, "step": 420800 }, { "epoch": 0.5078719243296173, "learning_rate": 8.340640063062947e-06, "loss": 3.0682489013671876, "step": 420900 }, { "epoch": 0.5079925876520999, "learning_rate": 8.340236227595209e-06, "loss": 3.070512390136719, "step": 421000 }, { "epoch": 0.5081132509745826, "learning_rate": 8.33983239212747e-06, "loss": 3.0714627075195313, "step": 421100 }, { "epoch": 0.5082339142970652, "learning_rate": 8.339428556659733e-06, "loss": 3.052193908691406, "step": 421200 }, { "epoch": 0.5083545776195479, "learning_rate": 8.339024721191995e-06, "loss": 3.048439636230469, "step": 421300 }, { "epoch": 0.5084752409420307, "learning_rate": 8.338620885724255e-06, "loss": 3.068442687988281, "step": 421400 }, { "epoch": 0.5085959042645133, "learning_rate": 8.338217050256517e-06, "loss": 3.0612451171875, "step": 421500 }, { "epoch": 0.508716567586996, "learning_rate": 8.337813214788777e-06, "loss": 3.0792041015625, "step": 421600 }, { "epoch": 0.5088372309094786, "learning_rate": 8.33740937932104e-06, "loss": 3.0510464477539063, "step": 421700 }, { "epoch": 0.5089578942319614, "learning_rate": 8.337005543853301e-06, "loss": 3.0392532348632812, "step": 421800 }, { "epoch": 0.5090785575544441, "learning_rate": 8.336601708385563e-06, "loss": 3.044076232910156, "step": 421900 }, { "epoch": 0.5091992208769267, "learning_rate": 8.336197872917825e-06, "loss": 3.04828369140625, "step": 422000 }, { "epoch": 0.5093198841994094, "learning_rate": 8.335794037450087e-06, "loss": 3.038778076171875, "step": 422100 }, { "epoch": 0.509440547521892, "learning_rate": 8.33539020198235e-06, "loss": 3.0599810791015627, "step": 422200 }, { "epoch": 0.5095612108443748, "learning_rate": 8.33498636651461e-06, "loss": 3.0603094482421875, "step": 422300 }, { "epoch": 0.5096818741668575, "learning_rate": 8.334582531046871e-06, "loss": 3.059103698730469, "step": 422400 }, { "epoch": 0.5098025374893401, "learning_rate": 8.334178695579133e-06, "loss": 3.037176208496094, "step": 422500 }, { "epoch": 0.5099232008118229, "learning_rate": 8.333774860111394e-06, "loss": 3.0613641357421875, "step": 422600 }, { "epoch": 0.5100438641343055, "learning_rate": 8.333371024643656e-06, "loss": 3.067445983886719, "step": 422700 }, { "epoch": 0.5101645274567882, "learning_rate": 8.332967189175918e-06, "loss": 3.075067443847656, "step": 422800 }, { "epoch": 0.5102851907792709, "learning_rate": 8.33256335370818e-06, "loss": 3.0423004150390627, "step": 422900 }, { "epoch": 0.5104058541017535, "learning_rate": 8.332159518240442e-06, "loss": 3.03037841796875, "step": 423000 }, { "epoch": 0.5105265174242363, "learning_rate": 8.331755682772704e-06, "loss": 3.0377597045898437, "step": 423100 }, { "epoch": 0.5106471807467189, "learning_rate": 8.331351847304966e-06, "loss": 3.0459384155273437, "step": 423200 }, { "epoch": 0.5107678440692016, "learning_rate": 8.330948011837226e-06, "loss": 3.0799755859375, "step": 423300 }, { "epoch": 0.5108885073916843, "learning_rate": 8.330544176369488e-06, "loss": 3.0394296264648437, "step": 423400 }, { "epoch": 0.511009170714167, "learning_rate": 8.330140340901748e-06, "loss": 3.0380587768554688, "step": 423500 }, { "epoch": 0.5111298340366497, "learning_rate": 8.32973650543401e-06, "loss": 3.0400350952148436, "step": 423600 }, { "epoch": 0.5112504973591323, "learning_rate": 8.329332669966272e-06, "loss": 3.0556790161132814, "step": 423700 }, { "epoch": 0.511371160681615, "learning_rate": 8.328928834498534e-06, "loss": 3.05145263671875, "step": 423800 }, { "epoch": 0.5114918240040978, "learning_rate": 8.328524999030796e-06, "loss": 3.056429443359375, "step": 423900 }, { "epoch": 0.5116124873265804, "learning_rate": 8.328121163563058e-06, "loss": 3.0487911987304686, "step": 424000 }, { "epoch": 0.5117331506490631, "learning_rate": 8.327717328095318e-06, "loss": 3.0483303833007813, "step": 424100 }, { "epoch": 0.5118538139715457, "learning_rate": 8.32731349262758e-06, "loss": 3.08312255859375, "step": 424200 }, { "epoch": 0.5119744772940285, "learning_rate": 8.326909657159842e-06, "loss": 3.0497344970703124, "step": 424300 }, { "epoch": 0.5120951406165112, "learning_rate": 8.326505821692104e-06, "loss": 3.067230529785156, "step": 424400 }, { "epoch": 0.5122158039389938, "learning_rate": 8.326101986224365e-06, "loss": 3.0073797607421877, "step": 424500 }, { "epoch": 0.5123364672614765, "learning_rate": 8.325698150756627e-06, "loss": 3.0361453247070314, "step": 424600 }, { "epoch": 0.5124571305839593, "learning_rate": 8.325294315288889e-06, "loss": 3.0673797607421873, "step": 424700 }, { "epoch": 0.5125777939064419, "learning_rate": 8.32489047982115e-06, "loss": 3.0618853759765625, "step": 424800 }, { "epoch": 0.5126984572289246, "learning_rate": 8.324486644353411e-06, "loss": 3.039766540527344, "step": 424900 }, { "epoch": 0.5128191205514072, "learning_rate": 8.324082808885673e-06, "loss": 3.0676339721679686, "step": 425000 }, { "epoch": 0.5129397838738899, "learning_rate": 8.323678973417935e-06, "loss": 3.052113037109375, "step": 425100 }, { "epoch": 0.5130604471963727, "learning_rate": 8.323275137950197e-06, "loss": 3.04845947265625, "step": 425200 }, { "epoch": 0.5131811105188553, "learning_rate": 8.322871302482459e-06, "loss": 3.0752008056640623, "step": 425300 }, { "epoch": 0.513301773841338, "learning_rate": 8.322467467014719e-06, "loss": 3.078260803222656, "step": 425400 }, { "epoch": 0.5134224371638206, "learning_rate": 8.322063631546981e-06, "loss": 3.0693145751953126, "step": 425500 }, { "epoch": 0.5135431004863034, "learning_rate": 8.321659796079243e-06, "loss": 3.062494812011719, "step": 425600 }, { "epoch": 0.5136637638087861, "learning_rate": 8.321255960611503e-06, "loss": 3.0423348999023436, "step": 425700 }, { "epoch": 0.5137844271312687, "learning_rate": 8.320852125143765e-06, "loss": 3.0554080200195313, "step": 425800 }, { "epoch": 0.5139050904537514, "learning_rate": 8.320448289676027e-06, "loss": 3.032933349609375, "step": 425900 }, { "epoch": 0.514025753776234, "learning_rate": 8.32004445420829e-06, "loss": 3.0390618896484374, "step": 426000 }, { "epoch": 0.5141464170987168, "learning_rate": 8.319640618740551e-06, "loss": 3.06499755859375, "step": 426100 }, { "epoch": 0.5142670804211995, "learning_rate": 8.319236783272813e-06, "loss": 3.0649758911132814, "step": 426200 }, { "epoch": 0.5143877437436821, "learning_rate": 8.318832947805075e-06, "loss": 3.02170654296875, "step": 426300 }, { "epoch": 0.5145084070661649, "learning_rate": 8.318429112337336e-06, "loss": 3.04176025390625, "step": 426400 }, { "epoch": 0.5146290703886475, "learning_rate": 8.318025276869598e-06, "loss": 3.058222351074219, "step": 426500 }, { "epoch": 0.5147497337111302, "learning_rate": 8.317621441401858e-06, "loss": 3.045534973144531, "step": 426600 }, { "epoch": 0.5148703970336129, "learning_rate": 8.31721760593412e-06, "loss": 3.05906982421875, "step": 426700 }, { "epoch": 0.5149910603560955, "learning_rate": 8.316813770466382e-06, "loss": 3.0301718139648437, "step": 426800 }, { "epoch": 0.5151117236785783, "learning_rate": 8.316409934998644e-06, "loss": 3.071788330078125, "step": 426900 }, { "epoch": 0.5152323870010609, "learning_rate": 8.316006099530906e-06, "loss": 3.033121337890625, "step": 427000 }, { "epoch": 0.5153530503235436, "learning_rate": 8.315602264063168e-06, "loss": 3.0305520629882814, "step": 427100 }, { "epoch": 0.5154737136460263, "learning_rate": 8.31519842859543e-06, "loss": 3.0346124267578123, "step": 427200 }, { "epoch": 0.515594376968509, "learning_rate": 8.31479459312769e-06, "loss": 3.075622253417969, "step": 427300 }, { "epoch": 0.5157150402909917, "learning_rate": 8.314390757659952e-06, "loss": 3.0046380615234374, "step": 427400 }, { "epoch": 0.5158357036134743, "learning_rate": 8.313986922192214e-06, "loss": 3.0335498046875, "step": 427500 }, { "epoch": 0.515956366935957, "learning_rate": 8.313583086724474e-06, "loss": 3.0385031127929687, "step": 427600 }, { "epoch": 0.5160770302584398, "learning_rate": 8.313179251256736e-06, "loss": 3.0766921997070313, "step": 427700 }, { "epoch": 0.5161976935809224, "learning_rate": 8.312775415788998e-06, "loss": 3.0377151489257814, "step": 427800 }, { "epoch": 0.5163183569034051, "learning_rate": 8.31237158032126e-06, "loss": 3.0509808349609373, "step": 427900 }, { "epoch": 0.5164390202258877, "learning_rate": 8.311967744853522e-06, "loss": 3.0555560302734377, "step": 428000 }, { "epoch": 0.5165596835483705, "learning_rate": 8.311563909385784e-06, "loss": 3.039304504394531, "step": 428100 }, { "epoch": 0.5166803468708532, "learning_rate": 8.311160073918044e-06, "loss": 3.058705139160156, "step": 428200 }, { "epoch": 0.5168010101933358, "learning_rate": 8.310756238450306e-06, "loss": 3.056860046386719, "step": 428300 }, { "epoch": 0.5169216735158185, "learning_rate": 8.310352402982568e-06, "loss": 3.046229248046875, "step": 428400 }, { "epoch": 0.5170423368383011, "learning_rate": 8.309948567514829e-06, "loss": 3.0511959838867186, "step": 428500 }, { "epoch": 0.5171630001607839, "learning_rate": 8.30954473204709e-06, "loss": 3.0641293334960937, "step": 428600 }, { "epoch": 0.5172836634832666, "learning_rate": 8.309140896579353e-06, "loss": 3.054437255859375, "step": 428700 }, { "epoch": 0.5174043268057492, "learning_rate": 8.308737061111615e-06, "loss": 3.0301165771484375, "step": 428800 }, { "epoch": 0.5175249901282319, "learning_rate": 8.308333225643877e-06, "loss": 3.0498062133789063, "step": 428900 }, { "epoch": 0.5176456534507146, "learning_rate": 8.307929390176137e-06, "loss": 3.0663275146484374, "step": 429000 }, { "epoch": 0.5177663167731973, "learning_rate": 8.307525554708399e-06, "loss": 3.061188049316406, "step": 429100 }, { "epoch": 0.51788698009568, "learning_rate": 8.307121719240661e-06, "loss": 3.045030212402344, "step": 429200 }, { "epoch": 0.5180076434181626, "learning_rate": 8.306717883772923e-06, "loss": 3.0660830688476564, "step": 429300 }, { "epoch": 0.5181283067406454, "learning_rate": 8.306314048305185e-06, "loss": 3.072074279785156, "step": 429400 }, { "epoch": 0.518248970063128, "learning_rate": 8.305910212837445e-06, "loss": 3.0510189819335936, "step": 429500 }, { "epoch": 0.5183696333856107, "learning_rate": 8.305506377369707e-06, "loss": 3.0200775146484373, "step": 429600 }, { "epoch": 0.5184902967080934, "learning_rate": 8.305102541901969e-06, "loss": 3.0297467041015627, "step": 429700 }, { "epoch": 0.518610960030576, "learning_rate": 8.30469870643423e-06, "loss": 3.053097839355469, "step": 429800 }, { "epoch": 0.5187316233530588, "learning_rate": 8.304294870966491e-06, "loss": 3.050734558105469, "step": 429900 }, { "epoch": 0.5188522866755415, "learning_rate": 8.303891035498753e-06, "loss": 3.05365234375, "step": 430000 }, { "epoch": 0.5189729499980241, "learning_rate": 8.303487200031015e-06, "loss": 3.0288882446289063, "step": 430100 }, { "epoch": 0.5190936133205069, "learning_rate": 8.303083364563277e-06, "loss": 3.063024597167969, "step": 430200 }, { "epoch": 0.5192142766429895, "learning_rate": 8.30267952909554e-06, "loss": 3.037414855957031, "step": 430300 }, { "epoch": 0.5193349399654722, "learning_rate": 8.3022756936278e-06, "loss": 3.055743408203125, "step": 430400 }, { "epoch": 0.5194556032879549, "learning_rate": 8.301871858160062e-06, "loss": 3.052115173339844, "step": 430500 }, { "epoch": 0.5195762666104375, "learning_rate": 8.301468022692324e-06, "loss": 3.0498760986328124, "step": 430600 }, { "epoch": 0.5196969299329203, "learning_rate": 8.301064187224584e-06, "loss": 3.0660003662109374, "step": 430700 }, { "epoch": 0.5198175932554029, "learning_rate": 8.300660351756846e-06, "loss": 3.0593902587890627, "step": 430800 }, { "epoch": 0.5199382565778856, "learning_rate": 8.300256516289108e-06, "loss": 3.0359820556640624, "step": 430900 }, { "epoch": 0.5200589199003683, "learning_rate": 8.29985268082137e-06, "loss": 3.044608154296875, "step": 431000 }, { "epoch": 0.520179583222851, "learning_rate": 8.299448845353632e-06, "loss": 3.043662109375, "step": 431100 }, { "epoch": 0.5203002465453337, "learning_rate": 8.299045009885894e-06, "loss": 3.0331790161132814, "step": 431200 }, { "epoch": 0.5204209098678163, "learning_rate": 8.298641174418156e-06, "loss": 3.06168212890625, "step": 431300 }, { "epoch": 0.520541573190299, "learning_rate": 8.298237338950416e-06, "loss": 3.0216925048828127, "step": 431400 }, { "epoch": 0.5206622365127818, "learning_rate": 8.297833503482678e-06, "loss": 3.04521728515625, "step": 431500 }, { "epoch": 0.5207828998352644, "learning_rate": 8.297429668014938e-06, "loss": 3.06349365234375, "step": 431600 }, { "epoch": 0.5209035631577471, "learning_rate": 8.2970258325472e-06, "loss": 3.015486145019531, "step": 431700 }, { "epoch": 0.5210242264802297, "learning_rate": 8.296621997079462e-06, "loss": 3.049866027832031, "step": 431800 }, { "epoch": 0.5211448898027125, "learning_rate": 8.296218161611724e-06, "loss": 3.0094125366210935, "step": 431900 }, { "epoch": 0.5212655531251952, "learning_rate": 8.295814326143986e-06, "loss": 3.06577880859375, "step": 432000 }, { "epoch": 0.5213862164476778, "learning_rate": 8.295410490676248e-06, "loss": 3.033587646484375, "step": 432100 }, { "epoch": 0.5215068797701605, "learning_rate": 8.29500665520851e-06, "loss": 3.037728576660156, "step": 432200 }, { "epoch": 0.5216275430926431, "learning_rate": 8.29460281974077e-06, "loss": 3.038385314941406, "step": 432300 }, { "epoch": 0.5217482064151259, "learning_rate": 8.294198984273032e-06, "loss": 3.0494979858398437, "step": 432400 }, { "epoch": 0.5218688697376086, "learning_rate": 8.293795148805294e-06, "loss": 3.053844299316406, "step": 432500 }, { "epoch": 0.5219895330600912, "learning_rate": 8.293391313337555e-06, "loss": 3.019091796875, "step": 432600 }, { "epoch": 0.5221101963825739, "learning_rate": 8.292987477869817e-06, "loss": 3.035799560546875, "step": 432700 }, { "epoch": 0.5222308597050566, "learning_rate": 8.292583642402079e-06, "loss": 3.0246429443359375, "step": 432800 }, { "epoch": 0.5223515230275393, "learning_rate": 8.29217980693434e-06, "loss": 3.0304010009765623, "step": 432900 }, { "epoch": 0.522472186350022, "learning_rate": 8.291775971466603e-06, "loss": 3.0269244384765623, "step": 433000 }, { "epoch": 0.5225928496725046, "learning_rate": 8.291372135998863e-06, "loss": 3.0511712646484375, "step": 433100 }, { "epoch": 0.5227135129949874, "learning_rate": 8.290968300531125e-06, "loss": 3.0312127685546875, "step": 433200 }, { "epoch": 0.52283417631747, "learning_rate": 8.290564465063387e-06, "loss": 3.023028564453125, "step": 433300 }, { "epoch": 0.5229548396399527, "learning_rate": 8.290160629595649e-06, "loss": 3.01251220703125, "step": 433400 }, { "epoch": 0.5230755029624354, "learning_rate": 8.28975679412791e-06, "loss": 3.0403378295898436, "step": 433500 }, { "epoch": 0.523196166284918, "learning_rate": 8.289352958660171e-06, "loss": 3.037583923339844, "step": 433600 }, { "epoch": 0.5233168296074008, "learning_rate": 8.288949123192433e-06, "loss": 3.052095947265625, "step": 433700 }, { "epoch": 0.5234374929298834, "learning_rate": 8.288545287724695e-06, "loss": 3.0461572265625, "step": 433800 }, { "epoch": 0.5235581562523661, "learning_rate": 8.288141452256955e-06, "loss": 3.0304461669921876, "step": 433900 }, { "epoch": 0.5236788195748489, "learning_rate": 8.287737616789217e-06, "loss": 3.0209609985351564, "step": 434000 }, { "epoch": 0.5237994828973315, "learning_rate": 8.28733378132148e-06, "loss": 3.01710205078125, "step": 434100 }, { "epoch": 0.5239201462198142, "learning_rate": 8.286929945853741e-06, "loss": 3.0505917358398436, "step": 434200 }, { "epoch": 0.5240408095422968, "learning_rate": 8.286526110386003e-06, "loss": 3.0195462036132814, "step": 434300 }, { "epoch": 0.5241614728647795, "learning_rate": 8.286122274918265e-06, "loss": 3.0492449951171876, "step": 434400 }, { "epoch": 0.5242821361872623, "learning_rate": 8.285718439450526e-06, "loss": 3.0434799194335938, "step": 434500 }, { "epoch": 0.5244027995097449, "learning_rate": 8.285314603982788e-06, "loss": 3.0262298583984375, "step": 434600 }, { "epoch": 0.5245234628322276, "learning_rate": 8.284910768515048e-06, "loss": 3.0278640747070313, "step": 434700 }, { "epoch": 0.5246441261547103, "learning_rate": 8.28450693304731e-06, "loss": 3.027030334472656, "step": 434800 }, { "epoch": 0.524764789477193, "learning_rate": 8.284103097579572e-06, "loss": 3.0209881591796877, "step": 434900 }, { "epoch": 0.5248854527996757, "learning_rate": 8.283699262111834e-06, "loss": 3.0090411376953123, "step": 435000 }, { "epoch": 0.5250061161221583, "learning_rate": 8.283295426644096e-06, "loss": 3.0484347534179688, "step": 435100 }, { "epoch": 0.525126779444641, "learning_rate": 8.282891591176358e-06, "loss": 3.029527282714844, "step": 435200 }, { "epoch": 0.5252474427671238, "learning_rate": 8.28248775570862e-06, "loss": 3.046122741699219, "step": 435300 }, { "epoch": 0.5253681060896064, "learning_rate": 8.282083920240882e-06, "loss": 3.0437503051757813, "step": 435400 }, { "epoch": 0.5254887694120891, "learning_rate": 8.281680084773142e-06, "loss": 3.017331237792969, "step": 435500 }, { "epoch": 0.5256094327345717, "learning_rate": 8.281276249305404e-06, "loss": 3.019862060546875, "step": 435600 }, { "epoch": 0.5257300960570545, "learning_rate": 8.280872413837664e-06, "loss": 3.0174725341796873, "step": 435700 }, { "epoch": 0.5258507593795372, "learning_rate": 8.280468578369926e-06, "loss": 3.0225360107421877, "step": 435800 }, { "epoch": 0.5259714227020198, "learning_rate": 8.280064742902188e-06, "loss": 3.048797607421875, "step": 435900 }, { "epoch": 0.5260920860245025, "learning_rate": 8.27966090743445e-06, "loss": 3.0422622680664064, "step": 436000 }, { "epoch": 0.5262127493469851, "learning_rate": 8.279257071966712e-06, "loss": 3.029744873046875, "step": 436100 }, { "epoch": 0.5263334126694679, "learning_rate": 8.278853236498974e-06, "loss": 3.026267395019531, "step": 436200 }, { "epoch": 0.5264540759919506, "learning_rate": 8.278449401031235e-06, "loss": 3.0416055297851563, "step": 436300 }, { "epoch": 0.5265747393144332, "learning_rate": 8.278045565563496e-06, "loss": 3.0519058227539064, "step": 436400 }, { "epoch": 0.5266954026369159, "learning_rate": 8.277641730095758e-06, "loss": 3.054364013671875, "step": 436500 }, { "epoch": 0.5268160659593986, "learning_rate": 8.27723789462802e-06, "loss": 3.0086798095703124, "step": 436600 }, { "epoch": 0.5269367292818813, "learning_rate": 8.27683405916028e-06, "loss": 3.0447116088867188, "step": 436700 }, { "epoch": 0.527057392604364, "learning_rate": 8.276430223692543e-06, "loss": 3.039418029785156, "step": 436800 }, { "epoch": 0.5271780559268466, "learning_rate": 8.276026388224805e-06, "loss": 3.0420828247070313, "step": 436900 }, { "epoch": 0.5272987192493294, "learning_rate": 8.275622552757067e-06, "loss": 3.056221618652344, "step": 437000 }, { "epoch": 0.527419382571812, "learning_rate": 8.275218717289327e-06, "loss": 3.032608947753906, "step": 437100 }, { "epoch": 0.5275400458942947, "learning_rate": 8.274814881821589e-06, "loss": 3.0226190185546873, "step": 437200 }, { "epoch": 0.5276607092167774, "learning_rate": 8.274411046353851e-06, "loss": 2.998238830566406, "step": 437300 }, { "epoch": 0.52778137253926, "learning_rate": 8.274007210886113e-06, "loss": 3.0441619873046877, "step": 437400 }, { "epoch": 0.5279020358617428, "learning_rate": 8.273603375418375e-06, "loss": 3.0439849853515626, "step": 437500 }, { "epoch": 0.5280226991842254, "learning_rate": 8.273199539950635e-06, "loss": 3.0543450927734375, "step": 437600 }, { "epoch": 0.5281433625067081, "learning_rate": 8.272795704482897e-06, "loss": 3.020230407714844, "step": 437700 }, { "epoch": 0.5282640258291909, "learning_rate": 8.27239186901516e-06, "loss": 3.038050231933594, "step": 437800 }, { "epoch": 0.5283846891516735, "learning_rate": 8.271988033547421e-06, "loss": 3.021733703613281, "step": 437900 }, { "epoch": 0.5285053524741562, "learning_rate": 8.271584198079681e-06, "loss": 3.029966125488281, "step": 438000 }, { "epoch": 0.5286260157966388, "learning_rate": 8.271180362611943e-06, "loss": 3.053952331542969, "step": 438100 }, { "epoch": 0.5287466791191215, "learning_rate": 8.270776527144205e-06, "loss": 3.02169677734375, "step": 438200 }, { "epoch": 0.5288673424416043, "learning_rate": 8.270372691676467e-06, "loss": 3.0531158447265625, "step": 438300 }, { "epoch": 0.5289880057640869, "learning_rate": 8.26996885620873e-06, "loss": 3.0478030395507814, "step": 438400 }, { "epoch": 0.5291086690865696, "learning_rate": 8.269565020740991e-06, "loss": 3.021881103515625, "step": 438500 }, { "epoch": 0.5292293324090522, "learning_rate": 8.269161185273252e-06, "loss": 3.0300494384765626, "step": 438600 }, { "epoch": 0.529349995731535, "learning_rate": 8.268757349805514e-06, "loss": 3.0104168701171874, "step": 438700 }, { "epoch": 0.5294706590540177, "learning_rate": 8.268353514337774e-06, "loss": 3.020096740722656, "step": 438800 }, { "epoch": 0.5295913223765003, "learning_rate": 8.267949678870036e-06, "loss": 3.0495291137695313, "step": 438900 }, { "epoch": 0.529711985698983, "learning_rate": 8.267545843402298e-06, "loss": 3.0659521484375, "step": 439000 }, { "epoch": 0.5298326490214657, "learning_rate": 8.26714200793456e-06, "loss": 3.0177215576171874, "step": 439100 }, { "epoch": 0.5299533123439484, "learning_rate": 8.266738172466822e-06, "loss": 3.036053466796875, "step": 439200 }, { "epoch": 0.5300739756664311, "learning_rate": 8.266334336999084e-06, "loss": 3.007360534667969, "step": 439300 }, { "epoch": 0.5301946389889137, "learning_rate": 8.265930501531346e-06, "loss": 3.0053591918945313, "step": 439400 }, { "epoch": 0.5303153023113965, "learning_rate": 8.265526666063606e-06, "loss": 3.043965148925781, "step": 439500 }, { "epoch": 0.5304359656338791, "learning_rate": 8.265122830595868e-06, "loss": 3.0373468017578125, "step": 439600 }, { "epoch": 0.5305566289563618, "learning_rate": 8.26471899512813e-06, "loss": 3.0461749267578124, "step": 439700 }, { "epoch": 0.5306772922788445, "learning_rate": 8.26431515966039e-06, "loss": 3.0115863037109376, "step": 439800 }, { "epoch": 0.5307979556013271, "learning_rate": 8.263911324192652e-06, "loss": 3.0024359130859377, "step": 439900 }, { "epoch": 0.5309186189238099, "learning_rate": 8.263507488724914e-06, "loss": 3.021661682128906, "step": 440000 }, { "epoch": 0.5310392822462926, "learning_rate": 8.263103653257176e-06, "loss": 3.026658630371094, "step": 440100 }, { "epoch": 0.5311599455687752, "learning_rate": 8.262699817789438e-06, "loss": 3.0172085571289062, "step": 440200 }, { "epoch": 0.5312806088912579, "learning_rate": 8.2622959823217e-06, "loss": 3.02299560546875, "step": 440300 }, { "epoch": 0.5314012722137406, "learning_rate": 8.26189214685396e-06, "loss": 3.0163613891601564, "step": 440400 }, { "epoch": 0.5315219355362233, "learning_rate": 8.261488311386223e-06, "loss": 3.043457336425781, "step": 440500 }, { "epoch": 0.531642598858706, "learning_rate": 8.261084475918485e-06, "loss": 3.0227670288085937, "step": 440600 }, { "epoch": 0.5317632621811886, "learning_rate": 8.260680640450745e-06, "loss": 3.02986328125, "step": 440700 }, { "epoch": 0.5318839255036714, "learning_rate": 8.260276804983007e-06, "loss": 3.028037414550781, "step": 440800 }, { "epoch": 0.532004588826154, "learning_rate": 8.259872969515269e-06, "loss": 3.01552490234375, "step": 440900 }, { "epoch": 0.5321252521486367, "learning_rate": 8.25946913404753e-06, "loss": 3.027689208984375, "step": 441000 }, { "epoch": 0.5322459154711194, "learning_rate": 8.259065298579793e-06, "loss": 3.02337158203125, "step": 441100 }, { "epoch": 0.532366578793602, "learning_rate": 8.258661463112053e-06, "loss": 3.002225036621094, "step": 441200 }, { "epoch": 0.5324872421160848, "learning_rate": 8.258257627644315e-06, "loss": 3.015375671386719, "step": 441300 }, { "epoch": 0.5326079054385674, "learning_rate": 8.257853792176577e-06, "loss": 3.0085568237304687, "step": 441400 }, { "epoch": 0.5327285687610501, "learning_rate": 8.257449956708839e-06, "loss": 3.029344482421875, "step": 441500 }, { "epoch": 0.5328492320835329, "learning_rate": 8.257046121241101e-06, "loss": 3.0445382690429685, "step": 441600 }, { "epoch": 0.5329698954060155, "learning_rate": 8.256642285773361e-06, "loss": 3.036221923828125, "step": 441700 }, { "epoch": 0.5330905587284982, "learning_rate": 8.256238450305623e-06, "loss": 3.022719421386719, "step": 441800 }, { "epoch": 0.5332112220509808, "learning_rate": 8.255834614837885e-06, "loss": 3.015985107421875, "step": 441900 }, { "epoch": 0.5333318853734635, "learning_rate": 8.255430779370145e-06, "loss": 3.007535095214844, "step": 442000 }, { "epoch": 0.5334525486959463, "learning_rate": 8.255026943902407e-06, "loss": 2.9976519775390624, "step": 442100 }, { "epoch": 0.5335732120184289, "learning_rate": 8.25462310843467e-06, "loss": 3.026825256347656, "step": 442200 }, { "epoch": 0.5336938753409116, "learning_rate": 8.254219272966931e-06, "loss": 3.0377377319335936, "step": 442300 }, { "epoch": 0.5338145386633942, "learning_rate": 8.253815437499193e-06, "loss": 3.037503356933594, "step": 442400 }, { "epoch": 0.533935201985877, "learning_rate": 8.253411602031455e-06, "loss": 3.0330621337890626, "step": 442500 }, { "epoch": 0.5340558653083597, "learning_rate": 8.253007766563716e-06, "loss": 3.0423260498046876, "step": 442600 }, { "epoch": 0.5341765286308423, "learning_rate": 8.252603931095978e-06, "loss": 3.013909912109375, "step": 442700 }, { "epoch": 0.534297191953325, "learning_rate": 8.25220009562824e-06, "loss": 3.040461120605469, "step": 442800 }, { "epoch": 0.5344178552758077, "learning_rate": 8.2517962601605e-06, "loss": 3.0267962646484374, "step": 442900 }, { "epoch": 0.5345385185982904, "learning_rate": 8.251392424692762e-06, "loss": 3.031927490234375, "step": 443000 }, { "epoch": 0.5346591819207731, "learning_rate": 8.250988589225024e-06, "loss": 3.0334930419921875, "step": 443100 }, { "epoch": 0.5347798452432557, "learning_rate": 8.250584753757286e-06, "loss": 3.0304254150390624, "step": 443200 }, { "epoch": 0.5349005085657385, "learning_rate": 8.250180918289548e-06, "loss": 3.0278860473632814, "step": 443300 }, { "epoch": 0.5350211718882211, "learning_rate": 8.24977708282181e-06, "loss": 3.04392333984375, "step": 443400 }, { "epoch": 0.5351418352107038, "learning_rate": 8.249373247354072e-06, "loss": 3.0515933227539063, "step": 443500 }, { "epoch": 0.5352624985331865, "learning_rate": 8.248969411886332e-06, "loss": 2.9995220947265624, "step": 443600 }, { "epoch": 0.5353831618556691, "learning_rate": 8.248565576418594e-06, "loss": 3.05199951171875, "step": 443700 }, { "epoch": 0.5355038251781519, "learning_rate": 8.248161740950854e-06, "loss": 3.029063415527344, "step": 443800 }, { "epoch": 0.5356244885006345, "learning_rate": 8.247757905483116e-06, "loss": 3.0162322998046873, "step": 443900 }, { "epoch": 0.5357451518231172, "learning_rate": 8.247354070015378e-06, "loss": 3.0014007568359373, "step": 444000 }, { "epoch": 0.5358658151455999, "learning_rate": 8.24695023454764e-06, "loss": 3.019384765625, "step": 444100 }, { "epoch": 0.5359864784680826, "learning_rate": 8.246546399079902e-06, "loss": 3.014043273925781, "step": 444200 }, { "epoch": 0.5361071417905653, "learning_rate": 8.246142563612164e-06, "loss": 3.0233529663085936, "step": 444300 }, { "epoch": 0.5362278051130479, "learning_rate": 8.245738728144426e-06, "loss": 3.0105099487304687, "step": 444400 }, { "epoch": 0.5363484684355306, "learning_rate": 8.245334892676687e-06, "loss": 3.01185791015625, "step": 444500 }, { "epoch": 0.5364691317580134, "learning_rate": 8.244931057208949e-06, "loss": 3.0508038330078127, "step": 444600 }, { "epoch": 0.536589795080496, "learning_rate": 8.24452722174121e-06, "loss": 3.016676330566406, "step": 444700 }, { "epoch": 0.5367104584029787, "learning_rate": 8.24412338627347e-06, "loss": 3.029635314941406, "step": 444800 }, { "epoch": 0.5368311217254613, "learning_rate": 8.243719550805733e-06, "loss": 3.021878356933594, "step": 444900 }, { "epoch": 0.536951785047944, "learning_rate": 8.243315715337995e-06, "loss": 3.0114556884765626, "step": 445000 }, { "epoch": 0.5370724483704268, "learning_rate": 8.242911879870257e-06, "loss": 3.020982666015625, "step": 445100 }, { "epoch": 0.5371931116929094, "learning_rate": 8.242508044402519e-06, "loss": 3.0232113647460936, "step": 445200 }, { "epoch": 0.5373137750153921, "learning_rate": 8.242104208934779e-06, "loss": 3.005293884277344, "step": 445300 }, { "epoch": 0.5374344383378749, "learning_rate": 8.241700373467041e-06, "loss": 3.03168701171875, "step": 445400 }, { "epoch": 0.5375551016603575, "learning_rate": 8.241296537999303e-06, "loss": 3.009619140625, "step": 445500 }, { "epoch": 0.5376757649828402, "learning_rate": 8.240892702531565e-06, "loss": 3.030387268066406, "step": 445600 }, { "epoch": 0.5377964283053228, "learning_rate": 8.240488867063825e-06, "loss": 3.004181213378906, "step": 445700 }, { "epoch": 0.5379170916278055, "learning_rate": 8.240085031596087e-06, "loss": 3.009443359375, "step": 445800 }, { "epoch": 0.5380377549502883, "learning_rate": 8.23968119612835e-06, "loss": 3.0328079223632813, "step": 445900 }, { "epoch": 0.5381584182727709, "learning_rate": 8.239277360660611e-06, "loss": 3.008001403808594, "step": 446000 }, { "epoch": 0.5382790815952536, "learning_rate": 8.238873525192872e-06, "loss": 3.0023226928710938, "step": 446100 }, { "epoch": 0.5383997449177362, "learning_rate": 8.238469689725134e-06, "loss": 3.0127142333984374, "step": 446200 }, { "epoch": 0.538520408240219, "learning_rate": 8.238065854257395e-06, "loss": 3.0399655151367186, "step": 446300 }, { "epoch": 0.5386410715627017, "learning_rate": 8.237662018789657e-06, "loss": 3.000540771484375, "step": 446400 }, { "epoch": 0.5387617348851843, "learning_rate": 8.23725818332192e-06, "loss": 3.0260101318359376, "step": 446500 }, { "epoch": 0.538882398207667, "learning_rate": 8.236854347854181e-06, "loss": 3.013153381347656, "step": 446600 }, { "epoch": 0.5390030615301497, "learning_rate": 8.236450512386442e-06, "loss": 3.0308767700195314, "step": 446700 }, { "epoch": 0.5391237248526324, "learning_rate": 8.236046676918704e-06, "loss": 3.015799865722656, "step": 446800 }, { "epoch": 0.5392443881751151, "learning_rate": 8.235642841450964e-06, "loss": 3.0192779541015624, "step": 446900 }, { "epoch": 0.5393650514975977, "learning_rate": 8.235239005983226e-06, "loss": 3.0200576782226562, "step": 447000 }, { "epoch": 0.5394857148200805, "learning_rate": 8.234835170515488e-06, "loss": 3.0116571044921874, "step": 447100 }, { "epoch": 0.5396063781425631, "learning_rate": 8.23443133504775e-06, "loss": 3.0280792236328127, "step": 447200 }, { "epoch": 0.5397270414650458, "learning_rate": 8.234027499580012e-06, "loss": 3.02627685546875, "step": 447300 }, { "epoch": 0.5398477047875285, "learning_rate": 8.233623664112274e-06, "loss": 3.011654052734375, "step": 447400 }, { "epoch": 0.5399683681100111, "learning_rate": 8.233219828644536e-06, "loss": 3.0159393310546876, "step": 447500 }, { "epoch": 0.5400890314324939, "learning_rate": 8.232815993176798e-06, "loss": 3.0320013427734374, "step": 447600 }, { "epoch": 0.5402096947549765, "learning_rate": 8.232412157709058e-06, "loss": 2.9989382934570314, "step": 447700 }, { "epoch": 0.5403303580774592, "learning_rate": 8.23200832224132e-06, "loss": 3.0335263061523436, "step": 447800 }, { "epoch": 0.5404510213999419, "learning_rate": 8.23160448677358e-06, "loss": 3.009174499511719, "step": 447900 }, { "epoch": 0.5405716847224246, "learning_rate": 8.231200651305842e-06, "loss": 3.0320751953125, "step": 448000 }, { "epoch": 0.5406923480449073, "learning_rate": 8.230796815838104e-06, "loss": 3.00021728515625, "step": 448100 }, { "epoch": 0.5408130113673899, "learning_rate": 8.230392980370366e-06, "loss": 3.0343118286132813, "step": 448200 }, { "epoch": 0.5409336746898726, "learning_rate": 8.229989144902628e-06, "loss": 3.0097808837890625, "step": 448300 }, { "epoch": 0.5410543380123554, "learning_rate": 8.22958530943489e-06, "loss": 3.0248489379882812, "step": 448400 }, { "epoch": 0.541175001334838, "learning_rate": 8.229181473967152e-06, "loss": 2.9971588134765623, "step": 448500 }, { "epoch": 0.5412956646573207, "learning_rate": 8.228777638499413e-06, "loss": 3.0415640258789063, "step": 448600 }, { "epoch": 0.5414163279798033, "learning_rate": 8.228373803031675e-06, "loss": 3.0337384033203123, "step": 448700 }, { "epoch": 0.541536991302286, "learning_rate": 8.227969967563937e-06, "loss": 3.025321044921875, "step": 448800 }, { "epoch": 0.5416576546247688, "learning_rate": 8.227566132096197e-06, "loss": 3.026483459472656, "step": 448900 }, { "epoch": 0.5417783179472514, "learning_rate": 8.227162296628459e-06, "loss": 3.0326153564453127, "step": 449000 }, { "epoch": 0.5418989812697341, "learning_rate": 8.22675846116072e-06, "loss": 2.998897705078125, "step": 449100 }, { "epoch": 0.5420196445922167, "learning_rate": 8.226354625692983e-06, "loss": 2.9886660766601563, "step": 449200 }, { "epoch": 0.5421403079146995, "learning_rate": 8.225950790225245e-06, "loss": 3.0406594848632813, "step": 449300 }, { "epoch": 0.5422609712371822, "learning_rate": 8.225546954757505e-06, "loss": 3.048433532714844, "step": 449400 }, { "epoch": 0.5423816345596648, "learning_rate": 8.225143119289767e-06, "loss": 3.022899169921875, "step": 449500 }, { "epoch": 0.5425022978821475, "learning_rate": 8.224739283822029e-06, "loss": 3.015343017578125, "step": 449600 }, { "epoch": 0.5426229612046302, "learning_rate": 8.224335448354291e-06, "loss": 3.015889892578125, "step": 449700 }, { "epoch": 0.5427436245271129, "learning_rate": 8.223931612886551e-06, "loss": 3.0024258422851564, "step": 449800 }, { "epoch": 0.5428642878495956, "learning_rate": 8.223527777418813e-06, "loss": 3.009610900878906, "step": 449900 }, { "epoch": 0.5429849511720782, "learning_rate": 8.223123941951075e-06, "loss": 2.999173583984375, "step": 450000 }, { "epoch": 0.543105614494561, "learning_rate": 8.222720106483337e-06, "loss": 3.0015234375, "step": 450100 }, { "epoch": 0.5432262778170436, "learning_rate": 8.222316271015598e-06, "loss": 3.0120281982421875, "step": 450200 }, { "epoch": 0.5433469411395263, "learning_rate": 8.22191243554786e-06, "loss": 2.999786376953125, "step": 450300 }, { "epoch": 0.543467604462009, "learning_rate": 8.221508600080122e-06, "loss": 3.0111660766601562, "step": 450400 }, { "epoch": 0.5435882677844917, "learning_rate": 8.221104764612384e-06, "loss": 3.0109133911132813, "step": 450500 }, { "epoch": 0.5437089311069744, "learning_rate": 8.220700929144645e-06, "loss": 2.984908447265625, "step": 450600 }, { "epoch": 0.5438295944294571, "learning_rate": 8.220297093676907e-06, "loss": 2.9949130249023437, "step": 450700 }, { "epoch": 0.5439502577519397, "learning_rate": 8.219893258209168e-06, "loss": 3.021127014160156, "step": 450800 }, { "epoch": 0.5440709210744225, "learning_rate": 8.21948942274143e-06, "loss": 3.0266192626953123, "step": 450900 }, { "epoch": 0.5441915843969051, "learning_rate": 8.21908558727369e-06, "loss": 3.0105615234375, "step": 451000 }, { "epoch": 0.5443122477193878, "learning_rate": 8.218681751805952e-06, "loss": 3.0360455322265625, "step": 451100 }, { "epoch": 0.5444329110418705, "learning_rate": 8.218277916338214e-06, "loss": 2.9971127319335937, "step": 451200 }, { "epoch": 0.5445535743643531, "learning_rate": 8.217874080870476e-06, "loss": 2.995586242675781, "step": 451300 }, { "epoch": 0.5446742376868359, "learning_rate": 8.217470245402738e-06, "loss": 3.0117559814453125, "step": 451400 }, { "epoch": 0.5447949010093185, "learning_rate": 8.217066409935e-06, "loss": 3.036898498535156, "step": 451500 }, { "epoch": 0.5449155643318012, "learning_rate": 8.216662574467262e-06, "loss": 3.04584228515625, "step": 451600 }, { "epoch": 0.545036227654284, "learning_rate": 8.216258738999522e-06, "loss": 3.030256652832031, "step": 451700 }, { "epoch": 0.5451568909767666, "learning_rate": 8.215854903531784e-06, "loss": 3.0310906982421875, "step": 451800 }, { "epoch": 0.5452775542992493, "learning_rate": 8.215451068064046e-06, "loss": 2.9987249755859375, "step": 451900 }, { "epoch": 0.5453982176217319, "learning_rate": 8.215047232596306e-06, "loss": 2.998523864746094, "step": 452000 }, { "epoch": 0.5455188809442146, "learning_rate": 8.214643397128568e-06, "loss": 3.024566345214844, "step": 452100 }, { "epoch": 0.5456395442666974, "learning_rate": 8.21423956166083e-06, "loss": 3.0222308349609377, "step": 452200 }, { "epoch": 0.54576020758918, "learning_rate": 8.213835726193092e-06, "loss": 3.010903625488281, "step": 452300 }, { "epoch": 0.5458808709116627, "learning_rate": 8.213431890725354e-06, "loss": 3.0244232177734376, "step": 452400 }, { "epoch": 0.5460015342341453, "learning_rate": 8.213028055257616e-06, "loss": 3.0216119384765623, "step": 452500 }, { "epoch": 0.546122197556628, "learning_rate": 8.212624219789877e-06, "loss": 2.999864501953125, "step": 452600 }, { "epoch": 0.5462428608791108, "learning_rate": 8.212220384322139e-06, "loss": 3.0284210205078126, "step": 452700 }, { "epoch": 0.5463635242015934, "learning_rate": 8.2118165488544e-06, "loss": 2.999059143066406, "step": 452800 }, { "epoch": 0.5464841875240761, "learning_rate": 8.211412713386661e-06, "loss": 3.042408142089844, "step": 452900 }, { "epoch": 0.5466048508465587, "learning_rate": 8.211008877918923e-06, "loss": 3.024136962890625, "step": 453000 }, { "epoch": 0.5467255141690415, "learning_rate": 8.210605042451185e-06, "loss": 2.9897027587890626, "step": 453100 }, { "epoch": 0.5468461774915242, "learning_rate": 8.210201206983447e-06, "loss": 3.007030334472656, "step": 453200 }, { "epoch": 0.5469668408140068, "learning_rate": 8.209797371515709e-06, "loss": 3.0133856201171874, "step": 453300 }, { "epoch": 0.5470875041364895, "learning_rate": 8.20939353604797e-06, "loss": 3.0122451782226562, "step": 453400 }, { "epoch": 0.5472081674589722, "learning_rate": 8.208989700580231e-06, "loss": 3.022361145019531, "step": 453500 }, { "epoch": 0.5473288307814549, "learning_rate": 8.208585865112493e-06, "loss": 3.0185812377929686, "step": 453600 }, { "epoch": 0.5474494941039376, "learning_rate": 8.208182029644755e-06, "loss": 2.9914254760742187, "step": 453700 }, { "epoch": 0.5475701574264202, "learning_rate": 8.207778194177017e-06, "loss": 3.001167907714844, "step": 453800 }, { "epoch": 0.547690820748903, "learning_rate": 8.207374358709277e-06, "loss": 3.0201190185546873, "step": 453900 }, { "epoch": 0.5478114840713856, "learning_rate": 8.20697052324154e-06, "loss": 3.0026666259765626, "step": 454000 }, { "epoch": 0.5479321473938683, "learning_rate": 8.206566687773801e-06, "loss": 2.999969787597656, "step": 454100 }, { "epoch": 0.548052810716351, "learning_rate": 8.206162852306063e-06, "loss": 3.0005563354492186, "step": 454200 }, { "epoch": 0.5481734740388337, "learning_rate": 8.205759016838324e-06, "loss": 3.002593994140625, "step": 454300 }, { "epoch": 0.5482941373613164, "learning_rate": 8.205355181370586e-06, "loss": 3.0044915771484373, "step": 454400 }, { "epoch": 0.548414800683799, "learning_rate": 8.204951345902848e-06, "loss": 2.9987005615234374, "step": 454500 }, { "epoch": 0.5485354640062817, "learning_rate": 8.20454751043511e-06, "loss": 3.0016461181640626, "step": 454600 }, { "epoch": 0.5486561273287645, "learning_rate": 8.204143674967372e-06, "loss": 3.0159988403320312, "step": 454700 }, { "epoch": 0.5487767906512471, "learning_rate": 8.203739839499632e-06, "loss": 3.0185556030273437, "step": 454800 }, { "epoch": 0.5488974539737298, "learning_rate": 8.203336004031894e-06, "loss": 2.9955682373046875, "step": 454900 }, { "epoch": 0.5490181172962124, "learning_rate": 8.202932168564156e-06, "loss": 3.0180563354492187, "step": 455000 }, { "epoch": 0.5491387806186951, "learning_rate": 8.202528333096416e-06, "loss": 3.00729248046875, "step": 455100 }, { "epoch": 0.5492594439411779, "learning_rate": 8.202124497628678e-06, "loss": 2.981845703125, "step": 455200 }, { "epoch": 0.5493801072636605, "learning_rate": 8.20172066216094e-06, "loss": 3.0141424560546874, "step": 455300 }, { "epoch": 0.5495007705861432, "learning_rate": 8.201316826693202e-06, "loss": 2.9988238525390627, "step": 455400 }, { "epoch": 0.5496214339086258, "learning_rate": 8.200912991225464e-06, "loss": 3.0104196166992185, "step": 455500 }, { "epoch": 0.5497420972311086, "learning_rate": 8.200509155757726e-06, "loss": 3.0210446166992186, "step": 455600 }, { "epoch": 0.5498627605535913, "learning_rate": 8.200105320289988e-06, "loss": 2.9909295654296875, "step": 455700 }, { "epoch": 0.5499834238760739, "learning_rate": 8.199701484822248e-06, "loss": 3.017538757324219, "step": 455800 }, { "epoch": 0.5501040871985566, "learning_rate": 8.19929764935451e-06, "loss": 3.0219967651367186, "step": 455900 }, { "epoch": 0.5502247505210394, "learning_rate": 8.19889381388677e-06, "loss": 2.9999539184570314, "step": 456000 }, { "epoch": 0.550345413843522, "learning_rate": 8.198489978419033e-06, "loss": 2.9966256713867185, "step": 456100 }, { "epoch": 0.5504660771660047, "learning_rate": 8.198086142951294e-06, "loss": 3.0037548828125, "step": 456200 }, { "epoch": 0.5505867404884873, "learning_rate": 8.197682307483556e-06, "loss": 3.0014892578125, "step": 456300 }, { "epoch": 0.55070740381097, "learning_rate": 8.197278472015818e-06, "loss": 3.0157656860351563, "step": 456400 }, { "epoch": 0.5508280671334528, "learning_rate": 8.19687463654808e-06, "loss": 3.0050479125976564, "step": 456500 }, { "epoch": 0.5509487304559354, "learning_rate": 8.196470801080342e-06, "loss": 2.996612548828125, "step": 456600 }, { "epoch": 0.5510693937784181, "learning_rate": 8.196066965612603e-06, "loss": 3.0021636962890623, "step": 456700 }, { "epoch": 0.5511900571009007, "learning_rate": 8.195663130144865e-06, "loss": 3.01055419921875, "step": 456800 }, { "epoch": 0.5513107204233835, "learning_rate": 8.195259294677127e-06, "loss": 2.991148681640625, "step": 456900 }, { "epoch": 0.5514313837458662, "learning_rate": 8.194855459209387e-06, "loss": 2.985732116699219, "step": 457000 }, { "epoch": 0.5515520470683488, "learning_rate": 8.194451623741649e-06, "loss": 3.0277813720703124, "step": 457100 }, { "epoch": 0.5516727103908315, "learning_rate": 8.194047788273911e-06, "loss": 3.0079150390625, "step": 457200 }, { "epoch": 0.5517933737133142, "learning_rate": 8.193643952806173e-06, "loss": 3.035090026855469, "step": 457300 }, { "epoch": 0.5519140370357969, "learning_rate": 8.193240117338435e-06, "loss": 3.0119354248046877, "step": 457400 }, { "epoch": 0.5520347003582796, "learning_rate": 8.192836281870695e-06, "loss": 3.022391357421875, "step": 457500 }, { "epoch": 0.5521553636807622, "learning_rate": 8.192432446402957e-06, "loss": 2.9878070068359377, "step": 457600 }, { "epoch": 0.552276027003245, "learning_rate": 8.192028610935219e-06, "loss": 2.9676254272460936, "step": 457700 }, { "epoch": 0.5523966903257276, "learning_rate": 8.191624775467481e-06, "loss": 3.000948181152344, "step": 457800 }, { "epoch": 0.5525173536482103, "learning_rate": 8.191220939999741e-06, "loss": 3.0209481811523435, "step": 457900 }, { "epoch": 0.552638016970693, "learning_rate": 8.190817104532003e-06, "loss": 3.016698303222656, "step": 458000 }, { "epoch": 0.5527586802931757, "learning_rate": 8.190413269064265e-06, "loss": 2.993017272949219, "step": 458100 }, { "epoch": 0.5528793436156584, "learning_rate": 8.190009433596527e-06, "loss": 2.995467529296875, "step": 458200 }, { "epoch": 0.553000006938141, "learning_rate": 8.18960559812879e-06, "loss": 2.994551696777344, "step": 458300 }, { "epoch": 0.5531206702606237, "learning_rate": 8.18920176266105e-06, "loss": 2.9993743896484375, "step": 458400 }, { "epoch": 0.5532413335831065, "learning_rate": 8.188797927193312e-06, "loss": 2.995627136230469, "step": 458500 }, { "epoch": 0.5533619969055891, "learning_rate": 8.188394091725574e-06, "loss": 3.0100048828125, "step": 458600 }, { "epoch": 0.5534826602280718, "learning_rate": 8.187990256257836e-06, "loss": 3.0135394287109376, "step": 458700 }, { "epoch": 0.5536033235505544, "learning_rate": 8.187586420790098e-06, "loss": 3.0050653076171874, "step": 458800 }, { "epoch": 0.5537239868730371, "learning_rate": 8.187182585322358e-06, "loss": 2.998879699707031, "step": 458900 }, { "epoch": 0.5538446501955199, "learning_rate": 8.18677874985462e-06, "loss": 3.0019467163085936, "step": 459000 }, { "epoch": 0.5539653135180025, "learning_rate": 8.186374914386882e-06, "loss": 2.9818710327148437, "step": 459100 }, { "epoch": 0.5540859768404852, "learning_rate": 8.185971078919142e-06, "loss": 3.015633544921875, "step": 459200 }, { "epoch": 0.5542066401629678, "learning_rate": 8.185567243451404e-06, "loss": 2.962353515625, "step": 459300 }, { "epoch": 0.5543273034854506, "learning_rate": 8.185163407983666e-06, "loss": 3.020951232910156, "step": 459400 }, { "epoch": 0.5544479668079333, "learning_rate": 8.184759572515928e-06, "loss": 2.986156005859375, "step": 459500 }, { "epoch": 0.5545686301304159, "learning_rate": 8.18435573704819e-06, "loss": 2.994339599609375, "step": 459600 }, { "epoch": 0.5546892934528986, "learning_rate": 8.183951901580452e-06, "loss": 3.0034249877929686, "step": 459700 }, { "epoch": 0.5548099567753813, "learning_rate": 8.183548066112712e-06, "loss": 3.004940185546875, "step": 459800 }, { "epoch": 0.554930620097864, "learning_rate": 8.183144230644974e-06, "loss": 2.9959375, "step": 459900 }, { "epoch": 0.5550512834203467, "learning_rate": 8.182740395177236e-06, "loss": 3.0019882202148436, "step": 460000 }, { "epoch": 0.5551719467428293, "learning_rate": 8.182336559709497e-06, "loss": 2.9806918334960937, "step": 460100 }, { "epoch": 0.555292610065312, "learning_rate": 8.181932724241759e-06, "loss": 3.010456237792969, "step": 460200 }, { "epoch": 0.5554132733877947, "learning_rate": 8.18152888877402e-06, "loss": 3.018319396972656, "step": 460300 }, { "epoch": 0.5555339367102774, "learning_rate": 8.181125053306282e-06, "loss": 3.0150662231445313, "step": 460400 }, { "epoch": 0.5556546000327601, "learning_rate": 8.180721217838544e-06, "loss": 3.0147088623046874, "step": 460500 }, { "epoch": 0.5557752633552427, "learning_rate": 8.180317382370806e-06, "loss": 2.984632568359375, "step": 460600 }, { "epoch": 0.5558959266777255, "learning_rate": 8.179913546903068e-06, "loss": 3.0083657836914064, "step": 460700 }, { "epoch": 0.5560165900002082, "learning_rate": 8.179509711435329e-06, "loss": 2.98829833984375, "step": 460800 }, { "epoch": 0.5561372533226908, "learning_rate": 8.17910587596759e-06, "loss": 3.0026199340820314, "step": 460900 }, { "epoch": 0.5562579166451735, "learning_rate": 8.178702040499851e-06, "loss": 2.98964599609375, "step": 461000 }, { "epoch": 0.5563785799676562, "learning_rate": 8.178298205032113e-06, "loss": 2.9768099975585938, "step": 461100 }, { "epoch": 0.5564992432901389, "learning_rate": 8.177894369564375e-06, "loss": 3.0057339477539062, "step": 461200 }, { "epoch": 0.5566199066126216, "learning_rate": 8.177490534096637e-06, "loss": 3.015718688964844, "step": 461300 }, { "epoch": 0.5567405699351042, "learning_rate": 8.177086698628899e-06, "loss": 3.009690246582031, "step": 461400 }, { "epoch": 0.556861233257587, "learning_rate": 8.176682863161161e-06, "loss": 2.9791058349609374, "step": 461500 }, { "epoch": 0.5569818965800696, "learning_rate": 8.176279027693421e-06, "loss": 2.999722595214844, "step": 461600 }, { "epoch": 0.5571025599025523, "learning_rate": 8.175875192225683e-06, "loss": 3.000059814453125, "step": 461700 }, { "epoch": 0.557223223225035, "learning_rate": 8.175471356757945e-06, "loss": 3.0044793701171875, "step": 461800 }, { "epoch": 0.5573438865475177, "learning_rate": 8.175067521290207e-06, "loss": 3.0161895751953125, "step": 461900 }, { "epoch": 0.5574645498700004, "learning_rate": 8.174663685822467e-06, "loss": 2.9899432373046877, "step": 462000 }, { "epoch": 0.557585213192483, "learning_rate": 8.17425985035473e-06, "loss": 2.975271911621094, "step": 462100 }, { "epoch": 0.5577058765149657, "learning_rate": 8.173856014886991e-06, "loss": 3.000601501464844, "step": 462200 }, { "epoch": 0.5578265398374485, "learning_rate": 8.173452179419253e-06, "loss": 2.9855050659179687, "step": 462300 }, { "epoch": 0.5579472031599311, "learning_rate": 8.173048343951514e-06, "loss": 3.002107849121094, "step": 462400 }, { "epoch": 0.5580678664824138, "learning_rate": 8.172644508483776e-06, "loss": 3.0097360229492187, "step": 462500 }, { "epoch": 0.5581885298048964, "learning_rate": 8.172240673016038e-06, "loss": 3.001328430175781, "step": 462600 }, { "epoch": 0.5583091931273791, "learning_rate": 8.1718368375483e-06, "loss": 3.019193420410156, "step": 462700 }, { "epoch": 0.5584298564498619, "learning_rate": 8.171433002080562e-06, "loss": 2.9669720458984377, "step": 462800 }, { "epoch": 0.5585505197723445, "learning_rate": 8.171029166612824e-06, "loss": 3.005193786621094, "step": 462900 }, { "epoch": 0.5586711830948272, "learning_rate": 8.170625331145084e-06, "loss": 3.0114401245117186, "step": 463000 }, { "epoch": 0.5587918464173098, "learning_rate": 8.170221495677346e-06, "loss": 2.997593994140625, "step": 463100 }, { "epoch": 0.5589125097397926, "learning_rate": 8.169817660209608e-06, "loss": 3.00738037109375, "step": 463200 }, { "epoch": 0.5590331730622753, "learning_rate": 8.169413824741868e-06, "loss": 2.9959030151367188, "step": 463300 }, { "epoch": 0.5591538363847579, "learning_rate": 8.16900998927413e-06, "loss": 3.008182373046875, "step": 463400 }, { "epoch": 0.5592744997072406, "learning_rate": 8.168606153806392e-06, "loss": 2.9801837158203126, "step": 463500 }, { "epoch": 0.5593951630297233, "learning_rate": 8.168202318338654e-06, "loss": 3.0317446899414064, "step": 463600 }, { "epoch": 0.559515826352206, "learning_rate": 8.167798482870916e-06, "loss": 3.0086660766601563, "step": 463700 }, { "epoch": 0.5596364896746887, "learning_rate": 8.167394647403178e-06, "loss": 2.987573547363281, "step": 463800 }, { "epoch": 0.5597571529971713, "learning_rate": 8.166990811935438e-06, "loss": 3.0176132202148436, "step": 463900 }, { "epoch": 0.559877816319654, "learning_rate": 8.1665869764677e-06, "loss": 2.9872970581054688, "step": 464000 }, { "epoch": 0.5599984796421367, "learning_rate": 8.166183140999962e-06, "loss": 3.016565856933594, "step": 464100 }, { "epoch": 0.5601191429646194, "learning_rate": 8.165779305532223e-06, "loss": 3.0058441162109375, "step": 464200 }, { "epoch": 0.5602398062871021, "learning_rate": 8.165375470064485e-06, "loss": 3.0088265991210936, "step": 464300 }, { "epoch": 0.5603604696095847, "learning_rate": 8.164971634596747e-06, "loss": 2.96726806640625, "step": 464400 }, { "epoch": 0.5604811329320675, "learning_rate": 8.164567799129009e-06, "loss": 2.9828610229492187, "step": 464500 }, { "epoch": 0.5606017962545501, "learning_rate": 8.16416396366127e-06, "loss": 2.9877239990234377, "step": 464600 }, { "epoch": 0.5607224595770328, "learning_rate": 8.163760128193532e-06, "loss": 2.983226013183594, "step": 464700 }, { "epoch": 0.5608431228995155, "learning_rate": 8.163356292725794e-06, "loss": 2.9693008422851563, "step": 464800 }, { "epoch": 0.5609637862219982, "learning_rate": 8.162952457258055e-06, "loss": 3.003946533203125, "step": 464900 }, { "epoch": 0.5610844495444809, "learning_rate": 8.162548621790317e-06, "loss": 3.010050048828125, "step": 465000 }, { "epoch": 0.5612051128669635, "learning_rate": 8.162144786322577e-06, "loss": 2.9866204833984376, "step": 465100 }, { "epoch": 0.5613257761894462, "learning_rate": 8.161740950854839e-06, "loss": 3.003884582519531, "step": 465200 }, { "epoch": 0.561446439511929, "learning_rate": 8.161337115387101e-06, "loss": 2.975133361816406, "step": 465300 }, { "epoch": 0.5615671028344116, "learning_rate": 8.160933279919363e-06, "loss": 3.00321044921875, "step": 465400 }, { "epoch": 0.5616877661568943, "learning_rate": 8.160529444451625e-06, "loss": 2.9761087036132814, "step": 465500 }, { "epoch": 0.5618084294793769, "learning_rate": 8.160125608983887e-06, "loss": 2.9978091430664064, "step": 465600 }, { "epoch": 0.5619290928018597, "learning_rate": 8.159721773516147e-06, "loss": 2.985066223144531, "step": 465700 }, { "epoch": 0.5620497561243424, "learning_rate": 8.15931793804841e-06, "loss": 2.9695587158203125, "step": 465800 }, { "epoch": 0.562170419446825, "learning_rate": 8.158914102580671e-06, "loss": 2.9904751586914062, "step": 465900 }, { "epoch": 0.5622910827693077, "learning_rate": 8.158510267112933e-06, "loss": 2.987451171875, "step": 466000 }, { "epoch": 0.5624117460917905, "learning_rate": 8.158106431645193e-06, "loss": 2.9501666259765624, "step": 466100 }, { "epoch": 0.5625324094142731, "learning_rate": 8.157702596177455e-06, "loss": 2.9546029663085935, "step": 466200 }, { "epoch": 0.5626530727367558, "learning_rate": 8.157298760709717e-06, "loss": 2.993612976074219, "step": 466300 }, { "epoch": 0.5627737360592384, "learning_rate": 8.15689492524198e-06, "loss": 3.017295227050781, "step": 466400 }, { "epoch": 0.5628943993817211, "learning_rate": 8.15649108977424e-06, "loss": 3.006566162109375, "step": 466500 }, { "epoch": 0.5630150627042039, "learning_rate": 8.156087254306502e-06, "loss": 2.995247497558594, "step": 466600 }, { "epoch": 0.5631357260266865, "learning_rate": 8.155683418838764e-06, "loss": 2.965714111328125, "step": 466700 }, { "epoch": 0.5632563893491692, "learning_rate": 8.155279583371026e-06, "loss": 2.9988967895507814, "step": 466800 }, { "epoch": 0.5633770526716518, "learning_rate": 8.154875747903288e-06, "loss": 2.9797158813476563, "step": 466900 }, { "epoch": 0.5634977159941346, "learning_rate": 8.154471912435548e-06, "loss": 3.0074114990234375, "step": 467000 }, { "epoch": 0.5636183793166173, "learning_rate": 8.15406807696781e-06, "loss": 2.9966064453125, "step": 467100 }, { "epoch": 0.5637390426390999, "learning_rate": 8.153664241500072e-06, "loss": 3.0003421020507814, "step": 467200 }, { "epoch": 0.5638597059615826, "learning_rate": 8.153260406032332e-06, "loss": 2.9827456665039063, "step": 467300 }, { "epoch": 0.5639803692840653, "learning_rate": 8.152856570564594e-06, "loss": 3.0229400634765624, "step": 467400 }, { "epoch": 0.564101032606548, "learning_rate": 8.152452735096856e-06, "loss": 2.9976632690429685, "step": 467500 }, { "epoch": 0.5642216959290307, "learning_rate": 8.152048899629118e-06, "loss": 2.972752685546875, "step": 467600 }, { "epoch": 0.5643423592515133, "learning_rate": 8.15164506416138e-06, "loss": 3.000854797363281, "step": 467700 }, { "epoch": 0.564463022573996, "learning_rate": 8.151241228693642e-06, "loss": 2.971127624511719, "step": 467800 }, { "epoch": 0.5645836858964787, "learning_rate": 8.150837393225904e-06, "loss": 3.0021893310546877, "step": 467900 }, { "epoch": 0.5647043492189614, "learning_rate": 8.150433557758164e-06, "loss": 2.97356689453125, "step": 468000 }, { "epoch": 0.5648250125414441, "learning_rate": 8.150029722290426e-06, "loss": 3.009740905761719, "step": 468100 }, { "epoch": 0.5649456758639267, "learning_rate": 8.149625886822687e-06, "loss": 2.9869815063476564, "step": 468200 }, { "epoch": 0.5650663391864095, "learning_rate": 8.149222051354949e-06, "loss": 2.9912185668945312, "step": 468300 }, { "epoch": 0.5651870025088921, "learning_rate": 8.14881821588721e-06, "loss": 2.983764343261719, "step": 468400 }, { "epoch": 0.5653076658313748, "learning_rate": 8.148414380419473e-06, "loss": 2.9786697387695313, "step": 468500 }, { "epoch": 0.5654283291538575, "learning_rate": 8.148010544951735e-06, "loss": 2.9820037841796876, "step": 468600 }, { "epoch": 0.5655489924763402, "learning_rate": 8.147606709483997e-06, "loss": 2.9766241455078126, "step": 468700 }, { "epoch": 0.5656696557988229, "learning_rate": 8.147202874016259e-06, "loss": 2.991668395996094, "step": 468800 }, { "epoch": 0.5657903191213055, "learning_rate": 8.146799038548519e-06, "loss": 2.982549743652344, "step": 468900 }, { "epoch": 0.5659109824437882, "learning_rate": 8.14639520308078e-06, "loss": 2.9765692138671875, "step": 469000 }, { "epoch": 0.566031645766271, "learning_rate": 8.145991367613043e-06, "loss": 3.021697998046875, "step": 469100 }, { "epoch": 0.5661523090887536, "learning_rate": 8.145587532145303e-06, "loss": 2.99116455078125, "step": 469200 }, { "epoch": 0.5662729724112363, "learning_rate": 8.145183696677565e-06, "loss": 2.9649371337890624, "step": 469300 }, { "epoch": 0.5663936357337189, "learning_rate": 8.144779861209827e-06, "loss": 2.9671444702148437, "step": 469400 }, { "epoch": 0.5665142990562017, "learning_rate": 8.144376025742089e-06, "loss": 2.999248352050781, "step": 469500 }, { "epoch": 0.5666349623786844, "learning_rate": 8.143972190274351e-06, "loss": 2.952983093261719, "step": 469600 }, { "epoch": 0.566755625701167, "learning_rate": 8.143568354806613e-06, "loss": 2.973188781738281, "step": 469700 }, { "epoch": 0.5668762890236497, "learning_rate": 8.143164519338873e-06, "loss": 2.991272277832031, "step": 469800 }, { "epoch": 0.5669969523461323, "learning_rate": 8.142760683871135e-06, "loss": 2.96271240234375, "step": 469900 }, { "epoch": 0.5671176156686151, "learning_rate": 8.142356848403397e-06, "loss": 2.9962982177734374, "step": 470000 }, { "epoch": 0.5672382789910978, "learning_rate": 8.141953012935658e-06, "loss": 2.9819561767578127, "step": 470100 }, { "epoch": 0.5673589423135804, "learning_rate": 8.14154917746792e-06, "loss": 3.0018905639648437, "step": 470200 }, { "epoch": 0.5674796056360631, "learning_rate": 8.141145342000181e-06, "loss": 2.9827496337890627, "step": 470300 }, { "epoch": 0.5676002689585458, "learning_rate": 8.140741506532443e-06, "loss": 2.9602642822265626, "step": 470400 }, { "epoch": 0.5677209322810285, "learning_rate": 8.140337671064705e-06, "loss": 2.9945339965820312, "step": 470500 }, { "epoch": 0.5678415956035112, "learning_rate": 8.139933835596966e-06, "loss": 2.9567803955078125, "step": 470600 }, { "epoch": 0.5679622589259938, "learning_rate": 8.139530000129228e-06, "loss": 2.9850918579101564, "step": 470700 }, { "epoch": 0.5680829222484766, "learning_rate": 8.13912616466149e-06, "loss": 2.9919552612304687, "step": 470800 }, { "epoch": 0.5682035855709592, "learning_rate": 8.138722329193752e-06, "loss": 3.0009429931640623, "step": 470900 }, { "epoch": 0.5683242488934419, "learning_rate": 8.138318493726014e-06, "loss": 2.999633483886719, "step": 471000 }, { "epoch": 0.5684449122159246, "learning_rate": 8.137914658258274e-06, "loss": 2.994955749511719, "step": 471100 }, { "epoch": 0.5685655755384073, "learning_rate": 8.137510822790536e-06, "loss": 2.9888763427734375, "step": 471200 }, { "epoch": 0.56868623886089, "learning_rate": 8.137106987322798e-06, "loss": 2.994425964355469, "step": 471300 }, { "epoch": 0.5688069021833727, "learning_rate": 8.136703151855058e-06, "loss": 2.98322509765625, "step": 471400 }, { "epoch": 0.5689275655058553, "learning_rate": 8.13629931638732e-06, "loss": 2.9915762329101563, "step": 471500 }, { "epoch": 0.569048228828338, "learning_rate": 8.135895480919582e-06, "loss": 2.9823672485351564, "step": 471600 }, { "epoch": 0.5691688921508207, "learning_rate": 8.135491645451844e-06, "loss": 2.996954345703125, "step": 471700 }, { "epoch": 0.5692895554733034, "learning_rate": 8.135087809984106e-06, "loss": 2.9538153076171874, "step": 471800 }, { "epoch": 0.5694102187957861, "learning_rate": 8.134683974516368e-06, "loss": 2.9856658935546876, "step": 471900 }, { "epoch": 0.5695308821182687, "learning_rate": 8.134280139048628e-06, "loss": 2.98936279296875, "step": 472000 }, { "epoch": 0.5696515454407515, "learning_rate": 8.13387630358089e-06, "loss": 2.9860760498046877, "step": 472100 }, { "epoch": 0.5697722087632341, "learning_rate": 8.133472468113152e-06, "loss": 2.953877258300781, "step": 472200 }, { "epoch": 0.5698928720857168, "learning_rate": 8.133068632645413e-06, "loss": 2.9647430419921874, "step": 472300 }, { "epoch": 0.5700135354081995, "learning_rate": 8.132664797177675e-06, "loss": 2.9823434448242185, "step": 472400 }, { "epoch": 0.5701341987306822, "learning_rate": 8.132260961709937e-06, "loss": 2.963651428222656, "step": 472500 }, { "epoch": 0.5702548620531649, "learning_rate": 8.131857126242199e-06, "loss": 2.985428771972656, "step": 472600 }, { "epoch": 0.5703755253756475, "learning_rate": 8.13145329077446e-06, "loss": 2.963888854980469, "step": 472700 }, { "epoch": 0.5704961886981302, "learning_rate": 8.131049455306723e-06, "loss": 2.9848248291015627, "step": 472800 }, { "epoch": 0.570616852020613, "learning_rate": 8.130645619838985e-06, "loss": 2.960509948730469, "step": 472900 }, { "epoch": 0.5707375153430956, "learning_rate": 8.130241784371245e-06, "loss": 2.9915228271484375, "step": 473000 }, { "epoch": 0.5708581786655783, "learning_rate": 8.129837948903507e-06, "loss": 2.974735107421875, "step": 473100 }, { "epoch": 0.5709788419880609, "learning_rate": 8.129434113435767e-06, "loss": 2.97484375, "step": 473200 }, { "epoch": 0.5710995053105437, "learning_rate": 8.129030277968029e-06, "loss": 2.9823483276367186, "step": 473300 }, { "epoch": 0.5712201686330264, "learning_rate": 8.128626442500291e-06, "loss": 2.9506890869140623, "step": 473400 }, { "epoch": 0.571340831955509, "learning_rate": 8.128222607032553e-06, "loss": 2.9802865600585937, "step": 473500 }, { "epoch": 0.5714614952779917, "learning_rate": 8.127818771564815e-06, "loss": 2.993403015136719, "step": 473600 }, { "epoch": 0.5715821586004743, "learning_rate": 8.127414936097077e-06, "loss": 2.9807058715820314, "step": 473700 }, { "epoch": 0.5717028219229571, "learning_rate": 8.127011100629339e-06, "loss": 2.987046203613281, "step": 473800 }, { "epoch": 0.5718234852454398, "learning_rate": 8.1266072651616e-06, "loss": 2.991500244140625, "step": 473900 }, { "epoch": 0.5719441485679224, "learning_rate": 8.126203429693861e-06, "loss": 2.977865905761719, "step": 474000 }, { "epoch": 0.5720648118904051, "learning_rate": 8.125799594226123e-06, "loss": 2.9773330688476562, "step": 474100 }, { "epoch": 0.5721854752128878, "learning_rate": 8.125395758758384e-06, "loss": 2.970625915527344, "step": 474200 }, { "epoch": 0.5723061385353705, "learning_rate": 8.124991923290646e-06, "loss": 2.999735107421875, "step": 474300 }, { "epoch": 0.5724268018578532, "learning_rate": 8.124588087822908e-06, "loss": 3.0177960205078125, "step": 474400 }, { "epoch": 0.5725474651803358, "learning_rate": 8.12418425235517e-06, "loss": 2.975946044921875, "step": 474500 }, { "epoch": 0.5726681285028186, "learning_rate": 8.123780416887431e-06, "loss": 2.9703582763671874, "step": 474600 }, { "epoch": 0.5727887918253012, "learning_rate": 8.123376581419692e-06, "loss": 2.9667718505859373, "step": 474700 }, { "epoch": 0.5729094551477839, "learning_rate": 8.122972745951954e-06, "loss": 2.9742330932617187, "step": 474800 }, { "epoch": 0.5730301184702666, "learning_rate": 8.122568910484216e-06, "loss": 2.947726135253906, "step": 474900 }, { "epoch": 0.5731507817927493, "learning_rate": 8.122165075016478e-06, "loss": 2.9807330322265626, "step": 475000 }, { "epoch": 0.573271445115232, "learning_rate": 8.121761239548738e-06, "loss": 2.9854776000976564, "step": 475100 }, { "epoch": 0.5733921084377146, "learning_rate": 8.121357404081e-06, "loss": 2.954489440917969, "step": 475200 }, { "epoch": 0.5735127717601973, "learning_rate": 8.120953568613262e-06, "loss": 2.9779437255859373, "step": 475300 }, { "epoch": 0.57363343508268, "learning_rate": 8.120549733145524e-06, "loss": 2.9832638549804686, "step": 475400 }, { "epoch": 0.5737540984051627, "learning_rate": 8.120145897677784e-06, "loss": 2.9620635986328123, "step": 475500 }, { "epoch": 0.5738747617276454, "learning_rate": 8.119742062210046e-06, "loss": 2.987445983886719, "step": 475600 }, { "epoch": 0.573995425050128, "learning_rate": 8.119338226742308e-06, "loss": 2.9681301879882813, "step": 475700 }, { "epoch": 0.5741160883726107, "learning_rate": 8.11893439127457e-06, "loss": 2.9592779541015624, "step": 475800 }, { "epoch": 0.5742367516950935, "learning_rate": 8.118530555806832e-06, "loss": 2.9818679809570314, "step": 475900 }, { "epoch": 0.5743574150175761, "learning_rate": 8.118126720339094e-06, "loss": 3.0136920166015626, "step": 476000 }, { "epoch": 0.5744780783400588, "learning_rate": 8.117722884871354e-06, "loss": 2.9860235595703126, "step": 476100 }, { "epoch": 0.5745987416625414, "learning_rate": 8.117319049403616e-06, "loss": 2.96761962890625, "step": 476200 }, { "epoch": 0.5747194049850242, "learning_rate": 8.116915213935877e-06, "loss": 2.9663983154296876, "step": 476300 }, { "epoch": 0.5748400683075069, "learning_rate": 8.116511378468139e-06, "loss": 2.9492767333984373, "step": 476400 }, { "epoch": 0.5749607316299895, "learning_rate": 8.1161075430004e-06, "loss": 2.986912841796875, "step": 476500 }, { "epoch": 0.5750813949524722, "learning_rate": 8.115703707532663e-06, "loss": 2.9770361328125, "step": 476600 }, { "epoch": 0.575202058274955, "learning_rate": 8.115299872064925e-06, "loss": 2.9979034423828126, "step": 476700 }, { "epoch": 0.5753227215974376, "learning_rate": 8.114896036597187e-06, "loss": 2.969718017578125, "step": 476800 }, { "epoch": 0.5754433849199203, "learning_rate": 8.114492201129449e-06, "loss": 2.981287841796875, "step": 476900 }, { "epoch": 0.5755640482424029, "learning_rate": 8.11408836566171e-06, "loss": 2.987734680175781, "step": 477000 }, { "epoch": 0.5756847115648857, "learning_rate": 8.113684530193971e-06, "loss": 2.979698486328125, "step": 477100 }, { "epoch": 0.5758053748873684, "learning_rate": 8.113280694726233e-06, "loss": 2.964830017089844, "step": 477200 }, { "epoch": 0.575926038209851, "learning_rate": 8.112876859258493e-06, "loss": 2.9503338623046873, "step": 477300 }, { "epoch": 0.5760467015323337, "learning_rate": 8.112473023790755e-06, "loss": 2.9733847045898436, "step": 477400 }, { "epoch": 0.5761673648548163, "learning_rate": 8.112069188323017e-06, "loss": 2.9585009765625, "step": 477500 }, { "epoch": 0.5762880281772991, "learning_rate": 8.111665352855279e-06, "loss": 2.9824008178710937, "step": 477600 }, { "epoch": 0.5764086914997818, "learning_rate": 8.111261517387541e-06, "loss": 2.9772378540039064, "step": 477700 }, { "epoch": 0.5765293548222644, "learning_rate": 8.110857681919803e-06, "loss": 2.9740951538085936, "step": 477800 }, { "epoch": 0.5766500181447471, "learning_rate": 8.110453846452063e-06, "loss": 2.993214111328125, "step": 477900 }, { "epoch": 0.5767706814672298, "learning_rate": 8.110050010984325e-06, "loss": 2.977830810546875, "step": 478000 }, { "epoch": 0.5768913447897125, "learning_rate": 8.109646175516587e-06, "loss": 2.972706604003906, "step": 478100 }, { "epoch": 0.5770120081121952, "learning_rate": 8.10924234004885e-06, "loss": 2.981258544921875, "step": 478200 }, { "epoch": 0.5771326714346778, "learning_rate": 8.10883850458111e-06, "loss": 2.9657022094726564, "step": 478300 }, { "epoch": 0.5772533347571606, "learning_rate": 8.108434669113372e-06, "loss": 2.989014892578125, "step": 478400 }, { "epoch": 0.5773739980796432, "learning_rate": 8.108030833645634e-06, "loss": 2.974716796875, "step": 478500 }, { "epoch": 0.5774946614021259, "learning_rate": 8.107626998177896e-06, "loss": 2.9836196899414062, "step": 478600 }, { "epoch": 0.5776153247246086, "learning_rate": 8.107223162710158e-06, "loss": 2.9681552124023436, "step": 478700 }, { "epoch": 0.5777359880470913, "learning_rate": 8.106819327242418e-06, "loss": 3.008946838378906, "step": 478800 }, { "epoch": 0.577856651369574, "learning_rate": 8.10641549177468e-06, "loss": 2.9639816284179688, "step": 478900 }, { "epoch": 0.5779773146920566, "learning_rate": 8.106011656306942e-06, "loss": 2.9923004150390624, "step": 479000 }, { "epoch": 0.5780979780145393, "learning_rate": 8.105607820839204e-06, "loss": 2.9615414428710936, "step": 479100 }, { "epoch": 0.578218641337022, "learning_rate": 8.105203985371464e-06, "loss": 2.9481521606445313, "step": 479200 }, { "epoch": 0.5783393046595047, "learning_rate": 8.104800149903726e-06, "loss": 2.965667724609375, "step": 479300 }, { "epoch": 0.5784599679819874, "learning_rate": 8.104396314435988e-06, "loss": 2.981436462402344, "step": 479400 }, { "epoch": 0.57858063130447, "learning_rate": 8.10399247896825e-06, "loss": 2.9828228759765625, "step": 479500 }, { "epoch": 0.5787012946269527, "learning_rate": 8.10358864350051e-06, "loss": 2.96062744140625, "step": 479600 }, { "epoch": 0.5788219579494355, "learning_rate": 8.103184808032772e-06, "loss": 2.956165771484375, "step": 479700 }, { "epoch": 0.5789426212719181, "learning_rate": 8.102780972565034e-06, "loss": 2.9961224365234376, "step": 479800 }, { "epoch": 0.5790632845944008, "learning_rate": 8.102377137097296e-06, "loss": 2.9412493896484375, "step": 479900 }, { "epoch": 0.5791839479168834, "learning_rate": 8.101973301629558e-06, "loss": 2.9621832275390627, "step": 480000 }, { "epoch": 0.5793046112393662, "learning_rate": 8.10156946616182e-06, "loss": 2.9854931640625, "step": 480100 }, { "epoch": 0.5794252745618489, "learning_rate": 8.10116563069408e-06, "loss": 2.9970028686523436, "step": 480200 }, { "epoch": 0.5795459378843315, "learning_rate": 8.100761795226342e-06, "loss": 2.9552850341796875, "step": 480300 }, { "epoch": 0.5796666012068142, "learning_rate": 8.100357959758603e-06, "loss": 2.9902328491210937, "step": 480400 }, { "epoch": 0.5797872645292969, "learning_rate": 8.099954124290865e-06, "loss": 2.961526184082031, "step": 480500 }, { "epoch": 0.5799079278517796, "learning_rate": 8.099550288823127e-06, "loss": 2.9639349365234375, "step": 480600 }, { "epoch": 0.5800285911742623, "learning_rate": 8.099146453355389e-06, "loss": 2.966573486328125, "step": 480700 }, { "epoch": 0.5801492544967449, "learning_rate": 8.09874261788765e-06, "loss": 2.9636276245117186, "step": 480800 }, { "epoch": 0.5802699178192277, "learning_rate": 8.098338782419913e-06, "loss": 2.952803649902344, "step": 480900 }, { "epoch": 0.5803905811417103, "learning_rate": 8.097934946952175e-06, "loss": 2.9921038818359373, "step": 481000 }, { "epoch": 0.580511244464193, "learning_rate": 8.097531111484435e-06, "loss": 2.9870700073242187, "step": 481100 }, { "epoch": 0.5806319077866757, "learning_rate": 8.097127276016697e-06, "loss": 2.9667413330078123, "step": 481200 }, { "epoch": 0.5807525711091583, "learning_rate": 8.096723440548959e-06, "loss": 2.9679583740234374, "step": 481300 }, { "epoch": 0.5808732344316411, "learning_rate": 8.09631960508122e-06, "loss": 2.97364990234375, "step": 481400 }, { "epoch": 0.5809938977541237, "learning_rate": 8.095915769613481e-06, "loss": 2.98238037109375, "step": 481500 }, { "epoch": 0.5811145610766064, "learning_rate": 8.095511934145743e-06, "loss": 2.977811279296875, "step": 481600 }, { "epoch": 0.5812352243990891, "learning_rate": 8.095108098678005e-06, "loss": 2.983026428222656, "step": 481700 }, { "epoch": 0.5813558877215718, "learning_rate": 8.094704263210267e-06, "loss": 2.982837829589844, "step": 481800 }, { "epoch": 0.5814765510440545, "learning_rate": 8.094300427742529e-06, "loss": 2.9884658813476563, "step": 481900 }, { "epoch": 0.5815972143665372, "learning_rate": 8.09389659227479e-06, "loss": 2.9661550903320313, "step": 482000 }, { "epoch": 0.5817178776890198, "learning_rate": 8.093492756807051e-06, "loss": 2.973033752441406, "step": 482100 }, { "epoch": 0.5818385410115026, "learning_rate": 8.093088921339313e-06, "loss": 2.973619384765625, "step": 482200 }, { "epoch": 0.5819592043339852, "learning_rate": 8.092685085871574e-06, "loss": 2.9707208251953126, "step": 482300 }, { "epoch": 0.5820798676564679, "learning_rate": 8.092281250403836e-06, "loss": 2.9651748657226564, "step": 482400 }, { "epoch": 0.5822005309789506, "learning_rate": 8.091877414936098e-06, "loss": 2.949432678222656, "step": 482500 }, { "epoch": 0.5823211943014333, "learning_rate": 8.09147357946836e-06, "loss": 2.9793191528320313, "step": 482600 }, { "epoch": 0.582441857623916, "learning_rate": 8.091069744000622e-06, "loss": 2.9813580322265625, "step": 482700 }, { "epoch": 0.5825625209463986, "learning_rate": 8.090665908532882e-06, "loss": 2.961824951171875, "step": 482800 }, { "epoch": 0.5826831842688813, "learning_rate": 8.090262073065144e-06, "loss": 2.9605416870117187, "step": 482900 }, { "epoch": 0.582803847591364, "learning_rate": 8.089858237597406e-06, "loss": 2.952781066894531, "step": 483000 }, { "epoch": 0.5829245109138467, "learning_rate": 8.089454402129668e-06, "loss": 2.9838186645507814, "step": 483100 }, { "epoch": 0.5830451742363294, "learning_rate": 8.08905056666193e-06, "loss": 2.982503662109375, "step": 483200 }, { "epoch": 0.583165837558812, "learning_rate": 8.08864673119419e-06, "loss": 2.9656787109375, "step": 483300 }, { "epoch": 0.5832865008812947, "learning_rate": 8.088242895726452e-06, "loss": 2.9740997314453126, "step": 483400 }, { "epoch": 0.5834071642037775, "learning_rate": 8.087839060258714e-06, "loss": 2.984513854980469, "step": 483500 }, { "epoch": 0.5835278275262601, "learning_rate": 8.087435224790974e-06, "loss": 2.9776446533203127, "step": 483600 }, { "epoch": 0.5836484908487428, "learning_rate": 8.087031389323236e-06, "loss": 2.9530511474609376, "step": 483700 }, { "epoch": 0.5837691541712254, "learning_rate": 8.086627553855498e-06, "loss": 2.9732745361328123, "step": 483800 }, { "epoch": 0.5838898174937082, "learning_rate": 8.08622371838776e-06, "loss": 2.9666485595703125, "step": 483900 }, { "epoch": 0.5840104808161909, "learning_rate": 8.085819882920022e-06, "loss": 2.9661984252929687, "step": 484000 }, { "epoch": 0.5841311441386735, "learning_rate": 8.085416047452284e-06, "loss": 2.9630029296875, "step": 484100 }, { "epoch": 0.5842518074611562, "learning_rate": 8.085012211984545e-06, "loss": 2.9773654174804687, "step": 484200 }, { "epoch": 0.5843724707836389, "learning_rate": 8.084608376516807e-06, "loss": 2.96956298828125, "step": 484300 }, { "epoch": 0.5844931341061216, "learning_rate": 8.084204541049069e-06, "loss": 2.9580194091796876, "step": 484400 }, { "epoch": 0.5846137974286043, "learning_rate": 8.083800705581329e-06, "loss": 2.9955279541015627, "step": 484500 }, { "epoch": 0.5847344607510869, "learning_rate": 8.08339687011359e-06, "loss": 2.9667892456054688, "step": 484600 }, { "epoch": 0.5848551240735697, "learning_rate": 8.082993034645853e-06, "loss": 2.9837551879882813, "step": 484700 }, { "epoch": 0.5849757873960523, "learning_rate": 8.082589199178115e-06, "loss": 2.9466522216796873, "step": 484800 }, { "epoch": 0.585096450718535, "learning_rate": 8.082185363710377e-06, "loss": 2.9726937866210936, "step": 484900 }, { "epoch": 0.5852171140410177, "learning_rate": 8.081781528242639e-06, "loss": 2.9689227294921876, "step": 485000 }, { "epoch": 0.5853377773635003, "learning_rate": 8.0813776927749e-06, "loss": 2.944732971191406, "step": 485100 }, { "epoch": 0.5854584406859831, "learning_rate": 8.080973857307161e-06, "loss": 2.9782815551757813, "step": 485200 }, { "epoch": 0.5855791040084657, "learning_rate": 8.080570021839423e-06, "loss": 2.9612307739257813, "step": 485300 }, { "epoch": 0.5856997673309484, "learning_rate": 8.080166186371683e-06, "loss": 2.940147705078125, "step": 485400 }, { "epoch": 0.5858204306534311, "learning_rate": 8.079762350903945e-06, "loss": 2.9731491088867186, "step": 485500 }, { "epoch": 0.5859410939759138, "learning_rate": 8.079358515436207e-06, "loss": 2.9864181518554687, "step": 485600 }, { "epoch": 0.5860617572983965, "learning_rate": 8.07895467996847e-06, "loss": 2.982764892578125, "step": 485700 }, { "epoch": 0.5861824206208791, "learning_rate": 8.078550844500731e-06, "loss": 2.941102294921875, "step": 485800 }, { "epoch": 0.5863030839433618, "learning_rate": 8.078147009032993e-06, "loss": 2.9511947631835938, "step": 485900 }, { "epoch": 0.5864237472658446, "learning_rate": 8.077743173565255e-06, "loss": 2.9434832763671874, "step": 486000 }, { "epoch": 0.5865444105883272, "learning_rate": 8.077339338097515e-06, "loss": 2.9721939086914064, "step": 486100 }, { "epoch": 0.5866650739108099, "learning_rate": 8.076935502629777e-06, "loss": 2.963254699707031, "step": 486200 }, { "epoch": 0.5867857372332925, "learning_rate": 8.07653166716204e-06, "loss": 2.9630078125, "step": 486300 }, { "epoch": 0.5869064005557753, "learning_rate": 8.0761278316943e-06, "loss": 2.9865576171875, "step": 486400 }, { "epoch": 0.587027063878258, "learning_rate": 8.075723996226562e-06, "loss": 2.9787857055664064, "step": 486500 }, { "epoch": 0.5871477272007406, "learning_rate": 8.075320160758824e-06, "loss": 2.9784112548828126, "step": 486600 }, { "epoch": 0.5872683905232233, "learning_rate": 8.074916325291086e-06, "loss": 2.9550482177734376, "step": 486700 }, { "epoch": 0.587389053845706, "learning_rate": 8.074512489823348e-06, "loss": 2.967176818847656, "step": 486800 }, { "epoch": 0.5875097171681887, "learning_rate": 8.074108654355608e-06, "loss": 2.9666311645507815, "step": 486900 }, { "epoch": 0.5876303804906714, "learning_rate": 8.07370481888787e-06, "loss": 2.939674072265625, "step": 487000 }, { "epoch": 0.587751043813154, "learning_rate": 8.073300983420132e-06, "loss": 2.9351376342773436, "step": 487100 }, { "epoch": 0.5878717071356367, "learning_rate": 8.072897147952394e-06, "loss": 2.9677545166015626, "step": 487200 }, { "epoch": 0.5879923704581195, "learning_rate": 8.072493312484654e-06, "loss": 2.9541204833984374, "step": 487300 }, { "epoch": 0.5881130337806021, "learning_rate": 8.072089477016916e-06, "loss": 2.957548828125, "step": 487400 }, { "epoch": 0.5882336971030848, "learning_rate": 8.071685641549178e-06, "loss": 2.9496249389648437, "step": 487500 }, { "epoch": 0.5883543604255674, "learning_rate": 8.07128180608144e-06, "loss": 2.9719998168945314, "step": 487600 }, { "epoch": 0.5884750237480502, "learning_rate": 8.0708779706137e-06, "loss": 2.9489666748046877, "step": 487700 }, { "epoch": 0.5885956870705329, "learning_rate": 8.070474135145962e-06, "loss": 2.9749627685546876, "step": 487800 }, { "epoch": 0.5887163503930155, "learning_rate": 8.070070299678224e-06, "loss": 2.96795166015625, "step": 487900 }, { "epoch": 0.5888370137154982, "learning_rate": 8.069666464210486e-06, "loss": 2.968385009765625, "step": 488000 }, { "epoch": 0.5889576770379809, "learning_rate": 8.069262628742748e-06, "loss": 2.9446173095703125, "step": 488100 }, { "epoch": 0.5890783403604636, "learning_rate": 8.06885879327501e-06, "loss": 2.942460632324219, "step": 488200 }, { "epoch": 0.5891990036829463, "learning_rate": 8.06845495780727e-06, "loss": 2.9851751708984375, "step": 488300 }, { "epoch": 0.5893196670054289, "learning_rate": 8.068051122339533e-06, "loss": 2.988564453125, "step": 488400 }, { "epoch": 0.5894403303279117, "learning_rate": 8.067647286871793e-06, "loss": 2.958942565917969, "step": 488500 }, { "epoch": 0.5895609936503943, "learning_rate": 8.067243451404055e-06, "loss": 2.9633984375, "step": 488600 }, { "epoch": 0.589681656972877, "learning_rate": 8.066839615936317e-06, "loss": 2.9610614013671874, "step": 488700 }, { "epoch": 0.5898023202953597, "learning_rate": 8.066435780468579e-06, "loss": 2.9576141357421877, "step": 488800 }, { "epoch": 0.5899229836178423, "learning_rate": 8.06603194500084e-06, "loss": 2.9549810791015627, "step": 488900 }, { "epoch": 0.5900436469403251, "learning_rate": 8.065628109533103e-06, "loss": 2.9668426513671875, "step": 489000 }, { "epoch": 0.5901643102628077, "learning_rate": 8.065224274065365e-06, "loss": 2.9712603759765623, "step": 489100 }, { "epoch": 0.5902849735852904, "learning_rate": 8.064820438597625e-06, "loss": 2.960770263671875, "step": 489200 }, { "epoch": 0.5904056369077731, "learning_rate": 8.064416603129887e-06, "loss": 2.9565350341796877, "step": 489300 }, { "epoch": 0.5905263002302558, "learning_rate": 8.064012767662149e-06, "loss": 2.9616189575195313, "step": 489400 }, { "epoch": 0.5906469635527385, "learning_rate": 8.06360893219441e-06, "loss": 2.97448974609375, "step": 489500 }, { "epoch": 0.5907676268752211, "learning_rate": 8.063205096726671e-06, "loss": 2.9743618774414062, "step": 489600 }, { "epoch": 0.5908882901977038, "learning_rate": 8.062801261258933e-06, "loss": 2.9766690063476564, "step": 489700 }, { "epoch": 0.5910089535201866, "learning_rate": 8.062397425791195e-06, "loss": 2.9721905517578127, "step": 489800 }, { "epoch": 0.5911296168426692, "learning_rate": 8.061993590323457e-06, "loss": 2.9808489990234377, "step": 489900 }, { "epoch": 0.5912502801651519, "learning_rate": 8.06158975485572e-06, "loss": 2.945633544921875, "step": 490000 }, { "epoch": 0.5913709434876345, "learning_rate": 8.061185919387981e-06, "loss": 2.958897705078125, "step": 490100 }, { "epoch": 0.5914916068101173, "learning_rate": 8.060782083920241e-06, "loss": 2.9526596069335938, "step": 490200 }, { "epoch": 0.5916122701326, "learning_rate": 8.060378248452503e-06, "loss": 2.95847900390625, "step": 490300 }, { "epoch": 0.5917329334550826, "learning_rate": 8.059974412984764e-06, "loss": 2.9596591186523438, "step": 490400 }, { "epoch": 0.5918535967775653, "learning_rate": 8.059570577517026e-06, "loss": 2.944175109863281, "step": 490500 }, { "epoch": 0.5919742601000479, "learning_rate": 8.059166742049288e-06, "loss": 2.9776235961914064, "step": 490600 }, { "epoch": 0.5920949234225307, "learning_rate": 8.05876290658155e-06, "loss": 2.960718688964844, "step": 490700 }, { "epoch": 0.5922155867450134, "learning_rate": 8.058359071113812e-06, "loss": 2.976762390136719, "step": 490800 }, { "epoch": 0.592336250067496, "learning_rate": 8.057955235646074e-06, "loss": 2.96544677734375, "step": 490900 }, { "epoch": 0.5924569133899787, "learning_rate": 8.057551400178334e-06, "loss": 2.9486407470703124, "step": 491000 }, { "epoch": 0.5925775767124614, "learning_rate": 8.057147564710596e-06, "loss": 2.938033447265625, "step": 491100 }, { "epoch": 0.5926982400349441, "learning_rate": 8.056743729242858e-06, "loss": 2.949468688964844, "step": 491200 }, { "epoch": 0.5928189033574268, "learning_rate": 8.05633989377512e-06, "loss": 2.925229797363281, "step": 491300 }, { "epoch": 0.5929395666799094, "learning_rate": 8.05593605830738e-06, "loss": 2.943150939941406, "step": 491400 }, { "epoch": 0.5930602300023922, "learning_rate": 8.055532222839642e-06, "loss": 2.9539303588867187, "step": 491500 }, { "epoch": 0.5931808933248748, "learning_rate": 8.055128387371904e-06, "loss": 2.9391903686523437, "step": 491600 }, { "epoch": 0.5933015566473575, "learning_rate": 8.054724551904166e-06, "loss": 2.9569131469726564, "step": 491700 }, { "epoch": 0.5934222199698402, "learning_rate": 8.054320716436426e-06, "loss": 2.966691589355469, "step": 491800 }, { "epoch": 0.5935428832923229, "learning_rate": 8.053916880968688e-06, "loss": 2.988161926269531, "step": 491900 }, { "epoch": 0.5936635466148056, "learning_rate": 8.05351304550095e-06, "loss": 2.943126525878906, "step": 492000 }, { "epoch": 0.5937842099372883, "learning_rate": 8.053109210033212e-06, "loss": 2.9560235595703124, "step": 492100 }, { "epoch": 0.5939048732597709, "learning_rate": 8.052705374565474e-06, "loss": 2.952505798339844, "step": 492200 }, { "epoch": 0.5940255365822537, "learning_rate": 8.052301539097736e-06, "loss": 2.96342529296875, "step": 492300 }, { "epoch": 0.5941461999047363, "learning_rate": 8.051897703629997e-06, "loss": 2.9526077270507813, "step": 492400 }, { "epoch": 0.594266863227219, "learning_rate": 8.051493868162259e-06, "loss": 2.992037048339844, "step": 492500 }, { "epoch": 0.5943875265497017, "learning_rate": 8.051090032694519e-06, "loss": 2.9615869140625, "step": 492600 }, { "epoch": 0.5945081898721843, "learning_rate": 8.050686197226781e-06, "loss": 2.97475830078125, "step": 492700 }, { "epoch": 0.5946288531946671, "learning_rate": 8.050282361759043e-06, "loss": 2.9530374145507814, "step": 492800 }, { "epoch": 0.5947495165171497, "learning_rate": 8.049878526291305e-06, "loss": 2.95875732421875, "step": 492900 }, { "epoch": 0.5948701798396324, "learning_rate": 8.049474690823567e-06, "loss": 2.9713275146484377, "step": 493000 }, { "epoch": 0.5949908431621151, "learning_rate": 8.049070855355829e-06, "loss": 2.9611590576171873, "step": 493100 }, { "epoch": 0.5951115064845978, "learning_rate": 8.04866701988809e-06, "loss": 2.96239013671875, "step": 493200 }, { "epoch": 0.5952321698070805, "learning_rate": 8.048263184420351e-06, "loss": 2.9204086303710937, "step": 493300 }, { "epoch": 0.5953528331295631, "learning_rate": 8.047859348952613e-06, "loss": 2.963445129394531, "step": 493400 }, { "epoch": 0.5954734964520458, "learning_rate": 8.047455513484875e-06, "loss": 2.952359924316406, "step": 493500 }, { "epoch": 0.5955941597745286, "learning_rate": 8.047051678017135e-06, "loss": 2.947237243652344, "step": 493600 }, { "epoch": 0.5957148230970112, "learning_rate": 8.046647842549397e-06, "loss": 2.94197021484375, "step": 493700 }, { "epoch": 0.5958354864194939, "learning_rate": 8.04624400708166e-06, "loss": 2.962818603515625, "step": 493800 }, { "epoch": 0.5959561497419765, "learning_rate": 8.045840171613921e-06, "loss": 2.9547216796875, "step": 493900 }, { "epoch": 0.5960768130644593, "learning_rate": 8.045436336146183e-06, "loss": 2.9487380981445312, "step": 494000 }, { "epoch": 0.596197476386942, "learning_rate": 8.045032500678445e-06, "loss": 2.9525277709960935, "step": 494100 }, { "epoch": 0.5963181397094246, "learning_rate": 8.044628665210707e-06, "loss": 2.9557479858398437, "step": 494200 }, { "epoch": 0.5964388030319073, "learning_rate": 8.044224829742967e-06, "loss": 2.96691650390625, "step": 494300 }, { "epoch": 0.59655946635439, "learning_rate": 8.04382099427523e-06, "loss": 2.9398138427734377, "step": 494400 }, { "epoch": 0.5966801296768727, "learning_rate": 8.04341715880749e-06, "loss": 2.93875732421875, "step": 494500 }, { "epoch": 0.5968007929993554, "learning_rate": 8.043013323339752e-06, "loss": 2.964020080566406, "step": 494600 }, { "epoch": 0.596921456321838, "learning_rate": 8.042609487872014e-06, "loss": 2.9571539306640626, "step": 494700 }, { "epoch": 0.5970421196443207, "learning_rate": 8.042205652404276e-06, "loss": 2.975044860839844, "step": 494800 }, { "epoch": 0.5971627829668034, "learning_rate": 8.041801816936538e-06, "loss": 2.965111083984375, "step": 494900 }, { "epoch": 0.5972834462892861, "learning_rate": 8.0413979814688e-06, "loss": 2.9459494018554686, "step": 495000 }, { "epoch": 0.5974041096117688, "learning_rate": 8.04099414600106e-06, "loss": 2.9387896728515623, "step": 495100 }, { "epoch": 0.5975247729342514, "learning_rate": 8.040590310533322e-06, "loss": 2.9479049682617187, "step": 495200 }, { "epoch": 0.5976454362567342, "learning_rate": 8.040186475065584e-06, "loss": 2.9441293334960936, "step": 495300 }, { "epoch": 0.5977660995792168, "learning_rate": 8.039782639597846e-06, "loss": 2.9364984130859373, "step": 495400 }, { "epoch": 0.5978867629016995, "learning_rate": 8.039378804130106e-06, "loss": 2.920135803222656, "step": 495500 }, { "epoch": 0.5980074262241822, "learning_rate": 8.038974968662368e-06, "loss": 2.9691693115234377, "step": 495600 }, { "epoch": 0.5981280895466649, "learning_rate": 8.03857113319463e-06, "loss": 2.9268438720703127, "step": 495700 }, { "epoch": 0.5982487528691476, "learning_rate": 8.038167297726892e-06, "loss": 2.954842834472656, "step": 495800 }, { "epoch": 0.5983694161916302, "learning_rate": 8.037763462259152e-06, "loss": 2.9568231201171873, "step": 495900 }, { "epoch": 0.5984900795141129, "learning_rate": 8.037359626791414e-06, "loss": 2.9504180908203126, "step": 496000 }, { "epoch": 0.5986107428365957, "learning_rate": 8.036955791323676e-06, "loss": 2.93613525390625, "step": 496100 }, { "epoch": 0.5987314061590783, "learning_rate": 8.036551955855938e-06, "loss": 2.949007568359375, "step": 496200 }, { "epoch": 0.598852069481561, "learning_rate": 8.0361481203882e-06, "loss": 2.962759704589844, "step": 496300 }, { "epoch": 0.5989727328040436, "learning_rate": 8.03574428492046e-06, "loss": 2.958729553222656, "step": 496400 }, { "epoch": 0.5990933961265263, "learning_rate": 8.035340449452723e-06, "loss": 2.9451922607421874, "step": 496500 }, { "epoch": 0.5992140594490091, "learning_rate": 8.034936613984985e-06, "loss": 2.956802978515625, "step": 496600 }, { "epoch": 0.5993347227714917, "learning_rate": 8.034532778517245e-06, "loss": 2.9515606689453127, "step": 496700 }, { "epoch": 0.5994553860939744, "learning_rate": 8.034128943049507e-06, "loss": 2.962585144042969, "step": 496800 }, { "epoch": 0.599576049416457, "learning_rate": 8.033725107581769e-06, "loss": 2.9377703857421875, "step": 496900 }, { "epoch": 0.5996967127389398, "learning_rate": 8.033321272114031e-06, "loss": 2.9345822143554687, "step": 497000 }, { "epoch": 0.5998173760614225, "learning_rate": 8.032917436646293e-06, "loss": 2.9454769897460937, "step": 497100 }, { "epoch": 0.5999380393839051, "learning_rate": 8.032513601178555e-06, "loss": 2.972662353515625, "step": 497200 }, { "epoch": 0.6000587027063878, "learning_rate": 8.032109765710817e-06, "loss": 2.954279479980469, "step": 497300 }, { "epoch": 0.6001793660288706, "learning_rate": 8.031705930243077e-06, "loss": 2.928613586425781, "step": 497400 }, { "epoch": 0.6003000293513532, "learning_rate": 8.031302094775339e-06, "loss": 2.937383728027344, "step": 497500 }, { "epoch": 0.6004206926738359, "learning_rate": 8.0308982593076e-06, "loss": 2.954742736816406, "step": 497600 }, { "epoch": 0.6005413559963185, "learning_rate": 8.030494423839861e-06, "loss": 2.9312362670898438, "step": 497700 }, { "epoch": 0.6006620193188013, "learning_rate": 8.030090588372123e-06, "loss": 2.9541384887695314, "step": 497800 }, { "epoch": 0.600782682641284, "learning_rate": 8.029686752904385e-06, "loss": 2.959463806152344, "step": 497900 }, { "epoch": 0.6009033459637666, "learning_rate": 8.029282917436647e-06, "loss": 2.927001953125, "step": 498000 }, { "epoch": 0.6010240092862493, "learning_rate": 8.02887908196891e-06, "loss": 2.9707293701171875, "step": 498100 }, { "epoch": 0.601144672608732, "learning_rate": 8.028475246501171e-06, "loss": 2.944581298828125, "step": 498200 }, { "epoch": 0.6012653359312147, "learning_rate": 8.028071411033432e-06, "loss": 2.954312438964844, "step": 498300 }, { "epoch": 0.6013859992536974, "learning_rate": 8.027667575565694e-06, "loss": 2.9526156616210937, "step": 498400 }, { "epoch": 0.60150666257618, "learning_rate": 8.027263740097956e-06, "loss": 2.949285583496094, "step": 498500 }, { "epoch": 0.6016273258986627, "learning_rate": 8.026859904630216e-06, "loss": 2.980736083984375, "step": 498600 }, { "epoch": 0.6017479892211454, "learning_rate": 8.026456069162478e-06, "loss": 2.949732360839844, "step": 498700 }, { "epoch": 0.6018686525436281, "learning_rate": 8.02605223369474e-06, "loss": 2.9579483032226563, "step": 498800 }, { "epoch": 0.6019893158661108, "learning_rate": 8.025648398227002e-06, "loss": 2.972672424316406, "step": 498900 }, { "epoch": 0.6021099791885934, "learning_rate": 8.025244562759264e-06, "loss": 2.952484436035156, "step": 499000 }, { "epoch": 0.6022306425110762, "learning_rate": 8.024840727291524e-06, "loss": 2.9228143310546875, "step": 499100 }, { "epoch": 0.6023513058335588, "learning_rate": 8.024436891823786e-06, "loss": 2.9677297973632815, "step": 499200 }, { "epoch": 0.6024719691560415, "learning_rate": 8.024033056356048e-06, "loss": 2.968966064453125, "step": 499300 }, { "epoch": 0.6025926324785242, "learning_rate": 8.02362922088831e-06, "loss": 2.9369766235351564, "step": 499400 }, { "epoch": 0.6027132958010069, "learning_rate": 8.02322538542057e-06, "loss": 2.92471435546875, "step": 499500 }, { "epoch": 0.6028339591234896, "learning_rate": 8.022821549952832e-06, "loss": 2.9405337524414064, "step": 499600 }, { "epoch": 0.6029546224459722, "learning_rate": 8.022417714485094e-06, "loss": 2.9437945556640623, "step": 499700 }, { "epoch": 0.6030752857684549, "learning_rate": 8.022013879017356e-06, "loss": 2.9274481201171874, "step": 499800 }, { "epoch": 0.6031959490909377, "learning_rate": 8.021610043549618e-06, "loss": 2.9407730102539062, "step": 499900 }, { "epoch": 0.6033166124134203, "learning_rate": 8.021206208081878e-06, "loss": 2.942716369628906, "step": 500000 }, { "epoch": 0.603437275735903, "learning_rate": 8.02080237261414e-06, "loss": 2.9249346923828123, "step": 500100 }, { "epoch": 0.6035579390583856, "learning_rate": 8.020398537146402e-06, "loss": 2.9676077270507815, "step": 500200 }, { "epoch": 0.6036786023808683, "learning_rate": 8.019994701678664e-06, "loss": 2.953896179199219, "step": 500300 }, { "epoch": 0.6037992657033511, "learning_rate": 8.019590866210926e-06, "loss": 2.9350482177734376, "step": 500400 }, { "epoch": 0.6039199290258337, "learning_rate": 8.019187030743187e-06, "loss": 2.953463134765625, "step": 500500 }, { "epoch": 0.6040405923483164, "learning_rate": 8.018783195275449e-06, "loss": 2.969024658203125, "step": 500600 }, { "epoch": 0.604161255670799, "learning_rate": 8.01837935980771e-06, "loss": 2.936881103515625, "step": 500700 }, { "epoch": 0.6042819189932818, "learning_rate": 8.017975524339971e-06, "loss": 2.9495361328125, "step": 500800 }, { "epoch": 0.6044025823157645, "learning_rate": 8.017571688872233e-06, "loss": 2.9232330322265625, "step": 500900 }, { "epoch": 0.6045232456382471, "learning_rate": 8.017167853404495e-06, "loss": 2.94489501953125, "step": 501000 }, { "epoch": 0.6046439089607298, "learning_rate": 8.016764017936757e-06, "loss": 2.94240234375, "step": 501100 }, { "epoch": 0.6047645722832125, "learning_rate": 8.016360182469019e-06, "loss": 2.937272033691406, "step": 501200 }, { "epoch": 0.6048852356056952, "learning_rate": 8.015956347001281e-06, "loss": 2.96359375, "step": 501300 }, { "epoch": 0.6050058989281779, "learning_rate": 8.015552511533541e-06, "loss": 2.9370523071289063, "step": 501400 }, { "epoch": 0.6051265622506605, "learning_rate": 8.015148676065803e-06, "loss": 2.943509521484375, "step": 501500 }, { "epoch": 0.6052472255731433, "learning_rate": 8.014744840598065e-06, "loss": 2.9520709228515627, "step": 501600 }, { "epoch": 0.6053678888956259, "learning_rate": 8.014341005130325e-06, "loss": 2.924737548828125, "step": 501700 }, { "epoch": 0.6054885522181086, "learning_rate": 8.013937169662587e-06, "loss": 2.9384710693359377, "step": 501800 }, { "epoch": 0.6056092155405913, "learning_rate": 8.01353333419485e-06, "loss": 2.9202166748046876, "step": 501900 }, { "epoch": 0.605729878863074, "learning_rate": 8.013129498727111e-06, "loss": 2.9348904418945314, "step": 502000 }, { "epoch": 0.6058505421855567, "learning_rate": 8.012725663259373e-06, "loss": 2.9645947265625, "step": 502100 }, { "epoch": 0.6059712055080393, "learning_rate": 8.012321827791635e-06, "loss": 2.955181884765625, "step": 502200 }, { "epoch": 0.606091868830522, "learning_rate": 8.011917992323897e-06, "loss": 2.9298760986328123, "step": 502300 }, { "epoch": 0.6062125321530047, "learning_rate": 8.011514156856158e-06, "loss": 2.941722412109375, "step": 502400 }, { "epoch": 0.6063331954754874, "learning_rate": 8.01111032138842e-06, "loss": 2.9457748413085936, "step": 502500 }, { "epoch": 0.6064538587979701, "learning_rate": 8.01070648592068e-06, "loss": 2.9628973388671875, "step": 502600 }, { "epoch": 0.6065745221204528, "learning_rate": 8.010302650452942e-06, "loss": 2.9518466186523438, "step": 502700 }, { "epoch": 0.6066951854429354, "learning_rate": 8.009898814985204e-06, "loss": 2.9688055419921877, "step": 502800 }, { "epoch": 0.6068158487654182, "learning_rate": 8.009494979517466e-06, "loss": 2.9575765991210936, "step": 502900 }, { "epoch": 0.6069365120879008, "learning_rate": 8.009091144049728e-06, "loss": 2.9197097778320313, "step": 503000 }, { "epoch": 0.6070571754103835, "learning_rate": 8.00868730858199e-06, "loss": 2.9297930908203127, "step": 503100 }, { "epoch": 0.6071778387328662, "learning_rate": 8.00828347311425e-06, "loss": 2.9497998046875, "step": 503200 }, { "epoch": 0.6072985020553489, "learning_rate": 8.007879637646512e-06, "loss": 2.9174771118164062, "step": 503300 }, { "epoch": 0.6074191653778316, "learning_rate": 8.007475802178774e-06, "loss": 2.9464212036132813, "step": 503400 }, { "epoch": 0.6075398287003142, "learning_rate": 8.007071966711036e-06, "loss": 2.9540090942382813, "step": 503500 }, { "epoch": 0.6076604920227969, "learning_rate": 8.006668131243296e-06, "loss": 2.935716552734375, "step": 503600 }, { "epoch": 0.6077811553452797, "learning_rate": 8.006264295775558e-06, "loss": 2.9447976684570314, "step": 503700 }, { "epoch": 0.6079018186677623, "learning_rate": 8.00586046030782e-06, "loss": 2.928397216796875, "step": 503800 }, { "epoch": 0.608022481990245, "learning_rate": 8.005456624840082e-06, "loss": 2.9565304565429686, "step": 503900 }, { "epoch": 0.6081431453127276, "learning_rate": 8.005052789372343e-06, "loss": 2.902865295410156, "step": 504000 }, { "epoch": 0.6082638086352103, "learning_rate": 8.004648953904605e-06, "loss": 2.936872863769531, "step": 504100 }, { "epoch": 0.6083844719576931, "learning_rate": 8.004245118436866e-06, "loss": 2.931551208496094, "step": 504200 }, { "epoch": 0.6085051352801757, "learning_rate": 8.003841282969128e-06, "loss": 2.947609558105469, "step": 504300 }, { "epoch": 0.6086257986026584, "learning_rate": 8.00343744750139e-06, "loss": 2.9287814331054687, "step": 504400 }, { "epoch": 0.608746461925141, "learning_rate": 8.00303361203365e-06, "loss": 2.938049621582031, "step": 504500 }, { "epoch": 0.6088671252476238, "learning_rate": 8.002629776565913e-06, "loss": 2.949931945800781, "step": 504600 }, { "epoch": 0.6089877885701065, "learning_rate": 8.002225941098175e-06, "loss": 2.9366058349609374, "step": 504700 }, { "epoch": 0.6091084518925891, "learning_rate": 8.001822105630437e-06, "loss": 2.9943002319335936, "step": 504800 }, { "epoch": 0.6092291152150718, "learning_rate": 8.001418270162697e-06, "loss": 2.940538330078125, "step": 504900 }, { "epoch": 0.6093497785375545, "learning_rate": 8.001014434694959e-06, "loss": 2.934717712402344, "step": 505000 }, { "epoch": 0.6094704418600372, "learning_rate": 8.000610599227221e-06, "loss": 2.958609924316406, "step": 505100 }, { "epoch": 0.6095911051825199, "learning_rate": 8.000206763759483e-06, "loss": 2.96318603515625, "step": 505200 }, { "epoch": 0.6097117685050025, "learning_rate": 7.999802928291745e-06, "loss": 2.9749432373046876, "step": 505300 }, { "epoch": 0.6098324318274853, "learning_rate": 7.999399092824007e-06, "loss": 2.9267352294921873, "step": 505400 }, { "epoch": 0.6099530951499679, "learning_rate": 7.998995257356267e-06, "loss": 2.942299499511719, "step": 505500 }, { "epoch": 0.6100737584724506, "learning_rate": 7.99859142188853e-06, "loss": 2.9731671142578127, "step": 505600 }, { "epoch": 0.6101944217949333, "learning_rate": 7.99818758642079e-06, "loss": 2.950361328125, "step": 505700 }, { "epoch": 0.610315085117416, "learning_rate": 7.997783750953051e-06, "loss": 2.941955871582031, "step": 505800 }, { "epoch": 0.6104357484398987, "learning_rate": 7.997379915485313e-06, "loss": 2.939858703613281, "step": 505900 }, { "epoch": 0.6105564117623813, "learning_rate": 7.996976080017575e-06, "loss": 2.948837890625, "step": 506000 }, { "epoch": 0.610677075084864, "learning_rate": 7.996572244549837e-06, "loss": 2.9474603271484376, "step": 506100 }, { "epoch": 0.6107977384073467, "learning_rate": 7.9961684090821e-06, "loss": 2.9288702392578125, "step": 506200 }, { "epoch": 0.6109184017298294, "learning_rate": 7.995764573614361e-06, "loss": 2.9382174682617186, "step": 506300 }, { "epoch": 0.6110390650523121, "learning_rate": 7.995360738146623e-06, "loss": 2.942349548339844, "step": 506400 }, { "epoch": 0.6111597283747947, "learning_rate": 7.994956902678884e-06, "loss": 2.9141015625, "step": 506500 }, { "epoch": 0.6112803916972774, "learning_rate": 7.994553067211146e-06, "loss": 2.9523745727539064, "step": 506600 }, { "epoch": 0.6114010550197602, "learning_rate": 7.994149231743406e-06, "loss": 2.953815612792969, "step": 506700 }, { "epoch": 0.6115217183422428, "learning_rate": 7.993745396275668e-06, "loss": 2.9407293701171877, "step": 506800 }, { "epoch": 0.6116423816647255, "learning_rate": 7.99334156080793e-06, "loss": 2.9476864624023436, "step": 506900 }, { "epoch": 0.6117630449872081, "learning_rate": 7.992937725340192e-06, "loss": 2.9306097412109375, "step": 507000 }, { "epoch": 0.6118837083096909, "learning_rate": 7.992533889872454e-06, "loss": 2.9344500732421874, "step": 507100 }, { "epoch": 0.6120043716321736, "learning_rate": 7.992130054404716e-06, "loss": 2.9500466918945314, "step": 507200 }, { "epoch": 0.6121250349546562, "learning_rate": 7.991726218936976e-06, "loss": 2.94267578125, "step": 507300 }, { "epoch": 0.6122456982771389, "learning_rate": 7.991322383469238e-06, "loss": 2.9566375732421877, "step": 507400 }, { "epoch": 0.6123663615996215, "learning_rate": 7.9909185480015e-06, "loss": 2.9195281982421877, "step": 507500 }, { "epoch": 0.6124870249221043, "learning_rate": 7.990514712533762e-06, "loss": 2.939086608886719, "step": 507600 }, { "epoch": 0.612607688244587, "learning_rate": 7.990110877066022e-06, "loss": 2.9370703125, "step": 507700 }, { "epoch": 0.6127283515670696, "learning_rate": 7.989707041598284e-06, "loss": 2.941788330078125, "step": 507800 }, { "epoch": 0.6128490148895523, "learning_rate": 7.989303206130546e-06, "loss": 2.9362823486328127, "step": 507900 }, { "epoch": 0.6129696782120351, "learning_rate": 7.988899370662808e-06, "loss": 2.949305114746094, "step": 508000 }, { "epoch": 0.6130903415345177, "learning_rate": 7.988495535195069e-06, "loss": 2.922286376953125, "step": 508100 }, { "epoch": 0.6132110048570004, "learning_rate": 7.98809169972733e-06, "loss": 2.946279296875, "step": 508200 }, { "epoch": 0.613331668179483, "learning_rate": 7.987687864259593e-06, "loss": 2.9381887817382815, "step": 508300 }, { "epoch": 0.6134523315019658, "learning_rate": 7.987284028791855e-06, "loss": 2.9511874389648436, "step": 508400 }, { "epoch": 0.6135729948244485, "learning_rate": 7.986880193324116e-06, "loss": 2.9328399658203126, "step": 508500 }, { "epoch": 0.6136936581469311, "learning_rate": 7.986476357856377e-06, "loss": 2.940248718261719, "step": 508600 }, { "epoch": 0.6138143214694138, "learning_rate": 7.986072522388639e-06, "loss": 2.9078173828125, "step": 508700 }, { "epoch": 0.6139349847918965, "learning_rate": 7.9856686869209e-06, "loss": 2.9195855712890624, "step": 508800 }, { "epoch": 0.6140556481143792, "learning_rate": 7.985264851453161e-06, "loss": 2.923081359863281, "step": 508900 }, { "epoch": 0.6141763114368619, "learning_rate": 7.984861015985423e-06, "loss": 2.9314361572265626, "step": 509000 }, { "epoch": 0.6142969747593445, "learning_rate": 7.984457180517685e-06, "loss": 2.907495422363281, "step": 509100 }, { "epoch": 0.6144176380818273, "learning_rate": 7.984053345049947e-06, "loss": 2.9291592407226563, "step": 509200 }, { "epoch": 0.6145383014043099, "learning_rate": 7.983649509582209e-06, "loss": 2.9413824462890625, "step": 509300 }, { "epoch": 0.6146589647267926, "learning_rate": 7.983245674114471e-06, "loss": 2.926028137207031, "step": 509400 }, { "epoch": 0.6147796280492753, "learning_rate": 7.982841838646733e-06, "loss": 2.928121337890625, "step": 509500 }, { "epoch": 0.614900291371758, "learning_rate": 7.982438003178993e-06, "loss": 2.9601974487304688, "step": 509600 }, { "epoch": 0.6150209546942407, "learning_rate": 7.982034167711255e-06, "loss": 2.9320724487304686, "step": 509700 }, { "epoch": 0.6151416180167233, "learning_rate": 7.981630332243515e-06, "loss": 2.9248001098632814, "step": 509800 }, { "epoch": 0.615262281339206, "learning_rate": 7.981226496775777e-06, "loss": 2.94704833984375, "step": 509900 }, { "epoch": 0.6153829446616887, "learning_rate": 7.98082266130804e-06, "loss": 2.938487854003906, "step": 510000 }, { "epoch": 0.6155036079841714, "learning_rate": 7.980418825840301e-06, "loss": 2.9286630249023435, "step": 510100 }, { "epoch": 0.6156242713066541, "learning_rate": 7.980014990372563e-06, "loss": 2.9487484741210936, "step": 510200 }, { "epoch": 0.6157449346291367, "learning_rate": 7.979611154904825e-06, "loss": 2.9647967529296877, "step": 510300 }, { "epoch": 0.6158655979516194, "learning_rate": 7.979207319437087e-06, "loss": 2.9429425048828124, "step": 510400 }, { "epoch": 0.6159862612741022, "learning_rate": 7.978803483969348e-06, "loss": 2.959300842285156, "step": 510500 }, { "epoch": 0.6161069245965848, "learning_rate": 7.97839964850161e-06, "loss": 2.9324209594726565, "step": 510600 }, { "epoch": 0.6162275879190675, "learning_rate": 7.977995813033872e-06, "loss": 2.931982116699219, "step": 510700 }, { "epoch": 0.6163482512415501, "learning_rate": 7.977591977566132e-06, "loss": 2.9510748291015627, "step": 510800 }, { "epoch": 0.6164689145640329, "learning_rate": 7.977188142098394e-06, "loss": 2.900860595703125, "step": 510900 }, { "epoch": 0.6165895778865156, "learning_rate": 7.976784306630656e-06, "loss": 2.936392517089844, "step": 511000 }, { "epoch": 0.6167102412089982, "learning_rate": 7.976380471162918e-06, "loss": 2.9366650390625, "step": 511100 }, { "epoch": 0.6168309045314809, "learning_rate": 7.97597663569518e-06, "loss": 2.943543701171875, "step": 511200 }, { "epoch": 0.6169515678539635, "learning_rate": 7.975572800227442e-06, "loss": 2.929909362792969, "step": 511300 }, { "epoch": 0.6170722311764463, "learning_rate": 7.975168964759702e-06, "loss": 2.925518798828125, "step": 511400 }, { "epoch": 0.617192894498929, "learning_rate": 7.974765129291964e-06, "loss": 2.9333935546875, "step": 511500 }, { "epoch": 0.6173135578214116, "learning_rate": 7.974361293824226e-06, "loss": 2.924302062988281, "step": 511600 }, { "epoch": 0.6174342211438943, "learning_rate": 7.973957458356486e-06, "loss": 2.9478570556640626, "step": 511700 }, { "epoch": 0.617554884466377, "learning_rate": 7.973553622888748e-06, "loss": 2.9365350341796876, "step": 511800 }, { "epoch": 0.6176755477888597, "learning_rate": 7.97314978742101e-06, "loss": 2.9318582153320314, "step": 511900 }, { "epoch": 0.6177962111113424, "learning_rate": 7.972745951953272e-06, "loss": 2.9342440795898437, "step": 512000 }, { "epoch": 0.617916874433825, "learning_rate": 7.972342116485534e-06, "loss": 2.9170303344726562, "step": 512100 }, { "epoch": 0.6180375377563078, "learning_rate": 7.971938281017795e-06, "loss": 2.8970108032226562, "step": 512200 }, { "epoch": 0.6181582010787904, "learning_rate": 7.971534445550057e-06, "loss": 2.923292541503906, "step": 512300 }, { "epoch": 0.6182788644012731, "learning_rate": 7.971130610082319e-06, "loss": 2.928847351074219, "step": 512400 }, { "epoch": 0.6183995277237558, "learning_rate": 7.97072677461458e-06, "loss": 2.9172064208984376, "step": 512500 }, { "epoch": 0.6185201910462385, "learning_rate": 7.970322939146843e-06, "loss": 2.9376541137695313, "step": 512600 }, { "epoch": 0.6186408543687212, "learning_rate": 7.969919103679103e-06, "loss": 2.9123886108398436, "step": 512700 }, { "epoch": 0.6187615176912038, "learning_rate": 7.969515268211365e-06, "loss": 2.9545639038085936, "step": 512800 }, { "epoch": 0.6188821810136865, "learning_rate": 7.969111432743627e-06, "loss": 2.9437515258789064, "step": 512900 }, { "epoch": 0.6190028443361693, "learning_rate": 7.968707597275887e-06, "loss": 2.9291162109375, "step": 513000 }, { "epoch": 0.6191235076586519, "learning_rate": 7.968303761808149e-06, "loss": 2.9460580444335935, "step": 513100 }, { "epoch": 0.6192441709811346, "learning_rate": 7.967899926340411e-06, "loss": 2.9116244506835938, "step": 513200 }, { "epoch": 0.6193648343036173, "learning_rate": 7.967496090872673e-06, "loss": 2.9105389404296873, "step": 513300 }, { "epoch": 0.6194854976261, "learning_rate": 7.967092255404935e-06, "loss": 2.9243295288085935, "step": 513400 }, { "epoch": 0.6196061609485827, "learning_rate": 7.966688419937197e-06, "loss": 2.9280929565429688, "step": 513500 }, { "epoch": 0.6197268242710653, "learning_rate": 7.966284584469457e-06, "loss": 2.9477328491210937, "step": 513600 }, { "epoch": 0.619847487593548, "learning_rate": 7.96588074900172e-06, "loss": 2.9262680053710937, "step": 513700 }, { "epoch": 0.6199681509160307, "learning_rate": 7.965476913533981e-06, "loss": 2.919295349121094, "step": 513800 }, { "epoch": 0.6200888142385134, "learning_rate": 7.965073078066242e-06, "loss": 2.9143356323242187, "step": 513900 }, { "epoch": 0.6202094775609961, "learning_rate": 7.964669242598504e-06, "loss": 2.9276748657226563, "step": 514000 }, { "epoch": 0.6203301408834787, "learning_rate": 7.964265407130765e-06, "loss": 2.937161865234375, "step": 514100 }, { "epoch": 0.6204508042059614, "learning_rate": 7.963861571663027e-06, "loss": 2.9196502685546877, "step": 514200 }, { "epoch": 0.6205714675284442, "learning_rate": 7.96345773619529e-06, "loss": 2.931656494140625, "step": 514300 }, { "epoch": 0.6206921308509268, "learning_rate": 7.963053900727551e-06, "loss": 2.9033148193359377, "step": 514400 }, { "epoch": 0.6208127941734095, "learning_rate": 7.962650065259813e-06, "loss": 2.92002197265625, "step": 514500 }, { "epoch": 0.6209334574958921, "learning_rate": 7.962246229792074e-06, "loss": 2.919794921875, "step": 514600 }, { "epoch": 0.6210541208183749, "learning_rate": 7.961842394324336e-06, "loss": 2.916904296875, "step": 514700 }, { "epoch": 0.6211747841408576, "learning_rate": 7.961438558856596e-06, "loss": 2.9389263916015627, "step": 514800 }, { "epoch": 0.6212954474633402, "learning_rate": 7.961034723388858e-06, "loss": 2.937230224609375, "step": 514900 }, { "epoch": 0.6214161107858229, "learning_rate": 7.96063088792112e-06, "loss": 2.913074951171875, "step": 515000 }, { "epoch": 0.6215367741083055, "learning_rate": 7.960227052453382e-06, "loss": 2.9199456787109375, "step": 515100 }, { "epoch": 0.6216574374307883, "learning_rate": 7.959823216985644e-06, "loss": 2.933965148925781, "step": 515200 }, { "epoch": 0.621778100753271, "learning_rate": 7.959419381517906e-06, "loss": 2.9413833618164062, "step": 515300 }, { "epoch": 0.6218987640757536, "learning_rate": 7.959015546050168e-06, "loss": 2.9478463745117187, "step": 515400 }, { "epoch": 0.6220194273982363, "learning_rate": 7.958611710582428e-06, "loss": 2.9017559814453127, "step": 515500 }, { "epoch": 0.622140090720719, "learning_rate": 7.95820787511469e-06, "loss": 2.927471008300781, "step": 515600 }, { "epoch": 0.6222607540432017, "learning_rate": 7.957804039646952e-06, "loss": 2.9231170654296874, "step": 515700 }, { "epoch": 0.6223814173656844, "learning_rate": 7.957400204179212e-06, "loss": 2.9155319213867186, "step": 515800 }, { "epoch": 0.622502080688167, "learning_rate": 7.956996368711474e-06, "loss": 2.9355905151367185, "step": 515900 }, { "epoch": 0.6226227440106498, "learning_rate": 7.956592533243736e-06, "loss": 2.915854797363281, "step": 516000 }, { "epoch": 0.6227434073331324, "learning_rate": 7.956188697775998e-06, "loss": 2.937925109863281, "step": 516100 }, { "epoch": 0.6228640706556151, "learning_rate": 7.95578486230826e-06, "loss": 2.958274230957031, "step": 516200 }, { "epoch": 0.6229847339780978, "learning_rate": 7.95538102684052e-06, "loss": 2.900185241699219, "step": 516300 }, { "epoch": 0.6231053973005805, "learning_rate": 7.954977191372783e-06, "loss": 2.9382064819335936, "step": 516400 }, { "epoch": 0.6232260606230632, "learning_rate": 7.954573355905045e-06, "loss": 2.931901550292969, "step": 516500 }, { "epoch": 0.6233467239455458, "learning_rate": 7.954169520437307e-06, "loss": 2.8812347412109376, "step": 516600 }, { "epoch": 0.6234673872680285, "learning_rate": 7.953765684969567e-06, "loss": 2.898975524902344, "step": 516700 }, { "epoch": 0.6235880505905113, "learning_rate": 7.953361849501829e-06, "loss": 2.933077697753906, "step": 516800 }, { "epoch": 0.6237087139129939, "learning_rate": 7.95295801403409e-06, "loss": 2.9323956298828127, "step": 516900 }, { "epoch": 0.6238293772354766, "learning_rate": 7.952554178566353e-06, "loss": 2.9189215087890625, "step": 517000 }, { "epoch": 0.6239500405579592, "learning_rate": 7.952150343098613e-06, "loss": 2.9305963134765625, "step": 517100 }, { "epoch": 0.624070703880442, "learning_rate": 7.951746507630875e-06, "loss": 2.9188876342773438, "step": 517200 }, { "epoch": 0.6241913672029247, "learning_rate": 7.951342672163137e-06, "loss": 2.9377862548828126, "step": 517300 }, { "epoch": 0.6243120305254073, "learning_rate": 7.950938836695399e-06, "loss": 2.9388796997070314, "step": 517400 }, { "epoch": 0.62443269384789, "learning_rate": 7.950535001227661e-06, "loss": 2.920887451171875, "step": 517500 }, { "epoch": 0.6245533571703726, "learning_rate": 7.950131165759923e-06, "loss": 2.8912997436523438, "step": 517600 }, { "epoch": 0.6246740204928554, "learning_rate": 7.949727330292183e-06, "loss": 2.9513134765625, "step": 517700 }, { "epoch": 0.6247946838153381, "learning_rate": 7.949323494824445e-06, "loss": 2.895133056640625, "step": 517800 }, { "epoch": 0.6249153471378207, "learning_rate": 7.948919659356706e-06, "loss": 2.9340667724609375, "step": 517900 }, { "epoch": 0.6250360104603034, "learning_rate": 7.948515823888968e-06, "loss": 2.93799072265625, "step": 518000 }, { "epoch": 0.6251566737827862, "learning_rate": 7.94811198842123e-06, "loss": 2.9283697509765627, "step": 518100 }, { "epoch": 0.6252773371052688, "learning_rate": 7.947708152953492e-06, "loss": 2.9418405151367186, "step": 518200 }, { "epoch": 0.6253980004277515, "learning_rate": 7.947304317485753e-06, "loss": 2.915838317871094, "step": 518300 }, { "epoch": 0.6255186637502341, "learning_rate": 7.946900482018015e-06, "loss": 2.894775085449219, "step": 518400 }, { "epoch": 0.6256393270727169, "learning_rate": 7.946496646550277e-06, "loss": 2.9170150756835938, "step": 518500 }, { "epoch": 0.6257599903951996, "learning_rate": 7.94609281108254e-06, "loss": 2.9279708862304688, "step": 518600 }, { "epoch": 0.6258806537176822, "learning_rate": 7.9456889756148e-06, "loss": 2.9136148071289063, "step": 518700 }, { "epoch": 0.6260013170401649, "learning_rate": 7.945285140147062e-06, "loss": 2.917821960449219, "step": 518800 }, { "epoch": 0.6261219803626475, "learning_rate": 7.944881304679322e-06, "loss": 2.900311279296875, "step": 518900 }, { "epoch": 0.6262426436851303, "learning_rate": 7.944477469211584e-06, "loss": 2.924251708984375, "step": 519000 }, { "epoch": 0.626363307007613, "learning_rate": 7.944073633743846e-06, "loss": 2.939072265625, "step": 519100 }, { "epoch": 0.6264839703300956, "learning_rate": 7.943669798276108e-06, "loss": 2.9273110961914064, "step": 519200 }, { "epoch": 0.6266046336525783, "learning_rate": 7.94326596280837e-06, "loss": 2.8934375, "step": 519300 }, { "epoch": 0.626725296975061, "learning_rate": 7.942862127340632e-06, "loss": 2.9186386108398437, "step": 519400 }, { "epoch": 0.6268459602975437, "learning_rate": 7.942458291872892e-06, "loss": 2.927326354980469, "step": 519500 }, { "epoch": 0.6269666236200264, "learning_rate": 7.942054456405154e-06, "loss": 2.9182174682617186, "step": 519600 }, { "epoch": 0.627087286942509, "learning_rate": 7.941650620937416e-06, "loss": 2.9111480712890625, "step": 519700 }, { "epoch": 0.6272079502649918, "learning_rate": 7.941246785469678e-06, "loss": 2.9423431396484374, "step": 519800 }, { "epoch": 0.6273286135874744, "learning_rate": 7.940842950001938e-06, "loss": 2.922041015625, "step": 519900 }, { "epoch": 0.6274492769099571, "learning_rate": 7.9404391145342e-06, "loss": 2.958108215332031, "step": 520000 }, { "epoch": 0.6275699402324398, "learning_rate": 7.940035279066462e-06, "loss": 2.910821838378906, "step": 520100 }, { "epoch": 0.6276906035549225, "learning_rate": 7.939631443598724e-06, "loss": 2.92248291015625, "step": 520200 }, { "epoch": 0.6278112668774052, "learning_rate": 7.939227608130986e-06, "loss": 2.920801086425781, "step": 520300 }, { "epoch": 0.6279319301998878, "learning_rate": 7.938823772663247e-06, "loss": 2.920839538574219, "step": 520400 }, { "epoch": 0.6280525935223705, "learning_rate": 7.938419937195509e-06, "loss": 2.92770263671875, "step": 520500 }, { "epoch": 0.6281732568448533, "learning_rate": 7.93801610172777e-06, "loss": 2.9224734497070313, "step": 520600 }, { "epoch": 0.6282939201673359, "learning_rate": 7.937612266260033e-06, "loss": 2.9305413818359374, "step": 520700 }, { "epoch": 0.6284145834898186, "learning_rate": 7.937208430792293e-06, "loss": 2.8962722778320313, "step": 520800 }, { "epoch": 0.6285352468123012, "learning_rate": 7.936804595324555e-06, "loss": 2.9308657836914063, "step": 520900 }, { "epoch": 0.628655910134784, "learning_rate": 7.936400759856817e-06, "loss": 2.904207458496094, "step": 521000 }, { "epoch": 0.6287765734572667, "learning_rate": 7.935996924389079e-06, "loss": 2.9203060913085936, "step": 521100 }, { "epoch": 0.6288972367797493, "learning_rate": 7.935593088921339e-06, "loss": 2.916864929199219, "step": 521200 }, { "epoch": 0.629017900102232, "learning_rate": 7.935189253453601e-06, "loss": 2.907156982421875, "step": 521300 }, { "epoch": 0.6291385634247146, "learning_rate": 7.934785417985863e-06, "loss": 2.914400634765625, "step": 521400 }, { "epoch": 0.6292592267471974, "learning_rate": 7.934381582518125e-06, "loss": 2.9265597534179686, "step": 521500 }, { "epoch": 0.6293798900696801, "learning_rate": 7.933977747050387e-06, "loss": 2.9270748901367187, "step": 521600 }, { "epoch": 0.6295005533921627, "learning_rate": 7.933573911582649e-06, "loss": 2.9318606567382814, "step": 521700 }, { "epoch": 0.6296212167146454, "learning_rate": 7.93317007611491e-06, "loss": 2.922077941894531, "step": 521800 }, { "epoch": 0.629741880037128, "learning_rate": 7.932766240647171e-06, "loss": 2.9371435546875, "step": 521900 }, { "epoch": 0.6298625433596108, "learning_rate": 7.932362405179432e-06, "loss": 2.8946109008789063, "step": 522000 }, { "epoch": 0.6299832066820935, "learning_rate": 7.931958569711694e-06, "loss": 2.91708984375, "step": 522100 }, { "epoch": 0.6301038700045761, "learning_rate": 7.931554734243956e-06, "loss": 2.935476989746094, "step": 522200 }, { "epoch": 0.6302245333270589, "learning_rate": 7.931150898776218e-06, "loss": 2.931512756347656, "step": 522300 }, { "epoch": 0.6303451966495415, "learning_rate": 7.93074706330848e-06, "loss": 2.930699462890625, "step": 522400 }, { "epoch": 0.6304658599720242, "learning_rate": 7.930343227840742e-06, "loss": 2.916722717285156, "step": 522500 }, { "epoch": 0.6305865232945069, "learning_rate": 7.929939392373003e-06, "loss": 2.930321044921875, "step": 522600 }, { "epoch": 0.6307071866169895, "learning_rate": 7.929535556905264e-06, "loss": 2.9280126953125, "step": 522700 }, { "epoch": 0.6308278499394723, "learning_rate": 7.929131721437526e-06, "loss": 2.9292257690429686, "step": 522800 }, { "epoch": 0.6309485132619549, "learning_rate": 7.928727885969788e-06, "loss": 2.9129730224609376, "step": 522900 }, { "epoch": 0.6310691765844376, "learning_rate": 7.928324050502048e-06, "loss": 2.9149789428710937, "step": 523000 }, { "epoch": 0.6311898399069203, "learning_rate": 7.92792021503431e-06, "loss": 2.9060940551757812, "step": 523100 }, { "epoch": 0.631310503229403, "learning_rate": 7.927516379566572e-06, "loss": 2.9181484985351562, "step": 523200 }, { "epoch": 0.6314311665518857, "learning_rate": 7.927112544098834e-06, "loss": 2.9121249389648436, "step": 523300 }, { "epoch": 0.6315518298743684, "learning_rate": 7.926708708631096e-06, "loss": 2.9159979248046874, "step": 523400 }, { "epoch": 0.631672493196851, "learning_rate": 7.926304873163358e-06, "loss": 2.948087463378906, "step": 523500 }, { "epoch": 0.6317931565193338, "learning_rate": 7.925901037695618e-06, "loss": 2.930238952636719, "step": 523600 }, { "epoch": 0.6319138198418164, "learning_rate": 7.92549720222788e-06, "loss": 2.912752685546875, "step": 523700 }, { "epoch": 0.6320344831642991, "learning_rate": 7.925093366760142e-06, "loss": 2.9361221313476564, "step": 523800 }, { "epoch": 0.6321551464867818, "learning_rate": 7.924689531292402e-06, "loss": 2.9162432861328127, "step": 523900 }, { "epoch": 0.6322758098092645, "learning_rate": 7.924285695824664e-06, "loss": 2.9198068237304686, "step": 524000 }, { "epoch": 0.6323964731317472, "learning_rate": 7.923881860356926e-06, "loss": 2.9152001953125, "step": 524100 }, { "epoch": 0.6325171364542298, "learning_rate": 7.923478024889188e-06, "loss": 2.9171633911132813, "step": 524200 }, { "epoch": 0.6326377997767125, "learning_rate": 7.92307418942145e-06, "loss": 2.9247210693359373, "step": 524300 }, { "epoch": 0.6327584630991953, "learning_rate": 7.92267035395371e-06, "loss": 2.920307312011719, "step": 524400 }, { "epoch": 0.6328791264216779, "learning_rate": 7.922266518485973e-06, "loss": 2.911843566894531, "step": 524500 }, { "epoch": 0.6329997897441606, "learning_rate": 7.921862683018235e-06, "loss": 2.9048123168945312, "step": 524600 }, { "epoch": 0.6331204530666432, "learning_rate": 7.921458847550497e-06, "loss": 2.8982302856445314, "step": 524700 }, { "epoch": 0.633241116389126, "learning_rate": 7.921055012082759e-06, "loss": 2.9159341430664063, "step": 524800 }, { "epoch": 0.6333617797116087, "learning_rate": 7.920651176615019e-06, "loss": 2.953211364746094, "step": 524900 }, { "epoch": 0.6334824430340913, "learning_rate": 7.920247341147281e-06, "loss": 2.8935418701171876, "step": 525000 }, { "epoch": 0.633603106356574, "learning_rate": 7.919843505679543e-06, "loss": 2.8928067016601564, "step": 525100 }, { "epoch": 0.6337237696790566, "learning_rate": 7.919439670211805e-06, "loss": 2.9214743041992186, "step": 525200 }, { "epoch": 0.6338444330015394, "learning_rate": 7.919035834744065e-06, "loss": 2.9290887451171876, "step": 525300 }, { "epoch": 0.6339650963240221, "learning_rate": 7.918631999276327e-06, "loss": 2.9300689697265625, "step": 525400 }, { "epoch": 0.6340857596465047, "learning_rate": 7.918228163808589e-06, "loss": 2.8972433471679686, "step": 525500 }, { "epoch": 0.6342064229689874, "learning_rate": 7.917824328340851e-06, "loss": 2.8949765014648436, "step": 525600 }, { "epoch": 0.63432708629147, "learning_rate": 7.917420492873113e-06, "loss": 2.91369873046875, "step": 525700 }, { "epoch": 0.6344477496139528, "learning_rate": 7.917016657405373e-06, "loss": 2.900715026855469, "step": 525800 }, { "epoch": 0.6345684129364355, "learning_rate": 7.916612821937635e-06, "loss": 2.9279440307617186, "step": 525900 }, { "epoch": 0.6346890762589181, "learning_rate": 7.916208986469897e-06, "loss": 2.9390029907226562, "step": 526000 }, { "epoch": 0.6348097395814009, "learning_rate": 7.915805151002158e-06, "loss": 2.9287124633789063, "step": 526100 }, { "epoch": 0.6349304029038835, "learning_rate": 7.91540131553442e-06, "loss": 2.89931396484375, "step": 526200 }, { "epoch": 0.6350510662263662, "learning_rate": 7.914997480066682e-06, "loss": 2.9417630004882813, "step": 526300 }, { "epoch": 0.6351717295488489, "learning_rate": 7.914593644598944e-06, "loss": 2.9337152099609374, "step": 526400 }, { "epoch": 0.6352923928713315, "learning_rate": 7.914189809131206e-06, "loss": 2.9253668212890624, "step": 526500 }, { "epoch": 0.6354130561938143, "learning_rate": 7.913785973663468e-06, "loss": 2.9214242553710936, "step": 526600 }, { "epoch": 0.6355337195162969, "learning_rate": 7.91338213819573e-06, "loss": 2.911136474609375, "step": 526700 }, { "epoch": 0.6356543828387796, "learning_rate": 7.91297830272799e-06, "loss": 2.919922180175781, "step": 526800 }, { "epoch": 0.6357750461612623, "learning_rate": 7.912574467260252e-06, "loss": 2.926233825683594, "step": 526900 }, { "epoch": 0.635895709483745, "learning_rate": 7.912170631792512e-06, "loss": 2.8864752197265626, "step": 527000 }, { "epoch": 0.6360163728062277, "learning_rate": 7.911766796324774e-06, "loss": 2.9276934814453126, "step": 527100 }, { "epoch": 0.6361370361287103, "learning_rate": 7.911362960857036e-06, "loss": 2.8995010375976564, "step": 527200 }, { "epoch": 0.636257699451193, "learning_rate": 7.910959125389298e-06, "loss": 2.920686950683594, "step": 527300 }, { "epoch": 0.6363783627736758, "learning_rate": 7.91055528992156e-06, "loss": 2.926412353515625, "step": 527400 }, { "epoch": 0.6364990260961584, "learning_rate": 7.910151454453822e-06, "loss": 2.9265869140625, "step": 527500 }, { "epoch": 0.6366196894186411, "learning_rate": 7.909747618986084e-06, "loss": 2.9085421752929688, "step": 527600 }, { "epoch": 0.6367403527411237, "learning_rate": 7.909343783518344e-06, "loss": 2.9507366943359377, "step": 527700 }, { "epoch": 0.6368610160636065, "learning_rate": 7.908939948050606e-06, "loss": 2.9089315795898436, "step": 527800 }, { "epoch": 0.6369816793860892, "learning_rate": 7.908536112582868e-06, "loss": 2.9272750854492187, "step": 527900 }, { "epoch": 0.6371023427085718, "learning_rate": 7.908132277115129e-06, "loss": 2.8651077270507814, "step": 528000 }, { "epoch": 0.6372230060310545, "learning_rate": 7.90772844164739e-06, "loss": 2.8903424072265627, "step": 528100 }, { "epoch": 0.6373436693535371, "learning_rate": 7.907324606179652e-06, "loss": 2.917109375, "step": 528200 }, { "epoch": 0.6374643326760199, "learning_rate": 7.906920770711914e-06, "loss": 2.90942138671875, "step": 528300 }, { "epoch": 0.6375849959985026, "learning_rate": 7.906516935244176e-06, "loss": 2.9393081665039062, "step": 528400 }, { "epoch": 0.6377056593209852, "learning_rate": 7.906113099776437e-06, "loss": 2.9263076782226562, "step": 528500 }, { "epoch": 0.637826322643468, "learning_rate": 7.905709264308699e-06, "loss": 2.914020690917969, "step": 528600 }, { "epoch": 0.6379469859659507, "learning_rate": 7.90530542884096e-06, "loss": 2.9094778442382814, "step": 528700 }, { "epoch": 0.6380676492884333, "learning_rate": 7.904901593373223e-06, "loss": 2.919495849609375, "step": 528800 }, { "epoch": 0.638188312610916, "learning_rate": 7.904497757905483e-06, "loss": 2.9046136474609376, "step": 528900 }, { "epoch": 0.6383089759333986, "learning_rate": 7.904093922437745e-06, "loss": 2.909035949707031, "step": 529000 }, { "epoch": 0.6384296392558814, "learning_rate": 7.903690086970007e-06, "loss": 2.908266906738281, "step": 529100 }, { "epoch": 0.6385503025783641, "learning_rate": 7.903286251502269e-06, "loss": 2.885537109375, "step": 529200 }, { "epoch": 0.6386709659008467, "learning_rate": 7.90288241603453e-06, "loss": 2.9287509155273437, "step": 529300 }, { "epoch": 0.6387916292233294, "learning_rate": 7.902478580566791e-06, "loss": 2.912772216796875, "step": 529400 }, { "epoch": 0.638912292545812, "learning_rate": 7.902074745099053e-06, "loss": 2.924574279785156, "step": 529500 }, { "epoch": 0.6390329558682948, "learning_rate": 7.901670909631315e-06, "loss": 2.9036474609375, "step": 529600 }, { "epoch": 0.6391536191907775, "learning_rate": 7.901267074163577e-06, "loss": 2.902551574707031, "step": 529700 }, { "epoch": 0.6392742825132601, "learning_rate": 7.900863238695839e-06, "loss": 2.9299160766601564, "step": 529800 }, { "epoch": 0.6393949458357429, "learning_rate": 7.9004594032281e-06, "loss": 2.9189422607421873, "step": 529900 }, { "epoch": 0.6395156091582255, "learning_rate": 7.900055567760361e-06, "loss": 2.919125671386719, "step": 530000 }, { "epoch": 0.6396362724807082, "learning_rate": 7.899651732292623e-06, "loss": 2.889647216796875, "step": 530100 }, { "epoch": 0.6397569358031909, "learning_rate": 7.899247896824884e-06, "loss": 2.9255801391601564, "step": 530200 }, { "epoch": 0.6398775991256735, "learning_rate": 7.898844061357146e-06, "loss": 2.8967352294921875, "step": 530300 }, { "epoch": 0.6399982624481563, "learning_rate": 7.898440225889408e-06, "loss": 2.9440728759765626, "step": 530400 }, { "epoch": 0.6401189257706389, "learning_rate": 7.89803639042167e-06, "loss": 2.9279129028320314, "step": 530500 }, { "epoch": 0.6402395890931216, "learning_rate": 7.897632554953932e-06, "loss": 2.9225119018554686, "step": 530600 }, { "epoch": 0.6403602524156043, "learning_rate": 7.897228719486194e-06, "loss": 2.899134216308594, "step": 530700 }, { "epoch": 0.640480915738087, "learning_rate": 7.896824884018454e-06, "loss": 2.920964660644531, "step": 530800 }, { "epoch": 0.6406015790605697, "learning_rate": 7.896421048550716e-06, "loss": 2.9086627197265624, "step": 530900 }, { "epoch": 0.6407222423830523, "learning_rate": 7.896017213082978e-06, "loss": 2.8920623779296877, "step": 531000 }, { "epoch": 0.640842905705535, "learning_rate": 7.895613377615238e-06, "loss": 2.8837518310546875, "step": 531100 }, { "epoch": 0.6409635690280178, "learning_rate": 7.8952095421475e-06, "loss": 2.91379150390625, "step": 531200 }, { "epoch": 0.6410842323505004, "learning_rate": 7.894805706679762e-06, "loss": 2.931374206542969, "step": 531300 }, { "epoch": 0.6412048956729831, "learning_rate": 7.894401871212024e-06, "loss": 2.9140640258789063, "step": 531400 }, { "epoch": 0.6413255589954657, "learning_rate": 7.893998035744286e-06, "loss": 2.906854553222656, "step": 531500 }, { "epoch": 0.6414462223179485, "learning_rate": 7.893594200276548e-06, "loss": 2.92174560546875, "step": 531600 }, { "epoch": 0.6415668856404312, "learning_rate": 7.89319036480881e-06, "loss": 2.9333343505859375, "step": 531700 }, { "epoch": 0.6416875489629138, "learning_rate": 7.89278652934107e-06, "loss": 2.915685119628906, "step": 531800 }, { "epoch": 0.6418082122853965, "learning_rate": 7.892382693873332e-06, "loss": 2.9405352783203127, "step": 531900 }, { "epoch": 0.6419288756078791, "learning_rate": 7.891978858405593e-06, "loss": 2.8800735473632812, "step": 532000 }, { "epoch": 0.6420495389303619, "learning_rate": 7.891575022937855e-06, "loss": 2.8825479125976563, "step": 532100 }, { "epoch": 0.6421702022528446, "learning_rate": 7.891171187470117e-06, "loss": 2.8957418823242187, "step": 532200 }, { "epoch": 0.6422908655753272, "learning_rate": 7.890767352002379e-06, "loss": 2.9057769775390625, "step": 532300 }, { "epoch": 0.64241152889781, "learning_rate": 7.89036351653464e-06, "loss": 2.9050631713867188, "step": 532400 }, { "epoch": 0.6425321922202926, "learning_rate": 7.889959681066902e-06, "loss": 2.8788491821289064, "step": 532500 }, { "epoch": 0.6426528555427753, "learning_rate": 7.889555845599163e-06, "loss": 2.9095004272460936, "step": 532600 }, { "epoch": 0.642773518865258, "learning_rate": 7.889152010131425e-06, "loss": 2.9180343627929686, "step": 532700 }, { "epoch": 0.6428941821877406, "learning_rate": 7.888748174663687e-06, "loss": 2.930128173828125, "step": 532800 }, { "epoch": 0.6430148455102234, "learning_rate": 7.888344339195949e-06, "loss": 2.9327386474609374, "step": 532900 }, { "epoch": 0.643135508832706, "learning_rate": 7.887940503728209e-06, "loss": 2.9133541870117186, "step": 533000 }, { "epoch": 0.6432561721551887, "learning_rate": 7.887536668260471e-06, "loss": 2.90226806640625, "step": 533100 }, { "epoch": 0.6433768354776714, "learning_rate": 7.887132832792733e-06, "loss": 2.9028521728515626, "step": 533200 }, { "epoch": 0.643497498800154, "learning_rate": 7.886728997324995e-06, "loss": 2.922269592285156, "step": 533300 }, { "epoch": 0.6436181621226368, "learning_rate": 7.886325161857255e-06, "loss": 2.9260598754882814, "step": 533400 }, { "epoch": 0.6437388254451194, "learning_rate": 7.885921326389517e-06, "loss": 2.9319769287109376, "step": 533500 }, { "epoch": 0.6438594887676021, "learning_rate": 7.88551749092178e-06, "loss": 2.901370849609375, "step": 533600 }, { "epoch": 0.6439801520900849, "learning_rate": 7.885113655454041e-06, "loss": 2.9178424072265625, "step": 533700 }, { "epoch": 0.6441008154125675, "learning_rate": 7.884709819986303e-06, "loss": 2.9081576538085936, "step": 533800 }, { "epoch": 0.6442214787350502, "learning_rate": 7.884305984518565e-06, "loss": 2.907099609375, "step": 533900 }, { "epoch": 0.6443421420575329, "learning_rate": 7.883902149050825e-06, "loss": 2.918369140625, "step": 534000 }, { "epoch": 0.6444628053800155, "learning_rate": 7.883498313583087e-06, "loss": 2.9075936889648437, "step": 534100 }, { "epoch": 0.6445834687024983, "learning_rate": 7.883094478115348e-06, "loss": 2.9389569091796877, "step": 534200 }, { "epoch": 0.6447041320249809, "learning_rate": 7.88269064264761e-06, "loss": 2.887899169921875, "step": 534300 }, { "epoch": 0.6448247953474636, "learning_rate": 7.882286807179872e-06, "loss": 2.900060119628906, "step": 534400 }, { "epoch": 0.6449454586699463, "learning_rate": 7.881882971712134e-06, "loss": 2.902264404296875, "step": 534500 }, { "epoch": 0.645066121992429, "learning_rate": 7.881479136244396e-06, "loss": 2.8935296630859373, "step": 534600 }, { "epoch": 0.6451867853149117, "learning_rate": 7.881075300776658e-06, "loss": 2.93751953125, "step": 534700 }, { "epoch": 0.6453074486373943, "learning_rate": 7.88067146530892e-06, "loss": 2.90350830078125, "step": 534800 }, { "epoch": 0.645428111959877, "learning_rate": 7.88026762984118e-06, "loss": 2.890809326171875, "step": 534900 }, { "epoch": 0.6455487752823598, "learning_rate": 7.879863794373442e-06, "loss": 2.91779296875, "step": 535000 }, { "epoch": 0.6456694386048424, "learning_rate": 7.879459958905704e-06, "loss": 2.9179510498046874, "step": 535100 }, { "epoch": 0.6457901019273251, "learning_rate": 7.879056123437964e-06, "loss": 2.9075067138671873, "step": 535200 }, { "epoch": 0.6459107652498077, "learning_rate": 7.878652287970226e-06, "loss": 2.908475646972656, "step": 535300 }, { "epoch": 0.6460314285722905, "learning_rate": 7.878248452502488e-06, "loss": 2.9076922607421873, "step": 535400 }, { "epoch": 0.6461520918947732, "learning_rate": 7.87784461703475e-06, "loss": 2.890078430175781, "step": 535500 }, { "epoch": 0.6462727552172558, "learning_rate": 7.877440781567012e-06, "loss": 2.8760922241210936, "step": 535600 }, { "epoch": 0.6463934185397385, "learning_rate": 7.877036946099274e-06, "loss": 2.93329833984375, "step": 535700 }, { "epoch": 0.6465140818622211, "learning_rate": 7.876633110631536e-06, "loss": 2.9066500854492188, "step": 535800 }, { "epoch": 0.6466347451847039, "learning_rate": 7.876229275163796e-06, "loss": 2.933055419921875, "step": 535900 }, { "epoch": 0.6467554085071866, "learning_rate": 7.875825439696058e-06, "loss": 2.9006198120117186, "step": 536000 }, { "epoch": 0.6468760718296692, "learning_rate": 7.875421604228319e-06, "loss": 2.9125405883789064, "step": 536100 }, { "epoch": 0.646996735152152, "learning_rate": 7.87501776876058e-06, "loss": 2.9205218505859376, "step": 536200 }, { "epoch": 0.6471173984746346, "learning_rate": 7.874613933292843e-06, "loss": 2.9006918334960936, "step": 536300 }, { "epoch": 0.6472380617971173, "learning_rate": 7.874210097825105e-06, "loss": 2.891918029785156, "step": 536400 }, { "epoch": 0.6473587251196, "learning_rate": 7.873806262357367e-06, "loss": 2.9168359375, "step": 536500 }, { "epoch": 0.6474793884420826, "learning_rate": 7.873402426889629e-06, "loss": 2.916479187011719, "step": 536600 }, { "epoch": 0.6476000517645654, "learning_rate": 7.872998591421889e-06, "loss": 2.923353576660156, "step": 536700 }, { "epoch": 0.647720715087048, "learning_rate": 7.87259475595415e-06, "loss": 2.9228530883789063, "step": 536800 }, { "epoch": 0.6478413784095307, "learning_rate": 7.872190920486413e-06, "loss": 2.896103515625, "step": 536900 }, { "epoch": 0.6479620417320134, "learning_rate": 7.871787085018675e-06, "loss": 2.88780029296875, "step": 537000 }, { "epoch": 0.648082705054496, "learning_rate": 7.871383249550935e-06, "loss": 2.892388916015625, "step": 537100 }, { "epoch": 0.6482033683769788, "learning_rate": 7.870979414083197e-06, "loss": 2.903394775390625, "step": 537200 }, { "epoch": 0.6483240316994614, "learning_rate": 7.870575578615459e-06, "loss": 2.889374084472656, "step": 537300 }, { "epoch": 0.6484446950219441, "learning_rate": 7.870171743147721e-06, "loss": 2.9206292724609373, "step": 537400 }, { "epoch": 0.6485653583444269, "learning_rate": 7.869767907679981e-06, "loss": 2.902332458496094, "step": 537500 }, { "epoch": 0.6486860216669095, "learning_rate": 7.869364072212243e-06, "loss": 2.9179312133789064, "step": 537600 }, { "epoch": 0.6488066849893922, "learning_rate": 7.868960236744505e-06, "loss": 2.8813995361328124, "step": 537700 }, { "epoch": 0.6489273483118748, "learning_rate": 7.868556401276767e-06, "loss": 2.92198974609375, "step": 537800 }, { "epoch": 0.6490480116343575, "learning_rate": 7.86815256580903e-06, "loss": 2.8931451416015626, "step": 537900 }, { "epoch": 0.6491686749568403, "learning_rate": 7.86774873034129e-06, "loss": 2.90304443359375, "step": 538000 }, { "epoch": 0.6492893382793229, "learning_rate": 7.867344894873551e-06, "loss": 2.8974130249023435, "step": 538100 }, { "epoch": 0.6494100016018056, "learning_rate": 7.866941059405813e-06, "loss": 2.9123568725585938, "step": 538200 }, { "epoch": 0.6495306649242882, "learning_rate": 7.866537223938074e-06, "loss": 2.8980618286132813, "step": 538300 }, { "epoch": 0.649651328246771, "learning_rate": 7.866133388470336e-06, "loss": 2.9039300537109374, "step": 538400 }, { "epoch": 0.6497719915692537, "learning_rate": 7.865729553002598e-06, "loss": 2.903240051269531, "step": 538500 }, { "epoch": 0.6498926548917363, "learning_rate": 7.86532571753486e-06, "loss": 2.888386535644531, "step": 538600 }, { "epoch": 0.650013318214219, "learning_rate": 7.864921882067122e-06, "loss": 2.865736389160156, "step": 538700 }, { "epoch": 0.6501339815367017, "learning_rate": 7.864518046599384e-06, "loss": 2.8814651489257814, "step": 538800 }, { "epoch": 0.6502546448591844, "learning_rate": 7.864114211131646e-06, "loss": 2.9174713134765624, "step": 538900 }, { "epoch": 0.6503753081816671, "learning_rate": 7.863710375663906e-06, "loss": 2.8867333984375, "step": 539000 }, { "epoch": 0.6504959715041497, "learning_rate": 7.863306540196168e-06, "loss": 2.8783908081054688, "step": 539100 }, { "epoch": 0.6506166348266325, "learning_rate": 7.862902704728428e-06, "loss": 2.9131756591796876, "step": 539200 }, { "epoch": 0.6507372981491152, "learning_rate": 7.86249886926069e-06, "loss": 2.917720947265625, "step": 539300 }, { "epoch": 0.6508579614715978, "learning_rate": 7.862095033792952e-06, "loss": 2.915721130371094, "step": 539400 }, { "epoch": 0.6509786247940805, "learning_rate": 7.861691198325214e-06, "loss": 2.9115286254882813, "step": 539500 }, { "epoch": 0.6510992881165631, "learning_rate": 7.861287362857476e-06, "loss": 2.913331298828125, "step": 539600 }, { "epoch": 0.6512199514390459, "learning_rate": 7.860883527389738e-06, "loss": 2.9298211669921876, "step": 539700 }, { "epoch": 0.6513406147615286, "learning_rate": 7.860479691922e-06, "loss": 2.917668762207031, "step": 539800 }, { "epoch": 0.6514612780840112, "learning_rate": 7.86007585645426e-06, "loss": 2.8871951293945313, "step": 539900 }, { "epoch": 0.651581941406494, "learning_rate": 7.859672020986522e-06, "loss": 2.9174041748046875, "step": 540000 }, { "epoch": 0.6517026047289766, "learning_rate": 7.859268185518784e-06, "loss": 2.891155090332031, "step": 540100 }, { "epoch": 0.6518232680514593, "learning_rate": 7.858864350051045e-06, "loss": 2.8895083618164064, "step": 540200 }, { "epoch": 0.651943931373942, "learning_rate": 7.858460514583307e-06, "loss": 2.8884426879882814, "step": 540300 }, { "epoch": 0.6520645946964246, "learning_rate": 7.858056679115569e-06, "loss": 2.8725735473632814, "step": 540400 }, { "epoch": 0.6521852580189074, "learning_rate": 7.85765284364783e-06, "loss": 2.8968325805664064, "step": 540500 }, { "epoch": 0.65230592134139, "learning_rate": 7.857249008180093e-06, "loss": 2.8704620361328126, "step": 540600 }, { "epoch": 0.6524265846638727, "learning_rate": 7.856845172712355e-06, "loss": 2.915482177734375, "step": 540700 }, { "epoch": 0.6525472479863554, "learning_rate": 7.856441337244615e-06, "loss": 2.9027215576171876, "step": 540800 }, { "epoch": 0.6526679113088381, "learning_rate": 7.856037501776877e-06, "loss": 2.912454833984375, "step": 540900 }, { "epoch": 0.6527885746313208, "learning_rate": 7.855633666309139e-06, "loss": 2.90088134765625, "step": 541000 }, { "epoch": 0.6529092379538034, "learning_rate": 7.855229830841399e-06, "loss": 2.918892822265625, "step": 541100 }, { "epoch": 0.6530299012762861, "learning_rate": 7.854825995373661e-06, "loss": 2.8833172607421873, "step": 541200 }, { "epoch": 0.6531505645987689, "learning_rate": 7.854422159905923e-06, "loss": 2.8815362548828123, "step": 541300 }, { "epoch": 0.6532712279212515, "learning_rate": 7.854018324438185e-06, "loss": 2.908486633300781, "step": 541400 }, { "epoch": 0.6533918912437342, "learning_rate": 7.853614488970447e-06, "loss": 2.8756982421875, "step": 541500 }, { "epoch": 0.6535125545662168, "learning_rate": 7.853210653502707e-06, "loss": 2.8931463623046874, "step": 541600 }, { "epoch": 0.6536332178886995, "learning_rate": 7.85280681803497e-06, "loss": 2.898650817871094, "step": 541700 }, { "epoch": 0.6537538812111823, "learning_rate": 7.852402982567231e-06, "loss": 2.897416687011719, "step": 541800 }, { "epoch": 0.6538745445336649, "learning_rate": 7.851999147099493e-06, "loss": 2.9071905517578127, "step": 541900 }, { "epoch": 0.6539952078561476, "learning_rate": 7.851595311631755e-06, "loss": 2.8878460693359376, "step": 542000 }, { "epoch": 0.6541158711786302, "learning_rate": 7.851191476164016e-06, "loss": 2.900864562988281, "step": 542100 }, { "epoch": 0.654236534501113, "learning_rate": 7.850787640696278e-06, "loss": 2.8920828247070314, "step": 542200 }, { "epoch": 0.6543571978235957, "learning_rate": 7.85038380522854e-06, "loss": 2.870994873046875, "step": 542300 }, { "epoch": 0.6544778611460783, "learning_rate": 7.8499799697608e-06, "loss": 2.911165466308594, "step": 542400 }, { "epoch": 0.654598524468561, "learning_rate": 7.849576134293062e-06, "loss": 2.9239794921875, "step": 542500 }, { "epoch": 0.6547191877910437, "learning_rate": 7.849172298825324e-06, "loss": 2.8798031616210937, "step": 542600 }, { "epoch": 0.6548398511135264, "learning_rate": 7.848768463357586e-06, "loss": 2.885004577636719, "step": 542700 }, { "epoch": 0.6549605144360091, "learning_rate": 7.848364627889848e-06, "loss": 2.8778231811523436, "step": 542800 }, { "epoch": 0.6550811777584917, "learning_rate": 7.84796079242211e-06, "loss": 2.9184939575195314, "step": 542900 }, { "epoch": 0.6552018410809745, "learning_rate": 7.84755695695437e-06, "loss": 2.8894195556640625, "step": 543000 }, { "epoch": 0.6553225044034571, "learning_rate": 7.847153121486632e-06, "loss": 2.8782662963867187, "step": 543100 }, { "epoch": 0.6554431677259398, "learning_rate": 7.846749286018894e-06, "loss": 2.894966735839844, "step": 543200 }, { "epoch": 0.6555638310484225, "learning_rate": 7.846345450551154e-06, "loss": 2.8925051879882813, "step": 543300 }, { "epoch": 0.6556844943709051, "learning_rate": 7.845941615083416e-06, "loss": 2.905179748535156, "step": 543400 }, { "epoch": 0.6558051576933879, "learning_rate": 7.845537779615678e-06, "loss": 2.90675048828125, "step": 543500 }, { "epoch": 0.6559258210158705, "learning_rate": 7.84513394414794e-06, "loss": 2.889992370605469, "step": 543600 }, { "epoch": 0.6560464843383532, "learning_rate": 7.844730108680202e-06, "loss": 2.8882940673828124, "step": 543700 }, { "epoch": 0.656167147660836, "learning_rate": 7.844326273212464e-06, "loss": 2.8928472900390627, "step": 543800 }, { "epoch": 0.6562878109833186, "learning_rate": 7.843922437744726e-06, "loss": 2.8955841064453125, "step": 543900 }, { "epoch": 0.6564084743058013, "learning_rate": 7.843518602276986e-06, "loss": 2.890169677734375, "step": 544000 }, { "epoch": 0.656529137628284, "learning_rate": 7.843114766809248e-06, "loss": 2.8813189697265624, "step": 544100 }, { "epoch": 0.6566498009507666, "learning_rate": 7.842710931341509e-06, "loss": 2.9042623901367186, "step": 544200 }, { "epoch": 0.6567704642732494, "learning_rate": 7.84230709587377e-06, "loss": 2.8564773559570313, "step": 544300 }, { "epoch": 0.656891127595732, "learning_rate": 7.841903260406033e-06, "loss": 2.887789306640625, "step": 544400 }, { "epoch": 0.6570117909182147, "learning_rate": 7.841499424938295e-06, "loss": 2.8893804931640625, "step": 544500 }, { "epoch": 0.6571324542406974, "learning_rate": 7.841095589470557e-06, "loss": 2.893466796875, "step": 544600 }, { "epoch": 0.6572531175631801, "learning_rate": 7.840691754002819e-06, "loss": 2.8943426513671877, "step": 544700 }, { "epoch": 0.6573737808856628, "learning_rate": 7.840287918535079e-06, "loss": 2.911033020019531, "step": 544800 }, { "epoch": 0.6574944442081454, "learning_rate": 7.839884083067341e-06, "loss": 2.89703857421875, "step": 544900 }, { "epoch": 0.6576151075306281, "learning_rate": 7.839480247599603e-06, "loss": 2.886546936035156, "step": 545000 }, { "epoch": 0.6577357708531109, "learning_rate": 7.839076412131865e-06, "loss": 2.8962164306640625, "step": 545100 }, { "epoch": 0.6578564341755935, "learning_rate": 7.838672576664125e-06, "loss": 2.9256500244140624, "step": 545200 }, { "epoch": 0.6579770974980762, "learning_rate": 7.838268741196387e-06, "loss": 2.8784664916992186, "step": 545300 }, { "epoch": 0.6580977608205588, "learning_rate": 7.837864905728649e-06, "loss": 2.907110595703125, "step": 545400 }, { "epoch": 0.6582184241430415, "learning_rate": 7.837461070260911e-06, "loss": 2.900867614746094, "step": 545500 }, { "epoch": 0.6583390874655243, "learning_rate": 7.837057234793173e-06, "loss": 2.909971923828125, "step": 545600 }, { "epoch": 0.6584597507880069, "learning_rate": 7.836653399325433e-06, "loss": 2.9139413452148437, "step": 545700 }, { "epoch": 0.6585804141104896, "learning_rate": 7.836249563857695e-06, "loss": 2.920662841796875, "step": 545800 }, { "epoch": 0.6587010774329722, "learning_rate": 7.835845728389957e-06, "loss": 2.9010275268554686, "step": 545900 }, { "epoch": 0.658821740755455, "learning_rate": 7.83544189292222e-06, "loss": 2.8878598022460937, "step": 546000 }, { "epoch": 0.6589424040779377, "learning_rate": 7.83503805745448e-06, "loss": 2.9176119995117187, "step": 546100 }, { "epoch": 0.6590630674004203, "learning_rate": 7.834634221986742e-06, "loss": 2.9249783325195313, "step": 546200 }, { "epoch": 0.659183730722903, "learning_rate": 7.834230386519004e-06, "loss": 2.901019287109375, "step": 546300 }, { "epoch": 0.6593043940453857, "learning_rate": 7.833826551051266e-06, "loss": 2.8969735717773437, "step": 546400 }, { "epoch": 0.6594250573678684, "learning_rate": 7.833422715583526e-06, "loss": 2.8929318237304686, "step": 546500 }, { "epoch": 0.6595457206903511, "learning_rate": 7.833018880115788e-06, "loss": 2.9113809204101564, "step": 546600 }, { "epoch": 0.6596663840128337, "learning_rate": 7.83261504464805e-06, "loss": 2.8651937866210937, "step": 546700 }, { "epoch": 0.6597870473353165, "learning_rate": 7.832211209180312e-06, "loss": 2.898782958984375, "step": 546800 }, { "epoch": 0.6599077106577991, "learning_rate": 7.831807373712574e-06, "loss": 2.9068112182617187, "step": 546900 }, { "epoch": 0.6600283739802818, "learning_rate": 7.831403538244836e-06, "loss": 2.8640316772460936, "step": 547000 }, { "epoch": 0.6601490373027645, "learning_rate": 7.830999702777096e-06, "loss": 2.8768670654296873, "step": 547100 }, { "epoch": 0.6602697006252471, "learning_rate": 7.830595867309358e-06, "loss": 2.9254611206054686, "step": 547200 }, { "epoch": 0.6603903639477299, "learning_rate": 7.830192031841618e-06, "loss": 2.8940365600585936, "step": 547300 }, { "epoch": 0.6605110272702125, "learning_rate": 7.82978819637388e-06, "loss": 2.888963317871094, "step": 547400 }, { "epoch": 0.6606316905926952, "learning_rate": 7.829384360906142e-06, "loss": 2.8824942016601565, "step": 547500 }, { "epoch": 0.660752353915178, "learning_rate": 7.828980525438404e-06, "loss": 2.8810000610351563, "step": 547600 }, { "epoch": 0.6608730172376606, "learning_rate": 7.828576689970666e-06, "loss": 2.872586975097656, "step": 547700 }, { "epoch": 0.6609936805601433, "learning_rate": 7.828172854502928e-06, "loss": 2.8890869140625, "step": 547800 }, { "epoch": 0.6611143438826259, "learning_rate": 7.82776901903519e-06, "loss": 2.902843017578125, "step": 547900 }, { "epoch": 0.6612350072051086, "learning_rate": 7.827365183567452e-06, "loss": 2.8827139282226564, "step": 548000 }, { "epoch": 0.6613556705275914, "learning_rate": 7.826961348099712e-06, "loss": 2.8952496337890623, "step": 548100 }, { "epoch": 0.661476333850074, "learning_rate": 7.826557512631974e-06, "loss": 2.892314758300781, "step": 548200 }, { "epoch": 0.6615969971725567, "learning_rate": 7.826153677164235e-06, "loss": 2.9087774658203127, "step": 548300 }, { "epoch": 0.6617176604950393, "learning_rate": 7.825749841696497e-06, "loss": 2.8974014282226563, "step": 548400 }, { "epoch": 0.6618383238175221, "learning_rate": 7.825346006228759e-06, "loss": 2.88627685546875, "step": 548500 }, { "epoch": 0.6619589871400048, "learning_rate": 7.82494217076102e-06, "loss": 2.8855911254882813, "step": 548600 }, { "epoch": 0.6620796504624874, "learning_rate": 7.824538335293283e-06, "loss": 2.867442932128906, "step": 548700 }, { "epoch": 0.6622003137849701, "learning_rate": 7.824134499825545e-06, "loss": 2.892622985839844, "step": 548800 }, { "epoch": 0.6623209771074527, "learning_rate": 7.823730664357805e-06, "loss": 2.8662149047851564, "step": 548900 }, { "epoch": 0.6624416404299355, "learning_rate": 7.823326828890067e-06, "loss": 2.9218402099609375, "step": 549000 }, { "epoch": 0.6625623037524182, "learning_rate": 7.822922993422329e-06, "loss": 2.87510009765625, "step": 549100 }, { "epoch": 0.6626829670749008, "learning_rate": 7.822519157954591e-06, "loss": 2.8868499755859376, "step": 549200 }, { "epoch": 0.6628036303973835, "learning_rate": 7.822115322486851e-06, "loss": 2.8812124633789065, "step": 549300 }, { "epoch": 0.6629242937198663, "learning_rate": 7.821711487019113e-06, "loss": 2.9025885009765626, "step": 549400 }, { "epoch": 0.6630449570423489, "learning_rate": 7.821307651551375e-06, "loss": 2.873065185546875, "step": 549500 }, { "epoch": 0.6631656203648316, "learning_rate": 7.820903816083637e-06, "loss": 2.8949411010742185, "step": 549600 }, { "epoch": 0.6632862836873142, "learning_rate": 7.820499980615897e-06, "loss": 2.8904754638671877, "step": 549700 }, { "epoch": 0.663406947009797, "learning_rate": 7.82009614514816e-06, "loss": 2.906838684082031, "step": 549800 }, { "epoch": 0.6635276103322797, "learning_rate": 7.819692309680421e-06, "loss": 2.8911181640625, "step": 549900 }, { "epoch": 0.6636482736547623, "learning_rate": 7.819288474212683e-06, "loss": 2.869093933105469, "step": 550000 }, { "epoch": 0.663768936977245, "learning_rate": 7.818884638744945e-06, "loss": 2.8962200927734374, "step": 550100 }, { "epoch": 0.6638896002997277, "learning_rate": 7.818480803277206e-06, "loss": 2.8813595581054687, "step": 550200 }, { "epoch": 0.6640102636222104, "learning_rate": 7.818076967809468e-06, "loss": 2.9032928466796877, "step": 550300 }, { "epoch": 0.6641309269446931, "learning_rate": 7.81767313234173e-06, "loss": 2.9056414794921874, "step": 550400 }, { "epoch": 0.6642515902671757, "learning_rate": 7.81726929687399e-06, "loss": 2.890927429199219, "step": 550500 }, { "epoch": 0.6643722535896585, "learning_rate": 7.816865461406252e-06, "loss": 2.86630615234375, "step": 550600 }, { "epoch": 0.6644929169121411, "learning_rate": 7.816461625938514e-06, "loss": 2.8881985473632814, "step": 550700 }, { "epoch": 0.6646135802346238, "learning_rate": 7.816057790470776e-06, "loss": 2.9093582153320314, "step": 550800 }, { "epoch": 0.6647342435571065, "learning_rate": 7.815653955003038e-06, "loss": 2.8779608154296876, "step": 550900 }, { "epoch": 0.6648549068795891, "learning_rate": 7.8152501195353e-06, "loss": 2.8884927368164064, "step": 551000 }, { "epoch": 0.6649755702020719, "learning_rate": 7.814846284067562e-06, "loss": 2.8700637817382812, "step": 551100 }, { "epoch": 0.6650962335245545, "learning_rate": 7.814442448599822e-06, "loss": 2.9007708740234377, "step": 551200 }, { "epoch": 0.6652168968470372, "learning_rate": 7.814038613132084e-06, "loss": 2.8968634033203124, "step": 551300 }, { "epoch": 0.66533756016952, "learning_rate": 7.813634777664344e-06, "loss": 2.8800799560546877, "step": 551400 }, { "epoch": 0.6654582234920026, "learning_rate": 7.813230942196606e-06, "loss": 2.9100927734375, "step": 551500 }, { "epoch": 0.6655788868144853, "learning_rate": 7.812827106728868e-06, "loss": 2.918765869140625, "step": 551600 }, { "epoch": 0.6656995501369679, "learning_rate": 7.81242327126113e-06, "loss": 2.8859066772460937, "step": 551700 }, { "epoch": 0.6658202134594506, "learning_rate": 7.812019435793392e-06, "loss": 2.8692236328125, "step": 551800 }, { "epoch": 0.6659408767819334, "learning_rate": 7.811615600325654e-06, "loss": 2.88407958984375, "step": 551900 }, { "epoch": 0.666061540104416, "learning_rate": 7.811211764857916e-06, "loss": 2.8988983154296877, "step": 552000 }, { "epoch": 0.6661822034268987, "learning_rate": 7.810807929390177e-06, "loss": 2.884002990722656, "step": 552100 }, { "epoch": 0.6663028667493813, "learning_rate": 7.810404093922438e-06, "loss": 2.8778765869140623, "step": 552200 }, { "epoch": 0.6664235300718641, "learning_rate": 7.8100002584547e-06, "loss": 2.8798202514648437, "step": 552300 }, { "epoch": 0.6665441933943468, "learning_rate": 7.80959642298696e-06, "loss": 2.880676574707031, "step": 552400 }, { "epoch": 0.6666648567168294, "learning_rate": 7.809192587519223e-06, "loss": 2.888607177734375, "step": 552500 }, { "epoch": 0.6667855200393121, "learning_rate": 7.808788752051485e-06, "loss": 2.883059387207031, "step": 552600 }, { "epoch": 0.6669061833617947, "learning_rate": 7.808384916583747e-06, "loss": 2.8970391845703123, "step": 552700 }, { "epoch": 0.6670268466842775, "learning_rate": 7.807981081116009e-06, "loss": 2.9010162353515625, "step": 552800 }, { "epoch": 0.6671475100067602, "learning_rate": 7.80757724564827e-06, "loss": 2.875140380859375, "step": 552900 }, { "epoch": 0.6672681733292428, "learning_rate": 7.807173410180531e-06, "loss": 2.8983416748046875, "step": 553000 }, { "epoch": 0.6673888366517255, "learning_rate": 7.806769574712793e-06, "loss": 2.8651605224609376, "step": 553100 }, { "epoch": 0.6675094999742082, "learning_rate": 7.806365739245055e-06, "loss": 2.8826727294921874, "step": 553200 }, { "epoch": 0.6676301632966909, "learning_rate": 7.805961903777315e-06, "loss": 2.87650146484375, "step": 553300 }, { "epoch": 0.6677508266191736, "learning_rate": 7.805558068309577e-06, "loss": 2.870502624511719, "step": 553400 }, { "epoch": 0.6678714899416562, "learning_rate": 7.80515423284184e-06, "loss": 2.8962478637695312, "step": 553500 }, { "epoch": 0.667992153264139, "learning_rate": 7.804750397374101e-06, "loss": 2.9070758056640624, "step": 553600 }, { "epoch": 0.6681128165866216, "learning_rate": 7.804346561906363e-06, "loss": 2.87674560546875, "step": 553700 }, { "epoch": 0.6682334799091043, "learning_rate": 7.803942726438623e-06, "loss": 2.872855224609375, "step": 553800 }, { "epoch": 0.668354143231587, "learning_rate": 7.803538890970885e-06, "loss": 2.8738970947265625, "step": 553900 }, { "epoch": 0.6684748065540697, "learning_rate": 7.803135055503147e-06, "loss": 2.862540588378906, "step": 554000 }, { "epoch": 0.6685954698765524, "learning_rate": 7.80273122003541e-06, "loss": 2.900754089355469, "step": 554100 }, { "epoch": 0.668716133199035, "learning_rate": 7.802327384567671e-06, "loss": 2.8874362182617186, "step": 554200 }, { "epoch": 0.6688367965215177, "learning_rate": 7.801923549099932e-06, "loss": 2.8697039794921877, "step": 554300 }, { "epoch": 0.6689574598440005, "learning_rate": 7.801519713632194e-06, "loss": 2.8760580444335937, "step": 554400 }, { "epoch": 0.6690781231664831, "learning_rate": 7.801115878164456e-06, "loss": 2.8804000854492187, "step": 554500 }, { "epoch": 0.6691987864889658, "learning_rate": 7.800712042696716e-06, "loss": 2.889403991699219, "step": 554600 }, { "epoch": 0.6693194498114485, "learning_rate": 7.800308207228978e-06, "loss": 2.8754501342773438, "step": 554700 }, { "epoch": 0.6694401131339311, "learning_rate": 7.79990437176124e-06, "loss": 2.895796203613281, "step": 554800 }, { "epoch": 0.6695607764564139, "learning_rate": 7.799500536293502e-06, "loss": 2.9030282592773435, "step": 554900 }, { "epoch": 0.6696814397788965, "learning_rate": 7.799096700825764e-06, "loss": 2.8908013916015625, "step": 555000 }, { "epoch": 0.6698021031013792, "learning_rate": 7.798692865358026e-06, "loss": 2.875460205078125, "step": 555100 }, { "epoch": 0.669922766423862, "learning_rate": 7.798289029890286e-06, "loss": 2.8758810424804686, "step": 555200 }, { "epoch": 0.6700434297463446, "learning_rate": 7.797885194422548e-06, "loss": 2.8593960571289063, "step": 555300 }, { "epoch": 0.6701640930688273, "learning_rate": 7.79748135895481e-06, "loss": 2.8479013061523437, "step": 555400 }, { "epoch": 0.6702847563913099, "learning_rate": 7.79707752348707e-06, "loss": 2.8833963012695314, "step": 555500 }, { "epoch": 0.6704054197137926, "learning_rate": 7.796673688019332e-06, "loss": 2.8628692626953125, "step": 555600 }, { "epoch": 0.6705260830362754, "learning_rate": 7.796269852551594e-06, "loss": 2.881380310058594, "step": 555700 }, { "epoch": 0.670646746358758, "learning_rate": 7.795866017083856e-06, "loss": 2.838923034667969, "step": 555800 }, { "epoch": 0.6707674096812407, "learning_rate": 7.795462181616118e-06, "loss": 2.894267883300781, "step": 555900 }, { "epoch": 0.6708880730037233, "learning_rate": 7.79505834614838e-06, "loss": 2.883511962890625, "step": 556000 }, { "epoch": 0.6710087363262061, "learning_rate": 7.794654510680642e-06, "loss": 2.87624755859375, "step": 556100 }, { "epoch": 0.6711293996486888, "learning_rate": 7.794250675212903e-06, "loss": 2.878243713378906, "step": 556200 }, { "epoch": 0.6712500629711714, "learning_rate": 7.793846839745165e-06, "loss": 2.8911016845703124, "step": 556300 }, { "epoch": 0.6713707262936541, "learning_rate": 7.793443004277425e-06, "loss": 2.903614196777344, "step": 556400 }, { "epoch": 0.6714913896161367, "learning_rate": 7.793039168809687e-06, "loss": 2.8828045654296877, "step": 556500 }, { "epoch": 0.6716120529386195, "learning_rate": 7.792635333341949e-06, "loss": 2.909044189453125, "step": 556600 }, { "epoch": 0.6717327162611022, "learning_rate": 7.79223149787421e-06, "loss": 2.8577044677734373, "step": 556700 }, { "epoch": 0.6718533795835848, "learning_rate": 7.791827662406473e-06, "loss": 2.886777038574219, "step": 556800 }, { "epoch": 0.6719740429060675, "learning_rate": 7.791423826938735e-06, "loss": 2.8680679321289064, "step": 556900 }, { "epoch": 0.6720947062285502, "learning_rate": 7.791019991470997e-06, "loss": 2.887698059082031, "step": 557000 }, { "epoch": 0.6722153695510329, "learning_rate": 7.790616156003257e-06, "loss": 2.8616558837890627, "step": 557100 }, { "epoch": 0.6723360328735156, "learning_rate": 7.790212320535519e-06, "loss": 2.892606201171875, "step": 557200 }, { "epoch": 0.6724566961959982, "learning_rate": 7.789808485067781e-06, "loss": 2.870316467285156, "step": 557300 }, { "epoch": 0.672577359518481, "learning_rate": 7.789404649600041e-06, "loss": 2.85173095703125, "step": 557400 }, { "epoch": 0.6726980228409636, "learning_rate": 7.789000814132303e-06, "loss": 2.8881787109375, "step": 557500 }, { "epoch": 0.6728186861634463, "learning_rate": 7.788596978664565e-06, "loss": 2.86265625, "step": 557600 }, { "epoch": 0.672939349485929, "learning_rate": 7.788193143196827e-06, "loss": 2.87184814453125, "step": 557700 }, { "epoch": 0.6730600128084117, "learning_rate": 7.78778930772909e-06, "loss": 2.89560302734375, "step": 557800 }, { "epoch": 0.6731806761308944, "learning_rate": 7.78738547226135e-06, "loss": 2.8589797973632813, "step": 557900 }, { "epoch": 0.673301339453377, "learning_rate": 7.786981636793611e-06, "loss": 2.8650192260742187, "step": 558000 }, { "epoch": 0.6734220027758597, "learning_rate": 7.786577801325873e-06, "loss": 2.9020370483398437, "step": 558100 }, { "epoch": 0.6735426660983425, "learning_rate": 7.786173965858135e-06, "loss": 2.876556091308594, "step": 558200 }, { "epoch": 0.6736633294208251, "learning_rate": 7.785770130390396e-06, "loss": 2.868436279296875, "step": 558300 }, { "epoch": 0.6737839927433078, "learning_rate": 7.785366294922658e-06, "loss": 2.885539855957031, "step": 558400 }, { "epoch": 0.6739046560657904, "learning_rate": 7.78496245945492e-06, "loss": 2.886922607421875, "step": 558500 }, { "epoch": 0.6740253193882731, "learning_rate": 7.784558623987182e-06, "loss": 2.8880572509765625, "step": 558600 }, { "epoch": 0.6741459827107559, "learning_rate": 7.784154788519442e-06, "loss": 2.873570556640625, "step": 558700 }, { "epoch": 0.6742666460332385, "learning_rate": 7.783750953051704e-06, "loss": 2.9087109375, "step": 558800 }, { "epoch": 0.6743873093557212, "learning_rate": 7.783347117583966e-06, "loss": 2.8594561767578126, "step": 558900 }, { "epoch": 0.6745079726782038, "learning_rate": 7.782943282116228e-06, "loss": 2.8572076416015624, "step": 559000 }, { "epoch": 0.6746286360006866, "learning_rate": 7.78253944664849e-06, "loss": 2.8629010009765623, "step": 559100 }, { "epoch": 0.6747492993231693, "learning_rate": 7.782135611180752e-06, "loss": 2.88161865234375, "step": 559200 }, { "epoch": 0.6748699626456519, "learning_rate": 7.781731775713012e-06, "loss": 2.8737612915039064, "step": 559300 }, { "epoch": 0.6749906259681346, "learning_rate": 7.781327940245274e-06, "loss": 2.8823065185546874, "step": 559400 }, { "epoch": 0.6751112892906173, "learning_rate": 7.780924104777534e-06, "loss": 2.863649597167969, "step": 559500 }, { "epoch": 0.6752319526131, "learning_rate": 7.780520269309796e-06, "loss": 2.854613952636719, "step": 559600 }, { "epoch": 0.6753526159355827, "learning_rate": 7.780116433842058e-06, "loss": 2.85444091796875, "step": 559700 }, { "epoch": 0.6754732792580653, "learning_rate": 7.77971259837432e-06, "loss": 2.898060607910156, "step": 559800 }, { "epoch": 0.6755939425805481, "learning_rate": 7.779308762906582e-06, "loss": 2.9172439575195312, "step": 559900 }, { "epoch": 0.6757146059030308, "learning_rate": 7.778904927438844e-06, "loss": 2.8942379760742187, "step": 560000 }, { "epoch": 0.6758352692255134, "learning_rate": 7.778501091971106e-06, "loss": 2.8584835815429686, "step": 560100 }, { "epoch": 0.6759559325479961, "learning_rate": 7.778097256503367e-06, "loss": 2.872791748046875, "step": 560200 }, { "epoch": 0.6760765958704787, "learning_rate": 7.777693421035629e-06, "loss": 2.903233947753906, "step": 560300 }, { "epoch": 0.6761972591929615, "learning_rate": 7.77728958556789e-06, "loss": 2.845096435546875, "step": 560400 }, { "epoch": 0.6763179225154442, "learning_rate": 7.776885750100151e-06, "loss": 2.8757818603515624, "step": 560500 }, { "epoch": 0.6764385858379268, "learning_rate": 7.776481914632413e-06, "loss": 2.8799420166015626, "step": 560600 }, { "epoch": 0.6765592491604095, "learning_rate": 7.776078079164675e-06, "loss": 2.8757839965820313, "step": 560700 }, { "epoch": 0.6766799124828922, "learning_rate": 7.775674243696937e-06, "loss": 2.8814715576171874, "step": 560800 }, { "epoch": 0.6768005758053749, "learning_rate": 7.775270408229199e-06, "loss": 2.871025390625, "step": 560900 }, { "epoch": 0.6769212391278576, "learning_rate": 7.77486657276146e-06, "loss": 2.8730758666992187, "step": 561000 }, { "epoch": 0.6770419024503402, "learning_rate": 7.774462737293723e-06, "loss": 2.8659014892578125, "step": 561100 }, { "epoch": 0.677162565772823, "learning_rate": 7.774058901825983e-06, "loss": 2.870810546875, "step": 561200 }, { "epoch": 0.6772832290953056, "learning_rate": 7.773655066358245e-06, "loss": 2.8903762817382814, "step": 561300 }, { "epoch": 0.6774038924177883, "learning_rate": 7.773251230890505e-06, "loss": 2.8667633056640627, "step": 561400 }, { "epoch": 0.677524555740271, "learning_rate": 7.772847395422767e-06, "loss": 2.8895559692382813, "step": 561500 }, { "epoch": 0.6776452190627537, "learning_rate": 7.77244355995503e-06, "loss": 2.868918762207031, "step": 561600 }, { "epoch": 0.6777658823852364, "learning_rate": 7.772039724487291e-06, "loss": 2.854873046875, "step": 561700 }, { "epoch": 0.677886545707719, "learning_rate": 7.771635889019553e-06, "loss": 2.884571533203125, "step": 561800 }, { "epoch": 0.6780072090302017, "learning_rate": 7.771232053551815e-06, "loss": 2.8823175048828125, "step": 561900 }, { "epoch": 0.6781278723526845, "learning_rate": 7.770828218084076e-06, "loss": 2.876451110839844, "step": 562000 }, { "epoch": 0.6782485356751671, "learning_rate": 7.770424382616337e-06, "loss": 2.8530618286132814, "step": 562100 }, { "epoch": 0.6783691989976498, "learning_rate": 7.7700205471486e-06, "loss": 2.8595480346679687, "step": 562200 }, { "epoch": 0.6784898623201324, "learning_rate": 7.769616711680861e-06, "loss": 2.8763507080078123, "step": 562300 }, { "epoch": 0.6786105256426151, "learning_rate": 7.769212876213122e-06, "loss": 2.8865179443359374, "step": 562400 }, { "epoch": 0.6787311889650979, "learning_rate": 7.768809040745384e-06, "loss": 2.8828839111328124, "step": 562500 }, { "epoch": 0.6788518522875805, "learning_rate": 7.768405205277646e-06, "loss": 2.8752972412109377, "step": 562600 }, { "epoch": 0.6789725156100632, "learning_rate": 7.768001369809908e-06, "loss": 2.8934088134765625, "step": 562700 }, { "epoch": 0.6790931789325458, "learning_rate": 7.767597534342168e-06, "loss": 2.8764599609375, "step": 562800 }, { "epoch": 0.6792138422550286, "learning_rate": 7.76719369887443e-06, "loss": 2.8791510009765626, "step": 562900 }, { "epoch": 0.6793345055775113, "learning_rate": 7.766789863406692e-06, "loss": 2.8823703002929686, "step": 563000 }, { "epoch": 0.6794551688999939, "learning_rate": 7.766386027938954e-06, "loss": 2.8865802001953127, "step": 563100 }, { "epoch": 0.6795758322224766, "learning_rate": 7.765982192471216e-06, "loss": 2.876112060546875, "step": 563200 }, { "epoch": 0.6796964955449593, "learning_rate": 7.765578357003478e-06, "loss": 2.8465057373046876, "step": 563300 }, { "epoch": 0.679817158867442, "learning_rate": 7.765174521535738e-06, "loss": 2.87403076171875, "step": 563400 }, { "epoch": 0.6799378221899247, "learning_rate": 7.764770686068e-06, "loss": 2.8897393798828124, "step": 563500 }, { "epoch": 0.6800584855124073, "learning_rate": 7.76436685060026e-06, "loss": 2.874971618652344, "step": 563600 }, { "epoch": 0.6801791488348901, "learning_rate": 7.763963015132522e-06, "loss": 2.8601336669921875, "step": 563700 }, { "epoch": 0.6802998121573727, "learning_rate": 7.763559179664784e-06, "loss": 2.8728759765625, "step": 563800 }, { "epoch": 0.6804204754798554, "learning_rate": 7.763155344197046e-06, "loss": 2.869473876953125, "step": 563900 }, { "epoch": 0.6805411388023381, "learning_rate": 7.762751508729308e-06, "loss": 2.876650390625, "step": 564000 }, { "epoch": 0.6806618021248207, "learning_rate": 7.76234767326157e-06, "loss": 2.8839767456054686, "step": 564100 }, { "epoch": 0.6807824654473035, "learning_rate": 7.761943837793832e-06, "loss": 2.8563507080078123, "step": 564200 }, { "epoch": 0.6809031287697861, "learning_rate": 7.761540002326093e-06, "loss": 2.9017193603515623, "step": 564300 }, { "epoch": 0.6810237920922688, "learning_rate": 7.761136166858355e-06, "loss": 2.8523788452148438, "step": 564400 }, { "epoch": 0.6811444554147515, "learning_rate": 7.760732331390617e-06, "loss": 2.8543975830078123, "step": 564500 }, { "epoch": 0.6812651187372342, "learning_rate": 7.760328495922877e-06, "loss": 2.901194763183594, "step": 564600 }, { "epoch": 0.6813857820597169, "learning_rate": 7.759924660455139e-06, "loss": 2.888547058105469, "step": 564700 }, { "epoch": 0.6815064453821995, "learning_rate": 7.759520824987401e-06, "loss": 2.8899765014648438, "step": 564800 }, { "epoch": 0.6816271087046822, "learning_rate": 7.759116989519663e-06, "loss": 2.892289733886719, "step": 564900 }, { "epoch": 0.681747772027165, "learning_rate": 7.758713154051925e-06, "loss": 2.869903869628906, "step": 565000 }, { "epoch": 0.6818684353496476, "learning_rate": 7.758309318584187e-06, "loss": 2.8770574951171874, "step": 565100 }, { "epoch": 0.6819890986721303, "learning_rate": 7.757905483116447e-06, "loss": 2.9096868896484374, "step": 565200 }, { "epoch": 0.682109761994613, "learning_rate": 7.757501647648709e-06, "loss": 2.8768850708007814, "step": 565300 }, { "epoch": 0.6822304253170957, "learning_rate": 7.757097812180971e-06, "loss": 2.8804562377929686, "step": 565400 }, { "epoch": 0.6823510886395784, "learning_rate": 7.756693976713231e-06, "loss": 2.8872064208984374, "step": 565500 }, { "epoch": 0.682471751962061, "learning_rate": 7.756290141245493e-06, "loss": 2.8703192138671874, "step": 565600 }, { "epoch": 0.6825924152845437, "learning_rate": 7.755886305777755e-06, "loss": 2.847398376464844, "step": 565700 }, { "epoch": 0.6827130786070265, "learning_rate": 7.755482470310017e-06, "loss": 2.879388427734375, "step": 565800 }, { "epoch": 0.6828337419295091, "learning_rate": 7.75507863484228e-06, "loss": 2.9059454345703126, "step": 565900 }, { "epoch": 0.6829544052519918, "learning_rate": 7.75467479937454e-06, "loss": 2.8791693115234374, "step": 566000 }, { "epoch": 0.6830750685744744, "learning_rate": 7.754270963906802e-06, "loss": 2.8903179931640626, "step": 566100 }, { "epoch": 0.6831957318969571, "learning_rate": 7.753867128439064e-06, "loss": 2.8886767578125, "step": 566200 }, { "epoch": 0.6833163952194399, "learning_rate": 7.753463292971326e-06, "loss": 2.874239501953125, "step": 566300 }, { "epoch": 0.6834370585419225, "learning_rate": 7.753059457503587e-06, "loss": 2.88536376953125, "step": 566400 }, { "epoch": 0.6835577218644052, "learning_rate": 7.752655622035848e-06, "loss": 2.879300537109375, "step": 566500 }, { "epoch": 0.6836783851868878, "learning_rate": 7.75225178656811e-06, "loss": 2.8782589721679686, "step": 566600 }, { "epoch": 0.6837990485093706, "learning_rate": 7.751847951100372e-06, "loss": 2.867265625, "step": 566700 }, { "epoch": 0.6839197118318533, "learning_rate": 7.751444115632634e-06, "loss": 2.8794720458984373, "step": 566800 }, { "epoch": 0.6840403751543359, "learning_rate": 7.751040280164894e-06, "loss": 2.8571954345703126, "step": 566900 }, { "epoch": 0.6841610384768186, "learning_rate": 7.750636444697156e-06, "loss": 2.857785949707031, "step": 567000 }, { "epoch": 0.6842817017993013, "learning_rate": 7.750232609229418e-06, "loss": 2.8535577392578126, "step": 567100 }, { "epoch": 0.684402365121784, "learning_rate": 7.74982877376168e-06, "loss": 2.8628280639648436, "step": 567200 }, { "epoch": 0.6845230284442667, "learning_rate": 7.749424938293942e-06, "loss": 2.8665975952148437, "step": 567300 }, { "epoch": 0.6846436917667493, "learning_rate": 7.749021102826202e-06, "loss": 2.8678985595703126, "step": 567400 }, { "epoch": 0.6847643550892321, "learning_rate": 7.748617267358464e-06, "loss": 2.882415771484375, "step": 567500 }, { "epoch": 0.6848850184117147, "learning_rate": 7.748213431890726e-06, "loss": 2.8546875, "step": 567600 }, { "epoch": 0.6850056817341974, "learning_rate": 7.747809596422986e-06, "loss": 2.8489559936523436, "step": 567700 }, { "epoch": 0.6851263450566801, "learning_rate": 7.747405760955248e-06, "loss": 2.883067321777344, "step": 567800 }, { "epoch": 0.6852470083791627, "learning_rate": 7.74700192548751e-06, "loss": 2.880250244140625, "step": 567900 }, { "epoch": 0.6853676717016455, "learning_rate": 7.746598090019772e-06, "loss": 2.9046136474609376, "step": 568000 }, { "epoch": 0.6854883350241281, "learning_rate": 7.746194254552034e-06, "loss": 2.8551254272460938, "step": 568100 }, { "epoch": 0.6856089983466108, "learning_rate": 7.745790419084296e-06, "loss": 2.8562921142578124, "step": 568200 }, { "epoch": 0.6857296616690935, "learning_rate": 7.745386583616558e-06, "loss": 2.8735302734375, "step": 568300 }, { "epoch": 0.6858503249915762, "learning_rate": 7.744982748148819e-06, "loss": 2.8759234619140623, "step": 568400 }, { "epoch": 0.6859709883140589, "learning_rate": 7.74457891268108e-06, "loss": 2.876201477050781, "step": 568500 }, { "epoch": 0.6860916516365415, "learning_rate": 7.744175077213341e-06, "loss": 2.869367980957031, "step": 568600 }, { "epoch": 0.6862123149590242, "learning_rate": 7.743771241745603e-06, "loss": 2.8561962890625, "step": 568700 }, { "epoch": 0.686332978281507, "learning_rate": 7.743367406277865e-06, "loss": 2.859227294921875, "step": 568800 }, { "epoch": 0.6864536416039896, "learning_rate": 7.742963570810127e-06, "loss": 2.875888671875, "step": 568900 }, { "epoch": 0.6865743049264723, "learning_rate": 7.742559735342389e-06, "loss": 2.8876577758789064, "step": 569000 }, { "epoch": 0.6866949682489549, "learning_rate": 7.742155899874651e-06, "loss": 2.861221923828125, "step": 569100 }, { "epoch": 0.6868156315714377, "learning_rate": 7.741752064406913e-06, "loss": 2.8677130126953125, "step": 569200 }, { "epoch": 0.6869362948939204, "learning_rate": 7.741348228939173e-06, "loss": 2.8819265747070313, "step": 569300 }, { "epoch": 0.687056958216403, "learning_rate": 7.740944393471435e-06, "loss": 2.8750811767578126, "step": 569400 }, { "epoch": 0.6871776215388857, "learning_rate": 7.740540558003697e-06, "loss": 2.8770632934570313, "step": 569500 }, { "epoch": 0.6872982848613683, "learning_rate": 7.740136722535957e-06, "loss": 2.865481262207031, "step": 569600 }, { "epoch": 0.6874189481838511, "learning_rate": 7.73973288706822e-06, "loss": 2.8378131103515627, "step": 569700 }, { "epoch": 0.6875396115063338, "learning_rate": 7.739329051600481e-06, "loss": 2.852716979980469, "step": 569800 }, { "epoch": 0.6876602748288164, "learning_rate": 7.738925216132743e-06, "loss": 2.863541259765625, "step": 569900 }, { "epoch": 0.6877809381512991, "learning_rate": 7.738521380665005e-06, "loss": 2.8488308715820314, "step": 570000 }, { "epoch": 0.6879016014737819, "learning_rate": 7.738117545197266e-06, "loss": 2.882537841796875, "step": 570100 }, { "epoch": 0.6880222647962645, "learning_rate": 7.737713709729528e-06, "loss": 2.847112731933594, "step": 570200 }, { "epoch": 0.6881429281187472, "learning_rate": 7.73730987426179e-06, "loss": 2.876348571777344, "step": 570300 }, { "epoch": 0.6882635914412298, "learning_rate": 7.736906038794052e-06, "loss": 2.889609069824219, "step": 570400 }, { "epoch": 0.6883842547637126, "learning_rate": 7.736502203326312e-06, "loss": 2.8449444580078125, "step": 570500 }, { "epoch": 0.6885049180861953, "learning_rate": 7.736098367858574e-06, "loss": 2.8665936279296873, "step": 570600 }, { "epoch": 0.6886255814086779, "learning_rate": 7.735694532390836e-06, "loss": 2.890267333984375, "step": 570700 }, { "epoch": 0.6887462447311606, "learning_rate": 7.735290696923098e-06, "loss": 2.8554742431640623, "step": 570800 }, { "epoch": 0.6888669080536433, "learning_rate": 7.734886861455358e-06, "loss": 2.8798077392578123, "step": 570900 }, { "epoch": 0.688987571376126, "learning_rate": 7.73448302598762e-06, "loss": 2.8675967407226564, "step": 571000 }, { "epoch": 0.6891082346986087, "learning_rate": 7.734079190519882e-06, "loss": 2.8301461791992186, "step": 571100 }, { "epoch": 0.6892288980210913, "learning_rate": 7.733675355052144e-06, "loss": 2.84908935546875, "step": 571200 }, { "epoch": 0.6893495613435741, "learning_rate": 7.733271519584406e-06, "loss": 2.8650912475585937, "step": 571300 }, { "epoch": 0.6894702246660567, "learning_rate": 7.732867684116668e-06, "loss": 2.8545663452148435, "step": 571400 }, { "epoch": 0.6895908879885394, "learning_rate": 7.732463848648928e-06, "loss": 2.8690859985351564, "step": 571500 }, { "epoch": 0.6897115513110221, "learning_rate": 7.73206001318119e-06, "loss": 2.8635479736328127, "step": 571600 }, { "epoch": 0.6898322146335047, "learning_rate": 7.731656177713452e-06, "loss": 2.852455749511719, "step": 571700 }, { "epoch": 0.6899528779559875, "learning_rate": 7.731252342245713e-06, "loss": 2.8488589477539064, "step": 571800 }, { "epoch": 0.6900735412784701, "learning_rate": 7.730848506777975e-06, "loss": 2.8865380859375, "step": 571900 }, { "epoch": 0.6901942046009528, "learning_rate": 7.730444671310236e-06, "loss": 2.874664611816406, "step": 572000 }, { "epoch": 0.6903148679234355, "learning_rate": 7.730040835842498e-06, "loss": 2.8504257202148438, "step": 572100 }, { "epoch": 0.6904355312459182, "learning_rate": 7.72963700037476e-06, "loss": 2.8802975463867186, "step": 572200 }, { "epoch": 0.6905561945684009, "learning_rate": 7.729233164907022e-06, "loss": 2.8815579223632812, "step": 572300 }, { "epoch": 0.6906768578908835, "learning_rate": 7.728829329439283e-06, "loss": 2.8994290161132814, "step": 572400 }, { "epoch": 0.6907975212133662, "learning_rate": 7.728425493971545e-06, "loss": 2.857418212890625, "step": 572500 }, { "epoch": 0.690918184535849, "learning_rate": 7.728021658503807e-06, "loss": 2.8725555419921873, "step": 572600 }, { "epoch": 0.6910388478583316, "learning_rate": 7.727617823036067e-06, "loss": 2.867392578125, "step": 572700 }, { "epoch": 0.6911595111808143, "learning_rate": 7.727213987568329e-06, "loss": 2.870016784667969, "step": 572800 }, { "epoch": 0.6912801745032969, "learning_rate": 7.726810152100591e-06, "loss": 2.853316345214844, "step": 572900 }, { "epoch": 0.6914008378257797, "learning_rate": 7.726406316632853e-06, "loss": 2.8782925415039062, "step": 573000 }, { "epoch": 0.6915215011482624, "learning_rate": 7.726002481165115e-06, "loss": 2.8332757568359375, "step": 573100 }, { "epoch": 0.691642164470745, "learning_rate": 7.725598645697377e-06, "loss": 2.8534942626953126, "step": 573200 }, { "epoch": 0.6917628277932277, "learning_rate": 7.725194810229639e-06, "loss": 2.8601724243164064, "step": 573300 }, { "epoch": 0.6918834911157103, "learning_rate": 7.7247909747619e-06, "loss": 2.872872009277344, "step": 573400 }, { "epoch": 0.6920041544381931, "learning_rate": 7.724387139294161e-06, "loss": 2.8716860961914064, "step": 573500 }, { "epoch": 0.6921248177606758, "learning_rate": 7.723983303826421e-06, "loss": 2.870142517089844, "step": 573600 }, { "epoch": 0.6922454810831584, "learning_rate": 7.723579468358683e-06, "loss": 2.861686096191406, "step": 573700 }, { "epoch": 0.6923661444056411, "learning_rate": 7.723175632890945e-06, "loss": 2.89477294921875, "step": 573800 }, { "epoch": 0.6924868077281238, "learning_rate": 7.722771797423207e-06, "loss": 2.858819580078125, "step": 573900 }, { "epoch": 0.6926074710506065, "learning_rate": 7.72236796195547e-06, "loss": 2.8641656494140624, "step": 574000 }, { "epoch": 0.6927281343730892, "learning_rate": 7.721964126487731e-06, "loss": 2.8659429931640625, "step": 574100 }, { "epoch": 0.6928487976955718, "learning_rate": 7.721560291019992e-06, "loss": 2.86802734375, "step": 574200 }, { "epoch": 0.6929694610180546, "learning_rate": 7.721156455552254e-06, "loss": 2.8383413696289064, "step": 574300 }, { "epoch": 0.6930901243405372, "learning_rate": 7.720752620084516e-06, "loss": 2.8667523193359377, "step": 574400 }, { "epoch": 0.6932107876630199, "learning_rate": 7.720348784616778e-06, "loss": 2.8475680541992188, "step": 574500 }, { "epoch": 0.6933314509855026, "learning_rate": 7.719944949149038e-06, "loss": 2.851126708984375, "step": 574600 }, { "epoch": 0.6934521143079853, "learning_rate": 7.7195411136813e-06, "loss": 2.851023864746094, "step": 574700 }, { "epoch": 0.693572777630468, "learning_rate": 7.719137278213562e-06, "loss": 2.8499740600585937, "step": 574800 }, { "epoch": 0.6936934409529506, "learning_rate": 7.718733442745824e-06, "loss": 2.8620339965820314, "step": 574900 }, { "epoch": 0.6938141042754333, "learning_rate": 7.718329607278084e-06, "loss": 2.8746914672851562, "step": 575000 }, { "epoch": 0.6939347675979161, "learning_rate": 7.717925771810346e-06, "loss": 2.8576153564453124, "step": 575100 }, { "epoch": 0.6940554309203987, "learning_rate": 7.717521936342608e-06, "loss": 2.84666748046875, "step": 575200 }, { "epoch": 0.6941760942428814, "learning_rate": 7.71711810087487e-06, "loss": 2.8798028564453126, "step": 575300 }, { "epoch": 0.6942967575653641, "learning_rate": 7.716714265407132e-06, "loss": 2.8682757568359376, "step": 575400 }, { "epoch": 0.6944174208878467, "learning_rate": 7.716310429939394e-06, "loss": 2.8715280151367186, "step": 575500 }, { "epoch": 0.6945380842103295, "learning_rate": 7.715906594471654e-06, "loss": 2.877300109863281, "step": 575600 }, { "epoch": 0.6946587475328121, "learning_rate": 7.715502759003916e-06, "loss": 2.8766259765625, "step": 575700 }, { "epoch": 0.6947794108552948, "learning_rate": 7.715098923536177e-06, "loss": 2.8907876586914063, "step": 575800 }, { "epoch": 0.6949000741777775, "learning_rate": 7.714695088068439e-06, "loss": 2.8691976928710936, "step": 575900 }, { "epoch": 0.6950207375002602, "learning_rate": 7.7142912526007e-06, "loss": 2.859876708984375, "step": 576000 }, { "epoch": 0.6951414008227429, "learning_rate": 7.713887417132963e-06, "loss": 2.8728204345703126, "step": 576100 }, { "epoch": 0.6952620641452255, "learning_rate": 7.713483581665224e-06, "loss": 2.8735012817382812, "step": 576200 }, { "epoch": 0.6953827274677082, "learning_rate": 7.713079746197486e-06, "loss": 2.8696408081054687, "step": 576300 }, { "epoch": 0.695503390790191, "learning_rate": 7.712675910729748e-06, "loss": 2.8614126586914064, "step": 576400 }, { "epoch": 0.6956240541126736, "learning_rate": 7.712272075262009e-06, "loss": 2.863514709472656, "step": 576500 }, { "epoch": 0.6957447174351563, "learning_rate": 7.71186823979427e-06, "loss": 2.875749206542969, "step": 576600 }, { "epoch": 0.6958653807576389, "learning_rate": 7.711464404326533e-06, "loss": 2.869881286621094, "step": 576700 }, { "epoch": 0.6959860440801217, "learning_rate": 7.711060568858793e-06, "loss": 2.877679443359375, "step": 576800 }, { "epoch": 0.6961067074026044, "learning_rate": 7.710656733391055e-06, "loss": 2.8645761108398435, "step": 576900 }, { "epoch": 0.696227370725087, "learning_rate": 7.710252897923317e-06, "loss": 2.8620050048828123, "step": 577000 }, { "epoch": 0.6963480340475697, "learning_rate": 7.709849062455579e-06, "loss": 2.8769570922851564, "step": 577100 }, { "epoch": 0.6964686973700523, "learning_rate": 7.709445226987841e-06, "loss": 2.856103515625, "step": 577200 }, { "epoch": 0.6965893606925351, "learning_rate": 7.709041391520103e-06, "loss": 2.851171875, "step": 577300 }, { "epoch": 0.6967100240150178, "learning_rate": 7.708637556052365e-06, "loss": 2.864934387207031, "step": 577400 }, { "epoch": 0.6968306873375004, "learning_rate": 7.708233720584625e-06, "loss": 2.8648745727539064, "step": 577500 }, { "epoch": 0.6969513506599831, "learning_rate": 7.707829885116887e-06, "loss": 2.8809881591796875, "step": 577600 }, { "epoch": 0.6970720139824658, "learning_rate": 7.707426049649147e-06, "loss": 2.8629269409179687, "step": 577700 }, { "epoch": 0.6971926773049485, "learning_rate": 7.70702221418141e-06, "loss": 2.8471365356445313, "step": 577800 }, { "epoch": 0.6973133406274312, "learning_rate": 7.706618378713671e-06, "loss": 2.8456512451171876, "step": 577900 }, { "epoch": 0.6974340039499138, "learning_rate": 7.706214543245933e-06, "loss": 2.8593902587890625, "step": 578000 }, { "epoch": 0.6975546672723966, "learning_rate": 7.705810707778195e-06, "loss": 2.888683166503906, "step": 578100 }, { "epoch": 0.6976753305948792, "learning_rate": 7.705406872310457e-06, "loss": 2.86565185546875, "step": 578200 }, { "epoch": 0.6977959939173619, "learning_rate": 7.705003036842718e-06, "loss": 2.8601412963867188, "step": 578300 }, { "epoch": 0.6979166572398446, "learning_rate": 7.70459920137498e-06, "loss": 2.865805969238281, "step": 578400 }, { "epoch": 0.6980373205623273, "learning_rate": 7.704195365907242e-06, "loss": 2.867271728515625, "step": 578500 }, { "epoch": 0.69815798388481, "learning_rate": 7.703791530439504e-06, "loss": 2.8775863647460938, "step": 578600 }, { "epoch": 0.6982786472072926, "learning_rate": 7.703387694971764e-06, "loss": 2.8373922729492187, "step": 578700 }, { "epoch": 0.6983993105297753, "learning_rate": 7.702983859504026e-06, "loss": 2.8459716796875, "step": 578800 }, { "epoch": 0.6985199738522581, "learning_rate": 7.702580024036288e-06, "loss": 2.8858401489257814, "step": 578900 }, { "epoch": 0.6986406371747407, "learning_rate": 7.70217618856855e-06, "loss": 2.8735421752929686, "step": 579000 }, { "epoch": 0.6987613004972234, "learning_rate": 7.70177235310081e-06, "loss": 2.8599142456054687, "step": 579100 }, { "epoch": 0.698881963819706, "learning_rate": 7.701368517633072e-06, "loss": 2.8436068725585937, "step": 579200 }, { "epoch": 0.6990026271421887, "learning_rate": 7.700964682165334e-06, "loss": 2.8749465942382812, "step": 579300 }, { "epoch": 0.6991232904646715, "learning_rate": 7.700560846697596e-06, "loss": 2.8473880004882814, "step": 579400 }, { "epoch": 0.6992439537871541, "learning_rate": 7.700157011229858e-06, "loss": 2.8750433349609374, "step": 579500 }, { "epoch": 0.6993646171096368, "learning_rate": 7.699753175762118e-06, "loss": 2.8686251831054688, "step": 579600 }, { "epoch": 0.6994852804321194, "learning_rate": 7.69934934029438e-06, "loss": 2.8483035278320314, "step": 579700 }, { "epoch": 0.6996059437546022, "learning_rate": 7.698945504826642e-06, "loss": 2.865941162109375, "step": 579800 }, { "epoch": 0.6997266070770849, "learning_rate": 7.698541669358903e-06, "loss": 2.8775344848632813, "step": 579900 }, { "epoch": 0.6998472703995675, "learning_rate": 7.698137833891165e-06, "loss": 2.8662261962890625, "step": 580000 }, { "epoch": 0.6999679337220502, "learning_rate": 7.697733998423427e-06, "loss": 2.8305096435546875, "step": 580100 }, { "epoch": 0.7000885970445329, "learning_rate": 7.697330162955689e-06, "loss": 2.846646423339844, "step": 580200 }, { "epoch": 0.7002092603670156, "learning_rate": 7.69692632748795e-06, "loss": 2.8427920532226563, "step": 580300 }, { "epoch": 0.7003299236894983, "learning_rate": 7.696522492020213e-06, "loss": 2.8501577758789063, "step": 580400 }, { "epoch": 0.7004505870119809, "learning_rate": 7.696118656552474e-06, "loss": 2.856065368652344, "step": 580500 }, { "epoch": 0.7005712503344637, "learning_rate": 7.695714821084735e-06, "loss": 2.86554443359375, "step": 580600 }, { "epoch": 0.7006919136569464, "learning_rate": 7.695310985616997e-06, "loss": 2.861060791015625, "step": 580700 }, { "epoch": 0.700812576979429, "learning_rate": 7.694907150149257e-06, "loss": 2.8796966552734373, "step": 580800 }, { "epoch": 0.7009332403019117, "learning_rate": 7.694503314681519e-06, "loss": 2.846746826171875, "step": 580900 }, { "epoch": 0.7010539036243943, "learning_rate": 7.694099479213781e-06, "loss": 2.8797747802734377, "step": 581000 }, { "epoch": 0.7011745669468771, "learning_rate": 7.693695643746043e-06, "loss": 2.8457540893554687, "step": 581100 }, { "epoch": 0.7012952302693598, "learning_rate": 7.693291808278305e-06, "loss": 2.8617990112304685, "step": 581200 }, { "epoch": 0.7014158935918424, "learning_rate": 7.692887972810567e-06, "loss": 2.8425949096679686, "step": 581300 }, { "epoch": 0.7015365569143251, "learning_rate": 7.692484137342829e-06, "loss": 2.871072082519531, "step": 581400 }, { "epoch": 0.7016572202368078, "learning_rate": 7.69208030187509e-06, "loss": 2.8760720825195314, "step": 581500 }, { "epoch": 0.7017778835592905, "learning_rate": 7.691676466407351e-06, "loss": 2.8598867797851564, "step": 581600 }, { "epoch": 0.7018985468817732, "learning_rate": 7.691272630939613e-06, "loss": 2.848721923828125, "step": 581700 }, { "epoch": 0.7020192102042558, "learning_rate": 7.690868795471873e-06, "loss": 2.879400329589844, "step": 581800 }, { "epoch": 0.7021398735267386, "learning_rate": 7.690464960004135e-06, "loss": 2.8481890869140627, "step": 581900 }, { "epoch": 0.7022605368492212, "learning_rate": 7.690061124536397e-06, "loss": 2.8708651733398436, "step": 582000 }, { "epoch": 0.7023812001717039, "learning_rate": 7.68965728906866e-06, "loss": 2.8634072875976564, "step": 582100 }, { "epoch": 0.7025018634941866, "learning_rate": 7.689253453600921e-06, "loss": 2.8674072265625, "step": 582200 }, { "epoch": 0.7026225268166693, "learning_rate": 7.688849618133183e-06, "loss": 2.850791015625, "step": 582300 }, { "epoch": 0.702743190139152, "learning_rate": 7.688445782665444e-06, "loss": 2.8389996337890624, "step": 582400 }, { "epoch": 0.7028638534616346, "learning_rate": 7.688041947197706e-06, "loss": 2.835662536621094, "step": 582500 }, { "epoch": 0.7029845167841173, "learning_rate": 7.687638111729968e-06, "loss": 2.861239013671875, "step": 582600 }, { "epoch": 0.7031051801066001, "learning_rate": 7.687234276262228e-06, "loss": 2.8550344848632814, "step": 582700 }, { "epoch": 0.7032258434290827, "learning_rate": 7.68683044079449e-06, "loss": 2.8749453735351564, "step": 582800 }, { "epoch": 0.7033465067515654, "learning_rate": 7.686426605326752e-06, "loss": 2.840761413574219, "step": 582900 }, { "epoch": 0.703467170074048, "learning_rate": 7.686022769859014e-06, "loss": 2.824681396484375, "step": 583000 }, { "epoch": 0.7035878333965307, "learning_rate": 7.685618934391276e-06, "loss": 2.8570266723632813, "step": 583100 }, { "epoch": 0.7037084967190135, "learning_rate": 7.685215098923536e-06, "loss": 2.8533200073242186, "step": 583200 }, { "epoch": 0.7038291600414961, "learning_rate": 7.684811263455798e-06, "loss": 2.8620306396484376, "step": 583300 }, { "epoch": 0.7039498233639788, "learning_rate": 7.68440742798806e-06, "loss": 2.8539398193359373, "step": 583400 }, { "epoch": 0.7040704866864614, "learning_rate": 7.684003592520322e-06, "loss": 2.8594931030273436, "step": 583500 }, { "epoch": 0.7041911500089442, "learning_rate": 7.683599757052584e-06, "loss": 2.8342193603515624, "step": 583600 }, { "epoch": 0.7043118133314269, "learning_rate": 7.683195921584844e-06, "loss": 2.847510986328125, "step": 583700 }, { "epoch": 0.7044324766539095, "learning_rate": 7.682792086117106e-06, "loss": 2.8276678466796876, "step": 583800 }, { "epoch": 0.7045531399763922, "learning_rate": 7.682388250649368e-06, "loss": 2.819851989746094, "step": 583900 }, { "epoch": 0.7046738032988749, "learning_rate": 7.681984415181629e-06, "loss": 2.8557998657226564, "step": 584000 }, { "epoch": 0.7047944666213576, "learning_rate": 7.68158057971389e-06, "loss": 2.8221475219726564, "step": 584100 }, { "epoch": 0.7049151299438403, "learning_rate": 7.681176744246153e-06, "loss": 2.8478509521484376, "step": 584200 }, { "epoch": 0.7050357932663229, "learning_rate": 7.680772908778415e-06, "loss": 2.8505010986328125, "step": 584300 }, { "epoch": 0.7051564565888057, "learning_rate": 7.680369073310677e-06, "loss": 2.867825927734375, "step": 584400 }, { "epoch": 0.7052771199112883, "learning_rate": 7.679965237842939e-06, "loss": 2.852281188964844, "step": 584500 }, { "epoch": 0.705397783233771, "learning_rate": 7.679561402375199e-06, "loss": 2.8433111572265624, "step": 584600 }, { "epoch": 0.7055184465562537, "learning_rate": 7.67915756690746e-06, "loss": 2.8510702514648436, "step": 584700 }, { "epoch": 0.7056391098787363, "learning_rate": 7.678753731439723e-06, "loss": 2.847156677246094, "step": 584800 }, { "epoch": 0.7057597732012191, "learning_rate": 7.678349895971983e-06, "loss": 2.862283020019531, "step": 584900 }, { "epoch": 0.7058804365237017, "learning_rate": 7.677946060504245e-06, "loss": 2.870137023925781, "step": 585000 }, { "epoch": 0.7060010998461844, "learning_rate": 7.677542225036507e-06, "loss": 2.858834228515625, "step": 585100 }, { "epoch": 0.7061217631686671, "learning_rate": 7.677138389568769e-06, "loss": 2.8479238891601564, "step": 585200 }, { "epoch": 0.7062424264911498, "learning_rate": 7.676734554101031e-06, "loss": 2.8547308349609377, "step": 585300 }, { "epoch": 0.7063630898136325, "learning_rate": 7.676330718633293e-06, "loss": 2.833609924316406, "step": 585400 }, { "epoch": 0.7064837531361151, "learning_rate": 7.675926883165555e-06, "loss": 2.8622250366210937, "step": 585500 }, { "epoch": 0.7066044164585978, "learning_rate": 7.675523047697815e-06, "loss": 2.842254638671875, "step": 585600 }, { "epoch": 0.7067250797810806, "learning_rate": 7.675119212230077e-06, "loss": 2.854966125488281, "step": 585700 }, { "epoch": 0.7068457431035632, "learning_rate": 7.674715376762338e-06, "loss": 2.8604837036132813, "step": 585800 }, { "epoch": 0.7069664064260459, "learning_rate": 7.6743115412946e-06, "loss": 2.8233154296875, "step": 585900 }, { "epoch": 0.7070870697485286, "learning_rate": 7.673907705826862e-06, "loss": 2.8461572265625, "step": 586000 }, { "epoch": 0.7072077330710113, "learning_rate": 7.673503870359123e-06, "loss": 2.851761779785156, "step": 586100 }, { "epoch": 0.707328396393494, "learning_rate": 7.673100034891385e-06, "loss": 2.8616061401367188, "step": 586200 }, { "epoch": 0.7074490597159766, "learning_rate": 7.672696199423647e-06, "loss": 2.852017517089844, "step": 586300 }, { "epoch": 0.7075697230384593, "learning_rate": 7.672292363955908e-06, "loss": 2.8566278076171874, "step": 586400 }, { "epoch": 0.7076903863609421, "learning_rate": 7.67188852848817e-06, "loss": 2.8473611450195313, "step": 586500 }, { "epoch": 0.7078110496834247, "learning_rate": 7.671484693020432e-06, "loss": 2.87174072265625, "step": 586600 }, { "epoch": 0.7079317130059074, "learning_rate": 7.671080857552694e-06, "loss": 2.8517861938476563, "step": 586700 }, { "epoch": 0.70805237632839, "learning_rate": 7.670677022084954e-06, "loss": 2.862684631347656, "step": 586800 }, { "epoch": 0.7081730396508727, "learning_rate": 7.670273186617216e-06, "loss": 2.8592300415039062, "step": 586900 }, { "epoch": 0.7082937029733555, "learning_rate": 7.669869351149478e-06, "loss": 2.8380801391601564, "step": 587000 }, { "epoch": 0.7084143662958381, "learning_rate": 7.66946551568174e-06, "loss": 2.856009826660156, "step": 587100 }, { "epoch": 0.7085350296183208, "learning_rate": 7.669061680214002e-06, "loss": 2.854145202636719, "step": 587200 }, { "epoch": 0.7086556929408034, "learning_rate": 7.668657844746262e-06, "loss": 2.8359329223632814, "step": 587300 }, { "epoch": 0.7087763562632862, "learning_rate": 7.668254009278524e-06, "loss": 2.8700601196289064, "step": 587400 }, { "epoch": 0.7088970195857689, "learning_rate": 7.667850173810786e-06, "loss": 2.8557757568359374, "step": 587500 }, { "epoch": 0.7090176829082515, "learning_rate": 7.667446338343048e-06, "loss": 2.8446340942382813, "step": 587600 }, { "epoch": 0.7091383462307342, "learning_rate": 7.667042502875308e-06, "loss": 2.8498724365234374, "step": 587700 }, { "epoch": 0.7092590095532169, "learning_rate": 7.66663866740757e-06, "loss": 2.839444274902344, "step": 587800 }, { "epoch": 0.7093796728756996, "learning_rate": 7.666234831939832e-06, "loss": 2.8605221557617186, "step": 587900 }, { "epoch": 0.7095003361981823, "learning_rate": 7.665830996472094e-06, "loss": 2.8712619018554686, "step": 588000 }, { "epoch": 0.7096209995206649, "learning_rate": 7.665427161004355e-06, "loss": 2.851839294433594, "step": 588100 }, { "epoch": 0.7097416628431477, "learning_rate": 7.665023325536617e-06, "loss": 2.8605792236328127, "step": 588200 }, { "epoch": 0.7098623261656303, "learning_rate": 7.664619490068879e-06, "loss": 2.8506231689453125, "step": 588300 }, { "epoch": 0.709982989488113, "learning_rate": 7.66421565460114e-06, "loss": 2.8274185180664064, "step": 588400 }, { "epoch": 0.7101036528105957, "learning_rate": 7.663811819133403e-06, "loss": 2.880670166015625, "step": 588500 }, { "epoch": 0.7102243161330783, "learning_rate": 7.663407983665665e-06, "loss": 2.8383724975585936, "step": 588600 }, { "epoch": 0.7103449794555611, "learning_rate": 7.663004148197925e-06, "loss": 2.846884765625, "step": 588700 }, { "epoch": 0.7104656427780437, "learning_rate": 7.662600312730187e-06, "loss": 2.841048278808594, "step": 588800 }, { "epoch": 0.7105863061005264, "learning_rate": 7.662196477262447e-06, "loss": 2.832183532714844, "step": 588900 }, { "epoch": 0.7107069694230091, "learning_rate": 7.661792641794709e-06, "loss": 2.849126892089844, "step": 589000 }, { "epoch": 0.7108276327454918, "learning_rate": 7.661388806326971e-06, "loss": 2.865208740234375, "step": 589100 }, { "epoch": 0.7109482960679745, "learning_rate": 7.660984970859233e-06, "loss": 2.8427505493164062, "step": 589200 }, { "epoch": 0.7110689593904571, "learning_rate": 7.660581135391495e-06, "loss": 2.8471249389648436, "step": 589300 }, { "epoch": 0.7111896227129398, "learning_rate": 7.660177299923757e-06, "loss": 2.8581051635742187, "step": 589400 }, { "epoch": 0.7113102860354226, "learning_rate": 7.659773464456019e-06, "loss": 2.850183410644531, "step": 589500 }, { "epoch": 0.7114309493579052, "learning_rate": 7.659369628988281e-06, "loss": 2.8320297241210937, "step": 589600 }, { "epoch": 0.7115516126803879, "learning_rate": 7.658965793520541e-06, "loss": 2.8095318603515627, "step": 589700 }, { "epoch": 0.7116722760028705, "learning_rate": 7.658561958052803e-06, "loss": 2.8488092041015625, "step": 589800 }, { "epoch": 0.7117929393253533, "learning_rate": 7.658158122585064e-06, "loss": 2.860452880859375, "step": 589900 }, { "epoch": 0.711913602647836, "learning_rate": 7.657754287117326e-06, "loss": 2.88807373046875, "step": 590000 }, { "epoch": 0.7120342659703186, "learning_rate": 7.657350451649588e-06, "loss": 2.8698056030273436, "step": 590100 }, { "epoch": 0.7121549292928013, "learning_rate": 7.65694661618185e-06, "loss": 2.84966796875, "step": 590200 }, { "epoch": 0.712275592615284, "learning_rate": 7.656542780714112e-06, "loss": 2.8345077514648436, "step": 590300 }, { "epoch": 0.7123962559377667, "learning_rate": 7.656138945246373e-06, "loss": 2.8443502807617187, "step": 590400 }, { "epoch": 0.7125169192602494, "learning_rate": 7.655735109778634e-06, "loss": 2.835208740234375, "step": 590500 }, { "epoch": 0.712637582582732, "learning_rate": 7.655331274310896e-06, "loss": 2.8191632080078124, "step": 590600 }, { "epoch": 0.7127582459052147, "learning_rate": 7.654927438843158e-06, "loss": 2.8341183471679687, "step": 590700 }, { "epoch": 0.7128789092276974, "learning_rate": 7.65452360337542e-06, "loss": 2.831346130371094, "step": 590800 }, { "epoch": 0.7129995725501801, "learning_rate": 7.65411976790768e-06, "loss": 2.8378945922851564, "step": 590900 }, { "epoch": 0.7131202358726628, "learning_rate": 7.653715932439942e-06, "loss": 2.8293966674804687, "step": 591000 }, { "epoch": 0.7132408991951454, "learning_rate": 7.653312096972204e-06, "loss": 2.8608172607421873, "step": 591100 }, { "epoch": 0.7133615625176282, "learning_rate": 7.652908261504466e-06, "loss": 2.87868896484375, "step": 591200 }, { "epoch": 0.7134822258401109, "learning_rate": 7.652504426036726e-06, "loss": 2.8494287109375, "step": 591300 }, { "epoch": 0.7136028891625935, "learning_rate": 7.652100590568988e-06, "loss": 2.852053527832031, "step": 591400 }, { "epoch": 0.7137235524850762, "learning_rate": 7.65169675510125e-06, "loss": 2.867012939453125, "step": 591500 }, { "epoch": 0.7138442158075589, "learning_rate": 7.651292919633512e-06, "loss": 2.8467132568359377, "step": 591600 }, { "epoch": 0.7139648791300416, "learning_rate": 7.650889084165774e-06, "loss": 2.8750851440429686, "step": 591700 }, { "epoch": 0.7140855424525243, "learning_rate": 7.650485248698034e-06, "loss": 2.8647781372070313, "step": 591800 }, { "epoch": 0.7142062057750069, "learning_rate": 7.650081413230296e-06, "loss": 2.858387145996094, "step": 591900 }, { "epoch": 0.7143268690974897, "learning_rate": 7.649677577762558e-06, "loss": 2.8398922729492186, "step": 592000 }, { "epoch": 0.7144475324199723, "learning_rate": 7.64927374229482e-06, "loss": 2.8484786987304687, "step": 592100 }, { "epoch": 0.714568195742455, "learning_rate": 7.64886990682708e-06, "loss": 2.822452392578125, "step": 592200 }, { "epoch": 0.7146888590649377, "learning_rate": 7.648466071359343e-06, "loss": 2.851641845703125, "step": 592300 }, { "epoch": 0.7148095223874203, "learning_rate": 7.648062235891605e-06, "loss": 2.8470709228515627, "step": 592400 }, { "epoch": 0.7149301857099031, "learning_rate": 7.647658400423867e-06, "loss": 2.851204833984375, "step": 592500 }, { "epoch": 0.7150508490323857, "learning_rate": 7.647254564956129e-06, "loss": 2.840595397949219, "step": 592600 }, { "epoch": 0.7151715123548684, "learning_rate": 7.64685072948839e-06, "loss": 2.8561087036132813, "step": 592700 }, { "epoch": 0.7152921756773511, "learning_rate": 7.646446894020651e-06, "loss": 2.830580139160156, "step": 592800 }, { "epoch": 0.7154128389998338, "learning_rate": 7.646043058552913e-06, "loss": 2.8352166748046876, "step": 592900 }, { "epoch": 0.7155335023223165, "learning_rate": 7.645639223085173e-06, "loss": 2.8629534912109373, "step": 593000 }, { "epoch": 0.7156541656447991, "learning_rate": 7.645235387617435e-06, "loss": 2.853104553222656, "step": 593100 }, { "epoch": 0.7157748289672818, "learning_rate": 7.644831552149697e-06, "loss": 2.8582220458984375, "step": 593200 }, { "epoch": 0.7158954922897646, "learning_rate": 7.644427716681959e-06, "loss": 2.8493191528320314, "step": 593300 }, { "epoch": 0.7160161556122472, "learning_rate": 7.644023881214221e-06, "loss": 2.866957702636719, "step": 593400 }, { "epoch": 0.7161368189347299, "learning_rate": 7.643620045746483e-06, "loss": 2.832419738769531, "step": 593500 }, { "epoch": 0.7162574822572125, "learning_rate": 7.643216210278745e-06, "loss": 2.880351257324219, "step": 593600 }, { "epoch": 0.7163781455796953, "learning_rate": 7.642812374811005e-06, "loss": 2.8743853759765625, "step": 593700 }, { "epoch": 0.716498808902178, "learning_rate": 7.642408539343267e-06, "loss": 2.8396533203125, "step": 593800 }, { "epoch": 0.7166194722246606, "learning_rate": 7.64200470387553e-06, "loss": 2.845855712890625, "step": 593900 }, { "epoch": 0.7167401355471433, "learning_rate": 7.64160086840779e-06, "loss": 2.8430340576171873, "step": 594000 }, { "epoch": 0.716860798869626, "learning_rate": 7.641197032940052e-06, "loss": 2.835252380371094, "step": 594100 }, { "epoch": 0.7169814621921087, "learning_rate": 7.640793197472314e-06, "loss": 2.8477993774414063, "step": 594200 }, { "epoch": 0.7171021255145914, "learning_rate": 7.640389362004576e-06, "loss": 2.83353515625, "step": 594300 }, { "epoch": 0.717222788837074, "learning_rate": 7.639985526536838e-06, "loss": 2.838026123046875, "step": 594400 }, { "epoch": 0.7173434521595567, "learning_rate": 7.6395816910691e-06, "loss": 2.8310287475585936, "step": 594500 }, { "epoch": 0.7174641154820394, "learning_rate": 7.63917785560136e-06, "loss": 2.843500061035156, "step": 594600 }, { "epoch": 0.7175847788045221, "learning_rate": 7.638774020133622e-06, "loss": 2.860919189453125, "step": 594700 }, { "epoch": 0.7177054421270048, "learning_rate": 7.638370184665884e-06, "loss": 2.8437673950195315, "step": 594800 }, { "epoch": 0.7178261054494874, "learning_rate": 7.637966349198144e-06, "loss": 2.845377197265625, "step": 594900 }, { "epoch": 0.7179467687719702, "learning_rate": 7.637562513730406e-06, "loss": 2.8584356689453125, "step": 595000 }, { "epoch": 0.7180674320944528, "learning_rate": 7.637158678262668e-06, "loss": 2.8483447265625, "step": 595100 }, { "epoch": 0.7181880954169355, "learning_rate": 7.63675484279493e-06, "loss": 2.830110778808594, "step": 595200 }, { "epoch": 0.7183087587394182, "learning_rate": 7.636351007327192e-06, "loss": 2.831490173339844, "step": 595300 }, { "epoch": 0.7184294220619009, "learning_rate": 7.635947171859452e-06, "loss": 2.880101623535156, "step": 595400 }, { "epoch": 0.7185500853843836, "learning_rate": 7.635543336391714e-06, "loss": 2.814600830078125, "step": 595500 }, { "epoch": 0.7186707487068662, "learning_rate": 7.635139500923976e-06, "loss": 2.8266641235351564, "step": 595600 }, { "epoch": 0.7187914120293489, "learning_rate": 7.634735665456238e-06, "loss": 2.8104318237304686, "step": 595700 }, { "epoch": 0.7189120753518317, "learning_rate": 7.6343318299885e-06, "loss": 2.843552551269531, "step": 595800 }, { "epoch": 0.7190327386743143, "learning_rate": 7.63392799452076e-06, "loss": 2.828013610839844, "step": 595900 }, { "epoch": 0.719153401996797, "learning_rate": 7.633524159053022e-06, "loss": 2.8720211791992187, "step": 596000 }, { "epoch": 0.7192740653192796, "learning_rate": 7.633120323585284e-06, "loss": 2.835665283203125, "step": 596100 }, { "epoch": 0.7193947286417623, "learning_rate": 7.632716488117545e-06, "loss": 2.840772705078125, "step": 596200 }, { "epoch": 0.7195153919642451, "learning_rate": 7.632312652649807e-06, "loss": 2.8577618408203125, "step": 596300 }, { "epoch": 0.7196360552867277, "learning_rate": 7.631908817182069e-06, "loss": 2.844828796386719, "step": 596400 }, { "epoch": 0.7197567186092104, "learning_rate": 7.63150498171433e-06, "loss": 2.8559085083007814, "step": 596500 }, { "epoch": 0.7198773819316931, "learning_rate": 7.631101146246593e-06, "loss": 2.8550439453125, "step": 596600 }, { "epoch": 0.7199980452541758, "learning_rate": 7.630697310778855e-06, "loss": 2.82895263671875, "step": 596700 }, { "epoch": 0.7201187085766585, "learning_rate": 7.630293475311115e-06, "loss": 2.8775347900390624, "step": 596800 }, { "epoch": 0.7202393718991411, "learning_rate": 7.629889639843377e-06, "loss": 2.8132208251953124, "step": 596900 }, { "epoch": 0.7203600352216238, "learning_rate": 7.629485804375639e-06, "loss": 2.855584716796875, "step": 597000 }, { "epoch": 0.7204806985441066, "learning_rate": 7.6290819689079e-06, "loss": 2.835617980957031, "step": 597100 }, { "epoch": 0.7206013618665892, "learning_rate": 7.628678133440161e-06, "loss": 2.833038024902344, "step": 597200 }, { "epoch": 0.7207220251890719, "learning_rate": 7.628274297972423e-06, "loss": 2.8349478149414065, "step": 597300 }, { "epoch": 0.7208426885115545, "learning_rate": 7.627870462504685e-06, "loss": 2.8466970825195315, "step": 597400 }, { "epoch": 0.7209633518340373, "learning_rate": 7.627466627036947e-06, "loss": 2.8552850341796874, "step": 597500 }, { "epoch": 0.72108401515652, "learning_rate": 7.627062791569208e-06, "loss": 2.8689910888671877, "step": 597600 }, { "epoch": 0.7212046784790026, "learning_rate": 7.62665895610147e-06, "loss": 2.848668212890625, "step": 597700 }, { "epoch": 0.7213253418014853, "learning_rate": 7.626255120633732e-06, "loss": 2.8390097045898437, "step": 597800 }, { "epoch": 0.721446005123968, "learning_rate": 7.6258512851659925e-06, "loss": 2.8535665893554687, "step": 597900 }, { "epoch": 0.7215666684464507, "learning_rate": 7.6254474496982545e-06, "loss": 2.8399832153320315, "step": 598000 }, { "epoch": 0.7216873317689334, "learning_rate": 7.6250436142305165e-06, "loss": 2.8328372192382814, "step": 598100 }, { "epoch": 0.721807995091416, "learning_rate": 7.624639778762778e-06, "loss": 2.8236346435546875, "step": 598200 }, { "epoch": 0.7219286584138987, "learning_rate": 7.62423594329504e-06, "loss": 2.839200439453125, "step": 598300 }, { "epoch": 0.7220493217363814, "learning_rate": 7.623832107827302e-06, "loss": 2.858956298828125, "step": 598400 }, { "epoch": 0.7221699850588641, "learning_rate": 7.623428272359564e-06, "loss": 2.83538818359375, "step": 598500 }, { "epoch": 0.7222906483813468, "learning_rate": 7.623024436891825e-06, "loss": 2.8272552490234375, "step": 598600 }, { "epoch": 0.7224113117038294, "learning_rate": 7.622620601424086e-06, "loss": 2.8433087158203123, "step": 598700 }, { "epoch": 0.7225319750263122, "learning_rate": 7.622216765956347e-06, "loss": 2.852114562988281, "step": 598800 }, { "epoch": 0.7226526383487948, "learning_rate": 7.621812930488609e-06, "loss": 2.8037570190429686, "step": 598900 }, { "epoch": 0.7227733016712775, "learning_rate": 7.621409095020871e-06, "loss": 2.860138244628906, "step": 599000 }, { "epoch": 0.7228939649937602, "learning_rate": 7.621005259553133e-06, "loss": 2.849071044921875, "step": 599100 }, { "epoch": 0.7230146283162429, "learning_rate": 7.620601424085394e-06, "loss": 2.834295349121094, "step": 599200 }, { "epoch": 0.7231352916387256, "learning_rate": 7.620197588617656e-06, "loss": 2.86677490234375, "step": 599300 }, { "epoch": 0.7232559549612082, "learning_rate": 7.619793753149918e-06, "loss": 2.8441143798828126, "step": 599400 }, { "epoch": 0.7233766182836909, "learning_rate": 7.619389917682178e-06, "loss": 2.8090560913085936, "step": 599500 }, { "epoch": 0.7234972816061737, "learning_rate": 7.61898608221444e-06, "loss": 2.8088385009765626, "step": 599600 }, { "epoch": 0.7236179449286563, "learning_rate": 7.618582246746702e-06, "loss": 2.8294964599609376, "step": 599700 }, { "epoch": 0.723738608251139, "learning_rate": 7.618178411278963e-06, "loss": 2.8351806640625, "step": 599800 }, { "epoch": 0.7238592715736216, "learning_rate": 7.617774575811225e-06, "loss": 2.8585284423828123, "step": 599900 }, { "epoch": 0.7239799348961043, "learning_rate": 7.617370740343487e-06, "loss": 2.835009765625, "step": 600000 }, { "epoch": 0.7241005982185871, "learning_rate": 7.6169669048757485e-06, "loss": 2.8402664184570314, "step": 600100 }, { "epoch": 0.7242212615410697, "learning_rate": 7.6165630694080105e-06, "loss": 2.8244183349609373, "step": 600200 }, { "epoch": 0.7243419248635524, "learning_rate": 7.616159233940272e-06, "loss": 2.8449526977539064, "step": 600300 }, { "epoch": 0.724462588186035, "learning_rate": 7.615755398472533e-06, "loss": 2.8412411499023436, "step": 600400 }, { "epoch": 0.7245832515085178, "learning_rate": 7.615351563004795e-06, "loss": 2.8219430541992185, "step": 600500 }, { "epoch": 0.7247039148310005, "learning_rate": 7.614947727537057e-06, "loss": 2.832084045410156, "step": 600600 }, { "epoch": 0.7248245781534831, "learning_rate": 7.614543892069318e-06, "loss": 2.8650436401367188, "step": 600700 }, { "epoch": 0.7249452414759658, "learning_rate": 7.61414005660158e-06, "loss": 2.83247314453125, "step": 600800 }, { "epoch": 0.7250659047984485, "learning_rate": 7.613736221133842e-06, "loss": 2.8388943481445312, "step": 600900 }, { "epoch": 0.7251865681209312, "learning_rate": 7.613332385666104e-06, "loss": 2.829284973144531, "step": 601000 }, { "epoch": 0.7253072314434139, "learning_rate": 7.612928550198364e-06, "loss": 2.824978942871094, "step": 601100 }, { "epoch": 0.7254278947658965, "learning_rate": 7.612524714730626e-06, "loss": 2.8546621704101565, "step": 601200 }, { "epoch": 0.7255485580883793, "learning_rate": 7.612120879262887e-06, "loss": 2.8446481323242185, "step": 601300 }, { "epoch": 0.725669221410862, "learning_rate": 7.611717043795149e-06, "loss": 2.8569454956054687, "step": 601400 }, { "epoch": 0.7257898847333446, "learning_rate": 7.611313208327411e-06, "loss": 2.84204345703125, "step": 601500 }, { "epoch": 0.7259105480558273, "learning_rate": 7.610909372859673e-06, "loss": 2.8396881103515623, "step": 601600 }, { "epoch": 0.72603121137831, "learning_rate": 7.610505537391934e-06, "loss": 2.858248596191406, "step": 601700 }, { "epoch": 0.7261518747007927, "learning_rate": 7.610101701924196e-06, "loss": 2.8359979248046874, "step": 601800 }, { "epoch": 0.7262725380232754, "learning_rate": 7.609697866456457e-06, "loss": 2.8368960571289064, "step": 601900 }, { "epoch": 0.726393201345758, "learning_rate": 7.6092940309887186e-06, "loss": 2.844346008300781, "step": 602000 }, { "epoch": 0.7265138646682407, "learning_rate": 7.6088901955209805e-06, "loss": 2.8497967529296875, "step": 602100 }, { "epoch": 0.7266345279907234, "learning_rate": 7.6084863600532425e-06, "loss": 2.818468017578125, "step": 602200 }, { "epoch": 0.7267551913132061, "learning_rate": 7.608082524585504e-06, "loss": 2.84897705078125, "step": 602300 }, { "epoch": 0.7268758546356888, "learning_rate": 7.607678689117766e-06, "loss": 2.8364697265625, "step": 602400 }, { "epoch": 0.7269965179581714, "learning_rate": 7.607274853650028e-06, "loss": 2.8343548583984375, "step": 602500 }, { "epoch": 0.7271171812806542, "learning_rate": 7.606871018182289e-06, "loss": 2.81431640625, "step": 602600 }, { "epoch": 0.7272378446031368, "learning_rate": 7.606467182714551e-06, "loss": 2.8723526000976562, "step": 602700 }, { "epoch": 0.7273585079256195, "learning_rate": 7.606063347246812e-06, "loss": 2.81925537109375, "step": 602800 }, { "epoch": 0.7274791712481022, "learning_rate": 7.605659511779073e-06, "loss": 2.7938177490234377, "step": 602900 }, { "epoch": 0.7275998345705849, "learning_rate": 7.605255676311335e-06, "loss": 2.8298220825195313, "step": 603000 }, { "epoch": 0.7277204978930676, "learning_rate": 7.604851840843597e-06, "loss": 2.842681884765625, "step": 603100 }, { "epoch": 0.7278411612155502, "learning_rate": 7.604448005375858e-06, "loss": 2.8330377197265624, "step": 603200 }, { "epoch": 0.7279618245380329, "learning_rate": 7.60404416990812e-06, "loss": 2.8187625122070314, "step": 603300 }, { "epoch": 0.7280824878605157, "learning_rate": 7.603640334440382e-06, "loss": 2.839820556640625, "step": 603400 }, { "epoch": 0.7282031511829983, "learning_rate": 7.603236498972644e-06, "loss": 2.818056640625, "step": 603500 }, { "epoch": 0.728323814505481, "learning_rate": 7.602832663504904e-06, "loss": 2.8298419189453123, "step": 603600 }, { "epoch": 0.7284444778279636, "learning_rate": 7.602428828037166e-06, "loss": 2.824041442871094, "step": 603700 }, { "epoch": 0.7285651411504463, "learning_rate": 7.6020249925694275e-06, "loss": 2.84650390625, "step": 603800 }, { "epoch": 0.7286858044729291, "learning_rate": 7.6016211571016895e-06, "loss": 2.8340460205078126, "step": 603900 }, { "epoch": 0.7288064677954117, "learning_rate": 7.6012173216339514e-06, "loss": 2.8298089599609373, "step": 604000 }, { "epoch": 0.7289271311178944, "learning_rate": 7.600813486166213e-06, "loss": 2.8144265747070314, "step": 604100 }, { "epoch": 0.729047794440377, "learning_rate": 7.6004096506984746e-06, "loss": 2.8420260620117186, "step": 604200 }, { "epoch": 0.7291684577628598, "learning_rate": 7.6000058152307365e-06, "loss": 2.8317364501953124, "step": 604300 }, { "epoch": 0.7292891210853425, "learning_rate": 7.599601979762997e-06, "loss": 2.854012145996094, "step": 604400 }, { "epoch": 0.7294097844078251, "learning_rate": 7.599198144295259e-06, "loss": 2.852894287109375, "step": 604500 }, { "epoch": 0.7295304477303078, "learning_rate": 7.598794308827521e-06, "loss": 2.8500555419921874, "step": 604600 }, { "epoch": 0.7296511110527905, "learning_rate": 7.598390473359783e-06, "loss": 2.825152587890625, "step": 604700 }, { "epoch": 0.7297717743752732, "learning_rate": 7.597986637892044e-06, "loss": 2.8397869873046875, "step": 604800 }, { "epoch": 0.7298924376977559, "learning_rate": 7.597582802424306e-06, "loss": 2.8551385498046873, "step": 604900 }, { "epoch": 0.7300131010202385, "learning_rate": 7.597178966956568e-06, "loss": 2.8412796020507813, "step": 605000 }, { "epoch": 0.7301337643427213, "learning_rate": 7.596775131488829e-06, "loss": 2.8156011962890624, "step": 605100 }, { "epoch": 0.7302544276652039, "learning_rate": 7.59637129602109e-06, "loss": 2.8235458374023437, "step": 605200 }, { "epoch": 0.7303750909876866, "learning_rate": 7.595967460553352e-06, "loss": 2.8220587158203125, "step": 605300 }, { "epoch": 0.7304957543101693, "learning_rate": 7.595563625085613e-06, "loss": 2.8451638793945313, "step": 605400 }, { "epoch": 0.730616417632652, "learning_rate": 7.595159789617875e-06, "loss": 2.8342608642578124, "step": 605500 }, { "epoch": 0.7307370809551347, "learning_rate": 7.594755954150137e-06, "loss": 2.833648681640625, "step": 605600 }, { "epoch": 0.7308577442776173, "learning_rate": 7.594352118682398e-06, "loss": 2.832721862792969, "step": 605700 }, { "epoch": 0.7309784076001, "learning_rate": 7.59394828321466e-06, "loss": 2.82572265625, "step": 605800 }, { "epoch": 0.7310990709225827, "learning_rate": 7.593544447746922e-06, "loss": 2.8513800048828126, "step": 605900 }, { "epoch": 0.7312197342450654, "learning_rate": 7.593140612279183e-06, "loss": 2.8289996337890626, "step": 606000 }, { "epoch": 0.7313403975675481, "learning_rate": 7.592736776811445e-06, "loss": 2.8240087890625, "step": 606100 }, { "epoch": 0.7314610608900307, "learning_rate": 7.592332941343707e-06, "loss": 2.8449395751953124, "step": 606200 }, { "epoch": 0.7315817242125134, "learning_rate": 7.591929105875968e-06, "loss": 2.8405169677734374, "step": 606300 }, { "epoch": 0.7317023875349962, "learning_rate": 7.59152527040823e-06, "loss": 2.8252545166015626, "step": 606400 }, { "epoch": 0.7318230508574788, "learning_rate": 7.591121434940492e-06, "loss": 2.8312115478515625, "step": 606500 }, { "epoch": 0.7319437141799615, "learning_rate": 7.590717599472754e-06, "loss": 2.820077209472656, "step": 606600 }, { "epoch": 0.7320643775024442, "learning_rate": 7.590313764005015e-06, "loss": 2.823672180175781, "step": 606700 }, { "epoch": 0.7321850408249269, "learning_rate": 7.589909928537276e-06, "loss": 2.8201654052734373, "step": 606800 }, { "epoch": 0.7323057041474096, "learning_rate": 7.589506093069537e-06, "loss": 2.8248065185546873, "step": 606900 }, { "epoch": 0.7324263674698922, "learning_rate": 7.589102257601799e-06, "loss": 2.8089474487304686, "step": 607000 }, { "epoch": 0.7325470307923749, "learning_rate": 7.588698422134061e-06, "loss": 2.8481414794921873, "step": 607100 }, { "epoch": 0.7326676941148577, "learning_rate": 7.588294586666323e-06, "loss": 2.826563720703125, "step": 607200 }, { "epoch": 0.7327883574373403, "learning_rate": 7.587890751198584e-06, "loss": 2.8146597290039064, "step": 607300 }, { "epoch": 0.732909020759823, "learning_rate": 7.587486915730846e-06, "loss": 2.8355548095703127, "step": 607400 }, { "epoch": 0.7330296840823056, "learning_rate": 7.587083080263108e-06, "loss": 2.8327291870117186, "step": 607500 }, { "epoch": 0.7331503474047883, "learning_rate": 7.586679244795369e-06, "loss": 2.835107421875, "step": 607600 }, { "epoch": 0.7332710107272711, "learning_rate": 7.58627540932763e-06, "loss": 2.857324523925781, "step": 607700 }, { "epoch": 0.7333916740497537, "learning_rate": 7.585871573859892e-06, "loss": 2.8485736083984374, "step": 607800 }, { "epoch": 0.7335123373722364, "learning_rate": 7.5854677383921535e-06, "loss": 2.8316030883789063, "step": 607900 }, { "epoch": 0.733633000694719, "learning_rate": 7.5850639029244155e-06, "loss": 2.843360595703125, "step": 608000 }, { "epoch": 0.7337536640172018, "learning_rate": 7.5846600674566775e-06, "loss": 2.8294363403320313, "step": 608100 }, { "epoch": 0.7338743273396845, "learning_rate": 7.584256231988939e-06, "loss": 2.8250167846679686, "step": 608200 }, { "epoch": 0.7339949906621671, "learning_rate": 7.583852396521201e-06, "loss": 2.8388677978515626, "step": 608300 }, { "epoch": 0.7341156539846498, "learning_rate": 7.5834485610534626e-06, "loss": 2.845799865722656, "step": 608400 }, { "epoch": 0.7342363173071325, "learning_rate": 7.583044725585723e-06, "loss": 2.81463623046875, "step": 608500 }, { "epoch": 0.7343569806296152, "learning_rate": 7.582640890117985e-06, "loss": 2.853978576660156, "step": 608600 }, { "epoch": 0.7344776439520979, "learning_rate": 7.582237054650247e-06, "loss": 2.83222412109375, "step": 608700 }, { "epoch": 0.7345983072745805, "learning_rate": 7.581833219182508e-06, "loss": 2.804739990234375, "step": 608800 }, { "epoch": 0.7347189705970633, "learning_rate": 7.58142938371477e-06, "loss": 2.82529052734375, "step": 608900 }, { "epoch": 0.7348396339195459, "learning_rate": 7.581025548247032e-06, "loss": 2.8481216430664062, "step": 609000 }, { "epoch": 0.7349602972420286, "learning_rate": 7.580621712779294e-06, "loss": 2.8316244506835937, "step": 609100 }, { "epoch": 0.7350809605645113, "learning_rate": 7.580217877311555e-06, "loss": 2.8433767700195314, "step": 609200 }, { "epoch": 0.735201623886994, "learning_rate": 7.579814041843816e-06, "loss": 2.8337847900390627, "step": 609300 }, { "epoch": 0.7353222872094767, "learning_rate": 7.579410206376077e-06, "loss": 2.8405975341796874, "step": 609400 }, { "epoch": 0.7354429505319593, "learning_rate": 7.579006370908339e-06, "loss": 2.843521728515625, "step": 609500 }, { "epoch": 0.735563613854442, "learning_rate": 7.578602535440601e-06, "loss": 2.8249505615234374, "step": 609600 }, { "epoch": 0.7356842771769248, "learning_rate": 7.578198699972863e-06, "loss": 2.865635986328125, "step": 609700 }, { "epoch": 0.7358049404994074, "learning_rate": 7.577794864505124e-06, "loss": 2.8307565307617186, "step": 609800 }, { "epoch": 0.7359256038218901, "learning_rate": 7.577391029037386e-06, "loss": 2.7958209228515627, "step": 609900 }, { "epoch": 0.7360462671443727, "learning_rate": 7.576987193569648e-06, "loss": 2.8226547241210938, "step": 610000 }, { "epoch": 0.7361669304668554, "learning_rate": 7.576583358101909e-06, "loss": 2.813846435546875, "step": 610100 }, { "epoch": 0.7362875937893382, "learning_rate": 7.576179522634171e-06, "loss": 2.819149169921875, "step": 610200 }, { "epoch": 0.7364082571118208, "learning_rate": 7.575775687166433e-06, "loss": 2.8468051147460938, "step": 610300 }, { "epoch": 0.7365289204343035, "learning_rate": 7.575371851698694e-06, "loss": 2.8197586059570314, "step": 610400 }, { "epoch": 0.7366495837567861, "learning_rate": 7.574968016230956e-06, "loss": 2.814403381347656, "step": 610500 }, { "epoch": 0.7367702470792689, "learning_rate": 7.574564180763218e-06, "loss": 2.8308221435546876, "step": 610600 }, { "epoch": 0.7368909104017516, "learning_rate": 7.57416034529548e-06, "loss": 2.831101379394531, "step": 610700 }, { "epoch": 0.7370115737242342, "learning_rate": 7.573756509827741e-06, "loss": 2.8293746948242187, "step": 610800 }, { "epoch": 0.7371322370467169, "learning_rate": 7.573352674360002e-06, "loss": 2.850122985839844, "step": 610900 }, { "epoch": 0.7372529003691995, "learning_rate": 7.572948838892263e-06, "loss": 2.8342330932617186, "step": 611000 }, { "epoch": 0.7373735636916823, "learning_rate": 7.572545003424525e-06, "loss": 2.827171630859375, "step": 611100 }, { "epoch": 0.737494227014165, "learning_rate": 7.572141167956787e-06, "loss": 2.822620849609375, "step": 611200 }, { "epoch": 0.7376148903366476, "learning_rate": 7.571737332489049e-06, "loss": 2.8397671508789064, "step": 611300 }, { "epoch": 0.7377355536591303, "learning_rate": 7.57133349702131e-06, "loss": 2.8224777221679687, "step": 611400 }, { "epoch": 0.737856216981613, "learning_rate": 7.570929661553572e-06, "loss": 2.8421759033203124, "step": 611500 }, { "epoch": 0.7379768803040957, "learning_rate": 7.570525826085834e-06, "loss": 2.827149658203125, "step": 611600 }, { "epoch": 0.7380975436265784, "learning_rate": 7.5701219906180944e-06, "loss": 2.8314828491210937, "step": 611700 }, { "epoch": 0.738218206949061, "learning_rate": 7.569718155150356e-06, "loss": 2.797510681152344, "step": 611800 }, { "epoch": 0.7383388702715438, "learning_rate": 7.569314319682618e-06, "loss": 2.8336410522460938, "step": 611900 }, { "epoch": 0.7384595335940265, "learning_rate": 7.5689104842148795e-06, "loss": 2.843047790527344, "step": 612000 }, { "epoch": 0.7385801969165091, "learning_rate": 7.5685066487471415e-06, "loss": 2.8051467895507813, "step": 612100 }, { "epoch": 0.7387008602389918, "learning_rate": 7.5681028132794035e-06, "loss": 2.8253042602539065, "step": 612200 }, { "epoch": 0.7388215235614745, "learning_rate": 7.567698977811665e-06, "loss": 2.781560363769531, "step": 612300 }, { "epoch": 0.7389421868839572, "learning_rate": 7.567295142343927e-06, "loss": 2.8181698608398436, "step": 612400 }, { "epoch": 0.7390628502064399, "learning_rate": 7.566891306876189e-06, "loss": 2.8395892333984376, "step": 612500 }, { "epoch": 0.7391835135289225, "learning_rate": 7.566487471408449e-06, "loss": 2.838157958984375, "step": 612600 }, { "epoch": 0.7393041768514053, "learning_rate": 7.566083635940711e-06, "loss": 2.8269708251953123, "step": 612700 }, { "epoch": 0.7394248401738879, "learning_rate": 7.565679800472973e-06, "loss": 2.8259820556640625, "step": 612800 }, { "epoch": 0.7395455034963706, "learning_rate": 7.565275965005234e-06, "loss": 2.8072039794921877, "step": 612900 }, { "epoch": 0.7396661668188533, "learning_rate": 7.564872129537496e-06, "loss": 2.8385406494140626, "step": 613000 }, { "epoch": 0.739786830141336, "learning_rate": 7.564468294069758e-06, "loss": 2.798528747558594, "step": 613100 }, { "epoch": 0.7399074934638187, "learning_rate": 7.56406445860202e-06, "loss": 2.8339385986328125, "step": 613200 }, { "epoch": 0.7400281567863013, "learning_rate": 7.563660623134281e-06, "loss": 2.8272882080078126, "step": 613300 }, { "epoch": 0.740148820108784, "learning_rate": 7.563256787666542e-06, "loss": 2.8170840454101564, "step": 613400 }, { "epoch": 0.7402694834312668, "learning_rate": 7.562852952198803e-06, "loss": 2.8212686157226563, "step": 613500 }, { "epoch": 0.7403901467537494, "learning_rate": 7.562449116731065e-06, "loss": 2.8304904174804686, "step": 613600 }, { "epoch": 0.7405108100762321, "learning_rate": 7.562045281263327e-06, "loss": 2.83412109375, "step": 613700 }, { "epoch": 0.7406314733987147, "learning_rate": 7.561641445795589e-06, "loss": 2.826516418457031, "step": 613800 }, { "epoch": 0.7407521367211974, "learning_rate": 7.5612376103278504e-06, "loss": 2.813454284667969, "step": 613900 }, { "epoch": 0.7408728000436802, "learning_rate": 7.560833774860112e-06, "loss": 2.8243328857421877, "step": 614000 }, { "epoch": 0.7409934633661628, "learning_rate": 7.560429939392374e-06, "loss": 2.833742980957031, "step": 614100 }, { "epoch": 0.7411141266886455, "learning_rate": 7.560026103924635e-06, "loss": 2.8076470947265624, "step": 614200 }, { "epoch": 0.7412347900111281, "learning_rate": 7.559622268456897e-06, "loss": 2.8299530029296873, "step": 614300 }, { "epoch": 0.7413554533336109, "learning_rate": 7.559218432989159e-06, "loss": 2.819527282714844, "step": 614400 }, { "epoch": 0.7414761166560936, "learning_rate": 7.55881459752142e-06, "loss": 2.8074356079101563, "step": 614500 }, { "epoch": 0.7415967799785762, "learning_rate": 7.558410762053682e-06, "loss": 2.818992004394531, "step": 614600 }, { "epoch": 0.7417174433010589, "learning_rate": 7.558006926585944e-06, "loss": 2.84697021484375, "step": 614700 }, { "epoch": 0.7418381066235415, "learning_rate": 7.557603091118205e-06, "loss": 2.8341073608398437, "step": 614800 }, { "epoch": 0.7419587699460243, "learning_rate": 7.557199255650467e-06, "loss": 2.8070330810546875, "step": 614900 }, { "epoch": 0.742079433268507, "learning_rate": 7.556795420182728e-06, "loss": 2.815440673828125, "step": 615000 }, { "epoch": 0.7422000965909896, "learning_rate": 7.556391584714989e-06, "loss": 2.8568255615234377, "step": 615100 }, { "epoch": 0.7423207599134724, "learning_rate": 7.555987749247251e-06, "loss": 2.8088778686523437, "step": 615200 }, { "epoch": 0.742441423235955, "learning_rate": 7.555583913779513e-06, "loss": 2.8101040649414064, "step": 615300 }, { "epoch": 0.7425620865584377, "learning_rate": 7.555180078311774e-06, "loss": 2.8466583251953126, "step": 615400 }, { "epoch": 0.7426827498809204, "learning_rate": 7.554776242844036e-06, "loss": 2.8294287109375, "step": 615500 }, { "epoch": 0.742803413203403, "learning_rate": 7.554372407376298e-06, "loss": 2.82283935546875, "step": 615600 }, { "epoch": 0.7429240765258858, "learning_rate": 7.55396857190856e-06, "loss": 2.8386404418945315, "step": 615700 }, { "epoch": 0.7430447398483684, "learning_rate": 7.5535647364408205e-06, "loss": 2.8301040649414064, "step": 615800 }, { "epoch": 0.7431654031708511, "learning_rate": 7.5531609009730825e-06, "loss": 2.8170407104492186, "step": 615900 }, { "epoch": 0.7432860664933338, "learning_rate": 7.552757065505344e-06, "loss": 2.8237225341796877, "step": 616000 }, { "epoch": 0.7434067298158165, "learning_rate": 7.5523532300376056e-06, "loss": 2.7910894775390624, "step": 616100 }, { "epoch": 0.7435273931382992, "learning_rate": 7.5519493945698676e-06, "loss": 2.8088031005859375, "step": 616200 }, { "epoch": 0.7436480564607818, "learning_rate": 7.5515455591021295e-06, "loss": 2.810670166015625, "step": 616300 }, { "epoch": 0.7437687197832645, "learning_rate": 7.551141723634391e-06, "loss": 2.8361151123046877, "step": 616400 }, { "epoch": 0.7438893831057473, "learning_rate": 7.550737888166653e-06, "loss": 2.833929138183594, "step": 616500 }, { "epoch": 0.7440100464282299, "learning_rate": 7.550334052698913e-06, "loss": 2.808399658203125, "step": 616600 }, { "epoch": 0.7441307097507126, "learning_rate": 7.549930217231175e-06, "loss": 2.8284747314453127, "step": 616700 }, { "epoch": 0.7442513730731952, "learning_rate": 7.549526381763437e-06, "loss": 2.819230651855469, "step": 616800 }, { "epoch": 0.744372036395678, "learning_rate": 7.549122546295699e-06, "loss": 2.8165911865234374, "step": 616900 }, { "epoch": 0.7444926997181607, "learning_rate": 7.54871871082796e-06, "loss": 2.8294052124023437, "step": 617000 }, { "epoch": 0.7446133630406433, "learning_rate": 7.548314875360222e-06, "loss": 2.812433776855469, "step": 617100 }, { "epoch": 0.744734026363126, "learning_rate": 7.547911039892484e-06, "loss": 2.827803649902344, "step": 617200 }, { "epoch": 0.7448546896856088, "learning_rate": 7.547507204424745e-06, "loss": 2.8532666015625, "step": 617300 }, { "epoch": 0.7449753530080914, "learning_rate": 7.547103368957006e-06, "loss": 2.825555419921875, "step": 617400 }, { "epoch": 0.7450960163305741, "learning_rate": 7.546699533489268e-06, "loss": 2.820987548828125, "step": 617500 }, { "epoch": 0.7452166796530567, "learning_rate": 7.546295698021529e-06, "loss": 2.830040283203125, "step": 617600 }, { "epoch": 0.7453373429755394, "learning_rate": 7.545891862553791e-06, "loss": 2.8361956787109377, "step": 617700 }, { "epoch": 0.7454580062980222, "learning_rate": 7.545488027086053e-06, "loss": 2.8424581909179687, "step": 617800 }, { "epoch": 0.7455786696205048, "learning_rate": 7.5450841916183145e-06, "loss": 2.813293151855469, "step": 617900 }, { "epoch": 0.7456993329429875, "learning_rate": 7.5446803561505765e-06, "loss": 2.8331146240234375, "step": 618000 }, { "epoch": 0.7458199962654701, "learning_rate": 7.5442765206828384e-06, "loss": 2.8351800537109373, "step": 618100 }, { "epoch": 0.7459406595879529, "learning_rate": 7.5438726852151004e-06, "loss": 2.8177914428710937, "step": 618200 }, { "epoch": 0.7460613229104356, "learning_rate": 7.543468849747361e-06, "loss": 2.8362612915039063, "step": 618300 }, { "epoch": 0.7461819862329182, "learning_rate": 7.543065014279623e-06, "loss": 2.8077484130859376, "step": 618400 }, { "epoch": 0.7463026495554009, "learning_rate": 7.542661178811884e-06, "loss": 2.8257672119140627, "step": 618500 }, { "epoch": 0.7464233128778835, "learning_rate": 7.542257343344146e-06, "loss": 2.8363217163085936, "step": 618600 }, { "epoch": 0.7465439762003663, "learning_rate": 7.541853507876408e-06, "loss": 2.8073886108398436, "step": 618700 }, { "epoch": 0.746664639522849, "learning_rate": 7.54144967240867e-06, "loss": 2.8025497436523437, "step": 618800 }, { "epoch": 0.7467853028453316, "learning_rate": 7.541045836940931e-06, "loss": 2.8164547729492186, "step": 618900 }, { "epoch": 0.7469059661678144, "learning_rate": 7.540642001473193e-06, "loss": 2.797499084472656, "step": 619000 }, { "epoch": 0.747026629490297, "learning_rate": 7.540238166005453e-06, "loss": 2.8240225219726565, "step": 619100 }, { "epoch": 0.7471472928127797, "learning_rate": 7.539834330537715e-06, "loss": 2.8514141845703125, "step": 619200 }, { "epoch": 0.7472679561352624, "learning_rate": 7.539430495069977e-06, "loss": 2.8393463134765624, "step": 619300 }, { "epoch": 0.747388619457745, "learning_rate": 7.539026659602239e-06, "loss": 2.8152816772460936, "step": 619400 }, { "epoch": 0.7475092827802278, "learning_rate": 7.5386228241345e-06, "loss": 2.849360046386719, "step": 619500 }, { "epoch": 0.7476299461027104, "learning_rate": 7.538218988666762e-06, "loss": 2.8304534912109376, "step": 619600 }, { "epoch": 0.7477506094251931, "learning_rate": 7.537815153199024e-06, "loss": 2.7997320556640624, "step": 619700 }, { "epoch": 0.7478712727476758, "learning_rate": 7.537411317731285e-06, "loss": 2.8333538818359374, "step": 619800 }, { "epoch": 0.7479919360701585, "learning_rate": 7.5370074822635465e-06, "loss": 2.8378982543945312, "step": 619900 }, { "epoch": 0.7481125993926412, "learning_rate": 7.5366036467958085e-06, "loss": 2.853677062988281, "step": 620000 }, { "epoch": 0.7482332627151238, "learning_rate": 7.53619981132807e-06, "loss": 2.8385684204101564, "step": 620100 }, { "epoch": 0.7483539260376065, "learning_rate": 7.535795975860332e-06, "loss": 2.829327392578125, "step": 620200 }, { "epoch": 0.7484745893600893, "learning_rate": 7.535392140392594e-06, "loss": 2.8047689819335937, "step": 620300 }, { "epoch": 0.7485952526825719, "learning_rate": 7.534988304924855e-06, "loss": 2.817430114746094, "step": 620400 }, { "epoch": 0.7487159160050546, "learning_rate": 7.534584469457117e-06, "loss": 2.8175750732421876, "step": 620500 }, { "epoch": 0.7488365793275372, "learning_rate": 7.534180633989379e-06, "loss": 2.80708251953125, "step": 620600 }, { "epoch": 0.74895724265002, "learning_rate": 7.533776798521639e-06, "loss": 2.8062698364257814, "step": 620700 }, { "epoch": 0.7490779059725027, "learning_rate": 7.533372963053901e-06, "loss": 2.814303283691406, "step": 620800 }, { "epoch": 0.7491985692949853, "learning_rate": 7.532969127586163e-06, "loss": 2.821028747558594, "step": 620900 }, { "epoch": 0.749319232617468, "learning_rate": 7.532565292118424e-06, "loss": 2.8208688354492186, "step": 621000 }, { "epoch": 0.7494398959399506, "learning_rate": 7.532161456650686e-06, "loss": 2.833165588378906, "step": 621100 }, { "epoch": 0.7495605592624334, "learning_rate": 7.531757621182948e-06, "loss": 2.8111578369140626, "step": 621200 }, { "epoch": 0.7496812225849161, "learning_rate": 7.53135378571521e-06, "loss": 2.819300231933594, "step": 621300 }, { "epoch": 0.7498018859073987, "learning_rate": 7.530949950247471e-06, "loss": 2.8168365478515627, "step": 621400 }, { "epoch": 0.7499225492298814, "learning_rate": 7.530546114779732e-06, "loss": 2.84283935546875, "step": 621500 }, { "epoch": 0.7500432125523641, "learning_rate": 7.5301422793119934e-06, "loss": 2.8554141235351564, "step": 621600 }, { "epoch": 0.7501638758748468, "learning_rate": 7.529738443844255e-06, "loss": 2.831490478515625, "step": 621700 }, { "epoch": 0.7502845391973295, "learning_rate": 7.529334608376517e-06, "loss": 2.8194000244140627, "step": 621800 }, { "epoch": 0.7504052025198121, "learning_rate": 7.528930772908779e-06, "loss": 2.8222787475585935, "step": 621900 }, { "epoch": 0.7505258658422949, "learning_rate": 7.5285269374410405e-06, "loss": 2.821630859375, "step": 622000 }, { "epoch": 0.7506465291647775, "learning_rate": 7.5281231019733025e-06, "loss": 2.8231985473632815, "step": 622100 }, { "epoch": 0.7507671924872602, "learning_rate": 7.5277192665055645e-06, "loss": 2.811253967285156, "step": 622200 }, { "epoch": 0.7508878558097429, "learning_rate": 7.527315431037825e-06, "loss": 2.7806607055664063, "step": 622300 }, { "epoch": 0.7510085191322255, "learning_rate": 7.526911595570087e-06, "loss": 2.848405456542969, "step": 622400 }, { "epoch": 0.7511291824547083, "learning_rate": 7.526507760102349e-06, "loss": 2.79271484375, "step": 622500 }, { "epoch": 0.751249845777191, "learning_rate": 7.52610392463461e-06, "loss": 2.8372039794921875, "step": 622600 }, { "epoch": 0.7513705090996736, "learning_rate": 7.525700089166872e-06, "loss": 2.8286602783203123, "step": 622700 }, { "epoch": 0.7514911724221564, "learning_rate": 7.525296253699134e-06, "loss": 2.8279736328125, "step": 622800 }, { "epoch": 0.751611835744639, "learning_rate": 7.524892418231395e-06, "loss": 2.8249545288085938, "step": 622900 }, { "epoch": 0.7517324990671217, "learning_rate": 7.524488582763657e-06, "loss": 2.8132870483398436, "step": 623000 }, { "epoch": 0.7518531623896044, "learning_rate": 7.524084747295919e-06, "loss": 2.8364694213867185, "step": 623100 }, { "epoch": 0.751973825712087, "learning_rate": 7.523680911828179e-06, "loss": 2.8017919921875, "step": 623200 }, { "epoch": 0.7520944890345698, "learning_rate": 7.523277076360441e-06, "loss": 2.8268621826171874, "step": 623300 }, { "epoch": 0.7522151523570524, "learning_rate": 7.522873240892703e-06, "loss": 2.8178338623046875, "step": 623400 }, { "epoch": 0.7523358156795351, "learning_rate": 7.522469405424964e-06, "loss": 2.7910528564453125, "step": 623500 }, { "epoch": 0.7524564790020178, "learning_rate": 7.522065569957226e-06, "loss": 2.8216256713867187, "step": 623600 }, { "epoch": 0.7525771423245005, "learning_rate": 7.521661734489488e-06, "loss": 2.835389404296875, "step": 623700 }, { "epoch": 0.7526978056469832, "learning_rate": 7.52125789902175e-06, "loss": 2.847786865234375, "step": 623800 }, { "epoch": 0.7528184689694658, "learning_rate": 7.520854063554011e-06, "loss": 2.7977569580078123, "step": 623900 }, { "epoch": 0.7529391322919485, "learning_rate": 7.5204502280862725e-06, "loss": 2.8150515747070313, "step": 624000 }, { "epoch": 0.7530597956144313, "learning_rate": 7.520046392618534e-06, "loss": 2.8003094482421873, "step": 624100 }, { "epoch": 0.7531804589369139, "learning_rate": 7.519642557150796e-06, "loss": 2.8240151977539063, "step": 624200 }, { "epoch": 0.7533011222593966, "learning_rate": 7.519238721683058e-06, "loss": 2.8090219116210937, "step": 624300 }, { "epoch": 0.7534217855818792, "learning_rate": 7.51883488621532e-06, "loss": 2.7934942626953125, "step": 624400 }, { "epoch": 0.753542448904362, "learning_rate": 7.518431050747581e-06, "loss": 2.814222717285156, "step": 624500 }, { "epoch": 0.7536631122268447, "learning_rate": 7.518027215279843e-06, "loss": 2.8359490966796876, "step": 624600 }, { "epoch": 0.7537837755493273, "learning_rate": 7.517623379812105e-06, "loss": 2.8103677368164064, "step": 624700 }, { "epoch": 0.75390443887181, "learning_rate": 7.517219544344365e-06, "loss": 2.8218817138671874, "step": 624800 }, { "epoch": 0.7540251021942926, "learning_rate": 7.516815708876627e-06, "loss": 2.8379351806640627, "step": 624900 }, { "epoch": 0.7541457655167754, "learning_rate": 7.516411873408889e-06, "loss": 2.8164877319335937, "step": 625000 }, { "epoch": 0.7542664288392581, "learning_rate": 7.51600803794115e-06, "loss": 2.836911926269531, "step": 625100 }, { "epoch": 0.7543870921617407, "learning_rate": 7.515604202473412e-06, "loss": 2.8158297729492188, "step": 625200 }, { "epoch": 0.7545077554842234, "learning_rate": 7.515200367005674e-06, "loss": 2.832657775878906, "step": 625300 }, { "epoch": 0.7546284188067061, "learning_rate": 7.514796531537936e-06, "loss": 2.838329162597656, "step": 625400 }, { "epoch": 0.7547490821291888, "learning_rate": 7.514392696070197e-06, "loss": 2.80716552734375, "step": 625500 }, { "epoch": 0.7548697454516715, "learning_rate": 7.513988860602458e-06, "loss": 2.838720703125, "step": 625600 }, { "epoch": 0.7549904087741541, "learning_rate": 7.5135850251347195e-06, "loss": 2.814241943359375, "step": 625700 }, { "epoch": 0.7551110720966369, "learning_rate": 7.5131811896669814e-06, "loss": 2.8169039916992187, "step": 625800 }, { "epoch": 0.7552317354191195, "learning_rate": 7.5127773541992434e-06, "loss": 2.82134765625, "step": 625900 }, { "epoch": 0.7553523987416022, "learning_rate": 7.512373518731505e-06, "loss": 2.8186550903320313, "step": 626000 }, { "epoch": 0.7554730620640849, "learning_rate": 7.5119696832637665e-06, "loss": 2.832461242675781, "step": 626100 }, { "epoch": 0.7555937253865675, "learning_rate": 7.5115658477960285e-06, "loss": 2.8221148681640624, "step": 626200 }, { "epoch": 0.7557143887090503, "learning_rate": 7.5111620123282905e-06, "loss": 2.848611145019531, "step": 626300 }, { "epoch": 0.7558350520315329, "learning_rate": 7.510758176860551e-06, "loss": 2.816414794921875, "step": 626400 }, { "epoch": 0.7559557153540156, "learning_rate": 7.510354341392813e-06, "loss": 2.8215090942382814, "step": 626500 }, { "epoch": 0.7560763786764984, "learning_rate": 7.509950505925075e-06, "loss": 2.8143475341796873, "step": 626600 }, { "epoch": 0.756197041998981, "learning_rate": 7.509546670457336e-06, "loss": 2.8294100952148438, "step": 626700 }, { "epoch": 0.7563177053214637, "learning_rate": 7.509142834989598e-06, "loss": 2.81141845703125, "step": 626800 }, { "epoch": 0.7564383686439463, "learning_rate": 7.50873899952186e-06, "loss": 2.807459411621094, "step": 626900 }, { "epoch": 0.756559031966429, "learning_rate": 7.508335164054121e-06, "loss": 2.815330810546875, "step": 627000 }, { "epoch": 0.7566796952889118, "learning_rate": 7.507931328586383e-06, "loss": 2.8179620361328124, "step": 627100 }, { "epoch": 0.7568003586113944, "learning_rate": 7.507527493118644e-06, "loss": 2.8043142700195314, "step": 627200 }, { "epoch": 0.7569210219338771, "learning_rate": 7.507123657650905e-06, "loss": 2.8381643676757813, "step": 627300 }, { "epoch": 0.7570416852563598, "learning_rate": 7.506719822183167e-06, "loss": 2.823447570800781, "step": 627400 }, { "epoch": 0.7571623485788425, "learning_rate": 7.506315986715429e-06, "loss": 2.803863525390625, "step": 627500 }, { "epoch": 0.7572830119013252, "learning_rate": 7.50591215124769e-06, "loss": 2.8209368896484377, "step": 627600 }, { "epoch": 0.7574036752238078, "learning_rate": 7.505508315779952e-06, "loss": 2.810624694824219, "step": 627700 }, { "epoch": 0.7575243385462905, "learning_rate": 7.505104480312214e-06, "loss": 2.8308978271484375, "step": 627800 }, { "epoch": 0.7576450018687733, "learning_rate": 7.504700644844476e-06, "loss": 2.820066223144531, "step": 627900 }, { "epoch": 0.7577656651912559, "learning_rate": 7.5042968093767374e-06, "loss": 2.825129089355469, "step": 628000 }, { "epoch": 0.7578863285137386, "learning_rate": 7.5038929739089986e-06, "loss": 2.7999700927734374, "step": 628100 }, { "epoch": 0.7580069918362212, "learning_rate": 7.50348913844126e-06, "loss": 2.8441912841796877, "step": 628200 }, { "epoch": 0.758127655158704, "learning_rate": 7.503085302973522e-06, "loss": 2.8127236938476563, "step": 628300 }, { "epoch": 0.7582483184811867, "learning_rate": 7.502681467505784e-06, "loss": 2.8064776611328126, "step": 628400 }, { "epoch": 0.7583689818036693, "learning_rate": 7.502277632038046e-06, "loss": 2.81010986328125, "step": 628500 }, { "epoch": 0.758489645126152, "learning_rate": 7.501873796570307e-06, "loss": 2.813505859375, "step": 628600 }, { "epoch": 0.7586103084486346, "learning_rate": 7.501469961102569e-06, "loss": 2.839752502441406, "step": 628700 }, { "epoch": 0.7587309717711174, "learning_rate": 7.501066125634831e-06, "loss": 2.8094476318359374, "step": 628800 }, { "epoch": 0.7588516350936001, "learning_rate": 7.500662290167091e-06, "loss": 2.8255184936523436, "step": 628900 }, { "epoch": 0.7589722984160827, "learning_rate": 7.500258454699353e-06, "loss": 2.7825860595703125, "step": 629000 }, { "epoch": 0.7590929617385654, "learning_rate": 7.499854619231615e-06, "loss": 2.7998233032226563, "step": 629100 }, { "epoch": 0.7592136250610481, "learning_rate": 7.499450783763876e-06, "loss": 2.833280029296875, "step": 629200 }, { "epoch": 0.7593342883835308, "learning_rate": 7.499046948296138e-06, "loss": 2.82797119140625, "step": 629300 }, { "epoch": 0.7594549517060135, "learning_rate": 7.4986431128284e-06, "loss": 2.8048834228515624, "step": 629400 }, { "epoch": 0.7595756150284961, "learning_rate": 7.498239277360661e-06, "loss": 2.840520324707031, "step": 629500 }, { "epoch": 0.7596962783509789, "learning_rate": 7.497835441892923e-06, "loss": 2.8284671020507814, "step": 629600 }, { "epoch": 0.7598169416734615, "learning_rate": 7.497431606425184e-06, "loss": 2.8107119750976564, "step": 629700 }, { "epoch": 0.7599376049959442, "learning_rate": 7.4970277709574455e-06, "loss": 2.817759704589844, "step": 629800 }, { "epoch": 0.7600582683184269, "learning_rate": 7.4966239354897075e-06, "loss": 2.7947119140625, "step": 629900 }, { "epoch": 0.7601789316409095, "learning_rate": 7.4962201000219695e-06, "loss": 2.827834167480469, "step": 630000 }, { "epoch": 0.7602995949633923, "learning_rate": 7.495816264554231e-06, "loss": 2.806748046875, "step": 630100 }, { "epoch": 0.7604202582858749, "learning_rate": 7.495412429086493e-06, "loss": 2.8078036499023438, "step": 630200 }, { "epoch": 0.7605409216083576, "learning_rate": 7.4950085936187546e-06, "loss": 2.7935491943359376, "step": 630300 }, { "epoch": 0.7606615849308404, "learning_rate": 7.4946047581510165e-06, "loss": 2.824662780761719, "step": 630400 }, { "epoch": 0.760782248253323, "learning_rate": 7.494200922683277e-06, "loss": 2.8324224853515627, "step": 630500 }, { "epoch": 0.7609029115758057, "learning_rate": 7.493797087215539e-06, "loss": 2.824881896972656, "step": 630600 }, { "epoch": 0.7610235748982883, "learning_rate": 7.4933932517478e-06, "loss": 2.809110107421875, "step": 630700 }, { "epoch": 0.761144238220771, "learning_rate": 7.492989416280062e-06, "loss": 2.8109576416015627, "step": 630800 }, { "epoch": 0.7612649015432538, "learning_rate": 7.492585580812324e-06, "loss": 2.839380798339844, "step": 630900 }, { "epoch": 0.7613855648657364, "learning_rate": 7.492181745344586e-06, "loss": 2.8052963256835937, "step": 631000 }, { "epoch": 0.7615062281882191, "learning_rate": 7.491777909876847e-06, "loss": 2.8299984741210937, "step": 631100 }, { "epoch": 0.7616268915107017, "learning_rate": 7.491374074409109e-06, "loss": 2.8344342041015627, "step": 631200 }, { "epoch": 0.7617475548331845, "learning_rate": 7.490970238941369e-06, "loss": 2.7963909912109375, "step": 631300 }, { "epoch": 0.7618682181556672, "learning_rate": 7.490566403473631e-06, "loss": 2.819774169921875, "step": 631400 }, { "epoch": 0.7619888814781498, "learning_rate": 7.490162568005893e-06, "loss": 2.829229431152344, "step": 631500 }, { "epoch": 0.7621095448006325, "learning_rate": 7.489758732538155e-06, "loss": 2.7972030639648438, "step": 631600 }, { "epoch": 0.7622302081231151, "learning_rate": 7.489354897070416e-06, "loss": 2.8223831176757814, "step": 631700 }, { "epoch": 0.7623508714455979, "learning_rate": 7.488951061602678e-06, "loss": 2.827274169921875, "step": 631800 }, { "epoch": 0.7624715347680806, "learning_rate": 7.48854722613494e-06, "loss": 2.8172030639648438, "step": 631900 }, { "epoch": 0.7625921980905632, "learning_rate": 7.4881433906672015e-06, "loss": 2.799857177734375, "step": 632000 }, { "epoch": 0.762712861413046, "learning_rate": 7.487739555199463e-06, "loss": 2.80046630859375, "step": 632100 }, { "epoch": 0.7628335247355286, "learning_rate": 7.487335719731725e-06, "loss": 2.8192620849609376, "step": 632200 }, { "epoch": 0.7629541880580113, "learning_rate": 7.486931884263986e-06, "loss": 2.8029095458984377, "step": 632300 }, { "epoch": 0.763074851380494, "learning_rate": 7.486528048796248e-06, "loss": 2.8075775146484374, "step": 632400 }, { "epoch": 0.7631955147029766, "learning_rate": 7.48612421332851e-06, "loss": 2.8197528076171876, "step": 632500 }, { "epoch": 0.7633161780254594, "learning_rate": 7.485720377860771e-06, "loss": 2.798919372558594, "step": 632600 }, { "epoch": 0.7634368413479421, "learning_rate": 7.485316542393033e-06, "loss": 2.815196228027344, "step": 632700 }, { "epoch": 0.7635575046704247, "learning_rate": 7.484912706925295e-06, "loss": 2.795498046875, "step": 632800 }, { "epoch": 0.7636781679929074, "learning_rate": 7.484508871457555e-06, "loss": 2.836619567871094, "step": 632900 }, { "epoch": 0.7637988313153901, "learning_rate": 7.484105035989817e-06, "loss": 2.8059762573242186, "step": 633000 }, { "epoch": 0.7639194946378728, "learning_rate": 7.483701200522079e-06, "loss": 2.806063537597656, "step": 633100 }, { "epoch": 0.7640401579603555, "learning_rate": 7.48329736505434e-06, "loss": 2.806720886230469, "step": 633200 }, { "epoch": 0.7641608212828381, "learning_rate": 7.482893529586602e-06, "loss": 2.82459228515625, "step": 633300 }, { "epoch": 0.7642814846053209, "learning_rate": 7.482489694118864e-06, "loss": 2.8183721923828124, "step": 633400 }, { "epoch": 0.7644021479278035, "learning_rate": 7.482085858651126e-06, "loss": 2.7859466552734373, "step": 633500 }, { "epoch": 0.7645228112502862, "learning_rate": 7.481682023183387e-06, "loss": 2.7920452880859377, "step": 633600 }, { "epoch": 0.7646434745727689, "learning_rate": 7.481278187715649e-06, "loss": 2.826982116699219, "step": 633700 }, { "epoch": 0.7647641378952516, "learning_rate": 7.4808743522479096e-06, "loss": 2.8122933959960936, "step": 633800 }, { "epoch": 0.7648848012177343, "learning_rate": 7.4804705167801715e-06, "loss": 2.8242767333984373, "step": 633900 }, { "epoch": 0.7650054645402169, "learning_rate": 7.4800666813124335e-06, "loss": 2.80056640625, "step": 634000 }, { "epoch": 0.7651261278626996, "learning_rate": 7.4796628458446955e-06, "loss": 2.8149404907226563, "step": 634100 }, { "epoch": 0.7652467911851824, "learning_rate": 7.479259010376957e-06, "loss": 2.8430496215820313, "step": 634200 }, { "epoch": 0.765367454507665, "learning_rate": 7.478855174909219e-06, "loss": 2.825057067871094, "step": 634300 }, { "epoch": 0.7654881178301477, "learning_rate": 7.478451339441481e-06, "loss": 2.7937969970703125, "step": 634400 }, { "epoch": 0.7656087811526303, "learning_rate": 7.478047503973742e-06, "loss": 2.8096853637695314, "step": 634500 }, { "epoch": 0.765729444475113, "learning_rate": 7.477643668506003e-06, "loss": 2.814560546875, "step": 634600 }, { "epoch": 0.7658501077975958, "learning_rate": 7.477239833038265e-06, "loss": 2.814894104003906, "step": 634700 }, { "epoch": 0.7659707711200784, "learning_rate": 7.476835997570526e-06, "loss": 2.8021551513671876, "step": 634800 }, { "epoch": 0.7660914344425611, "learning_rate": 7.476432162102788e-06, "loss": 2.8287619018554686, "step": 634900 }, { "epoch": 0.7662120977650437, "learning_rate": 7.47602832663505e-06, "loss": 2.8066400146484374, "step": 635000 }, { "epoch": 0.7663327610875265, "learning_rate": 7.475624491167311e-06, "loss": 2.8202584838867186, "step": 635100 }, { "epoch": 0.7664534244100092, "learning_rate": 7.475220655699573e-06, "loss": 2.808660583496094, "step": 635200 }, { "epoch": 0.7665740877324918, "learning_rate": 7.474816820231835e-06, "loss": 2.8035342407226564, "step": 635300 }, { "epoch": 0.7666947510549745, "learning_rate": 7.474412984764095e-06, "loss": 2.8066366577148436, "step": 635400 }, { "epoch": 0.7668154143774571, "learning_rate": 7.474009149296357e-06, "loss": 2.8064675903320313, "step": 635500 }, { "epoch": 0.7669360776999399, "learning_rate": 7.473605313828619e-06, "loss": 2.8260287475585937, "step": 635600 }, { "epoch": 0.7670567410224226, "learning_rate": 7.4732014783608804e-06, "loss": 2.81394775390625, "step": 635700 }, { "epoch": 0.7671774043449052, "learning_rate": 7.4727976428931424e-06, "loss": 2.805430908203125, "step": 635800 }, { "epoch": 0.767298067667388, "learning_rate": 7.472393807425404e-06, "loss": 2.825620422363281, "step": 635900 }, { "epoch": 0.7674187309898706, "learning_rate": 7.471989971957666e-06, "loss": 2.8045498657226564, "step": 636000 }, { "epoch": 0.7675393943123533, "learning_rate": 7.4715861364899275e-06, "loss": 2.76764404296875, "step": 636100 }, { "epoch": 0.767660057634836, "learning_rate": 7.471182301022189e-06, "loss": 2.80500244140625, "step": 636200 }, { "epoch": 0.7677807209573186, "learning_rate": 7.47077846555445e-06, "loss": 2.7840670776367187, "step": 636300 }, { "epoch": 0.7679013842798014, "learning_rate": 7.470374630086712e-06, "loss": 2.82157470703125, "step": 636400 }, { "epoch": 0.768022047602284, "learning_rate": 7.469970794618974e-06, "loss": 2.8102056884765627, "step": 636500 }, { "epoch": 0.7681427109247667, "learning_rate": 7.469566959151236e-06, "loss": 2.7919244384765625, "step": 636600 }, { "epoch": 0.7682633742472494, "learning_rate": 7.469163123683497e-06, "loss": 2.8040496826171877, "step": 636700 }, { "epoch": 0.7683840375697321, "learning_rate": 7.468759288215759e-06, "loss": 2.8322763061523437, "step": 636800 }, { "epoch": 0.7685047008922148, "learning_rate": 7.468355452748021e-06, "loss": 2.8125839233398438, "step": 636900 }, { "epoch": 0.7686253642146974, "learning_rate": 7.467951617280281e-06, "loss": 2.81189208984375, "step": 637000 }, { "epoch": 0.7687460275371801, "learning_rate": 7.467547781812543e-06, "loss": 2.7913079833984376, "step": 637100 }, { "epoch": 0.7688666908596629, "learning_rate": 7.467143946344805e-06, "loss": 2.7972946166992188, "step": 637200 }, { "epoch": 0.7689873541821455, "learning_rate": 7.466740110877066e-06, "loss": 2.7843026733398437, "step": 637300 }, { "epoch": 0.7691080175046282, "learning_rate": 7.466336275409328e-06, "loss": 2.8177694702148437, "step": 637400 }, { "epoch": 0.7692286808271108, "learning_rate": 7.46593243994159e-06, "loss": 2.794295654296875, "step": 637500 }, { "epoch": 0.7693493441495936, "learning_rate": 7.465528604473851e-06, "loss": 2.799768981933594, "step": 637600 }, { "epoch": 0.7694700074720763, "learning_rate": 7.465124769006113e-06, "loss": 2.788987731933594, "step": 637700 }, { "epoch": 0.7695906707945589, "learning_rate": 7.4647209335383745e-06, "loss": 2.7929547119140623, "step": 637800 }, { "epoch": 0.7697113341170416, "learning_rate": 7.464317098070636e-06, "loss": 2.7963330078125, "step": 637900 }, { "epoch": 0.7698319974395244, "learning_rate": 7.4639132626028976e-06, "loss": 2.7865264892578123, "step": 638000 }, { "epoch": 0.769952660762007, "learning_rate": 7.4635094271351596e-06, "loss": 2.802998352050781, "step": 638100 }, { "epoch": 0.7700733240844897, "learning_rate": 7.463105591667421e-06, "loss": 2.798790283203125, "step": 638200 }, { "epoch": 0.7701939874069723, "learning_rate": 7.462701756199683e-06, "loss": 2.814588928222656, "step": 638300 }, { "epoch": 0.770314650729455, "learning_rate": 7.462297920731945e-06, "loss": 2.8448245239257814, "step": 638400 }, { "epoch": 0.7704353140519378, "learning_rate": 7.461894085264207e-06, "loss": 2.7995623779296874, "step": 638500 }, { "epoch": 0.7705559773744204, "learning_rate": 7.461490249796468e-06, "loss": 2.7841168212890626, "step": 638600 }, { "epoch": 0.7706766406969031, "learning_rate": 7.461086414328729e-06, "loss": 2.809776611328125, "step": 638700 }, { "epoch": 0.7707973040193857, "learning_rate": 7.46068257886099e-06, "loss": 2.806551513671875, "step": 638800 }, { "epoch": 0.7709179673418685, "learning_rate": 7.460278743393252e-06, "loss": 2.799233093261719, "step": 638900 }, { "epoch": 0.7710386306643512, "learning_rate": 7.459874907925514e-06, "loss": 2.8224993896484376, "step": 639000 }, { "epoch": 0.7711592939868338, "learning_rate": 7.459471072457776e-06, "loss": 2.798675537109375, "step": 639100 }, { "epoch": 0.7712799573093165, "learning_rate": 7.459067236990037e-06, "loss": 2.8178729248046874, "step": 639200 }, { "epoch": 0.7714006206317991, "learning_rate": 7.458663401522299e-06, "loss": 2.787048645019531, "step": 639300 }, { "epoch": 0.7715212839542819, "learning_rate": 7.458259566054561e-06, "loss": 2.8220550537109377, "step": 639400 }, { "epoch": 0.7716419472767646, "learning_rate": 7.457855730586821e-06, "loss": 2.809775390625, "step": 639500 }, { "epoch": 0.7717626105992472, "learning_rate": 7.457451895119083e-06, "loss": 2.8032269287109375, "step": 639600 }, { "epoch": 0.77188327392173, "learning_rate": 7.457048059651345e-06, "loss": 2.802798156738281, "step": 639700 }, { "epoch": 0.7720039372442126, "learning_rate": 7.4566442241836065e-06, "loss": 2.7987185668945314, "step": 639800 }, { "epoch": 0.7721246005666953, "learning_rate": 7.4562403887158685e-06, "loss": 2.8019683837890623, "step": 639900 }, { "epoch": 0.772245263889178, "learning_rate": 7.4558365532481304e-06, "loss": 2.8094406127929688, "step": 640000 }, { "epoch": 0.7723659272116606, "learning_rate": 7.4554327177803924e-06, "loss": 2.781033935546875, "step": 640100 }, { "epoch": 0.7724865905341434, "learning_rate": 7.4550288823126536e-06, "loss": 2.830671691894531, "step": 640200 }, { "epoch": 0.772607253856626, "learning_rate": 7.454625046844915e-06, "loss": 2.8130642700195314, "step": 640300 }, { "epoch": 0.7727279171791087, "learning_rate": 7.454221211377176e-06, "loss": 2.795113830566406, "step": 640400 }, { "epoch": 0.7728485805015914, "learning_rate": 7.453817375909438e-06, "loss": 2.7911883544921876, "step": 640500 }, { "epoch": 0.7729692438240741, "learning_rate": 7.4534135404417e-06, "loss": 2.824063720703125, "step": 640600 }, { "epoch": 0.7730899071465568, "learning_rate": 7.453009704973962e-06, "loss": 2.7955221557617187, "step": 640700 }, { "epoch": 0.7732105704690394, "learning_rate": 7.452605869506223e-06, "loss": 2.810726318359375, "step": 640800 }, { "epoch": 0.7733312337915221, "learning_rate": 7.452202034038485e-06, "loss": 2.8075360107421874, "step": 640900 }, { "epoch": 0.7734518971140049, "learning_rate": 7.451798198570747e-06, "loss": 2.8090118408203124, "step": 641000 }, { "epoch": 0.7735725604364875, "learning_rate": 7.451394363103007e-06, "loss": 2.794954833984375, "step": 641100 }, { "epoch": 0.7736932237589702, "learning_rate": 7.450990527635269e-06, "loss": 2.7930673217773436, "step": 641200 }, { "epoch": 0.7738138870814528, "learning_rate": 7.450586692167531e-06, "loss": 2.783580627441406, "step": 641300 }, { "epoch": 0.7739345504039356, "learning_rate": 7.450182856699792e-06, "loss": 2.7946356201171874, "step": 641400 }, { "epoch": 0.7740552137264183, "learning_rate": 7.449779021232054e-06, "loss": 2.7804501342773436, "step": 641500 }, { "epoch": 0.7741758770489009, "learning_rate": 7.449375185764316e-06, "loss": 2.8231967163085936, "step": 641600 }, { "epoch": 0.7742965403713836, "learning_rate": 7.448971350296577e-06, "loss": 2.797424621582031, "step": 641700 }, { "epoch": 0.7744172036938662, "learning_rate": 7.448567514828839e-06, "loss": 2.8254598999023437, "step": 641800 }, { "epoch": 0.774537867016349, "learning_rate": 7.4481636793611005e-06, "loss": 2.800212097167969, "step": 641900 }, { "epoch": 0.7746585303388317, "learning_rate": 7.447759843893362e-06, "loss": 2.799847412109375, "step": 642000 }, { "epoch": 0.7747791936613143, "learning_rate": 7.447356008425624e-06, "loss": 2.7982672119140624, "step": 642100 }, { "epoch": 0.774899856983797, "learning_rate": 7.446952172957886e-06, "loss": 2.7974948120117187, "step": 642200 }, { "epoch": 0.7750205203062797, "learning_rate": 7.446548337490147e-06, "loss": 2.7808526611328124, "step": 642300 }, { "epoch": 0.7751411836287624, "learning_rate": 7.446144502022409e-06, "loss": 2.7849496459960936, "step": 642400 }, { "epoch": 0.7752618469512451, "learning_rate": 7.445740666554671e-06, "loss": 2.8252993774414064, "step": 642500 }, { "epoch": 0.7753825102737277, "learning_rate": 7.445336831086933e-06, "loss": 2.7983026123046875, "step": 642600 }, { "epoch": 0.7755031735962105, "learning_rate": 7.444932995619193e-06, "loss": 2.8225552368164064, "step": 642700 }, { "epoch": 0.7756238369186931, "learning_rate": 7.444529160151455e-06, "loss": 2.796225280761719, "step": 642800 }, { "epoch": 0.7757445002411758, "learning_rate": 7.444125324683716e-06, "loss": 2.797408142089844, "step": 642900 }, { "epoch": 0.7758651635636585, "learning_rate": 7.443721489215978e-06, "loss": 2.8313677978515623, "step": 643000 }, { "epoch": 0.7759858268861412, "learning_rate": 7.44331765374824e-06, "loss": 2.79855224609375, "step": 643100 }, { "epoch": 0.7761064902086239, "learning_rate": 7.442913818280502e-06, "loss": 2.8013034057617188, "step": 643200 }, { "epoch": 0.7762271535311066, "learning_rate": 7.442509982812763e-06, "loss": 2.791241455078125, "step": 643300 }, { "epoch": 0.7763478168535892, "learning_rate": 7.442106147345025e-06, "loss": 2.803466491699219, "step": 643400 }, { "epoch": 0.776468480176072, "learning_rate": 7.441702311877287e-06, "loss": 2.8065109252929688, "step": 643500 }, { "epoch": 0.7765891434985546, "learning_rate": 7.441298476409547e-06, "loss": 2.8209933471679687, "step": 643600 }, { "epoch": 0.7767098068210373, "learning_rate": 7.440894640941809e-06, "loss": 2.784701232910156, "step": 643700 }, { "epoch": 0.77683047014352, "learning_rate": 7.440490805474071e-06, "loss": 2.811717529296875, "step": 643800 }, { "epoch": 0.7769511334660026, "learning_rate": 7.4400869700063325e-06, "loss": 2.7684066772460936, "step": 643900 }, { "epoch": 0.7770717967884854, "learning_rate": 7.4396831345385945e-06, "loss": 2.8030841064453127, "step": 644000 }, { "epoch": 0.777192460110968, "learning_rate": 7.4392792990708565e-06, "loss": 2.801991271972656, "step": 644100 }, { "epoch": 0.7773131234334507, "learning_rate": 7.438875463603118e-06, "loss": 2.8076577758789063, "step": 644200 }, { "epoch": 0.7774337867559334, "learning_rate": 7.43847162813538e-06, "loss": 2.785273132324219, "step": 644300 }, { "epoch": 0.7775544500784161, "learning_rate": 7.438067792667641e-06, "loss": 2.7681045532226562, "step": 644400 }, { "epoch": 0.7776751134008988, "learning_rate": 7.437663957199902e-06, "loss": 2.8096875, "step": 644500 }, { "epoch": 0.7777957767233814, "learning_rate": 7.437260121732164e-06, "loss": 2.8151321411132812, "step": 644600 }, { "epoch": 0.7779164400458641, "learning_rate": 7.436856286264426e-06, "loss": 2.8049139404296874, "step": 644700 }, { "epoch": 0.7780371033683469, "learning_rate": 7.436452450796687e-06, "loss": 2.7531466674804688, "step": 644800 }, { "epoch": 0.7781577666908295, "learning_rate": 7.436048615328949e-06, "loss": 2.7882122802734375, "step": 644900 }, { "epoch": 0.7782784300133122, "learning_rate": 7.435644779861211e-06, "loss": 2.8069497680664064, "step": 645000 }, { "epoch": 0.7783990933357948, "learning_rate": 7.435240944393473e-06, "loss": 2.8038626098632813, "step": 645100 }, { "epoch": 0.7785197566582776, "learning_rate": 7.434837108925733e-06, "loss": 2.79199462890625, "step": 645200 }, { "epoch": 0.7786404199807603, "learning_rate": 7.434433273457995e-06, "loss": 2.8295538330078127, "step": 645300 }, { "epoch": 0.7787610833032429, "learning_rate": 7.434029437990256e-06, "loss": 2.8368130493164063, "step": 645400 }, { "epoch": 0.7788817466257256, "learning_rate": 7.433625602522518e-06, "loss": 2.80603759765625, "step": 645500 }, { "epoch": 0.7790024099482082, "learning_rate": 7.43322176705478e-06, "loss": 2.794247741699219, "step": 645600 }, { "epoch": 0.779123073270691, "learning_rate": 7.432817931587042e-06, "loss": 2.79450927734375, "step": 645700 }, { "epoch": 0.7792437365931737, "learning_rate": 7.432414096119303e-06, "loss": 2.794268798828125, "step": 645800 }, { "epoch": 0.7793643999156563, "learning_rate": 7.432010260651565e-06, "loss": 2.781707763671875, "step": 645900 }, { "epoch": 0.779485063238139, "learning_rate": 7.431606425183826e-06, "loss": 2.7842803955078126, "step": 646000 }, { "epoch": 0.7796057265606217, "learning_rate": 7.431202589716088e-06, "loss": 2.8273434448242187, "step": 646100 }, { "epoch": 0.7797263898831044, "learning_rate": 7.43079875424835e-06, "loss": 2.7945376586914064, "step": 646200 }, { "epoch": 0.7798470532055871, "learning_rate": 7.430394918780612e-06, "loss": 2.792893981933594, "step": 646300 }, { "epoch": 0.7799677165280697, "learning_rate": 7.429991083312873e-06, "loss": 2.814039611816406, "step": 646400 }, { "epoch": 0.7800883798505525, "learning_rate": 7.429587247845135e-06, "loss": 2.784273681640625, "step": 646500 }, { "epoch": 0.7802090431730351, "learning_rate": 7.429183412377397e-06, "loss": 2.811090087890625, "step": 646600 }, { "epoch": 0.7803297064955178, "learning_rate": 7.428779576909658e-06, "loss": 2.7727545166015624, "step": 646700 }, { "epoch": 0.7804503698180005, "learning_rate": 7.428375741441919e-06, "loss": 2.79545654296875, "step": 646800 }, { "epoch": 0.7805710331404832, "learning_rate": 7.427971905974181e-06, "loss": 2.8199188232421877, "step": 646900 }, { "epoch": 0.7806916964629659, "learning_rate": 7.427568070506442e-06, "loss": 2.8087591552734374, "step": 647000 }, { "epoch": 0.7808123597854485, "learning_rate": 7.427164235038704e-06, "loss": 2.8018902587890624, "step": 647100 }, { "epoch": 0.7809330231079312, "learning_rate": 7.426760399570966e-06, "loss": 2.8068023681640626, "step": 647200 }, { "epoch": 0.781053686430414, "learning_rate": 7.426356564103227e-06, "loss": 2.780206298828125, "step": 647300 }, { "epoch": 0.7811743497528966, "learning_rate": 7.425952728635489e-06, "loss": 2.8132147216796874, "step": 647400 }, { "epoch": 0.7812950130753793, "learning_rate": 7.425548893167751e-06, "loss": 2.7968673706054688, "step": 647500 }, { "epoch": 0.7814156763978619, "learning_rate": 7.4251450577000115e-06, "loss": 2.7901736450195314, "step": 647600 }, { "epoch": 0.7815363397203446, "learning_rate": 7.4247412222322734e-06, "loss": 2.797579650878906, "step": 647700 }, { "epoch": 0.7816570030428274, "learning_rate": 7.4243373867645354e-06, "loss": 2.7747537231445314, "step": 647800 }, { "epoch": 0.78177766636531, "learning_rate": 7.4239335512967966e-06, "loss": 2.792848815917969, "step": 647900 }, { "epoch": 0.7818983296877927, "learning_rate": 7.4235297158290585e-06, "loss": 2.8133364868164064, "step": 648000 }, { "epoch": 0.7820189930102753, "learning_rate": 7.4231258803613205e-06, "loss": 2.8114834594726563, "step": 648100 }, { "epoch": 0.7821396563327581, "learning_rate": 7.4227220448935825e-06, "loss": 2.80548095703125, "step": 648200 }, { "epoch": 0.7822603196552408, "learning_rate": 7.422318209425844e-06, "loss": 2.790826721191406, "step": 648300 }, { "epoch": 0.7823809829777234, "learning_rate": 7.421914373958105e-06, "loss": 2.774923095703125, "step": 648400 }, { "epoch": 0.7825016463002061, "learning_rate": 7.421510538490366e-06, "loss": 2.7789620971679687, "step": 648500 }, { "epoch": 0.7826223096226889, "learning_rate": 7.421106703022628e-06, "loss": 2.8081011962890625, "step": 648600 }, { "epoch": 0.7827429729451715, "learning_rate": 7.42070286755489e-06, "loss": 2.7909561157226563, "step": 648700 }, { "epoch": 0.7828636362676542, "learning_rate": 7.420299032087152e-06, "loss": 2.7952871704101563, "step": 648800 }, { "epoch": 0.7829842995901368, "learning_rate": 7.419895196619413e-06, "loss": 2.8052932739257814, "step": 648900 }, { "epoch": 0.7831049629126196, "learning_rate": 7.419491361151675e-06, "loss": 2.819377136230469, "step": 649000 }, { "epoch": 0.7832256262351023, "learning_rate": 7.419087525683937e-06, "loss": 2.82023681640625, "step": 649100 }, { "epoch": 0.7833462895575849, "learning_rate": 7.418683690216198e-06, "loss": 2.8108856201171877, "step": 649200 }, { "epoch": 0.7834669528800676, "learning_rate": 7.418279854748459e-06, "loss": 2.781102294921875, "step": 649300 }, { "epoch": 0.7835876162025502, "learning_rate": 7.417876019280721e-06, "loss": 2.7746896362304687, "step": 649400 }, { "epoch": 0.783708279525033, "learning_rate": 7.417472183812982e-06, "loss": 2.791792907714844, "step": 649500 }, { "epoch": 0.7838289428475157, "learning_rate": 7.417068348345244e-06, "loss": 2.77331298828125, "step": 649600 }, { "epoch": 0.7839496061699983, "learning_rate": 7.416664512877506e-06, "loss": 2.812242431640625, "step": 649700 }, { "epoch": 0.784070269492481, "learning_rate": 7.4162606774097675e-06, "loss": 2.780318298339844, "step": 649800 }, { "epoch": 0.7841909328149637, "learning_rate": 7.4158568419420294e-06, "loss": 2.813304138183594, "step": 649900 }, { "epoch": 0.7843115961374464, "learning_rate": 7.415453006474291e-06, "loss": 2.8148846435546875, "step": 650000 }, { "epoch": 0.7844322594599291, "learning_rate": 7.415049171006552e-06, "loss": 2.807090148925781, "step": 650100 }, { "epoch": 0.7845529227824117, "learning_rate": 7.414645335538814e-06, "loss": 2.820609436035156, "step": 650200 }, { "epoch": 0.7846735861048945, "learning_rate": 7.414241500071076e-06, "loss": 2.8246429443359373, "step": 650300 }, { "epoch": 0.7847942494273771, "learning_rate": 7.413837664603337e-06, "loss": 2.8008038330078127, "step": 650400 }, { "epoch": 0.7849149127498598, "learning_rate": 7.413433829135599e-06, "loss": 2.79761962890625, "step": 650500 }, { "epoch": 0.7850355760723425, "learning_rate": 7.413029993667861e-06, "loss": 2.8181552124023437, "step": 650600 }, { "epoch": 0.7851562393948252, "learning_rate": 7.412626158200123e-06, "loss": 2.813277282714844, "step": 650700 }, { "epoch": 0.7852769027173079, "learning_rate": 7.412222322732384e-06, "loss": 2.7930374145507812, "step": 650800 }, { "epoch": 0.7853975660397905, "learning_rate": 7.411818487264645e-06, "loss": 2.785684814453125, "step": 650900 }, { "epoch": 0.7855182293622732, "learning_rate": 7.411414651796906e-06, "loss": 2.800728454589844, "step": 651000 }, { "epoch": 0.785638892684756, "learning_rate": 7.411010816329168e-06, "loss": 2.812364196777344, "step": 651100 }, { "epoch": 0.7857595560072386, "learning_rate": 7.41060698086143e-06, "loss": 2.7963671875, "step": 651200 }, { "epoch": 0.7858802193297213, "learning_rate": 7.410203145393692e-06, "loss": 2.78601806640625, "step": 651300 }, { "epoch": 0.7860008826522039, "learning_rate": 7.409799309925953e-06, "loss": 2.7887860107421876, "step": 651400 }, { "epoch": 0.7861215459746866, "learning_rate": 7.409395474458215e-06, "loss": 2.8027056884765624, "step": 651500 }, { "epoch": 0.7862422092971694, "learning_rate": 7.408991638990477e-06, "loss": 2.8188494873046874, "step": 651600 }, { "epoch": 0.786362872619652, "learning_rate": 7.4085878035227375e-06, "loss": 2.806413269042969, "step": 651700 }, { "epoch": 0.7864835359421347, "learning_rate": 7.4081839680549995e-06, "loss": 2.790466613769531, "step": 651800 }, { "epoch": 0.7866041992646173, "learning_rate": 7.4077801325872615e-06, "loss": 2.8119375610351565, "step": 651900 }, { "epoch": 0.7867248625871001, "learning_rate": 7.407376297119523e-06, "loss": 2.8192398071289064, "step": 652000 }, { "epoch": 0.7868455259095828, "learning_rate": 7.406972461651785e-06, "loss": 2.777142333984375, "step": 652100 }, { "epoch": 0.7869661892320654, "learning_rate": 7.4065686261840466e-06, "loss": 2.7916253662109374, "step": 652200 }, { "epoch": 0.7870868525545481, "learning_rate": 7.406164790716308e-06, "loss": 2.8010763549804687, "step": 652300 }, { "epoch": 0.7872075158770308, "learning_rate": 7.40576095524857e-06, "loss": 2.799225158691406, "step": 652400 }, { "epoch": 0.7873281791995135, "learning_rate": 7.405357119780831e-06, "loss": 2.8012130737304686, "step": 652500 }, { "epoch": 0.7874488425219962, "learning_rate": 7.404953284313092e-06, "loss": 2.792757873535156, "step": 652600 }, { "epoch": 0.7875695058444788, "learning_rate": 7.404549448845354e-06, "loss": 2.7983407592773437, "step": 652700 }, { "epoch": 0.7876901691669616, "learning_rate": 7.404145613377616e-06, "loss": 2.7867816162109373, "step": 652800 }, { "epoch": 0.7878108324894442, "learning_rate": 7.403741777909877e-06, "loss": 2.7692584228515624, "step": 652900 }, { "epoch": 0.7879314958119269, "learning_rate": 7.403337942442139e-06, "loss": 2.82015625, "step": 653000 }, { "epoch": 0.7880521591344096, "learning_rate": 7.402934106974401e-06, "loss": 2.781053466796875, "step": 653100 }, { "epoch": 0.7881728224568922, "learning_rate": 7.402530271506663e-06, "loss": 2.7840753173828126, "step": 653200 }, { "epoch": 0.788293485779375, "learning_rate": 7.402126436038923e-06, "loss": 2.784112854003906, "step": 653300 }, { "epoch": 0.7884141491018577, "learning_rate": 7.401722600571185e-06, "loss": 2.772276611328125, "step": 653400 }, { "epoch": 0.7885348124243403, "learning_rate": 7.401318765103446e-06, "loss": 2.7786004638671873, "step": 653500 }, { "epoch": 0.788655475746823, "learning_rate": 7.400914929635708e-06, "loss": 2.8094366455078124, "step": 653600 }, { "epoch": 0.7887761390693057, "learning_rate": 7.40051109416797e-06, "loss": 2.808651123046875, "step": 653700 }, { "epoch": 0.7888968023917884, "learning_rate": 7.400107258700232e-06, "loss": 2.8094168090820313, "step": 653800 }, { "epoch": 0.7890174657142711, "learning_rate": 7.3997034232324935e-06, "loss": 2.786241149902344, "step": 653900 }, { "epoch": 0.7891381290367537, "learning_rate": 7.3992995877647555e-06, "loss": 2.797081298828125, "step": 654000 }, { "epoch": 0.7892587923592365, "learning_rate": 7.3988957522970175e-06, "loss": 2.7973736572265624, "step": 654100 }, { "epoch": 0.7893794556817191, "learning_rate": 7.398491916829278e-06, "loss": 2.7939804077148436, "step": 654200 }, { "epoch": 0.7895001190042018, "learning_rate": 7.39808808136154e-06, "loss": 2.792857360839844, "step": 654300 }, { "epoch": 0.7896207823266845, "learning_rate": 7.397684245893802e-06, "loss": 2.78983642578125, "step": 654400 }, { "epoch": 0.7897414456491672, "learning_rate": 7.397280410426063e-06, "loss": 2.784940490722656, "step": 654500 }, { "epoch": 0.7898621089716499, "learning_rate": 7.396876574958325e-06, "loss": 2.7826373291015627, "step": 654600 }, { "epoch": 0.7899827722941325, "learning_rate": 7.396472739490587e-06, "loss": 2.796996765136719, "step": 654700 }, { "epoch": 0.7901034356166152, "learning_rate": 7.396068904022849e-06, "loss": 2.7768310546875, "step": 654800 }, { "epoch": 0.790224098939098, "learning_rate": 7.39566506855511e-06, "loss": 2.819232177734375, "step": 654900 }, { "epoch": 0.7903447622615806, "learning_rate": 7.395261233087371e-06, "loss": 2.8174673461914064, "step": 655000 }, { "epoch": 0.7904654255840633, "learning_rate": 7.394857397619632e-06, "loss": 2.7847885131835937, "step": 655100 }, { "epoch": 0.7905860889065459, "learning_rate": 7.394453562151894e-06, "loss": 2.784398498535156, "step": 655200 }, { "epoch": 0.7907067522290286, "learning_rate": 7.394049726684156e-06, "loss": 2.8010406494140625, "step": 655300 }, { "epoch": 0.7908274155515114, "learning_rate": 7.393645891216418e-06, "loss": 2.7829110717773435, "step": 655400 }, { "epoch": 0.790948078873994, "learning_rate": 7.393242055748679e-06, "loss": 2.798858642578125, "step": 655500 }, { "epoch": 0.7910687421964767, "learning_rate": 7.392838220280941e-06, "loss": 2.7971316528320314, "step": 655600 }, { "epoch": 0.7911894055189593, "learning_rate": 7.392434384813203e-06, "loss": 2.7993093872070314, "step": 655700 }, { "epoch": 0.7913100688414421, "learning_rate": 7.3920305493454635e-06, "loss": 2.7924017333984374, "step": 655800 }, { "epoch": 0.7914307321639248, "learning_rate": 7.3916267138777255e-06, "loss": 2.802512512207031, "step": 655900 }, { "epoch": 0.7915513954864074, "learning_rate": 7.3912228784099875e-06, "loss": 2.8014016723632813, "step": 656000 }, { "epoch": 0.7916720588088901, "learning_rate": 7.390819042942249e-06, "loss": 2.8237478637695315, "step": 656100 }, { "epoch": 0.7917927221313728, "learning_rate": 7.390415207474511e-06, "loss": 2.8255386352539062, "step": 656200 }, { "epoch": 0.7919133854538555, "learning_rate": 7.390011372006773e-06, "loss": 2.79927734375, "step": 656300 }, { "epoch": 0.7920340487763382, "learning_rate": 7.389607536539034e-06, "loss": 2.7872320556640626, "step": 656400 }, { "epoch": 0.7921547120988208, "learning_rate": 7.389203701071296e-06, "loss": 2.7966079711914062, "step": 656500 }, { "epoch": 0.7922753754213036, "learning_rate": 7.388799865603557e-06, "loss": 2.8005999755859374, "step": 656600 }, { "epoch": 0.7923960387437862, "learning_rate": 7.388396030135818e-06, "loss": 2.7729583740234376, "step": 656700 }, { "epoch": 0.7925167020662689, "learning_rate": 7.38799219466808e-06, "loss": 2.788101806640625, "step": 656800 }, { "epoch": 0.7926373653887516, "learning_rate": 7.387588359200342e-06, "loss": 2.818209533691406, "step": 656900 }, { "epoch": 0.7927580287112342, "learning_rate": 7.387184523732603e-06, "loss": 2.7764602661132813, "step": 657000 }, { "epoch": 0.792878692033717, "learning_rate": 7.386780688264865e-06, "loss": 2.783212890625, "step": 657100 }, { "epoch": 0.7929993553561996, "learning_rate": 7.386376852797127e-06, "loss": 2.802919921875, "step": 657200 }, { "epoch": 0.7931200186786823, "learning_rate": 7.385973017329389e-06, "loss": 2.82133544921875, "step": 657300 }, { "epoch": 0.793240682001165, "learning_rate": 7.385569181861649e-06, "loss": 2.771608581542969, "step": 657400 }, { "epoch": 0.7933613453236477, "learning_rate": 7.385165346393911e-06, "loss": 2.792261962890625, "step": 657500 }, { "epoch": 0.7934820086461304, "learning_rate": 7.3847615109261724e-06, "loss": 2.7808551025390624, "step": 657600 }, { "epoch": 0.793602671968613, "learning_rate": 7.384357675458434e-06, "loss": 2.7785824584960936, "step": 657700 }, { "epoch": 0.7937233352910957, "learning_rate": 7.383953839990696e-06, "loss": 2.7540673828125, "step": 657800 }, { "epoch": 0.7938439986135785, "learning_rate": 7.383550004522958e-06, "loss": 2.778395080566406, "step": 657900 }, { "epoch": 0.7939646619360611, "learning_rate": 7.3831461690552195e-06, "loss": 2.7874209594726564, "step": 658000 }, { "epoch": 0.7940853252585438, "learning_rate": 7.3827423335874815e-06, "loss": 2.82052490234375, "step": 658100 }, { "epoch": 0.7942059885810264, "learning_rate": 7.382338498119742e-06, "loss": 2.7886251831054687, "step": 658200 }, { "epoch": 0.7943266519035092, "learning_rate": 7.381934662652004e-06, "loss": 2.8138217163085937, "step": 658300 }, { "epoch": 0.7944473152259919, "learning_rate": 7.381530827184266e-06, "loss": 2.7949624633789063, "step": 658400 }, { "epoch": 0.7945679785484745, "learning_rate": 7.381126991716528e-06, "loss": 2.7925430297851563, "step": 658500 }, { "epoch": 0.7946886418709572, "learning_rate": 7.380723156248789e-06, "loss": 2.7645278930664063, "step": 658600 }, { "epoch": 0.79480930519344, "learning_rate": 7.380319320781051e-06, "loss": 2.806607971191406, "step": 658700 }, { "epoch": 0.7949299685159226, "learning_rate": 7.379915485313313e-06, "loss": 2.790441589355469, "step": 658800 }, { "epoch": 0.7950506318384053, "learning_rate": 7.379511649845574e-06, "loss": 2.795, "step": 658900 }, { "epoch": 0.7951712951608879, "learning_rate": 7.379107814377836e-06, "loss": 2.809898681640625, "step": 659000 }, { "epoch": 0.7952919584833706, "learning_rate": 7.378703978910097e-06, "loss": 2.7773202514648436, "step": 659100 }, { "epoch": 0.7954126218058534, "learning_rate": 7.378300143442358e-06, "loss": 2.7560894775390623, "step": 659200 }, { "epoch": 0.795533285128336, "learning_rate": 7.37789630797462e-06, "loss": 2.773792724609375, "step": 659300 }, { "epoch": 0.7956539484508187, "learning_rate": 7.377492472506882e-06, "loss": 2.7895248413085936, "step": 659400 }, { "epoch": 0.7957746117733013, "learning_rate": 7.377088637039143e-06, "loss": 2.7947698974609376, "step": 659500 }, { "epoch": 0.7958952750957841, "learning_rate": 7.376684801571405e-06, "loss": 2.7723992919921874, "step": 659600 }, { "epoch": 0.7960159384182668, "learning_rate": 7.376280966103667e-06, "loss": 2.7925439453125, "step": 659700 }, { "epoch": 0.7961366017407494, "learning_rate": 7.375877130635929e-06, "loss": 2.807578125, "step": 659800 }, { "epoch": 0.7962572650632321, "learning_rate": 7.3754732951681896e-06, "loss": 2.782637023925781, "step": 659900 }, { "epoch": 0.7963779283857148, "learning_rate": 7.3750694597004515e-06, "loss": 2.7776123046875, "step": 660000 }, { "epoch": 0.7964985917081975, "learning_rate": 7.374665624232713e-06, "loss": 2.789456787109375, "step": 660100 }, { "epoch": 0.7966192550306802, "learning_rate": 7.374261788764975e-06, "loss": 2.791808776855469, "step": 660200 }, { "epoch": 0.7967399183531628, "learning_rate": 7.373857953297237e-06, "loss": 2.7873214721679687, "step": 660300 }, { "epoch": 0.7968605816756456, "learning_rate": 7.373454117829499e-06, "loss": 2.751332092285156, "step": 660400 }, { "epoch": 0.7969812449981282, "learning_rate": 7.37305028236176e-06, "loss": 2.786790771484375, "step": 660500 }, { "epoch": 0.7971019083206109, "learning_rate": 7.372646446894022e-06, "loss": 2.7691900634765627, "step": 660600 }, { "epoch": 0.7972225716430936, "learning_rate": 7.372242611426282e-06, "loss": 2.773759765625, "step": 660700 }, { "epoch": 0.7973432349655762, "learning_rate": 7.371838775958544e-06, "loss": 2.795589599609375, "step": 660800 }, { "epoch": 0.797463898288059, "learning_rate": 7.371434940490806e-06, "loss": 2.792037353515625, "step": 660900 }, { "epoch": 0.7975845616105416, "learning_rate": 7.371031105023068e-06, "loss": 2.7888421630859375, "step": 661000 }, { "epoch": 0.7977052249330243, "learning_rate": 7.370627269555329e-06, "loss": 2.8155197143554687, "step": 661100 }, { "epoch": 0.797825888255507, "learning_rate": 7.370223434087591e-06, "loss": 2.8025848388671877, "step": 661200 }, { "epoch": 0.7979465515779897, "learning_rate": 7.369819598619853e-06, "loss": 2.7878948974609377, "step": 661300 }, { "epoch": 0.7980672149004724, "learning_rate": 7.369415763152114e-06, "loss": 2.7930889892578126, "step": 661400 }, { "epoch": 0.798187878222955, "learning_rate": 7.369011927684375e-06, "loss": 2.79222900390625, "step": 661500 }, { "epoch": 0.7983085415454377, "learning_rate": 7.368608092216637e-06, "loss": 2.787877197265625, "step": 661600 }, { "epoch": 0.7984292048679205, "learning_rate": 7.3682042567488985e-06, "loss": 2.7590106201171873, "step": 661700 }, { "epoch": 0.7985498681904031, "learning_rate": 7.3678004212811605e-06, "loss": 2.769784240722656, "step": 661800 }, { "epoch": 0.7986705315128858, "learning_rate": 7.3673965858134224e-06, "loss": 2.7575341796875, "step": 661900 }, { "epoch": 0.7987911948353684, "learning_rate": 7.3669927503456836e-06, "loss": 2.8153366088867187, "step": 662000 }, { "epoch": 0.7989118581578512, "learning_rate": 7.3665889148779456e-06, "loss": 2.7815582275390627, "step": 662100 }, { "epoch": 0.7990325214803339, "learning_rate": 7.3661850794102075e-06, "loss": 2.8085784912109375, "step": 662200 }, { "epoch": 0.7991531848028165, "learning_rate": 7.365781243942468e-06, "loss": 2.7746963500976562, "step": 662300 }, { "epoch": 0.7992738481252992, "learning_rate": 7.36537740847473e-06, "loss": 2.803014221191406, "step": 662400 }, { "epoch": 0.7993945114477818, "learning_rate": 7.364973573006992e-06, "loss": 2.785816955566406, "step": 662500 }, { "epoch": 0.7995151747702646, "learning_rate": 7.364569737539253e-06, "loss": 2.8019845581054685, "step": 662600 }, { "epoch": 0.7996358380927473, "learning_rate": 7.364165902071515e-06, "loss": 2.7981805419921875, "step": 662700 }, { "epoch": 0.7997565014152299, "learning_rate": 7.363762066603777e-06, "loss": 2.801832275390625, "step": 662800 }, { "epoch": 0.7998771647377126, "learning_rate": 7.363358231136039e-06, "loss": 2.7599334716796875, "step": 662900 }, { "epoch": 0.7999978280601953, "learning_rate": 7.3629543956683e-06, "loss": 2.7765902709960937, "step": 663000 }, { "epoch": 0.800118491382678, "learning_rate": 7.362550560200561e-06, "loss": 2.7803604125976564, "step": 663100 }, { "epoch": 0.8002391547051607, "learning_rate": 7.362146724732822e-06, "loss": 2.805971984863281, "step": 663200 }, { "epoch": 0.8003598180276433, "learning_rate": 7.361742889265084e-06, "loss": 2.7982293701171876, "step": 663300 }, { "epoch": 0.8004804813501261, "learning_rate": 7.361339053797346e-06, "loss": 2.752122497558594, "step": 663400 }, { "epoch": 0.8006011446726087, "learning_rate": 7.360935218329608e-06, "loss": 2.759324951171875, "step": 663500 }, { "epoch": 0.8007218079950914, "learning_rate": 7.360531382861869e-06, "loss": 2.7706671142578125, "step": 663600 }, { "epoch": 0.8008424713175741, "learning_rate": 7.360127547394131e-06, "loss": 2.779388732910156, "step": 663700 }, { "epoch": 0.8009631346400568, "learning_rate": 7.359723711926393e-06, "loss": 2.7845867919921874, "step": 663800 }, { "epoch": 0.8010837979625395, "learning_rate": 7.3593198764586545e-06, "loss": 2.797130126953125, "step": 663900 }, { "epoch": 0.8012044612850222, "learning_rate": 7.358916040990916e-06, "loss": 2.783852233886719, "step": 664000 }, { "epoch": 0.8013251246075048, "learning_rate": 7.358512205523178e-06, "loss": 2.786119079589844, "step": 664100 }, { "epoch": 0.8014457879299876, "learning_rate": 7.358108370055439e-06, "loss": 2.767880859375, "step": 664200 }, { "epoch": 0.8015664512524702, "learning_rate": 7.357704534587701e-06, "loss": 2.794988098144531, "step": 664300 }, { "epoch": 0.8016871145749529, "learning_rate": 7.357300699119963e-06, "loss": 2.758273010253906, "step": 664400 }, { "epoch": 0.8018077778974356, "learning_rate": 7.356896863652224e-06, "loss": 2.791065673828125, "step": 664500 }, { "epoch": 0.8019284412199182, "learning_rate": 7.356493028184486e-06, "loss": 2.78525634765625, "step": 664600 }, { "epoch": 0.802049104542401, "learning_rate": 7.356089192716748e-06, "loss": 2.7733160400390626, "step": 664700 }, { "epoch": 0.8021697678648836, "learning_rate": 7.355685357249008e-06, "loss": 2.7771453857421875, "step": 664800 }, { "epoch": 0.8022904311873663, "learning_rate": 7.35528152178127e-06, "loss": 2.766620788574219, "step": 664900 }, { "epoch": 0.802411094509849, "learning_rate": 7.354877686313532e-06, "loss": 2.791540222167969, "step": 665000 }, { "epoch": 0.8025317578323317, "learning_rate": 7.354473850845793e-06, "loss": 2.7797222900390626, "step": 665100 }, { "epoch": 0.8026524211548144, "learning_rate": 7.354070015378055e-06, "loss": 2.7765823364257813, "step": 665200 }, { "epoch": 0.802773084477297, "learning_rate": 7.353666179910317e-06, "loss": 2.7628494262695313, "step": 665300 }, { "epoch": 0.8028937477997797, "learning_rate": 7.353262344442579e-06, "loss": 2.789728088378906, "step": 665400 }, { "epoch": 0.8030144111222625, "learning_rate": 7.35285850897484e-06, "loss": 2.764951171875, "step": 665500 }, { "epoch": 0.8031350744447451, "learning_rate": 7.352454673507101e-06, "loss": 2.7846725463867186, "step": 665600 }, { "epoch": 0.8032557377672278, "learning_rate": 7.3520508380393625e-06, "loss": 2.8048196411132813, "step": 665700 }, { "epoch": 0.8033764010897104, "learning_rate": 7.3516470025716245e-06, "loss": 2.7994088745117187, "step": 665800 }, { "epoch": 0.8034970644121932, "learning_rate": 7.3512431671038865e-06, "loss": 2.772532958984375, "step": 665900 }, { "epoch": 0.8036177277346759, "learning_rate": 7.3508393316361485e-06, "loss": 2.7886767578125, "step": 666000 }, { "epoch": 0.8037383910571585, "learning_rate": 7.35043549616841e-06, "loss": 2.805261535644531, "step": 666100 }, { "epoch": 0.8038590543796412, "learning_rate": 7.350031660700672e-06, "loss": 2.777310485839844, "step": 666200 }, { "epoch": 0.8039797177021238, "learning_rate": 7.3496278252329336e-06, "loss": 2.80323974609375, "step": 666300 }, { "epoch": 0.8041003810246066, "learning_rate": 7.349223989765194e-06, "loss": 2.7863595581054685, "step": 666400 }, { "epoch": 0.8042210443470893, "learning_rate": 7.348820154297456e-06, "loss": 2.7771896362304687, "step": 666500 }, { "epoch": 0.8043417076695719, "learning_rate": 7.348416318829718e-06, "loss": 2.7987991333007813, "step": 666600 }, { "epoch": 0.8044623709920546, "learning_rate": 7.348012483361979e-06, "loss": 2.7728643798828125, "step": 666700 }, { "epoch": 0.8045830343145373, "learning_rate": 7.347608647894241e-06, "loss": 2.8204156494140626, "step": 666800 }, { "epoch": 0.80470369763702, "learning_rate": 7.347204812426503e-06, "loss": 2.7827682495117188, "step": 666900 }, { "epoch": 0.8048243609595027, "learning_rate": 7.346800976958765e-06, "loss": 2.770790710449219, "step": 667000 }, { "epoch": 0.8049450242819853, "learning_rate": 7.346397141491026e-06, "loss": 2.807127685546875, "step": 667100 }, { "epoch": 0.8050656876044681, "learning_rate": 7.345993306023287e-06, "loss": 2.774967041015625, "step": 667200 }, { "epoch": 0.8051863509269507, "learning_rate": 7.345589470555548e-06, "loss": 2.772124938964844, "step": 667300 }, { "epoch": 0.8053070142494334, "learning_rate": 7.34518563508781e-06, "loss": 2.804805908203125, "step": 667400 }, { "epoch": 0.8054276775719161, "learning_rate": 7.344781799620072e-06, "loss": 2.7840206909179686, "step": 667500 }, { "epoch": 0.8055483408943988, "learning_rate": 7.344377964152334e-06, "loss": 2.7858447265625, "step": 667600 }, { "epoch": 0.8056690042168815, "learning_rate": 7.343974128684595e-06, "loss": 2.792890930175781, "step": 667700 }, { "epoch": 0.8057896675393641, "learning_rate": 7.343570293216857e-06, "loss": 2.7870553588867186, "step": 667800 }, { "epoch": 0.8059103308618468, "learning_rate": 7.343166457749119e-06, "loss": 2.798052978515625, "step": 667900 }, { "epoch": 0.8060309941843296, "learning_rate": 7.34276262228138e-06, "loss": 2.7840646362304686, "step": 668000 }, { "epoch": 0.8061516575068122, "learning_rate": 7.342358786813642e-06, "loss": 2.7588845825195314, "step": 668100 }, { "epoch": 0.8062723208292949, "learning_rate": 7.341954951345904e-06, "loss": 2.7744430541992187, "step": 668200 }, { "epoch": 0.8063929841517775, "learning_rate": 7.341551115878165e-06, "loss": 2.7746337890625, "step": 668300 }, { "epoch": 0.8065136474742602, "learning_rate": 7.341147280410427e-06, "loss": 2.7823443603515625, "step": 668400 }, { "epoch": 0.806634310796743, "learning_rate": 7.340743444942689e-06, "loss": 2.7789727783203126, "step": 668500 }, { "epoch": 0.8067549741192256, "learning_rate": 7.34033960947495e-06, "loss": 2.798805847167969, "step": 668600 }, { "epoch": 0.8068756374417083, "learning_rate": 7.339935774007212e-06, "loss": 2.782273864746094, "step": 668700 }, { "epoch": 0.8069963007641909, "learning_rate": 7.339531938539473e-06, "loss": 2.767358703613281, "step": 668800 }, { "epoch": 0.8071169640866737, "learning_rate": 7.339128103071734e-06, "loss": 2.775126953125, "step": 668900 }, { "epoch": 0.8072376274091564, "learning_rate": 7.338724267603996e-06, "loss": 2.785374755859375, "step": 669000 }, { "epoch": 0.807358290731639, "learning_rate": 7.338320432136258e-06, "loss": 2.773117980957031, "step": 669100 }, { "epoch": 0.8074789540541217, "learning_rate": 7.337916596668519e-06, "loss": 2.79136474609375, "step": 669200 }, { "epoch": 0.8075996173766045, "learning_rate": 7.337512761200781e-06, "loss": 2.75295654296875, "step": 669300 }, { "epoch": 0.8077202806990871, "learning_rate": 7.337108925733043e-06, "loss": 2.7753939819335938, "step": 669400 }, { "epoch": 0.8078409440215698, "learning_rate": 7.336705090265305e-06, "loss": 2.7691995239257814, "step": 669500 }, { "epoch": 0.8079616073440524, "learning_rate": 7.336301254797566e-06, "loss": 2.77121337890625, "step": 669600 }, { "epoch": 0.8080822706665352, "learning_rate": 7.335897419329827e-06, "loss": 2.805318603515625, "step": 669700 }, { "epoch": 0.8082029339890179, "learning_rate": 7.3354935838620886e-06, "loss": 2.758067932128906, "step": 669800 }, { "epoch": 0.8083235973115005, "learning_rate": 7.3350897483943505e-06, "loss": 2.7659542846679686, "step": 669900 }, { "epoch": 0.8084442606339832, "learning_rate": 7.3346859129266125e-06, "loss": 2.7943734741210937, "step": 670000 }, { "epoch": 0.8085649239564658, "learning_rate": 7.3342820774588745e-06, "loss": 2.7637985229492186, "step": 670100 }, { "epoch": 0.8086855872789486, "learning_rate": 7.333878241991136e-06, "loss": 2.7870721435546875, "step": 670200 }, { "epoch": 0.8088062506014313, "learning_rate": 7.333474406523398e-06, "loss": 2.791502685546875, "step": 670300 }, { "epoch": 0.8089269139239139, "learning_rate": 7.33307057105566e-06, "loss": 2.770005187988281, "step": 670400 }, { "epoch": 0.8090475772463966, "learning_rate": 7.33266673558792e-06, "loss": 2.7822671508789063, "step": 670500 }, { "epoch": 0.8091682405688793, "learning_rate": 7.332262900120182e-06, "loss": 2.7513616943359374, "step": 670600 }, { "epoch": 0.809288903891362, "learning_rate": 7.331859064652444e-06, "loss": 2.7921597290039064, "step": 670700 }, { "epoch": 0.8094095672138447, "learning_rate": 7.331455229184705e-06, "loss": 2.775643615722656, "step": 670800 }, { "epoch": 0.8095302305363273, "learning_rate": 7.331051393716967e-06, "loss": 2.7852047729492186, "step": 670900 }, { "epoch": 0.8096508938588101, "learning_rate": 7.330647558249229e-06, "loss": 2.772471618652344, "step": 671000 }, { "epoch": 0.8097715571812927, "learning_rate": 7.33024372278149e-06, "loss": 2.7878985595703125, "step": 671100 }, { "epoch": 0.8098922205037754, "learning_rate": 7.329839887313752e-06, "loss": 2.7733609008789064, "step": 671200 }, { "epoch": 0.8100128838262581, "learning_rate": 7.329436051846013e-06, "loss": 2.7803582763671875, "step": 671300 }, { "epoch": 0.8101335471487408, "learning_rate": 7.329032216378274e-06, "loss": 2.7941995239257813, "step": 671400 }, { "epoch": 0.8102542104712235, "learning_rate": 7.328628380910536e-06, "loss": 2.7581256103515623, "step": 671500 }, { "epoch": 0.8103748737937061, "learning_rate": 7.328224545442798e-06, "loss": 2.7770376586914063, "step": 671600 }, { "epoch": 0.8104955371161888, "learning_rate": 7.3278207099750594e-06, "loss": 2.764063720703125, "step": 671700 }, { "epoch": 0.8106162004386716, "learning_rate": 7.3274168745073214e-06, "loss": 2.7906890869140626, "step": 671800 }, { "epoch": 0.8107368637611542, "learning_rate": 7.327013039039583e-06, "loss": 2.7944598388671875, "step": 671900 }, { "epoch": 0.8108575270836369, "learning_rate": 7.326609203571845e-06, "loss": 2.762570495605469, "step": 672000 }, { "epoch": 0.8109781904061195, "learning_rate": 7.326205368104106e-06, "loss": 2.779108581542969, "step": 672100 }, { "epoch": 0.8110988537286022, "learning_rate": 7.325801532636368e-06, "loss": 2.782147216796875, "step": 672200 }, { "epoch": 0.811219517051085, "learning_rate": 7.325397697168629e-06, "loss": 2.779765319824219, "step": 672300 }, { "epoch": 0.8113401803735676, "learning_rate": 7.324993861700891e-06, "loss": 2.7478057861328127, "step": 672400 }, { "epoch": 0.8114608436960503, "learning_rate": 7.324590026233153e-06, "loss": 2.7575408935546877, "step": 672500 }, { "epoch": 0.8115815070185329, "learning_rate": 7.324186190765415e-06, "loss": 2.774888610839844, "step": 672600 }, { "epoch": 0.8117021703410157, "learning_rate": 7.323782355297676e-06, "loss": 2.770577392578125, "step": 672700 }, { "epoch": 0.8118228336634984, "learning_rate": 7.323378519829938e-06, "loss": 2.7907574462890623, "step": 672800 }, { "epoch": 0.811943496985981, "learning_rate": 7.322974684362198e-06, "loss": 2.792117004394531, "step": 672900 }, { "epoch": 0.8120641603084637, "learning_rate": 7.32257084889446e-06, "loss": 2.7660174560546875, "step": 673000 }, { "epoch": 0.8121848236309464, "learning_rate": 7.322167013426722e-06, "loss": 2.77701416015625, "step": 673100 }, { "epoch": 0.8123054869534291, "learning_rate": 7.321763177958984e-06, "loss": 2.7650604248046875, "step": 673200 }, { "epoch": 0.8124261502759118, "learning_rate": 7.321359342491245e-06, "loss": 2.7854238891601564, "step": 673300 }, { "epoch": 0.8125468135983944, "learning_rate": 7.320955507023507e-06, "loss": 2.776844482421875, "step": 673400 }, { "epoch": 0.8126674769208772, "learning_rate": 7.320551671555769e-06, "loss": 2.782826232910156, "step": 673500 }, { "epoch": 0.8127881402433598, "learning_rate": 7.32014783608803e-06, "loss": 2.7471697998046873, "step": 673600 }, { "epoch": 0.8129088035658425, "learning_rate": 7.3197440006202915e-06, "loss": 2.7987896728515627, "step": 673700 }, { "epoch": 0.8130294668883252, "learning_rate": 7.3193401651525535e-06, "loss": 2.7811871337890626, "step": 673800 }, { "epoch": 0.8131501302108078, "learning_rate": 7.318936329684815e-06, "loss": 2.7738702392578123, "step": 673900 }, { "epoch": 0.8132707935332906, "learning_rate": 7.3185324942170766e-06, "loss": 2.7958404541015627, "step": 674000 }, { "epoch": 0.8133914568557732, "learning_rate": 7.3181286587493386e-06, "loss": 2.8123013305664064, "step": 674100 }, { "epoch": 0.8135121201782559, "learning_rate": 7.3177248232816e-06, "loss": 2.7953521728515627, "step": 674200 }, { "epoch": 0.8136327835007386, "learning_rate": 7.317320987813862e-06, "loss": 2.7777886962890626, "step": 674300 }, { "epoch": 0.8137534468232213, "learning_rate": 7.316917152346124e-06, "loss": 2.7687893676757813, "step": 674400 }, { "epoch": 0.813874110145704, "learning_rate": 7.316513316878386e-06, "loss": 2.7885232543945313, "step": 674500 }, { "epoch": 0.8139947734681867, "learning_rate": 7.316109481410646e-06, "loss": 2.785223083496094, "step": 674600 }, { "epoch": 0.8141154367906693, "learning_rate": 7.315705645942908e-06, "loss": 2.78183349609375, "step": 674700 }, { "epoch": 0.8142361001131521, "learning_rate": 7.315301810475169e-06, "loss": 2.75867919921875, "step": 674800 }, { "epoch": 0.8143567634356347, "learning_rate": 7.314897975007431e-06, "loss": 2.7710635375976564, "step": 674900 }, { "epoch": 0.8144774267581174, "learning_rate": 7.314494139539693e-06, "loss": 2.7757638549804686, "step": 675000 }, { "epoch": 0.8145980900806001, "learning_rate": 7.314090304071955e-06, "loss": 2.797603759765625, "step": 675100 }, { "epoch": 0.8147187534030828, "learning_rate": 7.313686468604216e-06, "loss": 2.765887451171875, "step": 675200 }, { "epoch": 0.8148394167255655, "learning_rate": 7.313282633136478e-06, "loss": 2.7624163818359375, "step": 675300 }, { "epoch": 0.8149600800480481, "learning_rate": 7.312878797668738e-06, "loss": 2.788194580078125, "step": 675400 }, { "epoch": 0.8150807433705308, "learning_rate": 7.312474962201e-06, "loss": 2.798177490234375, "step": 675500 }, { "epoch": 0.8152014066930136, "learning_rate": 7.312071126733262e-06, "loss": 2.7722097778320314, "step": 675600 }, { "epoch": 0.8153220700154962, "learning_rate": 7.311667291265524e-06, "loss": 2.779398193359375, "step": 675700 }, { "epoch": 0.8154427333379789, "learning_rate": 7.3112634557977855e-06, "loss": 2.781210632324219, "step": 675800 }, { "epoch": 0.8155633966604615, "learning_rate": 7.3108596203300475e-06, "loss": 2.77276123046875, "step": 675900 }, { "epoch": 0.8156840599829442, "learning_rate": 7.3104557848623094e-06, "loss": 2.7947283935546876, "step": 676000 }, { "epoch": 0.815804723305427, "learning_rate": 7.310051949394571e-06, "loss": 2.80211669921875, "step": 676100 }, { "epoch": 0.8159253866279096, "learning_rate": 7.309648113926832e-06, "loss": 2.784278564453125, "step": 676200 }, { "epoch": 0.8160460499503923, "learning_rate": 7.309244278459094e-06, "loss": 2.790855712890625, "step": 676300 }, { "epoch": 0.8161667132728749, "learning_rate": 7.308840442991355e-06, "loss": 2.7782666015625, "step": 676400 }, { "epoch": 0.8162873765953577, "learning_rate": 7.308436607523617e-06, "loss": 2.77833984375, "step": 676500 }, { "epoch": 0.8164080399178404, "learning_rate": 7.308032772055879e-06, "loss": 2.7788742065429686, "step": 676600 }, { "epoch": 0.816528703240323, "learning_rate": 7.30762893658814e-06, "loss": 2.7719540405273437, "step": 676700 }, { "epoch": 0.8166493665628057, "learning_rate": 7.307225101120402e-06, "loss": 2.787636413574219, "step": 676800 }, { "epoch": 0.8167700298852884, "learning_rate": 7.306821265652664e-06, "loss": 2.789268798828125, "step": 676900 }, { "epoch": 0.8168906932077711, "learning_rate": 7.306417430184924e-06, "loss": 2.782451171875, "step": 677000 }, { "epoch": 0.8170113565302538, "learning_rate": 7.306013594717186e-06, "loss": 2.7727215576171873, "step": 677100 }, { "epoch": 0.8171320198527364, "learning_rate": 7.305609759249448e-06, "loss": 2.7946551513671873, "step": 677200 }, { "epoch": 0.8172526831752192, "learning_rate": 7.305205923781709e-06, "loss": 2.7975909423828127, "step": 677300 }, { "epoch": 0.8173733464977018, "learning_rate": 7.304802088313971e-06, "loss": 2.765296630859375, "step": 677400 }, { "epoch": 0.8174940098201845, "learning_rate": 7.304398252846233e-06, "loss": 2.796300964355469, "step": 677500 }, { "epoch": 0.8176146731426672, "learning_rate": 7.303994417378495e-06, "loss": 2.76763671875, "step": 677600 }, { "epoch": 0.8177353364651498, "learning_rate": 7.303590581910756e-06, "loss": 2.774588623046875, "step": 677700 }, { "epoch": 0.8178559997876326, "learning_rate": 7.3031867464430175e-06, "loss": 2.7680130004882812, "step": 677800 }, { "epoch": 0.8179766631101152, "learning_rate": 7.302782910975279e-06, "loss": 2.780946960449219, "step": 677900 }, { "epoch": 0.8180973264325979, "learning_rate": 7.302379075507541e-06, "loss": 2.7843597412109373, "step": 678000 }, { "epoch": 0.8182179897550806, "learning_rate": 7.301975240039803e-06, "loss": 2.762198791503906, "step": 678100 }, { "epoch": 0.8183386530775633, "learning_rate": 7.301571404572065e-06, "loss": 2.7904241943359374, "step": 678200 }, { "epoch": 0.818459316400046, "learning_rate": 7.301167569104326e-06, "loss": 2.7629043579101564, "step": 678300 }, { "epoch": 0.8185799797225286, "learning_rate": 7.300763733636588e-06, "loss": 2.7684771728515627, "step": 678400 }, { "epoch": 0.8187006430450113, "learning_rate": 7.30035989816885e-06, "loss": 2.7525875854492186, "step": 678500 }, { "epoch": 0.8188213063674941, "learning_rate": 7.29995606270111e-06, "loss": 2.78022216796875, "step": 678600 }, { "epoch": 0.8189419696899767, "learning_rate": 7.299552227233372e-06, "loss": 2.770039367675781, "step": 678700 }, { "epoch": 0.8190626330124594, "learning_rate": 7.299148391765634e-06, "loss": 2.7813906860351563, "step": 678800 }, { "epoch": 0.819183296334942, "learning_rate": 7.298744556297895e-06, "loss": 2.768718566894531, "step": 678900 }, { "epoch": 0.8193039596574248, "learning_rate": 7.298340720830157e-06, "loss": 2.750425109863281, "step": 679000 }, { "epoch": 0.8194246229799075, "learning_rate": 7.297936885362419e-06, "loss": 2.7760751342773435, "step": 679100 }, { "epoch": 0.8195452863023901, "learning_rate": 7.29753304989468e-06, "loss": 2.747894592285156, "step": 679200 }, { "epoch": 0.8196659496248728, "learning_rate": 7.297129214426942e-06, "loss": 2.771839904785156, "step": 679300 }, { "epoch": 0.8197866129473554, "learning_rate": 7.296725378959204e-06, "loss": 2.7960140991210936, "step": 679400 }, { "epoch": 0.8199072762698382, "learning_rate": 7.2963215434914644e-06, "loss": 2.776028747558594, "step": 679500 }, { "epoch": 0.8200279395923209, "learning_rate": 7.295917708023726e-06, "loss": 2.7511846923828127, "step": 679600 }, { "epoch": 0.8201486029148035, "learning_rate": 7.295513872555988e-06, "loss": 2.7819943237304687, "step": 679700 }, { "epoch": 0.8202692662372862, "learning_rate": 7.2951100370882495e-06, "loss": 2.747019958496094, "step": 679800 }, { "epoch": 0.820389929559769, "learning_rate": 7.2947062016205115e-06, "loss": 2.774222717285156, "step": 679900 }, { "epoch": 0.8205105928822516, "learning_rate": 7.2943023661527735e-06, "loss": 2.7718215942382813, "step": 680000 }, { "epoch": 0.8206312562047343, "learning_rate": 7.2938985306850355e-06, "loss": 2.780849609375, "step": 680100 }, { "epoch": 0.8207519195272169, "learning_rate": 7.293494695217297e-06, "loss": 2.783356018066406, "step": 680200 }, { "epoch": 0.8208725828496997, "learning_rate": 7.293090859749558e-06, "loss": 2.7759130859375, "step": 680300 }, { "epoch": 0.8209932461721824, "learning_rate": 7.292687024281819e-06, "loss": 2.776283874511719, "step": 680400 }, { "epoch": 0.821113909494665, "learning_rate": 7.292283188814081e-06, "loss": 2.7642578125, "step": 680500 }, { "epoch": 0.8212345728171477, "learning_rate": 7.291879353346343e-06, "loss": 2.7832626342773437, "step": 680600 }, { "epoch": 0.8213552361396304, "learning_rate": 7.291475517878605e-06, "loss": 2.7746176147460937, "step": 680700 }, { "epoch": 0.8214758994621131, "learning_rate": 7.291071682410866e-06, "loss": 2.7747976684570315, "step": 680800 }, { "epoch": 0.8215965627845958, "learning_rate": 7.290667846943128e-06, "loss": 2.7911410522460938, "step": 680900 }, { "epoch": 0.8217172261070784, "learning_rate": 7.29026401147539e-06, "loss": 2.772505798339844, "step": 681000 }, { "epoch": 0.8218378894295612, "learning_rate": 7.28986017600765e-06, "loss": 2.781540832519531, "step": 681100 }, { "epoch": 0.8219585527520438, "learning_rate": 7.289456340539912e-06, "loss": 2.750919189453125, "step": 681200 }, { "epoch": 0.8220792160745265, "learning_rate": 7.289052505072174e-06, "loss": 2.764035949707031, "step": 681300 }, { "epoch": 0.8221998793970092, "learning_rate": 7.288648669604435e-06, "loss": 2.798994445800781, "step": 681400 }, { "epoch": 0.8223205427194918, "learning_rate": 7.288244834136697e-06, "loss": 2.778087463378906, "step": 681500 }, { "epoch": 0.8224412060419746, "learning_rate": 7.287840998668959e-06, "loss": 2.770902404785156, "step": 681600 }, { "epoch": 0.8225618693644572, "learning_rate": 7.287437163201221e-06, "loss": 2.7659957885742186, "step": 681700 }, { "epoch": 0.8226825326869399, "learning_rate": 7.287033327733482e-06, "loss": 2.754152526855469, "step": 681800 }, { "epoch": 0.8228031960094226, "learning_rate": 7.2866294922657435e-06, "loss": 2.794879150390625, "step": 681900 }, { "epoch": 0.8229238593319053, "learning_rate": 7.286225656798005e-06, "loss": 2.791917419433594, "step": 682000 }, { "epoch": 0.823044522654388, "learning_rate": 7.285821821330267e-06, "loss": 2.798742370605469, "step": 682100 }, { "epoch": 0.8231651859768706, "learning_rate": 7.285417985862529e-06, "loss": 2.7911911010742188, "step": 682200 }, { "epoch": 0.8232858492993533, "learning_rate": 7.285014150394791e-06, "loss": 2.726761474609375, "step": 682300 }, { "epoch": 0.8234065126218361, "learning_rate": 7.284610314927052e-06, "loss": 2.76898681640625, "step": 682400 }, { "epoch": 0.8235271759443187, "learning_rate": 7.284206479459314e-06, "loss": 2.7621563720703124, "step": 682500 }, { "epoch": 0.8236478392668014, "learning_rate": 7.283802643991576e-06, "loss": 2.7733587646484374, "step": 682600 }, { "epoch": 0.823768502589284, "learning_rate": 7.283398808523836e-06, "loss": 2.793271484375, "step": 682700 }, { "epoch": 0.8238891659117668, "learning_rate": 7.282994973056098e-06, "loss": 2.76546630859375, "step": 682800 }, { "epoch": 0.8240098292342495, "learning_rate": 7.28259113758836e-06, "loss": 2.7817333984375, "step": 682900 }, { "epoch": 0.8241304925567321, "learning_rate": 7.282187302120621e-06, "loss": 2.7622714233398438, "step": 683000 }, { "epoch": 0.8242511558792148, "learning_rate": 7.281783466652883e-06, "loss": 2.765032958984375, "step": 683100 }, { "epoch": 0.8243718192016974, "learning_rate": 7.281379631185145e-06, "loss": 2.75868408203125, "step": 683200 }, { "epoch": 0.8244924825241802, "learning_rate": 7.280975795717406e-06, "loss": 2.7622296142578127, "step": 683300 }, { "epoch": 0.8246131458466629, "learning_rate": 7.280571960249668e-06, "loss": 2.76447021484375, "step": 683400 }, { "epoch": 0.8247338091691455, "learning_rate": 7.280168124781929e-06, "loss": 2.7963937377929686, "step": 683500 }, { "epoch": 0.8248544724916282, "learning_rate": 7.2797642893141905e-06, "loss": 2.785882873535156, "step": 683600 }, { "epoch": 0.8249751358141109, "learning_rate": 7.2793604538464524e-06, "loss": 2.7596749877929687, "step": 683700 }, { "epoch": 0.8250957991365936, "learning_rate": 7.2789566183787144e-06, "loss": 2.7607269287109375, "step": 683800 }, { "epoch": 0.8252164624590763, "learning_rate": 7.2785527829109756e-06, "loss": 2.767558898925781, "step": 683900 }, { "epoch": 0.8253371257815589, "learning_rate": 7.2781489474432375e-06, "loss": 2.746151123046875, "step": 684000 }, { "epoch": 0.8254577891040417, "learning_rate": 7.2777451119754995e-06, "loss": 2.785746765136719, "step": 684100 }, { "epoch": 0.8255784524265243, "learning_rate": 7.2773412765077615e-06, "loss": 2.772562255859375, "step": 684200 }, { "epoch": 0.825699115749007, "learning_rate": 7.276937441040022e-06, "loss": 2.7555859375, "step": 684300 }, { "epoch": 0.8258197790714897, "learning_rate": 7.276533605572284e-06, "loss": 2.7792007446289064, "step": 684400 }, { "epoch": 0.8259404423939724, "learning_rate": 7.276129770104545e-06, "loss": 2.759610900878906, "step": 684500 }, { "epoch": 0.8260611057164551, "learning_rate": 7.275725934636807e-06, "loss": 2.7839810180664064, "step": 684600 }, { "epoch": 0.8261817690389378, "learning_rate": 7.275322099169069e-06, "loss": 2.765096435546875, "step": 684700 }, { "epoch": 0.8263024323614204, "learning_rate": 7.274918263701331e-06, "loss": 2.7779061889648435, "step": 684800 }, { "epoch": 0.8264230956839032, "learning_rate": 7.274514428233592e-06, "loss": 2.796318359375, "step": 684900 }, { "epoch": 0.8265437590063858, "learning_rate": 7.274110592765854e-06, "loss": 2.8043829345703126, "step": 685000 }, { "epoch": 0.8266644223288685, "learning_rate": 7.273706757298116e-06, "loss": 2.764012756347656, "step": 685100 }, { "epoch": 0.8267850856513512, "learning_rate": 7.273302921830376e-06, "loss": 2.7973806762695315, "step": 685200 }, { "epoch": 0.8269057489738338, "learning_rate": 7.272899086362638e-06, "loss": 2.747877502441406, "step": 685300 }, { "epoch": 0.8270264122963166, "learning_rate": 7.2724952508949e-06, "loss": 2.727659912109375, "step": 685400 }, { "epoch": 0.8271470756187992, "learning_rate": 7.272091415427161e-06, "loss": 2.770906677246094, "step": 685500 }, { "epoch": 0.8272677389412819, "learning_rate": 7.271687579959423e-06, "loss": 2.765697326660156, "step": 685600 }, { "epoch": 0.8273884022637646, "learning_rate": 7.271283744491685e-06, "loss": 2.761227722167969, "step": 685700 }, { "epoch": 0.8275090655862473, "learning_rate": 7.2708799090239465e-06, "loss": 2.779718322753906, "step": 685800 }, { "epoch": 0.82762972890873, "learning_rate": 7.2704760735562084e-06, "loss": 2.74761962890625, "step": 685900 }, { "epoch": 0.8277503922312126, "learning_rate": 7.2700722380884696e-06, "loss": 2.758592529296875, "step": 686000 }, { "epoch": 0.8278710555536953, "learning_rate": 7.269668402620731e-06, "loss": 2.766251220703125, "step": 686100 }, { "epoch": 0.8279917188761781, "learning_rate": 7.269264567152993e-06, "loss": 2.7486810302734375, "step": 686200 }, { "epoch": 0.8281123821986607, "learning_rate": 7.268860731685255e-06, "loss": 2.7468301391601564, "step": 686300 }, { "epoch": 0.8282330455211434, "learning_rate": 7.268456896217516e-06, "loss": 2.783356018066406, "step": 686400 }, { "epoch": 0.828353708843626, "learning_rate": 7.268053060749778e-06, "loss": 2.796214904785156, "step": 686500 }, { "epoch": 0.8284743721661088, "learning_rate": 7.26764922528204e-06, "loss": 2.7551763916015624, "step": 686600 }, { "epoch": 0.8285950354885915, "learning_rate": 7.267245389814302e-06, "loss": 2.7310626220703127, "step": 686700 }, { "epoch": 0.8287156988110741, "learning_rate": 7.266841554346562e-06, "loss": 2.788240966796875, "step": 686800 }, { "epoch": 0.8288363621335568, "learning_rate": 7.266437718878824e-06, "loss": 2.7726473999023438, "step": 686900 }, { "epoch": 0.8289570254560394, "learning_rate": 7.266033883411085e-06, "loss": 2.7804150390625, "step": 687000 }, { "epoch": 0.8290776887785222, "learning_rate": 7.265630047943347e-06, "loss": 2.73583984375, "step": 687100 }, { "epoch": 0.8291983521010049, "learning_rate": 7.265226212475609e-06, "loss": 2.7614453125, "step": 687200 }, { "epoch": 0.8293190154234875, "learning_rate": 7.264822377007871e-06, "loss": 2.776871643066406, "step": 687300 }, { "epoch": 0.8294396787459702, "learning_rate": 7.264418541540132e-06, "loss": 2.7650790405273438, "step": 687400 }, { "epoch": 0.8295603420684529, "learning_rate": 7.264014706072394e-06, "loss": 2.7622006225585936, "step": 687500 }, { "epoch": 0.8296810053909356, "learning_rate": 7.2636108706046545e-06, "loss": 2.74801025390625, "step": 687600 }, { "epoch": 0.8298016687134183, "learning_rate": 7.2632070351369165e-06, "loss": 2.7588674926757815, "step": 687700 }, { "epoch": 0.8299223320359009, "learning_rate": 7.2628031996691785e-06, "loss": 2.7784210205078126, "step": 687800 }, { "epoch": 0.8300429953583837, "learning_rate": 7.2623993642014405e-06, "loss": 2.760014953613281, "step": 687900 }, { "epoch": 0.8301636586808663, "learning_rate": 7.261995528733702e-06, "loss": 2.766098937988281, "step": 688000 }, { "epoch": 0.830284322003349, "learning_rate": 7.261591693265964e-06, "loss": 2.7400997924804686, "step": 688100 }, { "epoch": 0.8304049853258317, "learning_rate": 7.2611878577982256e-06, "loss": 2.7693490600585937, "step": 688200 }, { "epoch": 0.8305256486483144, "learning_rate": 7.260784022330487e-06, "loss": 2.7861932373046874, "step": 688300 }, { "epoch": 0.8306463119707971, "learning_rate": 7.260380186862748e-06, "loss": 2.780870361328125, "step": 688400 }, { "epoch": 0.8307669752932797, "learning_rate": 7.25997635139501e-06, "loss": 2.762931213378906, "step": 688500 }, { "epoch": 0.8308876386157624, "learning_rate": 7.259572515927271e-06, "loss": 2.76712890625, "step": 688600 }, { "epoch": 0.8310083019382452, "learning_rate": 7.259168680459533e-06, "loss": 2.739679260253906, "step": 688700 }, { "epoch": 0.8311289652607278, "learning_rate": 7.258764844991795e-06, "loss": 2.770452575683594, "step": 688800 }, { "epoch": 0.8312496285832105, "learning_rate": 7.258361009524056e-06, "loss": 2.7772784423828125, "step": 688900 }, { "epoch": 0.8313702919056931, "learning_rate": 7.257957174056318e-06, "loss": 2.7580340576171873, "step": 689000 }, { "epoch": 0.8314909552281758, "learning_rate": 7.25755333858858e-06, "loss": 2.7548779296875, "step": 689100 }, { "epoch": 0.8316116185506586, "learning_rate": 7.25714950312084e-06, "loss": 2.7769586181640626, "step": 689200 }, { "epoch": 0.8317322818731412, "learning_rate": 7.256745667653102e-06, "loss": 2.7747686767578124, "step": 689300 }, { "epoch": 0.8318529451956239, "learning_rate": 7.256341832185364e-06, "loss": 2.7806280517578124, "step": 689400 }, { "epoch": 0.8319736085181065, "learning_rate": 7.255937996717625e-06, "loss": 2.7483615112304687, "step": 689500 }, { "epoch": 0.8320942718405893, "learning_rate": 7.255534161249887e-06, "loss": 2.766712951660156, "step": 689600 }, { "epoch": 0.832214935163072, "learning_rate": 7.255130325782149e-06, "loss": 2.7647628784179688, "step": 689700 }, { "epoch": 0.8323355984855546, "learning_rate": 7.254726490314411e-06, "loss": 2.779339599609375, "step": 689800 }, { "epoch": 0.8324562618080373, "learning_rate": 7.2543226548466725e-06, "loss": 2.734499816894531, "step": 689900 }, { "epoch": 0.8325769251305201, "learning_rate": 7.2539188193789345e-06, "loss": 2.7614596557617186, "step": 690000 }, { "epoch": 0.8326975884530027, "learning_rate": 7.253514983911195e-06, "loss": 2.7762570190429687, "step": 690100 }, { "epoch": 0.8328182517754854, "learning_rate": 7.253111148443457e-06, "loss": 2.7788519287109374, "step": 690200 }, { "epoch": 0.832938915097968, "learning_rate": 7.252707312975719e-06, "loss": 2.7794393920898437, "step": 690300 }, { "epoch": 0.8330595784204508, "learning_rate": 7.252303477507981e-06, "loss": 2.744797668457031, "step": 690400 }, { "epoch": 0.8331802417429335, "learning_rate": 7.251899642040242e-06, "loss": 2.7352310180664063, "step": 690500 }, { "epoch": 0.8333009050654161, "learning_rate": 7.251495806572504e-06, "loss": 2.760634765625, "step": 690600 }, { "epoch": 0.8334215683878988, "learning_rate": 7.251091971104766e-06, "loss": 2.747817077636719, "step": 690700 }, { "epoch": 0.8335422317103814, "learning_rate": 7.250688135637027e-06, "loss": 2.737945556640625, "step": 690800 }, { "epoch": 0.8336628950328642, "learning_rate": 7.250284300169288e-06, "loss": 2.768433837890625, "step": 690900 }, { "epoch": 0.8337835583553469, "learning_rate": 7.24988046470155e-06, "loss": 2.74574951171875, "step": 691000 }, { "epoch": 0.8339042216778295, "learning_rate": 7.249476629233811e-06, "loss": 2.7629129028320314, "step": 691100 }, { "epoch": 0.8340248850003122, "learning_rate": 7.249072793766073e-06, "loss": 2.746793518066406, "step": 691200 }, { "epoch": 0.8341455483227949, "learning_rate": 7.248668958298335e-06, "loss": 2.739273681640625, "step": 691300 }, { "epoch": 0.8342662116452776, "learning_rate": 7.248265122830596e-06, "loss": 2.781951904296875, "step": 691400 }, { "epoch": 0.8343868749677603, "learning_rate": 7.247861287362858e-06, "loss": 2.759024963378906, "step": 691500 }, { "epoch": 0.8345075382902429, "learning_rate": 7.24745745189512e-06, "loss": 2.77873291015625, "step": 691600 }, { "epoch": 0.8346282016127257, "learning_rate": 7.2470536164273806e-06, "loss": 2.7770071411132813, "step": 691700 }, { "epoch": 0.8347488649352083, "learning_rate": 7.2466497809596425e-06, "loss": 2.7521490478515624, "step": 691800 }, { "epoch": 0.834869528257691, "learning_rate": 7.2462459454919045e-06, "loss": 2.770146484375, "step": 691900 }, { "epoch": 0.8349901915801737, "learning_rate": 7.245842110024166e-06, "loss": 2.755367431640625, "step": 692000 }, { "epoch": 0.8351108549026564, "learning_rate": 7.245438274556428e-06, "loss": 2.7622604370117188, "step": 692100 }, { "epoch": 0.8352315182251391, "learning_rate": 7.24503443908869e-06, "loss": 2.76739990234375, "step": 692200 }, { "epoch": 0.8353521815476217, "learning_rate": 7.244630603620952e-06, "loss": 2.769892578125, "step": 692300 }, { "epoch": 0.8354728448701044, "learning_rate": 7.244226768153213e-06, "loss": 2.7444207763671873, "step": 692400 }, { "epoch": 0.8355935081925872, "learning_rate": 7.243822932685474e-06, "loss": 2.767644958496094, "step": 692500 }, { "epoch": 0.8357141715150698, "learning_rate": 7.243419097217735e-06, "loss": 2.753415222167969, "step": 692600 }, { "epoch": 0.8358348348375525, "learning_rate": 7.243015261749997e-06, "loss": 2.757127380371094, "step": 692700 }, { "epoch": 0.8359554981600351, "learning_rate": 7.242611426282259e-06, "loss": 2.7736105346679687, "step": 692800 }, { "epoch": 0.8360761614825178, "learning_rate": 7.242207590814521e-06, "loss": 2.7389935302734374, "step": 692900 }, { "epoch": 0.8361968248050006, "learning_rate": 7.241803755346782e-06, "loss": 2.7779116821289063, "step": 693000 }, { "epoch": 0.8363174881274832, "learning_rate": 7.241399919879044e-06, "loss": 2.75095703125, "step": 693100 }, { "epoch": 0.8364381514499659, "learning_rate": 7.240996084411306e-06, "loss": 2.772707214355469, "step": 693200 }, { "epoch": 0.8365588147724485, "learning_rate": 7.240592248943566e-06, "loss": 2.7717205810546877, "step": 693300 }, { "epoch": 0.8366794780949313, "learning_rate": 7.240188413475828e-06, "loss": 2.783363037109375, "step": 693400 }, { "epoch": 0.836800141417414, "learning_rate": 7.23978457800809e-06, "loss": 2.769794921875, "step": 693500 }, { "epoch": 0.8369208047398966, "learning_rate": 7.2393807425403514e-06, "loss": 2.737657470703125, "step": 693600 }, { "epoch": 0.8370414680623793, "learning_rate": 7.2389769070726134e-06, "loss": 2.770452880859375, "step": 693700 }, { "epoch": 0.837162131384862, "learning_rate": 7.238573071604875e-06, "loss": 2.74417236328125, "step": 693800 }, { "epoch": 0.8372827947073447, "learning_rate": 7.2381692361371365e-06, "loss": 2.7591851806640624, "step": 693900 }, { "epoch": 0.8374034580298274, "learning_rate": 7.2377654006693985e-06, "loss": 2.7601513671875, "step": 694000 }, { "epoch": 0.83752412135231, "learning_rate": 7.23736156520166e-06, "loss": 2.7459622192382813, "step": 694100 }, { "epoch": 0.8376447846747928, "learning_rate": 7.236957729733921e-06, "loss": 2.7640350341796873, "step": 694200 }, { "epoch": 0.8377654479972754, "learning_rate": 7.236553894266183e-06, "loss": 2.762540283203125, "step": 694300 }, { "epoch": 0.8378861113197581, "learning_rate": 7.236150058798445e-06, "loss": 2.7619268798828127, "step": 694400 }, { "epoch": 0.8380067746422408, "learning_rate": 7.235746223330706e-06, "loss": 2.7208523559570312, "step": 694500 }, { "epoch": 0.8381274379647234, "learning_rate": 7.235342387862968e-06, "loss": 2.736491394042969, "step": 694600 }, { "epoch": 0.8382481012872062, "learning_rate": 7.23493855239523e-06, "loss": 2.7519732666015626, "step": 694700 }, { "epoch": 0.8383687646096888, "learning_rate": 7.234534716927492e-06, "loss": 2.7600112915039063, "step": 694800 }, { "epoch": 0.8384894279321715, "learning_rate": 7.234130881459753e-06, "loss": 2.77838134765625, "step": 694900 }, { "epoch": 0.8386100912546542, "learning_rate": 7.233727045992014e-06, "loss": 2.778692626953125, "step": 695000 }, { "epoch": 0.8387307545771369, "learning_rate": 7.233323210524275e-06, "loss": 2.767226257324219, "step": 695100 }, { "epoch": 0.8388514178996196, "learning_rate": 7.232919375056537e-06, "loss": 2.7683566284179686, "step": 695200 }, { "epoch": 0.8389720812221023, "learning_rate": 7.232515539588799e-06, "loss": 2.7708123779296874, "step": 695300 }, { "epoch": 0.8390927445445849, "learning_rate": 7.232111704121061e-06, "loss": 2.755225830078125, "step": 695400 }, { "epoch": 0.8392134078670677, "learning_rate": 7.231707868653322e-06, "loss": 2.7623663330078125, "step": 695500 }, { "epoch": 0.8393340711895503, "learning_rate": 7.231304033185584e-06, "loss": 2.7495608520507813, "step": 695600 }, { "epoch": 0.839454734512033, "learning_rate": 7.230900197717846e-06, "loss": 2.754932556152344, "step": 695700 }, { "epoch": 0.8395753978345157, "learning_rate": 7.230496362250107e-06, "loss": 2.7537255859375, "step": 695800 }, { "epoch": 0.8396960611569984, "learning_rate": 7.2300925267823686e-06, "loss": 2.754486389160156, "step": 695900 }, { "epoch": 0.8398167244794811, "learning_rate": 7.2296886913146306e-06, "loss": 2.7523419189453127, "step": 696000 }, { "epoch": 0.8399373878019637, "learning_rate": 7.229284855846892e-06, "loss": 2.745189208984375, "step": 696100 }, { "epoch": 0.8400580511244464, "learning_rate": 7.228881020379154e-06, "loss": 2.7585690307617186, "step": 696200 }, { "epoch": 0.8401787144469292, "learning_rate": 7.228477184911416e-06, "loss": 2.757199401855469, "step": 696300 }, { "epoch": 0.8402993777694118, "learning_rate": 7.228073349443678e-06, "loss": 2.7604180908203126, "step": 696400 }, { "epoch": 0.8404200410918945, "learning_rate": 7.227669513975939e-06, "loss": 2.7483511352539063, "step": 696500 }, { "epoch": 0.8405407044143771, "learning_rate": 7.2272656785082e-06, "loss": 2.7624032592773435, "step": 696600 }, { "epoch": 0.8406613677368598, "learning_rate": 7.226861843040461e-06, "loss": 2.764954833984375, "step": 696700 }, { "epoch": 0.8407820310593426, "learning_rate": 7.226458007572723e-06, "loss": 2.7384982299804688, "step": 696800 }, { "epoch": 0.8409026943818252, "learning_rate": 7.226054172104985e-06, "loss": 2.7461196899414064, "step": 696900 }, { "epoch": 0.8410233577043079, "learning_rate": 7.225650336637247e-06, "loss": 2.73990966796875, "step": 697000 }, { "epoch": 0.8411440210267905, "learning_rate": 7.225246501169508e-06, "loss": 2.7417037963867186, "step": 697100 }, { "epoch": 0.8412646843492733, "learning_rate": 7.22484266570177e-06, "loss": 2.754837951660156, "step": 697200 }, { "epoch": 0.841385347671756, "learning_rate": 7.224438830234032e-06, "loss": 2.7644775390625, "step": 697300 }, { "epoch": 0.8415060109942386, "learning_rate": 7.224034994766292e-06, "loss": 2.7673019409179687, "step": 697400 }, { "epoch": 0.8416266743167213, "learning_rate": 7.223631159298554e-06, "loss": 2.7481979370117187, "step": 697500 }, { "epoch": 0.841747337639204, "learning_rate": 7.223227323830816e-06, "loss": 2.7859262084960936, "step": 697600 }, { "epoch": 0.8418680009616867, "learning_rate": 7.2228234883630775e-06, "loss": 2.7625445556640624, "step": 697700 }, { "epoch": 0.8419886642841694, "learning_rate": 7.2224196528953395e-06, "loss": 2.764498291015625, "step": 697800 }, { "epoch": 0.842109327606652, "learning_rate": 7.2220158174276014e-06, "loss": 2.747264404296875, "step": 697900 }, { "epoch": 0.8422299909291348, "learning_rate": 7.221611981959863e-06, "loss": 2.776311340332031, "step": 698000 }, { "epoch": 0.8423506542516174, "learning_rate": 7.2212081464921246e-06, "loss": 2.7646533203125, "step": 698100 }, { "epoch": 0.8424713175741001, "learning_rate": 7.220804311024386e-06, "loss": 2.7593475341796876, "step": 698200 }, { "epoch": 0.8425919808965828, "learning_rate": 7.220400475556647e-06, "loss": 2.742789611816406, "step": 698300 }, { "epoch": 0.8427126442190654, "learning_rate": 7.219996640088909e-06, "loss": 2.7323455810546875, "step": 698400 }, { "epoch": 0.8428333075415482, "learning_rate": 7.219592804621171e-06, "loss": 2.7811355590820312, "step": 698500 }, { "epoch": 0.8429539708640308, "learning_rate": 7.219188969153432e-06, "loss": 2.7867587280273436, "step": 698600 }, { "epoch": 0.8430746341865135, "learning_rate": 7.218785133685694e-06, "loss": 2.7540383911132813, "step": 698700 }, { "epoch": 0.8431952975089962, "learning_rate": 7.218381298217956e-06, "loss": 2.73100830078125, "step": 698800 }, { "epoch": 0.8433159608314789, "learning_rate": 7.217977462750218e-06, "loss": 2.7559234619140627, "step": 698900 }, { "epoch": 0.8434366241539616, "learning_rate": 7.217573627282478e-06, "loss": 2.7618115234375, "step": 699000 }, { "epoch": 0.8435572874764442, "learning_rate": 7.21716979181474e-06, "loss": 2.746187744140625, "step": 699100 }, { "epoch": 0.8436779507989269, "learning_rate": 7.216765956347001e-06, "loss": 2.7446331787109375, "step": 699200 }, { "epoch": 0.8437986141214097, "learning_rate": 7.216362120879263e-06, "loss": 2.7656594848632814, "step": 699300 }, { "epoch": 0.8439192774438923, "learning_rate": 7.215958285411525e-06, "loss": 2.7403350830078126, "step": 699400 }, { "epoch": 0.844039940766375, "learning_rate": 7.215554449943787e-06, "loss": 2.753825988769531, "step": 699500 }, { "epoch": 0.8441606040888576, "learning_rate": 7.215150614476048e-06, "loss": 2.739991455078125, "step": 699600 }, { "epoch": 0.8442812674113404, "learning_rate": 7.21474677900831e-06, "loss": 2.7475155639648436, "step": 699700 }, { "epoch": 0.8444019307338231, "learning_rate": 7.214342943540571e-06, "loss": 2.75184326171875, "step": 699800 }, { "epoch": 0.8445225940563057, "learning_rate": 7.213939108072833e-06, "loss": 2.735565490722656, "step": 699900 }, { "epoch": 0.8446432573787884, "learning_rate": 7.213535272605095e-06, "loss": 2.769859619140625, "step": 700000 }, { "epoch": 0.844763920701271, "learning_rate": 7.213131437137357e-06, "loss": 2.774072570800781, "step": 700100 }, { "epoch": 0.8448845840237538, "learning_rate": 7.212727601669618e-06, "loss": 2.7508477783203125, "step": 700200 }, { "epoch": 0.8450052473462365, "learning_rate": 7.21232376620188e-06, "loss": 2.7312185668945315, "step": 700300 }, { "epoch": 0.8451259106687191, "learning_rate": 7.211919930734142e-06, "loss": 2.72595947265625, "step": 700400 }, { "epoch": 0.8452465739912018, "learning_rate": 7.211516095266403e-06, "loss": 2.761361083984375, "step": 700500 }, { "epoch": 0.8453672373136846, "learning_rate": 7.211112259798665e-06, "loss": 2.7568505859375, "step": 700600 }, { "epoch": 0.8454879006361672, "learning_rate": 7.210708424330926e-06, "loss": 2.7646929931640627, "step": 700700 }, { "epoch": 0.8456085639586499, "learning_rate": 7.210304588863187e-06, "loss": 2.741496887207031, "step": 700800 }, { "epoch": 0.8457292272811325, "learning_rate": 7.209900753395449e-06, "loss": 2.72297119140625, "step": 700900 }, { "epoch": 0.8458498906036153, "learning_rate": 7.209496917927711e-06, "loss": 2.752399597167969, "step": 701000 }, { "epoch": 0.845970553926098, "learning_rate": 7.209093082459972e-06, "loss": 2.7268942260742186, "step": 701100 }, { "epoch": 0.8460912172485806, "learning_rate": 7.208689246992234e-06, "loss": 2.761585693359375, "step": 701200 }, { "epoch": 0.8462118805710633, "learning_rate": 7.208285411524496e-06, "loss": 2.763692626953125, "step": 701300 }, { "epoch": 0.846332543893546, "learning_rate": 7.207881576056758e-06, "loss": 2.759352111816406, "step": 701400 }, { "epoch": 0.8464532072160287, "learning_rate": 7.207477740589018e-06, "loss": 2.7340435791015625, "step": 701500 }, { "epoch": 0.8465738705385114, "learning_rate": 7.20707390512128e-06, "loss": 2.771798400878906, "step": 701600 }, { "epoch": 0.846694533860994, "learning_rate": 7.2066700696535415e-06, "loss": 2.7612728881835937, "step": 701700 }, { "epoch": 0.8468151971834768, "learning_rate": 7.2062662341858035e-06, "loss": 2.742584228515625, "step": 701800 }, { "epoch": 0.8469358605059594, "learning_rate": 7.2058623987180655e-06, "loss": 2.735779113769531, "step": 701900 }, { "epoch": 0.8470565238284421, "learning_rate": 7.2054585632503275e-06, "loss": 2.717684020996094, "step": 702000 }, { "epoch": 0.8471771871509248, "learning_rate": 7.205054727782589e-06, "loss": 2.7524249267578127, "step": 702100 }, { "epoch": 0.8472978504734074, "learning_rate": 7.204650892314851e-06, "loss": 2.7912030029296875, "step": 702200 }, { "epoch": 0.8474185137958902, "learning_rate": 7.204247056847111e-06, "loss": 2.7568463134765624, "step": 702300 }, { "epoch": 0.8475391771183728, "learning_rate": 7.203843221379373e-06, "loss": 2.742562255859375, "step": 702400 }, { "epoch": 0.8476598404408555, "learning_rate": 7.203439385911635e-06, "loss": 2.7338986206054687, "step": 702500 }, { "epoch": 0.8477805037633382, "learning_rate": 7.203035550443897e-06, "loss": 2.7584689331054686, "step": 702600 }, { "epoch": 0.8479011670858209, "learning_rate": 7.202631714976158e-06, "loss": 2.761337890625, "step": 702700 }, { "epoch": 0.8480218304083036, "learning_rate": 7.20222787950842e-06, "loss": 2.7570785522460937, "step": 702800 }, { "epoch": 0.8481424937307862, "learning_rate": 7.201824044040682e-06, "loss": 2.759461669921875, "step": 702900 }, { "epoch": 0.8482631570532689, "learning_rate": 7.201420208572943e-06, "loss": 2.740189208984375, "step": 703000 }, { "epoch": 0.8483838203757517, "learning_rate": 7.201016373105204e-06, "loss": 2.7350228881835936, "step": 703100 }, { "epoch": 0.8485044836982343, "learning_rate": 7.200612537637466e-06, "loss": 2.747209167480469, "step": 703200 }, { "epoch": 0.848625147020717, "learning_rate": 7.200208702169727e-06, "loss": 2.770213928222656, "step": 703300 }, { "epoch": 0.8487458103431996, "learning_rate": 7.199804866701989e-06, "loss": 2.7480010986328125, "step": 703400 }, { "epoch": 0.8488664736656824, "learning_rate": 7.199401031234251e-06, "loss": 2.729515380859375, "step": 703500 }, { "epoch": 0.8489871369881651, "learning_rate": 7.198997195766512e-06, "loss": 2.7514968872070313, "step": 703600 }, { "epoch": 0.8491078003106477, "learning_rate": 7.198593360298774e-06, "loss": 2.787181396484375, "step": 703700 }, { "epoch": 0.8492284636331304, "learning_rate": 7.198189524831036e-06, "loss": 2.7567489624023436, "step": 703800 }, { "epoch": 0.849349126955613, "learning_rate": 7.197785689363297e-06, "loss": 2.7393313598632814, "step": 703900 }, { "epoch": 0.8494697902780958, "learning_rate": 7.197381853895559e-06, "loss": 2.7720135498046874, "step": 704000 }, { "epoch": 0.8495904536005785, "learning_rate": 7.196978018427821e-06, "loss": 2.76645751953125, "step": 704100 }, { "epoch": 0.8497111169230611, "learning_rate": 7.196574182960082e-06, "loss": 2.7568350219726563, "step": 704200 }, { "epoch": 0.8498317802455438, "learning_rate": 7.196170347492344e-06, "loss": 2.754114685058594, "step": 704300 }, { "epoch": 0.8499524435680265, "learning_rate": 7.195766512024606e-06, "loss": 2.7828915405273436, "step": 704400 }, { "epoch": 0.8500731068905092, "learning_rate": 7.195362676556868e-06, "loss": 2.76895751953125, "step": 704500 }, { "epoch": 0.8501937702129919, "learning_rate": 7.194958841089129e-06, "loss": 2.7466351318359377, "step": 704600 }, { "epoch": 0.8503144335354745, "learning_rate": 7.19455500562139e-06, "loss": 2.754508361816406, "step": 704700 }, { "epoch": 0.8504350968579573, "learning_rate": 7.194151170153651e-06, "loss": 2.7450051879882813, "step": 704800 }, { "epoch": 0.8505557601804399, "learning_rate": 7.193747334685913e-06, "loss": 2.7456875610351563, "step": 704900 }, { "epoch": 0.8506764235029226, "learning_rate": 7.193343499218175e-06, "loss": 2.779808349609375, "step": 705000 }, { "epoch": 0.8507970868254053, "learning_rate": 7.192939663750437e-06, "loss": 2.7399258422851562, "step": 705100 }, { "epoch": 0.850917750147888, "learning_rate": 7.192535828282698e-06, "loss": 2.7727099609375, "step": 705200 }, { "epoch": 0.8510384134703707, "learning_rate": 7.19213199281496e-06, "loss": 2.7663116455078125, "step": 705300 }, { "epoch": 0.8511590767928533, "learning_rate": 7.191728157347222e-06, "loss": 2.7588116455078127, "step": 705400 }, { "epoch": 0.851279740115336, "learning_rate": 7.191324321879483e-06, "loss": 2.7287109375, "step": 705500 }, { "epoch": 0.8514004034378188, "learning_rate": 7.1909204864117444e-06, "loss": 2.728892822265625, "step": 705600 }, { "epoch": 0.8515210667603014, "learning_rate": 7.1905166509440064e-06, "loss": 2.7715408325195314, "step": 705700 }, { "epoch": 0.8516417300827841, "learning_rate": 7.1901128154762676e-06, "loss": 2.739892883300781, "step": 705800 }, { "epoch": 0.8517623934052668, "learning_rate": 7.1897089800085295e-06, "loss": 2.750996398925781, "step": 705900 }, { "epoch": 0.8518830567277494, "learning_rate": 7.1893051445407915e-06, "loss": 2.738392333984375, "step": 706000 }, { "epoch": 0.8520037200502322, "learning_rate": 7.188901309073053e-06, "loss": 2.75764892578125, "step": 706100 }, { "epoch": 0.8521243833727148, "learning_rate": 7.188497473605315e-06, "loss": 2.7510452270507812, "step": 706200 }, { "epoch": 0.8522450466951975, "learning_rate": 7.188093638137577e-06, "loss": 2.7574835205078125, "step": 706300 }, { "epoch": 0.8523657100176802, "learning_rate": 7.187689802669837e-06, "loss": 2.7572174072265625, "step": 706400 }, { "epoch": 0.8524863733401629, "learning_rate": 7.187285967202099e-06, "loss": 2.7706378173828123, "step": 706500 }, { "epoch": 0.8526070366626456, "learning_rate": 7.186882131734361e-06, "loss": 2.7622296142578127, "step": 706600 }, { "epoch": 0.8527276999851282, "learning_rate": 7.186478296266622e-06, "loss": 2.74099365234375, "step": 706700 }, { "epoch": 0.8528483633076109, "learning_rate": 7.186074460798884e-06, "loss": 2.720220031738281, "step": 706800 }, { "epoch": 0.8529690266300937, "learning_rate": 7.185670625331146e-06, "loss": 2.75215576171875, "step": 706900 }, { "epoch": 0.8530896899525763, "learning_rate": 7.185266789863408e-06, "loss": 2.7263839721679686, "step": 707000 }, { "epoch": 0.853210353275059, "learning_rate": 7.184862954395669e-06, "loss": 2.7559783935546873, "step": 707100 }, { "epoch": 0.8533310165975416, "learning_rate": 7.18445911892793e-06, "loss": 2.7144232177734375, "step": 707200 }, { "epoch": 0.8534516799200244, "learning_rate": 7.184055283460191e-06, "loss": 2.773271179199219, "step": 707300 }, { "epoch": 0.8535723432425071, "learning_rate": 7.183651447992453e-06, "loss": 2.7693255615234373, "step": 707400 }, { "epoch": 0.8536930065649897, "learning_rate": 7.183247612524715e-06, "loss": 2.7593157958984373, "step": 707500 }, { "epoch": 0.8538136698874724, "learning_rate": 7.182843777056977e-06, "loss": 2.7662057495117187, "step": 707600 }, { "epoch": 0.853934333209955, "learning_rate": 7.1824399415892385e-06, "loss": 2.7554592895507812, "step": 707700 }, { "epoch": 0.8540549965324378, "learning_rate": 7.1820361061215004e-06, "loss": 2.7663064575195313, "step": 707800 }, { "epoch": 0.8541756598549205, "learning_rate": 7.181632270653762e-06, "loss": 2.722821044921875, "step": 707900 }, { "epoch": 0.8542963231774031, "learning_rate": 7.181228435186023e-06, "loss": 2.745648193359375, "step": 708000 }, { "epoch": 0.8544169864998858, "learning_rate": 7.180824599718285e-06, "loss": 2.73657958984375, "step": 708100 }, { "epoch": 0.8545376498223685, "learning_rate": 7.180420764250547e-06, "loss": 2.7559326171875, "step": 708200 }, { "epoch": 0.8546583131448512, "learning_rate": 7.180016928782808e-06, "loss": 2.7323992919921873, "step": 708300 }, { "epoch": 0.8547789764673339, "learning_rate": 7.17961309331507e-06, "loss": 2.7835382080078124, "step": 708400 }, { "epoch": 0.8548996397898165, "learning_rate": 7.179209257847332e-06, "loss": 2.7665277099609376, "step": 708500 }, { "epoch": 0.8550203031122993, "learning_rate": 7.178805422379593e-06, "loss": 2.7825445556640624, "step": 708600 }, { "epoch": 0.8551409664347819, "learning_rate": 7.178401586911855e-06, "loss": 2.7248361206054685, "step": 708700 }, { "epoch": 0.8552616297572646, "learning_rate": 7.177997751444116e-06, "loss": 2.74733154296875, "step": 708800 }, { "epoch": 0.8553822930797473, "learning_rate": 7.177593915976377e-06, "loss": 2.759459228515625, "step": 708900 }, { "epoch": 0.85550295640223, "learning_rate": 7.177190080508639e-06, "loss": 2.7485617065429686, "step": 709000 }, { "epoch": 0.8556236197247127, "learning_rate": 7.176786245040901e-06, "loss": 2.7674832153320312, "step": 709100 }, { "epoch": 0.8557442830471953, "learning_rate": 7.176382409573162e-06, "loss": 2.725174865722656, "step": 709200 }, { "epoch": 0.855864946369678, "learning_rate": 7.175978574105424e-06, "loss": 2.7582058715820312, "step": 709300 }, { "epoch": 0.8559856096921608, "learning_rate": 7.175574738637686e-06, "loss": 2.7534060668945313, "step": 709400 }, { "epoch": 0.8561062730146434, "learning_rate": 7.175170903169948e-06, "loss": 2.7385955810546876, "step": 709500 }, { "epoch": 0.8562269363371261, "learning_rate": 7.1747670677022085e-06, "loss": 2.7787591552734376, "step": 709600 }, { "epoch": 0.8563475996596087, "learning_rate": 7.1743632322344705e-06, "loss": 2.75330078125, "step": 709700 }, { "epoch": 0.8564682629820914, "learning_rate": 7.173959396766732e-06, "loss": 2.742421875, "step": 709800 }, { "epoch": 0.8565889263045742, "learning_rate": 7.173555561298994e-06, "loss": 2.73435546875, "step": 709900 }, { "epoch": 0.8567095896270568, "learning_rate": 7.173151725831256e-06, "loss": 2.749805603027344, "step": 710000 }, { "epoch": 0.8568302529495395, "learning_rate": 7.1727478903635176e-06, "loss": 2.7488973999023436, "step": 710100 }, { "epoch": 0.8569509162720221, "learning_rate": 7.172344054895779e-06, "loss": 2.748739929199219, "step": 710200 }, { "epoch": 0.8570715795945049, "learning_rate": 7.171940219428041e-06, "loss": 2.734100036621094, "step": 710300 }, { "epoch": 0.8571922429169876, "learning_rate": 7.171536383960303e-06, "loss": 2.745453186035156, "step": 710400 }, { "epoch": 0.8573129062394702, "learning_rate": 7.171132548492563e-06, "loss": 2.7523568725585936, "step": 710500 }, { "epoch": 0.8574335695619529, "learning_rate": 7.170728713024825e-06, "loss": 2.7299957275390625, "step": 710600 }, { "epoch": 0.8575542328844357, "learning_rate": 7.170324877557087e-06, "loss": 2.75388671875, "step": 710700 }, { "epoch": 0.8576748962069183, "learning_rate": 7.169921042089348e-06, "loss": 2.738289794921875, "step": 710800 }, { "epoch": 0.857795559529401, "learning_rate": 7.16951720662161e-06, "loss": 2.7618887329101565, "step": 710900 }, { "epoch": 0.8579162228518836, "learning_rate": 7.169113371153872e-06, "loss": 2.7549127197265624, "step": 711000 }, { "epoch": 0.8580368861743664, "learning_rate": 7.168709535686134e-06, "loss": 2.7405996704101563, "step": 711100 }, { "epoch": 0.8581575494968491, "learning_rate": 7.168305700218395e-06, "loss": 2.7535833740234374, "step": 711200 }, { "epoch": 0.8582782128193317, "learning_rate": 7.167901864750656e-06, "loss": 2.711210021972656, "step": 711300 }, { "epoch": 0.8583988761418144, "learning_rate": 7.167498029282917e-06, "loss": 2.7226312255859373, "step": 711400 }, { "epoch": 0.858519539464297, "learning_rate": 7.167094193815179e-06, "loss": 2.7308953857421874, "step": 711500 }, { "epoch": 0.8586402027867798, "learning_rate": 7.166690358347441e-06, "loss": 2.7484173583984375, "step": 711600 }, { "epoch": 0.8587608661092625, "learning_rate": 7.166286522879703e-06, "loss": 2.7637481689453125, "step": 711700 }, { "epoch": 0.8588815294317451, "learning_rate": 7.1658826874119645e-06, "loss": 2.7276507568359376, "step": 711800 }, { "epoch": 0.8590021927542278, "learning_rate": 7.1654788519442265e-06, "loss": 2.711622619628906, "step": 711900 }, { "epoch": 0.8591228560767105, "learning_rate": 7.1650750164764885e-06, "loss": 2.7432424926757815, "step": 712000 }, { "epoch": 0.8592435193991932, "learning_rate": 7.164671181008749e-06, "loss": 2.742309265136719, "step": 712100 }, { "epoch": 0.8593641827216759, "learning_rate": 7.164267345541011e-06, "loss": 2.733612060546875, "step": 712200 }, { "epoch": 0.8594848460441585, "learning_rate": 7.163863510073273e-06, "loss": 2.7543075561523436, "step": 712300 }, { "epoch": 0.8596055093666413, "learning_rate": 7.163459674605534e-06, "loss": 2.7235186767578123, "step": 712400 }, { "epoch": 0.8597261726891239, "learning_rate": 7.163055839137796e-06, "loss": 2.7509991455078127, "step": 712500 }, { "epoch": 0.8598468360116066, "learning_rate": 7.162652003670058e-06, "loss": 2.74455322265625, "step": 712600 }, { "epoch": 0.8599674993340893, "learning_rate": 7.162248168202319e-06, "loss": 2.749991149902344, "step": 712700 }, { "epoch": 0.860088162656572, "learning_rate": 7.161844332734581e-06, "loss": 2.744374084472656, "step": 712800 }, { "epoch": 0.8602088259790547, "learning_rate": 7.161440497266842e-06, "loss": 2.751786804199219, "step": 712900 }, { "epoch": 0.8603294893015373, "learning_rate": 7.161036661799103e-06, "loss": 2.744775695800781, "step": 713000 }, { "epoch": 0.86045015262402, "learning_rate": 7.160632826331365e-06, "loss": 2.731753234863281, "step": 713100 }, { "epoch": 0.8605708159465028, "learning_rate": 7.160228990863627e-06, "loss": 2.7628961181640626, "step": 713200 }, { "epoch": 0.8606914792689854, "learning_rate": 7.159825155395888e-06, "loss": 2.749023742675781, "step": 713300 }, { "epoch": 0.8608121425914681, "learning_rate": 7.15942131992815e-06, "loss": 2.745763244628906, "step": 713400 }, { "epoch": 0.8609328059139507, "learning_rate": 7.159017484460412e-06, "loss": 2.763033142089844, "step": 713500 }, { "epoch": 0.8610534692364334, "learning_rate": 7.158613648992674e-06, "loss": 2.7456985473632813, "step": 713600 }, { "epoch": 0.8611741325589162, "learning_rate": 7.1582098135249345e-06, "loss": 2.746715087890625, "step": 713700 }, { "epoch": 0.8612947958813988, "learning_rate": 7.1578059780571965e-06, "loss": 2.774205322265625, "step": 713800 }, { "epoch": 0.8614154592038815, "learning_rate": 7.157402142589458e-06, "loss": 2.7615338134765626, "step": 713900 }, { "epoch": 0.8615361225263641, "learning_rate": 7.15699830712172e-06, "loss": 2.7474932861328125, "step": 714000 }, { "epoch": 0.8616567858488469, "learning_rate": 7.156594471653982e-06, "loss": 2.7298092651367187, "step": 714100 }, { "epoch": 0.8617774491713296, "learning_rate": 7.156190636186244e-06, "loss": 2.7619708251953123, "step": 714200 }, { "epoch": 0.8618981124938122, "learning_rate": 7.155786800718505e-06, "loss": 2.7335028076171874, "step": 714300 }, { "epoch": 0.8620187758162949, "learning_rate": 7.155382965250767e-06, "loss": 2.757335205078125, "step": 714400 }, { "epoch": 0.8621394391387776, "learning_rate": 7.154979129783027e-06, "loss": 2.7551504516601564, "step": 714500 }, { "epoch": 0.8622601024612603, "learning_rate": 7.154575294315289e-06, "loss": 2.7472378540039064, "step": 714600 }, { "epoch": 0.862380765783743, "learning_rate": 7.154171458847551e-06, "loss": 2.7425286865234373, "step": 714700 }, { "epoch": 0.8625014291062256, "learning_rate": 7.153767623379813e-06, "loss": 2.7385983276367187, "step": 714800 }, { "epoch": 0.8626220924287084, "learning_rate": 7.153363787912074e-06, "loss": 2.7679537963867187, "step": 714900 }, { "epoch": 0.862742755751191, "learning_rate": 7.152959952444336e-06, "loss": 2.7354312133789063, "step": 715000 }, { "epoch": 0.8628634190736737, "learning_rate": 7.152556116976598e-06, "loss": 2.74020263671875, "step": 715100 }, { "epoch": 0.8629840823961564, "learning_rate": 7.152152281508859e-06, "loss": 2.741080627441406, "step": 715200 }, { "epoch": 0.863104745718639, "learning_rate": 7.15174844604112e-06, "loss": 2.7262567138671874, "step": 715300 }, { "epoch": 0.8632254090411218, "learning_rate": 7.151344610573382e-06, "loss": 2.755650634765625, "step": 715400 }, { "epoch": 0.8633460723636044, "learning_rate": 7.1509407751056434e-06, "loss": 2.7160546875, "step": 715500 }, { "epoch": 0.8634667356860871, "learning_rate": 7.150536939637905e-06, "loss": 2.7647164916992186, "step": 715600 }, { "epoch": 0.8635873990085698, "learning_rate": 7.150133104170167e-06, "loss": 2.7508428955078124, "step": 715700 }, { "epoch": 0.8637080623310525, "learning_rate": 7.1497292687024285e-06, "loss": 2.7408526611328123, "step": 715800 }, { "epoch": 0.8638287256535352, "learning_rate": 7.1493254332346905e-06, "loss": 2.7365994262695312, "step": 715900 }, { "epoch": 0.8639493889760179, "learning_rate": 7.1489215977669525e-06, "loss": 2.765014343261719, "step": 716000 }, { "epoch": 0.8640700522985005, "learning_rate": 7.1485177622992145e-06, "loss": 2.745838928222656, "step": 716100 }, { "epoch": 0.8641907156209833, "learning_rate": 7.148113926831475e-06, "loss": 2.7431427001953126, "step": 716200 }, { "epoch": 0.8643113789434659, "learning_rate": 7.147710091363737e-06, "loss": 2.7446990966796876, "step": 716300 }, { "epoch": 0.8644320422659486, "learning_rate": 7.147306255895998e-06, "loss": 2.7468972778320313, "step": 716400 }, { "epoch": 0.8645527055884313, "learning_rate": 7.14690242042826e-06, "loss": 2.7713021850585937, "step": 716500 }, { "epoch": 0.864673368910914, "learning_rate": 7.146498584960522e-06, "loss": 2.74315185546875, "step": 716600 }, { "epoch": 0.8647940322333967, "learning_rate": 7.146094749492784e-06, "loss": 2.757685241699219, "step": 716700 }, { "epoch": 0.8649146955558793, "learning_rate": 7.145690914025045e-06, "loss": 2.74128173828125, "step": 716800 }, { "epoch": 0.865035358878362, "learning_rate": 7.145287078557307e-06, "loss": 2.7546420288085938, "step": 716900 }, { "epoch": 0.8651560222008448, "learning_rate": 7.144883243089567e-06, "loss": 2.770912780761719, "step": 717000 }, { "epoch": 0.8652766855233274, "learning_rate": 7.144479407621829e-06, "loss": 2.746339111328125, "step": 717100 }, { "epoch": 0.8653973488458101, "learning_rate": 7.144075572154091e-06, "loss": 2.737349548339844, "step": 717200 }, { "epoch": 0.8655180121682927, "learning_rate": 7.143671736686353e-06, "loss": 2.7293496704101563, "step": 717300 }, { "epoch": 0.8656386754907754, "learning_rate": 7.143267901218614e-06, "loss": 2.7399862670898436, "step": 717400 }, { "epoch": 0.8657593388132582, "learning_rate": 7.142864065750876e-06, "loss": 2.734954528808594, "step": 717500 }, { "epoch": 0.8658800021357408, "learning_rate": 7.142460230283138e-06, "loss": 2.7651708984375, "step": 717600 }, { "epoch": 0.8660006654582235, "learning_rate": 7.1420563948153994e-06, "loss": 2.7267083740234375, "step": 717700 }, { "epoch": 0.8661213287807061, "learning_rate": 7.1416525593476606e-06, "loss": 2.7249285888671877, "step": 717800 }, { "epoch": 0.8662419921031889, "learning_rate": 7.1412487238799225e-06, "loss": 2.7328753662109375, "step": 717900 }, { "epoch": 0.8663626554256716, "learning_rate": 7.140844888412184e-06, "loss": 2.734349670410156, "step": 718000 }, { "epoch": 0.8664833187481542, "learning_rate": 7.140441052944446e-06, "loss": 2.7516940307617186, "step": 718100 }, { "epoch": 0.8666039820706369, "learning_rate": 7.140037217476708e-06, "loss": 2.7468798828125, "step": 718200 }, { "epoch": 0.8667246453931196, "learning_rate": 7.139633382008969e-06, "loss": 2.74196044921875, "step": 718300 }, { "epoch": 0.8668453087156023, "learning_rate": 7.139229546541231e-06, "loss": 2.747171630859375, "step": 718400 }, { "epoch": 0.866965972038085, "learning_rate": 7.138825711073493e-06, "loss": 2.7543389892578123, "step": 718500 }, { "epoch": 0.8670866353605676, "learning_rate": 7.138421875605753e-06, "loss": 2.7472442626953124, "step": 718600 }, { "epoch": 0.8672072986830504, "learning_rate": 7.138018040138015e-06, "loss": 2.71944091796875, "step": 718700 }, { "epoch": 0.867327962005533, "learning_rate": 7.137614204670277e-06, "loss": 2.750362548828125, "step": 718800 }, { "epoch": 0.8674486253280157, "learning_rate": 7.137210369202538e-06, "loss": 2.734419860839844, "step": 718900 }, { "epoch": 0.8675692886504984, "learning_rate": 7.1368065337348e-06, "loss": 2.7601531982421874, "step": 719000 }, { "epoch": 0.867689951972981, "learning_rate": 7.136402698267062e-06, "loss": 2.7632586669921877, "step": 719100 }, { "epoch": 0.8678106152954638, "learning_rate": 7.135998862799324e-06, "loss": 2.755637512207031, "step": 719200 }, { "epoch": 0.8679312786179464, "learning_rate": 7.135595027331585e-06, "loss": 2.7303326416015623, "step": 719300 }, { "epoch": 0.8680519419404291, "learning_rate": 7.135191191863846e-06, "loss": 2.7492831420898436, "step": 719400 }, { "epoch": 0.8681726052629118, "learning_rate": 7.1347873563961075e-06, "loss": 2.75053955078125, "step": 719500 }, { "epoch": 0.8682932685853945, "learning_rate": 7.1343835209283695e-06, "loss": 2.7334869384765623, "step": 719600 }, { "epoch": 0.8684139319078772, "learning_rate": 7.1339796854606315e-06, "loss": 2.751102294921875, "step": 719700 }, { "epoch": 0.8685345952303598, "learning_rate": 7.1335758499928934e-06, "loss": 2.7191317749023436, "step": 719800 }, { "epoch": 0.8686552585528425, "learning_rate": 7.1331720145251546e-06, "loss": 2.7013043212890624, "step": 719900 }, { "epoch": 0.8687759218753253, "learning_rate": 7.1327681790574166e-06, "loss": 2.7597579956054688, "step": 720000 }, { "epoch": 0.8688965851978079, "learning_rate": 7.1323643435896785e-06, "loss": 2.7323822021484374, "step": 720100 }, { "epoch": 0.8690172485202906, "learning_rate": 7.131960508121939e-06, "loss": 2.7413070678710936, "step": 720200 }, { "epoch": 0.8691379118427732, "learning_rate": 7.131556672654201e-06, "loss": 2.73740234375, "step": 720300 }, { "epoch": 0.869258575165256, "learning_rate": 7.131152837186463e-06, "loss": 2.731237487792969, "step": 720400 }, { "epoch": 0.8693792384877387, "learning_rate": 7.130749001718724e-06, "loss": 2.7377325439453126, "step": 720500 }, { "epoch": 0.8694999018102213, "learning_rate": 7.130345166250986e-06, "loss": 2.75404296875, "step": 720600 }, { "epoch": 0.869620565132704, "learning_rate": 7.129941330783248e-06, "loss": 2.741457214355469, "step": 720700 }, { "epoch": 0.8697412284551866, "learning_rate": 7.129537495315509e-06, "loss": 2.7357058715820313, "step": 720800 }, { "epoch": 0.8698618917776694, "learning_rate": 7.129133659847771e-06, "loss": 2.762898254394531, "step": 720900 }, { "epoch": 0.8699825551001521, "learning_rate": 7.128729824380033e-06, "loss": 2.727400207519531, "step": 721000 }, { "epoch": 0.8701032184226347, "learning_rate": 7.128325988912293e-06, "loss": 2.7526950073242187, "step": 721100 }, { "epoch": 0.8702238817451174, "learning_rate": 7.127922153444555e-06, "loss": 2.7293804931640624, "step": 721200 }, { "epoch": 0.8703445450676002, "learning_rate": 7.127518317976817e-06, "loss": 2.7467416381835936, "step": 721300 }, { "epoch": 0.8704652083900828, "learning_rate": 7.127114482509078e-06, "loss": 2.731553039550781, "step": 721400 }, { "epoch": 0.8705858717125655, "learning_rate": 7.12671064704134e-06, "loss": 2.720465087890625, "step": 721500 }, { "epoch": 0.8707065350350481, "learning_rate": 7.126306811573602e-06, "loss": 2.74106201171875, "step": 721600 }, { "epoch": 0.8708271983575309, "learning_rate": 7.125902976105864e-06, "loss": 2.7291665649414063, "step": 721700 }, { "epoch": 0.8709478616800136, "learning_rate": 7.1254991406381255e-06, "loss": 2.7402203369140623, "step": 721800 }, { "epoch": 0.8710685250024962, "learning_rate": 7.125095305170387e-06, "loss": 2.7421701049804685, "step": 721900 }, { "epoch": 0.8711891883249789, "learning_rate": 7.124691469702648e-06, "loss": 2.726976318359375, "step": 722000 }, { "epoch": 0.8713098516474616, "learning_rate": 7.12428763423491e-06, "loss": 2.7228878784179686, "step": 722100 }, { "epoch": 0.8714305149699443, "learning_rate": 7.123883798767172e-06, "loss": 2.74001953125, "step": 722200 }, { "epoch": 0.871551178292427, "learning_rate": 7.123479963299434e-06, "loss": 2.730009765625, "step": 722300 }, { "epoch": 0.8716718416149096, "learning_rate": 7.123076127831695e-06, "loss": 2.7399935913085938, "step": 722400 }, { "epoch": 0.8717925049373924, "learning_rate": 7.122672292363957e-06, "loss": 2.7469906616210937, "step": 722500 }, { "epoch": 0.871913168259875, "learning_rate": 7.122268456896219e-06, "loss": 2.7371044921875, "step": 722600 }, { "epoch": 0.8720338315823577, "learning_rate": 7.121864621428479e-06, "loss": 2.751040344238281, "step": 722700 }, { "epoch": 0.8721544949048404, "learning_rate": 7.121460785960741e-06, "loss": 2.7153976440429686, "step": 722800 }, { "epoch": 0.872275158227323, "learning_rate": 7.121056950493003e-06, "loss": 2.7663784790039063, "step": 722900 }, { "epoch": 0.8723958215498058, "learning_rate": 7.120653115025264e-06, "loss": 2.7534466552734376, "step": 723000 }, { "epoch": 0.8725164848722884, "learning_rate": 7.120249279557526e-06, "loss": 2.7529193115234376, "step": 723100 }, { "epoch": 0.8726371481947711, "learning_rate": 7.119845444089788e-06, "loss": 2.7304791259765624, "step": 723200 }, { "epoch": 0.8727578115172538, "learning_rate": 7.119441608622049e-06, "loss": 2.738200378417969, "step": 723300 }, { "epoch": 0.8728784748397365, "learning_rate": 7.119037773154311e-06, "loss": 2.7223223876953124, "step": 723400 }, { "epoch": 0.8729991381622192, "learning_rate": 7.118633937686572e-06, "loss": 2.7443331909179687, "step": 723500 }, { "epoch": 0.8731198014847018, "learning_rate": 7.1182301022188335e-06, "loss": 2.7387176513671876, "step": 723600 }, { "epoch": 0.8732404648071845, "learning_rate": 7.1178262667510955e-06, "loss": 2.751534729003906, "step": 723700 }, { "epoch": 0.8733611281296673, "learning_rate": 7.1174224312833575e-06, "loss": 2.7623245239257814, "step": 723800 }, { "epoch": 0.8734817914521499, "learning_rate": 7.117018595815619e-06, "loss": 2.7401214599609376, "step": 723900 }, { "epoch": 0.8736024547746326, "learning_rate": 7.116614760347881e-06, "loss": 2.7233721923828127, "step": 724000 }, { "epoch": 0.8737231180971152, "learning_rate": 7.116210924880143e-06, "loss": 2.742966613769531, "step": 724100 }, { "epoch": 0.873843781419598, "learning_rate": 7.1158070894124046e-06, "loss": 2.7220977783203124, "step": 724200 }, { "epoch": 0.8739644447420807, "learning_rate": 7.115403253944665e-06, "loss": 2.722117614746094, "step": 724300 }, { "epoch": 0.8740851080645633, "learning_rate": 7.114999418476927e-06, "loss": 2.722786560058594, "step": 724400 }, { "epoch": 0.874205771387046, "learning_rate": 7.114595583009188e-06, "loss": 2.7380490112304687, "step": 724500 }, { "epoch": 0.8743264347095286, "learning_rate": 7.11419174754145e-06, "loss": 2.718147888183594, "step": 724600 }, { "epoch": 0.8744470980320114, "learning_rate": 7.113787912073712e-06, "loss": 2.7039804077148437, "step": 724700 }, { "epoch": 0.8745677613544941, "learning_rate": 7.113384076605974e-06, "loss": 2.7432684326171874, "step": 724800 }, { "epoch": 0.8746884246769767, "learning_rate": 7.112980241138235e-06, "loss": 2.751463623046875, "step": 724900 }, { "epoch": 0.8748090879994594, "learning_rate": 7.112576405670497e-06, "loss": 2.7284161376953127, "step": 725000 }, { "epoch": 0.8749297513219421, "learning_rate": 7.112172570202757e-06, "loss": 2.7394534301757814, "step": 725100 }, { "epoch": 0.8750504146444248, "learning_rate": 7.111768734735019e-06, "loss": 2.7583248901367186, "step": 725200 }, { "epoch": 0.8751710779669075, "learning_rate": 7.111364899267281e-06, "loss": 2.7719354248046875, "step": 725300 }, { "epoch": 0.8752917412893901, "learning_rate": 7.110961063799543e-06, "loss": 2.7420037841796874, "step": 725400 }, { "epoch": 0.8754124046118729, "learning_rate": 7.110557228331804e-06, "loss": 2.7500125122070314, "step": 725500 }, { "epoch": 0.8755330679343555, "learning_rate": 7.110153392864066e-06, "loss": 2.747250671386719, "step": 725600 }, { "epoch": 0.8756537312568382, "learning_rate": 7.109749557396328e-06, "loss": 2.7216561889648436, "step": 725700 }, { "epoch": 0.8757743945793209, "learning_rate": 7.10934572192859e-06, "loss": 2.710088195800781, "step": 725800 }, { "epoch": 0.8758950579018036, "learning_rate": 7.1089418864608515e-06, "loss": 2.769359436035156, "step": 725900 }, { "epoch": 0.8760157212242863, "learning_rate": 7.108538050993113e-06, "loss": 2.7085470581054687, "step": 726000 }, { "epoch": 0.8761363845467689, "learning_rate": 7.108134215525374e-06, "loss": 2.757945861816406, "step": 726100 }, { "epoch": 0.8762570478692516, "learning_rate": 7.107730380057636e-06, "loss": 2.7416485595703124, "step": 726200 }, { "epoch": 0.8763777111917344, "learning_rate": 7.107326544589898e-06, "loss": 2.748413391113281, "step": 726300 }, { "epoch": 0.876498374514217, "learning_rate": 7.10692270912216e-06, "loss": 2.7397756958007813, "step": 726400 }, { "epoch": 0.8766190378366997, "learning_rate": 7.106518873654421e-06, "loss": 2.7575885009765626, "step": 726500 }, { "epoch": 0.8767397011591824, "learning_rate": 7.106115038186683e-06, "loss": 2.7148733520507813, "step": 726600 }, { "epoch": 0.876860364481665, "learning_rate": 7.105711202718945e-06, "loss": 2.7477838134765626, "step": 726700 }, { "epoch": 0.8769810278041478, "learning_rate": 7.105307367251205e-06, "loss": 2.7526788330078125, "step": 726800 }, { "epoch": 0.8771016911266304, "learning_rate": 7.104903531783467e-06, "loss": 2.718369140625, "step": 726900 }, { "epoch": 0.8772223544491131, "learning_rate": 7.104499696315729e-06, "loss": 2.7524481201171875, "step": 727000 }, { "epoch": 0.8773430177715958, "learning_rate": 7.10409586084799e-06, "loss": 2.7475070190429687, "step": 727100 }, { "epoch": 0.8774636810940785, "learning_rate": 7.103692025380252e-06, "loss": 2.7298004150390627, "step": 727200 }, { "epoch": 0.8775843444165612, "learning_rate": 7.103288189912514e-06, "loss": 2.7433599853515624, "step": 727300 }, { "epoch": 0.8777050077390438, "learning_rate": 7.102884354444775e-06, "loss": 2.7073684692382813, "step": 727400 }, { "epoch": 0.8778256710615265, "learning_rate": 7.102480518977037e-06, "loss": 2.7142562866210938, "step": 727500 }, { "epoch": 0.8779463343840093, "learning_rate": 7.102076683509298e-06, "loss": 2.7750311279296875, "step": 727600 }, { "epoch": 0.8780669977064919, "learning_rate": 7.1016728480415596e-06, "loss": 2.7266168212890625, "step": 727700 }, { "epoch": 0.8781876610289746, "learning_rate": 7.1012690125738215e-06, "loss": 2.7208056640625, "step": 727800 }, { "epoch": 0.8783083243514572, "learning_rate": 7.1008651771060835e-06, "loss": 2.7392486572265624, "step": 727900 }, { "epoch": 0.87842898767394, "learning_rate": 7.100461341638345e-06, "loss": 2.762337951660156, "step": 728000 }, { "epoch": 0.8785496509964227, "learning_rate": 7.100057506170607e-06, "loss": 2.722068176269531, "step": 728100 }, { "epoch": 0.8786703143189053, "learning_rate": 7.099653670702869e-06, "loss": 2.73170654296875, "step": 728200 }, { "epoch": 0.878790977641388, "learning_rate": 7.099249835235131e-06, "loss": 2.7332476806640624, "step": 728300 }, { "epoch": 0.8789116409638706, "learning_rate": 7.098845999767391e-06, "loss": 2.738536376953125, "step": 728400 }, { "epoch": 0.8790323042863534, "learning_rate": 7.098442164299653e-06, "loss": 2.7710955810546873, "step": 728500 }, { "epoch": 0.8791529676088361, "learning_rate": 7.098038328831914e-06, "loss": 2.735881652832031, "step": 728600 }, { "epoch": 0.8792736309313187, "learning_rate": 7.097634493364176e-06, "loss": 2.7565213012695313, "step": 728700 }, { "epoch": 0.8793942942538014, "learning_rate": 7.097230657896438e-06, "loss": 2.73095947265625, "step": 728800 }, { "epoch": 0.8795149575762841, "learning_rate": 7.0968268224287e-06, "loss": 2.7409622192382814, "step": 728900 }, { "epoch": 0.8796356208987668, "learning_rate": 7.096422986960961e-06, "loss": 2.740140075683594, "step": 729000 }, { "epoch": 0.8797562842212495, "learning_rate": 7.096019151493223e-06, "loss": 2.7190701293945314, "step": 729100 }, { "epoch": 0.8798769475437321, "learning_rate": 7.095615316025483e-06, "loss": 2.7191653442382813, "step": 729200 }, { "epoch": 0.8799976108662149, "learning_rate": 7.095211480557745e-06, "loss": 2.7350674438476563, "step": 729300 }, { "epoch": 0.8801182741886975, "learning_rate": 7.094807645090007e-06, "loss": 2.7357754516601562, "step": 729400 }, { "epoch": 0.8802389375111802, "learning_rate": 7.094403809622269e-06, "loss": 2.7274420166015627, "step": 729500 }, { "epoch": 0.8803596008336629, "learning_rate": 7.0939999741545304e-06, "loss": 2.738597412109375, "step": 729600 }, { "epoch": 0.8804802641561456, "learning_rate": 7.0935961386867924e-06, "loss": 2.7043511962890623, "step": 729700 }, { "epoch": 0.8806009274786283, "learning_rate": 7.093192303219054e-06, "loss": 2.740457763671875, "step": 729800 }, { "epoch": 0.8807215908011109, "learning_rate": 7.0927884677513155e-06, "loss": 2.736832580566406, "step": 729900 }, { "epoch": 0.8808422541235936, "learning_rate": 7.092384632283577e-06, "loss": 2.729727478027344, "step": 730000 }, { "epoch": 0.8809629174460764, "learning_rate": 7.091980796815839e-06, "loss": 2.7417007446289063, "step": 730100 }, { "epoch": 0.881083580768559, "learning_rate": 7.0915769613481e-06, "loss": 2.720724792480469, "step": 730200 }, { "epoch": 0.8812042440910417, "learning_rate": 7.091173125880362e-06, "loss": 2.7023855590820314, "step": 730300 }, { "epoch": 0.8813249074135243, "learning_rate": 7.090769290412624e-06, "loss": 2.7165963745117185, "step": 730400 }, { "epoch": 0.881445570736007, "learning_rate": 7.090365454944885e-06, "loss": 2.7342123413085937, "step": 730500 }, { "epoch": 0.8815662340584898, "learning_rate": 7.089961619477147e-06, "loss": 2.7447747802734375, "step": 730600 }, { "epoch": 0.8816868973809724, "learning_rate": 7.089557784009409e-06, "loss": 2.7240731811523435, "step": 730700 }, { "epoch": 0.8818075607034551, "learning_rate": 7.089153948541671e-06, "loss": 2.751165466308594, "step": 730800 }, { "epoch": 0.8819282240259377, "learning_rate": 7.088750113073931e-06, "loss": 2.7319085693359373, "step": 730900 }, { "epoch": 0.8820488873484205, "learning_rate": 7.088346277606193e-06, "loss": 2.727286071777344, "step": 731000 }, { "epoch": 0.8821695506709032, "learning_rate": 7.087942442138454e-06, "loss": 2.7234710693359374, "step": 731100 }, { "epoch": 0.8822902139933858, "learning_rate": 7.087538606670716e-06, "loss": 2.713250732421875, "step": 731200 }, { "epoch": 0.8824108773158685, "learning_rate": 7.087134771202978e-06, "loss": 2.7090606689453125, "step": 731300 }, { "epoch": 0.8825315406383512, "learning_rate": 7.08673093573524e-06, "loss": 2.739396667480469, "step": 731400 }, { "epoch": 0.8826522039608339, "learning_rate": 7.086327100267501e-06, "loss": 2.742340393066406, "step": 731500 }, { "epoch": 0.8827728672833166, "learning_rate": 7.085923264799763e-06, "loss": 2.715809326171875, "step": 731600 }, { "epoch": 0.8828935306057992, "learning_rate": 7.085519429332024e-06, "loss": 2.74200439453125, "step": 731700 }, { "epoch": 0.883014193928282, "learning_rate": 7.085115593864286e-06, "loss": 2.745321044921875, "step": 731800 }, { "epoch": 0.8831348572507647, "learning_rate": 7.0847117583965476e-06, "loss": 2.738373107910156, "step": 731900 }, { "epoch": 0.8832555205732473, "learning_rate": 7.0843079229288096e-06, "loss": 2.7407760620117188, "step": 732000 }, { "epoch": 0.88337618389573, "learning_rate": 7.083904087461071e-06, "loss": 2.7285922241210936, "step": 732100 }, { "epoch": 0.8834968472182126, "learning_rate": 7.083500251993333e-06, "loss": 2.712127380371094, "step": 732200 }, { "epoch": 0.8836175105406954, "learning_rate": 7.083096416525595e-06, "loss": 2.7188595581054686, "step": 732300 }, { "epoch": 0.8837381738631781, "learning_rate": 7.082692581057856e-06, "loss": 2.745901794433594, "step": 732400 }, { "epoch": 0.8838588371856607, "learning_rate": 7.082288745590117e-06, "loss": 2.733869934082031, "step": 732500 }, { "epoch": 0.8839795005081434, "learning_rate": 7.081884910122379e-06, "loss": 2.7473135375976563, "step": 732600 }, { "epoch": 0.8841001638306261, "learning_rate": 7.08148107465464e-06, "loss": 2.7492916870117186, "step": 732700 }, { "epoch": 0.8842208271531088, "learning_rate": 7.081077239186902e-06, "loss": 2.7530865478515625, "step": 732800 }, { "epoch": 0.8843414904755915, "learning_rate": 7.080673403719164e-06, "loss": 2.750387878417969, "step": 732900 }, { "epoch": 0.8844621537980741, "learning_rate": 7.080269568251425e-06, "loss": 2.7354171752929686, "step": 733000 }, { "epoch": 0.8845828171205569, "learning_rate": 7.079865732783687e-06, "loss": 2.7391607666015627, "step": 733100 }, { "epoch": 0.8847034804430395, "learning_rate": 7.079461897315949e-06, "loss": 2.7047134399414063, "step": 733200 }, { "epoch": 0.8848241437655222, "learning_rate": 7.079058061848209e-06, "loss": 2.7133523559570314, "step": 733300 }, { "epoch": 0.8849448070880049, "learning_rate": 7.078654226380471e-06, "loss": 2.7188739013671874, "step": 733400 }, { "epoch": 0.8850654704104876, "learning_rate": 7.078250390912733e-06, "loss": 2.73158203125, "step": 733500 }, { "epoch": 0.8851861337329703, "learning_rate": 7.0778465554449945e-06, "loss": 2.714430236816406, "step": 733600 }, { "epoch": 0.8853067970554529, "learning_rate": 7.0774427199772565e-06, "loss": 2.7335888671875, "step": 733700 }, { "epoch": 0.8854274603779356, "learning_rate": 7.0770388845095185e-06, "loss": 2.7512872314453123, "step": 733800 }, { "epoch": 0.8855481237004184, "learning_rate": 7.0766350490417804e-06, "loss": 2.7435076904296873, "step": 733900 }, { "epoch": 0.885668787022901, "learning_rate": 7.076231213574042e-06, "loss": 2.737284851074219, "step": 734000 }, { "epoch": 0.8857894503453837, "learning_rate": 7.075827378106303e-06, "loss": 2.7308883666992188, "step": 734100 }, { "epoch": 0.8859101136678663, "learning_rate": 7.075423542638564e-06, "loss": 2.7234097290039063, "step": 734200 }, { "epoch": 0.886030776990349, "learning_rate": 7.075019707170826e-06, "loss": 2.745239562988281, "step": 734300 }, { "epoch": 0.8861514403128318, "learning_rate": 7.074615871703088e-06, "loss": 2.716042785644531, "step": 734400 }, { "epoch": 0.8862721036353144, "learning_rate": 7.07421203623535e-06, "loss": 2.755118713378906, "step": 734500 }, { "epoch": 0.8863927669577971, "learning_rate": 7.073808200767611e-06, "loss": 2.7056069946289063, "step": 734600 }, { "epoch": 0.8865134302802797, "learning_rate": 7.073404365299873e-06, "loss": 2.748909912109375, "step": 734700 }, { "epoch": 0.8866340936027625, "learning_rate": 7.073000529832135e-06, "loss": 2.744024353027344, "step": 734800 }, { "epoch": 0.8867547569252452, "learning_rate": 7.072596694364395e-06, "loss": 2.741895751953125, "step": 734900 }, { "epoch": 0.8868754202477278, "learning_rate": 7.072192858896657e-06, "loss": 2.7386053466796874, "step": 735000 }, { "epoch": 0.8869960835702105, "learning_rate": 7.071789023428919e-06, "loss": 2.7415911865234377, "step": 735100 }, { "epoch": 0.8871167468926932, "learning_rate": 7.07138518796118e-06, "loss": 2.71133544921875, "step": 735200 }, { "epoch": 0.8872374102151759, "learning_rate": 7.070981352493442e-06, "loss": 2.7137249755859374, "step": 735300 }, { "epoch": 0.8873580735376586, "learning_rate": 7.070577517025704e-06, "loss": 2.7215786743164063, "step": 735400 }, { "epoch": 0.8874787368601412, "learning_rate": 7.070173681557965e-06, "loss": 2.7454568481445314, "step": 735500 }, { "epoch": 0.887599400182624, "learning_rate": 7.069769846090227e-06, "loss": 2.7191583251953126, "step": 735600 }, { "epoch": 0.8877200635051066, "learning_rate": 7.0693660106224885e-06, "loss": 2.705452880859375, "step": 735700 }, { "epoch": 0.8878407268275893, "learning_rate": 7.06896217515475e-06, "loss": 2.7064398193359374, "step": 735800 }, { "epoch": 0.887961390150072, "learning_rate": 7.068558339687012e-06, "loss": 2.718194580078125, "step": 735900 }, { "epoch": 0.8880820534725546, "learning_rate": 7.068154504219274e-06, "loss": 2.7307830810546876, "step": 736000 }, { "epoch": 0.8882027167950374, "learning_rate": 7.067750668751535e-06, "loss": 2.7309039306640623, "step": 736100 }, { "epoch": 0.88832338011752, "learning_rate": 7.067346833283797e-06, "loss": 2.7098562622070315, "step": 736200 }, { "epoch": 0.8884440434400027, "learning_rate": 7.066942997816059e-06, "loss": 2.7430569458007814, "step": 736300 }, { "epoch": 0.8885647067624854, "learning_rate": 7.066539162348321e-06, "loss": 2.748873291015625, "step": 736400 }, { "epoch": 0.8886853700849681, "learning_rate": 7.066135326880582e-06, "loss": 2.720919494628906, "step": 736500 }, { "epoch": 0.8888060334074508, "learning_rate": 7.065731491412843e-06, "loss": 2.7128076171875, "step": 736600 }, { "epoch": 0.8889266967299335, "learning_rate": 7.065327655945104e-06, "loss": 2.7215841674804686, "step": 736700 }, { "epoch": 0.8890473600524161, "learning_rate": 7.064923820477366e-06, "loss": 2.7322537231445314, "step": 736800 }, { "epoch": 0.8891680233748989, "learning_rate": 7.064519985009628e-06, "loss": 2.693781433105469, "step": 736900 }, { "epoch": 0.8892886866973815, "learning_rate": 7.06411614954189e-06, "loss": 2.724798583984375, "step": 737000 }, { "epoch": 0.8894093500198642, "learning_rate": 7.063712314074151e-06, "loss": 2.7303778076171876, "step": 737100 }, { "epoch": 0.8895300133423469, "learning_rate": 7.063308478606413e-06, "loss": 2.7336956787109377, "step": 737200 }, { "epoch": 0.8896506766648296, "learning_rate": 7.062904643138675e-06, "loss": 2.733870544433594, "step": 737300 }, { "epoch": 0.8897713399873123, "learning_rate": 7.0625008076709354e-06, "loss": 2.719818115234375, "step": 737400 }, { "epoch": 0.8898920033097949, "learning_rate": 7.062096972203197e-06, "loss": 2.7107363891601564, "step": 737500 }, { "epoch": 0.8900126666322776, "learning_rate": 7.061693136735459e-06, "loss": 2.7413232421875, "step": 737600 }, { "epoch": 0.8901333299547604, "learning_rate": 7.0612893012677205e-06, "loss": 2.710152282714844, "step": 737700 }, { "epoch": 0.890253993277243, "learning_rate": 7.0608854657999825e-06, "loss": 2.7378070068359377, "step": 737800 }, { "epoch": 0.8903746565997257, "learning_rate": 7.0604816303322445e-06, "loss": 2.749425354003906, "step": 737900 }, { "epoch": 0.8904953199222083, "learning_rate": 7.0600777948645065e-06, "loss": 2.708382263183594, "step": 738000 }, { "epoch": 0.890615983244691, "learning_rate": 7.059673959396768e-06, "loss": 2.7359039306640627, "step": 738100 }, { "epoch": 0.8907366465671738, "learning_rate": 7.059270123929029e-06, "loss": 2.7318234252929687, "step": 738200 }, { "epoch": 0.8908573098896564, "learning_rate": 7.05886628846129e-06, "loss": 2.715947570800781, "step": 738300 }, { "epoch": 0.8909779732121391, "learning_rate": 7.058462452993552e-06, "loss": 2.7302822875976562, "step": 738400 }, { "epoch": 0.8910986365346217, "learning_rate": 7.058058617525814e-06, "loss": 2.7540798950195313, "step": 738500 }, { "epoch": 0.8912192998571045, "learning_rate": 7.057654782058076e-06, "loss": 2.7022030639648436, "step": 738600 }, { "epoch": 0.8913399631795872, "learning_rate": 7.057250946590337e-06, "loss": 2.73271484375, "step": 738700 }, { "epoch": 0.8914606265020698, "learning_rate": 7.056847111122599e-06, "loss": 2.725824279785156, "step": 738800 }, { "epoch": 0.8915812898245525, "learning_rate": 7.056443275654861e-06, "loss": 2.7351751708984375, "step": 738900 }, { "epoch": 0.8917019531470352, "learning_rate": 7.056039440187121e-06, "loss": 2.7426071166992188, "step": 739000 }, { "epoch": 0.8918226164695179, "learning_rate": 7.055635604719383e-06, "loss": 2.7087799072265626, "step": 739100 }, { "epoch": 0.8919432797920006, "learning_rate": 7.055231769251645e-06, "loss": 2.7549200439453125, "step": 739200 }, { "epoch": 0.8920639431144832, "learning_rate": 7.054827933783906e-06, "loss": 2.7025405883789064, "step": 739300 }, { "epoch": 0.892184606436966, "learning_rate": 7.054424098316168e-06, "loss": 2.71512451171875, "step": 739400 }, { "epoch": 0.8923052697594486, "learning_rate": 7.05402026284843e-06, "loss": 2.7437033081054687, "step": 739500 }, { "epoch": 0.8924259330819313, "learning_rate": 7.0536164273806914e-06, "loss": 2.7225714111328125, "step": 739600 }, { "epoch": 0.892546596404414, "learning_rate": 7.053212591912953e-06, "loss": 2.733736877441406, "step": 739700 }, { "epoch": 0.8926672597268966, "learning_rate": 7.0528087564452145e-06, "loss": 2.7534173583984374, "step": 739800 }, { "epoch": 0.8927879230493794, "learning_rate": 7.052404920977476e-06, "loss": 2.734855041503906, "step": 739900 }, { "epoch": 0.892908586371862, "learning_rate": 7.052001085509738e-06, "loss": 2.740697021484375, "step": 740000 }, { "epoch": 0.8930292496943447, "learning_rate": 7.051597250042e-06, "loss": 2.7092889404296874, "step": 740100 }, { "epoch": 0.8931499130168274, "learning_rate": 7.051193414574261e-06, "loss": 2.7255520629882812, "step": 740200 }, { "epoch": 0.8932705763393101, "learning_rate": 7.050789579106523e-06, "loss": 2.7272430419921876, "step": 740300 }, { "epoch": 0.8933912396617928, "learning_rate": 7.050385743638785e-06, "loss": 2.73778076171875, "step": 740400 }, { "epoch": 0.8935119029842754, "learning_rate": 7.049981908171047e-06, "loss": 2.7084820556640623, "step": 740500 }, { "epoch": 0.8936325663067581, "learning_rate": 7.049578072703307e-06, "loss": 2.709866638183594, "step": 740600 }, { "epoch": 0.8937532296292409, "learning_rate": 7.049174237235569e-06, "loss": 2.732705383300781, "step": 740700 }, { "epoch": 0.8938738929517235, "learning_rate": 7.04877040176783e-06, "loss": 2.735065612792969, "step": 740800 }, { "epoch": 0.8939945562742062, "learning_rate": 7.048366566300092e-06, "loss": 2.7316400146484376, "step": 740900 }, { "epoch": 0.8941152195966888, "learning_rate": 7.047962730832354e-06, "loss": 2.7328036499023436, "step": 741000 }, { "epoch": 0.8942358829191716, "learning_rate": 7.047558895364616e-06, "loss": 2.717243347167969, "step": 741100 }, { "epoch": 0.8943565462416543, "learning_rate": 7.047155059896877e-06, "loss": 2.748670654296875, "step": 741200 }, { "epoch": 0.8944772095641369, "learning_rate": 7.046751224429139e-06, "loss": 2.730111389160156, "step": 741300 }, { "epoch": 0.8945978728866196, "learning_rate": 7.046347388961401e-06, "loss": 2.7375213623046877, "step": 741400 }, { "epoch": 0.8947185362091022, "learning_rate": 7.0459435534936615e-06, "loss": 2.7348736572265624, "step": 741500 }, { "epoch": 0.894839199531585, "learning_rate": 7.0455397180259234e-06, "loss": 2.7266830444335937, "step": 741600 }, { "epoch": 0.8949598628540677, "learning_rate": 7.0451358825581854e-06, "loss": 2.7210342407226564, "step": 741700 }, { "epoch": 0.8950805261765503, "learning_rate": 7.0447320470904466e-06, "loss": 2.712923583984375, "step": 741800 }, { "epoch": 0.895201189499033, "learning_rate": 7.0443282116227086e-06, "loss": 2.7168063354492187, "step": 741900 }, { "epoch": 0.8953218528215158, "learning_rate": 7.0439243761549705e-06, "loss": 2.745323486328125, "step": 742000 }, { "epoch": 0.8954425161439984, "learning_rate": 7.043520540687232e-06, "loss": 2.729361572265625, "step": 742100 }, { "epoch": 0.8955631794664811, "learning_rate": 7.043116705219494e-06, "loss": 2.7249334716796874, "step": 742200 }, { "epoch": 0.8956838427889637, "learning_rate": 7.042712869751755e-06, "loss": 2.7297906494140625, "step": 742300 }, { "epoch": 0.8958045061114465, "learning_rate": 7.042309034284016e-06, "loss": 2.7410064697265626, "step": 742400 }, { "epoch": 0.8959251694339292, "learning_rate": 7.041905198816278e-06, "loss": 2.7229266357421875, "step": 742500 }, { "epoch": 0.8960458327564118, "learning_rate": 7.04150136334854e-06, "loss": 2.7508108520507815, "step": 742600 }, { "epoch": 0.8961664960788945, "learning_rate": 7.041097527880801e-06, "loss": 2.7371334838867187, "step": 742700 }, { "epoch": 0.8962871594013772, "learning_rate": 7.040693692413063e-06, "loss": 2.7199612426757813, "step": 742800 }, { "epoch": 0.8964078227238599, "learning_rate": 7.040289856945325e-06, "loss": 2.7309439086914065, "step": 742900 }, { "epoch": 0.8965284860463426, "learning_rate": 7.039886021477587e-06, "loss": 2.7434942626953127, "step": 743000 }, { "epoch": 0.8966491493688252, "learning_rate": 7.039482186009847e-06, "loss": 2.715146179199219, "step": 743100 }, { "epoch": 0.896769812691308, "learning_rate": 7.039078350542109e-06, "loss": 2.704852294921875, "step": 743200 }, { "epoch": 0.8968904760137906, "learning_rate": 7.03867451507437e-06, "loss": 2.725163879394531, "step": 743300 }, { "epoch": 0.8970111393362733, "learning_rate": 7.038270679606632e-06, "loss": 2.723072509765625, "step": 743400 }, { "epoch": 0.897131802658756, "learning_rate": 7.037866844138894e-06, "loss": 2.6917718505859374, "step": 743500 }, { "epoch": 0.8972524659812386, "learning_rate": 7.037463008671156e-06, "loss": 2.7169619750976564, "step": 743600 }, { "epoch": 0.8973731293037214, "learning_rate": 7.0370591732034175e-06, "loss": 2.7150286865234374, "step": 743700 }, { "epoch": 0.897493792626204, "learning_rate": 7.0366553377356794e-06, "loss": 2.719017333984375, "step": 743800 }, { "epoch": 0.8976144559486867, "learning_rate": 7.03625150226794e-06, "loss": 2.723973693847656, "step": 743900 }, { "epoch": 0.8977351192711694, "learning_rate": 7.035847666800202e-06, "loss": 2.6832806396484377, "step": 744000 }, { "epoch": 0.8978557825936521, "learning_rate": 7.035443831332464e-06, "loss": 2.721883544921875, "step": 744100 }, { "epoch": 0.8979764459161348, "learning_rate": 7.035039995864726e-06, "loss": 2.7390142822265626, "step": 744200 }, { "epoch": 0.8980971092386174, "learning_rate": 7.034636160396987e-06, "loss": 2.7354367065429686, "step": 744300 }, { "epoch": 0.8982177725611001, "learning_rate": 7.034232324929249e-06, "loss": 2.715270690917969, "step": 744400 }, { "epoch": 0.8983384358835829, "learning_rate": 7.033828489461511e-06, "loss": 2.7241973876953125, "step": 744500 }, { "epoch": 0.8984590992060655, "learning_rate": 7.033424653993772e-06, "loss": 2.7295037841796876, "step": 744600 }, { "epoch": 0.8985797625285482, "learning_rate": 7.033020818526033e-06, "loss": 2.7467135620117187, "step": 744700 }, { "epoch": 0.8987004258510308, "learning_rate": 7.032616983058295e-06, "loss": 2.7325469970703127, "step": 744800 }, { "epoch": 0.8988210891735136, "learning_rate": 7.032213147590556e-06, "loss": 2.725127868652344, "step": 744900 }, { "epoch": 0.8989417524959963, "learning_rate": 7.031809312122818e-06, "loss": 2.7171371459960936, "step": 745000 }, { "epoch": 0.8990624158184789, "learning_rate": 7.03140547665508e-06, "loss": 2.7441476440429686, "step": 745100 }, { "epoch": 0.8991830791409616, "learning_rate": 7.031001641187341e-06, "loss": 2.718975830078125, "step": 745200 }, { "epoch": 0.8993037424634442, "learning_rate": 7.030597805719603e-06, "loss": 2.742962646484375, "step": 745300 }, { "epoch": 0.899424405785927, "learning_rate": 7.030193970251865e-06, "loss": 2.7156326293945314, "step": 745400 }, { "epoch": 0.8995450691084097, "learning_rate": 7.0297901347841255e-06, "loss": 2.701527404785156, "step": 745500 }, { "epoch": 0.8996657324308923, "learning_rate": 7.0293862993163875e-06, "loss": 2.713634033203125, "step": 745600 }, { "epoch": 0.899786395753375, "learning_rate": 7.0289824638486495e-06, "loss": 2.730815124511719, "step": 745700 }, { "epoch": 0.8999070590758577, "learning_rate": 7.028578628380911e-06, "loss": 2.730887756347656, "step": 745800 }, { "epoch": 0.9000277223983404, "learning_rate": 7.028174792913173e-06, "loss": 2.724427490234375, "step": 745900 }, { "epoch": 0.9001483857208231, "learning_rate": 7.027770957445435e-06, "loss": 2.725099792480469, "step": 746000 }, { "epoch": 0.9002690490433057, "learning_rate": 7.0273671219776966e-06, "loss": 2.7605023193359375, "step": 746100 }, { "epoch": 0.9003897123657885, "learning_rate": 7.026963286509958e-06, "loss": 2.7150143432617186, "step": 746200 }, { "epoch": 0.9005103756882711, "learning_rate": 7.02655945104222e-06, "loss": 2.7164682006835936, "step": 746300 }, { "epoch": 0.9006310390107538, "learning_rate": 7.02615561557448e-06, "loss": 2.729403381347656, "step": 746400 }, { "epoch": 0.9007517023332365, "learning_rate": 7.025751780106742e-06, "loss": 2.7280404663085935, "step": 746500 }, { "epoch": 0.9008723656557192, "learning_rate": 7.025347944639004e-06, "loss": 2.7270477294921873, "step": 746600 }, { "epoch": 0.9009930289782019, "learning_rate": 7.024944109171266e-06, "loss": 2.717498474121094, "step": 746700 }, { "epoch": 0.9011136923006845, "learning_rate": 7.024540273703527e-06, "loss": 2.7400689697265626, "step": 746800 }, { "epoch": 0.9012343556231672, "learning_rate": 7.024136438235789e-06, "loss": 2.732668151855469, "step": 746900 }, { "epoch": 0.90135501894565, "learning_rate": 7.023732602768051e-06, "loss": 2.715328369140625, "step": 747000 }, { "epoch": 0.9014756822681326, "learning_rate": 7.023328767300312e-06, "loss": 2.7237518310546873, "step": 747100 }, { "epoch": 0.9015963455906153, "learning_rate": 7.022924931832573e-06, "loss": 2.706340026855469, "step": 747200 }, { "epoch": 0.901717008913098, "learning_rate": 7.022521096364835e-06, "loss": 2.72986572265625, "step": 747300 }, { "epoch": 0.9018376722355806, "learning_rate": 7.022117260897096e-06, "loss": 2.745135498046875, "step": 747400 }, { "epoch": 0.9019583355580634, "learning_rate": 7.021713425429358e-06, "loss": 2.7311337280273436, "step": 747500 }, { "epoch": 0.902078998880546, "learning_rate": 7.02130958996162e-06, "loss": 2.7418359375, "step": 747600 }, { "epoch": 0.9021996622030287, "learning_rate": 7.0209057544938815e-06, "loss": 2.703841247558594, "step": 747700 }, { "epoch": 0.9023203255255114, "learning_rate": 7.0205019190261435e-06, "loss": 2.718524169921875, "step": 747800 }, { "epoch": 0.9024409888479941, "learning_rate": 7.0200980835584055e-06, "loss": 2.731907958984375, "step": 747900 }, { "epoch": 0.9025616521704768, "learning_rate": 7.019694248090666e-06, "loss": 2.71821044921875, "step": 748000 }, { "epoch": 0.9026823154929594, "learning_rate": 7.019290412622928e-06, "loss": 2.7228350830078125, "step": 748100 }, { "epoch": 0.9028029788154421, "learning_rate": 7.01888657715519e-06, "loss": 2.723360900878906, "step": 748200 }, { "epoch": 0.9029236421379249, "learning_rate": 7.018482741687451e-06, "loss": 2.7175689697265626, "step": 748300 }, { "epoch": 0.9030443054604075, "learning_rate": 7.018078906219713e-06, "loss": 2.7196163940429687, "step": 748400 }, { "epoch": 0.9031649687828902, "learning_rate": 7.017675070751975e-06, "loss": 2.7180010986328127, "step": 748500 }, { "epoch": 0.9032856321053728, "learning_rate": 7.017271235284237e-06, "loss": 2.7507080078125, "step": 748600 }, { "epoch": 0.9034062954278556, "learning_rate": 7.016867399816498e-06, "loss": 2.7238140869140626, "step": 748700 }, { "epoch": 0.9035269587503383, "learning_rate": 7.016463564348759e-06, "loss": 2.7220233154296873, "step": 748800 }, { "epoch": 0.9036476220728209, "learning_rate": 7.01605972888102e-06, "loss": 2.7368045043945313, "step": 748900 }, { "epoch": 0.9037682853953036, "learning_rate": 7.015655893413282e-06, "loss": 2.7221585083007813, "step": 749000 }, { "epoch": 0.9038889487177862, "learning_rate": 7.015252057945544e-06, "loss": 2.712857360839844, "step": 749100 }, { "epoch": 0.904009612040269, "learning_rate": 7.014848222477806e-06, "loss": 2.731495056152344, "step": 749200 }, { "epoch": 0.9041302753627517, "learning_rate": 7.014444387010067e-06, "loss": 2.6801251220703124, "step": 749300 }, { "epoch": 0.9042509386852343, "learning_rate": 7.014040551542329e-06, "loss": 2.708482360839844, "step": 749400 }, { "epoch": 0.904371602007717, "learning_rate": 7.013636716074591e-06, "loss": 2.7209231567382814, "step": 749500 }, { "epoch": 0.9044922653301997, "learning_rate": 7.0132328806068516e-06, "loss": 2.7037344360351563, "step": 749600 }, { "epoch": 0.9046129286526824, "learning_rate": 7.0128290451391135e-06, "loss": 2.7255047607421874, "step": 749700 }, { "epoch": 0.9047335919751651, "learning_rate": 7.0124252096713755e-06, "loss": 2.7201861572265624, "step": 749800 }, { "epoch": 0.9048542552976477, "learning_rate": 7.012021374203637e-06, "loss": 2.7334674072265623, "step": 749900 }, { "epoch": 0.9049749186201305, "learning_rate": 7.011617538735899e-06, "loss": 2.701701354980469, "step": 750000 }, { "epoch": 0.9050955819426131, "learning_rate": 7.011213703268161e-06, "loss": 2.7371160888671877, "step": 750100 }, { "epoch": 0.9052162452650958, "learning_rate": 7.010809867800422e-06, "loss": 2.7254638671875, "step": 750200 }, { "epoch": 0.9053369085875785, "learning_rate": 7.010406032332684e-06, "loss": 2.713075866699219, "step": 750300 }, { "epoch": 0.9054575719100612, "learning_rate": 7.010002196864945e-06, "loss": 2.7333999633789063, "step": 750400 }, { "epoch": 0.9055782352325439, "learning_rate": 7.009598361397206e-06, "loss": 2.716353759765625, "step": 750500 }, { "epoch": 0.9056988985550265, "learning_rate": 7.009194525929468e-06, "loss": 2.7203439331054686, "step": 750600 }, { "epoch": 0.9058195618775092, "learning_rate": 7.00879069046173e-06, "loss": 2.738988952636719, "step": 750700 }, { "epoch": 0.905940225199992, "learning_rate": 7.008386854993991e-06, "loss": 2.7409710693359375, "step": 750800 }, { "epoch": 0.9060608885224746, "learning_rate": 7.007983019526253e-06, "loss": 2.719257507324219, "step": 750900 }, { "epoch": 0.9061815518449573, "learning_rate": 7.007579184058515e-06, "loss": 2.732732238769531, "step": 751000 }, { "epoch": 0.9063022151674399, "learning_rate": 7.007175348590777e-06, "loss": 2.740428466796875, "step": 751100 }, { "epoch": 0.9064228784899226, "learning_rate": 7.006771513123037e-06, "loss": 2.703509521484375, "step": 751200 }, { "epoch": 0.9065435418124054, "learning_rate": 7.006367677655299e-06, "loss": 2.7348568725585936, "step": 751300 }, { "epoch": 0.906664205134888, "learning_rate": 7.0059638421875605e-06, "loss": 2.6957693481445313, "step": 751400 }, { "epoch": 0.9067848684573707, "learning_rate": 7.0055600067198224e-06, "loss": 2.7042010498046873, "step": 751500 }, { "epoch": 0.9069055317798533, "learning_rate": 7.0051561712520844e-06, "loss": 2.7228546142578125, "step": 751600 }, { "epoch": 0.9070261951023361, "learning_rate": 7.004752335784346e-06, "loss": 2.7252740478515625, "step": 751700 }, { "epoch": 0.9071468584248188, "learning_rate": 7.0043485003166075e-06, "loss": 2.7023776245117186, "step": 751800 }, { "epoch": 0.9072675217473014, "learning_rate": 7.0039446648488695e-06, "loss": 2.7013726806640626, "step": 751900 }, { "epoch": 0.9073881850697841, "learning_rate": 7.0035408293811315e-06, "loss": 2.7249407958984375, "step": 752000 }, { "epoch": 0.9075088483922668, "learning_rate": 7.003136993913392e-06, "loss": 2.7058734130859374, "step": 752100 }, { "epoch": 0.9076295117147495, "learning_rate": 7.002733158445654e-06, "loss": 2.739010009765625, "step": 752200 }, { "epoch": 0.9077501750372322, "learning_rate": 7.002329322977916e-06, "loss": 2.7271142578125, "step": 752300 }, { "epoch": 0.9078708383597148, "learning_rate": 7.001925487510177e-06, "loss": 2.6901339721679687, "step": 752400 }, { "epoch": 0.9079915016821976, "learning_rate": 7.001521652042439e-06, "loss": 2.7174810791015624, "step": 752500 }, { "epoch": 0.9081121650046803, "learning_rate": 7.001117816574701e-06, "loss": 2.7409039306640626, "step": 752600 }, { "epoch": 0.9082328283271629, "learning_rate": 7.000713981106963e-06, "loss": 2.7397201538085936, "step": 752700 }, { "epoch": 0.9083534916496456, "learning_rate": 7.000310145639224e-06, "loss": 2.710599365234375, "step": 752800 }, { "epoch": 0.9084741549721282, "learning_rate": 6.999906310171485e-06, "loss": 2.7264013671875, "step": 752900 }, { "epoch": 0.908594818294611, "learning_rate": 6.999502474703746e-06, "loss": 2.7216943359375, "step": 753000 }, { "epoch": 0.9087154816170937, "learning_rate": 6.999098639236008e-06, "loss": 2.7107843017578124, "step": 753100 }, { "epoch": 0.9088361449395763, "learning_rate": 6.99869480376827e-06, "loss": 2.7430291748046876, "step": 753200 }, { "epoch": 0.908956808262059, "learning_rate": 6.998290968300532e-06, "loss": 2.735186767578125, "step": 753300 }, { "epoch": 0.9090774715845417, "learning_rate": 6.997887132832793e-06, "loss": 2.7256546020507812, "step": 753400 }, { "epoch": 0.9091981349070244, "learning_rate": 6.997483297365055e-06, "loss": 2.719635314941406, "step": 753500 }, { "epoch": 0.9093187982295071, "learning_rate": 6.997079461897317e-06, "loss": 2.724583740234375, "step": 753600 }, { "epoch": 0.9094394615519897, "learning_rate": 6.996675626429578e-06, "loss": 2.70271484375, "step": 753700 }, { "epoch": 0.9095601248744725, "learning_rate": 6.9962717909618396e-06, "loss": 2.7515304565429686, "step": 753800 }, { "epoch": 0.9096807881969551, "learning_rate": 6.9958679554941016e-06, "loss": 2.7265185546875, "step": 753900 }, { "epoch": 0.9098014515194378, "learning_rate": 6.995464120026363e-06, "loss": 2.7119000244140623, "step": 754000 }, { "epoch": 0.9099221148419205, "learning_rate": 6.995060284558625e-06, "loss": 2.728374328613281, "step": 754100 }, { "epoch": 0.9100427781644032, "learning_rate": 6.994656449090887e-06, "loss": 2.7213119506835937, "step": 754200 }, { "epoch": 0.9101634414868859, "learning_rate": 6.994252613623148e-06, "loss": 2.7191763305664063, "step": 754300 }, { "epoch": 0.9102841048093685, "learning_rate": 6.99384877815541e-06, "loss": 2.6843630981445314, "step": 754400 }, { "epoch": 0.9104047681318512, "learning_rate": 6.993444942687671e-06, "loss": 2.726817932128906, "step": 754500 }, { "epoch": 0.910525431454334, "learning_rate": 6.993041107219932e-06, "loss": 2.7228076171875, "step": 754600 }, { "epoch": 0.9106460947768166, "learning_rate": 6.992637271752194e-06, "loss": 2.7332470703125, "step": 754700 }, { "epoch": 0.9107667580992993, "learning_rate": 6.992233436284456e-06, "loss": 2.704501037597656, "step": 754800 }, { "epoch": 0.9108874214217819, "learning_rate": 6.991829600816717e-06, "loss": 2.7262496948242188, "step": 754900 }, { "epoch": 0.9110080847442646, "learning_rate": 6.991425765348979e-06, "loss": 2.7435516357421874, "step": 755000 }, { "epoch": 0.9111287480667474, "learning_rate": 6.991021929881241e-06, "loss": 2.7228741455078125, "step": 755100 }, { "epoch": 0.91124941138923, "learning_rate": 6.990618094413503e-06, "loss": 2.7264419555664063, "step": 755200 }, { "epoch": 0.9113700747117127, "learning_rate": 6.990214258945763e-06, "loss": 2.714402770996094, "step": 755300 }, { "epoch": 0.9114907380341953, "learning_rate": 6.989810423478025e-06, "loss": 2.7024462890625, "step": 755400 }, { "epoch": 0.9116114013566781, "learning_rate": 6.9894065880102865e-06, "loss": 2.7157928466796877, "step": 755500 }, { "epoch": 0.9117320646791608, "learning_rate": 6.9890027525425485e-06, "loss": 2.7170587158203126, "step": 755600 }, { "epoch": 0.9118527280016434, "learning_rate": 6.9885989170748105e-06, "loss": 2.7023019409179687, "step": 755700 }, { "epoch": 0.9119733913241261, "learning_rate": 6.9881950816070724e-06, "loss": 2.7180850219726564, "step": 755800 }, { "epoch": 0.9120940546466088, "learning_rate": 6.987791246139334e-06, "loss": 2.7026437377929686, "step": 755900 }, { "epoch": 0.9122147179690915, "learning_rate": 6.9873874106715956e-06, "loss": 2.7044512939453127, "step": 756000 }, { "epoch": 0.9123353812915742, "learning_rate": 6.986983575203856e-06, "loss": 2.7101593017578125, "step": 756100 }, { "epoch": 0.9124560446140568, "learning_rate": 6.986579739736118e-06, "loss": 2.7351699829101563, "step": 756200 }, { "epoch": 0.9125767079365396, "learning_rate": 6.98617590426838e-06, "loss": 2.7282696533203126, "step": 756300 }, { "epoch": 0.9126973712590222, "learning_rate": 6.985772068800642e-06, "loss": 2.717259521484375, "step": 756400 }, { "epoch": 0.9128180345815049, "learning_rate": 6.985368233332903e-06, "loss": 2.699613342285156, "step": 756500 }, { "epoch": 0.9129386979039876, "learning_rate": 6.984964397865165e-06, "loss": 2.714638977050781, "step": 756600 }, { "epoch": 0.9130593612264702, "learning_rate": 6.984560562397427e-06, "loss": 2.717453918457031, "step": 756700 }, { "epoch": 0.913180024548953, "learning_rate": 6.984156726929688e-06, "loss": 2.7215951538085936, "step": 756800 }, { "epoch": 0.9133006878714356, "learning_rate": 6.98375289146195e-06, "loss": 2.694805908203125, "step": 756900 }, { "epoch": 0.9134213511939183, "learning_rate": 6.983349055994211e-06, "loss": 2.718033752441406, "step": 757000 }, { "epoch": 0.913542014516401, "learning_rate": 6.982945220526472e-06, "loss": 2.712441711425781, "step": 757100 }, { "epoch": 0.9136626778388837, "learning_rate": 6.982541385058734e-06, "loss": 2.7206649780273438, "step": 757200 }, { "epoch": 0.9137833411613664, "learning_rate": 6.982137549590996e-06, "loss": 2.7138796997070314, "step": 757300 }, { "epoch": 0.913904004483849, "learning_rate": 6.981733714123257e-06, "loss": 2.7164752197265627, "step": 757400 }, { "epoch": 0.9140246678063317, "learning_rate": 6.981329878655519e-06, "loss": 2.7090032958984374, "step": 757500 }, { "epoch": 0.9141453311288145, "learning_rate": 6.980926043187781e-06, "loss": 2.702010498046875, "step": 757600 }, { "epoch": 0.9142659944512971, "learning_rate": 6.980522207720043e-06, "loss": 2.7365997314453123, "step": 757700 }, { "epoch": 0.9143866577737798, "learning_rate": 6.980118372252304e-06, "loss": 2.725452880859375, "step": 757800 }, { "epoch": 0.9145073210962625, "learning_rate": 6.979714536784566e-06, "loss": 2.7137100219726564, "step": 757900 }, { "epoch": 0.9146279844187452, "learning_rate": 6.979310701316827e-06, "loss": 2.7367401123046875, "step": 758000 }, { "epoch": 0.9147486477412279, "learning_rate": 6.978906865849089e-06, "loss": 2.7375335693359375, "step": 758100 }, { "epoch": 0.9148693110637105, "learning_rate": 6.978503030381351e-06, "loss": 2.7440301513671876, "step": 758200 }, { "epoch": 0.9149899743861932, "learning_rate": 6.978099194913613e-06, "loss": 2.7281399536132813, "step": 758300 }, { "epoch": 0.915110637708676, "learning_rate": 6.977695359445874e-06, "loss": 2.7083004760742186, "step": 758400 }, { "epoch": 0.9152313010311586, "learning_rate": 6.977291523978136e-06, "loss": 2.7087408447265626, "step": 758500 }, { "epoch": 0.9153519643536413, "learning_rate": 6.976887688510396e-06, "loss": 2.685780029296875, "step": 758600 }, { "epoch": 0.9154726276761239, "learning_rate": 6.976483853042658e-06, "loss": 2.6974197387695313, "step": 758700 }, { "epoch": 0.9155932909986066, "learning_rate": 6.97608001757492e-06, "loss": 2.717125244140625, "step": 758800 }, { "epoch": 0.9157139543210894, "learning_rate": 6.975676182107182e-06, "loss": 2.710915222167969, "step": 758900 }, { "epoch": 0.915834617643572, "learning_rate": 6.975272346639443e-06, "loss": 2.696430969238281, "step": 759000 }, { "epoch": 0.9159552809660547, "learning_rate": 6.974868511171705e-06, "loss": 2.723599853515625, "step": 759100 }, { "epoch": 0.9160759442885373, "learning_rate": 6.974464675703967e-06, "loss": 2.696347961425781, "step": 759200 }, { "epoch": 0.9161966076110201, "learning_rate": 6.974060840236228e-06, "loss": 2.704950866699219, "step": 759300 }, { "epoch": 0.9163172709335028, "learning_rate": 6.973657004768489e-06, "loss": 2.72002685546875, "step": 759400 }, { "epoch": 0.9164379342559854, "learning_rate": 6.973253169300751e-06, "loss": 2.7140692138671874, "step": 759500 }, { "epoch": 0.9165585975784681, "learning_rate": 6.9728493338330125e-06, "loss": 2.710602111816406, "step": 759600 }, { "epoch": 0.9166792609009508, "learning_rate": 6.9724454983652745e-06, "loss": 2.6868490600585937, "step": 759700 }, { "epoch": 0.9167999242234335, "learning_rate": 6.9720416628975365e-06, "loss": 2.6989642333984376, "step": 759800 }, { "epoch": 0.9169205875459162, "learning_rate": 6.971637827429798e-06, "loss": 2.721639404296875, "step": 759900 }, { "epoch": 0.9170412508683988, "learning_rate": 6.97123399196206e-06, "loss": 2.714097595214844, "step": 760000 }, { "epoch": 0.9171619141908816, "learning_rate": 6.970830156494322e-06, "loss": 2.7013153076171874, "step": 760100 }, { "epoch": 0.9172825775133642, "learning_rate": 6.970426321026582e-06, "loss": 2.708526916503906, "step": 760200 }, { "epoch": 0.9174032408358469, "learning_rate": 6.970022485558844e-06, "loss": 2.725055847167969, "step": 760300 }, { "epoch": 0.9175239041583296, "learning_rate": 6.969618650091106e-06, "loss": 2.7046444702148436, "step": 760400 }, { "epoch": 0.9176445674808122, "learning_rate": 6.969214814623367e-06, "loss": 2.7154812622070312, "step": 760500 }, { "epoch": 0.917765230803295, "learning_rate": 6.968810979155629e-06, "loss": 2.723992919921875, "step": 760600 }, { "epoch": 0.9178858941257776, "learning_rate": 6.968407143687891e-06, "loss": 2.7231289672851564, "step": 760700 }, { "epoch": 0.9180065574482603, "learning_rate": 6.968003308220153e-06, "loss": 2.7140087890625, "step": 760800 }, { "epoch": 0.918127220770743, "learning_rate": 6.967599472752414e-06, "loss": 2.7221444702148436, "step": 760900 }, { "epoch": 0.9182478840932257, "learning_rate": 6.967195637284675e-06, "loss": 2.742440490722656, "step": 761000 }, { "epoch": 0.9183685474157084, "learning_rate": 6.966791801816936e-06, "loss": 2.70039306640625, "step": 761100 }, { "epoch": 0.918489210738191, "learning_rate": 6.966387966349198e-06, "loss": 2.6976992797851564, "step": 761200 }, { "epoch": 0.9186098740606737, "learning_rate": 6.96598413088146e-06, "loss": 2.716680603027344, "step": 761300 }, { "epoch": 0.9187305373831565, "learning_rate": 6.965580295413722e-06, "loss": 2.719371643066406, "step": 761400 }, { "epoch": 0.9188512007056391, "learning_rate": 6.965176459945983e-06, "loss": 2.7075543212890625, "step": 761500 }, { "epoch": 0.9189718640281218, "learning_rate": 6.964772624478245e-06, "loss": 2.7399853515625, "step": 761600 }, { "epoch": 0.9190925273506044, "learning_rate": 6.964368789010507e-06, "loss": 2.6807687377929685, "step": 761700 }, { "epoch": 0.9192131906730872, "learning_rate": 6.9639649535427685e-06, "loss": 2.706905517578125, "step": 761800 }, { "epoch": 0.9193338539955699, "learning_rate": 6.96356111807503e-06, "loss": 2.7048809814453123, "step": 761900 }, { "epoch": 0.9194545173180525, "learning_rate": 6.963157282607292e-06, "loss": 2.69527587890625, "step": 762000 }, { "epoch": 0.9195751806405352, "learning_rate": 6.962753447139553e-06, "loss": 2.685765686035156, "step": 762100 }, { "epoch": 0.9196958439630178, "learning_rate": 6.962349611671815e-06, "loss": 2.726064453125, "step": 762200 }, { "epoch": 0.9198165072855006, "learning_rate": 6.961945776204077e-06, "loss": 2.7296441650390624, "step": 762300 }, { "epoch": 0.9199371706079833, "learning_rate": 6.961541940736338e-06, "loss": 2.681319580078125, "step": 762400 }, { "epoch": 0.9200578339304659, "learning_rate": 6.9611381052686e-06, "loss": 2.6966326904296873, "step": 762500 }, { "epoch": 0.9201784972529486, "learning_rate": 6.960734269800862e-06, "loss": 2.704101867675781, "step": 762600 }, { "epoch": 0.9202991605754313, "learning_rate": 6.960330434333122e-06, "loss": 2.7356027221679686, "step": 762700 }, { "epoch": 0.920419823897914, "learning_rate": 6.959926598865384e-06, "loss": 2.7033782958984376, "step": 762800 }, { "epoch": 0.9205404872203967, "learning_rate": 6.959522763397646e-06, "loss": 2.7299237060546875, "step": 762900 }, { "epoch": 0.9206611505428793, "learning_rate": 6.959118927929907e-06, "loss": 2.6986846923828125, "step": 763000 }, { "epoch": 0.9207818138653621, "learning_rate": 6.958715092462169e-06, "loss": 2.6819708251953127, "step": 763100 }, { "epoch": 0.9209024771878448, "learning_rate": 6.958311256994431e-06, "loss": 2.7112496948242186, "step": 763200 }, { "epoch": 0.9210231405103274, "learning_rate": 6.957907421526693e-06, "loss": 2.707572326660156, "step": 763300 }, { "epoch": 0.9211438038328101, "learning_rate": 6.957503586058954e-06, "loss": 2.7444638061523436, "step": 763400 }, { "epoch": 0.9212644671552928, "learning_rate": 6.9570997505912154e-06, "loss": 2.721355285644531, "step": 763500 }, { "epoch": 0.9213851304777755, "learning_rate": 6.956695915123477e-06, "loss": 2.7093276977539062, "step": 763600 }, { "epoch": 0.9215057938002582, "learning_rate": 6.9562920796557386e-06, "loss": 2.7083489990234373, "step": 763700 }, { "epoch": 0.9216264571227408, "learning_rate": 6.9558882441880005e-06, "loss": 2.753251037597656, "step": 763800 }, { "epoch": 0.9217471204452236, "learning_rate": 6.9554844087202625e-06, "loss": 2.7183648681640626, "step": 763900 }, { "epoch": 0.9218677837677062, "learning_rate": 6.955080573252524e-06, "loss": 2.7290078735351564, "step": 764000 }, { "epoch": 0.9219884470901889, "learning_rate": 6.954676737784786e-06, "loss": 2.72128173828125, "step": 764100 }, { "epoch": 0.9221091104126716, "learning_rate": 6.954272902317048e-06, "loss": 2.7131747436523437, "step": 764200 }, { "epoch": 0.9222297737351542, "learning_rate": 6.953869066849308e-06, "loss": 2.714777526855469, "step": 764300 }, { "epoch": 0.922350437057637, "learning_rate": 6.95346523138157e-06, "loss": 2.6997210693359377, "step": 764400 }, { "epoch": 0.9224711003801196, "learning_rate": 6.953061395913832e-06, "loss": 2.7271597290039065, "step": 764500 }, { "epoch": 0.9225917637026023, "learning_rate": 6.952657560446093e-06, "loss": 2.745616149902344, "step": 764600 }, { "epoch": 0.922712427025085, "learning_rate": 6.952253724978355e-06, "loss": 2.6939227294921877, "step": 764700 }, { "epoch": 0.9228330903475677, "learning_rate": 6.951849889510617e-06, "loss": 2.704753723144531, "step": 764800 }, { "epoch": 0.9229537536700504, "learning_rate": 6.951446054042878e-06, "loss": 2.7193789672851563, "step": 764900 }, { "epoch": 0.923074416992533, "learning_rate": 6.95104221857514e-06, "loss": 2.6972140502929687, "step": 765000 }, { "epoch": 0.9231950803150157, "learning_rate": 6.950638383107401e-06, "loss": 2.7116754150390623, "step": 765100 }, { "epoch": 0.9233157436374985, "learning_rate": 6.950234547639662e-06, "loss": 2.696826171875, "step": 765200 }, { "epoch": 0.9234364069599811, "learning_rate": 6.949830712171924e-06, "loss": 2.6825689697265624, "step": 765300 }, { "epoch": 0.9235570702824638, "learning_rate": 6.949426876704186e-06, "loss": 2.733409118652344, "step": 765400 }, { "epoch": 0.9236777336049464, "learning_rate": 6.9490230412364475e-06, "loss": 2.7111666870117186, "step": 765500 }, { "epoch": 0.9237983969274292, "learning_rate": 6.9486192057687095e-06, "loss": 2.7072442626953124, "step": 765600 }, { "epoch": 0.9239190602499119, "learning_rate": 6.9482153703009714e-06, "loss": 2.7210903930664063, "step": 765700 }, { "epoch": 0.9240397235723945, "learning_rate": 6.947811534833233e-06, "loss": 2.716011962890625, "step": 765800 }, { "epoch": 0.9241603868948772, "learning_rate": 6.947407699365494e-06, "loss": 2.7110159301757815, "step": 765900 }, { "epoch": 0.9242810502173598, "learning_rate": 6.947003863897756e-06, "loss": 2.699219055175781, "step": 766000 }, { "epoch": 0.9244017135398426, "learning_rate": 6.946600028430017e-06, "loss": 2.7015451049804686, "step": 766100 }, { "epoch": 0.9245223768623253, "learning_rate": 6.946196192962279e-06, "loss": 2.699013977050781, "step": 766200 }, { "epoch": 0.9246430401848079, "learning_rate": 6.945792357494541e-06, "loss": 2.6999081420898436, "step": 766300 }, { "epoch": 0.9247637035072906, "learning_rate": 6.945388522026803e-06, "loss": 2.71362060546875, "step": 766400 }, { "epoch": 0.9248843668297733, "learning_rate": 6.944984686559064e-06, "loss": 2.7305923461914063, "step": 766500 }, { "epoch": 0.925005030152256, "learning_rate": 6.944580851091326e-06, "loss": 2.715047607421875, "step": 766600 }, { "epoch": 0.9251256934747387, "learning_rate": 6.944177015623586e-06, "loss": 2.708504333496094, "step": 766700 }, { "epoch": 0.9252463567972213, "learning_rate": 6.943773180155848e-06, "loss": 2.7337991333007814, "step": 766800 }, { "epoch": 0.9253670201197041, "learning_rate": 6.94336934468811e-06, "loss": 2.710657043457031, "step": 766900 }, { "epoch": 0.9254876834421867, "learning_rate": 6.942965509220372e-06, "loss": 2.7390896606445314, "step": 767000 }, { "epoch": 0.9256083467646694, "learning_rate": 6.942561673752633e-06, "loss": 2.7206436157226563, "step": 767100 }, { "epoch": 0.9257290100871521, "learning_rate": 6.942157838284895e-06, "loss": 2.7318191528320312, "step": 767200 }, { "epoch": 0.9258496734096348, "learning_rate": 6.941754002817157e-06, "loss": 2.7278036499023437, "step": 767300 }, { "epoch": 0.9259703367321175, "learning_rate": 6.941350167349419e-06, "loss": 2.6993109130859376, "step": 767400 }, { "epoch": 0.9260910000546001, "learning_rate": 6.94094633188168e-06, "loss": 2.72431884765625, "step": 767500 }, { "epoch": 0.9262116633770828, "learning_rate": 6.9405424964139415e-06, "loss": 2.7293734741210938, "step": 767600 }, { "epoch": 0.9263323266995656, "learning_rate": 6.940138660946203e-06, "loss": 2.726324462890625, "step": 767700 }, { "epoch": 0.9264529900220482, "learning_rate": 6.939734825478465e-06, "loss": 2.7142318725585937, "step": 767800 }, { "epoch": 0.9265736533445309, "learning_rate": 6.939330990010727e-06, "loss": 2.6950982666015624, "step": 767900 }, { "epoch": 0.9266943166670136, "learning_rate": 6.9389271545429886e-06, "loss": 2.725982666015625, "step": 768000 }, { "epoch": 0.9268149799894962, "learning_rate": 6.93852331907525e-06, "loss": 2.7130923461914063, "step": 768100 }, { "epoch": 0.926935643311979, "learning_rate": 6.938119483607512e-06, "loss": 2.704115295410156, "step": 768200 }, { "epoch": 0.9270563066344616, "learning_rate": 6.937715648139774e-06, "loss": 2.7048297119140625, "step": 768300 }, { "epoch": 0.9271769699569443, "learning_rate": 6.937311812672034e-06, "loss": 2.689481506347656, "step": 768400 }, { "epoch": 0.927297633279427, "learning_rate": 6.936907977204296e-06, "loss": 2.7060397338867186, "step": 768500 }, { "epoch": 0.9274182966019097, "learning_rate": 6.936504141736558e-06, "loss": 2.7118771362304686, "step": 768600 }, { "epoch": 0.9275389599243924, "learning_rate": 6.936100306268819e-06, "loss": 2.7096142578125, "step": 768700 }, { "epoch": 0.927659623246875, "learning_rate": 6.935696470801081e-06, "loss": 2.6985372924804687, "step": 768800 }, { "epoch": 0.9277802865693577, "learning_rate": 6.935292635333343e-06, "loss": 2.72333984375, "step": 768900 }, { "epoch": 0.9279009498918405, "learning_rate": 6.934888799865604e-06, "loss": 2.717132873535156, "step": 769000 }, { "epoch": 0.9280216132143231, "learning_rate": 6.934484964397866e-06, "loss": 2.696222839355469, "step": 769100 }, { "epoch": 0.9281422765368058, "learning_rate": 6.934081128930127e-06, "loss": 2.71998779296875, "step": 769200 }, { "epoch": 0.9282629398592884, "learning_rate": 6.933677293462388e-06, "loss": 2.746978454589844, "step": 769300 }, { "epoch": 0.9283836031817712, "learning_rate": 6.93327345799465e-06, "loss": 2.7055157470703124, "step": 769400 }, { "epoch": 0.9285042665042539, "learning_rate": 6.932869622526912e-06, "loss": 2.7084616088867186, "step": 769500 }, { "epoch": 0.9286249298267365, "learning_rate": 6.9324657870591735e-06, "loss": 2.7281369018554686, "step": 769600 }, { "epoch": 0.9287455931492192, "learning_rate": 6.9320619515914355e-06, "loss": 2.70949462890625, "step": 769700 }, { "epoch": 0.9288662564717018, "learning_rate": 6.9316581161236975e-06, "loss": 2.7162203979492188, "step": 769800 }, { "epoch": 0.9289869197941846, "learning_rate": 6.9312542806559595e-06, "loss": 2.714763488769531, "step": 769900 }, { "epoch": 0.9291075831166673, "learning_rate": 6.93085044518822e-06, "loss": 2.704931335449219, "step": 770000 }, { "epoch": 0.9292282464391499, "learning_rate": 6.930446609720482e-06, "loss": 2.73090087890625, "step": 770100 }, { "epoch": 0.9293489097616326, "learning_rate": 6.930042774252743e-06, "loss": 2.69136962890625, "step": 770200 }, { "epoch": 0.9294695730841153, "learning_rate": 6.929638938785005e-06, "loss": 2.708759765625, "step": 770300 }, { "epoch": 0.929590236406598, "learning_rate": 6.929235103317267e-06, "loss": 2.7128842163085936, "step": 770400 }, { "epoch": 0.9297108997290807, "learning_rate": 6.928831267849529e-06, "loss": 2.7096026611328123, "step": 770500 }, { "epoch": 0.9298315630515633, "learning_rate": 6.92842743238179e-06, "loss": 2.7300595092773436, "step": 770600 }, { "epoch": 0.9299522263740461, "learning_rate": 6.928023596914052e-06, "loss": 2.718547668457031, "step": 770700 }, { "epoch": 0.9300728896965287, "learning_rate": 6.927619761446312e-06, "loss": 2.70151123046875, "step": 770800 }, { "epoch": 0.9301935530190114, "learning_rate": 6.927215925978574e-06, "loss": 2.713346252441406, "step": 770900 }, { "epoch": 0.9303142163414941, "learning_rate": 6.926812090510836e-06, "loss": 2.7114483642578127, "step": 771000 }, { "epoch": 0.9304348796639768, "learning_rate": 6.926408255043098e-06, "loss": 2.7203155517578126, "step": 771100 }, { "epoch": 0.9305555429864595, "learning_rate": 6.926004419575359e-06, "loss": 2.6935879516601564, "step": 771200 }, { "epoch": 0.9306762063089421, "learning_rate": 6.925600584107621e-06, "loss": 2.699639892578125, "step": 771300 }, { "epoch": 0.9307968696314248, "learning_rate": 6.925196748639883e-06, "loss": 2.69577880859375, "step": 771400 }, { "epoch": 0.9309175329539076, "learning_rate": 6.924792913172144e-06, "loss": 2.7279010009765625, "step": 771500 }, { "epoch": 0.9310381962763902, "learning_rate": 6.9243890777044055e-06, "loss": 2.6930416870117186, "step": 771600 }, { "epoch": 0.9311588595988729, "learning_rate": 6.9239852422366675e-06, "loss": 2.7251531982421877, "step": 771700 }, { "epoch": 0.9312795229213555, "learning_rate": 6.923581406768929e-06, "loss": 2.6980877685546876, "step": 771800 }, { "epoch": 0.9314001862438382, "learning_rate": 6.923177571301191e-06, "loss": 2.7033090209960937, "step": 771900 }, { "epoch": 0.931520849566321, "learning_rate": 6.922773735833453e-06, "loss": 2.722109375, "step": 772000 }, { "epoch": 0.9316415128888036, "learning_rate": 6.922369900365714e-06, "loss": 2.7122137451171877, "step": 772100 }, { "epoch": 0.9317621762112863, "learning_rate": 6.921966064897976e-06, "loss": 2.6771124267578124, "step": 772200 }, { "epoch": 0.9318828395337689, "learning_rate": 6.921562229430238e-06, "loss": 2.7164907836914063, "step": 772300 }, { "epoch": 0.9320035028562517, "learning_rate": 6.9211583939625e-06, "loss": 2.7073919677734377, "step": 772400 }, { "epoch": 0.9321241661787344, "learning_rate": 6.92075455849476e-06, "loss": 2.7518569946289064, "step": 772500 }, { "epoch": 0.932244829501217, "learning_rate": 6.920350723027022e-06, "loss": 2.7145254516601565, "step": 772600 }, { "epoch": 0.9323654928236997, "learning_rate": 6.919946887559283e-06, "loss": 2.7332952880859374, "step": 772700 }, { "epoch": 0.9324861561461824, "learning_rate": 6.919543052091545e-06, "loss": 2.686192932128906, "step": 772800 }, { "epoch": 0.9326068194686651, "learning_rate": 6.919139216623807e-06, "loss": 2.695884094238281, "step": 772900 }, { "epoch": 0.9327274827911478, "learning_rate": 6.918735381156069e-06, "loss": 2.7109515380859377, "step": 773000 }, { "epoch": 0.9328481461136304, "learning_rate": 6.91833154568833e-06, "loss": 2.7053292846679686, "step": 773100 }, { "epoch": 0.9329688094361132, "learning_rate": 6.917927710220592e-06, "loss": 2.728251953125, "step": 773200 }, { "epoch": 0.9330894727585959, "learning_rate": 6.9175238747528525e-06, "loss": 2.6773690795898437, "step": 773300 }, { "epoch": 0.9332101360810785, "learning_rate": 6.9171200392851144e-06, "loss": 2.7007586669921877, "step": 773400 }, { "epoch": 0.9333307994035612, "learning_rate": 6.916716203817376e-06, "loss": 2.706307067871094, "step": 773500 }, { "epoch": 0.9334514627260438, "learning_rate": 6.916312368349638e-06, "loss": 2.693376159667969, "step": 773600 }, { "epoch": 0.9335721260485266, "learning_rate": 6.9159085328818995e-06, "loss": 2.7099908447265624, "step": 773700 }, { "epoch": 0.9336927893710093, "learning_rate": 6.9155046974141615e-06, "loss": 2.6912216186523437, "step": 773800 }, { "epoch": 0.9338134526934919, "learning_rate": 6.9151008619464235e-06, "loss": 2.7100604248046873, "step": 773900 }, { "epoch": 0.9339341160159746, "learning_rate": 6.914697026478685e-06, "loss": 2.68709228515625, "step": 774000 }, { "epoch": 0.9340547793384573, "learning_rate": 6.914293191010946e-06, "loss": 2.684173889160156, "step": 774100 }, { "epoch": 0.93417544266094, "learning_rate": 6.913889355543208e-06, "loss": 2.6919992065429685, "step": 774200 }, { "epoch": 0.9342961059834227, "learning_rate": 6.913485520075469e-06, "loss": 2.72694580078125, "step": 774300 }, { "epoch": 0.9344167693059053, "learning_rate": 6.913081684607731e-06, "loss": 2.72618896484375, "step": 774400 }, { "epoch": 0.9345374326283881, "learning_rate": 6.912677849139993e-06, "loss": 2.7042236328125, "step": 774500 }, { "epoch": 0.9346580959508707, "learning_rate": 6.912274013672254e-06, "loss": 2.72306396484375, "step": 774600 }, { "epoch": 0.9347787592733534, "learning_rate": 6.911870178204516e-06, "loss": 2.7018829345703126, "step": 774700 }, { "epoch": 0.9348994225958361, "learning_rate": 6.911466342736778e-06, "loss": 2.6873052978515624, "step": 774800 }, { "epoch": 0.9350200859183188, "learning_rate": 6.911062507269038e-06, "loss": 2.7239227294921875, "step": 774900 }, { "epoch": 0.9351407492408015, "learning_rate": 6.9106586718013e-06, "loss": 2.708006591796875, "step": 775000 }, { "epoch": 0.9352614125632841, "learning_rate": 6.910254836333562e-06, "loss": 2.728523864746094, "step": 775100 }, { "epoch": 0.9353820758857668, "learning_rate": 6.909851000865823e-06, "loss": 2.7073623657226564, "step": 775200 }, { "epoch": 0.9355027392082496, "learning_rate": 6.909447165398085e-06, "loss": 2.698633117675781, "step": 775300 }, { "epoch": 0.9356234025307322, "learning_rate": 6.909043329930347e-06, "loss": 2.6993307495117187, "step": 775400 }, { "epoch": 0.9357440658532149, "learning_rate": 6.908639494462609e-06, "loss": 2.6809100341796874, "step": 775500 }, { "epoch": 0.9358647291756975, "learning_rate": 6.9082356589948704e-06, "loss": 2.726416015625, "step": 775600 }, { "epoch": 0.9359853924981802, "learning_rate": 6.9078318235271316e-06, "loss": 2.7061093139648436, "step": 775700 }, { "epoch": 0.936106055820663, "learning_rate": 6.907427988059393e-06, "loss": 2.7084561157226563, "step": 775800 }, { "epoch": 0.9362267191431456, "learning_rate": 6.907024152591655e-06, "loss": 2.698969421386719, "step": 775900 }, { "epoch": 0.9363473824656283, "learning_rate": 6.906620317123917e-06, "loss": 2.697595520019531, "step": 776000 }, { "epoch": 0.9364680457881109, "learning_rate": 6.906216481656179e-06, "loss": 2.7139797973632813, "step": 776100 }, { "epoch": 0.9365887091105937, "learning_rate": 6.90581264618844e-06, "loss": 2.691824645996094, "step": 776200 }, { "epoch": 0.9367093724330764, "learning_rate": 6.905408810720702e-06, "loss": 2.6998385620117187, "step": 776300 }, { "epoch": 0.936830035755559, "learning_rate": 6.905004975252964e-06, "loss": 2.6876129150390624, "step": 776400 }, { "epoch": 0.9369506990780417, "learning_rate": 6.904601139785224e-06, "loss": 2.69812255859375, "step": 776500 }, { "epoch": 0.9370713624005244, "learning_rate": 6.904197304317486e-06, "loss": 2.6965487670898436, "step": 776600 }, { "epoch": 0.9371920257230071, "learning_rate": 6.903793468849748e-06, "loss": 2.687722473144531, "step": 776700 }, { "epoch": 0.9373126890454898, "learning_rate": 6.903389633382009e-06, "loss": 2.674696350097656, "step": 776800 }, { "epoch": 0.9374333523679724, "learning_rate": 6.902985797914271e-06, "loss": 2.703077697753906, "step": 776900 }, { "epoch": 0.9375540156904552, "learning_rate": 6.902581962446533e-06, "loss": 2.7088275146484375, "step": 777000 }, { "epoch": 0.9376746790129378, "learning_rate": 6.902178126978794e-06, "loss": 2.7058575439453123, "step": 777100 }, { "epoch": 0.9377953423354205, "learning_rate": 6.901774291511056e-06, "loss": 2.6725701904296875, "step": 777200 }, { "epoch": 0.9379160056579032, "learning_rate": 6.901370456043318e-06, "loss": 2.6719586181640627, "step": 777300 }, { "epoch": 0.9380366689803858, "learning_rate": 6.9009666205755785e-06, "loss": 2.7048577880859375, "step": 777400 }, { "epoch": 0.9381573323028686, "learning_rate": 6.9005627851078405e-06, "loss": 2.6799310302734374, "step": 777500 }, { "epoch": 0.9382779956253512, "learning_rate": 6.9001589496401025e-06, "loss": 2.7246563720703123, "step": 777600 }, { "epoch": 0.9383986589478339, "learning_rate": 6.899755114172364e-06, "loss": 2.704770812988281, "step": 777700 }, { "epoch": 0.9385193222703166, "learning_rate": 6.8993512787046256e-06, "loss": 2.7322308349609377, "step": 777800 }, { "epoch": 0.9386399855927993, "learning_rate": 6.8989474432368876e-06, "loss": 2.71516357421875, "step": 777900 }, { "epoch": 0.938760648915282, "learning_rate": 6.8985436077691495e-06, "loss": 2.709796142578125, "step": 778000 }, { "epoch": 0.9388813122377646, "learning_rate": 6.898139772301411e-06, "loss": 2.697861633300781, "step": 778100 }, { "epoch": 0.9390019755602473, "learning_rate": 6.897735936833672e-06, "loss": 2.6971392822265625, "step": 778200 }, { "epoch": 0.9391226388827301, "learning_rate": 6.897332101365933e-06, "loss": 2.698938903808594, "step": 778300 }, { "epoch": 0.9392433022052127, "learning_rate": 6.896928265898195e-06, "loss": 2.689117126464844, "step": 778400 }, { "epoch": 0.9393639655276954, "learning_rate": 6.896524430430457e-06, "loss": 2.65630859375, "step": 778500 }, { "epoch": 0.9394846288501781, "learning_rate": 6.896120594962719e-06, "loss": 2.686415710449219, "step": 778600 }, { "epoch": 0.9396052921726608, "learning_rate": 6.89571675949498e-06, "loss": 2.7130313110351563, "step": 778700 }, { "epoch": 0.9397259554951435, "learning_rate": 6.895312924027242e-06, "loss": 2.6894622802734376, "step": 778800 }, { "epoch": 0.9398466188176261, "learning_rate": 6.894909088559504e-06, "loss": 2.7211837768554688, "step": 778900 }, { "epoch": 0.9399672821401088, "learning_rate": 6.894505253091764e-06, "loss": 2.6654296875, "step": 779000 }, { "epoch": 0.9400879454625916, "learning_rate": 6.894101417624026e-06, "loss": 2.71796875, "step": 779100 }, { "epoch": 0.9402086087850742, "learning_rate": 6.893697582156288e-06, "loss": 2.6913458251953126, "step": 779200 }, { "epoch": 0.9403292721075569, "learning_rate": 6.893293746688549e-06, "loss": 2.711322021484375, "step": 779300 }, { "epoch": 0.9404499354300395, "learning_rate": 6.892889911220811e-06, "loss": 2.6974050903320315, "step": 779400 }, { "epoch": 0.9405705987525222, "learning_rate": 6.892486075753073e-06, "loss": 2.695054931640625, "step": 779500 }, { "epoch": 0.940691262075005, "learning_rate": 6.8920822402853345e-06, "loss": 2.681632385253906, "step": 779600 }, { "epoch": 0.9408119253974876, "learning_rate": 6.8916784048175965e-06, "loss": 2.7084234619140624, "step": 779700 }, { "epoch": 0.9409325887199703, "learning_rate": 6.891274569349858e-06, "loss": 2.7164697265625, "step": 779800 }, { "epoch": 0.9410532520424529, "learning_rate": 6.890870733882119e-06, "loss": 2.72239013671875, "step": 779900 }, { "epoch": 0.9411739153649357, "learning_rate": 6.890466898414381e-06, "loss": 2.6979470825195313, "step": 780000 }, { "epoch": 0.9412945786874184, "learning_rate": 6.890063062946643e-06, "loss": 2.6883090209960936, "step": 780100 }, { "epoch": 0.941415242009901, "learning_rate": 6.889659227478904e-06, "loss": 2.700802917480469, "step": 780200 }, { "epoch": 0.9415359053323837, "learning_rate": 6.889255392011166e-06, "loss": 2.723611145019531, "step": 780300 }, { "epoch": 0.9416565686548664, "learning_rate": 6.888851556543428e-06, "loss": 2.684306640625, "step": 780400 }, { "epoch": 0.9417772319773491, "learning_rate": 6.88844772107569e-06, "loss": 2.687012939453125, "step": 780500 }, { "epoch": 0.9418978952998318, "learning_rate": 6.88804388560795e-06, "loss": 2.686885986328125, "step": 780600 }, { "epoch": 0.9420185586223144, "learning_rate": 6.887640050140212e-06, "loss": 2.690635070800781, "step": 780700 }, { "epoch": 0.9421392219447972, "learning_rate": 6.887236214672473e-06, "loss": 2.6944476318359376, "step": 780800 }, { "epoch": 0.9422598852672798, "learning_rate": 6.886832379204735e-06, "loss": 2.712443542480469, "step": 780900 }, { "epoch": 0.9423805485897625, "learning_rate": 6.886428543736997e-06, "loss": 2.718123474121094, "step": 781000 }, { "epoch": 0.9425012119122452, "learning_rate": 6.886024708269259e-06, "loss": 2.6832315063476564, "step": 781100 }, { "epoch": 0.9426218752347278, "learning_rate": 6.88562087280152e-06, "loss": 2.7331011962890623, "step": 781200 }, { "epoch": 0.9427425385572106, "learning_rate": 6.885217037333782e-06, "loss": 2.699590759277344, "step": 781300 }, { "epoch": 0.9428632018796932, "learning_rate": 6.8848132018660425e-06, "loss": 2.701646728515625, "step": 781400 }, { "epoch": 0.9429838652021759, "learning_rate": 6.8844093663983045e-06, "loss": 2.707436828613281, "step": 781500 }, { "epoch": 0.9431045285246586, "learning_rate": 6.8840055309305665e-06, "loss": 2.6986178588867187, "step": 781600 }, { "epoch": 0.9432251918471413, "learning_rate": 6.8836016954628285e-06, "loss": 2.705647277832031, "step": 781700 }, { "epoch": 0.943345855169624, "learning_rate": 6.88319785999509e-06, "loss": 2.6955316162109373, "step": 781800 }, { "epoch": 0.9434665184921066, "learning_rate": 6.882794024527352e-06, "loss": 2.6958181762695315, "step": 781900 }, { "epoch": 0.9435871818145893, "learning_rate": 6.882390189059614e-06, "loss": 2.709802551269531, "step": 782000 }, { "epoch": 0.9437078451370721, "learning_rate": 6.8819863535918756e-06, "loss": 2.712794189453125, "step": 782100 }, { "epoch": 0.9438285084595547, "learning_rate": 6.881582518124136e-06, "loss": 2.677330322265625, "step": 782200 }, { "epoch": 0.9439491717820374, "learning_rate": 6.881178682656398e-06, "loss": 2.6943588256835938, "step": 782300 }, { "epoch": 0.94406983510452, "learning_rate": 6.880774847188659e-06, "loss": 2.6779534912109373, "step": 782400 }, { "epoch": 0.9441904984270028, "learning_rate": 6.880371011720921e-06, "loss": 2.7140399169921876, "step": 782500 }, { "epoch": 0.9443111617494855, "learning_rate": 6.879967176253183e-06, "loss": 2.688753662109375, "step": 782600 }, { "epoch": 0.9444318250719681, "learning_rate": 6.879563340785445e-06, "loss": 2.692589111328125, "step": 782700 }, { "epoch": 0.9445524883944508, "learning_rate": 6.879159505317706e-06, "loss": 2.695231628417969, "step": 782800 }, { "epoch": 0.9446731517169334, "learning_rate": 6.878755669849968e-06, "loss": 2.708210754394531, "step": 782900 }, { "epoch": 0.9447938150394162, "learning_rate": 6.87835183438223e-06, "loss": 2.7206710815429687, "step": 783000 }, { "epoch": 0.9449144783618989, "learning_rate": 6.87794799891449e-06, "loss": 2.7077731323242187, "step": 783100 }, { "epoch": 0.9450351416843815, "learning_rate": 6.877544163446752e-06, "loss": 2.6877816772460936, "step": 783200 }, { "epoch": 0.9451558050068642, "learning_rate": 6.877140327979014e-06, "loss": 2.7060867309570313, "step": 783300 }, { "epoch": 0.9452764683293469, "learning_rate": 6.876736492511275e-06, "loss": 2.691536560058594, "step": 783400 }, { "epoch": 0.9453971316518296, "learning_rate": 6.876332657043537e-06, "loss": 2.679559326171875, "step": 783500 }, { "epoch": 0.9455177949743123, "learning_rate": 6.875928821575799e-06, "loss": 2.6865939331054687, "step": 783600 }, { "epoch": 0.9456384582967949, "learning_rate": 6.8755249861080605e-06, "loss": 2.716458435058594, "step": 783700 }, { "epoch": 0.9457591216192777, "learning_rate": 6.8751211506403225e-06, "loss": 2.689589538574219, "step": 783800 }, { "epoch": 0.9458797849417604, "learning_rate": 6.874717315172584e-06, "loss": 2.691872863769531, "step": 783900 }, { "epoch": 0.946000448264243, "learning_rate": 6.874313479704845e-06, "loss": 2.698790283203125, "step": 784000 }, { "epoch": 0.9461211115867257, "learning_rate": 6.873909644237107e-06, "loss": 2.7061041259765624, "step": 784100 }, { "epoch": 0.9462417749092084, "learning_rate": 6.873505808769369e-06, "loss": 2.7147872924804686, "step": 784200 }, { "epoch": 0.9463624382316911, "learning_rate": 6.87310197330163e-06, "loss": 2.7183792114257814, "step": 784300 }, { "epoch": 0.9464831015541738, "learning_rate": 6.872698137833892e-06, "loss": 2.6941510009765626, "step": 784400 }, { "epoch": 0.9466037648766564, "learning_rate": 6.872294302366154e-06, "loss": 2.69320556640625, "step": 784500 }, { "epoch": 0.9467244281991392, "learning_rate": 6.871890466898416e-06, "loss": 2.688454895019531, "step": 784600 }, { "epoch": 0.9468450915216218, "learning_rate": 6.871486631430676e-06, "loss": 2.6960821533203125, "step": 784700 }, { "epoch": 0.9469657548441045, "learning_rate": 6.871082795962938e-06, "loss": 2.7080783081054687, "step": 784800 }, { "epoch": 0.9470864181665872, "learning_rate": 6.870678960495199e-06, "loss": 2.6997640991210936, "step": 784900 }, { "epoch": 0.9472070814890698, "learning_rate": 6.870275125027461e-06, "loss": 2.698119812011719, "step": 785000 }, { "epoch": 0.9473277448115526, "learning_rate": 6.869871289559723e-06, "loss": 2.6856170654296876, "step": 785100 }, { "epoch": 0.9474484081340352, "learning_rate": 6.869467454091985e-06, "loss": 2.6706402587890623, "step": 785200 }, { "epoch": 0.9475690714565179, "learning_rate": 6.869063618624246e-06, "loss": 2.6903500366210937, "step": 785300 }, { "epoch": 0.9476897347790006, "learning_rate": 6.868659783156508e-06, "loss": 2.6869570922851564, "step": 785400 }, { "epoch": 0.9478103981014833, "learning_rate": 6.8682559476887686e-06, "loss": 2.6905816650390624, "step": 785500 }, { "epoch": 0.947931061423966, "learning_rate": 6.8678521122210306e-06, "loss": 2.6731591796875, "step": 785600 }, { "epoch": 0.9480517247464486, "learning_rate": 6.8674482767532925e-06, "loss": 2.6994927978515624, "step": 785700 }, { "epoch": 0.9481723880689313, "learning_rate": 6.8670444412855545e-06, "loss": 2.6779379272460937, "step": 785800 }, { "epoch": 0.9482930513914141, "learning_rate": 6.866640605817816e-06, "loss": 2.68255126953125, "step": 785900 }, { "epoch": 0.9484137147138967, "learning_rate": 6.866236770350078e-06, "loss": 2.6855838012695314, "step": 786000 }, { "epoch": 0.9485343780363794, "learning_rate": 6.86583293488234e-06, "loss": 2.6961398315429688, "step": 786100 }, { "epoch": 0.948655041358862, "learning_rate": 6.865429099414601e-06, "loss": 2.6921310424804688, "step": 786200 }, { "epoch": 0.9487757046813448, "learning_rate": 6.865025263946862e-06, "loss": 2.7065447998046874, "step": 786300 }, { "epoch": 0.9488963680038275, "learning_rate": 6.864621428479124e-06, "loss": 2.6985897827148437, "step": 786400 }, { "epoch": 0.9490170313263101, "learning_rate": 6.864217593011385e-06, "loss": 2.6831744384765623, "step": 786500 }, { "epoch": 0.9491376946487928, "learning_rate": 6.863813757543647e-06, "loss": 2.693229064941406, "step": 786600 }, { "epoch": 0.9492583579712754, "learning_rate": 6.863409922075909e-06, "loss": 2.7117425537109376, "step": 786700 }, { "epoch": 0.9493790212937582, "learning_rate": 6.86300608660817e-06, "loss": 2.697349853515625, "step": 786800 }, { "epoch": 0.9494996846162409, "learning_rate": 6.862602251140432e-06, "loss": 2.6667523193359375, "step": 786900 }, { "epoch": 0.9496203479387235, "learning_rate": 6.862198415672694e-06, "loss": 2.6829205322265626, "step": 787000 }, { "epoch": 0.9497410112612062, "learning_rate": 6.861794580204954e-06, "loss": 2.701283264160156, "step": 787100 }, { "epoch": 0.9498616745836889, "learning_rate": 6.861390744737216e-06, "loss": 2.7187347412109375, "step": 787200 }, { "epoch": 0.9499823379061716, "learning_rate": 6.860986909269478e-06, "loss": 2.695077209472656, "step": 787300 }, { "epoch": 0.9501030012286543, "learning_rate": 6.8605830738017395e-06, "loss": 2.6848077392578125, "step": 787400 }, { "epoch": 0.9502236645511369, "learning_rate": 6.8601792383340014e-06, "loss": 2.71979736328125, "step": 787500 }, { "epoch": 0.9503443278736197, "learning_rate": 6.8597754028662634e-06, "loss": 2.687115478515625, "step": 787600 }, { "epoch": 0.9504649911961023, "learning_rate": 6.859371567398525e-06, "loss": 2.678658142089844, "step": 787700 }, { "epoch": 0.950585654518585, "learning_rate": 6.8589677319307865e-06, "loss": 2.6731732177734373, "step": 787800 }, { "epoch": 0.9507063178410677, "learning_rate": 6.8585638964630485e-06, "loss": 2.699960021972656, "step": 787900 }, { "epoch": 0.9508269811635504, "learning_rate": 6.858160060995309e-06, "loss": 2.71200927734375, "step": 788000 }, { "epoch": 0.9509476444860331, "learning_rate": 6.857756225527571e-06, "loss": 2.6778497314453125, "step": 788100 }, { "epoch": 0.9510683078085157, "learning_rate": 6.857352390059833e-06, "loss": 2.679437255859375, "step": 788200 }, { "epoch": 0.9511889711309984, "learning_rate": 6.856948554592095e-06, "loss": 2.69108154296875, "step": 788300 }, { "epoch": 0.9513096344534812, "learning_rate": 6.856544719124356e-06, "loss": 2.6952084350585936, "step": 788400 }, { "epoch": 0.9514302977759638, "learning_rate": 6.856140883656618e-06, "loss": 2.685252685546875, "step": 788500 }, { "epoch": 0.9515509610984465, "learning_rate": 6.85573704818888e-06, "loss": 2.708140869140625, "step": 788600 }, { "epoch": 0.9516716244209291, "learning_rate": 6.855333212721141e-06, "loss": 2.7034957885742186, "step": 788700 }, { "epoch": 0.9517922877434118, "learning_rate": 6.854929377253402e-06, "loss": 2.705916748046875, "step": 788800 }, { "epoch": 0.9519129510658946, "learning_rate": 6.854525541785664e-06, "loss": 2.6758883666992186, "step": 788900 }, { "epoch": 0.9520336143883772, "learning_rate": 6.854121706317925e-06, "loss": 2.725309143066406, "step": 789000 }, { "epoch": 0.9521542777108599, "learning_rate": 6.853717870850187e-06, "loss": 2.680340576171875, "step": 789100 }, { "epoch": 0.9522749410333426, "learning_rate": 6.853314035382449e-06, "loss": 2.71977783203125, "step": 789200 }, { "epoch": 0.9523956043558253, "learning_rate": 6.85291019991471e-06, "loss": 2.6834921264648437, "step": 789300 }, { "epoch": 0.952516267678308, "learning_rate": 6.852506364446972e-06, "loss": 2.6977169799804686, "step": 789400 }, { "epoch": 0.9526369310007906, "learning_rate": 6.852102528979234e-06, "loss": 2.713534240722656, "step": 789500 }, { "epoch": 0.9527575943232733, "learning_rate": 6.851698693511495e-06, "loss": 2.7157223510742186, "step": 789600 }, { "epoch": 0.9528782576457561, "learning_rate": 6.851294858043757e-06, "loss": 2.712982482910156, "step": 789700 }, { "epoch": 0.9529989209682387, "learning_rate": 6.8508910225760186e-06, "loss": 2.7126171875, "step": 789800 }, { "epoch": 0.9531195842907214, "learning_rate": 6.85048718710828e-06, "loss": 2.6991302490234377, "step": 789900 }, { "epoch": 0.953240247613204, "learning_rate": 6.850083351640542e-06, "loss": 2.672728271484375, "step": 790000 }, { "epoch": 0.9533609109356868, "learning_rate": 6.849679516172804e-06, "loss": 2.6914654541015626, "step": 790100 }, { "epoch": 0.9534815742581695, "learning_rate": 6.849275680705066e-06, "loss": 2.705994873046875, "step": 790200 }, { "epoch": 0.9536022375806521, "learning_rate": 6.848871845237327e-06, "loss": 2.69797119140625, "step": 790300 }, { "epoch": 0.9537229009031348, "learning_rate": 6.848468009769588e-06, "loss": 2.7130682373046877, "step": 790400 }, { "epoch": 0.9538435642256174, "learning_rate": 6.848064174301849e-06, "loss": 2.674532470703125, "step": 790500 }, { "epoch": 0.9539642275481002, "learning_rate": 6.847660338834111e-06, "loss": 2.7007791137695314, "step": 790600 }, { "epoch": 0.9540848908705829, "learning_rate": 6.847256503366373e-06, "loss": 2.6982965087890625, "step": 790700 }, { "epoch": 0.9542055541930655, "learning_rate": 6.846852667898635e-06, "loss": 2.67190185546875, "step": 790800 }, { "epoch": 0.9543262175155482, "learning_rate": 6.846448832430896e-06, "loss": 2.6917459106445314, "step": 790900 }, { "epoch": 0.9544468808380309, "learning_rate": 6.846044996963158e-06, "loss": 2.6997036743164062, "step": 791000 }, { "epoch": 0.9545675441605136, "learning_rate": 6.84564116149542e-06, "loss": 2.704617614746094, "step": 791100 }, { "epoch": 0.9546882074829963, "learning_rate": 6.84523732602768e-06, "loss": 2.704593505859375, "step": 791200 }, { "epoch": 0.9548088708054789, "learning_rate": 6.844833490559942e-06, "loss": 2.6877423095703126, "step": 791300 }, { "epoch": 0.9549295341279617, "learning_rate": 6.844429655092204e-06, "loss": 2.6890524291992186, "step": 791400 }, { "epoch": 0.9550501974504443, "learning_rate": 6.8440258196244655e-06, "loss": 2.694490966796875, "step": 791500 }, { "epoch": 0.955170860772927, "learning_rate": 6.8436219841567275e-06, "loss": 2.709522399902344, "step": 791600 }, { "epoch": 0.9552915240954097, "learning_rate": 6.8432181486889895e-06, "loss": 2.706404724121094, "step": 791700 }, { "epoch": 0.9554121874178924, "learning_rate": 6.842814313221251e-06, "loss": 2.688263244628906, "step": 791800 }, { "epoch": 0.9555328507403751, "learning_rate": 6.842410477753513e-06, "loss": 2.6859906005859373, "step": 791900 }, { "epoch": 0.9556535140628577, "learning_rate": 6.842006642285774e-06, "loss": 2.6879788208007813, "step": 792000 }, { "epoch": 0.9557741773853404, "learning_rate": 6.841602806818035e-06, "loss": 2.68304443359375, "step": 792100 }, { "epoch": 0.9558948407078232, "learning_rate": 6.841198971350297e-06, "loss": 2.711295166015625, "step": 792200 }, { "epoch": 0.9560155040303058, "learning_rate": 6.840795135882559e-06, "loss": 2.7052120971679687, "step": 792300 }, { "epoch": 0.9561361673527885, "learning_rate": 6.84039130041482e-06, "loss": 2.7207632446289063, "step": 792400 }, { "epoch": 0.9562568306752711, "learning_rate": 6.839987464947082e-06, "loss": 2.6743267822265624, "step": 792500 }, { "epoch": 0.9563774939977538, "learning_rate": 6.839583629479344e-06, "loss": 2.6836273193359377, "step": 792600 }, { "epoch": 0.9564981573202366, "learning_rate": 6.839179794011606e-06, "loss": 2.7048394775390623, "step": 792700 }, { "epoch": 0.9566188206427192, "learning_rate": 6.838775958543867e-06, "loss": 2.7131442260742187, "step": 792800 }, { "epoch": 0.9567394839652019, "learning_rate": 6.838372123076128e-06, "loss": 2.7153109741210937, "step": 792900 }, { "epoch": 0.9568601472876845, "learning_rate": 6.837968287608389e-06, "loss": 2.6718734741210937, "step": 793000 }, { "epoch": 0.9569808106101673, "learning_rate": 6.837564452140651e-06, "loss": 2.695150146484375, "step": 793100 }, { "epoch": 0.95710147393265, "learning_rate": 6.837160616672913e-06, "loss": 2.709000549316406, "step": 793200 }, { "epoch": 0.9572221372551326, "learning_rate": 6.836756781205175e-06, "loss": 2.700020446777344, "step": 793300 }, { "epoch": 0.9573428005776153, "learning_rate": 6.836352945737436e-06, "loss": 2.7089523315429687, "step": 793400 }, { "epoch": 0.957463463900098, "learning_rate": 6.835949110269698e-06, "loss": 2.707245178222656, "step": 793500 }, { "epoch": 0.9575841272225807, "learning_rate": 6.83554527480196e-06, "loss": 2.679405517578125, "step": 793600 }, { "epoch": 0.9577047905450634, "learning_rate": 6.835141439334221e-06, "loss": 2.685549621582031, "step": 793700 }, { "epoch": 0.957825453867546, "learning_rate": 6.834737603866483e-06, "loss": 2.6958978271484373, "step": 793800 }, { "epoch": 0.9579461171900288, "learning_rate": 6.834333768398745e-06, "loss": 2.6856509399414064, "step": 793900 }, { "epoch": 0.9580667805125115, "learning_rate": 6.833929932931006e-06, "loss": 2.701844482421875, "step": 794000 }, { "epoch": 0.9581874438349941, "learning_rate": 6.833526097463268e-06, "loss": 2.7029852294921874, "step": 794100 }, { "epoch": 0.9583081071574768, "learning_rate": 6.83312226199553e-06, "loss": 2.6582180786132814, "step": 794200 }, { "epoch": 0.9584287704799594, "learning_rate": 6.832718426527792e-06, "loss": 2.701297607421875, "step": 794300 }, { "epoch": 0.9585494338024422, "learning_rate": 6.832314591060053e-06, "loss": 2.6823431396484376, "step": 794400 }, { "epoch": 0.9586700971249249, "learning_rate": 6.831910755592314e-06, "loss": 2.6907440185546876, "step": 794500 }, { "epoch": 0.9587907604474075, "learning_rate": 6.831506920124575e-06, "loss": 2.6905303955078126, "step": 794600 }, { "epoch": 0.9589114237698902, "learning_rate": 6.831103084656837e-06, "loss": 2.6836862182617187, "step": 794700 }, { "epoch": 0.9590320870923729, "learning_rate": 6.830699249189099e-06, "loss": 2.682628479003906, "step": 794800 }, { "epoch": 0.9591527504148556, "learning_rate": 6.830295413721361e-06, "loss": 2.670255432128906, "step": 794900 }, { "epoch": 0.9592734137373383, "learning_rate": 6.829891578253622e-06, "loss": 2.6966766357421874, "step": 795000 }, { "epoch": 0.9593940770598209, "learning_rate": 6.829487742785884e-06, "loss": 2.694981689453125, "step": 795100 }, { "epoch": 0.9595147403823037, "learning_rate": 6.829083907318146e-06, "loss": 2.7091305541992186, "step": 795200 }, { "epoch": 0.9596354037047863, "learning_rate": 6.8286800718504064e-06, "loss": 2.6809722900390627, "step": 795300 }, { "epoch": 0.959756067027269, "learning_rate": 6.828276236382668e-06, "loss": 2.7010037231445314, "step": 795400 }, { "epoch": 0.9598767303497517, "learning_rate": 6.82787240091493e-06, "loss": 2.685649108886719, "step": 795500 }, { "epoch": 0.9599973936722344, "learning_rate": 6.8274685654471915e-06, "loss": 2.6855316162109375, "step": 795600 }, { "epoch": 0.9601180569947171, "learning_rate": 6.8270647299794535e-06, "loss": 2.691778259277344, "step": 795700 }, { "epoch": 0.9602387203171997, "learning_rate": 6.8266608945117155e-06, "loss": 2.7441671752929686, "step": 795800 }, { "epoch": 0.9603593836396824, "learning_rate": 6.826257059043977e-06, "loss": 2.6926171875, "step": 795900 }, { "epoch": 0.9604800469621652, "learning_rate": 6.825853223576239e-06, "loss": 2.6957366943359373, "step": 796000 }, { "epoch": 0.9606007102846478, "learning_rate": 6.8254493881085e-06, "loss": 2.6825436401367186, "step": 796100 }, { "epoch": 0.9607213736071305, "learning_rate": 6.825045552640761e-06, "loss": 2.6730517578125, "step": 796200 }, { "epoch": 0.9608420369296131, "learning_rate": 6.824641717173023e-06, "loss": 2.6876568603515625, "step": 796300 }, { "epoch": 0.9609627002520958, "learning_rate": 6.824237881705285e-06, "loss": 2.6995730590820313, "step": 796400 }, { "epoch": 0.9610833635745786, "learning_rate": 6.823834046237546e-06, "loss": 2.699891357421875, "step": 796500 }, { "epoch": 0.9612040268970612, "learning_rate": 6.823430210769808e-06, "loss": 2.678602294921875, "step": 796600 }, { "epoch": 0.9613246902195439, "learning_rate": 6.82302637530207e-06, "loss": 2.690196228027344, "step": 796700 }, { "epoch": 0.9614453535420265, "learning_rate": 6.822622539834332e-06, "loss": 2.6925125122070312, "step": 796800 }, { "epoch": 0.9615660168645093, "learning_rate": 6.822218704366592e-06, "loss": 2.7001583862304686, "step": 796900 }, { "epoch": 0.961686680186992, "learning_rate": 6.821814868898854e-06, "loss": 2.7129946899414064, "step": 797000 }, { "epoch": 0.9618073435094746, "learning_rate": 6.821411033431115e-06, "loss": 2.6820724487304686, "step": 797100 }, { "epoch": 0.9619280068319573, "learning_rate": 6.821007197963377e-06, "loss": 2.71345703125, "step": 797200 }, { "epoch": 0.96204867015444, "learning_rate": 6.820603362495639e-06, "loss": 2.7013079833984377, "step": 797300 }, { "epoch": 0.9621693334769227, "learning_rate": 6.820199527027901e-06, "loss": 2.7034817504882813, "step": 797400 }, { "epoch": 0.9622899967994054, "learning_rate": 6.8197956915601624e-06, "loss": 2.6788226318359376, "step": 797500 }, { "epoch": 0.962410660121888, "learning_rate": 6.819391856092424e-06, "loss": 2.68404541015625, "step": 797600 }, { "epoch": 0.9625313234443708, "learning_rate": 6.818988020624685e-06, "loss": 2.6818505859375, "step": 797700 }, { "epoch": 0.9626519867668534, "learning_rate": 6.818584185156947e-06, "loss": 2.708017578125, "step": 797800 }, { "epoch": 0.9627726500893361, "learning_rate": 6.818180349689209e-06, "loss": 2.6850454711914065, "step": 797900 }, { "epoch": 0.9628933134118188, "learning_rate": 6.817776514221471e-06, "loss": 2.67915283203125, "step": 798000 }, { "epoch": 0.9630139767343014, "learning_rate": 6.817372678753732e-06, "loss": 2.70856201171875, "step": 798100 }, { "epoch": 0.9631346400567842, "learning_rate": 6.816968843285994e-06, "loss": 2.714721374511719, "step": 798200 }, { "epoch": 0.9632553033792668, "learning_rate": 6.816565007818256e-06, "loss": 2.71268310546875, "step": 798300 }, { "epoch": 0.9633759667017495, "learning_rate": 6.816161172350517e-06, "loss": 2.677989501953125, "step": 798400 }, { "epoch": 0.9634966300242322, "learning_rate": 6.815757336882779e-06, "loss": 2.6910800170898437, "step": 798500 }, { "epoch": 0.9636172933467149, "learning_rate": 6.81535350141504e-06, "loss": 2.694371337890625, "step": 798600 }, { "epoch": 0.9637379566691976, "learning_rate": 6.814949665947301e-06, "loss": 2.6851123046875, "step": 798700 }, { "epoch": 0.9638586199916802, "learning_rate": 6.814545830479563e-06, "loss": 2.7044406127929688, "step": 798800 }, { "epoch": 0.9639792833141629, "learning_rate": 6.814141995011825e-06, "loss": 2.6898077392578124, "step": 798900 }, { "epoch": 0.9640999466366457, "learning_rate": 6.813738159544086e-06, "loss": 2.7004083251953124, "step": 799000 }, { "epoch": 0.9642206099591283, "learning_rate": 6.813334324076348e-06, "loss": 2.6879046630859373, "step": 799100 }, { "epoch": 0.964341273281611, "learning_rate": 6.81293048860861e-06, "loss": 2.6848663330078124, "step": 799200 }, { "epoch": 0.9644619366040937, "learning_rate": 6.812526653140872e-06, "loss": 2.6838946533203125, "step": 799300 }, { "epoch": 0.9645825999265764, "learning_rate": 6.8121228176731325e-06, "loss": 2.7106149291992185, "step": 799400 }, { "epoch": 0.9647032632490591, "learning_rate": 6.8117189822053944e-06, "loss": 2.6894512939453126, "step": 799500 }, { "epoch": 0.9648239265715417, "learning_rate": 6.811315146737656e-06, "loss": 2.7079510498046875, "step": 799600 }, { "epoch": 0.9649445898940244, "learning_rate": 6.8109113112699176e-06, "loss": 2.695456237792969, "step": 799700 }, { "epoch": 0.9650652532165072, "learning_rate": 6.8105074758021796e-06, "loss": 2.6870162963867186, "step": 799800 }, { "epoch": 0.9651859165389898, "learning_rate": 6.8101036403344415e-06, "loss": 2.7064361572265625, "step": 799900 }, { "epoch": 0.9653065798614725, "learning_rate": 6.809699804866703e-06, "loss": 2.707325134277344, "step": 800000 }, { "epoch": 0.9654272431839551, "learning_rate": 6.809295969398965e-06, "loss": 2.6884579467773437, "step": 800100 }, { "epoch": 0.9655479065064378, "learning_rate": 6.808892133931225e-06, "loss": 2.6800570678710938, "step": 800200 }, { "epoch": 0.9656685698289206, "learning_rate": 6.808488298463487e-06, "loss": 2.706690673828125, "step": 800300 }, { "epoch": 0.9657892331514032, "learning_rate": 6.808084462995749e-06, "loss": 2.6865118408203124, "step": 800400 }, { "epoch": 0.9659098964738859, "learning_rate": 6.807680627528011e-06, "loss": 2.686295166015625, "step": 800500 }, { "epoch": 0.9660305597963685, "learning_rate": 6.807276792060272e-06, "loss": 2.711240539550781, "step": 800600 }, { "epoch": 0.9661512231188513, "learning_rate": 6.806872956592534e-06, "loss": 2.694505310058594, "step": 800700 }, { "epoch": 0.966271886441334, "learning_rate": 6.806469121124796e-06, "loss": 2.6965765380859374, "step": 800800 }, { "epoch": 0.9663925497638166, "learning_rate": 6.806065285657057e-06, "loss": 2.6807980346679687, "step": 800900 }, { "epoch": 0.9665132130862993, "learning_rate": 6.805661450189318e-06, "loss": 2.709455871582031, "step": 801000 }, { "epoch": 0.966633876408782, "learning_rate": 6.80525761472158e-06, "loss": 2.6670916748046873, "step": 801100 }, { "epoch": 0.9667545397312647, "learning_rate": 6.804853779253841e-06, "loss": 2.6991848754882812, "step": 801200 }, { "epoch": 0.9668752030537474, "learning_rate": 6.804449943786103e-06, "loss": 2.6755157470703126, "step": 801300 }, { "epoch": 0.96699586637623, "learning_rate": 6.804046108318365e-06, "loss": 2.6537326049804686, "step": 801400 }, { "epoch": 0.9671165296987128, "learning_rate": 6.8036422728506265e-06, "loss": 2.6764602661132812, "step": 801500 }, { "epoch": 0.9672371930211954, "learning_rate": 6.8032384373828885e-06, "loss": 2.6886260986328123, "step": 801600 }, { "epoch": 0.9673578563436781, "learning_rate": 6.8028346019151504e-06, "loss": 2.6860256958007813, "step": 801700 }, { "epoch": 0.9674785196661608, "learning_rate": 6.802430766447411e-06, "loss": 2.6928305053710937, "step": 801800 }, { "epoch": 0.9675991829886434, "learning_rate": 6.802026930979673e-06, "loss": 2.703335876464844, "step": 801900 }, { "epoch": 0.9677198463111262, "learning_rate": 6.801623095511935e-06, "loss": 2.6712432861328126, "step": 802000 }, { "epoch": 0.9678405096336088, "learning_rate": 6.801219260044196e-06, "loss": 2.6686746215820314, "step": 802100 }, { "epoch": 0.9679611729560915, "learning_rate": 6.800815424576458e-06, "loss": 2.701936950683594, "step": 802200 }, { "epoch": 0.9680818362785742, "learning_rate": 6.80041158910872e-06, "loss": 2.7050506591796877, "step": 802300 }, { "epoch": 0.9682024996010569, "learning_rate": 6.800007753640982e-06, "loss": 2.67053955078125, "step": 802400 }, { "epoch": 0.9683231629235396, "learning_rate": 6.799603918173243e-06, "loss": 2.6807672119140626, "step": 802500 }, { "epoch": 0.9684438262460222, "learning_rate": 6.799200082705504e-06, "loss": 2.6952532958984374, "step": 802600 }, { "epoch": 0.9685644895685049, "learning_rate": 6.798796247237765e-06, "loss": 2.690641174316406, "step": 802700 }, { "epoch": 0.9686851528909877, "learning_rate": 6.798392411770027e-06, "loss": 2.69266845703125, "step": 802800 }, { "epoch": 0.9688058162134703, "learning_rate": 6.797988576302289e-06, "loss": 2.6992703247070313, "step": 802900 }, { "epoch": 0.968926479535953, "learning_rate": 6.797584740834551e-06, "loss": 2.6943588256835938, "step": 803000 }, { "epoch": 0.9690471428584356, "learning_rate": 6.797180905366812e-06, "loss": 2.6907293701171877, "step": 803100 }, { "epoch": 0.9691678061809184, "learning_rate": 6.796777069899074e-06, "loss": 2.688797912597656, "step": 803200 }, { "epoch": 0.9692884695034011, "learning_rate": 6.796373234431336e-06, "loss": 2.66757080078125, "step": 803300 }, { "epoch": 0.9694091328258837, "learning_rate": 6.795969398963597e-06, "loss": 2.707461242675781, "step": 803400 }, { "epoch": 0.9695297961483664, "learning_rate": 6.7955655634958585e-06, "loss": 2.679440612792969, "step": 803500 }, { "epoch": 0.969650459470849, "learning_rate": 6.7951617280281205e-06, "loss": 2.7043743896484376, "step": 803600 }, { "epoch": 0.9697711227933318, "learning_rate": 6.794757892560382e-06, "loss": 2.66918212890625, "step": 803700 }, { "epoch": 0.9698917861158145, "learning_rate": 6.794354057092644e-06, "loss": 2.717323913574219, "step": 803800 }, { "epoch": 0.9700124494382971, "learning_rate": 6.793950221624906e-06, "loss": 2.6916580200195312, "step": 803900 }, { "epoch": 0.9701331127607798, "learning_rate": 6.793546386157167e-06, "loss": 2.715509338378906, "step": 804000 }, { "epoch": 0.9702537760832625, "learning_rate": 6.793142550689429e-06, "loss": 2.6739166259765623, "step": 804100 }, { "epoch": 0.9703744394057452, "learning_rate": 6.792738715221691e-06, "loss": 2.6808645629882815, "step": 804200 }, { "epoch": 0.9704951027282279, "learning_rate": 6.792334879753951e-06, "loss": 2.6978271484375, "step": 804300 }, { "epoch": 0.9706157660507105, "learning_rate": 6.791931044286213e-06, "loss": 2.6868878173828126, "step": 804400 }, { "epoch": 0.9707364293731933, "learning_rate": 6.791527208818475e-06, "loss": 2.6900100708007812, "step": 804500 }, { "epoch": 0.970857092695676, "learning_rate": 6.791123373350736e-06, "loss": 2.683175354003906, "step": 804600 }, { "epoch": 0.9709777560181586, "learning_rate": 6.790719537882998e-06, "loss": 2.678918762207031, "step": 804700 }, { "epoch": 0.9710984193406413, "learning_rate": 6.79031570241526e-06, "loss": 2.681148681640625, "step": 804800 }, { "epoch": 0.971219082663124, "learning_rate": 6.789911866947522e-06, "loss": 2.69580078125, "step": 804900 }, { "epoch": 0.9713397459856067, "learning_rate": 6.789508031479783e-06, "loss": 2.710692138671875, "step": 805000 }, { "epoch": 0.9714604093080894, "learning_rate": 6.789104196012044e-06, "loss": 2.6963760375976564, "step": 805100 }, { "epoch": 0.971581072630572, "learning_rate": 6.7887003605443054e-06, "loss": 2.682347717285156, "step": 805200 }, { "epoch": 0.9717017359530548, "learning_rate": 6.788296525076567e-06, "loss": 2.6771612548828125, "step": 805300 }, { "epoch": 0.9718223992755374, "learning_rate": 6.787892689608829e-06, "loss": 2.678078308105469, "step": 805400 }, { "epoch": 0.9719430625980201, "learning_rate": 6.787488854141091e-06, "loss": 2.7187554931640623, "step": 805500 }, { "epoch": 0.9720637259205028, "learning_rate": 6.7870850186733525e-06, "loss": 2.700899963378906, "step": 805600 }, { "epoch": 0.9721843892429854, "learning_rate": 6.7866811832056145e-06, "loss": 2.7239028930664064, "step": 805700 }, { "epoch": 0.9723050525654682, "learning_rate": 6.7862773477378765e-06, "loss": 2.6747686767578127, "step": 805800 }, { "epoch": 0.9724257158879508, "learning_rate": 6.785873512270137e-06, "loss": 2.6927474975585937, "step": 805900 }, { "epoch": 0.9725463792104335, "learning_rate": 6.785469676802399e-06, "loss": 2.6647125244140626, "step": 806000 }, { "epoch": 0.9726670425329162, "learning_rate": 6.785065841334661e-06, "loss": 2.69884521484375, "step": 806100 }, { "epoch": 0.9727877058553989, "learning_rate": 6.784662005866922e-06, "loss": 2.677520446777344, "step": 806200 }, { "epoch": 0.9729083691778816, "learning_rate": 6.784258170399184e-06, "loss": 2.6768572998046873, "step": 806300 }, { "epoch": 0.9730290325003642, "learning_rate": 6.783854334931446e-06, "loss": 2.6970257568359375, "step": 806400 }, { "epoch": 0.9731496958228469, "learning_rate": 6.783450499463707e-06, "loss": 2.677064208984375, "step": 806500 }, { "epoch": 0.9732703591453297, "learning_rate": 6.783046663995969e-06, "loss": 2.664015197753906, "step": 806600 }, { "epoch": 0.9733910224678123, "learning_rate": 6.78264282852823e-06, "loss": 2.679351806640625, "step": 806700 }, { "epoch": 0.973511685790295, "learning_rate": 6.782238993060491e-06, "loss": 2.6948031616210937, "step": 806800 }, { "epoch": 0.9736323491127776, "learning_rate": 6.781835157592753e-06, "loss": 2.689730224609375, "step": 806900 }, { "epoch": 0.9737530124352604, "learning_rate": 6.781431322125015e-06, "loss": 2.6557235717773438, "step": 807000 }, { "epoch": 0.9738736757577431, "learning_rate": 6.781027486657276e-06, "loss": 2.670332336425781, "step": 807100 }, { "epoch": 0.9739943390802257, "learning_rate": 6.780623651189538e-06, "loss": 2.6936911010742186, "step": 807200 }, { "epoch": 0.9741150024027084, "learning_rate": 6.7802198157218e-06, "loss": 2.6822003173828124, "step": 807300 }, { "epoch": 0.974235665725191, "learning_rate": 6.779815980254062e-06, "loss": 2.6780514526367187, "step": 807400 }, { "epoch": 0.9743563290476738, "learning_rate": 6.7794121447863226e-06, "loss": 2.703970947265625, "step": 807500 }, { "epoch": 0.9744769923701565, "learning_rate": 6.7790083093185845e-06, "loss": 2.6939382934570313, "step": 807600 }, { "epoch": 0.9745976556926391, "learning_rate": 6.778604473850846e-06, "loss": 2.671354064941406, "step": 807700 }, { "epoch": 0.9747183190151218, "learning_rate": 6.778200638383108e-06, "loss": 2.689676513671875, "step": 807800 }, { "epoch": 0.9748389823376045, "learning_rate": 6.77779680291537e-06, "loss": 2.7074505615234377, "step": 807900 }, { "epoch": 0.9749596456600872, "learning_rate": 6.777392967447632e-06, "loss": 2.700010986328125, "step": 808000 }, { "epoch": 0.9750803089825699, "learning_rate": 6.776989131979893e-06, "loss": 2.6849871826171876, "step": 808100 }, { "epoch": 0.9752009723050525, "learning_rate": 6.776585296512155e-06, "loss": 2.7095816040039065, "step": 808200 }, { "epoch": 0.9753216356275353, "learning_rate": 6.776181461044417e-06, "loss": 2.670193786621094, "step": 808300 }, { "epoch": 0.9754422989500179, "learning_rate": 6.775777625576677e-06, "loss": 2.711287536621094, "step": 808400 }, { "epoch": 0.9755629622725006, "learning_rate": 6.775373790108939e-06, "loss": 2.6967694091796877, "step": 808500 }, { "epoch": 0.9756836255949833, "learning_rate": 6.774969954641201e-06, "loss": 2.6963327026367185, "step": 808600 }, { "epoch": 0.975804288917466, "learning_rate": 6.774566119173462e-06, "loss": 2.6876171875, "step": 808700 }, { "epoch": 0.9759249522399487, "learning_rate": 6.774162283705724e-06, "loss": 2.6921600341796874, "step": 808800 }, { "epoch": 0.9760456155624313, "learning_rate": 6.773758448237986e-06, "loss": 2.6753268432617188, "step": 808900 }, { "epoch": 0.976166278884914, "learning_rate": 6.773354612770248e-06, "loss": 2.688093566894531, "step": 809000 }, { "epoch": 0.9762869422073968, "learning_rate": 6.772950777302509e-06, "loss": 2.6751287841796874, "step": 809100 }, { "epoch": 0.9764076055298794, "learning_rate": 6.77254694183477e-06, "loss": 2.6506143188476563, "step": 809200 }, { "epoch": 0.9765282688523621, "learning_rate": 6.7721431063670315e-06, "loss": 2.6773471069335937, "step": 809300 }, { "epoch": 0.9766489321748447, "learning_rate": 6.7717392708992934e-06, "loss": 2.6791110229492188, "step": 809400 }, { "epoch": 0.9767695954973274, "learning_rate": 6.7713354354315554e-06, "loss": 2.671355895996094, "step": 809500 }, { "epoch": 0.9768902588198102, "learning_rate": 6.770931599963817e-06, "loss": 2.6950555419921876, "step": 809600 }, { "epoch": 0.9770109221422928, "learning_rate": 6.7705277644960785e-06, "loss": 2.6874758911132814, "step": 809700 }, { "epoch": 0.9771315854647755, "learning_rate": 6.7701239290283405e-06, "loss": 2.6821771240234376, "step": 809800 }, { "epoch": 0.9772522487872582, "learning_rate": 6.7697200935606025e-06, "loss": 2.6739187622070313, "step": 809900 }, { "epoch": 0.9773729121097409, "learning_rate": 6.769316258092863e-06, "loss": 2.6828009033203126, "step": 810000 }, { "epoch": 0.9774935754322236, "learning_rate": 6.768912422625125e-06, "loss": 2.6938296508789064, "step": 810100 }, { "epoch": 0.9776142387547062, "learning_rate": 6.768508587157387e-06, "loss": 2.6793634033203126, "step": 810200 }, { "epoch": 0.9777349020771889, "learning_rate": 6.768104751689648e-06, "loss": 2.6675564575195314, "step": 810300 }, { "epoch": 0.9778555653996717, "learning_rate": 6.76770091622191e-06, "loss": 2.6702450561523436, "step": 810400 }, { "epoch": 0.9779762287221543, "learning_rate": 6.767297080754172e-06, "loss": 2.6727130126953127, "step": 810500 }, { "epoch": 0.978096892044637, "learning_rate": 6.766893245286433e-06, "loss": 2.7010467529296873, "step": 810600 }, { "epoch": 0.9782175553671196, "learning_rate": 6.766489409818695e-06, "loss": 2.7036837768554687, "step": 810700 }, { "epoch": 0.9783382186896024, "learning_rate": 6.766085574350956e-06, "loss": 2.7078302001953123, "step": 810800 }, { "epoch": 0.9784588820120851, "learning_rate": 6.765681738883217e-06, "loss": 2.663199462890625, "step": 810900 }, { "epoch": 0.9785795453345677, "learning_rate": 6.765277903415479e-06, "loss": 2.6508743286132814, "step": 811000 }, { "epoch": 0.9787002086570504, "learning_rate": 6.764874067947741e-06, "loss": 2.6925048828125, "step": 811100 }, { "epoch": 0.978820871979533, "learning_rate": 6.764470232480002e-06, "loss": 2.688280029296875, "step": 811200 }, { "epoch": 0.9789415353020158, "learning_rate": 6.764066397012264e-06, "loss": 2.6898269653320312, "step": 811300 }, { "epoch": 0.9790621986244985, "learning_rate": 6.763662561544526e-06, "loss": 2.7011874389648436, "step": 811400 }, { "epoch": 0.9791828619469811, "learning_rate": 6.763258726076788e-06, "loss": 2.7097824096679686, "step": 811500 }, { "epoch": 0.9793035252694638, "learning_rate": 6.762854890609049e-06, "loss": 2.6825701904296877, "step": 811600 }, { "epoch": 0.9794241885919465, "learning_rate": 6.7624510551413106e-06, "loss": 2.6860009765625, "step": 811700 }, { "epoch": 0.9795448519144292, "learning_rate": 6.762047219673572e-06, "loss": 2.6980886840820313, "step": 811800 }, { "epoch": 0.9796655152369119, "learning_rate": 6.761643384205834e-06, "loss": 2.6894317626953126, "step": 811900 }, { "epoch": 0.9797861785593945, "learning_rate": 6.761239548738096e-06, "loss": 2.682275695800781, "step": 812000 }, { "epoch": 0.9799068418818773, "learning_rate": 6.760835713270358e-06, "loss": 2.671392517089844, "step": 812100 }, { "epoch": 0.9800275052043599, "learning_rate": 6.760431877802619e-06, "loss": 2.67977294921875, "step": 812200 }, { "epoch": 0.9801481685268426, "learning_rate": 6.760028042334881e-06, "loss": 2.683537902832031, "step": 812300 }, { "epoch": 0.9802688318493253, "learning_rate": 6.759624206867141e-06, "loss": 2.6908953857421873, "step": 812400 }, { "epoch": 0.980389495171808, "learning_rate": 6.759220371399403e-06, "loss": 2.695611572265625, "step": 812500 }, { "epoch": 0.9805101584942907, "learning_rate": 6.758816535931665e-06, "loss": 2.660994567871094, "step": 812600 }, { "epoch": 0.9806308218167733, "learning_rate": 6.758412700463927e-06, "loss": 2.6747811889648436, "step": 812700 }, { "epoch": 0.980751485139256, "learning_rate": 6.758008864996188e-06, "loss": 2.6699423217773437, "step": 812800 }, { "epoch": 0.9808721484617388, "learning_rate": 6.75760502952845e-06, "loss": 2.6848773193359374, "step": 812900 }, { "epoch": 0.9809928117842214, "learning_rate": 6.757201194060712e-06, "loss": 2.7114273071289063, "step": 813000 }, { "epoch": 0.9811134751067041, "learning_rate": 6.756797358592973e-06, "loss": 2.681495361328125, "step": 813100 }, { "epoch": 0.9812341384291867, "learning_rate": 6.756393523125235e-06, "loss": 2.65793212890625, "step": 813200 }, { "epoch": 0.9813548017516694, "learning_rate": 6.755989687657496e-06, "loss": 2.69505859375, "step": 813300 }, { "epoch": 0.9814754650741522, "learning_rate": 6.7555858521897575e-06, "loss": 2.683656005859375, "step": 813400 }, { "epoch": 0.9815961283966348, "learning_rate": 6.7551820167220195e-06, "loss": 2.665914306640625, "step": 813500 }, { "epoch": 0.9817167917191175, "learning_rate": 6.7547781812542815e-06, "loss": 2.718000793457031, "step": 813600 }, { "epoch": 0.9818374550416001, "learning_rate": 6.754374345786543e-06, "loss": 2.684240417480469, "step": 813700 }, { "epoch": 0.9819581183640829, "learning_rate": 6.753970510318805e-06, "loss": 2.68198486328125, "step": 813800 }, { "epoch": 0.9820787816865656, "learning_rate": 6.7535666748510666e-06, "loss": 2.656136779785156, "step": 813900 }, { "epoch": 0.9821994450090482, "learning_rate": 6.7531628393833285e-06, "loss": 2.6939166259765623, "step": 814000 }, { "epoch": 0.9823201083315309, "learning_rate": 6.752759003915589e-06, "loss": 2.67964111328125, "step": 814100 }, { "epoch": 0.9824407716540136, "learning_rate": 6.752355168447851e-06, "loss": 2.69299560546875, "step": 814200 }, { "epoch": 0.9825614349764963, "learning_rate": 6.751951332980112e-06, "loss": 2.70552490234375, "step": 814300 }, { "epoch": 0.982682098298979, "learning_rate": 6.751547497512374e-06, "loss": 2.6740325927734374, "step": 814400 }, { "epoch": 0.9828027616214616, "learning_rate": 6.751143662044636e-06, "loss": 2.6805450439453127, "step": 814500 }, { "epoch": 0.9829234249439444, "learning_rate": 6.750739826576898e-06, "loss": 2.6954055786132813, "step": 814600 }, { "epoch": 0.983044088266427, "learning_rate": 6.750335991109159e-06, "loss": 2.681743469238281, "step": 814700 }, { "epoch": 0.9831647515889097, "learning_rate": 6.749932155641421e-06, "loss": 2.656484375, "step": 814800 }, { "epoch": 0.9832854149113924, "learning_rate": 6.749528320173681e-06, "loss": 2.6701669311523437, "step": 814900 }, { "epoch": 0.983406078233875, "learning_rate": 6.749124484705943e-06, "loss": 2.666640319824219, "step": 815000 }, { "epoch": 0.9835267415563578, "learning_rate": 6.748720649238205e-06, "loss": 2.680677795410156, "step": 815100 }, { "epoch": 0.9836474048788405, "learning_rate": 6.748316813770467e-06, "loss": 2.667122497558594, "step": 815200 }, { "epoch": 0.9837680682013231, "learning_rate": 6.747912978302728e-06, "loss": 2.677156677246094, "step": 815300 }, { "epoch": 0.9838887315238058, "learning_rate": 6.74750914283499e-06, "loss": 2.674298095703125, "step": 815400 }, { "epoch": 0.9840093948462885, "learning_rate": 6.747105307367252e-06, "loss": 2.6642822265625, "step": 815500 }, { "epoch": 0.9841300581687712, "learning_rate": 6.7467014718995135e-06, "loss": 2.679352111816406, "step": 815600 }, { "epoch": 0.9842507214912539, "learning_rate": 6.746297636431775e-06, "loss": 2.699165954589844, "step": 815700 }, { "epoch": 0.9843713848137365, "learning_rate": 6.745893800964037e-06, "loss": 2.6945315551757814, "step": 815800 }, { "epoch": 0.9844920481362193, "learning_rate": 6.745489965496298e-06, "loss": 2.6596005249023436, "step": 815900 }, { "epoch": 0.9846127114587019, "learning_rate": 6.74508613002856e-06, "loss": 2.658267822265625, "step": 816000 }, { "epoch": 0.9847333747811846, "learning_rate": 6.744682294560822e-06, "loss": 2.68552490234375, "step": 816100 }, { "epoch": 0.9848540381036673, "learning_rate": 6.744278459093083e-06, "loss": 2.6624905395507814, "step": 816200 }, { "epoch": 0.98497470142615, "learning_rate": 6.743874623625345e-06, "loss": 2.70736572265625, "step": 816300 }, { "epoch": 0.9850953647486327, "learning_rate": 6.743470788157607e-06, "loss": 2.6846636962890624, "step": 816400 }, { "epoch": 0.9852160280711153, "learning_rate": 6.743066952689867e-06, "loss": 2.6894381713867186, "step": 816500 }, { "epoch": 0.985336691393598, "learning_rate": 6.742663117222129e-06, "loss": 2.6659359741210937, "step": 816600 }, { "epoch": 0.9854573547160808, "learning_rate": 6.742259281754391e-06, "loss": 2.679892578125, "step": 816700 }, { "epoch": 0.9855780180385634, "learning_rate": 6.741855446286652e-06, "loss": 2.6737411499023436, "step": 816800 }, { "epoch": 0.9856986813610461, "learning_rate": 6.741451610818914e-06, "loss": 2.672438659667969, "step": 816900 }, { "epoch": 0.9858193446835287, "learning_rate": 6.741047775351176e-06, "loss": 2.674625244140625, "step": 817000 }, { "epoch": 0.9859400080060114, "learning_rate": 6.740643939883438e-06, "loss": 2.655400695800781, "step": 817100 }, { "epoch": 0.9860606713284942, "learning_rate": 6.740240104415699e-06, "loss": 2.6880364990234376, "step": 817200 }, { "epoch": 0.9861813346509768, "learning_rate": 6.73983626894796e-06, "loss": 2.6675970458984377, "step": 817300 }, { "epoch": 0.9863019979734595, "learning_rate": 6.7394324334802215e-06, "loss": 2.6784149169921876, "step": 817400 }, { "epoch": 0.9864226612959421, "learning_rate": 6.7390285980124835e-06, "loss": 2.646031494140625, "step": 817500 }, { "epoch": 0.9865433246184249, "learning_rate": 6.7386247625447455e-06, "loss": 2.6934979248046873, "step": 817600 }, { "epoch": 0.9866639879409076, "learning_rate": 6.7382209270770075e-06, "loss": 2.6654037475585937, "step": 817700 }, { "epoch": 0.9867846512633902, "learning_rate": 6.737817091609269e-06, "loss": 2.6561181640625, "step": 817800 }, { "epoch": 0.9869053145858729, "learning_rate": 6.737413256141531e-06, "loss": 2.674538269042969, "step": 817900 }, { "epoch": 0.9870259779083556, "learning_rate": 6.737009420673793e-06, "loss": 2.6939398193359376, "step": 818000 }, { "epoch": 0.9871466412308383, "learning_rate": 6.736605585206053e-06, "loss": 2.6833050537109373, "step": 818100 }, { "epoch": 0.987267304553321, "learning_rate": 6.736201749738315e-06, "loss": 2.6685162353515626, "step": 818200 }, { "epoch": 0.9873879678758036, "learning_rate": 6.735797914270577e-06, "loss": 2.6538433837890625, "step": 818300 }, { "epoch": 0.9875086311982864, "learning_rate": 6.735394078802838e-06, "loss": 2.6761468505859374, "step": 818400 }, { "epoch": 0.987629294520769, "learning_rate": 6.7349902433351e-06, "loss": 2.6830453491210937, "step": 818500 }, { "epoch": 0.9877499578432517, "learning_rate": 6.734586407867362e-06, "loss": 2.6938226318359373, "step": 818600 }, { "epoch": 0.9878706211657344, "learning_rate": 6.734182572399623e-06, "loss": 2.683275146484375, "step": 818700 }, { "epoch": 0.987991284488217, "learning_rate": 6.733778736931885e-06, "loss": 2.6771585083007814, "step": 818800 }, { "epoch": 0.9881119478106998, "learning_rate": 6.733374901464147e-06, "loss": 2.714053039550781, "step": 818900 }, { "epoch": 0.9882326111331824, "learning_rate": 6.732971065996407e-06, "loss": 2.6686859130859375, "step": 819000 }, { "epoch": 0.9883532744556651, "learning_rate": 6.732567230528669e-06, "loss": 2.6474444580078127, "step": 819100 }, { "epoch": 0.9884739377781478, "learning_rate": 6.732163395060931e-06, "loss": 2.6603457641601564, "step": 819200 }, { "epoch": 0.9885946011006305, "learning_rate": 6.7317595595931924e-06, "loss": 2.676976623535156, "step": 819300 }, { "epoch": 0.9887152644231132, "learning_rate": 6.731355724125454e-06, "loss": 2.6678286743164064, "step": 819400 }, { "epoch": 0.9888359277455958, "learning_rate": 6.730951888657716e-06, "loss": 2.682550354003906, "step": 819500 }, { "epoch": 0.9889565910680785, "learning_rate": 6.730548053189978e-06, "loss": 2.6728720092773437, "step": 819600 }, { "epoch": 0.9890772543905613, "learning_rate": 6.7301442177222395e-06, "loss": 2.7108804321289064, "step": 819700 }, { "epoch": 0.9891979177130439, "learning_rate": 6.729740382254501e-06, "loss": 2.6983132934570313, "step": 819800 }, { "epoch": 0.9893185810355266, "learning_rate": 6.729336546786762e-06, "loss": 2.671525573730469, "step": 819900 }, { "epoch": 0.9894392443580093, "learning_rate": 6.728932711319024e-06, "loss": 2.705901794433594, "step": 820000 }, { "epoch": 0.989559907680492, "learning_rate": 6.728528875851286e-06, "loss": 2.692937316894531, "step": 820100 }, { "epoch": 0.9896805710029747, "learning_rate": 6.728125040383548e-06, "loss": 2.7091128540039064, "step": 820200 }, { "epoch": 0.9898012343254573, "learning_rate": 6.727721204915809e-06, "loss": 2.667628173828125, "step": 820300 }, { "epoch": 0.98992189764794, "learning_rate": 6.727317369448071e-06, "loss": 2.648557434082031, "step": 820400 }, { "epoch": 0.9900425609704228, "learning_rate": 6.726913533980333e-06, "loss": 2.6960568237304687, "step": 820500 }, { "epoch": 0.9901632242929054, "learning_rate": 6.726509698512593e-06, "loss": 2.6807672119140626, "step": 820600 }, { "epoch": 0.9902838876153881, "learning_rate": 6.726105863044855e-06, "loss": 2.636048583984375, "step": 820700 }, { "epoch": 0.9904045509378707, "learning_rate": 6.725702027577117e-06, "loss": 2.665213623046875, "step": 820800 }, { "epoch": 0.9905252142603534, "learning_rate": 6.725298192109378e-06, "loss": 2.6850955200195314, "step": 820900 }, { "epoch": 0.9906458775828362, "learning_rate": 6.72489435664164e-06, "loss": 2.672674255371094, "step": 821000 }, { "epoch": 0.9907665409053188, "learning_rate": 6.724490521173902e-06, "loss": 2.697420349121094, "step": 821100 }, { "epoch": 0.9908872042278015, "learning_rate": 6.724086685706163e-06, "loss": 2.686748352050781, "step": 821200 }, { "epoch": 0.9910078675502841, "learning_rate": 6.723682850238425e-06, "loss": 2.6724563598632813, "step": 821300 }, { "epoch": 0.9911285308727669, "learning_rate": 6.7232790147706864e-06, "loss": 2.6566036987304686, "step": 821400 }, { "epoch": 0.9912491941952496, "learning_rate": 6.722875179302948e-06, "loss": 2.6710250854492186, "step": 821500 }, { "epoch": 0.9913698575177322, "learning_rate": 6.7224713438352096e-06, "loss": 2.6614364624023437, "step": 821600 }, { "epoch": 0.9914905208402149, "learning_rate": 6.7220675083674715e-06, "loss": 2.6621102905273437, "step": 821700 }, { "epoch": 0.9916111841626976, "learning_rate": 6.721663672899733e-06, "loss": 2.669195251464844, "step": 821800 }, { "epoch": 0.9917318474851803, "learning_rate": 6.721259837431995e-06, "loss": 2.668642578125, "step": 821900 }, { "epoch": 0.991852510807663, "learning_rate": 6.720856001964257e-06, "loss": 2.676502990722656, "step": 822000 }, { "epoch": 0.9919731741301456, "learning_rate": 6.720452166496519e-06, "loss": 2.6948666381835937, "step": 822100 }, { "epoch": 0.9920938374526284, "learning_rate": 6.720048331028779e-06, "loss": 2.6849105834960936, "step": 822200 }, { "epoch": 0.992214500775111, "learning_rate": 6.719644495561041e-06, "loss": 2.690841064453125, "step": 822300 }, { "epoch": 0.9923351640975937, "learning_rate": 6.719240660093302e-06, "loss": 2.650257568359375, "step": 822400 }, { "epoch": 0.9924558274200764, "learning_rate": 6.718836824625564e-06, "loss": 2.6702978515625, "step": 822500 }, { "epoch": 0.992576490742559, "learning_rate": 6.718432989157826e-06, "loss": 2.6630850219726563, "step": 822600 }, { "epoch": 0.9926971540650418, "learning_rate": 6.718029153690088e-06, "loss": 2.666379089355469, "step": 822700 }, { "epoch": 0.9928178173875244, "learning_rate": 6.717625318222349e-06, "loss": 2.6946063232421875, "step": 822800 }, { "epoch": 0.9929384807100071, "learning_rate": 6.717221482754611e-06, "loss": 2.6902044677734374, "step": 822900 }, { "epoch": 0.9930591440324898, "learning_rate": 6.716817647286871e-06, "loss": 2.6733328247070314, "step": 823000 }, { "epoch": 0.9931798073549725, "learning_rate": 6.716413811819133e-06, "loss": 2.6891790771484376, "step": 823100 }, { "epoch": 0.9933004706774552, "learning_rate": 6.716009976351395e-06, "loss": 2.681728515625, "step": 823200 }, { "epoch": 0.9934211339999378, "learning_rate": 6.715606140883657e-06, "loss": 2.6626651000976564, "step": 823300 }, { "epoch": 0.9935417973224205, "learning_rate": 6.7152023054159185e-06, "loss": 2.6870901489257815, "step": 823400 }, { "epoch": 0.9936624606449033, "learning_rate": 6.7147984699481805e-06, "loss": 2.681002197265625, "step": 823500 }, { "epoch": 0.9937831239673859, "learning_rate": 6.7143946344804424e-06, "loss": 2.6660977172851563, "step": 823600 }, { "epoch": 0.9939037872898686, "learning_rate": 6.713990799012704e-06, "loss": 2.6880914306640626, "step": 823700 }, { "epoch": 0.9940244506123512, "learning_rate": 6.7135869635449656e-06, "loss": 2.6761395263671877, "step": 823800 }, { "epoch": 0.994145113934834, "learning_rate": 6.713183128077227e-06, "loss": 2.671181945800781, "step": 823900 }, { "epoch": 0.9942657772573167, "learning_rate": 6.712779292609488e-06, "loss": 2.67576171875, "step": 824000 }, { "epoch": 0.9943864405797993, "learning_rate": 6.71237545714175e-06, "loss": 2.668782958984375, "step": 824100 }, { "epoch": 0.994507103902282, "learning_rate": 6.711971621674012e-06, "loss": 2.6599774169921875, "step": 824200 }, { "epoch": 0.9946277672247646, "learning_rate": 6.711567786206274e-06, "loss": 2.653553466796875, "step": 824300 }, { "epoch": 0.9947484305472474, "learning_rate": 6.711163950738535e-06, "loss": 2.645980224609375, "step": 824400 }, { "epoch": 0.9948690938697301, "learning_rate": 6.710760115270797e-06, "loss": 2.683380432128906, "step": 824500 }, { "epoch": 0.9949897571922127, "learning_rate": 6.710356279803059e-06, "loss": 2.682442626953125, "step": 824600 }, { "epoch": 0.9951104205146954, "learning_rate": 6.709952444335319e-06, "loss": 2.657414855957031, "step": 824700 }, { "epoch": 0.9952310838371781, "learning_rate": 6.709548608867581e-06, "loss": 2.660740966796875, "step": 824800 }, { "epoch": 0.9953517471596608, "learning_rate": 6.709144773399843e-06, "loss": 2.67637939453125, "step": 824900 }, { "epoch": 0.9954724104821435, "learning_rate": 6.708740937932104e-06, "loss": 2.6584527587890623, "step": 825000 }, { "epoch": 0.9955930738046261, "learning_rate": 6.708337102464366e-06, "loss": 2.675741882324219, "step": 825100 }, { "epoch": 0.9957137371271089, "learning_rate": 6.707933266996628e-06, "loss": 2.6681900024414062, "step": 825200 }, { "epoch": 0.9958344004495916, "learning_rate": 6.707529431528889e-06, "loss": 2.6534722900390624, "step": 825300 }, { "epoch": 0.9959550637720742, "learning_rate": 6.707125596061151e-06, "loss": 2.6840509033203124, "step": 825400 }, { "epoch": 0.9960757270945569, "learning_rate": 6.7067217605934125e-06, "loss": 2.678610534667969, "step": 825500 }, { "epoch": 0.9961963904170396, "learning_rate": 6.706317925125674e-06, "loss": 2.65917236328125, "step": 825600 }, { "epoch": 0.9963170537395223, "learning_rate": 6.705914089657936e-06, "loss": 2.6591110229492188, "step": 825700 }, { "epoch": 0.996437717062005, "learning_rate": 6.705510254190198e-06, "loss": 2.682529296875, "step": 825800 }, { "epoch": 0.9965583803844876, "learning_rate": 6.705106418722459e-06, "loss": 2.6839044189453123, "step": 825900 }, { "epoch": 0.9966790437069704, "learning_rate": 6.704702583254721e-06, "loss": 2.6751528930664064, "step": 826000 }, { "epoch": 0.996799707029453, "learning_rate": 6.704298747786983e-06, "loss": 2.670529479980469, "step": 826100 }, { "epoch": 0.9969203703519357, "learning_rate": 6.703894912319245e-06, "loss": 2.650093688964844, "step": 826200 }, { "epoch": 0.9970410336744184, "learning_rate": 6.703491076851505e-06, "loss": 2.662044677734375, "step": 826300 }, { "epoch": 0.997161696996901, "learning_rate": 6.703087241383767e-06, "loss": 2.6854217529296873, "step": 826400 }, { "epoch": 0.9972823603193838, "learning_rate": 6.702683405916028e-06, "loss": 2.696641845703125, "step": 826500 }, { "epoch": 0.9974030236418664, "learning_rate": 6.70227957044829e-06, "loss": 2.6746514892578124, "step": 826600 }, { "epoch": 0.9975236869643491, "learning_rate": 6.701875734980552e-06, "loss": 2.68685546875, "step": 826700 }, { "epoch": 0.9976443502868318, "learning_rate": 6.701471899512814e-06, "loss": 2.6613497924804688, "step": 826800 }, { "epoch": 0.9977650136093145, "learning_rate": 6.701068064045075e-06, "loss": 2.6856564331054686, "step": 826900 }, { "epoch": 0.9978856769317972, "learning_rate": 6.700664228577337e-06, "loss": 2.673701171875, "step": 827000 }, { "epoch": 0.9980063402542798, "learning_rate": 6.700260393109597e-06, "loss": 2.6949124145507812, "step": 827100 }, { "epoch": 0.9981270035767625, "learning_rate": 6.699856557641859e-06, "loss": 2.6727285766601563, "step": 827200 }, { "epoch": 0.9982476668992453, "learning_rate": 6.699452722174121e-06, "loss": 2.668210144042969, "step": 827300 }, { "epoch": 0.9983683302217279, "learning_rate": 6.699048886706383e-06, "loss": 2.6980914306640624, "step": 827400 }, { "epoch": 0.9984889935442106, "learning_rate": 6.6986450512386445e-06, "loss": 2.703157958984375, "step": 827500 }, { "epoch": 0.9986096568666932, "learning_rate": 6.6982412157709065e-06, "loss": 2.6848297119140625, "step": 827600 }, { "epoch": 0.998730320189176, "learning_rate": 6.6978373803031685e-06, "loss": 2.6548025512695315, "step": 827700 }, { "epoch": 0.9988509835116587, "learning_rate": 6.69743354483543e-06, "loss": 2.7009893798828126, "step": 827800 }, { "epoch": 0.9989716468341413, "learning_rate": 6.697029709367691e-06, "loss": 2.6848382568359375, "step": 827900 }, { "epoch": 0.999092310156624, "learning_rate": 6.696625873899953e-06, "loss": 2.656058654785156, "step": 828000 }, { "epoch": 0.9992129734791066, "learning_rate": 6.696222038432214e-06, "loss": 2.672911376953125, "step": 828100 }, { "epoch": 0.9993336368015894, "learning_rate": 6.695818202964476e-06, "loss": 2.6661865234375, "step": 828200 }, { "epoch": 0.9994543001240721, "learning_rate": 6.695414367496738e-06, "loss": 2.6962744140625, "step": 828300 }, { "epoch": 0.9995749634465547, "learning_rate": 6.695010532028999e-06, "loss": 2.6639312744140624, "step": 828400 }, { "epoch": 0.9996956267690374, "learning_rate": 6.694606696561261e-06, "loss": 2.6883038330078124, "step": 828500 }, { "epoch": 0.9998162900915201, "learning_rate": 6.694202861093523e-06, "loss": 2.6783151245117187, "step": 828600 }, { "epoch": 0.9999369534140028, "learning_rate": 6.693799025625785e-06, "loss": 2.670914611816406, "step": 828700 }, { "epoch": 1.0000579183947917, "learning_rate": 6.693395190158045e-06, "loss": 2.642450866699219, "step": 828800 }, { "epoch": 1.0001785817172744, "learning_rate": 6.692991354690307e-06, "loss": 2.664066162109375, "step": 828900 }, { "epoch": 1.000299245039757, "learning_rate": 6.692587519222568e-06, "loss": 2.672530517578125, "step": 829000 }, { "epoch": 1.0004199083622398, "learning_rate": 6.69218368375483e-06, "loss": 2.656075439453125, "step": 829100 }, { "epoch": 1.0005405716847224, "learning_rate": 6.691779848287092e-06, "loss": 2.6617922973632813, "step": 829200 }, { "epoch": 1.000661235007205, "learning_rate": 6.691376012819354e-06, "loss": 2.6811477661132814, "step": 829300 }, { "epoch": 1.000781898329688, "learning_rate": 6.690972177351615e-06, "loss": 2.656368408203125, "step": 829400 }, { "epoch": 1.0009025616521705, "learning_rate": 6.690568341883877e-06, "loss": 2.687430419921875, "step": 829500 }, { "epoch": 1.0010232249746531, "learning_rate": 6.690164506416138e-06, "loss": 2.668204040527344, "step": 829600 }, { "epoch": 1.0011438882971357, "learning_rate": 6.6897606709484e-06, "loss": 2.6946099853515624, "step": 829700 }, { "epoch": 1.0012645516196186, "learning_rate": 6.689356835480662e-06, "loss": 2.6431613159179688, "step": 829800 }, { "epoch": 1.0013852149421012, "learning_rate": 6.688953000012924e-06, "loss": 2.658269348144531, "step": 829900 }, { "epoch": 1.0015058782645838, "learning_rate": 6.688549164545185e-06, "loss": 2.665915832519531, "step": 830000 }, { "epoch": 1.0016265415870667, "learning_rate": 6.688145329077447e-06, "loss": 2.6680718994140626, "step": 830100 }, { "epoch": 1.0017472049095493, "learning_rate": 6.687741493609709e-06, "loss": 2.6460205078125, "step": 830200 }, { "epoch": 1.0018678682320319, "learning_rate": 6.68733765814197e-06, "loss": 2.665745849609375, "step": 830300 }, { "epoch": 1.0019885315545147, "learning_rate": 6.686933822674231e-06, "loss": 2.670310363769531, "step": 830400 }, { "epoch": 1.0021091948769973, "learning_rate": 6.686529987206493e-06, "loss": 2.6609701538085937, "step": 830500 }, { "epoch": 1.00222985819948, "learning_rate": 6.686126151738754e-06, "loss": 2.68549560546875, "step": 830600 }, { "epoch": 1.0023505215219626, "learning_rate": 6.685722316271016e-06, "loss": 2.6621697998046874, "step": 830700 }, { "epoch": 1.0024711848444454, "learning_rate": 6.685318480803278e-06, "loss": 2.6637542724609373, "step": 830800 }, { "epoch": 1.002591848166928, "learning_rate": 6.684914645335539e-06, "loss": 2.6727145385742186, "step": 830900 }, { "epoch": 1.0027125114894107, "learning_rate": 6.684510809867801e-06, "loss": 2.670887451171875, "step": 831000 }, { "epoch": 1.0028331748118935, "learning_rate": 6.684106974400063e-06, "loss": 2.6645999145507813, "step": 831100 }, { "epoch": 1.002953838134376, "learning_rate": 6.6837031389323235e-06, "loss": 2.6778253173828124, "step": 831200 }, { "epoch": 1.0030745014568587, "learning_rate": 6.6832993034645854e-06, "loss": 2.653314514160156, "step": 831300 }, { "epoch": 1.0031951647793416, "learning_rate": 6.682895467996847e-06, "loss": 2.669618835449219, "step": 831400 }, { "epoch": 1.0033158281018242, "learning_rate": 6.6824916325291086e-06, "loss": 2.6839334106445314, "step": 831500 }, { "epoch": 1.0034364914243068, "learning_rate": 6.6820877970613705e-06, "loss": 2.6693310546875, "step": 831600 }, { "epoch": 1.0035571547467894, "learning_rate": 6.6816839615936325e-06, "loss": 2.65457275390625, "step": 831700 }, { "epoch": 1.0036778180692723, "learning_rate": 6.6812801261258945e-06, "loss": 2.6749365234375, "step": 831800 }, { "epoch": 1.0037984813917549, "learning_rate": 6.680876290658156e-06, "loss": 2.6946420288085937, "step": 831900 }, { "epoch": 1.0039191447142375, "learning_rate": 6.680472455190417e-06, "loss": 2.6551580810546875, "step": 832000 }, { "epoch": 1.0040398080367203, "learning_rate": 6.680068619722678e-06, "loss": 2.6457122802734374, "step": 832100 }, { "epoch": 1.004160471359203, "learning_rate": 6.67966478425494e-06, "loss": 2.6547357177734376, "step": 832200 }, { "epoch": 1.0042811346816856, "learning_rate": 6.679260948787202e-06, "loss": 2.6392483520507812, "step": 832300 }, { "epoch": 1.0044017980041684, "learning_rate": 6.678857113319464e-06, "loss": 2.671790771484375, "step": 832400 }, { "epoch": 1.004522461326651, "learning_rate": 6.678453277851725e-06, "loss": 2.688953857421875, "step": 832500 }, { "epoch": 1.0046431246491336, "learning_rate": 6.678049442383987e-06, "loss": 2.669514465332031, "step": 832600 }, { "epoch": 1.0047637879716165, "learning_rate": 6.677645606916249e-06, "loss": 2.667991943359375, "step": 832700 }, { "epoch": 1.004884451294099, "learning_rate": 6.677241771448509e-06, "loss": 2.6686502075195313, "step": 832800 }, { "epoch": 1.0050051146165817, "learning_rate": 6.676837935980771e-06, "loss": 2.6730770874023437, "step": 832900 }, { "epoch": 1.0051257779390643, "learning_rate": 6.676434100513033e-06, "loss": 2.6629248046875, "step": 833000 }, { "epoch": 1.0052464412615472, "learning_rate": 6.676030265045294e-06, "loss": 2.6706048583984376, "step": 833100 }, { "epoch": 1.0053671045840298, "learning_rate": 6.675626429577556e-06, "loss": 2.6712841796875, "step": 833200 }, { "epoch": 1.0054877679065124, "learning_rate": 6.675222594109818e-06, "loss": 2.6916168212890623, "step": 833300 }, { "epoch": 1.0056084312289952, "learning_rate": 6.6748187586420794e-06, "loss": 2.6764617919921876, "step": 833400 }, { "epoch": 1.0057290945514779, "learning_rate": 6.6744149231743414e-06, "loss": 2.6857620239257813, "step": 833500 }, { "epoch": 1.0058497578739605, "learning_rate": 6.6740110877066026e-06, "loss": 2.69642333984375, "step": 833600 }, { "epoch": 1.0059704211964433, "learning_rate": 6.673607252238864e-06, "loss": 2.669405212402344, "step": 833700 }, { "epoch": 1.006091084518926, "learning_rate": 6.673203416771126e-06, "loss": 2.67684814453125, "step": 833800 }, { "epoch": 1.0062117478414085, "learning_rate": 6.672799581303388e-06, "loss": 2.694349365234375, "step": 833900 }, { "epoch": 1.0063324111638912, "learning_rate": 6.672395745835649e-06, "loss": 2.652376708984375, "step": 834000 }, { "epoch": 1.006453074486374, "learning_rate": 6.671991910367911e-06, "loss": 2.6683200073242186, "step": 834100 }, { "epoch": 1.0065737378088566, "learning_rate": 6.671588074900173e-06, "loss": 2.673197937011719, "step": 834200 }, { "epoch": 1.0066944011313392, "learning_rate": 6.671184239432435e-06, "loss": 2.6989065551757814, "step": 834300 }, { "epoch": 1.006815064453822, "learning_rate": 6.670780403964696e-06, "loss": 2.6509268188476565, "step": 834400 }, { "epoch": 1.0069357277763047, "learning_rate": 6.670376568496957e-06, "loss": 2.634881896972656, "step": 834500 }, { "epoch": 1.0070563910987873, "learning_rate": 6.669972733029218e-06, "loss": 2.6676651000976563, "step": 834600 }, { "epoch": 1.0071770544212701, "learning_rate": 6.66956889756148e-06, "loss": 2.648936767578125, "step": 834700 }, { "epoch": 1.0072977177437528, "learning_rate": 6.669165062093742e-06, "loss": 2.6786160278320312, "step": 834800 }, { "epoch": 1.0074183810662354, "learning_rate": 6.668761226626004e-06, "loss": 2.66345703125, "step": 834900 }, { "epoch": 1.007539044388718, "learning_rate": 6.668357391158265e-06, "loss": 2.6724398803710936, "step": 835000 }, { "epoch": 1.0076597077112008, "learning_rate": 6.667953555690527e-06, "loss": 2.675732421875, "step": 835100 }, { "epoch": 1.0077803710336835, "learning_rate": 6.667549720222789e-06, "loss": 2.6875408935546874, "step": 835200 }, { "epoch": 1.007901034356166, "learning_rate": 6.6671458847550495e-06, "loss": 2.664395751953125, "step": 835300 }, { "epoch": 1.008021697678649, "learning_rate": 6.6667420492873115e-06, "loss": 2.669517822265625, "step": 835400 }, { "epoch": 1.0081423610011315, "learning_rate": 6.6663382138195735e-06, "loss": 2.679656677246094, "step": 835500 }, { "epoch": 1.0082630243236141, "learning_rate": 6.665934378351835e-06, "loss": 2.650309753417969, "step": 835600 }, { "epoch": 1.008383687646097, "learning_rate": 6.6655305428840966e-06, "loss": 2.6916583251953123, "step": 835700 }, { "epoch": 1.0085043509685796, "learning_rate": 6.6651267074163586e-06, "loss": 2.6457611083984376, "step": 835800 }, { "epoch": 1.0086250142910622, "learning_rate": 6.66472287194862e-06, "loss": 2.6728253173828125, "step": 835900 }, { "epoch": 1.0087456776135448, "learning_rate": 6.664319036480882e-06, "loss": 2.6713372802734376, "step": 836000 }, { "epoch": 1.0088663409360277, "learning_rate": 6.663915201013143e-06, "loss": 2.6735125732421876, "step": 836100 }, { "epoch": 1.0089870042585103, "learning_rate": 6.663511365545404e-06, "loss": 2.681324462890625, "step": 836200 }, { "epoch": 1.009107667580993, "learning_rate": 6.663107530077666e-06, "loss": 2.650556640625, "step": 836300 }, { "epoch": 1.0092283309034757, "learning_rate": 6.662703694609928e-06, "loss": 2.670698547363281, "step": 836400 }, { "epoch": 1.0093489942259584, "learning_rate": 6.662299859142189e-06, "loss": 2.671199951171875, "step": 836500 }, { "epoch": 1.009469657548441, "learning_rate": 6.661896023674451e-06, "loss": 2.6779010009765627, "step": 836600 }, { "epoch": 1.0095903208709238, "learning_rate": 6.661492188206713e-06, "loss": 2.6741632080078124, "step": 836700 }, { "epoch": 1.0097109841934064, "learning_rate": 6.661088352738975e-06, "loss": 2.66322998046875, "step": 836800 }, { "epoch": 1.009831647515889, "learning_rate": 6.660684517271235e-06, "loss": 2.667527160644531, "step": 836900 }, { "epoch": 1.0099523108383717, "learning_rate": 6.660280681803497e-06, "loss": 2.671894226074219, "step": 837000 }, { "epoch": 1.0100729741608545, "learning_rate": 6.659876846335758e-06, "loss": 2.670956726074219, "step": 837100 }, { "epoch": 1.0101936374833371, "learning_rate": 6.65947301086802e-06, "loss": 2.6606573486328124, "step": 837200 }, { "epoch": 1.0103143008058197, "learning_rate": 6.659069175400282e-06, "loss": 2.6768124389648436, "step": 837300 }, { "epoch": 1.0104349641283026, "learning_rate": 6.658665339932544e-06, "loss": 2.6502520751953127, "step": 837400 }, { "epoch": 1.0105556274507852, "learning_rate": 6.6582615044648055e-06, "loss": 2.665366516113281, "step": 837500 }, { "epoch": 1.0106762907732678, "learning_rate": 6.6578576689970675e-06, "loss": 2.6486215209960937, "step": 837600 }, { "epoch": 1.0107969540957507, "learning_rate": 6.657453833529328e-06, "loss": 2.6668106079101563, "step": 837700 }, { "epoch": 1.0109176174182333, "learning_rate": 6.65704999806159e-06, "loss": 2.6575384521484375, "step": 837800 }, { "epoch": 1.0110382807407159, "learning_rate": 6.656646162593852e-06, "loss": 2.6694976806640627, "step": 837900 }, { "epoch": 1.0111589440631987, "learning_rate": 6.656242327126114e-06, "loss": 2.671161804199219, "step": 838000 }, { "epoch": 1.0112796073856813, "learning_rate": 6.655838491658375e-06, "loss": 2.66253173828125, "step": 838100 }, { "epoch": 1.011400270708164, "learning_rate": 6.655434656190637e-06, "loss": 2.6559109497070312, "step": 838200 }, { "epoch": 1.0115209340306466, "learning_rate": 6.655030820722899e-06, "loss": 2.6654876708984374, "step": 838300 }, { "epoch": 1.0116415973531294, "learning_rate": 6.654626985255161e-06, "loss": 2.661060791015625, "step": 838400 }, { "epoch": 1.011762260675612, "learning_rate": 6.654223149787421e-06, "loss": 2.67801513671875, "step": 838500 }, { "epoch": 1.0118829239980947, "learning_rate": 6.653819314319683e-06, "loss": 2.6741067504882814, "step": 838600 }, { "epoch": 1.0120035873205775, "learning_rate": 6.653415478851944e-06, "loss": 2.6697662353515623, "step": 838700 }, { "epoch": 1.01212425064306, "learning_rate": 6.653011643384206e-06, "loss": 2.6659414672851565, "step": 838800 }, { "epoch": 1.0122449139655427, "learning_rate": 6.652607807916468e-06, "loss": 2.661806640625, "step": 838900 }, { "epoch": 1.0123655772880256, "learning_rate": 6.65220397244873e-06, "loss": 2.6762405395507813, "step": 839000 }, { "epoch": 1.0124862406105082, "learning_rate": 6.651800136980991e-06, "loss": 2.6752886962890625, "step": 839100 }, { "epoch": 1.0126069039329908, "learning_rate": 6.651396301513253e-06, "loss": 2.664350891113281, "step": 839200 }, { "epoch": 1.0127275672554734, "learning_rate": 6.650992466045515e-06, "loss": 2.6602581787109374, "step": 839300 }, { "epoch": 1.0128482305779563, "learning_rate": 6.6505886305777755e-06, "loss": 2.6652041625976564, "step": 839400 }, { "epoch": 1.0129688939004389, "learning_rate": 6.6501847951100375e-06, "loss": 2.6705694580078125, "step": 839500 }, { "epoch": 1.0130895572229215, "learning_rate": 6.6497809596422995e-06, "loss": 2.664001159667969, "step": 839600 }, { "epoch": 1.0132102205454043, "learning_rate": 6.649377124174561e-06, "loss": 2.6558001708984373, "step": 839700 }, { "epoch": 1.013330883867887, "learning_rate": 6.648973288706823e-06, "loss": 2.660788879394531, "step": 839800 }, { "epoch": 1.0134515471903696, "learning_rate": 6.648569453239085e-06, "loss": 2.665801696777344, "step": 839900 }, { "epoch": 1.0135722105128524, "learning_rate": 6.648165617771346e-06, "loss": 2.6536279296875, "step": 840000 }, { "epoch": 1.013692873835335, "learning_rate": 6.647761782303608e-06, "loss": 2.64593994140625, "step": 840100 }, { "epoch": 1.0138135371578176, "learning_rate": 6.647357946835869e-06, "loss": 2.6660198974609375, "step": 840200 }, { "epoch": 1.0139342004803003, "learning_rate": 6.64695411136813e-06, "loss": 2.6681332397460937, "step": 840300 }, { "epoch": 1.014054863802783, "learning_rate": 6.646550275900392e-06, "loss": 2.6684912109375, "step": 840400 }, { "epoch": 1.0141755271252657, "learning_rate": 6.646146440432654e-06, "loss": 2.669108581542969, "step": 840500 }, { "epoch": 1.0142961904477483, "learning_rate": 6.645742604964915e-06, "loss": 2.6840383911132815, "step": 840600 }, { "epoch": 1.0144168537702312, "learning_rate": 6.645338769497177e-06, "loss": 2.691567077636719, "step": 840700 }, { "epoch": 1.0145375170927138, "learning_rate": 6.644934934029439e-06, "loss": 2.6614700317382813, "step": 840800 }, { "epoch": 1.0146581804151964, "learning_rate": 6.644531098561701e-06, "loss": 2.6920761108398437, "step": 840900 }, { "epoch": 1.0147788437376792, "learning_rate": 6.644127263093961e-06, "loss": 2.6617111206054687, "step": 841000 }, { "epoch": 1.0148995070601619, "learning_rate": 6.643723427626223e-06, "loss": 2.6799588012695312, "step": 841100 }, { "epoch": 1.0150201703826445, "learning_rate": 6.6433195921584844e-06, "loss": 2.6266168212890624, "step": 841200 }, { "epoch": 1.015140833705127, "learning_rate": 6.642915756690746e-06, "loss": 2.701055908203125, "step": 841300 }, { "epoch": 1.01526149702761, "learning_rate": 6.642511921223008e-06, "loss": 2.6607894897460938, "step": 841400 }, { "epoch": 1.0153821603500925, "learning_rate": 6.64210808575527e-06, "loss": 2.638602600097656, "step": 841500 }, { "epoch": 1.0155028236725752, "learning_rate": 6.6417042502875315e-06, "loss": 2.6609042358398436, "step": 841600 }, { "epoch": 1.015623486995058, "learning_rate": 6.6413004148197935e-06, "loss": 2.671781005859375, "step": 841700 }, { "epoch": 1.0157441503175406, "learning_rate": 6.640896579352054e-06, "loss": 2.664034423828125, "step": 841800 }, { "epoch": 1.0158648136400232, "learning_rate": 6.640492743884316e-06, "loss": 2.6587152099609375, "step": 841900 }, { "epoch": 1.015985476962506, "learning_rate": 6.640088908416578e-06, "loss": 2.673206481933594, "step": 842000 }, { "epoch": 1.0161061402849887, "learning_rate": 6.63968507294884e-06, "loss": 2.662435302734375, "step": 842100 }, { "epoch": 1.0162268036074713, "learning_rate": 6.639281237481101e-06, "loss": 2.6557958984375, "step": 842200 }, { "epoch": 1.016347466929954, "learning_rate": 6.638877402013363e-06, "loss": 2.6544424438476564, "step": 842300 }, { "epoch": 1.0164681302524368, "learning_rate": 6.638473566545625e-06, "loss": 2.6642086791992186, "step": 842400 }, { "epoch": 1.0165887935749194, "learning_rate": 6.638069731077886e-06, "loss": 2.655965576171875, "step": 842500 }, { "epoch": 1.016709456897402, "learning_rate": 6.637665895610147e-06, "loss": 2.6639285278320313, "step": 842600 }, { "epoch": 1.0168301202198848, "learning_rate": 6.637262060142409e-06, "loss": 2.660499267578125, "step": 842700 }, { "epoch": 1.0169507835423675, "learning_rate": 6.63685822467467e-06, "loss": 2.657254943847656, "step": 842800 }, { "epoch": 1.01707144686485, "learning_rate": 6.636454389206932e-06, "loss": 2.670887756347656, "step": 842900 }, { "epoch": 1.017192110187333, "learning_rate": 6.636050553739194e-06, "loss": 2.657173767089844, "step": 843000 }, { "epoch": 1.0173127735098155, "learning_rate": 6.635646718271455e-06, "loss": 2.654862365722656, "step": 843100 }, { "epoch": 1.0174334368322981, "learning_rate": 6.635242882803717e-06, "loss": 2.6756695556640624, "step": 843200 }, { "epoch": 1.017554100154781, "learning_rate": 6.634839047335979e-06, "loss": 2.6746527099609376, "step": 843300 }, { "epoch": 1.0176747634772636, "learning_rate": 6.6344352118682396e-06, "loss": 2.66942138671875, "step": 843400 }, { "epoch": 1.0177954267997462, "learning_rate": 6.6340313764005016e-06, "loss": 2.676083679199219, "step": 843500 }, { "epoch": 1.0179160901222288, "learning_rate": 6.6336275409327635e-06, "loss": 2.6710162353515625, "step": 843600 }, { "epoch": 1.0180367534447117, "learning_rate": 6.633223705465025e-06, "loss": 2.66753173828125, "step": 843700 }, { "epoch": 1.0181574167671943, "learning_rate": 6.632819869997287e-06, "loss": 2.660012512207031, "step": 843800 }, { "epoch": 1.018278080089677, "learning_rate": 6.632416034529549e-06, "loss": 2.643835144042969, "step": 843900 }, { "epoch": 1.0183987434121597, "learning_rate": 6.632012199061811e-06, "loss": 2.6691470336914063, "step": 844000 }, { "epoch": 1.0185194067346424, "learning_rate": 6.631608363594072e-06, "loss": 2.698969421386719, "step": 844100 }, { "epoch": 1.018640070057125, "learning_rate": 6.631204528126334e-06, "loss": 2.644516906738281, "step": 844200 }, { "epoch": 1.0187607333796078, "learning_rate": 6.630800692658594e-06, "loss": 2.63013671875, "step": 844300 }, { "epoch": 1.0188813967020904, "learning_rate": 6.630396857190856e-06, "loss": 2.67343994140625, "step": 844400 }, { "epoch": 1.019002060024573, "learning_rate": 6.629993021723118e-06, "loss": 2.6569744873046877, "step": 844500 }, { "epoch": 1.0191227233470557, "learning_rate": 6.62958918625538e-06, "loss": 2.6643170166015624, "step": 844600 }, { "epoch": 1.0192433866695385, "learning_rate": 6.629185350787641e-06, "loss": 2.6886367797851562, "step": 844700 }, { "epoch": 1.0193640499920211, "learning_rate": 6.628781515319903e-06, "loss": 2.6861776733398437, "step": 844800 }, { "epoch": 1.0194847133145037, "learning_rate": 6.628377679852165e-06, "loss": 2.6629437255859374, "step": 844900 }, { "epoch": 1.0196053766369866, "learning_rate": 6.627973844384426e-06, "loss": 2.6712942504882813, "step": 845000 }, { "epoch": 1.0197260399594692, "learning_rate": 6.627570008916687e-06, "loss": 2.6819091796875, "step": 845100 }, { "epoch": 1.0198467032819518, "learning_rate": 6.627166173448949e-06, "loss": 2.6625592041015627, "step": 845200 }, { "epoch": 1.0199673666044347, "learning_rate": 6.6267623379812105e-06, "loss": 2.6553729248046873, "step": 845300 }, { "epoch": 1.0200880299269173, "learning_rate": 6.6263585025134724e-06, "loss": 2.6611422729492187, "step": 845400 }, { "epoch": 1.0202086932494, "learning_rate": 6.6259546670457344e-06, "loss": 2.6362686157226562, "step": 845500 }, { "epoch": 1.0203293565718825, "learning_rate": 6.6255508315779956e-06, "loss": 2.654532165527344, "step": 845600 }, { "epoch": 1.0204500198943653, "learning_rate": 6.6251469961102575e-06, "loss": 2.6682080078125, "step": 845700 }, { "epoch": 1.020570683216848, "learning_rate": 6.6247431606425195e-06, "loss": 2.6667340087890623, "step": 845800 }, { "epoch": 1.0206913465393306, "learning_rate": 6.62433932517478e-06, "loss": 2.6703524780273438, "step": 845900 }, { "epoch": 1.0208120098618134, "learning_rate": 6.623935489707042e-06, "loss": 2.6463165283203125, "step": 846000 }, { "epoch": 1.020932673184296, "learning_rate": 6.623531654239304e-06, "loss": 2.6798980712890623, "step": 846100 }, { "epoch": 1.0210533365067787, "learning_rate": 6.623127818771565e-06, "loss": 2.6738818359375, "step": 846200 }, { "epoch": 1.0211739998292615, "learning_rate": 6.622723983303827e-06, "loss": 2.66275390625, "step": 846300 }, { "epoch": 1.021294663151744, "learning_rate": 6.622320147836089e-06, "loss": 2.6870220947265624, "step": 846400 }, { "epoch": 1.0214153264742267, "learning_rate": 6.621916312368351e-06, "loss": 2.6608245849609373, "step": 846500 }, { "epoch": 1.0215359897967093, "learning_rate": 6.621512476900612e-06, "loss": 2.687867431640625, "step": 846600 }, { "epoch": 1.0216566531191922, "learning_rate": 6.621108641432873e-06, "loss": 2.663904113769531, "step": 846700 }, { "epoch": 1.0217773164416748, "learning_rate": 6.620704805965134e-06, "loss": 2.6595773315429687, "step": 846800 }, { "epoch": 1.0218979797641574, "learning_rate": 6.620300970497396e-06, "loss": 2.64540283203125, "step": 846900 }, { "epoch": 1.0220186430866403, "learning_rate": 6.619897135029658e-06, "loss": 2.6698724365234376, "step": 847000 }, { "epoch": 1.0221393064091229, "learning_rate": 6.61949329956192e-06, "loss": 2.685932312011719, "step": 847100 }, { "epoch": 1.0222599697316055, "learning_rate": 6.619089464094181e-06, "loss": 2.666602783203125, "step": 847200 }, { "epoch": 1.0223806330540883, "learning_rate": 6.618685628626443e-06, "loss": 2.660416564941406, "step": 847300 }, { "epoch": 1.022501296376571, "learning_rate": 6.618281793158705e-06, "loss": 2.654067077636719, "step": 847400 }, { "epoch": 1.0226219596990536, "learning_rate": 6.617877957690966e-06, "loss": 2.6481011962890624, "step": 847500 }, { "epoch": 1.0227426230215362, "learning_rate": 6.617474122223228e-06, "loss": 2.657057800292969, "step": 847600 }, { "epoch": 1.022863286344019, "learning_rate": 6.6170702867554896e-06, "loss": 2.6477362060546876, "step": 847700 }, { "epoch": 1.0229839496665016, "learning_rate": 6.616666451287751e-06, "loss": 2.6805355834960936, "step": 847800 }, { "epoch": 1.0231046129889843, "learning_rate": 6.616262615820013e-06, "loss": 2.680877380371094, "step": 847900 }, { "epoch": 1.023225276311467, "learning_rate": 6.615858780352275e-06, "loss": 2.670315856933594, "step": 848000 }, { "epoch": 1.0233459396339497, "learning_rate": 6.615454944884536e-06, "loss": 2.6568426513671874, "step": 848100 }, { "epoch": 1.0234666029564323, "learning_rate": 6.615051109416798e-06, "loss": 2.6580429077148438, "step": 848200 }, { "epoch": 1.0235872662789152, "learning_rate": 6.614647273949059e-06, "loss": 2.661504211425781, "step": 848300 }, { "epoch": 1.0237079296013978, "learning_rate": 6.61424343848132e-06, "loss": 2.672857360839844, "step": 848400 }, { "epoch": 1.0238285929238804, "learning_rate": 6.613839603013582e-06, "loss": 2.6788214111328124, "step": 848500 }, { "epoch": 1.0239492562463632, "learning_rate": 6.613435767545844e-06, "loss": 2.6561856079101562, "step": 848600 }, { "epoch": 1.0240699195688459, "learning_rate": 6.613031932078105e-06, "loss": 2.6525918579101564, "step": 848700 }, { "epoch": 1.0241905828913285, "learning_rate": 6.612628096610367e-06, "loss": 2.67130859375, "step": 848800 }, { "epoch": 1.024311246213811, "learning_rate": 6.612224261142629e-06, "loss": 2.6575555419921875, "step": 848900 }, { "epoch": 1.024431909536294, "learning_rate": 6.611820425674891e-06, "loss": 2.67512939453125, "step": 849000 }, { "epoch": 1.0245525728587765, "learning_rate": 6.611416590207151e-06, "loss": 2.691391906738281, "step": 849100 }, { "epoch": 1.0246732361812592, "learning_rate": 6.611012754739413e-06, "loss": 2.6630853271484374, "step": 849200 }, { "epoch": 1.024793899503742, "learning_rate": 6.6106089192716745e-06, "loss": 2.6648638916015623, "step": 849300 }, { "epoch": 1.0249145628262246, "learning_rate": 6.6102050838039365e-06, "loss": 2.670361328125, "step": 849400 }, { "epoch": 1.0250352261487072, "learning_rate": 6.6098012483361985e-06, "loss": 2.6736968994140624, "step": 849500 }, { "epoch": 1.02515588947119, "learning_rate": 6.6093974128684605e-06, "loss": 2.648916015625, "step": 849600 }, { "epoch": 1.0252765527936727, "learning_rate": 6.608993577400722e-06, "loss": 2.641554260253906, "step": 849700 }, { "epoch": 1.0253972161161553, "learning_rate": 6.608589741932984e-06, "loss": 2.636549987792969, "step": 849800 }, { "epoch": 1.025517879438638, "learning_rate": 6.6081859064652456e-06, "loss": 2.6548391723632814, "step": 849900 }, { "epoch": 1.0256385427611208, "learning_rate": 6.607782070997506e-06, "loss": 2.6585733032226564, "step": 850000 }, { "epoch": 1.0257592060836034, "learning_rate": 6.607378235529768e-06, "loss": 2.6834512329101563, "step": 850100 }, { "epoch": 1.025879869406086, "learning_rate": 6.60697440006203e-06, "loss": 2.6477862548828126, "step": 850200 }, { "epoch": 1.0260005327285688, "learning_rate": 6.606570564594291e-06, "loss": 2.6616439819335938, "step": 850300 }, { "epoch": 1.0261211960510515, "learning_rate": 6.606166729126553e-06, "loss": 2.6444451904296873, "step": 850400 }, { "epoch": 1.026241859373534, "learning_rate": 6.605762893658815e-06, "loss": 2.666917419433594, "step": 850500 }, { "epoch": 1.026362522696017, "learning_rate": 6.605359058191077e-06, "loss": 2.67349365234375, "step": 850600 }, { "epoch": 1.0264831860184995, "learning_rate": 6.604955222723338e-06, "loss": 2.6393853759765626, "step": 850700 }, { "epoch": 1.0266038493409821, "learning_rate": 6.604551387255599e-06, "loss": 2.6858316040039063, "step": 850800 }, { "epoch": 1.0267245126634648, "learning_rate": 6.60414755178786e-06, "loss": 2.6504391479492186, "step": 850900 }, { "epoch": 1.0268451759859476, "learning_rate": 6.603743716320122e-06, "loss": 2.64663330078125, "step": 851000 }, { "epoch": 1.0269658393084302, "learning_rate": 6.603339880852384e-06, "loss": 2.6510772705078125, "step": 851100 }, { "epoch": 1.0270865026309128, "learning_rate": 6.602936045384646e-06, "loss": 2.636679992675781, "step": 851200 }, { "epoch": 1.0272071659533957, "learning_rate": 6.602532209916907e-06, "loss": 2.6563824462890624, "step": 851300 }, { "epoch": 1.0273278292758783, "learning_rate": 6.602128374449169e-06, "loss": 2.65275146484375, "step": 851400 }, { "epoch": 1.027448492598361, "learning_rate": 6.601724538981431e-06, "loss": 2.66157470703125, "step": 851500 }, { "epoch": 1.0275691559208437, "learning_rate": 6.601320703513692e-06, "loss": 2.6549887084960937, "step": 851600 }, { "epoch": 1.0276898192433264, "learning_rate": 6.600916868045954e-06, "loss": 2.675226135253906, "step": 851700 }, { "epoch": 1.027810482565809, "learning_rate": 6.600513032578215e-06, "loss": 2.640070495605469, "step": 851800 }, { "epoch": 1.0279311458882916, "learning_rate": 6.600109197110477e-06, "loss": 2.6607135009765623, "step": 851900 }, { "epoch": 1.0280518092107744, "learning_rate": 6.599705361642739e-06, "loss": 2.636357421875, "step": 852000 }, { "epoch": 1.028172472533257, "learning_rate": 6.599301526175001e-06, "loss": 2.641199645996094, "step": 852100 }, { "epoch": 1.0282931358557397, "learning_rate": 6.598897690707262e-06, "loss": 2.657536926269531, "step": 852200 }, { "epoch": 1.0284137991782225, "learning_rate": 6.598493855239524e-06, "loss": 2.6468405151367187, "step": 852300 }, { "epoch": 1.0285344625007051, "learning_rate": 6.598090019771784e-06, "loss": 2.6573443603515625, "step": 852400 }, { "epoch": 1.0286551258231877, "learning_rate": 6.597686184304046e-06, "loss": 2.685948486328125, "step": 852500 }, { "epoch": 1.0287757891456706, "learning_rate": 6.597282348836308e-06, "loss": 2.6307864379882813, "step": 852600 }, { "epoch": 1.0288964524681532, "learning_rate": 6.59687851336857e-06, "loss": 2.6891790771484376, "step": 852700 }, { "epoch": 1.0290171157906358, "learning_rate": 6.596474677900831e-06, "loss": 2.6423190307617186, "step": 852800 }, { "epoch": 1.0291377791131187, "learning_rate": 6.596070842433093e-06, "loss": 2.62477294921875, "step": 852900 }, { "epoch": 1.0292584424356013, "learning_rate": 6.595667006965355e-06, "loss": 2.6624185180664064, "step": 853000 }, { "epoch": 1.029379105758084, "learning_rate": 6.595263171497617e-06, "loss": 2.67115478515625, "step": 853100 }, { "epoch": 1.0294997690805665, "learning_rate": 6.5948593360298774e-06, "loss": 2.6584716796875, "step": 853200 }, { "epoch": 1.0296204324030493, "learning_rate": 6.594455500562139e-06, "loss": 2.689708557128906, "step": 853300 }, { "epoch": 1.029741095725532, "learning_rate": 6.5940516650944006e-06, "loss": 2.6736416625976562, "step": 853400 }, { "epoch": 1.0298617590480146, "learning_rate": 6.5936478296266625e-06, "loss": 2.6801522827148436, "step": 853500 }, { "epoch": 1.0299824223704974, "learning_rate": 6.5932439941589245e-06, "loss": 2.669095764160156, "step": 853600 }, { "epoch": 1.03010308569298, "learning_rate": 6.5928401586911865e-06, "loss": 2.672066955566406, "step": 853700 }, { "epoch": 1.0302237490154627, "learning_rate": 6.592436323223448e-06, "loss": 2.649106750488281, "step": 853800 }, { "epoch": 1.0303444123379455, "learning_rate": 6.59203248775571e-06, "loss": 2.665860595703125, "step": 853900 }, { "epoch": 1.030465075660428, "learning_rate": 6.59162865228797e-06, "loss": 2.628764953613281, "step": 854000 }, { "epoch": 1.0305857389829107, "learning_rate": 6.591224816820232e-06, "loss": 2.6653570556640624, "step": 854100 }, { "epoch": 1.0307064023053933, "learning_rate": 6.590820981352494e-06, "loss": 2.655375671386719, "step": 854200 }, { "epoch": 1.0308270656278762, "learning_rate": 6.590417145884756e-06, "loss": 2.669874572753906, "step": 854300 }, { "epoch": 1.0309477289503588, "learning_rate": 6.590013310417017e-06, "loss": 2.654976806640625, "step": 854400 }, { "epoch": 1.0310683922728414, "learning_rate": 6.589609474949279e-06, "loss": 2.684794616699219, "step": 854500 }, { "epoch": 1.0311890555953243, "learning_rate": 6.589205639481541e-06, "loss": 2.65213134765625, "step": 854600 }, { "epoch": 1.0313097189178069, "learning_rate": 6.588801804013802e-06, "loss": 2.6710015869140626, "step": 854700 }, { "epoch": 1.0314303822402895, "learning_rate": 6.588397968546064e-06, "loss": 2.6651321411132813, "step": 854800 }, { "epoch": 1.0315510455627723, "learning_rate": 6.587994133078325e-06, "loss": 2.686104736328125, "step": 854900 }, { "epoch": 1.031671708885255, "learning_rate": 6.587590297610586e-06, "loss": 2.660299072265625, "step": 855000 }, { "epoch": 1.0317923722077376, "learning_rate": 6.587186462142848e-06, "loss": 2.65587890625, "step": 855100 }, { "epoch": 1.0319130355302202, "learning_rate": 6.58678262667511e-06, "loss": 2.653806457519531, "step": 855200 }, { "epoch": 1.032033698852703, "learning_rate": 6.5863787912073714e-06, "loss": 2.639870910644531, "step": 855300 }, { "epoch": 1.0321543621751856, "learning_rate": 6.5859749557396334e-06, "loss": 2.6648077392578124, "step": 855400 }, { "epoch": 1.0322750254976683, "learning_rate": 6.585571120271895e-06, "loss": 2.6432940673828127, "step": 855500 }, { "epoch": 1.032395688820151, "learning_rate": 6.585167284804157e-06, "loss": 2.6633099365234374, "step": 855600 }, { "epoch": 1.0325163521426337, "learning_rate": 6.584763449336418e-06, "loss": 2.6723321533203124, "step": 855700 }, { "epoch": 1.0326370154651163, "learning_rate": 6.58435961386868e-06, "loss": 2.6634262084960936, "step": 855800 }, { "epoch": 1.0327576787875992, "learning_rate": 6.583955778400941e-06, "loss": 2.645987243652344, "step": 855900 }, { "epoch": 1.0328783421100818, "learning_rate": 6.583551942933203e-06, "loss": 2.6544680786132813, "step": 856000 }, { "epoch": 1.0329990054325644, "learning_rate": 6.583148107465465e-06, "loss": 2.63458984375, "step": 856100 }, { "epoch": 1.033119668755047, "learning_rate": 6.582744271997727e-06, "loss": 2.6761883544921874, "step": 856200 }, { "epoch": 1.0332403320775299, "learning_rate": 6.582340436529988e-06, "loss": 2.665079345703125, "step": 856300 }, { "epoch": 1.0333609954000125, "learning_rate": 6.58193660106225e-06, "loss": 2.687864990234375, "step": 856400 }, { "epoch": 1.033481658722495, "learning_rate": 6.58153276559451e-06, "loss": 2.6806842041015626, "step": 856500 }, { "epoch": 1.033602322044978, "learning_rate": 6.581128930126772e-06, "loss": 2.6934719848632813, "step": 856600 }, { "epoch": 1.0337229853674605, "learning_rate": 6.580725094659034e-06, "loss": 2.646905822753906, "step": 856700 }, { "epoch": 1.0338436486899432, "learning_rate": 6.580321259191296e-06, "loss": 2.6504745483398438, "step": 856800 }, { "epoch": 1.033964312012426, "learning_rate": 6.579917423723557e-06, "loss": 2.677440490722656, "step": 856900 }, { "epoch": 1.0340849753349086, "learning_rate": 6.579513588255819e-06, "loss": 2.6621365356445312, "step": 857000 }, { "epoch": 1.0342056386573912, "learning_rate": 6.579109752788081e-06, "loss": 2.660322570800781, "step": 857100 }, { "epoch": 1.034326301979874, "learning_rate": 6.578705917320342e-06, "loss": 2.6694549560546874, "step": 857200 }, { "epoch": 1.0344469653023567, "learning_rate": 6.5783020818526035e-06, "loss": 2.6505975341796875, "step": 857300 }, { "epoch": 1.0345676286248393, "learning_rate": 6.5778982463848655e-06, "loss": 2.629649658203125, "step": 857400 }, { "epoch": 1.034688291947322, "learning_rate": 6.577494410917127e-06, "loss": 2.650999755859375, "step": 857500 }, { "epoch": 1.0348089552698048, "learning_rate": 6.5770905754493886e-06, "loss": 2.6468011474609376, "step": 857600 }, { "epoch": 1.0349296185922874, "learning_rate": 6.5766867399816506e-06, "loss": 2.662148742675781, "step": 857700 }, { "epoch": 1.03505028191477, "learning_rate": 6.576282904513912e-06, "loss": 2.654186096191406, "step": 857800 }, { "epoch": 1.0351709452372528, "learning_rate": 6.575879069046174e-06, "loss": 2.6556997680664063, "step": 857900 }, { "epoch": 1.0352916085597355, "learning_rate": 6.575475233578436e-06, "loss": 2.6523202514648436, "step": 858000 }, { "epoch": 1.035412271882218, "learning_rate": 6.575071398110696e-06, "loss": 2.6602276611328124, "step": 858100 }, { "epoch": 1.0355329352047007, "learning_rate": 6.574667562642958e-06, "loss": 2.645975341796875, "step": 858200 }, { "epoch": 1.0356535985271835, "learning_rate": 6.57426372717522e-06, "loss": 2.6490289306640626, "step": 858300 }, { "epoch": 1.0357742618496661, "learning_rate": 6.573859891707481e-06, "loss": 2.6418307495117186, "step": 858400 }, { "epoch": 1.0358949251721488, "learning_rate": 6.573456056239743e-06, "loss": 2.6403173828125, "step": 858500 }, { "epoch": 1.0360155884946316, "learning_rate": 6.573052220772005e-06, "loss": 2.6551242065429688, "step": 858600 }, { "epoch": 1.0361362518171142, "learning_rate": 6.572648385304267e-06, "loss": 2.661435546875, "step": 858700 }, { "epoch": 1.0362569151395968, "learning_rate": 6.572244549836528e-06, "loss": 2.6435809326171875, "step": 858800 }, { "epoch": 1.0363775784620797, "learning_rate": 6.571840714368789e-06, "loss": 2.6443072509765626, "step": 858900 }, { "epoch": 1.0364982417845623, "learning_rate": 6.57143687890105e-06, "loss": 2.6608346557617186, "step": 859000 }, { "epoch": 1.036618905107045, "learning_rate": 6.571033043433312e-06, "loss": 2.675945129394531, "step": 859100 }, { "epoch": 1.0367395684295277, "learning_rate": 6.570629207965574e-06, "loss": 2.6627679443359376, "step": 859200 }, { "epoch": 1.0368602317520104, "learning_rate": 6.570225372497836e-06, "loss": 2.649039611816406, "step": 859300 }, { "epoch": 1.036980895074493, "learning_rate": 6.5698215370300975e-06, "loss": 2.6746310424804687, "step": 859400 }, { "epoch": 1.0371015583969756, "learning_rate": 6.5694177015623595e-06, "loss": 2.6650421142578127, "step": 859500 }, { "epoch": 1.0372222217194584, "learning_rate": 6.5690138660946214e-06, "loss": 2.6862005615234374, "step": 859600 }, { "epoch": 1.037342885041941, "learning_rate": 6.5686100306268826e-06, "loss": 2.6595944213867186, "step": 859700 }, { "epoch": 1.0374635483644237, "learning_rate": 6.568206195159144e-06, "loss": 2.650043640136719, "step": 859800 }, { "epoch": 1.0375842116869065, "learning_rate": 6.567802359691406e-06, "loss": 2.6377102661132814, "step": 859900 }, { "epoch": 1.0377048750093891, "learning_rate": 6.567398524223667e-06, "loss": 2.6747036743164063, "step": 860000 }, { "epoch": 1.0378255383318717, "learning_rate": 6.566994688755929e-06, "loss": 2.6581015014648437, "step": 860100 }, { "epoch": 1.0379462016543546, "learning_rate": 6.566590853288191e-06, "loss": 2.65966552734375, "step": 860200 }, { "epoch": 1.0380668649768372, "learning_rate": 6.566187017820452e-06, "loss": 2.666154479980469, "step": 860300 }, { "epoch": 1.0381875282993198, "learning_rate": 6.565783182352714e-06, "loss": 2.65571044921875, "step": 860400 }, { "epoch": 1.0383081916218024, "learning_rate": 6.565379346884976e-06, "loss": 2.6635250854492187, "step": 860500 }, { "epoch": 1.0384288549442853, "learning_rate": 6.564975511417236e-06, "loss": 2.645590515136719, "step": 860600 }, { "epoch": 1.038549518266768, "learning_rate": 6.564571675949498e-06, "loss": 2.6616973876953125, "step": 860700 }, { "epoch": 1.0386701815892505, "learning_rate": 6.56416784048176e-06, "loss": 2.6690750122070312, "step": 860800 }, { "epoch": 1.0387908449117333, "learning_rate": 6.563764005014021e-06, "loss": 2.6457373046875, "step": 860900 }, { "epoch": 1.038911508234216, "learning_rate": 6.563360169546283e-06, "loss": 2.6602078247070313, "step": 861000 }, { "epoch": 1.0390321715566986, "learning_rate": 6.562956334078545e-06, "loss": 2.6707504272460936, "step": 861100 }, { "epoch": 1.0391528348791814, "learning_rate": 6.562552498610807e-06, "loss": 2.646268310546875, "step": 861200 }, { "epoch": 1.039273498201664, "learning_rate": 6.562148663143068e-06, "loss": 2.6717535400390626, "step": 861300 }, { "epoch": 1.0393941615241467, "learning_rate": 6.5617448276753295e-06, "loss": 2.644560546875, "step": 861400 }, { "epoch": 1.0395148248466293, "learning_rate": 6.561340992207591e-06, "loss": 2.6601791381835938, "step": 861500 }, { "epoch": 1.039635488169112, "learning_rate": 6.560937156739853e-06, "loss": 2.63201171875, "step": 861600 }, { "epoch": 1.0397561514915947, "learning_rate": 6.560533321272115e-06, "loss": 2.6256149291992186, "step": 861700 }, { "epoch": 1.0398768148140773, "learning_rate": 6.560129485804377e-06, "loss": 2.656178283691406, "step": 861800 }, { "epoch": 1.0399974781365602, "learning_rate": 6.559725650336638e-06, "loss": 2.6676565551757814, "step": 861900 }, { "epoch": 1.0401181414590428, "learning_rate": 6.5593218148689e-06, "loss": 2.670790100097656, "step": 862000 }, { "epoch": 1.0402388047815254, "learning_rate": 6.558917979401162e-06, "loss": 2.6625601196289064, "step": 862100 }, { "epoch": 1.0403594681040083, "learning_rate": 6.558514143933422e-06, "loss": 2.63179443359375, "step": 862200 }, { "epoch": 1.0404801314264909, "learning_rate": 6.558110308465684e-06, "loss": 2.669542236328125, "step": 862300 }, { "epoch": 1.0406007947489735, "learning_rate": 6.557706472997946e-06, "loss": 2.682248840332031, "step": 862400 }, { "epoch": 1.0407214580714563, "learning_rate": 6.557302637530207e-06, "loss": 2.670917663574219, "step": 862500 }, { "epoch": 1.040842121393939, "learning_rate": 6.556898802062469e-06, "loss": 2.662626953125, "step": 862600 }, { "epoch": 1.0409627847164216, "learning_rate": 6.556494966594731e-06, "loss": 2.646322937011719, "step": 862700 }, { "epoch": 1.0410834480389042, "learning_rate": 6.556091131126992e-06, "loss": 2.6600152587890626, "step": 862800 }, { "epoch": 1.041204111361387, "learning_rate": 6.555687295659254e-06, "loss": 2.6633270263671873, "step": 862900 }, { "epoch": 1.0413247746838696, "learning_rate": 6.555283460191515e-06, "loss": 2.658177490234375, "step": 863000 }, { "epoch": 1.0414454380063523, "learning_rate": 6.5548796247237764e-06, "loss": 2.64822265625, "step": 863100 }, { "epoch": 1.041566101328835, "learning_rate": 6.554475789256038e-06, "loss": 2.629946594238281, "step": 863200 }, { "epoch": 1.0416867646513177, "learning_rate": 6.5540719537883e-06, "loss": 2.6696182250976563, "step": 863300 }, { "epoch": 1.0418074279738003, "learning_rate": 6.5536681183205615e-06, "loss": 2.6381912231445312, "step": 863400 }, { "epoch": 1.041928091296283, "learning_rate": 6.5532642828528235e-06, "loss": 2.6217132568359376, "step": 863500 }, { "epoch": 1.0420487546187658, "learning_rate": 6.5528604473850855e-06, "loss": 2.6428948974609376, "step": 863600 }, { "epoch": 1.0421694179412484, "learning_rate": 6.5524566119173475e-06, "loss": 2.653642578125, "step": 863700 }, { "epoch": 1.042290081263731, "learning_rate": 6.552052776449608e-06, "loss": 2.647142028808594, "step": 863800 }, { "epoch": 1.0424107445862139, "learning_rate": 6.55164894098187e-06, "loss": 2.650415344238281, "step": 863900 }, { "epoch": 1.0425314079086965, "learning_rate": 6.551245105514131e-06, "loss": 2.6517449951171876, "step": 864000 }, { "epoch": 1.042652071231179, "learning_rate": 6.550841270046393e-06, "loss": 2.679823913574219, "step": 864100 }, { "epoch": 1.042772734553662, "learning_rate": 6.550437434578655e-06, "loss": 2.6401962280273437, "step": 864200 }, { "epoch": 1.0428933978761445, "learning_rate": 6.550033599110917e-06, "loss": 2.638868408203125, "step": 864300 }, { "epoch": 1.0430140611986272, "learning_rate": 6.549629763643178e-06, "loss": 2.657568054199219, "step": 864400 }, { "epoch": 1.04313472452111, "learning_rate": 6.54922592817544e-06, "loss": 2.664769592285156, "step": 864500 }, { "epoch": 1.0432553878435926, "learning_rate": 6.5488220927077e-06, "loss": 2.6384393310546876, "step": 864600 }, { "epoch": 1.0433760511660752, "learning_rate": 6.548418257239962e-06, "loss": 2.6465411376953125, "step": 864700 }, { "epoch": 1.0434967144885579, "learning_rate": 6.548014421772224e-06, "loss": 2.66962158203125, "step": 864800 }, { "epoch": 1.0436173778110407, "learning_rate": 6.547610586304486e-06, "loss": 2.6625872802734376, "step": 864900 }, { "epoch": 1.0437380411335233, "learning_rate": 6.547206750836747e-06, "loss": 2.6427951049804688, "step": 865000 }, { "epoch": 1.043858704456006, "learning_rate": 6.546802915369009e-06, "loss": 2.6510223388671874, "step": 865100 }, { "epoch": 1.0439793677784888, "learning_rate": 6.546399079901271e-06, "loss": 2.62669921875, "step": 865200 }, { "epoch": 1.0441000311009714, "learning_rate": 6.545995244433533e-06, "loss": 2.661985168457031, "step": 865300 }, { "epoch": 1.044220694423454, "learning_rate": 6.545591408965794e-06, "loss": 2.6588861083984376, "step": 865400 }, { "epoch": 1.0443413577459368, "learning_rate": 6.5451875734980555e-06, "loss": 2.62440673828125, "step": 865500 }, { "epoch": 1.0444620210684195, "learning_rate": 6.544783738030317e-06, "loss": 2.670568542480469, "step": 865600 }, { "epoch": 1.044582684390902, "learning_rate": 6.544379902562579e-06, "loss": 2.639734191894531, "step": 865700 }, { "epoch": 1.0447033477133847, "learning_rate": 6.543976067094841e-06, "loss": 2.6616775512695314, "step": 865800 }, { "epoch": 1.0448240110358675, "learning_rate": 6.543572231627103e-06, "loss": 2.6679861450195315, "step": 865900 }, { "epoch": 1.0449446743583501, "learning_rate": 6.543168396159364e-06, "loss": 2.6500689697265627, "step": 866000 }, { "epoch": 1.0450653376808328, "learning_rate": 6.542764560691626e-06, "loss": 2.6400405883789064, "step": 866100 }, { "epoch": 1.0451860010033156, "learning_rate": 6.542360725223888e-06, "loss": 2.6446298217773436, "step": 866200 }, { "epoch": 1.0453066643257982, "learning_rate": 6.541956889756148e-06, "loss": 2.6448324584960936, "step": 866300 }, { "epoch": 1.0454273276482808, "learning_rate": 6.54155305428841e-06, "loss": 2.635065002441406, "step": 866400 }, { "epoch": 1.0455479909707637, "learning_rate": 6.541149218820672e-06, "loss": 2.639224853515625, "step": 866500 }, { "epoch": 1.0456686542932463, "learning_rate": 6.540745383352933e-06, "loss": 2.6287567138671877, "step": 866600 }, { "epoch": 1.045789317615729, "learning_rate": 6.540341547885195e-06, "loss": 2.6558935546875, "step": 866700 }, { "epoch": 1.0459099809382115, "learning_rate": 6.539937712417457e-06, "loss": 2.6529446411132813, "step": 866800 }, { "epoch": 1.0460306442606944, "learning_rate": 6.539533876949718e-06, "loss": 2.6300665283203126, "step": 866900 }, { "epoch": 1.046151307583177, "learning_rate": 6.53913004148198e-06, "loss": 2.642272644042969, "step": 867000 }, { "epoch": 1.0462719709056596, "learning_rate": 6.538726206014241e-06, "loss": 2.64414794921875, "step": 867100 }, { "epoch": 1.0463926342281424, "learning_rate": 6.5383223705465025e-06, "loss": 2.6574798583984376, "step": 867200 }, { "epoch": 1.046513297550625, "learning_rate": 6.5379185350787644e-06, "loss": 2.6605404663085936, "step": 867300 }, { "epoch": 1.0466339608731077, "learning_rate": 6.5375146996110264e-06, "loss": 2.6691802978515624, "step": 867400 }, { "epoch": 1.0467546241955905, "learning_rate": 6.5371108641432876e-06, "loss": 2.66790771484375, "step": 867500 }, { "epoch": 1.0468752875180731, "learning_rate": 6.5367070286755495e-06, "loss": 2.655499267578125, "step": 867600 }, { "epoch": 1.0469959508405557, "learning_rate": 6.5363031932078115e-06, "loss": 2.644698486328125, "step": 867700 }, { "epoch": 1.0471166141630386, "learning_rate": 6.5358993577400735e-06, "loss": 2.634197998046875, "step": 867800 }, { "epoch": 1.0472372774855212, "learning_rate": 6.535495522272334e-06, "loss": 2.63038330078125, "step": 867900 }, { "epoch": 1.0473579408080038, "learning_rate": 6.535091686804596e-06, "loss": 2.684940185546875, "step": 868000 }, { "epoch": 1.0474786041304864, "learning_rate": 6.534687851336857e-06, "loss": 2.6191342163085936, "step": 868100 }, { "epoch": 1.0475992674529693, "learning_rate": 6.534284015869119e-06, "loss": 2.6336541748046876, "step": 868200 }, { "epoch": 1.047719930775452, "learning_rate": 6.533880180401381e-06, "loss": 2.635486755371094, "step": 868300 }, { "epoch": 1.0478405940979345, "learning_rate": 6.533476344933643e-06, "loss": 2.652287902832031, "step": 868400 }, { "epoch": 1.0479612574204173, "learning_rate": 6.533072509465904e-06, "loss": 2.6567562866210936, "step": 868500 }, { "epoch": 1.0480819207429, "learning_rate": 6.532668673998166e-06, "loss": 2.6486111450195313, "step": 868600 }, { "epoch": 1.0482025840653826, "learning_rate": 6.532264838530426e-06, "loss": 2.667272033691406, "step": 868700 }, { "epoch": 1.0483232473878652, "learning_rate": 6.531861003062688e-06, "loss": 2.6466082763671874, "step": 868800 }, { "epoch": 1.048443910710348, "learning_rate": 6.53145716759495e-06, "loss": 2.65130859375, "step": 868900 }, { "epoch": 1.0485645740328307, "learning_rate": 6.531053332127212e-06, "loss": 2.6867575073242187, "step": 869000 }, { "epoch": 1.0486852373553133, "learning_rate": 6.530649496659473e-06, "loss": 2.6360244750976562, "step": 869100 }, { "epoch": 1.048805900677796, "learning_rate": 6.530245661191735e-06, "loss": 2.6693984985351564, "step": 869200 }, { "epoch": 1.0489265640002787, "learning_rate": 6.529841825723997e-06, "loss": 2.634560546875, "step": 869300 }, { "epoch": 1.0490472273227613, "learning_rate": 6.5294379902562585e-06, "loss": 2.6696878051757813, "step": 869400 }, { "epoch": 1.0491678906452442, "learning_rate": 6.52903415478852e-06, "loss": 2.6768203735351563, "step": 869500 }, { "epoch": 1.0492885539677268, "learning_rate": 6.5286303193207816e-06, "loss": 2.6672378540039063, "step": 869600 }, { "epoch": 1.0494092172902094, "learning_rate": 6.528226483853043e-06, "loss": 2.6537704467773438, "step": 869700 }, { "epoch": 1.0495298806126923, "learning_rate": 6.527822648385305e-06, "loss": 2.638013916015625, "step": 869800 }, { "epoch": 1.0496505439351749, "learning_rate": 6.527418812917567e-06, "loss": 2.6613079833984377, "step": 869900 }, { "epoch": 1.0497712072576575, "learning_rate": 6.527014977449828e-06, "loss": 2.6682989501953127, "step": 870000 }, { "epoch": 1.04989187058014, "learning_rate": 6.52661114198209e-06, "loss": 2.6600079345703125, "step": 870100 }, { "epoch": 1.050012533902623, "learning_rate": 6.526207306514352e-06, "loss": 2.622137451171875, "step": 870200 }, { "epoch": 1.0501331972251056, "learning_rate": 6.525803471046614e-06, "loss": 2.6603347778320314, "step": 870300 }, { "epoch": 1.0502538605475882, "learning_rate": 6.525399635578874e-06, "loss": 2.6478982543945313, "step": 870400 }, { "epoch": 1.050374523870071, "learning_rate": 6.524995800111136e-06, "loss": 2.6451791381835936, "step": 870500 }, { "epoch": 1.0504951871925536, "learning_rate": 6.524591964643397e-06, "loss": 2.66137451171875, "step": 870600 }, { "epoch": 1.0506158505150363, "learning_rate": 6.524188129175659e-06, "loss": 2.627479248046875, "step": 870700 }, { "epoch": 1.050736513837519, "learning_rate": 6.523784293707921e-06, "loss": 2.636741943359375, "step": 870800 }, { "epoch": 1.0508571771600017, "learning_rate": 6.523380458240183e-06, "loss": 2.633809814453125, "step": 870900 }, { "epoch": 1.0509778404824843, "learning_rate": 6.522976622772444e-06, "loss": 2.6297537231445314, "step": 871000 }, { "epoch": 1.051098503804967, "learning_rate": 6.522572787304706e-06, "loss": 2.6521612548828126, "step": 871100 }, { "epoch": 1.0512191671274498, "learning_rate": 6.5221689518369665e-06, "loss": 2.649369812011719, "step": 871200 }, { "epoch": 1.0513398304499324, "learning_rate": 6.5217651163692285e-06, "loss": 2.6526748657226564, "step": 871300 }, { "epoch": 1.051460493772415, "learning_rate": 6.5213612809014905e-06, "loss": 2.652823791503906, "step": 871400 }, { "epoch": 1.0515811570948979, "learning_rate": 6.5209574454337525e-06, "loss": 2.6173504638671874, "step": 871500 }, { "epoch": 1.0517018204173805, "learning_rate": 6.520553609966014e-06, "loss": 2.641896057128906, "step": 871600 }, { "epoch": 1.051822483739863, "learning_rate": 6.520149774498276e-06, "loss": 2.654942932128906, "step": 871700 }, { "epoch": 1.051943147062346, "learning_rate": 6.5197459390305376e-06, "loss": 2.6803555297851562, "step": 871800 }, { "epoch": 1.0520638103848285, "learning_rate": 6.519342103562799e-06, "loss": 2.6399136352539063, "step": 871900 }, { "epoch": 1.0521844737073112, "learning_rate": 6.51893826809506e-06, "loss": 2.663939208984375, "step": 872000 }, { "epoch": 1.0523051370297938, "learning_rate": 6.518534432627322e-06, "loss": 2.6471939086914062, "step": 872100 }, { "epoch": 1.0524258003522766, "learning_rate": 6.518130597159583e-06, "loss": 2.653969421386719, "step": 872200 }, { "epoch": 1.0525464636747592, "learning_rate": 6.517726761691845e-06, "loss": 2.655210266113281, "step": 872300 }, { "epoch": 1.0526671269972419, "learning_rate": 6.517322926224107e-06, "loss": 2.651669616699219, "step": 872400 }, { "epoch": 1.0527877903197247, "learning_rate": 6.516919090756368e-06, "loss": 2.6597576904296876, "step": 872500 }, { "epoch": 1.0529084536422073, "learning_rate": 6.51651525528863e-06, "loss": 2.6276895141601564, "step": 872600 }, { "epoch": 1.05302911696469, "learning_rate": 6.516111419820892e-06, "loss": 2.64956787109375, "step": 872700 }, { "epoch": 1.0531497802871728, "learning_rate": 6.515707584353152e-06, "loss": 2.666306457519531, "step": 872800 }, { "epoch": 1.0532704436096554, "learning_rate": 6.515303748885414e-06, "loss": 2.64918701171875, "step": 872900 }, { "epoch": 1.053391106932138, "learning_rate": 6.514899913417676e-06, "loss": 2.6624520874023436, "step": 873000 }, { "epoch": 1.0535117702546208, "learning_rate": 6.514496077949937e-06, "loss": 2.6900738525390624, "step": 873100 }, { "epoch": 1.0536324335771035, "learning_rate": 6.514092242482199e-06, "loss": 2.6566534423828125, "step": 873200 }, { "epoch": 1.053753096899586, "learning_rate": 6.513688407014461e-06, "loss": 2.6597393798828124, "step": 873300 }, { "epoch": 1.0538737602220687, "learning_rate": 6.513284571546723e-06, "loss": 2.669294738769531, "step": 873400 }, { "epoch": 1.0539944235445515, "learning_rate": 6.5128807360789845e-06, "loss": 2.656913146972656, "step": 873500 }, { "epoch": 1.0541150868670341, "learning_rate": 6.512476900611246e-06, "loss": 2.6480670166015625, "step": 873600 }, { "epoch": 1.0542357501895168, "learning_rate": 6.512073065143507e-06, "loss": 2.638843994140625, "step": 873700 }, { "epoch": 1.0543564135119996, "learning_rate": 6.511669229675769e-06, "loss": 2.6424380493164064, "step": 873800 }, { "epoch": 1.0544770768344822, "learning_rate": 6.511265394208031e-06, "loss": 2.649330749511719, "step": 873900 }, { "epoch": 1.0545977401569648, "learning_rate": 6.510861558740293e-06, "loss": 2.64460693359375, "step": 874000 }, { "epoch": 1.0547184034794475, "learning_rate": 6.510457723272554e-06, "loss": 2.6370303344726564, "step": 874100 }, { "epoch": 1.0548390668019303, "learning_rate": 6.510053887804816e-06, "loss": 2.6430368041992187, "step": 874200 }, { "epoch": 1.054959730124413, "learning_rate": 6.509650052337078e-06, "loss": 2.6361294555664063, "step": 874300 }, { "epoch": 1.0550803934468955, "learning_rate": 6.509246216869338e-06, "loss": 2.6367388916015626, "step": 874400 }, { "epoch": 1.0552010567693784, "learning_rate": 6.5088423814016e-06, "loss": 2.6838363647460937, "step": 874500 }, { "epoch": 1.055321720091861, "learning_rate": 6.508438545933862e-06, "loss": 2.651902770996094, "step": 874600 }, { "epoch": 1.0554423834143436, "learning_rate": 6.508034710466123e-06, "loss": 2.6423126220703126, "step": 874700 }, { "epoch": 1.0555630467368264, "learning_rate": 6.507630874998385e-06, "loss": 2.6539730834960937, "step": 874800 }, { "epoch": 1.055683710059309, "learning_rate": 6.507227039530647e-06, "loss": 2.640503234863281, "step": 874900 }, { "epoch": 1.0558043733817917, "learning_rate": 6.506823204062908e-06, "loss": 2.634710693359375, "step": 875000 }, { "epoch": 1.0559250367042745, "learning_rate": 6.50641936859517e-06, "loss": 2.643280029296875, "step": 875100 }, { "epoch": 1.0560457000267571, "learning_rate": 6.506015533127432e-06, "loss": 2.6501611328125, "step": 875200 }, { "epoch": 1.0561663633492397, "learning_rate": 6.5056116976596925e-06, "loss": 2.663890380859375, "step": 875300 }, { "epoch": 1.0562870266717224, "learning_rate": 6.5052078621919545e-06, "loss": 2.6770596313476562, "step": 875400 }, { "epoch": 1.0564076899942052, "learning_rate": 6.5048040267242165e-06, "loss": 2.6340203857421876, "step": 875500 }, { "epoch": 1.0565283533166878, "learning_rate": 6.504400191256478e-06, "loss": 2.6636456298828124, "step": 875600 }, { "epoch": 1.0566490166391704, "learning_rate": 6.50399635578874e-06, "loss": 2.659063720703125, "step": 875700 }, { "epoch": 1.0567696799616533, "learning_rate": 6.503592520321002e-06, "loss": 2.6462841796875, "step": 875800 }, { "epoch": 1.056890343284136, "learning_rate": 6.503188684853264e-06, "loss": 2.6172760009765623, "step": 875900 }, { "epoch": 1.0570110066066185, "learning_rate": 6.502784849385525e-06, "loss": 2.6403009033203126, "step": 876000 }, { "epoch": 1.0571316699291013, "learning_rate": 6.502381013917786e-06, "loss": 2.6411068725585936, "step": 876100 }, { "epoch": 1.057252333251584, "learning_rate": 6.501977178450047e-06, "loss": 2.6441680908203127, "step": 876200 }, { "epoch": 1.0573729965740666, "learning_rate": 6.501573342982309e-06, "loss": 2.6424749755859374, "step": 876300 }, { "epoch": 1.0574936598965492, "learning_rate": 6.501169507514571e-06, "loss": 2.667469177246094, "step": 876400 }, { "epoch": 1.057614323219032, "learning_rate": 6.500765672046833e-06, "loss": 2.6395587158203124, "step": 876500 }, { "epoch": 1.0577349865415147, "learning_rate": 6.500361836579094e-06, "loss": 2.65869384765625, "step": 876600 }, { "epoch": 1.0578556498639973, "learning_rate": 6.499958001111356e-06, "loss": 2.639866943359375, "step": 876700 }, { "epoch": 1.05797631318648, "learning_rate": 6.499554165643618e-06, "loss": 2.6665859985351563, "step": 876800 }, { "epoch": 1.0580969765089627, "learning_rate": 6.499150330175878e-06, "loss": 2.65236083984375, "step": 876900 }, { "epoch": 1.0582176398314453, "learning_rate": 6.49874649470814e-06, "loss": 2.636356201171875, "step": 877000 }, { "epoch": 1.0583383031539282, "learning_rate": 6.498342659240402e-06, "loss": 2.647286682128906, "step": 877100 }, { "epoch": 1.0584589664764108, "learning_rate": 6.4979388237726634e-06, "loss": 2.637803649902344, "step": 877200 }, { "epoch": 1.0585796297988934, "learning_rate": 6.497534988304925e-06, "loss": 2.6235931396484373, "step": 877300 }, { "epoch": 1.058700293121376, "learning_rate": 6.497131152837187e-06, "loss": 2.6467010498046877, "step": 877400 }, { "epoch": 1.0588209564438589, "learning_rate": 6.4967273173694485e-06, "loss": 2.635309753417969, "step": 877500 }, { "epoch": 1.0589416197663415, "learning_rate": 6.4963234819017105e-06, "loss": 2.653896484375, "step": 877600 }, { "epoch": 1.059062283088824, "learning_rate": 6.495919646433972e-06, "loss": 2.6448355102539063, "step": 877700 }, { "epoch": 1.059182946411307, "learning_rate": 6.495515810966233e-06, "loss": 2.6443988037109376, "step": 877800 }, { "epoch": 1.0593036097337896, "learning_rate": 6.495111975498495e-06, "loss": 2.638658447265625, "step": 877900 }, { "epoch": 1.0594242730562722, "learning_rate": 6.494708140030757e-06, "loss": 2.632471618652344, "step": 878000 }, { "epoch": 1.059544936378755, "learning_rate": 6.494304304563018e-06, "loss": 2.6594668579101564, "step": 878100 }, { "epoch": 1.0596655997012376, "learning_rate": 6.49390046909528e-06, "loss": 2.6462420654296874, "step": 878200 }, { "epoch": 1.0597862630237203, "learning_rate": 6.493496633627542e-06, "loss": 2.6353359985351563, "step": 878300 }, { "epoch": 1.059906926346203, "learning_rate": 6.493092798159804e-06, "loss": 2.6366400146484374, "step": 878400 }, { "epoch": 1.0600275896686857, "learning_rate": 6.492688962692064e-06, "loss": 2.638136901855469, "step": 878500 }, { "epoch": 1.0601482529911683, "learning_rate": 6.492285127224326e-06, "loss": 2.6423611450195312, "step": 878600 }, { "epoch": 1.060268916313651, "learning_rate": 6.491881291756587e-06, "loss": 2.635270690917969, "step": 878700 }, { "epoch": 1.0603895796361338, "learning_rate": 6.491477456288849e-06, "loss": 2.6418325805664065, "step": 878800 }, { "epoch": 1.0605102429586164, "learning_rate": 6.491073620821111e-06, "loss": 2.638446044921875, "step": 878900 }, { "epoch": 1.060630906281099, "learning_rate": 6.490669785353373e-06, "loss": 2.655639953613281, "step": 879000 }, { "epoch": 1.0607515696035819, "learning_rate": 6.490265949885634e-06, "loss": 2.634552307128906, "step": 879100 }, { "epoch": 1.0608722329260645, "learning_rate": 6.489862114417896e-06, "loss": 2.6522967529296877, "step": 879200 }, { "epoch": 1.060992896248547, "learning_rate": 6.489458278950157e-06, "loss": 2.618765869140625, "step": 879300 }, { "epoch": 1.06111355957103, "learning_rate": 6.489054443482419e-06, "loss": 2.647611389160156, "step": 879400 }, { "epoch": 1.0612342228935125, "learning_rate": 6.4886506080146806e-06, "loss": 2.650621337890625, "step": 879500 }, { "epoch": 1.0613548862159952, "learning_rate": 6.4882467725469425e-06, "loss": 2.6269134521484374, "step": 879600 }, { "epoch": 1.0614755495384778, "learning_rate": 6.487842937079204e-06, "loss": 2.629508361816406, "step": 879700 }, { "epoch": 1.0615962128609606, "learning_rate": 6.487439101611466e-06, "loss": 2.659398193359375, "step": 879800 }, { "epoch": 1.0617168761834432, "learning_rate": 6.487035266143728e-06, "loss": 2.635176696777344, "step": 879900 }, { "epoch": 1.0618375395059259, "learning_rate": 6.48663143067599e-06, "loss": 2.6163616943359376, "step": 880000 }, { "epoch": 1.0619582028284087, "learning_rate": 6.48622759520825e-06, "loss": 2.63012451171875, "step": 880100 }, { "epoch": 1.0620788661508913, "learning_rate": 6.485823759740512e-06, "loss": 2.6600299072265625, "step": 880200 }, { "epoch": 1.062199529473374, "learning_rate": 6.485419924272773e-06, "loss": 2.6344097900390624, "step": 880300 }, { "epoch": 1.0623201927958568, "learning_rate": 6.485016088805035e-06, "loss": 2.6282809448242186, "step": 880400 }, { "epoch": 1.0624408561183394, "learning_rate": 6.484612253337297e-06, "loss": 2.6318341064453126, "step": 880500 }, { "epoch": 1.062561519440822, "learning_rate": 6.484208417869559e-06, "loss": 2.631944274902344, "step": 880600 }, { "epoch": 1.0626821827633046, "learning_rate": 6.48380458240182e-06, "loss": 2.6311083984375, "step": 880700 }, { "epoch": 1.0628028460857875, "learning_rate": 6.483400746934082e-06, "loss": 2.627524719238281, "step": 880800 }, { "epoch": 1.06292350940827, "learning_rate": 6.482996911466344e-06, "loss": 2.6353680419921877, "step": 880900 }, { "epoch": 1.0630441727307527, "learning_rate": 6.482593075998604e-06, "loss": 2.6402127075195314, "step": 881000 }, { "epoch": 1.0631648360532355, "learning_rate": 6.482189240530866e-06, "loss": 2.6592147827148436, "step": 881100 }, { "epoch": 1.0632854993757181, "learning_rate": 6.481785405063128e-06, "loss": 2.6514044189453125, "step": 881200 }, { "epoch": 1.0634061626982008, "learning_rate": 6.4813815695953895e-06, "loss": 2.6612539672851563, "step": 881300 }, { "epoch": 1.0635268260206836, "learning_rate": 6.4809777341276515e-06, "loss": 2.6413665771484376, "step": 881400 }, { "epoch": 1.0636474893431662, "learning_rate": 6.4805738986599134e-06, "loss": 2.6527398681640624, "step": 881500 }, { "epoch": 1.0637681526656488, "learning_rate": 6.4801700631921746e-06, "loss": 2.6395611572265625, "step": 881600 }, { "epoch": 1.0638888159881315, "learning_rate": 6.4797662277244366e-06, "loss": 2.6543719482421877, "step": 881700 }, { "epoch": 1.0640094793106143, "learning_rate": 6.479362392256698e-06, "loss": 2.6532766723632815, "step": 881800 }, { "epoch": 1.064130142633097, "learning_rate": 6.478958556788959e-06, "loss": 2.644970703125, "step": 881900 }, { "epoch": 1.0642508059555795, "learning_rate": 6.478554721321221e-06, "loss": 2.6310113525390624, "step": 882000 }, { "epoch": 1.0643714692780624, "learning_rate": 6.478150885853483e-06, "loss": 2.646475830078125, "step": 882100 }, { "epoch": 1.064492132600545, "learning_rate": 6.477747050385744e-06, "loss": 2.6392251586914064, "step": 882200 }, { "epoch": 1.0646127959230276, "learning_rate": 6.477343214918006e-06, "loss": 2.632973327636719, "step": 882300 }, { "epoch": 1.0647334592455104, "learning_rate": 6.476939379450268e-06, "loss": 2.643004150390625, "step": 882400 }, { "epoch": 1.064854122567993, "learning_rate": 6.47653554398253e-06, "loss": 2.6370010375976562, "step": 882500 }, { "epoch": 1.0649747858904757, "learning_rate": 6.47613170851479e-06, "loss": 2.631103820800781, "step": 882600 }, { "epoch": 1.0650954492129583, "learning_rate": 6.475727873047052e-06, "loss": 2.654682922363281, "step": 882700 }, { "epoch": 1.0652161125354411, "learning_rate": 6.475324037579313e-06, "loss": 2.6401748657226562, "step": 882800 }, { "epoch": 1.0653367758579237, "learning_rate": 6.474920202111575e-06, "loss": 2.612066345214844, "step": 882900 }, { "epoch": 1.0654574391804064, "learning_rate": 6.474516366643837e-06, "loss": 2.638851318359375, "step": 883000 }, { "epoch": 1.0655781025028892, "learning_rate": 6.474112531176099e-06, "loss": 2.6507623291015623, "step": 883100 }, { "epoch": 1.0656987658253718, "learning_rate": 6.47370869570836e-06, "loss": 2.6301788330078124, "step": 883200 }, { "epoch": 1.0658194291478544, "learning_rate": 6.473304860240622e-06, "loss": 2.6457891845703125, "step": 883300 }, { "epoch": 1.0659400924703373, "learning_rate": 6.472901024772883e-06, "loss": 2.6394549560546876, "step": 883400 }, { "epoch": 1.06606075579282, "learning_rate": 6.472497189305145e-06, "loss": 2.6400970458984374, "step": 883500 }, { "epoch": 1.0661814191153025, "learning_rate": 6.472093353837407e-06, "loss": 2.6297116088867187, "step": 883600 }, { "epoch": 1.0663020824377853, "learning_rate": 6.471689518369669e-06, "loss": 2.641482238769531, "step": 883700 }, { "epoch": 1.066422745760268, "learning_rate": 6.47128568290193e-06, "loss": 2.656490478515625, "step": 883800 }, { "epoch": 1.0665434090827506, "learning_rate": 6.470881847434192e-06, "loss": 2.6502761840820312, "step": 883900 }, { "epoch": 1.0666640724052332, "learning_rate": 6.470478011966454e-06, "loss": 2.661435241699219, "step": 884000 }, { "epoch": 1.066784735727716, "learning_rate": 6.470074176498715e-06, "loss": 2.633891296386719, "step": 884100 }, { "epoch": 1.0669053990501987, "learning_rate": 6.469670341030976e-06, "loss": 2.631265869140625, "step": 884200 }, { "epoch": 1.0670260623726813, "learning_rate": 6.469266505563238e-06, "loss": 2.650437316894531, "step": 884300 }, { "epoch": 1.0671467256951641, "learning_rate": 6.468862670095499e-06, "loss": 2.65962646484375, "step": 884400 }, { "epoch": 1.0672673890176467, "learning_rate": 6.468458834627761e-06, "loss": 2.664656677246094, "step": 884500 }, { "epoch": 1.0673880523401293, "learning_rate": 6.468054999160023e-06, "loss": 2.6083563232421874, "step": 884600 }, { "epoch": 1.067508715662612, "learning_rate": 6.467651163692284e-06, "loss": 2.640457763671875, "step": 884700 }, { "epoch": 1.0676293789850948, "learning_rate": 6.467247328224546e-06, "loss": 2.6536019897460936, "step": 884800 }, { "epoch": 1.0677500423075774, "learning_rate": 6.466843492756808e-06, "loss": 2.6478558349609376, "step": 884900 }, { "epoch": 1.06787070563006, "learning_rate": 6.466439657289068e-06, "loss": 2.6457040405273435, "step": 885000 }, { "epoch": 1.0679913689525429, "learning_rate": 6.46603582182133e-06, "loss": 2.6360858154296873, "step": 885100 }, { "epoch": 1.0681120322750255, "learning_rate": 6.465631986353592e-06, "loss": 2.65676025390625, "step": 885200 }, { "epoch": 1.068232695597508, "learning_rate": 6.4652281508858535e-06, "loss": 2.627732849121094, "step": 885300 }, { "epoch": 1.068353358919991, "learning_rate": 6.4648243154181155e-06, "loss": 2.662294616699219, "step": 885400 }, { "epoch": 1.0684740222424736, "learning_rate": 6.4644204799503775e-06, "loss": 2.663579406738281, "step": 885500 }, { "epoch": 1.0685946855649562, "learning_rate": 6.4640166444826395e-06, "loss": 2.64373291015625, "step": 885600 }, { "epoch": 1.068715348887439, "learning_rate": 6.463612809014901e-06, "loss": 2.6116558837890627, "step": 885700 }, { "epoch": 1.0688360122099216, "learning_rate": 6.463208973547163e-06, "loss": 2.6323678588867185, "step": 885800 }, { "epoch": 1.0689566755324043, "learning_rate": 6.462805138079423e-06, "loss": 2.632845458984375, "step": 885900 }, { "epoch": 1.0690773388548869, "learning_rate": 6.462401302611685e-06, "loss": 2.6381539916992187, "step": 886000 }, { "epoch": 1.0691980021773697, "learning_rate": 6.461997467143947e-06, "loss": 2.6230538940429686, "step": 886100 }, { "epoch": 1.0693186654998523, "learning_rate": 6.461593631676209e-06, "loss": 2.6435015869140623, "step": 886200 }, { "epoch": 1.069439328822335, "learning_rate": 6.46118979620847e-06, "loss": 2.6438534545898436, "step": 886300 }, { "epoch": 1.0695599921448178, "learning_rate": 6.460785960740732e-06, "loss": 2.629372863769531, "step": 886400 }, { "epoch": 1.0696806554673004, "learning_rate": 6.460382125272994e-06, "loss": 2.6683529663085936, "step": 886500 }, { "epoch": 1.069801318789783, "learning_rate": 6.459978289805255e-06, "loss": 2.6277926635742186, "step": 886600 }, { "epoch": 1.0699219821122659, "learning_rate": 6.459574454337516e-06, "loss": 2.658510437011719, "step": 886700 }, { "epoch": 1.0700426454347485, "learning_rate": 6.459170618869778e-06, "loss": 2.6456097412109374, "step": 886800 }, { "epoch": 1.070163308757231, "learning_rate": 6.458766783402039e-06, "loss": 2.6299624633789063, "step": 886900 }, { "epoch": 1.0702839720797137, "learning_rate": 6.458362947934301e-06, "loss": 2.6340560913085938, "step": 887000 }, { "epoch": 1.0704046354021965, "learning_rate": 6.457959112466563e-06, "loss": 2.653772888183594, "step": 887100 }, { "epoch": 1.0705252987246792, "learning_rate": 6.457555276998824e-06, "loss": 2.6311886596679686, "step": 887200 }, { "epoch": 1.0706459620471618, "learning_rate": 6.457151441531086e-06, "loss": 2.64567138671875, "step": 887300 }, { "epoch": 1.0707666253696446, "learning_rate": 6.456747606063348e-06, "loss": 2.643294677734375, "step": 887400 }, { "epoch": 1.0708872886921272, "learning_rate": 6.456343770595609e-06, "loss": 2.657909240722656, "step": 887500 }, { "epoch": 1.0710079520146099, "learning_rate": 6.455939935127871e-06, "loss": 2.6499017333984374, "step": 887600 }, { "epoch": 1.0711286153370927, "learning_rate": 6.455536099660133e-06, "loss": 2.6537051391601563, "step": 887700 }, { "epoch": 1.0712492786595753, "learning_rate": 6.455132264192394e-06, "loss": 2.61180908203125, "step": 887800 }, { "epoch": 1.071369941982058, "learning_rate": 6.454728428724656e-06, "loss": 2.6348248291015626, "step": 887900 }, { "epoch": 1.0714906053045405, "learning_rate": 6.454324593256918e-06, "loss": 2.6328720092773437, "step": 888000 }, { "epoch": 1.0716112686270234, "learning_rate": 6.45392075778918e-06, "loss": 2.65102783203125, "step": 888100 }, { "epoch": 1.071731931949506, "learning_rate": 6.453516922321441e-06, "loss": 2.640761413574219, "step": 888200 }, { "epoch": 1.0718525952719886, "learning_rate": 6.453113086853702e-06, "loss": 2.637531433105469, "step": 888300 }, { "epoch": 1.0719732585944715, "learning_rate": 6.452709251385963e-06, "loss": 2.6259759521484374, "step": 888400 }, { "epoch": 1.072093921916954, "learning_rate": 6.452305415918225e-06, "loss": 2.6354632568359375, "step": 888500 }, { "epoch": 1.0722145852394367, "learning_rate": 6.451901580450487e-06, "loss": 2.64031005859375, "step": 888600 }, { "epoch": 1.0723352485619195, "learning_rate": 6.451497744982749e-06, "loss": 2.646226806640625, "step": 888700 }, { "epoch": 1.0724559118844021, "learning_rate": 6.45109390951501e-06, "loss": 2.6430267333984374, "step": 888800 }, { "epoch": 1.0725765752068848, "learning_rate": 6.450690074047272e-06, "loss": 2.6310321044921876, "step": 888900 }, { "epoch": 1.0726972385293676, "learning_rate": 6.450286238579534e-06, "loss": 2.6230279541015626, "step": 889000 }, { "epoch": 1.0728179018518502, "learning_rate": 6.4498824031117945e-06, "loss": 2.6269216918945313, "step": 889100 }, { "epoch": 1.0729385651743328, "learning_rate": 6.4494785676440564e-06, "loss": 2.63637939453125, "step": 889200 }, { "epoch": 1.0730592284968155, "learning_rate": 6.449074732176318e-06, "loss": 2.620826416015625, "step": 889300 }, { "epoch": 1.0731798918192983, "learning_rate": 6.4486708967085796e-06, "loss": 2.630079345703125, "step": 889400 }, { "epoch": 1.073300555141781, "learning_rate": 6.4482670612408415e-06, "loss": 2.6315579223632812, "step": 889500 }, { "epoch": 1.0734212184642635, "learning_rate": 6.4478632257731035e-06, "loss": 2.6428268432617186, "step": 889600 }, { "epoch": 1.0735418817867464, "learning_rate": 6.447459390305365e-06, "loss": 2.629938659667969, "step": 889700 }, { "epoch": 1.073662545109229, "learning_rate": 6.447055554837627e-06, "loss": 2.640897521972656, "step": 889800 }, { "epoch": 1.0737832084317116, "learning_rate": 6.446651719369888e-06, "loss": 2.654442138671875, "step": 889900 }, { "epoch": 1.0739038717541942, "learning_rate": 6.446247883902149e-06, "loss": 2.64361572265625, "step": 890000 }, { "epoch": 1.074024535076677, "learning_rate": 6.445844048434411e-06, "loss": 2.659996337890625, "step": 890100 }, { "epoch": 1.0741451983991597, "learning_rate": 6.445440212966673e-06, "loss": 2.6445443725585935, "step": 890200 }, { "epoch": 1.0742658617216423, "learning_rate": 6.445036377498934e-06, "loss": 2.653118896484375, "step": 890300 }, { "epoch": 1.0743865250441251, "learning_rate": 6.444632542031196e-06, "loss": 2.6253460693359374, "step": 890400 }, { "epoch": 1.0745071883666077, "learning_rate": 6.444228706563458e-06, "loss": 2.6407986450195313, "step": 890500 }, { "epoch": 1.0746278516890904, "learning_rate": 6.44382487109572e-06, "loss": 2.6272076416015624, "step": 890600 }, { "epoch": 1.0747485150115732, "learning_rate": 6.443421035627981e-06, "loss": 2.6365667724609376, "step": 890700 }, { "epoch": 1.0748691783340558, "learning_rate": 6.443017200160242e-06, "loss": 2.6430850219726563, "step": 890800 }, { "epoch": 1.0749898416565384, "learning_rate": 6.442613364692503e-06, "loss": 2.646309814453125, "step": 890900 }, { "epoch": 1.0751105049790213, "learning_rate": 6.442209529224765e-06, "loss": 2.6549716186523438, "step": 891000 }, { "epoch": 1.075231168301504, "learning_rate": 6.441805693757027e-06, "loss": 2.627316589355469, "step": 891100 }, { "epoch": 1.0753518316239865, "learning_rate": 6.441401858289289e-06, "loss": 2.6275958251953124, "step": 891200 }, { "epoch": 1.0754724949464691, "learning_rate": 6.4409980228215504e-06, "loss": 2.636075134277344, "step": 891300 }, { "epoch": 1.075593158268952, "learning_rate": 6.4405941873538124e-06, "loss": 2.6519879150390624, "step": 891400 }, { "epoch": 1.0757138215914346, "learning_rate": 6.440190351886074e-06, "loss": 2.6578109741210936, "step": 891500 }, { "epoch": 1.0758344849139172, "learning_rate": 6.439786516418335e-06, "loss": 2.6388949584960937, "step": 891600 }, { "epoch": 1.0759551482364, "learning_rate": 6.439382680950597e-06, "loss": 2.640879821777344, "step": 891700 }, { "epoch": 1.0760758115588827, "learning_rate": 6.438978845482859e-06, "loss": 2.6707919311523436, "step": 891800 }, { "epoch": 1.0761964748813653, "learning_rate": 6.43857501001512e-06, "loss": 2.662308349609375, "step": 891900 }, { "epoch": 1.0763171382038481, "learning_rate": 6.438171174547382e-06, "loss": 2.625604553222656, "step": 892000 }, { "epoch": 1.0764378015263307, "learning_rate": 6.437767339079644e-06, "loss": 2.612235412597656, "step": 892100 }, { "epoch": 1.0765584648488133, "learning_rate": 6.437363503611905e-06, "loss": 2.6279949951171875, "step": 892200 }, { "epoch": 1.076679128171296, "learning_rate": 6.436959668144167e-06, "loss": 2.6381768798828125, "step": 892300 }, { "epoch": 1.0767997914937788, "learning_rate": 6.436555832676428e-06, "loss": 2.6264773559570314, "step": 892400 }, { "epoch": 1.0769204548162614, "learning_rate": 6.436151997208689e-06, "loss": 2.639454345703125, "step": 892500 }, { "epoch": 1.077041118138744, "learning_rate": 6.435748161740951e-06, "loss": 2.635142822265625, "step": 892600 }, { "epoch": 1.0771617814612269, "learning_rate": 6.435344326273213e-06, "loss": 2.6622186279296876, "step": 892700 }, { "epoch": 1.0772824447837095, "learning_rate": 6.434940490805474e-06, "loss": 2.6349383544921876, "step": 892800 }, { "epoch": 1.077403108106192, "learning_rate": 6.434536655337736e-06, "loss": 2.6307919311523436, "step": 892900 }, { "epoch": 1.077523771428675, "learning_rate": 6.434132819869998e-06, "loss": 2.624693603515625, "step": 893000 }, { "epoch": 1.0776444347511576, "learning_rate": 6.43372898440226e-06, "loss": 2.6222994995117186, "step": 893100 }, { "epoch": 1.0777650980736402, "learning_rate": 6.4333251489345205e-06, "loss": 2.6278341674804686, "step": 893200 }, { "epoch": 1.0778857613961228, "learning_rate": 6.4329213134667825e-06, "loss": 2.650948181152344, "step": 893300 }, { "epoch": 1.0780064247186056, "learning_rate": 6.432517477999044e-06, "loss": 2.6318792724609374, "step": 893400 }, { "epoch": 1.0781270880410883, "learning_rate": 6.432113642531306e-06, "loss": 2.625208435058594, "step": 893500 }, { "epoch": 1.0782477513635709, "learning_rate": 6.4317098070635676e-06, "loss": 2.6423345947265626, "step": 893600 }, { "epoch": 1.0783684146860537, "learning_rate": 6.4313059715958296e-06, "loss": 2.638625183105469, "step": 893700 }, { "epoch": 1.0784890780085363, "learning_rate": 6.430902136128091e-06, "loss": 2.6456680297851562, "step": 893800 }, { "epoch": 1.078609741331019, "learning_rate": 6.430498300660353e-06, "loss": 2.6427630615234374, "step": 893900 }, { "epoch": 1.0787304046535018, "learning_rate": 6.430094465192613e-06, "loss": 2.6382305908203123, "step": 894000 }, { "epoch": 1.0788510679759844, "learning_rate": 6.429690629724875e-06, "loss": 2.636536865234375, "step": 894100 }, { "epoch": 1.078971731298467, "learning_rate": 6.429286794257137e-06, "loss": 2.655084533691406, "step": 894200 }, { "epoch": 1.0790923946209499, "learning_rate": 6.428882958789399e-06, "loss": 2.63655029296875, "step": 894300 }, { "epoch": 1.0792130579434325, "learning_rate": 6.42847912332166e-06, "loss": 2.604456787109375, "step": 894400 }, { "epoch": 1.079333721265915, "learning_rate": 6.428075287853922e-06, "loss": 2.6357681274414064, "step": 894500 }, { "epoch": 1.0794543845883977, "learning_rate": 6.427671452386184e-06, "loss": 2.643572998046875, "step": 894600 }, { "epoch": 1.0795750479108805, "learning_rate": 6.427267616918446e-06, "loss": 2.651817626953125, "step": 894700 }, { "epoch": 1.0796957112333632, "learning_rate": 6.426863781450706e-06, "loss": 2.6598492431640626, "step": 894800 }, { "epoch": 1.0798163745558458, "learning_rate": 6.426459945982968e-06, "loss": 2.6216156005859377, "step": 894900 }, { "epoch": 1.0799370378783286, "learning_rate": 6.426056110515229e-06, "loss": 2.6192745971679687, "step": 895000 }, { "epoch": 1.0800577012008112, "learning_rate": 6.425652275047491e-06, "loss": 2.6343624877929686, "step": 895100 }, { "epoch": 1.0801783645232939, "learning_rate": 6.425248439579753e-06, "loss": 2.632033386230469, "step": 895200 }, { "epoch": 1.0802990278457765, "learning_rate": 6.424844604112015e-06, "loss": 2.6425872802734376, "step": 895300 }, { "epoch": 1.0804196911682593, "learning_rate": 6.4244407686442765e-06, "loss": 2.6324725341796875, "step": 895400 }, { "epoch": 1.080540354490742, "learning_rate": 6.4240369331765385e-06, "loss": 2.624013671875, "step": 895500 }, { "epoch": 1.0806610178132245, "learning_rate": 6.4236330977088004e-06, "loss": 2.6364117431640626, "step": 895600 }, { "epoch": 1.0807816811357074, "learning_rate": 6.423229262241061e-06, "loss": 2.622001953125, "step": 895700 }, { "epoch": 1.08090234445819, "learning_rate": 6.422825426773323e-06, "loss": 2.62449462890625, "step": 895800 }, { "epoch": 1.0810230077806726, "learning_rate": 6.422421591305585e-06, "loss": 2.647921142578125, "step": 895900 }, { "epoch": 1.0811436711031555, "learning_rate": 6.422017755837846e-06, "loss": 2.643070068359375, "step": 896000 }, { "epoch": 1.081264334425638, "learning_rate": 6.421613920370108e-06, "loss": 2.646632080078125, "step": 896100 }, { "epoch": 1.0813849977481207, "learning_rate": 6.42121008490237e-06, "loss": 2.6206454467773437, "step": 896200 }, { "epoch": 1.0815056610706035, "learning_rate": 6.420806249434631e-06, "loss": 2.6289306640625, "step": 896300 }, { "epoch": 1.0816263243930861, "learning_rate": 6.420402413966893e-06, "loss": 2.6060665893554686, "step": 896400 }, { "epoch": 1.0817469877155688, "learning_rate": 6.419998578499154e-06, "loss": 2.6314297485351563, "step": 896500 }, { "epoch": 1.0818676510380514, "learning_rate": 6.419594743031415e-06, "loss": 2.619541015625, "step": 896600 }, { "epoch": 1.0819883143605342, "learning_rate": 6.419190907563677e-06, "loss": 2.6072732543945314, "step": 896700 }, { "epoch": 1.0821089776830168, "learning_rate": 6.418787072095939e-06, "loss": 2.6565682983398435, "step": 896800 }, { "epoch": 1.0822296410054995, "learning_rate": 6.4183832366282e-06, "loss": 2.6453872680664063, "step": 896900 }, { "epoch": 1.0823503043279823, "learning_rate": 6.417979401160462e-06, "loss": 2.6278091430664063, "step": 897000 }, { "epoch": 1.082470967650465, "learning_rate": 6.417575565692724e-06, "loss": 2.64855712890625, "step": 897100 }, { "epoch": 1.0825916309729475, "learning_rate": 6.417171730224986e-06, "loss": 2.6149783325195313, "step": 897200 }, { "epoch": 1.0827122942954304, "learning_rate": 6.4167678947572465e-06, "loss": 2.641558837890625, "step": 897300 }, { "epoch": 1.082832957617913, "learning_rate": 6.4163640592895085e-06, "loss": 2.6469281005859373, "step": 897400 }, { "epoch": 1.0829536209403956, "learning_rate": 6.41596022382177e-06, "loss": 2.629913024902344, "step": 897500 }, { "epoch": 1.0830742842628782, "learning_rate": 6.415556388354032e-06, "loss": 2.6114385986328124, "step": 897600 }, { "epoch": 1.083194947585361, "learning_rate": 6.415152552886294e-06, "loss": 2.6301785278320313, "step": 897700 }, { "epoch": 1.0833156109078437, "learning_rate": 6.414748717418556e-06, "loss": 2.647728271484375, "step": 897800 }, { "epoch": 1.0834362742303263, "learning_rate": 6.414344881950817e-06, "loss": 2.640047607421875, "step": 897900 }, { "epoch": 1.0835569375528091, "learning_rate": 6.413941046483079e-06, "loss": 2.6385787963867187, "step": 898000 }, { "epoch": 1.0836776008752917, "learning_rate": 6.413537211015339e-06, "loss": 2.633290100097656, "step": 898100 }, { "epoch": 1.0837982641977744, "learning_rate": 6.413133375547601e-06, "loss": 2.665039367675781, "step": 898200 }, { "epoch": 1.0839189275202572, "learning_rate": 6.412729540079863e-06, "loss": 2.6211578369140627, "step": 898300 }, { "epoch": 1.0840395908427398, "learning_rate": 6.412325704612125e-06, "loss": 2.6343563842773436, "step": 898400 }, { "epoch": 1.0841602541652224, "learning_rate": 6.411921869144386e-06, "loss": 2.656985168457031, "step": 898500 }, { "epoch": 1.084280917487705, "learning_rate": 6.411518033676648e-06, "loss": 2.6350607299804687, "step": 898600 }, { "epoch": 1.084401580810188, "learning_rate": 6.41111419820891e-06, "loss": 2.630096740722656, "step": 898700 }, { "epoch": 1.0845222441326705, "learning_rate": 6.410710362741171e-06, "loss": 2.6660140991210937, "step": 898800 }, { "epoch": 1.0846429074551531, "learning_rate": 6.410306527273432e-06, "loss": 2.6578469848632813, "step": 898900 }, { "epoch": 1.084763570777636, "learning_rate": 6.409902691805694e-06, "loss": 2.628138122558594, "step": 899000 }, { "epoch": 1.0848842341001186, "learning_rate": 6.4094988563379554e-06, "loss": 2.6377447509765624, "step": 899100 }, { "epoch": 1.0850048974226012, "learning_rate": 6.409095020870217e-06, "loss": 2.633472595214844, "step": 899200 }, { "epoch": 1.085125560745084, "learning_rate": 6.408691185402479e-06, "loss": 2.640217590332031, "step": 899300 }, { "epoch": 1.0852462240675667, "learning_rate": 6.4082873499347405e-06, "loss": 2.6380740356445314, "step": 899400 }, { "epoch": 1.0853668873900493, "learning_rate": 6.4078835144670025e-06, "loss": 2.6351754760742185, "step": 899500 }, { "epoch": 1.0854875507125321, "learning_rate": 6.4074796789992645e-06, "loss": 2.63486328125, "step": 899600 }, { "epoch": 1.0856082140350147, "learning_rate": 6.407075843531525e-06, "loss": 2.622944030761719, "step": 899700 }, { "epoch": 1.0857288773574973, "learning_rate": 6.406672008063787e-06, "loss": 2.6412396240234375, "step": 899800 }, { "epoch": 1.08584954067998, "learning_rate": 6.406268172596049e-06, "loss": 2.6474014282226563, "step": 899900 }, { "epoch": 1.0859702040024628, "learning_rate": 6.40586433712831e-06, "loss": 2.625941162109375, "step": 900000 }, { "epoch": 1.0860908673249454, "learning_rate": 6.405460501660572e-06, "loss": 2.6224224853515623, "step": 900100 }, { "epoch": 1.086211530647428, "learning_rate": 6.405056666192834e-06, "loss": 2.6442691040039064, "step": 900200 }, { "epoch": 1.0863321939699109, "learning_rate": 6.404652830725096e-06, "loss": 2.663260192871094, "step": 900300 }, { "epoch": 1.0864528572923935, "learning_rate": 6.404248995257357e-06, "loss": 2.6250640869140627, "step": 900400 }, { "epoch": 1.086573520614876, "learning_rate": 6.403845159789618e-06, "loss": 2.627490234375, "step": 900500 }, { "epoch": 1.0866941839373587, "learning_rate": 6.403441324321879e-06, "loss": 2.64927734375, "step": 900600 }, { "epoch": 1.0868148472598416, "learning_rate": 6.403037488854141e-06, "loss": 2.6276925659179686, "step": 900700 }, { "epoch": 1.0869355105823242, "learning_rate": 6.402633653386403e-06, "loss": 2.6348397827148435, "step": 900800 }, { "epoch": 1.0870561739048068, "learning_rate": 6.402229817918665e-06, "loss": 2.6190704345703124, "step": 900900 }, { "epoch": 1.0871768372272896, "learning_rate": 6.401825982450926e-06, "loss": 2.639576416015625, "step": 901000 }, { "epoch": 1.0872975005497723, "learning_rate": 6.401422146983188e-06, "loss": 2.6186724853515626, "step": 901100 }, { "epoch": 1.0874181638722549, "learning_rate": 6.40101831151545e-06, "loss": 2.634073486328125, "step": 901200 }, { "epoch": 1.0875388271947377, "learning_rate": 6.400614476047711e-06, "loss": 2.6529754638671874, "step": 901300 }, { "epoch": 1.0876594905172203, "learning_rate": 6.4002106405799726e-06, "loss": 2.6316290283203125, "step": 901400 }, { "epoch": 1.087780153839703, "learning_rate": 6.3998068051122345e-06, "loss": 2.6493212890625, "step": 901500 }, { "epoch": 1.0879008171621858, "learning_rate": 6.399402969644496e-06, "loss": 2.6346371459960936, "step": 901600 }, { "epoch": 1.0880214804846684, "learning_rate": 6.398999134176758e-06, "loss": 2.598580627441406, "step": 901700 }, { "epoch": 1.088142143807151, "learning_rate": 6.39859529870902e-06, "loss": 2.615245361328125, "step": 901800 }, { "epoch": 1.0882628071296336, "learning_rate": 6.398191463241281e-06, "loss": 2.6423220825195313, "step": 901900 }, { "epoch": 1.0883834704521165, "learning_rate": 6.397787627773543e-06, "loss": 2.628992614746094, "step": 902000 }, { "epoch": 1.088504133774599, "learning_rate": 6.397383792305805e-06, "loss": 2.600397033691406, "step": 902100 }, { "epoch": 1.0886247970970817, "learning_rate": 6.396979956838065e-06, "loss": 2.6216082763671875, "step": 902200 }, { "epoch": 1.0887454604195645, "learning_rate": 6.396576121370327e-06, "loss": 2.6081747436523437, "step": 902300 }, { "epoch": 1.0888661237420472, "learning_rate": 6.396172285902589e-06, "loss": 2.633494567871094, "step": 902400 }, { "epoch": 1.0889867870645298, "learning_rate": 6.39576845043485e-06, "loss": 2.63342529296875, "step": 902500 }, { "epoch": 1.0891074503870126, "learning_rate": 6.395364614967112e-06, "loss": 2.6232778930664065, "step": 902600 }, { "epoch": 1.0892281137094952, "learning_rate": 6.394960779499374e-06, "loss": 2.6272543334960936, "step": 902700 }, { "epoch": 1.0893487770319779, "learning_rate": 6.394556944031636e-06, "loss": 2.628411865234375, "step": 902800 }, { "epoch": 1.0894694403544605, "learning_rate": 6.394153108563897e-06, "loss": 2.6402325439453125, "step": 902900 }, { "epoch": 1.0895901036769433, "learning_rate": 6.393749273096158e-06, "loss": 2.6524313354492186, "step": 903000 }, { "epoch": 1.089710766999426, "learning_rate": 6.3933454376284195e-06, "loss": 2.6346249389648437, "step": 903100 }, { "epoch": 1.0898314303219085, "learning_rate": 6.3929416021606815e-06, "loss": 2.6294720458984373, "step": 903200 }, { "epoch": 1.0899520936443914, "learning_rate": 6.3925377666929434e-06, "loss": 2.6317105102539062, "step": 903300 }, { "epoch": 1.090072756966874, "learning_rate": 6.3921339312252054e-06, "loss": 2.6270391845703127, "step": 903400 }, { "epoch": 1.0901934202893566, "learning_rate": 6.3917300957574666e-06, "loss": 2.643330383300781, "step": 903500 }, { "epoch": 1.0903140836118395, "learning_rate": 6.3913262602897285e-06, "loss": 2.6662933349609377, "step": 903600 }, { "epoch": 1.090434746934322, "learning_rate": 6.3909224248219905e-06, "loss": 2.6595465087890626, "step": 903700 }, { "epoch": 1.0905554102568047, "learning_rate": 6.390518589354251e-06, "loss": 2.6440975952148436, "step": 903800 }, { "epoch": 1.0906760735792873, "learning_rate": 6.390114753886513e-06, "loss": 2.6326480102539063, "step": 903900 }, { "epoch": 1.0907967369017701, "learning_rate": 6.389710918418775e-06, "loss": 2.615062255859375, "step": 904000 }, { "epoch": 1.0909174002242528, "learning_rate": 6.389307082951036e-06, "loss": 2.636004638671875, "step": 904100 }, { "epoch": 1.0910380635467354, "learning_rate": 6.388903247483298e-06, "loss": 2.6280532836914063, "step": 904200 }, { "epoch": 1.0911587268692182, "learning_rate": 6.38849941201556e-06, "loss": 2.6171563720703124, "step": 904300 }, { "epoch": 1.0912793901917008, "learning_rate": 6.388095576547821e-06, "loss": 2.65656005859375, "step": 904400 }, { "epoch": 1.0914000535141835, "learning_rate": 6.387691741080083e-06, "loss": 2.636783447265625, "step": 904500 }, { "epoch": 1.0915207168366663, "learning_rate": 6.387287905612344e-06, "loss": 2.6137969970703123, "step": 904600 }, { "epoch": 1.091641380159149, "learning_rate": 6.386884070144605e-06, "loss": 2.6490817260742188, "step": 904700 }, { "epoch": 1.0917620434816315, "learning_rate": 6.386480234676867e-06, "loss": 2.625990295410156, "step": 904800 }, { "epoch": 1.0918827068041144, "learning_rate": 6.386076399209129e-06, "loss": 2.627452697753906, "step": 904900 }, { "epoch": 1.092003370126597, "learning_rate": 6.38567256374139e-06, "loss": 2.6320062255859376, "step": 905000 }, { "epoch": 1.0921240334490796, "learning_rate": 6.385268728273652e-06, "loss": 2.643699951171875, "step": 905100 }, { "epoch": 1.0922446967715622, "learning_rate": 6.384864892805914e-06, "loss": 2.6024966430664063, "step": 905200 }, { "epoch": 1.092365360094045, "learning_rate": 6.384461057338176e-06, "loss": 2.6427511596679687, "step": 905300 }, { "epoch": 1.0924860234165277, "learning_rate": 6.384057221870437e-06, "loss": 2.6289407348632814, "step": 905400 }, { "epoch": 1.0926066867390103, "learning_rate": 6.383653386402699e-06, "loss": 2.6255368041992186, "step": 905500 }, { "epoch": 1.0927273500614931, "learning_rate": 6.38324955093496e-06, "loss": 2.663836669921875, "step": 905600 }, { "epoch": 1.0928480133839757, "learning_rate": 6.382845715467222e-06, "loss": 2.6104107666015626, "step": 905700 }, { "epoch": 1.0929686767064584, "learning_rate": 6.382441879999484e-06, "loss": 2.6613980102539063, "step": 905800 }, { "epoch": 1.093089340028941, "learning_rate": 6.382038044531746e-06, "loss": 2.62904541015625, "step": 905900 }, { "epoch": 1.0932100033514238, "learning_rate": 6.381634209064007e-06, "loss": 2.6252215576171873, "step": 906000 }, { "epoch": 1.0933306666739064, "learning_rate": 6.381230373596269e-06, "loss": 2.623293762207031, "step": 906100 }, { "epoch": 1.093451329996389, "learning_rate": 6.380826538128531e-06, "loss": 2.629317626953125, "step": 906200 }, { "epoch": 1.093571993318872, "learning_rate": 6.380422702660791e-06, "loss": 2.6269345092773437, "step": 906300 }, { "epoch": 1.0936926566413545, "learning_rate": 6.380018867193053e-06, "loss": 2.621573791503906, "step": 906400 }, { "epoch": 1.0938133199638371, "learning_rate": 6.379615031725315e-06, "loss": 2.6295599365234374, "step": 906500 }, { "epoch": 1.09393398328632, "learning_rate": 6.379211196257576e-06, "loss": 2.619825439453125, "step": 906600 }, { "epoch": 1.0940546466088026, "learning_rate": 6.378807360789838e-06, "loss": 2.6546810913085936, "step": 906700 }, { "epoch": 1.0941753099312852, "learning_rate": 6.3784035253221e-06, "loss": 2.624448547363281, "step": 906800 }, { "epoch": 1.094295973253768, "learning_rate": 6.377999689854361e-06, "loss": 2.626952819824219, "step": 906900 }, { "epoch": 1.0944166365762507, "learning_rate": 6.377595854386623e-06, "loss": 2.624078369140625, "step": 907000 }, { "epoch": 1.0945372998987333, "learning_rate": 6.377192018918884e-06, "loss": 2.6605288696289064, "step": 907100 }, { "epoch": 1.094657963221216, "learning_rate": 6.3767881834511455e-06, "loss": 2.6306988525390627, "step": 907200 }, { "epoch": 1.0947786265436987, "learning_rate": 6.3763843479834075e-06, "loss": 2.6422216796875, "step": 907300 }, { "epoch": 1.0948992898661813, "learning_rate": 6.3759805125156695e-06, "loss": 2.638782958984375, "step": 907400 }, { "epoch": 1.095019953188664, "learning_rate": 6.375576677047931e-06, "loss": 2.611625061035156, "step": 907500 }, { "epoch": 1.0951406165111468, "learning_rate": 6.375172841580193e-06, "loss": 2.6213568115234374, "step": 907600 }, { "epoch": 1.0952612798336294, "learning_rate": 6.374769006112455e-06, "loss": 2.624462890625, "step": 907700 }, { "epoch": 1.095381943156112, "learning_rate": 6.3743651706447166e-06, "loss": 2.6072543334960936, "step": 907800 }, { "epoch": 1.0955026064785949, "learning_rate": 6.373961335176977e-06, "loss": 2.631005859375, "step": 907900 }, { "epoch": 1.0956232698010775, "learning_rate": 6.373557499709239e-06, "loss": 2.66450439453125, "step": 908000 }, { "epoch": 1.09574393312356, "learning_rate": 6.3731536642415e-06, "loss": 2.609915771484375, "step": 908100 }, { "epoch": 1.095864596446043, "learning_rate": 6.372749828773762e-06, "loss": 2.636405334472656, "step": 908200 }, { "epoch": 1.0959852597685256, "learning_rate": 6.372345993306024e-06, "loss": 2.615126953125, "step": 908300 }, { "epoch": 1.0961059230910082, "learning_rate": 6.371942157838286e-06, "loss": 2.6286636352539063, "step": 908400 }, { "epoch": 1.0962265864134908, "learning_rate": 6.371538322370547e-06, "loss": 2.6300164794921876, "step": 908500 }, { "epoch": 1.0963472497359736, "learning_rate": 6.371134486902809e-06, "loss": 2.6305575561523438, "step": 908600 }, { "epoch": 1.0964679130584563, "learning_rate": 6.370730651435069e-06, "loss": 2.6325006103515625, "step": 908700 }, { "epoch": 1.0965885763809389, "learning_rate": 6.370326815967331e-06, "loss": 2.647330017089844, "step": 908800 }, { "epoch": 1.0967092397034217, "learning_rate": 6.369922980499593e-06, "loss": 2.615975341796875, "step": 908900 }, { "epoch": 1.0968299030259043, "learning_rate": 6.369519145031855e-06, "loss": 2.6406732177734376, "step": 909000 }, { "epoch": 1.096950566348387, "learning_rate": 6.369115309564116e-06, "loss": 2.629495849609375, "step": 909100 }, { "epoch": 1.0970712296708696, "learning_rate": 6.368711474096378e-06, "loss": 2.625262451171875, "step": 909200 }, { "epoch": 1.0971918929933524, "learning_rate": 6.36830763862864e-06, "loss": 2.6298431396484374, "step": 909300 }, { "epoch": 1.097312556315835, "learning_rate": 6.367903803160902e-06, "loss": 2.647391357421875, "step": 909400 }, { "epoch": 1.0974332196383176, "learning_rate": 6.367499967693163e-06, "loss": 2.6330197143554686, "step": 909500 }, { "epoch": 1.0975538829608005, "learning_rate": 6.367096132225425e-06, "loss": 2.634104919433594, "step": 909600 }, { "epoch": 1.097674546283283, "learning_rate": 6.366692296757686e-06, "loss": 2.638111267089844, "step": 909700 }, { "epoch": 1.0977952096057657, "learning_rate": 6.366288461289948e-06, "loss": 2.652773742675781, "step": 909800 }, { "epoch": 1.0979158729282485, "learning_rate": 6.36588462582221e-06, "loss": 2.5806503295898438, "step": 909900 }, { "epoch": 1.0980365362507312, "learning_rate": 6.365480790354472e-06, "loss": 2.6431948852539064, "step": 910000 }, { "epoch": 1.0981571995732138, "learning_rate": 6.365076954886733e-06, "loss": 2.631023254394531, "step": 910100 }, { "epoch": 1.0982778628956966, "learning_rate": 6.364673119418995e-06, "loss": 2.6102178955078124, "step": 910200 }, { "epoch": 1.0983985262181792, "learning_rate": 6.364269283951255e-06, "loss": 2.628664855957031, "step": 910300 }, { "epoch": 1.0985191895406619, "learning_rate": 6.363865448483517e-06, "loss": 2.645428466796875, "step": 910400 }, { "epoch": 1.0986398528631445, "learning_rate": 6.363461613015779e-06, "loss": 2.6269952392578126, "step": 910500 }, { "epoch": 1.0987605161856273, "learning_rate": 6.363057777548041e-06, "loss": 2.626833190917969, "step": 910600 }, { "epoch": 1.09888117950811, "learning_rate": 6.362653942080302e-06, "loss": 2.6228125, "step": 910700 }, { "epoch": 1.0990018428305925, "learning_rate": 6.362250106612564e-06, "loss": 2.643116455078125, "step": 910800 }, { "epoch": 1.0991225061530754, "learning_rate": 6.361846271144826e-06, "loss": 2.624383544921875, "step": 910900 }, { "epoch": 1.099243169475558, "learning_rate": 6.361442435677087e-06, "loss": 2.6385623168945314, "step": 911000 }, { "epoch": 1.0993638327980406, "learning_rate": 6.361038600209349e-06, "loss": 2.631291809082031, "step": 911100 }, { "epoch": 1.0994844961205232, "learning_rate": 6.36063476474161e-06, "loss": 2.6435806274414064, "step": 911200 }, { "epoch": 1.099605159443006, "learning_rate": 6.3602309292738716e-06, "loss": 2.65498779296875, "step": 911300 }, { "epoch": 1.0997258227654887, "learning_rate": 6.3598270938061335e-06, "loss": 2.608807373046875, "step": 911400 }, { "epoch": 1.0998464860879713, "learning_rate": 6.3594232583383955e-06, "loss": 2.651078186035156, "step": 911500 }, { "epoch": 1.0999671494104541, "learning_rate": 6.359019422870657e-06, "loss": 2.6397415161132813, "step": 911600 }, { "epoch": 1.1000878127329368, "learning_rate": 6.358615587402919e-06, "loss": 2.64026123046875, "step": 911700 }, { "epoch": 1.1002084760554194, "learning_rate": 6.358211751935181e-06, "loss": 2.626869812011719, "step": 911800 }, { "epoch": 1.1003291393779022, "learning_rate": 6.357807916467443e-06, "loss": 2.6310769653320314, "step": 911900 }, { "epoch": 1.1004498027003848, "learning_rate": 6.357404080999703e-06, "loss": 2.64161865234375, "step": 912000 }, { "epoch": 1.1005704660228675, "learning_rate": 6.357000245531965e-06, "loss": 2.6233575439453123, "step": 912100 }, { "epoch": 1.1006911293453503, "learning_rate": 6.356596410064226e-06, "loss": 2.6364474487304688, "step": 912200 }, { "epoch": 1.100811792667833, "learning_rate": 6.356192574596488e-06, "loss": 2.6344451904296875, "step": 912300 }, { "epoch": 1.1009324559903155, "learning_rate": 6.35578873912875e-06, "loss": 2.641507263183594, "step": 912400 }, { "epoch": 1.1010531193127981, "learning_rate": 6.355384903661012e-06, "loss": 2.6531829833984375, "step": 912500 }, { "epoch": 1.101173782635281, "learning_rate": 6.354981068193273e-06, "loss": 2.6111309814453123, "step": 912600 }, { "epoch": 1.1012944459577636, "learning_rate": 6.354577232725535e-06, "loss": 2.610431823730469, "step": 912700 }, { "epoch": 1.1014151092802462, "learning_rate": 6.354173397257795e-06, "loss": 2.628868408203125, "step": 912800 }, { "epoch": 1.101535772602729, "learning_rate": 6.353769561790057e-06, "loss": 2.6261962890625, "step": 912900 }, { "epoch": 1.1016564359252117, "learning_rate": 6.353365726322319e-06, "loss": 2.5855657958984377, "step": 913000 }, { "epoch": 1.1017770992476943, "learning_rate": 6.352961890854581e-06, "loss": 2.634139099121094, "step": 913100 }, { "epoch": 1.1018977625701771, "learning_rate": 6.3525580553868424e-06, "loss": 2.64853515625, "step": 913200 }, { "epoch": 1.1020184258926597, "learning_rate": 6.3521542199191044e-06, "loss": 2.6388104248046873, "step": 913300 }, { "epoch": 1.1021390892151424, "learning_rate": 6.351750384451366e-06, "loss": 2.624087219238281, "step": 913400 }, { "epoch": 1.1022597525376252, "learning_rate": 6.3513465489836275e-06, "loss": 2.5903549194335938, "step": 913500 }, { "epoch": 1.1023804158601078, "learning_rate": 6.350942713515889e-06, "loss": 2.6605758666992188, "step": 913600 }, { "epoch": 1.1025010791825904, "learning_rate": 6.350538878048151e-06, "loss": 2.627177429199219, "step": 913700 }, { "epoch": 1.102621742505073, "learning_rate": 6.350135042580412e-06, "loss": 2.613186950683594, "step": 913800 }, { "epoch": 1.102742405827556, "learning_rate": 6.349731207112674e-06, "loss": 2.6338821411132813, "step": 913900 }, { "epoch": 1.1028630691500385, "learning_rate": 6.349327371644936e-06, "loss": 2.6157537841796876, "step": 914000 }, { "epoch": 1.1029837324725211, "learning_rate": 6.348923536177197e-06, "loss": 2.6165045166015624, "step": 914100 }, { "epoch": 1.103104395795004, "learning_rate": 6.348519700709459e-06, "loss": 2.654710388183594, "step": 914200 }, { "epoch": 1.1032250591174866, "learning_rate": 6.348115865241721e-06, "loss": 2.6470526123046874, "step": 914300 }, { "epoch": 1.1033457224399692, "learning_rate": 6.347712029773981e-06, "loss": 2.611097717285156, "step": 914400 }, { "epoch": 1.1034663857624518, "learning_rate": 6.347308194306243e-06, "loss": 2.6148687744140626, "step": 914500 }, { "epoch": 1.1035870490849347, "learning_rate": 6.346904358838505e-06, "loss": 2.6276422119140626, "step": 914600 }, { "epoch": 1.1037077124074173, "learning_rate": 6.346500523370766e-06, "loss": 2.6582366943359377, "step": 914700 }, { "epoch": 1.1038283757299, "learning_rate": 6.346096687903028e-06, "loss": 2.6402099609375, "step": 914800 }, { "epoch": 1.1039490390523827, "learning_rate": 6.34569285243529e-06, "loss": 2.6111935424804686, "step": 914900 }, { "epoch": 1.1040697023748653, "learning_rate": 6.345289016967552e-06, "loss": 2.6616815185546874, "step": 915000 }, { "epoch": 1.104190365697348, "learning_rate": 6.344885181499813e-06, "loss": 2.638768310546875, "step": 915100 }, { "epoch": 1.1043110290198308, "learning_rate": 6.3444813460320745e-06, "loss": 2.63294189453125, "step": 915200 }, { "epoch": 1.1044316923423134, "learning_rate": 6.344077510564336e-06, "loss": 2.6204733276367187, "step": 915300 }, { "epoch": 1.104552355664796, "learning_rate": 6.343673675096598e-06, "loss": 2.5981491088867186, "step": 915400 }, { "epoch": 1.1046730189872789, "learning_rate": 6.3432698396288596e-06, "loss": 2.616934814453125, "step": 915500 }, { "epoch": 1.1047936823097615, "learning_rate": 6.3428660041611216e-06, "loss": 2.6304580688476564, "step": 915600 }, { "epoch": 1.104914345632244, "learning_rate": 6.342462168693383e-06, "loss": 2.6375592041015623, "step": 915700 }, { "epoch": 1.1050350089547267, "learning_rate": 6.342058333225645e-06, "loss": 2.60246826171875, "step": 915800 }, { "epoch": 1.1051556722772096, "learning_rate": 6.341654497757907e-06, "loss": 2.6113128662109375, "step": 915900 }, { "epoch": 1.1052763355996922, "learning_rate": 6.341250662290167e-06, "loss": 2.629444580078125, "step": 916000 }, { "epoch": 1.1053969989221748, "learning_rate": 6.340846826822429e-06, "loss": 2.618221435546875, "step": 916100 }, { "epoch": 1.1055176622446576, "learning_rate": 6.340442991354691e-06, "loss": 2.620465087890625, "step": 916200 }, { "epoch": 1.1056383255671403, "learning_rate": 6.340039155886952e-06, "loss": 2.627161560058594, "step": 916300 }, { "epoch": 1.1057589888896229, "learning_rate": 6.339635320419214e-06, "loss": 2.62619873046875, "step": 916400 }, { "epoch": 1.1058796522121055, "learning_rate": 6.339231484951476e-06, "loss": 2.6389199829101564, "step": 916500 }, { "epoch": 1.1060003155345883, "learning_rate": 6.338827649483737e-06, "loss": 2.64522216796875, "step": 916600 }, { "epoch": 1.106120978857071, "learning_rate": 6.338423814015999e-06, "loss": 2.6253857421875, "step": 916700 }, { "epoch": 1.1062416421795536, "learning_rate": 6.338019978548261e-06, "loss": 2.62248046875, "step": 916800 }, { "epoch": 1.1063623055020364, "learning_rate": 6.337616143080521e-06, "loss": 2.599301452636719, "step": 916900 }, { "epoch": 1.106482968824519, "learning_rate": 6.337212307612783e-06, "loss": 2.637653503417969, "step": 917000 }, { "epoch": 1.1066036321470016, "learning_rate": 6.336808472145045e-06, "loss": 2.614382019042969, "step": 917100 }, { "epoch": 1.1067242954694845, "learning_rate": 6.3364046366773065e-06, "loss": 2.641138000488281, "step": 917200 }, { "epoch": 1.106844958791967, "learning_rate": 6.3360008012095685e-06, "loss": 2.635864562988281, "step": 917300 }, { "epoch": 1.1069656221144497, "learning_rate": 6.3355969657418305e-06, "loss": 2.6546807861328126, "step": 917400 }, { "epoch": 1.1070862854369325, "learning_rate": 6.3351931302740924e-06, "loss": 2.6222711181640626, "step": 917500 }, { "epoch": 1.1072069487594152, "learning_rate": 6.3347892948063536e-06, "loss": 2.6131341552734373, "step": 917600 }, { "epoch": 1.1073276120818978, "learning_rate": 6.334385459338615e-06, "loss": 2.638657531738281, "step": 917700 }, { "epoch": 1.1074482754043804, "learning_rate": 6.333981623870876e-06, "loss": 2.6017019653320315, "step": 917800 }, { "epoch": 1.1075689387268632, "learning_rate": 6.333577788403138e-06, "loss": 2.619889831542969, "step": 917900 }, { "epoch": 1.1076896020493459, "learning_rate": 6.3331739529354e-06, "loss": 2.6416650390625, "step": 918000 }, { "epoch": 1.1078102653718285, "learning_rate": 6.332770117467662e-06, "loss": 2.638194274902344, "step": 918100 }, { "epoch": 1.1079309286943113, "learning_rate": 6.332366281999923e-06, "loss": 2.624028625488281, "step": 918200 }, { "epoch": 1.108051592016794, "learning_rate": 6.331962446532185e-06, "loss": 2.6409161376953123, "step": 918300 }, { "epoch": 1.1081722553392765, "learning_rate": 6.331558611064447e-06, "loss": 2.639848327636719, "step": 918400 }, { "epoch": 1.1082929186617594, "learning_rate": 6.331154775596707e-06, "loss": 2.62400634765625, "step": 918500 }, { "epoch": 1.108413581984242, "learning_rate": 6.330750940128969e-06, "loss": 2.63901123046875, "step": 918600 }, { "epoch": 1.1085342453067246, "learning_rate": 6.330347104661231e-06, "loss": 2.626859436035156, "step": 918700 }, { "epoch": 1.1086549086292075, "learning_rate": 6.329943269193492e-06, "loss": 2.623662414550781, "step": 918800 }, { "epoch": 1.10877557195169, "learning_rate": 6.329539433725754e-06, "loss": 2.635798034667969, "step": 918900 }, { "epoch": 1.1088962352741727, "learning_rate": 6.329135598258016e-06, "loss": 2.6163040161132813, "step": 919000 }, { "epoch": 1.1090168985966553, "learning_rate": 6.328731762790277e-06, "loss": 2.607804870605469, "step": 919100 }, { "epoch": 1.1091375619191381, "learning_rate": 6.328327927322539e-06, "loss": 2.63783447265625, "step": 919200 }, { "epoch": 1.1092582252416208, "learning_rate": 6.3279240918548005e-06, "loss": 2.62074462890625, "step": 919300 }, { "epoch": 1.1093788885641034, "learning_rate": 6.327520256387062e-06, "loss": 2.6211761474609374, "step": 919400 }, { "epoch": 1.1094995518865862, "learning_rate": 6.327116420919324e-06, "loss": 2.6251516723632813, "step": 919500 }, { "epoch": 1.1096202152090688, "learning_rate": 6.326712585451586e-06, "loss": 2.6259335327148436, "step": 919600 }, { "epoch": 1.1097408785315515, "learning_rate": 6.326308749983847e-06, "loss": 2.614272155761719, "step": 919700 }, { "epoch": 1.109861541854034, "learning_rate": 6.325904914516109e-06, "loss": 2.6137469482421873, "step": 919800 }, { "epoch": 1.109982205176517, "learning_rate": 6.325501079048371e-06, "loss": 2.6214724731445314, "step": 919900 }, { "epoch": 1.1101028684989995, "learning_rate": 6.325097243580633e-06, "loss": 2.61711181640625, "step": 920000 }, { "epoch": 1.1102235318214821, "learning_rate": 6.324693408112893e-06, "loss": 2.6019158935546876, "step": 920100 }, { "epoch": 1.110344195143965, "learning_rate": 6.324289572645155e-06, "loss": 2.616114501953125, "step": 920200 }, { "epoch": 1.1104648584664476, "learning_rate": 6.323885737177416e-06, "loss": 2.6538766479492186, "step": 920300 }, { "epoch": 1.1105855217889302, "learning_rate": 6.323481901709678e-06, "loss": 2.633577880859375, "step": 920400 }, { "epoch": 1.110706185111413, "learning_rate": 6.32307806624194e-06, "loss": 2.6151300048828126, "step": 920500 }, { "epoch": 1.1108268484338957, "learning_rate": 6.322674230774202e-06, "loss": 2.6362548828125, "step": 920600 }, { "epoch": 1.1109475117563783, "learning_rate": 6.322270395306463e-06, "loss": 2.621695251464844, "step": 920700 }, { "epoch": 1.1110681750788611, "learning_rate": 6.321866559838725e-06, "loss": 2.6443441772460936, "step": 920800 }, { "epoch": 1.1111888384013437, "learning_rate": 6.3214627243709854e-06, "loss": 2.6037799072265626, "step": 920900 }, { "epoch": 1.1113095017238264, "learning_rate": 6.3210588889032474e-06, "loss": 2.6152114868164062, "step": 921000 }, { "epoch": 1.111430165046309, "learning_rate": 6.320655053435509e-06, "loss": 2.598189697265625, "step": 921100 }, { "epoch": 1.1115508283687918, "learning_rate": 6.320251217967771e-06, "loss": 2.6343179321289063, "step": 921200 }, { "epoch": 1.1116714916912744, "learning_rate": 6.3198473825000325e-06, "loss": 2.605723571777344, "step": 921300 }, { "epoch": 1.111792155013757, "learning_rate": 6.3194435470322945e-06, "loss": 2.63184814453125, "step": 921400 }, { "epoch": 1.11191281833624, "learning_rate": 6.3190397115645565e-06, "loss": 2.614848937988281, "step": 921500 }, { "epoch": 1.1120334816587225, "learning_rate": 6.3186358760968185e-06, "loss": 2.6201519775390625, "step": 921600 }, { "epoch": 1.1121541449812051, "learning_rate": 6.31823204062908e-06, "loss": 2.663558349609375, "step": 921700 }, { "epoch": 1.1122748083036877, "learning_rate": 6.317828205161341e-06, "loss": 2.628737487792969, "step": 921800 }, { "epoch": 1.1123954716261706, "learning_rate": 6.317424369693602e-06, "loss": 2.6429544067382813, "step": 921900 }, { "epoch": 1.1125161349486532, "learning_rate": 6.317020534225864e-06, "loss": 2.6483218383789064, "step": 922000 }, { "epoch": 1.1126367982711358, "learning_rate": 6.316616698758126e-06, "loss": 2.616400146484375, "step": 922100 }, { "epoch": 1.1127574615936187, "learning_rate": 6.316212863290388e-06, "loss": 2.612984619140625, "step": 922200 }, { "epoch": 1.1128781249161013, "learning_rate": 6.315809027822649e-06, "loss": 2.616000061035156, "step": 922300 }, { "epoch": 1.112998788238584, "learning_rate": 6.315405192354911e-06, "loss": 2.630919189453125, "step": 922400 }, { "epoch": 1.1131194515610667, "learning_rate": 6.315001356887173e-06, "loss": 2.629457702636719, "step": 922500 }, { "epoch": 1.1132401148835493, "learning_rate": 6.314597521419433e-06, "loss": 2.633494873046875, "step": 922600 }, { "epoch": 1.113360778206032, "learning_rate": 6.314193685951695e-06, "loss": 2.623704528808594, "step": 922700 }, { "epoch": 1.1134814415285148, "learning_rate": 6.313789850483957e-06, "loss": 2.6036337280273436, "step": 922800 }, { "epoch": 1.1136021048509974, "learning_rate": 6.313386015016218e-06, "loss": 2.6144027709960938, "step": 922900 }, { "epoch": 1.11372276817348, "learning_rate": 6.31298217954848e-06, "loss": 2.618819580078125, "step": 923000 }, { "epoch": 1.1138434314959627, "learning_rate": 6.312578344080742e-06, "loss": 2.6154534912109373, "step": 923100 }, { "epoch": 1.1139640948184455, "learning_rate": 6.312174508613003e-06, "loss": 2.615621337890625, "step": 923200 }, { "epoch": 1.114084758140928, "learning_rate": 6.311770673145265e-06, "loss": 2.628072509765625, "step": 923300 }, { "epoch": 1.1142054214634107, "learning_rate": 6.3113668376775265e-06, "loss": 2.62260009765625, "step": 923400 }, { "epoch": 1.1143260847858936, "learning_rate": 6.310963002209788e-06, "loss": 2.6353564453125, "step": 923500 }, { "epoch": 1.1144467481083762, "learning_rate": 6.31055916674205e-06, "loss": 2.5998666381835935, "step": 923600 }, { "epoch": 1.1145674114308588, "learning_rate": 6.310155331274312e-06, "loss": 2.632518615722656, "step": 923700 }, { "epoch": 1.1146880747533416, "learning_rate": 6.309751495806573e-06, "loss": 2.6251422119140626, "step": 923800 }, { "epoch": 1.1148087380758243, "learning_rate": 6.309347660338835e-06, "loss": 2.6342901611328124, "step": 923900 }, { "epoch": 1.1149294013983069, "learning_rate": 6.308943824871097e-06, "loss": 2.603799133300781, "step": 924000 }, { "epoch": 1.1150500647207897, "learning_rate": 6.308539989403359e-06, "loss": 2.622663879394531, "step": 924100 }, { "epoch": 1.1151707280432723, "learning_rate": 6.308136153935619e-06, "loss": 2.6107131958007814, "step": 924200 }, { "epoch": 1.115291391365755, "learning_rate": 6.307732318467881e-06, "loss": 2.612198486328125, "step": 924300 }, { "epoch": 1.1154120546882376, "learning_rate": 6.307328483000142e-06, "loss": 2.6293988037109375, "step": 924400 }, { "epoch": 1.1155327180107204, "learning_rate": 6.306924647532404e-06, "loss": 2.6243661499023436, "step": 924500 }, { "epoch": 1.115653381333203, "learning_rate": 6.306520812064666e-06, "loss": 2.6502545166015623, "step": 924600 }, { "epoch": 1.1157740446556856, "learning_rate": 6.306116976596928e-06, "loss": 2.64490966796875, "step": 924700 }, { "epoch": 1.1158947079781685, "learning_rate": 6.305713141129189e-06, "loss": 2.594893493652344, "step": 924800 }, { "epoch": 1.116015371300651, "learning_rate": 6.305309305661451e-06, "loss": 2.614312744140625, "step": 924900 }, { "epoch": 1.1161360346231337, "learning_rate": 6.3049054701937115e-06, "loss": 2.609169616699219, "step": 925000 }, { "epoch": 1.1162566979456163, "learning_rate": 6.3045016347259735e-06, "loss": 2.6168475341796875, "step": 925100 }, { "epoch": 1.1163773612680992, "learning_rate": 6.3040977992582354e-06, "loss": 2.5950408935546876, "step": 925200 }, { "epoch": 1.1164980245905818, "learning_rate": 6.3036939637904974e-06, "loss": 2.6377642822265623, "step": 925300 }, { "epoch": 1.1166186879130644, "learning_rate": 6.3032901283227586e-06, "loss": 2.62218017578125, "step": 925400 }, { "epoch": 1.1167393512355472, "learning_rate": 6.3028862928550205e-06, "loss": 2.6217724609375, "step": 925500 }, { "epoch": 1.1168600145580299, "learning_rate": 6.3024824573872825e-06, "loss": 2.6039788818359373, "step": 925600 }, { "epoch": 1.1169806778805125, "learning_rate": 6.302078621919544e-06, "loss": 2.6134164428710935, "step": 925700 }, { "epoch": 1.1171013412029953, "learning_rate": 6.301674786451805e-06, "loss": 2.6209442138671877, "step": 925800 }, { "epoch": 1.117222004525478, "learning_rate": 6.301270950984067e-06, "loss": 2.6269094848632815, "step": 925900 }, { "epoch": 1.1173426678479605, "learning_rate": 6.300867115516328e-06, "loss": 2.617669982910156, "step": 926000 }, { "epoch": 1.1174633311704434, "learning_rate": 6.30046328004859e-06, "loss": 2.622481384277344, "step": 926100 }, { "epoch": 1.117583994492926, "learning_rate": 6.300059444580852e-06, "loss": 2.631622314453125, "step": 926200 }, { "epoch": 1.1177046578154086, "learning_rate": 6.299655609113113e-06, "loss": 2.626204833984375, "step": 926300 }, { "epoch": 1.1178253211378912, "learning_rate": 6.299251773645375e-06, "loss": 2.629308166503906, "step": 926400 }, { "epoch": 1.117945984460374, "learning_rate": 6.298847938177637e-06, "loss": 2.607415771484375, "step": 926500 }, { "epoch": 1.1180666477828567, "learning_rate": 6.298444102709899e-06, "loss": 2.630994873046875, "step": 926600 }, { "epoch": 1.1181873111053393, "learning_rate": 6.298040267242159e-06, "loss": 2.5943280029296876, "step": 926700 }, { "epoch": 1.1183079744278221, "learning_rate": 6.297636431774421e-06, "loss": 2.6235720825195314, "step": 926800 }, { "epoch": 1.1184286377503048, "learning_rate": 6.297232596306682e-06, "loss": 2.5875115966796876, "step": 926900 }, { "epoch": 1.1185493010727874, "learning_rate": 6.296828760838944e-06, "loss": 2.631506042480469, "step": 927000 }, { "epoch": 1.1186699643952702, "learning_rate": 6.296424925371206e-06, "loss": 2.604935302734375, "step": 927100 }, { "epoch": 1.1187906277177528, "learning_rate": 6.296021089903468e-06, "loss": 2.6028903198242186, "step": 927200 }, { "epoch": 1.1189112910402355, "learning_rate": 6.2956172544357295e-06, "loss": 2.6494415283203123, "step": 927300 }, { "epoch": 1.119031954362718, "learning_rate": 6.2952134189679914e-06, "loss": 2.5939511108398436, "step": 927400 }, { "epoch": 1.119152617685201, "learning_rate": 6.294809583500252e-06, "loss": 2.6268084716796873, "step": 927500 }, { "epoch": 1.1192732810076835, "learning_rate": 6.294405748032514e-06, "loss": 2.613397521972656, "step": 927600 }, { "epoch": 1.1193939443301661, "learning_rate": 6.294001912564776e-06, "loss": 2.6268756103515627, "step": 927700 }, { "epoch": 1.119514607652649, "learning_rate": 6.293598077097038e-06, "loss": 2.6097637939453127, "step": 927800 }, { "epoch": 1.1196352709751316, "learning_rate": 6.293194241629299e-06, "loss": 2.6174581909179686, "step": 927900 }, { "epoch": 1.1197559342976142, "learning_rate": 6.292790406161561e-06, "loss": 2.6251385498046873, "step": 928000 }, { "epoch": 1.119876597620097, "learning_rate": 6.292386570693823e-06, "loss": 2.621623229980469, "step": 928100 }, { "epoch": 1.1199972609425797, "learning_rate": 6.291982735226084e-06, "loss": 2.6113571166992187, "step": 928200 }, { "epoch": 1.1201179242650623, "learning_rate": 6.291578899758345e-06, "loss": 2.6311880493164064, "step": 928300 }, { "epoch": 1.120238587587545, "learning_rate": 6.291175064290607e-06, "loss": 2.6203793334960936, "step": 928400 }, { "epoch": 1.1203592509100277, "learning_rate": 6.290771228822868e-06, "loss": 2.6047735595703125, "step": 928500 }, { "epoch": 1.1204799142325104, "learning_rate": 6.29036739335513e-06, "loss": 2.6524578857421877, "step": 928600 }, { "epoch": 1.120600577554993, "learning_rate": 6.289963557887392e-06, "loss": 2.6032177734375, "step": 928700 }, { "epoch": 1.1207212408774758, "learning_rate": 6.289559722419653e-06, "loss": 2.6334072875976564, "step": 928800 }, { "epoch": 1.1208419041999584, "learning_rate": 6.289155886951915e-06, "loss": 2.6086444091796874, "step": 928900 }, { "epoch": 1.120962567522441, "learning_rate": 6.288752051484177e-06, "loss": 2.588970031738281, "step": 929000 }, { "epoch": 1.121083230844924, "learning_rate": 6.2883482160164375e-06, "loss": 2.60943603515625, "step": 929100 }, { "epoch": 1.1212038941674065, "learning_rate": 6.2879443805486995e-06, "loss": 2.618482666015625, "step": 929200 }, { "epoch": 1.1213245574898891, "learning_rate": 6.2875405450809615e-06, "loss": 2.6223764038085937, "step": 929300 }, { "epoch": 1.121445220812372, "learning_rate": 6.287136709613223e-06, "loss": 2.6269989013671875, "step": 929400 }, { "epoch": 1.1215658841348546, "learning_rate": 6.286732874145485e-06, "loss": 2.6029052734375, "step": 929500 }, { "epoch": 1.1216865474573372, "learning_rate": 6.286329038677747e-06, "loss": 2.6298321533203124, "step": 929600 }, { "epoch": 1.1218072107798198, "learning_rate": 6.2859252032100086e-06, "loss": 2.64248779296875, "step": 929700 }, { "epoch": 1.1219278741023027, "learning_rate": 6.28552136774227e-06, "loss": 2.6314566040039065, "step": 929800 }, { "epoch": 1.1220485374247853, "learning_rate": 6.285117532274531e-06, "loss": 2.623665771484375, "step": 929900 }, { "epoch": 1.122169200747268, "learning_rate": 6.284713696806792e-06, "loss": 2.648373718261719, "step": 930000 }, { "epoch": 1.1222898640697507, "learning_rate": 6.284309861339054e-06, "loss": 2.6323306274414064, "step": 930100 }, { "epoch": 1.1224105273922333, "learning_rate": 6.283906025871316e-06, "loss": 2.6171710205078127, "step": 930200 }, { "epoch": 1.122531190714716, "learning_rate": 6.283502190403578e-06, "loss": 2.6217340087890624, "step": 930300 }, { "epoch": 1.1226518540371986, "learning_rate": 6.283098354935839e-06, "loss": 2.594351806640625, "step": 930400 }, { "epoch": 1.1227725173596814, "learning_rate": 6.282694519468101e-06, "loss": 2.6213192749023437, "step": 930500 }, { "epoch": 1.122893180682164, "learning_rate": 6.282290684000363e-06, "loss": 2.6161907958984374, "step": 930600 }, { "epoch": 1.1230138440046467, "learning_rate": 6.281886848532623e-06, "loss": 2.6039700317382812, "step": 930700 }, { "epoch": 1.1231345073271295, "learning_rate": 6.281483013064885e-06, "loss": 2.6187612915039065, "step": 930800 }, { "epoch": 1.1232551706496121, "learning_rate": 6.281079177597147e-06, "loss": 2.6220416259765624, "step": 930900 }, { "epoch": 1.1233758339720947, "learning_rate": 6.280675342129408e-06, "loss": 2.615478210449219, "step": 931000 }, { "epoch": 1.1234964972945776, "learning_rate": 6.28027150666167e-06, "loss": 2.60112548828125, "step": 931100 }, { "epoch": 1.1236171606170602, "learning_rate": 6.279867671193932e-06, "loss": 2.6547198486328125, "step": 931200 }, { "epoch": 1.1237378239395428, "learning_rate": 6.2794638357261935e-06, "loss": 2.632742614746094, "step": 931300 }, { "epoch": 1.1238584872620256, "learning_rate": 6.2790600002584555e-06, "loss": 2.6175326538085937, "step": 931400 }, { "epoch": 1.1239791505845083, "learning_rate": 6.278656164790717e-06, "loss": 2.61483154296875, "step": 931500 }, { "epoch": 1.1240998139069909, "learning_rate": 6.278252329322978e-06, "loss": 2.603729553222656, "step": 931600 }, { "epoch": 1.1242204772294735, "learning_rate": 6.27784849385524e-06, "loss": 2.6125112915039064, "step": 931700 }, { "epoch": 1.1243411405519563, "learning_rate": 6.277444658387502e-06, "loss": 2.6084246826171875, "step": 931800 }, { "epoch": 1.124461803874439, "learning_rate": 6.277040822919763e-06, "loss": 2.612613525390625, "step": 931900 }, { "epoch": 1.1245824671969216, "learning_rate": 6.276636987452025e-06, "loss": 2.629849548339844, "step": 932000 }, { "epoch": 1.1247031305194044, "learning_rate": 6.276233151984287e-06, "loss": 2.6373214721679688, "step": 932100 }, { "epoch": 1.124823793841887, "learning_rate": 6.275829316516549e-06, "loss": 2.62805419921875, "step": 932200 }, { "epoch": 1.1249444571643696, "learning_rate": 6.27542548104881e-06, "loss": 2.598486022949219, "step": 932300 }, { "epoch": 1.1250651204868523, "learning_rate": 6.275021645581071e-06, "loss": 2.6379318237304688, "step": 932400 }, { "epoch": 1.125185783809335, "learning_rate": 6.274617810113332e-06, "loss": 2.6169586181640625, "step": 932500 }, { "epoch": 1.1253064471318177, "learning_rate": 6.274213974645594e-06, "loss": 2.6373910522460937, "step": 932600 }, { "epoch": 1.1254271104543005, "learning_rate": 6.273810139177856e-06, "loss": 2.599747619628906, "step": 932700 }, { "epoch": 1.1255477737767832, "learning_rate": 6.273406303710118e-06, "loss": 2.6338839721679688, "step": 932800 }, { "epoch": 1.1256684370992658, "learning_rate": 6.273002468242379e-06, "loss": 2.6351577758789064, "step": 932900 }, { "epoch": 1.1257891004217484, "learning_rate": 6.272598632774641e-06, "loss": 2.5821319580078126, "step": 933000 }, { "epoch": 1.1259097637442312, "learning_rate": 6.272194797306903e-06, "loss": 2.618014221191406, "step": 933100 }, { "epoch": 1.1260304270667139, "learning_rate": 6.2717909618391635e-06, "loss": 2.63196044921875, "step": 933200 }, { "epoch": 1.1261510903891965, "learning_rate": 6.2713871263714255e-06, "loss": 2.626383972167969, "step": 933300 }, { "epoch": 1.1262717537116793, "learning_rate": 6.2709832909036875e-06, "loss": 2.624905700683594, "step": 933400 }, { "epoch": 1.126392417034162, "learning_rate": 6.270579455435949e-06, "loss": 2.5933685302734375, "step": 933500 }, { "epoch": 1.1265130803566445, "learning_rate": 6.270175619968211e-06, "loss": 2.614072570800781, "step": 933600 }, { "epoch": 1.1266337436791272, "learning_rate": 6.269771784500473e-06, "loss": 2.6289352416992187, "step": 933700 }, { "epoch": 1.12675440700161, "learning_rate": 6.269367949032734e-06, "loss": 2.606445007324219, "step": 933800 }, { "epoch": 1.1268750703240926, "learning_rate": 6.268964113564996e-06, "loss": 2.616314697265625, "step": 933900 }, { "epoch": 1.1269957336465752, "learning_rate": 6.268560278097257e-06, "loss": 2.599975891113281, "step": 934000 }, { "epoch": 1.127116396969058, "learning_rate": 6.268156442629518e-06, "loss": 2.6374356079101564, "step": 934100 }, { "epoch": 1.1272370602915407, "learning_rate": 6.26775260716178e-06, "loss": 2.6217596435546877, "step": 934200 }, { "epoch": 1.1273577236140233, "learning_rate": 6.267348771694042e-06, "loss": 2.6271783447265626, "step": 934300 }, { "epoch": 1.1274783869365061, "learning_rate": 6.266944936226303e-06, "loss": 2.6368289184570313, "step": 934400 }, { "epoch": 1.1275990502589888, "learning_rate": 6.266541100758565e-06, "loss": 2.6348910522460938, "step": 934500 }, { "epoch": 1.1277197135814714, "learning_rate": 6.266137265290827e-06, "loss": 2.646974792480469, "step": 934600 }, { "epoch": 1.1278403769039542, "learning_rate": 6.265733429823089e-06, "loss": 2.6231350708007812, "step": 934700 }, { "epoch": 1.1279610402264368, "learning_rate": 6.265329594355349e-06, "loss": 2.6051885986328127, "step": 934800 }, { "epoch": 1.1280817035489195, "learning_rate": 6.264925758887611e-06, "loss": 2.63467041015625, "step": 934900 }, { "epoch": 1.128202366871402, "learning_rate": 6.2645219234198725e-06, "loss": 2.635914001464844, "step": 935000 }, { "epoch": 1.128323030193885, "learning_rate": 6.2641180879521344e-06, "loss": 2.6149423217773435, "step": 935100 }, { "epoch": 1.1284436935163675, "learning_rate": 6.263714252484396e-06, "loss": 2.5852597045898436, "step": 935200 }, { "epoch": 1.1285643568388501, "learning_rate": 6.263310417016658e-06, "loss": 2.6139410400390624, "step": 935300 }, { "epoch": 1.128685020161333, "learning_rate": 6.2629065815489195e-06, "loss": 2.610517883300781, "step": 935400 }, { "epoch": 1.1288056834838156, "learning_rate": 6.2625027460811815e-06, "loss": 2.6214556884765625, "step": 935500 }, { "epoch": 1.1289263468062982, "learning_rate": 6.262098910613442e-06, "loss": 2.638338623046875, "step": 935600 }, { "epoch": 1.1290470101287808, "learning_rate": 6.261695075145704e-06, "loss": 2.61470703125, "step": 935700 }, { "epoch": 1.1291676734512637, "learning_rate": 6.261291239677966e-06, "loss": 2.6242041015625, "step": 935800 }, { "epoch": 1.1292883367737463, "learning_rate": 6.260887404210228e-06, "loss": 2.5793386840820314, "step": 935900 }, { "epoch": 1.129409000096229, "learning_rate": 6.260483568742489e-06, "loss": 2.6430029296875, "step": 936000 }, { "epoch": 1.1295296634187117, "learning_rate": 6.260079733274751e-06, "loss": 2.6267239379882814, "step": 936100 }, { "epoch": 1.1296503267411944, "learning_rate": 6.259675897807013e-06, "loss": 2.6037213134765627, "step": 936200 }, { "epoch": 1.129770990063677, "learning_rate": 6.259272062339275e-06, "loss": 2.5900140380859376, "step": 936300 }, { "epoch": 1.1298916533861598, "learning_rate": 6.258868226871535e-06, "loss": 2.5999432373046876, "step": 936400 }, { "epoch": 1.1300123167086424, "learning_rate": 6.258464391403797e-06, "loss": 2.5986273193359377, "step": 936500 }, { "epoch": 1.130132980031125, "learning_rate": 6.258060555936058e-06, "loss": 2.6146206665039062, "step": 936600 }, { "epoch": 1.130253643353608, "learning_rate": 6.25765672046832e-06, "loss": 2.629852294921875, "step": 936700 }, { "epoch": 1.1303743066760905, "learning_rate": 6.257252885000582e-06, "loss": 2.6136505126953127, "step": 936800 }, { "epoch": 1.1304949699985731, "learning_rate": 6.256849049532844e-06, "loss": 2.6186517333984374, "step": 936900 }, { "epoch": 1.1306156333210557, "learning_rate": 6.256445214065105e-06, "loss": 2.617464599609375, "step": 937000 }, { "epoch": 1.1307362966435386, "learning_rate": 6.256041378597367e-06, "loss": 2.6281915283203126, "step": 937100 }, { "epoch": 1.1308569599660212, "learning_rate": 6.255637543129629e-06, "loss": 2.613961486816406, "step": 937200 }, { "epoch": 1.1309776232885038, "learning_rate": 6.25523370766189e-06, "loss": 2.6067169189453123, "step": 937300 }, { "epoch": 1.1310982866109867, "learning_rate": 6.2548298721941516e-06, "loss": 2.6028924560546876, "step": 937400 }, { "epoch": 1.1312189499334693, "learning_rate": 6.2544260367264135e-06, "loss": 2.607696838378906, "step": 937500 }, { "epoch": 1.131339613255952, "learning_rate": 6.254022201258675e-06, "loss": 2.624076232910156, "step": 937600 }, { "epoch": 1.1314602765784345, "learning_rate": 6.253618365790937e-06, "loss": 2.623883056640625, "step": 937700 }, { "epoch": 1.1315809399009173, "learning_rate": 6.253214530323199e-06, "loss": 2.621484680175781, "step": 937800 }, { "epoch": 1.1317016032234, "learning_rate": 6.25281069485546e-06, "loss": 2.60453125, "step": 937900 }, { "epoch": 1.1318222665458828, "learning_rate": 6.252406859387722e-06, "loss": 2.6245297241210936, "step": 938000 }, { "epoch": 1.1319429298683654, "learning_rate": 6.252003023919983e-06, "loss": 2.625582275390625, "step": 938100 }, { "epoch": 1.132063593190848, "learning_rate": 6.251599188452244e-06, "loss": 2.63792236328125, "step": 938200 }, { "epoch": 1.1321842565133307, "learning_rate": 6.251195352984506e-06, "loss": 2.593336181640625, "step": 938300 }, { "epoch": 1.1323049198358135, "learning_rate": 6.250791517516768e-06, "loss": 2.6023223876953123, "step": 938400 }, { "epoch": 1.1324255831582961, "learning_rate": 6.250387682049029e-06, "loss": 2.5944082641601565, "step": 938500 }, { "epoch": 1.1325462464807787, "learning_rate": 6.249983846581291e-06, "loss": 2.598961181640625, "step": 938600 }, { "epoch": 1.1326669098032616, "learning_rate": 6.249580011113553e-06, "loss": 2.631778564453125, "step": 938700 }, { "epoch": 1.1327875731257442, "learning_rate": 6.249176175645815e-06, "loss": 2.604162292480469, "step": 938800 }, { "epoch": 1.1329082364482268, "learning_rate": 6.248772340178075e-06, "loss": 2.6188223266601565, "step": 938900 }, { "epoch": 1.1330288997707094, "learning_rate": 6.248368504710337e-06, "loss": 2.625703125, "step": 939000 }, { "epoch": 1.1331495630931923, "learning_rate": 6.2479646692425985e-06, "loss": 2.6207144165039065, "step": 939100 }, { "epoch": 1.1332702264156749, "learning_rate": 6.2475608337748605e-06, "loss": 2.6054571533203124, "step": 939200 }, { "epoch": 1.1333908897381575, "learning_rate": 6.2471569983071225e-06, "loss": 2.6353729248046873, "step": 939300 }, { "epoch": 1.1335115530606403, "learning_rate": 6.2467531628393844e-06, "loss": 2.596302185058594, "step": 939400 }, { "epoch": 1.133632216383123, "learning_rate": 6.2463493273716456e-06, "loss": 2.606475524902344, "step": 939500 }, { "epoch": 1.1337528797056056, "learning_rate": 6.2459454919039076e-06, "loss": 2.5988934326171873, "step": 939600 }, { "epoch": 1.1338735430280884, "learning_rate": 6.245541656436168e-06, "loss": 2.612318115234375, "step": 939700 }, { "epoch": 1.133994206350571, "learning_rate": 6.24513782096843e-06, "loss": 2.636504821777344, "step": 939800 }, { "epoch": 1.1341148696730536, "learning_rate": 6.244733985500692e-06, "loss": 2.6001861572265623, "step": 939900 }, { "epoch": 1.1342355329955365, "learning_rate": 6.244330150032954e-06, "loss": 2.594765319824219, "step": 940000 }, { "epoch": 1.134356196318019, "learning_rate": 6.243926314565215e-06, "loss": 2.617511901855469, "step": 940100 }, { "epoch": 1.1344768596405017, "learning_rate": 6.243522479097477e-06, "loss": 2.61108642578125, "step": 940200 }, { "epoch": 1.1345975229629843, "learning_rate": 6.243118643629739e-06, "loss": 2.6141842651367186, "step": 940300 }, { "epoch": 1.1347181862854672, "learning_rate": 6.242714808162e-06, "loss": 2.640875244140625, "step": 940400 }, { "epoch": 1.1348388496079498, "learning_rate": 6.242310972694261e-06, "loss": 2.629657897949219, "step": 940500 }, { "epoch": 1.1349595129304324, "learning_rate": 6.241907137226523e-06, "loss": 2.588307189941406, "step": 940600 }, { "epoch": 1.1350801762529152, "learning_rate": 6.241503301758784e-06, "loss": 2.5940234375, "step": 940700 }, { "epoch": 1.1352008395753979, "learning_rate": 6.241099466291046e-06, "loss": 2.6365170288085937, "step": 940800 }, { "epoch": 1.1353215028978805, "learning_rate": 6.240695630823308e-06, "loss": 2.6187786865234375, "step": 940900 }, { "epoch": 1.135442166220363, "learning_rate": 6.240291795355569e-06, "loss": 2.6286370849609373, "step": 941000 }, { "epoch": 1.135562829542846, "learning_rate": 6.239887959887831e-06, "loss": 2.6029263305664063, "step": 941100 }, { "epoch": 1.1356834928653285, "learning_rate": 6.239484124420093e-06, "loss": 2.6267413330078124, "step": 941200 }, { "epoch": 1.1358041561878112, "learning_rate": 6.239080288952354e-06, "loss": 2.6064321899414065, "step": 941300 }, { "epoch": 1.135924819510294, "learning_rate": 6.238676453484616e-06, "loss": 2.6161233520507814, "step": 941400 }, { "epoch": 1.1360454828327766, "learning_rate": 6.238272618016878e-06, "loss": 2.6594473266601564, "step": 941500 }, { "epoch": 1.1361661461552592, "learning_rate": 6.237868782549139e-06, "loss": 2.635657958984375, "step": 941600 }, { "epoch": 1.136286809477742, "learning_rate": 6.237464947081401e-06, "loss": 2.6091436767578124, "step": 941700 }, { "epoch": 1.1364074728002247, "learning_rate": 6.237061111613663e-06, "loss": 2.6426156616210936, "step": 941800 }, { "epoch": 1.1365281361227073, "learning_rate": 6.236657276145925e-06, "loss": 2.610916748046875, "step": 941900 }, { "epoch": 1.1366487994451901, "learning_rate": 6.236253440678186e-06, "loss": 2.612365417480469, "step": 942000 }, { "epoch": 1.1367694627676728, "learning_rate": 6.235849605210448e-06, "loss": 2.620144958496094, "step": 942100 }, { "epoch": 1.1368901260901554, "learning_rate": 6.235445769742708e-06, "loss": 2.6269573974609375, "step": 942200 }, { "epoch": 1.137010789412638, "learning_rate": 6.23504193427497e-06, "loss": 2.604497985839844, "step": 942300 }, { "epoch": 1.1371314527351208, "learning_rate": 6.234638098807232e-06, "loss": 2.6113055419921873, "step": 942400 }, { "epoch": 1.1372521160576035, "learning_rate": 6.234234263339494e-06, "loss": 2.6067401123046876, "step": 942500 }, { "epoch": 1.137372779380086, "learning_rate": 6.233830427871755e-06, "loss": 2.595289306640625, "step": 942600 }, { "epoch": 1.137493442702569, "learning_rate": 6.233426592404017e-06, "loss": 2.622913513183594, "step": 942700 }, { "epoch": 1.1376141060250515, "learning_rate": 6.233022756936279e-06, "loss": 2.635110168457031, "step": 942800 }, { "epoch": 1.1377347693475341, "learning_rate": 6.23261892146854e-06, "loss": 2.634896240234375, "step": 942900 }, { "epoch": 1.1378554326700168, "learning_rate": 6.232215086000801e-06, "loss": 2.6030059814453126, "step": 943000 }, { "epoch": 1.1379760959924996, "learning_rate": 6.231811250533063e-06, "loss": 2.6297747802734377, "step": 943100 }, { "epoch": 1.1380967593149822, "learning_rate": 6.2314074150653245e-06, "loss": 2.5927593994140623, "step": 943200 }, { "epoch": 1.138217422637465, "learning_rate": 6.2310035795975865e-06, "loss": 2.6345748901367188, "step": 943300 }, { "epoch": 1.1383380859599477, "learning_rate": 6.2305997441298485e-06, "loss": 2.6164886474609377, "step": 943400 }, { "epoch": 1.1384587492824303, "learning_rate": 6.23019590866211e-06, "loss": 2.6260995483398437, "step": 943500 }, { "epoch": 1.138579412604913, "learning_rate": 6.229792073194372e-06, "loss": 2.5948248291015625, "step": 943600 }, { "epoch": 1.1387000759273957, "learning_rate": 6.229388237726634e-06, "loss": 2.6124539184570312, "step": 943700 }, { "epoch": 1.1388207392498784, "learning_rate": 6.228984402258894e-06, "loss": 2.6130096435546877, "step": 943800 }, { "epoch": 1.138941402572361, "learning_rate": 6.228580566791156e-06, "loss": 2.6143069458007813, "step": 943900 }, { "epoch": 1.1390620658948438, "learning_rate": 6.228176731323418e-06, "loss": 2.6088702392578127, "step": 944000 }, { "epoch": 1.1391827292173264, "learning_rate": 6.227772895855679e-06, "loss": 2.615647277832031, "step": 944100 }, { "epoch": 1.139303392539809, "learning_rate": 6.227369060387941e-06, "loss": 2.629200439453125, "step": 944200 }, { "epoch": 1.1394240558622917, "learning_rate": 6.226965224920203e-06, "loss": 2.6127114868164063, "step": 944300 }, { "epoch": 1.1395447191847745, "learning_rate": 6.226561389452465e-06, "loss": 2.60292724609375, "step": 944400 }, { "epoch": 1.1396653825072571, "learning_rate": 6.226157553984726e-06, "loss": 2.63016357421875, "step": 944500 }, { "epoch": 1.1397860458297397, "learning_rate": 6.225753718516987e-06, "loss": 2.6047271728515624, "step": 944600 }, { "epoch": 1.1399067091522226, "learning_rate": 6.225349883049248e-06, "loss": 2.6140899658203125, "step": 944700 }, { "epoch": 1.1400273724747052, "learning_rate": 6.22494604758151e-06, "loss": 2.613972473144531, "step": 944800 }, { "epoch": 1.1401480357971878, "learning_rate": 6.224542212113772e-06, "loss": 2.5908935546875, "step": 944900 }, { "epoch": 1.1402686991196707, "learning_rate": 6.224138376646034e-06, "loss": 2.6209951782226564, "step": 945000 }, { "epoch": 1.1403893624421533, "learning_rate": 6.223734541178295e-06, "loss": 2.6047869873046876, "step": 945100 }, { "epoch": 1.140510025764636, "learning_rate": 6.223330705710557e-06, "loss": 2.592830810546875, "step": 945200 }, { "epoch": 1.1406306890871187, "learning_rate": 6.222926870242819e-06, "loss": 2.6129556274414063, "step": 945300 }, { "epoch": 1.1407513524096013, "learning_rate": 6.22252303477508e-06, "loss": 2.594706726074219, "step": 945400 }, { "epoch": 1.140872015732084, "learning_rate": 6.222119199307342e-06, "loss": 2.5724871826171873, "step": 945500 }, { "epoch": 1.1409926790545666, "learning_rate": 6.221715363839604e-06, "loss": 2.6203207397460937, "step": 945600 }, { "epoch": 1.1411133423770494, "learning_rate": 6.221311528371865e-06, "loss": 2.6257400512695312, "step": 945700 }, { "epoch": 1.141234005699532, "learning_rate": 6.220907692904127e-06, "loss": 2.6282992553710938, "step": 945800 }, { "epoch": 1.1413546690220147, "learning_rate": 6.220503857436389e-06, "loss": 2.617237243652344, "step": 945900 }, { "epoch": 1.1414753323444975, "learning_rate": 6.22010002196865e-06, "loss": 2.6210662841796877, "step": 946000 }, { "epoch": 1.1415959956669801, "learning_rate": 6.219696186500912e-06, "loss": 2.618955078125, "step": 946100 }, { "epoch": 1.1417166589894627, "learning_rate": 6.219292351033173e-06, "loss": 2.570051574707031, "step": 946200 }, { "epoch": 1.1418373223119453, "learning_rate": 6.218888515565434e-06, "loss": 2.6150445556640625, "step": 946300 }, { "epoch": 1.1419579856344282, "learning_rate": 6.218484680097696e-06, "loss": 2.610651550292969, "step": 946400 }, { "epoch": 1.1420786489569108, "learning_rate": 6.218080844629958e-06, "loss": 2.5864691162109374, "step": 946500 }, { "epoch": 1.1421993122793934, "learning_rate": 6.217677009162219e-06, "loss": 2.63109130859375, "step": 946600 }, { "epoch": 1.1423199756018763, "learning_rate": 6.217273173694481e-06, "loss": 2.59879150390625, "step": 946700 }, { "epoch": 1.1424406389243589, "learning_rate": 6.216869338226743e-06, "loss": 2.6015185546875, "step": 946800 }, { "epoch": 1.1425613022468415, "learning_rate": 6.216465502759005e-06, "loss": 2.622770080566406, "step": 946900 }, { "epoch": 1.1426819655693243, "learning_rate": 6.2160616672912655e-06, "loss": 2.6356069946289065, "step": 947000 }, { "epoch": 1.142802628891807, "learning_rate": 6.2156578318235274e-06, "loss": 2.626424560546875, "step": 947100 }, { "epoch": 1.1429232922142896, "learning_rate": 6.2152539963557886e-06, "loss": 2.6052490234375, "step": 947200 }, { "epoch": 1.1430439555367724, "learning_rate": 6.2148501608880506e-06, "loss": 2.5885882568359375, "step": 947300 }, { "epoch": 1.143164618859255, "learning_rate": 6.2144463254203125e-06, "loss": 2.6020327758789064, "step": 947400 }, { "epoch": 1.1432852821817376, "learning_rate": 6.2140424899525745e-06, "loss": 2.6133953857421877, "step": 947500 }, { "epoch": 1.1434059455042203, "learning_rate": 6.213638654484836e-06, "loss": 2.6125137329101564, "step": 947600 }, { "epoch": 1.143526608826703, "learning_rate": 6.213234819017098e-06, "loss": 2.6151809692382812, "step": 947700 }, { "epoch": 1.1436472721491857, "learning_rate": 6.21283098354936e-06, "loss": 2.6079888916015626, "step": 947800 }, { "epoch": 1.1437679354716683, "learning_rate": 6.21242714808162e-06, "loss": 2.6306951904296874, "step": 947900 }, { "epoch": 1.1438885987941512, "learning_rate": 6.212023312613882e-06, "loss": 2.6356436157226564, "step": 948000 }, { "epoch": 1.1440092621166338, "learning_rate": 6.211619477146144e-06, "loss": 2.6355154418945315, "step": 948100 }, { "epoch": 1.1441299254391164, "learning_rate": 6.211215641678405e-06, "loss": 2.6309628295898437, "step": 948200 }, { "epoch": 1.144250588761599, "learning_rate": 6.210811806210667e-06, "loss": 2.6163394165039064, "step": 948300 }, { "epoch": 1.1443712520840819, "learning_rate": 6.210407970742929e-06, "loss": 2.641640625, "step": 948400 }, { "epoch": 1.1444919154065645, "learning_rate": 6.21000413527519e-06, "loss": 2.6174142456054685, "step": 948500 }, { "epoch": 1.1446125787290473, "learning_rate": 6.209600299807452e-06, "loss": 2.611031188964844, "step": 948600 }, { "epoch": 1.14473324205153, "learning_rate": 6.209196464339713e-06, "loss": 2.590994567871094, "step": 948700 }, { "epoch": 1.1448539053740125, "learning_rate": 6.208792628871974e-06, "loss": 2.5961676025390625, "step": 948800 }, { "epoch": 1.1449745686964952, "learning_rate": 6.208388793404236e-06, "loss": 2.6135299682617186, "step": 948900 }, { "epoch": 1.145095232018978, "learning_rate": 6.207984957936498e-06, "loss": 2.620563659667969, "step": 949000 }, { "epoch": 1.1452158953414606, "learning_rate": 6.2075811224687595e-06, "loss": 2.6126742553710938, "step": 949100 }, { "epoch": 1.1453365586639432, "learning_rate": 6.2071772870010214e-06, "loss": 2.616917724609375, "step": 949200 }, { "epoch": 1.145457221986426, "learning_rate": 6.2067734515332834e-06, "loss": 2.5921734619140624, "step": 949300 }, { "epoch": 1.1455778853089087, "learning_rate": 6.206369616065545e-06, "loss": 2.6025921630859377, "step": 949400 }, { "epoch": 1.1456985486313913, "learning_rate": 6.205965780597806e-06, "loss": 2.611419677734375, "step": 949500 }, { "epoch": 1.145819211953874, "learning_rate": 6.205561945130068e-06, "loss": 2.6084991455078126, "step": 949600 }, { "epoch": 1.1459398752763568, "learning_rate": 6.205158109662329e-06, "loss": 2.614696350097656, "step": 949700 }, { "epoch": 1.1460605385988394, "learning_rate": 6.204754274194591e-06, "loss": 2.6101699829101563, "step": 949800 }, { "epoch": 1.146181201921322, "learning_rate": 6.204350438726853e-06, "loss": 2.600971374511719, "step": 949900 }, { "epoch": 1.1463018652438048, "learning_rate": 6.203946603259115e-06, "loss": 2.6160879516601563, "step": 950000 }, { "epoch": 1.1464225285662875, "learning_rate": 6.203542767791376e-06, "loss": 2.6071121215820314, "step": 950100 }, { "epoch": 1.14654319188877, "learning_rate": 6.203138932323638e-06, "loss": 2.612298889160156, "step": 950200 }, { "epoch": 1.146663855211253, "learning_rate": 6.202735096855898e-06, "loss": 2.622821960449219, "step": 950300 }, { "epoch": 1.1467845185337355, "learning_rate": 6.20233126138816e-06, "loss": 2.6132998657226563, "step": 950400 }, { "epoch": 1.1469051818562181, "learning_rate": 6.201927425920422e-06, "loss": 2.619720153808594, "step": 950500 }, { "epoch": 1.147025845178701, "learning_rate": 6.201523590452684e-06, "loss": 2.6135708618164064, "step": 950600 }, { "epoch": 1.1471465085011836, "learning_rate": 6.201119754984945e-06, "loss": 2.6075100708007812, "step": 950700 }, { "epoch": 1.1472671718236662, "learning_rate": 6.200715919517207e-06, "loss": 2.6029238891601563, "step": 950800 }, { "epoch": 1.1473878351461488, "learning_rate": 6.200312084049469e-06, "loss": 2.5948748779296875, "step": 950900 }, { "epoch": 1.1475084984686317, "learning_rate": 6.199908248581731e-06, "loss": 2.6129000854492186, "step": 951000 }, { "epoch": 1.1476291617911143, "learning_rate": 6.1995044131139915e-06, "loss": 2.6263623046875, "step": 951100 }, { "epoch": 1.147749825113597, "learning_rate": 6.1991005776462535e-06, "loss": 2.6212701416015625, "step": 951200 }, { "epoch": 1.1478704884360798, "learning_rate": 6.198696742178515e-06, "loss": 2.610265197753906, "step": 951300 }, { "epoch": 1.1479911517585624, "learning_rate": 6.198292906710777e-06, "loss": 2.609844055175781, "step": 951400 }, { "epoch": 1.148111815081045, "learning_rate": 6.1978890712430386e-06, "loss": 2.598408203125, "step": 951500 }, { "epoch": 1.1482324784035276, "learning_rate": 6.1974852357753006e-06, "loss": 2.6211373901367185, "step": 951600 }, { "epoch": 1.1483531417260104, "learning_rate": 6.197081400307562e-06, "loss": 2.608787841796875, "step": 951700 }, { "epoch": 1.148473805048493, "learning_rate": 6.196677564839824e-06, "loss": 2.6135687255859374, "step": 951800 }, { "epoch": 1.1485944683709757, "learning_rate": 6.196273729372084e-06, "loss": 2.610379333496094, "step": 951900 }, { "epoch": 1.1487151316934585, "learning_rate": 6.195869893904346e-06, "loss": 2.621862487792969, "step": 952000 }, { "epoch": 1.1488357950159411, "learning_rate": 6.195466058436608e-06, "loss": 2.6043603515625, "step": 952100 }, { "epoch": 1.1489564583384237, "learning_rate": 6.19506222296887e-06, "loss": 2.605713195800781, "step": 952200 }, { "epoch": 1.1490771216609066, "learning_rate": 6.194658387501131e-06, "loss": 2.6134152221679687, "step": 952300 }, { "epoch": 1.1491977849833892, "learning_rate": 6.194254552033393e-06, "loss": 2.6090911865234374, "step": 952400 }, { "epoch": 1.1493184483058718, "learning_rate": 6.193850716565655e-06, "loss": 2.5746710205078127, "step": 952500 }, { "epoch": 1.1494391116283547, "learning_rate": 6.193446881097916e-06, "loss": 2.5977328491210936, "step": 952600 }, { "epoch": 1.1495597749508373, "learning_rate": 6.193043045630178e-06, "loss": 2.5947311401367186, "step": 952700 }, { "epoch": 1.14968043827332, "learning_rate": 6.192639210162439e-06, "loss": 2.61755126953125, "step": 952800 }, { "epoch": 1.1498011015958025, "learning_rate": 6.1922353746947e-06, "loss": 2.6275177001953125, "step": 952900 }, { "epoch": 1.1499217649182853, "learning_rate": 6.191831539226962e-06, "loss": 2.6163043212890624, "step": 953000 }, { "epoch": 1.150042428240768, "learning_rate": 6.191427703759224e-06, "loss": 2.600805358886719, "step": 953100 }, { "epoch": 1.1501630915632506, "learning_rate": 6.1910238682914855e-06, "loss": 2.6172439575195314, "step": 953200 }, { "epoch": 1.1502837548857334, "learning_rate": 6.1906200328237475e-06, "loss": 2.572999267578125, "step": 953300 }, { "epoch": 1.150404418208216, "learning_rate": 6.1902161973560095e-06, "loss": 2.6003271484375, "step": 953400 }, { "epoch": 1.1505250815306987, "learning_rate": 6.1898123618882714e-06, "loss": 2.601137390136719, "step": 953500 }, { "epoch": 1.1506457448531813, "learning_rate": 6.189408526420532e-06, "loss": 2.597591552734375, "step": 953600 }, { "epoch": 1.1507664081756641, "learning_rate": 6.189004690952794e-06, "loss": 2.6115380859375, "step": 953700 }, { "epoch": 1.1508870714981467, "learning_rate": 6.188600855485055e-06, "loss": 2.6453726196289065, "step": 953800 }, { "epoch": 1.1510077348206296, "learning_rate": 6.188197020017317e-06, "loss": 2.6158111572265623, "step": 953900 }, { "epoch": 1.1511283981431122, "learning_rate": 6.187793184549579e-06, "loss": 2.6071786499023437, "step": 954000 }, { "epoch": 1.1512490614655948, "learning_rate": 6.187389349081841e-06, "loss": 2.6331689453125, "step": 954100 }, { "epoch": 1.1513697247880774, "learning_rate": 6.186985513614102e-06, "loss": 2.5931686401367187, "step": 954200 }, { "epoch": 1.1514903881105603, "learning_rate": 6.186581678146364e-06, "loss": 2.5924911499023438, "step": 954300 }, { "epoch": 1.1516110514330429, "learning_rate": 6.186177842678624e-06, "loss": 2.5925198364257813, "step": 954400 }, { "epoch": 1.1517317147555255, "learning_rate": 6.185774007210886e-06, "loss": 2.5948883056640626, "step": 954500 }, { "epoch": 1.1518523780780083, "learning_rate": 6.185370171743148e-06, "loss": 2.615431823730469, "step": 954600 }, { "epoch": 1.151973041400491, "learning_rate": 6.18496633627541e-06, "loss": 2.594769287109375, "step": 954700 }, { "epoch": 1.1520937047229736, "learning_rate": 6.184562500807671e-06, "loss": 2.61339111328125, "step": 954800 }, { "epoch": 1.1522143680454562, "learning_rate": 6.184158665339933e-06, "loss": 2.57939453125, "step": 954900 }, { "epoch": 1.152335031367939, "learning_rate": 6.183754829872195e-06, "loss": 2.6062380981445314, "step": 955000 }, { "epoch": 1.1524556946904216, "learning_rate": 6.183350994404456e-06, "loss": 2.606298828125, "step": 955100 }, { "epoch": 1.1525763580129043, "learning_rate": 6.1829471589367175e-06, "loss": 2.6189120483398436, "step": 955200 }, { "epoch": 1.152697021335387, "learning_rate": 6.1825433234689795e-06, "loss": 2.6288970947265624, "step": 955300 }, { "epoch": 1.1528176846578697, "learning_rate": 6.182139488001241e-06, "loss": 2.595953369140625, "step": 955400 }, { "epoch": 1.1529383479803523, "learning_rate": 6.181735652533503e-06, "loss": 2.6176409912109375, "step": 955500 }, { "epoch": 1.1530590113028352, "learning_rate": 6.181331817065765e-06, "loss": 2.5911419677734373, "step": 955600 }, { "epoch": 1.1531796746253178, "learning_rate": 6.180927981598026e-06, "loss": 2.6102890014648437, "step": 955700 }, { "epoch": 1.1533003379478004, "learning_rate": 6.180524146130288e-06, "loss": 2.6307781982421874, "step": 955800 }, { "epoch": 1.1534210012702832, "learning_rate": 6.18012031066255e-06, "loss": 2.6189004516601564, "step": 955900 }, { "epoch": 1.1535416645927659, "learning_rate": 6.17971647519481e-06, "loss": 2.6112127685546875, "step": 956000 }, { "epoch": 1.1536623279152485, "learning_rate": 6.179312639727072e-06, "loss": 2.6311395263671873, "step": 956100 }, { "epoch": 1.153782991237731, "learning_rate": 6.178908804259334e-06, "loss": 2.616090087890625, "step": 956200 }, { "epoch": 1.153903654560214, "learning_rate": 6.178504968791595e-06, "loss": 2.6078436279296877, "step": 956300 }, { "epoch": 1.1540243178826965, "learning_rate": 6.178101133323857e-06, "loss": 2.6079721069335937, "step": 956400 }, { "epoch": 1.1541449812051792, "learning_rate": 6.177697297856119e-06, "loss": 2.604311828613281, "step": 956500 }, { "epoch": 1.154265644527662, "learning_rate": 6.177293462388381e-06, "loss": 2.609208068847656, "step": 956600 }, { "epoch": 1.1543863078501446, "learning_rate": 6.176889626920642e-06, "loss": 2.6453726196289065, "step": 956700 }, { "epoch": 1.1545069711726272, "learning_rate": 6.176485791452903e-06, "loss": 2.5969448852539063, "step": 956800 }, { "epoch": 1.1546276344951099, "learning_rate": 6.1760819559851644e-06, "loss": 2.592884826660156, "step": 956900 }, { "epoch": 1.1547482978175927, "learning_rate": 6.1756781205174264e-06, "loss": 2.592471923828125, "step": 957000 }, { "epoch": 1.1548689611400753, "learning_rate": 6.175274285049688e-06, "loss": 2.601288146972656, "step": 957100 }, { "epoch": 1.154989624462558, "learning_rate": 6.17487044958195e-06, "loss": 2.580452880859375, "step": 957200 }, { "epoch": 1.1551102877850408, "learning_rate": 6.1744666141142115e-06, "loss": 2.5903970336914064, "step": 957300 }, { "epoch": 1.1552309511075234, "learning_rate": 6.1740627786464735e-06, "loss": 2.6013613891601564, "step": 957400 }, { "epoch": 1.155351614430006, "learning_rate": 6.1736589431787355e-06, "loss": 2.6290484619140626, "step": 957500 }, { "epoch": 1.1554722777524888, "learning_rate": 6.173255107710997e-06, "loss": 2.621641845703125, "step": 957600 }, { "epoch": 1.1555929410749715, "learning_rate": 6.172851272243258e-06, "loss": 2.6319915771484377, "step": 957700 }, { "epoch": 1.155713604397454, "learning_rate": 6.17244743677552e-06, "loss": 2.5975958251953126, "step": 957800 }, { "epoch": 1.155834267719937, "learning_rate": 6.172043601307781e-06, "loss": 2.597547912597656, "step": 957900 }, { "epoch": 1.1559549310424195, "learning_rate": 6.171639765840043e-06, "loss": 2.6237063598632813, "step": 958000 }, { "epoch": 1.1560755943649021, "learning_rate": 6.171235930372305e-06, "loss": 2.6117950439453126, "step": 958100 }, { "epoch": 1.1561962576873848, "learning_rate": 6.170832094904566e-06, "loss": 2.6011172485351564, "step": 958200 }, { "epoch": 1.1563169210098676, "learning_rate": 6.170428259436828e-06, "loss": 2.62639892578125, "step": 958300 }, { "epoch": 1.1564375843323502, "learning_rate": 6.17002442396909e-06, "loss": 2.6082333374023436, "step": 958400 }, { "epoch": 1.1565582476548328, "learning_rate": 6.16962058850135e-06, "loss": 2.6206024169921873, "step": 958500 }, { "epoch": 1.1566789109773157, "learning_rate": 6.169216753033612e-06, "loss": 2.6056253051757814, "step": 958600 }, { "epoch": 1.1567995742997983, "learning_rate": 6.168812917565874e-06, "loss": 2.60398193359375, "step": 958700 }, { "epoch": 1.156920237622281, "learning_rate": 6.168409082098135e-06, "loss": 2.604681396484375, "step": 958800 }, { "epoch": 1.1570409009447635, "learning_rate": 6.168005246630397e-06, "loss": 2.6162469482421873, "step": 958900 }, { "epoch": 1.1571615642672464, "learning_rate": 6.167601411162659e-06, "loss": 2.595830383300781, "step": 959000 }, { "epoch": 1.157282227589729, "learning_rate": 6.167197575694921e-06, "loss": 2.597062683105469, "step": 959100 }, { "epoch": 1.1574028909122118, "learning_rate": 6.166793740227182e-06, "loss": 2.5934072875976564, "step": 959200 }, { "epoch": 1.1575235542346944, "learning_rate": 6.1663899047594436e-06, "loss": 2.609781494140625, "step": 959300 }, { "epoch": 1.157644217557177, "learning_rate": 6.165986069291705e-06, "loss": 2.5913409423828124, "step": 959400 }, { "epoch": 1.1577648808796597, "learning_rate": 6.165582233823967e-06, "loss": 2.6227017211914063, "step": 959500 }, { "epoch": 1.1578855442021425, "learning_rate": 6.165178398356229e-06, "loss": 2.58590087890625, "step": 959600 }, { "epoch": 1.1580062075246251, "learning_rate": 6.164774562888491e-06, "loss": 2.6155465698242186, "step": 959700 }, { "epoch": 1.1581268708471077, "learning_rate": 6.164370727420752e-06, "loss": 2.6292559814453127, "step": 959800 }, { "epoch": 1.1582475341695906, "learning_rate": 6.163966891953014e-06, "loss": 2.599437255859375, "step": 959900 }, { "epoch": 1.1583681974920732, "learning_rate": 6.163563056485276e-06, "loss": 2.61607666015625, "step": 960000 }, { "epoch": 1.1584888608145558, "learning_rate": 6.163159221017536e-06, "loss": 2.6151837158203124, "step": 960100 }, { "epoch": 1.1586095241370384, "learning_rate": 6.162755385549798e-06, "loss": 2.6048468017578124, "step": 960200 }, { "epoch": 1.1587301874595213, "learning_rate": 6.16235155008206e-06, "loss": 2.628770446777344, "step": 960300 }, { "epoch": 1.158850850782004, "learning_rate": 6.161947714614321e-06, "loss": 2.6127337646484374, "step": 960400 }, { "epoch": 1.1589715141044865, "learning_rate": 6.161543879146583e-06, "loss": 2.63024169921875, "step": 960500 }, { "epoch": 1.1590921774269694, "learning_rate": 6.161140043678845e-06, "loss": 2.6300665283203126, "step": 960600 }, { "epoch": 1.159212840749452, "learning_rate": 6.160736208211106e-06, "loss": 2.6107553100585936, "step": 960700 }, { "epoch": 1.1593335040719346, "learning_rate": 6.160332372743368e-06, "loss": 2.6173858642578125, "step": 960800 }, { "epoch": 1.1594541673944174, "learning_rate": 6.159928537275629e-06, "loss": 2.602850036621094, "step": 960900 }, { "epoch": 1.1595748307169, "learning_rate": 6.1595247018078905e-06, "loss": 2.6033099365234373, "step": 961000 }, { "epoch": 1.1596954940393827, "learning_rate": 6.1591208663401525e-06, "loss": 2.5956048583984375, "step": 961100 }, { "epoch": 1.1598161573618655, "learning_rate": 6.1587170308724144e-06, "loss": 2.5980123901367187, "step": 961200 }, { "epoch": 1.1599368206843481, "learning_rate": 6.158313195404676e-06, "loss": 2.617196044921875, "step": 961300 }, { "epoch": 1.1600574840068307, "learning_rate": 6.1579093599369376e-06, "loss": 2.6059469604492187, "step": 961400 }, { "epoch": 1.1601781473293133, "learning_rate": 6.1575055244691995e-06, "loss": 2.5931747436523436, "step": 961500 }, { "epoch": 1.1602988106517962, "learning_rate": 6.1571016890014615e-06, "loss": 2.626947326660156, "step": 961600 }, { "epoch": 1.1604194739742788, "learning_rate": 6.156697853533722e-06, "loss": 2.625688171386719, "step": 961700 }, { "epoch": 1.1605401372967614, "learning_rate": 6.156294018065984e-06, "loss": 2.613464050292969, "step": 961800 }, { "epoch": 1.1606608006192443, "learning_rate": 6.155890182598245e-06, "loss": 2.602183532714844, "step": 961900 }, { "epoch": 1.1607814639417269, "learning_rate": 6.155486347130507e-06, "loss": 2.6049429321289064, "step": 962000 }, { "epoch": 1.1609021272642095, "learning_rate": 6.155082511662769e-06, "loss": 2.571180419921875, "step": 962100 }, { "epoch": 1.161022790586692, "learning_rate": 6.154678676195031e-06, "loss": 2.6022393798828123, "step": 962200 }, { "epoch": 1.161143453909175, "learning_rate": 6.154274840727292e-06, "loss": 2.6092828369140624, "step": 962300 }, { "epoch": 1.1612641172316576, "learning_rate": 6.153871005259554e-06, "loss": 2.5968841552734374, "step": 962400 }, { "epoch": 1.1613847805541402, "learning_rate": 6.153467169791816e-06, "loss": 2.612817687988281, "step": 962500 }, { "epoch": 1.161505443876623, "learning_rate": 6.153063334324076e-06, "loss": 2.57997802734375, "step": 962600 }, { "epoch": 1.1616261071991056, "learning_rate": 6.152659498856338e-06, "loss": 2.60719970703125, "step": 962700 }, { "epoch": 1.1617467705215883, "learning_rate": 6.1522556633886e-06, "loss": 2.5909368896484377, "step": 962800 }, { "epoch": 1.161867433844071, "learning_rate": 6.151851827920861e-06, "loss": 2.5975152587890626, "step": 962900 }, { "epoch": 1.1619880971665537, "learning_rate": 6.151447992453123e-06, "loss": 2.615958251953125, "step": 963000 }, { "epoch": 1.1621087604890363, "learning_rate": 6.151044156985385e-06, "loss": 2.576460266113281, "step": 963100 }, { "epoch": 1.1622294238115192, "learning_rate": 6.1506403215176465e-06, "loss": 2.5760159301757812, "step": 963200 }, { "epoch": 1.1623500871340018, "learning_rate": 6.1502364860499085e-06, "loss": 2.5960430908203125, "step": 963300 }, { "epoch": 1.1624707504564844, "learning_rate": 6.14983265058217e-06, "loss": 2.5937631225585935, "step": 963400 }, { "epoch": 1.162591413778967, "learning_rate": 6.149428815114431e-06, "loss": 2.564389343261719, "step": 963500 }, { "epoch": 1.1627120771014499, "learning_rate": 6.149024979646693e-06, "loss": 2.59315185546875, "step": 963600 }, { "epoch": 1.1628327404239325, "learning_rate": 6.148621144178955e-06, "loss": 2.5984536743164064, "step": 963700 }, { "epoch": 1.162953403746415, "learning_rate": 6.148217308711216e-06, "loss": 2.6191778564453125, "step": 963800 }, { "epoch": 1.163074067068898, "learning_rate": 6.147813473243478e-06, "loss": 2.60344970703125, "step": 963900 }, { "epoch": 1.1631947303913805, "learning_rate": 6.14740963777574e-06, "loss": 2.5846658325195313, "step": 964000 }, { "epoch": 1.1633153937138632, "learning_rate": 6.147005802308002e-06, "loss": 2.5946170043945314, "step": 964100 }, { "epoch": 1.1634360570363458, "learning_rate": 6.146601966840262e-06, "loss": 2.6010617065429686, "step": 964200 }, { "epoch": 1.1635567203588286, "learning_rate": 6.146198131372524e-06, "loss": 2.6177658081054687, "step": 964300 }, { "epoch": 1.1636773836813112, "learning_rate": 6.145794295904785e-06, "loss": 2.58694580078125, "step": 964400 }, { "epoch": 1.163798047003794, "learning_rate": 6.145390460437047e-06, "loss": 2.580343933105469, "step": 964500 }, { "epoch": 1.1639187103262767, "learning_rate": 6.144986624969309e-06, "loss": 2.5937454223632814, "step": 964600 }, { "epoch": 1.1640393736487593, "learning_rate": 6.144582789501571e-06, "loss": 2.604034423828125, "step": 964700 }, { "epoch": 1.164160036971242, "learning_rate": 6.144178954033832e-06, "loss": 2.5897412109375, "step": 964800 }, { "epoch": 1.1642807002937248, "learning_rate": 6.143775118566094e-06, "loss": 2.571217346191406, "step": 964900 }, { "epoch": 1.1644013636162074, "learning_rate": 6.1433712830983545e-06, "loss": 2.611466979980469, "step": 965000 }, { "epoch": 1.16452202693869, "learning_rate": 6.1429674476306165e-06, "loss": 2.5981204223632814, "step": 965100 }, { "epoch": 1.1646426902611728, "learning_rate": 6.1425636121628785e-06, "loss": 2.619578857421875, "step": 965200 }, { "epoch": 1.1647633535836555, "learning_rate": 6.1421597766951405e-06, "loss": 2.5722427368164062, "step": 965300 }, { "epoch": 1.164884016906138, "learning_rate": 6.141755941227402e-06, "loss": 2.5968865966796875, "step": 965400 }, { "epoch": 1.1650046802286207, "learning_rate": 6.141352105759664e-06, "loss": 2.6245123291015626, "step": 965500 }, { "epoch": 1.1651253435511035, "learning_rate": 6.140948270291926e-06, "loss": 2.5684393310546874, "step": 965600 }, { "epoch": 1.1652460068735861, "learning_rate": 6.1405444348241876e-06, "loss": 2.5872454833984375, "step": 965700 }, { "epoch": 1.1653666701960688, "learning_rate": 6.140140599356448e-06, "loss": 2.583257751464844, "step": 965800 }, { "epoch": 1.1654873335185516, "learning_rate": 6.13973676388871e-06, "loss": 2.5694143676757815, "step": 965900 }, { "epoch": 1.1656079968410342, "learning_rate": 6.139332928420971e-06, "loss": 2.6079248046875, "step": 966000 }, { "epoch": 1.1657286601635168, "learning_rate": 6.138929092953233e-06, "loss": 2.6125823974609377, "step": 966100 }, { "epoch": 1.1658493234859997, "learning_rate": 6.138525257485495e-06, "loss": 2.6124822998046877, "step": 966200 }, { "epoch": 1.1659699868084823, "learning_rate": 6.138121422017757e-06, "loss": 2.5991586303710936, "step": 966300 }, { "epoch": 1.166090650130965, "learning_rate": 6.137717586550018e-06, "loss": 2.6045751953125, "step": 966400 }, { "epoch": 1.1662113134534478, "learning_rate": 6.13731375108228e-06, "loss": 2.5966873168945312, "step": 966500 }, { "epoch": 1.1663319767759304, "learning_rate": 6.13690991561454e-06, "loss": 2.6005987548828124, "step": 966600 }, { "epoch": 1.166452640098413, "learning_rate": 6.136506080146802e-06, "loss": 2.608534851074219, "step": 966700 }, { "epoch": 1.1665733034208956, "learning_rate": 6.136102244679064e-06, "loss": 2.597913818359375, "step": 966800 }, { "epoch": 1.1666939667433784, "learning_rate": 6.135698409211326e-06, "loss": 2.5938482666015625, "step": 966900 }, { "epoch": 1.166814630065861, "learning_rate": 6.135294573743587e-06, "loss": 2.618718566894531, "step": 967000 }, { "epoch": 1.1669352933883437, "learning_rate": 6.134890738275849e-06, "loss": 2.5790841674804685, "step": 967100 }, { "epoch": 1.1670559567108265, "learning_rate": 6.134486902808111e-06, "loss": 2.5889413452148435, "step": 967200 }, { "epoch": 1.1671766200333091, "learning_rate": 6.1340830673403725e-06, "loss": 2.607156066894531, "step": 967300 }, { "epoch": 1.1672972833557917, "learning_rate": 6.133679231872634e-06, "loss": 2.606257019042969, "step": 967400 }, { "epoch": 1.1674179466782744, "learning_rate": 6.133275396404896e-06, "loss": 2.5843264770507814, "step": 967500 }, { "epoch": 1.1675386100007572, "learning_rate": 6.132871560937157e-06, "loss": 2.581515197753906, "step": 967600 }, { "epoch": 1.1676592733232398, "learning_rate": 6.132467725469419e-06, "loss": 2.610942077636719, "step": 967700 }, { "epoch": 1.1677799366457224, "learning_rate": 6.132063890001681e-06, "loss": 2.595484619140625, "step": 967800 }, { "epoch": 1.1679005999682053, "learning_rate": 6.131660054533942e-06, "loss": 2.6037118530273435, "step": 967900 }, { "epoch": 1.168021263290688, "learning_rate": 6.131256219066204e-06, "loss": 2.6062527465820313, "step": 968000 }, { "epoch": 1.1681419266131705, "learning_rate": 6.130852383598466e-06, "loss": 2.6002743530273436, "step": 968100 }, { "epoch": 1.1682625899356534, "learning_rate": 6.130448548130728e-06, "loss": 2.6064212036132814, "step": 968200 }, { "epoch": 1.168383253258136, "learning_rate": 6.130044712662988e-06, "loss": 2.597742919921875, "step": 968300 }, { "epoch": 1.1685039165806186, "learning_rate": 6.12964087719525e-06, "loss": 2.603427734375, "step": 968400 }, { "epoch": 1.1686245799031014, "learning_rate": 6.129237041727511e-06, "loss": 2.5983599853515624, "step": 968500 }, { "epoch": 1.168745243225584, "learning_rate": 6.128833206259773e-06, "loss": 2.5899981689453124, "step": 968600 }, { "epoch": 1.1688659065480667, "learning_rate": 6.128429370792035e-06, "loss": 2.6104367065429686, "step": 968700 }, { "epoch": 1.1689865698705493, "learning_rate": 6.128025535324297e-06, "loss": 2.591802062988281, "step": 968800 }, { "epoch": 1.1691072331930321, "learning_rate": 6.127621699856558e-06, "loss": 2.6269415283203124, "step": 968900 }, { "epoch": 1.1692278965155147, "learning_rate": 6.12721786438882e-06, "loss": 2.6107693481445313, "step": 969000 }, { "epoch": 1.1693485598379973, "learning_rate": 6.1268140289210806e-06, "loss": 2.592244873046875, "step": 969100 }, { "epoch": 1.1694692231604802, "learning_rate": 6.1264101934533426e-06, "loss": 2.5835595703125, "step": 969200 }, { "epoch": 1.1695898864829628, "learning_rate": 6.1260063579856045e-06, "loss": 2.5968057250976564, "step": 969300 }, { "epoch": 1.1697105498054454, "learning_rate": 6.1256025225178665e-06, "loss": 2.5983236694335936, "step": 969400 }, { "epoch": 1.169831213127928, "learning_rate": 6.125198687050128e-06, "loss": 2.614699401855469, "step": 969500 }, { "epoch": 1.1699518764504109, "learning_rate": 6.12479485158239e-06, "loss": 2.5903466796875, "step": 969600 }, { "epoch": 1.1700725397728935, "learning_rate": 6.124391016114652e-06, "loss": 2.636473388671875, "step": 969700 }, { "epoch": 1.1701932030953763, "learning_rate": 6.123987180646913e-06, "loss": 2.591294250488281, "step": 969800 }, { "epoch": 1.170313866417859, "learning_rate": 6.123583345179174e-06, "loss": 2.6016812133789062, "step": 969900 }, { "epoch": 1.1704345297403416, "learning_rate": 6.123179509711436e-06, "loss": 2.6125543212890623, "step": 970000 }, { "epoch": 1.1705551930628242, "learning_rate": 6.122775674243697e-06, "loss": 2.6065374755859376, "step": 970100 }, { "epoch": 1.170675856385307, "learning_rate": 6.122371838775959e-06, "loss": 2.5975701904296873, "step": 970200 }, { "epoch": 1.1707965197077896, "learning_rate": 6.121968003308221e-06, "loss": 2.597145690917969, "step": 970300 }, { "epoch": 1.1709171830302723, "learning_rate": 6.121564167840482e-06, "loss": 2.597004089355469, "step": 970400 }, { "epoch": 1.171037846352755, "learning_rate": 6.121160332372744e-06, "loss": 2.6181301879882812, "step": 970500 }, { "epoch": 1.1711585096752377, "learning_rate": 6.120756496905006e-06, "loss": 2.5806201171875, "step": 970600 }, { "epoch": 1.1712791729977203, "learning_rate": 6.120352661437266e-06, "loss": 2.5732327270507813, "step": 970700 }, { "epoch": 1.171399836320203, "learning_rate": 6.119948825969528e-06, "loss": 2.588171081542969, "step": 970800 }, { "epoch": 1.1715204996426858, "learning_rate": 6.11954499050179e-06, "loss": 2.5915231323242187, "step": 970900 }, { "epoch": 1.1716411629651684, "learning_rate": 6.1191411550340515e-06, "loss": 2.606606140136719, "step": 971000 }, { "epoch": 1.171761826287651, "learning_rate": 6.1187373195663134e-06, "loss": 2.594422607421875, "step": 971100 }, { "epoch": 1.1718824896101339, "learning_rate": 6.1183334840985754e-06, "loss": 2.6180487060546875, "step": 971200 }, { "epoch": 1.1720031529326165, "learning_rate": 6.117929648630837e-06, "loss": 2.6240243530273437, "step": 971300 }, { "epoch": 1.172123816255099, "learning_rate": 6.1175258131630985e-06, "loss": 2.616488342285156, "step": 971400 }, { "epoch": 1.172244479577582, "learning_rate": 6.11712197769536e-06, "loss": 2.599603271484375, "step": 971500 }, { "epoch": 1.1723651429000645, "learning_rate": 6.116718142227621e-06, "loss": 2.5942929077148436, "step": 971600 }, { "epoch": 1.1724858062225472, "learning_rate": 6.116314306759883e-06, "loss": 2.592612609863281, "step": 971700 }, { "epoch": 1.17260646954503, "learning_rate": 6.115910471292145e-06, "loss": 2.608624267578125, "step": 971800 }, { "epoch": 1.1727271328675126, "learning_rate": 6.115506635824407e-06, "loss": 2.6028536987304687, "step": 971900 }, { "epoch": 1.1728477961899952, "learning_rate": 6.115102800356668e-06, "loss": 2.57473876953125, "step": 972000 }, { "epoch": 1.1729684595124779, "learning_rate": 6.11469896488893e-06, "loss": 2.576666259765625, "step": 972100 }, { "epoch": 1.1730891228349607, "learning_rate": 6.114295129421192e-06, "loss": 2.592965087890625, "step": 972200 }, { "epoch": 1.1732097861574433, "learning_rate": 6.113891293953452e-06, "loss": 2.594486083984375, "step": 972300 }, { "epoch": 1.173330449479926, "learning_rate": 6.113487458485714e-06, "loss": 2.6021405029296876, "step": 972400 }, { "epoch": 1.1734511128024088, "learning_rate": 6.113083623017976e-06, "loss": 2.6069635009765624, "step": 972500 }, { "epoch": 1.1735717761248914, "learning_rate": 6.112679787550237e-06, "loss": 2.5913131713867186, "step": 972600 }, { "epoch": 1.173692439447374, "learning_rate": 6.112275952082499e-06, "loss": 2.5781884765625, "step": 972700 }, { "epoch": 1.1738131027698566, "learning_rate": 6.111872116614761e-06, "loss": 2.5997573852539064, "step": 972800 }, { "epoch": 1.1739337660923395, "learning_rate": 6.111468281147022e-06, "loss": 2.602791442871094, "step": 972900 }, { "epoch": 1.174054429414822, "learning_rate": 6.111064445679284e-06, "loss": 2.5773501586914063, "step": 973000 }, { "epoch": 1.1741750927373047, "learning_rate": 6.110660610211546e-06, "loss": 2.5909423828125, "step": 973100 }, { "epoch": 1.1742957560597875, "learning_rate": 6.110256774743807e-06, "loss": 2.5998834228515624, "step": 973200 }, { "epoch": 1.1744164193822701, "learning_rate": 6.109852939276069e-06, "loss": 2.592122802734375, "step": 973300 }, { "epoch": 1.1745370827047528, "learning_rate": 6.1094491038083306e-06, "loss": 2.5871722412109377, "step": 973400 }, { "epoch": 1.1746577460272356, "learning_rate": 6.109045268340592e-06, "loss": 2.611591491699219, "step": 973500 }, { "epoch": 1.1747784093497182, "learning_rate": 6.108641432872854e-06, "loss": 2.604677429199219, "step": 973600 }, { "epoch": 1.1748990726722008, "learning_rate": 6.108237597405116e-06, "loss": 2.5988088989257814, "step": 973700 }, { "epoch": 1.1750197359946837, "learning_rate": 6.107833761937378e-06, "loss": 2.58959716796875, "step": 973800 }, { "epoch": 1.1751403993171663, "learning_rate": 6.107429926469639e-06, "loss": 2.60385009765625, "step": 973900 }, { "epoch": 1.175261062639649, "learning_rate": 6.1070260910019e-06, "loss": 2.5829022216796873, "step": 974000 }, { "epoch": 1.1753817259621315, "learning_rate": 6.106622255534161e-06, "loss": 2.615972595214844, "step": 974100 }, { "epoch": 1.1755023892846144, "learning_rate": 6.106218420066423e-06, "loss": 2.5916778564453127, "step": 974200 }, { "epoch": 1.175623052607097, "learning_rate": 6.105814584598685e-06, "loss": 2.6110943603515624, "step": 974300 }, { "epoch": 1.1757437159295796, "learning_rate": 6.105410749130947e-06, "loss": 2.6056671142578125, "step": 974400 }, { "epoch": 1.1758643792520624, "learning_rate": 6.105006913663208e-06, "loss": 2.5961822509765624, "step": 974500 }, { "epoch": 1.175985042574545, "learning_rate": 6.10460307819547e-06, "loss": 2.6264227294921874, "step": 974600 }, { "epoch": 1.1761057058970277, "learning_rate": 6.104199242727732e-06, "loss": 2.590207214355469, "step": 974700 }, { "epoch": 1.1762263692195103, "learning_rate": 6.103795407259992e-06, "loss": 2.580292053222656, "step": 974800 }, { "epoch": 1.1763470325419931, "learning_rate": 6.103391571792254e-06, "loss": 2.603485412597656, "step": 974900 }, { "epoch": 1.1764676958644757, "learning_rate": 6.102987736324516e-06, "loss": 2.6332916259765624, "step": 975000 }, { "epoch": 1.1765883591869586, "learning_rate": 6.1025839008567775e-06, "loss": 2.58498046875, "step": 975100 }, { "epoch": 1.1767090225094412, "learning_rate": 6.1021800653890395e-06, "loss": 2.603824462890625, "step": 975200 }, { "epoch": 1.1768296858319238, "learning_rate": 6.1017762299213015e-06, "loss": 2.6032049560546877, "step": 975300 }, { "epoch": 1.1769503491544064, "learning_rate": 6.101372394453563e-06, "loss": 2.581085205078125, "step": 975400 }, { "epoch": 1.1770710124768893, "learning_rate": 6.100968558985825e-06, "loss": 2.599595947265625, "step": 975500 }, { "epoch": 1.177191675799372, "learning_rate": 6.100564723518086e-06, "loss": 2.579244384765625, "step": 975600 }, { "epoch": 1.1773123391218545, "learning_rate": 6.100160888050347e-06, "loss": 2.570328674316406, "step": 975700 }, { "epoch": 1.1774330024443374, "learning_rate": 6.099757052582609e-06, "loss": 2.601065368652344, "step": 975800 }, { "epoch": 1.17755366576682, "learning_rate": 6.099353217114871e-06, "loss": 2.596960144042969, "step": 975900 }, { "epoch": 1.1776743290893026, "learning_rate": 6.098949381647132e-06, "loss": 2.5835009765625, "step": 976000 }, { "epoch": 1.1777949924117852, "learning_rate": 6.098545546179394e-06, "loss": 2.565362548828125, "step": 976100 }, { "epoch": 1.177915655734268, "learning_rate": 6.098141710711656e-06, "loss": 2.6015194702148436, "step": 976200 }, { "epoch": 1.1780363190567507, "learning_rate": 6.097737875243918e-06, "loss": 2.589146728515625, "step": 976300 }, { "epoch": 1.1781569823792333, "learning_rate": 6.097334039776178e-06, "loss": 2.582178039550781, "step": 976400 }, { "epoch": 1.1782776457017161, "learning_rate": 6.09693020430844e-06, "loss": 2.5743618774414063, "step": 976500 }, { "epoch": 1.1783983090241987, "learning_rate": 6.096526368840701e-06, "loss": 2.5747439575195314, "step": 976600 }, { "epoch": 1.1785189723466813, "learning_rate": 6.096122533372963e-06, "loss": 2.599559020996094, "step": 976700 }, { "epoch": 1.1786396356691642, "learning_rate": 6.095718697905225e-06, "loss": 2.6225466918945313, "step": 976800 }, { "epoch": 1.1787602989916468, "learning_rate": 6.095314862437487e-06, "loss": 2.6300787353515624, "step": 976900 }, { "epoch": 1.1788809623141294, "learning_rate": 6.094911026969748e-06, "loss": 2.610126953125, "step": 977000 }, { "epoch": 1.1790016256366123, "learning_rate": 6.09450719150201e-06, "loss": 2.587339172363281, "step": 977100 }, { "epoch": 1.1791222889590949, "learning_rate": 6.094103356034271e-06, "loss": 2.6041104125976564, "step": 977200 }, { "epoch": 1.1792429522815775, "learning_rate": 6.093699520566533e-06, "loss": 2.5947113037109375, "step": 977300 }, { "epoch": 1.1793636156040601, "learning_rate": 6.093295685098795e-06, "loss": 2.5954348754882814, "step": 977400 }, { "epoch": 1.179484278926543, "learning_rate": 6.092891849631057e-06, "loss": 2.6100494384765627, "step": 977500 }, { "epoch": 1.1796049422490256, "learning_rate": 6.092488014163318e-06, "loss": 2.5916104125976562, "step": 977600 }, { "epoch": 1.1797256055715082, "learning_rate": 6.09208417869558e-06, "loss": 2.586148376464844, "step": 977700 }, { "epoch": 1.179846268893991, "learning_rate": 6.091680343227842e-06, "loss": 2.574223937988281, "step": 977800 }, { "epoch": 1.1799669322164736, "learning_rate": 6.091276507760104e-06, "loss": 2.5928005981445312, "step": 977900 }, { "epoch": 1.1800875955389563, "learning_rate": 6.090872672292365e-06, "loss": 2.6233489990234373, "step": 978000 }, { "epoch": 1.1802082588614389, "learning_rate": 6.090468836824626e-06, "loss": 2.6063607788085936, "step": 978100 }, { "epoch": 1.1803289221839217, "learning_rate": 6.090065001356887e-06, "loss": 2.597544860839844, "step": 978200 }, { "epoch": 1.1804495855064043, "learning_rate": 6.089661165889149e-06, "loss": 2.6014981079101562, "step": 978300 }, { "epoch": 1.180570248828887, "learning_rate": 6.089257330421411e-06, "loss": 2.5859390258789063, "step": 978400 }, { "epoch": 1.1806909121513698, "learning_rate": 6.088853494953673e-06, "loss": 2.59175537109375, "step": 978500 }, { "epoch": 1.1808115754738524, "learning_rate": 6.088449659485934e-06, "loss": 2.63207275390625, "step": 978600 }, { "epoch": 1.180932238796335, "learning_rate": 6.088045824018196e-06, "loss": 2.58492431640625, "step": 978700 }, { "epoch": 1.1810529021188179, "learning_rate": 6.087641988550458e-06, "loss": 2.5941448974609376, "step": 978800 }, { "epoch": 1.1811735654413005, "learning_rate": 6.0872381530827184e-06, "loss": 2.5975421142578123, "step": 978900 }, { "epoch": 1.181294228763783, "learning_rate": 6.08683431761498e-06, "loss": 2.585941162109375, "step": 979000 }, { "epoch": 1.181414892086266, "learning_rate": 6.086430482147242e-06, "loss": 2.5682357788085937, "step": 979100 }, { "epoch": 1.1815355554087486, "learning_rate": 6.0860266466795035e-06, "loss": 2.6013369750976563, "step": 979200 }, { "epoch": 1.1816562187312312, "learning_rate": 6.0856228112117655e-06, "loss": 2.5646978759765626, "step": 979300 }, { "epoch": 1.1817768820537138, "learning_rate": 6.0852189757440275e-06, "loss": 2.6018975830078124, "step": 979400 }, { "epoch": 1.1818975453761966, "learning_rate": 6.084815140276289e-06, "loss": 2.595281982421875, "step": 979500 }, { "epoch": 1.1820182086986792, "learning_rate": 6.084411304808551e-06, "loss": 2.60206298828125, "step": 979600 }, { "epoch": 1.1821388720211619, "learning_rate": 6.084007469340812e-06, "loss": 2.5950027465820313, "step": 979700 }, { "epoch": 1.1822595353436447, "learning_rate": 6.083603633873073e-06, "loss": 2.5825759887695314, "step": 979800 }, { "epoch": 1.1823801986661273, "learning_rate": 6.083199798405335e-06, "loss": 2.617801513671875, "step": 979900 }, { "epoch": 1.18250086198861, "learning_rate": 6.082795962937597e-06, "loss": 2.6138485717773436, "step": 980000 }, { "epoch": 1.1826215253110925, "learning_rate": 6.082392127469858e-06, "loss": 2.592586669921875, "step": 980100 }, { "epoch": 1.1827421886335754, "learning_rate": 6.08198829200212e-06, "loss": 2.585135803222656, "step": 980200 }, { "epoch": 1.182862851956058, "learning_rate": 6.081584456534382e-06, "loss": 2.629750061035156, "step": 980300 }, { "epoch": 1.1829835152785408, "learning_rate": 6.081180621066644e-06, "loss": 2.5939315795898437, "step": 980400 }, { "epoch": 1.1831041786010235, "learning_rate": 6.080776785598904e-06, "loss": 2.617914123535156, "step": 980500 }, { "epoch": 1.183224841923506, "learning_rate": 6.080372950131166e-06, "loss": 2.5924609375, "step": 980600 }, { "epoch": 1.1833455052459887, "learning_rate": 6.079969114663427e-06, "loss": 2.620184326171875, "step": 980700 }, { "epoch": 1.1834661685684715, "learning_rate": 6.079565279195689e-06, "loss": 2.6176577758789064, "step": 980800 }, { "epoch": 1.1835868318909541, "learning_rate": 6.079161443727951e-06, "loss": 2.60630859375, "step": 980900 }, { "epoch": 1.1837074952134368, "learning_rate": 6.078757608260213e-06, "loss": 2.6123992919921877, "step": 981000 }, { "epoch": 1.1838281585359196, "learning_rate": 6.078353772792474e-06, "loss": 2.579404602050781, "step": 981100 }, { "epoch": 1.1839488218584022, "learning_rate": 6.077949937324736e-06, "loss": 2.5910165405273435, "step": 981200 }, { "epoch": 1.1840694851808848, "learning_rate": 6.077546101856997e-06, "loss": 2.5846823120117186, "step": 981300 }, { "epoch": 1.1841901485033675, "learning_rate": 6.077142266389259e-06, "loss": 2.614487609863281, "step": 981400 }, { "epoch": 1.1843108118258503, "learning_rate": 6.076738430921521e-06, "loss": 2.58438232421875, "step": 981500 }, { "epoch": 1.184431475148333, "learning_rate": 6.076334595453783e-06, "loss": 2.605773620605469, "step": 981600 }, { "epoch": 1.1845521384708155, "learning_rate": 6.075930759986044e-06, "loss": 2.5952593994140627, "step": 981700 }, { "epoch": 1.1846728017932984, "learning_rate": 6.075526924518306e-06, "loss": 2.5849530029296877, "step": 981800 }, { "epoch": 1.184793465115781, "learning_rate": 6.075123089050568e-06, "loss": 2.5910150146484376, "step": 981900 }, { "epoch": 1.1849141284382636, "learning_rate": 6.074719253582829e-06, "loss": 2.576096496582031, "step": 982000 }, { "epoch": 1.1850347917607464, "learning_rate": 6.07431541811509e-06, "loss": 2.6080093383789062, "step": 982100 }, { "epoch": 1.185155455083229, "learning_rate": 6.073911582647352e-06, "loss": 2.6047940063476562, "step": 982200 }, { "epoch": 1.1852761184057117, "learning_rate": 6.073507747179613e-06, "loss": 2.6149285888671874, "step": 982300 }, { "epoch": 1.1853967817281945, "learning_rate": 6.073103911711875e-06, "loss": 2.58296630859375, "step": 982400 }, { "epoch": 1.1855174450506771, "learning_rate": 6.072700076244137e-06, "loss": 2.573744201660156, "step": 982500 }, { "epoch": 1.1856381083731597, "learning_rate": 6.072296240776398e-06, "loss": 2.5759396362304687, "step": 982600 }, { "epoch": 1.1857587716956424, "learning_rate": 6.07189240530866e-06, "loss": 2.5933792114257814, "step": 982700 }, { "epoch": 1.1858794350181252, "learning_rate": 6.071488569840922e-06, "loss": 2.6140484619140625, "step": 982800 }, { "epoch": 1.1860000983406078, "learning_rate": 6.0710847343731825e-06, "loss": 2.5783963012695312, "step": 982900 }, { "epoch": 1.1861207616630904, "learning_rate": 6.0706808989054445e-06, "loss": 2.597664794921875, "step": 983000 }, { "epoch": 1.1862414249855733, "learning_rate": 6.0702770634377064e-06, "loss": 2.560101318359375, "step": 983100 }, { "epoch": 1.186362088308056, "learning_rate": 6.069873227969968e-06, "loss": 2.608586730957031, "step": 983200 }, { "epoch": 1.1864827516305385, "learning_rate": 6.0694693925022296e-06, "loss": 2.5867044067382814, "step": 983300 }, { "epoch": 1.1866034149530211, "learning_rate": 6.0690655570344915e-06, "loss": 2.569785461425781, "step": 983400 }, { "epoch": 1.186724078275504, "learning_rate": 6.0686617215667535e-06, "loss": 2.598089294433594, "step": 983500 }, { "epoch": 1.1868447415979866, "learning_rate": 6.068257886099015e-06, "loss": 2.598568115234375, "step": 983600 }, { "epoch": 1.1869654049204692, "learning_rate": 6.067854050631277e-06, "loss": 2.608358154296875, "step": 983700 }, { "epoch": 1.187086068242952, "learning_rate": 6.067450215163537e-06, "loss": 2.6020941162109374, "step": 983800 }, { "epoch": 1.1872067315654347, "learning_rate": 6.067046379695799e-06, "loss": 2.5930218505859375, "step": 983900 }, { "epoch": 1.1873273948879173, "learning_rate": 6.066642544228061e-06, "loss": 2.634434814453125, "step": 984000 }, { "epoch": 1.1874480582104001, "learning_rate": 6.066238708760323e-06, "loss": 2.5946343994140624, "step": 984100 }, { "epoch": 1.1875687215328827, "learning_rate": 6.065834873292584e-06, "loss": 2.5793441772460937, "step": 984200 }, { "epoch": 1.1876893848553653, "learning_rate": 6.065431037824846e-06, "loss": 2.6008465576171873, "step": 984300 }, { "epoch": 1.1878100481778482, "learning_rate": 6.065027202357108e-06, "loss": 2.5900091552734374, "step": 984400 }, { "epoch": 1.1879307115003308, "learning_rate": 6.064623366889369e-06, "loss": 2.6016241455078126, "step": 984500 }, { "epoch": 1.1880513748228134, "learning_rate": 6.06421953142163e-06, "loss": 2.59624267578125, "step": 984600 }, { "epoch": 1.188172038145296, "learning_rate": 6.063815695953892e-06, "loss": 2.585549621582031, "step": 984700 }, { "epoch": 1.1882927014677789, "learning_rate": 6.063411860486153e-06, "loss": 2.5818902587890626, "step": 984800 }, { "epoch": 1.1884133647902615, "learning_rate": 6.063008025018415e-06, "loss": 2.587596435546875, "step": 984900 }, { "epoch": 1.1885340281127441, "learning_rate": 6.062604189550677e-06, "loss": 2.6011721801757814, "step": 985000 }, { "epoch": 1.188654691435227, "learning_rate": 6.0622003540829385e-06, "loss": 2.5860760498046873, "step": 985100 }, { "epoch": 1.1887753547577096, "learning_rate": 6.0617965186152005e-06, "loss": 2.5945028686523437, "step": 985200 }, { "epoch": 1.1888960180801922, "learning_rate": 6.0613926831474624e-06, "loss": 2.586225891113281, "step": 985300 }, { "epoch": 1.1890166814026748, "learning_rate": 6.060988847679723e-06, "loss": 2.58639404296875, "step": 985400 }, { "epoch": 1.1891373447251576, "learning_rate": 6.060585012211985e-06, "loss": 2.589744873046875, "step": 985500 }, { "epoch": 1.1892580080476403, "learning_rate": 6.060181176744247e-06, "loss": 2.611219482421875, "step": 985600 }, { "epoch": 1.189378671370123, "learning_rate": 6.059777341276508e-06, "loss": 2.6014892578125, "step": 985700 }, { "epoch": 1.1894993346926057, "learning_rate": 6.05937350580877e-06, "loss": 2.6130850219726565, "step": 985800 }, { "epoch": 1.1896199980150883, "learning_rate": 6.058969670341032e-06, "loss": 2.6030126953125, "step": 985900 }, { "epoch": 1.189740661337571, "learning_rate": 6.058565834873294e-06, "loss": 2.5568995666503906, "step": 986000 }, { "epoch": 1.1898613246600538, "learning_rate": 6.058161999405555e-06, "loss": 2.5992047119140627, "step": 986100 }, { "epoch": 1.1899819879825364, "learning_rate": 6.057758163937816e-06, "loss": 2.614365539550781, "step": 986200 }, { "epoch": 1.190102651305019, "learning_rate": 6.057354328470077e-06, "loss": 2.561944885253906, "step": 986300 }, { "epoch": 1.1902233146275019, "learning_rate": 6.056950493002339e-06, "loss": 2.591408386230469, "step": 986400 }, { "epoch": 1.1903439779499845, "learning_rate": 6.056546657534601e-06, "loss": 2.5944464111328127, "step": 986500 }, { "epoch": 1.190464641272467, "learning_rate": 6.056142822066863e-06, "loss": 2.594496154785156, "step": 986600 }, { "epoch": 1.1905853045949497, "learning_rate": 6.055738986599124e-06, "loss": 2.602533264160156, "step": 986700 }, { "epoch": 1.1907059679174326, "learning_rate": 6.055335151131386e-06, "loss": 2.6103643798828124, "step": 986800 }, { "epoch": 1.1908266312399152, "learning_rate": 6.054931315663648e-06, "loss": 2.596690979003906, "step": 986900 }, { "epoch": 1.1909472945623978, "learning_rate": 6.0545274801959085e-06, "loss": 2.597983093261719, "step": 987000 }, { "epoch": 1.1910679578848806, "learning_rate": 6.0541236447281705e-06, "loss": 2.6055035400390625, "step": 987100 }, { "epoch": 1.1911886212073632, "learning_rate": 6.0537198092604325e-06, "loss": 2.5853179931640624, "step": 987200 }, { "epoch": 1.1913092845298459, "learning_rate": 6.053315973792694e-06, "loss": 2.5890655517578125, "step": 987300 }, { "epoch": 1.1914299478523287, "learning_rate": 6.052912138324956e-06, "loss": 2.604725036621094, "step": 987400 }, { "epoch": 1.1915506111748113, "learning_rate": 6.052508302857218e-06, "loss": 2.6311273193359375, "step": 987500 }, { "epoch": 1.191671274497294, "learning_rate": 6.052104467389479e-06, "loss": 2.593239440917969, "step": 987600 }, { "epoch": 1.1917919378197768, "learning_rate": 6.051700631921741e-06, "loss": 2.5910223388671874, "step": 987700 }, { "epoch": 1.1919126011422594, "learning_rate": 6.051296796454002e-06, "loss": 2.585469970703125, "step": 987800 }, { "epoch": 1.192033264464742, "learning_rate": 6.050892960986263e-06, "loss": 2.600281982421875, "step": 987900 }, { "epoch": 1.1921539277872246, "learning_rate": 6.050489125518525e-06, "loss": 2.5974420166015624, "step": 988000 }, { "epoch": 1.1922745911097075, "learning_rate": 6.050085290050787e-06, "loss": 2.5980303955078123, "step": 988100 }, { "epoch": 1.19239525443219, "learning_rate": 6.049681454583048e-06, "loss": 2.612778625488281, "step": 988200 }, { "epoch": 1.1925159177546727, "learning_rate": 6.04927761911531e-06, "loss": 2.589386291503906, "step": 988300 }, { "epoch": 1.1926365810771555, "learning_rate": 6.048873783647572e-06, "loss": 2.6068988037109375, "step": 988400 }, { "epoch": 1.1927572443996382, "learning_rate": 6.048469948179834e-06, "loss": 2.5870852661132813, "step": 988500 }, { "epoch": 1.1928779077221208, "learning_rate": 6.048066112712095e-06, "loss": 2.5838912963867187, "step": 988600 }, { "epoch": 1.1929985710446034, "learning_rate": 6.047662277244356e-06, "loss": 2.5863116455078123, "step": 988700 }, { "epoch": 1.1931192343670862, "learning_rate": 6.047258441776617e-06, "loss": 2.6013247680664064, "step": 988800 }, { "epoch": 1.1932398976895688, "learning_rate": 6.046854606308879e-06, "loss": 2.6056527709960937, "step": 988900 }, { "epoch": 1.1933605610120515, "learning_rate": 6.046450770841141e-06, "loss": 2.60065185546875, "step": 989000 }, { "epoch": 1.1934812243345343, "learning_rate": 6.046046935373403e-06, "loss": 2.582217102050781, "step": 989100 }, { "epoch": 1.193601887657017, "learning_rate": 6.0456430999056645e-06, "loss": 2.599864196777344, "step": 989200 }, { "epoch": 1.1937225509794995, "learning_rate": 6.0452392644379265e-06, "loss": 2.567310791015625, "step": 989300 }, { "epoch": 1.1938432143019824, "learning_rate": 6.0448354289701885e-06, "loss": 2.61168701171875, "step": 989400 }, { "epoch": 1.193963877624465, "learning_rate": 6.044431593502449e-06, "loss": 2.5996624755859377, "step": 989500 }, { "epoch": 1.1940845409469476, "learning_rate": 6.044027758034711e-06, "loss": 2.578859558105469, "step": 989600 }, { "epoch": 1.1942052042694304, "learning_rate": 6.043623922566973e-06, "loss": 2.6084259033203123, "step": 989700 }, { "epoch": 1.194325867591913, "learning_rate": 6.043220087099234e-06, "loss": 2.6022723388671873, "step": 989800 }, { "epoch": 1.1944465309143957, "learning_rate": 6.042816251631496e-06, "loss": 2.587525634765625, "step": 989900 }, { "epoch": 1.1945671942368783, "learning_rate": 6.042412416163758e-06, "loss": 2.5719009399414063, "step": 990000 }, { "epoch": 1.1946878575593611, "learning_rate": 6.042008580696019e-06, "loss": 2.572001647949219, "step": 990100 }, { "epoch": 1.1948085208818437, "learning_rate": 6.041604745228281e-06, "loss": 2.6108160400390625, "step": 990200 }, { "epoch": 1.1949291842043264, "learning_rate": 6.041200909760542e-06, "loss": 2.5733282470703127, "step": 990300 }, { "epoch": 1.1950498475268092, "learning_rate": 6.040797074292803e-06, "loss": 2.5819952392578127, "step": 990400 }, { "epoch": 1.1951705108492918, "learning_rate": 6.040393238825065e-06, "loss": 2.584156188964844, "step": 990500 }, { "epoch": 1.1952911741717744, "learning_rate": 6.039989403357327e-06, "loss": 2.6094500732421877, "step": 990600 }, { "epoch": 1.195411837494257, "learning_rate": 6.039585567889588e-06, "loss": 2.6129571533203126, "step": 990700 }, { "epoch": 1.19553250081674, "learning_rate": 6.03918173242185e-06, "loss": 2.582649841308594, "step": 990800 }, { "epoch": 1.1956531641392225, "learning_rate": 6.038777896954112e-06, "loss": 2.598116760253906, "step": 990900 }, { "epoch": 1.1957738274617054, "learning_rate": 6.038374061486374e-06, "loss": 2.593816833496094, "step": 991000 }, { "epoch": 1.195894490784188, "learning_rate": 6.0379702260186345e-06, "loss": 2.576995544433594, "step": 991100 }, { "epoch": 1.1960151541066706, "learning_rate": 6.0375663905508965e-06, "loss": 2.5823880004882813, "step": 991200 }, { "epoch": 1.1961358174291532, "learning_rate": 6.037162555083158e-06, "loss": 2.5965460205078124, "step": 991300 }, { "epoch": 1.196256480751636, "learning_rate": 6.03675871961542e-06, "loss": 2.5929864501953124, "step": 991400 }, { "epoch": 1.1963771440741187, "learning_rate": 6.036354884147682e-06, "loss": 2.586373291015625, "step": 991500 }, { "epoch": 1.1964978073966013, "learning_rate": 6.035951048679944e-06, "loss": 2.5966171264648437, "step": 991600 }, { "epoch": 1.1966184707190841, "learning_rate": 6.035547213212205e-06, "loss": 2.599550476074219, "step": 991700 }, { "epoch": 1.1967391340415667, "learning_rate": 6.035143377744467e-06, "loss": 2.5896014404296874, "step": 991800 }, { "epoch": 1.1968597973640493, "learning_rate": 6.034739542276727e-06, "loss": 2.584306335449219, "step": 991900 }, { "epoch": 1.196980460686532, "learning_rate": 6.034335706808989e-06, "loss": 2.5980401611328126, "step": 992000 }, { "epoch": 1.1971011240090148, "learning_rate": 6.033931871341251e-06, "loss": 2.6080865478515625, "step": 992100 }, { "epoch": 1.1972217873314974, "learning_rate": 6.033528035873513e-06, "loss": 2.6064727783203123, "step": 992200 }, { "epoch": 1.19734245065398, "learning_rate": 6.033124200405774e-06, "loss": 2.5954489135742187, "step": 992300 }, { "epoch": 1.1974631139764629, "learning_rate": 6.032720364938036e-06, "loss": 2.610365295410156, "step": 992400 }, { "epoch": 1.1975837772989455, "learning_rate": 6.032316529470298e-06, "loss": 2.5940728759765626, "step": 992500 }, { "epoch": 1.1977044406214281, "learning_rate": 6.03191269400256e-06, "loss": 2.570939636230469, "step": 992600 }, { "epoch": 1.197825103943911, "learning_rate": 6.03150885853482e-06, "loss": 2.584353332519531, "step": 992700 }, { "epoch": 1.1979457672663936, "learning_rate": 6.031105023067082e-06, "loss": 2.598033752441406, "step": 992800 }, { "epoch": 1.1980664305888762, "learning_rate": 6.0307011875993435e-06, "loss": 2.5762176513671875, "step": 992900 }, { "epoch": 1.198187093911359, "learning_rate": 6.0302973521316054e-06, "loss": 2.589976806640625, "step": 993000 }, { "epoch": 1.1983077572338416, "learning_rate": 6.029893516663867e-06, "loss": 2.5842959594726564, "step": 993100 }, { "epoch": 1.1984284205563243, "learning_rate": 6.029489681196129e-06, "loss": 2.579898681640625, "step": 993200 }, { "epoch": 1.1985490838788069, "learning_rate": 6.0290858457283905e-06, "loss": 2.5633245849609376, "step": 993300 }, { "epoch": 1.1986697472012897, "learning_rate": 6.0286820102606525e-06, "loss": 2.586378479003906, "step": 993400 }, { "epoch": 1.1987904105237723, "learning_rate": 6.0282781747929145e-06, "loss": 2.612513427734375, "step": 993500 }, { "epoch": 1.198911073846255, "learning_rate": 6.027874339325175e-06, "loss": 2.608420104980469, "step": 993600 }, { "epoch": 1.1990317371687378, "learning_rate": 6.027470503857437e-06, "loss": 2.6017852783203126, "step": 993700 }, { "epoch": 1.1991524004912204, "learning_rate": 6.027066668389699e-06, "loss": 2.6116604614257812, "step": 993800 }, { "epoch": 1.199273063813703, "learning_rate": 6.02666283292196e-06, "loss": 2.5727294921875, "step": 993900 }, { "epoch": 1.1993937271361856, "learning_rate": 6.026258997454222e-06, "loss": 2.5887985229492188, "step": 994000 }, { "epoch": 1.1995143904586685, "learning_rate": 6.025855161986484e-06, "loss": 2.571607971191406, "step": 994100 }, { "epoch": 1.199635053781151, "learning_rate": 6.025451326518745e-06, "loss": 2.5867340087890627, "step": 994200 }, { "epoch": 1.1997557171036337, "learning_rate": 6.025047491051007e-06, "loss": 2.5858209228515623, "step": 994300 }, { "epoch": 1.1998763804261166, "learning_rate": 6.024643655583268e-06, "loss": 2.5972613525390624, "step": 994400 }, { "epoch": 1.1999970437485992, "learning_rate": 6.024239820115529e-06, "loss": 2.5819223022460935, "step": 994500 }, { "epoch": 1.2001177070710818, "learning_rate": 6.023835984647791e-06, "loss": 2.590470275878906, "step": 994600 }, { "epoch": 1.2002383703935646, "learning_rate": 6.023432149180053e-06, "loss": 2.5792547607421876, "step": 994700 }, { "epoch": 1.2003590337160472, "learning_rate": 6.023028313712314e-06, "loss": 2.581932373046875, "step": 994800 }, { "epoch": 1.2004796970385299, "learning_rate": 6.022624478244576e-06, "loss": 2.58543701171875, "step": 994900 }, { "epoch": 1.2006003603610127, "learning_rate": 6.022220642776838e-06, "loss": 2.588716735839844, "step": 995000 }, { "epoch": 1.2007210236834953, "learning_rate": 6.0218168073091e-06, "loss": 2.565452880859375, "step": 995100 }, { "epoch": 1.200841687005978, "learning_rate": 6.021412971841361e-06, "loss": 2.5673287963867186, "step": 995200 }, { "epoch": 1.2009623503284605, "learning_rate": 6.0210091363736226e-06, "loss": 2.5934765625, "step": 995300 }, { "epoch": 1.2010830136509434, "learning_rate": 6.020605300905884e-06, "loss": 2.592362060546875, "step": 995400 }, { "epoch": 1.201203676973426, "learning_rate": 6.020201465438146e-06, "loss": 2.58357177734375, "step": 995500 }, { "epoch": 1.2013243402959086, "learning_rate": 6.019797629970408e-06, "loss": 2.558121795654297, "step": 995600 }, { "epoch": 1.2014450036183915, "learning_rate": 6.01939379450267e-06, "loss": 2.5753555297851562, "step": 995700 }, { "epoch": 1.201565666940874, "learning_rate": 6.018989959034931e-06, "loss": 2.591250305175781, "step": 995800 }, { "epoch": 1.2016863302633567, "learning_rate": 6.018586123567193e-06, "loss": 2.5973391723632813, "step": 995900 }, { "epoch": 1.2018069935858393, "learning_rate": 6.018182288099453e-06, "loss": 2.570903625488281, "step": 996000 }, { "epoch": 1.2019276569083222, "learning_rate": 6.017778452631715e-06, "loss": 2.592829284667969, "step": 996100 }, { "epoch": 1.2020483202308048, "learning_rate": 6.017374617163977e-06, "loss": 2.583069152832031, "step": 996200 }, { "epoch": 1.2021689835532876, "learning_rate": 6.016970781696239e-06, "loss": 2.6080181884765623, "step": 996300 }, { "epoch": 1.2022896468757702, "learning_rate": 6.0165669462285e-06, "loss": 2.5774530029296874, "step": 996400 }, { "epoch": 1.2024103101982528, "learning_rate": 6.016163110760762e-06, "loss": 2.583879089355469, "step": 996500 }, { "epoch": 1.2025309735207355, "learning_rate": 6.015759275293024e-06, "loss": 2.613372802734375, "step": 996600 }, { "epoch": 1.2026516368432183, "learning_rate": 6.015355439825285e-06, "loss": 2.5959820556640625, "step": 996700 }, { "epoch": 1.202772300165701, "learning_rate": 6.014951604357546e-06, "loss": 2.6047817993164064, "step": 996800 }, { "epoch": 1.2028929634881835, "learning_rate": 6.014547768889808e-06, "loss": 2.5873379516601562, "step": 996900 }, { "epoch": 1.2030136268106664, "learning_rate": 6.0141439334220695e-06, "loss": 2.583349304199219, "step": 997000 }, { "epoch": 1.203134290133149, "learning_rate": 6.0137400979543315e-06, "loss": 2.60281982421875, "step": 997100 }, { "epoch": 1.2032549534556316, "learning_rate": 6.0133362624865935e-06, "loss": 2.60412353515625, "step": 997200 }, { "epoch": 1.2033756167781142, "learning_rate": 6.012932427018855e-06, "loss": 2.609312744140625, "step": 997300 }, { "epoch": 1.203496280100597, "learning_rate": 6.0125285915511166e-06, "loss": 2.5763665771484376, "step": 997400 }, { "epoch": 1.2036169434230797, "learning_rate": 6.0121247560833786e-06, "loss": 2.5854180908203124, "step": 997500 }, { "epoch": 1.2037376067455623, "learning_rate": 6.011720920615639e-06, "loss": 2.5799942016601562, "step": 997600 }, { "epoch": 1.2038582700680451, "learning_rate": 6.011317085147901e-06, "loss": 2.5823712158203125, "step": 997700 }, { "epoch": 1.2039789333905278, "learning_rate": 6.010913249680163e-06, "loss": 2.6094265747070313, "step": 997800 }, { "epoch": 1.2040995967130104, "learning_rate": 6.010509414212424e-06, "loss": 2.5981106567382812, "step": 997900 }, { "epoch": 1.2042202600354932, "learning_rate": 6.010105578744686e-06, "loss": 2.5972219848632814, "step": 998000 }, { "epoch": 1.2043409233579758, "learning_rate": 6.009701743276948e-06, "loss": 2.580426025390625, "step": 998100 }, { "epoch": 1.2044615866804584, "learning_rate": 6.00929790780921e-06, "loss": 2.585313720703125, "step": 998200 }, { "epoch": 1.2045822500029413, "learning_rate": 6.008894072341471e-06, "loss": 2.5883139038085936, "step": 998300 }, { "epoch": 1.204702913325424, "learning_rate": 6.008490236873732e-06, "loss": 2.5722528076171876, "step": 998400 }, { "epoch": 1.2048235766479065, "learning_rate": 6.008086401405993e-06, "loss": 2.581435241699219, "step": 998500 }, { "epoch": 1.2049442399703891, "learning_rate": 6.007682565938255e-06, "loss": 2.5993505859375, "step": 998600 }, { "epoch": 1.205064903292872, "learning_rate": 6.007278730470517e-06, "loss": 2.5977325439453125, "step": 998700 }, { "epoch": 1.2051855666153546, "learning_rate": 6.006874895002779e-06, "loss": 2.593480529785156, "step": 998800 }, { "epoch": 1.2053062299378372, "learning_rate": 6.00647105953504e-06, "loss": 2.5599436950683594, "step": 998900 }, { "epoch": 1.20542689326032, "learning_rate": 6.006067224067302e-06, "loss": 2.5618231201171877, "step": 999000 }, { "epoch": 1.2055475565828027, "learning_rate": 6.005663388599564e-06, "loss": 2.574082946777344, "step": 999100 }, { "epoch": 1.2056682199052853, "learning_rate": 6.0052595531318255e-06, "loss": 2.5980935668945313, "step": 999200 }, { "epoch": 1.205788883227768, "learning_rate": 6.004855717664087e-06, "loss": 2.587355651855469, "step": 999300 }, { "epoch": 1.2059095465502507, "learning_rate": 6.004451882196349e-06, "loss": 2.616277160644531, "step": 999400 }, { "epoch": 1.2060302098727333, "learning_rate": 6.00404804672861e-06, "loss": 2.572906188964844, "step": 999500 }, { "epoch": 1.206150873195216, "learning_rate": 6.003644211260872e-06, "loss": 2.6047576904296874, "step": 999600 }, { "epoch": 1.2062715365176988, "learning_rate": 6.003240375793134e-06, "loss": 2.590765075683594, "step": 999700 }, { "epoch": 1.2063921998401814, "learning_rate": 6.002836540325395e-06, "loss": 2.5794024658203125, "step": 999800 }, { "epoch": 1.206512863162664, "learning_rate": 6.002432704857657e-06, "loss": 2.599256591796875, "step": 999900 }, { "epoch": 1.2066335264851469, "learning_rate": 6.002028869389919e-06, "loss": 2.59798583984375, "step": 1000000 }, { "epoch": 1.2067541898076295, "learning_rate": 6.001625033922179e-06, "loss": 2.6022021484375, "step": 1000100 }, { "epoch": 1.2068748531301121, "learning_rate": 6.001221198454441e-06, "loss": 2.589915466308594, "step": 1000200 }, { "epoch": 1.206995516452595, "learning_rate": 6.000817362986703e-06, "loss": 2.5835858154296876, "step": 1000300 }, { "epoch": 1.2071161797750776, "learning_rate": 6.000413527518964e-06, "loss": 2.575775146484375, "step": 1000400 }, { "epoch": 1.2072368430975602, "learning_rate": 6.000009692051226e-06, "loss": 2.6158401489257814, "step": 1000500 }, { "epoch": 1.2073575064200428, "learning_rate": 5.999605856583488e-06, "loss": 2.5703643798828124, "step": 1000600 }, { "epoch": 1.2074781697425256, "learning_rate": 5.99920202111575e-06, "loss": 2.592787780761719, "step": 1000700 }, { "epoch": 1.2075988330650083, "learning_rate": 5.998798185648011e-06, "loss": 2.5765673828125, "step": 1000800 }, { "epoch": 1.2077194963874909, "learning_rate": 5.998394350180272e-06, "loss": 2.590276794433594, "step": 1000900 }, { "epoch": 1.2078401597099737, "learning_rate": 5.9979905147125335e-06, "loss": 2.5952838134765623, "step": 1001000 }, { "epoch": 1.2079608230324563, "learning_rate": 5.9975866792447955e-06, "loss": 2.5840444946289063, "step": 1001100 }, { "epoch": 1.208081486354939, "learning_rate": 5.9971828437770575e-06, "loss": 2.596746826171875, "step": 1001200 }, { "epoch": 1.2082021496774216, "learning_rate": 5.9967790083093195e-06, "loss": 2.5952243041992187, "step": 1001300 }, { "epoch": 1.2083228129999044, "learning_rate": 5.996375172841581e-06, "loss": 2.5795797729492187, "step": 1001400 }, { "epoch": 1.208443476322387, "learning_rate": 5.995971337373843e-06, "loss": 2.597052001953125, "step": 1001500 }, { "epoch": 1.2085641396448699, "learning_rate": 5.995567501906105e-06, "loss": 2.60904296875, "step": 1001600 }, { "epoch": 1.2086848029673525, "learning_rate": 5.995163666438365e-06, "loss": 2.58393310546875, "step": 1001700 }, { "epoch": 1.208805466289835, "learning_rate": 5.994759830970627e-06, "loss": 2.5913775634765623, "step": 1001800 }, { "epoch": 1.2089261296123177, "learning_rate": 5.994355995502889e-06, "loss": 2.595897216796875, "step": 1001900 }, { "epoch": 1.2090467929348006, "learning_rate": 5.99395216003515e-06, "loss": 2.6027267456054686, "step": 1002000 }, { "epoch": 1.2091674562572832, "learning_rate": 5.993548324567412e-06, "loss": 2.612747802734375, "step": 1002100 }, { "epoch": 1.2092881195797658, "learning_rate": 5.993144489099674e-06, "loss": 2.5940789794921875, "step": 1002200 }, { "epoch": 1.2094087829022486, "learning_rate": 5.992740653631935e-06, "loss": 2.5752850341796876, "step": 1002300 }, { "epoch": 1.2095294462247312, "learning_rate": 5.992336818164197e-06, "loss": 2.6042990112304687, "step": 1002400 }, { "epoch": 1.2096501095472139, "learning_rate": 5.991932982696458e-06, "loss": 2.559644927978516, "step": 1002500 }, { "epoch": 1.2097707728696965, "learning_rate": 5.991529147228719e-06, "loss": 2.5772573852539065, "step": 1002600 }, { "epoch": 1.2098914361921793, "learning_rate": 5.991125311760981e-06, "loss": 2.59503662109375, "step": 1002700 }, { "epoch": 1.210012099514662, "learning_rate": 5.990721476293243e-06, "loss": 2.56747802734375, "step": 1002800 }, { "epoch": 1.2101327628371445, "learning_rate": 5.9903176408255044e-06, "loss": 2.587383117675781, "step": 1002900 }, { "epoch": 1.2102534261596274, "learning_rate": 5.989913805357766e-06, "loss": 2.56919677734375, "step": 1003000 }, { "epoch": 1.21037408948211, "learning_rate": 5.989509969890028e-06, "loss": 2.571070251464844, "step": 1003100 }, { "epoch": 1.2104947528045926, "learning_rate": 5.98910613442229e-06, "loss": 2.5983941650390623, "step": 1003200 }, { "epoch": 1.2106154161270755, "learning_rate": 5.988702298954551e-06, "loss": 2.5665203857421877, "step": 1003300 }, { "epoch": 1.210736079449558, "learning_rate": 5.988298463486813e-06, "loss": 2.5752337646484373, "step": 1003400 }, { "epoch": 1.2108567427720407, "learning_rate": 5.987894628019074e-06, "loss": 2.597101745605469, "step": 1003500 }, { "epoch": 1.2109774060945235, "learning_rate": 5.987490792551336e-06, "loss": 2.5678146362304686, "step": 1003600 }, { "epoch": 1.2110980694170062, "learning_rate": 5.987086957083598e-06, "loss": 2.587971496582031, "step": 1003700 }, { "epoch": 1.2112187327394888, "learning_rate": 5.98668312161586e-06, "loss": 2.575755615234375, "step": 1003800 }, { "epoch": 1.2113393960619714, "learning_rate": 5.986279286148121e-06, "loss": 2.602939453125, "step": 1003900 }, { "epoch": 1.2114600593844542, "learning_rate": 5.985875450680383e-06, "loss": 2.5862451171875, "step": 1004000 }, { "epoch": 1.2115807227069368, "learning_rate": 5.985471615212645e-06, "loss": 2.5769580078125, "step": 1004100 }, { "epoch": 1.2117013860294195, "learning_rate": 5.985067779744905e-06, "loss": 2.598065185546875, "step": 1004200 }, { "epoch": 1.2118220493519023, "learning_rate": 5.984663944277167e-06, "loss": 2.5922921752929686, "step": 1004300 }, { "epoch": 1.211942712674385, "learning_rate": 5.984260108809429e-06, "loss": 2.609633483886719, "step": 1004400 }, { "epoch": 1.2120633759968675, "learning_rate": 5.98385627334169e-06, "loss": 2.572191162109375, "step": 1004500 }, { "epoch": 1.2121840393193501, "learning_rate": 5.983452437873952e-06, "loss": 2.5856863403320314, "step": 1004600 }, { "epoch": 1.212304702641833, "learning_rate": 5.983048602406214e-06, "loss": 2.5694955444335936, "step": 1004700 }, { "epoch": 1.2124253659643156, "learning_rate": 5.982644766938475e-06, "loss": 2.585050048828125, "step": 1004800 }, { "epoch": 1.2125460292867982, "learning_rate": 5.982240931470737e-06, "loss": 2.578052978515625, "step": 1004900 }, { "epoch": 1.212666692609281, "learning_rate": 5.9818370960029984e-06, "loss": 2.602294616699219, "step": 1005000 }, { "epoch": 1.2127873559317637, "learning_rate": 5.9814332605352596e-06, "loss": 2.5659774780273437, "step": 1005100 }, { "epoch": 1.2129080192542463, "learning_rate": 5.9810294250675216e-06, "loss": 2.5814544677734377, "step": 1005200 }, { "epoch": 1.2130286825767291, "learning_rate": 5.9806255895997835e-06, "loss": 2.5862973022460936, "step": 1005300 }, { "epoch": 1.2131493458992118, "learning_rate": 5.980221754132045e-06, "loss": 2.5864639282226562, "step": 1005400 }, { "epoch": 1.2132700092216944, "learning_rate": 5.979817918664307e-06, "loss": 2.589774475097656, "step": 1005500 }, { "epoch": 1.2133906725441772, "learning_rate": 5.979414083196569e-06, "loss": 2.5846380615234374, "step": 1005600 }, { "epoch": 1.2135113358666598, "learning_rate": 5.979010247728831e-06, "loss": 2.5954940795898436, "step": 1005700 }, { "epoch": 1.2136319991891424, "learning_rate": 5.978606412261091e-06, "loss": 2.573484191894531, "step": 1005800 }, { "epoch": 1.213752662511625, "learning_rate": 5.978202576793353e-06, "loss": 2.56675537109375, "step": 1005900 }, { "epoch": 1.213873325834108, "learning_rate": 5.977798741325614e-06, "loss": 2.586187744140625, "step": 1006000 }, { "epoch": 1.2139939891565905, "learning_rate": 5.977394905857876e-06, "loss": 2.609754943847656, "step": 1006100 }, { "epoch": 1.2141146524790731, "learning_rate": 5.976991070390138e-06, "loss": 2.5754776000976562, "step": 1006200 }, { "epoch": 1.214235315801556, "learning_rate": 5.9765872349224e-06, "loss": 2.6030758666992186, "step": 1006300 }, { "epoch": 1.2143559791240386, "learning_rate": 5.976183399454661e-06, "loss": 2.5884164428710936, "step": 1006400 }, { "epoch": 1.2144766424465212, "learning_rate": 5.975779563986923e-06, "loss": 2.583922119140625, "step": 1006500 }, { "epoch": 1.2145973057690038, "learning_rate": 5.975375728519183e-06, "loss": 2.5984136962890627, "step": 1006600 }, { "epoch": 1.2147179690914867, "learning_rate": 5.974971893051445e-06, "loss": 2.5869134521484374, "step": 1006700 }, { "epoch": 1.2148386324139693, "learning_rate": 5.974568057583707e-06, "loss": 2.5631427001953124, "step": 1006800 }, { "epoch": 1.2149592957364521, "learning_rate": 5.974164222115969e-06, "loss": 2.5816754150390624, "step": 1006900 }, { "epoch": 1.2150799590589347, "learning_rate": 5.9737603866482305e-06, "loss": 2.60897216796875, "step": 1007000 }, { "epoch": 1.2152006223814174, "learning_rate": 5.9733565511804924e-06, "loss": 2.5888934326171875, "step": 1007100 }, { "epoch": 1.2153212857039, "learning_rate": 5.9729527157127544e-06, "loss": 2.5836041259765623, "step": 1007200 }, { "epoch": 1.2154419490263828, "learning_rate": 5.972548880245016e-06, "loss": 2.5792245483398437, "step": 1007300 }, { "epoch": 1.2155626123488654, "learning_rate": 5.972145044777277e-06, "loss": 2.588428955078125, "step": 1007400 }, { "epoch": 1.215683275671348, "learning_rate": 5.971741209309539e-06, "loss": 2.5893218994140623, "step": 1007500 }, { "epoch": 1.2158039389938309, "learning_rate": 5.9713373738418e-06, "loss": 2.5528416442871094, "step": 1007600 }, { "epoch": 1.2159246023163135, "learning_rate": 5.970933538374062e-06, "loss": 2.5735791015625, "step": 1007700 }, { "epoch": 1.2160452656387961, "learning_rate": 5.970529702906324e-06, "loss": 2.5943756103515625, "step": 1007800 }, { "epoch": 1.2161659289612787, "learning_rate": 5.970125867438586e-06, "loss": 2.591111755371094, "step": 1007900 }, { "epoch": 1.2162865922837616, "learning_rate": 5.969722031970847e-06, "loss": 2.5735943603515623, "step": 1008000 }, { "epoch": 1.2164072556062442, "learning_rate": 5.969318196503109e-06, "loss": 2.585079345703125, "step": 1008100 }, { "epoch": 1.2165279189287268, "learning_rate": 5.968914361035369e-06, "loss": 2.6075390625, "step": 1008200 }, { "epoch": 1.2166485822512096, "learning_rate": 5.968510525567631e-06, "loss": 2.621576232910156, "step": 1008300 }, { "epoch": 1.2167692455736923, "learning_rate": 5.968106690099893e-06, "loss": 2.5724636840820314, "step": 1008400 }, { "epoch": 1.2168899088961749, "learning_rate": 5.967702854632155e-06, "loss": 2.576777038574219, "step": 1008500 }, { "epoch": 1.2170105722186577, "learning_rate": 5.967299019164416e-06, "loss": 2.546286926269531, "step": 1008600 }, { "epoch": 1.2171312355411403, "learning_rate": 5.966895183696678e-06, "loss": 2.5573577880859375, "step": 1008700 }, { "epoch": 1.217251898863623, "learning_rate": 5.96649134822894e-06, "loss": 2.5928268432617188, "step": 1008800 }, { "epoch": 1.2173725621861058, "learning_rate": 5.966087512761201e-06, "loss": 2.580580749511719, "step": 1008900 }, { "epoch": 1.2174932255085884, "learning_rate": 5.965683677293463e-06, "loss": 2.5976266479492187, "step": 1009000 }, { "epoch": 1.217613888831071, "learning_rate": 5.9652798418257245e-06, "loss": 2.5956884765625, "step": 1009100 }, { "epoch": 1.2177345521535536, "learning_rate": 5.964876006357986e-06, "loss": 2.5858905029296877, "step": 1009200 }, { "epoch": 1.2178552154760365, "learning_rate": 5.964472170890248e-06, "loss": 2.580829772949219, "step": 1009300 }, { "epoch": 1.217975878798519, "learning_rate": 5.9640683354225096e-06, "loss": 2.5541380310058592, "step": 1009400 }, { "epoch": 1.2180965421210017, "learning_rate": 5.963664499954771e-06, "loss": 2.586528625488281, "step": 1009500 }, { "epoch": 1.2182172054434846, "learning_rate": 5.963260664487033e-06, "loss": 2.588980407714844, "step": 1009600 }, { "epoch": 1.2183378687659672, "learning_rate": 5.962856829019295e-06, "loss": 2.580602111816406, "step": 1009700 }, { "epoch": 1.2184585320884498, "learning_rate": 5.962452993551557e-06, "loss": 2.595520324707031, "step": 1009800 }, { "epoch": 1.2185791954109324, "learning_rate": 5.962049158083817e-06, "loss": 2.599153747558594, "step": 1009900 }, { "epoch": 1.2186998587334152, "learning_rate": 5.961645322616079e-06, "loss": 2.595789489746094, "step": 1010000 }, { "epoch": 1.2188205220558979, "learning_rate": 5.96124148714834e-06, "loss": 2.590914001464844, "step": 1010100 }, { "epoch": 1.2189411853783805, "learning_rate": 5.960837651680602e-06, "loss": 2.564967041015625, "step": 1010200 }, { "epoch": 1.2190618487008633, "learning_rate": 5.960433816212864e-06, "loss": 2.5766860961914064, "step": 1010300 }, { "epoch": 1.219182512023346, "learning_rate": 5.960029980745126e-06, "loss": 2.5953353881835937, "step": 1010400 }, { "epoch": 1.2193031753458285, "learning_rate": 5.959626145277387e-06, "loss": 2.5832659912109377, "step": 1010500 }, { "epoch": 1.2194238386683114, "learning_rate": 5.959222309809649e-06, "loss": 2.5967367553710936, "step": 1010600 }, { "epoch": 1.219544501990794, "learning_rate": 5.958818474341909e-06, "loss": 2.5883367919921874, "step": 1010700 }, { "epoch": 1.2196651653132766, "learning_rate": 5.958414638874171e-06, "loss": 2.6250155639648436, "step": 1010800 }, { "epoch": 1.2197858286357595, "learning_rate": 5.958010803406433e-06, "loss": 2.6105307006835936, "step": 1010900 }, { "epoch": 1.219906491958242, "learning_rate": 5.957606967938695e-06, "loss": 2.576982421875, "step": 1011000 }, { "epoch": 1.2200271552807247, "learning_rate": 5.9572031324709565e-06, "loss": 2.5608700561523436, "step": 1011100 }, { "epoch": 1.2201478186032073, "learning_rate": 5.9567992970032185e-06, "loss": 2.5698013305664062, "step": 1011200 }, { "epoch": 1.2202684819256902, "learning_rate": 5.9563954615354805e-06, "loss": 2.6145455932617185, "step": 1011300 }, { "epoch": 1.2203891452481728, "learning_rate": 5.955991626067742e-06, "loss": 2.584559020996094, "step": 1011400 }, { "epoch": 1.2205098085706554, "learning_rate": 5.955587790600003e-06, "loss": 2.5740216064453123, "step": 1011500 }, { "epoch": 1.2206304718931382, "learning_rate": 5.955183955132265e-06, "loss": 2.5667410278320313, "step": 1011600 }, { "epoch": 1.2207511352156208, "learning_rate": 5.954780119664526e-06, "loss": 2.5802813720703126, "step": 1011700 }, { "epoch": 1.2208717985381035, "learning_rate": 5.954376284196788e-06, "loss": 2.5989065551757813, "step": 1011800 }, { "epoch": 1.220992461860586, "learning_rate": 5.95397244872905e-06, "loss": 2.599371032714844, "step": 1011900 }, { "epoch": 1.221113125183069, "learning_rate": 5.953568613261311e-06, "loss": 2.5724163818359376, "step": 1012000 }, { "epoch": 1.2212337885055515, "learning_rate": 5.953164777793573e-06, "loss": 2.5798876953125, "step": 1012100 }, { "epoch": 1.2213544518280344, "learning_rate": 5.952760942325835e-06, "loss": 2.5983615112304688, "step": 1012200 }, { "epoch": 1.221475115150517, "learning_rate": 5.952357106858095e-06, "loss": 2.57089599609375, "step": 1012300 }, { "epoch": 1.2215957784729996, "learning_rate": 5.951953271390357e-06, "loss": 2.6121051025390627, "step": 1012400 }, { "epoch": 1.2217164417954822, "learning_rate": 5.951549435922619e-06, "loss": 2.5913189697265624, "step": 1012500 }, { "epoch": 1.221837105117965, "learning_rate": 5.95114560045488e-06, "loss": 2.600299987792969, "step": 1012600 }, { "epoch": 1.2219577684404477, "learning_rate": 5.950741764987142e-06, "loss": 2.5685894775390623, "step": 1012700 }, { "epoch": 1.2220784317629303, "learning_rate": 5.950337929519404e-06, "loss": 2.5668499755859373, "step": 1012800 }, { "epoch": 1.2221990950854131, "learning_rate": 5.949934094051666e-06, "loss": 2.559784240722656, "step": 1012900 }, { "epoch": 1.2223197584078958, "learning_rate": 5.949530258583927e-06, "loss": 2.5756576538085936, "step": 1013000 }, { "epoch": 1.2224404217303784, "learning_rate": 5.9491264231161885e-06, "loss": 2.580562744140625, "step": 1013100 }, { "epoch": 1.222561085052861, "learning_rate": 5.94872258764845e-06, "loss": 2.5990469360351565, "step": 1013200 }, { "epoch": 1.2226817483753438, "learning_rate": 5.948318752180712e-06, "loss": 2.5695321655273435, "step": 1013300 }, { "epoch": 1.2228024116978264, "learning_rate": 5.947914916712974e-06, "loss": 2.5985983276367186, "step": 1013400 }, { "epoch": 1.222923075020309, "learning_rate": 5.947511081245236e-06, "loss": 2.5753765869140626, "step": 1013500 }, { "epoch": 1.223043738342792, "learning_rate": 5.947107245777497e-06, "loss": 2.5859478759765624, "step": 1013600 }, { "epoch": 1.2231644016652745, "learning_rate": 5.946703410309759e-06, "loss": 2.58534912109375, "step": 1013700 }, { "epoch": 1.2232850649877571, "learning_rate": 5.946299574842021e-06, "loss": 2.6025048828125, "step": 1013800 }, { "epoch": 1.22340572831024, "learning_rate": 5.945895739374281e-06, "loss": 2.5716546630859374, "step": 1013900 }, { "epoch": 1.2235263916327226, "learning_rate": 5.945491903906543e-06, "loss": 2.560941162109375, "step": 1014000 }, { "epoch": 1.2236470549552052, "learning_rate": 5.945088068438805e-06, "loss": 2.591849670410156, "step": 1014100 }, { "epoch": 1.223767718277688, "learning_rate": 5.944684232971066e-06, "loss": 2.5894015502929686, "step": 1014200 }, { "epoch": 1.2238883816001707, "learning_rate": 5.944280397503328e-06, "loss": 2.574870300292969, "step": 1014300 }, { "epoch": 1.2240090449226533, "learning_rate": 5.94387656203559e-06, "loss": 2.58961669921875, "step": 1014400 }, { "epoch": 1.224129708245136, "learning_rate": 5.943472726567851e-06, "loss": 2.6025775146484373, "step": 1014500 }, { "epoch": 1.2242503715676187, "learning_rate": 5.943068891100113e-06, "loss": 2.5637252807617186, "step": 1014600 }, { "epoch": 1.2243710348901014, "learning_rate": 5.942665055632375e-06, "loss": 2.5855807495117187, "step": 1014700 }, { "epoch": 1.224491698212584, "learning_rate": 5.9422612201646355e-06, "loss": 2.5637493896484376, "step": 1014800 }, { "epoch": 1.2246123615350668, "learning_rate": 5.9418573846968974e-06, "loss": 2.5867684936523436, "step": 1014900 }, { "epoch": 1.2247330248575494, "learning_rate": 5.941453549229159e-06, "loss": 2.5871240234375, "step": 1015000 }, { "epoch": 1.224853688180032, "learning_rate": 5.9410497137614206e-06, "loss": 2.5829156494140624, "step": 1015100 }, { "epoch": 1.2249743515025147, "learning_rate": 5.9406458782936825e-06, "loss": 2.593664245605469, "step": 1015200 }, { "epoch": 1.2250950148249975, "learning_rate": 5.9402420428259445e-06, "loss": 2.5732464599609375, "step": 1015300 }, { "epoch": 1.2252156781474801, "learning_rate": 5.9398382073582065e-06, "loss": 2.6002023315429685, "step": 1015400 }, { "epoch": 1.2253363414699627, "learning_rate": 5.939434371890468e-06, "loss": 2.5985226440429687, "step": 1015500 }, { "epoch": 1.2254570047924456, "learning_rate": 5.939030536422729e-06, "loss": 2.563104248046875, "step": 1015600 }, { "epoch": 1.2255776681149282, "learning_rate": 5.93862670095499e-06, "loss": 2.6057861328125, "step": 1015700 }, { "epoch": 1.2256983314374108, "learning_rate": 5.938222865487252e-06, "loss": 2.5816726684570312, "step": 1015800 }, { "epoch": 1.2258189947598936, "learning_rate": 5.937819030019514e-06, "loss": 2.580680236816406, "step": 1015900 }, { "epoch": 1.2259396580823763, "learning_rate": 5.937415194551776e-06, "loss": 2.560596618652344, "step": 1016000 }, { "epoch": 1.2260603214048589, "learning_rate": 5.937011359084037e-06, "loss": 2.5748028564453125, "step": 1016100 }, { "epoch": 1.2261809847273417, "learning_rate": 5.936607523616299e-06, "loss": 2.5657992553710938, "step": 1016200 }, { "epoch": 1.2263016480498243, "learning_rate": 5.936203688148561e-06, "loss": 2.5578631591796874, "step": 1016300 }, { "epoch": 1.226422311372307, "learning_rate": 5.935799852680821e-06, "loss": 2.5620596313476565, "step": 1016400 }, { "epoch": 1.2265429746947896, "learning_rate": 5.935396017213083e-06, "loss": 2.584797668457031, "step": 1016500 }, { "epoch": 1.2266636380172724, "learning_rate": 5.934992181745345e-06, "loss": 2.5792633056640626, "step": 1016600 }, { "epoch": 1.226784301339755, "learning_rate": 5.934588346277606e-06, "loss": 2.597567443847656, "step": 1016700 }, { "epoch": 1.2269049646622376, "learning_rate": 5.934184510809868e-06, "loss": 2.5470050048828123, "step": 1016800 }, { "epoch": 1.2270256279847205, "learning_rate": 5.93378067534213e-06, "loss": 2.560993347167969, "step": 1016900 }, { "epoch": 1.227146291307203, "learning_rate": 5.9333768398743914e-06, "loss": 2.596288146972656, "step": 1017000 }, { "epoch": 1.2272669546296857, "learning_rate": 5.932973004406653e-06, "loss": 2.6184005737304688, "step": 1017100 }, { "epoch": 1.2273876179521686, "learning_rate": 5.9325691689389146e-06, "loss": 2.6032421875, "step": 1017200 }, { "epoch": 1.2275082812746512, "learning_rate": 5.932165333471176e-06, "loss": 2.5805453491210937, "step": 1017300 }, { "epoch": 1.2276289445971338, "learning_rate": 5.931761498003438e-06, "loss": 2.588258972167969, "step": 1017400 }, { "epoch": 1.2277496079196166, "learning_rate": 5.9313576625357e-06, "loss": 2.6049960327148436, "step": 1017500 }, { "epoch": 1.2278702712420992, "learning_rate": 5.930953827067961e-06, "loss": 2.5819232177734377, "step": 1017600 }, { "epoch": 1.2279909345645819, "learning_rate": 5.930549991600223e-06, "loss": 2.545513153076172, "step": 1017700 }, { "epoch": 1.2281115978870645, "learning_rate": 5.930146156132485e-06, "loss": 2.5869342041015626, "step": 1017800 }, { "epoch": 1.2282322612095473, "learning_rate": 5.929742320664747e-06, "loss": 2.582342529296875, "step": 1017900 }, { "epoch": 1.22835292453203, "learning_rate": 5.929338485197007e-06, "loss": 2.587716064453125, "step": 1018000 }, { "epoch": 1.2284735878545125, "learning_rate": 5.928934649729269e-06, "loss": 2.5404266357421874, "step": 1018100 }, { "epoch": 1.2285942511769954, "learning_rate": 5.92853081426153e-06, "loss": 2.5661883544921875, "step": 1018200 }, { "epoch": 1.228714914499478, "learning_rate": 5.928126978793792e-06, "loss": 2.5905621337890623, "step": 1018300 }, { "epoch": 1.2288355778219606, "learning_rate": 5.927723143326054e-06, "loss": 2.5755108642578124, "step": 1018400 }, { "epoch": 1.2289562411444432, "learning_rate": 5.927319307858316e-06, "loss": 2.56387451171875, "step": 1018500 }, { "epoch": 1.229076904466926, "learning_rate": 5.926915472390577e-06, "loss": 2.5725115966796874, "step": 1018600 }, { "epoch": 1.2291975677894087, "learning_rate": 5.926511636922839e-06, "loss": 2.558067169189453, "step": 1018700 }, { "epoch": 1.2293182311118913, "learning_rate": 5.9261078014550995e-06, "loss": 2.5850933837890624, "step": 1018800 }, { "epoch": 1.2294388944343742, "learning_rate": 5.9257039659873615e-06, "loss": 2.598403015136719, "step": 1018900 }, { "epoch": 1.2295595577568568, "learning_rate": 5.9253001305196235e-06, "loss": 2.589814453125, "step": 1019000 }, { "epoch": 1.2296802210793394, "learning_rate": 5.9248962950518854e-06, "loss": 2.5627410888671873, "step": 1019100 }, { "epoch": 1.2298008844018222, "learning_rate": 5.924492459584147e-06, "loss": 2.5807815551757813, "step": 1019200 }, { "epoch": 1.2299215477243048, "learning_rate": 5.9240886241164086e-06, "loss": 2.5710955810546876, "step": 1019300 }, { "epoch": 1.2300422110467875, "learning_rate": 5.9236847886486705e-06, "loss": 2.5698678588867185, "step": 1019400 }, { "epoch": 1.2301628743692703, "learning_rate": 5.923280953180932e-06, "loss": 2.564097595214844, "step": 1019500 }, { "epoch": 1.230283537691753, "learning_rate": 5.922877117713194e-06, "loss": 2.5924981689453124, "step": 1019600 }, { "epoch": 1.2304042010142355, "learning_rate": 5.922473282245455e-06, "loss": 2.57291748046875, "step": 1019700 }, { "epoch": 1.2305248643367181, "learning_rate": 5.922069446777716e-06, "loss": 2.5727304077148436, "step": 1019800 }, { "epoch": 1.230645527659201, "learning_rate": 5.921665611309978e-06, "loss": 2.5788339233398436, "step": 1019900 }, { "epoch": 1.2307661909816836, "learning_rate": 5.92126177584224e-06, "loss": 2.5874810791015626, "step": 1020000 }, { "epoch": 1.2308868543041662, "learning_rate": 5.920857940374501e-06, "loss": 2.5760073852539063, "step": 1020100 }, { "epoch": 1.231007517626649, "learning_rate": 5.920454104906763e-06, "loss": 2.587437744140625, "step": 1020200 }, { "epoch": 1.2311281809491317, "learning_rate": 5.920050269439025e-06, "loss": 2.5756292724609375, "step": 1020300 }, { "epoch": 1.2312488442716143, "learning_rate": 5.919646433971287e-06, "loss": 2.589193115234375, "step": 1020400 }, { "epoch": 1.231369507594097, "learning_rate": 5.919242598503547e-06, "loss": 2.562017822265625, "step": 1020500 }, { "epoch": 1.2314901709165798, "learning_rate": 5.918838763035809e-06, "loss": 2.5798434448242187, "step": 1020600 }, { "epoch": 1.2316108342390624, "learning_rate": 5.91843492756807e-06, "loss": 2.5695706176757813, "step": 1020700 }, { "epoch": 1.231731497561545, "learning_rate": 5.918031092100332e-06, "loss": 2.5691094970703126, "step": 1020800 }, { "epoch": 1.2318521608840278, "learning_rate": 5.917627256632594e-06, "loss": 2.5695654296875, "step": 1020900 }, { "epoch": 1.2319728242065104, "learning_rate": 5.917223421164856e-06, "loss": 2.5628091430664064, "step": 1021000 }, { "epoch": 1.232093487528993, "learning_rate": 5.9168195856971175e-06, "loss": 2.58782470703125, "step": 1021100 }, { "epoch": 1.232214150851476, "learning_rate": 5.9164157502293795e-06, "loss": 2.6009478759765625, "step": 1021200 }, { "epoch": 1.2323348141739585, "learning_rate": 5.91601191476164e-06, "loss": 2.5747552490234376, "step": 1021300 }, { "epoch": 1.2324554774964411, "learning_rate": 5.915608079293902e-06, "loss": 2.5673068237304686, "step": 1021400 }, { "epoch": 1.232576140818924, "learning_rate": 5.915204243826164e-06, "loss": 2.590911865234375, "step": 1021500 }, { "epoch": 1.2326968041414066, "learning_rate": 5.914800408358426e-06, "loss": 2.57565185546875, "step": 1021600 }, { "epoch": 1.2328174674638892, "learning_rate": 5.914396572890687e-06, "loss": 2.563990478515625, "step": 1021700 }, { "epoch": 1.2329381307863718, "learning_rate": 5.913992737422949e-06, "loss": 2.5801165771484373, "step": 1021800 }, { "epoch": 1.2330587941088547, "learning_rate": 5.913588901955211e-06, "loss": 2.57489990234375, "step": 1021900 }, { "epoch": 1.2331794574313373, "learning_rate": 5.913185066487473e-06, "loss": 2.5673898315429686, "step": 1022000 }, { "epoch": 1.23330012075382, "learning_rate": 5.912781231019733e-06, "loss": 2.5683993530273437, "step": 1022100 }, { "epoch": 1.2334207840763027, "learning_rate": 5.912377395551995e-06, "loss": 2.5726885986328125, "step": 1022200 }, { "epoch": 1.2335414473987854, "learning_rate": 5.911973560084256e-06, "loss": 2.5826580810546873, "step": 1022300 }, { "epoch": 1.233662110721268, "learning_rate": 5.911569724616518e-06, "loss": 2.5695654296875, "step": 1022400 }, { "epoch": 1.2337827740437508, "learning_rate": 5.91116588914878e-06, "loss": 2.5981793212890625, "step": 1022500 }, { "epoch": 1.2339034373662334, "learning_rate": 5.910762053681042e-06, "loss": 2.6036337280273436, "step": 1022600 }, { "epoch": 1.234024100688716, "learning_rate": 5.910358218213303e-06, "loss": 2.5956201171875, "step": 1022700 }, { "epoch": 1.2341447640111989, "learning_rate": 5.909954382745565e-06, "loss": 2.591326904296875, "step": 1022800 }, { "epoch": 1.2342654273336815, "learning_rate": 5.9095505472778255e-06, "loss": 2.5851556396484376, "step": 1022900 }, { "epoch": 1.2343860906561641, "learning_rate": 5.9091467118100875e-06, "loss": 2.569710693359375, "step": 1023000 }, { "epoch": 1.2345067539786467, "learning_rate": 5.9087428763423495e-06, "loss": 2.5506663513183594, "step": 1023100 }, { "epoch": 1.2346274173011296, "learning_rate": 5.9083390408746115e-06, "loss": 2.5703115844726563, "step": 1023200 }, { "epoch": 1.2347480806236122, "learning_rate": 5.907935205406873e-06, "loss": 2.5755209350585937, "step": 1023300 }, { "epoch": 1.2348687439460948, "learning_rate": 5.907531369939135e-06, "loss": 2.5782376098632813, "step": 1023400 }, { "epoch": 1.2349894072685776, "learning_rate": 5.907127534471397e-06, "loss": 2.573221435546875, "step": 1023500 }, { "epoch": 1.2351100705910603, "learning_rate": 5.906723699003658e-06, "loss": 2.5700628662109377, "step": 1023600 }, { "epoch": 1.2352307339135429, "learning_rate": 5.906319863535919e-06, "loss": 2.5920675659179686, "step": 1023700 }, { "epoch": 1.2353513972360255, "learning_rate": 5.905916028068181e-06, "loss": 2.5798291015625, "step": 1023800 }, { "epoch": 1.2354720605585083, "learning_rate": 5.905512192600442e-06, "loss": 2.5943057250976564, "step": 1023900 }, { "epoch": 1.235592723880991, "learning_rate": 5.905108357132704e-06, "loss": 2.5800274658203124, "step": 1024000 }, { "epoch": 1.2357133872034736, "learning_rate": 5.904704521664966e-06, "loss": 2.5889321899414064, "step": 1024100 }, { "epoch": 1.2358340505259564, "learning_rate": 5.904300686197227e-06, "loss": 2.564385986328125, "step": 1024200 }, { "epoch": 1.235954713848439, "learning_rate": 5.903896850729489e-06, "loss": 2.6105340576171874, "step": 1024300 }, { "epoch": 1.2360753771709216, "learning_rate": 5.903493015261751e-06, "loss": 2.5809716796875, "step": 1024400 }, { "epoch": 1.2361960404934045, "learning_rate": 5.903089179794013e-06, "loss": 2.5610528564453126, "step": 1024500 }, { "epoch": 1.236316703815887, "learning_rate": 5.902685344326273e-06, "loss": 2.594942932128906, "step": 1024600 }, { "epoch": 1.2364373671383697, "learning_rate": 5.902281508858535e-06, "loss": 2.576158142089844, "step": 1024700 }, { "epoch": 1.2365580304608526, "learning_rate": 5.9018776733907964e-06, "loss": 2.5567692565917968, "step": 1024800 }, { "epoch": 1.2366786937833352, "learning_rate": 5.901473837923058e-06, "loss": 2.549102325439453, "step": 1024900 }, { "epoch": 1.2367993571058178, "learning_rate": 5.90107000245532e-06, "loss": 2.5981866455078126, "step": 1025000 }, { "epoch": 1.2369200204283004, "learning_rate": 5.900666166987582e-06, "loss": 2.5764703369140625, "step": 1025100 }, { "epoch": 1.2370406837507832, "learning_rate": 5.9002623315198435e-06, "loss": 2.588198547363281, "step": 1025200 }, { "epoch": 1.2371613470732659, "learning_rate": 5.8998584960521055e-06, "loss": 2.6126971435546875, "step": 1025300 }, { "epoch": 1.2372820103957485, "learning_rate": 5.899454660584366e-06, "loss": 2.5732321166992187, "step": 1025400 }, { "epoch": 1.2374026737182313, "learning_rate": 5.899050825116628e-06, "loss": 2.5666802978515624, "step": 1025500 }, { "epoch": 1.237523337040714, "learning_rate": 5.89864698964889e-06, "loss": 2.5667520141601563, "step": 1025600 }, { "epoch": 1.2376440003631966, "learning_rate": 5.898243154181152e-06, "loss": 2.5740420532226564, "step": 1025700 }, { "epoch": 1.2377646636856792, "learning_rate": 5.897839318713413e-06, "loss": 2.5834451293945313, "step": 1025800 }, { "epoch": 1.237885327008162, "learning_rate": 5.897435483245675e-06, "loss": 2.59651611328125, "step": 1025900 }, { "epoch": 1.2380059903306446, "learning_rate": 5.897031647777937e-06, "loss": 2.5785757446289064, "step": 1026000 }, { "epoch": 1.2381266536531272, "learning_rate": 5.896627812310198e-06, "loss": 2.57478271484375, "step": 1026100 }, { "epoch": 1.23824731697561, "learning_rate": 5.896223976842459e-06, "loss": 2.5710128784179687, "step": 1026200 }, { "epoch": 1.2383679802980927, "learning_rate": 5.895820141374721e-06, "loss": 2.5934182739257814, "step": 1026300 }, { "epoch": 1.2384886436205753, "learning_rate": 5.895416305906982e-06, "loss": 2.57549560546875, "step": 1026400 }, { "epoch": 1.2386093069430582, "learning_rate": 5.895012470439244e-06, "loss": 2.5815325927734376, "step": 1026500 }, { "epoch": 1.2387299702655408, "learning_rate": 5.894608634971506e-06, "loss": 2.5846102905273436, "step": 1026600 }, { "epoch": 1.2388506335880234, "learning_rate": 5.894204799503767e-06, "loss": 2.581850280761719, "step": 1026700 }, { "epoch": 1.2389712969105062, "learning_rate": 5.893800964036029e-06, "loss": 2.5762557983398438, "step": 1026800 }, { "epoch": 1.2390919602329888, "learning_rate": 5.893397128568291e-06, "loss": 2.552881774902344, "step": 1026900 }, { "epoch": 1.2392126235554715, "learning_rate": 5.8929932931005516e-06, "loss": 2.5915011596679687, "step": 1027000 }, { "epoch": 1.239333286877954, "learning_rate": 5.8925894576328136e-06, "loss": 2.5776803588867185, "step": 1027100 }, { "epoch": 1.239453950200437, "learning_rate": 5.8921856221650755e-06, "loss": 2.5636300659179687, "step": 1027200 }, { "epoch": 1.2395746135229195, "learning_rate": 5.891781786697337e-06, "loss": 2.5549781799316404, "step": 1027300 }, { "epoch": 1.2396952768454021, "learning_rate": 5.891377951229599e-06, "loss": 2.6003350830078125, "step": 1027400 }, { "epoch": 1.239815940167885, "learning_rate": 5.890974115761861e-06, "loss": 2.602364807128906, "step": 1027500 }, { "epoch": 1.2399366034903676, "learning_rate": 5.890570280294123e-06, "loss": 2.587572021484375, "step": 1027600 }, { "epoch": 1.2400572668128502, "learning_rate": 5.890166444826384e-06, "loss": 2.5666159057617186, "step": 1027700 }, { "epoch": 1.240177930135333, "learning_rate": 5.889762609358645e-06, "loss": 2.5734954833984376, "step": 1027800 }, { "epoch": 1.2402985934578157, "learning_rate": 5.889358773890906e-06, "loss": 2.579728698730469, "step": 1027900 }, { "epoch": 1.2404192567802983, "learning_rate": 5.888954938423168e-06, "loss": 2.581354675292969, "step": 1028000 }, { "epoch": 1.2405399201027811, "learning_rate": 5.88855110295543e-06, "loss": 2.5821795654296875, "step": 1028100 }, { "epoch": 1.2406605834252638, "learning_rate": 5.888147267487692e-06, "loss": 2.576739501953125, "step": 1028200 }, { "epoch": 1.2407812467477464, "learning_rate": 5.887743432019953e-06, "loss": 2.5585662841796877, "step": 1028300 }, { "epoch": 1.240901910070229, "learning_rate": 5.887339596552215e-06, "loss": 2.565641174316406, "step": 1028400 }, { "epoch": 1.2410225733927118, "learning_rate": 5.886935761084477e-06, "loss": 2.5601046752929686, "step": 1028500 }, { "epoch": 1.2411432367151944, "learning_rate": 5.886531925616737e-06, "loss": 2.5611080932617187, "step": 1028600 }, { "epoch": 1.241263900037677, "learning_rate": 5.886128090148999e-06, "loss": 2.5803659057617185, "step": 1028700 }, { "epoch": 1.24138456336016, "learning_rate": 5.885724254681261e-06, "loss": 2.5764834594726564, "step": 1028800 }, { "epoch": 1.2415052266826425, "learning_rate": 5.8853204192135225e-06, "loss": 2.5672332763671877, "step": 1028900 }, { "epoch": 1.2416258900051251, "learning_rate": 5.8849165837457844e-06, "loss": 2.6005902099609375, "step": 1029000 }, { "epoch": 1.2417465533276077, "learning_rate": 5.8845127482780464e-06, "loss": 2.572349853515625, "step": 1029100 }, { "epoch": 1.2418672166500906, "learning_rate": 5.8841089128103076e-06, "loss": 2.579498596191406, "step": 1029200 }, { "epoch": 1.2419878799725732, "learning_rate": 5.8837050773425695e-06, "loss": 2.558224639892578, "step": 1029300 }, { "epoch": 1.2421085432950558, "learning_rate": 5.883301241874831e-06, "loss": 2.5915542602539063, "step": 1029400 }, { "epoch": 1.2422292066175387, "learning_rate": 5.882897406407092e-06, "loss": 2.5669259643554687, "step": 1029500 }, { "epoch": 1.2423498699400213, "learning_rate": 5.882493570939354e-06, "loss": 2.5986865234375, "step": 1029600 }, { "epoch": 1.242470533262504, "learning_rate": 5.882089735471616e-06, "loss": 2.5906521606445314, "step": 1029700 }, { "epoch": 1.2425911965849867, "learning_rate": 5.881685900003877e-06, "loss": 2.5731011962890626, "step": 1029800 }, { "epoch": 1.2427118599074694, "learning_rate": 5.881282064536139e-06, "loss": 2.573765869140625, "step": 1029900 }, { "epoch": 1.242832523229952, "learning_rate": 5.880878229068401e-06, "loss": 2.5928689575195314, "step": 1030000 }, { "epoch": 1.2429531865524348, "learning_rate": 5.880474393600663e-06, "loss": 2.5732913208007813, "step": 1030100 }, { "epoch": 1.2430738498749174, "learning_rate": 5.880070558132924e-06, "loss": 2.57040283203125, "step": 1030200 }, { "epoch": 1.2431945131974, "learning_rate": 5.879666722665185e-06, "loss": 2.5650543212890624, "step": 1030300 }, { "epoch": 1.2433151765198827, "learning_rate": 5.879262887197446e-06, "loss": 2.5589169311523436, "step": 1030400 }, { "epoch": 1.2434358398423655, "learning_rate": 5.878859051729708e-06, "loss": 2.564941711425781, "step": 1030500 }, { "epoch": 1.2435565031648481, "learning_rate": 5.87845521626197e-06, "loss": 2.57875244140625, "step": 1030600 }, { "epoch": 1.2436771664873307, "learning_rate": 5.878051380794232e-06, "loss": 2.5807293701171874, "step": 1030700 }, { "epoch": 1.2437978298098136, "learning_rate": 5.877647545326493e-06, "loss": 2.5875729370117186, "step": 1030800 }, { "epoch": 1.2439184931322962, "learning_rate": 5.877243709858755e-06, "loss": 2.586211853027344, "step": 1030900 }, { "epoch": 1.2440391564547788, "learning_rate": 5.876839874391017e-06, "loss": 2.5505551147460936, "step": 1031000 }, { "epoch": 1.2441598197772614, "learning_rate": 5.876436038923278e-06, "loss": 2.5652499389648438, "step": 1031100 }, { "epoch": 1.2442804830997443, "learning_rate": 5.87603220345554e-06, "loss": 2.5610516357421873, "step": 1031200 }, { "epoch": 1.2444011464222269, "learning_rate": 5.8756283679878016e-06, "loss": 2.5752438354492186, "step": 1031300 }, { "epoch": 1.2445218097447095, "learning_rate": 5.875224532520063e-06, "loss": 2.580528564453125, "step": 1031400 }, { "epoch": 1.2446424730671923, "learning_rate": 5.874820697052325e-06, "loss": 2.576431884765625, "step": 1031500 }, { "epoch": 1.244763136389675, "learning_rate": 5.874416861584587e-06, "loss": 2.59281982421875, "step": 1031600 }, { "epoch": 1.2448837997121576, "learning_rate": 5.874013026116848e-06, "loss": 2.5754684448242187, "step": 1031700 }, { "epoch": 1.2450044630346404, "learning_rate": 5.87360919064911e-06, "loss": 2.5601904296875, "step": 1031800 }, { "epoch": 1.245125126357123, "learning_rate": 5.873205355181371e-06, "loss": 2.574876708984375, "step": 1031900 }, { "epoch": 1.2452457896796056, "learning_rate": 5.872801519713632e-06, "loss": 2.589632873535156, "step": 1032000 }, { "epoch": 1.2453664530020885, "learning_rate": 5.872397684245894e-06, "loss": 2.582591247558594, "step": 1032100 }, { "epoch": 1.245487116324571, "learning_rate": 5.871993848778156e-06, "loss": 2.621709289550781, "step": 1032200 }, { "epoch": 1.2456077796470537, "learning_rate": 5.871590013310417e-06, "loss": 2.5934747314453124, "step": 1032300 }, { "epoch": 1.2457284429695363, "learning_rate": 5.871186177842679e-06, "loss": 2.545093994140625, "step": 1032400 }, { "epoch": 1.2458491062920192, "learning_rate": 5.870782342374941e-06, "loss": 2.556499481201172, "step": 1032500 }, { "epoch": 1.2459697696145018, "learning_rate": 5.870378506907203e-06, "loss": 2.5697467041015627, "step": 1032600 }, { "epoch": 1.2460904329369844, "learning_rate": 5.869974671439463e-06, "loss": 2.574124450683594, "step": 1032700 }, { "epoch": 1.2462110962594672, "learning_rate": 5.869570835971725e-06, "loss": 2.5778768920898436, "step": 1032800 }, { "epoch": 1.2463317595819499, "learning_rate": 5.8691670005039865e-06, "loss": 2.563542785644531, "step": 1032900 }, { "epoch": 1.2464524229044325, "learning_rate": 5.8687631650362485e-06, "loss": 2.54975830078125, "step": 1033000 }, { "epoch": 1.2465730862269153, "learning_rate": 5.8683593295685105e-06, "loss": 2.5907241821289064, "step": 1033100 }, { "epoch": 1.246693749549398, "learning_rate": 5.8679554941007725e-06, "loss": 2.6201617431640627, "step": 1033200 }, { "epoch": 1.2468144128718806, "learning_rate": 5.867551658633034e-06, "loss": 2.5735848999023436, "step": 1033300 }, { "epoch": 1.2469350761943634, "learning_rate": 5.867147823165296e-06, "loss": 2.5545513916015623, "step": 1033400 }, { "epoch": 1.247055739516846, "learning_rate": 5.866743987697556e-06, "loss": 2.5682077026367187, "step": 1033500 }, { "epoch": 1.2471764028393286, "learning_rate": 5.866340152229818e-06, "loss": 2.5855557250976564, "step": 1033600 }, { "epoch": 1.2472970661618112, "learning_rate": 5.86593631676208e-06, "loss": 2.6001824951171875, "step": 1033700 }, { "epoch": 1.247417729484294, "learning_rate": 5.865532481294342e-06, "loss": 2.5750567626953127, "step": 1033800 }, { "epoch": 1.2475383928067767, "learning_rate": 5.865128645826603e-06, "loss": 2.5685150146484377, "step": 1033900 }, { "epoch": 1.2476590561292593, "learning_rate": 5.864724810358865e-06, "loss": 2.56471435546875, "step": 1034000 }, { "epoch": 1.2477797194517422, "learning_rate": 5.864320974891127e-06, "loss": 2.568558654785156, "step": 1034100 }, { "epoch": 1.2479003827742248, "learning_rate": 5.863917139423388e-06, "loss": 2.5705447387695313, "step": 1034200 }, { "epoch": 1.2480210460967074, "learning_rate": 5.863513303955649e-06, "loss": 2.597641906738281, "step": 1034300 }, { "epoch": 1.24814170941919, "learning_rate": 5.863109468487911e-06, "loss": 2.585174865722656, "step": 1034400 }, { "epoch": 1.2482623727416728, "learning_rate": 5.862705633020172e-06, "loss": 2.5941226196289064, "step": 1034500 }, { "epoch": 1.2483830360641555, "learning_rate": 5.862301797552434e-06, "loss": 2.563055419921875, "step": 1034600 }, { "epoch": 1.248503699386638, "learning_rate": 5.861897962084696e-06, "loss": 2.5504881286621095, "step": 1034700 }, { "epoch": 1.248624362709121, "learning_rate": 5.861494126616957e-06, "loss": 2.583792419433594, "step": 1034800 }, { "epoch": 1.2487450260316035, "learning_rate": 5.861090291149219e-06, "loss": 2.5734686279296874, "step": 1034900 }, { "epoch": 1.2488656893540862, "learning_rate": 5.860686455681481e-06, "loss": 2.5820986938476564, "step": 1035000 }, { "epoch": 1.248986352676569, "learning_rate": 5.860282620213743e-06, "loss": 2.5769342041015624, "step": 1035100 }, { "epoch": 1.2491070159990516, "learning_rate": 5.859878784746004e-06, "loss": 2.5595770263671875, "step": 1035200 }, { "epoch": 1.2492276793215342, "learning_rate": 5.859474949278266e-06, "loss": 2.568662109375, "step": 1035300 }, { "epoch": 1.249348342644017, "learning_rate": 5.859071113810527e-06, "loss": 2.587207946777344, "step": 1035400 }, { "epoch": 1.2494690059664997, "learning_rate": 5.858667278342789e-06, "loss": 2.5830438232421873, "step": 1035500 }, { "epoch": 1.2495896692889823, "learning_rate": 5.858263442875051e-06, "loss": 2.5693045043945313, "step": 1035600 }, { "epoch": 1.249710332611465, "learning_rate": 5.857859607407313e-06, "loss": 2.6058050537109376, "step": 1035700 }, { "epoch": 1.2498309959339478, "learning_rate": 5.857455771939574e-06, "loss": 2.5602716064453124, "step": 1035800 }, { "epoch": 1.2499516592564304, "learning_rate": 5.857051936471836e-06, "loss": 2.596555480957031, "step": 1035900 }, { "epoch": 1.250072322578913, "learning_rate": 5.856648101004096e-06, "loss": 2.5707138061523436, "step": 1036000 }, { "epoch": 1.2501929859013958, "learning_rate": 5.856244265536358e-06, "loss": 2.5623870849609376, "step": 1036100 }, { "epoch": 1.2503136492238784, "learning_rate": 5.85584043006862e-06, "loss": 2.583456726074219, "step": 1036200 }, { "epoch": 1.250434312546361, "learning_rate": 5.855436594600882e-06, "loss": 2.591029052734375, "step": 1036300 }, { "epoch": 1.2505549758688437, "learning_rate": 5.855032759133143e-06, "loss": 2.566769714355469, "step": 1036400 }, { "epoch": 1.2506756391913265, "learning_rate": 5.854628923665405e-06, "loss": 2.543016815185547, "step": 1036500 }, { "epoch": 1.2507963025138091, "learning_rate": 5.854225088197667e-06, "loss": 2.57762939453125, "step": 1036600 }, { "epoch": 1.250916965836292, "learning_rate": 5.853821252729929e-06, "loss": 2.5715655517578124, "step": 1036700 }, { "epoch": 1.2510376291587746, "learning_rate": 5.8534174172621894e-06, "loss": 2.5758673095703126, "step": 1036800 }, { "epoch": 1.2511582924812572, "learning_rate": 5.853013581794451e-06, "loss": 2.5595013427734377, "step": 1036900 }, { "epoch": 1.2512789558037398, "learning_rate": 5.8526097463267125e-06, "loss": 2.5726904296875, "step": 1037000 }, { "epoch": 1.2513996191262227, "learning_rate": 5.8522059108589745e-06, "loss": 2.5846438598632813, "step": 1037100 }, { "epoch": 1.2515202824487053, "learning_rate": 5.8518020753912365e-06, "loss": 2.594224548339844, "step": 1037200 }, { "epoch": 1.251640945771188, "learning_rate": 5.8513982399234985e-06, "loss": 2.558871612548828, "step": 1037300 }, { "epoch": 1.2517616090936707, "learning_rate": 5.85099440445576e-06, "loss": 2.5607635498046877, "step": 1037400 }, { "epoch": 1.2518822724161534, "learning_rate": 5.850590568988022e-06, "loss": 2.574246826171875, "step": 1037500 }, { "epoch": 1.252002935738636, "learning_rate": 5.850186733520282e-06, "loss": 2.577664489746094, "step": 1037600 }, { "epoch": 1.2521235990611186, "learning_rate": 5.849782898052544e-06, "loss": 2.5578302001953124, "step": 1037700 }, { "epoch": 1.2522442623836014, "learning_rate": 5.849379062584806e-06, "loss": 2.597474365234375, "step": 1037800 }, { "epoch": 1.252364925706084, "learning_rate": 5.848975227117068e-06, "loss": 2.5837051391601564, "step": 1037900 }, { "epoch": 1.2524855890285667, "learning_rate": 5.848571391649329e-06, "loss": 2.5668695068359373, "step": 1038000 }, { "epoch": 1.2526062523510495, "learning_rate": 5.848167556181591e-06, "loss": 2.587239990234375, "step": 1038100 }, { "epoch": 1.2527269156735321, "learning_rate": 5.847763720713853e-06, "loss": 2.599979248046875, "step": 1038200 }, { "epoch": 1.2528475789960147, "learning_rate": 5.847359885246114e-06, "loss": 2.5660751342773436, "step": 1038300 }, { "epoch": 1.2529682423184973, "learning_rate": 5.846956049778375e-06, "loss": 2.587227478027344, "step": 1038400 }, { "epoch": 1.2530889056409802, "learning_rate": 5.846552214310637e-06, "loss": 2.5789007568359374, "step": 1038500 }, { "epoch": 1.2532095689634628, "learning_rate": 5.846148378842898e-06, "loss": 2.5445977783203126, "step": 1038600 }, { "epoch": 1.2533302322859456, "learning_rate": 5.84574454337516e-06, "loss": 2.568819580078125, "step": 1038700 }, { "epoch": 1.2534508956084283, "learning_rate": 5.845340707907422e-06, "loss": 2.558331298828125, "step": 1038800 }, { "epoch": 1.2535715589309109, "learning_rate": 5.8449368724396834e-06, "loss": 2.5463351440429687, "step": 1038900 }, { "epoch": 1.2536922222533935, "learning_rate": 5.844533036971945e-06, "loss": 2.5758547973632813, "step": 1039000 }, { "epoch": 1.2538128855758763, "learning_rate": 5.844129201504207e-06, "loss": 2.5461572265625, "step": 1039100 }, { "epoch": 1.253933548898359, "learning_rate": 5.843725366036468e-06, "loss": 2.56326904296875, "step": 1039200 }, { "epoch": 1.2540542122208416, "learning_rate": 5.84332153056873e-06, "loss": 2.588012390136719, "step": 1039300 }, { "epoch": 1.2541748755433244, "learning_rate": 5.842917695100992e-06, "loss": 2.5572355651855467, "step": 1039400 }, { "epoch": 1.254295538865807, "learning_rate": 5.842513859633253e-06, "loss": 2.568190002441406, "step": 1039500 }, { "epoch": 1.2544162021882896, "learning_rate": 5.842110024165515e-06, "loss": 2.592143859863281, "step": 1039600 }, { "epoch": 1.2545368655107723, "learning_rate": 5.841706188697777e-06, "loss": 2.549272003173828, "step": 1039700 }, { "epoch": 1.254657528833255, "learning_rate": 5.841302353230039e-06, "loss": 2.574932861328125, "step": 1039800 }, { "epoch": 1.2547781921557377, "learning_rate": 5.8408985177623e-06, "loss": 2.5745065307617185, "step": 1039900 }, { "epoch": 1.2548988554782206, "learning_rate": 5.840494682294562e-06, "loss": 2.56103515625, "step": 1040000 }, { "epoch": 1.2550195188007032, "learning_rate": 5.840090846826822e-06, "loss": 2.579889221191406, "step": 1040100 }, { "epoch": 1.2551401821231858, "learning_rate": 5.839687011359084e-06, "loss": 2.579327392578125, "step": 1040200 }, { "epoch": 1.2552608454456684, "learning_rate": 5.839283175891346e-06, "loss": 2.5527342224121092, "step": 1040300 }, { "epoch": 1.255381508768151, "learning_rate": 5.838879340423608e-06, "loss": 2.596138916015625, "step": 1040400 }, { "epoch": 1.2555021720906339, "learning_rate": 5.838475504955869e-06, "loss": 2.5911737060546876, "step": 1040500 }, { "epoch": 1.2556228354131165, "learning_rate": 5.838071669488131e-06, "loss": 2.5611236572265623, "step": 1040600 }, { "epoch": 1.2557434987355993, "learning_rate": 5.837667834020393e-06, "loss": 2.566156311035156, "step": 1040700 }, { "epoch": 1.255864162058082, "learning_rate": 5.837263998552654e-06, "loss": 2.5952987670898438, "step": 1040800 }, { "epoch": 1.2559848253805646, "learning_rate": 5.8368601630849155e-06, "loss": 2.551419525146484, "step": 1040900 }, { "epoch": 1.2561054887030472, "learning_rate": 5.8364563276171774e-06, "loss": 2.572667236328125, "step": 1041000 }, { "epoch": 1.25622615202553, "learning_rate": 5.836052492149439e-06, "loss": 2.572947692871094, "step": 1041100 }, { "epoch": 1.2563468153480126, "learning_rate": 5.8356486566817006e-06, "loss": 2.5575129699707033, "step": 1041200 }, { "epoch": 1.2564674786704952, "learning_rate": 5.8352448212139625e-06, "loss": 2.5748681640625, "step": 1041300 }, { "epoch": 1.256588141992978, "learning_rate": 5.834840985746224e-06, "loss": 2.560294494628906, "step": 1041400 }, { "epoch": 1.2567088053154607, "learning_rate": 5.834437150278486e-06, "loss": 2.55714599609375, "step": 1041500 }, { "epoch": 1.2568294686379433, "learning_rate": 5.834033314810748e-06, "loss": 2.57648681640625, "step": 1041600 }, { "epoch": 1.256950131960426, "learning_rate": 5.833629479343008e-06, "loss": 2.5673541259765624, "step": 1041700 }, { "epoch": 1.2570707952829088, "learning_rate": 5.83322564387527e-06, "loss": 2.568960876464844, "step": 1041800 }, { "epoch": 1.2571914586053914, "learning_rate": 5.832821808407532e-06, "loss": 2.5853561401367187, "step": 1041900 }, { "epoch": 1.2573121219278742, "learning_rate": 5.832417972939793e-06, "loss": 2.5669482421875, "step": 1042000 }, { "epoch": 1.2574327852503568, "learning_rate": 5.832014137472055e-06, "loss": 2.5595216369628906, "step": 1042100 }, { "epoch": 1.2575534485728395, "learning_rate": 5.831610302004317e-06, "loss": 2.5805340576171876, "step": 1042200 }, { "epoch": 1.257674111895322, "learning_rate": 5.831206466536579e-06, "loss": 2.5711489868164064, "step": 1042300 }, { "epoch": 1.257794775217805, "learning_rate": 5.83080263106884e-06, "loss": 2.5572767639160157, "step": 1042400 }, { "epoch": 1.2579154385402875, "learning_rate": 5.830398795601101e-06, "loss": 2.5785198974609376, "step": 1042500 }, { "epoch": 1.2580361018627702, "learning_rate": 5.829994960133362e-06, "loss": 2.5753274536132813, "step": 1042600 }, { "epoch": 1.258156765185253, "learning_rate": 5.829591124665624e-06, "loss": 2.5832473754882814, "step": 1042700 }, { "epoch": 1.2582774285077356, "learning_rate": 5.829187289197886e-06, "loss": 2.599949951171875, "step": 1042800 }, { "epoch": 1.2583980918302182, "learning_rate": 5.828783453730148e-06, "loss": 2.5667071533203125, "step": 1042900 }, { "epoch": 1.2585187551527008, "learning_rate": 5.8283796182624095e-06, "loss": 2.578252258300781, "step": 1043000 }, { "epoch": 1.2586394184751837, "learning_rate": 5.8279757827946715e-06, "loss": 2.5676617431640625, "step": 1043100 }, { "epoch": 1.2587600817976663, "learning_rate": 5.8275719473269334e-06, "loss": 2.5668255615234377, "step": 1043200 }, { "epoch": 1.258880745120149, "learning_rate": 5.827168111859194e-06, "loss": 2.5734417724609373, "step": 1043300 }, { "epoch": 1.2590014084426318, "learning_rate": 5.826764276391456e-06, "loss": 2.58758544921875, "step": 1043400 }, { "epoch": 1.2591220717651144, "learning_rate": 5.826360440923718e-06, "loss": 2.5515184020996093, "step": 1043500 }, { "epoch": 1.259242735087597, "learning_rate": 5.825956605455979e-06, "loss": 2.5863912963867186, "step": 1043600 }, { "epoch": 1.2593633984100796, "learning_rate": 5.825552769988241e-06, "loss": 2.602530517578125, "step": 1043700 }, { "epoch": 1.2594840617325624, "learning_rate": 5.825148934520503e-06, "loss": 2.56224609375, "step": 1043800 }, { "epoch": 1.259604725055045, "learning_rate": 5.824745099052764e-06, "loss": 2.566282958984375, "step": 1043900 }, { "epoch": 1.259725388377528, "learning_rate": 5.824341263585026e-06, "loss": 2.5586337280273437, "step": 1044000 }, { "epoch": 1.2598460517000105, "learning_rate": 5.823937428117287e-06, "loss": 2.5770416259765625, "step": 1044100 }, { "epoch": 1.2599667150224931, "learning_rate": 5.823533592649548e-06, "loss": 2.5624826049804685, "step": 1044200 }, { "epoch": 1.2600873783449758, "learning_rate": 5.82312975718181e-06, "loss": 2.5693930053710936, "step": 1044300 }, { "epoch": 1.2602080416674586, "learning_rate": 5.822725921714072e-06, "loss": 2.559861145019531, "step": 1044400 }, { "epoch": 1.2603287049899412, "learning_rate": 5.822322086246333e-06, "loss": 2.5824551391601562, "step": 1044500 }, { "epoch": 1.2604493683124238, "learning_rate": 5.821918250778595e-06, "loss": 2.5706631469726564, "step": 1044600 }, { "epoch": 1.2605700316349067, "learning_rate": 5.821514415310857e-06, "loss": 2.5882855224609376, "step": 1044700 }, { "epoch": 1.2606906949573893, "learning_rate": 5.821110579843119e-06, "loss": 2.5681967163085937, "step": 1044800 }, { "epoch": 1.260811358279872, "learning_rate": 5.82070674437538e-06, "loss": 2.582435302734375, "step": 1044900 }, { "epoch": 1.2609320216023545, "learning_rate": 5.8203029089076415e-06, "loss": 2.563717956542969, "step": 1045000 }, { "epoch": 1.2610526849248374, "learning_rate": 5.819899073439903e-06, "loss": 2.580516662597656, "step": 1045100 }, { "epoch": 1.26117334824732, "learning_rate": 5.819495237972165e-06, "loss": 2.5960311889648438, "step": 1045200 }, { "epoch": 1.2612940115698028, "learning_rate": 5.819091402504427e-06, "loss": 2.5681396484375, "step": 1045300 }, { "epoch": 1.2614146748922854, "learning_rate": 5.818687567036689e-06, "loss": 2.594945068359375, "step": 1045400 }, { "epoch": 1.261535338214768, "learning_rate": 5.81828373156895e-06, "loss": 2.5506358337402344, "step": 1045500 }, { "epoch": 1.2616560015372507, "learning_rate": 5.817879896101212e-06, "loss": 2.567978820800781, "step": 1045600 }, { "epoch": 1.2617766648597333, "learning_rate": 5.817476060633474e-06, "loss": 2.5766732788085935, "step": 1045700 }, { "epoch": 1.2618973281822161, "learning_rate": 5.817072225165734e-06, "loss": 2.5903799438476565, "step": 1045800 }, { "epoch": 1.2620179915046987, "learning_rate": 5.816668389697996e-06, "loss": 2.5868280029296873, "step": 1045900 }, { "epoch": 1.2621386548271816, "learning_rate": 5.816264554230258e-06, "loss": 2.575748291015625, "step": 1046000 }, { "epoch": 1.2622593181496642, "learning_rate": 5.815860718762519e-06, "loss": 2.570953369140625, "step": 1046100 }, { "epoch": 1.2623799814721468, "learning_rate": 5.815456883294781e-06, "loss": 2.5654083251953126, "step": 1046200 }, { "epoch": 1.2625006447946294, "learning_rate": 5.815053047827043e-06, "loss": 2.5715380859375, "step": 1046300 }, { "epoch": 1.2626213081171123, "learning_rate": 5.814649212359304e-06, "loss": 2.5648822021484374, "step": 1046400 }, { "epoch": 1.2627419714395949, "learning_rate": 5.814245376891566e-06, "loss": 2.6002157592773436, "step": 1046500 }, { "epoch": 1.2628626347620775, "learning_rate": 5.813841541423827e-06, "loss": 2.572633056640625, "step": 1046600 }, { "epoch": 1.2629832980845603, "learning_rate": 5.813437705956088e-06, "loss": 2.5572698974609374, "step": 1046700 }, { "epoch": 1.263103961407043, "learning_rate": 5.81303387048835e-06, "loss": 2.6045068359375, "step": 1046800 }, { "epoch": 1.2632246247295256, "learning_rate": 5.812630035020612e-06, "loss": 2.5719094848632813, "step": 1046900 }, { "epoch": 1.2633452880520082, "learning_rate": 5.8122261995528735e-06, "loss": 2.5525851440429688, "step": 1047000 }, { "epoch": 1.263465951374491, "learning_rate": 5.8118223640851355e-06, "loss": 2.5376155090332033, "step": 1047100 }, { "epoch": 1.2635866146969736, "learning_rate": 5.8114185286173975e-06, "loss": 2.5826641845703127, "step": 1047200 }, { "epoch": 1.2637072780194565, "learning_rate": 5.8110146931496595e-06, "loss": 2.5798080444335936, "step": 1047300 }, { "epoch": 1.263827941341939, "learning_rate": 5.81061085768192e-06, "loss": 2.570467529296875, "step": 1047400 }, { "epoch": 1.2639486046644217, "learning_rate": 5.810207022214182e-06, "loss": 2.5662887573242186, "step": 1047500 }, { "epoch": 1.2640692679869043, "learning_rate": 5.809803186746443e-06, "loss": 2.565897216796875, "step": 1047600 }, { "epoch": 1.2641899313093872, "learning_rate": 5.809399351278705e-06, "loss": 2.5679266357421877, "step": 1047700 }, { "epoch": 1.2643105946318698, "learning_rate": 5.808995515810967e-06, "loss": 2.5770849609375, "step": 1047800 }, { "epoch": 1.2644312579543524, "learning_rate": 5.808591680343229e-06, "loss": 2.5737969970703123, "step": 1047900 }, { "epoch": 1.2645519212768352, "learning_rate": 5.80818784487549e-06, "loss": 2.5527923583984373, "step": 1048000 }, { "epoch": 1.2646725845993179, "learning_rate": 5.807784009407752e-06, "loss": 2.55347900390625, "step": 1048100 }, { "epoch": 1.2647932479218005, "learning_rate": 5.807380173940012e-06, "loss": 2.5807199096679687, "step": 1048200 }, { "epoch": 1.264913911244283, "learning_rate": 5.806976338472274e-06, "loss": 2.5715792846679686, "step": 1048300 }, { "epoch": 1.265034574566766, "learning_rate": 5.806572503004536e-06, "loss": 2.5426239013671874, "step": 1048400 }, { "epoch": 1.2651552378892486, "learning_rate": 5.806168667536798e-06, "loss": 2.5632785034179686, "step": 1048500 }, { "epoch": 1.2652759012117312, "learning_rate": 5.805764832069059e-06, "loss": 2.5482701110839843, "step": 1048600 }, { "epoch": 1.265396564534214, "learning_rate": 5.805360996601321e-06, "loss": 2.5684127807617188, "step": 1048700 }, { "epoch": 1.2655172278566966, "learning_rate": 5.804957161133583e-06, "loss": 2.5684884643554686, "step": 1048800 }, { "epoch": 1.2656378911791792, "learning_rate": 5.804553325665845e-06, "loss": 2.566876220703125, "step": 1048900 }, { "epoch": 1.2657585545016619, "learning_rate": 5.8041494901981055e-06, "loss": 2.5852456665039063, "step": 1049000 }, { "epoch": 1.2658792178241447, "learning_rate": 5.8037456547303675e-06, "loss": 2.588509826660156, "step": 1049100 }, { "epoch": 1.2659998811466273, "learning_rate": 5.803341819262629e-06, "loss": 2.567655029296875, "step": 1049200 }, { "epoch": 1.2661205444691102, "learning_rate": 5.802937983794891e-06, "loss": 2.5710595703125, "step": 1049300 }, { "epoch": 1.2662412077915928, "learning_rate": 5.802534148327153e-06, "loss": 2.5742071533203124, "step": 1049400 }, { "epoch": 1.2663618711140754, "learning_rate": 5.802130312859415e-06, "loss": 2.5638412475585937, "step": 1049500 }, { "epoch": 1.266482534436558, "learning_rate": 5.801726477391676e-06, "loss": 2.5666043090820314, "step": 1049600 }, { "epoch": 1.2666031977590408, "learning_rate": 5.801322641923938e-06, "loss": 2.5615045166015626, "step": 1049700 }, { "epoch": 1.2667238610815235, "learning_rate": 5.800918806456198e-06, "loss": 2.5477508544921874, "step": 1049800 }, { "epoch": 1.266844524404006, "learning_rate": 5.80051497098846e-06, "loss": 2.5550091552734373, "step": 1049900 }, { "epoch": 1.266965187726489, "learning_rate": 5.800111135520722e-06, "loss": 2.5598252868652343, "step": 1050000 }, { "epoch": 1.2670858510489715, "learning_rate": 5.799707300052984e-06, "loss": 2.5904910278320314, "step": 1050100 }, { "epoch": 1.2672065143714542, "learning_rate": 5.799303464585245e-06, "loss": 2.579670715332031, "step": 1050200 }, { "epoch": 1.2673271776939368, "learning_rate": 5.798899629117507e-06, "loss": 2.567712707519531, "step": 1050300 }, { "epoch": 1.2674478410164196, "learning_rate": 5.798495793649769e-06, "loss": 2.535228424072266, "step": 1050400 }, { "epoch": 1.2675685043389022, "learning_rate": 5.79809195818203e-06, "loss": 2.53361083984375, "step": 1050500 }, { "epoch": 1.267689167661385, "learning_rate": 5.797688122714292e-06, "loss": 2.555097808837891, "step": 1050600 }, { "epoch": 1.2678098309838677, "learning_rate": 5.797284287246553e-06, "loss": 2.61226806640625, "step": 1050700 }, { "epoch": 1.2679304943063503, "learning_rate": 5.7968804517788145e-06, "loss": 2.557561492919922, "step": 1050800 }, { "epoch": 1.268051157628833, "learning_rate": 5.7964766163110764e-06, "loss": 2.572508544921875, "step": 1050900 }, { "epoch": 1.2681718209513155, "learning_rate": 5.796072780843338e-06, "loss": 2.5503976440429685, "step": 1051000 }, { "epoch": 1.2682924842737984, "learning_rate": 5.7956689453755996e-06, "loss": 2.577437438964844, "step": 1051100 }, { "epoch": 1.268413147596281, "learning_rate": 5.7952651099078615e-06, "loss": 2.585007629394531, "step": 1051200 }, { "epoch": 1.2685338109187638, "learning_rate": 5.7948612744401235e-06, "loss": 2.5570498657226564, "step": 1051300 }, { "epoch": 1.2686544742412464, "learning_rate": 5.7944574389723855e-06, "loss": 2.549856414794922, "step": 1051400 }, { "epoch": 1.268775137563729, "learning_rate": 5.794053603504646e-06, "loss": 2.5612060546875, "step": 1051500 }, { "epoch": 1.2688958008862117, "learning_rate": 5.793649768036908e-06, "loss": 2.5823623657226564, "step": 1051600 }, { "epoch": 1.2690164642086945, "learning_rate": 5.793245932569169e-06, "loss": 2.564066162109375, "step": 1051700 }, { "epoch": 1.2691371275311771, "learning_rate": 5.792842097101431e-06, "loss": 2.5370460510253907, "step": 1051800 }, { "epoch": 1.2692577908536598, "learning_rate": 5.792438261633693e-06, "loss": 2.5731805419921874, "step": 1051900 }, { "epoch": 1.2693784541761426, "learning_rate": 5.792034426165955e-06, "loss": 2.569635925292969, "step": 1052000 }, { "epoch": 1.2694991174986252, "learning_rate": 5.791630590698216e-06, "loss": 2.5796600341796876, "step": 1052100 }, { "epoch": 1.2696197808211078, "learning_rate": 5.791226755230478e-06, "loss": 2.5479315185546874, "step": 1052200 }, { "epoch": 1.2697404441435904, "learning_rate": 5.790822919762738e-06, "loss": 2.5370407104492188, "step": 1052300 }, { "epoch": 1.2698611074660733, "learning_rate": 5.790419084295e-06, "loss": 2.57031982421875, "step": 1052400 }, { "epoch": 1.269981770788556, "learning_rate": 5.790015248827262e-06, "loss": 2.5549562072753904, "step": 1052500 }, { "epoch": 1.2701024341110387, "learning_rate": 5.789611413359524e-06, "loss": 2.556454772949219, "step": 1052600 }, { "epoch": 1.2702230974335214, "learning_rate": 5.789207577891785e-06, "loss": 2.594930419921875, "step": 1052700 }, { "epoch": 1.270343760756004, "learning_rate": 5.788803742424047e-06, "loss": 2.568536376953125, "step": 1052800 }, { "epoch": 1.2704644240784866, "learning_rate": 5.788399906956309e-06, "loss": 2.5380924987792968, "step": 1052900 }, { "epoch": 1.2705850874009694, "learning_rate": 5.7879960714885704e-06, "loss": 2.569491271972656, "step": 1053000 }, { "epoch": 1.270705750723452, "learning_rate": 5.787592236020832e-06, "loss": 2.5981890869140627, "step": 1053100 }, { "epoch": 1.2708264140459347, "learning_rate": 5.7871884005530936e-06, "loss": 2.5724761962890623, "step": 1053200 }, { "epoch": 1.2709470773684175, "learning_rate": 5.786784565085355e-06, "loss": 2.585411376953125, "step": 1053300 }, { "epoch": 1.2710677406909001, "learning_rate": 5.786380729617617e-06, "loss": 2.569372253417969, "step": 1053400 }, { "epoch": 1.2711884040133827, "learning_rate": 5.785976894149879e-06, "loss": 2.568519287109375, "step": 1053500 }, { "epoch": 1.2713090673358654, "learning_rate": 5.78557305868214e-06, "loss": 2.5698727416992186, "step": 1053600 }, { "epoch": 1.2714297306583482, "learning_rate": 5.785169223214402e-06, "loss": 2.573182373046875, "step": 1053700 }, { "epoch": 1.2715503939808308, "learning_rate": 5.784765387746664e-06, "loss": 2.5712936401367186, "step": 1053800 }, { "epoch": 1.2716710573033134, "learning_rate": 5.784361552278924e-06, "loss": 2.56056396484375, "step": 1053900 }, { "epoch": 1.2717917206257963, "learning_rate": 5.783957716811186e-06, "loss": 2.5686865234375, "step": 1054000 }, { "epoch": 1.2719123839482789, "learning_rate": 5.783553881343448e-06, "loss": 2.56764892578125, "step": 1054100 }, { "epoch": 1.2720330472707615, "learning_rate": 5.783150045875709e-06, "loss": 2.569968566894531, "step": 1054200 }, { "epoch": 1.2721537105932441, "learning_rate": 5.782746210407971e-06, "loss": 2.5856781005859375, "step": 1054300 }, { "epoch": 1.272274373915727, "learning_rate": 5.782342374940233e-06, "loss": 2.59735595703125, "step": 1054400 }, { "epoch": 1.2723950372382096, "learning_rate": 5.781938539472495e-06, "loss": 2.5440476989746093, "step": 1054500 }, { "epoch": 1.2725157005606924, "learning_rate": 5.781534704004756e-06, "loss": 2.550745849609375, "step": 1054600 }, { "epoch": 1.272636363883175, "learning_rate": 5.781130868537017e-06, "loss": 2.5621047973632813, "step": 1054700 }, { "epoch": 1.2727570272056576, "learning_rate": 5.7807270330692785e-06, "loss": 2.536368408203125, "step": 1054800 }, { "epoch": 1.2728776905281403, "learning_rate": 5.7803231976015405e-06, "loss": 2.556578826904297, "step": 1054900 }, { "epoch": 1.272998353850623, "learning_rate": 5.7799193621338025e-06, "loss": 2.5786892700195314, "step": 1055000 }, { "epoch": 1.2731190171731057, "learning_rate": 5.7795155266660645e-06, "loss": 2.557273406982422, "step": 1055100 }, { "epoch": 1.2732396804955883, "learning_rate": 5.779111691198326e-06, "loss": 2.5400360107421873, "step": 1055200 }, { "epoch": 1.2733603438180712, "learning_rate": 5.7787078557305876e-06, "loss": 2.5722689819335938, "step": 1055300 }, { "epoch": 1.2734810071405538, "learning_rate": 5.7783040202628496e-06, "loss": 2.56533447265625, "step": 1055400 }, { "epoch": 1.2736016704630364, "learning_rate": 5.777900184795111e-06, "loss": 2.5580982971191406, "step": 1055500 }, { "epoch": 1.273722333785519, "learning_rate": 5.777496349327372e-06, "loss": 2.561065368652344, "step": 1055600 }, { "epoch": 1.2738429971080019, "learning_rate": 5.777092513859634e-06, "loss": 2.5576995849609374, "step": 1055700 }, { "epoch": 1.2739636604304845, "learning_rate": 5.776688678391895e-06, "loss": 2.5469732666015625, "step": 1055800 }, { "epoch": 1.2740843237529673, "learning_rate": 5.776284842924157e-06, "loss": 2.5799710083007814, "step": 1055900 }, { "epoch": 1.27420498707545, "learning_rate": 5.775881007456419e-06, "loss": 2.559992218017578, "step": 1056000 }, { "epoch": 1.2743256503979326, "learning_rate": 5.77547717198868e-06, "loss": 2.5662469482421875, "step": 1056100 }, { "epoch": 1.2744463137204152, "learning_rate": 5.775073336520942e-06, "loss": 2.571158752441406, "step": 1056200 }, { "epoch": 1.2745669770428978, "learning_rate": 5.774669501053204e-06, "loss": 2.6025189208984374, "step": 1056300 }, { "epoch": 1.2746876403653806, "learning_rate": 5.774265665585464e-06, "loss": 2.5607113647460937, "step": 1056400 }, { "epoch": 1.2748083036878632, "learning_rate": 5.773861830117726e-06, "loss": 2.5779083251953123, "step": 1056500 }, { "epoch": 1.274928967010346, "learning_rate": 5.773457994649988e-06, "loss": 2.5684283447265623, "step": 1056600 }, { "epoch": 1.2750496303328287, "learning_rate": 5.773054159182249e-06, "loss": 2.5857723999023436, "step": 1056700 }, { "epoch": 1.2751702936553113, "learning_rate": 5.772650323714511e-06, "loss": 2.5965121459960936, "step": 1056800 }, { "epoch": 1.275290956977794, "learning_rate": 5.772246488246773e-06, "loss": 2.564411315917969, "step": 1056900 }, { "epoch": 1.2754116203002768, "learning_rate": 5.771842652779035e-06, "loss": 2.5603018188476563, "step": 1057000 }, { "epoch": 1.2755322836227594, "learning_rate": 5.7714388173112965e-06, "loss": 2.568869934082031, "step": 1057100 }, { "epoch": 1.275652946945242, "learning_rate": 5.771034981843558e-06, "loss": 2.563714599609375, "step": 1057200 }, { "epoch": 1.2757736102677248, "learning_rate": 5.770631146375819e-06, "loss": 2.600260925292969, "step": 1057300 }, { "epoch": 1.2758942735902075, "learning_rate": 5.770227310908081e-06, "loss": 2.5845391845703123, "step": 1057400 }, { "epoch": 1.27601493691269, "learning_rate": 5.769823475440343e-06, "loss": 2.612668151855469, "step": 1057500 }, { "epoch": 1.2761356002351727, "learning_rate": 5.769419639972605e-06, "loss": 2.5550888061523436, "step": 1057600 }, { "epoch": 1.2762562635576555, "learning_rate": 5.769015804504866e-06, "loss": 2.5805123901367186, "step": 1057700 }, { "epoch": 1.2763769268801382, "learning_rate": 5.768611969037128e-06, "loss": 2.5468353271484374, "step": 1057800 }, { "epoch": 1.276497590202621, "learning_rate": 5.76820813356939e-06, "loss": 2.560993957519531, "step": 1057900 }, { "epoch": 1.2766182535251036, "learning_rate": 5.76780429810165e-06, "loss": 2.5818890380859374, "step": 1058000 }, { "epoch": 1.2767389168475862, "learning_rate": 5.767400462633912e-06, "loss": 2.5716351318359374, "step": 1058100 }, { "epoch": 1.2768595801700688, "learning_rate": 5.766996627166174e-06, "loss": 2.56001953125, "step": 1058200 }, { "epoch": 1.2769802434925517, "learning_rate": 5.766592791698435e-06, "loss": 2.5451560974121095, "step": 1058300 }, { "epoch": 1.2771009068150343, "learning_rate": 5.766188956230697e-06, "loss": 2.557428283691406, "step": 1058400 }, { "epoch": 1.277221570137517, "learning_rate": 5.765785120762959e-06, "loss": 2.5728353881835937, "step": 1058500 }, { "epoch": 1.2773422334599998, "learning_rate": 5.76538128529522e-06, "loss": 2.5648834228515627, "step": 1058600 }, { "epoch": 1.2774628967824824, "learning_rate": 5.764977449827482e-06, "loss": 2.550722198486328, "step": 1058700 }, { "epoch": 1.277583560104965, "learning_rate": 5.764573614359743e-06, "loss": 2.5790328979492188, "step": 1058800 }, { "epoch": 1.2777042234274476, "learning_rate": 5.7641697788920045e-06, "loss": 2.59083984375, "step": 1058900 }, { "epoch": 1.2778248867499304, "learning_rate": 5.7637659434242665e-06, "loss": 2.5551251220703124, "step": 1059000 }, { "epoch": 1.277945550072413, "learning_rate": 5.7633621079565285e-06, "loss": 2.557292022705078, "step": 1059100 }, { "epoch": 1.2780662133948957, "learning_rate": 5.76295827248879e-06, "loss": 2.5758602905273436, "step": 1059200 }, { "epoch": 1.2781868767173785, "learning_rate": 5.762554437021052e-06, "loss": 2.5541937255859377, "step": 1059300 }, { "epoch": 1.2783075400398611, "learning_rate": 5.762150601553314e-06, "loss": 2.569230041503906, "step": 1059400 }, { "epoch": 1.2784282033623438, "learning_rate": 5.761746766085576e-06, "loss": 2.5681753540039063, "step": 1059500 }, { "epoch": 1.2785488666848264, "learning_rate": 5.761342930617836e-06, "loss": 2.5560311889648437, "step": 1059600 }, { "epoch": 1.2786695300073092, "learning_rate": 5.760939095150098e-06, "loss": 2.5376213073730467, "step": 1059700 }, { "epoch": 1.2787901933297918, "learning_rate": 5.760535259682359e-06, "loss": 2.5720645141601564, "step": 1059800 }, { "epoch": 1.2789108566522747, "learning_rate": 5.760131424214621e-06, "loss": 2.5809100341796873, "step": 1059900 }, { "epoch": 1.2790315199747573, "learning_rate": 5.759727588746883e-06, "loss": 2.5565611267089845, "step": 1060000 }, { "epoch": 1.27915218329724, "learning_rate": 5.759323753279145e-06, "loss": 2.5783151245117186, "step": 1060100 }, { "epoch": 1.2792728466197225, "learning_rate": 5.758919917811406e-06, "loss": 2.5846847534179687, "step": 1060200 }, { "epoch": 1.2793935099422054, "learning_rate": 5.758516082343668e-06, "loss": 2.5525732421875, "step": 1060300 }, { "epoch": 1.279514173264688, "learning_rate": 5.75811224687593e-06, "loss": 2.566367492675781, "step": 1060400 }, { "epoch": 1.2796348365871706, "learning_rate": 5.75770841140819e-06, "loss": 2.556011047363281, "step": 1060500 }, { "epoch": 1.2797554999096534, "learning_rate": 5.757304575940452e-06, "loss": 2.5716131591796874, "step": 1060600 }, { "epoch": 1.279876163232136, "learning_rate": 5.756900740472714e-06, "loss": 2.5614089965820312, "step": 1060700 }, { "epoch": 1.2799968265546187, "learning_rate": 5.7564969050049754e-06, "loss": 2.5550132751464845, "step": 1060800 }, { "epoch": 1.2801174898771013, "learning_rate": 5.756093069537237e-06, "loss": 2.5752438354492186, "step": 1060900 }, { "epoch": 1.2802381531995841, "learning_rate": 5.755689234069499e-06, "loss": 2.5896044921875, "step": 1061000 }, { "epoch": 1.2803588165220667, "learning_rate": 5.7552853986017605e-06, "loss": 2.5766567993164062, "step": 1061100 }, { "epoch": 1.2804794798445496, "learning_rate": 5.7548815631340225e-06, "loss": 2.572611999511719, "step": 1061200 }, { "epoch": 1.2806001431670322, "learning_rate": 5.754477727666284e-06, "loss": 2.552986602783203, "step": 1061300 }, { "epoch": 1.2807208064895148, "learning_rate": 5.754073892198545e-06, "loss": 2.54095458984375, "step": 1061400 }, { "epoch": 1.2808414698119974, "learning_rate": 5.753670056730807e-06, "loss": 2.5676239013671873, "step": 1061500 }, { "epoch": 1.28096213313448, "learning_rate": 5.753266221263069e-06, "loss": 2.584542236328125, "step": 1061600 }, { "epoch": 1.2810827964569629, "learning_rate": 5.75286238579533e-06, "loss": 2.5452488708496093, "step": 1061700 }, { "epoch": 1.2812034597794455, "learning_rate": 5.752458550327592e-06, "loss": 2.5710400390625, "step": 1061800 }, { "epoch": 1.2813241231019283, "learning_rate": 5.752054714859854e-06, "loss": 2.5766561889648436, "step": 1061900 }, { "epoch": 1.281444786424411, "learning_rate": 5.751650879392116e-06, "loss": 2.5691851806640624, "step": 1062000 }, { "epoch": 1.2815654497468936, "learning_rate": 5.751247043924376e-06, "loss": 2.5588929748535154, "step": 1062100 }, { "epoch": 1.2816861130693762, "learning_rate": 5.750843208456638e-06, "loss": 2.572515563964844, "step": 1062200 }, { "epoch": 1.281806776391859, "learning_rate": 5.750439372988899e-06, "loss": 2.5831304931640626, "step": 1062300 }, { "epoch": 1.2819274397143416, "learning_rate": 5.750035537521161e-06, "loss": 2.56316650390625, "step": 1062400 }, { "epoch": 1.2820481030368243, "learning_rate": 5.749631702053423e-06, "loss": 2.5732247924804685, "step": 1062500 }, { "epoch": 1.282168766359307, "learning_rate": 5.749227866585685e-06, "loss": 2.578920593261719, "step": 1062600 }, { "epoch": 1.2822894296817897, "learning_rate": 5.748824031117946e-06, "loss": 2.5488459777832033, "step": 1062700 }, { "epoch": 1.2824100930042723, "learning_rate": 5.748420195650208e-06, "loss": 2.531918487548828, "step": 1062800 }, { "epoch": 1.282530756326755, "learning_rate": 5.748016360182469e-06, "loss": 2.5452000427246095, "step": 1062900 }, { "epoch": 1.2826514196492378, "learning_rate": 5.7476125247147306e-06, "loss": 2.590989074707031, "step": 1063000 }, { "epoch": 1.2827720829717204, "learning_rate": 5.7472086892469926e-06, "loss": 2.5761761474609375, "step": 1063100 }, { "epoch": 1.2828927462942032, "learning_rate": 5.7468048537792545e-06, "loss": 2.5633584594726564, "step": 1063200 }, { "epoch": 1.2830134096166859, "learning_rate": 5.746401018311516e-06, "loss": 2.5879742431640627, "step": 1063300 }, { "epoch": 1.2831340729391685, "learning_rate": 5.745997182843778e-06, "loss": 2.5834161376953126, "step": 1063400 }, { "epoch": 1.283254736261651, "learning_rate": 5.74559334737604e-06, "loss": 2.5686849975585937, "step": 1063500 }, { "epoch": 1.283375399584134, "learning_rate": 5.745189511908302e-06, "loss": 2.5474403381347654, "step": 1063600 }, { "epoch": 1.2834960629066166, "learning_rate": 5.744785676440562e-06, "loss": 2.5628985595703124, "step": 1063700 }, { "epoch": 1.2836167262290992, "learning_rate": 5.744381840972824e-06, "loss": 2.5808154296875, "step": 1063800 }, { "epoch": 1.283737389551582, "learning_rate": 5.743978005505085e-06, "loss": 2.5481298828125, "step": 1063900 }, { "epoch": 1.2838580528740646, "learning_rate": 5.743574170037347e-06, "loss": 2.550398406982422, "step": 1064000 }, { "epoch": 1.2839787161965472, "learning_rate": 5.743170334569609e-06, "loss": 2.58307373046875, "step": 1064100 }, { "epoch": 1.2840993795190299, "learning_rate": 5.742766499101871e-06, "loss": 2.558725128173828, "step": 1064200 }, { "epoch": 1.2842200428415127, "learning_rate": 5.742362663634132e-06, "loss": 2.566438903808594, "step": 1064300 }, { "epoch": 1.2843407061639953, "learning_rate": 5.741958828166394e-06, "loss": 2.5614688110351564, "step": 1064400 }, { "epoch": 1.284461369486478, "learning_rate": 5.741554992698654e-06, "loss": 2.580118408203125, "step": 1064500 }, { "epoch": 1.2845820328089608, "learning_rate": 5.741151157230916e-06, "loss": 2.518922119140625, "step": 1064600 }, { "epoch": 1.2847026961314434, "learning_rate": 5.740747321763178e-06, "loss": 2.5234242248535157, "step": 1064700 }, { "epoch": 1.284823359453926, "learning_rate": 5.74034348629544e-06, "loss": 2.554583740234375, "step": 1064800 }, { "epoch": 1.2849440227764086, "learning_rate": 5.7399396508277015e-06, "loss": 2.5418217468261717, "step": 1064900 }, { "epoch": 1.2850646860988915, "learning_rate": 5.7395358153599634e-06, "loss": 2.555255126953125, "step": 1065000 }, { "epoch": 1.285185349421374, "learning_rate": 5.7391319798922254e-06, "loss": 2.566322937011719, "step": 1065100 }, { "epoch": 1.285306012743857, "learning_rate": 5.7387281444244866e-06, "loss": 2.5675616455078125, "step": 1065200 }, { "epoch": 1.2854266760663395, "learning_rate": 5.738324308956748e-06, "loss": 2.587442626953125, "step": 1065300 }, { "epoch": 1.2855473393888222, "learning_rate": 5.73792047348901e-06, "loss": 2.5432745361328126, "step": 1065400 }, { "epoch": 1.2856680027113048, "learning_rate": 5.737516638021271e-06, "loss": 2.6105636596679687, "step": 1065500 }, { "epoch": 1.2857886660337876, "learning_rate": 5.737112802553533e-06, "loss": 2.5709567260742188, "step": 1065600 }, { "epoch": 1.2859093293562702, "learning_rate": 5.736708967085795e-06, "loss": 2.553116760253906, "step": 1065700 }, { "epoch": 1.2860299926787528, "learning_rate": 5.736305131618056e-06, "loss": 2.5733798217773436, "step": 1065800 }, { "epoch": 1.2861506560012357, "learning_rate": 5.735901296150318e-06, "loss": 2.5795733642578127, "step": 1065900 }, { "epoch": 1.2862713193237183, "learning_rate": 5.73549746068258e-06, "loss": 2.569671630859375, "step": 1066000 }, { "epoch": 1.286391982646201, "learning_rate": 5.735093625214842e-06, "loss": 2.5714996337890623, "step": 1066100 }, { "epoch": 1.2865126459686835, "learning_rate": 5.734689789747102e-06, "loss": 2.5437638854980467, "step": 1066200 }, { "epoch": 1.2866333092911664, "learning_rate": 5.734285954279364e-06, "loss": 2.5781430053710936, "step": 1066300 }, { "epoch": 1.286753972613649, "learning_rate": 5.733882118811625e-06, "loss": 2.5656924438476563, "step": 1066400 }, { "epoch": 1.2868746359361318, "learning_rate": 5.733478283343887e-06, "loss": 2.561823425292969, "step": 1066500 }, { "epoch": 1.2869952992586144, "learning_rate": 5.733074447876149e-06, "loss": 2.5484901428222657, "step": 1066600 }, { "epoch": 1.287115962581097, "learning_rate": 5.732670612408411e-06, "loss": 2.576094665527344, "step": 1066700 }, { "epoch": 1.2872366259035797, "learning_rate": 5.732266776940672e-06, "loss": 2.559752655029297, "step": 1066800 }, { "epoch": 1.2873572892260623, "learning_rate": 5.731862941472934e-06, "loss": 2.5487550354003905, "step": 1066900 }, { "epoch": 1.2874779525485451, "learning_rate": 5.731459106005195e-06, "loss": 2.5548167419433594, "step": 1067000 }, { "epoch": 1.2875986158710278, "learning_rate": 5.731055270537457e-06, "loss": 2.551944580078125, "step": 1067100 }, { "epoch": 1.2877192791935106, "learning_rate": 5.730651435069719e-06, "loss": 2.5724807739257813, "step": 1067200 }, { "epoch": 1.2878399425159932, "learning_rate": 5.7302475996019806e-06, "loss": 2.567180480957031, "step": 1067300 }, { "epoch": 1.2879606058384758, "learning_rate": 5.729843764134242e-06, "loss": 2.5373809814453123, "step": 1067400 }, { "epoch": 1.2880812691609584, "learning_rate": 5.729439928666504e-06, "loss": 2.57637451171875, "step": 1067500 }, { "epoch": 1.2882019324834413, "learning_rate": 5.729036093198766e-06, "loss": 2.5580543518066405, "step": 1067600 }, { "epoch": 1.288322595805924, "learning_rate": 5.728632257731027e-06, "loss": 2.5691632080078124, "step": 1067700 }, { "epoch": 1.2884432591284065, "learning_rate": 5.728228422263288e-06, "loss": 2.548158721923828, "step": 1067800 }, { "epoch": 1.2885639224508894, "learning_rate": 5.72782458679555e-06, "loss": 2.576643981933594, "step": 1067900 }, { "epoch": 1.288684585773372, "learning_rate": 5.727420751327811e-06, "loss": 2.5428759765625, "step": 1068000 }, { "epoch": 1.2888052490958546, "learning_rate": 5.727016915860073e-06, "loss": 2.599731140136719, "step": 1068100 }, { "epoch": 1.2889259124183372, "learning_rate": 5.726613080392335e-06, "loss": 2.556876525878906, "step": 1068200 }, { "epoch": 1.28904657574082, "learning_rate": 5.726209244924596e-06, "loss": 2.587457580566406, "step": 1068300 }, { "epoch": 1.2891672390633027, "learning_rate": 5.725805409456858e-06, "loss": 2.552674102783203, "step": 1068400 }, { "epoch": 1.2892879023857855, "learning_rate": 5.72540157398912e-06, "loss": 2.591832275390625, "step": 1068500 }, { "epoch": 1.2894085657082681, "learning_rate": 5.72499773852138e-06, "loss": 2.5634576416015626, "step": 1068600 }, { "epoch": 1.2895292290307507, "learning_rate": 5.724593903053642e-06, "loss": 2.570126647949219, "step": 1068700 }, { "epoch": 1.2896498923532334, "learning_rate": 5.724190067585904e-06, "loss": 2.560044860839844, "step": 1068800 }, { "epoch": 1.2897705556757162, "learning_rate": 5.7237862321181655e-06, "loss": 2.571834716796875, "step": 1068900 }, { "epoch": 1.2898912189981988, "learning_rate": 5.7233823966504275e-06, "loss": 2.5402340698242187, "step": 1069000 }, { "epoch": 1.2900118823206814, "learning_rate": 5.7229785611826895e-06, "loss": 2.549904479980469, "step": 1069100 }, { "epoch": 1.2901325456431643, "learning_rate": 5.7225747257149515e-06, "loss": 2.572348327636719, "step": 1069200 }, { "epoch": 1.2902532089656469, "learning_rate": 5.722170890247213e-06, "loss": 2.5435331726074217, "step": 1069300 }, { "epoch": 1.2903738722881295, "learning_rate": 5.721767054779474e-06, "loss": 2.545818176269531, "step": 1069400 }, { "epoch": 1.2904945356106121, "learning_rate": 5.721363219311735e-06, "loss": 2.547497100830078, "step": 1069500 }, { "epoch": 1.290615198933095, "learning_rate": 5.720959383843997e-06, "loss": 2.5607470703125, "step": 1069600 }, { "epoch": 1.2907358622555776, "learning_rate": 5.720555548376259e-06, "loss": 2.5784597778320313, "step": 1069700 }, { "epoch": 1.2908565255780602, "learning_rate": 5.720151712908521e-06, "loss": 2.5686798095703125, "step": 1069800 }, { "epoch": 1.290977188900543, "learning_rate": 5.719747877440782e-06, "loss": 2.543323669433594, "step": 1069900 }, { "epoch": 1.2910978522230256, "learning_rate": 5.719344041973044e-06, "loss": 2.5609805297851564, "step": 1070000 }, { "epoch": 1.2912185155455083, "learning_rate": 5.718940206505306e-06, "loss": 2.552744903564453, "step": 1070100 }, { "epoch": 1.2913391788679909, "learning_rate": 5.718536371037566e-06, "loss": 2.5709603881835936, "step": 1070200 }, { "epoch": 1.2914598421904737, "learning_rate": 5.718132535569828e-06, "loss": 2.5835577392578126, "step": 1070300 }, { "epoch": 1.2915805055129563, "learning_rate": 5.71772870010209e-06, "loss": 2.5645071411132814, "step": 1070400 }, { "epoch": 1.2917011688354392, "learning_rate": 5.717324864634351e-06, "loss": 2.5696170043945314, "step": 1070500 }, { "epoch": 1.2918218321579218, "learning_rate": 5.716921029166613e-06, "loss": 2.547554779052734, "step": 1070600 }, { "epoch": 1.2919424954804044, "learning_rate": 5.716517193698875e-06, "loss": 2.585484619140625, "step": 1070700 }, { "epoch": 1.292063158802887, "learning_rate": 5.716113358231136e-06, "loss": 2.555486297607422, "step": 1070800 }, { "epoch": 1.2921838221253699, "learning_rate": 5.715709522763398e-06, "loss": 2.57549072265625, "step": 1070900 }, { "epoch": 1.2923044854478525, "learning_rate": 5.71530568729566e-06, "loss": 2.5507638549804685, "step": 1071000 }, { "epoch": 1.292425148770335, "learning_rate": 5.714901851827921e-06, "loss": 2.5483453369140623, "step": 1071100 }, { "epoch": 1.292545812092818, "learning_rate": 5.714498016360183e-06, "loss": 2.5437164306640625, "step": 1071200 }, { "epoch": 1.2926664754153006, "learning_rate": 5.714094180892445e-06, "loss": 2.564595031738281, "step": 1071300 }, { "epoch": 1.2927871387377832, "learning_rate": 5.713690345424706e-06, "loss": 2.5612966918945315, "step": 1071400 }, { "epoch": 1.2929078020602658, "learning_rate": 5.713286509956968e-06, "loss": 2.5790475463867186, "step": 1071500 }, { "epoch": 1.2930284653827486, "learning_rate": 5.71288267448923e-06, "loss": 2.57418212890625, "step": 1071600 }, { "epoch": 1.2931491287052312, "learning_rate": 5.712478839021492e-06, "loss": 2.562730407714844, "step": 1071700 }, { "epoch": 1.293269792027714, "learning_rate": 5.712075003553753e-06, "loss": 2.5531463623046875, "step": 1071800 }, { "epoch": 1.2933904553501967, "learning_rate": 5.711671168086014e-06, "loss": 2.573019714355469, "step": 1071900 }, { "epoch": 1.2935111186726793, "learning_rate": 5.711267332618275e-06, "loss": 2.550948028564453, "step": 1072000 }, { "epoch": 1.293631781995162, "learning_rate": 5.710863497150537e-06, "loss": 2.5481849670410157, "step": 1072100 }, { "epoch": 1.2937524453176446, "learning_rate": 5.710459661682799e-06, "loss": 2.558854522705078, "step": 1072200 }, { "epoch": 1.2938731086401274, "learning_rate": 5.710055826215061e-06, "loss": 2.5768341064453124, "step": 1072300 }, { "epoch": 1.29399377196261, "learning_rate": 5.709651990747322e-06, "loss": 2.558857116699219, "step": 1072400 }, { "epoch": 1.2941144352850928, "learning_rate": 5.709248155279584e-06, "loss": 2.5751193237304686, "step": 1072500 }, { "epoch": 1.2942350986075755, "learning_rate": 5.708844319811846e-06, "loss": 2.5529911804199217, "step": 1072600 }, { "epoch": 1.294355761930058, "learning_rate": 5.7084404843441065e-06, "loss": 2.537860107421875, "step": 1072700 }, { "epoch": 1.2944764252525407, "learning_rate": 5.7080366488763684e-06, "loss": 2.5528521728515625, "step": 1072800 }, { "epoch": 1.2945970885750235, "learning_rate": 5.70763281340863e-06, "loss": 2.5616796875, "step": 1072900 }, { "epoch": 1.2947177518975062, "learning_rate": 5.7072289779408916e-06, "loss": 2.575154113769531, "step": 1073000 }, { "epoch": 1.2948384152199888, "learning_rate": 5.7068251424731535e-06, "loss": 2.5478135681152345, "step": 1073100 }, { "epoch": 1.2949590785424716, "learning_rate": 5.7064213070054155e-06, "loss": 2.5480221557617186, "step": 1073200 }, { "epoch": 1.2950797418649542, "learning_rate": 5.706017471537677e-06, "loss": 2.5483644104003904, "step": 1073300 }, { "epoch": 1.2952004051874368, "learning_rate": 5.705613636069939e-06, "loss": 2.5572575378417968, "step": 1073400 }, { "epoch": 1.2953210685099195, "learning_rate": 5.7052098006022e-06, "loss": 2.57109375, "step": 1073500 }, { "epoch": 1.2954417318324023, "learning_rate": 5.704805965134461e-06, "loss": 2.544468994140625, "step": 1073600 }, { "epoch": 1.295562395154885, "learning_rate": 5.704402129666723e-06, "loss": 2.5571324157714845, "step": 1073700 }, { "epoch": 1.2956830584773678, "learning_rate": 5.703998294198985e-06, "loss": 2.562124938964844, "step": 1073800 }, { "epoch": 1.2958037217998504, "learning_rate": 5.703594458731246e-06, "loss": 2.5403550720214843, "step": 1073900 }, { "epoch": 1.295924385122333, "learning_rate": 5.703190623263508e-06, "loss": 2.5583157348632812, "step": 1074000 }, { "epoch": 1.2960450484448156, "learning_rate": 5.70278678779577e-06, "loss": 2.557883605957031, "step": 1074100 }, { "epoch": 1.2961657117672984, "learning_rate": 5.702382952328032e-06, "loss": 2.580538330078125, "step": 1074200 }, { "epoch": 1.296286375089781, "learning_rate": 5.701979116860292e-06, "loss": 2.5554876708984375, "step": 1074300 }, { "epoch": 1.2964070384122637, "learning_rate": 5.701575281392554e-06, "loss": 2.5284158325195314, "step": 1074400 }, { "epoch": 1.2965277017347465, "learning_rate": 5.701171445924815e-06, "loss": 2.5654351806640623, "step": 1074500 }, { "epoch": 1.2966483650572291, "learning_rate": 5.700767610457077e-06, "loss": 2.529309844970703, "step": 1074600 }, { "epoch": 1.2967690283797118, "learning_rate": 5.700363774989339e-06, "loss": 2.5478102111816407, "step": 1074700 }, { "epoch": 1.2968896917021944, "learning_rate": 5.699959939521601e-06, "loss": 2.5755880737304686, "step": 1074800 }, { "epoch": 1.2970103550246772, "learning_rate": 5.6995561040538624e-06, "loss": 2.5428585815429687, "step": 1074900 }, { "epoch": 1.2971310183471598, "learning_rate": 5.699152268586124e-06, "loss": 2.5693829345703123, "step": 1075000 }, { "epoch": 1.2972516816696427, "learning_rate": 5.698748433118385e-06, "loss": 2.5984619140625, "step": 1075100 }, { "epoch": 1.2973723449921253, "learning_rate": 5.698344597650647e-06, "loss": 2.5767330932617187, "step": 1075200 }, { "epoch": 1.297493008314608, "learning_rate": 5.697940762182909e-06, "loss": 2.551782531738281, "step": 1075300 }, { "epoch": 1.2976136716370905, "learning_rate": 5.697536926715171e-06, "loss": 2.5466358947753904, "step": 1075400 }, { "epoch": 1.2977343349595731, "learning_rate": 5.697133091247432e-06, "loss": 2.5726046752929688, "step": 1075500 }, { "epoch": 1.297854998282056, "learning_rate": 5.696729255779694e-06, "loss": 2.555053405761719, "step": 1075600 }, { "epoch": 1.2979756616045386, "learning_rate": 5.696325420311956e-06, "loss": 2.549324188232422, "step": 1075700 }, { "epoch": 1.2980963249270214, "learning_rate": 5.695921584844217e-06, "loss": 2.5777041625976564, "step": 1075800 }, { "epoch": 1.298216988249504, "learning_rate": 5.695517749376479e-06, "loss": 2.545119323730469, "step": 1075900 }, { "epoch": 1.2983376515719867, "learning_rate": 5.69511391390874e-06, "loss": 2.5495535278320314, "step": 1076000 }, { "epoch": 1.2984583148944693, "learning_rate": 5.694710078441001e-06, "loss": 2.527934265136719, "step": 1076100 }, { "epoch": 1.2985789782169521, "learning_rate": 5.694306242973263e-06, "loss": 2.563862609863281, "step": 1076200 }, { "epoch": 1.2986996415394347, "learning_rate": 5.693902407505525e-06, "loss": 2.5605523681640623, "step": 1076300 }, { "epoch": 1.2988203048619174, "learning_rate": 5.693498572037786e-06, "loss": 2.5723776245117187, "step": 1076400 }, { "epoch": 1.2989409681844002, "learning_rate": 5.693094736570048e-06, "loss": 2.5519410705566408, "step": 1076500 }, { "epoch": 1.2990616315068828, "learning_rate": 5.69269090110231e-06, "loss": 2.533247528076172, "step": 1076600 }, { "epoch": 1.2991822948293654, "learning_rate": 5.692287065634572e-06, "loss": 2.5607833862304688, "step": 1076700 }, { "epoch": 1.299302958151848, "learning_rate": 5.6918832301668325e-06, "loss": 2.5675018310546873, "step": 1076800 }, { "epoch": 1.2994236214743309, "learning_rate": 5.6914793946990945e-06, "loss": 2.54861083984375, "step": 1076900 }, { "epoch": 1.2995442847968135, "learning_rate": 5.691075559231356e-06, "loss": 2.5647958374023436, "step": 1077000 }, { "epoch": 1.2996649481192963, "learning_rate": 5.690671723763618e-06, "loss": 2.563851623535156, "step": 1077100 }, { "epoch": 1.299785611441779, "learning_rate": 5.6902678882958796e-06, "loss": 2.554442138671875, "step": 1077200 }, { "epoch": 1.2999062747642616, "learning_rate": 5.6898640528281415e-06, "loss": 2.528411407470703, "step": 1077300 }, { "epoch": 1.3000269380867442, "learning_rate": 5.689460217360403e-06, "loss": 2.55521240234375, "step": 1077400 }, { "epoch": 1.3001476014092268, "learning_rate": 5.689056381892665e-06, "loss": 2.561631164550781, "step": 1077500 }, { "epoch": 1.3002682647317096, "learning_rate": 5.688652546424925e-06, "loss": 2.5279383850097656, "step": 1077600 }, { "epoch": 1.3003889280541923, "learning_rate": 5.688248710957187e-06, "loss": 2.5612149047851562, "step": 1077700 }, { "epoch": 1.300509591376675, "learning_rate": 5.687844875489449e-06, "loss": 2.5401556396484377, "step": 1077800 }, { "epoch": 1.3006302546991577, "learning_rate": 5.687441040021711e-06, "loss": 2.5457058715820313, "step": 1077900 }, { "epoch": 1.3007509180216403, "learning_rate": 5.687037204553972e-06, "loss": 2.5478578186035157, "step": 1078000 }, { "epoch": 1.300871581344123, "learning_rate": 5.686633369086234e-06, "loss": 2.569681396484375, "step": 1078100 }, { "epoch": 1.3009922446666058, "learning_rate": 5.686229533618496e-06, "loss": 2.544952850341797, "step": 1078200 }, { "epoch": 1.3011129079890884, "learning_rate": 5.685825698150758e-06, "loss": 2.520896759033203, "step": 1078300 }, { "epoch": 1.301233571311571, "learning_rate": 5.685421862683018e-06, "loss": 2.5551826477050783, "step": 1078400 }, { "epoch": 1.3013542346340539, "learning_rate": 5.68501802721528e-06, "loss": 2.5633694458007814, "step": 1078500 }, { "epoch": 1.3014748979565365, "learning_rate": 5.684614191747541e-06, "loss": 2.559736480712891, "step": 1078600 }, { "epoch": 1.301595561279019, "learning_rate": 5.684210356279803e-06, "loss": 2.5636862182617186, "step": 1078700 }, { "epoch": 1.3017162246015017, "learning_rate": 5.683806520812065e-06, "loss": 2.566939697265625, "step": 1078800 }, { "epoch": 1.3018368879239846, "learning_rate": 5.683402685344327e-06, "loss": 2.562860107421875, "step": 1078900 }, { "epoch": 1.3019575512464672, "learning_rate": 5.6829988498765885e-06, "loss": 2.5673727416992187, "step": 1079000 }, { "epoch": 1.30207821456895, "learning_rate": 5.6825950144088505e-06, "loss": 2.547724609375, "step": 1079100 }, { "epoch": 1.3021988778914326, "learning_rate": 5.682191178941111e-06, "loss": 2.5616259765625, "step": 1079200 }, { "epoch": 1.3023195412139152, "learning_rate": 5.681787343473373e-06, "loss": 2.552498626708984, "step": 1079300 }, { "epoch": 1.3024402045363979, "learning_rate": 5.681383508005635e-06, "loss": 2.5539315795898436, "step": 1079400 }, { "epoch": 1.3025608678588807, "learning_rate": 5.680979672537897e-06, "loss": 2.558233184814453, "step": 1079500 }, { "epoch": 1.3026815311813633, "learning_rate": 5.680575837070158e-06, "loss": 2.5554573059082033, "step": 1079600 }, { "epoch": 1.302802194503846, "learning_rate": 5.68017200160242e-06, "loss": 2.55929931640625, "step": 1079700 }, { "epoch": 1.3029228578263288, "learning_rate": 5.679768166134682e-06, "loss": 2.5748501586914063, "step": 1079800 }, { "epoch": 1.3030435211488114, "learning_rate": 5.679364330666943e-06, "loss": 2.551691436767578, "step": 1079900 }, { "epoch": 1.303164184471294, "learning_rate": 5.678960495199204e-06, "loss": 2.568845520019531, "step": 1080000 }, { "epoch": 1.3032848477937766, "learning_rate": 5.678556659731466e-06, "loss": 2.5456669616699217, "step": 1080100 }, { "epoch": 1.3034055111162595, "learning_rate": 5.678152824263727e-06, "loss": 2.564297790527344, "step": 1080200 }, { "epoch": 1.303526174438742, "learning_rate": 5.677748988795989e-06, "loss": 2.5552436828613283, "step": 1080300 }, { "epoch": 1.303646837761225, "learning_rate": 5.677345153328251e-06, "loss": 2.5716400146484375, "step": 1080400 }, { "epoch": 1.3037675010837075, "learning_rate": 5.676941317860512e-06, "loss": 2.5487734985351564, "step": 1080500 }, { "epoch": 1.3038881644061902, "learning_rate": 5.676537482392774e-06, "loss": 2.579068603515625, "step": 1080600 }, { "epoch": 1.3040088277286728, "learning_rate": 5.676133646925036e-06, "loss": 2.539351501464844, "step": 1080700 }, { "epoch": 1.3041294910511554, "learning_rate": 5.6757298114572965e-06, "loss": 2.5471832275390627, "step": 1080800 }, { "epoch": 1.3042501543736382, "learning_rate": 5.6753259759895585e-06, "loss": 2.5655126953125, "step": 1080900 }, { "epoch": 1.3043708176961208, "learning_rate": 5.6749221405218205e-06, "loss": 2.5562057495117188, "step": 1081000 }, { "epoch": 1.3044914810186037, "learning_rate": 5.674518305054082e-06, "loss": 2.538668975830078, "step": 1081100 }, { "epoch": 1.3046121443410863, "learning_rate": 5.674114469586344e-06, "loss": 2.565599060058594, "step": 1081200 }, { "epoch": 1.304732807663569, "learning_rate": 5.673710634118606e-06, "loss": 2.532515869140625, "step": 1081300 }, { "epoch": 1.3048534709860515, "learning_rate": 5.673306798650868e-06, "loss": 2.545681610107422, "step": 1081400 }, { "epoch": 1.3049741343085344, "learning_rate": 5.672902963183129e-06, "loss": 2.5640603637695314, "step": 1081500 }, { "epoch": 1.305094797631017, "learning_rate": 5.672499127715391e-06, "loss": 2.5631985473632812, "step": 1081600 }, { "epoch": 1.3052154609534996, "learning_rate": 5.672095292247651e-06, "loss": 2.560586242675781, "step": 1081700 }, { "epoch": 1.3053361242759824, "learning_rate": 5.671691456779913e-06, "loss": 2.5590782165527344, "step": 1081800 }, { "epoch": 1.305456787598465, "learning_rate": 5.671287621312175e-06, "loss": 2.5574191284179686, "step": 1081900 }, { "epoch": 1.3055774509209477, "learning_rate": 5.670883785844437e-06, "loss": 2.5618389892578124, "step": 1082000 }, { "epoch": 1.3056981142434303, "learning_rate": 5.670479950376698e-06, "loss": 2.553639373779297, "step": 1082100 }, { "epoch": 1.3058187775659131, "learning_rate": 5.67007611490896e-06, "loss": 2.5474623107910155, "step": 1082200 }, { "epoch": 1.3059394408883958, "learning_rate": 5.669672279441222e-06, "loss": 2.5589149475097654, "step": 1082300 }, { "epoch": 1.3060601042108786, "learning_rate": 5.669268443973483e-06, "loss": 2.5695513916015624, "step": 1082400 }, { "epoch": 1.3061807675333612, "learning_rate": 5.668864608505744e-06, "loss": 2.55406982421875, "step": 1082500 }, { "epoch": 1.3063014308558438, "learning_rate": 5.668460773038006e-06, "loss": 2.571086120605469, "step": 1082600 }, { "epoch": 1.3064220941783264, "learning_rate": 5.6680569375702674e-06, "loss": 2.567100830078125, "step": 1082700 }, { "epoch": 1.306542757500809, "learning_rate": 5.667653102102529e-06, "loss": 2.5550115966796874, "step": 1082800 }, { "epoch": 1.306663420823292, "learning_rate": 5.667249266634791e-06, "loss": 2.559858856201172, "step": 1082900 }, { "epoch": 1.3067840841457745, "learning_rate": 5.6668454311670525e-06, "loss": 2.5568592834472654, "step": 1083000 }, { "epoch": 1.3069047474682574, "learning_rate": 5.6664415956993145e-06, "loss": 2.5518763732910155, "step": 1083100 }, { "epoch": 1.30702541079074, "learning_rate": 5.6660377602315765e-06, "loss": 2.5424790954589844, "step": 1083200 }, { "epoch": 1.3071460741132226, "learning_rate": 5.665633924763837e-06, "loss": 2.5493783569335937, "step": 1083300 }, { "epoch": 1.3072667374357052, "learning_rate": 5.665230089296099e-06, "loss": 2.564657897949219, "step": 1083400 }, { "epoch": 1.307387400758188, "learning_rate": 5.664826253828361e-06, "loss": 2.540216827392578, "step": 1083500 }, { "epoch": 1.3075080640806707, "learning_rate": 5.664422418360622e-06, "loss": 2.580692138671875, "step": 1083600 }, { "epoch": 1.3076287274031533, "learning_rate": 5.664018582892884e-06, "loss": 2.5573179626464846, "step": 1083700 }, { "epoch": 1.3077493907256361, "learning_rate": 5.663614747425146e-06, "loss": 2.5459149169921873, "step": 1083800 }, { "epoch": 1.3078700540481187, "learning_rate": 5.663210911957408e-06, "loss": 2.57718994140625, "step": 1083900 }, { "epoch": 1.3079907173706014, "learning_rate": 5.662807076489669e-06, "loss": 2.5540150451660155, "step": 1084000 }, { "epoch": 1.308111380693084, "learning_rate": 5.66240324102193e-06, "loss": 2.5655563354492186, "step": 1084100 }, { "epoch": 1.3082320440155668, "learning_rate": 5.661999405554191e-06, "loss": 2.5618603515625, "step": 1084200 }, { "epoch": 1.3083527073380494, "learning_rate": 5.661595570086453e-06, "loss": 2.5724896240234374, "step": 1084300 }, { "epoch": 1.3084733706605323, "learning_rate": 5.661191734618715e-06, "loss": 2.5675119018554686, "step": 1084400 }, { "epoch": 1.3085940339830149, "learning_rate": 5.660787899150977e-06, "loss": 2.583421325683594, "step": 1084500 }, { "epoch": 1.3087146973054975, "learning_rate": 5.660384063683238e-06, "loss": 2.5471957397460936, "step": 1084600 }, { "epoch": 1.3088353606279801, "learning_rate": 5.6599802282155e-06, "loss": 2.5583419799804688, "step": 1084700 }, { "epoch": 1.308956023950463, "learning_rate": 5.659576392747762e-06, "loss": 2.5591046142578127, "step": 1084800 }, { "epoch": 1.3090766872729456, "learning_rate": 5.6591725572800226e-06, "loss": 2.528092498779297, "step": 1084900 }, { "epoch": 1.3091973505954282, "learning_rate": 5.6587687218122846e-06, "loss": 2.5642849731445314, "step": 1085000 }, { "epoch": 1.309318013917911, "learning_rate": 5.6583648863445465e-06, "loss": 2.5520613098144533, "step": 1085100 }, { "epoch": 1.3094386772403936, "learning_rate": 5.657961050876808e-06, "loss": 2.5574952697753908, "step": 1085200 }, { "epoch": 1.3095593405628763, "learning_rate": 5.65755721540907e-06, "loss": 2.560263366699219, "step": 1085300 }, { "epoch": 1.3096800038853589, "learning_rate": 5.657153379941332e-06, "loss": 2.528867492675781, "step": 1085400 }, { "epoch": 1.3098006672078417, "learning_rate": 5.656749544473593e-06, "loss": 2.572273864746094, "step": 1085500 }, { "epoch": 1.3099213305303243, "learning_rate": 5.656345709005855e-06, "loss": 2.5547529602050782, "step": 1085600 }, { "epoch": 1.3100419938528072, "learning_rate": 5.655941873538116e-06, "loss": 2.5502593994140623, "step": 1085700 }, { "epoch": 1.3101626571752898, "learning_rate": 5.655538038070377e-06, "loss": 2.5494180297851563, "step": 1085800 }, { "epoch": 1.3102833204977724, "learning_rate": 5.655134202602639e-06, "loss": 2.5913336181640627, "step": 1085900 }, { "epoch": 1.310403983820255, "learning_rate": 5.654730367134901e-06, "loss": 2.542246856689453, "step": 1086000 }, { "epoch": 1.3105246471427376, "learning_rate": 5.654326531667162e-06, "loss": 2.5640823364257814, "step": 1086100 }, { "epoch": 1.3106453104652205, "learning_rate": 5.653922696199424e-06, "loss": 2.541390228271484, "step": 1086200 }, { "epoch": 1.310765973787703, "learning_rate": 5.653518860731686e-06, "loss": 2.5229527282714845, "step": 1086300 }, { "epoch": 1.310886637110186, "learning_rate": 5.653115025263948e-06, "loss": 2.5556539916992187, "step": 1086400 }, { "epoch": 1.3110073004326686, "learning_rate": 5.652711189796209e-06, "loss": 2.5516934204101562, "step": 1086500 }, { "epoch": 1.3111279637551512, "learning_rate": 5.65230735432847e-06, "loss": 2.5812203979492185, "step": 1086600 }, { "epoch": 1.3112486270776338, "learning_rate": 5.6519035188607315e-06, "loss": 2.5420291137695314, "step": 1086700 }, { "epoch": 1.3113692904001166, "learning_rate": 5.6514996833929935e-06, "loss": 2.564453125, "step": 1086800 }, { "epoch": 1.3114899537225992, "learning_rate": 5.6510958479252554e-06, "loss": 2.5485185241699218, "step": 1086900 }, { "epoch": 1.3116106170450819, "learning_rate": 5.6506920124575174e-06, "loss": 2.546965789794922, "step": 1087000 }, { "epoch": 1.3117312803675647, "learning_rate": 5.6502881769897786e-06, "loss": 2.5937686157226563, "step": 1087100 }, { "epoch": 1.3118519436900473, "learning_rate": 5.6498843415220405e-06, "loss": 2.55890869140625, "step": 1087200 }, { "epoch": 1.31197260701253, "learning_rate": 5.6494805060543025e-06, "loss": 2.5580935668945313, "step": 1087300 }, { "epoch": 1.3120932703350126, "learning_rate": 5.649076670586563e-06, "loss": 2.5532290649414064, "step": 1087400 }, { "epoch": 1.3122139336574954, "learning_rate": 5.648672835118825e-06, "loss": 2.6002740478515625, "step": 1087500 }, { "epoch": 1.312334596979978, "learning_rate": 5.648268999651087e-06, "loss": 2.5522976684570313, "step": 1087600 }, { "epoch": 1.3124552603024608, "learning_rate": 5.647865164183348e-06, "loss": 2.5383283996582033, "step": 1087700 }, { "epoch": 1.3125759236249435, "learning_rate": 5.64746132871561e-06, "loss": 2.564009094238281, "step": 1087800 }, { "epoch": 1.312696586947426, "learning_rate": 5.647057493247872e-06, "loss": 2.5509564208984377, "step": 1087900 }, { "epoch": 1.3128172502699087, "learning_rate": 5.646653657780133e-06, "loss": 2.546455841064453, "step": 1088000 }, { "epoch": 1.3129379135923915, "learning_rate": 5.646249822312395e-06, "loss": 2.578446044921875, "step": 1088100 }, { "epoch": 1.3130585769148742, "learning_rate": 5.645845986844656e-06, "loss": 2.5432528686523437, "step": 1088200 }, { "epoch": 1.3131792402373568, "learning_rate": 5.645442151376917e-06, "loss": 2.54797607421875, "step": 1088300 }, { "epoch": 1.3132999035598396, "learning_rate": 5.645038315909179e-06, "loss": 2.5499722290039064, "step": 1088400 }, { "epoch": 1.3134205668823222, "learning_rate": 5.644634480441441e-06, "loss": 2.5820773315429686, "step": 1088500 }, { "epoch": 1.3135412302048048, "learning_rate": 5.644230644973702e-06, "loss": 2.557436218261719, "step": 1088600 }, { "epoch": 1.3136618935272875, "learning_rate": 5.643826809505964e-06, "loss": 2.531993865966797, "step": 1088700 }, { "epoch": 1.3137825568497703, "learning_rate": 5.643422974038226e-06, "loss": 2.548395538330078, "step": 1088800 }, { "epoch": 1.313903220172253, "learning_rate": 5.643019138570488e-06, "loss": 2.5650006103515626, "step": 1088900 }, { "epoch": 1.3140238834947355, "learning_rate": 5.642615303102749e-06, "loss": 2.549491119384766, "step": 1089000 }, { "epoch": 1.3141445468172184, "learning_rate": 5.642211467635011e-06, "loss": 2.5621163940429685, "step": 1089100 }, { "epoch": 1.314265210139701, "learning_rate": 5.641807632167272e-06, "loss": 2.5524127197265627, "step": 1089200 }, { "epoch": 1.3143858734621836, "learning_rate": 5.641403796699534e-06, "loss": 2.552733154296875, "step": 1089300 }, { "epoch": 1.3145065367846662, "learning_rate": 5.640999961231796e-06, "loss": 2.5571690368652344, "step": 1089400 }, { "epoch": 1.314627200107149, "learning_rate": 5.640596125764058e-06, "loss": 2.557180938720703, "step": 1089500 }, { "epoch": 1.3147478634296317, "learning_rate": 5.640192290296319e-06, "loss": 2.545235443115234, "step": 1089600 }, { "epoch": 1.3148685267521145, "learning_rate": 5.639788454828581e-06, "loss": 2.556837615966797, "step": 1089700 }, { "epoch": 1.3149891900745971, "learning_rate": 5.639384619360841e-06, "loss": 2.564802551269531, "step": 1089800 }, { "epoch": 1.3151098533970798, "learning_rate": 5.638980783893103e-06, "loss": 2.54810791015625, "step": 1089900 }, { "epoch": 1.3152305167195624, "learning_rate": 5.638576948425365e-06, "loss": 2.5523988342285158, "step": 1090000 }, { "epoch": 1.3153511800420452, "learning_rate": 5.638173112957627e-06, "loss": 2.547243804931641, "step": 1090100 }, { "epoch": 1.3154718433645278, "learning_rate": 5.637769277489888e-06, "loss": 2.5449708557128905, "step": 1090200 }, { "epoch": 1.3155925066870104, "learning_rate": 5.63736544202215e-06, "loss": 2.5492681884765624, "step": 1090300 }, { "epoch": 1.3157131700094933, "learning_rate": 5.636961606554412e-06, "loss": 2.5551344299316407, "step": 1090400 }, { "epoch": 1.315833833331976, "learning_rate": 5.636557771086673e-06, "loss": 2.558866271972656, "step": 1090500 }, { "epoch": 1.3159544966544585, "learning_rate": 5.636153935618934e-06, "loss": 2.5590481567382812, "step": 1090600 }, { "epoch": 1.3160751599769411, "learning_rate": 5.635750100151196e-06, "loss": 2.5398660278320313, "step": 1090700 }, { "epoch": 1.316195823299424, "learning_rate": 5.6353462646834575e-06, "loss": 2.547239990234375, "step": 1090800 }, { "epoch": 1.3163164866219066, "learning_rate": 5.6349424292157195e-06, "loss": 2.5362362670898437, "step": 1090900 }, { "epoch": 1.3164371499443894, "learning_rate": 5.6345385937479815e-06, "loss": 2.5718505859375, "step": 1091000 }, { "epoch": 1.316557813266872, "learning_rate": 5.634134758280243e-06, "loss": 2.545814971923828, "step": 1091100 }, { "epoch": 1.3166784765893547, "learning_rate": 5.633730922812505e-06, "loss": 2.543257598876953, "step": 1091200 }, { "epoch": 1.3167991399118373, "learning_rate": 5.633327087344767e-06, "loss": 2.5517544555664062, "step": 1091300 }, { "epoch": 1.31691980323432, "learning_rate": 5.6329232518770286e-06, "loss": 2.5599684143066406, "step": 1091400 }, { "epoch": 1.3170404665568027, "learning_rate": 5.632519416409289e-06, "loss": 2.5563931274414062, "step": 1091500 }, { "epoch": 1.3171611298792854, "learning_rate": 5.632115580941551e-06, "loss": 2.5631723022460937, "step": 1091600 }, { "epoch": 1.3172817932017682, "learning_rate": 5.631711745473812e-06, "loss": 2.554298858642578, "step": 1091700 }, { "epoch": 1.3174024565242508, "learning_rate": 5.631307910006074e-06, "loss": 2.548472900390625, "step": 1091800 }, { "epoch": 1.3175231198467334, "learning_rate": 5.630904074538336e-06, "loss": 2.5481982421875, "step": 1091900 }, { "epoch": 1.317643783169216, "learning_rate": 5.630500239070598e-06, "loss": 2.5821990966796875, "step": 1092000 }, { "epoch": 1.3177644464916989, "learning_rate": 5.630096403602859e-06, "loss": 2.5599241638183594, "step": 1092100 }, { "epoch": 1.3178851098141815, "learning_rate": 5.629692568135121e-06, "loss": 2.557892608642578, "step": 1092200 }, { "epoch": 1.3180057731366641, "learning_rate": 5.629288732667381e-06, "loss": 2.5427142333984376, "step": 1092300 }, { "epoch": 1.318126436459147, "learning_rate": 5.628884897199643e-06, "loss": 2.5726004028320313, "step": 1092400 }, { "epoch": 1.3182470997816296, "learning_rate": 5.628481061731905e-06, "loss": 2.526109466552734, "step": 1092500 }, { "epoch": 1.3183677631041122, "learning_rate": 5.628077226264167e-06, "loss": 2.555214538574219, "step": 1092600 }, { "epoch": 1.3184884264265948, "learning_rate": 5.627673390796428e-06, "loss": 2.548678436279297, "step": 1092700 }, { "epoch": 1.3186090897490776, "learning_rate": 5.62726955532869e-06, "loss": 2.563157958984375, "step": 1092800 }, { "epoch": 1.3187297530715603, "learning_rate": 5.626865719860952e-06, "loss": 2.568973388671875, "step": 1092900 }, { "epoch": 1.318850416394043, "learning_rate": 5.626461884393214e-06, "loss": 2.563741455078125, "step": 1093000 }, { "epoch": 1.3189710797165257, "learning_rate": 5.626058048925475e-06, "loss": 2.5436399841308592, "step": 1093100 }, { "epoch": 1.3190917430390083, "learning_rate": 5.625654213457737e-06, "loss": 2.5446818542480467, "step": 1093200 }, { "epoch": 1.319212406361491, "learning_rate": 5.625250377989998e-06, "loss": 2.5535826110839843, "step": 1093300 }, { "epoch": 1.3193330696839738, "learning_rate": 5.62484654252226e-06, "loss": 2.560447998046875, "step": 1093400 }, { "epoch": 1.3194537330064564, "learning_rate": 5.624442707054522e-06, "loss": 2.5264585876464842, "step": 1093500 }, { "epoch": 1.319574396328939, "learning_rate": 5.624038871586784e-06, "loss": 2.5848626708984375, "step": 1093600 }, { "epoch": 1.3196950596514219, "learning_rate": 5.623635036119045e-06, "loss": 2.51069580078125, "step": 1093700 }, { "epoch": 1.3198157229739045, "learning_rate": 5.623231200651307e-06, "loss": 2.5292427062988283, "step": 1093800 }, { "epoch": 1.319936386296387, "learning_rate": 5.622827365183567e-06, "loss": 2.540599822998047, "step": 1093900 }, { "epoch": 1.3200570496188697, "learning_rate": 5.622423529715829e-06, "loss": 2.531332550048828, "step": 1094000 }, { "epoch": 1.3201777129413526, "learning_rate": 5.622019694248091e-06, "loss": 2.5718896484375, "step": 1094100 }, { "epoch": 1.3202983762638352, "learning_rate": 5.621615858780353e-06, "loss": 2.5285743713378905, "step": 1094200 }, { "epoch": 1.3204190395863178, "learning_rate": 5.621212023312614e-06, "loss": 2.540790710449219, "step": 1094300 }, { "epoch": 1.3205397029088006, "learning_rate": 5.620808187844876e-06, "loss": 2.5675534057617186, "step": 1094400 }, { "epoch": 1.3206603662312832, "learning_rate": 5.620404352377138e-06, "loss": 2.5689932250976564, "step": 1094500 }, { "epoch": 1.3207810295537659, "learning_rate": 5.620000516909399e-06, "loss": 2.5678839111328124, "step": 1094600 }, { "epoch": 1.3209016928762485, "learning_rate": 5.6195966814416604e-06, "loss": 2.525592803955078, "step": 1094700 }, { "epoch": 1.3210223561987313, "learning_rate": 5.619192845973922e-06, "loss": 2.536093292236328, "step": 1094800 }, { "epoch": 1.321143019521214, "learning_rate": 5.6187890105061835e-06, "loss": 2.531951904296875, "step": 1094900 }, { "epoch": 1.3212636828436968, "learning_rate": 5.6183851750384455e-06, "loss": 2.549217529296875, "step": 1095000 }, { "epoch": 1.3213843461661794, "learning_rate": 5.6179813395707075e-06, "loss": 2.5671871948242186, "step": 1095100 }, { "epoch": 1.321505009488662, "learning_rate": 5.617577504102969e-06, "loss": 2.549984130859375, "step": 1095200 }, { "epoch": 1.3216256728111446, "learning_rate": 5.617173668635231e-06, "loss": 2.578207702636719, "step": 1095300 }, { "epoch": 1.3217463361336275, "learning_rate": 5.616769833167493e-06, "loss": 2.5482972717285155, "step": 1095400 }, { "epoch": 1.32186699945611, "learning_rate": 5.616365997699753e-06, "loss": 2.56985107421875, "step": 1095500 }, { "epoch": 1.3219876627785927, "learning_rate": 5.615962162232015e-06, "loss": 2.5251898193359374, "step": 1095600 }, { "epoch": 1.3221083261010755, "learning_rate": 5.615558326764277e-06, "loss": 2.571219482421875, "step": 1095700 }, { "epoch": 1.3222289894235582, "learning_rate": 5.615154491296538e-06, "loss": 2.5448883056640623, "step": 1095800 }, { "epoch": 1.3223496527460408, "learning_rate": 5.6147506558288e-06, "loss": 2.5816171264648435, "step": 1095900 }, { "epoch": 1.3224703160685234, "learning_rate": 5.614346820361062e-06, "loss": 2.5545326232910157, "step": 1096000 }, { "epoch": 1.3225909793910062, "learning_rate": 5.613942984893324e-06, "loss": 2.5394633483886717, "step": 1096100 }, { "epoch": 1.3227116427134888, "learning_rate": 5.613539149425585e-06, "loss": 2.5617611694335936, "step": 1096200 }, { "epoch": 1.3228323060359717, "learning_rate": 5.613135313957846e-06, "loss": 2.552193145751953, "step": 1096300 }, { "epoch": 1.3229529693584543, "learning_rate": 5.612731478490107e-06, "loss": 2.573558654785156, "step": 1096400 }, { "epoch": 1.323073632680937, "learning_rate": 5.612327643022369e-06, "loss": 2.548691864013672, "step": 1096500 }, { "epoch": 1.3231942960034195, "learning_rate": 5.611923807554631e-06, "loss": 2.556333465576172, "step": 1096600 }, { "epoch": 1.3233149593259022, "learning_rate": 5.611519972086893e-06, "loss": 2.557570495605469, "step": 1096700 }, { "epoch": 1.323435622648385, "learning_rate": 5.6111161366191544e-06, "loss": 2.5304598999023438, "step": 1096800 }, { "epoch": 1.3235562859708676, "learning_rate": 5.610712301151416e-06, "loss": 2.538854217529297, "step": 1096900 }, { "epoch": 1.3236769492933504, "learning_rate": 5.610308465683678e-06, "loss": 2.5557981872558595, "step": 1097000 }, { "epoch": 1.323797612615833, "learning_rate": 5.6099046302159395e-06, "loss": 2.5919873046875, "step": 1097100 }, { "epoch": 1.3239182759383157, "learning_rate": 5.609500794748201e-06, "loss": 2.548035430908203, "step": 1097200 }, { "epoch": 1.3240389392607983, "learning_rate": 5.609096959280463e-06, "loss": 2.5592530822753905, "step": 1097300 }, { "epoch": 1.3241596025832811, "learning_rate": 5.608693123812724e-06, "loss": 2.5602960205078125, "step": 1097400 }, { "epoch": 1.3242802659057638, "learning_rate": 5.608289288344986e-06, "loss": 2.5626220703125, "step": 1097500 }, { "epoch": 1.3244009292282464, "learning_rate": 5.607885452877248e-06, "loss": 2.568172607421875, "step": 1097600 }, { "epoch": 1.3245215925507292, "learning_rate": 5.607481617409509e-06, "loss": 2.539080047607422, "step": 1097700 }, { "epoch": 1.3246422558732118, "learning_rate": 5.607077781941771e-06, "loss": 2.5737991333007812, "step": 1097800 }, { "epoch": 1.3247629191956944, "learning_rate": 5.606673946474033e-06, "loss": 2.5636407470703126, "step": 1097900 }, { "epoch": 1.324883582518177, "learning_rate": 5.606270111006293e-06, "loss": 2.588065490722656, "step": 1098000 }, { "epoch": 1.32500424584066, "learning_rate": 5.605866275538555e-06, "loss": 2.5616497802734375, "step": 1098100 }, { "epoch": 1.3251249091631425, "learning_rate": 5.605462440070817e-06, "loss": 2.5295286560058594, "step": 1098200 }, { "epoch": 1.3252455724856254, "learning_rate": 5.605058604603078e-06, "loss": 2.561962890625, "step": 1098300 }, { "epoch": 1.325366235808108, "learning_rate": 5.60465476913534e-06, "loss": 2.5497976684570314, "step": 1098400 }, { "epoch": 1.3254868991305906, "learning_rate": 5.604250933667602e-06, "loss": 2.531443328857422, "step": 1098500 }, { "epoch": 1.3256075624530732, "learning_rate": 5.603847098199864e-06, "loss": 2.5258460998535157, "step": 1098600 }, { "epoch": 1.325728225775556, "learning_rate": 5.603443262732125e-06, "loss": 2.534833984375, "step": 1098700 }, { "epoch": 1.3258488890980387, "learning_rate": 5.6030394272643865e-06, "loss": 2.54765625, "step": 1098800 }, { "epoch": 1.3259695524205213, "learning_rate": 5.602635591796648e-06, "loss": 2.5570518493652346, "step": 1098900 }, { "epoch": 1.3260902157430041, "learning_rate": 5.60223175632891e-06, "loss": 2.55595947265625, "step": 1099000 }, { "epoch": 1.3262108790654867, "learning_rate": 5.6018279208611716e-06, "loss": 2.5565721130371095, "step": 1099100 }, { "epoch": 1.3263315423879694, "learning_rate": 5.6014240853934335e-06, "loss": 2.5457611083984375, "step": 1099200 }, { "epoch": 1.326452205710452, "learning_rate": 5.601020249925695e-06, "loss": 2.5532040405273437, "step": 1099300 }, { "epoch": 1.3265728690329348, "learning_rate": 5.600616414457957e-06, "loss": 2.5629067993164063, "step": 1099400 }, { "epoch": 1.3266935323554174, "learning_rate": 5.600212578990219e-06, "loss": 2.5379881286621093, "step": 1099500 }, { "epoch": 1.3268141956779, "learning_rate": 5.599808743522479e-06, "loss": 2.537314758300781, "step": 1099600 }, { "epoch": 1.3269348590003829, "learning_rate": 5.599404908054741e-06, "loss": 2.5620794677734375, "step": 1099700 }, { "epoch": 1.3270555223228655, "learning_rate": 5.599001072587003e-06, "loss": 2.5501333618164064, "step": 1099800 }, { "epoch": 1.3271761856453481, "learning_rate": 5.598597237119264e-06, "loss": 2.5552029418945312, "step": 1099900 }, { "epoch": 1.3272968489678307, "learning_rate": 5.598193401651526e-06, "loss": 2.5722857666015626, "step": 1100000 }, { "epoch": 1.3274175122903136, "learning_rate": 5.597789566183788e-06, "loss": 2.558529510498047, "step": 1100100 }, { "epoch": 1.3275381756127962, "learning_rate": 5.597385730716049e-06, "loss": 2.5483737182617188, "step": 1100200 }, { "epoch": 1.327658838935279, "learning_rate": 5.596981895248311e-06, "loss": 2.546100311279297, "step": 1100300 }, { "epoch": 1.3277795022577616, "learning_rate": 5.596578059780572e-06, "loss": 2.560460510253906, "step": 1100400 }, { "epoch": 1.3279001655802443, "learning_rate": 5.596174224312833e-06, "loss": 2.5154901123046876, "step": 1100500 }, { "epoch": 1.3280208289027269, "learning_rate": 5.595770388845095e-06, "loss": 2.5458868408203124, "step": 1100600 }, { "epoch": 1.3281414922252097, "learning_rate": 5.595366553377357e-06, "loss": 2.591527404785156, "step": 1100700 }, { "epoch": 1.3282621555476923, "learning_rate": 5.5949627179096185e-06, "loss": 2.520142364501953, "step": 1100800 }, { "epoch": 1.328382818870175, "learning_rate": 5.5945588824418805e-06, "loss": 2.545812072753906, "step": 1100900 }, { "epoch": 1.3285034821926578, "learning_rate": 5.5941550469741425e-06, "loss": 2.5501750183105467, "step": 1101000 }, { "epoch": 1.3286241455151404, "learning_rate": 5.5937512115064044e-06, "loss": 2.566391906738281, "step": 1101100 }, { "epoch": 1.328744808837623, "learning_rate": 5.593347376038665e-06, "loss": 2.544314270019531, "step": 1101200 }, { "epoch": 1.3288654721601056, "learning_rate": 5.592943540570927e-06, "loss": 2.5687075805664064, "step": 1101300 }, { "epoch": 1.3289861354825885, "learning_rate": 5.592539705103188e-06, "loss": 2.550492248535156, "step": 1101400 }, { "epoch": 1.329106798805071, "learning_rate": 5.59213586963545e-06, "loss": 2.531156311035156, "step": 1101500 }, { "epoch": 1.329227462127554, "learning_rate": 5.591732034167712e-06, "loss": 2.5406690979003907, "step": 1101600 }, { "epoch": 1.3293481254500366, "learning_rate": 5.591328198699974e-06, "loss": 2.553549041748047, "step": 1101700 }, { "epoch": 1.3294687887725192, "learning_rate": 5.590924363232235e-06, "loss": 2.5383856201171877, "step": 1101800 }, { "epoch": 1.3295894520950018, "learning_rate": 5.590520527764497e-06, "loss": 2.534021301269531, "step": 1101900 }, { "epoch": 1.3297101154174844, "learning_rate": 5.590116692296759e-06, "loss": 2.5559762573242186, "step": 1102000 }, { "epoch": 1.3298307787399672, "learning_rate": 5.589712856829019e-06, "loss": 2.562913513183594, "step": 1102100 }, { "epoch": 1.3299514420624499, "learning_rate": 5.589309021361281e-06, "loss": 2.567188415527344, "step": 1102200 }, { "epoch": 1.3300721053849327, "learning_rate": 5.588905185893543e-06, "loss": 2.5673507690429687, "step": 1102300 }, { "epoch": 1.3301927687074153, "learning_rate": 5.588501350425804e-06, "loss": 2.5720660400390627, "step": 1102400 }, { "epoch": 1.330313432029898, "learning_rate": 5.588097514958066e-06, "loss": 2.5451704406738282, "step": 1102500 }, { "epoch": 1.3304340953523806, "learning_rate": 5.587693679490328e-06, "loss": 2.523310089111328, "step": 1102600 }, { "epoch": 1.3305547586748634, "learning_rate": 5.587289844022589e-06, "loss": 2.5665054321289062, "step": 1102700 }, { "epoch": 1.330675421997346, "learning_rate": 5.586886008554851e-06, "loss": 2.555083465576172, "step": 1102800 }, { "epoch": 1.3307960853198286, "learning_rate": 5.5864821730871125e-06, "loss": 2.5476727294921875, "step": 1102900 }, { "epoch": 1.3309167486423115, "learning_rate": 5.586078337619374e-06, "loss": 2.544009246826172, "step": 1103000 }, { "epoch": 1.331037411964794, "learning_rate": 5.585674502151636e-06, "loss": 2.5580372619628906, "step": 1103100 }, { "epoch": 1.3311580752872767, "learning_rate": 5.585270666683898e-06, "loss": 2.5509762573242187, "step": 1103200 }, { "epoch": 1.3312787386097593, "learning_rate": 5.584866831216159e-06, "loss": 2.531029052734375, "step": 1103300 }, { "epoch": 1.3313994019322422, "learning_rate": 5.584462995748421e-06, "loss": 2.532251739501953, "step": 1103400 }, { "epoch": 1.3315200652547248, "learning_rate": 5.584059160280683e-06, "loss": 2.526808013916016, "step": 1103500 }, { "epoch": 1.3316407285772076, "learning_rate": 5.583655324812945e-06, "loss": 2.5696011352539063, "step": 1103600 }, { "epoch": 1.3317613918996902, "learning_rate": 5.583251489345205e-06, "loss": 2.5467625427246094, "step": 1103700 }, { "epoch": 1.3318820552221728, "learning_rate": 5.582847653877467e-06, "loss": 2.5390606689453126, "step": 1103800 }, { "epoch": 1.3320027185446555, "learning_rate": 5.582443818409728e-06, "loss": 2.5460989379882815, "step": 1103900 }, { "epoch": 1.3321233818671383, "learning_rate": 5.58203998294199e-06, "loss": 2.5491815185546876, "step": 1104000 }, { "epoch": 1.332244045189621, "learning_rate": 5.581636147474252e-06, "loss": 2.565324401855469, "step": 1104100 }, { "epoch": 1.3323647085121035, "learning_rate": 5.581232312006514e-06, "loss": 2.5465452575683596, "step": 1104200 }, { "epoch": 1.3324853718345864, "learning_rate": 5.580828476538775e-06, "loss": 2.5407928466796874, "step": 1104300 }, { "epoch": 1.332606035157069, "learning_rate": 5.580424641071037e-06, "loss": 2.5520751953125, "step": 1104400 }, { "epoch": 1.3327266984795516, "learning_rate": 5.5800208056032974e-06, "loss": 2.5536123657226564, "step": 1104500 }, { "epoch": 1.3328473618020342, "learning_rate": 5.579616970135559e-06, "loss": 2.558126983642578, "step": 1104600 }, { "epoch": 1.332968025124517, "learning_rate": 5.579213134667821e-06, "loss": 2.556645965576172, "step": 1104700 }, { "epoch": 1.3330886884469997, "learning_rate": 5.578809299200083e-06, "loss": 2.55730712890625, "step": 1104800 }, { "epoch": 1.3332093517694823, "learning_rate": 5.5784054637323445e-06, "loss": 2.565129699707031, "step": 1104900 }, { "epoch": 1.3333300150919651, "learning_rate": 5.5780016282646065e-06, "loss": 2.5498501586914064, "step": 1105000 }, { "epoch": 1.3334506784144478, "learning_rate": 5.5775977927968685e-06, "loss": 2.524735870361328, "step": 1105100 }, { "epoch": 1.3335713417369304, "learning_rate": 5.5771939573291305e-06, "loss": 2.5469429016113283, "step": 1105200 }, { "epoch": 1.333692005059413, "learning_rate": 5.576790121861391e-06, "loss": 2.551446533203125, "step": 1105300 }, { "epoch": 1.3338126683818958, "learning_rate": 5.576386286393653e-06, "loss": 2.5767608642578126, "step": 1105400 }, { "epoch": 1.3339333317043784, "learning_rate": 5.575982450925914e-06, "loss": 2.537062225341797, "step": 1105500 }, { "epoch": 1.3340539950268613, "learning_rate": 5.575578615458176e-06, "loss": 2.5685470581054686, "step": 1105600 }, { "epoch": 1.334174658349344, "learning_rate": 5.575174779990438e-06, "loss": 2.5610369873046874, "step": 1105700 }, { "epoch": 1.3342953216718265, "learning_rate": 5.5747709445227e-06, "loss": 2.553358459472656, "step": 1105800 }, { "epoch": 1.3344159849943091, "learning_rate": 5.574367109054961e-06, "loss": 2.544271697998047, "step": 1105900 }, { "epoch": 1.334536648316792, "learning_rate": 5.573963273587223e-06, "loss": 2.5805044555664063, "step": 1106000 }, { "epoch": 1.3346573116392746, "learning_rate": 5.573559438119483e-06, "loss": 2.543824005126953, "step": 1106100 }, { "epoch": 1.3347779749617572, "learning_rate": 5.573155602651745e-06, "loss": 2.543515319824219, "step": 1106200 }, { "epoch": 1.33489863828424, "learning_rate": 5.572751767184007e-06, "loss": 2.563873596191406, "step": 1106300 }, { "epoch": 1.3350193016067227, "learning_rate": 5.572347931716269e-06, "loss": 2.547380218505859, "step": 1106400 }, { "epoch": 1.3351399649292053, "learning_rate": 5.57194409624853e-06, "loss": 2.5344598388671873, "step": 1106500 }, { "epoch": 1.335260628251688, "learning_rate": 5.571540260780792e-06, "loss": 2.551089172363281, "step": 1106600 }, { "epoch": 1.3353812915741707, "learning_rate": 5.571136425313054e-06, "loss": 2.538284912109375, "step": 1106700 }, { "epoch": 1.3355019548966534, "learning_rate": 5.570732589845315e-06, "loss": 2.5220738220214844, "step": 1106800 }, { "epoch": 1.3356226182191362, "learning_rate": 5.570328754377577e-06, "loss": 2.536118469238281, "step": 1106900 }, { "epoch": 1.3357432815416188, "learning_rate": 5.5699249189098385e-06, "loss": 2.544111328125, "step": 1107000 }, { "epoch": 1.3358639448641014, "learning_rate": 5.5695210834421e-06, "loss": 2.545118408203125, "step": 1107100 }, { "epoch": 1.335984608186584, "learning_rate": 5.569117247974362e-06, "loss": 2.544485321044922, "step": 1107200 }, { "epoch": 1.3361052715090667, "learning_rate": 5.568713412506624e-06, "loss": 2.5573468017578125, "step": 1107300 }, { "epoch": 1.3362259348315495, "learning_rate": 5.568309577038885e-06, "loss": 2.5518424987792967, "step": 1107400 }, { "epoch": 1.3363465981540321, "learning_rate": 5.567905741571147e-06, "loss": 2.5286859130859374, "step": 1107500 }, { "epoch": 1.336467261476515, "learning_rate": 5.567501906103409e-06, "loss": 2.552254180908203, "step": 1107600 }, { "epoch": 1.3365879247989976, "learning_rate": 5.567098070635671e-06, "loss": 2.527863006591797, "step": 1107700 }, { "epoch": 1.3367085881214802, "learning_rate": 5.566694235167931e-06, "loss": 2.581435546875, "step": 1107800 }, { "epoch": 1.3368292514439628, "learning_rate": 5.566290399700193e-06, "loss": 2.5337763977050782, "step": 1107900 }, { "epoch": 1.3369499147664456, "learning_rate": 5.565886564232454e-06, "loss": 2.5375352478027344, "step": 1108000 }, { "epoch": 1.3370705780889283, "learning_rate": 5.565482728764716e-06, "loss": 2.5547279357910155, "step": 1108100 }, { "epoch": 1.3371912414114109, "learning_rate": 5.565078893296978e-06, "loss": 2.5512933349609375, "step": 1108200 }, { "epoch": 1.3373119047338937, "learning_rate": 5.56467505782924e-06, "loss": 2.566394958496094, "step": 1108300 }, { "epoch": 1.3374325680563763, "learning_rate": 5.564271222361501e-06, "loss": 2.531109619140625, "step": 1108400 }, { "epoch": 1.337553231378859, "learning_rate": 5.563867386893763e-06, "loss": 2.5505714416503906, "step": 1108500 }, { "epoch": 1.3376738947013416, "learning_rate": 5.5634635514260235e-06, "loss": 2.5428646850585936, "step": 1108600 }, { "epoch": 1.3377945580238244, "learning_rate": 5.5630597159582855e-06, "loss": 2.5584429931640624, "step": 1108700 }, { "epoch": 1.337915221346307, "learning_rate": 5.5626558804905474e-06, "loss": 2.5633999633789064, "step": 1108800 }, { "epoch": 1.3380358846687899, "learning_rate": 5.562252045022809e-06, "loss": 2.544799499511719, "step": 1108900 }, { "epoch": 1.3381565479912725, "learning_rate": 5.5618482095550706e-06, "loss": 2.553006286621094, "step": 1109000 }, { "epoch": 1.338277211313755, "learning_rate": 5.5614443740873325e-06, "loss": 2.539281005859375, "step": 1109100 }, { "epoch": 1.3383978746362377, "learning_rate": 5.5610405386195945e-06, "loss": 2.5367686462402346, "step": 1109200 }, { "epoch": 1.3385185379587206, "learning_rate": 5.560636703151856e-06, "loss": 2.550974884033203, "step": 1109300 }, { "epoch": 1.3386392012812032, "learning_rate": 5.560232867684117e-06, "loss": 2.532545471191406, "step": 1109400 }, { "epoch": 1.3387598646036858, "learning_rate": 5.559829032216379e-06, "loss": 2.5664520263671875, "step": 1109500 }, { "epoch": 1.3388805279261686, "learning_rate": 5.55942519674864e-06, "loss": 2.545825958251953, "step": 1109600 }, { "epoch": 1.3390011912486512, "learning_rate": 5.559021361280902e-06, "loss": 2.554263458251953, "step": 1109700 }, { "epoch": 1.3391218545711339, "learning_rate": 5.558617525813164e-06, "loss": 2.5776568603515626, "step": 1109800 }, { "epoch": 1.3392425178936165, "learning_rate": 5.558213690345425e-06, "loss": 2.5451824951171873, "step": 1109900 }, { "epoch": 1.3393631812160993, "learning_rate": 5.557809854877687e-06, "loss": 2.5513790893554686, "step": 1110000 }, { "epoch": 1.339483844538582, "learning_rate": 5.557406019409949e-06, "loss": 2.5632119750976563, "step": 1110100 }, { "epoch": 1.3396045078610646, "learning_rate": 5.557002183942209e-06, "loss": 2.5362506103515625, "step": 1110200 }, { "epoch": 1.3397251711835474, "learning_rate": 5.556598348474471e-06, "loss": 2.5444961547851563, "step": 1110300 }, { "epoch": 1.33984583450603, "learning_rate": 5.556194513006733e-06, "loss": 2.542674713134766, "step": 1110400 }, { "epoch": 1.3399664978285126, "learning_rate": 5.555790677538994e-06, "loss": 2.5368896484375, "step": 1110500 }, { "epoch": 1.3400871611509952, "learning_rate": 5.555386842071256e-06, "loss": 2.5381095886230467, "step": 1110600 }, { "epoch": 1.340207824473478, "learning_rate": 5.554983006603518e-06, "loss": 2.570368347167969, "step": 1110700 }, { "epoch": 1.3403284877959607, "learning_rate": 5.55457917113578e-06, "loss": 2.5426971435546877, "step": 1110800 }, { "epoch": 1.3404491511184435, "learning_rate": 5.5541753356680414e-06, "loss": 2.5433203125, "step": 1110900 }, { "epoch": 1.3405698144409262, "learning_rate": 5.553771500200303e-06, "loss": 2.552196197509766, "step": 1111000 }, { "epoch": 1.3406904777634088, "learning_rate": 5.553367664732564e-06, "loss": 2.558595886230469, "step": 1111100 }, { "epoch": 1.3408111410858914, "learning_rate": 5.552963829264826e-06, "loss": 2.5352072143554687, "step": 1111200 }, { "epoch": 1.3409318044083742, "learning_rate": 5.552559993797088e-06, "loss": 2.5393373107910158, "step": 1111300 }, { "epoch": 1.3410524677308568, "learning_rate": 5.55215615832935e-06, "loss": 2.5393157958984376, "step": 1111400 }, { "epoch": 1.3411731310533395, "learning_rate": 5.551752322861611e-06, "loss": 2.560013732910156, "step": 1111500 }, { "epoch": 1.3412937943758223, "learning_rate": 5.551348487393873e-06, "loss": 2.5662612915039062, "step": 1111600 }, { "epoch": 1.341414457698305, "learning_rate": 5.550944651926135e-06, "loss": 2.562915954589844, "step": 1111700 }, { "epoch": 1.3415351210207875, "learning_rate": 5.550540816458396e-06, "loss": 2.5793841552734373, "step": 1111800 }, { "epoch": 1.3416557843432702, "learning_rate": 5.550136980990657e-06, "loss": 2.52924072265625, "step": 1111900 }, { "epoch": 1.341776447665753, "learning_rate": 5.549733145522919e-06, "loss": 2.5424267578125, "step": 1112000 }, { "epoch": 1.3418971109882356, "learning_rate": 5.54932931005518e-06, "loss": 2.5436204528808593, "step": 1112100 }, { "epoch": 1.3420177743107184, "learning_rate": 5.548925474587442e-06, "loss": 2.568104248046875, "step": 1112200 }, { "epoch": 1.342138437633201, "learning_rate": 5.548521639119704e-06, "loss": 2.5462519836425783, "step": 1112300 }, { "epoch": 1.3422591009556837, "learning_rate": 5.548117803651965e-06, "loss": 2.5653836059570314, "step": 1112400 }, { "epoch": 1.3423797642781663, "learning_rate": 5.547713968184227e-06, "loss": 2.5654010009765624, "step": 1112500 }, { "epoch": 1.342500427600649, "learning_rate": 5.547310132716489e-06, "loss": 2.5203120422363283, "step": 1112600 }, { "epoch": 1.3426210909231318, "learning_rate": 5.5469062972487495e-06, "loss": 2.5490574645996094, "step": 1112700 }, { "epoch": 1.3427417542456144, "learning_rate": 5.5465024617810115e-06, "loss": 2.5530996704101563, "step": 1112800 }, { "epoch": 1.3428624175680972, "learning_rate": 5.5460986263132735e-06, "loss": 2.5294068908691405, "step": 1112900 }, { "epoch": 1.3429830808905798, "learning_rate": 5.545694790845535e-06, "loss": 2.5257037353515623, "step": 1113000 }, { "epoch": 1.3431037442130624, "learning_rate": 5.545290955377797e-06, "loss": 2.5374824523925783, "step": 1113100 }, { "epoch": 1.343224407535545, "learning_rate": 5.5448871199100586e-06, "loss": 2.5647607421875, "step": 1113200 }, { "epoch": 1.343345070858028, "learning_rate": 5.5444832844423206e-06, "loss": 2.5425067138671875, "step": 1113300 }, { "epoch": 1.3434657341805105, "learning_rate": 5.544079448974582e-06, "loss": 2.5473709106445312, "step": 1113400 }, { "epoch": 1.3435863975029931, "learning_rate": 5.543675613506843e-06, "loss": 2.5528302001953125, "step": 1113500 }, { "epoch": 1.343707060825476, "learning_rate": 5.543271778039104e-06, "loss": 2.5511744689941405, "step": 1113600 }, { "epoch": 1.3438277241479586, "learning_rate": 5.542867942571366e-06, "loss": 2.5588954162597655, "step": 1113700 }, { "epoch": 1.3439483874704412, "learning_rate": 5.542464107103628e-06, "loss": 2.5709823608398437, "step": 1113800 }, { "epoch": 1.3440690507929238, "learning_rate": 5.54206027163589e-06, "loss": 2.520937652587891, "step": 1113900 }, { "epoch": 1.3441897141154067, "learning_rate": 5.541656436168151e-06, "loss": 2.5643429565429687, "step": 1114000 }, { "epoch": 1.3443103774378893, "learning_rate": 5.541252600700413e-06, "loss": 2.538648681640625, "step": 1114100 }, { "epoch": 1.3444310407603721, "learning_rate": 5.540848765232675e-06, "loss": 2.5552252197265624, "step": 1114200 }, { "epoch": 1.3445517040828547, "learning_rate": 5.540444929764935e-06, "loss": 2.5260163879394533, "step": 1114300 }, { "epoch": 1.3446723674053374, "learning_rate": 5.540041094297197e-06, "loss": 2.5730535888671877, "step": 1114400 }, { "epoch": 1.34479303072782, "learning_rate": 5.539637258829459e-06, "loss": 2.5388166809082033, "step": 1114500 }, { "epoch": 1.3449136940503028, "learning_rate": 5.53923342336172e-06, "loss": 2.548509063720703, "step": 1114600 }, { "epoch": 1.3450343573727854, "learning_rate": 5.538829587893982e-06, "loss": 2.556884002685547, "step": 1114700 }, { "epoch": 1.345155020695268, "learning_rate": 5.538425752426244e-06, "loss": 2.56817138671875, "step": 1114800 }, { "epoch": 1.3452756840177509, "learning_rate": 5.5380219169585055e-06, "loss": 2.542788543701172, "step": 1114900 }, { "epoch": 1.3453963473402335, "learning_rate": 5.5376180814907675e-06, "loss": 2.5268318176269533, "step": 1115000 }, { "epoch": 1.3455170106627161, "learning_rate": 5.537214246023029e-06, "loss": 2.5365203857421874, "step": 1115100 }, { "epoch": 1.3456376739851987, "learning_rate": 5.53681041055529e-06, "loss": 2.5440408325195314, "step": 1115200 }, { "epoch": 1.3457583373076816, "learning_rate": 5.536406575087552e-06, "loss": 2.5360037231445314, "step": 1115300 }, { "epoch": 1.3458790006301642, "learning_rate": 5.536002739619814e-06, "loss": 2.552440185546875, "step": 1115400 }, { "epoch": 1.3459996639526468, "learning_rate": 5.535598904152075e-06, "loss": 2.5482569885253907, "step": 1115500 }, { "epoch": 1.3461203272751296, "learning_rate": 5.535195068684337e-06, "loss": 2.5366925048828124, "step": 1115600 }, { "epoch": 1.3462409905976123, "learning_rate": 5.534791233216599e-06, "loss": 2.553275909423828, "step": 1115700 }, { "epoch": 1.3463616539200949, "learning_rate": 5.534387397748861e-06, "loss": 2.5405120849609375, "step": 1115800 }, { "epoch": 1.3464823172425775, "learning_rate": 5.533983562281121e-06, "loss": 2.559019775390625, "step": 1115900 }, { "epoch": 1.3466029805650603, "learning_rate": 5.533579726813383e-06, "loss": 2.5397959899902345, "step": 1116000 }, { "epoch": 1.346723643887543, "learning_rate": 5.533175891345644e-06, "loss": 2.564012145996094, "step": 1116100 }, { "epoch": 1.3468443072100258, "learning_rate": 5.532772055877906e-06, "loss": 2.568498229980469, "step": 1116200 }, { "epoch": 1.3469649705325084, "learning_rate": 5.532368220410168e-06, "loss": 2.539281921386719, "step": 1116300 }, { "epoch": 1.347085633854991, "learning_rate": 5.53196438494243e-06, "loss": 2.5360700988769533, "step": 1116400 }, { "epoch": 1.3472062971774736, "learning_rate": 5.531560549474691e-06, "loss": 2.5370738220214846, "step": 1116500 }, { "epoch": 1.3473269604999565, "learning_rate": 5.531156714006953e-06, "loss": 2.528697052001953, "step": 1116600 }, { "epoch": 1.347447623822439, "learning_rate": 5.5307528785392136e-06, "loss": 2.5465025329589843, "step": 1116700 }, { "epoch": 1.3475682871449217, "learning_rate": 5.5303490430714755e-06, "loss": 2.5547276306152344, "step": 1116800 }, { "epoch": 1.3476889504674046, "learning_rate": 5.5299452076037375e-06, "loss": 2.529321746826172, "step": 1116900 }, { "epoch": 1.3478096137898872, "learning_rate": 5.5295413721359995e-06, "loss": 2.5452752685546876, "step": 1117000 }, { "epoch": 1.3479302771123698, "learning_rate": 5.529137536668261e-06, "loss": 2.5387448120117186, "step": 1117100 }, { "epoch": 1.3480509404348524, "learning_rate": 5.528733701200523e-06, "loss": 2.5606134033203123, "step": 1117200 }, { "epoch": 1.3481716037573352, "learning_rate": 5.528329865732785e-06, "loss": 2.555478210449219, "step": 1117300 }, { "epoch": 1.3482922670798179, "learning_rate": 5.527926030265046e-06, "loss": 2.5426573181152343, "step": 1117400 }, { "epoch": 1.3484129304023007, "learning_rate": 5.527522194797308e-06, "loss": 2.537702789306641, "step": 1117500 }, { "epoch": 1.3485335937247833, "learning_rate": 5.527118359329569e-06, "loss": 2.519753265380859, "step": 1117600 }, { "epoch": 1.348654257047266, "learning_rate": 5.52671452386183e-06, "loss": 2.548219757080078, "step": 1117700 }, { "epoch": 1.3487749203697486, "learning_rate": 5.526310688394092e-06, "loss": 2.5285653686523437, "step": 1117800 }, { "epoch": 1.3488955836922312, "learning_rate": 5.525906852926354e-06, "loss": 2.5342941284179688, "step": 1117900 }, { "epoch": 1.349016247014714, "learning_rate": 5.525503017458615e-06, "loss": 2.543271026611328, "step": 1118000 }, { "epoch": 1.3491369103371966, "learning_rate": 5.525099181990877e-06, "loss": 2.542471160888672, "step": 1118100 }, { "epoch": 1.3492575736596795, "learning_rate": 5.524695346523139e-06, "loss": 2.5599664306640624, "step": 1118200 }, { "epoch": 1.349378236982162, "learning_rate": 5.524291511055401e-06, "loss": 2.540577239990234, "step": 1118300 }, { "epoch": 1.3494989003046447, "learning_rate": 5.523887675587661e-06, "loss": 2.562897033691406, "step": 1118400 }, { "epoch": 1.3496195636271273, "learning_rate": 5.523483840119923e-06, "loss": 2.5509907531738283, "step": 1118500 }, { "epoch": 1.3497402269496102, "learning_rate": 5.5230800046521844e-06, "loss": 2.518310852050781, "step": 1118600 }, { "epoch": 1.3498608902720928, "learning_rate": 5.5226761691844464e-06, "loss": 2.5283380126953126, "step": 1118700 }, { "epoch": 1.3499815535945754, "learning_rate": 5.522272333716708e-06, "loss": 2.516519317626953, "step": 1118800 }, { "epoch": 1.3501022169170582, "learning_rate": 5.52186849824897e-06, "loss": 2.531022186279297, "step": 1118900 }, { "epoch": 1.3502228802395408, "learning_rate": 5.5214646627812315e-06, "loss": 2.544434814453125, "step": 1119000 }, { "epoch": 1.3503435435620235, "learning_rate": 5.5210608273134935e-06, "loss": 2.5300628662109377, "step": 1119100 }, { "epoch": 1.350464206884506, "learning_rate": 5.520656991845754e-06, "loss": 2.541341552734375, "step": 1119200 }, { "epoch": 1.350584870206989, "learning_rate": 5.520253156378016e-06, "loss": 2.5481666564941405, "step": 1119300 }, { "epoch": 1.3507055335294715, "learning_rate": 5.519849320910278e-06, "loss": 2.5577674865722657, "step": 1119400 }, { "epoch": 1.3508261968519544, "learning_rate": 5.51944548544254e-06, "loss": 2.523116149902344, "step": 1119500 }, { "epoch": 1.350946860174437, "learning_rate": 5.519041649974801e-06, "loss": 2.5553318786621095, "step": 1119600 }, { "epoch": 1.3510675234969196, "learning_rate": 5.518637814507063e-06, "loss": 2.532977752685547, "step": 1119700 }, { "epoch": 1.3511881868194022, "learning_rate": 5.518233979039325e-06, "loss": 2.529518890380859, "step": 1119800 }, { "epoch": 1.351308850141885, "learning_rate": 5.517830143571587e-06, "loss": 2.5464796447753906, "step": 1119900 }, { "epoch": 1.3514295134643677, "learning_rate": 5.517426308103847e-06, "loss": 2.56077392578125, "step": 1120000 }, { "epoch": 1.3515501767868503, "learning_rate": 5.517022472636109e-06, "loss": 2.5559896850585937, "step": 1120100 }, { "epoch": 1.3516708401093331, "learning_rate": 5.51661863716837e-06, "loss": 2.553842010498047, "step": 1120200 }, { "epoch": 1.3517915034318158, "learning_rate": 5.516214801700632e-06, "loss": 2.539685821533203, "step": 1120300 }, { "epoch": 1.3519121667542984, "learning_rate": 5.515810966232894e-06, "loss": 2.5438690185546875, "step": 1120400 }, { "epoch": 1.352032830076781, "learning_rate": 5.515407130765156e-06, "loss": 2.551146240234375, "step": 1120500 }, { "epoch": 1.3521534933992638, "learning_rate": 5.515003295297417e-06, "loss": 2.549216613769531, "step": 1120600 }, { "epoch": 1.3522741567217464, "learning_rate": 5.514599459829679e-06, "loss": 2.557922668457031, "step": 1120700 }, { "epoch": 1.352394820044229, "learning_rate": 5.51419562436194e-06, "loss": 2.50784423828125, "step": 1120800 }, { "epoch": 1.352515483366712, "learning_rate": 5.5137917888942016e-06, "loss": 2.5332676696777345, "step": 1120900 }, { "epoch": 1.3526361466891945, "learning_rate": 5.5133879534264636e-06, "loss": 2.5473388671875, "step": 1121000 }, { "epoch": 1.3527568100116771, "learning_rate": 5.5129841179587255e-06, "loss": 2.530411834716797, "step": 1121100 }, { "epoch": 1.3528774733341598, "learning_rate": 5.512580282490987e-06, "loss": 2.5281857299804686, "step": 1121200 }, { "epoch": 1.3529981366566426, "learning_rate": 5.512176447023249e-06, "loss": 2.551186370849609, "step": 1121300 }, { "epoch": 1.3531187999791252, "learning_rate": 5.511772611555511e-06, "loss": 2.546246337890625, "step": 1121400 }, { "epoch": 1.353239463301608, "learning_rate": 5.511368776087772e-06, "loss": 2.538327941894531, "step": 1121500 }, { "epoch": 1.3533601266240907, "learning_rate": 5.510964940620033e-06, "loss": 2.5449867248535156, "step": 1121600 }, { "epoch": 1.3534807899465733, "learning_rate": 5.510561105152295e-06, "loss": 2.542418212890625, "step": 1121700 }, { "epoch": 1.353601453269056, "learning_rate": 5.510157269684556e-06, "loss": 2.5215194702148436, "step": 1121800 }, { "epoch": 1.3537221165915387, "learning_rate": 5.509753434216818e-06, "loss": 2.5416180419921877, "step": 1121900 }, { "epoch": 1.3538427799140214, "learning_rate": 5.50934959874908e-06, "loss": 2.549102783203125, "step": 1122000 }, { "epoch": 1.353963443236504, "learning_rate": 5.508945763281341e-06, "loss": 2.5342994689941407, "step": 1122100 }, { "epoch": 1.3540841065589868, "learning_rate": 5.508541927813603e-06, "loss": 2.565973815917969, "step": 1122200 }, { "epoch": 1.3542047698814694, "learning_rate": 5.508138092345865e-06, "loss": 2.5185502624511718, "step": 1122300 }, { "epoch": 1.354325433203952, "learning_rate": 5.507734256878127e-06, "loss": 2.541664276123047, "step": 1122400 }, { "epoch": 1.3544460965264347, "learning_rate": 5.507330421410387e-06, "loss": 2.5332521057128905, "step": 1122500 }, { "epoch": 1.3545667598489175, "learning_rate": 5.506926585942649e-06, "loss": 2.554490509033203, "step": 1122600 }, { "epoch": 1.3546874231714001, "learning_rate": 5.5065227504749105e-06, "loss": 2.5597517395019533, "step": 1122700 }, { "epoch": 1.354808086493883, "learning_rate": 5.5061189150071725e-06, "loss": 2.5603933715820313, "step": 1122800 }, { "epoch": 1.3549287498163656, "learning_rate": 5.5057150795394344e-06, "loss": 2.5392439270019533, "step": 1122900 }, { "epoch": 1.3550494131388482, "learning_rate": 5.5053112440716964e-06, "loss": 2.5406544494628904, "step": 1123000 }, { "epoch": 1.3551700764613308, "learning_rate": 5.5049074086039576e-06, "loss": 2.5196127319335937, "step": 1123100 }, { "epoch": 1.3552907397838134, "learning_rate": 5.5045035731362195e-06, "loss": 2.5542462158203123, "step": 1123200 }, { "epoch": 1.3554114031062963, "learning_rate": 5.50409973766848e-06, "loss": 2.5477435302734377, "step": 1123300 }, { "epoch": 1.3555320664287789, "learning_rate": 5.503695902200742e-06, "loss": 2.5206947326660156, "step": 1123400 }, { "epoch": 1.3556527297512617, "learning_rate": 5.503292066733004e-06, "loss": 2.535978088378906, "step": 1123500 }, { "epoch": 1.3557733930737443, "learning_rate": 5.502888231265266e-06, "loss": 2.5170506286621093, "step": 1123600 }, { "epoch": 1.355894056396227, "learning_rate": 5.502484395797527e-06, "loss": 2.537860107421875, "step": 1123700 }, { "epoch": 1.3560147197187096, "learning_rate": 5.502080560329789e-06, "loss": 2.5277445983886717, "step": 1123800 }, { "epoch": 1.3561353830411924, "learning_rate": 5.501676724862051e-06, "loss": 2.545663299560547, "step": 1123900 }, { "epoch": 1.356256046363675, "learning_rate": 5.501272889394312e-06, "loss": 2.5464501953125, "step": 1124000 }, { "epoch": 1.3563767096861576, "learning_rate": 5.500869053926573e-06, "loss": 2.53087646484375, "step": 1124100 }, { "epoch": 1.3564973730086405, "learning_rate": 5.500465218458835e-06, "loss": 2.528291778564453, "step": 1124200 }, { "epoch": 1.356618036331123, "learning_rate": 5.500061382991096e-06, "loss": 2.556417999267578, "step": 1124300 }, { "epoch": 1.3567386996536057, "learning_rate": 5.499657547523358e-06, "loss": 2.5463137817382813, "step": 1124400 }, { "epoch": 1.3568593629760883, "learning_rate": 5.49925371205562e-06, "loss": 2.5528323364257814, "step": 1124500 }, { "epoch": 1.3569800262985712, "learning_rate": 5.498849876587881e-06, "loss": 2.5476618957519532, "step": 1124600 }, { "epoch": 1.3571006896210538, "learning_rate": 5.498446041120143e-06, "loss": 2.532095489501953, "step": 1124700 }, { "epoch": 1.3572213529435366, "learning_rate": 5.498042205652405e-06, "loss": 2.5468052673339843, "step": 1124800 }, { "epoch": 1.3573420162660192, "learning_rate": 5.497638370184666e-06, "loss": 2.5427659606933593, "step": 1124900 }, { "epoch": 1.3574626795885019, "learning_rate": 5.497234534716928e-06, "loss": 2.5309274291992185, "step": 1125000 }, { "epoch": 1.3575833429109845, "learning_rate": 5.49683069924919e-06, "loss": 2.525297088623047, "step": 1125100 }, { "epoch": 1.3577040062334673, "learning_rate": 5.496426863781451e-06, "loss": 2.5114067077636717, "step": 1125200 }, { "epoch": 1.35782466955595, "learning_rate": 5.496023028313713e-06, "loss": 2.511322784423828, "step": 1125300 }, { "epoch": 1.3579453328784326, "learning_rate": 5.495619192845975e-06, "loss": 2.5488937377929686, "step": 1125400 }, { "epoch": 1.3580659962009154, "learning_rate": 5.495215357378237e-06, "loss": 2.5407017517089843, "step": 1125500 }, { "epoch": 1.358186659523398, "learning_rate": 5.494811521910498e-06, "loss": 2.568465576171875, "step": 1125600 }, { "epoch": 1.3583073228458806, "learning_rate": 5.494407686442759e-06, "loss": 2.545077056884766, "step": 1125700 }, { "epoch": 1.3584279861683632, "learning_rate": 5.49400385097502e-06, "loss": 2.5211495971679687, "step": 1125800 }, { "epoch": 1.358548649490846, "learning_rate": 5.493600015507282e-06, "loss": 2.5613250732421875, "step": 1125900 }, { "epoch": 1.3586693128133287, "learning_rate": 5.493196180039544e-06, "loss": 2.5317626953125, "step": 1126000 }, { "epoch": 1.3587899761358113, "learning_rate": 5.492792344571806e-06, "loss": 2.5492181396484375, "step": 1126100 }, { "epoch": 1.3589106394582942, "learning_rate": 5.492388509104067e-06, "loss": 2.521556701660156, "step": 1126200 }, { "epoch": 1.3590313027807768, "learning_rate": 5.491984673636329e-06, "loss": 2.5345832824707033, "step": 1126300 }, { "epoch": 1.3591519661032594, "learning_rate": 5.491580838168591e-06, "loss": 2.5059523010253906, "step": 1126400 }, { "epoch": 1.359272629425742, "learning_rate": 5.491177002700851e-06, "loss": 2.5525477600097655, "step": 1126500 }, { "epoch": 1.3593932927482248, "learning_rate": 5.490773167233113e-06, "loss": 2.536240692138672, "step": 1126600 }, { "epoch": 1.3595139560707075, "learning_rate": 5.490369331765375e-06, "loss": 2.547270965576172, "step": 1126700 }, { "epoch": 1.3596346193931903, "learning_rate": 5.4899654962976365e-06, "loss": 2.5382621765136717, "step": 1126800 }, { "epoch": 1.359755282715673, "learning_rate": 5.4895616608298985e-06, "loss": 2.5084226989746092, "step": 1126900 }, { "epoch": 1.3598759460381555, "learning_rate": 5.4891578253621605e-06, "loss": 2.5537115478515626, "step": 1127000 }, { "epoch": 1.3599966093606382, "learning_rate": 5.488753989894422e-06, "loss": 2.529862518310547, "step": 1127100 }, { "epoch": 1.360117272683121, "learning_rate": 5.488350154426684e-06, "loss": 2.5425225830078126, "step": 1127200 }, { "epoch": 1.3602379360056036, "learning_rate": 5.487946318958946e-06, "loss": 2.546363983154297, "step": 1127300 }, { "epoch": 1.3603585993280862, "learning_rate": 5.487542483491206e-06, "loss": 2.555062255859375, "step": 1127400 }, { "epoch": 1.360479262650569, "learning_rate": 5.487138648023468e-06, "loss": 2.536742401123047, "step": 1127500 }, { "epoch": 1.3605999259730517, "learning_rate": 5.48673481255573e-06, "loss": 2.5172850036621095, "step": 1127600 }, { "epoch": 1.3607205892955343, "learning_rate": 5.486330977087991e-06, "loss": 2.548764343261719, "step": 1127700 }, { "epoch": 1.360841252618017, "learning_rate": 5.485927141620253e-06, "loss": 2.5186814880371093, "step": 1127800 }, { "epoch": 1.3609619159404998, "learning_rate": 5.485523306152515e-06, "loss": 2.5488526916503904, "step": 1127900 }, { "epoch": 1.3610825792629824, "learning_rate": 5.485119470684777e-06, "loss": 2.5373512268066407, "step": 1128000 }, { "epoch": 1.3612032425854652, "learning_rate": 5.484715635217038e-06, "loss": 2.5273744201660158, "step": 1128100 }, { "epoch": 1.3613239059079478, "learning_rate": 5.484311799749299e-06, "loss": 2.566933898925781, "step": 1128200 }, { "epoch": 1.3614445692304304, "learning_rate": 5.48390796428156e-06, "loss": 2.5179644775390626, "step": 1128300 }, { "epoch": 1.361565232552913, "learning_rate": 5.483504128813822e-06, "loss": 2.5089340209960938, "step": 1128400 }, { "epoch": 1.3616858958753957, "learning_rate": 5.483100293346084e-06, "loss": 2.522506103515625, "step": 1128500 }, { "epoch": 1.3618065591978785, "learning_rate": 5.482696457878346e-06, "loss": 2.5125848388671876, "step": 1128600 }, { "epoch": 1.3619272225203611, "learning_rate": 5.482292622410607e-06, "loss": 2.549005584716797, "step": 1128700 }, { "epoch": 1.362047885842844, "learning_rate": 5.481888786942869e-06, "loss": 2.5461631774902345, "step": 1128800 }, { "epoch": 1.3621685491653266, "learning_rate": 5.481484951475131e-06, "loss": 2.5144801330566406, "step": 1128900 }, { "epoch": 1.3622892124878092, "learning_rate": 5.481081116007392e-06, "loss": 2.546425018310547, "step": 1129000 }, { "epoch": 1.3624098758102918, "learning_rate": 5.480677280539654e-06, "loss": 2.5235301208496095, "step": 1129100 }, { "epoch": 1.3625305391327747, "learning_rate": 5.480273445071916e-06, "loss": 2.54118408203125, "step": 1129200 }, { "epoch": 1.3626512024552573, "learning_rate": 5.479869609604177e-06, "loss": 2.5247308349609376, "step": 1129300 }, { "epoch": 1.36277186577774, "learning_rate": 5.479465774136439e-06, "loss": 2.55634765625, "step": 1129400 }, { "epoch": 1.3628925291002227, "learning_rate": 5.479061938668701e-06, "loss": 2.546397399902344, "step": 1129500 }, { "epoch": 1.3630131924227054, "learning_rate": 5.478658103200962e-06, "loss": 2.543706512451172, "step": 1129600 }, { "epoch": 1.363133855745188, "learning_rate": 5.478254267733224e-06, "loss": 2.5261944580078124, "step": 1129700 }, { "epoch": 1.3632545190676706, "learning_rate": 5.477850432265485e-06, "loss": 2.515106506347656, "step": 1129800 }, { "epoch": 1.3633751823901534, "learning_rate": 5.477446596797746e-06, "loss": 2.542965850830078, "step": 1129900 }, { "epoch": 1.363495845712636, "learning_rate": 5.477042761330008e-06, "loss": 2.537078399658203, "step": 1130000 }, { "epoch": 1.3636165090351189, "learning_rate": 5.47663892586227e-06, "loss": 2.5330560302734373, "step": 1130100 }, { "epoch": 1.3637371723576015, "learning_rate": 5.476235090394531e-06, "loss": 2.5538006591796876, "step": 1130200 }, { "epoch": 1.3638578356800841, "learning_rate": 5.475831254926793e-06, "loss": 2.5284684753417968, "step": 1130300 }, { "epoch": 1.3639784990025667, "learning_rate": 5.475427419459055e-06, "loss": 2.5340118408203125, "step": 1130400 }, { "epoch": 1.3640991623250496, "learning_rate": 5.475023583991317e-06, "loss": 2.5498179626464843, "step": 1130500 }, { "epoch": 1.3642198256475322, "learning_rate": 5.4746197485235775e-06, "loss": 2.5415298461914064, "step": 1130600 }, { "epoch": 1.3643404889700148, "learning_rate": 5.4742159130558394e-06, "loss": 2.552894744873047, "step": 1130700 }, { "epoch": 1.3644611522924976, "learning_rate": 5.4738120775881006e-06, "loss": 2.5367230224609374, "step": 1130800 }, { "epoch": 1.3645818156149803, "learning_rate": 5.4734082421203626e-06, "loss": 2.53853515625, "step": 1130900 }, { "epoch": 1.3647024789374629, "learning_rate": 5.4730044066526245e-06, "loss": 2.5517034912109375, "step": 1131000 }, { "epoch": 1.3648231422599455, "learning_rate": 5.4726005711848865e-06, "loss": 2.52247802734375, "step": 1131100 }, { "epoch": 1.3649438055824283, "learning_rate": 5.472196735717148e-06, "loss": 2.5470062255859376, "step": 1131200 }, { "epoch": 1.365064468904911, "learning_rate": 5.47179290024941e-06, "loss": 2.544286651611328, "step": 1131300 }, { "epoch": 1.3651851322273936, "learning_rate": 5.47138906478167e-06, "loss": 2.526001281738281, "step": 1131400 }, { "epoch": 1.3653057955498764, "learning_rate": 5.470985229313932e-06, "loss": 2.526212158203125, "step": 1131500 }, { "epoch": 1.365426458872359, "learning_rate": 5.470581393846194e-06, "loss": 2.543825988769531, "step": 1131600 }, { "epoch": 1.3655471221948416, "learning_rate": 5.470177558378456e-06, "loss": 2.5256793212890627, "step": 1131700 }, { "epoch": 1.3656677855173243, "learning_rate": 5.469773722910717e-06, "loss": 2.5456607055664064, "step": 1131800 }, { "epoch": 1.365788448839807, "learning_rate": 5.469369887442979e-06, "loss": 2.565182800292969, "step": 1131900 }, { "epoch": 1.3659091121622897, "learning_rate": 5.468966051975241e-06, "loss": 2.5345989990234377, "step": 1132000 }, { "epoch": 1.3660297754847726, "learning_rate": 5.468562216507502e-06, "loss": 2.5519664001464846, "step": 1132100 }, { "epoch": 1.3661504388072552, "learning_rate": 5.468158381039763e-06, "loss": 2.5582870483398437, "step": 1132200 }, { "epoch": 1.3662711021297378, "learning_rate": 5.467754545572025e-06, "loss": 2.5398123168945315, "step": 1132300 }, { "epoch": 1.3663917654522204, "learning_rate": 5.467350710104286e-06, "loss": 2.5418060302734373, "step": 1132400 }, { "epoch": 1.3665124287747032, "learning_rate": 5.466946874636548e-06, "loss": 2.5375169372558593, "step": 1132500 }, { "epoch": 1.3666330920971859, "learning_rate": 5.46654303916881e-06, "loss": 2.5345640563964844, "step": 1132600 }, { "epoch": 1.3667537554196685, "learning_rate": 5.4661392037010715e-06, "loss": 2.5095263671875, "step": 1132700 }, { "epoch": 1.3668744187421513, "learning_rate": 5.4657353682333334e-06, "loss": 2.544271240234375, "step": 1132800 }, { "epoch": 1.366995082064634, "learning_rate": 5.4653315327655954e-06, "loss": 2.558857269287109, "step": 1132900 }, { "epoch": 1.3671157453871166, "learning_rate": 5.464927697297857e-06, "loss": 2.5289830017089843, "step": 1133000 }, { "epoch": 1.3672364087095992, "learning_rate": 5.464523861830118e-06, "loss": 2.5395074462890626, "step": 1133100 }, { "epoch": 1.367357072032082, "learning_rate": 5.46412002636238e-06, "loss": 2.5412644958496093, "step": 1133200 }, { "epoch": 1.3674777353545646, "learning_rate": 5.463716190894641e-06, "loss": 2.552389373779297, "step": 1133300 }, { "epoch": 1.3675983986770475, "learning_rate": 5.463312355426903e-06, "loss": 2.528237762451172, "step": 1133400 }, { "epoch": 1.36771906199953, "learning_rate": 5.462908519959165e-06, "loss": 2.52712158203125, "step": 1133500 }, { "epoch": 1.3678397253220127, "learning_rate": 5.462504684491427e-06, "loss": 2.527351989746094, "step": 1133600 }, { "epoch": 1.3679603886444953, "learning_rate": 5.462100849023688e-06, "loss": 2.520762634277344, "step": 1133700 }, { "epoch": 1.368081051966978, "learning_rate": 5.46169701355595e-06, "loss": 2.5224348449707032, "step": 1133800 }, { "epoch": 1.3682017152894608, "learning_rate": 5.46129317808821e-06, "loss": 2.5395237731933595, "step": 1133900 }, { "epoch": 1.3683223786119434, "learning_rate": 5.460889342620472e-06, "loss": 2.523396759033203, "step": 1134000 }, { "epoch": 1.3684430419344262, "learning_rate": 5.460485507152734e-06, "loss": 2.5361149597167967, "step": 1134100 }, { "epoch": 1.3685637052569088, "learning_rate": 5.460081671684996e-06, "loss": 2.5270977783203126, "step": 1134200 }, { "epoch": 1.3686843685793915, "learning_rate": 5.459677836217257e-06, "loss": 2.5597315979003907, "step": 1134300 }, { "epoch": 1.368805031901874, "learning_rate": 5.459274000749519e-06, "loss": 2.5261296081542968, "step": 1134400 }, { "epoch": 1.368925695224357, "learning_rate": 5.458870165281781e-06, "loss": 2.5534066772460937, "step": 1134500 }, { "epoch": 1.3690463585468395, "learning_rate": 5.458466329814043e-06, "loss": 2.524967041015625, "step": 1134600 }, { "epoch": 1.3691670218693222, "learning_rate": 5.4580624943463035e-06, "loss": 2.5324061584472655, "step": 1134700 }, { "epoch": 1.369287685191805, "learning_rate": 5.4576586588785655e-06, "loss": 2.5290873718261717, "step": 1134800 }, { "epoch": 1.3694083485142876, "learning_rate": 5.457254823410827e-06, "loss": 2.534931182861328, "step": 1134900 }, { "epoch": 1.3695290118367702, "learning_rate": 5.456850987943089e-06, "loss": 2.538076171875, "step": 1135000 }, { "epoch": 1.3696496751592528, "learning_rate": 5.4564471524753506e-06, "loss": 2.5237281799316404, "step": 1135100 }, { "epoch": 1.3697703384817357, "learning_rate": 5.4560433170076125e-06, "loss": 2.538491516113281, "step": 1135200 }, { "epoch": 1.3698910018042183, "learning_rate": 5.455639481539874e-06, "loss": 2.536091156005859, "step": 1135300 }, { "epoch": 1.3700116651267011, "learning_rate": 5.455235646072136e-06, "loss": 2.542910919189453, "step": 1135400 }, { "epoch": 1.3701323284491838, "learning_rate": 5.454831810604396e-06, "loss": 2.5501914978027345, "step": 1135500 }, { "epoch": 1.3702529917716664, "learning_rate": 5.454427975136658e-06, "loss": 2.5471392822265626, "step": 1135600 }, { "epoch": 1.370373655094149, "learning_rate": 5.45402413966892e-06, "loss": 2.5583735656738282, "step": 1135700 }, { "epoch": 1.3704943184166318, "learning_rate": 5.453620304201182e-06, "loss": 2.5479974365234375, "step": 1135800 }, { "epoch": 1.3706149817391144, "learning_rate": 5.453216468733443e-06, "loss": 2.532686462402344, "step": 1135900 }, { "epoch": 1.370735645061597, "learning_rate": 5.452812633265705e-06, "loss": 2.5161082458496096, "step": 1136000 }, { "epoch": 1.37085630838408, "learning_rate": 5.452408797797967e-06, "loss": 2.5332286071777346, "step": 1136100 }, { "epoch": 1.3709769717065625, "learning_rate": 5.452004962330228e-06, "loss": 2.513297576904297, "step": 1136200 }, { "epoch": 1.3710976350290451, "learning_rate": 5.451601126862489e-06, "loss": 2.5305491638183595, "step": 1136300 }, { "epoch": 1.3712182983515278, "learning_rate": 5.451197291394751e-06, "loss": 2.5382089233398437, "step": 1136400 }, { "epoch": 1.3713389616740106, "learning_rate": 5.450793455927012e-06, "loss": 2.542510528564453, "step": 1136500 }, { "epoch": 1.3714596249964932, "learning_rate": 5.450389620459274e-06, "loss": 2.5426008605957033, "step": 1136600 }, { "epoch": 1.3715802883189758, "learning_rate": 5.449985784991536e-06, "loss": 2.5103395080566404, "step": 1136700 }, { "epoch": 1.3717009516414587, "learning_rate": 5.4495819495237975e-06, "loss": 2.546983642578125, "step": 1136800 }, { "epoch": 1.3718216149639413, "learning_rate": 5.4491781140560595e-06, "loss": 2.5199876403808594, "step": 1136900 }, { "epoch": 1.371942278286424, "learning_rate": 5.4487742785883215e-06, "loss": 2.5389828491210937, "step": 1137000 }, { "epoch": 1.3720629416089065, "learning_rate": 5.448370443120582e-06, "loss": 2.519501953125, "step": 1137100 }, { "epoch": 1.3721836049313894, "learning_rate": 5.447966607652844e-06, "loss": 2.5643328857421874, "step": 1137200 }, { "epoch": 1.372304268253872, "learning_rate": 5.447562772185106e-06, "loss": 2.5271170043945315, "step": 1137300 }, { "epoch": 1.3724249315763548, "learning_rate": 5.447158936717367e-06, "loss": 2.517020416259766, "step": 1137400 }, { "epoch": 1.3725455948988374, "learning_rate": 5.446755101249629e-06, "loss": 2.569444580078125, "step": 1137500 }, { "epoch": 1.37266625822132, "learning_rate": 5.446351265781891e-06, "loss": 2.5404542541503905, "step": 1137600 }, { "epoch": 1.3727869215438027, "learning_rate": 5.445947430314153e-06, "loss": 2.5718399047851563, "step": 1137700 }, { "epoch": 1.3729075848662855, "learning_rate": 5.445543594846414e-06, "loss": 2.5461988830566407, "step": 1137800 }, { "epoch": 1.3730282481887681, "learning_rate": 5.445139759378676e-06, "loss": 2.548560791015625, "step": 1137900 }, { "epoch": 1.3731489115112507, "learning_rate": 5.444735923910936e-06, "loss": 2.54360595703125, "step": 1138000 }, { "epoch": 1.3732695748337336, "learning_rate": 5.444332088443198e-06, "loss": 2.5419076538085936, "step": 1138100 }, { "epoch": 1.3733902381562162, "learning_rate": 5.44392825297546e-06, "loss": 2.552976531982422, "step": 1138200 }, { "epoch": 1.3735109014786988, "learning_rate": 5.443524417507722e-06, "loss": 2.52674072265625, "step": 1138300 }, { "epoch": 1.3736315648011814, "learning_rate": 5.443120582039983e-06, "loss": 2.543697509765625, "step": 1138400 }, { "epoch": 1.3737522281236643, "learning_rate": 5.442716746572245e-06, "loss": 2.5015023803710936, "step": 1138500 }, { "epoch": 1.3738728914461469, "learning_rate": 5.442312911104507e-06, "loss": 2.5388385009765626, "step": 1138600 }, { "epoch": 1.3739935547686297, "learning_rate": 5.441909075636768e-06, "loss": 2.5495433044433593, "step": 1138700 }, { "epoch": 1.3741142180911123, "learning_rate": 5.4415052401690295e-06, "loss": 2.535744323730469, "step": 1138800 }, { "epoch": 1.374234881413595, "learning_rate": 5.4411014047012915e-06, "loss": 2.5505636596679686, "step": 1138900 }, { "epoch": 1.3743555447360776, "learning_rate": 5.440697569233553e-06, "loss": 2.544205780029297, "step": 1139000 }, { "epoch": 1.3744762080585602, "learning_rate": 5.440293733765815e-06, "loss": 2.541745147705078, "step": 1139100 }, { "epoch": 1.374596871381043, "learning_rate": 5.439889898298077e-06, "loss": 2.5528407287597656, "step": 1139200 }, { "epoch": 1.3747175347035256, "learning_rate": 5.439486062830338e-06, "loss": 2.5194491577148437, "step": 1139300 }, { "epoch": 1.3748381980260085, "learning_rate": 5.4390822273626e-06, "loss": 2.523556671142578, "step": 1139400 }, { "epoch": 1.374958861348491, "learning_rate": 5.438678391894862e-06, "loss": 2.52521728515625, "step": 1139500 }, { "epoch": 1.3750795246709737, "learning_rate": 5.438274556427122e-06, "loss": 2.512046203613281, "step": 1139600 }, { "epoch": 1.3752001879934563, "learning_rate": 5.437870720959384e-06, "loss": 2.541837463378906, "step": 1139700 }, { "epoch": 1.3753208513159392, "learning_rate": 5.437466885491646e-06, "loss": 2.525388488769531, "step": 1139800 }, { "epoch": 1.3754415146384218, "learning_rate": 5.437063050023907e-06, "loss": 2.545591125488281, "step": 1139900 }, { "epoch": 1.3755621779609044, "learning_rate": 5.436659214556169e-06, "loss": 2.52818603515625, "step": 1140000 }, { "epoch": 1.3756828412833872, "learning_rate": 5.436255379088431e-06, "loss": 2.515214691162109, "step": 1140100 }, { "epoch": 1.3758035046058699, "learning_rate": 5.435851543620693e-06, "loss": 2.545337982177734, "step": 1140200 }, { "epoch": 1.3759241679283525, "learning_rate": 5.435447708152954e-06, "loss": 2.541880798339844, "step": 1140300 }, { "epoch": 1.376044831250835, "learning_rate": 5.435043872685215e-06, "loss": 2.5188539123535154, "step": 1140400 }, { "epoch": 1.376165494573318, "learning_rate": 5.4346400372174764e-06, "loss": 2.5112628173828124, "step": 1140500 }, { "epoch": 1.3762861578958006, "learning_rate": 5.4342362017497384e-06, "loss": 2.524778137207031, "step": 1140600 }, { "epoch": 1.3764068212182834, "learning_rate": 5.433832366282e-06, "loss": 2.543590240478516, "step": 1140700 }, { "epoch": 1.376527484540766, "learning_rate": 5.433428530814262e-06, "loss": 2.5368023681640626, "step": 1140800 }, { "epoch": 1.3766481478632486, "learning_rate": 5.4330246953465235e-06, "loss": 2.5154937744140624, "step": 1140900 }, { "epoch": 1.3767688111857312, "learning_rate": 5.4326208598787855e-06, "loss": 2.513436584472656, "step": 1141000 }, { "epoch": 1.376889474508214, "learning_rate": 5.4322170244110475e-06, "loss": 2.503190765380859, "step": 1141100 }, { "epoch": 1.3770101378306967, "learning_rate": 5.431813188943308e-06, "loss": 2.557327880859375, "step": 1141200 }, { "epoch": 1.3771308011531793, "learning_rate": 5.43140935347557e-06, "loss": 2.5278384399414064, "step": 1141300 }, { "epoch": 1.3772514644756622, "learning_rate": 5.431005518007832e-06, "loss": 2.5263067626953126, "step": 1141400 }, { "epoch": 1.3773721277981448, "learning_rate": 5.430601682540093e-06, "loss": 2.5221929931640625, "step": 1141500 }, { "epoch": 1.3774927911206274, "learning_rate": 5.430197847072355e-06, "loss": 2.544229278564453, "step": 1141600 }, { "epoch": 1.37761345444311, "learning_rate": 5.429794011604617e-06, "loss": 2.554261016845703, "step": 1141700 }, { "epoch": 1.3777341177655928, "learning_rate": 5.429390176136878e-06, "loss": 2.5323876953125, "step": 1141800 }, { "epoch": 1.3778547810880755, "learning_rate": 5.42898634066914e-06, "loss": 2.528624725341797, "step": 1141900 }, { "epoch": 1.377975444410558, "learning_rate": 5.428582505201401e-06, "loss": 2.5226971435546877, "step": 1142000 }, { "epoch": 1.378096107733041, "learning_rate": 5.428178669733662e-06, "loss": 2.5477256774902344, "step": 1142100 }, { "epoch": 1.3782167710555235, "learning_rate": 5.427774834265924e-06, "loss": 2.5299638366699218, "step": 1142200 }, { "epoch": 1.3783374343780062, "learning_rate": 5.427370998798186e-06, "loss": 2.5363206481933593, "step": 1142300 }, { "epoch": 1.3784580977004888, "learning_rate": 5.426967163330447e-06, "loss": 2.547471923828125, "step": 1142400 }, { "epoch": 1.3785787610229716, "learning_rate": 5.426563327862709e-06, "loss": 2.514842834472656, "step": 1142500 }, { "epoch": 1.3786994243454542, "learning_rate": 5.426159492394971e-06, "loss": 2.5372265625, "step": 1142600 }, { "epoch": 1.378820087667937, "learning_rate": 5.425755656927233e-06, "loss": 2.515281219482422, "step": 1142700 }, { "epoch": 1.3789407509904197, "learning_rate": 5.425351821459494e-06, "loss": 2.511183013916016, "step": 1142800 }, { "epoch": 1.3790614143129023, "learning_rate": 5.4249479859917556e-06, "loss": 2.5355906677246094, "step": 1142900 }, { "epoch": 1.379182077635385, "learning_rate": 5.424544150524017e-06, "loss": 2.5508056640625, "step": 1143000 }, { "epoch": 1.3793027409578678, "learning_rate": 5.424140315056279e-06, "loss": 2.541520080566406, "step": 1143100 }, { "epoch": 1.3794234042803504, "learning_rate": 5.423736479588541e-06, "loss": 2.5150335693359374, "step": 1143200 }, { "epoch": 1.379544067602833, "learning_rate": 5.423332644120803e-06, "loss": 2.5438296508789064, "step": 1143300 }, { "epoch": 1.3796647309253158, "learning_rate": 5.422928808653064e-06, "loss": 2.5094369506835936, "step": 1143400 }, { "epoch": 1.3797853942477984, "learning_rate": 5.422524973185326e-06, "loss": 2.5541021728515627, "step": 1143500 }, { "epoch": 1.379906057570281, "learning_rate": 5.422121137717588e-06, "loss": 2.5475660705566407, "step": 1143600 }, { "epoch": 1.3800267208927637, "learning_rate": 5.421717302249848e-06, "loss": 2.5314952087402345, "step": 1143700 }, { "epoch": 1.3801473842152465, "learning_rate": 5.42131346678211e-06, "loss": 2.5375489807128906, "step": 1143800 }, { "epoch": 1.3802680475377291, "learning_rate": 5.420909631314372e-06, "loss": 2.521672668457031, "step": 1143900 }, { "epoch": 1.380388710860212, "learning_rate": 5.420505795846633e-06, "loss": 2.535904846191406, "step": 1144000 }, { "epoch": 1.3805093741826946, "learning_rate": 5.420101960378895e-06, "loss": 2.531316680908203, "step": 1144100 }, { "epoch": 1.3806300375051772, "learning_rate": 5.419698124911157e-06, "loss": 2.5353948974609377, "step": 1144200 }, { "epoch": 1.3807507008276598, "learning_rate": 5.419294289443418e-06, "loss": 2.5233360290527345, "step": 1144300 }, { "epoch": 1.3808713641501424, "learning_rate": 5.41889045397568e-06, "loss": 2.5406507873535156, "step": 1144400 }, { "epoch": 1.3809920274726253, "learning_rate": 5.418486618507941e-06, "loss": 2.552934417724609, "step": 1144500 }, { "epoch": 1.381112690795108, "learning_rate": 5.4180827830402025e-06, "loss": 2.548315124511719, "step": 1144600 }, { "epoch": 1.3812333541175907, "learning_rate": 5.4176789475724645e-06, "loss": 2.543492431640625, "step": 1144700 }, { "epoch": 1.3813540174400734, "learning_rate": 5.4172751121047264e-06, "loss": 2.555675048828125, "step": 1144800 }, { "epoch": 1.381474680762556, "learning_rate": 5.416871276636988e-06, "loss": 2.527588195800781, "step": 1144900 }, { "epoch": 1.3815953440850386, "learning_rate": 5.4164674411692496e-06, "loss": 2.5472946166992188, "step": 1145000 }, { "epoch": 1.3817160074075214, "learning_rate": 5.4160636057015115e-06, "loss": 2.5301190185546876, "step": 1145100 }, { "epoch": 1.381836670730004, "learning_rate": 5.4156597702337735e-06, "loss": 2.5367149353027343, "step": 1145200 }, { "epoch": 1.3819573340524867, "learning_rate": 5.415255934766034e-06, "loss": 2.5438656616210937, "step": 1145300 }, { "epoch": 1.3820779973749695, "learning_rate": 5.414852099298296e-06, "loss": 2.532565460205078, "step": 1145400 }, { "epoch": 1.3821986606974521, "learning_rate": 5.414448263830557e-06, "loss": 2.521920471191406, "step": 1145500 }, { "epoch": 1.3823193240199347, "learning_rate": 5.414044428362819e-06, "loss": 2.5297177124023436, "step": 1145600 }, { "epoch": 1.3824399873424174, "learning_rate": 5.413640592895081e-06, "loss": 2.5246351623535155, "step": 1145700 }, { "epoch": 1.3825606506649002, "learning_rate": 5.413236757427343e-06, "loss": 2.5591070556640627, "step": 1145800 }, { "epoch": 1.3826813139873828, "learning_rate": 5.412832921959604e-06, "loss": 2.5358404541015624, "step": 1145900 }, { "epoch": 1.3828019773098656, "learning_rate": 5.412429086491866e-06, "loss": 2.526722106933594, "step": 1146000 }, { "epoch": 1.3829226406323483, "learning_rate": 5.412025251024126e-06, "loss": 2.511173095703125, "step": 1146100 }, { "epoch": 1.3830433039548309, "learning_rate": 5.411621415556388e-06, "loss": 2.5481590270996093, "step": 1146200 }, { "epoch": 1.3831639672773135, "learning_rate": 5.41121758008865e-06, "loss": 2.545981140136719, "step": 1146300 }, { "epoch": 1.3832846305997963, "learning_rate": 5.410813744620912e-06, "loss": 2.525196990966797, "step": 1146400 }, { "epoch": 1.383405293922279, "learning_rate": 5.410409909153173e-06, "loss": 2.559201507568359, "step": 1146500 }, { "epoch": 1.3835259572447616, "learning_rate": 5.410006073685435e-06, "loss": 2.5289569091796875, "step": 1146600 }, { "epoch": 1.3836466205672444, "learning_rate": 5.409602238217697e-06, "loss": 2.526231231689453, "step": 1146700 }, { "epoch": 1.383767283889727, "learning_rate": 5.4091984027499585e-06, "loss": 2.536224670410156, "step": 1146800 }, { "epoch": 1.3838879472122096, "learning_rate": 5.40879456728222e-06, "loss": 2.52229736328125, "step": 1146900 }, { "epoch": 1.3840086105346923, "learning_rate": 5.408390731814482e-06, "loss": 2.515036315917969, "step": 1147000 }, { "epoch": 1.384129273857175, "learning_rate": 5.407986896346743e-06, "loss": 2.520436248779297, "step": 1147100 }, { "epoch": 1.3842499371796577, "learning_rate": 5.407583060879005e-06, "loss": 2.506478729248047, "step": 1147200 }, { "epoch": 1.3843706005021403, "learning_rate": 5.407179225411267e-06, "loss": 2.537923126220703, "step": 1147300 }, { "epoch": 1.3844912638246232, "learning_rate": 5.406775389943528e-06, "loss": 2.514120635986328, "step": 1147400 }, { "epoch": 1.3846119271471058, "learning_rate": 5.40637155447579e-06, "loss": 2.538255462646484, "step": 1147500 }, { "epoch": 1.3847325904695884, "learning_rate": 5.405967719008052e-06, "loss": 2.558655090332031, "step": 1147600 }, { "epoch": 1.384853253792071, "learning_rate": 5.405563883540312e-06, "loss": 2.533682403564453, "step": 1147700 }, { "epoch": 1.3849739171145539, "learning_rate": 5.405160048072574e-06, "loss": 2.5453860473632814, "step": 1147800 }, { "epoch": 1.3850945804370365, "learning_rate": 5.404756212604836e-06, "loss": 2.52238037109375, "step": 1147900 }, { "epoch": 1.3852152437595193, "learning_rate": 5.404352377137097e-06, "loss": 2.5367420959472655, "step": 1148000 }, { "epoch": 1.385335907082002, "learning_rate": 5.403948541669359e-06, "loss": 2.5412278747558594, "step": 1148100 }, { "epoch": 1.3854565704044846, "learning_rate": 5.403544706201621e-06, "loss": 2.5077024841308595, "step": 1148200 }, { "epoch": 1.3855772337269672, "learning_rate": 5.403140870733883e-06, "loss": 2.5063795471191406, "step": 1148300 }, { "epoch": 1.38569789704945, "learning_rate": 5.402737035266144e-06, "loss": 2.5242520141601563, "step": 1148400 }, { "epoch": 1.3858185603719326, "learning_rate": 5.402333199798406e-06, "loss": 2.535416717529297, "step": 1148500 }, { "epoch": 1.3859392236944152, "learning_rate": 5.4019293643306665e-06, "loss": 2.5348394775390624, "step": 1148600 }, { "epoch": 1.386059887016898, "learning_rate": 5.4015255288629285e-06, "loss": 2.5310186767578124, "step": 1148700 }, { "epoch": 1.3861805503393807, "learning_rate": 5.4011216933951905e-06, "loss": 2.5209614562988283, "step": 1148800 }, { "epoch": 1.3863012136618633, "learning_rate": 5.4007178579274525e-06, "loss": 2.5188616943359374, "step": 1148900 }, { "epoch": 1.386421876984346, "learning_rate": 5.400314022459714e-06, "loss": 2.5145919799804686, "step": 1149000 }, { "epoch": 1.3865425403068288, "learning_rate": 5.399910186991976e-06, "loss": 2.5039500427246093, "step": 1149100 }, { "epoch": 1.3866632036293114, "learning_rate": 5.399506351524238e-06, "loss": 2.5271942138671877, "step": 1149200 }, { "epoch": 1.3867838669517942, "learning_rate": 5.3991025160564996e-06, "loss": 2.520858154296875, "step": 1149300 }, { "epoch": 1.3869045302742768, "learning_rate": 5.39869868058876e-06, "loss": 2.526811370849609, "step": 1149400 }, { "epoch": 1.3870251935967595, "learning_rate": 5.398294845121022e-06, "loss": 2.5180397033691406, "step": 1149500 }, { "epoch": 1.387145856919242, "learning_rate": 5.397891009653283e-06, "loss": 2.5278610229492187, "step": 1149600 }, { "epoch": 1.3872665202417247, "learning_rate": 5.397487174185545e-06, "loss": 2.543345184326172, "step": 1149700 }, { "epoch": 1.3873871835642075, "learning_rate": 5.397083338717807e-06, "loss": 2.524442596435547, "step": 1149800 }, { "epoch": 1.3875078468866902, "learning_rate": 5.396679503250069e-06, "loss": 2.5227981567382813, "step": 1149900 }, { "epoch": 1.387628510209173, "learning_rate": 5.39627566778233e-06, "loss": 2.5310043334960937, "step": 1150000 }, { "epoch": 1.3877491735316556, "learning_rate": 5.395871832314592e-06, "loss": 2.517650909423828, "step": 1150100 }, { "epoch": 1.3878698368541382, "learning_rate": 5.395467996846852e-06, "loss": 2.524495086669922, "step": 1150200 }, { "epoch": 1.3879905001766208, "learning_rate": 5.395064161379114e-06, "loss": 2.5102299499511718, "step": 1150300 }, { "epoch": 1.3881111634991037, "learning_rate": 5.394660325911376e-06, "loss": 2.5394557189941405, "step": 1150400 }, { "epoch": 1.3882318268215863, "learning_rate": 5.394256490443638e-06, "loss": 2.5404037475585937, "step": 1150500 }, { "epoch": 1.388352490144069, "learning_rate": 5.393852654975899e-06, "loss": 2.525884094238281, "step": 1150600 }, { "epoch": 1.3884731534665518, "learning_rate": 5.393448819508161e-06, "loss": 2.5312400817871095, "step": 1150700 }, { "epoch": 1.3885938167890344, "learning_rate": 5.393044984040423e-06, "loss": 2.516312255859375, "step": 1150800 }, { "epoch": 1.388714480111517, "learning_rate": 5.3926411485726845e-06, "loss": 2.5113238525390624, "step": 1150900 }, { "epoch": 1.3888351434339996, "learning_rate": 5.392237313104946e-06, "loss": 2.5285166931152343, "step": 1151000 }, { "epoch": 1.3889558067564824, "learning_rate": 5.391833477637208e-06, "loss": 2.5104353332519533, "step": 1151100 }, { "epoch": 1.389076470078965, "learning_rate": 5.391429642169469e-06, "loss": 2.548168182373047, "step": 1151200 }, { "epoch": 1.389197133401448, "learning_rate": 5.391025806701731e-06, "loss": 2.524268798828125, "step": 1151300 }, { "epoch": 1.3893177967239305, "learning_rate": 5.390621971233993e-06, "loss": 2.525360870361328, "step": 1151400 }, { "epoch": 1.3894384600464131, "learning_rate": 5.390218135766254e-06, "loss": 2.529053192138672, "step": 1151500 }, { "epoch": 1.3895591233688958, "learning_rate": 5.389814300298516e-06, "loss": 2.514293975830078, "step": 1151600 }, { "epoch": 1.3896797866913786, "learning_rate": 5.389410464830778e-06, "loss": 2.5168475341796874, "step": 1151700 }, { "epoch": 1.3898004500138612, "learning_rate": 5.389006629363038e-06, "loss": 2.5484770202636717, "step": 1151800 }, { "epoch": 1.3899211133363438, "learning_rate": 5.3886027938953e-06, "loss": 2.5428106689453127, "step": 1151900 }, { "epoch": 1.3900417766588267, "learning_rate": 5.388198958427562e-06, "loss": 2.5350466918945314, "step": 1152000 }, { "epoch": 1.3901624399813093, "learning_rate": 5.387795122959823e-06, "loss": 2.540474853515625, "step": 1152100 }, { "epoch": 1.390283103303792, "learning_rate": 5.387391287492085e-06, "loss": 2.5336659240722654, "step": 1152200 }, { "epoch": 1.3904037666262745, "learning_rate": 5.386987452024347e-06, "loss": 2.5053668212890625, "step": 1152300 }, { "epoch": 1.3905244299487574, "learning_rate": 5.386583616556609e-06, "loss": 2.5222811889648438, "step": 1152400 }, { "epoch": 1.39064509327124, "learning_rate": 5.38617978108887e-06, "loss": 2.5426150512695314, "step": 1152500 }, { "epoch": 1.3907657565937226, "learning_rate": 5.3857759456211314e-06, "loss": 2.5417770385742187, "step": 1152600 }, { "epoch": 1.3908864199162054, "learning_rate": 5.3853721101533926e-06, "loss": 2.5155413818359373, "step": 1152700 }, { "epoch": 1.391007083238688, "learning_rate": 5.3849682746856545e-06, "loss": 2.5267010498046876, "step": 1152800 }, { "epoch": 1.3911277465611707, "learning_rate": 5.3845644392179165e-06, "loss": 2.53987548828125, "step": 1152900 }, { "epoch": 1.3912484098836533, "learning_rate": 5.3841606037501785e-06, "loss": 2.5038192749023436, "step": 1153000 }, { "epoch": 1.3913690732061361, "learning_rate": 5.38375676828244e-06, "loss": 2.5173573303222656, "step": 1153100 }, { "epoch": 1.3914897365286187, "learning_rate": 5.383352932814702e-06, "loss": 2.5479449462890624, "step": 1153200 }, { "epoch": 1.3916103998511016, "learning_rate": 5.382949097346964e-06, "loss": 2.5450289916992186, "step": 1153300 }, { "epoch": 1.3917310631735842, "learning_rate": 5.382545261879225e-06, "loss": 2.5209263610839843, "step": 1153400 }, { "epoch": 1.3918517264960668, "learning_rate": 5.382141426411486e-06, "loss": 2.532440185546875, "step": 1153500 }, { "epoch": 1.3919723898185494, "learning_rate": 5.381737590943748e-06, "loss": 2.5346116638183593, "step": 1153600 }, { "epoch": 1.3920930531410323, "learning_rate": 5.381333755476009e-06, "loss": 2.5527911376953125, "step": 1153700 }, { "epoch": 1.3922137164635149, "learning_rate": 5.380929920008271e-06, "loss": 2.5223353576660155, "step": 1153800 }, { "epoch": 1.3923343797859975, "learning_rate": 5.380526084540533e-06, "loss": 2.5422930908203125, "step": 1153900 }, { "epoch": 1.3924550431084803, "learning_rate": 5.380122249072794e-06, "loss": 2.536565704345703, "step": 1154000 }, { "epoch": 1.392575706430963, "learning_rate": 5.379718413605056e-06, "loss": 2.5293238830566405, "step": 1154100 }, { "epoch": 1.3926963697534456, "learning_rate": 5.379314578137318e-06, "loss": 2.517669982910156, "step": 1154200 }, { "epoch": 1.3928170330759282, "learning_rate": 5.378910742669578e-06, "loss": 2.5376908874511717, "step": 1154300 }, { "epoch": 1.392937696398411, "learning_rate": 5.37850690720184e-06, "loss": 2.519211730957031, "step": 1154400 }, { "epoch": 1.3930583597208936, "learning_rate": 5.378103071734102e-06, "loss": 2.515825653076172, "step": 1154500 }, { "epoch": 1.3931790230433765, "learning_rate": 5.3776992362663635e-06, "loss": 2.50259765625, "step": 1154600 }, { "epoch": 1.393299686365859, "learning_rate": 5.3772954007986254e-06, "loss": 2.540410614013672, "step": 1154700 }, { "epoch": 1.3934203496883417, "learning_rate": 5.376891565330887e-06, "loss": 2.5407919311523437, "step": 1154800 }, { "epoch": 1.3935410130108243, "learning_rate": 5.376487729863149e-06, "loss": 2.5305557250976562, "step": 1154900 }, { "epoch": 1.393661676333307, "learning_rate": 5.3760838943954105e-06, "loss": 2.548468017578125, "step": 1155000 }, { "epoch": 1.3937823396557898, "learning_rate": 5.375680058927672e-06, "loss": 2.522960357666016, "step": 1155100 }, { "epoch": 1.3939030029782724, "learning_rate": 5.375276223459933e-06, "loss": 2.501831817626953, "step": 1155200 }, { "epoch": 1.3940236663007552, "learning_rate": 5.374872387992195e-06, "loss": 2.5268960571289063, "step": 1155300 }, { "epoch": 1.3941443296232379, "learning_rate": 5.374468552524457e-06, "loss": 2.5192189025878906, "step": 1155400 }, { "epoch": 1.3942649929457205, "learning_rate": 5.374064717056719e-06, "loss": 2.529515380859375, "step": 1155500 }, { "epoch": 1.394385656268203, "learning_rate": 5.37366088158898e-06, "loss": 2.5204197692871095, "step": 1155600 }, { "epoch": 1.394506319590686, "learning_rate": 5.373257046121242e-06, "loss": 2.5188369750976562, "step": 1155700 }, { "epoch": 1.3946269829131686, "learning_rate": 5.372853210653504e-06, "loss": 2.525248718261719, "step": 1155800 }, { "epoch": 1.3947476462356512, "learning_rate": 5.372449375185764e-06, "loss": 2.526294860839844, "step": 1155900 }, { "epoch": 1.394868309558134, "learning_rate": 5.372045539718026e-06, "loss": 2.5375067138671876, "step": 1156000 }, { "epoch": 1.3949889728806166, "learning_rate": 5.371641704250288e-06, "loss": 2.5332675170898438, "step": 1156100 }, { "epoch": 1.3951096362030992, "learning_rate": 5.371237868782549e-06, "loss": 2.537090606689453, "step": 1156200 }, { "epoch": 1.3952302995255819, "learning_rate": 5.370834033314811e-06, "loss": 2.558913269042969, "step": 1156300 }, { "epoch": 1.3953509628480647, "learning_rate": 5.370430197847073e-06, "loss": 2.524530334472656, "step": 1156400 }, { "epoch": 1.3954716261705473, "learning_rate": 5.370026362379334e-06, "loss": 2.5485736083984376, "step": 1156500 }, { "epoch": 1.3955922894930302, "learning_rate": 5.369622526911596e-06, "loss": 2.513768768310547, "step": 1156600 }, { "epoch": 1.3957129528155128, "learning_rate": 5.3692186914438575e-06, "loss": 2.5433958435058592, "step": 1156700 }, { "epoch": 1.3958336161379954, "learning_rate": 5.368814855976119e-06, "loss": 2.5310513305664064, "step": 1156800 }, { "epoch": 1.395954279460478, "learning_rate": 5.368411020508381e-06, "loss": 2.5147918701171874, "step": 1156900 }, { "epoch": 1.3960749427829608, "learning_rate": 5.3680071850406426e-06, "loss": 2.5007318115234374, "step": 1157000 }, { "epoch": 1.3961956061054435, "learning_rate": 5.367603349572904e-06, "loss": 2.4964634704589845, "step": 1157100 }, { "epoch": 1.396316269427926, "learning_rate": 5.367199514105166e-06, "loss": 2.52902099609375, "step": 1157200 }, { "epoch": 1.396436932750409, "learning_rate": 5.366795678637428e-06, "loss": 2.5327960205078126, "step": 1157300 }, { "epoch": 1.3965575960728915, "learning_rate": 5.36639184316969e-06, "loss": 2.5491595458984375, "step": 1157400 }, { "epoch": 1.3966782593953742, "learning_rate": 5.36598800770195e-06, "loss": 2.5082083129882813, "step": 1157500 }, { "epoch": 1.3967989227178568, "learning_rate": 5.365584172234212e-06, "loss": 2.527851257324219, "step": 1157600 }, { "epoch": 1.3969195860403396, "learning_rate": 5.365180336766473e-06, "loss": 2.5149134826660156, "step": 1157700 }, { "epoch": 1.3970402493628222, "learning_rate": 5.364776501298735e-06, "loss": 2.5126251220703124, "step": 1157800 }, { "epoch": 1.3971609126853048, "learning_rate": 5.364372665830997e-06, "loss": 2.544752502441406, "step": 1157900 }, { "epoch": 1.3972815760077877, "learning_rate": 5.363968830363259e-06, "loss": 2.5350587463378904, "step": 1158000 }, { "epoch": 1.3974022393302703, "learning_rate": 5.36356499489552e-06, "loss": 2.5590748596191406, "step": 1158100 }, { "epoch": 1.397522902652753, "learning_rate": 5.363161159427782e-06, "loss": 2.5559420776367188, "step": 1158200 }, { "epoch": 1.3976435659752355, "learning_rate": 5.362757323960044e-06, "loss": 2.529595947265625, "step": 1158300 }, { "epoch": 1.3977642292977184, "learning_rate": 5.362353488492304e-06, "loss": 2.5079887390136717, "step": 1158400 }, { "epoch": 1.397884892620201, "learning_rate": 5.361949653024566e-06, "loss": 2.5299317932128904, "step": 1158500 }, { "epoch": 1.3980055559426838, "learning_rate": 5.361545817556828e-06, "loss": 2.512842102050781, "step": 1158600 }, { "epoch": 1.3981262192651664, "learning_rate": 5.3611419820890895e-06, "loss": 2.522920684814453, "step": 1158700 }, { "epoch": 1.398246882587649, "learning_rate": 5.3607381466213515e-06, "loss": 2.5416461181640626, "step": 1158800 }, { "epoch": 1.3983675459101317, "learning_rate": 5.3603343111536135e-06, "loss": 2.5171159362792968, "step": 1158900 }, { "epoch": 1.3984882092326145, "learning_rate": 5.359930475685875e-06, "loss": 2.5356214904785155, "step": 1159000 }, { "epoch": 1.3986088725550971, "learning_rate": 5.3595266402181366e-06, "loss": 2.553128204345703, "step": 1159100 }, { "epoch": 1.3987295358775798, "learning_rate": 5.359122804750398e-06, "loss": 2.5284690856933594, "step": 1159200 }, { "epoch": 1.3988501992000626, "learning_rate": 5.358718969282659e-06, "loss": 2.533741455078125, "step": 1159300 }, { "epoch": 1.3989708625225452, "learning_rate": 5.358315133814921e-06, "loss": 2.538132781982422, "step": 1159400 }, { "epoch": 1.3990915258450278, "learning_rate": 5.357911298347183e-06, "loss": 2.5424543762207032, "step": 1159500 }, { "epoch": 1.3992121891675104, "learning_rate": 5.357507462879444e-06, "loss": 2.530656433105469, "step": 1159600 }, { "epoch": 1.3993328524899933, "learning_rate": 5.357103627411706e-06, "loss": 2.5603302001953123, "step": 1159700 }, { "epoch": 1.399453515812476, "learning_rate": 5.356699791943968e-06, "loss": 2.5319927978515624, "step": 1159800 }, { "epoch": 1.3995741791349587, "learning_rate": 5.35629595647623e-06, "loss": 2.5034555053710936, "step": 1159900 }, { "epoch": 1.3996948424574414, "learning_rate": 5.35589212100849e-06, "loss": 2.514970550537109, "step": 1160000 }, { "epoch": 1.399815505779924, "learning_rate": 5.355488285540752e-06, "loss": 2.5374066162109377, "step": 1160100 }, { "epoch": 1.3999361691024066, "learning_rate": 5.355084450073013e-06, "loss": 2.5162548828125, "step": 1160200 }, { "epoch": 1.4000568324248892, "learning_rate": 5.354680614605275e-06, "loss": 2.5328367614746092, "step": 1160300 }, { "epoch": 1.400177495747372, "learning_rate": 5.354276779137537e-06, "loss": 2.5114682006835936, "step": 1160400 }, { "epoch": 1.4002981590698547, "learning_rate": 5.353872943669799e-06, "loss": 2.5257301330566406, "step": 1160500 }, { "epoch": 1.4004188223923375, "learning_rate": 5.35346910820206e-06, "loss": 2.517378845214844, "step": 1160600 }, { "epoch": 1.4005394857148201, "learning_rate": 5.353065272734322e-06, "loss": 2.526616973876953, "step": 1160700 }, { "epoch": 1.4006601490373027, "learning_rate": 5.352661437266583e-06, "loss": 2.501219482421875, "step": 1160800 }, { "epoch": 1.4007808123597854, "learning_rate": 5.352257601798845e-06, "loss": 2.525074768066406, "step": 1160900 }, { "epoch": 1.4009014756822682, "learning_rate": 5.351853766331107e-06, "loss": 2.527352752685547, "step": 1161000 }, { "epoch": 1.4010221390047508, "learning_rate": 5.351449930863369e-06, "loss": 2.522322540283203, "step": 1161100 }, { "epoch": 1.4011428023272334, "learning_rate": 5.35104609539563e-06, "loss": 2.5293170166015626, "step": 1161200 }, { "epoch": 1.4012634656497163, "learning_rate": 5.350642259927892e-06, "loss": 2.5101971435546875, "step": 1161300 }, { "epoch": 1.4013841289721989, "learning_rate": 5.350238424460154e-06, "loss": 2.5312689208984374, "step": 1161400 }, { "epoch": 1.4015047922946815, "learning_rate": 5.349834588992416e-06, "loss": 2.525313262939453, "step": 1161500 }, { "epoch": 1.4016254556171641, "learning_rate": 5.349430753524676e-06, "loss": 2.504325714111328, "step": 1161600 }, { "epoch": 1.401746118939647, "learning_rate": 5.349026918056938e-06, "loss": 2.527008361816406, "step": 1161700 }, { "epoch": 1.4018667822621296, "learning_rate": 5.348623082589199e-06, "loss": 2.5374960327148437, "step": 1161800 }, { "epoch": 1.4019874455846124, "learning_rate": 5.348219247121461e-06, "loss": 2.504452362060547, "step": 1161900 }, { "epoch": 1.402108108907095, "learning_rate": 5.347815411653723e-06, "loss": 2.5293487548828124, "step": 1162000 }, { "epoch": 1.4022287722295776, "learning_rate": 5.347411576185985e-06, "loss": 2.5311820983886717, "step": 1162100 }, { "epoch": 1.4023494355520603, "learning_rate": 5.347007740718246e-06, "loss": 2.5464816284179688, "step": 1162200 }, { "epoch": 1.402470098874543, "learning_rate": 5.346603905250508e-06, "loss": 2.5383920288085937, "step": 1162300 }, { "epoch": 1.4025907621970257, "learning_rate": 5.3462000697827684e-06, "loss": 2.518330383300781, "step": 1162400 }, { "epoch": 1.4027114255195083, "learning_rate": 5.34579623431503e-06, "loss": 2.5109617614746096, "step": 1162500 }, { "epoch": 1.4028320888419912, "learning_rate": 5.345392398847292e-06, "loss": 2.5294297790527343, "step": 1162600 }, { "epoch": 1.4029527521644738, "learning_rate": 5.3449885633795535e-06, "loss": 2.5041775512695312, "step": 1162700 }, { "epoch": 1.4030734154869564, "learning_rate": 5.3445847279118155e-06, "loss": 2.5252777099609376, "step": 1162800 }, { "epoch": 1.403194078809439, "learning_rate": 5.3441808924440775e-06, "loss": 2.5284730529785158, "step": 1162900 }, { "epoch": 1.4033147421319219, "learning_rate": 5.3437770569763395e-06, "loss": 2.5078106689453126, "step": 1163000 }, { "epoch": 1.4034354054544045, "learning_rate": 5.343373221508601e-06, "loss": 2.524599914550781, "step": 1163100 }, { "epoch": 1.403556068776887, "learning_rate": 5.342969386040862e-06, "loss": 2.519031829833984, "step": 1163200 }, { "epoch": 1.40367673209937, "learning_rate": 5.342565550573123e-06, "loss": 2.5417274475097655, "step": 1163300 }, { "epoch": 1.4037973954218526, "learning_rate": 5.342161715105385e-06, "loss": 2.5243467712402343, "step": 1163400 }, { "epoch": 1.4039180587443352, "learning_rate": 5.341757879637647e-06, "loss": 2.5327435302734376, "step": 1163500 }, { "epoch": 1.4040387220668178, "learning_rate": 5.341354044169909e-06, "loss": 2.548556365966797, "step": 1163600 }, { "epoch": 1.4041593853893006, "learning_rate": 5.34095020870217e-06, "loss": 2.5231605529785157, "step": 1163700 }, { "epoch": 1.4042800487117832, "learning_rate": 5.340546373234432e-06, "loss": 2.5467616271972657, "step": 1163800 }, { "epoch": 1.404400712034266, "learning_rate": 5.340142537766694e-06, "loss": 2.5349995422363283, "step": 1163900 }, { "epoch": 1.4045213753567487, "learning_rate": 5.339738702298956e-06, "loss": 2.5416165161132813, "step": 1164000 }, { "epoch": 1.4046420386792313, "learning_rate": 5.339334866831216e-06, "loss": 2.555613250732422, "step": 1164100 }, { "epoch": 1.404762702001714, "learning_rate": 5.338931031363478e-06, "loss": 2.5507179260253907, "step": 1164200 }, { "epoch": 1.4048833653241968, "learning_rate": 5.338527195895739e-06, "loss": 2.518742980957031, "step": 1164300 }, { "epoch": 1.4050040286466794, "learning_rate": 5.338123360428001e-06, "loss": 2.5378271484375, "step": 1164400 }, { "epoch": 1.405124691969162, "learning_rate": 5.337719524960263e-06, "loss": 2.5492860412597658, "step": 1164500 }, { "epoch": 1.4052453552916448, "learning_rate": 5.337315689492525e-06, "loss": 2.5339918518066407, "step": 1164600 }, { "epoch": 1.4053660186141275, "learning_rate": 5.336911854024786e-06, "loss": 2.5202320861816405, "step": 1164700 }, { "epoch": 1.40548668193661, "learning_rate": 5.336508018557048e-06, "loss": 2.536990051269531, "step": 1164800 }, { "epoch": 1.4056073452590927, "learning_rate": 5.336104183089309e-06, "loss": 2.5307986450195314, "step": 1164900 }, { "epoch": 1.4057280085815755, "learning_rate": 5.335700347621571e-06, "loss": 2.51799560546875, "step": 1165000 }, { "epoch": 1.4058486719040582, "learning_rate": 5.335296512153833e-06, "loss": 2.4824591064453125, "step": 1165100 }, { "epoch": 1.405969335226541, "learning_rate": 5.334892676686095e-06, "loss": 2.528423156738281, "step": 1165200 }, { "epoch": 1.4060899985490236, "learning_rate": 5.334488841218356e-06, "loss": 2.523019256591797, "step": 1165300 }, { "epoch": 1.4062106618715062, "learning_rate": 5.334085005750618e-06, "loss": 2.5061917114257812, "step": 1165400 }, { "epoch": 1.4063313251939888, "learning_rate": 5.33368117028288e-06, "loss": 2.5214743041992187, "step": 1165500 }, { "epoch": 1.4064519885164715, "learning_rate": 5.333277334815141e-06, "loss": 2.514373016357422, "step": 1165600 }, { "epoch": 1.4065726518389543, "learning_rate": 5.332873499347402e-06, "loss": 2.527446441650391, "step": 1165700 }, { "epoch": 1.406693315161437, "learning_rate": 5.332469663879664e-06, "loss": 2.5306793212890626, "step": 1165800 }, { "epoch": 1.4068139784839198, "learning_rate": 5.332065828411925e-06, "loss": 2.543943176269531, "step": 1165900 }, { "epoch": 1.4069346418064024, "learning_rate": 5.331661992944187e-06, "loss": 2.497627410888672, "step": 1166000 }, { "epoch": 1.407055305128885, "learning_rate": 5.331258157476449e-06, "loss": 2.5326826477050783, "step": 1166100 }, { "epoch": 1.4071759684513676, "learning_rate": 5.33085432200871e-06, "loss": 2.546064758300781, "step": 1166200 }, { "epoch": 1.4072966317738504, "learning_rate": 5.330450486540972e-06, "loss": 2.5347969055175783, "step": 1166300 }, { "epoch": 1.407417295096333, "learning_rate": 5.330046651073234e-06, "loss": 2.4998410034179686, "step": 1166400 }, { "epoch": 1.4075379584188157, "learning_rate": 5.3296428156054945e-06, "loss": 2.506375732421875, "step": 1166500 }, { "epoch": 1.4076586217412985, "learning_rate": 5.3292389801377565e-06, "loss": 2.5538101196289062, "step": 1166600 }, { "epoch": 1.4077792850637811, "learning_rate": 5.3288351446700184e-06, "loss": 2.539752655029297, "step": 1166700 }, { "epoch": 1.4078999483862638, "learning_rate": 5.3284313092022796e-06, "loss": 2.5409153747558593, "step": 1166800 }, { "epoch": 1.4080206117087464, "learning_rate": 5.3280274737345416e-06, "loss": 2.532998352050781, "step": 1166900 }, { "epoch": 1.4081412750312292, "learning_rate": 5.3276236382668035e-06, "loss": 2.522267608642578, "step": 1167000 }, { "epoch": 1.4082619383537118, "learning_rate": 5.3272198027990655e-06, "loss": 2.538083343505859, "step": 1167100 }, { "epoch": 1.4083826016761947, "learning_rate": 5.326815967331327e-06, "loss": 2.534817810058594, "step": 1167200 }, { "epoch": 1.4085032649986773, "learning_rate": 5.326412131863588e-06, "loss": 2.5263417053222654, "step": 1167300 }, { "epoch": 1.40862392832116, "learning_rate": 5.326008296395849e-06, "loss": 2.5242796325683594, "step": 1167400 }, { "epoch": 1.4087445916436425, "learning_rate": 5.325604460928111e-06, "loss": 2.520794677734375, "step": 1167500 }, { "epoch": 1.4088652549661254, "learning_rate": 5.325200625460373e-06, "loss": 2.5296324157714842, "step": 1167600 }, { "epoch": 1.408985918288608, "learning_rate": 5.324796789992635e-06, "loss": 2.5498541259765624, "step": 1167700 }, { "epoch": 1.4091065816110906, "learning_rate": 5.324392954524896e-06, "loss": 2.5320205688476562, "step": 1167800 }, { "epoch": 1.4092272449335734, "learning_rate": 5.323989119057158e-06, "loss": 2.4994305419921874, "step": 1167900 }, { "epoch": 1.409347908256056, "learning_rate": 5.32358528358942e-06, "loss": 2.5307270812988283, "step": 1168000 }, { "epoch": 1.4094685715785387, "learning_rate": 5.32318144812168e-06, "loss": 2.521178741455078, "step": 1168100 }, { "epoch": 1.4095892349010213, "learning_rate": 5.322777612653942e-06, "loss": 2.5218637084960935, "step": 1168200 }, { "epoch": 1.4097098982235041, "learning_rate": 5.322373777186204e-06, "loss": 2.5243072509765625, "step": 1168300 }, { "epoch": 1.4098305615459867, "learning_rate": 5.321969941718465e-06, "loss": 2.521416015625, "step": 1168400 }, { "epoch": 1.4099512248684694, "learning_rate": 5.321566106250727e-06, "loss": 2.509865417480469, "step": 1168500 }, { "epoch": 1.4100718881909522, "learning_rate": 5.321162270782989e-06, "loss": 2.5004331970214846, "step": 1168600 }, { "epoch": 1.4101925515134348, "learning_rate": 5.3207584353152505e-06, "loss": 2.5292984008789063, "step": 1168700 }, { "epoch": 1.4103132148359174, "learning_rate": 5.3203545998475124e-06, "loss": 2.530578308105469, "step": 1168800 }, { "epoch": 1.4104338781584, "learning_rate": 5.3199507643797744e-06, "loss": 2.507088317871094, "step": 1168900 }, { "epoch": 1.4105545414808829, "learning_rate": 5.319546928912035e-06, "loss": 2.533651580810547, "step": 1169000 }, { "epoch": 1.4106752048033655, "learning_rate": 5.319143093444297e-06, "loss": 2.5255030822753906, "step": 1169100 }, { "epoch": 1.4107958681258483, "learning_rate": 5.318739257976559e-06, "loss": 2.514783477783203, "step": 1169200 }, { "epoch": 1.410916531448331, "learning_rate": 5.31833542250882e-06, "loss": 2.5285873413085938, "step": 1169300 }, { "epoch": 1.4110371947708136, "learning_rate": 5.317931587041082e-06, "loss": 2.5338548278808593, "step": 1169400 }, { "epoch": 1.4111578580932962, "learning_rate": 5.317527751573344e-06, "loss": 2.521170349121094, "step": 1169500 }, { "epoch": 1.411278521415779, "learning_rate": 5.317123916105606e-06, "loss": 2.534537658691406, "step": 1169600 }, { "epoch": 1.4113991847382616, "learning_rate": 5.316720080637867e-06, "loss": 2.5158317565917967, "step": 1169700 }, { "epoch": 1.4115198480607443, "learning_rate": 5.316316245170128e-06, "loss": 2.541536560058594, "step": 1169800 }, { "epoch": 1.411640511383227, "learning_rate": 5.315912409702389e-06, "loss": 2.522380828857422, "step": 1169900 }, { "epoch": 1.4117611747057097, "learning_rate": 5.315508574234651e-06, "loss": 2.5299261474609374, "step": 1170000 }, { "epoch": 1.4118818380281923, "learning_rate": 5.315104738766913e-06, "loss": 2.5320588684082033, "step": 1170100 }, { "epoch": 1.412002501350675, "learning_rate": 5.314700903299175e-06, "loss": 2.559404296875, "step": 1170200 }, { "epoch": 1.4121231646731578, "learning_rate": 5.314297067831436e-06, "loss": 2.5230703735351563, "step": 1170300 }, { "epoch": 1.4122438279956404, "learning_rate": 5.313893232363698e-06, "loss": 2.5283079528808594, "step": 1170400 }, { "epoch": 1.4123644913181232, "learning_rate": 5.31348939689596e-06, "loss": 2.5464971923828124, "step": 1170500 }, { "epoch": 1.4124851546406059, "learning_rate": 5.3130855614282205e-06, "loss": 2.509877014160156, "step": 1170600 }, { "epoch": 1.4126058179630885, "learning_rate": 5.3126817259604825e-06, "loss": 2.55656494140625, "step": 1170700 }, { "epoch": 1.412726481285571, "learning_rate": 5.3122778904927445e-06, "loss": 2.516932373046875, "step": 1170800 }, { "epoch": 1.4128471446080537, "learning_rate": 5.311874055025006e-06, "loss": 2.5367945861816406, "step": 1170900 }, { "epoch": 1.4129678079305366, "learning_rate": 5.311470219557268e-06, "loss": 2.5154734802246095, "step": 1171000 }, { "epoch": 1.4130884712530192, "learning_rate": 5.3110663840895296e-06, "loss": 2.5442793273925783, "step": 1171100 }, { "epoch": 1.413209134575502, "learning_rate": 5.310662548621791e-06, "loss": 2.5405728149414064, "step": 1171200 }, { "epoch": 1.4133297978979846, "learning_rate": 5.310258713154053e-06, "loss": 2.5354786682128907, "step": 1171300 }, { "epoch": 1.4134504612204672, "learning_rate": 5.309854877686314e-06, "loss": 2.508446044921875, "step": 1171400 }, { "epoch": 1.4135711245429499, "learning_rate": 5.309451042218575e-06, "loss": 2.5253297424316408, "step": 1171500 }, { "epoch": 1.4136917878654327, "learning_rate": 5.309047206750837e-06, "loss": 2.519353332519531, "step": 1171600 }, { "epoch": 1.4138124511879153, "learning_rate": 5.308643371283099e-06, "loss": 2.5326625061035157, "step": 1171700 }, { "epoch": 1.413933114510398, "learning_rate": 5.30823953581536e-06, "loss": 2.537689514160156, "step": 1171800 }, { "epoch": 1.4140537778328808, "learning_rate": 5.307835700347622e-06, "loss": 2.5306640625, "step": 1171900 }, { "epoch": 1.4141744411553634, "learning_rate": 5.307431864879884e-06, "loss": 2.5064462280273436, "step": 1172000 }, { "epoch": 1.414295104477846, "learning_rate": 5.307028029412146e-06, "loss": 2.5550685119628906, "step": 1172100 }, { "epoch": 1.4144157678003286, "learning_rate": 5.306624193944406e-06, "loss": 2.540696868896484, "step": 1172200 }, { "epoch": 1.4145364311228115, "learning_rate": 5.306220358476668e-06, "loss": 2.535694274902344, "step": 1172300 }, { "epoch": 1.414657094445294, "learning_rate": 5.305816523008929e-06, "loss": 2.501470489501953, "step": 1172400 }, { "epoch": 1.414777757767777, "learning_rate": 5.305412687541191e-06, "loss": 2.536958770751953, "step": 1172500 }, { "epoch": 1.4148984210902595, "learning_rate": 5.305008852073453e-06, "loss": 2.543249053955078, "step": 1172600 }, { "epoch": 1.4150190844127422, "learning_rate": 5.304605016605715e-06, "loss": 2.5457803344726564, "step": 1172700 }, { "epoch": 1.4151397477352248, "learning_rate": 5.3042011811379765e-06, "loss": 2.5296952819824217, "step": 1172800 }, { "epoch": 1.4152604110577076, "learning_rate": 5.3037973456702385e-06, "loss": 2.5137675476074217, "step": 1172900 }, { "epoch": 1.4153810743801902, "learning_rate": 5.303393510202499e-06, "loss": 2.5406423950195314, "step": 1173000 }, { "epoch": 1.4155017377026728, "learning_rate": 5.302989674734761e-06, "loss": 2.5111117553710938, "step": 1173100 }, { "epoch": 1.4156224010251557, "learning_rate": 5.302585839267023e-06, "loss": 2.5053753662109375, "step": 1173200 }, { "epoch": 1.4157430643476383, "learning_rate": 5.302182003799285e-06, "loss": 2.5099421691894532, "step": 1173300 }, { "epoch": 1.415863727670121, "learning_rate": 5.301778168331546e-06, "loss": 2.5102908325195314, "step": 1173400 }, { "epoch": 1.4159843909926035, "learning_rate": 5.301374332863808e-06, "loss": 2.521959075927734, "step": 1173500 }, { "epoch": 1.4161050543150864, "learning_rate": 5.30097049739607e-06, "loss": 2.5302801513671875, "step": 1173600 }, { "epoch": 1.416225717637569, "learning_rate": 5.300566661928331e-06, "loss": 2.5039552307128905, "step": 1173700 }, { "epoch": 1.4163463809600516, "learning_rate": 5.300162826460593e-06, "loss": 2.543558807373047, "step": 1173800 }, { "epoch": 1.4164670442825344, "learning_rate": 5.299758990992854e-06, "loss": 2.505576324462891, "step": 1173900 }, { "epoch": 1.416587707605017, "learning_rate": 5.299355155525115e-06, "loss": 2.5199949645996096, "step": 1174000 }, { "epoch": 1.4167083709274997, "learning_rate": 5.298951320057377e-06, "loss": 2.5271839904785156, "step": 1174100 }, { "epoch": 1.4168290342499823, "learning_rate": 5.298547484589639e-06, "loss": 2.508608856201172, "step": 1174200 }, { "epoch": 1.4169496975724651, "learning_rate": 5.2981436491219e-06, "loss": 2.535255126953125, "step": 1174300 }, { "epoch": 1.4170703608949478, "learning_rate": 5.297739813654162e-06, "loss": 2.5217626953125, "step": 1174400 }, { "epoch": 1.4171910242174306, "learning_rate": 5.297335978186424e-06, "loss": 2.524913024902344, "step": 1174500 }, { "epoch": 1.4173116875399132, "learning_rate": 5.296932142718686e-06, "loss": 2.5258953857421873, "step": 1174600 }, { "epoch": 1.4174323508623958, "learning_rate": 5.2965283072509465e-06, "loss": 2.518159942626953, "step": 1174700 }, { "epoch": 1.4175530141848784, "learning_rate": 5.2961244717832085e-06, "loss": 2.519479064941406, "step": 1174800 }, { "epoch": 1.4176736775073613, "learning_rate": 5.29572063631547e-06, "loss": 2.5236888122558594, "step": 1174900 }, { "epoch": 1.417794340829844, "learning_rate": 5.295316800847732e-06, "loss": 2.5191413879394533, "step": 1175000 }, { "epoch": 1.4179150041523265, "learning_rate": 5.294912965379994e-06, "loss": 2.5005584716796876, "step": 1175100 }, { "epoch": 1.4180356674748094, "learning_rate": 5.294509129912256e-06, "loss": 2.5301025390625, "step": 1175200 }, { "epoch": 1.418156330797292, "learning_rate": 5.294105294444517e-06, "loss": 2.5259991455078126, "step": 1175300 }, { "epoch": 1.4182769941197746, "learning_rate": 5.293701458976779e-06, "loss": 2.5405296325683593, "step": 1175400 }, { "epoch": 1.4183976574422572, "learning_rate": 5.293297623509039e-06, "loss": 2.523783874511719, "step": 1175500 }, { "epoch": 1.41851832076474, "learning_rate": 5.292893788041301e-06, "loss": 2.5218270874023436, "step": 1175600 }, { "epoch": 1.4186389840872227, "learning_rate": 5.292489952573563e-06, "loss": 2.5293077087402343, "step": 1175700 }, { "epoch": 1.4187596474097055, "learning_rate": 5.292086117105825e-06, "loss": 2.5207342529296874, "step": 1175800 }, { "epoch": 1.4188803107321881, "learning_rate": 5.291682281638086e-06, "loss": 2.5407981872558594, "step": 1175900 }, { "epoch": 1.4190009740546707, "learning_rate": 5.291278446170348e-06, "loss": 2.511616058349609, "step": 1176000 }, { "epoch": 1.4191216373771534, "learning_rate": 5.29087461070261e-06, "loss": 2.5266380310058594, "step": 1176100 }, { "epoch": 1.419242300699636, "learning_rate": 5.290470775234872e-06, "loss": 2.525465545654297, "step": 1176200 }, { "epoch": 1.4193629640221188, "learning_rate": 5.290066939767132e-06, "loss": 2.5541586303710937, "step": 1176300 }, { "epoch": 1.4194836273446014, "learning_rate": 5.289663104299394e-06, "loss": 2.54840576171875, "step": 1176400 }, { "epoch": 1.4196042906670843, "learning_rate": 5.2892592688316554e-06, "loss": 2.546369934082031, "step": 1176500 }, { "epoch": 1.4197249539895669, "learning_rate": 5.2888554333639174e-06, "loss": 2.5057167053222655, "step": 1176600 }, { "epoch": 1.4198456173120495, "learning_rate": 5.288451597896179e-06, "loss": 2.507357635498047, "step": 1176700 }, { "epoch": 1.4199662806345321, "learning_rate": 5.288047762428441e-06, "loss": 2.5331056213378904, "step": 1176800 }, { "epoch": 1.420086943957015, "learning_rate": 5.2876439269607025e-06, "loss": 2.517766418457031, "step": 1176900 }, { "epoch": 1.4202076072794976, "learning_rate": 5.2872400914929645e-06, "loss": 2.5404248046875, "step": 1177000 }, { "epoch": 1.4203282706019802, "learning_rate": 5.286836256025225e-06, "loss": 2.52800048828125, "step": 1177100 }, { "epoch": 1.420448933924463, "learning_rate": 5.286432420557487e-06, "loss": 2.5342413330078126, "step": 1177200 }, { "epoch": 1.4205695972469456, "learning_rate": 5.286028585089749e-06, "loss": 2.5276341247558594, "step": 1177300 }, { "epoch": 1.4206902605694283, "learning_rate": 5.285624749622011e-06, "loss": 2.5067901611328125, "step": 1177400 }, { "epoch": 1.4208109238919109, "learning_rate": 5.285220914154272e-06, "loss": 2.502242126464844, "step": 1177500 }, { "epoch": 1.4209315872143937, "learning_rate": 5.284817078686534e-06, "loss": 2.5420289611816407, "step": 1177600 }, { "epoch": 1.4210522505368763, "learning_rate": 5.284413243218796e-06, "loss": 2.49966064453125, "step": 1177700 }, { "epoch": 1.4211729138593592, "learning_rate": 5.284009407751057e-06, "loss": 2.5150996398925782, "step": 1177800 }, { "epoch": 1.4212935771818418, "learning_rate": 5.283605572283318e-06, "loss": 2.5301731872558593, "step": 1177900 }, { "epoch": 1.4214142405043244, "learning_rate": 5.28320173681558e-06, "loss": 2.497679443359375, "step": 1178000 }, { "epoch": 1.421534903826807, "learning_rate": 5.282797901347841e-06, "loss": 2.509929351806641, "step": 1178100 }, { "epoch": 1.4216555671492899, "learning_rate": 5.282394065880103e-06, "loss": 2.539256744384766, "step": 1178200 }, { "epoch": 1.4217762304717725, "learning_rate": 5.281990230412365e-06, "loss": 2.5278584289550783, "step": 1178300 }, { "epoch": 1.421896893794255, "learning_rate": 5.281586394944626e-06, "loss": 2.524861602783203, "step": 1178400 }, { "epoch": 1.422017557116738, "learning_rate": 5.281182559476888e-06, "loss": 2.480113220214844, "step": 1178500 }, { "epoch": 1.4221382204392206, "learning_rate": 5.28077872400915e-06, "loss": 2.544309387207031, "step": 1178600 }, { "epoch": 1.4222588837617032, "learning_rate": 5.280374888541411e-06, "loss": 2.535814208984375, "step": 1178700 }, { "epoch": 1.4223795470841858, "learning_rate": 5.2799710530736726e-06, "loss": 2.5385902404785154, "step": 1178800 }, { "epoch": 1.4225002104066686, "learning_rate": 5.2795672176059346e-06, "loss": 2.532223968505859, "step": 1178900 }, { "epoch": 1.4226208737291512, "learning_rate": 5.279163382138196e-06, "loss": 2.5055055236816406, "step": 1179000 }, { "epoch": 1.4227415370516339, "learning_rate": 5.278759546670458e-06, "loss": 2.513731689453125, "step": 1179100 }, { "epoch": 1.4228622003741167, "learning_rate": 5.27835571120272e-06, "loss": 2.51498779296875, "step": 1179200 }, { "epoch": 1.4229828636965993, "learning_rate": 5.277951875734982e-06, "loss": 2.527681579589844, "step": 1179300 }, { "epoch": 1.423103527019082, "learning_rate": 5.277548040267243e-06, "loss": 2.5101751708984374, "step": 1179400 }, { "epoch": 1.4232241903415646, "learning_rate": 5.277144204799505e-06, "loss": 2.502488098144531, "step": 1179500 }, { "epoch": 1.4233448536640474, "learning_rate": 5.276740369331765e-06, "loss": 2.5214805603027344, "step": 1179600 }, { "epoch": 1.42346551698653, "learning_rate": 5.276336533864027e-06, "loss": 2.551748046875, "step": 1179700 }, { "epoch": 1.4235861803090128, "learning_rate": 5.275932698396289e-06, "loss": 2.5047723388671876, "step": 1179800 }, { "epoch": 1.4237068436314955, "learning_rate": 5.275528862928551e-06, "loss": 2.5215580749511717, "step": 1179900 }, { "epoch": 1.423827506953978, "learning_rate": 5.275125027460812e-06, "loss": 2.5310897827148438, "step": 1180000 }, { "epoch": 1.4239481702764607, "learning_rate": 5.274721191993074e-06, "loss": 2.509042053222656, "step": 1180100 }, { "epoch": 1.4240688335989435, "learning_rate": 5.274317356525336e-06, "loss": 2.518959503173828, "step": 1180200 }, { "epoch": 1.4241894969214262, "learning_rate": 5.273913521057597e-06, "loss": 2.5275245666503907, "step": 1180300 }, { "epoch": 1.4243101602439088, "learning_rate": 5.273509685589858e-06, "loss": 2.5281500244140624, "step": 1180400 }, { "epoch": 1.4244308235663916, "learning_rate": 5.27310585012212e-06, "loss": 2.529039306640625, "step": 1180500 }, { "epoch": 1.4245514868888742, "learning_rate": 5.2727020146543815e-06, "loss": 2.5048399353027344, "step": 1180600 }, { "epoch": 1.4246721502113568, "learning_rate": 5.2722981791866435e-06, "loss": 2.5271836853027345, "step": 1180700 }, { "epoch": 1.4247928135338395, "learning_rate": 5.2718943437189054e-06, "loss": 2.552171325683594, "step": 1180800 }, { "epoch": 1.4249134768563223, "learning_rate": 5.271490508251167e-06, "loss": 2.523907012939453, "step": 1180900 }, { "epoch": 1.425034140178805, "learning_rate": 5.2710866727834286e-06, "loss": 2.5101190185546876, "step": 1181000 }, { "epoch": 1.4251548035012878, "learning_rate": 5.2706828373156905e-06, "loss": 2.497663879394531, "step": 1181100 }, { "epoch": 1.4252754668237704, "learning_rate": 5.270279001847951e-06, "loss": 2.4954246520996093, "step": 1181200 }, { "epoch": 1.425396130146253, "learning_rate": 5.269875166380213e-06, "loss": 2.5303314208984373, "step": 1181300 }, { "epoch": 1.4255167934687356, "learning_rate": 5.269471330912475e-06, "loss": 2.538251953125, "step": 1181400 }, { "epoch": 1.4256374567912182, "learning_rate": 5.269067495444736e-06, "loss": 2.528745574951172, "step": 1181500 }, { "epoch": 1.425758120113701, "learning_rate": 5.268663659976998e-06, "loss": 2.514451141357422, "step": 1181600 }, { "epoch": 1.4258787834361837, "learning_rate": 5.26825982450926e-06, "loss": 2.511627655029297, "step": 1181700 }, { "epoch": 1.4259994467586665, "learning_rate": 5.267855989041522e-06, "loss": 2.5115321350097655, "step": 1181800 }, { "epoch": 1.4261201100811491, "learning_rate": 5.267452153573783e-06, "loss": 2.515756072998047, "step": 1181900 }, { "epoch": 1.4262407734036318, "learning_rate": 5.267048318106044e-06, "loss": 2.517303161621094, "step": 1182000 }, { "epoch": 1.4263614367261144, "learning_rate": 5.266644482638305e-06, "loss": 2.513849182128906, "step": 1182100 }, { "epoch": 1.4264821000485972, "learning_rate": 5.266240647170567e-06, "loss": 2.516558837890625, "step": 1182200 }, { "epoch": 1.4266027633710798, "learning_rate": 5.265836811702829e-06, "loss": 2.521468200683594, "step": 1182300 }, { "epoch": 1.4267234266935624, "learning_rate": 5.265432976235091e-06, "loss": 2.5201365661621096, "step": 1182400 }, { "epoch": 1.4268440900160453, "learning_rate": 5.265029140767352e-06, "loss": 2.5117031860351564, "step": 1182500 }, { "epoch": 1.426964753338528, "learning_rate": 5.264625305299614e-06, "loss": 2.504752349853516, "step": 1182600 }, { "epoch": 1.4270854166610105, "learning_rate": 5.264221469831876e-06, "loss": 2.52435546875, "step": 1182700 }, { "epoch": 1.4272060799834931, "learning_rate": 5.263817634364137e-06, "loss": 2.5029248046875, "step": 1182800 }, { "epoch": 1.427326743305976, "learning_rate": 5.263413798896399e-06, "loss": 2.5516253662109376, "step": 1182900 }, { "epoch": 1.4274474066284586, "learning_rate": 5.263009963428661e-06, "loss": 2.5366822814941408, "step": 1183000 }, { "epoch": 1.4275680699509414, "learning_rate": 5.262606127960922e-06, "loss": 2.565203857421875, "step": 1183100 }, { "epoch": 1.427688733273424, "learning_rate": 5.262202292493184e-06, "loss": 2.5041885375976562, "step": 1183200 }, { "epoch": 1.4278093965959067, "learning_rate": 5.261798457025446e-06, "loss": 2.5242350769042967, "step": 1183300 }, { "epoch": 1.4279300599183893, "learning_rate": 5.261394621557707e-06, "loss": 2.535106353759766, "step": 1183400 }, { "epoch": 1.4280507232408721, "learning_rate": 5.260990786089969e-06, "loss": 2.5230218505859376, "step": 1183500 }, { "epoch": 1.4281713865633547, "learning_rate": 5.26058695062223e-06, "loss": 2.5490704345703126, "step": 1183600 }, { "epoch": 1.4282920498858374, "learning_rate": 5.260183115154491e-06, "loss": 2.5148988342285157, "step": 1183700 }, { "epoch": 1.4284127132083202, "learning_rate": 5.259779279686753e-06, "loss": 2.520804901123047, "step": 1183800 }, { "epoch": 1.4285333765308028, "learning_rate": 5.259375444219015e-06, "loss": 2.5126226806640624, "step": 1183900 }, { "epoch": 1.4286540398532854, "learning_rate": 5.258971608751276e-06, "loss": 2.5404922485351564, "step": 1184000 }, { "epoch": 1.428774703175768, "learning_rate": 5.258567773283538e-06, "loss": 2.5202091979980468, "step": 1184100 }, { "epoch": 1.4288953664982509, "learning_rate": 5.2581639378158e-06, "loss": 2.490377655029297, "step": 1184200 }, { "epoch": 1.4290160298207335, "learning_rate": 5.257760102348062e-06, "loss": 2.498743438720703, "step": 1184300 }, { "epoch": 1.4291366931432163, "learning_rate": 5.257356266880323e-06, "loss": 2.5190382385253907, "step": 1184400 }, { "epoch": 1.429257356465699, "learning_rate": 5.256952431412584e-06, "loss": 2.5319972229003906, "step": 1184500 }, { "epoch": 1.4293780197881816, "learning_rate": 5.2565485959448455e-06, "loss": 2.518631591796875, "step": 1184600 }, { "epoch": 1.4294986831106642, "learning_rate": 5.2561447604771075e-06, "loss": 2.5322415161132814, "step": 1184700 }, { "epoch": 1.4296193464331468, "learning_rate": 5.2557409250093695e-06, "loss": 2.5306826782226564, "step": 1184800 }, { "epoch": 1.4297400097556296, "learning_rate": 5.2553370895416315e-06, "loss": 2.512464599609375, "step": 1184900 }, { "epoch": 1.4298606730781123, "learning_rate": 5.254933254073893e-06, "loss": 2.5313055419921877, "step": 1185000 }, { "epoch": 1.429981336400595, "learning_rate": 5.254529418606155e-06, "loss": 2.5221665954589843, "step": 1185100 }, { "epoch": 1.4301019997230777, "learning_rate": 5.254125583138417e-06, "loss": 2.5071699523925783, "step": 1185200 }, { "epoch": 1.4302226630455603, "learning_rate": 5.253721747670677e-06, "loss": 2.527986602783203, "step": 1185300 }, { "epoch": 1.430343326368043, "learning_rate": 5.253317912202939e-06, "loss": 2.5122004699707032, "step": 1185400 }, { "epoch": 1.4304639896905258, "learning_rate": 5.252914076735201e-06, "loss": 2.538983917236328, "step": 1185500 }, { "epoch": 1.4305846530130084, "learning_rate": 5.252510241267462e-06, "loss": 2.5173683166503906, "step": 1185600 }, { "epoch": 1.430705316335491, "learning_rate": 5.252106405799724e-06, "loss": 2.552755584716797, "step": 1185700 }, { "epoch": 1.4308259796579739, "learning_rate": 5.251702570331986e-06, "loss": 2.529195098876953, "step": 1185800 }, { "epoch": 1.4309466429804565, "learning_rate": 5.251298734864247e-06, "loss": 2.5218898010253907, "step": 1185900 }, { "epoch": 1.431067306302939, "learning_rate": 5.250894899396509e-06, "loss": 2.525093231201172, "step": 1186000 }, { "epoch": 1.4311879696254217, "learning_rate": 5.25049106392877e-06, "loss": 2.5383856201171877, "step": 1186100 }, { "epoch": 1.4313086329479046, "learning_rate": 5.250087228461031e-06, "loss": 2.5314039611816406, "step": 1186200 }, { "epoch": 1.4314292962703872, "learning_rate": 5.249683392993293e-06, "loss": 2.4924638366699217, "step": 1186300 }, { "epoch": 1.43154995959287, "learning_rate": 5.249279557525555e-06, "loss": 2.536219177246094, "step": 1186400 }, { "epoch": 1.4316706229153526, "learning_rate": 5.2488757220578164e-06, "loss": 2.5276788330078124, "step": 1186500 }, { "epoch": 1.4317912862378352, "learning_rate": 5.248471886590078e-06, "loss": 2.5296067810058593, "step": 1186600 }, { "epoch": 1.4319119495603179, "learning_rate": 5.24806805112234e-06, "loss": 2.517186279296875, "step": 1186700 }, { "epoch": 1.4320326128828005, "learning_rate": 5.247664215654602e-06, "loss": 2.5235728454589843, "step": 1186800 }, { "epoch": 1.4321532762052833, "learning_rate": 5.247260380186863e-06, "loss": 2.5346087646484374, "step": 1186900 }, { "epoch": 1.432273939527766, "learning_rate": 5.246856544719125e-06, "loss": 2.5227279663085938, "step": 1187000 }, { "epoch": 1.4323946028502488, "learning_rate": 5.246452709251386e-06, "loss": 2.519272918701172, "step": 1187100 }, { "epoch": 1.4325152661727314, "learning_rate": 5.246048873783648e-06, "loss": 2.513446960449219, "step": 1187200 }, { "epoch": 1.432635929495214, "learning_rate": 5.24564503831591e-06, "loss": 2.5123175048828124, "step": 1187300 }, { "epoch": 1.4327565928176966, "learning_rate": 5.245241202848172e-06, "loss": 2.5181674194335937, "step": 1187400 }, { "epoch": 1.4328772561401795, "learning_rate": 5.244837367380433e-06, "loss": 2.5282806396484374, "step": 1187500 }, { "epoch": 1.432997919462662, "learning_rate": 5.244433531912695e-06, "loss": 2.4888241577148436, "step": 1187600 }, { "epoch": 1.4331185827851447, "learning_rate": 5.244029696444955e-06, "loss": 2.5139111328125, "step": 1187700 }, { "epoch": 1.4332392461076275, "learning_rate": 5.243625860977217e-06, "loss": 2.5249339294433595, "step": 1187800 }, { "epoch": 1.4333599094301102, "learning_rate": 5.243222025509479e-06, "loss": 2.507424621582031, "step": 1187900 }, { "epoch": 1.4334805727525928, "learning_rate": 5.242818190041741e-06, "loss": 2.505626983642578, "step": 1188000 }, { "epoch": 1.4336012360750754, "learning_rate": 5.242414354574002e-06, "loss": 2.5139060974121095, "step": 1188100 }, { "epoch": 1.4337218993975582, "learning_rate": 5.242010519106264e-06, "loss": 2.5125198364257812, "step": 1188200 }, { "epoch": 1.4338425627200408, "learning_rate": 5.241606683638526e-06, "loss": 2.5062831115722655, "step": 1188300 }, { "epoch": 1.4339632260425237, "learning_rate": 5.241202848170787e-06, "loss": 2.5251246643066407, "step": 1188400 }, { "epoch": 1.4340838893650063, "learning_rate": 5.2407990127030485e-06, "loss": 2.5405316162109375, "step": 1188500 }, { "epoch": 1.434204552687489, "learning_rate": 5.2403951772353104e-06, "loss": 2.4922221374511717, "step": 1188600 }, { "epoch": 1.4343252160099715, "learning_rate": 5.2399913417675716e-06, "loss": 2.5183558654785156, "step": 1188700 }, { "epoch": 1.4344458793324544, "learning_rate": 5.2395875062998336e-06, "loss": 2.515214691162109, "step": 1188800 }, { "epoch": 1.434566542654937, "learning_rate": 5.2391836708320955e-06, "loss": 2.5064765930175783, "step": 1188900 }, { "epoch": 1.4346872059774196, "learning_rate": 5.238779835364357e-06, "loss": 2.5147283935546874, "step": 1189000 }, { "epoch": 1.4348078692999024, "learning_rate": 5.238375999896619e-06, "loss": 2.51111572265625, "step": 1189100 }, { "epoch": 1.434928532622385, "learning_rate": 5.237972164428881e-06, "loss": 2.532339782714844, "step": 1189200 }, { "epoch": 1.4350491959448677, "learning_rate": 5.237568328961143e-06, "loss": 2.5452557373046876, "step": 1189300 }, { "epoch": 1.4351698592673503, "learning_rate": 5.237164493493403e-06, "loss": 2.535574645996094, "step": 1189400 }, { "epoch": 1.4352905225898331, "learning_rate": 5.236760658025665e-06, "loss": 2.5082249450683594, "step": 1189500 }, { "epoch": 1.4354111859123158, "learning_rate": 5.236356822557926e-06, "loss": 2.5051364135742187, "step": 1189600 }, { "epoch": 1.4355318492347986, "learning_rate": 5.235952987090188e-06, "loss": 2.5193327331542967, "step": 1189700 }, { "epoch": 1.4356525125572812, "learning_rate": 5.23554915162245e-06, "loss": 2.533246612548828, "step": 1189800 }, { "epoch": 1.4357731758797638, "learning_rate": 5.235145316154712e-06, "loss": 2.5396965026855467, "step": 1189900 }, { "epoch": 1.4358938392022464, "learning_rate": 5.234741480686973e-06, "loss": 2.508358154296875, "step": 1190000 }, { "epoch": 1.436014502524729, "learning_rate": 5.234337645219235e-06, "loss": 2.5252581787109376, "step": 1190100 }, { "epoch": 1.436135165847212, "learning_rate": 5.233933809751495e-06, "loss": 2.51241455078125, "step": 1190200 }, { "epoch": 1.4362558291696945, "learning_rate": 5.233529974283757e-06, "loss": 2.5246627807617186, "step": 1190300 }, { "epoch": 1.4363764924921774, "learning_rate": 5.233126138816019e-06, "loss": 2.523518524169922, "step": 1190400 }, { "epoch": 1.43649715581466, "learning_rate": 5.232722303348281e-06, "loss": 2.5173191833496094, "step": 1190500 }, { "epoch": 1.4366178191371426, "learning_rate": 5.2323184678805425e-06, "loss": 2.516549072265625, "step": 1190600 }, { "epoch": 1.4367384824596252, "learning_rate": 5.2319146324128044e-06, "loss": 2.523076477050781, "step": 1190700 }, { "epoch": 1.436859145782108, "learning_rate": 5.2315107969450664e-06, "loss": 2.518424377441406, "step": 1190800 }, { "epoch": 1.4369798091045907, "learning_rate": 5.231106961477328e-06, "loss": 2.5306346130371096, "step": 1190900 }, { "epoch": 1.4371004724270733, "learning_rate": 5.230703126009589e-06, "loss": 2.534179382324219, "step": 1191000 }, { "epoch": 1.4372211357495561, "learning_rate": 5.230299290541851e-06, "loss": 2.5444851684570313, "step": 1191100 }, { "epoch": 1.4373417990720387, "learning_rate": 5.229895455074112e-06, "loss": 2.516419677734375, "step": 1191200 }, { "epoch": 1.4374624623945214, "learning_rate": 5.229491619606374e-06, "loss": 2.528853302001953, "step": 1191300 }, { "epoch": 1.437583125717004, "learning_rate": 5.229087784138636e-06, "loss": 2.5317533874511717, "step": 1191400 }, { "epoch": 1.4377037890394868, "learning_rate": 5.228683948670898e-06, "loss": 2.5186932373046873, "step": 1191500 }, { "epoch": 1.4378244523619694, "learning_rate": 5.228280113203159e-06, "loss": 2.528907928466797, "step": 1191600 }, { "epoch": 1.4379451156844523, "learning_rate": 5.227876277735421e-06, "loss": 2.5317727661132814, "step": 1191700 }, { "epoch": 1.4380657790069349, "learning_rate": 5.227472442267681e-06, "loss": 2.5165318298339843, "step": 1191800 }, { "epoch": 1.4381864423294175, "learning_rate": 5.227068606799943e-06, "loss": 2.4890036010742187, "step": 1191900 }, { "epoch": 1.4383071056519001, "learning_rate": 5.226664771332205e-06, "loss": 2.524722137451172, "step": 1192000 }, { "epoch": 1.4384277689743827, "learning_rate": 5.226260935864467e-06, "loss": 2.5253208923339843, "step": 1192100 }, { "epoch": 1.4385484322968656, "learning_rate": 5.225857100396728e-06, "loss": 2.505312957763672, "step": 1192200 }, { "epoch": 1.4386690956193482, "learning_rate": 5.22545326492899e-06, "loss": 2.514775695800781, "step": 1192300 }, { "epoch": 1.438789758941831, "learning_rate": 5.225049429461252e-06, "loss": 2.5136781311035157, "step": 1192400 }, { "epoch": 1.4389104222643136, "learning_rate": 5.224645593993513e-06, "loss": 2.526367950439453, "step": 1192500 }, { "epoch": 1.4390310855867963, "learning_rate": 5.2242417585257745e-06, "loss": 2.5105220031738282, "step": 1192600 }, { "epoch": 1.4391517489092789, "learning_rate": 5.2238379230580365e-06, "loss": 2.4971743774414064, "step": 1192700 }, { "epoch": 1.4392724122317617, "learning_rate": 5.223434087590298e-06, "loss": 2.5240325927734375, "step": 1192800 }, { "epoch": 1.4393930755542443, "learning_rate": 5.22303025212256e-06, "loss": 2.5125328063964845, "step": 1192900 }, { "epoch": 1.439513738876727, "learning_rate": 5.2226264166548216e-06, "loss": 2.5212832641601564, "step": 1193000 }, { "epoch": 1.4396344021992098, "learning_rate": 5.222222581187083e-06, "loss": 2.510792236328125, "step": 1193100 }, { "epoch": 1.4397550655216924, "learning_rate": 5.221818745719345e-06, "loss": 2.479328460693359, "step": 1193200 }, { "epoch": 1.439875728844175, "learning_rate": 5.221414910251607e-06, "loss": 2.5101918029785155, "step": 1193300 }, { "epoch": 1.4399963921666576, "learning_rate": 5.221011074783867e-06, "loss": 2.5160589599609375, "step": 1193400 }, { "epoch": 1.4401170554891405, "learning_rate": 5.220607239316129e-06, "loss": 2.507454681396484, "step": 1193500 }, { "epoch": 1.440237718811623, "learning_rate": 5.220203403848391e-06, "loss": 2.509287872314453, "step": 1193600 }, { "epoch": 1.440358382134106, "learning_rate": 5.219799568380652e-06, "loss": 2.5202265930175782, "step": 1193700 }, { "epoch": 1.4404790454565886, "learning_rate": 5.219395732912914e-06, "loss": 2.525673675537109, "step": 1193800 }, { "epoch": 1.4405997087790712, "learning_rate": 5.218991897445176e-06, "loss": 2.530961151123047, "step": 1193900 }, { "epoch": 1.4407203721015538, "learning_rate": 5.218588061977438e-06, "loss": 2.5242579650878905, "step": 1194000 }, { "epoch": 1.4408410354240366, "learning_rate": 5.218184226509699e-06, "loss": 2.486059112548828, "step": 1194100 }, { "epoch": 1.4409616987465192, "learning_rate": 5.217780391041961e-06, "loss": 2.536277160644531, "step": 1194200 }, { "epoch": 1.4410823620690019, "learning_rate": 5.217376555574221e-06, "loss": 2.5148846435546877, "step": 1194300 }, { "epoch": 1.4412030253914847, "learning_rate": 5.216972720106483e-06, "loss": 2.5185835266113283, "step": 1194400 }, { "epoch": 1.4413236887139673, "learning_rate": 5.216568884638745e-06, "loss": 2.5191632080078126, "step": 1194500 }, { "epoch": 1.44144435203645, "learning_rate": 5.216165049171007e-06, "loss": 2.5047372436523436, "step": 1194600 }, { "epoch": 1.4415650153589326, "learning_rate": 5.2157612137032685e-06, "loss": 2.526259002685547, "step": 1194700 }, { "epoch": 1.4416856786814154, "learning_rate": 5.2153573782355305e-06, "loss": 2.519425048828125, "step": 1194800 }, { "epoch": 1.441806342003898, "learning_rate": 5.2149535427677925e-06, "loss": 2.529441070556641, "step": 1194900 }, { "epoch": 1.4419270053263809, "learning_rate": 5.214549707300054e-06, "loss": 2.5284193420410155, "step": 1195000 }, { "epoch": 1.4420476686488635, "learning_rate": 5.214145871832315e-06, "loss": 2.525818176269531, "step": 1195100 }, { "epoch": 1.442168331971346, "learning_rate": 5.213742036364577e-06, "loss": 2.495961151123047, "step": 1195200 }, { "epoch": 1.4422889952938287, "learning_rate": 5.213338200896838e-06, "loss": 2.5538490295410154, "step": 1195300 }, { "epoch": 1.4424096586163113, "learning_rate": 5.2129343654291e-06, "loss": 2.507427062988281, "step": 1195400 }, { "epoch": 1.4425303219387942, "learning_rate": 5.212530529961362e-06, "loss": 2.5080491638183595, "step": 1195500 }, { "epoch": 1.4426509852612768, "learning_rate": 5.212126694493623e-06, "loss": 2.5181280517578126, "step": 1195600 }, { "epoch": 1.4427716485837596, "learning_rate": 5.211722859025885e-06, "loss": 2.5350054931640624, "step": 1195700 }, { "epoch": 1.4428923119062422, "learning_rate": 5.211319023558147e-06, "loss": 2.504360809326172, "step": 1195800 }, { "epoch": 1.4430129752287248, "learning_rate": 5.210915188090407e-06, "loss": 2.5091680908203124, "step": 1195900 }, { "epoch": 1.4431336385512075, "learning_rate": 5.210511352622669e-06, "loss": 2.5447418212890627, "step": 1196000 }, { "epoch": 1.4432543018736903, "learning_rate": 5.210107517154931e-06, "loss": 2.533300323486328, "step": 1196100 }, { "epoch": 1.443374965196173, "learning_rate": 5.209703681687192e-06, "loss": 2.5360038757324217, "step": 1196200 }, { "epoch": 1.4434956285186555, "learning_rate": 5.209299846219454e-06, "loss": 2.522806854248047, "step": 1196300 }, { "epoch": 1.4436162918411384, "learning_rate": 5.208896010751716e-06, "loss": 2.5091925048828125, "step": 1196400 }, { "epoch": 1.443736955163621, "learning_rate": 5.208492175283978e-06, "loss": 2.5319508361816405, "step": 1196500 }, { "epoch": 1.4438576184861036, "learning_rate": 5.208088339816239e-06, "loss": 2.5220703125, "step": 1196600 }, { "epoch": 1.4439782818085862, "learning_rate": 5.2076845043485005e-06, "loss": 2.529867706298828, "step": 1196700 }, { "epoch": 1.444098945131069, "learning_rate": 5.207280668880762e-06, "loss": 2.514643096923828, "step": 1196800 }, { "epoch": 1.4442196084535517, "learning_rate": 5.206876833413024e-06, "loss": 2.510701904296875, "step": 1196900 }, { "epoch": 1.4443402717760345, "learning_rate": 5.206472997945286e-06, "loss": 2.50802490234375, "step": 1197000 }, { "epoch": 1.4444609350985171, "learning_rate": 5.206069162477548e-06, "loss": 2.4950006103515623, "step": 1197100 }, { "epoch": 1.4445815984209998, "learning_rate": 5.205665327009809e-06, "loss": 2.5193797302246095, "step": 1197200 }, { "epoch": 1.4447022617434824, "learning_rate": 5.205261491542071e-06, "loss": 2.540937805175781, "step": 1197300 }, { "epoch": 1.444822925065965, "learning_rate": 5.204857656074333e-06, "loss": 2.5470611572265627, "step": 1197400 }, { "epoch": 1.4449435883884478, "learning_rate": 5.204453820606593e-06, "loss": 2.5152882385253905, "step": 1197500 }, { "epoch": 1.4450642517109304, "learning_rate": 5.204049985138855e-06, "loss": 2.526672058105469, "step": 1197600 }, { "epoch": 1.4451849150334133, "learning_rate": 5.203646149671117e-06, "loss": 2.5112065124511718, "step": 1197700 }, { "epoch": 1.445305578355896, "learning_rate": 5.203242314203378e-06, "loss": 2.535656280517578, "step": 1197800 }, { "epoch": 1.4454262416783785, "learning_rate": 5.20283847873564e-06, "loss": 2.5271482849121094, "step": 1197900 }, { "epoch": 1.4455469050008611, "learning_rate": 5.202434643267902e-06, "loss": 2.513130340576172, "step": 1198000 }, { "epoch": 1.445667568323344, "learning_rate": 5.202030807800163e-06, "loss": 2.509256134033203, "step": 1198100 }, { "epoch": 1.4457882316458266, "learning_rate": 5.201626972332425e-06, "loss": 2.528433990478516, "step": 1198200 }, { "epoch": 1.4459088949683092, "learning_rate": 5.201223136864686e-06, "loss": 2.536367645263672, "step": 1198300 }, { "epoch": 1.446029558290792, "learning_rate": 5.2008193013969474e-06, "loss": 2.523226013183594, "step": 1198400 }, { "epoch": 1.4461502216132747, "learning_rate": 5.2004154659292094e-06, "loss": 2.520672607421875, "step": 1198500 }, { "epoch": 1.4462708849357573, "learning_rate": 5.200011630461471e-06, "loss": 2.5307615661621092, "step": 1198600 }, { "epoch": 1.44639154825824, "learning_rate": 5.1996077949937325e-06, "loss": 2.5072557067871095, "step": 1198700 }, { "epoch": 1.4465122115807227, "learning_rate": 5.1992039595259945e-06, "loss": 2.5211672973632813, "step": 1198800 }, { "epoch": 1.4466328749032054, "learning_rate": 5.1988001240582565e-06, "loss": 2.5063325500488283, "step": 1198900 }, { "epoch": 1.4467535382256882, "learning_rate": 5.1983962885905185e-06, "loss": 2.520632629394531, "step": 1199000 }, { "epoch": 1.4468742015481708, "learning_rate": 5.197992453122779e-06, "loss": 2.512787322998047, "step": 1199100 }, { "epoch": 1.4469948648706534, "learning_rate": 5.197588617655041e-06, "loss": 2.5062521362304686, "step": 1199200 }, { "epoch": 1.447115528193136, "learning_rate": 5.197184782187302e-06, "loss": 2.531629943847656, "step": 1199300 }, { "epoch": 1.4472361915156189, "learning_rate": 5.196780946719564e-06, "loss": 2.51687255859375, "step": 1199400 }, { "epoch": 1.4473568548381015, "learning_rate": 5.196377111251826e-06, "loss": 2.4846339416503906, "step": 1199500 }, { "epoch": 1.4474775181605841, "learning_rate": 5.195973275784088e-06, "loss": 2.5144526672363283, "step": 1199600 }, { "epoch": 1.447598181483067, "learning_rate": 5.195569440316349e-06, "loss": 2.538743743896484, "step": 1199700 }, { "epoch": 1.4477188448055496, "learning_rate": 5.195165604848611e-06, "loss": 2.5094529724121095, "step": 1199800 }, { "epoch": 1.4478395081280322, "learning_rate": 5.194761769380873e-06, "loss": 2.5028358459472657, "step": 1199900 }, { "epoch": 1.4479601714505148, "learning_rate": 5.194357933913133e-06, "loss": 2.5161358642578127, "step": 1200000 }, { "epoch": 1.4480808347729976, "learning_rate": 5.193954098445395e-06, "loss": 2.5075839233398436, "step": 1200100 }, { "epoch": 1.4482014980954803, "learning_rate": 5.193550262977657e-06, "loss": 2.530966491699219, "step": 1200200 }, { "epoch": 1.448322161417963, "learning_rate": 5.193146427509918e-06, "loss": 2.5082525634765624, "step": 1200300 }, { "epoch": 1.4484428247404457, "learning_rate": 5.19274259204218e-06, "loss": 2.51498291015625, "step": 1200400 }, { "epoch": 1.4485634880629283, "learning_rate": 5.192338756574442e-06, "loss": 2.5330262756347657, "step": 1200500 }, { "epoch": 1.448684151385411, "learning_rate": 5.1919349211067034e-06, "loss": 2.5419366455078123, "step": 1200600 }, { "epoch": 1.4488048147078936, "learning_rate": 5.191531085638965e-06, "loss": 2.521240539550781, "step": 1200700 }, { "epoch": 1.4489254780303764, "learning_rate": 5.1911272501712266e-06, "loss": 2.5266842651367187, "step": 1200800 }, { "epoch": 1.449046141352859, "learning_rate": 5.190723414703488e-06, "loss": 2.520174102783203, "step": 1200900 }, { "epoch": 1.4491668046753419, "learning_rate": 5.19031957923575e-06, "loss": 2.494157257080078, "step": 1201000 }, { "epoch": 1.4492874679978245, "learning_rate": 5.189915743768012e-06, "loss": 2.499616241455078, "step": 1201100 }, { "epoch": 1.449408131320307, "learning_rate": 5.189511908300273e-06, "loss": 2.512931671142578, "step": 1201200 }, { "epoch": 1.4495287946427897, "learning_rate": 5.189108072832535e-06, "loss": 2.51753173828125, "step": 1201300 }, { "epoch": 1.4496494579652726, "learning_rate": 5.188704237364797e-06, "loss": 2.496304931640625, "step": 1201400 }, { "epoch": 1.4497701212877552, "learning_rate": 5.188300401897059e-06, "loss": 2.4873695373535156, "step": 1201500 }, { "epoch": 1.4498907846102378, "learning_rate": 5.187896566429319e-06, "loss": 2.503267822265625, "step": 1201600 }, { "epoch": 1.4500114479327206, "learning_rate": 5.187492730961581e-06, "loss": 2.5383729553222656, "step": 1201700 }, { "epoch": 1.4501321112552032, "learning_rate": 5.187088895493842e-06, "loss": 2.5011251831054686, "step": 1201800 }, { "epoch": 1.4502527745776859, "learning_rate": 5.186685060026104e-06, "loss": 2.5101560974121093, "step": 1201900 }, { "epoch": 1.4503734379001685, "learning_rate": 5.186281224558366e-06, "loss": 2.482931823730469, "step": 1202000 }, { "epoch": 1.4504941012226513, "learning_rate": 5.185877389090628e-06, "loss": 2.491637725830078, "step": 1202100 }, { "epoch": 1.450614764545134, "learning_rate": 5.185473553622889e-06, "loss": 2.513232421875, "step": 1202200 }, { "epoch": 1.4507354278676168, "learning_rate": 5.185069718155151e-06, "loss": 2.5372891235351562, "step": 1202300 }, { "epoch": 1.4508560911900994, "learning_rate": 5.1846658826874115e-06, "loss": 2.537087097167969, "step": 1202400 }, { "epoch": 1.450976754512582, "learning_rate": 5.1842620472196735e-06, "loss": 2.5318475341796876, "step": 1202500 }, { "epoch": 1.4510974178350646, "learning_rate": 5.1838582117519355e-06, "loss": 2.511898651123047, "step": 1202600 }, { "epoch": 1.4512180811575475, "learning_rate": 5.1834543762841974e-06, "loss": 2.4908018493652344, "step": 1202700 }, { "epoch": 1.45133874448003, "learning_rate": 5.183050540816459e-06, "loss": 2.4919192504882814, "step": 1202800 }, { "epoch": 1.4514594078025127, "learning_rate": 5.1826467053487206e-06, "loss": 2.5306358337402344, "step": 1202900 }, { "epoch": 1.4515800711249955, "learning_rate": 5.1822428698809825e-06, "loss": 2.502747344970703, "step": 1203000 }, { "epoch": 1.4517007344474782, "learning_rate": 5.181839034413244e-06, "loss": 2.5040859985351562, "step": 1203100 }, { "epoch": 1.4518213977699608, "learning_rate": 5.181435198945505e-06, "loss": 2.5205438232421873, "step": 1203200 }, { "epoch": 1.4519420610924434, "learning_rate": 5.181031363477767e-06, "loss": 2.5176116943359377, "step": 1203300 }, { "epoch": 1.4520627244149262, "learning_rate": 5.180627528010028e-06, "loss": 2.4954856872558593, "step": 1203400 }, { "epoch": 1.4521833877374088, "learning_rate": 5.18022369254229e-06, "loss": 2.528822479248047, "step": 1203500 }, { "epoch": 1.4523040510598915, "learning_rate": 5.179819857074552e-06, "loss": 2.5194132995605467, "step": 1203600 }, { "epoch": 1.4524247143823743, "learning_rate": 5.179416021606813e-06, "loss": 2.5130326843261717, "step": 1203700 }, { "epoch": 1.452545377704857, "learning_rate": 5.179012186139075e-06, "loss": 2.534657287597656, "step": 1203800 }, { "epoch": 1.4526660410273395, "learning_rate": 5.178608350671337e-06, "loss": 2.517678680419922, "step": 1203900 }, { "epoch": 1.4527867043498222, "learning_rate": 5.178204515203597e-06, "loss": 2.5060520935058594, "step": 1204000 }, { "epoch": 1.452907367672305, "learning_rate": 5.177800679735859e-06, "loss": 2.4985975646972656, "step": 1204100 }, { "epoch": 1.4530280309947876, "learning_rate": 5.177396844268121e-06, "loss": 2.5389794921875, "step": 1204200 }, { "epoch": 1.4531486943172705, "learning_rate": 5.176993008800382e-06, "loss": 2.5280720520019533, "step": 1204300 }, { "epoch": 1.453269357639753, "learning_rate": 5.176589173332644e-06, "loss": 2.5130303955078124, "step": 1204400 }, { "epoch": 1.4533900209622357, "learning_rate": 5.176185337864906e-06, "loss": 2.524222564697266, "step": 1204500 }, { "epoch": 1.4535106842847183, "learning_rate": 5.175781502397168e-06, "loss": 2.5192576599121095, "step": 1204600 }, { "epoch": 1.4536313476072011, "learning_rate": 5.1753776669294295e-06, "loss": 2.5239466857910156, "step": 1204700 }, { "epoch": 1.4537520109296838, "learning_rate": 5.1749738314616915e-06, "loss": 2.5057557678222655, "step": 1204800 }, { "epoch": 1.4538726742521664, "learning_rate": 5.174569995993952e-06, "loss": 2.5040252685546873, "step": 1204900 }, { "epoch": 1.4539933375746492, "learning_rate": 5.174166160526214e-06, "loss": 2.512290191650391, "step": 1205000 }, { "epoch": 1.4541140008971318, "learning_rate": 5.173762325058476e-06, "loss": 2.5383128356933593, "step": 1205100 }, { "epoch": 1.4542346642196144, "learning_rate": 5.173358489590738e-06, "loss": 2.497091064453125, "step": 1205200 }, { "epoch": 1.454355327542097, "learning_rate": 5.172954654122999e-06, "loss": 2.497685546875, "step": 1205300 }, { "epoch": 1.45447599086458, "learning_rate": 5.172550818655261e-06, "loss": 2.5060916137695313, "step": 1205400 }, { "epoch": 1.4545966541870625, "learning_rate": 5.172146983187523e-06, "loss": 2.544850616455078, "step": 1205500 }, { "epoch": 1.4547173175095454, "learning_rate": 5.171743147719785e-06, "loss": 2.514679718017578, "step": 1205600 }, { "epoch": 1.454837980832028, "learning_rate": 5.171339312252045e-06, "loss": 2.5219882202148436, "step": 1205700 }, { "epoch": 1.4549586441545106, "learning_rate": 5.170935476784307e-06, "loss": 2.530722351074219, "step": 1205800 }, { "epoch": 1.4550793074769932, "learning_rate": 5.170531641316568e-06, "loss": 2.499063262939453, "step": 1205900 }, { "epoch": 1.4551999707994758, "learning_rate": 5.17012780584883e-06, "loss": 2.5107072448730468, "step": 1206000 }, { "epoch": 1.4553206341219587, "learning_rate": 5.169723970381092e-06, "loss": 2.5146240234375, "step": 1206100 }, { "epoch": 1.4554412974444413, "learning_rate": 5.169320134913354e-06, "loss": 2.5213967895507814, "step": 1206200 }, { "epoch": 1.4555619607669241, "learning_rate": 5.168916299445615e-06, "loss": 2.5153244018554686, "step": 1206300 }, { "epoch": 1.4556826240894067, "learning_rate": 5.168512463977877e-06, "loss": 2.535375061035156, "step": 1206400 }, { "epoch": 1.4558032874118894, "learning_rate": 5.1681086285101375e-06, "loss": 2.5199327087402343, "step": 1206500 }, { "epoch": 1.455923950734372, "learning_rate": 5.1677047930423995e-06, "loss": 2.4992494201660156, "step": 1206600 }, { "epoch": 1.4560446140568548, "learning_rate": 5.1673009575746615e-06, "loss": 2.5044898986816406, "step": 1206700 }, { "epoch": 1.4561652773793374, "learning_rate": 5.1668971221069235e-06, "loss": 2.514717559814453, "step": 1206800 }, { "epoch": 1.45628594070182, "learning_rate": 5.166493286639185e-06, "loss": 2.5060073852539064, "step": 1206900 }, { "epoch": 1.4564066040243029, "learning_rate": 5.166089451171447e-06, "loss": 2.519663543701172, "step": 1207000 }, { "epoch": 1.4565272673467855, "learning_rate": 5.165685615703709e-06, "loss": 2.5106797790527344, "step": 1207100 }, { "epoch": 1.4566479306692681, "learning_rate": 5.16528178023597e-06, "loss": 2.5200196838378908, "step": 1207200 }, { "epoch": 1.4567685939917507, "learning_rate": 5.164877944768231e-06, "loss": 2.5124777221679686, "step": 1207300 }, { "epoch": 1.4568892573142336, "learning_rate": 5.164474109300493e-06, "loss": 2.497633056640625, "step": 1207400 }, { "epoch": 1.4570099206367162, "learning_rate": 5.164070273832754e-06, "loss": 2.5003645324707033, "step": 1207500 }, { "epoch": 1.457130583959199, "learning_rate": 5.163666438365016e-06, "loss": 2.5106475830078123, "step": 1207600 }, { "epoch": 1.4572512472816816, "learning_rate": 5.163262602897278e-06, "loss": 2.5219630432128906, "step": 1207700 }, { "epoch": 1.4573719106041643, "learning_rate": 5.162858767429539e-06, "loss": 2.513583068847656, "step": 1207800 }, { "epoch": 1.4574925739266469, "learning_rate": 5.162454931961801e-06, "loss": 2.5399256896972657, "step": 1207900 }, { "epoch": 1.4576132372491297, "learning_rate": 5.162051096494063e-06, "loss": 2.521140441894531, "step": 1208000 }, { "epoch": 1.4577339005716123, "learning_rate": 5.161647261026323e-06, "loss": 2.5300897216796874, "step": 1208100 }, { "epoch": 1.457854563894095, "learning_rate": 5.161243425558585e-06, "loss": 2.516402587890625, "step": 1208200 }, { "epoch": 1.4579752272165778, "learning_rate": 5.160839590090847e-06, "loss": 2.523581085205078, "step": 1208300 }, { "epoch": 1.4580958905390604, "learning_rate": 5.160435754623108e-06, "loss": 2.512251892089844, "step": 1208400 }, { "epoch": 1.458216553861543, "learning_rate": 5.16003191915537e-06, "loss": 2.5247647094726564, "step": 1208500 }, { "epoch": 1.4583372171840256, "learning_rate": 5.159628083687632e-06, "loss": 2.497182159423828, "step": 1208600 }, { "epoch": 1.4584578805065085, "learning_rate": 5.159224248219894e-06, "loss": 2.488153991699219, "step": 1208700 }, { "epoch": 1.458578543828991, "learning_rate": 5.1588204127521555e-06, "loss": 2.4831451416015624, "step": 1208800 }, { "epoch": 1.4586992071514737, "learning_rate": 5.158416577284417e-06, "loss": 2.5211444091796875, "step": 1208900 }, { "epoch": 1.4588198704739566, "learning_rate": 5.158012741816678e-06, "loss": 2.5040000915527343, "step": 1209000 }, { "epoch": 1.4589405337964392, "learning_rate": 5.15760890634894e-06, "loss": 2.5097808837890625, "step": 1209100 }, { "epoch": 1.4590611971189218, "learning_rate": 5.157205070881202e-06, "loss": 2.527263946533203, "step": 1209200 }, { "epoch": 1.4591818604414044, "learning_rate": 5.156801235413464e-06, "loss": 2.5314891052246096, "step": 1209300 }, { "epoch": 1.4593025237638872, "learning_rate": 5.156397399945725e-06, "loss": 2.5144993591308595, "step": 1209400 }, { "epoch": 1.4594231870863699, "learning_rate": 5.155993564477987e-06, "loss": 2.5105191040039063, "step": 1209500 }, { "epoch": 1.4595438504088527, "learning_rate": 5.155589729010249e-06, "loss": 2.5011140441894533, "step": 1209600 }, { "epoch": 1.4596645137313353, "learning_rate": 5.15518589354251e-06, "loss": 2.5316900634765624, "step": 1209700 }, { "epoch": 1.459785177053818, "learning_rate": 5.154782058074771e-06, "loss": 2.5214683532714846, "step": 1209800 }, { "epoch": 1.4599058403763006, "learning_rate": 5.154378222607033e-06, "loss": 2.5210426330566404, "step": 1209900 }, { "epoch": 1.4600265036987834, "learning_rate": 5.153974387139294e-06, "loss": 2.5225978088378906, "step": 1210000 }, { "epoch": 1.460147167021266, "learning_rate": 5.153570551671556e-06, "loss": 2.517728576660156, "step": 1210100 }, { "epoch": 1.4602678303437486, "learning_rate": 5.153166716203818e-06, "loss": 2.4979704284667967, "step": 1210200 }, { "epoch": 1.4603884936662315, "learning_rate": 5.152762880736079e-06, "loss": 2.5374636840820313, "step": 1210300 }, { "epoch": 1.460509156988714, "learning_rate": 5.152359045268341e-06, "loss": 2.5173497009277344, "step": 1210400 }, { "epoch": 1.4606298203111967, "learning_rate": 5.151955209800603e-06, "loss": 2.530989227294922, "step": 1210500 }, { "epoch": 1.4607504836336793, "learning_rate": 5.1515513743328636e-06, "loss": 2.52003662109375, "step": 1210600 }, { "epoch": 1.4608711469561622, "learning_rate": 5.1511475388651255e-06, "loss": 2.529652862548828, "step": 1210700 }, { "epoch": 1.4609918102786448, "learning_rate": 5.1507437033973875e-06, "loss": 2.5127267456054687, "step": 1210800 }, { "epoch": 1.4611124736011276, "learning_rate": 5.150339867929649e-06, "loss": 2.5316123962402344, "step": 1210900 }, { "epoch": 1.4612331369236102, "learning_rate": 5.149936032461911e-06, "loss": 2.4850004577636717, "step": 1211000 }, { "epoch": 1.4613538002460928, "learning_rate": 5.149532196994173e-06, "loss": 2.520555419921875, "step": 1211100 }, { "epoch": 1.4614744635685755, "learning_rate": 5.149128361526435e-06, "loss": 2.490012969970703, "step": 1211200 }, { "epoch": 1.461595126891058, "learning_rate": 5.148724526058696e-06, "loss": 2.5086984252929687, "step": 1211300 }, { "epoch": 1.461715790213541, "learning_rate": 5.148320690590957e-06, "loss": 2.51083984375, "step": 1211400 }, { "epoch": 1.4618364535360235, "learning_rate": 5.147916855123218e-06, "loss": 2.5364830017089846, "step": 1211500 }, { "epoch": 1.4619571168585064, "learning_rate": 5.14751301965548e-06, "loss": 2.5092477416992187, "step": 1211600 }, { "epoch": 1.462077780180989, "learning_rate": 5.147109184187742e-06, "loss": 2.5168267822265626, "step": 1211700 }, { "epoch": 1.4621984435034716, "learning_rate": 5.146705348720004e-06, "loss": 2.5163925170898436, "step": 1211800 }, { "epoch": 1.4623191068259542, "learning_rate": 5.146301513252265e-06, "loss": 2.5135226440429688, "step": 1211900 }, { "epoch": 1.462439770148437, "learning_rate": 5.145897677784527e-06, "loss": 2.5085934448242186, "step": 1212000 }, { "epoch": 1.4625604334709197, "learning_rate": 5.145493842316789e-06, "loss": 2.4988722229003906, "step": 1212100 }, { "epoch": 1.4626810967934023, "learning_rate": 5.145090006849049e-06, "loss": 2.5151759338378907, "step": 1212200 }, { "epoch": 1.4628017601158851, "learning_rate": 5.144686171381311e-06, "loss": 2.520643615722656, "step": 1212300 }, { "epoch": 1.4629224234383678, "learning_rate": 5.144282335913573e-06, "loss": 2.501903839111328, "step": 1212400 }, { "epoch": 1.4630430867608504, "learning_rate": 5.1438785004458345e-06, "loss": 2.534810333251953, "step": 1212500 }, { "epoch": 1.463163750083333, "learning_rate": 5.1434746649780964e-06, "loss": 2.518227386474609, "step": 1212600 }, { "epoch": 1.4632844134058158, "learning_rate": 5.143070829510358e-06, "loss": 2.534706268310547, "step": 1212700 }, { "epoch": 1.4634050767282984, "learning_rate": 5.1426669940426196e-06, "loss": 2.5122134399414064, "step": 1212800 }, { "epoch": 1.4635257400507813, "learning_rate": 5.1422631585748815e-06, "loss": 2.5008580017089845, "step": 1212900 }, { "epoch": 1.463646403373264, "learning_rate": 5.141859323107143e-06, "loss": 2.479510498046875, "step": 1213000 }, { "epoch": 1.4637670666957465, "learning_rate": 5.141455487639404e-06, "loss": 2.5129989624023437, "step": 1213100 }, { "epoch": 1.4638877300182291, "learning_rate": 5.141051652171666e-06, "loss": 2.502744140625, "step": 1213200 }, { "epoch": 1.464008393340712, "learning_rate": 5.140647816703928e-06, "loss": 2.502563934326172, "step": 1213300 }, { "epoch": 1.4641290566631946, "learning_rate": 5.140243981236189e-06, "loss": 2.5332655334472656, "step": 1213400 }, { "epoch": 1.4642497199856772, "learning_rate": 5.139840145768451e-06, "loss": 2.513109588623047, "step": 1213500 }, { "epoch": 1.46437038330816, "learning_rate": 5.139436310300713e-06, "loss": 2.5085710144042968, "step": 1213600 }, { "epoch": 1.4644910466306427, "learning_rate": 5.139032474832975e-06, "loss": 2.5255035400390624, "step": 1213700 }, { "epoch": 1.4646117099531253, "learning_rate": 5.138628639365235e-06, "loss": 2.518119049072266, "step": 1213800 }, { "epoch": 1.464732373275608, "learning_rate": 5.138224803897497e-06, "loss": 2.518134765625, "step": 1213900 }, { "epoch": 1.4648530365980907, "learning_rate": 5.137820968429758e-06, "loss": 2.5108023071289063, "step": 1214000 }, { "epoch": 1.4649736999205734, "learning_rate": 5.13741713296202e-06, "loss": 2.5060684204101564, "step": 1214100 }, { "epoch": 1.465094363243056, "learning_rate": 5.137013297494282e-06, "loss": 2.4858744812011717, "step": 1214200 }, { "epoch": 1.4652150265655388, "learning_rate": 5.136609462026544e-06, "loss": 2.502616424560547, "step": 1214300 }, { "epoch": 1.4653356898880214, "learning_rate": 5.136205626558805e-06, "loss": 2.508589019775391, "step": 1214400 }, { "epoch": 1.465456353210504, "learning_rate": 5.135801791091067e-06, "loss": 2.508871765136719, "step": 1214500 }, { "epoch": 1.4655770165329867, "learning_rate": 5.135397955623328e-06, "loss": 2.5108998107910154, "step": 1214600 }, { "epoch": 1.4656976798554695, "learning_rate": 5.13499412015559e-06, "loss": 2.512197265625, "step": 1214700 }, { "epoch": 1.4658183431779521, "learning_rate": 5.134590284687852e-06, "loss": 2.516071624755859, "step": 1214800 }, { "epoch": 1.465939006500435, "learning_rate": 5.1341864492201136e-06, "loss": 2.5182762145996094, "step": 1214900 }, { "epoch": 1.4660596698229176, "learning_rate": 5.133782613752375e-06, "loss": 2.512656707763672, "step": 1215000 }, { "epoch": 1.4661803331454002, "learning_rate": 5.133378778284637e-06, "loss": 2.506121826171875, "step": 1215100 }, { "epoch": 1.4663009964678828, "learning_rate": 5.132974942816899e-06, "loss": 2.5115426635742186, "step": 1215200 }, { "epoch": 1.4664216597903657, "learning_rate": 5.13257110734916e-06, "loss": 2.5212641906738282, "step": 1215300 }, { "epoch": 1.4665423231128483, "learning_rate": 5.132167271881422e-06, "loss": 2.4980767822265624, "step": 1215400 }, { "epoch": 1.4666629864353309, "learning_rate": 5.131763436413683e-06, "loss": 2.501182098388672, "step": 1215500 }, { "epoch": 1.4667836497578137, "learning_rate": 5.131359600945944e-06, "loss": 2.506073760986328, "step": 1215600 }, { "epoch": 1.4669043130802963, "learning_rate": 5.130955765478206e-06, "loss": 2.5305329895019533, "step": 1215700 }, { "epoch": 1.467024976402779, "learning_rate": 5.130551930010468e-06, "loss": 2.5369279479980467, "step": 1215800 }, { "epoch": 1.4671456397252616, "learning_rate": 5.130148094542729e-06, "loss": 2.507620849609375, "step": 1215900 }, { "epoch": 1.4672663030477444, "learning_rate": 5.129744259074991e-06, "loss": 2.5046260070800783, "step": 1216000 }, { "epoch": 1.467386966370227, "learning_rate": 5.129340423607253e-06, "loss": 2.524696960449219, "step": 1216100 }, { "epoch": 1.4675076296927099, "learning_rate": 5.128936588139515e-06, "loss": 2.519131927490234, "step": 1216200 }, { "epoch": 1.4676282930151925, "learning_rate": 5.128532752671775e-06, "loss": 2.511677551269531, "step": 1216300 }, { "epoch": 1.467748956337675, "learning_rate": 5.128128917204037e-06, "loss": 2.5116929626464843, "step": 1216400 }, { "epoch": 1.4678696196601577, "learning_rate": 5.1277250817362985e-06, "loss": 2.48597412109375, "step": 1216500 }, { "epoch": 1.4679902829826403, "learning_rate": 5.1273212462685605e-06, "loss": 2.5214527893066405, "step": 1216600 }, { "epoch": 1.4681109463051232, "learning_rate": 5.1269174108008225e-06, "loss": 2.5295433044433593, "step": 1216700 }, { "epoch": 1.4682316096276058, "learning_rate": 5.1265135753330845e-06, "loss": 2.5203038024902344, "step": 1216800 }, { "epoch": 1.4683522729500886, "learning_rate": 5.126109739865346e-06, "loss": 2.513870849609375, "step": 1216900 }, { "epoch": 1.4684729362725712, "learning_rate": 5.1257059043976076e-06, "loss": 2.5091233825683594, "step": 1217000 }, { "epoch": 1.4685935995950539, "learning_rate": 5.125302068929868e-06, "loss": 2.5137152099609374, "step": 1217100 }, { "epoch": 1.4687142629175365, "learning_rate": 5.12489823346213e-06, "loss": 2.5327073669433595, "step": 1217200 }, { "epoch": 1.4688349262400193, "learning_rate": 5.124494397994392e-06, "loss": 2.519366455078125, "step": 1217300 }, { "epoch": 1.468955589562502, "learning_rate": 5.124090562526654e-06, "loss": 2.503278350830078, "step": 1217400 }, { "epoch": 1.4690762528849846, "learning_rate": 5.123686727058915e-06, "loss": 2.5213177490234373, "step": 1217500 }, { "epoch": 1.4691969162074674, "learning_rate": 5.123282891591177e-06, "loss": 2.5083021545410156, "step": 1217600 }, { "epoch": 1.46931757952995, "learning_rate": 5.122879056123439e-06, "loss": 2.5063630676269533, "step": 1217700 }, { "epoch": 1.4694382428524326, "learning_rate": 5.1224752206557e-06, "loss": 2.5306968688964844, "step": 1217800 }, { "epoch": 1.4695589061749152, "learning_rate": 5.122071385187961e-06, "loss": 2.5030757141113282, "step": 1217900 }, { "epoch": 1.469679569497398, "learning_rate": 5.121667549720223e-06, "loss": 2.5111961364746094, "step": 1218000 }, { "epoch": 1.4698002328198807, "learning_rate": 5.121263714252484e-06, "loss": 2.520974426269531, "step": 1218100 }, { "epoch": 1.4699208961423635, "learning_rate": 5.120859878784746e-06, "loss": 2.5002490234375, "step": 1218200 }, { "epoch": 1.4700415594648462, "learning_rate": 5.120456043317008e-06, "loss": 2.5193536376953123, "step": 1218300 }, { "epoch": 1.4701622227873288, "learning_rate": 5.120052207849269e-06, "loss": 2.5082568359375, "step": 1218400 }, { "epoch": 1.4702828861098114, "learning_rate": 5.119648372381531e-06, "loss": 2.5162335205078126, "step": 1218500 }, { "epoch": 1.4704035494322942, "learning_rate": 5.119244536913793e-06, "loss": 2.504585418701172, "step": 1218600 }, { "epoch": 1.4705242127547768, "learning_rate": 5.118840701446054e-06, "loss": 2.5277786254882812, "step": 1218700 }, { "epoch": 1.4706448760772595, "learning_rate": 5.118436865978316e-06, "loss": 2.529365997314453, "step": 1218800 }, { "epoch": 1.4707655393997423, "learning_rate": 5.118033030510578e-06, "loss": 2.5191641235351563, "step": 1218900 }, { "epoch": 1.470886202722225, "learning_rate": 5.117629195042839e-06, "loss": 2.5099887084960937, "step": 1219000 }, { "epoch": 1.4710068660447075, "learning_rate": 5.117225359575101e-06, "loss": 2.5102998352050783, "step": 1219100 }, { "epoch": 1.4711275293671902, "learning_rate": 5.116821524107363e-06, "loss": 2.480766143798828, "step": 1219200 }, { "epoch": 1.471248192689673, "learning_rate": 5.116417688639625e-06, "loss": 2.5045120239257814, "step": 1219300 }, { "epoch": 1.4713688560121556, "learning_rate": 5.116013853171886e-06, "loss": 2.512132568359375, "step": 1219400 }, { "epoch": 1.4714895193346382, "learning_rate": 5.115610017704147e-06, "loss": 2.5169422912597654, "step": 1219500 }, { "epoch": 1.471610182657121, "learning_rate": 5.115206182236408e-06, "loss": 2.503670196533203, "step": 1219600 }, { "epoch": 1.4717308459796037, "learning_rate": 5.11480234676867e-06, "loss": 2.483851318359375, "step": 1219700 }, { "epoch": 1.4718515093020863, "learning_rate": 5.114398511300932e-06, "loss": 2.513017272949219, "step": 1219800 }, { "epoch": 1.471972172624569, "learning_rate": 5.113994675833194e-06, "loss": 2.5199758911132815, "step": 1219900 }, { "epoch": 1.4720928359470518, "learning_rate": 5.113590840365455e-06, "loss": 2.5207261657714843, "step": 1220000 }, { "epoch": 1.4722134992695344, "learning_rate": 5.113187004897717e-06, "loss": 2.5247052001953123, "step": 1220100 }, { "epoch": 1.4723341625920172, "learning_rate": 5.112783169429979e-06, "loss": 2.5034053039550783, "step": 1220200 }, { "epoch": 1.4724548259144998, "learning_rate": 5.112379333962241e-06, "loss": 2.504244689941406, "step": 1220300 }, { "epoch": 1.4725754892369824, "learning_rate": 5.111975498494501e-06, "loss": 2.5043174743652346, "step": 1220400 }, { "epoch": 1.472696152559465, "learning_rate": 5.111571663026763e-06, "loss": 2.494320983886719, "step": 1220500 }, { "epoch": 1.472816815881948, "learning_rate": 5.1111678275590245e-06, "loss": 2.5179519653320312, "step": 1220600 }, { "epoch": 1.4729374792044305, "learning_rate": 5.1107639920912865e-06, "loss": 2.5282049560546875, "step": 1220700 }, { "epoch": 1.4730581425269131, "learning_rate": 5.1103601566235485e-06, "loss": 2.4935308837890626, "step": 1220800 }, { "epoch": 1.473178805849396, "learning_rate": 5.1099563211558105e-06, "loss": 2.4888771057128904, "step": 1220900 }, { "epoch": 1.4732994691718786, "learning_rate": 5.109552485688072e-06, "loss": 2.5108766174316406, "step": 1221000 }, { "epoch": 1.4734201324943612, "learning_rate": 5.109148650220334e-06, "loss": 2.528196258544922, "step": 1221100 }, { "epoch": 1.4735407958168438, "learning_rate": 5.108744814752594e-06, "loss": 2.510536346435547, "step": 1221200 }, { "epoch": 1.4736614591393267, "learning_rate": 5.108340979284856e-06, "loss": 2.5335646057128907, "step": 1221300 }, { "epoch": 1.4737821224618093, "learning_rate": 5.107937143817118e-06, "loss": 2.4973103332519533, "step": 1221400 }, { "epoch": 1.4739027857842921, "learning_rate": 5.10753330834938e-06, "loss": 2.4932461547851563, "step": 1221500 }, { "epoch": 1.4740234491067747, "learning_rate": 5.107129472881641e-06, "loss": 2.515633392333984, "step": 1221600 }, { "epoch": 1.4741441124292574, "learning_rate": 5.106725637413903e-06, "loss": 2.5004881286621092, "step": 1221700 }, { "epoch": 1.47426477575174, "learning_rate": 5.106321801946165e-06, "loss": 2.497386016845703, "step": 1221800 }, { "epoch": 1.4743854390742226, "learning_rate": 5.105917966478426e-06, "loss": 2.485274200439453, "step": 1221900 }, { "epoch": 1.4745061023967054, "learning_rate": 5.105514131010687e-06, "loss": 2.5173263549804688, "step": 1222000 }, { "epoch": 1.474626765719188, "learning_rate": 5.105110295542949e-06, "loss": 2.498865509033203, "step": 1222100 }, { "epoch": 1.4747474290416709, "learning_rate": 5.10470646007521e-06, "loss": 2.4987611389160156, "step": 1222200 }, { "epoch": 1.4748680923641535, "learning_rate": 5.104302624607472e-06, "loss": 2.51845947265625, "step": 1222300 }, { "epoch": 1.4749887556866361, "learning_rate": 5.103898789139734e-06, "loss": 2.484233703613281, "step": 1222400 }, { "epoch": 1.4751094190091187, "learning_rate": 5.1034949536719954e-06, "loss": 2.5125245666503906, "step": 1222500 }, { "epoch": 1.4752300823316016, "learning_rate": 5.103091118204257e-06, "loss": 2.5074996948242188, "step": 1222600 }, { "epoch": 1.4753507456540842, "learning_rate": 5.102687282736519e-06, "loss": 2.516853790283203, "step": 1222700 }, { "epoch": 1.4754714089765668, "learning_rate": 5.10228344726878e-06, "loss": 2.5137060546875, "step": 1222800 }, { "epoch": 1.4755920722990497, "learning_rate": 5.101879611801042e-06, "loss": 2.5256826782226565, "step": 1222900 }, { "epoch": 1.4757127356215323, "learning_rate": 5.101475776333304e-06, "loss": 2.523046875, "step": 1223000 }, { "epoch": 1.4758333989440149, "learning_rate": 5.101071940865565e-06, "loss": 2.4916677856445313, "step": 1223100 }, { "epoch": 1.4759540622664975, "learning_rate": 5.100668105397827e-06, "loss": 2.49484619140625, "step": 1223200 }, { "epoch": 1.4760747255889803, "learning_rate": 5.100264269930089e-06, "loss": 2.499745330810547, "step": 1223300 }, { "epoch": 1.476195388911463, "learning_rate": 5.099860434462351e-06, "loss": 2.496640625, "step": 1223400 }, { "epoch": 1.4763160522339458, "learning_rate": 5.099456598994612e-06, "loss": 2.5066346740722656, "step": 1223500 }, { "epoch": 1.4764367155564284, "learning_rate": 5.099052763526873e-06, "loss": 2.472238006591797, "step": 1223600 }, { "epoch": 1.476557378878911, "learning_rate": 5.098648928059134e-06, "loss": 2.5083102416992187, "step": 1223700 }, { "epoch": 1.4766780422013936, "learning_rate": 5.098245092591396e-06, "loss": 2.528791961669922, "step": 1223800 }, { "epoch": 1.4767987055238765, "learning_rate": 5.097841257123658e-06, "loss": 2.510968780517578, "step": 1223900 }, { "epoch": 1.476919368846359, "learning_rate": 5.09743742165592e-06, "loss": 2.5229656982421873, "step": 1224000 }, { "epoch": 1.4770400321688417, "learning_rate": 5.097033586188181e-06, "loss": 2.4792845153808596, "step": 1224100 }, { "epoch": 1.4771606954913246, "learning_rate": 5.096629750720443e-06, "loss": 2.50885986328125, "step": 1224200 }, { "epoch": 1.4772813588138072, "learning_rate": 5.096225915252705e-06, "loss": 2.523955535888672, "step": 1224300 }, { "epoch": 1.4774020221362898, "learning_rate": 5.0958220797849655e-06, "loss": 2.531979522705078, "step": 1224400 }, { "epoch": 1.4775226854587724, "learning_rate": 5.0954182443172275e-06, "loss": 2.5067124938964844, "step": 1224500 }, { "epoch": 1.4776433487812553, "learning_rate": 5.0950144088494894e-06, "loss": 2.511300506591797, "step": 1224600 }, { "epoch": 1.4777640121037379, "learning_rate": 5.0946105733817506e-06, "loss": 2.513871765136719, "step": 1224700 }, { "epoch": 1.4778846754262205, "learning_rate": 5.0942067379140126e-06, "loss": 2.4859768676757814, "step": 1224800 }, { "epoch": 1.4780053387487033, "learning_rate": 5.0938029024462745e-06, "loss": 2.495927276611328, "step": 1224900 }, { "epoch": 1.478126002071186, "learning_rate": 5.093399066978536e-06, "loss": 2.503600311279297, "step": 1225000 }, { "epoch": 1.4782466653936686, "learning_rate": 5.092995231510798e-06, "loss": 2.5155311584472657, "step": 1225100 }, { "epoch": 1.4783673287161512, "learning_rate": 5.09259139604306e-06, "loss": 2.495145263671875, "step": 1225200 }, { "epoch": 1.478487992038634, "learning_rate": 5.09218756057532e-06, "loss": 2.5112640380859377, "step": 1225300 }, { "epoch": 1.4786086553611166, "learning_rate": 5.091783725107582e-06, "loss": 2.5092402648925782, "step": 1225400 }, { "epoch": 1.4787293186835995, "learning_rate": 5.091379889639844e-06, "loss": 2.503142852783203, "step": 1225500 }, { "epoch": 1.478849982006082, "learning_rate": 5.090976054172105e-06, "loss": 2.4955999755859377, "step": 1225600 }, { "epoch": 1.4789706453285647, "learning_rate": 5.090572218704367e-06, "loss": 2.539633026123047, "step": 1225700 }, { "epoch": 1.4790913086510473, "learning_rate": 5.090168383236629e-06, "loss": 2.524288330078125, "step": 1225800 }, { "epoch": 1.4792119719735302, "learning_rate": 5.089764547768891e-06, "loss": 2.506470031738281, "step": 1225900 }, { "epoch": 1.4793326352960128, "learning_rate": 5.089360712301152e-06, "loss": 2.5009576416015626, "step": 1226000 }, { "epoch": 1.4794532986184954, "learning_rate": 5.088956876833413e-06, "loss": 2.5163253784179687, "step": 1226100 }, { "epoch": 1.4795739619409782, "learning_rate": 5.088553041365674e-06, "loss": 2.5016293334960937, "step": 1226200 }, { "epoch": 1.4796946252634608, "learning_rate": 5.088149205897936e-06, "loss": 2.5031715393066407, "step": 1226300 }, { "epoch": 1.4798152885859435, "learning_rate": 5.087745370430198e-06, "loss": 2.4962274169921876, "step": 1226400 }, { "epoch": 1.479935951908426, "learning_rate": 5.08734153496246e-06, "loss": 2.5024508666992187, "step": 1226500 }, { "epoch": 1.480056615230909, "learning_rate": 5.0869376994947215e-06, "loss": 2.492612762451172, "step": 1226600 }, { "epoch": 1.4801772785533915, "learning_rate": 5.0865338640269834e-06, "loss": 2.5136407470703124, "step": 1226700 }, { "epoch": 1.4802979418758744, "learning_rate": 5.0861300285592454e-06, "loss": 2.507638244628906, "step": 1226800 }, { "epoch": 1.480418605198357, "learning_rate": 5.085726193091506e-06, "loss": 2.5208786010742186, "step": 1226900 }, { "epoch": 1.4805392685208396, "learning_rate": 5.085322357623768e-06, "loss": 2.4790194702148436, "step": 1227000 }, { "epoch": 1.4806599318433222, "learning_rate": 5.08491852215603e-06, "loss": 2.5019302368164062, "step": 1227100 }, { "epoch": 1.4807805951658048, "learning_rate": 5.084514686688291e-06, "loss": 2.5131657409667967, "step": 1227200 }, { "epoch": 1.4809012584882877, "learning_rate": 5.084110851220553e-06, "loss": 2.4889060974121096, "step": 1227300 }, { "epoch": 1.4810219218107703, "learning_rate": 5.083707015752815e-06, "loss": 2.5026963806152343, "step": 1227400 }, { "epoch": 1.4811425851332531, "learning_rate": 5.083303180285076e-06, "loss": 2.5002378845214843, "step": 1227500 }, { "epoch": 1.4812632484557358, "learning_rate": 5.082899344817338e-06, "loss": 2.513252410888672, "step": 1227600 }, { "epoch": 1.4813839117782184, "learning_rate": 5.082495509349599e-06, "loss": 2.505531005859375, "step": 1227700 }, { "epoch": 1.481504575100701, "learning_rate": 5.08209167388186e-06, "loss": 2.5214138793945313, "step": 1227800 }, { "epoch": 1.4816252384231838, "learning_rate": 5.081687838414122e-06, "loss": 2.5047735595703124, "step": 1227900 }, { "epoch": 1.4817459017456664, "learning_rate": 5.081284002946384e-06, "loss": 2.5013504028320312, "step": 1228000 }, { "epoch": 1.481866565068149, "learning_rate": 5.080880167478645e-06, "loss": 2.5119464111328127, "step": 1228100 }, { "epoch": 1.481987228390632, "learning_rate": 5.080476332010907e-06, "loss": 2.4887345886230468, "step": 1228200 }, { "epoch": 1.4821078917131145, "learning_rate": 5.080072496543169e-06, "loss": 2.520163269042969, "step": 1228300 }, { "epoch": 1.4822285550355971, "learning_rate": 5.079668661075431e-06, "loss": 2.5074234008789062, "step": 1228400 }, { "epoch": 1.4823492183580798, "learning_rate": 5.0792648256076915e-06, "loss": 2.516098937988281, "step": 1228500 }, { "epoch": 1.4824698816805626, "learning_rate": 5.0788609901399535e-06, "loss": 2.5143911743164065, "step": 1228600 }, { "epoch": 1.4825905450030452, "learning_rate": 5.078457154672215e-06, "loss": 2.5081756591796873, "step": 1228700 }, { "epoch": 1.482711208325528, "learning_rate": 5.078053319204477e-06, "loss": 2.495474853515625, "step": 1228800 }, { "epoch": 1.4828318716480107, "learning_rate": 5.077649483736739e-06, "loss": 2.504680328369141, "step": 1228900 }, { "epoch": 1.4829525349704933, "learning_rate": 5.0772456482690006e-06, "loss": 2.5292999267578127, "step": 1229000 }, { "epoch": 1.483073198292976, "learning_rate": 5.076841812801262e-06, "loss": 2.5181292724609374, "step": 1229100 }, { "epoch": 1.4831938616154587, "learning_rate": 5.076437977333524e-06, "loss": 2.4993862915039062, "step": 1229200 }, { "epoch": 1.4833145249379414, "learning_rate": 5.076034141865784e-06, "loss": 2.5067477416992188, "step": 1229300 }, { "epoch": 1.483435188260424, "learning_rate": 5.075630306398046e-06, "loss": 2.5284080505371094, "step": 1229400 }, { "epoch": 1.4835558515829068, "learning_rate": 5.075226470930308e-06, "loss": 2.5317233276367186, "step": 1229500 }, { "epoch": 1.4836765149053894, "learning_rate": 5.07482263546257e-06, "loss": 2.520333709716797, "step": 1229600 }, { "epoch": 1.483797178227872, "learning_rate": 5.074418799994831e-06, "loss": 2.48560302734375, "step": 1229700 }, { "epoch": 1.4839178415503547, "learning_rate": 5.074014964527093e-06, "loss": 2.4945091247558593, "step": 1229800 }, { "epoch": 1.4840385048728375, "learning_rate": 5.073611129059355e-06, "loss": 2.516612091064453, "step": 1229900 }, { "epoch": 1.4841591681953201, "learning_rate": 5.073207293591616e-06, "loss": 2.498449249267578, "step": 1230000 }, { "epoch": 1.4842798315178027, "learning_rate": 5.072803458123877e-06, "loss": 2.5093031311035157, "step": 1230100 }, { "epoch": 1.4844004948402856, "learning_rate": 5.072399622656139e-06, "loss": 2.511419677734375, "step": 1230200 }, { "epoch": 1.4845211581627682, "learning_rate": 5.0719957871884e-06, "loss": 2.519235076904297, "step": 1230300 }, { "epoch": 1.4846418214852508, "learning_rate": 5.071591951720662e-06, "loss": 2.5127415466308594, "step": 1230400 }, { "epoch": 1.4847624848077334, "learning_rate": 5.071188116252924e-06, "loss": 2.4952952575683596, "step": 1230500 }, { "epoch": 1.4848831481302163, "learning_rate": 5.0707842807851855e-06, "loss": 2.4984344482421874, "step": 1230600 }, { "epoch": 1.4850038114526989, "learning_rate": 5.0703804453174475e-06, "loss": 2.5249986267089843, "step": 1230700 }, { "epoch": 1.4851244747751817, "learning_rate": 5.0699766098497095e-06, "loss": 2.5324212646484376, "step": 1230800 }, { "epoch": 1.4852451380976643, "learning_rate": 5.0695727743819715e-06, "loss": 2.4994656372070314, "step": 1230900 }, { "epoch": 1.485365801420147, "learning_rate": 5.069168938914232e-06, "loss": 2.5104295349121095, "step": 1231000 }, { "epoch": 1.4854864647426296, "learning_rate": 5.068765103446494e-06, "loss": 2.487687072753906, "step": 1231100 }, { "epoch": 1.4856071280651124, "learning_rate": 5.068361267978755e-06, "loss": 2.49460693359375, "step": 1231200 }, { "epoch": 1.485727791387595, "learning_rate": 5.067957432511017e-06, "loss": 2.499996795654297, "step": 1231300 }, { "epoch": 1.4858484547100776, "learning_rate": 5.067553597043279e-06, "loss": 2.5138140869140626, "step": 1231400 }, { "epoch": 1.4859691180325605, "learning_rate": 5.067149761575541e-06, "loss": 2.504788513183594, "step": 1231500 }, { "epoch": 1.486089781355043, "learning_rate": 5.066745926107802e-06, "loss": 2.4957034301757814, "step": 1231600 }, { "epoch": 1.4862104446775257, "learning_rate": 5.066342090640064e-06, "loss": 2.514872283935547, "step": 1231700 }, { "epoch": 1.4863311080000083, "learning_rate": 5.065938255172324e-06, "loss": 2.507959442138672, "step": 1231800 }, { "epoch": 1.4864517713224912, "learning_rate": 5.065534419704586e-06, "loss": 2.487789306640625, "step": 1231900 }, { "epoch": 1.4865724346449738, "learning_rate": 5.065130584236848e-06, "loss": 2.5112171936035157, "step": 1232000 }, { "epoch": 1.4866930979674566, "learning_rate": 5.06472674876911e-06, "loss": 2.5091734313964844, "step": 1232100 }, { "epoch": 1.4868137612899393, "learning_rate": 5.064322913301371e-06, "loss": 2.4988185119628907, "step": 1232200 }, { "epoch": 1.4869344246124219, "learning_rate": 5.063919077833633e-06, "loss": 2.4950767517089845, "step": 1232300 }, { "epoch": 1.4870550879349045, "learning_rate": 5.063515242365895e-06, "loss": 2.5324436950683595, "step": 1232400 }, { "epoch": 1.487175751257387, "learning_rate": 5.063111406898157e-06, "loss": 2.5270782470703126, "step": 1232500 }, { "epoch": 1.48729641457987, "learning_rate": 5.0627075714304175e-06, "loss": 2.478857421875, "step": 1232600 }, { "epoch": 1.4874170779023526, "learning_rate": 5.0623037359626795e-06, "loss": 2.4874867248535155, "step": 1232700 }, { "epoch": 1.4875377412248354, "learning_rate": 5.061899900494941e-06, "loss": 2.5047451782226564, "step": 1232800 }, { "epoch": 1.487658404547318, "learning_rate": 5.061496065027203e-06, "loss": 2.4920872497558593, "step": 1232900 }, { "epoch": 1.4877790678698006, "learning_rate": 5.061092229559465e-06, "loss": 2.516678466796875, "step": 1233000 }, { "epoch": 1.4878997311922832, "learning_rate": 5.060688394091727e-06, "loss": 2.534964599609375, "step": 1233100 }, { "epoch": 1.488020394514766, "learning_rate": 5.060284558623988e-06, "loss": 2.4930741882324217, "step": 1233200 }, { "epoch": 1.4881410578372487, "learning_rate": 5.05988072315625e-06, "loss": 2.5094786071777344, "step": 1233300 }, { "epoch": 1.4882617211597313, "learning_rate": 5.05947688768851e-06, "loss": 2.4979066467285156, "step": 1233400 }, { "epoch": 1.4883823844822142, "learning_rate": 5.059073052220772e-06, "loss": 2.523238220214844, "step": 1233500 }, { "epoch": 1.4885030478046968, "learning_rate": 5.058669216753034e-06, "loss": 2.5056251525878905, "step": 1233600 }, { "epoch": 1.4886237111271794, "learning_rate": 5.058265381285296e-06, "loss": 2.5083335876464843, "step": 1233700 }, { "epoch": 1.488744374449662, "learning_rate": 5.057861545817557e-06, "loss": 2.506604766845703, "step": 1233800 }, { "epoch": 1.4888650377721449, "learning_rate": 5.057457710349819e-06, "loss": 2.498243408203125, "step": 1233900 }, { "epoch": 1.4889857010946275, "learning_rate": 5.057053874882081e-06, "loss": 2.538086395263672, "step": 1234000 }, { "epoch": 1.4891063644171103, "learning_rate": 5.056650039414342e-06, "loss": 2.509546661376953, "step": 1234100 }, { "epoch": 1.489227027739593, "learning_rate": 5.056246203946603e-06, "loss": 2.504397430419922, "step": 1234200 }, { "epoch": 1.4893476910620755, "learning_rate": 5.055842368478865e-06, "loss": 2.522916564941406, "step": 1234300 }, { "epoch": 1.4894683543845582, "learning_rate": 5.0554385330111264e-06, "loss": 2.520760345458984, "step": 1234400 }, { "epoch": 1.489589017707041, "learning_rate": 5.0550346975433884e-06, "loss": 2.4952825927734374, "step": 1234500 }, { "epoch": 1.4897096810295236, "learning_rate": 5.05463086207565e-06, "loss": 2.5086622619628907, "step": 1234600 }, { "epoch": 1.4898303443520062, "learning_rate": 5.0542270266079115e-06, "loss": 2.4956578063964843, "step": 1234700 }, { "epoch": 1.489951007674489, "learning_rate": 5.0538231911401735e-06, "loss": 2.480840148925781, "step": 1234800 }, { "epoch": 1.4900716709969717, "learning_rate": 5.0534193556724355e-06, "loss": 2.4940371704101563, "step": 1234900 }, { "epoch": 1.4901923343194543, "learning_rate": 5.053015520204696e-06, "loss": 2.5431732177734374, "step": 1235000 }, { "epoch": 1.490312997641937, "learning_rate": 5.052611684736958e-06, "loss": 2.502003021240234, "step": 1235100 }, { "epoch": 1.4904336609644198, "learning_rate": 5.05220784926922e-06, "loss": 2.5098077392578126, "step": 1235200 }, { "epoch": 1.4905543242869024, "learning_rate": 5.051804013801481e-06, "loss": 2.5191685485839845, "step": 1235300 }, { "epoch": 1.490674987609385, "learning_rate": 5.051400178333743e-06, "loss": 2.518188018798828, "step": 1235400 }, { "epoch": 1.4907956509318678, "learning_rate": 5.050996342866005e-06, "loss": 2.497204132080078, "step": 1235500 }, { "epoch": 1.4909163142543504, "learning_rate": 5.050592507398267e-06, "loss": 2.4791336059570312, "step": 1235600 }, { "epoch": 1.491036977576833, "learning_rate": 5.050188671930528e-06, "loss": 2.492056121826172, "step": 1235700 }, { "epoch": 1.4911576408993157, "learning_rate": 5.04978483646279e-06, "loss": 2.5029461669921873, "step": 1235800 }, { "epoch": 1.4912783042217985, "learning_rate": 5.04938100099505e-06, "loss": 2.5011993408203126, "step": 1235900 }, { "epoch": 1.4913989675442811, "learning_rate": 5.048977165527312e-06, "loss": 2.482007598876953, "step": 1236000 }, { "epoch": 1.491519630866764, "learning_rate": 5.048573330059574e-06, "loss": 2.5033558654785155, "step": 1236100 }, { "epoch": 1.4916402941892466, "learning_rate": 5.048169494591836e-06, "loss": 2.5042074584960936, "step": 1236200 }, { "epoch": 1.4917609575117292, "learning_rate": 5.047765659124097e-06, "loss": 2.483251037597656, "step": 1236300 }, { "epoch": 1.4918816208342118, "learning_rate": 5.047361823656359e-06, "loss": 2.505323028564453, "step": 1236400 }, { "epoch": 1.4920022841566947, "learning_rate": 5.046957988188621e-06, "loss": 2.5104856872558594, "step": 1236500 }, { "epoch": 1.4921229474791773, "learning_rate": 5.0465541527208824e-06, "loss": 2.5133212280273436, "step": 1236600 }, { "epoch": 1.49224361080166, "learning_rate": 5.0461503172531436e-06, "loss": 2.491993713378906, "step": 1236700 }, { "epoch": 1.4923642741241427, "learning_rate": 5.0457464817854056e-06, "loss": 2.5100425720214843, "step": 1236800 }, { "epoch": 1.4924849374466254, "learning_rate": 5.045342646317667e-06, "loss": 2.4889756774902345, "step": 1236900 }, { "epoch": 1.492605600769108, "learning_rate": 5.044938810849929e-06, "loss": 2.502107696533203, "step": 1237000 }, { "epoch": 1.4927262640915906, "learning_rate": 5.044534975382191e-06, "loss": 2.511322479248047, "step": 1237100 }, { "epoch": 1.4928469274140734, "learning_rate": 5.044131139914452e-06, "loss": 2.501515655517578, "step": 1237200 }, { "epoch": 1.492967590736556, "learning_rate": 5.043727304446714e-06, "loss": 2.496554107666016, "step": 1237300 }, { "epoch": 1.4930882540590389, "learning_rate": 5.043323468978976e-06, "loss": 2.5351727294921873, "step": 1237400 }, { "epoch": 1.4932089173815215, "learning_rate": 5.042919633511236e-06, "loss": 2.507554931640625, "step": 1237500 }, { "epoch": 1.4933295807040041, "learning_rate": 5.042515798043498e-06, "loss": 2.5122499084472656, "step": 1237600 }, { "epoch": 1.4934502440264867, "learning_rate": 5.04211196257576e-06, "loss": 2.5135847473144532, "step": 1237700 }, { "epoch": 1.4935709073489694, "learning_rate": 5.041708127108021e-06, "loss": 2.525479278564453, "step": 1237800 }, { "epoch": 1.4936915706714522, "learning_rate": 5.041304291640283e-06, "loss": 2.493652038574219, "step": 1237900 }, { "epoch": 1.4938122339939348, "learning_rate": 5.040900456172545e-06, "loss": 2.4987205505371093, "step": 1238000 }, { "epoch": 1.4939328973164177, "learning_rate": 5.040496620704807e-06, "loss": 2.5083509826660157, "step": 1238100 }, { "epoch": 1.4940535606389003, "learning_rate": 5.040092785237068e-06, "loss": 2.4933653259277344, "step": 1238200 }, { "epoch": 1.4941742239613829, "learning_rate": 5.039688949769329e-06, "loss": 2.5171026611328124, "step": 1238300 }, { "epoch": 1.4942948872838655, "learning_rate": 5.0392851143015905e-06, "loss": 2.489144134521484, "step": 1238400 }, { "epoch": 1.4944155506063483, "learning_rate": 5.0388812788338525e-06, "loss": 2.4918963623046877, "step": 1238500 }, { "epoch": 1.494536213928831, "learning_rate": 5.0384774433661145e-06, "loss": 2.522034454345703, "step": 1238600 }, { "epoch": 1.4946568772513136, "learning_rate": 5.0380736078983764e-06, "loss": 2.5165144348144532, "step": 1238700 }, { "epoch": 1.4947775405737964, "learning_rate": 5.037669772430638e-06, "loss": 2.486369934082031, "step": 1238800 }, { "epoch": 1.494898203896279, "learning_rate": 5.0372659369628996e-06, "loss": 2.5161273193359377, "step": 1238900 }, { "epoch": 1.4950188672187616, "learning_rate": 5.0368621014951615e-06, "loss": 2.490640869140625, "step": 1239000 }, { "epoch": 1.4951395305412443, "learning_rate": 5.036458266027422e-06, "loss": 2.512001800537109, "step": 1239100 }, { "epoch": 1.495260193863727, "learning_rate": 5.036054430559684e-06, "loss": 2.522768096923828, "step": 1239200 }, { "epoch": 1.4953808571862097, "learning_rate": 5.035650595091946e-06, "loss": 2.4894984436035155, "step": 1239300 }, { "epoch": 1.4955015205086926, "learning_rate": 5.035246759624207e-06, "loss": 2.505165710449219, "step": 1239400 }, { "epoch": 1.4956221838311752, "learning_rate": 5.034842924156469e-06, "loss": 2.4938673400878906, "step": 1239500 }, { "epoch": 1.4957428471536578, "learning_rate": 5.034439088688731e-06, "loss": 2.4932318115234375, "step": 1239600 }, { "epoch": 1.4958635104761404, "learning_rate": 5.034035253220992e-06, "loss": 2.5093820190429685, "step": 1239700 }, { "epoch": 1.4959841737986233, "learning_rate": 5.033631417753254e-06, "loss": 2.5175271606445313, "step": 1239800 }, { "epoch": 1.4961048371211059, "learning_rate": 5.033227582285515e-06, "loss": 2.4872279357910156, "step": 1239900 }, { "epoch": 1.4962255004435885, "learning_rate": 5.032823746817776e-06, "loss": 2.5161679077148436, "step": 1240000 }, { "epoch": 1.4963461637660713, "learning_rate": 5.032419911350038e-06, "loss": 2.5048822021484374, "step": 1240100 }, { "epoch": 1.496466827088554, "learning_rate": 5.0320160758823e-06, "loss": 2.49961669921875, "step": 1240200 }, { "epoch": 1.4965874904110366, "learning_rate": 5.031612240414561e-06, "loss": 2.5100254821777344, "step": 1240300 }, { "epoch": 1.4967081537335192, "learning_rate": 5.031208404946823e-06, "loss": 2.4978070068359375, "step": 1240400 }, { "epoch": 1.496828817056002, "learning_rate": 5.030804569479085e-06, "loss": 2.4935145568847656, "step": 1240500 }, { "epoch": 1.4969494803784846, "learning_rate": 5.030400734011347e-06, "loss": 2.5285713195800783, "step": 1240600 }, { "epoch": 1.4970701437009672, "learning_rate": 5.0299968985436085e-06, "loss": 2.527998199462891, "step": 1240700 }, { "epoch": 1.49719080702345, "learning_rate": 5.02959306307587e-06, "loss": 2.5172918701171874, "step": 1240800 }, { "epoch": 1.4973114703459327, "learning_rate": 5.029189227608131e-06, "loss": 2.503282165527344, "step": 1240900 }, { "epoch": 1.4974321336684153, "learning_rate": 5.028785392140393e-06, "loss": 2.486165313720703, "step": 1241000 }, { "epoch": 1.497552796990898, "learning_rate": 5.028381556672655e-06, "loss": 2.4879579162597656, "step": 1241100 }, { "epoch": 1.4976734603133808, "learning_rate": 5.027977721204917e-06, "loss": 2.4919474792480467, "step": 1241200 }, { "epoch": 1.4977941236358634, "learning_rate": 5.027573885737178e-06, "loss": 2.515879669189453, "step": 1241300 }, { "epoch": 1.4979147869583462, "learning_rate": 5.02717005026944e-06, "loss": 2.517036590576172, "step": 1241400 }, { "epoch": 1.4980354502808289, "learning_rate": 5.026766214801702e-06, "loss": 2.519919128417969, "step": 1241500 }, { "epoch": 1.4981561136033115, "learning_rate": 5.026362379333962e-06, "loss": 2.4938168334960937, "step": 1241600 }, { "epoch": 1.498276776925794, "learning_rate": 5.025958543866224e-06, "loss": 2.4914508056640625, "step": 1241700 }, { "epoch": 1.498397440248277, "learning_rate": 5.025554708398486e-06, "loss": 2.4903190612792967, "step": 1241800 }, { "epoch": 1.4985181035707595, "learning_rate": 5.025150872930747e-06, "loss": 2.5073460388183593, "step": 1241900 }, { "epoch": 1.4986387668932422, "learning_rate": 5.024747037463009e-06, "loss": 2.501581115722656, "step": 1242000 }, { "epoch": 1.498759430215725, "learning_rate": 5.024343201995271e-06, "loss": 2.5057942199707033, "step": 1242100 }, { "epoch": 1.4988800935382076, "learning_rate": 5.023939366527532e-06, "loss": 2.5122047424316407, "step": 1242200 }, { "epoch": 1.4990007568606902, "learning_rate": 5.023535531059794e-06, "loss": 2.5282000732421874, "step": 1242300 }, { "epoch": 1.4991214201831728, "learning_rate": 5.023131695592055e-06, "loss": 2.4890040588378906, "step": 1242400 }, { "epoch": 1.4992420835056557, "learning_rate": 5.0227278601243165e-06, "loss": 2.4866087341308596, "step": 1242500 }, { "epoch": 1.4993627468281383, "learning_rate": 5.0223240246565785e-06, "loss": 2.5167454528808593, "step": 1242600 }, { "epoch": 1.4994834101506211, "learning_rate": 5.0219201891888405e-06, "loss": 2.510386962890625, "step": 1242700 }, { "epoch": 1.4996040734731038, "learning_rate": 5.021516353721102e-06, "loss": 2.503909454345703, "step": 1242800 }, { "epoch": 1.4997247367955864, "learning_rate": 5.021112518253364e-06, "loss": 2.514920959472656, "step": 1242900 }, { "epoch": 1.499845400118069, "learning_rate": 5.020708682785626e-06, "loss": 2.493968048095703, "step": 1243000 }, { "epoch": 1.4999660634405516, "learning_rate": 5.020304847317888e-06, "loss": 2.4973204040527346, "step": 1243100 }, { "epoch": 1.5000867267630345, "learning_rate": 5.019901011850148e-06, "loss": 2.5042758178710938, "step": 1243200 }, { "epoch": 1.500207390085517, "learning_rate": 5.01949717638241e-06, "loss": 2.4976905822753905, "step": 1243300 }, { "epoch": 1.500328053408, "learning_rate": 5.019093340914671e-06, "loss": 2.5179104614257812, "step": 1243400 }, { "epoch": 1.5004487167304825, "learning_rate": 5.018689505446933e-06, "loss": 2.498954162597656, "step": 1243500 }, { "epoch": 1.5005693800529651, "learning_rate": 5.018285669979195e-06, "loss": 2.4830584716796875, "step": 1243600 }, { "epoch": 1.5006900433754478, "learning_rate": 5.017881834511457e-06, "loss": 2.505063781738281, "step": 1243700 }, { "epoch": 1.5008107066979304, "learning_rate": 5.017477999043718e-06, "loss": 2.5048257446289064, "step": 1243800 }, { "epoch": 1.5009313700204132, "learning_rate": 5.01707416357598e-06, "loss": 2.4940745544433596, "step": 1243900 }, { "epoch": 1.501052033342896, "learning_rate": 5.01667032810824e-06, "loss": 2.499711761474609, "step": 1244000 }, { "epoch": 1.5011726966653787, "learning_rate": 5.016266492640502e-06, "loss": 2.505697479248047, "step": 1244100 }, { "epoch": 1.5012933599878613, "learning_rate": 5.015862657172764e-06, "loss": 2.5040908813476563, "step": 1244200 }, { "epoch": 1.501414023310344, "learning_rate": 5.015458821705026e-06, "loss": 2.5219766235351564, "step": 1244300 }, { "epoch": 1.5015346866328265, "learning_rate": 5.0150549862372874e-06, "loss": 2.5024447631835938, "step": 1244400 }, { "epoch": 1.5016553499553094, "learning_rate": 5.014651150769549e-06, "loss": 2.4958230590820314, "step": 1244500 }, { "epoch": 1.501776013277792, "learning_rate": 5.014247315301811e-06, "loss": 2.481914520263672, "step": 1244600 }, { "epoch": 1.5018966766002748, "learning_rate": 5.0138434798340725e-06, "loss": 2.5093251037597657, "step": 1244700 }, { "epoch": 1.5020173399227574, "learning_rate": 5.013439644366334e-06, "loss": 2.476928253173828, "step": 1244800 }, { "epoch": 1.50213800324524, "learning_rate": 5.013035808898596e-06, "loss": 2.5095875549316404, "step": 1244900 }, { "epoch": 1.5022586665677227, "learning_rate": 5.012631973430857e-06, "loss": 2.498838348388672, "step": 1245000 }, { "epoch": 1.5023793298902053, "learning_rate": 5.012228137963119e-06, "loss": 2.4929710388183595, "step": 1245100 }, { "epoch": 1.5024999932126881, "learning_rate": 5.011824302495381e-06, "loss": 2.478050079345703, "step": 1245200 }, { "epoch": 1.5026206565351707, "learning_rate": 5.011420467027642e-06, "loss": 2.4850579833984376, "step": 1245300 }, { "epoch": 1.5027413198576536, "learning_rate": 5.011016631559904e-06, "loss": 2.4889154052734375, "step": 1245400 }, { "epoch": 1.5028619831801362, "learning_rate": 5.010612796092166e-06, "loss": 2.496114044189453, "step": 1245500 }, { "epoch": 1.5029826465026188, "learning_rate": 5.010208960624426e-06, "loss": 2.5219406127929687, "step": 1245600 }, { "epoch": 1.5031033098251014, "learning_rate": 5.009805125156688e-06, "loss": 2.508932342529297, "step": 1245700 }, { "epoch": 1.5032239731475843, "learning_rate": 5.00940128968895e-06, "loss": 2.516162567138672, "step": 1245800 }, { "epoch": 1.5033446364700669, "learning_rate": 5.008997454221211e-06, "loss": 2.5290354919433593, "step": 1245900 }, { "epoch": 1.5034652997925497, "learning_rate": 5.008593618753473e-06, "loss": 2.4786366271972655, "step": 1246000 }, { "epoch": 1.5035859631150323, "learning_rate": 5.008189783285735e-06, "loss": 2.456603240966797, "step": 1246100 }, { "epoch": 1.503706626437515, "learning_rate": 5.007785947817997e-06, "loss": 2.479251708984375, "step": 1246200 }, { "epoch": 1.5038272897599976, "learning_rate": 5.007382112350258e-06, "loss": 2.5060044860839845, "step": 1246300 }, { "epoch": 1.5039479530824802, "learning_rate": 5.00697827688252e-06, "loss": 2.510154113769531, "step": 1246400 }, { "epoch": 1.504068616404963, "learning_rate": 5.006574441414781e-06, "loss": 2.530317687988281, "step": 1246500 }, { "epoch": 1.5041892797274456, "learning_rate": 5.0061706059470426e-06, "loss": 2.5029278564453126, "step": 1246600 }, { "epoch": 1.5043099430499285, "learning_rate": 5.0057667704793046e-06, "loss": 2.5045599365234374, "step": 1246700 }, { "epoch": 1.504430606372411, "learning_rate": 5.0053629350115665e-06, "loss": 2.4961837768554687, "step": 1246800 }, { "epoch": 1.5045512696948937, "learning_rate": 5.004959099543828e-06, "loss": 2.4957057189941407, "step": 1246900 }, { "epoch": 1.5046719330173763, "learning_rate": 5.00455526407609e-06, "loss": 2.4791133117675783, "step": 1247000 }, { "epoch": 1.504792596339859, "learning_rate": 5.004151428608352e-06, "loss": 2.5010308837890625, "step": 1247100 }, { "epoch": 1.5049132596623418, "learning_rate": 5.003747593140614e-06, "loss": 2.4874658203125, "step": 1247200 }, { "epoch": 1.5050339229848246, "learning_rate": 5.003343757672874e-06, "loss": 2.490304718017578, "step": 1247300 }, { "epoch": 1.5051545863073073, "learning_rate": 5.002939922205136e-06, "loss": 2.5132891845703127, "step": 1247400 }, { "epoch": 1.5052752496297899, "learning_rate": 5.002536086737397e-06, "loss": 2.5209030151367187, "step": 1247500 }, { "epoch": 1.5053959129522725, "learning_rate": 5.002132251269659e-06, "loss": 2.5124871826171873, "step": 1247600 }, { "epoch": 1.505516576274755, "learning_rate": 5.001728415801921e-06, "loss": 2.5272447204589845, "step": 1247700 }, { "epoch": 1.505637239597238, "learning_rate": 5.001324580334183e-06, "loss": 2.495961456298828, "step": 1247800 }, { "epoch": 1.5057579029197206, "learning_rate": 5.000920744866444e-06, "loss": 2.4812995910644533, "step": 1247900 }, { "epoch": 1.5058785662422034, "learning_rate": 5.000516909398706e-06, "loss": 2.4943507385253905, "step": 1248000 }, { "epoch": 1.505999229564686, "learning_rate": 5.000113073930966e-06, "loss": 2.504942626953125, "step": 1248100 }, { "epoch": 1.5061198928871686, "learning_rate": 4.999709238463229e-06, "loss": 2.508363952636719, "step": 1248200 }, { "epoch": 1.5062405562096512, "learning_rate": 4.99930540299549e-06, "loss": 2.4741485595703123, "step": 1248300 }, { "epoch": 1.5063612195321339, "learning_rate": 4.998901567527752e-06, "loss": 2.514406280517578, "step": 1248400 }, { "epoch": 1.5064818828546167, "learning_rate": 4.9984977320600135e-06, "loss": 2.485940246582031, "step": 1248500 }, { "epoch": 1.5066025461770993, "learning_rate": 4.9980938965922754e-06, "loss": 2.513775634765625, "step": 1248600 }, { "epoch": 1.5067232094995822, "learning_rate": 4.997690061124537e-06, "loss": 2.4846946716308596, "step": 1248700 }, { "epoch": 1.5068438728220648, "learning_rate": 4.9972862256567986e-06, "loss": 2.495525054931641, "step": 1248800 }, { "epoch": 1.5069645361445474, "learning_rate": 4.99688239018906e-06, "loss": 2.4903050231933594, "step": 1248900 }, { "epoch": 1.50708519946703, "learning_rate": 4.996478554721322e-06, "loss": 2.505094299316406, "step": 1249000 }, { "epoch": 1.5072058627895126, "learning_rate": 4.996074719253583e-06, "loss": 2.5096560668945314, "step": 1249100 }, { "epoch": 1.5073265261119955, "learning_rate": 4.995670883785845e-06, "loss": 2.5015322875976564, "step": 1249200 }, { "epoch": 1.5074471894344783, "learning_rate": 4.995267048318107e-06, "loss": 2.5048759460449217, "step": 1249300 }, { "epoch": 1.507567852756961, "learning_rate": 4.994863212850368e-06, "loss": 2.521825256347656, "step": 1249400 }, { "epoch": 1.5076885160794435, "learning_rate": 4.994459377382629e-06, "loss": 2.480241394042969, "step": 1249500 }, { "epoch": 1.5078091794019262, "learning_rate": 4.994055541914891e-06, "loss": 2.506925048828125, "step": 1249600 }, { "epoch": 1.5079298427244088, "learning_rate": 4.993651706447153e-06, "loss": 2.508273162841797, "step": 1249700 }, { "epoch": 1.5080505060468916, "learning_rate": 4.993247870979415e-06, "loss": 2.5184339904785156, "step": 1249800 }, { "epoch": 1.5081711693693742, "learning_rate": 4.992844035511676e-06, "loss": 2.503973083496094, "step": 1249900 }, { "epoch": 1.508291832691857, "learning_rate": 4.992440200043937e-06, "loss": 2.4907530212402342, "step": 1250000 }, { "epoch": 1.5084124960143397, "learning_rate": 4.992036364576199e-06, "loss": 2.491641082763672, "step": 1250100 }, { "epoch": 1.5085331593368223, "learning_rate": 4.991632529108461e-06, "loss": 2.517403869628906, "step": 1250200 }, { "epoch": 1.508653822659305, "learning_rate": 4.991228693640722e-06, "loss": 2.5087905883789063, "step": 1250300 }, { "epoch": 1.5087744859817875, "learning_rate": 4.990824858172984e-06, "loss": 2.499723358154297, "step": 1250400 }, { "epoch": 1.5088951493042704, "learning_rate": 4.9904210227052455e-06, "loss": 2.5018006896972658, "step": 1250500 }, { "epoch": 1.509015812626753, "learning_rate": 4.9900171872375075e-06, "loss": 2.5035487365722657, "step": 1250600 }, { "epoch": 1.5091364759492358, "learning_rate": 4.989613351769769e-06, "loss": 2.4880825805664064, "step": 1250700 }, { "epoch": 1.5092571392717185, "learning_rate": 4.989209516302031e-06, "loss": 2.4991664123535156, "step": 1250800 }, { "epoch": 1.509377802594201, "learning_rate": 4.9888056808342926e-06, "loss": 2.5218592834472657, "step": 1250900 }, { "epoch": 1.5094984659166837, "learning_rate": 4.988401845366554e-06, "loss": 2.5079896545410154, "step": 1251000 }, { "epoch": 1.5096191292391665, "learning_rate": 4.987998009898816e-06, "loss": 2.5111083984375, "step": 1251100 }, { "epoch": 1.5097397925616491, "learning_rate": 4.987594174431077e-06, "loss": 2.504441986083984, "step": 1251200 }, { "epoch": 1.509860455884132, "learning_rate": 4.987190338963339e-06, "loss": 2.505370788574219, "step": 1251300 }, { "epoch": 1.5099811192066146, "learning_rate": 4.9867865034956e-06, "loss": 2.5053141784667967, "step": 1251400 }, { "epoch": 1.5101017825290972, "learning_rate": 4.986382668027862e-06, "loss": 2.504780731201172, "step": 1251500 }, { "epoch": 1.5102224458515798, "learning_rate": 4.985978832560123e-06, "loss": 2.5327699279785154, "step": 1251600 }, { "epoch": 1.5103431091740624, "learning_rate": 4.985574997092385e-06, "loss": 2.5163504028320314, "step": 1251700 }, { "epoch": 1.5104637724965453, "learning_rate": 4.985171161624647e-06, "loss": 2.5124050903320314, "step": 1251800 }, { "epoch": 1.510584435819028, "learning_rate": 4.984767326156908e-06, "loss": 2.5198600769042967, "step": 1251900 }, { "epoch": 1.5107050991415107, "learning_rate": 4.984363490689169e-06, "loss": 2.515691223144531, "step": 1252000 }, { "epoch": 1.5108257624639934, "learning_rate": 4.983959655221431e-06, "loss": 2.503421173095703, "step": 1252100 }, { "epoch": 1.510946425786476, "learning_rate": 4.983555819753693e-06, "loss": 2.50197265625, "step": 1252200 }, { "epoch": 1.5110670891089586, "learning_rate": 4.983151984285955e-06, "loss": 2.5019767761230467, "step": 1252300 }, { "epoch": 1.5111877524314412, "learning_rate": 4.982748148818216e-06, "loss": 2.5022467041015624, "step": 1252400 }, { "epoch": 1.511308415753924, "learning_rate": 4.9823443133504775e-06, "loss": 2.540264892578125, "step": 1252500 }, { "epoch": 1.511429079076407, "learning_rate": 4.9819404778827395e-06, "loss": 2.46491455078125, "step": 1252600 }, { "epoch": 1.5115497423988895, "learning_rate": 4.9815366424150015e-06, "loss": 2.509041595458984, "step": 1252700 }, { "epoch": 1.5116704057213721, "learning_rate": 4.981132806947263e-06, "loss": 2.4909294128417967, "step": 1252800 }, { "epoch": 1.5117910690438547, "learning_rate": 4.980728971479525e-06, "loss": 2.498636932373047, "step": 1252900 }, { "epoch": 1.5119117323663374, "learning_rate": 4.980325136011786e-06, "loss": 2.487220916748047, "step": 1253000 }, { "epoch": 1.5120323956888202, "learning_rate": 4.979921300544048e-06, "loss": 2.506031799316406, "step": 1253100 }, { "epoch": 1.5121530590113028, "learning_rate": 4.979517465076309e-06, "loss": 2.5182179260253905, "step": 1253200 }, { "epoch": 1.5122737223337857, "learning_rate": 4.979113629608571e-06, "loss": 2.508070373535156, "step": 1253300 }, { "epoch": 1.5123943856562683, "learning_rate": 4.978709794140833e-06, "loss": 2.5083682250976564, "step": 1253400 }, { "epoch": 1.5125150489787509, "learning_rate": 4.978305958673094e-06, "loss": 2.5073524475097657, "step": 1253500 }, { "epoch": 1.5126357123012335, "learning_rate": 4.977902123205355e-06, "loss": 2.48991943359375, "step": 1253600 }, { "epoch": 1.5127563756237161, "learning_rate": 4.977498287737617e-06, "loss": 2.4831303405761718, "step": 1253700 }, { "epoch": 1.512877038946199, "learning_rate": 4.977094452269879e-06, "loss": 2.4915975952148437, "step": 1253800 }, { "epoch": 1.5129977022686816, "learning_rate": 4.97669061680214e-06, "loss": 2.5110015869140625, "step": 1253900 }, { "epoch": 1.5131183655911644, "learning_rate": 4.976286781334402e-06, "loss": 2.4872471618652345, "step": 1254000 }, { "epoch": 1.513239028913647, "learning_rate": 4.975882945866663e-06, "loss": 2.4923442077636717, "step": 1254100 }, { "epoch": 1.5133596922361296, "learning_rate": 4.975479110398925e-06, "loss": 2.5147799682617187, "step": 1254200 }, { "epoch": 1.5134803555586123, "learning_rate": 4.975075274931187e-06, "loss": 2.498591003417969, "step": 1254300 }, { "epoch": 1.5136010188810949, "learning_rate": 4.974671439463448e-06, "loss": 2.495019836425781, "step": 1254400 }, { "epoch": 1.5137216822035777, "learning_rate": 4.9742676039957095e-06, "loss": 2.5056549072265626, "step": 1254500 }, { "epoch": 1.5138423455260606, "learning_rate": 4.9738637685279715e-06, "loss": 2.5043685913085936, "step": 1254600 }, { "epoch": 1.5139630088485432, "learning_rate": 4.9734599330602335e-06, "loss": 2.498760223388672, "step": 1254700 }, { "epoch": 1.5140836721710258, "learning_rate": 4.973056097592495e-06, "loss": 2.49300537109375, "step": 1254800 }, { "epoch": 1.5142043354935084, "learning_rate": 4.972652262124757e-06, "loss": 2.510650177001953, "step": 1254900 }, { "epoch": 1.514324998815991, "learning_rate": 4.972248426657018e-06, "loss": 2.502952117919922, "step": 1255000 }, { "epoch": 1.5144456621384739, "learning_rate": 4.97184459118928e-06, "loss": 2.4819631958007813, "step": 1255100 }, { "epoch": 1.5145663254609565, "learning_rate": 4.971440755721541e-06, "loss": 2.4986769104003907, "step": 1255200 }, { "epoch": 1.5146869887834393, "learning_rate": 4.971036920253803e-06, "loss": 2.5241822814941406, "step": 1255300 }, { "epoch": 1.514807652105922, "learning_rate": 4.970633084786065e-06, "loss": 2.49258544921875, "step": 1255400 }, { "epoch": 1.5149283154284046, "learning_rate": 4.970229249318326e-06, "loss": 2.5216075134277345, "step": 1255500 }, { "epoch": 1.5150489787508872, "learning_rate": 4.969825413850587e-06, "loss": 2.5072703552246094, "step": 1255600 }, { "epoch": 1.5151696420733698, "learning_rate": 4.969421578382849e-06, "loss": 2.5038958740234376, "step": 1255700 }, { "epoch": 1.5152903053958526, "learning_rate": 4.969017742915111e-06, "loss": 2.513155212402344, "step": 1255800 }, { "epoch": 1.5154109687183352, "learning_rate": 4.968613907447373e-06, "loss": 2.4956251525878907, "step": 1255900 }, { "epoch": 1.515531632040818, "learning_rate": 4.968210071979634e-06, "loss": 2.475455017089844, "step": 1256000 }, { "epoch": 1.5156522953633007, "learning_rate": 4.967806236511895e-06, "loss": 2.499633026123047, "step": 1256100 }, { "epoch": 1.5157729586857833, "learning_rate": 4.967402401044157e-06, "loss": 2.524277648925781, "step": 1256200 }, { "epoch": 1.515893622008266, "learning_rate": 4.966998565576419e-06, "loss": 2.5090199279785157, "step": 1256300 }, { "epoch": 1.5160142853307488, "learning_rate": 4.966594730108681e-06, "loss": 2.5019264221191406, "step": 1256400 }, { "epoch": 1.5161349486532314, "learning_rate": 4.966190894640942e-06, "loss": 2.4963441467285157, "step": 1256500 }, { "epoch": 1.5162556119757142, "learning_rate": 4.9657870591732035e-06, "loss": 2.5006689453125, "step": 1256600 }, { "epoch": 1.5163762752981969, "learning_rate": 4.9653832237054655e-06, "loss": 2.4663587951660157, "step": 1256700 }, { "epoch": 1.5164969386206795, "learning_rate": 4.9649793882377275e-06, "loss": 2.5285458374023437, "step": 1256800 }, { "epoch": 1.516617601943162, "learning_rate": 4.964575552769989e-06, "loss": 2.479286956787109, "step": 1256900 }, { "epoch": 1.5167382652656447, "learning_rate": 4.964171717302251e-06, "loss": 2.483115386962891, "step": 1257000 }, { "epoch": 1.5168589285881275, "learning_rate": 4.963767881834512e-06, "loss": 2.506791229248047, "step": 1257100 }, { "epoch": 1.5169795919106102, "learning_rate": 4.963364046366774e-06, "loss": 2.51179443359375, "step": 1257200 }, { "epoch": 1.517100255233093, "learning_rate": 4.962960210899035e-06, "loss": 2.5006072998046873, "step": 1257300 }, { "epoch": 1.5172209185555756, "learning_rate": 4.962556375431297e-06, "loss": 2.4865963745117186, "step": 1257400 }, { "epoch": 1.5173415818780582, "learning_rate": 4.962152539963558e-06, "loss": 2.4936256408691406, "step": 1257500 }, { "epoch": 1.5174622452005408, "learning_rate": 4.96174870449582e-06, "loss": 2.482147216796875, "step": 1257600 }, { "epoch": 1.5175829085230235, "learning_rate": 4.961344869028081e-06, "loss": 2.511552429199219, "step": 1257700 }, { "epoch": 1.5177035718455063, "learning_rate": 4.960941033560343e-06, "loss": 2.493197021484375, "step": 1257800 }, { "epoch": 1.5178242351679891, "learning_rate": 4.960537198092605e-06, "loss": 2.503356475830078, "step": 1257900 }, { "epoch": 1.5179448984904718, "learning_rate": 4.960133362624866e-06, "loss": 2.4973771667480467, "step": 1258000 }, { "epoch": 1.5180655618129544, "learning_rate": 4.959729527157127e-06, "loss": 2.508619842529297, "step": 1258100 }, { "epoch": 1.518186225135437, "learning_rate": 4.959325691689389e-06, "loss": 2.4992433166503907, "step": 1258200 }, { "epoch": 1.5183068884579196, "learning_rate": 4.958921856221651e-06, "loss": 2.488017730712891, "step": 1258300 }, { "epoch": 1.5184275517804025, "learning_rate": 4.958518020753913e-06, "loss": 2.5247393798828126, "step": 1258400 }, { "epoch": 1.518548215102885, "learning_rate": 4.9581141852861744e-06, "loss": 2.5193846130371096, "step": 1258500 }, { "epoch": 1.518668878425368, "learning_rate": 4.9577103498184356e-06, "loss": 2.4923619079589843, "step": 1258600 }, { "epoch": 1.5187895417478505, "learning_rate": 4.9573065143506976e-06, "loss": 2.473033447265625, "step": 1258700 }, { "epoch": 1.5189102050703331, "learning_rate": 4.9569026788829595e-06, "loss": 2.5267633056640624, "step": 1258800 }, { "epoch": 1.5190308683928158, "learning_rate": 4.956498843415221e-06, "loss": 2.5028028869628907, "step": 1258900 }, { "epoch": 1.5191515317152984, "learning_rate": 4.956095007947483e-06, "loss": 2.494523773193359, "step": 1259000 }, { "epoch": 1.5192721950377812, "learning_rate": 4.955691172479744e-06, "loss": 2.4759115600585937, "step": 1259100 }, { "epoch": 1.5193928583602638, "learning_rate": 4.955287337012006e-06, "loss": 2.490714874267578, "step": 1259200 }, { "epoch": 1.5195135216827467, "learning_rate": 4.954883501544267e-06, "loss": 2.511391448974609, "step": 1259300 }, { "epoch": 1.5196341850052293, "learning_rate": 4.954479666076529e-06, "loss": 2.516277618408203, "step": 1259400 }, { "epoch": 1.519754848327712, "learning_rate": 4.954075830608791e-06, "loss": 2.495000457763672, "step": 1259500 }, { "epoch": 1.5198755116501945, "learning_rate": 4.953671995141052e-06, "loss": 2.507640838623047, "step": 1259600 }, { "epoch": 1.5199961749726771, "learning_rate": 4.953268159673313e-06, "loss": 2.502115936279297, "step": 1259700 }, { "epoch": 1.52011683829516, "learning_rate": 4.952864324205575e-06, "loss": 2.504664001464844, "step": 1259800 }, { "epoch": 1.5202375016176428, "learning_rate": 4.952460488737837e-06, "loss": 2.502618865966797, "step": 1259900 }, { "epoch": 1.5203581649401254, "learning_rate": 4.952056653270098e-06, "loss": 2.515913391113281, "step": 1260000 }, { "epoch": 1.520478828262608, "learning_rate": 4.95165281780236e-06, "loss": 2.501436767578125, "step": 1260100 }, { "epoch": 1.5205994915850907, "learning_rate": 4.951248982334621e-06, "loss": 2.5137599182128905, "step": 1260200 }, { "epoch": 1.5207201549075733, "learning_rate": 4.950845146866883e-06, "loss": 2.4839523315429686, "step": 1260300 }, { "epoch": 1.5208408182300561, "learning_rate": 4.950441311399145e-06, "loss": 2.497104034423828, "step": 1260400 }, { "epoch": 1.5209614815525387, "learning_rate": 4.9500374759314065e-06, "loss": 2.4790647888183592, "step": 1260500 }, { "epoch": 1.5210821448750216, "learning_rate": 4.949633640463668e-06, "loss": 2.4978982543945314, "step": 1260600 }, { "epoch": 1.5212028081975042, "learning_rate": 4.94922980499593e-06, "loss": 2.510958557128906, "step": 1260700 }, { "epoch": 1.5213234715199868, "learning_rate": 4.9488259695281916e-06, "loss": 2.478349151611328, "step": 1260800 }, { "epoch": 1.5214441348424694, "learning_rate": 4.948422134060453e-06, "loss": 2.478140411376953, "step": 1260900 }, { "epoch": 1.521564798164952, "learning_rate": 4.948018298592715e-06, "loss": 2.4931462097167967, "step": 1261000 }, { "epoch": 1.5216854614874349, "learning_rate": 4.947614463124976e-06, "loss": 2.4874253845214844, "step": 1261100 }, { "epoch": 1.5218061248099177, "learning_rate": 4.947210627657238e-06, "loss": 2.5197190856933593, "step": 1261200 }, { "epoch": 1.5219267881324003, "learning_rate": 4.9468067921895e-06, "loss": 2.496465148925781, "step": 1261300 }, { "epoch": 1.522047451454883, "learning_rate": 4.946402956721761e-06, "loss": 2.5206982421875, "step": 1261400 }, { "epoch": 1.5221681147773656, "learning_rate": 4.945999121254023e-06, "loss": 2.4950201416015627, "step": 1261500 }, { "epoch": 1.5222887780998482, "learning_rate": 4.945595285786284e-06, "loss": 2.5215470886230467, "step": 1261600 }, { "epoch": 1.522409441422331, "learning_rate": 4.945191450318546e-06, "loss": 2.482709503173828, "step": 1261700 }, { "epoch": 1.5225301047448137, "learning_rate": 4.944787614850807e-06, "loss": 2.51508056640625, "step": 1261800 }, { "epoch": 1.5226507680672965, "learning_rate": 4.944383779383069e-06, "loss": 2.490886535644531, "step": 1261900 }, { "epoch": 1.522771431389779, "learning_rate": 4.943979943915331e-06, "loss": 2.4970457458496096, "step": 1262000 }, { "epoch": 1.5228920947122617, "learning_rate": 4.943576108447592e-06, "loss": 2.48311767578125, "step": 1262100 }, { "epoch": 1.5230127580347443, "learning_rate": 4.943172272979853e-06, "loss": 2.4736036682128906, "step": 1262200 }, { "epoch": 1.523133421357227, "learning_rate": 4.942768437512115e-06, "loss": 2.492945556640625, "step": 1262300 }, { "epoch": 1.5232540846797098, "learning_rate": 4.942364602044377e-06, "loss": 2.5140692138671876, "step": 1262400 }, { "epoch": 1.5233747480021924, "learning_rate": 4.941960766576639e-06, "loss": 2.5048146057128906, "step": 1262500 }, { "epoch": 1.5234954113246753, "learning_rate": 4.9415569311089005e-06, "loss": 2.467792816162109, "step": 1262600 }, { "epoch": 1.5236160746471579, "learning_rate": 4.941153095641162e-06, "loss": 2.493288726806641, "step": 1262700 }, { "epoch": 1.5237367379696405, "learning_rate": 4.940749260173424e-06, "loss": 2.5156640625, "step": 1262800 }, { "epoch": 1.523857401292123, "learning_rate": 4.9403454247056856e-06, "loss": 2.499612579345703, "step": 1262900 }, { "epoch": 1.5239780646146057, "learning_rate": 4.939941589237947e-06, "loss": 2.5001460266113282, "step": 1263000 }, { "epoch": 1.5240987279370886, "learning_rate": 4.939537753770209e-06, "loss": 2.492778625488281, "step": 1263100 }, { "epoch": 1.5242193912595714, "learning_rate": 4.93913391830247e-06, "loss": 2.464641876220703, "step": 1263200 }, { "epoch": 1.524340054582054, "learning_rate": 4.938730082834732e-06, "loss": 2.52235107421875, "step": 1263300 }, { "epoch": 1.5244607179045366, "learning_rate": 4.938326247366993e-06, "loss": 2.498807067871094, "step": 1263400 }, { "epoch": 1.5245813812270192, "learning_rate": 4.937922411899255e-06, "loss": 2.506631317138672, "step": 1263500 }, { "epoch": 1.5247020445495019, "learning_rate": 4.937518576431516e-06, "loss": 2.4973110961914062, "step": 1263600 }, { "epoch": 1.5248227078719847, "learning_rate": 4.937114740963778e-06, "loss": 2.488217010498047, "step": 1263700 }, { "epoch": 1.5249433711944673, "learning_rate": 4.936710905496039e-06, "loss": 2.4897781372070313, "step": 1263800 }, { "epoch": 1.5250640345169502, "learning_rate": 4.936307070028301e-06, "loss": 2.4966464233398438, "step": 1263900 }, { "epoch": 1.5251846978394328, "learning_rate": 4.935903234560563e-06, "loss": 2.510386199951172, "step": 1264000 }, { "epoch": 1.5253053611619154, "learning_rate": 4.935499399092824e-06, "loss": 2.4591111755371093, "step": 1264100 }, { "epoch": 1.525426024484398, "learning_rate": 4.935095563625085e-06, "loss": 2.508783416748047, "step": 1264200 }, { "epoch": 1.5255466878068806, "learning_rate": 4.934691728157347e-06, "loss": 2.484203033447266, "step": 1264300 }, { "epoch": 1.5256673511293635, "learning_rate": 4.934287892689609e-06, "loss": 2.5295028686523438, "step": 1264400 }, { "epoch": 1.525788014451846, "learning_rate": 4.933884057221871e-06, "loss": 2.4786090087890624, "step": 1264500 }, { "epoch": 1.525908677774329, "learning_rate": 4.9334802217541325e-06, "loss": 2.471028289794922, "step": 1264600 }, { "epoch": 1.5260293410968115, "learning_rate": 4.933076386286394e-06, "loss": 2.4932720947265623, "step": 1264700 }, { "epoch": 1.5261500044192942, "learning_rate": 4.932672550818656e-06, "loss": 2.5257246398925783, "step": 1264800 }, { "epoch": 1.5262706677417768, "learning_rate": 4.932268715350918e-06, "loss": 2.521259613037109, "step": 1264900 }, { "epoch": 1.5263913310642594, "learning_rate": 4.931864879883179e-06, "loss": 2.505758514404297, "step": 1265000 }, { "epoch": 1.5265119943867422, "learning_rate": 4.931461044415441e-06, "loss": 2.5220736694335937, "step": 1265100 }, { "epoch": 1.526632657709225, "learning_rate": 4.931057208947702e-06, "loss": 2.499950714111328, "step": 1265200 }, { "epoch": 1.5267533210317077, "learning_rate": 4.930653373479964e-06, "loss": 2.486841125488281, "step": 1265300 }, { "epoch": 1.5268739843541903, "learning_rate": 4.930249538012225e-06, "loss": 2.494021453857422, "step": 1265400 }, { "epoch": 1.526994647676673, "learning_rate": 4.929845702544487e-06, "loss": 2.4964601135253908, "step": 1265500 }, { "epoch": 1.5271153109991555, "learning_rate": 4.929441867076749e-06, "loss": 2.491347351074219, "step": 1265600 }, { "epoch": 1.5272359743216384, "learning_rate": 4.92903803160901e-06, "loss": 2.4759317016601563, "step": 1265700 }, { "epoch": 1.527356637644121, "learning_rate": 4.928634196141271e-06, "loss": 2.4940977478027344, "step": 1265800 }, { "epoch": 1.5274773009666038, "learning_rate": 4.928230360673533e-06, "loss": 2.488236999511719, "step": 1265900 }, { "epoch": 1.5275979642890865, "learning_rate": 4.927826525205795e-06, "loss": 2.5212356567382814, "step": 1266000 }, { "epoch": 1.527718627611569, "learning_rate": 4.927422689738056e-06, "loss": 2.49386474609375, "step": 1266100 }, { "epoch": 1.5278392909340517, "learning_rate": 4.927018854270318e-06, "loss": 2.4843673706054688, "step": 1266200 }, { "epoch": 1.5279599542565343, "learning_rate": 4.926615018802579e-06, "loss": 2.5056588745117185, "step": 1266300 }, { "epoch": 1.5280806175790171, "learning_rate": 4.926211183334841e-06, "loss": 2.5065557861328127, "step": 1266400 }, { "epoch": 1.5282012809015, "learning_rate": 4.925807347867103e-06, "loss": 2.5133482360839845, "step": 1266500 }, { "epoch": 1.5283219442239826, "learning_rate": 4.9254035123993645e-06, "loss": 2.4776075744628905, "step": 1266600 }, { "epoch": 1.5284426075464652, "learning_rate": 4.924999676931626e-06, "loss": 2.5062843322753907, "step": 1266700 }, { "epoch": 1.5285632708689478, "learning_rate": 4.924595841463888e-06, "loss": 2.498094482421875, "step": 1266800 }, { "epoch": 1.5286839341914304, "learning_rate": 4.92419200599615e-06, "loss": 2.490184783935547, "step": 1266900 }, { "epoch": 1.5288045975139133, "learning_rate": 4.923788170528412e-06, "loss": 2.5261842346191408, "step": 1267000 }, { "epoch": 1.528925260836396, "learning_rate": 4.923384335060673e-06, "loss": 2.490358428955078, "step": 1267100 }, { "epoch": 1.5290459241588787, "learning_rate": 4.922980499592934e-06, "loss": 2.4920895385742186, "step": 1267200 }, { "epoch": 1.5291665874813614, "learning_rate": 4.922576664125196e-06, "loss": 2.478072204589844, "step": 1267300 }, { "epoch": 1.529287250803844, "learning_rate": 4.922172828657458e-06, "loss": 2.496929931640625, "step": 1267400 }, { "epoch": 1.5294079141263266, "learning_rate": 4.921768993189719e-06, "loss": 2.5247433471679686, "step": 1267500 }, { "epoch": 1.5295285774488092, "learning_rate": 4.921365157721981e-06, "loss": 2.5051370239257813, "step": 1267600 }, { "epoch": 1.529649240771292, "learning_rate": 4.920961322254242e-06, "loss": 2.4944419860839844, "step": 1267700 }, { "epoch": 1.5297699040937747, "learning_rate": 4.920557486786504e-06, "loss": 2.4880572509765626, "step": 1267800 }, { "epoch": 1.5298905674162575, "learning_rate": 4.920153651318765e-06, "loss": 2.4950572204589845, "step": 1267900 }, { "epoch": 1.5300112307387401, "learning_rate": 4.919749815851027e-06, "loss": 2.476168212890625, "step": 1268000 }, { "epoch": 1.5301318940612227, "learning_rate": 4.919345980383289e-06, "loss": 2.520692901611328, "step": 1268100 }, { "epoch": 1.5302525573837054, "learning_rate": 4.91894214491555e-06, "loss": 2.4981739807128904, "step": 1268200 }, { "epoch": 1.530373220706188, "learning_rate": 4.9185383094478114e-06, "loss": 2.501212463378906, "step": 1268300 }, { "epoch": 1.5304938840286708, "learning_rate": 4.9181344739800734e-06, "loss": 2.508450927734375, "step": 1268400 }, { "epoch": 1.5306145473511537, "learning_rate": 4.917730638512335e-06, "loss": 2.5141781616210936, "step": 1268500 }, { "epoch": 1.5307352106736363, "learning_rate": 4.917326803044597e-06, "loss": 2.514648895263672, "step": 1268600 }, { "epoch": 1.5308558739961189, "learning_rate": 4.9169229675768585e-06, "loss": 2.500474090576172, "step": 1268700 }, { "epoch": 1.5309765373186015, "learning_rate": 4.91651913210912e-06, "loss": 2.471097717285156, "step": 1268800 }, { "epoch": 1.5310972006410841, "learning_rate": 4.916115296641382e-06, "loss": 2.504252624511719, "step": 1268900 }, { "epoch": 1.531217863963567, "learning_rate": 4.915711461173644e-06, "loss": 2.4852951049804686, "step": 1269000 }, { "epoch": 1.5313385272860496, "learning_rate": 4.915307625705905e-06, "loss": 2.5086244201660155, "step": 1269100 }, { "epoch": 1.5314591906085324, "learning_rate": 4.914903790238167e-06, "loss": 2.5006398010253905, "step": 1269200 }, { "epoch": 1.531579853931015, "learning_rate": 4.914499954770428e-06, "loss": 2.519963836669922, "step": 1269300 }, { "epoch": 1.5317005172534977, "learning_rate": 4.91409611930269e-06, "loss": 2.503531188964844, "step": 1269400 }, { "epoch": 1.5318211805759803, "learning_rate": 4.913692283834951e-06, "loss": 2.50108154296875, "step": 1269500 }, { "epoch": 1.5319418438984629, "learning_rate": 4.913288448367213e-06, "loss": 2.5104620361328127, "step": 1269600 }, { "epoch": 1.5320625072209457, "learning_rate": 4.912884612899474e-06, "loss": 2.479481506347656, "step": 1269700 }, { "epoch": 1.5321831705434283, "learning_rate": 4.912480777431736e-06, "loss": 2.492684631347656, "step": 1269800 }, { "epoch": 1.5323038338659112, "learning_rate": 4.912076941963997e-06, "loss": 2.49889892578125, "step": 1269900 }, { "epoch": 1.5324244971883938, "learning_rate": 4.911673106496259e-06, "loss": 2.5017967224121094, "step": 1270000 }, { "epoch": 1.5325451605108764, "learning_rate": 4.911269271028521e-06, "loss": 2.4946246337890625, "step": 1270100 }, { "epoch": 1.532665823833359, "learning_rate": 4.910865435560782e-06, "loss": 2.5016018676757814, "step": 1270200 }, { "epoch": 1.5327864871558416, "learning_rate": 4.9104616000930435e-06, "loss": 2.503359527587891, "step": 1270300 }, { "epoch": 1.5329071504783245, "learning_rate": 4.9100577646253055e-06, "loss": 2.477905578613281, "step": 1270400 }, { "epoch": 1.5330278138008073, "learning_rate": 4.9096539291575674e-06, "loss": 2.492481994628906, "step": 1270500 }, { "epoch": 1.53314847712329, "learning_rate": 4.909250093689829e-06, "loss": 2.4863298034667967, "step": 1270600 }, { "epoch": 1.5332691404457726, "learning_rate": 4.9088462582220906e-06, "loss": 2.5362232971191405, "step": 1270700 }, { "epoch": 1.5333898037682552, "learning_rate": 4.908442422754352e-06, "loss": 2.4946139526367186, "step": 1270800 }, { "epoch": 1.5335104670907378, "learning_rate": 4.908038587286614e-06, "loss": 2.512339782714844, "step": 1270900 }, { "epoch": 1.5336311304132206, "learning_rate": 4.907634751818876e-06, "loss": 2.485450897216797, "step": 1271000 }, { "epoch": 1.5337517937357033, "learning_rate": 4.907230916351137e-06, "loss": 2.489241485595703, "step": 1271100 }, { "epoch": 1.533872457058186, "learning_rate": 4.906827080883399e-06, "loss": 2.491172180175781, "step": 1271200 }, { "epoch": 1.5339931203806687, "learning_rate": 4.90642324541566e-06, "loss": 2.4795710754394533, "step": 1271300 }, { "epoch": 1.5341137837031513, "learning_rate": 4.906019409947922e-06, "loss": 2.5133438110351562, "step": 1271400 }, { "epoch": 1.534234447025634, "learning_rate": 4.905615574480184e-06, "loss": 2.5099113464355467, "step": 1271500 }, { "epoch": 1.5343551103481166, "learning_rate": 4.905211739012445e-06, "loss": 2.495746765136719, "step": 1271600 }, { "epoch": 1.5344757736705994, "learning_rate": 4.904807903544707e-06, "loss": 2.49112548828125, "step": 1271700 }, { "epoch": 1.5345964369930822, "learning_rate": 4.904404068076968e-06, "loss": 2.526094970703125, "step": 1271800 }, { "epoch": 1.5347171003155649, "learning_rate": 4.90400023260923e-06, "loss": 2.470639495849609, "step": 1271900 }, { "epoch": 1.5348377636380475, "learning_rate": 4.903596397141491e-06, "loss": 2.4787496948242187, "step": 1272000 }, { "epoch": 1.53495842696053, "learning_rate": 4.903192561673753e-06, "loss": 2.505934143066406, "step": 1272100 }, { "epoch": 1.5350790902830127, "learning_rate": 4.902788726206014e-06, "loss": 2.4963117980957032, "step": 1272200 }, { "epoch": 1.5351997536054955, "learning_rate": 4.902384890738276e-06, "loss": 2.501928253173828, "step": 1272300 }, { "epoch": 1.5353204169279782, "learning_rate": 4.9019810552705375e-06, "loss": 2.49388916015625, "step": 1272400 }, { "epoch": 1.535441080250461, "learning_rate": 4.9015772198027995e-06, "loss": 2.5115786743164064, "step": 1272500 }, { "epoch": 1.5355617435729436, "learning_rate": 4.9011733843350614e-06, "loss": 2.4738200378417967, "step": 1272600 }, { "epoch": 1.5356824068954262, "learning_rate": 4.900769548867323e-06, "loss": 2.490639953613281, "step": 1272700 }, { "epoch": 1.5358030702179089, "learning_rate": 4.900365713399584e-06, "loss": 2.4849415588378907, "step": 1272800 }, { "epoch": 1.5359237335403915, "learning_rate": 4.899961877931846e-06, "loss": 2.504975128173828, "step": 1272900 }, { "epoch": 1.5360443968628743, "learning_rate": 4.899558042464108e-06, "loss": 2.494933776855469, "step": 1273000 }, { "epoch": 1.536165060185357, "learning_rate": 4.89915420699637e-06, "loss": 2.4872257995605467, "step": 1273100 }, { "epoch": 1.5362857235078398, "learning_rate": 4.898750371528631e-06, "loss": 2.4830500793457033, "step": 1273200 }, { "epoch": 1.5364063868303224, "learning_rate": 4.898346536060892e-06, "loss": 2.4937767028808593, "step": 1273300 }, { "epoch": 1.536527050152805, "learning_rate": 4.897942700593154e-06, "loss": 2.51667724609375, "step": 1273400 }, { "epoch": 1.5366477134752876, "learning_rate": 4.897538865125416e-06, "loss": 2.487054443359375, "step": 1273500 }, { "epoch": 1.5367683767977702, "learning_rate": 4.897135029657677e-06, "loss": 2.4494760131835935, "step": 1273600 }, { "epoch": 1.536889040120253, "learning_rate": 4.896731194189939e-06, "loss": 2.4998457336425783, "step": 1273700 }, { "epoch": 1.537009703442736, "learning_rate": 4.8963273587222e-06, "loss": 2.4891983032226563, "step": 1273800 }, { "epoch": 1.5371303667652185, "learning_rate": 4.895923523254462e-06, "loss": 2.504297332763672, "step": 1273900 }, { "epoch": 1.5372510300877011, "learning_rate": 4.895519687786723e-06, "loss": 2.4706036376953127, "step": 1274000 }, { "epoch": 1.5373716934101838, "learning_rate": 4.895115852318985e-06, "loss": 2.4996441650390624, "step": 1274100 }, { "epoch": 1.5374923567326664, "learning_rate": 4.894712016851247e-06, "loss": 2.512734222412109, "step": 1274200 }, { "epoch": 1.5376130200551492, "learning_rate": 4.894308181383508e-06, "loss": 2.49600830078125, "step": 1274300 }, { "epoch": 1.5377336833776318, "learning_rate": 4.8939043459157695e-06, "loss": 2.493125305175781, "step": 1274400 }, { "epoch": 1.5378543467001147, "learning_rate": 4.8935005104480315e-06, "loss": 2.502684783935547, "step": 1274500 }, { "epoch": 1.5379750100225973, "learning_rate": 4.8930966749802935e-06, "loss": 2.4830972290039064, "step": 1274600 }, { "epoch": 1.53809567334508, "learning_rate": 4.892692839512555e-06, "loss": 2.497491912841797, "step": 1274700 }, { "epoch": 1.5382163366675625, "learning_rate": 4.892289004044817e-06, "loss": 2.510290222167969, "step": 1274800 }, { "epoch": 1.5383369999900451, "learning_rate": 4.891885168577078e-06, "loss": 2.4742919921875, "step": 1274900 }, { "epoch": 1.538457663312528, "learning_rate": 4.89148133310934e-06, "loss": 2.465642395019531, "step": 1275000 }, { "epoch": 1.5385783266350106, "learning_rate": 4.891077497641602e-06, "loss": 2.525157928466797, "step": 1275100 }, { "epoch": 1.5386989899574934, "learning_rate": 4.890673662173863e-06, "loss": 2.4683770751953125, "step": 1275200 }, { "epoch": 1.538819653279976, "learning_rate": 4.890269826706124e-06, "loss": 2.4745701599121093, "step": 1275300 }, { "epoch": 1.5389403166024587, "learning_rate": 4.889865991238386e-06, "loss": 2.5008009338378905, "step": 1275400 }, { "epoch": 1.5390609799249413, "learning_rate": 4.889462155770648e-06, "loss": 2.509388122558594, "step": 1275500 }, { "epoch": 1.539181643247424, "learning_rate": 4.889058320302909e-06, "loss": 2.510572967529297, "step": 1275600 }, { "epoch": 1.5393023065699067, "learning_rate": 4.888654484835171e-06, "loss": 2.4816107177734374, "step": 1275700 }, { "epoch": 1.5394229698923896, "learning_rate": 4.888250649367432e-06, "loss": 2.4791824340820314, "step": 1275800 }, { "epoch": 1.5395436332148722, "learning_rate": 4.887846813899694e-06, "loss": 2.485747833251953, "step": 1275900 }, { "epoch": 1.5396642965373548, "learning_rate": 4.887442978431955e-06, "loss": 2.4998855590820312, "step": 1276000 }, { "epoch": 1.5397849598598374, "learning_rate": 4.887039142964217e-06, "loss": 2.482968597412109, "step": 1276100 }, { "epoch": 1.53990562318232, "learning_rate": 4.886635307496479e-06, "loss": 2.490679168701172, "step": 1276200 }, { "epoch": 1.5400262865048029, "learning_rate": 4.88623147202874e-06, "loss": 2.5017303466796874, "step": 1276300 }, { "epoch": 1.5401469498272855, "learning_rate": 4.8858276365610015e-06, "loss": 2.4943505859375, "step": 1276400 }, { "epoch": 1.5402676131497683, "learning_rate": 4.8854238010932635e-06, "loss": 2.503603210449219, "step": 1276500 }, { "epoch": 1.540388276472251, "learning_rate": 4.8850199656255255e-06, "loss": 2.511887969970703, "step": 1276600 }, { "epoch": 1.5405089397947336, "learning_rate": 4.8846161301577875e-06, "loss": 2.4848533630371095, "step": 1276700 }, { "epoch": 1.5406296031172162, "learning_rate": 4.884212294690049e-06, "loss": 2.491715393066406, "step": 1276800 }, { "epoch": 1.5407502664396988, "learning_rate": 4.88380845922231e-06, "loss": 2.4861207580566407, "step": 1276900 }, { "epoch": 1.5408709297621817, "learning_rate": 4.883404623754572e-06, "loss": 2.4942701721191405, "step": 1277000 }, { "epoch": 1.5409915930846645, "learning_rate": 4.883000788286834e-06, "loss": 2.490106201171875, "step": 1277100 }, { "epoch": 1.541112256407147, "learning_rate": 4.882596952819096e-06, "loss": 2.521964416503906, "step": 1277200 }, { "epoch": 1.5412329197296297, "learning_rate": 4.882193117351357e-06, "loss": 2.4999134826660154, "step": 1277300 }, { "epoch": 1.5413535830521123, "learning_rate": 4.881789281883618e-06, "loss": 2.478329620361328, "step": 1277400 }, { "epoch": 1.541474246374595, "learning_rate": 4.88138544641588e-06, "loss": 2.470705261230469, "step": 1277500 }, { "epoch": 1.5415949096970778, "learning_rate": 4.880981610948142e-06, "loss": 2.491669921875, "step": 1277600 }, { "epoch": 1.5417155730195604, "learning_rate": 4.880577775480403e-06, "loss": 2.4831935119628907, "step": 1277700 }, { "epoch": 1.5418362363420433, "learning_rate": 4.880173940012665e-06, "loss": 2.484986114501953, "step": 1277800 }, { "epoch": 1.5419568996645259, "learning_rate": 4.879770104544926e-06, "loss": 2.466482696533203, "step": 1277900 }, { "epoch": 1.5420775629870085, "learning_rate": 4.879366269077188e-06, "loss": 2.4870391845703126, "step": 1278000 }, { "epoch": 1.542198226309491, "learning_rate": 4.878962433609449e-06, "loss": 2.5046762084960936, "step": 1278100 }, { "epoch": 1.5423188896319737, "learning_rate": 4.878558598141711e-06, "loss": 2.473502197265625, "step": 1278200 }, { "epoch": 1.5424395529544566, "learning_rate": 4.878154762673972e-06, "loss": 2.4899411010742187, "step": 1278300 }, { "epoch": 1.5425602162769392, "learning_rate": 4.877750927206234e-06, "loss": 2.4817185974121094, "step": 1278400 }, { "epoch": 1.542680879599422, "learning_rate": 4.8773470917384955e-06, "loss": 2.504886474609375, "step": 1278500 }, { "epoch": 1.5428015429219046, "learning_rate": 4.8769432562707575e-06, "loss": 2.4926078796386717, "step": 1278600 }, { "epoch": 1.5429222062443873, "learning_rate": 4.8765394208030195e-06, "loss": 2.473824005126953, "step": 1278700 }, { "epoch": 1.5430428695668699, "learning_rate": 4.876135585335281e-06, "loss": 2.492126770019531, "step": 1278800 }, { "epoch": 1.5431635328893525, "learning_rate": 4.875731749867542e-06, "loss": 2.487310485839844, "step": 1278900 }, { "epoch": 1.5432841962118353, "learning_rate": 4.875327914399804e-06, "loss": 2.483846893310547, "step": 1279000 }, { "epoch": 1.5434048595343182, "learning_rate": 4.874924078932066e-06, "loss": 2.513008728027344, "step": 1279100 }, { "epoch": 1.5435255228568008, "learning_rate": 4.874520243464328e-06, "loss": 2.4894818115234374, "step": 1279200 }, { "epoch": 1.5436461861792834, "learning_rate": 4.874116407996589e-06, "loss": 2.488683776855469, "step": 1279300 }, { "epoch": 1.543766849501766, "learning_rate": 4.87371257252885e-06, "loss": 2.4831585693359375, "step": 1279400 }, { "epoch": 1.5438875128242486, "learning_rate": 4.873308737061112e-06, "loss": 2.5100038146972654, "step": 1279500 }, { "epoch": 1.5440081761467315, "learning_rate": 4.872904901593374e-06, "loss": 2.489293518066406, "step": 1279600 }, { "epoch": 1.544128839469214, "learning_rate": 4.872501066125635e-06, "loss": 2.4731791687011717, "step": 1279700 }, { "epoch": 1.544249502791697, "learning_rate": 4.872097230657897e-06, "loss": 2.495472717285156, "step": 1279800 }, { "epoch": 1.5443701661141795, "learning_rate": 4.871693395190158e-06, "loss": 2.4950267028808595, "step": 1279900 }, { "epoch": 1.5444908294366622, "learning_rate": 4.87128955972242e-06, "loss": 2.4808035278320313, "step": 1280000 }, { "epoch": 1.5446114927591448, "learning_rate": 4.870885724254681e-06, "loss": 2.5013883972167967, "step": 1280100 }, { "epoch": 1.5447321560816274, "learning_rate": 4.870481888786943e-06, "loss": 2.5162371826171874, "step": 1280200 }, { "epoch": 1.5448528194041102, "learning_rate": 4.870078053319205e-06, "loss": 2.495941467285156, "step": 1280300 }, { "epoch": 1.5449734827265929, "learning_rate": 4.8696742178514664e-06, "loss": 2.4955091857910157, "step": 1280400 }, { "epoch": 1.5450941460490757, "learning_rate": 4.8692703823837276e-06, "loss": 2.5183981323242186, "step": 1280500 }, { "epoch": 1.5452148093715583, "learning_rate": 4.8688665469159895e-06, "loss": 2.4973443603515624, "step": 1280600 }, { "epoch": 1.545335472694041, "learning_rate": 4.8684627114482515e-06, "loss": 2.4754148864746095, "step": 1280700 }, { "epoch": 1.5454561360165235, "learning_rate": 4.868058875980513e-06, "loss": 2.494956817626953, "step": 1280800 }, { "epoch": 1.5455767993390062, "learning_rate": 4.867655040512775e-06, "loss": 2.476497802734375, "step": 1280900 }, { "epoch": 1.545697462661489, "learning_rate": 4.867251205045036e-06, "loss": 2.4869453430175783, "step": 1281000 }, { "epoch": 1.5458181259839718, "learning_rate": 4.866847369577298e-06, "loss": 2.498490905761719, "step": 1281100 }, { "epoch": 1.5459387893064545, "learning_rate": 4.86644353410956e-06, "loss": 2.484394073486328, "step": 1281200 }, { "epoch": 1.546059452628937, "learning_rate": 4.866039698641821e-06, "loss": 2.5114259338378906, "step": 1281300 }, { "epoch": 1.5461801159514197, "learning_rate": 4.865635863174082e-06, "loss": 2.5152876281738283, "step": 1281400 }, { "epoch": 1.5463007792739023, "learning_rate": 4.865232027706344e-06, "loss": 2.471036376953125, "step": 1281500 }, { "epoch": 1.5464214425963851, "learning_rate": 4.864828192238606e-06, "loss": 2.512162780761719, "step": 1281600 }, { "epoch": 1.5465421059188678, "learning_rate": 4.864424356770868e-06, "loss": 2.471495361328125, "step": 1281700 }, { "epoch": 1.5466627692413506, "learning_rate": 4.864020521303129e-06, "loss": 2.47367919921875, "step": 1281800 }, { "epoch": 1.5467834325638332, "learning_rate": 4.86361668583539e-06, "loss": 2.4885997009277343, "step": 1281900 }, { "epoch": 1.5469040958863158, "learning_rate": 4.863212850367652e-06, "loss": 2.52360107421875, "step": 1282000 }, { "epoch": 1.5470247592087985, "learning_rate": 4.862809014899914e-06, "loss": 2.469508056640625, "step": 1282100 }, { "epoch": 1.547145422531281, "learning_rate": 4.862405179432175e-06, "loss": 2.505250244140625, "step": 1282200 }, { "epoch": 1.547266085853764, "learning_rate": 4.862001343964437e-06, "loss": 2.497932891845703, "step": 1282300 }, { "epoch": 1.5473867491762467, "learning_rate": 4.8615975084966985e-06, "loss": 2.4672491455078127, "step": 1282400 }, { "epoch": 1.5475074124987294, "learning_rate": 4.8611936730289604e-06, "loss": 2.4977867126464846, "step": 1282500 }, { "epoch": 1.547628075821212, "learning_rate": 4.8607898375612216e-06, "loss": 2.4934132385253904, "step": 1282600 }, { "epoch": 1.5477487391436946, "learning_rate": 4.8603860020934836e-06, "loss": 2.4748603820800783, "step": 1282700 }, { "epoch": 1.5478694024661772, "learning_rate": 4.8599821666257455e-06, "loss": 2.482781982421875, "step": 1282800 }, { "epoch": 1.54799006578866, "learning_rate": 4.859578331158007e-06, "loss": 2.486691741943359, "step": 1282900 }, { "epoch": 1.5481107291111427, "learning_rate": 4.859174495690268e-06, "loss": 2.5049197387695314, "step": 1283000 }, { "epoch": 1.5482313924336255, "learning_rate": 4.85877066022253e-06, "loss": 2.497084503173828, "step": 1283100 }, { "epoch": 1.5483520557561081, "learning_rate": 4.858366824754792e-06, "loss": 2.5364466857910157, "step": 1283200 }, { "epoch": 1.5484727190785907, "learning_rate": 4.857962989287054e-06, "loss": 2.479705810546875, "step": 1283300 }, { "epoch": 1.5485933824010734, "learning_rate": 4.857559153819315e-06, "loss": 2.480856170654297, "step": 1283400 }, { "epoch": 1.548714045723556, "learning_rate": 4.857155318351576e-06, "loss": 2.4902203369140623, "step": 1283500 }, { "epoch": 1.5488347090460388, "learning_rate": 4.856751482883838e-06, "loss": 2.509990692138672, "step": 1283600 }, { "epoch": 1.5489553723685214, "learning_rate": 4.8563476474161e-06, "loss": 2.5245315551757814, "step": 1283700 }, { "epoch": 1.5490760356910043, "learning_rate": 4.855943811948361e-06, "loss": 2.4905108642578124, "step": 1283800 }, { "epoch": 1.5491966990134869, "learning_rate": 4.855539976480623e-06, "loss": 2.5090266418457032, "step": 1283900 }, { "epoch": 1.5493173623359695, "learning_rate": 4.855136141012884e-06, "loss": 2.5103741455078126, "step": 1284000 }, { "epoch": 1.5494380256584521, "learning_rate": 4.854732305545146e-06, "loss": 2.486162567138672, "step": 1284100 }, { "epoch": 1.5495586889809347, "learning_rate": 4.854328470077407e-06, "loss": 2.4844219970703123, "step": 1284200 }, { "epoch": 1.5496793523034176, "learning_rate": 4.853924634609669e-06, "loss": 2.5007374572753904, "step": 1284300 }, { "epoch": 1.5498000156259004, "learning_rate": 4.8535207991419305e-06, "loss": 2.485745544433594, "step": 1284400 }, { "epoch": 1.549920678948383, "learning_rate": 4.8531169636741925e-06, "loss": 2.4710319519042967, "step": 1284500 }, { "epoch": 1.5500413422708657, "learning_rate": 4.852713128206454e-06, "loss": 2.47193359375, "step": 1284600 }, { "epoch": 1.5501620055933483, "learning_rate": 4.852309292738716e-06, "loss": 2.4685400390625, "step": 1284700 }, { "epoch": 1.5502826689158309, "learning_rate": 4.8519054572709776e-06, "loss": 2.5064039611816407, "step": 1284800 }, { "epoch": 1.5504033322383137, "learning_rate": 4.851501621803239e-06, "loss": 2.510008544921875, "step": 1284900 }, { "epoch": 1.5505239955607963, "learning_rate": 4.8510977863355e-06, "loss": 2.4669850158691404, "step": 1285000 }, { "epoch": 1.5506446588832792, "learning_rate": 4.850693950867762e-06, "loss": 2.4734013366699217, "step": 1285100 }, { "epoch": 1.5507653222057618, "learning_rate": 4.850290115400024e-06, "loss": 2.451685028076172, "step": 1285200 }, { "epoch": 1.5508859855282444, "learning_rate": 4.849886279932286e-06, "loss": 2.4794322204589845, "step": 1285300 }, { "epoch": 1.551006648850727, "learning_rate": 4.849482444464547e-06, "loss": 2.475877532958984, "step": 1285400 }, { "epoch": 1.5511273121732096, "learning_rate": 4.849078608996808e-06, "loss": 2.5111024475097654, "step": 1285500 }, { "epoch": 1.5512479754956925, "learning_rate": 4.84867477352907e-06, "loss": 2.5000679016113283, "step": 1285600 }, { "epoch": 1.551368638818175, "learning_rate": 4.848270938061332e-06, "loss": 2.494967346191406, "step": 1285700 }, { "epoch": 1.551489302140658, "learning_rate": 4.847867102593593e-06, "loss": 2.4951148986816407, "step": 1285800 }, { "epoch": 1.5516099654631406, "learning_rate": 4.847463267125855e-06, "loss": 2.5058241271972657, "step": 1285900 }, { "epoch": 1.5517306287856232, "learning_rate": 4.847059431658116e-06, "loss": 2.5017852783203125, "step": 1286000 }, { "epoch": 1.5518512921081058, "learning_rate": 4.846655596190378e-06, "loss": 2.52650146484375, "step": 1286100 }, { "epoch": 1.5519719554305884, "learning_rate": 4.846251760722639e-06, "loss": 2.491796112060547, "step": 1286200 }, { "epoch": 1.5520926187530713, "learning_rate": 4.845847925254901e-06, "loss": 2.5005458068847655, "step": 1286300 }, { "epoch": 1.552213282075554, "learning_rate": 4.845444089787163e-06, "loss": 2.492237854003906, "step": 1286400 }, { "epoch": 1.5523339453980367, "learning_rate": 4.8450402543194245e-06, "loss": 2.508478698730469, "step": 1286500 }, { "epoch": 1.5524546087205193, "learning_rate": 4.844636418851686e-06, "loss": 2.4992601013183595, "step": 1286600 }, { "epoch": 1.552575272043002, "learning_rate": 4.844232583383948e-06, "loss": 2.503543701171875, "step": 1286700 }, { "epoch": 1.5526959353654846, "learning_rate": 4.84382874791621e-06, "loss": 2.4955265808105467, "step": 1286800 }, { "epoch": 1.5528165986879674, "learning_rate": 4.843424912448471e-06, "loss": 2.496526641845703, "step": 1286900 }, { "epoch": 1.55293726201045, "learning_rate": 4.843021076980733e-06, "loss": 2.4752268981933594, "step": 1287000 }, { "epoch": 1.5530579253329329, "learning_rate": 4.842617241512994e-06, "loss": 2.482548828125, "step": 1287100 }, { "epoch": 1.5531785886554155, "learning_rate": 4.842213406045256e-06, "loss": 2.493888244628906, "step": 1287200 }, { "epoch": 1.553299251977898, "learning_rate": 4.841809570577518e-06, "loss": 2.5061935424804687, "step": 1287300 }, { "epoch": 1.5534199153003807, "learning_rate": 4.841405735109779e-06, "loss": 2.48722900390625, "step": 1287400 }, { "epoch": 1.5535405786228633, "learning_rate": 4.84100189964204e-06, "loss": 2.5087750244140623, "step": 1287500 }, { "epoch": 1.5536612419453462, "learning_rate": 4.840598064174302e-06, "loss": 2.499090118408203, "step": 1287600 }, { "epoch": 1.553781905267829, "learning_rate": 4.840194228706564e-06, "loss": 2.5012722778320313, "step": 1287700 }, { "epoch": 1.5539025685903116, "learning_rate": 4.839790393238826e-06, "loss": 2.4933676147460937, "step": 1287800 }, { "epoch": 1.5540232319127942, "learning_rate": 4.839386557771087e-06, "loss": 2.4971049499511717, "step": 1287900 }, { "epoch": 1.5541438952352769, "learning_rate": 4.838982722303348e-06, "loss": 2.5187940979003907, "step": 1288000 }, { "epoch": 1.5542645585577595, "learning_rate": 4.83857888683561e-06, "loss": 2.492769927978516, "step": 1288100 }, { "epoch": 1.5543852218802423, "learning_rate": 4.838175051367872e-06, "loss": 2.5119874572753904, "step": 1288200 }, { "epoch": 1.554505885202725, "learning_rate": 4.837771215900133e-06, "loss": 2.4833729553222654, "step": 1288300 }, { "epoch": 1.5546265485252078, "learning_rate": 4.837367380432395e-06, "loss": 2.488302459716797, "step": 1288400 }, { "epoch": 1.5547472118476904, "learning_rate": 4.8369635449646565e-06, "loss": 2.4874697875976564, "step": 1288500 }, { "epoch": 1.554867875170173, "learning_rate": 4.8365597094969185e-06, "loss": 2.527047882080078, "step": 1288600 }, { "epoch": 1.5549885384926556, "learning_rate": 4.83615587402918e-06, "loss": 2.483091125488281, "step": 1288700 }, { "epoch": 1.5551092018151382, "learning_rate": 4.835752038561442e-06, "loss": 2.4821568298339844, "step": 1288800 }, { "epoch": 1.555229865137621, "learning_rate": 4.835348203093704e-06, "loss": 2.4824281311035157, "step": 1288900 }, { "epoch": 1.5553505284601037, "learning_rate": 4.834944367625965e-06, "loss": 2.5178341674804687, "step": 1289000 }, { "epoch": 1.5554711917825865, "learning_rate": 4.834540532158226e-06, "loss": 2.495120849609375, "step": 1289100 }, { "epoch": 1.5555918551050691, "learning_rate": 4.834136696690488e-06, "loss": 2.4892762756347655, "step": 1289200 }, { "epoch": 1.5557125184275518, "learning_rate": 4.83373286122275e-06, "loss": 2.505875701904297, "step": 1289300 }, { "epoch": 1.5558331817500344, "learning_rate": 4.833329025755012e-06, "loss": 2.527782135009766, "step": 1289400 }, { "epoch": 1.555953845072517, "learning_rate": 4.832925190287273e-06, "loss": 2.508526153564453, "step": 1289500 }, { "epoch": 1.5560745083949998, "learning_rate": 4.832521354819534e-06, "loss": 2.490819549560547, "step": 1289600 }, { "epoch": 1.5561951717174827, "learning_rate": 4.832117519351796e-06, "loss": 2.507454833984375, "step": 1289700 }, { "epoch": 1.5563158350399653, "learning_rate": 4.831713683884058e-06, "loss": 2.481700897216797, "step": 1289800 }, { "epoch": 1.556436498362448, "learning_rate": 4.831309848416319e-06, "loss": 2.4889068603515625, "step": 1289900 }, { "epoch": 1.5565571616849305, "learning_rate": 4.830906012948581e-06, "loss": 2.504069519042969, "step": 1290000 }, { "epoch": 1.5566778250074131, "learning_rate": 4.830502177480842e-06, "loss": 2.4819195556640623, "step": 1290100 }, { "epoch": 1.556798488329896, "learning_rate": 4.830098342013104e-06, "loss": 2.461143341064453, "step": 1290200 }, { "epoch": 1.5569191516523786, "learning_rate": 4.8296945065453654e-06, "loss": 2.50377197265625, "step": 1290300 }, { "epoch": 1.5570398149748614, "learning_rate": 4.829290671077627e-06, "loss": 2.4872027587890626, "step": 1290400 }, { "epoch": 1.557160478297344, "learning_rate": 4.8288868356098885e-06, "loss": 2.4742364501953125, "step": 1290500 }, { "epoch": 1.5572811416198267, "learning_rate": 4.8284830001421505e-06, "loss": 2.4860600280761718, "step": 1290600 }, { "epoch": 1.5574018049423093, "learning_rate": 4.828079164674412e-06, "loss": 2.4985385131835938, "step": 1290700 }, { "epoch": 1.557522468264792, "learning_rate": 4.827675329206674e-06, "loss": 2.4971551513671875, "step": 1290800 }, { "epoch": 1.5576431315872747, "learning_rate": 4.827271493738936e-06, "loss": 2.506203918457031, "step": 1290900 }, { "epoch": 1.5577637949097574, "learning_rate": 4.826867658271197e-06, "loss": 2.4966578674316406, "step": 1291000 }, { "epoch": 1.5578844582322402, "learning_rate": 4.826463822803458e-06, "loss": 2.4831614685058594, "step": 1291100 }, { "epoch": 1.5580051215547228, "learning_rate": 4.82605998733572e-06, "loss": 2.4873939514160157, "step": 1291200 }, { "epoch": 1.5581257848772054, "learning_rate": 4.825656151867982e-06, "loss": 2.50049072265625, "step": 1291300 }, { "epoch": 1.558246448199688, "learning_rate": 4.825252316400244e-06, "loss": 2.5235997009277344, "step": 1291400 }, { "epoch": 1.5583671115221707, "learning_rate": 4.824848480932505e-06, "loss": 2.506730194091797, "step": 1291500 }, { "epoch": 1.5584877748446535, "learning_rate": 4.824444645464766e-06, "loss": 2.5087101745605467, "step": 1291600 }, { "epoch": 1.5586084381671363, "learning_rate": 4.824040809997028e-06, "loss": 2.494837646484375, "step": 1291700 }, { "epoch": 1.558729101489619, "learning_rate": 4.82363697452929e-06, "loss": 2.4703643798828123, "step": 1291800 }, { "epoch": 1.5588497648121016, "learning_rate": 4.823233139061551e-06, "loss": 2.5067344665527345, "step": 1291900 }, { "epoch": 1.5589704281345842, "learning_rate": 4.822829303593813e-06, "loss": 2.496518859863281, "step": 1292000 }, { "epoch": 1.5590910914570668, "learning_rate": 4.822425468126074e-06, "loss": 2.4858609008789063, "step": 1292100 }, { "epoch": 1.5592117547795497, "learning_rate": 4.822021632658336e-06, "loss": 2.4956239318847655, "step": 1292200 }, { "epoch": 1.5593324181020323, "learning_rate": 4.821617797190598e-06, "loss": 2.489368133544922, "step": 1292300 }, { "epoch": 1.559453081424515, "learning_rate": 4.8212139617228594e-06, "loss": 2.4867340087890626, "step": 1292400 }, { "epoch": 1.5595737447469977, "learning_rate": 4.820810126255121e-06, "loss": 2.5095257568359375, "step": 1292500 }, { "epoch": 1.5596944080694803, "learning_rate": 4.8204062907873825e-06, "loss": 2.4930714416503905, "step": 1292600 }, { "epoch": 1.559815071391963, "learning_rate": 4.8200024553196445e-06, "loss": 2.4683055114746093, "step": 1292700 }, { "epoch": 1.5599357347144456, "learning_rate": 4.819598619851906e-06, "loss": 2.503040771484375, "step": 1292800 }, { "epoch": 1.5600563980369284, "learning_rate": 4.819194784384168e-06, "loss": 2.483470764160156, "step": 1292900 }, { "epoch": 1.5601770613594113, "learning_rate": 4.818790948916429e-06, "loss": 2.518343811035156, "step": 1293000 }, { "epoch": 1.5602977246818939, "learning_rate": 4.818387113448691e-06, "loss": 2.5004786682128906, "step": 1293100 }, { "epoch": 1.5604183880043765, "learning_rate": 4.817983277980952e-06, "loss": 2.519151306152344, "step": 1293200 }, { "epoch": 1.560539051326859, "learning_rate": 4.817579442513214e-06, "loss": 2.4939671325683594, "step": 1293300 }, { "epoch": 1.5606597146493417, "learning_rate": 4.817175607045476e-06, "loss": 2.5092654418945313, "step": 1293400 }, { "epoch": 1.5607803779718246, "learning_rate": 4.816771771577737e-06, "loss": 2.4817291259765626, "step": 1293500 }, { "epoch": 1.5609010412943072, "learning_rate": 4.816367936109998e-06, "loss": 2.4903054809570313, "step": 1293600 }, { "epoch": 1.56102170461679, "learning_rate": 4.81596410064226e-06, "loss": 2.496546630859375, "step": 1293700 }, { "epoch": 1.5611423679392726, "learning_rate": 4.815560265174522e-06, "loss": 2.500053253173828, "step": 1293800 }, { "epoch": 1.5612630312617553, "learning_rate": 4.815156429706784e-06, "loss": 2.503920440673828, "step": 1293900 }, { "epoch": 1.5613836945842379, "learning_rate": 4.814752594239045e-06, "loss": 2.4830067443847654, "step": 1294000 }, { "epoch": 1.5615043579067205, "learning_rate": 4.814348758771306e-06, "loss": 2.4840164184570312, "step": 1294100 }, { "epoch": 1.5616250212292033, "learning_rate": 4.813944923303568e-06, "loss": 2.4787086486816405, "step": 1294200 }, { "epoch": 1.561745684551686, "learning_rate": 4.81354108783583e-06, "loss": 2.467271575927734, "step": 1294300 }, { "epoch": 1.5618663478741688, "learning_rate": 4.8131372523680915e-06, "loss": 2.4945167541503905, "step": 1294400 }, { "epoch": 1.5619870111966514, "learning_rate": 4.8127334169003534e-06, "loss": 2.4854335021972656, "step": 1294500 }, { "epoch": 1.562107674519134, "learning_rate": 4.8123295814326146e-06, "loss": 2.4844146728515626, "step": 1294600 }, { "epoch": 1.5622283378416166, "learning_rate": 4.8119257459648766e-06, "loss": 2.4772152709960937, "step": 1294700 }, { "epoch": 1.5623490011640992, "learning_rate": 4.811521910497138e-06, "loss": 2.4626080322265627, "step": 1294800 }, { "epoch": 1.562469664486582, "learning_rate": 4.8111180750294e-06, "loss": 2.458376922607422, "step": 1294900 }, { "epoch": 1.562590327809065, "learning_rate": 4.810714239561662e-06, "loss": 2.4800489807128905, "step": 1295000 }, { "epoch": 1.5627109911315475, "learning_rate": 4.810310404093923e-06, "loss": 2.4690049743652343, "step": 1295100 }, { "epoch": 1.5628316544540302, "learning_rate": 4.809906568626184e-06, "loss": 2.492634582519531, "step": 1295200 }, { "epoch": 1.5629523177765128, "learning_rate": 4.809502733158446e-06, "loss": 2.4935426330566406, "step": 1295300 }, { "epoch": 1.5630729810989954, "learning_rate": 4.809098897690708e-06, "loss": 2.493988342285156, "step": 1295400 }, { "epoch": 1.5631936444214782, "learning_rate": 4.808695062222969e-06, "loss": 2.4882797241210937, "step": 1295500 }, { "epoch": 1.5633143077439609, "learning_rate": 4.808291226755231e-06, "loss": 2.4788926696777343, "step": 1295600 }, { "epoch": 1.5634349710664437, "learning_rate": 4.807887391287492e-06, "loss": 2.498726654052734, "step": 1295700 }, { "epoch": 1.5635556343889263, "learning_rate": 4.807483555819754e-06, "loss": 2.4894017028808593, "step": 1295800 }, { "epoch": 1.563676297711409, "learning_rate": 4.807079720352016e-06, "loss": 2.4674617004394532, "step": 1295900 }, { "epoch": 1.5637969610338915, "learning_rate": 4.806675884884277e-06, "loss": 2.4902517700195315, "step": 1296000 }, { "epoch": 1.5639176243563742, "learning_rate": 4.806272049416538e-06, "loss": 2.500845947265625, "step": 1296100 }, { "epoch": 1.564038287678857, "learning_rate": 4.8058682139488e-06, "loss": 2.4694509887695313, "step": 1296200 }, { "epoch": 1.5641589510013396, "learning_rate": 4.805464378481062e-06, "loss": 2.480707244873047, "step": 1296300 }, { "epoch": 1.5642796143238225, "learning_rate": 4.8050605430133235e-06, "loss": 2.5159693908691407, "step": 1296400 }, { "epoch": 1.564400277646305, "learning_rate": 4.8046567075455855e-06, "loss": 2.48404541015625, "step": 1296500 }, { "epoch": 1.5645209409687877, "learning_rate": 4.804252872077847e-06, "loss": 2.4932516479492186, "step": 1296600 }, { "epoch": 1.5646416042912703, "learning_rate": 4.803849036610109e-06, "loss": 2.4845626831054686, "step": 1296700 }, { "epoch": 1.564762267613753, "learning_rate": 4.80344520114237e-06, "loss": 2.4749407958984375, "step": 1296800 }, { "epoch": 1.5648829309362358, "learning_rate": 4.803041365674632e-06, "loss": 2.519895324707031, "step": 1296900 }, { "epoch": 1.5650035942587186, "learning_rate": 4.802637530206894e-06, "loss": 2.5034494018554687, "step": 1297000 }, { "epoch": 1.5651242575812012, "learning_rate": 4.802233694739155e-06, "loss": 2.519830322265625, "step": 1297100 }, { "epoch": 1.5652449209036838, "learning_rate": 4.801829859271417e-06, "loss": 2.49449462890625, "step": 1297200 }, { "epoch": 1.5653655842261665, "learning_rate": 4.801426023803678e-06, "loss": 2.495801544189453, "step": 1297300 }, { "epoch": 1.565486247548649, "learning_rate": 4.80102218833594e-06, "loss": 2.499811706542969, "step": 1297400 }, { "epoch": 1.565606910871132, "learning_rate": 4.800618352868202e-06, "loss": 2.484560699462891, "step": 1297500 }, { "epoch": 1.5657275741936145, "learning_rate": 4.800214517400463e-06, "loss": 2.5110719299316404, "step": 1297600 }, { "epoch": 1.5658482375160974, "learning_rate": 4.799810681932724e-06, "loss": 2.4862757873535157, "step": 1297700 }, { "epoch": 1.56596890083858, "learning_rate": 4.799406846464986e-06, "loss": 2.4623451232910156, "step": 1297800 }, { "epoch": 1.5660895641610626, "learning_rate": 4.799003010997248e-06, "loss": 2.4928382873535155, "step": 1297900 }, { "epoch": 1.5662102274835452, "learning_rate": 4.79859917552951e-06, "loss": 2.5068634033203123, "step": 1298000 }, { "epoch": 1.5663308908060278, "learning_rate": 4.798195340061771e-06, "loss": 2.497688903808594, "step": 1298100 }, { "epoch": 1.5664515541285107, "learning_rate": 4.797791504594032e-06, "loss": 2.47777587890625, "step": 1298200 }, { "epoch": 1.5665722174509935, "learning_rate": 4.797387669126294e-06, "loss": 2.5249870300292967, "step": 1298300 }, { "epoch": 1.5666928807734761, "learning_rate": 4.796983833658556e-06, "loss": 2.479043273925781, "step": 1298400 }, { "epoch": 1.5668135440959587, "learning_rate": 4.7965799981908175e-06, "loss": 2.4992320251464846, "step": 1298500 }, { "epoch": 1.5669342074184414, "learning_rate": 4.7961761627230795e-06, "loss": 2.487056884765625, "step": 1298600 }, { "epoch": 1.567054870740924, "learning_rate": 4.795772327255341e-06, "loss": 2.5318035888671875, "step": 1298700 }, { "epoch": 1.5671755340634068, "learning_rate": 4.795368491787603e-06, "loss": 2.4855906677246096, "step": 1298800 }, { "epoch": 1.5672961973858894, "learning_rate": 4.794964656319864e-06, "loss": 2.5251705932617186, "step": 1298900 }, { "epoch": 1.5674168607083723, "learning_rate": 4.794560820852126e-06, "loss": 2.471475372314453, "step": 1299000 }, { "epoch": 1.567537524030855, "learning_rate": 4.794156985384387e-06, "loss": 2.4795718383789063, "step": 1299100 }, { "epoch": 1.5676581873533375, "learning_rate": 4.793753149916649e-06, "loss": 2.492736358642578, "step": 1299200 }, { "epoch": 1.5677788506758201, "learning_rate": 4.79334931444891e-06, "loss": 2.5007968139648438, "step": 1299300 }, { "epoch": 1.5678995139983027, "learning_rate": 4.792945478981172e-06, "loss": 2.514300537109375, "step": 1299400 }, { "epoch": 1.5680201773207856, "learning_rate": 4.792541643513434e-06, "loss": 2.518082580566406, "step": 1299500 }, { "epoch": 1.5681408406432682, "learning_rate": 4.792137808045695e-06, "loss": 2.4864649963378906, "step": 1299600 }, { "epoch": 1.568261503965751, "learning_rate": 4.791733972577956e-06, "loss": 2.4756707763671875, "step": 1299700 }, { "epoch": 1.5683821672882337, "learning_rate": 4.791330137110218e-06, "loss": 2.502603302001953, "step": 1299800 }, { "epoch": 1.5685028306107163, "learning_rate": 4.79092630164248e-06, "loss": 2.4991522216796875, "step": 1299900 }, { "epoch": 1.5686234939331989, "learning_rate": 4.790522466174742e-06, "loss": 2.522489013671875, "step": 1300000 }, { "epoch": 1.5687441572556815, "learning_rate": 4.790118630707003e-06, "loss": 2.4936741638183593, "step": 1300100 }, { "epoch": 1.5688648205781643, "learning_rate": 4.789714795239264e-06, "loss": 2.465619659423828, "step": 1300200 }, { "epoch": 1.5689854839006472, "learning_rate": 4.789310959771526e-06, "loss": 2.4884965515136717, "step": 1300300 }, { "epoch": 1.5691061472231298, "learning_rate": 4.788907124303788e-06, "loss": 2.4830145263671874, "step": 1300400 }, { "epoch": 1.5692268105456124, "learning_rate": 4.7885032888360495e-06, "loss": 2.4942976379394532, "step": 1300500 }, { "epoch": 1.569347473868095, "learning_rate": 4.7880994533683115e-06, "loss": 2.476404113769531, "step": 1300600 }, { "epoch": 1.5694681371905777, "learning_rate": 4.787695617900573e-06, "loss": 2.4983192443847657, "step": 1300700 }, { "epoch": 1.5695888005130605, "learning_rate": 4.787291782432835e-06, "loss": 2.4745579528808594, "step": 1300800 }, { "epoch": 1.569709463835543, "learning_rate": 4.786887946965096e-06, "loss": 2.497147216796875, "step": 1300900 }, { "epoch": 1.569830127158026, "learning_rate": 4.786484111497358e-06, "loss": 2.485861968994141, "step": 1301000 }, { "epoch": 1.5699507904805086, "learning_rate": 4.78608027602962e-06, "loss": 2.4858160400390625, "step": 1301100 }, { "epoch": 1.5700714538029912, "learning_rate": 4.785676440561881e-06, "loss": 2.468569030761719, "step": 1301200 }, { "epoch": 1.5701921171254738, "learning_rate": 4.785272605094142e-06, "loss": 2.478039093017578, "step": 1301300 }, { "epoch": 1.5703127804479564, "learning_rate": 4.784868769626404e-06, "loss": 2.5068844604492186, "step": 1301400 }, { "epoch": 1.5704334437704393, "learning_rate": 4.784464934158666e-06, "loss": 2.485091094970703, "step": 1301500 }, { "epoch": 1.5705541070929219, "learning_rate": 4.784061098690927e-06, "loss": 2.4979966735839843, "step": 1301600 }, { "epoch": 1.5706747704154047, "learning_rate": 4.783657263223189e-06, "loss": 2.486697540283203, "step": 1301700 }, { "epoch": 1.5707954337378873, "learning_rate": 4.78325342775545e-06, "loss": 2.4980197143554688, "step": 1301800 }, { "epoch": 1.57091609706037, "learning_rate": 4.782849592287712e-06, "loss": 2.476601257324219, "step": 1301900 }, { "epoch": 1.5710367603828526, "learning_rate": 4.782445756819974e-06, "loss": 2.4745738220214846, "step": 1302000 }, { "epoch": 1.5711574237053352, "learning_rate": 4.782041921352235e-06, "loss": 2.4834947204589843, "step": 1302100 }, { "epoch": 1.571278087027818, "learning_rate": 4.7816380858844964e-06, "loss": 2.4702853393554687, "step": 1302200 }, { "epoch": 1.5713987503503009, "learning_rate": 4.7812342504167584e-06, "loss": 2.490994873046875, "step": 1302300 }, { "epoch": 1.5715194136727835, "learning_rate": 4.78083041494902e-06, "loss": 2.484151611328125, "step": 1302400 }, { "epoch": 1.571640076995266, "learning_rate": 4.780426579481282e-06, "loss": 2.478956298828125, "step": 1302500 }, { "epoch": 1.5717607403177487, "learning_rate": 4.7800227440135435e-06, "loss": 2.478139190673828, "step": 1302600 }, { "epoch": 1.5718814036402313, "learning_rate": 4.779618908545805e-06, "loss": 2.5013690185546875, "step": 1302700 }, { "epoch": 1.5720020669627142, "learning_rate": 4.779215073078067e-06, "loss": 2.516806640625, "step": 1302800 }, { "epoch": 1.5721227302851968, "learning_rate": 4.778811237610329e-06, "loss": 2.4840707397460937, "step": 1302900 }, { "epoch": 1.5722433936076796, "learning_rate": 4.77840740214259e-06, "loss": 2.478809356689453, "step": 1303000 }, { "epoch": 1.5723640569301622, "learning_rate": 4.778003566674852e-06, "loss": 2.4760699462890625, "step": 1303100 }, { "epoch": 1.5724847202526449, "learning_rate": 4.777599731207113e-06, "loss": 2.4807530212402344, "step": 1303200 }, { "epoch": 1.5726053835751275, "learning_rate": 4.777195895739375e-06, "loss": 2.4868890380859376, "step": 1303300 }, { "epoch": 1.57272604689761, "learning_rate": 4.776792060271636e-06, "loss": 2.4582373046875, "step": 1303400 }, { "epoch": 1.572846710220093, "learning_rate": 4.776388224803898e-06, "loss": 2.486864471435547, "step": 1303500 }, { "epoch": 1.5729673735425758, "learning_rate": 4.77598438933616e-06, "loss": 2.501076202392578, "step": 1303600 }, { "epoch": 1.5730880368650584, "learning_rate": 4.775580553868421e-06, "loss": 2.4883758544921877, "step": 1303700 }, { "epoch": 1.573208700187541, "learning_rate": 4.775176718400682e-06, "loss": 2.4989630126953126, "step": 1303800 }, { "epoch": 1.5733293635100236, "learning_rate": 4.774772882932944e-06, "loss": 2.4825009155273436, "step": 1303900 }, { "epoch": 1.5734500268325062, "learning_rate": 4.774369047465206e-06, "loss": 2.4950155639648437, "step": 1304000 }, { "epoch": 1.573570690154989, "learning_rate": 4.773965211997468e-06, "loss": 2.47664306640625, "step": 1304100 }, { "epoch": 1.5736913534774717, "learning_rate": 4.773561376529729e-06, "loss": 2.4919509887695312, "step": 1304200 }, { "epoch": 1.5738120167999545, "learning_rate": 4.7731575410619905e-06, "loss": 2.4824203491210937, "step": 1304300 }, { "epoch": 1.5739326801224371, "learning_rate": 4.7727537055942524e-06, "loss": 2.4802700805664064, "step": 1304400 }, { "epoch": 1.5740533434449198, "learning_rate": 4.772349870126514e-06, "loss": 2.495985870361328, "step": 1304500 }, { "epoch": 1.5741740067674024, "learning_rate": 4.7719460346587756e-06, "loss": 2.480468292236328, "step": 1304600 }, { "epoch": 1.574294670089885, "learning_rate": 4.7715421991910375e-06, "loss": 2.4768365478515624, "step": 1304700 }, { "epoch": 1.5744153334123678, "learning_rate": 4.771138363723299e-06, "loss": 2.4744886779785156, "step": 1304800 }, { "epoch": 1.5745359967348505, "learning_rate": 4.770734528255561e-06, "loss": 2.467033233642578, "step": 1304900 }, { "epoch": 1.5746566600573333, "learning_rate": 4.770330692787822e-06, "loss": 2.453777008056641, "step": 1305000 }, { "epoch": 1.574777323379816, "learning_rate": 4.769926857320084e-06, "loss": 2.486405029296875, "step": 1305100 }, { "epoch": 1.5748979867022985, "learning_rate": 4.769523021852345e-06, "loss": 2.492919464111328, "step": 1305200 }, { "epoch": 1.5750186500247811, "learning_rate": 4.769119186384607e-06, "loss": 2.4959840393066406, "step": 1305300 }, { "epoch": 1.5751393133472638, "learning_rate": 4.768715350916868e-06, "loss": 2.457718963623047, "step": 1305400 }, { "epoch": 1.5752599766697466, "learning_rate": 4.76831151544913e-06, "loss": 2.514455108642578, "step": 1305500 }, { "epoch": 1.5753806399922294, "learning_rate": 4.767907679981392e-06, "loss": 2.4950917053222654, "step": 1305600 }, { "epoch": 1.575501303314712, "learning_rate": 4.767503844513653e-06, "loss": 2.5004608154296877, "step": 1305700 }, { "epoch": 1.5756219666371947, "learning_rate": 4.767100009045914e-06, "loss": 2.4870223999023438, "step": 1305800 }, { "epoch": 1.5757426299596773, "learning_rate": 4.766696173578176e-06, "loss": 2.4674641418457033, "step": 1305900 }, { "epoch": 1.57586329328216, "learning_rate": 4.766292338110438e-06, "loss": 2.4826116943359375, "step": 1306000 }, { "epoch": 1.5759839566046427, "learning_rate": 4.7658885026427e-06, "loss": 2.4883058166503904, "step": 1306100 }, { "epoch": 1.5761046199271254, "learning_rate": 4.765484667174961e-06, "loss": 2.502519989013672, "step": 1306200 }, { "epoch": 1.5762252832496082, "learning_rate": 4.7650808317072225e-06, "loss": 2.470694122314453, "step": 1306300 }, { "epoch": 1.5763459465720908, "learning_rate": 4.7646769962394845e-06, "loss": 2.470022735595703, "step": 1306400 }, { "epoch": 1.5764666098945734, "learning_rate": 4.7642731607717464e-06, "loss": 2.5018101501464844, "step": 1306500 }, { "epoch": 1.576587273217056, "learning_rate": 4.763869325304008e-06, "loss": 2.482169952392578, "step": 1306600 }, { "epoch": 1.5767079365395387, "learning_rate": 4.7634654898362696e-06, "loss": 2.4930996704101562, "step": 1306700 }, { "epoch": 1.5768285998620215, "learning_rate": 4.763061654368531e-06, "loss": 2.4769300842285156, "step": 1306800 }, { "epoch": 1.5769492631845041, "learning_rate": 4.762657818900793e-06, "loss": 2.487672882080078, "step": 1306900 }, { "epoch": 1.577069926506987, "learning_rate": 4.762253983433054e-06, "loss": 2.4732957458496094, "step": 1307000 }, { "epoch": 1.5771905898294696, "learning_rate": 4.761850147965316e-06, "loss": 2.491026611328125, "step": 1307100 }, { "epoch": 1.5773112531519522, "learning_rate": 4.761446312497578e-06, "loss": 2.4783497619628907, "step": 1307200 }, { "epoch": 1.5774319164744348, "learning_rate": 4.761042477029839e-06, "loss": 2.466732940673828, "step": 1307300 }, { "epoch": 1.5775525797969174, "learning_rate": 4.7606386415621e-06, "loss": 2.4972349548339845, "step": 1307400 }, { "epoch": 1.5776732431194003, "learning_rate": 4.760234806094362e-06, "loss": 2.5099920654296874, "step": 1307500 }, { "epoch": 1.577793906441883, "learning_rate": 4.759830970626624e-06, "loss": 2.511222686767578, "step": 1307600 }, { "epoch": 1.5779145697643657, "learning_rate": 4.759427135158885e-06, "loss": 2.5008280944824217, "step": 1307700 }, { "epoch": 1.5780352330868483, "learning_rate": 4.759023299691147e-06, "loss": 2.4862129211425783, "step": 1307800 }, { "epoch": 1.578155896409331, "learning_rate": 4.758619464223408e-06, "loss": 2.4999934387207032, "step": 1307900 }, { "epoch": 1.5782765597318136, "learning_rate": 4.75821562875567e-06, "loss": 2.480204772949219, "step": 1308000 }, { "epoch": 1.5783972230542964, "learning_rate": 4.757811793287932e-06, "loss": 2.5119952392578124, "step": 1308100 }, { "epoch": 1.578517886376779, "learning_rate": 4.757407957820193e-06, "loss": 2.4691461181640624, "step": 1308200 }, { "epoch": 1.5786385496992619, "learning_rate": 4.7570041223524545e-06, "loss": 2.5146853637695314, "step": 1308300 }, { "epoch": 1.5787592130217445, "learning_rate": 4.7566002868847165e-06, "loss": 2.4672242736816408, "step": 1308400 }, { "epoch": 1.578879876344227, "learning_rate": 4.7561964514169785e-06, "loss": 2.4822038269042968, "step": 1308500 }, { "epoch": 1.5790005396667097, "learning_rate": 4.7557926159492404e-06, "loss": 2.5003575134277343, "step": 1308600 }, { "epoch": 1.5791212029891923, "learning_rate": 4.755388780481502e-06, "loss": 2.4667286682128906, "step": 1308700 }, { "epoch": 1.5792418663116752, "learning_rate": 4.754984945013763e-06, "loss": 2.4774609375, "step": 1308800 }, { "epoch": 1.579362529634158, "learning_rate": 4.754581109546025e-06, "loss": 2.497012023925781, "step": 1308900 }, { "epoch": 1.5794831929566406, "learning_rate": 4.754177274078287e-06, "loss": 2.4769026184082032, "step": 1309000 }, { "epoch": 1.5796038562791233, "learning_rate": 4.753773438610548e-06, "loss": 2.487294921875, "step": 1309100 }, { "epoch": 1.5797245196016059, "learning_rate": 4.75336960314281e-06, "loss": 2.4854949951171874, "step": 1309200 }, { "epoch": 1.5798451829240885, "learning_rate": 4.752965767675071e-06, "loss": 2.5015892028808593, "step": 1309300 }, { "epoch": 1.5799658462465713, "learning_rate": 4.752561932207333e-06, "loss": 2.463655548095703, "step": 1309400 }, { "epoch": 1.580086509569054, "learning_rate": 4.752158096739594e-06, "loss": 2.50898681640625, "step": 1309500 }, { "epoch": 1.5802071728915368, "learning_rate": 4.751754261271856e-06, "loss": 2.5018312072753908, "step": 1309600 }, { "epoch": 1.5803278362140194, "learning_rate": 4.751350425804118e-06, "loss": 2.4674314880371093, "step": 1309700 }, { "epoch": 1.580448499536502, "learning_rate": 4.750946590336379e-06, "loss": 2.465292663574219, "step": 1309800 }, { "epoch": 1.5805691628589846, "learning_rate": 4.75054275486864e-06, "loss": 2.4894503784179687, "step": 1309900 }, { "epoch": 1.5806898261814673, "learning_rate": 4.750138919400902e-06, "loss": 2.4969850158691407, "step": 1310000 }, { "epoch": 1.58081048950395, "learning_rate": 4.749735083933164e-06, "loss": 2.492653503417969, "step": 1310100 }, { "epoch": 1.5809311528264327, "learning_rate": 4.749331248465425e-06, "loss": 2.4929913330078124, "step": 1310200 }, { "epoch": 1.5810518161489155, "learning_rate": 4.748927412997687e-06, "loss": 2.502466583251953, "step": 1310300 }, { "epoch": 1.5811724794713982, "learning_rate": 4.7485235775299485e-06, "loss": 2.508766784667969, "step": 1310400 }, { "epoch": 1.5812931427938808, "learning_rate": 4.7481197420622105e-06, "loss": 2.486037139892578, "step": 1310500 }, { "epoch": 1.5814138061163634, "learning_rate": 4.7477159065944725e-06, "loss": 2.4763427734375, "step": 1310600 }, { "epoch": 1.581534469438846, "learning_rate": 4.747312071126734e-06, "loss": 2.4891143798828126, "step": 1310700 }, { "epoch": 1.5816551327613289, "learning_rate": 4.746908235658995e-06, "loss": 2.4884848022460937, "step": 1310800 }, { "epoch": 1.5817757960838117, "learning_rate": 4.746504400191257e-06, "loss": 2.4882908630371094, "step": 1310900 }, { "epoch": 1.5818964594062943, "learning_rate": 4.746100564723519e-06, "loss": 2.49232666015625, "step": 1311000 }, { "epoch": 1.582017122728777, "learning_rate": 4.74569672925578e-06, "loss": 2.4970518493652345, "step": 1311100 }, { "epoch": 1.5821377860512595, "learning_rate": 4.745292893788042e-06, "loss": 2.483328094482422, "step": 1311200 }, { "epoch": 1.5822584493737422, "learning_rate": 4.744889058320303e-06, "loss": 2.492342224121094, "step": 1311300 }, { "epoch": 1.582379112696225, "learning_rate": 4.744485222852565e-06, "loss": 2.481565246582031, "step": 1311400 }, { "epoch": 1.5824997760187076, "learning_rate": 4.744081387384826e-06, "loss": 2.5098486328125, "step": 1311500 }, { "epoch": 1.5826204393411905, "learning_rate": 4.743677551917088e-06, "loss": 2.4661634826660155, "step": 1311600 }, { "epoch": 1.582741102663673, "learning_rate": 4.74327371644935e-06, "loss": 2.468213653564453, "step": 1311700 }, { "epoch": 1.5828617659861557, "learning_rate": 4.742869880981611e-06, "loss": 2.4763145446777344, "step": 1311800 }, { "epoch": 1.5829824293086383, "learning_rate": 4.742466045513872e-06, "loss": 2.4894059753417968, "step": 1311900 }, { "epoch": 1.583103092631121, "learning_rate": 4.742062210046134e-06, "loss": 2.4743466186523437, "step": 1312000 }, { "epoch": 1.5832237559536038, "learning_rate": 4.741658374578396e-06, "loss": 2.508129119873047, "step": 1312100 }, { "epoch": 1.5833444192760864, "learning_rate": 4.741254539110658e-06, "loss": 2.486743621826172, "step": 1312200 }, { "epoch": 1.5834650825985692, "learning_rate": 4.740850703642919e-06, "loss": 2.485398406982422, "step": 1312300 }, { "epoch": 1.5835857459210518, "learning_rate": 4.7404468681751805e-06, "loss": 2.4887986755371094, "step": 1312400 }, { "epoch": 1.5837064092435345, "learning_rate": 4.7400430327074425e-06, "loss": 2.510254211425781, "step": 1312500 }, { "epoch": 1.583827072566017, "learning_rate": 4.7396391972397045e-06, "loss": 2.4738973999023437, "step": 1312600 }, { "epoch": 1.5839477358884997, "learning_rate": 4.7392353617719665e-06, "loss": 2.4943731689453124, "step": 1312700 }, { "epoch": 1.5840683992109825, "learning_rate": 4.738831526304228e-06, "loss": 2.4924087524414062, "step": 1312800 }, { "epoch": 1.5841890625334654, "learning_rate": 4.738427690836489e-06, "loss": 2.4893370056152344, "step": 1312900 }, { "epoch": 1.584309725855948, "learning_rate": 4.738023855368751e-06, "loss": 2.478648681640625, "step": 1313000 }, { "epoch": 1.5844303891784306, "learning_rate": 4.737620019901013e-06, "loss": 2.482362823486328, "step": 1313100 }, { "epoch": 1.5845510525009132, "learning_rate": 4.737216184433274e-06, "loss": 2.484036865234375, "step": 1313200 }, { "epoch": 1.5846717158233958, "learning_rate": 4.736812348965536e-06, "loss": 2.467196807861328, "step": 1313300 }, { "epoch": 1.5847923791458787, "learning_rate": 4.736408513497797e-06, "loss": 2.4950935363769533, "step": 1313400 }, { "epoch": 1.5849130424683613, "learning_rate": 4.736004678030059e-06, "loss": 2.477924041748047, "step": 1313500 }, { "epoch": 1.5850337057908441, "learning_rate": 4.73560084256232e-06, "loss": 2.4532650756835936, "step": 1313600 }, { "epoch": 1.5851543691133267, "learning_rate": 4.735197007094582e-06, "loss": 2.475425567626953, "step": 1313700 }, { "epoch": 1.5852750324358094, "learning_rate": 4.734793171626843e-06, "loss": 2.480509948730469, "step": 1313800 }, { "epoch": 1.585395695758292, "learning_rate": 4.734389336159105e-06, "loss": 2.506562042236328, "step": 1313900 }, { "epoch": 1.5855163590807746, "learning_rate": 4.733985500691366e-06, "loss": 2.4789799499511718, "step": 1314000 }, { "epoch": 1.5856370224032574, "learning_rate": 4.733581665223628e-06, "loss": 2.4759426879882813, "step": 1314100 }, { "epoch": 1.5857576857257403, "learning_rate": 4.73317782975589e-06, "loss": 2.4822401428222656, "step": 1314200 }, { "epoch": 1.585878349048223, "learning_rate": 4.7327739942881514e-06, "loss": 2.4846347045898436, "step": 1314300 }, { "epoch": 1.5859990123707055, "learning_rate": 4.7323701588204126e-06, "loss": 2.485579376220703, "step": 1314400 }, { "epoch": 1.5861196756931881, "learning_rate": 4.7319663233526745e-06, "loss": 2.480632781982422, "step": 1314500 }, { "epoch": 1.5862403390156707, "learning_rate": 4.7315624878849365e-06, "loss": 2.4921504211425782, "step": 1314600 }, { "epoch": 1.5863610023381536, "learning_rate": 4.7311586524171985e-06, "loss": 2.503255157470703, "step": 1314700 }, { "epoch": 1.5864816656606362, "learning_rate": 4.73075481694946e-06, "loss": 2.490328826904297, "step": 1314800 }, { "epoch": 1.586602328983119, "learning_rate": 4.730350981481721e-06, "loss": 2.494554901123047, "step": 1314900 }, { "epoch": 1.5867229923056017, "learning_rate": 4.729947146013983e-06, "loss": 2.486561737060547, "step": 1315000 }, { "epoch": 1.5868436556280843, "learning_rate": 4.729543310546245e-06, "loss": 2.4749609375, "step": 1315100 }, { "epoch": 1.5869643189505669, "learning_rate": 4.729139475078506e-06, "loss": 2.488589630126953, "step": 1315200 }, { "epoch": 1.5870849822730495, "learning_rate": 4.728735639610768e-06, "loss": 2.494328918457031, "step": 1315300 }, { "epoch": 1.5872056455955323, "learning_rate": 4.728331804143029e-06, "loss": 2.4634030151367186, "step": 1315400 }, { "epoch": 1.587326308918015, "learning_rate": 4.727927968675291e-06, "loss": 2.492626190185547, "step": 1315500 }, { "epoch": 1.5874469722404978, "learning_rate": 4.727524133207552e-06, "loss": 2.4955938720703124, "step": 1315600 }, { "epoch": 1.5875676355629804, "learning_rate": 4.727120297739814e-06, "loss": 2.4825962829589843, "step": 1315700 }, { "epoch": 1.587688298885463, "learning_rate": 4.726716462272076e-06, "loss": 2.480782775878906, "step": 1315800 }, { "epoch": 1.5878089622079457, "learning_rate": 4.726312626804337e-06, "loss": 2.501911468505859, "step": 1315900 }, { "epoch": 1.5879296255304283, "learning_rate": 4.725908791336598e-06, "loss": 2.487579803466797, "step": 1316000 }, { "epoch": 1.588050288852911, "learning_rate": 4.72550495586886e-06, "loss": 2.4711598205566405, "step": 1316100 }, { "epoch": 1.588170952175394, "learning_rate": 4.725101120401122e-06, "loss": 2.474344940185547, "step": 1316200 }, { "epoch": 1.5882916154978766, "learning_rate": 4.7246972849333835e-06, "loss": 2.483650360107422, "step": 1316300 }, { "epoch": 1.5884122788203592, "learning_rate": 4.7242934494656454e-06, "loss": 2.467224578857422, "step": 1316400 }, { "epoch": 1.5885329421428418, "learning_rate": 4.7238896139979066e-06, "loss": 2.499525451660156, "step": 1316500 }, { "epoch": 1.5886536054653244, "learning_rate": 4.7234857785301686e-06, "loss": 2.4925282287597654, "step": 1316600 }, { "epoch": 1.5887742687878073, "learning_rate": 4.7230819430624305e-06, "loss": 2.465801544189453, "step": 1316700 }, { "epoch": 1.5888949321102899, "learning_rate": 4.722678107594692e-06, "loss": 2.476316375732422, "step": 1316800 }, { "epoch": 1.5890155954327727, "learning_rate": 4.722274272126953e-06, "loss": 2.506589202880859, "step": 1316900 }, { "epoch": 1.5891362587552553, "learning_rate": 4.721870436659215e-06, "loss": 2.485592498779297, "step": 1317000 }, { "epoch": 1.589256922077738, "learning_rate": 4.721466601191477e-06, "loss": 2.4808280944824217, "step": 1317100 }, { "epoch": 1.5893775854002206, "learning_rate": 4.721062765723738e-06, "loss": 2.483267059326172, "step": 1317200 }, { "epoch": 1.5894982487227032, "learning_rate": 4.720658930256e-06, "loss": 2.4795916748046873, "step": 1317300 }, { "epoch": 1.589618912045186, "learning_rate": 4.720255094788261e-06, "loss": 2.486819305419922, "step": 1317400 }, { "epoch": 1.5897395753676686, "learning_rate": 4.719851259320523e-06, "loss": 2.4979019165039062, "step": 1317500 }, { "epoch": 1.5898602386901515, "learning_rate": 4.719447423852784e-06, "loss": 2.490516815185547, "step": 1317600 }, { "epoch": 1.589980902012634, "learning_rate": 4.719043588385046e-06, "loss": 2.477955322265625, "step": 1317700 }, { "epoch": 1.5901015653351167, "learning_rate": 4.718639752917308e-06, "loss": 2.4813108825683594, "step": 1317800 }, { "epoch": 1.5902222286575993, "learning_rate": 4.718235917449569e-06, "loss": 2.4961639404296876, "step": 1317900 }, { "epoch": 1.590342891980082, "learning_rate": 4.717832081981831e-06, "loss": 2.4720068359375, "step": 1318000 }, { "epoch": 1.5904635553025648, "learning_rate": 4.717428246514092e-06, "loss": 2.4958074951171874, "step": 1318100 }, { "epoch": 1.5905842186250476, "learning_rate": 4.717024411046354e-06, "loss": 2.495394592285156, "step": 1318200 }, { "epoch": 1.5907048819475302, "learning_rate": 4.716620575578616e-06, "loss": 2.4821183776855467, "step": 1318300 }, { "epoch": 1.5908255452700129, "learning_rate": 4.7162167401108775e-06, "loss": 2.4919020080566407, "step": 1318400 }, { "epoch": 1.5909462085924955, "learning_rate": 4.715812904643139e-06, "loss": 2.4886123657226564, "step": 1318500 }, { "epoch": 1.591066871914978, "learning_rate": 4.715409069175401e-06, "loss": 2.489624328613281, "step": 1318600 }, { "epoch": 1.591187535237461, "learning_rate": 4.7150052337076626e-06, "loss": 2.4746290588378907, "step": 1318700 }, { "epoch": 1.5913081985599435, "learning_rate": 4.7146013982399245e-06, "loss": 2.482211456298828, "step": 1318800 }, { "epoch": 1.5914288618824264, "learning_rate": 4.714197562772186e-06, "loss": 2.491684875488281, "step": 1318900 }, { "epoch": 1.591549525204909, "learning_rate": 4.713793727304447e-06, "loss": 2.4859992980957033, "step": 1319000 }, { "epoch": 1.5916701885273916, "learning_rate": 4.713389891836709e-06, "loss": 2.4731826782226562, "step": 1319100 }, { "epoch": 1.5917908518498742, "learning_rate": 4.712986056368971e-06, "loss": 2.4957232666015625, "step": 1319200 }, { "epoch": 1.5919115151723569, "learning_rate": 4.712582220901232e-06, "loss": 2.472841796875, "step": 1319300 }, { "epoch": 1.5920321784948397, "learning_rate": 4.712178385433494e-06, "loss": 2.4942955017089843, "step": 1319400 }, { "epoch": 1.5921528418173225, "learning_rate": 4.711774549965755e-06, "loss": 2.477366180419922, "step": 1319500 }, { "epoch": 1.5922735051398051, "learning_rate": 4.711370714498017e-06, "loss": 2.4824209594726563, "step": 1319600 }, { "epoch": 1.5923941684622878, "learning_rate": 4.710966879030278e-06, "loss": 2.4597161865234374, "step": 1319700 }, { "epoch": 1.5925148317847704, "learning_rate": 4.71056304356254e-06, "loss": 2.4798155212402344, "step": 1319800 }, { "epoch": 1.592635495107253, "learning_rate": 4.710159208094801e-06, "loss": 2.485237579345703, "step": 1319900 }, { "epoch": 1.5927561584297358, "learning_rate": 4.709755372627063e-06, "loss": 2.4803074645996093, "step": 1320000 }, { "epoch": 1.5928768217522185, "learning_rate": 4.709351537159324e-06, "loss": 2.491943664550781, "step": 1320100 }, { "epoch": 1.5929974850747013, "learning_rate": 4.708947701691586e-06, "loss": 2.4495420837402344, "step": 1320200 }, { "epoch": 1.593118148397184, "learning_rate": 4.708543866223848e-06, "loss": 2.489132995605469, "step": 1320300 }, { "epoch": 1.5932388117196665, "learning_rate": 4.7081400307561095e-06, "loss": 2.4823489379882813, "step": 1320400 }, { "epoch": 1.5933594750421491, "learning_rate": 4.707736195288371e-06, "loss": 2.4812666320800782, "step": 1320500 }, { "epoch": 1.5934801383646318, "learning_rate": 4.707332359820633e-06, "loss": 2.449899444580078, "step": 1320600 }, { "epoch": 1.5936008016871146, "learning_rate": 4.706928524352895e-06, "loss": 2.4887124633789064, "step": 1320700 }, { "epoch": 1.5937214650095972, "learning_rate": 4.7065246888851566e-06, "loss": 2.4819883728027343, "step": 1320800 }, { "epoch": 1.59384212833208, "learning_rate": 4.706120853417418e-06, "loss": 2.4676173400878905, "step": 1320900 }, { "epoch": 1.5939627916545627, "learning_rate": 4.705717017949679e-06, "loss": 2.46509765625, "step": 1321000 }, { "epoch": 1.5940834549770453, "learning_rate": 4.705313182481941e-06, "loss": 2.4910633850097654, "step": 1321100 }, { "epoch": 1.594204118299528, "learning_rate": 4.704909347014203e-06, "loss": 2.478822021484375, "step": 1321200 }, { "epoch": 1.5943247816220105, "learning_rate": 4.704505511546464e-06, "loss": 2.5087265014648437, "step": 1321300 }, { "epoch": 1.5944454449444934, "learning_rate": 4.704101676078726e-06, "loss": 2.48540771484375, "step": 1321400 }, { "epoch": 1.5945661082669762, "learning_rate": 4.703697840610987e-06, "loss": 2.4872967529296877, "step": 1321500 }, { "epoch": 1.5946867715894588, "learning_rate": 4.703294005143249e-06, "loss": 2.489857482910156, "step": 1321600 }, { "epoch": 1.5948074349119414, "learning_rate": 4.70289016967551e-06, "loss": 2.47532470703125, "step": 1321700 }, { "epoch": 1.594928098234424, "learning_rate": 4.702486334207772e-06, "loss": 2.4825398254394533, "step": 1321800 }, { "epoch": 1.5950487615569067, "learning_rate": 4.702082498740034e-06, "loss": 2.4630465698242188, "step": 1321900 }, { "epoch": 1.5951694248793895, "learning_rate": 4.701678663272295e-06, "loss": 2.4877670288085936, "step": 1322000 }, { "epoch": 1.5952900882018721, "learning_rate": 4.701274827804556e-06, "loss": 2.4734732055664064, "step": 1322100 }, { "epoch": 1.595410751524355, "learning_rate": 4.700870992336818e-06, "loss": 2.4853163146972657, "step": 1322200 }, { "epoch": 1.5955314148468376, "learning_rate": 4.70046715686908e-06, "loss": 2.503781585693359, "step": 1322300 }, { "epoch": 1.5956520781693202, "learning_rate": 4.7000633214013415e-06, "loss": 2.4846157836914062, "step": 1322400 }, { "epoch": 1.5957727414918028, "learning_rate": 4.6996594859336035e-06, "loss": 2.467218322753906, "step": 1322500 }, { "epoch": 1.5958934048142854, "learning_rate": 4.699255650465865e-06, "loss": 2.4742332458496095, "step": 1322600 }, { "epoch": 1.5960140681367683, "learning_rate": 4.698851814998127e-06, "loss": 2.458972930908203, "step": 1322700 }, { "epoch": 1.5961347314592509, "learning_rate": 4.698447979530389e-06, "loss": 2.500885772705078, "step": 1322800 }, { "epoch": 1.5962553947817337, "learning_rate": 4.69804414406265e-06, "loss": 2.4745663452148436, "step": 1322900 }, { "epoch": 1.5963760581042163, "learning_rate": 4.697640308594911e-06, "loss": 2.4746961975097657, "step": 1323000 }, { "epoch": 1.596496721426699, "learning_rate": 4.697236473127173e-06, "loss": 2.4930267333984375, "step": 1323100 }, { "epoch": 1.5966173847491816, "learning_rate": 4.696832637659435e-06, "loss": 2.4974876403808595, "step": 1323200 }, { "epoch": 1.5967380480716642, "learning_rate": 4.696428802191697e-06, "loss": 2.5147642517089843, "step": 1323300 }, { "epoch": 1.596858711394147, "learning_rate": 4.696024966723958e-06, "loss": 2.469839782714844, "step": 1323400 }, { "epoch": 1.5969793747166299, "learning_rate": 4.695621131256219e-06, "loss": 2.490037841796875, "step": 1323500 }, { "epoch": 1.5971000380391125, "learning_rate": 4.695217295788481e-06, "loss": 2.496373596191406, "step": 1323600 }, { "epoch": 1.597220701361595, "learning_rate": 4.694813460320743e-06, "loss": 2.4754478454589846, "step": 1323700 }, { "epoch": 1.5973413646840777, "learning_rate": 4.694409624853004e-06, "loss": 2.4788473510742186, "step": 1323800 }, { "epoch": 1.5974620280065603, "learning_rate": 4.694005789385266e-06, "loss": 2.4807778930664064, "step": 1323900 }, { "epoch": 1.5975826913290432, "learning_rate": 4.693601953917527e-06, "loss": 2.4829502868652344, "step": 1324000 }, { "epoch": 1.5977033546515258, "learning_rate": 4.693198118449789e-06, "loss": 2.485155487060547, "step": 1324100 }, { "epoch": 1.5978240179740086, "learning_rate": 4.69279428298205e-06, "loss": 2.4713031005859376, "step": 1324200 }, { "epoch": 1.5979446812964913, "learning_rate": 4.692390447514312e-06, "loss": 2.4773114013671873, "step": 1324300 }, { "epoch": 1.5980653446189739, "learning_rate": 4.691986612046574e-06, "loss": 2.476884460449219, "step": 1324400 }, { "epoch": 1.5981860079414565, "learning_rate": 4.6915827765788355e-06, "loss": 2.4827618408203125, "step": 1324500 }, { "epoch": 1.598306671263939, "learning_rate": 4.691178941111097e-06, "loss": 2.4937565612792967, "step": 1324600 }, { "epoch": 1.598427334586422, "learning_rate": 4.690775105643359e-06, "loss": 2.4694673156738283, "step": 1324700 }, { "epoch": 1.5985479979089048, "learning_rate": 4.690371270175621e-06, "loss": 2.4951556396484373, "step": 1324800 }, { "epoch": 1.5986686612313874, "learning_rate": 4.689967434707883e-06, "loss": 2.492273406982422, "step": 1324900 }, { "epoch": 1.59878932455387, "learning_rate": 4.689563599240144e-06, "loss": 2.492819519042969, "step": 1325000 }, { "epoch": 1.5989099878763526, "learning_rate": 4.689159763772405e-06, "loss": 2.482206268310547, "step": 1325100 }, { "epoch": 1.5990306511988353, "learning_rate": 4.688755928304667e-06, "loss": 2.4840602111816406, "step": 1325200 }, { "epoch": 1.599151314521318, "learning_rate": 4.688352092836929e-06, "loss": 2.5006507873535155, "step": 1325300 }, { "epoch": 1.5992719778438007, "learning_rate": 4.68794825736919e-06, "loss": 2.4827621459960936, "step": 1325400 }, { "epoch": 1.5993926411662835, "learning_rate": 4.687544421901452e-06, "loss": 2.4851394653320313, "step": 1325500 }, { "epoch": 1.5995133044887662, "learning_rate": 4.687140586433713e-06, "loss": 2.482163848876953, "step": 1325600 }, { "epoch": 1.5996339678112488, "learning_rate": 4.686736750965975e-06, "loss": 2.461800231933594, "step": 1325700 }, { "epoch": 1.5997546311337314, "learning_rate": 4.686332915498236e-06, "loss": 2.49234130859375, "step": 1325800 }, { "epoch": 1.599875294456214, "learning_rate": 4.685929080030498e-06, "loss": 2.451399078369141, "step": 1325900 }, { "epoch": 1.5999959577786969, "learning_rate": 4.685525244562759e-06, "loss": 2.477674560546875, "step": 1326000 }, { "epoch": 1.6001166211011795, "learning_rate": 4.685121409095021e-06, "loss": 2.502746124267578, "step": 1326100 }, { "epoch": 1.6002372844236623, "learning_rate": 4.6847175736272824e-06, "loss": 2.468070373535156, "step": 1326200 }, { "epoch": 1.600357947746145, "learning_rate": 4.6843137381595444e-06, "loss": 2.4855694580078125, "step": 1326300 }, { "epoch": 1.6004786110686275, "learning_rate": 4.683909902691806e-06, "loss": 2.482741241455078, "step": 1326400 }, { "epoch": 1.6005992743911102, "learning_rate": 4.6835060672240675e-06, "loss": 2.4381887817382815, "step": 1326500 }, { "epoch": 1.6007199377135928, "learning_rate": 4.683102231756329e-06, "loss": 2.4840191650390624, "step": 1326600 }, { "epoch": 1.6008406010360756, "learning_rate": 4.682698396288591e-06, "loss": 2.47251220703125, "step": 1326700 }, { "epoch": 1.6009612643585585, "learning_rate": 4.682294560820853e-06, "loss": 2.4952821350097656, "step": 1326800 }, { "epoch": 1.601081927681041, "learning_rate": 4.681890725353115e-06, "loss": 2.4805776977539065, "step": 1326900 }, { "epoch": 1.6012025910035237, "learning_rate": 4.681486889885376e-06, "loss": 2.5114862060546876, "step": 1327000 }, { "epoch": 1.6013232543260063, "learning_rate": 4.681083054417637e-06, "loss": 2.4758123779296874, "step": 1327100 }, { "epoch": 1.601443917648489, "learning_rate": 4.680679218949899e-06, "loss": 2.4616441345214843, "step": 1327200 }, { "epoch": 1.6015645809709718, "learning_rate": 4.680275383482161e-06, "loss": 2.4995819091796876, "step": 1327300 }, { "epoch": 1.6016852442934544, "learning_rate": 4.679871548014422e-06, "loss": 2.472781982421875, "step": 1327400 }, { "epoch": 1.6018059076159372, "learning_rate": 4.679467712546684e-06, "loss": 2.4741531372070313, "step": 1327500 }, { "epoch": 1.6019265709384198, "learning_rate": 4.679063877078945e-06, "loss": 2.4909361267089842, "step": 1327600 }, { "epoch": 1.6020472342609025, "learning_rate": 4.678660041611207e-06, "loss": 2.4854171752929686, "step": 1327700 }, { "epoch": 1.602167897583385, "learning_rate": 4.678256206143468e-06, "loss": 2.476807861328125, "step": 1327800 }, { "epoch": 1.6022885609058677, "learning_rate": 4.67785237067573e-06, "loss": 2.4651229858398436, "step": 1327900 }, { "epoch": 1.6024092242283505, "learning_rate": 4.677448535207992e-06, "loss": 2.4918089294433594, "step": 1328000 }, { "epoch": 1.6025298875508331, "learning_rate": 4.677044699740253e-06, "loss": 2.4819184875488283, "step": 1328100 }, { "epoch": 1.602650550873316, "learning_rate": 4.676640864272515e-06, "loss": 2.486383361816406, "step": 1328200 }, { "epoch": 1.6027712141957986, "learning_rate": 4.6762370288047765e-06, "loss": 2.508489685058594, "step": 1328300 }, { "epoch": 1.6028918775182812, "learning_rate": 4.6758331933370384e-06, "loss": 2.4889569091796875, "step": 1328400 }, { "epoch": 1.6030125408407638, "learning_rate": 4.6754293578692996e-06, "loss": 2.449759521484375, "step": 1328500 }, { "epoch": 1.6031332041632465, "learning_rate": 4.6750255224015616e-06, "loss": 2.466775207519531, "step": 1328600 }, { "epoch": 1.6032538674857293, "learning_rate": 4.674621686933823e-06, "loss": 2.468641815185547, "step": 1328700 }, { "epoch": 1.6033745308082121, "learning_rate": 4.674217851466085e-06, "loss": 2.473136444091797, "step": 1328800 }, { "epoch": 1.6034951941306947, "learning_rate": 4.673814015998347e-06, "loss": 2.492147674560547, "step": 1328900 }, { "epoch": 1.6036158574531774, "learning_rate": 4.673410180530608e-06, "loss": 2.4844970703125, "step": 1329000 }, { "epoch": 1.60373652077566, "learning_rate": 4.673006345062869e-06, "loss": 2.4635166931152344, "step": 1329100 }, { "epoch": 1.6038571840981426, "learning_rate": 4.672602509595131e-06, "loss": 2.4699769592285157, "step": 1329200 }, { "epoch": 1.6039778474206254, "learning_rate": 4.672198674127393e-06, "loss": 2.475087127685547, "step": 1329300 }, { "epoch": 1.604098510743108, "learning_rate": 4.671794838659655e-06, "loss": 2.493582763671875, "step": 1329400 }, { "epoch": 1.604219174065591, "learning_rate": 4.671391003191916e-06, "loss": 2.5036927795410158, "step": 1329500 }, { "epoch": 1.6043398373880735, "learning_rate": 4.670987167724177e-06, "loss": 2.4913821411132813, "step": 1329600 }, { "epoch": 1.6044605007105561, "learning_rate": 4.670583332256439e-06, "loss": 2.4646734619140624, "step": 1329700 }, { "epoch": 1.6045811640330387, "learning_rate": 4.670179496788701e-06, "loss": 2.4478323364257815, "step": 1329800 }, { "epoch": 1.6047018273555214, "learning_rate": 4.669775661320962e-06, "loss": 2.471640625, "step": 1329900 }, { "epoch": 1.6048224906780042, "learning_rate": 4.669371825853224e-06, "loss": 2.494401092529297, "step": 1330000 }, { "epoch": 1.604943154000487, "learning_rate": 4.668967990385485e-06, "loss": 2.486509246826172, "step": 1330100 }, { "epoch": 1.6050638173229697, "learning_rate": 4.668564154917747e-06, "loss": 2.4869511413574217, "step": 1330200 }, { "epoch": 1.6051844806454523, "learning_rate": 4.6681603194500085e-06, "loss": 2.481401824951172, "step": 1330300 }, { "epoch": 1.6053051439679349, "learning_rate": 4.6677564839822705e-06, "loss": 2.4715750122070315, "step": 1330400 }, { "epoch": 1.6054258072904175, "learning_rate": 4.6673526485145324e-06, "loss": 2.4754148864746095, "step": 1330500 }, { "epoch": 1.6055464706129003, "learning_rate": 4.666948813046794e-06, "loss": 2.4661207580566407, "step": 1330600 }, { "epoch": 1.605667133935383, "learning_rate": 4.666544977579055e-06, "loss": 2.4961781311035156, "step": 1330700 }, { "epoch": 1.6057877972578658, "learning_rate": 4.666141142111317e-06, "loss": 2.442690582275391, "step": 1330800 }, { "epoch": 1.6059084605803484, "learning_rate": 4.665737306643579e-06, "loss": 2.475660552978516, "step": 1330900 }, { "epoch": 1.606029123902831, "learning_rate": 4.66533347117584e-06, "loss": 2.460635223388672, "step": 1331000 }, { "epoch": 1.6061497872253137, "learning_rate": 4.664929635708102e-06, "loss": 2.4756103515625, "step": 1331100 }, { "epoch": 1.6062704505477963, "learning_rate": 4.664525800240363e-06, "loss": 2.4915736389160155, "step": 1331200 }, { "epoch": 1.606391113870279, "learning_rate": 4.664121964772625e-06, "loss": 2.4546018981933595, "step": 1331300 }, { "epoch": 1.6065117771927617, "learning_rate": 4.663718129304887e-06, "loss": 2.4912640380859377, "step": 1331400 }, { "epoch": 1.6066324405152446, "learning_rate": 4.663314293837148e-06, "loss": 2.4548785400390627, "step": 1331500 }, { "epoch": 1.6067531038377272, "learning_rate": 4.662910458369409e-06, "loss": 2.468985900878906, "step": 1331600 }, { "epoch": 1.6068737671602098, "learning_rate": 4.662506622901671e-06, "loss": 2.476146392822266, "step": 1331700 }, { "epoch": 1.6069944304826924, "learning_rate": 4.662102787433933e-06, "loss": 2.500005340576172, "step": 1331800 }, { "epoch": 1.607115093805175, "learning_rate": 4.661698951966194e-06, "loss": 2.497659454345703, "step": 1331900 }, { "epoch": 1.6072357571276579, "learning_rate": 4.661295116498456e-06, "loss": 2.466940460205078, "step": 1332000 }, { "epoch": 1.6073564204501407, "learning_rate": 4.660891281030717e-06, "loss": 2.462948760986328, "step": 1332100 }, { "epoch": 1.6074770837726233, "learning_rate": 4.660487445562979e-06, "loss": 2.460507354736328, "step": 1332200 }, { "epoch": 1.607597747095106, "learning_rate": 4.6600836100952405e-06, "loss": 2.4705410766601563, "step": 1332300 }, { "epoch": 1.6077184104175886, "learning_rate": 4.6596797746275025e-06, "loss": 2.498499450683594, "step": 1332400 }, { "epoch": 1.6078390737400712, "learning_rate": 4.6592759391597645e-06, "loss": 2.4596737670898436, "step": 1332500 }, { "epoch": 1.607959737062554, "learning_rate": 4.658872103692026e-06, "loss": 2.4819847106933595, "step": 1332600 }, { "epoch": 1.6080804003850366, "learning_rate": 4.658468268224287e-06, "loss": 2.467987365722656, "step": 1332700 }, { "epoch": 1.6082010637075195, "learning_rate": 4.658064432756549e-06, "loss": 2.4522361755371094, "step": 1332800 }, { "epoch": 1.608321727030002, "learning_rate": 4.657660597288811e-06, "loss": 2.4654525756835937, "step": 1332900 }, { "epoch": 1.6084423903524847, "learning_rate": 4.657256761821073e-06, "loss": 2.477743682861328, "step": 1333000 }, { "epoch": 1.6085630536749673, "learning_rate": 4.656852926353334e-06, "loss": 2.4844454956054687, "step": 1333100 }, { "epoch": 1.60868371699745, "learning_rate": 4.656449090885595e-06, "loss": 2.478776397705078, "step": 1333200 }, { "epoch": 1.6088043803199328, "learning_rate": 4.656045255417857e-06, "loss": 2.4983198547363283, "step": 1333300 }, { "epoch": 1.6089250436424154, "learning_rate": 4.655641419950119e-06, "loss": 2.4891426086425783, "step": 1333400 }, { "epoch": 1.6090457069648982, "learning_rate": 4.655237584482381e-06, "loss": 2.4880694580078124, "step": 1333500 }, { "epoch": 1.6091663702873809, "learning_rate": 4.654833749014642e-06, "loss": 2.4804078674316408, "step": 1333600 }, { "epoch": 1.6092870336098635, "learning_rate": 4.654429913546903e-06, "loss": 2.4697230529785155, "step": 1333700 }, { "epoch": 1.609407696932346, "learning_rate": 4.654026078079165e-06, "loss": 2.480632476806641, "step": 1333800 }, { "epoch": 1.6095283602548287, "learning_rate": 4.653622242611427e-06, "loss": 2.4839405822753906, "step": 1333900 }, { "epoch": 1.6096490235773115, "learning_rate": 4.653218407143688e-06, "loss": 2.506086578369141, "step": 1334000 }, { "epoch": 1.6097696868997944, "learning_rate": 4.65281457167595e-06, "loss": 2.4627748107910157, "step": 1334100 }, { "epoch": 1.609890350222277, "learning_rate": 4.652410736208211e-06, "loss": 2.4703707885742188, "step": 1334200 }, { "epoch": 1.6100110135447596, "learning_rate": 4.652006900740473e-06, "loss": 2.4850419616699218, "step": 1334300 }, { "epoch": 1.6101316768672422, "learning_rate": 4.6516030652727345e-06, "loss": 2.4925381469726564, "step": 1334400 }, { "epoch": 1.6102523401897249, "learning_rate": 4.6511992298049965e-06, "loss": 2.4979881286621093, "step": 1334500 }, { "epoch": 1.6103730035122077, "learning_rate": 4.650795394337258e-06, "loss": 2.4880215454101564, "step": 1334600 }, { "epoch": 1.6104936668346903, "learning_rate": 4.65039155886952e-06, "loss": 2.488802185058594, "step": 1334700 }, { "epoch": 1.6106143301571731, "learning_rate": 4.649987723401781e-06, "loss": 2.4757539367675783, "step": 1334800 }, { "epoch": 1.6107349934796558, "learning_rate": 4.649583887934043e-06, "loss": 2.485830841064453, "step": 1334900 }, { "epoch": 1.6108556568021384, "learning_rate": 4.649180052466305e-06, "loss": 2.4726023864746094, "step": 1335000 }, { "epoch": 1.610976320124621, "learning_rate": 4.648776216998566e-06, "loss": 2.496085357666016, "step": 1335100 }, { "epoch": 1.6110969834471036, "learning_rate": 4.648372381530827e-06, "loss": 2.488614501953125, "step": 1335200 }, { "epoch": 1.6112176467695865, "learning_rate": 4.647968546063089e-06, "loss": 2.452526092529297, "step": 1335300 }, { "epoch": 1.6113383100920693, "learning_rate": 4.647564710595351e-06, "loss": 2.482330780029297, "step": 1335400 }, { "epoch": 1.611458973414552, "learning_rate": 4.647160875127613e-06, "loss": 2.4984141540527345, "step": 1335500 }, { "epoch": 1.6115796367370345, "learning_rate": 4.646757039659874e-06, "loss": 2.4693016052246093, "step": 1335600 }, { "epoch": 1.6117003000595171, "learning_rate": 4.646353204192135e-06, "loss": 2.5184971618652345, "step": 1335700 }, { "epoch": 1.6118209633819998, "learning_rate": 4.645949368724397e-06, "loss": 2.502175140380859, "step": 1335800 }, { "epoch": 1.6119416267044826, "learning_rate": 4.645545533256659e-06, "loss": 2.464921722412109, "step": 1335900 }, { "epoch": 1.6120622900269652, "learning_rate": 4.64514169778892e-06, "loss": 2.4836489868164064, "step": 1336000 }, { "epoch": 1.612182953349448, "learning_rate": 4.644737862321182e-06, "loss": 2.4775431823730467, "step": 1336100 }, { "epoch": 1.6123036166719307, "learning_rate": 4.644334026853443e-06, "loss": 2.458690338134766, "step": 1336200 }, { "epoch": 1.6124242799944133, "learning_rate": 4.643930191385705e-06, "loss": 2.4876167297363283, "step": 1336300 }, { "epoch": 1.612544943316896, "learning_rate": 4.6435263559179665e-06, "loss": 2.4846336364746096, "step": 1336400 }, { "epoch": 1.6126656066393785, "learning_rate": 4.6431225204502285e-06, "loss": 2.4818585205078123, "step": 1336500 }, { "epoch": 1.6127862699618614, "learning_rate": 4.6427186849824905e-06, "loss": 2.450847473144531, "step": 1336600 }, { "epoch": 1.612906933284344, "learning_rate": 4.642314849514752e-06, "loss": 2.5033013916015623, "step": 1336700 }, { "epoch": 1.6130275966068268, "learning_rate": 4.641911014047013e-06, "loss": 2.445030517578125, "step": 1336800 }, { "epoch": 1.6131482599293094, "learning_rate": 4.641507178579275e-06, "loss": 2.481977081298828, "step": 1336900 }, { "epoch": 1.613268923251792, "learning_rate": 4.641103343111537e-06, "loss": 2.464147491455078, "step": 1337000 }, { "epoch": 1.6133895865742747, "learning_rate": 4.640699507643798e-06, "loss": 2.462839813232422, "step": 1337100 }, { "epoch": 1.6135102498967573, "learning_rate": 4.64029567217606e-06, "loss": 2.495924377441406, "step": 1337200 }, { "epoch": 1.6136309132192401, "learning_rate": 4.639891836708321e-06, "loss": 2.4739813232421874, "step": 1337300 }, { "epoch": 1.613751576541723, "learning_rate": 4.639488001240583e-06, "loss": 2.4749078369140625, "step": 1337400 }, { "epoch": 1.6138722398642056, "learning_rate": 4.639084165772845e-06, "loss": 2.484411315917969, "step": 1337500 }, { "epoch": 1.6139929031866882, "learning_rate": 4.638680330305106e-06, "loss": 2.4607611083984375, "step": 1337600 }, { "epoch": 1.6141135665091708, "learning_rate": 4.638276494837367e-06, "loss": 2.4721469116210937, "step": 1337700 }, { "epoch": 1.6142342298316534, "learning_rate": 4.637872659369629e-06, "loss": 2.4580729675292967, "step": 1337800 }, { "epoch": 1.6143548931541363, "learning_rate": 4.637468823901891e-06, "loss": 2.469931335449219, "step": 1337900 }, { "epoch": 1.614475556476619, "learning_rate": 4.637064988434152e-06, "loss": 2.478954620361328, "step": 1338000 }, { "epoch": 1.6145962197991017, "learning_rate": 4.636661152966414e-06, "loss": 2.4615013122558596, "step": 1338100 }, { "epoch": 1.6147168831215843, "learning_rate": 4.6362573174986754e-06, "loss": 2.4997906494140625, "step": 1338200 }, { "epoch": 1.614837546444067, "learning_rate": 4.6358534820309374e-06, "loss": 2.492159729003906, "step": 1338300 }, { "epoch": 1.6149582097665496, "learning_rate": 4.635449646563199e-06, "loss": 2.453917236328125, "step": 1338400 }, { "epoch": 1.6150788730890322, "learning_rate": 4.6350458110954605e-06, "loss": 2.4803921508789064, "step": 1338500 }, { "epoch": 1.615199536411515, "learning_rate": 4.6346419756277225e-06, "loss": 2.5034730529785154, "step": 1338600 }, { "epoch": 1.6153201997339977, "learning_rate": 4.634238140159984e-06, "loss": 2.471212158203125, "step": 1338700 }, { "epoch": 1.6154408630564805, "learning_rate": 4.633834304692246e-06, "loss": 2.474709320068359, "step": 1338800 }, { "epoch": 1.615561526378963, "learning_rate": 4.633430469224507e-06, "loss": 2.4579681396484374, "step": 1338900 }, { "epoch": 1.6156821897014457, "learning_rate": 4.633026633756769e-06, "loss": 2.4665153503417967, "step": 1339000 }, { "epoch": 1.6158028530239283, "learning_rate": 4.632622798289031e-06, "loss": 2.47658203125, "step": 1339100 }, { "epoch": 1.615923516346411, "learning_rate": 4.632218962821292e-06, "loss": 2.4895248413085938, "step": 1339200 }, { "epoch": 1.6160441796688938, "learning_rate": 4.631815127353553e-06, "loss": 2.4520672607421874, "step": 1339300 }, { "epoch": 1.6161648429913766, "learning_rate": 4.631411291885815e-06, "loss": 2.4893263244628905, "step": 1339400 }, { "epoch": 1.6162855063138593, "learning_rate": 4.631007456418077e-06, "loss": 2.4765673828125, "step": 1339500 }, { "epoch": 1.6164061696363419, "learning_rate": 4.630603620950339e-06, "loss": 2.514773254394531, "step": 1339600 }, { "epoch": 1.6165268329588245, "learning_rate": 4.6301997854826e-06, "loss": 2.4892013549804686, "step": 1339700 }, { "epoch": 1.616647496281307, "learning_rate": 4.629795950014861e-06, "loss": 2.4738946533203126, "step": 1339800 }, { "epoch": 1.61676815960379, "learning_rate": 4.629392114547123e-06, "loss": 2.477846832275391, "step": 1339900 }, { "epoch": 1.6168888229262726, "learning_rate": 4.628988279079385e-06, "loss": 2.4709628295898436, "step": 1340000 }, { "epoch": 1.6170094862487554, "learning_rate": 4.628584443611646e-06, "loss": 2.4647666931152346, "step": 1340100 }, { "epoch": 1.617130149571238, "learning_rate": 4.628180608143908e-06, "loss": 2.4744708251953127, "step": 1340200 }, { "epoch": 1.6172508128937206, "learning_rate": 4.6277767726761695e-06, "loss": 2.485861358642578, "step": 1340300 }, { "epoch": 1.6173714762162033, "learning_rate": 4.6273729372084314e-06, "loss": 2.4594912719726563, "step": 1340400 }, { "epoch": 1.6174921395386859, "learning_rate": 4.6269691017406926e-06, "loss": 2.467772979736328, "step": 1340500 }, { "epoch": 1.6176128028611687, "learning_rate": 4.6265652662729546e-06, "loss": 2.4864251708984373, "step": 1340600 }, { "epoch": 1.6177334661836515, "learning_rate": 4.626161430805216e-06, "loss": 2.4875755310058594, "step": 1340700 }, { "epoch": 1.6178541295061342, "learning_rate": 4.625757595337478e-06, "loss": 2.4820785522460938, "step": 1340800 }, { "epoch": 1.6179747928286168, "learning_rate": 4.625353759869739e-06, "loss": 2.455258331298828, "step": 1340900 }, { "epoch": 1.6180954561510994, "learning_rate": 4.624949924402001e-06, "loss": 2.4995684814453125, "step": 1341000 }, { "epoch": 1.618216119473582, "learning_rate": 4.624546088934263e-06, "loss": 2.468287353515625, "step": 1341100 }, { "epoch": 1.6183367827960649, "learning_rate": 4.624142253466524e-06, "loss": 2.5107264709472656, "step": 1341200 }, { "epoch": 1.6184574461185475, "learning_rate": 4.623738417998785e-06, "loss": 2.479676513671875, "step": 1341300 }, { "epoch": 1.6185781094410303, "learning_rate": 4.623334582531047e-06, "loss": 2.4533331298828127, "step": 1341400 }, { "epoch": 1.618698772763513, "learning_rate": 4.622930747063309e-06, "loss": 2.478677978515625, "step": 1341500 }, { "epoch": 1.6188194360859955, "learning_rate": 4.622526911595571e-06, "loss": 2.4984754943847656, "step": 1341600 }, { "epoch": 1.6189400994084782, "learning_rate": 4.622123076127832e-06, "loss": 2.452758483886719, "step": 1341700 }, { "epoch": 1.6190607627309608, "learning_rate": 4.621719240660093e-06, "loss": 2.4806674194335936, "step": 1341800 }, { "epoch": 1.6191814260534436, "learning_rate": 4.621315405192355e-06, "loss": 2.5032530212402344, "step": 1341900 }, { "epoch": 1.6193020893759262, "learning_rate": 4.620911569724617e-06, "loss": 2.457622833251953, "step": 1342000 }, { "epoch": 1.619422752698409, "learning_rate": 4.620507734256878e-06, "loss": 2.476728515625, "step": 1342100 }, { "epoch": 1.6195434160208917, "learning_rate": 4.62010389878914e-06, "loss": 2.494589538574219, "step": 1342200 }, { "epoch": 1.6196640793433743, "learning_rate": 4.6197000633214015e-06, "loss": 2.482898406982422, "step": 1342300 }, { "epoch": 1.619784742665857, "learning_rate": 4.6192962278536635e-06, "loss": 2.490411682128906, "step": 1342400 }, { "epoch": 1.6199054059883395, "learning_rate": 4.618892392385925e-06, "loss": 2.4731596374511717, "step": 1342500 }, { "epoch": 1.6200260693108224, "learning_rate": 4.618488556918187e-06, "loss": 2.449543762207031, "step": 1342600 }, { "epoch": 1.6201467326333052, "learning_rate": 4.6180847214504486e-06, "loss": 2.4698297119140626, "step": 1342700 }, { "epoch": 1.6202673959557878, "learning_rate": 4.61768088598271e-06, "loss": 2.4729818725585937, "step": 1342800 }, { "epoch": 1.6203880592782705, "learning_rate": 4.617277050514971e-06, "loss": 2.478349609375, "step": 1342900 }, { "epoch": 1.620508722600753, "learning_rate": 4.616873215047233e-06, "loss": 2.4403419494628906, "step": 1343000 }, { "epoch": 1.6206293859232357, "learning_rate": 4.616469379579495e-06, "loss": 2.465090026855469, "step": 1343100 }, { "epoch": 1.6207500492457185, "learning_rate": 4.616065544111756e-06, "loss": 2.501513671875, "step": 1343200 }, { "epoch": 1.6208707125682011, "learning_rate": 4.615661708644018e-06, "loss": 2.4574830627441404, "step": 1343300 }, { "epoch": 1.620991375890684, "learning_rate": 4.615257873176279e-06, "loss": 2.4341796875, "step": 1343400 }, { "epoch": 1.6211120392131666, "learning_rate": 4.614854037708541e-06, "loss": 2.484800109863281, "step": 1343500 }, { "epoch": 1.6212327025356492, "learning_rate": 4.614450202240803e-06, "loss": 2.4624757385253906, "step": 1343600 }, { "epoch": 1.6213533658581318, "learning_rate": 4.614046366773064e-06, "loss": 2.497986297607422, "step": 1343700 }, { "epoch": 1.6214740291806145, "learning_rate": 4.613642531305325e-06, "loss": 2.4814385986328125, "step": 1343800 }, { "epoch": 1.6215946925030973, "learning_rate": 4.613238695837587e-06, "loss": 2.461953125, "step": 1343900 }, { "epoch": 1.62171535582558, "learning_rate": 4.612834860369849e-06, "loss": 2.4741194152832033, "step": 1344000 }, { "epoch": 1.6218360191480627, "learning_rate": 4.612431024902111e-06, "loss": 2.4716090393066406, "step": 1344100 }, { "epoch": 1.6219566824705454, "learning_rate": 4.612027189434372e-06, "loss": 2.4493089294433594, "step": 1344200 }, { "epoch": 1.622077345793028, "learning_rate": 4.6116233539666335e-06, "loss": 2.476542663574219, "step": 1344300 }, { "epoch": 1.6221980091155106, "learning_rate": 4.6112195184988955e-06, "loss": 2.48642578125, "step": 1344400 }, { "epoch": 1.6223186724379934, "learning_rate": 4.6108156830311575e-06, "loss": 2.4834468078613283, "step": 1344500 }, { "epoch": 1.622439335760476, "learning_rate": 4.610411847563419e-06, "loss": 2.482260437011719, "step": 1344600 }, { "epoch": 1.622559999082959, "learning_rate": 4.610008012095681e-06, "loss": 2.4862548828125, "step": 1344700 }, { "epoch": 1.6226806624054415, "learning_rate": 4.609604176627942e-06, "loss": 2.478199462890625, "step": 1344800 }, { "epoch": 1.6228013257279241, "learning_rate": 4.609200341160204e-06, "loss": 2.4793101501464845, "step": 1344900 }, { "epoch": 1.6229219890504067, "learning_rate": 4.608796505692465e-06, "loss": 2.479522399902344, "step": 1345000 }, { "epoch": 1.6230426523728894, "learning_rate": 4.608392670224727e-06, "loss": 2.478718719482422, "step": 1345100 }, { "epoch": 1.6231633156953722, "learning_rate": 4.607988834756989e-06, "loss": 2.4723391723632813, "step": 1345200 }, { "epoch": 1.6232839790178548, "learning_rate": 4.60758499928925e-06, "loss": 2.4673841857910155, "step": 1345300 }, { "epoch": 1.6234046423403377, "learning_rate": 4.607181163821511e-06, "loss": 2.4767579650878906, "step": 1345400 }, { "epoch": 1.6235253056628203, "learning_rate": 4.606777328353773e-06, "loss": 2.478737640380859, "step": 1345500 }, { "epoch": 1.623645968985303, "learning_rate": 4.606373492886035e-06, "loss": 2.46771728515625, "step": 1345600 }, { "epoch": 1.6237666323077855, "learning_rate": 4.605969657418296e-06, "loss": 2.486679992675781, "step": 1345700 }, { "epoch": 1.6238872956302681, "learning_rate": 4.605565821950558e-06, "loss": 2.4651634216308596, "step": 1345800 }, { "epoch": 1.624007958952751, "learning_rate": 4.605161986482819e-06, "loss": 2.473048095703125, "step": 1345900 }, { "epoch": 1.6241286222752338, "learning_rate": 4.604758151015081e-06, "loss": 2.494051055908203, "step": 1346000 }, { "epoch": 1.6242492855977164, "learning_rate": 4.604354315547343e-06, "loss": 2.473269348144531, "step": 1346100 }, { "epoch": 1.624369948920199, "learning_rate": 4.603950480079604e-06, "loss": 2.474651031494141, "step": 1346200 }, { "epoch": 1.6244906122426817, "learning_rate": 4.6035466446118655e-06, "loss": 2.4666934204101563, "step": 1346300 }, { "epoch": 1.6246112755651643, "learning_rate": 4.6031428091441275e-06, "loss": 2.498213348388672, "step": 1346400 }, { "epoch": 1.624731938887647, "learning_rate": 4.6027389736763895e-06, "loss": 2.464181671142578, "step": 1346500 }, { "epoch": 1.6248526022101297, "learning_rate": 4.602335138208651e-06, "loss": 2.465073699951172, "step": 1346600 }, { "epoch": 1.6249732655326126, "learning_rate": 4.601931302740913e-06, "loss": 2.4678744506835937, "step": 1346700 }, { "epoch": 1.6250939288550952, "learning_rate": 4.601527467273174e-06, "loss": 2.483049774169922, "step": 1346800 }, { "epoch": 1.6252145921775778, "learning_rate": 4.601123631805436e-06, "loss": 2.4828387451171876, "step": 1346900 }, { "epoch": 1.6253352555000604, "learning_rate": 4.600719796337697e-06, "loss": 2.4956260681152345, "step": 1347000 }, { "epoch": 1.625455918822543, "learning_rate": 4.600315960869959e-06, "loss": 2.4601194763183596, "step": 1347100 }, { "epoch": 1.6255765821450259, "learning_rate": 4.599912125402221e-06, "loss": 2.4692430114746093, "step": 1347200 }, { "epoch": 1.6256972454675085, "learning_rate": 4.599508289934482e-06, "loss": 2.4658853149414064, "step": 1347300 }, { "epoch": 1.6258179087899913, "learning_rate": 4.599104454466743e-06, "loss": 2.473587646484375, "step": 1347400 }, { "epoch": 1.625938572112474, "learning_rate": 4.598700618999005e-06, "loss": 2.478220977783203, "step": 1347500 }, { "epoch": 1.6260592354349566, "learning_rate": 4.598296783531267e-06, "loss": 2.4680186462402345, "step": 1347600 }, { "epoch": 1.6261798987574392, "learning_rate": 4.597892948063529e-06, "loss": 2.489205169677734, "step": 1347700 }, { "epoch": 1.6263005620799218, "learning_rate": 4.59748911259579e-06, "loss": 2.4951402282714845, "step": 1347800 }, { "epoch": 1.6264212254024046, "learning_rate": 4.597085277128051e-06, "loss": 2.4655917358398436, "step": 1347900 }, { "epoch": 1.6265418887248875, "learning_rate": 4.596681441660313e-06, "loss": 2.4573081970214843, "step": 1348000 }, { "epoch": 1.62666255204737, "learning_rate": 4.596277606192575e-06, "loss": 2.4938966369628908, "step": 1348100 }, { "epoch": 1.6267832153698527, "learning_rate": 4.5958737707248364e-06, "loss": 2.4695472717285156, "step": 1348200 }, { "epoch": 1.6269038786923353, "learning_rate": 4.595469935257098e-06, "loss": 2.4630340576171874, "step": 1348300 }, { "epoch": 1.627024542014818, "learning_rate": 4.5950660997893595e-06, "loss": 2.472473602294922, "step": 1348400 }, { "epoch": 1.6271452053373008, "learning_rate": 4.5946622643216215e-06, "loss": 2.4808290100097654, "step": 1348500 }, { "epoch": 1.6272658686597834, "learning_rate": 4.594258428853883e-06, "loss": 2.4586251831054686, "step": 1348600 }, { "epoch": 1.6273865319822662, "learning_rate": 4.593854593386145e-06, "loss": 2.456665802001953, "step": 1348700 }, { "epoch": 1.6275071953047489, "learning_rate": 4.593450757918407e-06, "loss": 2.485398406982422, "step": 1348800 }, { "epoch": 1.6276278586272315, "learning_rate": 4.593046922450668e-06, "loss": 2.474917144775391, "step": 1348900 }, { "epoch": 1.627748521949714, "learning_rate": 4.59264308698293e-06, "loss": 2.4662030029296873, "step": 1349000 }, { "epoch": 1.6278691852721967, "learning_rate": 4.592239251515191e-06, "loss": 2.4690765380859374, "step": 1349100 }, { "epoch": 1.6279898485946795, "learning_rate": 4.591835416047453e-06, "loss": 2.4450090026855467, "step": 1349200 }, { "epoch": 1.6281105119171622, "learning_rate": 4.591431580579714e-06, "loss": 2.4721798706054687, "step": 1349300 }, { "epoch": 1.628231175239645, "learning_rate": 4.591027745111976e-06, "loss": 2.4612733459472658, "step": 1349400 }, { "epoch": 1.6283518385621276, "learning_rate": 4.590623909644237e-06, "loss": 2.511497039794922, "step": 1349500 }, { "epoch": 1.6284725018846102, "learning_rate": 4.590220074176499e-06, "loss": 2.4646278381347657, "step": 1349600 }, { "epoch": 1.6285931652070929, "learning_rate": 4.589816238708761e-06, "loss": 2.480207824707031, "step": 1349700 }, { "epoch": 1.6287138285295757, "learning_rate": 4.589412403241022e-06, "loss": 2.455616912841797, "step": 1349800 }, { "epoch": 1.6288344918520583, "learning_rate": 4.589008567773283e-06, "loss": 2.4802957153320313, "step": 1349900 }, { "epoch": 1.6289551551745411, "learning_rate": 4.588604732305545e-06, "loss": 2.473652648925781, "step": 1350000 }, { "epoch": 1.6290758184970238, "learning_rate": 4.588200896837807e-06, "loss": 2.453141784667969, "step": 1350100 }, { "epoch": 1.6291964818195064, "learning_rate": 4.587797061370069e-06, "loss": 2.4850303649902346, "step": 1350200 }, { "epoch": 1.629317145141989, "learning_rate": 4.5873932259023304e-06, "loss": 2.493749542236328, "step": 1350300 }, { "epoch": 1.6294378084644716, "learning_rate": 4.5869893904345916e-06, "loss": 2.4764578247070315, "step": 1350400 }, { "epoch": 1.6295584717869545, "learning_rate": 4.5865855549668535e-06, "loss": 2.4940440368652346, "step": 1350500 }, { "epoch": 1.629679135109437, "learning_rate": 4.5861817194991155e-06, "loss": 2.4663764953613283, "step": 1350600 }, { "epoch": 1.62979979843192, "learning_rate": 4.585777884031377e-06, "loss": 2.4781283569335937, "step": 1350700 }, { "epoch": 1.6299204617544025, "learning_rate": 4.585374048563639e-06, "loss": 2.4729794311523436, "step": 1350800 }, { "epoch": 1.6300411250768851, "learning_rate": 4.5849702130959e-06, "loss": 2.451063385009766, "step": 1350900 }, { "epoch": 1.6301617883993678, "learning_rate": 4.584566377628162e-06, "loss": 2.481503143310547, "step": 1351000 }, { "epoch": 1.6302824517218504, "learning_rate": 4.584162542160423e-06, "loss": 2.471859130859375, "step": 1351100 }, { "epoch": 1.6304031150443332, "learning_rate": 4.583758706692685e-06, "loss": 2.468668670654297, "step": 1351200 }, { "epoch": 1.630523778366816, "learning_rate": 4.583354871224947e-06, "loss": 2.454839172363281, "step": 1351300 }, { "epoch": 1.6306444416892987, "learning_rate": 4.582951035757208e-06, "loss": 2.434528350830078, "step": 1351400 }, { "epoch": 1.6307651050117813, "learning_rate": 4.582547200289469e-06, "loss": 2.4975848388671875, "step": 1351500 }, { "epoch": 1.630885768334264, "learning_rate": 4.582143364821731e-06, "loss": 2.4635879516601564, "step": 1351600 }, { "epoch": 1.6310064316567465, "learning_rate": 4.581739529353993e-06, "loss": 2.4778233337402344, "step": 1351700 }, { "epoch": 1.6311270949792294, "learning_rate": 4.581335693886254e-06, "loss": 2.4802020263671873, "step": 1351800 }, { "epoch": 1.631247758301712, "learning_rate": 4.580931858418516e-06, "loss": 2.4867247009277342, "step": 1351900 }, { "epoch": 1.6313684216241948, "learning_rate": 4.580528022950777e-06, "loss": 2.479614715576172, "step": 1352000 }, { "epoch": 1.6314890849466774, "learning_rate": 4.580124187483039e-06, "loss": 2.478025207519531, "step": 1352100 }, { "epoch": 1.63160974826916, "learning_rate": 4.579720352015301e-06, "loss": 2.4756283569335937, "step": 1352200 }, { "epoch": 1.6317304115916427, "learning_rate": 4.5793165165475625e-06, "loss": 2.45906494140625, "step": 1352300 }, { "epoch": 1.6318510749141253, "learning_rate": 4.578912681079824e-06, "loss": 2.451182556152344, "step": 1352400 }, { "epoch": 1.6319717382366081, "learning_rate": 4.5785088456120856e-06, "loss": 2.482854766845703, "step": 1352500 }, { "epoch": 1.6320924015590907, "learning_rate": 4.5781050101443476e-06, "loss": 2.4642498779296873, "step": 1352600 }, { "epoch": 1.6322130648815736, "learning_rate": 4.577701174676609e-06, "loss": 2.459043426513672, "step": 1352700 }, { "epoch": 1.6323337282040562, "learning_rate": 4.577297339208871e-06, "loss": 2.479403381347656, "step": 1352800 }, { "epoch": 1.6324543915265388, "learning_rate": 4.576893503741132e-06, "loss": 2.467975616455078, "step": 1352900 }, { "epoch": 1.6325750548490214, "learning_rate": 4.576489668273394e-06, "loss": 2.442451629638672, "step": 1353000 }, { "epoch": 1.632695718171504, "learning_rate": 4.576085832805655e-06, "loss": 2.4595050048828124, "step": 1353100 }, { "epoch": 1.632816381493987, "learning_rate": 4.575681997337917e-06, "loss": 2.466865234375, "step": 1353200 }, { "epoch": 1.6329370448164697, "learning_rate": 4.575278161870179e-06, "loss": 2.466330871582031, "step": 1353300 }, { "epoch": 1.6330577081389523, "learning_rate": 4.57487432640244e-06, "loss": 2.4714285278320314, "step": 1353400 }, { "epoch": 1.633178371461435, "learning_rate": 4.574470490934701e-06, "loss": 2.4611207580566408, "step": 1353500 }, { "epoch": 1.6332990347839176, "learning_rate": 4.574066655466963e-06, "loss": 2.460946044921875, "step": 1353600 }, { "epoch": 1.6334196981064002, "learning_rate": 4.573662819999225e-06, "loss": 2.468314361572266, "step": 1353700 }, { "epoch": 1.633540361428883, "learning_rate": 4.573258984531487e-06, "loss": 2.4924333190917967, "step": 1353800 }, { "epoch": 1.6336610247513657, "learning_rate": 4.572855149063748e-06, "loss": 2.4492831420898438, "step": 1353900 }, { "epoch": 1.6337816880738485, "learning_rate": 4.572451313596009e-06, "loss": 2.4650617980957032, "step": 1354000 }, { "epoch": 1.633902351396331, "learning_rate": 4.572047478128271e-06, "loss": 2.4615737915039064, "step": 1354100 }, { "epoch": 1.6340230147188137, "learning_rate": 4.571643642660533e-06, "loss": 2.4509506225585938, "step": 1354200 }, { "epoch": 1.6341436780412963, "learning_rate": 4.571239807192795e-06, "loss": 2.470705261230469, "step": 1354300 }, { "epoch": 1.634264341363779, "learning_rate": 4.5708359717250565e-06, "loss": 2.4743777465820314, "step": 1354400 }, { "epoch": 1.6343850046862618, "learning_rate": 4.570432136257318e-06, "loss": 2.468365020751953, "step": 1354500 }, { "epoch": 1.6345056680087444, "learning_rate": 4.57002830078958e-06, "loss": 2.4847335815429688, "step": 1354600 }, { "epoch": 1.6346263313312273, "learning_rate": 4.5696244653218416e-06, "loss": 2.4766184997558596, "step": 1354700 }, { "epoch": 1.6347469946537099, "learning_rate": 4.569220629854103e-06, "loss": 2.449567413330078, "step": 1354800 }, { "epoch": 1.6348676579761925, "learning_rate": 4.568816794386365e-06, "loss": 2.454022979736328, "step": 1354900 }, { "epoch": 1.634988321298675, "learning_rate": 4.568412958918626e-06, "loss": 2.469773712158203, "step": 1355000 }, { "epoch": 1.635108984621158, "learning_rate": 4.568009123450888e-06, "loss": 2.4884512329101565, "step": 1355100 }, { "epoch": 1.6352296479436406, "learning_rate": 4.567605287983149e-06, "loss": 2.4619256591796876, "step": 1355200 }, { "epoch": 1.6353503112661234, "learning_rate": 4.567201452515411e-06, "loss": 2.4810409545898438, "step": 1355300 }, { "epoch": 1.635470974588606, "learning_rate": 4.566797617047672e-06, "loss": 2.445900573730469, "step": 1355400 }, { "epoch": 1.6355916379110886, "learning_rate": 4.566393781579934e-06, "loss": 2.475582275390625, "step": 1355500 }, { "epoch": 1.6357123012335713, "learning_rate": 4.565989946112195e-06, "loss": 2.461498107910156, "step": 1355600 }, { "epoch": 1.6358329645560539, "learning_rate": 4.565586110644457e-06, "loss": 2.4722581481933594, "step": 1355700 }, { "epoch": 1.6359536278785367, "learning_rate": 4.565182275176719e-06, "loss": 2.480615234375, "step": 1355800 }, { "epoch": 1.6360742912010193, "learning_rate": 4.56477843970898e-06, "loss": 2.467054901123047, "step": 1355900 }, { "epoch": 1.6361949545235022, "learning_rate": 4.564374604241241e-06, "loss": 2.4867703247070314, "step": 1356000 }, { "epoch": 1.6363156178459848, "learning_rate": 4.563970768773503e-06, "loss": 2.4764749145507814, "step": 1356100 }, { "epoch": 1.6364362811684674, "learning_rate": 4.563566933305765e-06, "loss": 2.450303192138672, "step": 1356200 }, { "epoch": 1.63655694449095, "learning_rate": 4.563163097838027e-06, "loss": 2.4884889221191404, "step": 1356300 }, { "epoch": 1.6366776078134326, "learning_rate": 4.5627592623702885e-06, "loss": 2.4785797119140627, "step": 1356400 }, { "epoch": 1.6367982711359155, "learning_rate": 4.56235542690255e-06, "loss": 2.4652415466308595, "step": 1356500 }, { "epoch": 1.6369189344583983, "learning_rate": 4.561951591434812e-06, "loss": 2.4887936401367186, "step": 1356600 }, { "epoch": 1.637039597780881, "learning_rate": 4.561547755967074e-06, "loss": 2.4530368041992188, "step": 1356700 }, { "epoch": 1.6371602611033635, "learning_rate": 4.561143920499335e-06, "loss": 2.444749755859375, "step": 1356800 }, { "epoch": 1.6372809244258462, "learning_rate": 4.560740085031597e-06, "loss": 2.4861489868164064, "step": 1356900 }, { "epoch": 1.6374015877483288, "learning_rate": 4.560336249563858e-06, "loss": 2.462698211669922, "step": 1357000 }, { "epoch": 1.6375222510708116, "learning_rate": 4.55993241409612e-06, "loss": 2.4856913757324217, "step": 1357100 }, { "epoch": 1.6376429143932942, "learning_rate": 4.559528578628381e-06, "loss": 2.492112121582031, "step": 1357200 }, { "epoch": 1.637763577715777, "learning_rate": 4.559124743160643e-06, "loss": 2.498299102783203, "step": 1357300 }, { "epoch": 1.6378842410382597, "learning_rate": 4.558720907692905e-06, "loss": 2.4783880615234377, "step": 1357400 }, { "epoch": 1.6380049043607423, "learning_rate": 4.558317072225166e-06, "loss": 2.478171539306641, "step": 1357500 }, { "epoch": 1.638125567683225, "learning_rate": 4.557913236757427e-06, "loss": 2.490445861816406, "step": 1357600 }, { "epoch": 1.6382462310057075, "learning_rate": 4.557509401289689e-06, "loss": 2.470553436279297, "step": 1357700 }, { "epoch": 1.6383668943281904, "learning_rate": 4.557105565821951e-06, "loss": 2.4615333557128904, "step": 1357800 }, { "epoch": 1.638487557650673, "learning_rate": 4.556701730354212e-06, "loss": 2.4806288146972655, "step": 1357900 }, { "epoch": 1.6386082209731558, "learning_rate": 4.556297894886474e-06, "loss": 2.483037414550781, "step": 1358000 }, { "epoch": 1.6387288842956385, "learning_rate": 4.555894059418735e-06, "loss": 2.459839630126953, "step": 1358100 }, { "epoch": 1.638849547618121, "learning_rate": 4.555490223950997e-06, "loss": 2.467914886474609, "step": 1358200 }, { "epoch": 1.6389702109406037, "learning_rate": 4.555086388483259e-06, "loss": 2.4485504150390627, "step": 1358300 }, { "epoch": 1.6390908742630863, "learning_rate": 4.5546825530155205e-06, "loss": 2.4638412475585936, "step": 1358400 }, { "epoch": 1.6392115375855691, "learning_rate": 4.554278717547782e-06, "loss": 2.4665782165527346, "step": 1358500 }, { "epoch": 1.639332200908052, "learning_rate": 4.553874882080044e-06, "loss": 2.470439910888672, "step": 1358600 }, { "epoch": 1.6394528642305346, "learning_rate": 4.553471046612306e-06, "loss": 2.485830993652344, "step": 1358700 }, { "epoch": 1.6395735275530172, "learning_rate": 4.553067211144567e-06, "loss": 2.457258758544922, "step": 1358800 }, { "epoch": 1.6396941908754998, "learning_rate": 4.552663375676829e-06, "loss": 2.4975535583496096, "step": 1358900 }, { "epoch": 1.6398148541979825, "learning_rate": 4.55225954020909e-06, "loss": 2.438640594482422, "step": 1359000 }, { "epoch": 1.6399355175204653, "learning_rate": 4.551855704741352e-06, "loss": 2.472989044189453, "step": 1359100 }, { "epoch": 1.640056180842948, "learning_rate": 4.551451869273614e-06, "loss": 2.468262481689453, "step": 1359200 }, { "epoch": 1.6401768441654307, "learning_rate": 4.551048033805875e-06, "loss": 2.4617079162597655, "step": 1359300 }, { "epoch": 1.6402975074879134, "learning_rate": 4.550644198338137e-06, "loss": 2.461578674316406, "step": 1359400 }, { "epoch": 1.640418170810396, "learning_rate": 4.550240362870398e-06, "loss": 2.450206451416016, "step": 1359500 }, { "epoch": 1.6405388341328786, "learning_rate": 4.54983652740266e-06, "loss": 2.481649932861328, "step": 1359600 }, { "epoch": 1.6406594974553612, "learning_rate": 4.549432691934921e-06, "loss": 2.4764138793945314, "step": 1359700 }, { "epoch": 1.640780160777844, "learning_rate": 4.549028856467183e-06, "loss": 2.4688595581054686, "step": 1359800 }, { "epoch": 1.6409008241003267, "learning_rate": 4.548625020999445e-06, "loss": 2.4755819702148436, "step": 1359900 }, { "epoch": 1.6410214874228095, "learning_rate": 4.548221185531706e-06, "loss": 2.500893249511719, "step": 1360000 }, { "epoch": 1.6411421507452921, "learning_rate": 4.5478173500639674e-06, "loss": 2.484452209472656, "step": 1360100 }, { "epoch": 1.6412628140677747, "learning_rate": 4.5474135145962294e-06, "loss": 2.4625787353515625, "step": 1360200 }, { "epoch": 1.6413834773902574, "learning_rate": 4.547009679128491e-06, "loss": 2.4740582275390626, "step": 1360300 }, { "epoch": 1.6415041407127402, "learning_rate": 4.546605843660753e-06, "loss": 2.490404510498047, "step": 1360400 }, { "epoch": 1.6416248040352228, "learning_rate": 4.5462020081930145e-06, "loss": 2.496380157470703, "step": 1360500 }, { "epoch": 1.6417454673577057, "learning_rate": 4.545798172725276e-06, "loss": 2.4991917419433594, "step": 1360600 }, { "epoch": 1.6418661306801883, "learning_rate": 4.545394337257538e-06, "loss": 2.48985595703125, "step": 1360700 }, { "epoch": 1.641986794002671, "learning_rate": 4.5449905017898e-06, "loss": 2.4625506591796875, "step": 1360800 }, { "epoch": 1.6421074573251535, "learning_rate": 4.544586666322061e-06, "loss": 2.461519470214844, "step": 1360900 }, { "epoch": 1.6422281206476361, "learning_rate": 4.544182830854323e-06, "loss": 2.4520610046386717, "step": 1361000 }, { "epoch": 1.642348783970119, "learning_rate": 4.543778995386584e-06, "loss": 2.4817878723144533, "step": 1361100 }, { "epoch": 1.6424694472926016, "learning_rate": 4.543375159918846e-06, "loss": 2.482324676513672, "step": 1361200 }, { "epoch": 1.6425901106150844, "learning_rate": 4.542971324451107e-06, "loss": 2.473248291015625, "step": 1361300 }, { "epoch": 1.642710773937567, "learning_rate": 4.542567488983369e-06, "loss": 2.456426239013672, "step": 1361400 }, { "epoch": 1.6428314372600497, "learning_rate": 4.54216365351563e-06, "loss": 2.452054138183594, "step": 1361500 }, { "epoch": 1.6429521005825323, "learning_rate": 4.541759818047892e-06, "loss": 2.4788528442382813, "step": 1361600 }, { "epoch": 1.6430727639050149, "learning_rate": 4.541355982580153e-06, "loss": 2.461927642822266, "step": 1361700 }, { "epoch": 1.6431934272274977, "learning_rate": 4.540952147112415e-06, "loss": 2.4682998657226562, "step": 1361800 }, { "epoch": 1.6433140905499806, "learning_rate": 4.540548311644677e-06, "loss": 2.476809539794922, "step": 1361900 }, { "epoch": 1.6434347538724632, "learning_rate": 4.540144476176938e-06, "loss": 2.471063995361328, "step": 1362000 }, { "epoch": 1.6435554171949458, "learning_rate": 4.5397406407091995e-06, "loss": 2.473854217529297, "step": 1362100 }, { "epoch": 1.6436760805174284, "learning_rate": 4.5393368052414615e-06, "loss": 2.492947692871094, "step": 1362200 }, { "epoch": 1.643796743839911, "learning_rate": 4.5389329697737234e-06, "loss": 2.483004455566406, "step": 1362300 }, { "epoch": 1.6439174071623939, "learning_rate": 4.538529134305985e-06, "loss": 2.468908386230469, "step": 1362400 }, { "epoch": 1.6440380704848765, "learning_rate": 4.5381252988382466e-06, "loss": 2.5021315002441407, "step": 1362500 }, { "epoch": 1.6441587338073593, "learning_rate": 4.537721463370508e-06, "loss": 2.4733958435058594, "step": 1362600 }, { "epoch": 1.644279397129842, "learning_rate": 4.53731762790277e-06, "loss": 2.4928799438476563, "step": 1362700 }, { "epoch": 1.6444000604523246, "learning_rate": 4.536913792435032e-06, "loss": 2.497883758544922, "step": 1362800 }, { "epoch": 1.6445207237748072, "learning_rate": 4.536509956967293e-06, "loss": 2.474143371582031, "step": 1362900 }, { "epoch": 1.6446413870972898, "learning_rate": 4.536106121499555e-06, "loss": 2.4722158813476565, "step": 1363000 }, { "epoch": 1.6447620504197726, "learning_rate": 4.535702286031816e-06, "loss": 2.4874588012695313, "step": 1363100 }, { "epoch": 1.6448827137422553, "learning_rate": 4.535298450564078e-06, "loss": 2.4724530029296874, "step": 1363200 }, { "epoch": 1.645003377064738, "learning_rate": 4.534894615096339e-06, "loss": 2.469423370361328, "step": 1363300 }, { "epoch": 1.6451240403872207, "learning_rate": 4.534490779628601e-06, "loss": 2.4916119384765625, "step": 1363400 }, { "epoch": 1.6452447037097033, "learning_rate": 4.534086944160863e-06, "loss": 2.4659136962890624, "step": 1363500 }, { "epoch": 1.645365367032186, "learning_rate": 4.533683108693124e-06, "loss": 2.4749269104003906, "step": 1363600 }, { "epoch": 1.6454860303546686, "learning_rate": 4.533279273225385e-06, "loss": 2.4670068359375, "step": 1363700 }, { "epoch": 1.6456066936771514, "learning_rate": 4.532875437757647e-06, "loss": 2.491898956298828, "step": 1363800 }, { "epoch": 1.6457273569996342, "learning_rate": 4.532471602289909e-06, "loss": 2.464698944091797, "step": 1363900 }, { "epoch": 1.6458480203221169, "learning_rate": 4.53206776682217e-06, "loss": 2.461997375488281, "step": 1364000 }, { "epoch": 1.6459686836445995, "learning_rate": 4.531663931354432e-06, "loss": 2.4821620178222656, "step": 1364100 }, { "epoch": 1.646089346967082, "learning_rate": 4.5312600958866935e-06, "loss": 2.4810377502441407, "step": 1364200 }, { "epoch": 1.6462100102895647, "learning_rate": 4.5308562604189555e-06, "loss": 2.4836695861816405, "step": 1364300 }, { "epoch": 1.6463306736120475, "learning_rate": 4.5304524249512174e-06, "loss": 2.4751632690429686, "step": 1364400 }, { "epoch": 1.6464513369345302, "learning_rate": 4.530048589483479e-06, "loss": 2.493041687011719, "step": 1364500 }, { "epoch": 1.646572000257013, "learning_rate": 4.52964475401574e-06, "loss": 2.4741810607910155, "step": 1364600 }, { "epoch": 1.6466926635794956, "learning_rate": 4.529240918548002e-06, "loss": 2.4540060424804686, "step": 1364700 }, { "epoch": 1.6468133269019782, "learning_rate": 4.528837083080264e-06, "loss": 2.4701202392578123, "step": 1364800 }, { "epoch": 1.6469339902244609, "learning_rate": 4.528433247612526e-06, "loss": 2.476046142578125, "step": 1364900 }, { "epoch": 1.6470546535469435, "learning_rate": 4.528029412144787e-06, "loss": 2.4923326110839845, "step": 1365000 }, { "epoch": 1.6471753168694263, "learning_rate": 4.527625576677048e-06, "loss": 2.4799876403808594, "step": 1365100 }, { "epoch": 1.647295980191909, "learning_rate": 4.52722174120931e-06, "loss": 2.4739524841308596, "step": 1365200 }, { "epoch": 1.6474166435143918, "learning_rate": 4.526817905741572e-06, "loss": 2.4444305419921877, "step": 1365300 }, { "epoch": 1.6475373068368744, "learning_rate": 4.526414070273833e-06, "loss": 2.4628390502929687, "step": 1365400 }, { "epoch": 1.647657970159357, "learning_rate": 4.526010234806095e-06, "loss": 2.467962646484375, "step": 1365500 }, { "epoch": 1.6477786334818396, "learning_rate": 4.525606399338356e-06, "loss": 2.4864773559570312, "step": 1365600 }, { "epoch": 1.6478992968043225, "learning_rate": 4.525202563870618e-06, "loss": 2.495503692626953, "step": 1365700 }, { "epoch": 1.648019960126805, "learning_rate": 4.524798728402879e-06, "loss": 2.498335876464844, "step": 1365800 }, { "epoch": 1.648140623449288, "learning_rate": 4.524394892935141e-06, "loss": 2.4566305541992186, "step": 1365900 }, { "epoch": 1.6482612867717705, "learning_rate": 4.523991057467403e-06, "loss": 2.4690480041503906, "step": 1366000 }, { "epoch": 1.6483819500942531, "learning_rate": 4.523587221999664e-06, "loss": 2.4690928649902344, "step": 1366100 }, { "epoch": 1.6485026134167358, "learning_rate": 4.5231833865319255e-06, "loss": 2.4577711486816405, "step": 1366200 }, { "epoch": 1.6486232767392184, "learning_rate": 4.5227795510641875e-06, "loss": 2.455832824707031, "step": 1366300 }, { "epoch": 1.6487439400617012, "learning_rate": 4.5223757155964495e-06, "loss": 2.4749290466308596, "step": 1366400 }, { "epoch": 1.6488646033841838, "learning_rate": 4.521971880128711e-06, "loss": 2.457893981933594, "step": 1366500 }, { "epoch": 1.6489852667066667, "learning_rate": 4.521568044660973e-06, "loss": 2.4566741943359376, "step": 1366600 }, { "epoch": 1.6491059300291493, "learning_rate": 4.521164209193234e-06, "loss": 2.458365173339844, "step": 1366700 }, { "epoch": 1.649226593351632, "learning_rate": 4.520760373725496e-06, "loss": 2.461436462402344, "step": 1366800 }, { "epoch": 1.6493472566741145, "learning_rate": 4.520356538257758e-06, "loss": 2.477538299560547, "step": 1366900 }, { "epoch": 1.6494679199965971, "learning_rate": 4.519952702790019e-06, "loss": 2.4476223754882813, "step": 1367000 }, { "epoch": 1.64958858331908, "learning_rate": 4.51954886732228e-06, "loss": 2.487091522216797, "step": 1367100 }, { "epoch": 1.6497092466415628, "learning_rate": 4.519145031854542e-06, "loss": 2.4638829040527344, "step": 1367200 }, { "epoch": 1.6498299099640454, "learning_rate": 4.518741196386804e-06, "loss": 2.459974670410156, "step": 1367300 }, { "epoch": 1.649950573286528, "learning_rate": 4.518337360919065e-06, "loss": 2.4725733947753907, "step": 1367400 }, { "epoch": 1.6500712366090107, "learning_rate": 4.517933525451327e-06, "loss": 2.4658718872070313, "step": 1367500 }, { "epoch": 1.6501918999314933, "learning_rate": 4.517529689983588e-06, "loss": 2.4750889587402343, "step": 1367600 }, { "epoch": 1.6503125632539761, "learning_rate": 4.51712585451585e-06, "loss": 2.481510009765625, "step": 1367700 }, { "epoch": 1.6504332265764587, "learning_rate": 4.516722019048111e-06, "loss": 2.4698858642578125, "step": 1367800 }, { "epoch": 1.6505538898989416, "learning_rate": 4.516318183580373e-06, "loss": 2.4797601318359375, "step": 1367900 }, { "epoch": 1.6506745532214242, "learning_rate": 4.515914348112635e-06, "loss": 2.4688043212890625, "step": 1368000 }, { "epoch": 1.6507952165439068, "learning_rate": 4.515510512644896e-06, "loss": 2.47051025390625, "step": 1368100 }, { "epoch": 1.6509158798663894, "learning_rate": 4.5151066771771575e-06, "loss": 2.4642379760742186, "step": 1368200 }, { "epoch": 1.651036543188872, "learning_rate": 4.5147028417094195e-06, "loss": 2.498116912841797, "step": 1368300 }, { "epoch": 1.651157206511355, "learning_rate": 4.5142990062416815e-06, "loss": 2.4751194763183593, "step": 1368400 }, { "epoch": 1.6512778698338375, "learning_rate": 4.5138951707739435e-06, "loss": 2.467332000732422, "step": 1368500 }, { "epoch": 1.6513985331563203, "learning_rate": 4.513491335306205e-06, "loss": 2.455491180419922, "step": 1368600 }, { "epoch": 1.651519196478803, "learning_rate": 4.513087499838466e-06, "loss": 2.4566806030273436, "step": 1368700 }, { "epoch": 1.6516398598012856, "learning_rate": 4.512683664370728e-06, "loss": 2.4556953430175783, "step": 1368800 }, { "epoch": 1.6517605231237682, "learning_rate": 4.51227982890299e-06, "loss": 2.4691468811035158, "step": 1368900 }, { "epoch": 1.6518811864462508, "learning_rate": 4.511875993435251e-06, "loss": 2.4716041564941404, "step": 1369000 }, { "epoch": 1.6520018497687337, "learning_rate": 4.511472157967513e-06, "loss": 2.4782780456542968, "step": 1369100 }, { "epoch": 1.6521225130912165, "learning_rate": 4.511068322499774e-06, "loss": 2.463293151855469, "step": 1369200 }, { "epoch": 1.652243176413699, "learning_rate": 4.510664487032036e-06, "loss": 2.466751708984375, "step": 1369300 }, { "epoch": 1.6523638397361817, "learning_rate": 4.510260651564298e-06, "loss": 2.4490260314941406, "step": 1369400 }, { "epoch": 1.6524845030586643, "learning_rate": 4.509856816096559e-06, "loss": 2.4754518127441405, "step": 1369500 }, { "epoch": 1.652605166381147, "learning_rate": 4.509452980628821e-06, "loss": 2.4825340270996095, "step": 1369600 }, { "epoch": 1.6527258297036298, "learning_rate": 4.509049145161082e-06, "loss": 2.4768670654296874, "step": 1369700 }, { "epoch": 1.6528464930261124, "learning_rate": 4.508645309693344e-06, "loss": 2.4574053955078123, "step": 1369800 }, { "epoch": 1.6529671563485953, "learning_rate": 4.508241474225605e-06, "loss": 2.4962359619140626, "step": 1369900 }, { "epoch": 1.6530878196710779, "learning_rate": 4.507837638757867e-06, "loss": 2.4606761169433593, "step": 1370000 }, { "epoch": 1.6532084829935605, "learning_rate": 4.507433803290128e-06, "loss": 2.461589813232422, "step": 1370100 }, { "epoch": 1.653329146316043, "learning_rate": 4.50702996782239e-06, "loss": 2.478772735595703, "step": 1370200 }, { "epoch": 1.6534498096385257, "learning_rate": 4.5066261323546515e-06, "loss": 2.4648951721191406, "step": 1370300 }, { "epoch": 1.6535704729610086, "learning_rate": 4.5062222968869135e-06, "loss": 2.456135101318359, "step": 1370400 }, { "epoch": 1.6536911362834912, "learning_rate": 4.5058184614191755e-06, "loss": 2.469218902587891, "step": 1370500 }, { "epoch": 1.653811799605974, "learning_rate": 4.505414625951437e-06, "loss": 2.477667236328125, "step": 1370600 }, { "epoch": 1.6539324629284566, "learning_rate": 4.505010790483698e-06, "loss": 2.4726158142089845, "step": 1370700 }, { "epoch": 1.6540531262509393, "learning_rate": 4.50460695501596e-06, "loss": 2.4568724060058593, "step": 1370800 }, { "epoch": 1.6541737895734219, "learning_rate": 4.504203119548222e-06, "loss": 2.489882354736328, "step": 1370900 }, { "epoch": 1.6542944528959047, "learning_rate": 4.503799284080484e-06, "loss": 2.4584913635253907, "step": 1371000 }, { "epoch": 1.6544151162183873, "learning_rate": 4.503395448612745e-06, "loss": 2.4570439147949217, "step": 1371100 }, { "epoch": 1.6545357795408702, "learning_rate": 4.502991613145006e-06, "loss": 2.4810182189941408, "step": 1371200 }, { "epoch": 1.6546564428633528, "learning_rate": 4.502587777677268e-06, "loss": 2.4724961853027345, "step": 1371300 }, { "epoch": 1.6547771061858354, "learning_rate": 4.50218394220953e-06, "loss": 2.447090301513672, "step": 1371400 }, { "epoch": 1.654897769508318, "learning_rate": 4.501780106741791e-06, "loss": 2.479362030029297, "step": 1371500 }, { "epoch": 1.6550184328308006, "learning_rate": 4.501376271274053e-06, "loss": 2.4753318786621095, "step": 1371600 }, { "epoch": 1.6551390961532835, "learning_rate": 4.500972435806314e-06, "loss": 2.4645730590820314, "step": 1371700 }, { "epoch": 1.655259759475766, "learning_rate": 4.500568600338576e-06, "loss": 2.4738157653808592, "step": 1371800 }, { "epoch": 1.655380422798249, "learning_rate": 4.500164764870837e-06, "loss": 2.4681263732910157, "step": 1371900 }, { "epoch": 1.6555010861207315, "learning_rate": 4.499760929403099e-06, "loss": 2.484277801513672, "step": 1372000 }, { "epoch": 1.6556217494432142, "learning_rate": 4.499357093935361e-06, "loss": 2.4690170288085938, "step": 1372100 }, { "epoch": 1.6557424127656968, "learning_rate": 4.4989532584676224e-06, "loss": 2.4742860412597656, "step": 1372200 }, { "epoch": 1.6558630760881794, "learning_rate": 4.4985494229998836e-06, "loss": 2.4741227722167967, "step": 1372300 }, { "epoch": 1.6559837394106622, "learning_rate": 4.4981455875321455e-06, "loss": 2.4868104553222654, "step": 1372400 }, { "epoch": 1.656104402733145, "learning_rate": 4.4977417520644075e-06, "loss": 2.498457336425781, "step": 1372500 }, { "epoch": 1.6562250660556277, "learning_rate": 4.497337916596669e-06, "loss": 2.4635101318359376, "step": 1372600 }, { "epoch": 1.6563457293781103, "learning_rate": 4.496934081128931e-06, "loss": 2.4658837890625, "step": 1372700 }, { "epoch": 1.656466392700593, "learning_rate": 4.496530245661192e-06, "loss": 2.4698606872558595, "step": 1372800 }, { "epoch": 1.6565870560230755, "learning_rate": 4.496126410193454e-06, "loss": 2.4600930786132813, "step": 1372900 }, { "epoch": 1.6567077193455584, "learning_rate": 4.495722574725716e-06, "loss": 2.4708863830566408, "step": 1373000 }, { "epoch": 1.656828382668041, "learning_rate": 4.495318739257977e-06, "loss": 2.4736056518554688, "step": 1373100 }, { "epoch": 1.6569490459905238, "learning_rate": 4.494914903790238e-06, "loss": 2.45256103515625, "step": 1373200 }, { "epoch": 1.6570697093130065, "learning_rate": 4.4945110683225e-06, "loss": 2.4663119506835938, "step": 1373300 }, { "epoch": 1.657190372635489, "learning_rate": 4.494107232854762e-06, "loss": 2.4748834228515624, "step": 1373400 }, { "epoch": 1.6573110359579717, "learning_rate": 4.493703397387023e-06, "loss": 2.4780036926269533, "step": 1373500 }, { "epoch": 1.6574316992804543, "learning_rate": 4.493299561919285e-06, "loss": 2.4790908813476564, "step": 1373600 }, { "epoch": 1.6575523626029371, "learning_rate": 4.492895726451546e-06, "loss": 2.4694453430175782, "step": 1373700 }, { "epoch": 1.6576730259254198, "learning_rate": 4.492491890983808e-06, "loss": 2.4641786193847657, "step": 1373800 }, { "epoch": 1.6577936892479026, "learning_rate": 4.492088055516069e-06, "loss": 2.446552429199219, "step": 1373900 }, { "epoch": 1.6579143525703852, "learning_rate": 4.491684220048331e-06, "loss": 2.4324974060058593, "step": 1374000 }, { "epoch": 1.6580350158928678, "learning_rate": 4.491280384580593e-06, "loss": 2.469823913574219, "step": 1374100 }, { "epoch": 1.6581556792153505, "learning_rate": 4.4908765491128545e-06, "loss": 2.450864105224609, "step": 1374200 }, { "epoch": 1.658276342537833, "learning_rate": 4.490472713645116e-06, "loss": 2.4863951110839846, "step": 1374300 }, { "epoch": 1.658397005860316, "learning_rate": 4.4900688781773776e-06, "loss": 2.4925080871582033, "step": 1374400 }, { "epoch": 1.6585176691827987, "learning_rate": 4.4896650427096396e-06, "loss": 2.48117919921875, "step": 1374500 }, { "epoch": 1.6586383325052814, "learning_rate": 4.4892612072419015e-06, "loss": 2.4775074768066405, "step": 1374600 }, { "epoch": 1.658758995827764, "learning_rate": 4.488857371774163e-06, "loss": 2.481750793457031, "step": 1374700 }, { "epoch": 1.6588796591502466, "learning_rate": 4.488453536306424e-06, "loss": 2.4626896667480467, "step": 1374800 }, { "epoch": 1.6590003224727292, "learning_rate": 4.488049700838686e-06, "loss": 2.473968200683594, "step": 1374900 }, { "epoch": 1.659120985795212, "learning_rate": 4.487645865370948e-06, "loss": 2.469404754638672, "step": 1375000 }, { "epoch": 1.6592416491176947, "learning_rate": 4.48724202990321e-06, "loss": 2.463692932128906, "step": 1375100 }, { "epoch": 1.6593623124401775, "learning_rate": 4.486838194435471e-06, "loss": 2.473457489013672, "step": 1375200 }, { "epoch": 1.6594829757626601, "learning_rate": 4.486434358967732e-06, "loss": 2.4702146911621092, "step": 1375300 }, { "epoch": 1.6596036390851427, "learning_rate": 4.486030523499994e-06, "loss": 2.4710870361328126, "step": 1375400 }, { "epoch": 1.6597243024076254, "learning_rate": 4.485626688032256e-06, "loss": 2.47525390625, "step": 1375500 }, { "epoch": 1.659844965730108, "learning_rate": 4.485222852564517e-06, "loss": 2.45270263671875, "step": 1375600 }, { "epoch": 1.6599656290525908, "learning_rate": 4.484819017096779e-06, "loss": 2.4669754028320314, "step": 1375700 }, { "epoch": 1.6600862923750737, "learning_rate": 4.48441518162904e-06, "loss": 2.4955403137207033, "step": 1375800 }, { "epoch": 1.6602069556975563, "learning_rate": 4.484011346161302e-06, "loss": 2.471352081298828, "step": 1375900 }, { "epoch": 1.660327619020039, "learning_rate": 4.483607510693563e-06, "loss": 2.458121032714844, "step": 1376000 }, { "epoch": 1.6604482823425215, "learning_rate": 4.483203675225825e-06, "loss": 2.4799844360351564, "step": 1376100 }, { "epoch": 1.6605689456650041, "learning_rate": 4.4827998397580865e-06, "loss": 2.464932556152344, "step": 1376200 }, { "epoch": 1.660689608987487, "learning_rate": 4.4823960042903485e-06, "loss": 2.4488975524902346, "step": 1376300 }, { "epoch": 1.6608102723099696, "learning_rate": 4.48199216882261e-06, "loss": 2.4607386779785156, "step": 1376400 }, { "epoch": 1.6609309356324524, "learning_rate": 4.481588333354872e-06, "loss": 2.4745028686523436, "step": 1376500 }, { "epoch": 1.661051598954935, "learning_rate": 4.4811844978871336e-06, "loss": 2.4561862182617187, "step": 1376600 }, { "epoch": 1.6611722622774177, "learning_rate": 4.480780662419395e-06, "loss": 2.4465568542480467, "step": 1376700 }, { "epoch": 1.6612929255999003, "learning_rate": 4.480376826951656e-06, "loss": 2.4865676879882814, "step": 1376800 }, { "epoch": 1.661413588922383, "learning_rate": 4.479972991483918e-06, "loss": 2.4628556823730468, "step": 1376900 }, { "epoch": 1.6615342522448657, "learning_rate": 4.47956915601618e-06, "loss": 2.4651304626464845, "step": 1377000 }, { "epoch": 1.6616549155673483, "learning_rate": 4.479165320548442e-06, "loss": 2.488120422363281, "step": 1377100 }, { "epoch": 1.6617755788898312, "learning_rate": 4.478761485080703e-06, "loss": 2.449748840332031, "step": 1377200 }, { "epoch": 1.6618962422123138, "learning_rate": 4.478357649612964e-06, "loss": 2.479856262207031, "step": 1377300 }, { "epoch": 1.6620169055347964, "learning_rate": 4.477953814145226e-06, "loss": 2.46491455078125, "step": 1377400 }, { "epoch": 1.662137568857279, "learning_rate": 4.477549978677488e-06, "loss": 2.466708068847656, "step": 1377500 }, { "epoch": 1.6622582321797617, "learning_rate": 4.477146143209749e-06, "loss": 2.475411834716797, "step": 1377600 }, { "epoch": 1.6623788955022445, "learning_rate": 4.476742307742011e-06, "loss": 2.4799368286132815, "step": 1377700 }, { "epoch": 1.6624995588247273, "learning_rate": 4.476338472274272e-06, "loss": 2.456706085205078, "step": 1377800 }, { "epoch": 1.66262022214721, "learning_rate": 4.475934636806534e-06, "loss": 2.4951220703125, "step": 1377900 }, { "epoch": 1.6627408854696926, "learning_rate": 4.475530801338795e-06, "loss": 2.4477389526367186, "step": 1378000 }, { "epoch": 1.6628615487921752, "learning_rate": 4.475126965871057e-06, "loss": 2.4961155700683593, "step": 1378100 }, { "epoch": 1.6629822121146578, "learning_rate": 4.474723130403319e-06, "loss": 2.442541046142578, "step": 1378200 }, { "epoch": 1.6631028754371406, "learning_rate": 4.4743192949355805e-06, "loss": 2.4577732849121094, "step": 1378300 }, { "epoch": 1.6632235387596233, "learning_rate": 4.473915459467842e-06, "loss": 2.4821942138671873, "step": 1378400 }, { "epoch": 1.663344202082106, "learning_rate": 4.473511624000104e-06, "loss": 2.495380096435547, "step": 1378500 }, { "epoch": 1.6634648654045887, "learning_rate": 4.473107788532366e-06, "loss": 2.479944305419922, "step": 1378600 }, { "epoch": 1.6635855287270713, "learning_rate": 4.472703953064627e-06, "loss": 2.4627447509765625, "step": 1378700 }, { "epoch": 1.663706192049554, "learning_rate": 4.472300117596889e-06, "loss": 2.465126190185547, "step": 1378800 }, { "epoch": 1.6638268553720366, "learning_rate": 4.47189628212915e-06, "loss": 2.4766361999511717, "step": 1378900 }, { "epoch": 1.6639475186945194, "learning_rate": 4.471492446661412e-06, "loss": 2.4650128173828123, "step": 1379000 }, { "epoch": 1.664068182017002, "learning_rate": 4.471088611193674e-06, "loss": 2.449069366455078, "step": 1379100 }, { "epoch": 1.6641888453394849, "learning_rate": 4.470684775725935e-06, "loss": 2.447931823730469, "step": 1379200 }, { "epoch": 1.6643095086619675, "learning_rate": 4.470280940258196e-06, "loss": 2.453088836669922, "step": 1379300 }, { "epoch": 1.66443017198445, "learning_rate": 4.469877104790458e-06, "loss": 2.484203643798828, "step": 1379400 }, { "epoch": 1.6645508353069327, "learning_rate": 4.46947326932272e-06, "loss": 2.4518917846679686, "step": 1379500 }, { "epoch": 1.6646714986294153, "learning_rate": 4.469069433854982e-06, "loss": 2.4757989501953124, "step": 1379600 }, { "epoch": 1.6647921619518982, "learning_rate": 4.468665598387243e-06, "loss": 2.4663847351074217, "step": 1379700 }, { "epoch": 1.664912825274381, "learning_rate": 4.468261762919504e-06, "loss": 2.4736982727050782, "step": 1379800 }, { "epoch": 1.6650334885968636, "learning_rate": 4.467857927451766e-06, "loss": 2.4627943420410157, "step": 1379900 }, { "epoch": 1.6651541519193462, "learning_rate": 4.467454091984028e-06, "loss": 2.4501295471191407, "step": 1380000 }, { "epoch": 1.6652748152418289, "learning_rate": 4.467050256516289e-06, "loss": 2.500682525634766, "step": 1380100 }, { "epoch": 1.6653954785643115, "learning_rate": 4.466646421048551e-06, "loss": 2.475130615234375, "step": 1380200 }, { "epoch": 1.6655161418867943, "learning_rate": 4.4662425855808125e-06, "loss": 2.465468444824219, "step": 1380300 }, { "epoch": 1.665636805209277, "learning_rate": 4.4658387501130745e-06, "loss": 2.4557926940917967, "step": 1380400 }, { "epoch": 1.6657574685317598, "learning_rate": 4.465434914645336e-06, "loss": 2.478487548828125, "step": 1380500 }, { "epoch": 1.6658781318542424, "learning_rate": 4.465031079177598e-06, "loss": 2.4742662048339845, "step": 1380600 }, { "epoch": 1.665998795176725, "learning_rate": 4.46462724370986e-06, "loss": 2.4878741455078126, "step": 1380700 }, { "epoch": 1.6661194584992076, "learning_rate": 4.464223408242121e-06, "loss": 2.4796702575683596, "step": 1380800 }, { "epoch": 1.6662401218216902, "learning_rate": 4.463819572774382e-06, "loss": 2.4819097900390625, "step": 1380900 }, { "epoch": 1.666360785144173, "learning_rate": 4.463415737306644e-06, "loss": 2.4551126098632814, "step": 1381000 }, { "epoch": 1.666481448466656, "learning_rate": 4.463011901838906e-06, "loss": 2.464055480957031, "step": 1381100 }, { "epoch": 1.6666021117891385, "learning_rate": 4.462608066371168e-06, "loss": 2.4793580627441405, "step": 1381200 }, { "epoch": 1.6667227751116211, "learning_rate": 4.462204230903429e-06, "loss": 2.4510130310058593, "step": 1381300 }, { "epoch": 1.6668434384341038, "learning_rate": 4.46180039543569e-06, "loss": 2.481181335449219, "step": 1381400 }, { "epoch": 1.6669641017565864, "learning_rate": 4.461396559967952e-06, "loss": 2.48408935546875, "step": 1381500 }, { "epoch": 1.6670847650790692, "learning_rate": 4.460992724500214e-06, "loss": 2.4522019958496095, "step": 1381600 }, { "epoch": 1.6672054284015518, "learning_rate": 4.460588889032475e-06, "loss": 2.458484649658203, "step": 1381700 }, { "epoch": 1.6673260917240347, "learning_rate": 4.460185053564737e-06, "loss": 2.477429962158203, "step": 1381800 }, { "epoch": 1.6674467550465173, "learning_rate": 4.459781218096998e-06, "loss": 2.445456237792969, "step": 1381900 }, { "epoch": 1.667567418369, "learning_rate": 4.45937738262926e-06, "loss": 2.4605722045898437, "step": 1382000 }, { "epoch": 1.6676880816914825, "learning_rate": 4.458973547161521e-06, "loss": 2.4588888549804686, "step": 1382100 }, { "epoch": 1.6678087450139651, "learning_rate": 4.458569711693783e-06, "loss": 2.466283874511719, "step": 1382200 }, { "epoch": 1.667929408336448, "learning_rate": 4.4581658762260445e-06, "loss": 2.466041717529297, "step": 1382300 }, { "epoch": 1.6680500716589306, "learning_rate": 4.4577620407583065e-06, "loss": 2.4501683044433595, "step": 1382400 }, { "epoch": 1.6681707349814134, "learning_rate": 4.457358205290568e-06, "loss": 2.458643798828125, "step": 1382500 }, { "epoch": 1.668291398303896, "learning_rate": 4.45695436982283e-06, "loss": 2.473623046875, "step": 1382600 }, { "epoch": 1.6684120616263787, "learning_rate": 4.456550534355092e-06, "loss": 2.4491839599609375, "step": 1382700 }, { "epoch": 1.6685327249488613, "learning_rate": 4.456146698887353e-06, "loss": 2.458401947021484, "step": 1382800 }, { "epoch": 1.668653388271344, "learning_rate": 4.455742863419614e-06, "loss": 2.473976898193359, "step": 1382900 }, { "epoch": 1.6687740515938267, "learning_rate": 4.455339027951876e-06, "loss": 2.4823435974121093, "step": 1383000 }, { "epoch": 1.6688947149163096, "learning_rate": 4.454935192484138e-06, "loss": 2.484225616455078, "step": 1383100 }, { "epoch": 1.6690153782387922, "learning_rate": 4.4545313570164e-06, "loss": 2.468769073486328, "step": 1383200 }, { "epoch": 1.6691360415612748, "learning_rate": 4.454127521548661e-06, "loss": 2.4350425720214846, "step": 1383300 }, { "epoch": 1.6692567048837574, "learning_rate": 4.453723686080922e-06, "loss": 2.4393353271484375, "step": 1383400 }, { "epoch": 1.66937736820624, "learning_rate": 4.453319850613184e-06, "loss": 2.463369140625, "step": 1383500 }, { "epoch": 1.669498031528723, "learning_rate": 4.452916015145446e-06, "loss": 2.484258117675781, "step": 1383600 }, { "epoch": 1.6696186948512055, "learning_rate": 4.452512179677707e-06, "loss": 2.4845201110839845, "step": 1383700 }, { "epoch": 1.6697393581736883, "learning_rate": 4.452108344209969e-06, "loss": 2.4574160766601563, "step": 1383800 }, { "epoch": 1.669860021496171, "learning_rate": 4.45170450874223e-06, "loss": 2.4946279907226563, "step": 1383900 }, { "epoch": 1.6699806848186536, "learning_rate": 4.451300673274492e-06, "loss": 2.4562940979003907, "step": 1384000 }, { "epoch": 1.6701013481411362, "learning_rate": 4.4508968378067534e-06, "loss": 2.46593017578125, "step": 1384100 }, { "epoch": 1.6702220114636188, "learning_rate": 4.4504930023390154e-06, "loss": 2.4888099670410155, "step": 1384200 }, { "epoch": 1.6703426747861017, "learning_rate": 4.450089166871277e-06, "loss": 2.4846092224121095, "step": 1384300 }, { "epoch": 1.6704633381085843, "learning_rate": 4.4496853314035385e-06, "loss": 2.4670835876464845, "step": 1384400 }, { "epoch": 1.6705840014310671, "learning_rate": 4.4492814959358e-06, "loss": 2.4592851257324218, "step": 1384500 }, { "epoch": 1.6707046647535497, "learning_rate": 4.448877660468062e-06, "loss": 2.487588653564453, "step": 1384600 }, { "epoch": 1.6708253280760323, "learning_rate": 4.448473825000324e-06, "loss": 2.463221435546875, "step": 1384700 }, { "epoch": 1.670945991398515, "learning_rate": 4.448069989532585e-06, "loss": 2.464902191162109, "step": 1384800 }, { "epoch": 1.6710666547209976, "learning_rate": 4.447666154064847e-06, "loss": 2.4620550537109374, "step": 1384900 }, { "epoch": 1.6711873180434804, "learning_rate": 4.447262318597108e-06, "loss": 2.476096496582031, "step": 1385000 }, { "epoch": 1.6713079813659633, "learning_rate": 4.44685848312937e-06, "loss": 2.4545353698730468, "step": 1385100 }, { "epoch": 1.6714286446884459, "learning_rate": 4.446454647661632e-06, "loss": 2.4767335510253905, "step": 1385200 }, { "epoch": 1.6715493080109285, "learning_rate": 4.446050812193893e-06, "loss": 2.478337860107422, "step": 1385300 }, { "epoch": 1.671669971333411, "learning_rate": 4.445646976726154e-06, "loss": 2.480748596191406, "step": 1385400 }, { "epoch": 1.6717906346558937, "learning_rate": 4.445243141258416e-06, "loss": 2.4541049194335938, "step": 1385500 }, { "epoch": 1.6719112979783766, "learning_rate": 4.444839305790678e-06, "loss": 2.458035583496094, "step": 1385600 }, { "epoch": 1.6720319613008592, "learning_rate": 4.44443547032294e-06, "loss": 2.456343536376953, "step": 1385700 }, { "epoch": 1.672152624623342, "learning_rate": 4.444031634855201e-06, "loss": 2.478015899658203, "step": 1385800 }, { "epoch": 1.6722732879458246, "learning_rate": 4.443627799387462e-06, "loss": 2.4858282470703124, "step": 1385900 }, { "epoch": 1.6723939512683073, "learning_rate": 4.443223963919724e-06, "loss": 2.4588685607910157, "step": 1386000 }, { "epoch": 1.6725146145907899, "learning_rate": 4.442820128451986e-06, "loss": 2.475159912109375, "step": 1386100 }, { "epoch": 1.6726352779132725, "learning_rate": 4.4424162929842475e-06, "loss": 2.4777655029296874, "step": 1386200 }, { "epoch": 1.6727559412357553, "learning_rate": 4.4420124575165094e-06, "loss": 2.4776095581054687, "step": 1386300 }, { "epoch": 1.6728766045582382, "learning_rate": 4.4416086220487706e-06, "loss": 2.4771051025390625, "step": 1386400 }, { "epoch": 1.6729972678807208, "learning_rate": 4.4412047865810326e-06, "loss": 2.48466552734375, "step": 1386500 }, { "epoch": 1.6731179312032034, "learning_rate": 4.440800951113294e-06, "loss": 2.4623587036132815, "step": 1386600 }, { "epoch": 1.673238594525686, "learning_rate": 4.440397115645556e-06, "loss": 2.4731495666503904, "step": 1386700 }, { "epoch": 1.6733592578481686, "learning_rate": 4.439993280177818e-06, "loss": 2.47348876953125, "step": 1386800 }, { "epoch": 1.6734799211706515, "learning_rate": 4.439589444710079e-06, "loss": 2.4795867919921877, "step": 1386900 }, { "epoch": 1.673600584493134, "learning_rate": 4.43918560924234e-06, "loss": 2.4425840759277344, "step": 1387000 }, { "epoch": 1.673721247815617, "learning_rate": 4.438781773774602e-06, "loss": 2.48661376953125, "step": 1387100 }, { "epoch": 1.6738419111380995, "learning_rate": 4.438377938306864e-06, "loss": 2.4575343322753906, "step": 1387200 }, { "epoch": 1.6739625744605822, "learning_rate": 4.437974102839125e-06, "loss": 2.4490838623046876, "step": 1387300 }, { "epoch": 1.6740832377830648, "learning_rate": 4.437570267371387e-06, "loss": 2.4651968383789065, "step": 1387400 }, { "epoch": 1.6742039011055474, "learning_rate": 4.437166431903648e-06, "loss": 2.479906005859375, "step": 1387500 }, { "epoch": 1.6743245644280302, "learning_rate": 4.43676259643591e-06, "loss": 2.4602421569824218, "step": 1387600 }, { "epoch": 1.6744452277505129, "learning_rate": 4.436358760968172e-06, "loss": 2.45675048828125, "step": 1387700 }, { "epoch": 1.6745658910729957, "learning_rate": 4.435954925500433e-06, "loss": 2.4619287109375, "step": 1387800 }, { "epoch": 1.6746865543954783, "learning_rate": 4.435551090032694e-06, "loss": 2.457548828125, "step": 1387900 }, { "epoch": 1.674807217717961, "learning_rate": 4.435147254564956e-06, "loss": 2.4470362854003906, "step": 1388000 }, { "epoch": 1.6749278810404435, "learning_rate": 4.434743419097218e-06, "loss": 2.4731016540527344, "step": 1388100 }, { "epoch": 1.6750485443629262, "learning_rate": 4.4343395836294795e-06, "loss": 2.483837890625, "step": 1388200 }, { "epoch": 1.675169207685409, "learning_rate": 4.4339357481617415e-06, "loss": 2.4598509216308595, "step": 1388300 }, { "epoch": 1.6752898710078918, "learning_rate": 4.433531912694003e-06, "loss": 2.4671316528320313, "step": 1388400 }, { "epoch": 1.6754105343303745, "learning_rate": 4.433128077226265e-06, "loss": 2.4934080505371092, "step": 1388500 }, { "epoch": 1.675531197652857, "learning_rate": 4.432724241758526e-06, "loss": 2.4457192993164063, "step": 1388600 }, { "epoch": 1.6756518609753397, "learning_rate": 4.432320406290788e-06, "loss": 2.445237121582031, "step": 1388700 }, { "epoch": 1.6757725242978223, "learning_rate": 4.43191657082305e-06, "loss": 2.4608953857421874, "step": 1388800 }, { "epoch": 1.6758931876203051, "learning_rate": 4.431512735355311e-06, "loss": 2.4664845275878906, "step": 1388900 }, { "epoch": 1.6760138509427878, "learning_rate": 4.431108899887572e-06, "loss": 2.4362159729003907, "step": 1389000 }, { "epoch": 1.6761345142652706, "learning_rate": 4.430705064419834e-06, "loss": 2.4471453857421874, "step": 1389100 }, { "epoch": 1.6762551775877532, "learning_rate": 4.430301228952096e-06, "loss": 2.448023681640625, "step": 1389200 }, { "epoch": 1.6763758409102358, "learning_rate": 4.429897393484358e-06, "loss": 2.457105865478516, "step": 1389300 }, { "epoch": 1.6764965042327185, "learning_rate": 4.429493558016619e-06, "loss": 2.480714874267578, "step": 1389400 }, { "epoch": 1.676617167555201, "learning_rate": 4.42908972254888e-06, "loss": 2.4588471984863283, "step": 1389500 }, { "epoch": 1.676737830877684, "learning_rate": 4.428685887081142e-06, "loss": 2.465537109375, "step": 1389600 }, { "epoch": 1.6768584942001665, "learning_rate": 4.428282051613404e-06, "loss": 2.4619181823730467, "step": 1389700 }, { "epoch": 1.6769791575226494, "learning_rate": 4.427878216145665e-06, "loss": 2.4536256408691406, "step": 1389800 }, { "epoch": 1.677099820845132, "learning_rate": 4.427474380677927e-06, "loss": 2.465886993408203, "step": 1389900 }, { "epoch": 1.6772204841676146, "learning_rate": 4.427070545210188e-06, "loss": 2.4463427734375, "step": 1390000 }, { "epoch": 1.6773411474900972, "learning_rate": 4.42666670974245e-06, "loss": 2.450686187744141, "step": 1390100 }, { "epoch": 1.6774618108125798, "learning_rate": 4.426262874274712e-06, "loss": 2.461154327392578, "step": 1390200 }, { "epoch": 1.6775824741350627, "learning_rate": 4.4258590388069735e-06, "loss": 2.4668653869628905, "step": 1390300 }, { "epoch": 1.6777031374575455, "learning_rate": 4.4254552033392355e-06, "loss": 2.475655822753906, "step": 1390400 }, { "epoch": 1.6778238007800281, "learning_rate": 4.425051367871497e-06, "loss": 2.4754368591308595, "step": 1390500 }, { "epoch": 1.6779444641025107, "learning_rate": 4.424647532403759e-06, "loss": 2.457433319091797, "step": 1390600 }, { "epoch": 1.6780651274249934, "learning_rate": 4.42424369693602e-06, "loss": 2.4543472290039063, "step": 1390700 }, { "epoch": 1.678185790747476, "learning_rate": 4.423839861468282e-06, "loss": 2.4584310913085936, "step": 1390800 }, { "epoch": 1.6783064540699588, "learning_rate": 4.423436026000543e-06, "loss": 2.4614189147949217, "step": 1390900 }, { "epoch": 1.6784271173924414, "learning_rate": 4.423032190532805e-06, "loss": 2.446219635009766, "step": 1391000 }, { "epoch": 1.6785477807149243, "learning_rate": 4.422628355065066e-06, "loss": 2.4569085693359374, "step": 1391100 }, { "epoch": 1.678668444037407, "learning_rate": 4.422224519597328e-06, "loss": 2.4581407165527343, "step": 1391200 }, { "epoch": 1.6787891073598895, "learning_rate": 4.42182068412959e-06, "loss": 2.487965393066406, "step": 1391300 }, { "epoch": 1.6789097706823721, "learning_rate": 4.421416848661851e-06, "loss": 2.464552917480469, "step": 1391400 }, { "epoch": 1.6790304340048547, "learning_rate": 4.421013013194112e-06, "loss": 2.4598316955566406, "step": 1391500 }, { "epoch": 1.6791510973273376, "learning_rate": 4.420609177726374e-06, "loss": 2.454126434326172, "step": 1391600 }, { "epoch": 1.6792717606498204, "learning_rate": 4.420205342258636e-06, "loss": 2.4896473693847656, "step": 1391700 }, { "epoch": 1.679392423972303, "learning_rate": 4.419801506790898e-06, "loss": 2.460379943847656, "step": 1391800 }, { "epoch": 1.6795130872947857, "learning_rate": 4.419397671323159e-06, "loss": 2.4553897094726564, "step": 1391900 }, { "epoch": 1.6796337506172683, "learning_rate": 4.41899383585542e-06, "loss": 2.4520887756347656, "step": 1392000 }, { "epoch": 1.679754413939751, "learning_rate": 4.418590000387682e-06, "loss": 2.462191619873047, "step": 1392100 }, { "epoch": 1.6798750772622337, "learning_rate": 4.418186164919944e-06, "loss": 2.438992462158203, "step": 1392200 }, { "epoch": 1.6799957405847163, "learning_rate": 4.4177823294522055e-06, "loss": 2.4806806945800783, "step": 1392300 }, { "epoch": 1.6801164039071992, "learning_rate": 4.4173784939844675e-06, "loss": 2.4518058776855467, "step": 1392400 }, { "epoch": 1.6802370672296818, "learning_rate": 4.416974658516729e-06, "loss": 2.4553253173828127, "step": 1392500 }, { "epoch": 1.6803577305521644, "learning_rate": 4.416570823048991e-06, "loss": 2.489476623535156, "step": 1392600 }, { "epoch": 1.680478393874647, "learning_rate": 4.416166987581252e-06, "loss": 2.4934953308105468, "step": 1392700 }, { "epoch": 1.6805990571971297, "learning_rate": 4.415763152113514e-06, "loss": 2.471820526123047, "step": 1392800 }, { "epoch": 1.6807197205196125, "learning_rate": 4.415359316645776e-06, "loss": 2.4687420654296877, "step": 1392900 }, { "epoch": 1.680840383842095, "learning_rate": 4.414955481178037e-06, "loss": 2.483216094970703, "step": 1393000 }, { "epoch": 1.680961047164578, "learning_rate": 4.414551645710298e-06, "loss": 2.460579376220703, "step": 1393100 }, { "epoch": 1.6810817104870606, "learning_rate": 4.41414781024256e-06, "loss": 2.462721862792969, "step": 1393200 }, { "epoch": 1.6812023738095432, "learning_rate": 4.413743974774822e-06, "loss": 2.4665589904785157, "step": 1393300 }, { "epoch": 1.6813230371320258, "learning_rate": 4.413340139307083e-06, "loss": 2.470220184326172, "step": 1393400 }, { "epoch": 1.6814437004545084, "learning_rate": 4.412936303839345e-06, "loss": 2.446187286376953, "step": 1393500 }, { "epoch": 1.6815643637769913, "learning_rate": 4.412532468371606e-06, "loss": 2.4705905151367187, "step": 1393600 }, { "epoch": 1.681685027099474, "learning_rate": 4.412128632903868e-06, "loss": 2.448405914306641, "step": 1393700 }, { "epoch": 1.6818056904219567, "learning_rate": 4.41172479743613e-06, "loss": 2.445928192138672, "step": 1393800 }, { "epoch": 1.6819263537444393, "learning_rate": 4.411320961968391e-06, "loss": 2.473443603515625, "step": 1393900 }, { "epoch": 1.682047017066922, "learning_rate": 4.4109171265006524e-06, "loss": 2.4558607482910157, "step": 1394000 }, { "epoch": 1.6821676803894046, "learning_rate": 4.410513291032914e-06, "loss": 2.4691119384765625, "step": 1394100 }, { "epoch": 1.6822883437118874, "learning_rate": 4.410109455565176e-06, "loss": 2.464374542236328, "step": 1394200 }, { "epoch": 1.68240900703437, "learning_rate": 4.4097056200974375e-06, "loss": 2.4458343505859377, "step": 1394300 }, { "epoch": 1.6825296703568529, "learning_rate": 4.4093017846296995e-06, "loss": 2.4560084533691406, "step": 1394400 }, { "epoch": 1.6826503336793355, "learning_rate": 4.408897949161961e-06, "loss": 2.4618040466308595, "step": 1394500 }, { "epoch": 1.682770997001818, "learning_rate": 4.408494113694223e-06, "loss": 2.480364227294922, "step": 1394600 }, { "epoch": 1.6828916603243007, "learning_rate": 4.408090278226484e-06, "loss": 2.47927978515625, "step": 1394700 }, { "epoch": 1.6830123236467833, "learning_rate": 4.407686442758746e-06, "loss": 2.4614947509765623, "step": 1394800 }, { "epoch": 1.6831329869692662, "learning_rate": 4.407282607291008e-06, "loss": 2.4584312438964844, "step": 1394900 }, { "epoch": 1.6832536502917488, "learning_rate": 4.406878771823269e-06, "loss": 2.4560162353515627, "step": 1395000 }, { "epoch": 1.6833743136142316, "learning_rate": 4.406474936355531e-06, "loss": 2.449065856933594, "step": 1395100 }, { "epoch": 1.6834949769367142, "learning_rate": 4.406071100887792e-06, "loss": 2.4886903381347656, "step": 1395200 }, { "epoch": 1.6836156402591969, "learning_rate": 4.405667265420054e-06, "loss": 2.463245391845703, "step": 1395300 }, { "epoch": 1.6837363035816795, "learning_rate": 4.405263429952316e-06, "loss": 2.4609638977050783, "step": 1395400 }, { "epoch": 1.683856966904162, "learning_rate": 4.404859594484577e-06, "loss": 2.475473175048828, "step": 1395500 }, { "epoch": 1.683977630226645, "learning_rate": 4.404455759016838e-06, "loss": 2.4585006713867186, "step": 1395600 }, { "epoch": 1.6840982935491278, "learning_rate": 4.4040519235491e-06, "loss": 2.4606040954589843, "step": 1395700 }, { "epoch": 1.6842189568716104, "learning_rate": 4.403648088081362e-06, "loss": 2.420870056152344, "step": 1395800 }, { "epoch": 1.684339620194093, "learning_rate": 4.403244252613624e-06, "loss": 2.4587893676757813, "step": 1395900 }, { "epoch": 1.6844602835165756, "learning_rate": 4.402840417145885e-06, "loss": 2.4496273803710937, "step": 1396000 }, { "epoch": 1.6845809468390582, "learning_rate": 4.4024365816781464e-06, "loss": 2.4368252563476562, "step": 1396100 }, { "epoch": 1.684701610161541, "learning_rate": 4.4020327462104084e-06, "loss": 2.448835754394531, "step": 1396200 }, { "epoch": 1.6848222734840237, "learning_rate": 4.40162891074267e-06, "loss": 2.4647027587890626, "step": 1396300 }, { "epoch": 1.6849429368065065, "learning_rate": 4.4012250752749315e-06, "loss": 2.4583055114746095, "step": 1396400 }, { "epoch": 1.6850636001289891, "learning_rate": 4.4008212398071935e-06, "loss": 2.44340576171875, "step": 1396500 }, { "epoch": 1.6851842634514718, "learning_rate": 4.400417404339455e-06, "loss": 2.483348083496094, "step": 1396600 }, { "epoch": 1.6853049267739544, "learning_rate": 4.400013568871717e-06, "loss": 2.4516058349609375, "step": 1396700 }, { "epoch": 1.685425590096437, "learning_rate": 4.399609733403978e-06, "loss": 2.465727996826172, "step": 1396800 }, { "epoch": 1.6855462534189198, "learning_rate": 4.39920589793624e-06, "loss": 2.464395751953125, "step": 1396900 }, { "epoch": 1.6856669167414027, "learning_rate": 4.398802062468501e-06, "loss": 2.4505078125, "step": 1397000 }, { "epoch": 1.6857875800638853, "learning_rate": 4.398398227000763e-06, "loss": 2.4930596923828126, "step": 1397100 }, { "epoch": 1.685908243386368, "learning_rate": 4.397994391533024e-06, "loss": 2.479439697265625, "step": 1397200 }, { "epoch": 1.6860289067088505, "learning_rate": 4.397590556065286e-06, "loss": 2.4530633544921874, "step": 1397300 }, { "epoch": 1.6861495700313331, "learning_rate": 4.397186720597548e-06, "loss": 2.463265686035156, "step": 1397400 }, { "epoch": 1.686270233353816, "learning_rate": 4.396782885129809e-06, "loss": 2.4830577087402346, "step": 1397500 }, { "epoch": 1.6863908966762986, "learning_rate": 4.39637904966207e-06, "loss": 2.4566581726074217, "step": 1397600 }, { "epoch": 1.6865115599987814, "learning_rate": 4.395975214194332e-06, "loss": 2.430181121826172, "step": 1397700 }, { "epoch": 1.686632223321264, "learning_rate": 4.395571378726594e-06, "loss": 2.465390625, "step": 1397800 }, { "epoch": 1.6867528866437467, "learning_rate": 4.395167543258856e-06, "loss": 2.4810916137695314, "step": 1397900 }, { "epoch": 1.6868735499662293, "learning_rate": 4.394763707791117e-06, "loss": 2.4603997802734376, "step": 1398000 }, { "epoch": 1.686994213288712, "learning_rate": 4.3943598723233785e-06, "loss": 2.4577330017089842, "step": 1398100 }, { "epoch": 1.6871148766111947, "learning_rate": 4.3939560368556405e-06, "loss": 2.4507075500488282, "step": 1398200 }, { "epoch": 1.6872355399336774, "learning_rate": 4.3935522013879024e-06, "loss": 2.4536297607421873, "step": 1398300 }, { "epoch": 1.6873562032561602, "learning_rate": 4.3931483659201636e-06, "loss": 2.4801397705078125, "step": 1398400 }, { "epoch": 1.6874768665786428, "learning_rate": 4.3927445304524256e-06, "loss": 2.452580871582031, "step": 1398500 }, { "epoch": 1.6875975299011254, "learning_rate": 4.392340694984687e-06, "loss": 2.4656135559082033, "step": 1398600 }, { "epoch": 1.687718193223608, "learning_rate": 4.391936859516949e-06, "loss": 2.4578207397460936, "step": 1398700 }, { "epoch": 1.6878388565460907, "learning_rate": 4.39153302404921e-06, "loss": 2.5017176818847657, "step": 1398800 }, { "epoch": 1.6879595198685735, "learning_rate": 4.391129188581472e-06, "loss": 2.473213653564453, "step": 1398900 }, { "epoch": 1.6880801831910563, "learning_rate": 4.390725353113734e-06, "loss": 2.461872863769531, "step": 1399000 }, { "epoch": 1.688200846513539, "learning_rate": 4.390321517645995e-06, "loss": 2.465686798095703, "step": 1399100 }, { "epoch": 1.6883215098360216, "learning_rate": 4.389917682178256e-06, "loss": 2.479508361816406, "step": 1399200 }, { "epoch": 1.6884421731585042, "learning_rate": 4.389513846710518e-06, "loss": 2.45537841796875, "step": 1399300 }, { "epoch": 1.6885628364809868, "learning_rate": 4.38911001124278e-06, "loss": 2.4718687438964846, "step": 1399400 }, { "epoch": 1.6886834998034697, "learning_rate": 4.388706175775041e-06, "loss": 2.4497109985351564, "step": 1399500 }, { "epoch": 1.6888041631259523, "learning_rate": 4.388302340307303e-06, "loss": 2.461878204345703, "step": 1399600 }, { "epoch": 1.6889248264484351, "learning_rate": 4.387898504839564e-06, "loss": 2.438685302734375, "step": 1399700 }, { "epoch": 1.6890454897709177, "learning_rate": 4.387494669371826e-06, "loss": 2.466356201171875, "step": 1399800 }, { "epoch": 1.6891661530934003, "learning_rate": 4.387090833904088e-06, "loss": 2.468499755859375, "step": 1399900 }, { "epoch": 1.689286816415883, "learning_rate": 4.386686998436349e-06, "loss": 2.4583189392089846, "step": 1400000 }, { "epoch": 1.6894074797383656, "learning_rate": 4.3862831629686105e-06, "loss": 2.4525515747070314, "step": 1400100 }, { "epoch": 1.6895281430608484, "learning_rate": 4.3858793275008725e-06, "loss": 2.452608947753906, "step": 1400200 }, { "epoch": 1.689648806383331, "learning_rate": 4.3854754920331345e-06, "loss": 2.4757337951660157, "step": 1400300 }, { "epoch": 1.6897694697058139, "learning_rate": 4.3850716565653964e-06, "loss": 2.4790827941894533, "step": 1400400 }, { "epoch": 1.6898901330282965, "learning_rate": 4.384667821097658e-06, "loss": 2.467046661376953, "step": 1400500 }, { "epoch": 1.690010796350779, "learning_rate": 4.384263985629919e-06, "loss": 2.4514959716796874, "step": 1400600 }, { "epoch": 1.6901314596732617, "learning_rate": 4.383860150162181e-06, "loss": 2.4538592529296874, "step": 1400700 }, { "epoch": 1.6902521229957443, "learning_rate": 4.383456314694443e-06, "loss": 2.4567420959472654, "step": 1400800 }, { "epoch": 1.6903727863182272, "learning_rate": 4.383052479226704e-06, "loss": 2.4553919982910157, "step": 1400900 }, { "epoch": 1.69049344964071, "learning_rate": 4.382648643758966e-06, "loss": 2.466982727050781, "step": 1401000 }, { "epoch": 1.6906141129631926, "learning_rate": 4.382244808291227e-06, "loss": 2.4730332946777343, "step": 1401100 }, { "epoch": 1.6907347762856753, "learning_rate": 4.381840972823489e-06, "loss": 2.4661363220214843, "step": 1401200 }, { "epoch": 1.6908554396081579, "learning_rate": 4.38143713735575e-06, "loss": 2.4718408203125, "step": 1401300 }, { "epoch": 1.6909761029306405, "learning_rate": 4.381033301888012e-06, "loss": 2.474401397705078, "step": 1401400 }, { "epoch": 1.6910967662531233, "learning_rate": 4.380629466420274e-06, "loss": 2.4631619262695312, "step": 1401500 }, { "epoch": 1.691217429575606, "learning_rate": 4.380225630952535e-06, "loss": 2.4401202392578125, "step": 1401600 }, { "epoch": 1.6913380928980888, "learning_rate": 4.379821795484796e-06, "loss": 2.457394561767578, "step": 1401700 }, { "epoch": 1.6914587562205714, "learning_rate": 4.379417960017058e-06, "loss": 2.4679698181152343, "step": 1401800 }, { "epoch": 1.691579419543054, "learning_rate": 4.37901412454932e-06, "loss": 2.4760700988769533, "step": 1401900 }, { "epoch": 1.6917000828655366, "learning_rate": 4.378610289081581e-06, "loss": 2.4792486572265626, "step": 1402000 }, { "epoch": 1.6918207461880193, "learning_rate": 4.378206453613843e-06, "loss": 2.453805694580078, "step": 1402100 }, { "epoch": 1.691941409510502, "learning_rate": 4.3778026181461045e-06, "loss": 2.4498031616210936, "step": 1402200 }, { "epoch": 1.692062072832985, "learning_rate": 4.3773987826783665e-06, "loss": 2.4638067626953126, "step": 1402300 }, { "epoch": 1.6921827361554675, "learning_rate": 4.3769949472106285e-06, "loss": 2.445967559814453, "step": 1402400 }, { "epoch": 1.6923033994779502, "learning_rate": 4.37659111174289e-06, "loss": 2.46228271484375, "step": 1402500 }, { "epoch": 1.6924240628004328, "learning_rate": 4.376187276275151e-06, "loss": 2.4427813720703124, "step": 1402600 }, { "epoch": 1.6925447261229154, "learning_rate": 4.375783440807413e-06, "loss": 2.4835569763183596, "step": 1402700 }, { "epoch": 1.6926653894453982, "learning_rate": 4.375379605339675e-06, "loss": 2.468610382080078, "step": 1402800 }, { "epoch": 1.6927860527678809, "learning_rate": 4.374975769871936e-06, "loss": 2.4701429748535157, "step": 1402900 }, { "epoch": 1.6929067160903637, "learning_rate": 4.374571934404198e-06, "loss": 2.450090179443359, "step": 1403000 }, { "epoch": 1.6930273794128463, "learning_rate": 4.374168098936459e-06, "loss": 2.4562777709960937, "step": 1403100 }, { "epoch": 1.693148042735329, "learning_rate": 4.373764263468721e-06, "loss": 2.458932342529297, "step": 1403200 }, { "epoch": 1.6932687060578115, "learning_rate": 4.373360428000982e-06, "loss": 2.485481872558594, "step": 1403300 }, { "epoch": 1.6933893693802942, "learning_rate": 4.372956592533244e-06, "loss": 2.4747605895996094, "step": 1403400 }, { "epoch": 1.693510032702777, "learning_rate": 4.372552757065506e-06, "loss": 2.4976995849609374, "step": 1403500 }, { "epoch": 1.6936306960252596, "learning_rate": 4.372148921597767e-06, "loss": 2.4692288208007813, "step": 1403600 }, { "epoch": 1.6937513593477425, "learning_rate": 4.371745086130028e-06, "loss": 2.458132019042969, "step": 1403700 }, { "epoch": 1.693872022670225, "learning_rate": 4.37134125066229e-06, "loss": 2.428267059326172, "step": 1403800 }, { "epoch": 1.6939926859927077, "learning_rate": 4.370937415194552e-06, "loss": 2.4794351196289064, "step": 1403900 }, { "epoch": 1.6941133493151903, "learning_rate": 4.370533579726814e-06, "loss": 2.4842929077148437, "step": 1404000 }, { "epoch": 1.694234012637673, "learning_rate": 4.370129744259075e-06, "loss": 2.4840151977539064, "step": 1404100 }, { "epoch": 1.6943546759601558, "learning_rate": 4.3697259087913365e-06, "loss": 2.4604727172851564, "step": 1404200 }, { "epoch": 1.6944753392826386, "learning_rate": 4.3693220733235985e-06, "loss": 2.4813131713867187, "step": 1404300 }, { "epoch": 1.6945960026051212, "learning_rate": 4.3689182378558605e-06, "loss": 2.461470031738281, "step": 1404400 }, { "epoch": 1.6947166659276038, "learning_rate": 4.368514402388122e-06, "loss": 2.4640316772460937, "step": 1404500 }, { "epoch": 1.6948373292500865, "learning_rate": 4.368110566920384e-06, "loss": 2.4519200134277344, "step": 1404600 }, { "epoch": 1.694957992572569, "learning_rate": 4.367706731452645e-06, "loss": 2.4764363098144533, "step": 1404700 }, { "epoch": 1.695078655895052, "learning_rate": 4.367302895984907e-06, "loss": 2.472412872314453, "step": 1404800 }, { "epoch": 1.6951993192175345, "learning_rate": 4.366899060517168e-06, "loss": 2.450214691162109, "step": 1404900 }, { "epoch": 1.6953199825400174, "learning_rate": 4.36649522504943e-06, "loss": 2.456734619140625, "step": 1405000 }, { "epoch": 1.6954406458625, "learning_rate": 4.366091389581692e-06, "loss": 2.4596844482421876, "step": 1405100 }, { "epoch": 1.6955613091849826, "learning_rate": 4.365687554113953e-06, "loss": 2.466045684814453, "step": 1405200 }, { "epoch": 1.6956819725074652, "learning_rate": 4.365283718646215e-06, "loss": 2.433414306640625, "step": 1405300 }, { "epoch": 1.6958026358299478, "learning_rate": 4.364879883178476e-06, "loss": 2.4607008361816405, "step": 1405400 }, { "epoch": 1.6959232991524307, "learning_rate": 4.364476047710738e-06, "loss": 2.4564469909667968, "step": 1405500 }, { "epoch": 1.6960439624749133, "learning_rate": 4.364072212242999e-06, "loss": 2.464841613769531, "step": 1405600 }, { "epoch": 1.6961646257973961, "learning_rate": 4.363668376775261e-06, "loss": 2.4714401245117186, "step": 1405700 }, { "epoch": 1.6962852891198787, "learning_rate": 4.363264541307522e-06, "loss": 2.4442265319824217, "step": 1405800 }, { "epoch": 1.6964059524423614, "learning_rate": 4.362860705839784e-06, "loss": 2.449453887939453, "step": 1405900 }, { "epoch": 1.696526615764844, "learning_rate": 4.362456870372046e-06, "loss": 2.4542808532714844, "step": 1406000 }, { "epoch": 1.6966472790873266, "learning_rate": 4.3620530349043074e-06, "loss": 2.455785827636719, "step": 1406100 }, { "epoch": 1.6967679424098094, "learning_rate": 4.3616491994365686e-06, "loss": 2.464772186279297, "step": 1406200 }, { "epoch": 1.6968886057322923, "learning_rate": 4.3612453639688305e-06, "loss": 2.464488983154297, "step": 1406300 }, { "epoch": 1.697009269054775, "learning_rate": 4.3608415285010925e-06, "loss": 2.4620938110351562, "step": 1406400 }, { "epoch": 1.6971299323772575, "learning_rate": 4.3604376930333545e-06, "loss": 2.458221740722656, "step": 1406500 }, { "epoch": 1.6972505956997401, "learning_rate": 4.360033857565616e-06, "loss": 2.455583038330078, "step": 1406600 }, { "epoch": 1.6973712590222227, "learning_rate": 4.359630022097877e-06, "loss": 2.4736761474609374, "step": 1406700 }, { "epoch": 1.6974919223447056, "learning_rate": 4.359226186630139e-06, "loss": 2.4783731079101563, "step": 1406800 }, { "epoch": 1.6976125856671882, "learning_rate": 4.358822351162401e-06, "loss": 2.450773010253906, "step": 1406900 }, { "epoch": 1.697733248989671, "learning_rate": 4.358418515694662e-06, "loss": 2.4793646240234377, "step": 1407000 }, { "epoch": 1.6978539123121537, "learning_rate": 4.358014680226924e-06, "loss": 2.4690301513671873, "step": 1407100 }, { "epoch": 1.6979745756346363, "learning_rate": 4.357610844759185e-06, "loss": 2.4714353942871092, "step": 1407200 }, { "epoch": 1.698095238957119, "learning_rate": 4.357207009291447e-06, "loss": 2.501964874267578, "step": 1407300 }, { "epoch": 1.6982159022796015, "learning_rate": 4.356803173823708e-06, "loss": 2.438695526123047, "step": 1407400 }, { "epoch": 1.6983365656020843, "learning_rate": 4.35639933835597e-06, "loss": 2.4966688537597657, "step": 1407500 }, { "epoch": 1.6984572289245672, "learning_rate": 4.355995502888232e-06, "loss": 2.4650816345214843, "step": 1407600 }, { "epoch": 1.6985778922470498, "learning_rate": 4.355591667420493e-06, "loss": 2.44453857421875, "step": 1407700 }, { "epoch": 1.6986985555695324, "learning_rate": 4.355187831952754e-06, "loss": 2.471200408935547, "step": 1407800 }, { "epoch": 1.698819218892015, "learning_rate": 4.354783996485016e-06, "loss": 2.482058563232422, "step": 1407900 }, { "epoch": 1.6989398822144977, "learning_rate": 4.354380161017278e-06, "loss": 2.437109069824219, "step": 1408000 }, { "epoch": 1.6990605455369805, "learning_rate": 4.3539763255495394e-06, "loss": 2.4645094299316406, "step": 1408100 }, { "epoch": 1.699181208859463, "learning_rate": 4.3535724900818014e-06, "loss": 2.475280303955078, "step": 1408200 }, { "epoch": 1.699301872181946, "learning_rate": 4.3531686546140626e-06, "loss": 2.4509788513183595, "step": 1408300 }, { "epoch": 1.6994225355044286, "learning_rate": 4.3527648191463246e-06, "loss": 2.4662579345703124, "step": 1408400 }, { "epoch": 1.6995431988269112, "learning_rate": 4.3523609836785865e-06, "loss": 2.441392059326172, "step": 1408500 }, { "epoch": 1.6996638621493938, "learning_rate": 4.351957148210848e-06, "loss": 2.4626072692871093, "step": 1408600 }, { "epoch": 1.6997845254718764, "learning_rate": 4.351553312743109e-06, "loss": 2.4467083740234377, "step": 1408700 }, { "epoch": 1.6999051887943593, "learning_rate": 4.351149477275371e-06, "loss": 2.4677279663085936, "step": 1408800 }, { "epoch": 1.7000258521168419, "learning_rate": 4.350745641807633e-06, "loss": 2.4731320190429686, "step": 1408900 }, { "epoch": 1.7001465154393247, "learning_rate": 4.350341806339894e-06, "loss": 2.484238586425781, "step": 1409000 }, { "epoch": 1.7002671787618073, "learning_rate": 4.349937970872156e-06, "loss": 2.441298370361328, "step": 1409100 }, { "epoch": 1.70038784208429, "learning_rate": 4.349534135404417e-06, "loss": 2.465948181152344, "step": 1409200 }, { "epoch": 1.7005085054067726, "learning_rate": 4.349130299936679e-06, "loss": 2.469999084472656, "step": 1409300 }, { "epoch": 1.7006291687292552, "learning_rate": 4.34872646446894e-06, "loss": 2.4759788513183594, "step": 1409400 }, { "epoch": 1.700749832051738, "learning_rate": 4.348322629001202e-06, "loss": 2.4665151977539064, "step": 1409500 }, { "epoch": 1.7008704953742209, "learning_rate": 4.347918793533464e-06, "loss": 2.455044860839844, "step": 1409600 }, { "epoch": 1.7009911586967035, "learning_rate": 4.347514958065725e-06, "loss": 2.467832336425781, "step": 1409700 }, { "epoch": 1.701111822019186, "learning_rate": 4.347111122597986e-06, "loss": 2.4712158203125, "step": 1409800 }, { "epoch": 1.7012324853416687, "learning_rate": 4.346707287130248e-06, "loss": 2.453932037353516, "step": 1409900 }, { "epoch": 1.7013531486641513, "learning_rate": 4.34630345166251e-06, "loss": 2.45540771484375, "step": 1410000 }, { "epoch": 1.7014738119866342, "learning_rate": 4.345899616194772e-06, "loss": 2.458579864501953, "step": 1410100 }, { "epoch": 1.7015944753091168, "learning_rate": 4.3454957807270335e-06, "loss": 2.4388238525390626, "step": 1410200 }, { "epoch": 1.7017151386315996, "learning_rate": 4.345091945259295e-06, "loss": 2.456751251220703, "step": 1410300 }, { "epoch": 1.7018358019540822, "learning_rate": 4.3446881097915566e-06, "loss": 2.4554119873046876, "step": 1410400 }, { "epoch": 1.7019564652765649, "learning_rate": 4.3442842743238186e-06, "loss": 2.457088623046875, "step": 1410500 }, { "epoch": 1.7020771285990475, "learning_rate": 4.3438804388560805e-06, "loss": 2.4772413635253905, "step": 1410600 }, { "epoch": 1.70219779192153, "learning_rate": 4.343476603388342e-06, "loss": 2.473338623046875, "step": 1410700 }, { "epoch": 1.702318455244013, "learning_rate": 4.343072767920603e-06, "loss": 2.4616160583496094, "step": 1410800 }, { "epoch": 1.7024391185664955, "learning_rate": 4.342668932452865e-06, "loss": 2.4676397705078124, "step": 1410900 }, { "epoch": 1.7025597818889784, "learning_rate": 4.342265096985127e-06, "loss": 2.470564270019531, "step": 1411000 }, { "epoch": 1.702680445211461, "learning_rate": 4.341861261517388e-06, "loss": 2.4685205078125, "step": 1411100 }, { "epoch": 1.7028011085339436, "learning_rate": 4.34145742604965e-06, "loss": 2.4673414611816407, "step": 1411200 }, { "epoch": 1.7029217718564262, "learning_rate": 4.341053590581911e-06, "loss": 2.4548431396484376, "step": 1411300 }, { "epoch": 1.7030424351789089, "learning_rate": 4.340649755114173e-06, "loss": 2.4871726989746095, "step": 1411400 }, { "epoch": 1.7031630985013917, "learning_rate": 4.340245919646434e-06, "loss": 2.4894456481933593, "step": 1411500 }, { "epoch": 1.7032837618238745, "learning_rate": 4.339842084178696e-06, "loss": 2.4542724609375, "step": 1411600 }, { "epoch": 1.7034044251463571, "learning_rate": 4.339438248710957e-06, "loss": 2.451200408935547, "step": 1411700 }, { "epoch": 1.7035250884688398, "learning_rate": 4.339034413243219e-06, "loss": 2.4472979736328124, "step": 1411800 }, { "epoch": 1.7036457517913224, "learning_rate": 4.33863057777548e-06, "loss": 2.4624197387695315, "step": 1411900 }, { "epoch": 1.703766415113805, "learning_rate": 4.338226742307742e-06, "loss": 2.491749725341797, "step": 1412000 }, { "epoch": 1.7038870784362878, "learning_rate": 4.337822906840004e-06, "loss": 2.4598040771484375, "step": 1412100 }, { "epoch": 1.7040077417587705, "learning_rate": 4.3374190713722655e-06, "loss": 2.4880625915527346, "step": 1412200 }, { "epoch": 1.7041284050812533, "learning_rate": 4.337015235904527e-06, "loss": 2.444446258544922, "step": 1412300 }, { "epoch": 1.704249068403736, "learning_rate": 4.336611400436789e-06, "loss": 2.4549832153320312, "step": 1412400 }, { "epoch": 1.7043697317262185, "learning_rate": 4.336207564969051e-06, "loss": 2.4626263427734374, "step": 1412500 }, { "epoch": 1.7044903950487011, "learning_rate": 4.3358037295013126e-06, "loss": 2.4819610595703123, "step": 1412600 }, { "epoch": 1.7046110583711838, "learning_rate": 4.335399894033574e-06, "loss": 2.4537721252441407, "step": 1412700 }, { "epoch": 1.7047317216936666, "learning_rate": 4.334996058565835e-06, "loss": 2.4726519775390625, "step": 1412800 }, { "epoch": 1.7048523850161494, "learning_rate": 4.334592223098097e-06, "loss": 2.4701947021484374, "step": 1412900 }, { "epoch": 1.704973048338632, "learning_rate": 4.334188387630359e-06, "loss": 2.470902862548828, "step": 1413000 }, { "epoch": 1.7050937116611147, "learning_rate": 4.33378455216262e-06, "loss": 2.4569938659667967, "step": 1413100 }, { "epoch": 1.7052143749835973, "learning_rate": 4.333380716694882e-06, "loss": 2.4627903747558593, "step": 1413200 }, { "epoch": 1.70533503830608, "learning_rate": 4.332976881227143e-06, "loss": 2.455294647216797, "step": 1413300 }, { "epoch": 1.7054557016285627, "learning_rate": 4.332573045759405e-06, "loss": 2.4603334045410157, "step": 1413400 }, { "epoch": 1.7055763649510454, "learning_rate": 4.332169210291666e-06, "loss": 2.4516616821289063, "step": 1413500 }, { "epoch": 1.7056970282735282, "learning_rate": 4.331765374823928e-06, "loss": 2.4321900939941408, "step": 1413600 }, { "epoch": 1.7058176915960108, "learning_rate": 4.33136153935619e-06, "loss": 2.4454345703125, "step": 1413700 }, { "epoch": 1.7059383549184934, "learning_rate": 4.330957703888451e-06, "loss": 2.4652023315429688, "step": 1413800 }, { "epoch": 1.706059018240976, "learning_rate": 4.330553868420712e-06, "loss": 2.4711558532714846, "step": 1413900 }, { "epoch": 1.7061796815634587, "learning_rate": 4.330150032952974e-06, "loss": 2.437969055175781, "step": 1414000 }, { "epoch": 1.7063003448859415, "learning_rate": 4.329746197485236e-06, "loss": 2.4366909790039064, "step": 1414100 }, { "epoch": 1.7064210082084241, "learning_rate": 4.3293423620174975e-06, "loss": 2.451346130371094, "step": 1414200 }, { "epoch": 1.706541671530907, "learning_rate": 4.3289385265497595e-06, "loss": 2.478682098388672, "step": 1414300 }, { "epoch": 1.7066623348533896, "learning_rate": 4.328534691082021e-06, "loss": 2.4691178894042967, "step": 1414400 }, { "epoch": 1.7067829981758722, "learning_rate": 4.328130855614283e-06, "loss": 2.446663513183594, "step": 1414500 }, { "epoch": 1.7069036614983548, "learning_rate": 4.327727020146545e-06, "loss": 2.459270172119141, "step": 1414600 }, { "epoch": 1.7070243248208374, "learning_rate": 4.327323184678806e-06, "loss": 2.436489715576172, "step": 1414700 }, { "epoch": 1.7071449881433203, "learning_rate": 4.326919349211067e-06, "loss": 2.462583312988281, "step": 1414800 }, { "epoch": 1.7072656514658031, "learning_rate": 4.326515513743329e-06, "loss": 2.459047546386719, "step": 1414900 }, { "epoch": 1.7073863147882857, "learning_rate": 4.326111678275591e-06, "loss": 2.463664093017578, "step": 1415000 }, { "epoch": 1.7075069781107683, "learning_rate": 4.325707842807852e-06, "loss": 2.4808535766601563, "step": 1415100 }, { "epoch": 1.707627641433251, "learning_rate": 4.325304007340114e-06, "loss": 2.4479106140136717, "step": 1415200 }, { "epoch": 1.7077483047557336, "learning_rate": 4.324900171872375e-06, "loss": 2.4819049072265624, "step": 1415300 }, { "epoch": 1.7078689680782164, "learning_rate": 4.324496336404637e-06, "loss": 2.470409698486328, "step": 1415400 }, { "epoch": 1.707989631400699, "learning_rate": 4.324092500936898e-06, "loss": 2.433829498291016, "step": 1415500 }, { "epoch": 1.7081102947231819, "learning_rate": 4.32368866546916e-06, "loss": 2.4444879150390624, "step": 1415600 }, { "epoch": 1.7082309580456645, "learning_rate": 4.323284830001422e-06, "loss": 2.4295417785644533, "step": 1415700 }, { "epoch": 1.708351621368147, "learning_rate": 4.322880994533683e-06, "loss": 2.4523170471191404, "step": 1415800 }, { "epoch": 1.7084722846906297, "learning_rate": 4.322477159065945e-06, "loss": 2.474806213378906, "step": 1415900 }, { "epoch": 1.7085929480131123, "learning_rate": 4.322073323598206e-06, "loss": 2.469368438720703, "step": 1416000 }, { "epoch": 1.7087136113355952, "learning_rate": 4.321669488130468e-06, "loss": 2.459792175292969, "step": 1416100 }, { "epoch": 1.7088342746580778, "learning_rate": 4.32126565266273e-06, "loss": 2.445548400878906, "step": 1416200 }, { "epoch": 1.7089549379805606, "learning_rate": 4.3208618171949915e-06, "loss": 2.4435745239257813, "step": 1416300 }, { "epoch": 1.7090756013030433, "learning_rate": 4.320457981727253e-06, "loss": 2.458118743896484, "step": 1416400 }, { "epoch": 1.7091962646255259, "learning_rate": 4.320054146259515e-06, "loss": 2.456534881591797, "step": 1416500 }, { "epoch": 1.7093169279480085, "learning_rate": 4.319650310791777e-06, "loss": 2.4609698486328124, "step": 1416600 }, { "epoch": 1.709437591270491, "learning_rate": 4.319246475324039e-06, "loss": 2.4616392517089842, "step": 1416700 }, { "epoch": 1.709558254592974, "learning_rate": 4.3188426398563e-06, "loss": 2.422191314697266, "step": 1416800 }, { "epoch": 1.7096789179154568, "learning_rate": 4.318438804388561e-06, "loss": 2.454493408203125, "step": 1416900 }, { "epoch": 1.7097995812379394, "learning_rate": 4.318034968920823e-06, "loss": 2.447174835205078, "step": 1417000 }, { "epoch": 1.709920244560422, "learning_rate": 4.317631133453085e-06, "loss": 2.4383949279785155, "step": 1417100 }, { "epoch": 1.7100409078829046, "learning_rate": 4.317227297985346e-06, "loss": 2.4776010131835937, "step": 1417200 }, { "epoch": 1.7101615712053873, "learning_rate": 4.316823462517608e-06, "loss": 2.466388702392578, "step": 1417300 }, { "epoch": 1.71028223452787, "learning_rate": 4.316419627049869e-06, "loss": 2.4596275329589843, "step": 1417400 }, { "epoch": 1.7104028978503527, "learning_rate": 4.316015791582131e-06, "loss": 2.4605792236328123, "step": 1417500 }, { "epoch": 1.7105235611728355, "learning_rate": 4.315611956114392e-06, "loss": 2.4601641845703126, "step": 1417600 }, { "epoch": 1.7106442244953182, "learning_rate": 4.315208120646654e-06, "loss": 2.4415464782714844, "step": 1417700 }, { "epoch": 1.7107648878178008, "learning_rate": 4.314804285178915e-06, "loss": 2.48698974609375, "step": 1417800 }, { "epoch": 1.7108855511402834, "learning_rate": 4.314400449711177e-06, "loss": 2.463195495605469, "step": 1417900 }, { "epoch": 1.711006214462766, "learning_rate": 4.3139966142434384e-06, "loss": 2.4646261596679686, "step": 1418000 }, { "epoch": 1.7111268777852489, "learning_rate": 4.3135927787757004e-06, "loss": 2.467511749267578, "step": 1418100 }, { "epoch": 1.7112475411077317, "learning_rate": 4.313188943307962e-06, "loss": 2.4798793029785156, "step": 1418200 }, { "epoch": 1.7113682044302143, "learning_rate": 4.3127851078402235e-06, "loss": 2.4632102966308596, "step": 1418300 }, { "epoch": 1.711488867752697, "learning_rate": 4.312381272372485e-06, "loss": 2.470011901855469, "step": 1418400 }, { "epoch": 1.7116095310751795, "learning_rate": 4.311977436904747e-06, "loss": 2.4684402465820314, "step": 1418500 }, { "epoch": 1.7117301943976622, "learning_rate": 4.311573601437009e-06, "loss": 2.4637428283691407, "step": 1418600 }, { "epoch": 1.711850857720145, "learning_rate": 4.311169765969271e-06, "loss": 2.467489471435547, "step": 1418700 }, { "epoch": 1.7119715210426276, "learning_rate": 4.310765930501532e-06, "loss": 2.4601332092285157, "step": 1418800 }, { "epoch": 1.7120921843651105, "learning_rate": 4.310362095033793e-06, "loss": 2.464981689453125, "step": 1418900 }, { "epoch": 1.712212847687593, "learning_rate": 4.309958259566055e-06, "loss": 2.448725128173828, "step": 1419000 }, { "epoch": 1.7123335110100757, "learning_rate": 4.309554424098317e-06, "loss": 2.444896545410156, "step": 1419100 }, { "epoch": 1.7124541743325583, "learning_rate": 4.309150588630578e-06, "loss": 2.4303547668457033, "step": 1419200 }, { "epoch": 1.712574837655041, "learning_rate": 4.30874675316284e-06, "loss": 2.466103363037109, "step": 1419300 }, { "epoch": 1.7126955009775238, "learning_rate": 4.308342917695101e-06, "loss": 2.4640544128417967, "step": 1419400 }, { "epoch": 1.7128161643000064, "learning_rate": 4.307939082227363e-06, "loss": 2.451612091064453, "step": 1419500 }, { "epoch": 1.7129368276224892, "learning_rate": 4.307535246759624e-06, "loss": 2.4525608825683594, "step": 1419600 }, { "epoch": 1.7130574909449718, "learning_rate": 4.307131411291886e-06, "loss": 2.4877891540527344, "step": 1419700 }, { "epoch": 1.7131781542674545, "learning_rate": 4.306727575824148e-06, "loss": 2.4579913330078127, "step": 1419800 }, { "epoch": 1.713298817589937, "learning_rate": 4.306323740356409e-06, "loss": 2.459757537841797, "step": 1419900 }, { "epoch": 1.7134194809124197, "learning_rate": 4.3059199048886705e-06, "loss": 2.4444737243652344, "step": 1420000 }, { "epoch": 1.7135401442349025, "learning_rate": 4.3055160694209325e-06, "loss": 2.4524473571777343, "step": 1420100 }, { "epoch": 1.7136608075573854, "learning_rate": 4.3051122339531944e-06, "loss": 2.464228057861328, "step": 1420200 }, { "epoch": 1.713781470879868, "learning_rate": 4.3047083984854556e-06, "loss": 2.4811366271972655, "step": 1420300 }, { "epoch": 1.7139021342023506, "learning_rate": 4.3043045630177176e-06, "loss": 2.451967468261719, "step": 1420400 }, { "epoch": 1.7140227975248332, "learning_rate": 4.303900727549979e-06, "loss": 2.462845458984375, "step": 1420500 }, { "epoch": 1.7141434608473158, "learning_rate": 4.303496892082241e-06, "loss": 2.4755812072753907, "step": 1420600 }, { "epoch": 1.7142641241697987, "learning_rate": 4.303093056614503e-06, "loss": 2.450179138183594, "step": 1420700 }, { "epoch": 1.7143847874922813, "learning_rate": 4.302689221146764e-06, "loss": 2.4842546081542967, "step": 1420800 }, { "epoch": 1.7145054508147641, "learning_rate": 4.302285385679025e-06, "loss": 2.466470031738281, "step": 1420900 }, { "epoch": 1.7146261141372467, "learning_rate": 4.301881550211287e-06, "loss": 2.467266845703125, "step": 1421000 }, { "epoch": 1.7147467774597294, "learning_rate": 4.301477714743549e-06, "loss": 2.444649200439453, "step": 1421100 }, { "epoch": 1.714867440782212, "learning_rate": 4.301073879275811e-06, "loss": 2.4763519287109377, "step": 1421200 }, { "epoch": 1.7149881041046946, "learning_rate": 4.300670043808072e-06, "loss": 2.4585527038574218, "step": 1421300 }, { "epoch": 1.7151087674271774, "learning_rate": 4.300266208340333e-06, "loss": 2.4603370666503905, "step": 1421400 }, { "epoch": 1.71522943074966, "learning_rate": 4.299862372872595e-06, "loss": 2.4484291076660156, "step": 1421500 }, { "epoch": 1.715350094072143, "learning_rate": 4.299458537404857e-06, "loss": 2.452178649902344, "step": 1421600 }, { "epoch": 1.7154707573946255, "learning_rate": 4.299054701937118e-06, "loss": 2.488423309326172, "step": 1421700 }, { "epoch": 1.7155914207171081, "learning_rate": 4.29865086646938e-06, "loss": 2.4568458557128907, "step": 1421800 }, { "epoch": 1.7157120840395907, "learning_rate": 4.298247031001641e-06, "loss": 2.439658966064453, "step": 1421900 }, { "epoch": 1.7158327473620734, "learning_rate": 4.297843195533903e-06, "loss": 2.4648223876953126, "step": 1422000 }, { "epoch": 1.7159534106845562, "learning_rate": 4.2974393600661645e-06, "loss": 2.4898831176757814, "step": 1422100 }, { "epoch": 1.716074074007039, "learning_rate": 4.2970355245984265e-06, "loss": 2.4667161560058593, "step": 1422200 }, { "epoch": 1.7161947373295217, "learning_rate": 4.2966316891306884e-06, "loss": 2.458739471435547, "step": 1422300 }, { "epoch": 1.7163154006520043, "learning_rate": 4.29622785366295e-06, "loss": 2.4643434143066405, "step": 1422400 }, { "epoch": 1.716436063974487, "learning_rate": 4.295824018195211e-06, "loss": 2.4526416015625, "step": 1422500 }, { "epoch": 1.7165567272969695, "learning_rate": 4.295420182727473e-06, "loss": 2.429936981201172, "step": 1422600 }, { "epoch": 1.7166773906194523, "learning_rate": 4.295016347259735e-06, "loss": 2.464150085449219, "step": 1422700 }, { "epoch": 1.716798053941935, "learning_rate": 4.294612511791996e-06, "loss": 2.4368011474609377, "step": 1422800 }, { "epoch": 1.7169187172644178, "learning_rate": 4.294208676324258e-06, "loss": 2.46609130859375, "step": 1422900 }, { "epoch": 1.7170393805869004, "learning_rate": 4.293804840856519e-06, "loss": 2.471466064453125, "step": 1423000 }, { "epoch": 1.717160043909383, "learning_rate": 4.293401005388781e-06, "loss": 2.433087921142578, "step": 1423100 }, { "epoch": 1.7172807072318657, "learning_rate": 4.292997169921043e-06, "loss": 2.446916198730469, "step": 1423200 }, { "epoch": 1.7174013705543483, "learning_rate": 4.292593334453304e-06, "loss": 2.490755767822266, "step": 1423300 }, { "epoch": 1.7175220338768311, "learning_rate": 4.292189498985565e-06, "loss": 2.4397178649902345, "step": 1423400 }, { "epoch": 1.717642697199314, "learning_rate": 4.291785663517827e-06, "loss": 2.441786346435547, "step": 1423500 }, { "epoch": 1.7177633605217966, "learning_rate": 4.291381828050089e-06, "loss": 2.431874237060547, "step": 1423600 }, { "epoch": 1.7178840238442792, "learning_rate": 4.29097799258235e-06, "loss": 2.470860900878906, "step": 1423700 }, { "epoch": 1.7180046871667618, "learning_rate": 4.290574157114612e-06, "loss": 2.4493307495117187, "step": 1423800 }, { "epoch": 1.7181253504892444, "learning_rate": 4.290170321646873e-06, "loss": 2.4689399719238283, "step": 1423900 }, { "epoch": 1.7182460138117273, "learning_rate": 4.289766486179135e-06, "loss": 2.468946075439453, "step": 1424000 }, { "epoch": 1.7183666771342099, "learning_rate": 4.2893626507113965e-06, "loss": 2.463990020751953, "step": 1424100 }, { "epoch": 1.7184873404566927, "learning_rate": 4.2889588152436585e-06, "loss": 2.43838134765625, "step": 1424200 }, { "epoch": 1.7186080037791753, "learning_rate": 4.2885549797759205e-06, "loss": 2.483845062255859, "step": 1424300 }, { "epoch": 1.718728667101658, "learning_rate": 4.288151144308182e-06, "loss": 2.454181365966797, "step": 1424400 }, { "epoch": 1.7188493304241406, "learning_rate": 4.287747308840443e-06, "loss": 2.448061218261719, "step": 1424500 }, { "epoch": 1.7189699937466232, "learning_rate": 4.287343473372705e-06, "loss": 2.4392051696777344, "step": 1424600 }, { "epoch": 1.719090657069106, "learning_rate": 4.286939637904967e-06, "loss": 2.447232208251953, "step": 1424700 }, { "epoch": 1.7192113203915886, "learning_rate": 4.286535802437229e-06, "loss": 2.468992919921875, "step": 1424800 }, { "epoch": 1.7193319837140715, "learning_rate": 4.28613196696949e-06, "loss": 2.435649871826172, "step": 1424900 }, { "epoch": 1.719452647036554, "learning_rate": 4.285728131501751e-06, "loss": 2.4349163818359374, "step": 1425000 }, { "epoch": 1.7195733103590367, "learning_rate": 4.285324296034013e-06, "loss": 2.4513786315917967, "step": 1425100 }, { "epoch": 1.7196939736815193, "learning_rate": 4.284920460566275e-06, "loss": 2.452004241943359, "step": 1425200 }, { "epoch": 1.719814637004002, "learning_rate": 4.284516625098536e-06, "loss": 2.4682057189941404, "step": 1425300 }, { "epoch": 1.7199353003264848, "learning_rate": 4.284112789630798e-06, "loss": 2.459585876464844, "step": 1425400 }, { "epoch": 1.7200559636489676, "learning_rate": 4.283708954163059e-06, "loss": 2.4439155578613283, "step": 1425500 }, { "epoch": 1.7201766269714502, "learning_rate": 4.283305118695321e-06, "loss": 2.4548130798339844, "step": 1425600 }, { "epoch": 1.7202972902939329, "learning_rate": 4.282901283227582e-06, "loss": 2.4804095458984374, "step": 1425700 }, { "epoch": 1.7204179536164155, "learning_rate": 4.282497447759844e-06, "loss": 2.4513093566894533, "step": 1425800 }, { "epoch": 1.720538616938898, "learning_rate": 4.282093612292106e-06, "loss": 2.4447430419921874, "step": 1425900 }, { "epoch": 1.720659280261381, "learning_rate": 4.281689776824367e-06, "loss": 2.4592250061035155, "step": 1426000 }, { "epoch": 1.7207799435838635, "learning_rate": 4.281285941356629e-06, "loss": 2.4734060668945315, "step": 1426100 }, { "epoch": 1.7209006069063464, "learning_rate": 4.2808821058888905e-06, "loss": 2.4483033752441408, "step": 1426200 }, { "epoch": 1.721021270228829, "learning_rate": 4.2804782704211525e-06, "loss": 2.4560675048828124, "step": 1426300 }, { "epoch": 1.7211419335513116, "learning_rate": 4.280074434953414e-06, "loss": 2.45740234375, "step": 1426400 }, { "epoch": 1.7212625968737942, "learning_rate": 4.279670599485676e-06, "loss": 2.480850830078125, "step": 1426500 }, { "epoch": 1.7213832601962769, "learning_rate": 4.279266764017937e-06, "loss": 2.4785345458984374, "step": 1426600 }, { "epoch": 1.7215039235187597, "learning_rate": 4.278862928550199e-06, "loss": 2.4621124267578125, "step": 1426700 }, { "epoch": 1.7216245868412423, "learning_rate": 4.278459093082461e-06, "loss": 2.454661560058594, "step": 1426800 }, { "epoch": 1.7217452501637251, "learning_rate": 4.278055257614722e-06, "loss": 2.4434617614746093, "step": 1426900 }, { "epoch": 1.7218659134862078, "learning_rate": 4.277651422146983e-06, "loss": 2.462125091552734, "step": 1427000 }, { "epoch": 1.7219865768086904, "learning_rate": 4.277247586679245e-06, "loss": 2.428485565185547, "step": 1427100 }, { "epoch": 1.722107240131173, "learning_rate": 4.276843751211507e-06, "loss": 2.4575985717773436, "step": 1427200 }, { "epoch": 1.7222279034536556, "learning_rate": 4.276439915743769e-06, "loss": 2.4635618591308592, "step": 1427300 }, { "epoch": 1.7223485667761385, "learning_rate": 4.27603608027603e-06, "loss": 2.451738128662109, "step": 1427400 }, { "epoch": 1.7224692300986213, "learning_rate": 4.275632244808291e-06, "loss": 2.439983215332031, "step": 1427500 }, { "epoch": 1.722589893421104, "learning_rate": 4.275228409340553e-06, "loss": 2.4679270935058595, "step": 1427600 }, { "epoch": 1.7227105567435865, "learning_rate": 4.274824573872815e-06, "loss": 2.445944061279297, "step": 1427700 }, { "epoch": 1.7228312200660691, "learning_rate": 4.274420738405076e-06, "loss": 2.466095275878906, "step": 1427800 }, { "epoch": 1.7229518833885518, "learning_rate": 4.274016902937338e-06, "loss": 2.4360365295410156, "step": 1427900 }, { "epoch": 1.7230725467110346, "learning_rate": 4.273613067469599e-06, "loss": 2.4559567260742186, "step": 1428000 }, { "epoch": 1.7231932100335172, "learning_rate": 4.273209232001861e-06, "loss": 2.4446986389160155, "step": 1428100 }, { "epoch": 1.723313873356, "learning_rate": 4.2728053965341225e-06, "loss": 2.464984588623047, "step": 1428200 }, { "epoch": 1.7234345366784827, "learning_rate": 4.2724015610663845e-06, "loss": 2.4413130187988283, "step": 1428300 }, { "epoch": 1.7235552000009653, "learning_rate": 4.2719977255986465e-06, "loss": 2.4900750732421875, "step": 1428400 }, { "epoch": 1.723675863323448, "learning_rate": 4.271593890130908e-06, "loss": 2.4506466674804686, "step": 1428500 }, { "epoch": 1.7237965266459305, "learning_rate": 4.271190054663169e-06, "loss": 2.454071807861328, "step": 1428600 }, { "epoch": 1.7239171899684134, "learning_rate": 4.270786219195431e-06, "loss": 2.459359130859375, "step": 1428700 }, { "epoch": 1.7240378532908962, "learning_rate": 4.270382383727693e-06, "loss": 2.448263702392578, "step": 1428800 }, { "epoch": 1.7241585166133788, "learning_rate": 4.269978548259954e-06, "loss": 2.472448272705078, "step": 1428900 }, { "epoch": 1.7242791799358614, "learning_rate": 4.269574712792216e-06, "loss": 2.4514315795898436, "step": 1429000 }, { "epoch": 1.724399843258344, "learning_rate": 4.269170877324477e-06, "loss": 2.452711639404297, "step": 1429100 }, { "epoch": 1.7245205065808267, "learning_rate": 4.268767041856739e-06, "loss": 2.4689509582519533, "step": 1429200 }, { "epoch": 1.7246411699033095, "learning_rate": 4.268363206389001e-06, "loss": 2.443165130615234, "step": 1429300 }, { "epoch": 1.7247618332257921, "learning_rate": 4.267959370921262e-06, "loss": 2.4795712280273436, "step": 1429400 }, { "epoch": 1.724882496548275, "learning_rate": 4.267555535453523e-06, "loss": 2.4581544494628904, "step": 1429500 }, { "epoch": 1.7250031598707576, "learning_rate": 4.267151699985785e-06, "loss": 2.4733956909179686, "step": 1429600 }, { "epoch": 1.7251238231932402, "learning_rate": 4.266747864518047e-06, "loss": 2.4782472229003907, "step": 1429700 }, { "epoch": 1.7252444865157228, "learning_rate": 4.266344029050308e-06, "loss": 2.447456970214844, "step": 1429800 }, { "epoch": 1.7253651498382054, "learning_rate": 4.26594019358257e-06, "loss": 2.4431700134277343, "step": 1429900 }, { "epoch": 1.7254858131606883, "learning_rate": 4.2655363581148314e-06, "loss": 2.4718313598632813, "step": 1430000 }, { "epoch": 1.725606476483171, "learning_rate": 4.2651325226470934e-06, "loss": 2.454475860595703, "step": 1430100 }, { "epoch": 1.7257271398056537, "learning_rate": 4.2647286871793546e-06, "loss": 2.478595886230469, "step": 1430200 }, { "epoch": 1.7258478031281363, "learning_rate": 4.2643248517116165e-06, "loss": 2.469319305419922, "step": 1430300 }, { "epoch": 1.725968466450619, "learning_rate": 4.2639210162438785e-06, "loss": 2.4608973693847656, "step": 1430400 }, { "epoch": 1.7260891297731016, "learning_rate": 4.26351718077614e-06, "loss": 2.4300265502929688, "step": 1430500 }, { "epoch": 1.7262097930955842, "learning_rate": 4.263113345308401e-06, "loss": 2.480887451171875, "step": 1430600 }, { "epoch": 1.726330456418067, "learning_rate": 4.262709509840663e-06, "loss": 2.4691848754882812, "step": 1430700 }, { "epoch": 1.7264511197405499, "learning_rate": 4.262305674372925e-06, "loss": 2.4447784423828125, "step": 1430800 }, { "epoch": 1.7265717830630325, "learning_rate": 4.261901838905187e-06, "loss": 2.4314222717285157, "step": 1430900 }, { "epoch": 1.7266924463855151, "learning_rate": 4.261498003437448e-06, "loss": 2.466854248046875, "step": 1431000 }, { "epoch": 1.7268131097079977, "learning_rate": 4.261094167969709e-06, "loss": 2.4472724914550783, "step": 1431100 }, { "epoch": 1.7269337730304803, "learning_rate": 4.260690332501971e-06, "loss": 2.4680690002441406, "step": 1431200 }, { "epoch": 1.7270544363529632, "learning_rate": 4.260286497034233e-06, "loss": 2.4413320922851565, "step": 1431300 }, { "epoch": 1.7271750996754458, "learning_rate": 4.259882661566495e-06, "loss": 2.435862579345703, "step": 1431400 }, { "epoch": 1.7272957629979286, "learning_rate": 4.259478826098756e-06, "loss": 2.5009164428710937, "step": 1431500 }, { "epoch": 1.7274164263204113, "learning_rate": 4.259074990631017e-06, "loss": 2.4416905212402344, "step": 1431600 }, { "epoch": 1.7275370896428939, "learning_rate": 4.258671155163279e-06, "loss": 2.442776947021484, "step": 1431700 }, { "epoch": 1.7276577529653765, "learning_rate": 4.258267319695541e-06, "loss": 2.4487429809570314, "step": 1431800 }, { "epoch": 1.727778416287859, "learning_rate": 4.257863484227802e-06, "loss": 2.433859100341797, "step": 1431900 }, { "epoch": 1.727899079610342, "learning_rate": 4.257459648760064e-06, "loss": 2.4479495239257814, "step": 1432000 }, { "epoch": 1.7280197429328246, "learning_rate": 4.2570558132923255e-06, "loss": 2.452184600830078, "step": 1432100 }, { "epoch": 1.7281404062553074, "learning_rate": 4.2566519778245874e-06, "loss": 2.4425032043457033, "step": 1432200 }, { "epoch": 1.72826106957779, "learning_rate": 4.2562481423568486e-06, "loss": 2.4715644836425783, "step": 1432300 }, { "epoch": 1.7283817329002726, "learning_rate": 4.2558443068891106e-06, "loss": 2.4621253967285157, "step": 1432400 }, { "epoch": 1.7285023962227553, "learning_rate": 4.255440471421372e-06, "loss": 2.462028045654297, "step": 1432500 }, { "epoch": 1.7286230595452379, "learning_rate": 4.255036635953634e-06, "loss": 2.440351867675781, "step": 1432600 }, { "epoch": 1.7287437228677207, "learning_rate": 4.254632800485895e-06, "loss": 2.4510243225097654, "step": 1432700 }, { "epoch": 1.7288643861902036, "learning_rate": 4.254228965018157e-06, "loss": 2.474739532470703, "step": 1432800 }, { "epoch": 1.7289850495126862, "learning_rate": 4.253825129550419e-06, "loss": 2.443905944824219, "step": 1432900 }, { "epoch": 1.7291057128351688, "learning_rate": 4.25342129408268e-06, "loss": 2.456468505859375, "step": 1433000 }, { "epoch": 1.7292263761576514, "learning_rate": 4.253017458614941e-06, "loss": 2.4440863037109377, "step": 1433100 }, { "epoch": 1.729347039480134, "learning_rate": 4.252613623147203e-06, "loss": 2.446444549560547, "step": 1433200 }, { "epoch": 1.7294677028026169, "learning_rate": 4.252209787679465e-06, "loss": 2.4649726867675783, "step": 1433300 }, { "epoch": 1.7295883661250995, "learning_rate": 4.251805952211727e-06, "loss": 2.4503271484375, "step": 1433400 }, { "epoch": 1.7297090294475823, "learning_rate": 4.251402116743988e-06, "loss": 2.4614553833007813, "step": 1433500 }, { "epoch": 1.729829692770065, "learning_rate": 4.250998281276249e-06, "loss": 2.459522247314453, "step": 1433600 }, { "epoch": 1.7299503560925475, "learning_rate": 4.250594445808511e-06, "loss": 2.450545349121094, "step": 1433700 }, { "epoch": 1.7300710194150302, "learning_rate": 4.250190610340773e-06, "loss": 2.462236022949219, "step": 1433800 }, { "epoch": 1.7301916827375128, "learning_rate": 4.249786774873034e-06, "loss": 2.443225860595703, "step": 1433900 }, { "epoch": 1.7303123460599956, "learning_rate": 4.249382939405296e-06, "loss": 2.4578517150878905, "step": 1434000 }, { "epoch": 1.7304330093824785, "learning_rate": 4.2489791039375575e-06, "loss": 2.4503306579589843, "step": 1434100 }, { "epoch": 1.730553672704961, "learning_rate": 4.2485752684698195e-06, "loss": 2.443765106201172, "step": 1434200 }, { "epoch": 1.7306743360274437, "learning_rate": 4.248171433002081e-06, "loss": 2.4336207580566405, "step": 1434300 }, { "epoch": 1.7307949993499263, "learning_rate": 4.247767597534343e-06, "loss": 2.432628631591797, "step": 1434400 }, { "epoch": 1.730915662672409, "learning_rate": 4.2473637620666046e-06, "loss": 2.4393489074707033, "step": 1434500 }, { "epoch": 1.7310363259948918, "learning_rate": 4.246959926598866e-06, "loss": 2.468385925292969, "step": 1434600 }, { "epoch": 1.7311569893173744, "learning_rate": 4.246556091131127e-06, "loss": 2.437866668701172, "step": 1434700 }, { "epoch": 1.7312776526398572, "learning_rate": 4.246152255663389e-06, "loss": 2.452320861816406, "step": 1434800 }, { "epoch": 1.7313983159623398, "learning_rate": 4.245748420195651e-06, "loss": 2.432740020751953, "step": 1434900 }, { "epoch": 1.7315189792848225, "learning_rate": 4.245344584727912e-06, "loss": 2.4324163818359374, "step": 1435000 }, { "epoch": 1.731639642607305, "learning_rate": 4.244940749260174e-06, "loss": 2.446977233886719, "step": 1435100 }, { "epoch": 1.7317603059297877, "learning_rate": 4.244536913792435e-06, "loss": 2.4590632629394533, "step": 1435200 }, { "epoch": 1.7318809692522705, "learning_rate": 4.244133078324697e-06, "loss": 2.4502879333496095, "step": 1435300 }, { "epoch": 1.7320016325747531, "learning_rate": 4.243729242856959e-06, "loss": 2.4432020568847657, "step": 1435400 }, { "epoch": 1.732122295897236, "learning_rate": 4.24332540738922e-06, "loss": 2.470781707763672, "step": 1435500 }, { "epoch": 1.7322429592197186, "learning_rate": 4.242921571921481e-06, "loss": 2.4372621154785157, "step": 1435600 }, { "epoch": 1.7323636225422012, "learning_rate": 4.242517736453743e-06, "loss": 2.475233612060547, "step": 1435700 }, { "epoch": 1.7324842858646838, "learning_rate": 4.242113900986005e-06, "loss": 2.4657159423828126, "step": 1435800 }, { "epoch": 1.7326049491871665, "learning_rate": 4.241710065518266e-06, "loss": 2.4398989868164063, "step": 1435900 }, { "epoch": 1.7327256125096493, "learning_rate": 4.241306230050528e-06, "loss": 2.4546075439453126, "step": 1436000 }, { "epoch": 1.7328462758321321, "learning_rate": 4.2409023945827895e-06, "loss": 2.445654296875, "step": 1436100 }, { "epoch": 1.7329669391546147, "learning_rate": 4.2404985591150515e-06, "loss": 2.4454295349121096, "step": 1436200 }, { "epoch": 1.7330876024770974, "learning_rate": 4.2400947236473135e-06, "loss": 2.4538336181640625, "step": 1436300 }, { "epoch": 1.73320826579958, "learning_rate": 4.239690888179575e-06, "loss": 2.444945526123047, "step": 1436400 }, { "epoch": 1.7333289291220626, "learning_rate": 4.239287052711837e-06, "loss": 2.4484303283691404, "step": 1436500 }, { "epoch": 1.7334495924445454, "learning_rate": 4.238883217244098e-06, "loss": 2.467781677246094, "step": 1436600 }, { "epoch": 1.733570255767028, "learning_rate": 4.23847938177636e-06, "loss": 2.465759582519531, "step": 1436700 }, { "epoch": 1.733690919089511, "learning_rate": 4.238075546308621e-06, "loss": 2.4197264099121094, "step": 1436800 }, { "epoch": 1.7338115824119935, "learning_rate": 4.237671710840883e-06, "loss": 2.4449977111816406, "step": 1436900 }, { "epoch": 1.7339322457344761, "learning_rate": 4.237267875373145e-06, "loss": 2.4348851013183594, "step": 1437000 }, { "epoch": 1.7340529090569587, "learning_rate": 4.236864039905406e-06, "loss": 2.4533042907714844, "step": 1437100 }, { "epoch": 1.7341735723794414, "learning_rate": 4.236460204437667e-06, "loss": 2.4522474670410155, "step": 1437200 }, { "epoch": 1.7342942357019242, "learning_rate": 4.236056368969929e-06, "loss": 2.4613592529296877, "step": 1437300 }, { "epoch": 1.7344148990244068, "learning_rate": 4.235652533502191e-06, "loss": 2.453077697753906, "step": 1437400 }, { "epoch": 1.7345355623468897, "learning_rate": 4.235248698034452e-06, "loss": 2.4586087036132813, "step": 1437500 }, { "epoch": 1.7346562256693723, "learning_rate": 4.234844862566714e-06, "loss": 2.467371826171875, "step": 1437600 }, { "epoch": 1.734776888991855, "learning_rate": 4.234441027098975e-06, "loss": 2.435484619140625, "step": 1437700 }, { "epoch": 1.7348975523143375, "learning_rate": 4.234037191631237e-06, "loss": 2.4632489013671877, "step": 1437800 }, { "epoch": 1.7350182156368201, "learning_rate": 4.233633356163499e-06, "loss": 2.449290008544922, "step": 1437900 }, { "epoch": 1.735138878959303, "learning_rate": 4.23322952069576e-06, "loss": 2.4657278442382813, "step": 1438000 }, { "epoch": 1.7352595422817858, "learning_rate": 4.2328256852280215e-06, "loss": 2.4549249267578124, "step": 1438100 }, { "epoch": 1.7353802056042684, "learning_rate": 4.2324218497602835e-06, "loss": 2.4353955078125, "step": 1438200 }, { "epoch": 1.735500868926751, "learning_rate": 4.2320180142925455e-06, "loss": 2.439647216796875, "step": 1438300 }, { "epoch": 1.7356215322492337, "learning_rate": 4.231614178824807e-06, "loss": 2.437421875, "step": 1438400 }, { "epoch": 1.7357421955717163, "learning_rate": 4.231210343357069e-06, "loss": 2.4548655700683595, "step": 1438500 }, { "epoch": 1.7358628588941991, "learning_rate": 4.23080650788933e-06, "loss": 2.4668727111816406, "step": 1438600 }, { "epoch": 1.7359835222166817, "learning_rate": 4.230402672421592e-06, "loss": 2.4446701049804687, "step": 1438700 }, { "epoch": 1.7361041855391646, "learning_rate": 4.229998836953853e-06, "loss": 2.4357965087890623, "step": 1438800 }, { "epoch": 1.7362248488616472, "learning_rate": 4.229595001486115e-06, "loss": 2.4571324157714844, "step": 1438900 }, { "epoch": 1.7363455121841298, "learning_rate": 4.229191166018377e-06, "loss": 2.4273306274414064, "step": 1439000 }, { "epoch": 1.7364661755066124, "learning_rate": 4.228787330550638e-06, "loss": 2.475333709716797, "step": 1439100 }, { "epoch": 1.736586838829095, "learning_rate": 4.228383495082899e-06, "loss": 2.467706604003906, "step": 1439200 }, { "epoch": 1.7367075021515779, "learning_rate": 4.227979659615161e-06, "loss": 2.4377597045898436, "step": 1439300 }, { "epoch": 1.7368281654740607, "learning_rate": 4.227575824147423e-06, "loss": 2.4659104919433594, "step": 1439400 }, { "epoch": 1.7369488287965433, "learning_rate": 4.227171988679685e-06, "loss": 2.4269261169433594, "step": 1439500 }, { "epoch": 1.737069492119026, "learning_rate": 4.226768153211946e-06, "loss": 2.442207946777344, "step": 1439600 }, { "epoch": 1.7371901554415086, "learning_rate": 4.226364317744207e-06, "loss": 2.465635986328125, "step": 1439700 }, { "epoch": 1.7373108187639912, "learning_rate": 4.225960482276469e-06, "loss": 2.4350180053710937, "step": 1439800 }, { "epoch": 1.737431482086474, "learning_rate": 4.225556646808731e-06, "loss": 2.467001647949219, "step": 1439900 }, { "epoch": 1.7375521454089566, "learning_rate": 4.225152811340992e-06, "loss": 2.4444731140136717, "step": 1440000 }, { "epoch": 1.7376728087314395, "learning_rate": 4.224748975873254e-06, "loss": 2.4577627563476563, "step": 1440100 }, { "epoch": 1.737793472053922, "learning_rate": 4.2243451404055155e-06, "loss": 2.462845458984375, "step": 1440200 }, { "epoch": 1.7379141353764047, "learning_rate": 4.2239413049377775e-06, "loss": 2.4442007446289065, "step": 1440300 }, { "epoch": 1.7380347986988873, "learning_rate": 4.223537469470039e-06, "loss": 2.462033233642578, "step": 1440400 }, { "epoch": 1.73815546202137, "learning_rate": 4.223133634002301e-06, "loss": 2.459739532470703, "step": 1440500 }, { "epoch": 1.7382761253438528, "learning_rate": 4.222729798534563e-06, "loss": 2.4627882385253907, "step": 1440600 }, { "epoch": 1.7383967886663354, "learning_rate": 4.222325963066824e-06, "loss": 2.443592224121094, "step": 1440700 }, { "epoch": 1.7385174519888182, "learning_rate": 4.221922127599085e-06, "loss": 2.4532792663574217, "step": 1440800 }, { "epoch": 1.7386381153113009, "learning_rate": 4.221518292131347e-06, "loss": 2.4413302612304686, "step": 1440900 }, { "epoch": 1.7387587786337835, "learning_rate": 4.221114456663609e-06, "loss": 2.455344543457031, "step": 1441000 }, { "epoch": 1.738879441956266, "learning_rate": 4.22071062119587e-06, "loss": 2.4666375732421875, "step": 1441100 }, { "epoch": 1.7390001052787487, "learning_rate": 4.220306785728132e-06, "loss": 2.4354661560058593, "step": 1441200 }, { "epoch": 1.7391207686012315, "learning_rate": 4.219902950260393e-06, "loss": 2.4674713134765627, "step": 1441300 }, { "epoch": 1.7392414319237144, "learning_rate": 4.219499114792655e-06, "loss": 2.4577735900878905, "step": 1441400 }, { "epoch": 1.739362095246197, "learning_rate": 4.219095279324917e-06, "loss": 2.4473828125, "step": 1441500 }, { "epoch": 1.7394827585686796, "learning_rate": 4.218691443857178e-06, "loss": 2.469359893798828, "step": 1441600 }, { "epoch": 1.7396034218911622, "learning_rate": 4.218287608389439e-06, "loss": 2.454875793457031, "step": 1441700 }, { "epoch": 1.7397240852136449, "learning_rate": 4.217883772921701e-06, "loss": 2.4695123291015624, "step": 1441800 }, { "epoch": 1.7398447485361277, "learning_rate": 4.217479937453963e-06, "loss": 2.4799656677246094, "step": 1441900 }, { "epoch": 1.7399654118586103, "learning_rate": 4.217076101986225e-06, "loss": 2.440011291503906, "step": 1442000 }, { "epoch": 1.7400860751810932, "learning_rate": 4.2166722665184864e-06, "loss": 2.4556094360351564, "step": 1442100 }, { "epoch": 1.7402067385035758, "learning_rate": 4.2162684310507476e-06, "loss": 2.4658436584472656, "step": 1442200 }, { "epoch": 1.7403274018260584, "learning_rate": 4.2158645955830095e-06, "loss": 2.456149444580078, "step": 1442300 }, { "epoch": 1.740448065148541, "learning_rate": 4.2154607601152715e-06, "loss": 2.465057373046875, "step": 1442400 }, { "epoch": 1.7405687284710236, "learning_rate": 4.215056924647533e-06, "loss": 2.4474327087402346, "step": 1442500 }, { "epoch": 1.7406893917935065, "learning_rate": 4.214653089179795e-06, "loss": 2.4673283386230467, "step": 1442600 }, { "epoch": 1.740810055115989, "learning_rate": 4.214249253712056e-06, "loss": 2.4457264709472657, "step": 1442700 }, { "epoch": 1.740930718438472, "learning_rate": 4.213845418244318e-06, "loss": 2.444902191162109, "step": 1442800 }, { "epoch": 1.7410513817609545, "learning_rate": 4.213441582776579e-06, "loss": 2.446203308105469, "step": 1442900 }, { "epoch": 1.7411720450834371, "learning_rate": 4.213037747308841e-06, "loss": 2.4503912353515624, "step": 1443000 }, { "epoch": 1.7412927084059198, "learning_rate": 4.212633911841103e-06, "loss": 2.4440440368652343, "step": 1443100 }, { "epoch": 1.7414133717284024, "learning_rate": 4.212230076373364e-06, "loss": 2.4517253112792967, "step": 1443200 }, { "epoch": 1.7415340350508852, "learning_rate": 4.211826240905625e-06, "loss": 2.4473585510253906, "step": 1443300 }, { "epoch": 1.741654698373368, "learning_rate": 4.211422405437887e-06, "loss": 2.4535931396484374, "step": 1443400 }, { "epoch": 1.7417753616958507, "learning_rate": 4.211018569970149e-06, "loss": 2.483809814453125, "step": 1443500 }, { "epoch": 1.7418960250183333, "learning_rate": 4.21061473450241e-06, "loss": 2.456728668212891, "step": 1443600 }, { "epoch": 1.742016688340816, "learning_rate": 4.210210899034672e-06, "loss": 2.443207092285156, "step": 1443700 }, { "epoch": 1.7421373516632985, "learning_rate": 4.209807063566933e-06, "loss": 2.4241671752929688, "step": 1443800 }, { "epoch": 1.7422580149857814, "learning_rate": 4.209403228099195e-06, "loss": 2.4448361206054687, "step": 1443900 }, { "epoch": 1.742378678308264, "learning_rate": 4.208999392631457e-06, "loss": 2.4600344848632814, "step": 1444000 }, { "epoch": 1.7424993416307468, "learning_rate": 4.2085955571637185e-06, "loss": 2.4338880920410157, "step": 1444100 }, { "epoch": 1.7426200049532294, "learning_rate": 4.20819172169598e-06, "loss": 2.461671905517578, "step": 1444200 }, { "epoch": 1.742740668275712, "learning_rate": 4.2077878862282416e-06, "loss": 2.4627931213378904, "step": 1444300 }, { "epoch": 1.7428613315981947, "learning_rate": 4.2073840507605036e-06, "loss": 2.4557135009765627, "step": 1444400 }, { "epoch": 1.7429819949206773, "learning_rate": 4.206980215292765e-06, "loss": 2.4486178588867187, "step": 1444500 }, { "epoch": 1.7431026582431601, "learning_rate": 4.206576379825027e-06, "loss": 2.441414031982422, "step": 1444600 }, { "epoch": 1.743223321565643, "learning_rate": 4.206172544357288e-06, "loss": 2.481184234619141, "step": 1444700 }, { "epoch": 1.7433439848881256, "learning_rate": 4.20576870888955e-06, "loss": 2.47345458984375, "step": 1444800 }, { "epoch": 1.7434646482106082, "learning_rate": 4.205364873421811e-06, "loss": 2.4667037963867187, "step": 1444900 }, { "epoch": 1.7435853115330908, "learning_rate": 4.204961037954073e-06, "loss": 2.4250953674316404, "step": 1445000 }, { "epoch": 1.7437059748555734, "learning_rate": 4.204557202486335e-06, "loss": 2.455576171875, "step": 1445100 }, { "epoch": 1.7438266381780563, "learning_rate": 4.204153367018596e-06, "loss": 2.451578369140625, "step": 1445200 }, { "epoch": 1.743947301500539, "learning_rate": 4.203749531550857e-06, "loss": 2.440320587158203, "step": 1445300 }, { "epoch": 1.7440679648230217, "learning_rate": 4.203345696083119e-06, "loss": 2.438594970703125, "step": 1445400 }, { "epoch": 1.7441886281455043, "learning_rate": 4.202941860615381e-06, "loss": 2.456650848388672, "step": 1445500 }, { "epoch": 1.744309291467987, "learning_rate": 4.202538025147643e-06, "loss": 2.452764587402344, "step": 1445600 }, { "epoch": 1.7444299547904696, "learning_rate": 4.202134189679904e-06, "loss": 2.455768280029297, "step": 1445700 }, { "epoch": 1.7445506181129522, "learning_rate": 4.201730354212165e-06, "loss": 2.459086608886719, "step": 1445800 }, { "epoch": 1.744671281435435, "learning_rate": 4.201326518744427e-06, "loss": 2.471407470703125, "step": 1445900 }, { "epoch": 1.7447919447579177, "learning_rate": 4.200922683276689e-06, "loss": 2.475929412841797, "step": 1446000 }, { "epoch": 1.7449126080804005, "learning_rate": 4.2005188478089505e-06, "loss": 2.4512680053710936, "step": 1446100 }, { "epoch": 1.7450332714028831, "learning_rate": 4.2001150123412125e-06, "loss": 2.456535186767578, "step": 1446200 }, { "epoch": 1.7451539347253657, "learning_rate": 4.199711176873474e-06, "loss": 2.4477693176269533, "step": 1446300 }, { "epoch": 1.7452745980478483, "learning_rate": 4.199307341405736e-06, "loss": 2.4515032958984375, "step": 1446400 }, { "epoch": 1.745395261370331, "learning_rate": 4.1989035059379976e-06, "loss": 2.4402091979980467, "step": 1446500 }, { "epoch": 1.7455159246928138, "learning_rate": 4.198499670470259e-06, "loss": 2.447614898681641, "step": 1446600 }, { "epoch": 1.7456365880152966, "learning_rate": 4.198095835002521e-06, "loss": 2.4494503784179686, "step": 1446700 }, { "epoch": 1.7457572513377793, "learning_rate": 4.197691999534782e-06, "loss": 2.4573941040039062, "step": 1446800 }, { "epoch": 1.7458779146602619, "learning_rate": 4.197288164067044e-06, "loss": 2.4433990478515626, "step": 1446900 }, { "epoch": 1.7459985779827445, "learning_rate": 4.196884328599305e-06, "loss": 2.4418630981445313, "step": 1447000 }, { "epoch": 1.746119241305227, "learning_rate": 4.196480493131567e-06, "loss": 2.448921661376953, "step": 1447100 }, { "epoch": 1.74623990462771, "learning_rate": 4.196076657663828e-06, "loss": 2.4235121154785157, "step": 1447200 }, { "epoch": 1.7463605679501926, "learning_rate": 4.19567282219609e-06, "loss": 2.479075469970703, "step": 1447300 }, { "epoch": 1.7464812312726754, "learning_rate": 4.195268986728351e-06, "loss": 2.437937927246094, "step": 1447400 }, { "epoch": 1.746601894595158, "learning_rate": 4.194865151260613e-06, "loss": 2.4617457580566406, "step": 1447500 }, { "epoch": 1.7467225579176406, "learning_rate": 4.194461315792875e-06, "loss": 2.448914337158203, "step": 1447600 }, { "epoch": 1.7468432212401233, "learning_rate": 4.194057480325136e-06, "loss": 2.4513096618652344, "step": 1447700 }, { "epoch": 1.7469638845626059, "learning_rate": 4.193653644857397e-06, "loss": 2.462405090332031, "step": 1447800 }, { "epoch": 1.7470845478850887, "learning_rate": 4.193249809389659e-06, "loss": 2.453105773925781, "step": 1447900 }, { "epoch": 1.7472052112075713, "learning_rate": 4.192845973921921e-06, "loss": 2.4495468139648438, "step": 1448000 }, { "epoch": 1.7473258745300542, "learning_rate": 4.192442138454183e-06, "loss": 2.4301519775390625, "step": 1448100 }, { "epoch": 1.7474465378525368, "learning_rate": 4.1920383029864445e-06, "loss": 2.4436961364746095, "step": 1448200 }, { "epoch": 1.7475672011750194, "learning_rate": 4.191634467518706e-06, "loss": 2.4282196044921873, "step": 1448300 }, { "epoch": 1.747687864497502, "learning_rate": 4.191230632050968e-06, "loss": 2.4898001098632814, "step": 1448400 }, { "epoch": 1.7478085278199846, "learning_rate": 4.19082679658323e-06, "loss": 2.4553736877441406, "step": 1448500 }, { "epoch": 1.7479291911424675, "learning_rate": 4.190422961115491e-06, "loss": 2.453713226318359, "step": 1448600 }, { "epoch": 1.7480498544649503, "learning_rate": 4.190019125647753e-06, "loss": 2.4440901184082033, "step": 1448700 }, { "epoch": 1.748170517787433, "learning_rate": 4.189615290180014e-06, "loss": 2.4652606201171876, "step": 1448800 }, { "epoch": 1.7482911811099155, "learning_rate": 4.189211454712276e-06, "loss": 2.4759442138671877, "step": 1448900 }, { "epoch": 1.7484118444323982, "learning_rate": 4.188807619244537e-06, "loss": 2.445489959716797, "step": 1449000 }, { "epoch": 1.7485325077548808, "learning_rate": 4.188403783776799e-06, "loss": 2.4479779052734374, "step": 1449100 }, { "epoch": 1.7486531710773636, "learning_rate": 4.187999948309061e-06, "loss": 2.4417733764648437, "step": 1449200 }, { "epoch": 1.7487738343998462, "learning_rate": 4.187596112841322e-06, "loss": 2.428835754394531, "step": 1449300 }, { "epoch": 1.748894497722329, "learning_rate": 4.187192277373583e-06, "loss": 2.4607826232910157, "step": 1449400 }, { "epoch": 1.7490151610448117, "learning_rate": 4.186788441905845e-06, "loss": 2.4656610107421875, "step": 1449500 }, { "epoch": 1.7491358243672943, "learning_rate": 4.186384606438107e-06, "loss": 2.451822967529297, "step": 1449600 }, { "epoch": 1.749256487689777, "learning_rate": 4.185980770970368e-06, "loss": 2.4548960876464845, "step": 1449700 }, { "epoch": 1.7493771510122595, "learning_rate": 4.18557693550263e-06, "loss": 2.4443678283691406, "step": 1449800 }, { "epoch": 1.7494978143347424, "learning_rate": 4.185173100034891e-06, "loss": 2.4502694702148435, "step": 1449900 }, { "epoch": 1.7496184776572252, "learning_rate": 4.184769264567153e-06, "loss": 2.4719447326660156, "step": 1450000 }, { "epoch": 1.7497391409797078, "learning_rate": 4.184365429099415e-06, "loss": 2.451731872558594, "step": 1450100 }, { "epoch": 1.7498598043021905, "learning_rate": 4.1839615936316765e-06, "loss": 2.4688653564453125, "step": 1450200 }, { "epoch": 1.749980467624673, "learning_rate": 4.183557758163938e-06, "loss": 2.4577897644042968, "step": 1450300 }, { "epoch": 1.7501011309471557, "learning_rate": 4.1831539226962e-06, "loss": 2.44421875, "step": 1450400 }, { "epoch": 1.7502217942696385, "learning_rate": 4.182750087228462e-06, "loss": 2.4400479125976564, "step": 1450500 }, { "epoch": 1.7503424575921211, "learning_rate": 4.182346251760723e-06, "loss": 2.477150115966797, "step": 1450600 }, { "epoch": 1.750463120914604, "learning_rate": 4.181942416292985e-06, "loss": 2.448840789794922, "step": 1450700 }, { "epoch": 1.7505837842370866, "learning_rate": 4.181538580825246e-06, "loss": 2.433479461669922, "step": 1450800 }, { "epoch": 1.7507044475595692, "learning_rate": 4.181134745357508e-06, "loss": 2.4179742431640623, "step": 1450900 }, { "epoch": 1.7508251108820518, "learning_rate": 4.180730909889769e-06, "loss": 2.4387832641601563, "step": 1451000 }, { "epoch": 1.7509457742045345, "learning_rate": 4.180327074422031e-06, "loss": 2.4457302856445313, "step": 1451100 }, { "epoch": 1.7510664375270173, "learning_rate": 4.179923238954293e-06, "loss": 2.4592620849609377, "step": 1451200 }, { "epoch": 1.7511871008495, "learning_rate": 4.179519403486554e-06, "loss": 2.4624453735351564, "step": 1451300 }, { "epoch": 1.7513077641719828, "learning_rate": 4.179115568018815e-06, "loss": 2.4425189208984377, "step": 1451400 }, { "epoch": 1.7514284274944654, "learning_rate": 4.178711732551077e-06, "loss": 2.4546958923339846, "step": 1451500 }, { "epoch": 1.751549090816948, "learning_rate": 4.178307897083339e-06, "loss": 2.42515625, "step": 1451600 }, { "epoch": 1.7516697541394306, "learning_rate": 4.177904061615601e-06, "loss": 2.434808654785156, "step": 1451700 }, { "epoch": 1.7517904174619132, "learning_rate": 4.177500226147862e-06, "loss": 2.4510791015625, "step": 1451800 }, { "epoch": 1.751911080784396, "learning_rate": 4.1770963906801234e-06, "loss": 2.490755310058594, "step": 1451900 }, { "epoch": 1.752031744106879, "learning_rate": 4.176692555212385e-06, "loss": 2.4312457275390624, "step": 1452000 }, { "epoch": 1.7521524074293615, "learning_rate": 4.176288719744647e-06, "loss": 2.467334899902344, "step": 1452100 }, { "epoch": 1.7522730707518441, "learning_rate": 4.175884884276909e-06, "loss": 2.448651885986328, "step": 1452200 }, { "epoch": 1.7523937340743267, "learning_rate": 4.1754810488091705e-06, "loss": 2.4728089904785158, "step": 1452300 }, { "epoch": 1.7525143973968094, "learning_rate": 4.175077213341432e-06, "loss": 2.473879699707031, "step": 1452400 }, { "epoch": 1.7526350607192922, "learning_rate": 4.174673377873694e-06, "loss": 2.4316448974609375, "step": 1452500 }, { "epoch": 1.7527557240417748, "learning_rate": 4.174269542405956e-06, "loss": 2.483056640625, "step": 1452600 }, { "epoch": 1.7528763873642577, "learning_rate": 4.173865706938217e-06, "loss": 2.4408636474609375, "step": 1452700 }, { "epoch": 1.7529970506867403, "learning_rate": 4.173461871470479e-06, "loss": 2.4750164794921874, "step": 1452800 }, { "epoch": 1.753117714009223, "learning_rate": 4.17305803600274e-06, "loss": 2.4468647766113283, "step": 1452900 }, { "epoch": 1.7532383773317055, "learning_rate": 4.172654200535002e-06, "loss": 2.434295654296875, "step": 1453000 }, { "epoch": 1.7533590406541881, "learning_rate": 4.172250365067263e-06, "loss": 2.4388194274902344, "step": 1453100 }, { "epoch": 1.753479703976671, "learning_rate": 4.171846529599525e-06, "loss": 2.4358036804199217, "step": 1453200 }, { "epoch": 1.7536003672991536, "learning_rate": 4.171442694131786e-06, "loss": 2.447371520996094, "step": 1453300 }, { "epoch": 1.7537210306216364, "learning_rate": 4.171038858664048e-06, "loss": 2.4492727661132814, "step": 1453400 }, { "epoch": 1.753841693944119, "learning_rate": 4.170635023196309e-06, "loss": 2.450847625732422, "step": 1453500 }, { "epoch": 1.7539623572666017, "learning_rate": 4.170231187728571e-06, "loss": 2.4515321350097654, "step": 1453600 }, { "epoch": 1.7540830205890843, "learning_rate": 4.169827352260833e-06, "loss": 2.4363468933105468, "step": 1453700 }, { "epoch": 1.754203683911567, "learning_rate": 4.169423516793094e-06, "loss": 2.4602392578125, "step": 1453800 }, { "epoch": 1.7543243472340497, "learning_rate": 4.1690196813253555e-06, "loss": 2.457816314697266, "step": 1453900 }, { "epoch": 1.7544450105565326, "learning_rate": 4.1686158458576174e-06, "loss": 2.454054107666016, "step": 1454000 }, { "epoch": 1.7545656738790152, "learning_rate": 4.1682120103898794e-06, "loss": 2.4525804138183593, "step": 1454100 }, { "epoch": 1.7546863372014978, "learning_rate": 4.167808174922141e-06, "loss": 2.4516201782226563, "step": 1454200 }, { "epoch": 1.7548070005239804, "learning_rate": 4.1674043394544025e-06, "loss": 2.468533477783203, "step": 1454300 }, { "epoch": 1.754927663846463, "learning_rate": 4.167000503986664e-06, "loss": 2.452334289550781, "step": 1454400 }, { "epoch": 1.7550483271689459, "learning_rate": 4.166596668518926e-06, "loss": 2.459422607421875, "step": 1454500 }, { "epoch": 1.7551689904914285, "learning_rate": 4.166192833051188e-06, "loss": 2.4524635314941405, "step": 1454600 }, { "epoch": 1.7552896538139113, "learning_rate": 4.165788997583449e-06, "loss": 2.4446160888671873, "step": 1454700 }, { "epoch": 1.755410317136394, "learning_rate": 4.165385162115711e-06, "loss": 2.446081085205078, "step": 1454800 }, { "epoch": 1.7555309804588766, "learning_rate": 4.164981326647972e-06, "loss": 2.4387136840820314, "step": 1454900 }, { "epoch": 1.7556516437813592, "learning_rate": 4.164577491180234e-06, "loss": 2.433668365478516, "step": 1455000 }, { "epoch": 1.7557723071038418, "learning_rate": 4.164173655712495e-06, "loss": 2.4704574584960937, "step": 1455100 }, { "epoch": 1.7558929704263246, "learning_rate": 4.163769820244757e-06, "loss": 2.4603402709960935, "step": 1455200 }, { "epoch": 1.7560136337488075, "learning_rate": 4.163365984777019e-06, "loss": 2.4610307312011717, "step": 1455300 }, { "epoch": 1.75613429707129, "learning_rate": 4.16296214930928e-06, "loss": 2.4322174072265623, "step": 1455400 }, { "epoch": 1.7562549603937727, "learning_rate": 4.162558313841541e-06, "loss": 2.4803703308105467, "step": 1455500 }, { "epoch": 1.7563756237162553, "learning_rate": 4.162154478373803e-06, "loss": 2.430511779785156, "step": 1455600 }, { "epoch": 1.756496287038738, "learning_rate": 4.161750642906065e-06, "loss": 2.4179145812988283, "step": 1455700 }, { "epoch": 1.7566169503612208, "learning_rate": 4.161346807438326e-06, "loss": 2.4296246337890626, "step": 1455800 }, { "epoch": 1.7567376136837034, "learning_rate": 4.160942971970588e-06, "loss": 2.477928009033203, "step": 1455900 }, { "epoch": 1.7568582770061862, "learning_rate": 4.1605391365028495e-06, "loss": 2.4436122131347657, "step": 1456000 }, { "epoch": 1.7569789403286689, "learning_rate": 4.1601353010351115e-06, "loss": 2.460650634765625, "step": 1456100 }, { "epoch": 1.7570996036511515, "learning_rate": 4.1597314655673734e-06, "loss": 2.4588714599609376, "step": 1456200 }, { "epoch": 1.757220266973634, "learning_rate": 4.1593276300996346e-06, "loss": 2.4743116760253905, "step": 1456300 }, { "epoch": 1.7573409302961167, "learning_rate": 4.158923794631896e-06, "loss": 2.444996032714844, "step": 1456400 }, { "epoch": 1.7574615936185995, "learning_rate": 4.158519959164158e-06, "loss": 2.4540472412109375, "step": 1456500 }, { "epoch": 1.7575822569410822, "learning_rate": 4.15811612369642e-06, "loss": 2.433010711669922, "step": 1456600 }, { "epoch": 1.757702920263565, "learning_rate": 4.157712288228681e-06, "loss": 2.450936737060547, "step": 1456700 }, { "epoch": 1.7578235835860476, "learning_rate": 4.157308452760943e-06, "loss": 2.4614334106445312, "step": 1456800 }, { "epoch": 1.7579442469085302, "learning_rate": 4.156904617293204e-06, "loss": 2.444671630859375, "step": 1456900 }, { "epoch": 1.7580649102310129, "learning_rate": 4.156500781825466e-06, "loss": 2.4537840270996094, "step": 1457000 }, { "epoch": 1.7581855735534955, "learning_rate": 4.156096946357728e-06, "loss": 2.4519993591308595, "step": 1457100 }, { "epoch": 1.7583062368759783, "learning_rate": 4.155693110889989e-06, "loss": 2.425428466796875, "step": 1457200 }, { "epoch": 1.7584269001984612, "learning_rate": 4.155289275422251e-06, "loss": 2.471696319580078, "step": 1457300 }, { "epoch": 1.7585475635209438, "learning_rate": 4.154885439954512e-06, "loss": 2.4697917175292967, "step": 1457400 }, { "epoch": 1.7586682268434264, "learning_rate": 4.154481604486774e-06, "loss": 2.451402282714844, "step": 1457500 }, { "epoch": 1.758788890165909, "learning_rate": 4.154077769019035e-06, "loss": 2.4486643981933596, "step": 1457600 }, { "epoch": 1.7589095534883916, "learning_rate": 4.153673933551297e-06, "loss": 2.4387135314941406, "step": 1457700 }, { "epoch": 1.7590302168108745, "learning_rate": 4.153270098083559e-06, "loss": 2.4580349731445312, "step": 1457800 }, { "epoch": 1.759150880133357, "learning_rate": 4.15286626261582e-06, "loss": 2.4669180297851563, "step": 1457900 }, { "epoch": 1.75927154345584, "learning_rate": 4.1524624271480815e-06, "loss": 2.467898712158203, "step": 1458000 }, { "epoch": 1.7593922067783225, "learning_rate": 4.1520585916803435e-06, "loss": 2.449137725830078, "step": 1458100 }, { "epoch": 1.7595128701008051, "learning_rate": 4.1516547562126055e-06, "loss": 2.4529379272460936, "step": 1458200 }, { "epoch": 1.7596335334232878, "learning_rate": 4.151250920744867e-06, "loss": 2.459619903564453, "step": 1458300 }, { "epoch": 1.7597541967457704, "learning_rate": 4.150847085277129e-06, "loss": 2.4203117370605467, "step": 1458400 }, { "epoch": 1.7598748600682532, "learning_rate": 4.15044324980939e-06, "loss": 2.447078857421875, "step": 1458500 }, { "epoch": 1.7599955233907358, "learning_rate": 4.150039414341652e-06, "loss": 2.4451129150390627, "step": 1458600 }, { "epoch": 1.7601161867132187, "learning_rate": 4.149635578873914e-06, "loss": 2.4610499572753906, "step": 1458700 }, { "epoch": 1.7602368500357013, "learning_rate": 4.149231743406175e-06, "loss": 2.446664276123047, "step": 1458800 }, { "epoch": 1.760357513358184, "learning_rate": 4.148827907938436e-06, "loss": 2.4385853576660157, "step": 1458900 }, { "epoch": 1.7604781766806665, "learning_rate": 4.148424072470698e-06, "loss": 2.4368209838867188, "step": 1459000 }, { "epoch": 1.7605988400031494, "learning_rate": 4.14802023700296e-06, "loss": 2.445052185058594, "step": 1459100 }, { "epoch": 1.760719503325632, "learning_rate": 4.147616401535221e-06, "loss": 2.4588088989257812, "step": 1459200 }, { "epoch": 1.7608401666481148, "learning_rate": 4.147212566067483e-06, "loss": 2.443124542236328, "step": 1459300 }, { "epoch": 1.7609608299705974, "learning_rate": 4.146808730599744e-06, "loss": 2.4564892578125, "step": 1459400 }, { "epoch": 1.76108149329308, "learning_rate": 4.146404895132006e-06, "loss": 2.4475897216796874, "step": 1459500 }, { "epoch": 1.7612021566155627, "learning_rate": 4.146001059664267e-06, "loss": 2.450835723876953, "step": 1459600 }, { "epoch": 1.7613228199380453, "learning_rate": 4.145597224196529e-06, "loss": 2.449481201171875, "step": 1459700 }, { "epoch": 1.7614434832605281, "learning_rate": 4.145193388728791e-06, "loss": 2.452776336669922, "step": 1459800 }, { "epoch": 1.7615641465830107, "learning_rate": 4.144789553261052e-06, "loss": 2.463035888671875, "step": 1459900 }, { "epoch": 1.7616848099054936, "learning_rate": 4.1443857177933135e-06, "loss": 2.4576077270507812, "step": 1460000 }, { "epoch": 1.7618054732279762, "learning_rate": 4.1439818823255755e-06, "loss": 2.451501770019531, "step": 1460100 }, { "epoch": 1.7619261365504588, "learning_rate": 4.1435780468578375e-06, "loss": 2.4637498474121093, "step": 1460200 }, { "epoch": 1.7620467998729414, "learning_rate": 4.1431742113900995e-06, "loss": 2.455750732421875, "step": 1460300 }, { "epoch": 1.762167463195424, "learning_rate": 4.142770375922361e-06, "loss": 2.447948760986328, "step": 1460400 }, { "epoch": 1.762288126517907, "learning_rate": 4.142366540454622e-06, "loss": 2.460954437255859, "step": 1460500 }, { "epoch": 1.7624087898403897, "learning_rate": 4.141962704986884e-06, "loss": 2.445069580078125, "step": 1460600 }, { "epoch": 1.7625294531628724, "learning_rate": 4.141558869519146e-06, "loss": 2.4260377502441406, "step": 1460700 }, { "epoch": 1.762650116485355, "learning_rate": 4.141155034051407e-06, "loss": 2.4652005004882813, "step": 1460800 }, { "epoch": 1.7627707798078376, "learning_rate": 4.140751198583669e-06, "loss": 2.4501487731933596, "step": 1460900 }, { "epoch": 1.7628914431303202, "learning_rate": 4.14034736311593e-06, "loss": 2.464688568115234, "step": 1461000 }, { "epoch": 1.763012106452803, "learning_rate": 4.139943527648192e-06, "loss": 2.4588011169433592, "step": 1461100 }, { "epoch": 1.7631327697752857, "learning_rate": 4.139539692180453e-06, "loss": 2.443406677246094, "step": 1461200 }, { "epoch": 1.7632534330977685, "learning_rate": 4.139135856712715e-06, "loss": 2.444646911621094, "step": 1461300 }, { "epoch": 1.7633740964202511, "learning_rate": 4.138732021244977e-06, "loss": 2.467859191894531, "step": 1461400 }, { "epoch": 1.7634947597427337, "learning_rate": 4.138328185777238e-06, "loss": 2.4532330322265623, "step": 1461500 }, { "epoch": 1.7636154230652163, "learning_rate": 4.137924350309499e-06, "loss": 2.4431317138671873, "step": 1461600 }, { "epoch": 1.763736086387699, "learning_rate": 4.137520514841761e-06, "loss": 2.4391690063476563, "step": 1461700 }, { "epoch": 1.7638567497101818, "learning_rate": 4.137116679374023e-06, "loss": 2.4641044616699217, "step": 1461800 }, { "epoch": 1.7639774130326644, "learning_rate": 4.136712843906284e-06, "loss": 2.4569664001464844, "step": 1461900 }, { "epoch": 1.7640980763551473, "learning_rate": 4.136309008438546e-06, "loss": 2.468247528076172, "step": 1462000 }, { "epoch": 1.7642187396776299, "learning_rate": 4.1359051729708075e-06, "loss": 2.444638366699219, "step": 1462100 }, { "epoch": 1.7643394030001125, "learning_rate": 4.1355013375030695e-06, "loss": 2.4491552734375, "step": 1462200 }, { "epoch": 1.764460066322595, "learning_rate": 4.1350975020353315e-06, "loss": 2.448392333984375, "step": 1462300 }, { "epoch": 1.7645807296450777, "learning_rate": 4.134693666567593e-06, "loss": 2.460723419189453, "step": 1462400 }, { "epoch": 1.7647013929675606, "learning_rate": 4.134289831099854e-06, "loss": 2.4347523498535155, "step": 1462500 }, { "epoch": 1.7648220562900434, "learning_rate": 4.133885995632116e-06, "loss": 2.427534942626953, "step": 1462600 }, { "epoch": 1.764942719612526, "learning_rate": 4.133482160164378e-06, "loss": 2.4708685302734374, "step": 1462700 }, { "epoch": 1.7650633829350086, "learning_rate": 4.13307832469664e-06, "loss": 2.430387420654297, "step": 1462800 }, { "epoch": 1.7651840462574913, "learning_rate": 4.132674489228901e-06, "loss": 2.443386688232422, "step": 1462900 }, { "epoch": 1.7653047095799739, "learning_rate": 4.132270653761162e-06, "loss": 2.428345031738281, "step": 1463000 }, { "epoch": 1.7654253729024567, "learning_rate": 4.131866818293424e-06, "loss": 2.4434640502929685, "step": 1463100 }, { "epoch": 1.7655460362249393, "learning_rate": 4.131462982825686e-06, "loss": 2.4476438903808595, "step": 1463200 }, { "epoch": 1.7656666995474222, "learning_rate": 4.131059147357947e-06, "loss": 2.459664001464844, "step": 1463300 }, { "epoch": 1.7657873628699048, "learning_rate": 4.130655311890209e-06, "loss": 2.4667422485351564, "step": 1463400 }, { "epoch": 1.7659080261923874, "learning_rate": 4.13025147642247e-06, "loss": 2.440598449707031, "step": 1463500 }, { "epoch": 1.76602868951487, "learning_rate": 4.129847640954732e-06, "loss": 2.4464202880859376, "step": 1463600 }, { "epoch": 1.7661493528373526, "learning_rate": 4.129443805486993e-06, "loss": 2.4687269592285155, "step": 1463700 }, { "epoch": 1.7662700161598355, "learning_rate": 4.129039970019255e-06, "loss": 2.431986846923828, "step": 1463800 }, { "epoch": 1.766390679482318, "learning_rate": 4.128636134551517e-06, "loss": 2.467257080078125, "step": 1463900 }, { "epoch": 1.766511342804801, "learning_rate": 4.1282322990837784e-06, "loss": 2.4590220642089844, "step": 1464000 }, { "epoch": 1.7666320061272835, "learning_rate": 4.1278284636160396e-06, "loss": 2.440726318359375, "step": 1464100 }, { "epoch": 1.7667526694497662, "learning_rate": 4.1274246281483015e-06, "loss": 2.45483154296875, "step": 1464200 }, { "epoch": 1.7668733327722488, "learning_rate": 4.1270207926805635e-06, "loss": 2.449778594970703, "step": 1464300 }, { "epoch": 1.7669939960947316, "learning_rate": 4.126616957212825e-06, "loss": 2.463576202392578, "step": 1464400 }, { "epoch": 1.7671146594172142, "learning_rate": 4.126213121745087e-06, "loss": 2.43283447265625, "step": 1464500 }, { "epoch": 1.767235322739697, "learning_rate": 4.125809286277348e-06, "loss": 2.4355757141113283, "step": 1464600 }, { "epoch": 1.7673559860621797, "learning_rate": 4.12540545080961e-06, "loss": 2.412879638671875, "step": 1464700 }, { "epoch": 1.7674766493846623, "learning_rate": 4.125001615341872e-06, "loss": 2.4496116638183594, "step": 1464800 }, { "epoch": 1.767597312707145, "learning_rate": 4.124597779874133e-06, "loss": 2.44083740234375, "step": 1464900 }, { "epoch": 1.7677179760296275, "learning_rate": 4.124193944406394e-06, "loss": 2.4376150512695314, "step": 1465000 }, { "epoch": 1.7678386393521104, "learning_rate": 4.123790108938656e-06, "loss": 2.437028350830078, "step": 1465100 }, { "epoch": 1.767959302674593, "learning_rate": 4.123386273470918e-06, "loss": 2.439372863769531, "step": 1465200 }, { "epoch": 1.7680799659970758, "learning_rate": 4.122982438003179e-06, "loss": 2.417752532958984, "step": 1465300 }, { "epoch": 1.7682006293195585, "learning_rate": 4.122578602535441e-06, "loss": 2.446169738769531, "step": 1465400 }, { "epoch": 1.768321292642041, "learning_rate": 4.122174767067702e-06, "loss": 2.4505436706542967, "step": 1465500 }, { "epoch": 1.7684419559645237, "learning_rate": 4.121770931599964e-06, "loss": 2.4314443969726565, "step": 1465600 }, { "epoch": 1.7685626192870063, "learning_rate": 4.121367096132225e-06, "loss": 2.4680540466308596, "step": 1465700 }, { "epoch": 1.7686832826094891, "learning_rate": 4.120963260664487e-06, "loss": 2.438385772705078, "step": 1465800 }, { "epoch": 1.768803945931972, "learning_rate": 4.120559425196749e-06, "loss": 2.436359405517578, "step": 1465900 }, { "epoch": 1.7689246092544546, "learning_rate": 4.1201555897290104e-06, "loss": 2.4460289001464846, "step": 1466000 }, { "epoch": 1.7690452725769372, "learning_rate": 4.119751754261272e-06, "loss": 2.4411215209960937, "step": 1466100 }, { "epoch": 1.7691659358994198, "learning_rate": 4.1193479187935336e-06, "loss": 2.4489794921875, "step": 1466200 }, { "epoch": 1.7692865992219025, "learning_rate": 4.1189440833257956e-06, "loss": 2.4514697265625, "step": 1466300 }, { "epoch": 1.7694072625443853, "learning_rate": 4.1185402478580575e-06, "loss": 2.4672341918945313, "step": 1466400 }, { "epoch": 1.769527925866868, "learning_rate": 4.118136412390319e-06, "loss": 2.445034637451172, "step": 1466500 }, { "epoch": 1.7696485891893508, "learning_rate": 4.11773257692258e-06, "loss": 2.4446847534179685, "step": 1466600 }, { "epoch": 1.7697692525118334, "learning_rate": 4.117328741454842e-06, "loss": 2.446482849121094, "step": 1466700 }, { "epoch": 1.769889915834316, "learning_rate": 4.116924905987104e-06, "loss": 2.438362731933594, "step": 1466800 }, { "epoch": 1.7700105791567986, "learning_rate": 4.116521070519365e-06, "loss": 2.4596337890625, "step": 1466900 }, { "epoch": 1.7701312424792812, "learning_rate": 4.116117235051627e-06, "loss": 2.4314535522460936, "step": 1467000 }, { "epoch": 1.770251905801764, "learning_rate": 4.115713399583888e-06, "loss": 2.4454913330078125, "step": 1467100 }, { "epoch": 1.7703725691242467, "learning_rate": 4.11530956411615e-06, "loss": 2.442551574707031, "step": 1467200 }, { "epoch": 1.7704932324467295, "learning_rate": 4.114905728648412e-06, "loss": 2.442946319580078, "step": 1467300 }, { "epoch": 1.7706138957692121, "learning_rate": 4.114501893180673e-06, "loss": 2.4501022338867187, "step": 1467400 }, { "epoch": 1.7707345590916947, "learning_rate": 4.114098057712935e-06, "loss": 2.4660382080078125, "step": 1467500 }, { "epoch": 1.7708552224141774, "learning_rate": 4.113694222245196e-06, "loss": 2.4284402465820314, "step": 1467600 }, { "epoch": 1.77097588573666, "learning_rate": 4.113290386777458e-06, "loss": 2.4514839172363283, "step": 1467700 }, { "epoch": 1.7710965490591428, "learning_rate": 4.112886551309719e-06, "loss": 2.4544992065429687, "step": 1467800 }, { "epoch": 1.7712172123816257, "learning_rate": 4.112482715841981e-06, "loss": 2.4566616821289062, "step": 1467900 }, { "epoch": 1.7713378757041083, "learning_rate": 4.1120788803742425e-06, "loss": 2.452602996826172, "step": 1468000 }, { "epoch": 1.771458539026591, "learning_rate": 4.1116750449065045e-06, "loss": 2.424799041748047, "step": 1468100 }, { "epoch": 1.7715792023490735, "learning_rate": 4.111271209438766e-06, "loss": 2.434325714111328, "step": 1468200 }, { "epoch": 1.7716998656715561, "learning_rate": 4.1108673739710276e-06, "loss": 2.4505657958984375, "step": 1468300 }, { "epoch": 1.771820528994039, "learning_rate": 4.1104635385032896e-06, "loss": 2.4720184326171877, "step": 1468400 }, { "epoch": 1.7719411923165216, "learning_rate": 4.110059703035551e-06, "loss": 2.463412017822266, "step": 1468500 }, { "epoch": 1.7720618556390044, "learning_rate": 4.109655867567812e-06, "loss": 2.4302691650390624, "step": 1468600 }, { "epoch": 1.772182518961487, "learning_rate": 4.109252032100074e-06, "loss": 2.4206553649902345, "step": 1468700 }, { "epoch": 1.7723031822839697, "learning_rate": 4.108848196632336e-06, "loss": 2.4521266174316407, "step": 1468800 }, { "epoch": 1.7724238456064523, "learning_rate": 4.108444361164598e-06, "loss": 2.4323304748535155, "step": 1468900 }, { "epoch": 1.772544508928935, "learning_rate": 4.108040525696859e-06, "loss": 2.455699462890625, "step": 1469000 }, { "epoch": 1.7726651722514177, "learning_rate": 4.10763669022912e-06, "loss": 2.4421849060058594, "step": 1469100 }, { "epoch": 1.7727858355739003, "learning_rate": 4.107232854761382e-06, "loss": 2.44745361328125, "step": 1469200 }, { "epoch": 1.7729064988963832, "learning_rate": 4.106829019293644e-06, "loss": 2.461442565917969, "step": 1469300 }, { "epoch": 1.7730271622188658, "learning_rate": 4.106425183825905e-06, "loss": 2.418671417236328, "step": 1469400 }, { "epoch": 1.7731478255413484, "learning_rate": 4.106021348358167e-06, "loss": 2.466622772216797, "step": 1469500 }, { "epoch": 1.773268488863831, "learning_rate": 4.105617512890428e-06, "loss": 2.43514404296875, "step": 1469600 }, { "epoch": 1.7733891521863139, "learning_rate": 4.10521367742269e-06, "loss": 2.4455543518066407, "step": 1469700 }, { "epoch": 1.7735098155087965, "learning_rate": 4.104809841954951e-06, "loss": 2.447795104980469, "step": 1469800 }, { "epoch": 1.7736304788312793, "learning_rate": 4.104406006487213e-06, "loss": 2.440789794921875, "step": 1469900 }, { "epoch": 1.773751142153762, "learning_rate": 4.104002171019475e-06, "loss": 2.468470458984375, "step": 1470000 }, { "epoch": 1.7738718054762446, "learning_rate": 4.1035983355517365e-06, "loss": 2.458209228515625, "step": 1470100 }, { "epoch": 1.7739924687987272, "learning_rate": 4.103194500083998e-06, "loss": 2.465074462890625, "step": 1470200 }, { "epoch": 1.7741131321212098, "learning_rate": 4.10279066461626e-06, "loss": 2.410941314697266, "step": 1470300 }, { "epoch": 1.7742337954436926, "learning_rate": 4.102386829148522e-06, "loss": 2.4139781188964844, "step": 1470400 }, { "epoch": 1.7743544587661753, "learning_rate": 4.101982993680783e-06, "loss": 2.4285772705078124, "step": 1470500 }, { "epoch": 1.774475122088658, "learning_rate": 4.101579158213045e-06, "loss": 2.437086334228516, "step": 1470600 }, { "epoch": 1.7745957854111407, "learning_rate": 4.101175322745306e-06, "loss": 2.4464593505859376, "step": 1470700 }, { "epoch": 1.7747164487336233, "learning_rate": 4.100771487277568e-06, "loss": 2.4285321044921875, "step": 1470800 }, { "epoch": 1.774837112056106, "learning_rate": 4.10036765180983e-06, "loss": 2.4336944580078126, "step": 1470900 }, { "epoch": 1.7749577753785886, "learning_rate": 4.099963816342091e-06, "loss": 2.442796173095703, "step": 1471000 }, { "epoch": 1.7750784387010714, "learning_rate": 4.099559980874352e-06, "loss": 2.4499165344238283, "step": 1471100 }, { "epoch": 1.7751991020235542, "learning_rate": 4.099156145406614e-06, "loss": 2.4315362548828126, "step": 1471200 }, { "epoch": 1.7753197653460369, "learning_rate": 4.098752309938876e-06, "loss": 2.4376376342773436, "step": 1471300 }, { "epoch": 1.7754404286685195, "learning_rate": 4.098348474471137e-06, "loss": 2.470514678955078, "step": 1471400 }, { "epoch": 1.775561091991002, "learning_rate": 4.097944639003399e-06, "loss": 2.444256134033203, "step": 1471500 }, { "epoch": 1.7756817553134847, "learning_rate": 4.09754080353566e-06, "loss": 2.431909942626953, "step": 1471600 }, { "epoch": 1.7758024186359676, "learning_rate": 4.097136968067922e-06, "loss": 2.441253356933594, "step": 1471700 }, { "epoch": 1.7759230819584502, "learning_rate": 4.096733132600183e-06, "loss": 2.4611363220214844, "step": 1471800 }, { "epoch": 1.776043745280933, "learning_rate": 4.096329297132445e-06, "loss": 2.4391363525390624, "step": 1471900 }, { "epoch": 1.7761644086034156, "learning_rate": 4.095925461664707e-06, "loss": 2.453810119628906, "step": 1472000 }, { "epoch": 1.7762850719258982, "learning_rate": 4.0955216261969685e-06, "loss": 2.441637420654297, "step": 1472100 }, { "epoch": 1.7764057352483809, "learning_rate": 4.0951177907292305e-06, "loss": 2.4402096557617186, "step": 1472200 }, { "epoch": 1.7765263985708635, "learning_rate": 4.094713955261492e-06, "loss": 2.4597425842285157, "step": 1472300 }, { "epoch": 1.7766470618933463, "learning_rate": 4.094310119793754e-06, "loss": 2.460224456787109, "step": 1472400 }, { "epoch": 1.776767725215829, "learning_rate": 4.093906284326016e-06, "loss": 2.4163209533691408, "step": 1472500 }, { "epoch": 1.7768883885383118, "learning_rate": 4.093502448858277e-06, "loss": 2.431062774658203, "step": 1472600 }, { "epoch": 1.7770090518607944, "learning_rate": 4.093098613390538e-06, "loss": 2.4410572814941407, "step": 1472700 }, { "epoch": 1.777129715183277, "learning_rate": 4.0926947779228e-06, "loss": 2.4497132873535157, "step": 1472800 }, { "epoch": 1.7772503785057596, "learning_rate": 4.092290942455062e-06, "loss": 2.445642852783203, "step": 1472900 }, { "epoch": 1.7773710418282422, "learning_rate": 4.091887106987324e-06, "loss": 2.4700563049316404, "step": 1473000 }, { "epoch": 1.777491705150725, "learning_rate": 4.091483271519585e-06, "loss": 2.439924621582031, "step": 1473100 }, { "epoch": 1.777612368473208, "learning_rate": 4.091079436051846e-06, "loss": 2.462299499511719, "step": 1473200 }, { "epoch": 1.7777330317956905, "learning_rate": 4.090675600584108e-06, "loss": 2.4381756591796875, "step": 1473300 }, { "epoch": 1.7778536951181731, "learning_rate": 4.09027176511637e-06, "loss": 2.4550621032714846, "step": 1473400 }, { "epoch": 1.7779743584406558, "learning_rate": 4.089867929648631e-06, "loss": 2.4497694396972656, "step": 1473500 }, { "epoch": 1.7780950217631384, "learning_rate": 4.089464094180892e-06, "loss": 2.429407196044922, "step": 1473600 }, { "epoch": 1.7782156850856212, "learning_rate": 4.089060258713154e-06, "loss": 2.4519903564453127, "step": 1473700 }, { "epoch": 1.7783363484081038, "learning_rate": 4.088656423245416e-06, "loss": 2.421694641113281, "step": 1473800 }, { "epoch": 1.7784570117305867, "learning_rate": 4.088252587777677e-06, "loss": 2.440467529296875, "step": 1473900 }, { "epoch": 1.7785776750530693, "learning_rate": 4.087848752309939e-06, "loss": 2.4173023986816404, "step": 1474000 }, { "epoch": 1.778698338375552, "learning_rate": 4.0874449168422005e-06, "loss": 2.4512901306152344, "step": 1474100 }, { "epoch": 1.7788190016980345, "learning_rate": 4.0870410813744625e-06, "loss": 2.4586737060546877, "step": 1474200 }, { "epoch": 1.7789396650205171, "learning_rate": 4.086637245906724e-06, "loss": 2.4304995727539063, "step": 1474300 }, { "epoch": 1.779060328343, "learning_rate": 4.086233410438986e-06, "loss": 2.441702880859375, "step": 1474400 }, { "epoch": 1.7791809916654826, "learning_rate": 4.085829574971248e-06, "loss": 2.4795796203613283, "step": 1474500 }, { "epoch": 1.7793016549879654, "learning_rate": 4.085425739503509e-06, "loss": 2.4374685668945313, "step": 1474600 }, { "epoch": 1.779422318310448, "learning_rate": 4.08502190403577e-06, "loss": 2.4541680908203123, "step": 1474700 }, { "epoch": 1.7795429816329307, "learning_rate": 4.084618068568032e-06, "loss": 2.4333197021484376, "step": 1474800 }, { "epoch": 1.7796636449554133, "learning_rate": 4.084214233100294e-06, "loss": 2.4402581787109376, "step": 1474900 }, { "epoch": 1.7797843082778961, "learning_rate": 4.083810397632556e-06, "loss": 2.419512176513672, "step": 1475000 }, { "epoch": 1.7799049716003787, "learning_rate": 4.083406562164817e-06, "loss": 2.4570281982421873, "step": 1475100 }, { "epoch": 1.7800256349228616, "learning_rate": 4.083002726697078e-06, "loss": 2.432197723388672, "step": 1475200 }, { "epoch": 1.7801462982453442, "learning_rate": 4.08259889122934e-06, "loss": 2.4652835083007814, "step": 1475300 }, { "epoch": 1.7802669615678268, "learning_rate": 4.082195055761602e-06, "loss": 2.459890594482422, "step": 1475400 }, { "epoch": 1.7803876248903094, "learning_rate": 4.081791220293863e-06, "loss": 2.4474131774902346, "step": 1475500 }, { "epoch": 1.780508288212792, "learning_rate": 4.081387384826125e-06, "loss": 2.4203622436523435, "step": 1475600 }, { "epoch": 1.780628951535275, "learning_rate": 4.080983549358386e-06, "loss": 2.4511351013183593, "step": 1475700 }, { "epoch": 1.7807496148577575, "learning_rate": 4.080579713890648e-06, "loss": 2.449363098144531, "step": 1475800 }, { "epoch": 1.7808702781802404, "learning_rate": 4.0801758784229094e-06, "loss": 2.456115417480469, "step": 1475900 }, { "epoch": 1.780990941502723, "learning_rate": 4.0797720429551714e-06, "loss": 2.4520001220703125, "step": 1476000 }, { "epoch": 1.7811116048252056, "learning_rate": 4.079368207487433e-06, "loss": 2.4541670227050782, "step": 1476100 }, { "epoch": 1.7812322681476882, "learning_rate": 4.0789643720196945e-06, "loss": 2.4675193786621095, "step": 1476200 }, { "epoch": 1.7813529314701708, "learning_rate": 4.078560536551956e-06, "loss": 2.4519282531738282, "step": 1476300 }, { "epoch": 1.7814735947926537, "learning_rate": 4.078156701084218e-06, "loss": 2.4639512634277345, "step": 1476400 }, { "epoch": 1.7815942581151365, "learning_rate": 4.07775286561648e-06, "loss": 2.451590881347656, "step": 1476500 }, { "epoch": 1.7817149214376191, "learning_rate": 4.077349030148741e-06, "loss": 2.4177432250976563, "step": 1476600 }, { "epoch": 1.7818355847601017, "learning_rate": 4.076945194681003e-06, "loss": 2.43607666015625, "step": 1476700 }, { "epoch": 1.7819562480825843, "learning_rate": 4.076541359213264e-06, "loss": 2.4429547119140627, "step": 1476800 }, { "epoch": 1.782076911405067, "learning_rate": 4.076137523745526e-06, "loss": 2.427310333251953, "step": 1476900 }, { "epoch": 1.7821975747275498, "learning_rate": 4.075733688277788e-06, "loss": 2.464246826171875, "step": 1477000 }, { "epoch": 1.7823182380500324, "learning_rate": 4.075329852810049e-06, "loss": 2.460829010009766, "step": 1477100 }, { "epoch": 1.7824389013725153, "learning_rate": 4.07492601734231e-06, "loss": 2.4422120666503906, "step": 1477200 }, { "epoch": 1.7825595646949979, "learning_rate": 4.074522181874572e-06, "loss": 2.4311955261230467, "step": 1477300 }, { "epoch": 1.7826802280174805, "learning_rate": 4.074118346406834e-06, "loss": 2.446169891357422, "step": 1477400 }, { "epoch": 1.7828008913399631, "learning_rate": 4.073714510939096e-06, "loss": 2.430625457763672, "step": 1477500 }, { "epoch": 1.7829215546624457, "learning_rate": 4.073310675471357e-06, "loss": 2.463131866455078, "step": 1477600 }, { "epoch": 1.7830422179849286, "learning_rate": 4.072906840003618e-06, "loss": 2.4548138427734374, "step": 1477700 }, { "epoch": 1.7831628813074112, "learning_rate": 4.07250300453588e-06, "loss": 2.4171742248535155, "step": 1477800 }, { "epoch": 1.783283544629894, "learning_rate": 4.072099169068142e-06, "loss": 2.4571487426757814, "step": 1477900 }, { "epoch": 1.7834042079523766, "learning_rate": 4.0716953336004035e-06, "loss": 2.470812225341797, "step": 1478000 }, { "epoch": 1.7835248712748593, "learning_rate": 4.0712914981326654e-06, "loss": 2.430433349609375, "step": 1478100 }, { "epoch": 1.7836455345973419, "learning_rate": 4.0708876626649266e-06, "loss": 2.4514051818847657, "step": 1478200 }, { "epoch": 1.7837661979198245, "learning_rate": 4.0704838271971886e-06, "loss": 2.443433990478516, "step": 1478300 }, { "epoch": 1.7838868612423073, "learning_rate": 4.07007999172945e-06, "loss": 2.4463755798339846, "step": 1478400 }, { "epoch": 1.7840075245647902, "learning_rate": 4.069676156261712e-06, "loss": 2.449587707519531, "step": 1478500 }, { "epoch": 1.7841281878872728, "learning_rate": 4.069272320793974e-06, "loss": 2.4230192565917967, "step": 1478600 }, { "epoch": 1.7842488512097554, "learning_rate": 4.068868485326235e-06, "loss": 2.4410487365722657, "step": 1478700 }, { "epoch": 1.784369514532238, "learning_rate": 4.068464649858496e-06, "loss": 2.4228692626953126, "step": 1478800 }, { "epoch": 1.7844901778547206, "learning_rate": 4.068060814390758e-06, "loss": 2.4374931335449217, "step": 1478900 }, { "epoch": 1.7846108411772035, "learning_rate": 4.06765697892302e-06, "loss": 2.452794494628906, "step": 1479000 }, { "epoch": 1.784731504499686, "learning_rate": 4.067253143455281e-06, "loss": 2.4284796142578124, "step": 1479100 }, { "epoch": 1.784852167822169, "learning_rate": 4.066849307987543e-06, "loss": 2.472756042480469, "step": 1479200 }, { "epoch": 1.7849728311446516, "learning_rate": 4.066445472519804e-06, "loss": 2.4329374694824217, "step": 1479300 }, { "epoch": 1.7850934944671342, "learning_rate": 4.066041637052066e-06, "loss": 2.436883544921875, "step": 1479400 }, { "epoch": 1.7852141577896168, "learning_rate": 4.065637801584328e-06, "loss": 2.4880406188964845, "step": 1479500 }, { "epoch": 1.7853348211120994, "learning_rate": 4.065233966116589e-06, "loss": 2.4307728576660157, "step": 1479600 }, { "epoch": 1.7854554844345822, "learning_rate": 4.06483013064885e-06, "loss": 2.4555072021484374, "step": 1479700 }, { "epoch": 1.7855761477570649, "learning_rate": 4.064426295181112e-06, "loss": 2.428572540283203, "step": 1479800 }, { "epoch": 1.7856968110795477, "learning_rate": 4.064022459713374e-06, "loss": 2.463938446044922, "step": 1479900 }, { "epoch": 1.7858174744020303, "learning_rate": 4.0636186242456355e-06, "loss": 2.443628845214844, "step": 1480000 }, { "epoch": 1.785938137724513, "learning_rate": 4.0632147887778975e-06, "loss": 2.4234957885742188, "step": 1480100 }, { "epoch": 1.7860588010469955, "learning_rate": 4.062810953310159e-06, "loss": 2.414715576171875, "step": 1480200 }, { "epoch": 1.7861794643694784, "learning_rate": 4.062407117842421e-06, "loss": 2.439808197021484, "step": 1480300 }, { "epoch": 1.786300127691961, "learning_rate": 4.062003282374682e-06, "loss": 2.4130509948730468, "step": 1480400 }, { "epoch": 1.7864207910144438, "learning_rate": 4.061599446906944e-06, "loss": 2.460330352783203, "step": 1480500 }, { "epoch": 1.7865414543369265, "learning_rate": 4.061195611439206e-06, "loss": 2.443551483154297, "step": 1480600 }, { "epoch": 1.786662117659409, "learning_rate": 4.060791775971467e-06, "loss": 2.4398867797851564, "step": 1480700 }, { "epoch": 1.7867827809818917, "learning_rate": 4.060387940503728e-06, "loss": 2.4418585205078127, "step": 1480800 }, { "epoch": 1.7869034443043743, "learning_rate": 4.05998410503599e-06, "loss": 2.444200439453125, "step": 1480900 }, { "epoch": 1.7870241076268572, "learning_rate": 4.059580269568252e-06, "loss": 2.4234324645996095, "step": 1481000 }, { "epoch": 1.7871447709493398, "learning_rate": 4.059176434100514e-06, "loss": 2.4440199279785157, "step": 1481100 }, { "epoch": 1.7872654342718226, "learning_rate": 4.058772598632775e-06, "loss": 2.4684722900390623, "step": 1481200 }, { "epoch": 1.7873860975943052, "learning_rate": 4.058368763165036e-06, "loss": 2.4199287414550783, "step": 1481300 }, { "epoch": 1.7875067609167878, "learning_rate": 4.057964927697298e-06, "loss": 2.4388397216796873, "step": 1481400 }, { "epoch": 1.7876274242392705, "learning_rate": 4.05756109222956e-06, "loss": 2.477461242675781, "step": 1481500 }, { "epoch": 1.787748087561753, "learning_rate": 4.057157256761821e-06, "loss": 2.454827880859375, "step": 1481600 }, { "epoch": 1.787868750884236, "learning_rate": 4.056753421294083e-06, "loss": 2.4496153259277342, "step": 1481700 }, { "epoch": 1.7879894142067188, "learning_rate": 4.056349585826344e-06, "loss": 2.4492384338378907, "step": 1481800 }, { "epoch": 1.7881100775292014, "learning_rate": 4.055945750358606e-06, "loss": 2.4309458923339844, "step": 1481900 }, { "epoch": 1.788230740851684, "learning_rate": 4.0555419148908675e-06, "loss": 2.443880615234375, "step": 1482000 }, { "epoch": 1.7883514041741666, "learning_rate": 4.0551380794231295e-06, "loss": 2.4410671997070312, "step": 1482100 }, { "epoch": 1.7884720674966492, "learning_rate": 4.0547342439553915e-06, "loss": 2.4484846496582033, "step": 1482200 }, { "epoch": 1.788592730819132, "learning_rate": 4.054330408487653e-06, "loss": 2.432414093017578, "step": 1482300 }, { "epoch": 1.7887133941416147, "learning_rate": 4.053926573019914e-06, "loss": 2.473561248779297, "step": 1482400 }, { "epoch": 1.7888340574640975, "learning_rate": 4.053522737552176e-06, "loss": 2.456202087402344, "step": 1482500 }, { "epoch": 1.7889547207865801, "learning_rate": 4.053118902084438e-06, "loss": 2.439820556640625, "step": 1482600 }, { "epoch": 1.7890753841090627, "learning_rate": 4.052715066616699e-06, "loss": 2.44244140625, "step": 1482700 }, { "epoch": 1.7891960474315454, "learning_rate": 4.052311231148961e-06, "loss": 2.4489892578125, "step": 1482800 }, { "epoch": 1.789316710754028, "learning_rate": 4.051907395681222e-06, "loss": 2.442720642089844, "step": 1482900 }, { "epoch": 1.7894373740765108, "learning_rate": 4.051503560213484e-06, "loss": 2.4370933532714845, "step": 1483000 }, { "epoch": 1.7895580373989934, "learning_rate": 4.051099724745746e-06, "loss": 2.42745849609375, "step": 1483100 }, { "epoch": 1.7896787007214763, "learning_rate": 4.050695889278007e-06, "loss": 2.435312042236328, "step": 1483200 }, { "epoch": 1.789799364043959, "learning_rate": 4.050292053810268e-06, "loss": 2.4541554260253906, "step": 1483300 }, { "epoch": 1.7899200273664415, "learning_rate": 4.04988821834253e-06, "loss": 2.4509928894042967, "step": 1483400 }, { "epoch": 1.7900406906889241, "learning_rate": 4.049484382874792e-06, "loss": 2.441980285644531, "step": 1483500 }, { "epoch": 1.7901613540114067, "learning_rate": 4.049080547407054e-06, "loss": 2.444682159423828, "step": 1483600 }, { "epoch": 1.7902820173338896, "learning_rate": 4.048676711939315e-06, "loss": 2.438740692138672, "step": 1483700 }, { "epoch": 1.7904026806563724, "learning_rate": 4.048272876471576e-06, "loss": 2.420367431640625, "step": 1483800 }, { "epoch": 1.790523343978855, "learning_rate": 4.047869041003838e-06, "loss": 2.45123046875, "step": 1483900 }, { "epoch": 1.7906440073013377, "learning_rate": 4.0474652055361e-06, "loss": 2.455613861083984, "step": 1484000 }, { "epoch": 1.7907646706238203, "learning_rate": 4.0470613700683615e-06, "loss": 2.4184701538085935, "step": 1484100 }, { "epoch": 1.790885333946303, "learning_rate": 4.0466575346006235e-06, "loss": 2.427076568603516, "step": 1484200 }, { "epoch": 1.7910059972687857, "learning_rate": 4.046253699132885e-06, "loss": 2.42393798828125, "step": 1484300 }, { "epoch": 1.7911266605912683, "learning_rate": 4.045849863665147e-06, "loss": 2.412470397949219, "step": 1484400 }, { "epoch": 1.7912473239137512, "learning_rate": 4.045446028197408e-06, "loss": 2.449813232421875, "step": 1484500 }, { "epoch": 1.7913679872362338, "learning_rate": 4.04504219272967e-06, "loss": 2.426419372558594, "step": 1484600 }, { "epoch": 1.7914886505587164, "learning_rate": 4.044638357261932e-06, "loss": 2.449449462890625, "step": 1484700 }, { "epoch": 1.791609313881199, "learning_rate": 4.044234521794193e-06, "loss": 2.4399513244628905, "step": 1484800 }, { "epoch": 1.7917299772036817, "learning_rate": 4.043830686326454e-06, "loss": 2.438257751464844, "step": 1484900 }, { "epoch": 1.7918506405261645, "learning_rate": 4.043426850858716e-06, "loss": 2.4336563110351563, "step": 1485000 }, { "epoch": 1.7919713038486473, "learning_rate": 4.043023015390978e-06, "loss": 2.474126281738281, "step": 1485100 }, { "epoch": 1.79209196717113, "learning_rate": 4.042619179923239e-06, "loss": 2.4561924743652344, "step": 1485200 }, { "epoch": 1.7922126304936126, "learning_rate": 4.042215344455501e-06, "loss": 2.452283935546875, "step": 1485300 }, { "epoch": 1.7923332938160952, "learning_rate": 4.041811508987762e-06, "loss": 2.4481657409667967, "step": 1485400 }, { "epoch": 1.7924539571385778, "learning_rate": 4.041407673520024e-06, "loss": 2.4325321960449218, "step": 1485500 }, { "epoch": 1.7925746204610606, "learning_rate": 4.041003838052286e-06, "loss": 2.4358154296875, "step": 1485600 }, { "epoch": 1.7926952837835433, "learning_rate": 4.040600002584547e-06, "loss": 2.4327822875976564, "step": 1485700 }, { "epoch": 1.792815947106026, "learning_rate": 4.0401961671168084e-06, "loss": 2.4695173645019532, "step": 1485800 }, { "epoch": 1.7929366104285087, "learning_rate": 4.03979233164907e-06, "loss": 2.438540344238281, "step": 1485900 }, { "epoch": 1.7930572737509913, "learning_rate": 4.039388496181332e-06, "loss": 2.4265419006347657, "step": 1486000 }, { "epoch": 1.793177937073474, "learning_rate": 4.0389846607135935e-06, "loss": 2.448335723876953, "step": 1486100 }, { "epoch": 1.7932986003959566, "learning_rate": 4.0385808252458555e-06, "loss": 2.41044189453125, "step": 1486200 }, { "epoch": 1.7934192637184394, "learning_rate": 4.038176989778117e-06, "loss": 2.4757659912109373, "step": 1486300 }, { "epoch": 1.793539927040922, "learning_rate": 4.037773154310379e-06, "loss": 2.4439752197265623, "step": 1486400 }, { "epoch": 1.7936605903634049, "learning_rate": 4.03736931884264e-06, "loss": 2.4369607543945313, "step": 1486500 }, { "epoch": 1.7937812536858875, "learning_rate": 4.036965483374902e-06, "loss": 2.4653752136230467, "step": 1486600 }, { "epoch": 1.79390191700837, "learning_rate": 4.036561647907164e-06, "loss": 2.402820587158203, "step": 1486700 }, { "epoch": 1.7940225803308527, "learning_rate": 4.036157812439425e-06, "loss": 2.4385740661621096, "step": 1486800 }, { "epoch": 1.7941432436533353, "learning_rate": 4.035753976971686e-06, "loss": 2.4333233642578125, "step": 1486900 }, { "epoch": 1.7942639069758182, "learning_rate": 4.035350141503948e-06, "loss": 2.4367059326171874, "step": 1487000 }, { "epoch": 1.794384570298301, "learning_rate": 4.03494630603621e-06, "loss": 2.4577684020996093, "step": 1487100 }, { "epoch": 1.7945052336207836, "learning_rate": 4.034542470568472e-06, "loss": 2.418397216796875, "step": 1487200 }, { "epoch": 1.7946258969432662, "learning_rate": 4.034138635100733e-06, "loss": 2.4410604858398437, "step": 1487300 }, { "epoch": 1.7947465602657489, "learning_rate": 4.033734799632994e-06, "loss": 2.432870635986328, "step": 1487400 }, { "epoch": 1.7948672235882315, "learning_rate": 4.033330964165256e-06, "loss": 2.4271527099609376, "step": 1487500 }, { "epoch": 1.7949878869107143, "learning_rate": 4.032927128697518e-06, "loss": 2.461211700439453, "step": 1487600 }, { "epoch": 1.795108550233197, "learning_rate": 4.03252329322978e-06, "loss": 2.456731872558594, "step": 1487700 }, { "epoch": 1.7952292135556798, "learning_rate": 4.032119457762041e-06, "loss": 2.4550241088867186, "step": 1487800 }, { "epoch": 1.7953498768781624, "learning_rate": 4.0317156222943024e-06, "loss": 2.4530787658691406, "step": 1487900 }, { "epoch": 1.795470540200645, "learning_rate": 4.0313117868265644e-06, "loss": 2.4100550842285156, "step": 1488000 }, { "epoch": 1.7955912035231276, "learning_rate": 4.030907951358826e-06, "loss": 2.470788879394531, "step": 1488100 }, { "epoch": 1.7957118668456102, "learning_rate": 4.0305041158910875e-06, "loss": 2.4262008666992188, "step": 1488200 }, { "epoch": 1.795832530168093, "learning_rate": 4.0301002804233495e-06, "loss": 2.449014434814453, "step": 1488300 }, { "epoch": 1.7959531934905757, "learning_rate": 4.029696444955611e-06, "loss": 2.412223205566406, "step": 1488400 }, { "epoch": 1.7960738568130585, "learning_rate": 4.029292609487873e-06, "loss": 2.448611602783203, "step": 1488500 }, { "epoch": 1.7961945201355412, "learning_rate": 4.028888774020134e-06, "loss": 2.457666015625, "step": 1488600 }, { "epoch": 1.7963151834580238, "learning_rate": 4.028484938552396e-06, "loss": 2.4393418884277343, "step": 1488700 }, { "epoch": 1.7964358467805064, "learning_rate": 4.028081103084657e-06, "loss": 2.4238435363769533, "step": 1488800 }, { "epoch": 1.796556510102989, "learning_rate": 4.027677267616919e-06, "loss": 2.46796875, "step": 1488900 }, { "epoch": 1.7966771734254718, "learning_rate": 4.02727343214918e-06, "loss": 2.4470199584960937, "step": 1489000 }, { "epoch": 1.7967978367479547, "learning_rate": 4.026869596681442e-06, "loss": 2.4624639892578126, "step": 1489100 }, { "epoch": 1.7969185000704373, "learning_rate": 4.026465761213704e-06, "loss": 2.4500962829589845, "step": 1489200 }, { "epoch": 1.79703916339292, "learning_rate": 4.026061925745965e-06, "loss": 2.432452850341797, "step": 1489300 }, { "epoch": 1.7971598267154025, "learning_rate": 4.025658090278226e-06, "loss": 2.4400889587402346, "step": 1489400 }, { "epoch": 1.7972804900378851, "learning_rate": 4.025254254810488e-06, "loss": 2.4452178955078123, "step": 1489500 }, { "epoch": 1.797401153360368, "learning_rate": 4.02485041934275e-06, "loss": 2.422432403564453, "step": 1489600 }, { "epoch": 1.7975218166828506, "learning_rate": 4.024446583875012e-06, "loss": 2.423653564453125, "step": 1489700 }, { "epoch": 1.7976424800053334, "learning_rate": 4.024042748407273e-06, "loss": 2.4346359252929686, "step": 1489800 }, { "epoch": 1.797763143327816, "learning_rate": 4.0236389129395345e-06, "loss": 2.4591473388671874, "step": 1489900 }, { "epoch": 1.7978838066502987, "learning_rate": 4.0232350774717965e-06, "loss": 2.440771484375, "step": 1490000 }, { "epoch": 1.7980044699727813, "learning_rate": 4.0228312420040584e-06, "loss": 2.4459109497070313, "step": 1490100 }, { "epoch": 1.798125133295264, "learning_rate": 4.0224274065363196e-06, "loss": 2.419602813720703, "step": 1490200 }, { "epoch": 1.7982457966177468, "learning_rate": 4.0220235710685816e-06, "loss": 2.4186573791503907, "step": 1490300 }, { "epoch": 1.7983664599402296, "learning_rate": 4.021619735600843e-06, "loss": 2.441813201904297, "step": 1490400 }, { "epoch": 1.7984871232627122, "learning_rate": 4.021215900133105e-06, "loss": 2.441319580078125, "step": 1490500 }, { "epoch": 1.7986077865851948, "learning_rate": 4.020812064665366e-06, "loss": 2.443228759765625, "step": 1490600 }, { "epoch": 1.7987284499076774, "learning_rate": 4.020408229197628e-06, "loss": 2.4548379516601564, "step": 1490700 }, { "epoch": 1.79884911323016, "learning_rate": 4.02000439372989e-06, "loss": 2.439638214111328, "step": 1490800 }, { "epoch": 1.798969776552643, "learning_rate": 4.019600558262151e-06, "loss": 2.4658506774902342, "step": 1490900 }, { "epoch": 1.7990904398751255, "learning_rate": 4.019196722794412e-06, "loss": 2.4215089416503908, "step": 1491000 }, { "epoch": 1.7992111031976084, "learning_rate": 4.018792887326674e-06, "loss": 2.4440966796875, "step": 1491100 }, { "epoch": 1.799331766520091, "learning_rate": 4.018389051858936e-06, "loss": 2.4392521667480467, "step": 1491200 }, { "epoch": 1.7994524298425736, "learning_rate": 4.017985216391197e-06, "loss": 2.452306671142578, "step": 1491300 }, { "epoch": 1.7995730931650562, "learning_rate": 4.017581380923459e-06, "loss": 2.4492230224609375, "step": 1491400 }, { "epoch": 1.7996937564875388, "learning_rate": 4.01717754545572e-06, "loss": 2.4316148376464843, "step": 1491500 }, { "epoch": 1.7998144198100217, "learning_rate": 4.016773709987982e-06, "loss": 2.4485418701171877, "step": 1491600 }, { "epoch": 1.7999350831325043, "learning_rate": 4.016369874520244e-06, "loss": 2.4337579345703126, "step": 1491700 }, { "epoch": 1.8000557464549871, "learning_rate": 4.015966039052505e-06, "loss": 2.449376983642578, "step": 1491800 }, { "epoch": 1.8001764097774697, "learning_rate": 4.0155622035847665e-06, "loss": 2.456148681640625, "step": 1491900 }, { "epoch": 1.8002970730999523, "learning_rate": 4.0151583681170285e-06, "loss": 2.437828369140625, "step": 1492000 }, { "epoch": 1.800417736422435, "learning_rate": 4.0147545326492905e-06, "loss": 2.4222035217285156, "step": 1492100 }, { "epoch": 1.8005383997449176, "learning_rate": 4.014350697181552e-06, "loss": 2.46528076171875, "step": 1492200 }, { "epoch": 1.8006590630674004, "learning_rate": 4.013946861713814e-06, "loss": 2.4347821044921876, "step": 1492300 }, { "epoch": 1.8007797263898833, "learning_rate": 4.013543026246075e-06, "loss": 2.467193603515625, "step": 1492400 }, { "epoch": 1.8009003897123659, "learning_rate": 4.013139190778337e-06, "loss": 2.447551574707031, "step": 1492500 }, { "epoch": 1.8010210530348485, "learning_rate": 4.012735355310598e-06, "loss": 2.4286207580566406, "step": 1492600 }, { "epoch": 1.8011417163573311, "learning_rate": 4.01233151984286e-06, "loss": 2.4360748291015626, "step": 1492700 }, { "epoch": 1.8012623796798137, "learning_rate": 4.011927684375122e-06, "loss": 2.437998046875, "step": 1492800 }, { "epoch": 1.8013830430022966, "learning_rate": 4.011523848907383e-06, "loss": 2.4206011962890623, "step": 1492900 }, { "epoch": 1.8015037063247792, "learning_rate": 4.011120013439645e-06, "loss": 2.4279747009277344, "step": 1493000 }, { "epoch": 1.801624369647262, "learning_rate": 4.010716177971906e-06, "loss": 2.4271875, "step": 1493100 }, { "epoch": 1.8017450329697446, "learning_rate": 4.010312342504168e-06, "loss": 2.473305969238281, "step": 1493200 }, { "epoch": 1.8018656962922273, "learning_rate": 4.00990850703643e-06, "loss": 2.432032470703125, "step": 1493300 }, { "epoch": 1.8019863596147099, "learning_rate": 4.009504671568691e-06, "loss": 2.4484230041503907, "step": 1493400 }, { "epoch": 1.8021070229371925, "learning_rate": 4.009100836100952e-06, "loss": 2.4117039489746093, "step": 1493500 }, { "epoch": 1.8022276862596753, "learning_rate": 4.008697000633214e-06, "loss": 2.454134674072266, "step": 1493600 }, { "epoch": 1.802348349582158, "learning_rate": 4.008293165165476e-06, "loss": 2.431804656982422, "step": 1493700 }, { "epoch": 1.8024690129046408, "learning_rate": 4.007889329697737e-06, "loss": 2.449434509277344, "step": 1493800 }, { "epoch": 1.8025896762271234, "learning_rate": 4.007485494229999e-06, "loss": 2.4463958740234375, "step": 1493900 }, { "epoch": 1.802710339549606, "learning_rate": 4.0070816587622605e-06, "loss": 2.428277587890625, "step": 1494000 }, { "epoch": 1.8028310028720886, "learning_rate": 4.0066778232945225e-06, "loss": 2.460702362060547, "step": 1494100 }, { "epoch": 1.8029516661945713, "learning_rate": 4.0062739878267845e-06, "loss": 2.458220672607422, "step": 1494200 }, { "epoch": 1.803072329517054, "learning_rate": 4.005870152359046e-06, "loss": 2.447376708984375, "step": 1494300 }, { "epoch": 1.803192992839537, "learning_rate": 4.005466316891307e-06, "loss": 2.465398254394531, "step": 1494400 }, { "epoch": 1.8033136561620196, "learning_rate": 4.005062481423569e-06, "loss": 2.4286865234375, "step": 1494500 }, { "epoch": 1.8034343194845022, "learning_rate": 4.004658645955831e-06, "loss": 2.4485537719726564, "step": 1494600 }, { "epoch": 1.8035549828069848, "learning_rate": 4.004254810488092e-06, "loss": 2.445104217529297, "step": 1494700 }, { "epoch": 1.8036756461294674, "learning_rate": 4.003850975020354e-06, "loss": 2.4669953918457033, "step": 1494800 }, { "epoch": 1.8037963094519502, "learning_rate": 4.003447139552615e-06, "loss": 2.440146179199219, "step": 1494900 }, { "epoch": 1.8039169727744329, "learning_rate": 4.003043304084877e-06, "loss": 2.434589691162109, "step": 1495000 }, { "epoch": 1.8040376360969157, "learning_rate": 4.002639468617138e-06, "loss": 2.404609375, "step": 1495100 }, { "epoch": 1.8041582994193983, "learning_rate": 4.0022356331494e-06, "loss": 2.4470115661621095, "step": 1495200 }, { "epoch": 1.804278962741881, "learning_rate": 4.001831797681662e-06, "loss": 2.435902557373047, "step": 1495300 }, { "epoch": 1.8043996260643635, "learning_rate": 4.001427962213923e-06, "loss": 2.4333544921875, "step": 1495400 }, { "epoch": 1.8045202893868462, "learning_rate": 4.001024126746184e-06, "loss": 2.455183258056641, "step": 1495500 }, { "epoch": 1.804640952709329, "learning_rate": 4.000620291278446e-06, "loss": 2.4350660705566405, "step": 1495600 }, { "epoch": 1.8047616160318118, "learning_rate": 4.000216455810708e-06, "loss": 2.424752960205078, "step": 1495700 }, { "epoch": 1.8048822793542945, "learning_rate": 3.99981262034297e-06, "loss": 2.4690399169921875, "step": 1495800 }, { "epoch": 1.805002942676777, "learning_rate": 3.999408784875231e-06, "loss": 2.4252061462402343, "step": 1495900 }, { "epoch": 1.8051236059992597, "learning_rate": 3.9990049494074925e-06, "loss": 2.4506565856933595, "step": 1496000 }, { "epoch": 1.8052442693217423, "learning_rate": 3.9986011139397545e-06, "loss": 2.441711883544922, "step": 1496100 }, { "epoch": 1.8053649326442252, "learning_rate": 3.9981972784720165e-06, "loss": 2.423605194091797, "step": 1496200 }, { "epoch": 1.8054855959667078, "learning_rate": 3.997793443004278e-06, "loss": 2.433829650878906, "step": 1496300 }, { "epoch": 1.8056062592891906, "learning_rate": 3.99738960753654e-06, "loss": 2.433603515625, "step": 1496400 }, { "epoch": 1.8057269226116732, "learning_rate": 3.996985772068801e-06, "loss": 2.4210575866699218, "step": 1496500 }, { "epoch": 1.8058475859341558, "learning_rate": 3.996581936601063e-06, "loss": 2.440902099609375, "step": 1496600 }, { "epoch": 1.8059682492566385, "learning_rate": 3.996178101133324e-06, "loss": 2.4151844787597656, "step": 1496700 }, { "epoch": 1.806088912579121, "learning_rate": 3.995774265665586e-06, "loss": 2.4258380126953125, "step": 1496800 }, { "epoch": 1.806209575901604, "learning_rate": 3.995370430197848e-06, "loss": 2.4468537902832033, "step": 1496900 }, { "epoch": 1.8063302392240865, "learning_rate": 3.994966594730109e-06, "loss": 2.4398988342285155, "step": 1497000 }, { "epoch": 1.8064509025465694, "learning_rate": 3.99456275926237e-06, "loss": 2.3978668212890626, "step": 1497100 }, { "epoch": 1.806571565869052, "learning_rate": 3.994158923794632e-06, "loss": 2.383349609375, "step": 1497200 }, { "epoch": 1.8066922291915346, "learning_rate": 3.993755088326894e-06, "loss": 2.455831756591797, "step": 1497300 }, { "epoch": 1.8068128925140172, "learning_rate": 3.993351252859155e-06, "loss": 2.433951568603516, "step": 1497400 }, { "epoch": 1.8069335558364998, "learning_rate": 3.992947417391417e-06, "loss": 2.4583450317382813, "step": 1497500 }, { "epoch": 1.8070542191589827, "learning_rate": 3.992543581923678e-06, "loss": 2.4315861511230468, "step": 1497600 }, { "epoch": 1.8071748824814655, "learning_rate": 3.99213974645594e-06, "loss": 2.4421983337402344, "step": 1497700 }, { "epoch": 1.8072955458039481, "learning_rate": 3.991735910988202e-06, "loss": 2.4304388427734374, "step": 1497800 }, { "epoch": 1.8074162091264308, "learning_rate": 3.991332075520463e-06, "loss": 2.45116455078125, "step": 1497900 }, { "epoch": 1.8075368724489134, "learning_rate": 3.9909282400527246e-06, "loss": 2.4183502197265625, "step": 1498000 }, { "epoch": 1.807657535771396, "learning_rate": 3.9905244045849865e-06, "loss": 2.456245574951172, "step": 1498100 }, { "epoch": 1.8077781990938788, "learning_rate": 3.9901205691172485e-06, "loss": 2.4341172790527343, "step": 1498200 }, { "epoch": 1.8078988624163614, "learning_rate": 3.9897167336495105e-06, "loss": 2.439725189208984, "step": 1498300 }, { "epoch": 1.8080195257388443, "learning_rate": 3.989312898181772e-06, "loss": 2.4237327575683594, "step": 1498400 }, { "epoch": 1.808140189061327, "learning_rate": 3.988909062714033e-06, "loss": 2.452526092529297, "step": 1498500 }, { "epoch": 1.8082608523838095, "learning_rate": 3.988505227246295e-06, "loss": 2.4345109558105467, "step": 1498600 }, { "epoch": 1.8083815157062921, "learning_rate": 3.988101391778557e-06, "loss": 2.443062744140625, "step": 1498700 }, { "epoch": 1.8085021790287747, "learning_rate": 3.987697556310818e-06, "loss": 2.4268646240234375, "step": 1498800 }, { "epoch": 1.8086228423512576, "learning_rate": 3.98729372084308e-06, "loss": 2.4610797119140626, "step": 1498900 }, { "epoch": 1.8087435056737402, "learning_rate": 3.986889885375341e-06, "loss": 2.437807769775391, "step": 1499000 }, { "epoch": 1.808864168996223, "learning_rate": 3.986486049907603e-06, "loss": 2.4381358337402346, "step": 1499100 }, { "epoch": 1.8089848323187057, "learning_rate": 3.986082214439864e-06, "loss": 2.4575871276855468, "step": 1499200 }, { "epoch": 1.8091054956411883, "learning_rate": 3.985678378972126e-06, "loss": 2.411451416015625, "step": 1499300 }, { "epoch": 1.809226158963671, "learning_rate": 3.985274543504388e-06, "loss": 2.4277029418945313, "step": 1499400 }, { "epoch": 1.8093468222861535, "learning_rate": 3.984870708036649e-06, "loss": 2.4465122985839844, "step": 1499500 }, { "epoch": 1.8094674856086364, "learning_rate": 3.98446687256891e-06, "loss": 2.4505691528320312, "step": 1499600 }, { "epoch": 1.8095881489311192, "learning_rate": 3.984063037101172e-06, "loss": 2.458235321044922, "step": 1499700 }, { "epoch": 1.8097088122536018, "learning_rate": 3.983659201633434e-06, "loss": 2.4465072631835936, "step": 1499800 }, { "epoch": 1.8098294755760844, "learning_rate": 3.9832553661656954e-06, "loss": 2.4407891845703125, "step": 1499900 }, { "epoch": 1.809950138898567, "learning_rate": 3.9828515306979574e-06, "loss": 2.4512252807617188, "step": 1500000 }, { "epoch": 1.8100708022210497, "learning_rate": 3.9824476952302186e-06, "loss": 2.440477142333984, "step": 1500100 }, { "epoch": 1.8101914655435325, "learning_rate": 3.9820438597624805e-06, "loss": 2.446125793457031, "step": 1500200 }, { "epoch": 1.8103121288660151, "learning_rate": 3.9816400242947425e-06, "loss": 2.46240966796875, "step": 1500300 }, { "epoch": 1.810432792188498, "learning_rate": 3.981236188827004e-06, "loss": 2.444152069091797, "step": 1500400 }, { "epoch": 1.8105534555109806, "learning_rate": 3.980832353359265e-06, "loss": 2.4453382873535157, "step": 1500500 }, { "epoch": 1.8106741188334632, "learning_rate": 3.980428517891527e-06, "loss": 2.4274411010742187, "step": 1500600 }, { "epoch": 1.8107947821559458, "learning_rate": 3.980024682423789e-06, "loss": 2.421781311035156, "step": 1500700 }, { "epoch": 1.8109154454784284, "learning_rate": 3.97962084695605e-06, "loss": 2.417606201171875, "step": 1500800 }, { "epoch": 1.8110361088009113, "learning_rate": 3.979217011488312e-06, "loss": 2.4249525451660157, "step": 1500900 }, { "epoch": 1.811156772123394, "learning_rate": 3.978813176020573e-06, "loss": 2.4604278564453126, "step": 1501000 }, { "epoch": 1.8112774354458767, "learning_rate": 3.978409340552835e-06, "loss": 2.4451690673828126, "step": 1501100 }, { "epoch": 1.8113980987683593, "learning_rate": 3.978005505085096e-06, "loss": 2.433526611328125, "step": 1501200 }, { "epoch": 1.811518762090842, "learning_rate": 3.977601669617358e-06, "loss": 2.4227220153808595, "step": 1501300 }, { "epoch": 1.8116394254133246, "learning_rate": 3.97719783414962e-06, "loss": 2.416927947998047, "step": 1501400 }, { "epoch": 1.8117600887358074, "learning_rate": 3.976793998681881e-06, "loss": 2.42783935546875, "step": 1501500 }, { "epoch": 1.81188075205829, "learning_rate": 3.976390163214142e-06, "loss": 2.487997741699219, "step": 1501600 }, { "epoch": 1.8120014153807729, "learning_rate": 3.975986327746404e-06, "loss": 2.413171844482422, "step": 1501700 }, { "epoch": 1.8121220787032555, "learning_rate": 3.975582492278666e-06, "loss": 2.445463104248047, "step": 1501800 }, { "epoch": 1.812242742025738, "learning_rate": 3.975178656810928e-06, "loss": 2.4431448364257813, "step": 1501900 }, { "epoch": 1.8123634053482207, "learning_rate": 3.9747748213431895e-06, "loss": 2.4211129760742187, "step": 1502000 }, { "epoch": 1.8124840686707033, "learning_rate": 3.974370985875451e-06, "loss": 2.438428955078125, "step": 1502100 }, { "epoch": 1.8126047319931862, "learning_rate": 3.9739671504077126e-06, "loss": 2.444625244140625, "step": 1502200 }, { "epoch": 1.8127253953156688, "learning_rate": 3.9735633149399746e-06, "loss": 2.452695617675781, "step": 1502300 }, { "epoch": 1.8128460586381516, "learning_rate": 3.973159479472236e-06, "loss": 2.4182456970214843, "step": 1502400 }, { "epoch": 1.8129667219606342, "learning_rate": 3.972755644004498e-06, "loss": 2.430755920410156, "step": 1502500 }, { "epoch": 1.8130873852831169, "learning_rate": 3.972351808536759e-06, "loss": 2.4332095336914064, "step": 1502600 }, { "epoch": 1.8132080486055995, "learning_rate": 3.971947973069021e-06, "loss": 2.4171432495117187, "step": 1502700 }, { "epoch": 1.813328711928082, "learning_rate": 3.971544137601282e-06, "loss": 2.45822265625, "step": 1502800 }, { "epoch": 1.813449375250565, "learning_rate": 3.971140302133544e-06, "loss": 2.469623260498047, "step": 1502900 }, { "epoch": 1.8135700385730478, "learning_rate": 3.970736466665806e-06, "loss": 2.443805847167969, "step": 1503000 }, { "epoch": 1.8136907018955304, "learning_rate": 3.970332631198067e-06, "loss": 2.456459197998047, "step": 1503100 }, { "epoch": 1.813811365218013, "learning_rate": 3.969928795730329e-06, "loss": 2.431924133300781, "step": 1503200 }, { "epoch": 1.8139320285404956, "learning_rate": 3.96952496026259e-06, "loss": 2.4382290649414062, "step": 1503300 }, { "epoch": 1.8140526918629782, "learning_rate": 3.969121124794852e-06, "loss": 2.4424479675292967, "step": 1503400 }, { "epoch": 1.814173355185461, "learning_rate": 3.968717289327113e-06, "loss": 2.433910217285156, "step": 1503500 }, { "epoch": 1.8142940185079437, "learning_rate": 3.968313453859375e-06, "loss": 2.438394775390625, "step": 1503600 }, { "epoch": 1.8144146818304265, "learning_rate": 3.967909618391636e-06, "loss": 2.4146478271484373, "step": 1503700 }, { "epoch": 1.8145353451529092, "learning_rate": 3.967505782923898e-06, "loss": 2.4547515869140626, "step": 1503800 }, { "epoch": 1.8146560084753918, "learning_rate": 3.96710194745616e-06, "loss": 2.429498596191406, "step": 1503900 }, { "epoch": 1.8147766717978744, "learning_rate": 3.9666981119884215e-06, "loss": 2.4379693603515626, "step": 1504000 }, { "epoch": 1.814897335120357, "learning_rate": 3.966294276520683e-06, "loss": 2.450943603515625, "step": 1504100 }, { "epoch": 1.8150179984428398, "learning_rate": 3.965890441052945e-06, "loss": 2.45711181640625, "step": 1504200 }, { "epoch": 1.8151386617653225, "learning_rate": 3.965486605585207e-06, "loss": 2.4425759887695313, "step": 1504300 }, { "epoch": 1.8152593250878053, "learning_rate": 3.9650827701174686e-06, "loss": 2.446157989501953, "step": 1504400 }, { "epoch": 1.815379988410288, "learning_rate": 3.96467893464973e-06, "loss": 2.4348880004882814, "step": 1504500 }, { "epoch": 1.8155006517327705, "learning_rate": 3.964275099181991e-06, "loss": 2.431455383300781, "step": 1504600 }, { "epoch": 1.8156213150552531, "learning_rate": 3.963871263714253e-06, "loss": 2.429371795654297, "step": 1504700 }, { "epoch": 1.8157419783777358, "learning_rate": 3.963467428246515e-06, "loss": 2.4485710144042967, "step": 1504800 }, { "epoch": 1.8158626417002186, "learning_rate": 3.963063592778776e-06, "loss": 2.407504119873047, "step": 1504900 }, { "epoch": 1.8159833050227014, "learning_rate": 3.962659757311038e-06, "loss": 2.449900360107422, "step": 1505000 }, { "epoch": 1.816103968345184, "learning_rate": 3.962255921843299e-06, "loss": 2.437339324951172, "step": 1505100 }, { "epoch": 1.8162246316676667, "learning_rate": 3.961852086375561e-06, "loss": 2.4502767944335937, "step": 1505200 }, { "epoch": 1.8163452949901493, "learning_rate": 3.961448250907822e-06, "loss": 2.4534803771972657, "step": 1505300 }, { "epoch": 1.816465958312632, "learning_rate": 3.961044415440084e-06, "loss": 2.448143310546875, "step": 1505400 }, { "epoch": 1.8165866216351148, "learning_rate": 3.960640579972346e-06, "loss": 2.4213191223144532, "step": 1505500 }, { "epoch": 1.8167072849575974, "learning_rate": 3.960236744504607e-06, "loss": 2.451149597167969, "step": 1505600 }, { "epoch": 1.8168279482800802, "learning_rate": 3.959832909036868e-06, "loss": 2.441400909423828, "step": 1505700 }, { "epoch": 1.8169486116025628, "learning_rate": 3.95942907356913e-06, "loss": 2.429493255615234, "step": 1505800 }, { "epoch": 1.8170692749250454, "learning_rate": 3.959025238101392e-06, "loss": 2.433990936279297, "step": 1505900 }, { "epoch": 1.817189938247528, "learning_rate": 3.9586214026336535e-06, "loss": 2.4232562255859373, "step": 1506000 }, { "epoch": 1.8173106015700107, "learning_rate": 3.9582175671659155e-06, "loss": 2.4632618713378904, "step": 1506100 }, { "epoch": 1.8174312648924935, "learning_rate": 3.957813731698177e-06, "loss": 2.452120361328125, "step": 1506200 }, { "epoch": 1.8175519282149764, "learning_rate": 3.957409896230439e-06, "loss": 2.452930450439453, "step": 1506300 }, { "epoch": 1.817672591537459, "learning_rate": 3.957006060762701e-06, "loss": 2.41974609375, "step": 1506400 }, { "epoch": 1.8177932548599416, "learning_rate": 3.956602225294962e-06, "loss": 2.4555572509765624, "step": 1506500 }, { "epoch": 1.8179139181824242, "learning_rate": 3.956198389827223e-06, "loss": 2.475484619140625, "step": 1506600 }, { "epoch": 1.8180345815049068, "learning_rate": 3.955794554359485e-06, "loss": 2.458047332763672, "step": 1506700 }, { "epoch": 1.8181552448273897, "learning_rate": 3.955390718891747e-06, "loss": 2.430336456298828, "step": 1506800 }, { "epoch": 1.8182759081498723, "learning_rate": 3.954986883424008e-06, "loss": 2.448626708984375, "step": 1506900 }, { "epoch": 1.8183965714723551, "learning_rate": 3.95458304795627e-06, "loss": 2.4245892333984376, "step": 1507000 }, { "epoch": 1.8185172347948377, "learning_rate": 3.954179212488531e-06, "loss": 2.4188035583496093, "step": 1507100 }, { "epoch": 1.8186378981173204, "learning_rate": 3.953775377020793e-06, "loss": 2.4485484313964845, "step": 1507200 }, { "epoch": 1.818758561439803, "learning_rate": 3.953371541553054e-06, "loss": 2.4246173095703125, "step": 1507300 }, { "epoch": 1.8188792247622856, "learning_rate": 3.952967706085316e-06, "loss": 2.4410313415527343, "step": 1507400 }, { "epoch": 1.8189998880847684, "learning_rate": 3.952563870617578e-06, "loss": 2.45004638671875, "step": 1507500 }, { "epoch": 1.819120551407251, "learning_rate": 3.952160035149839e-06, "loss": 2.4391162109375, "step": 1507600 }, { "epoch": 1.8192412147297339, "learning_rate": 3.9517561996821004e-06, "loss": 2.412339324951172, "step": 1507700 }, { "epoch": 1.8193618780522165, "learning_rate": 3.951352364214362e-06, "loss": 2.4316546630859377, "step": 1507800 }, { "epoch": 1.8194825413746991, "learning_rate": 3.950948528746624e-06, "loss": 2.4748150634765627, "step": 1507900 }, { "epoch": 1.8196032046971817, "learning_rate": 3.950544693278886e-06, "loss": 2.4536952209472656, "step": 1508000 }, { "epoch": 1.8197238680196643, "learning_rate": 3.9501408578111475e-06, "loss": 2.425925598144531, "step": 1508100 }, { "epoch": 1.8198445313421472, "learning_rate": 3.949737022343409e-06, "loss": 2.430874938964844, "step": 1508200 }, { "epoch": 1.81996519466463, "learning_rate": 3.949333186875671e-06, "loss": 2.4326432800292968, "step": 1508300 }, { "epoch": 1.8200858579871126, "learning_rate": 3.948929351407933e-06, "loss": 2.4252772521972656, "step": 1508400 }, { "epoch": 1.8202065213095953, "learning_rate": 3.948525515940195e-06, "loss": 2.435092010498047, "step": 1508500 }, { "epoch": 1.8203271846320779, "learning_rate": 3.948121680472456e-06, "loss": 2.439889678955078, "step": 1508600 }, { "epoch": 1.8204478479545605, "learning_rate": 3.947717845004717e-06, "loss": 2.4541311645507813, "step": 1508700 }, { "epoch": 1.8205685112770433, "learning_rate": 3.947314009536979e-06, "loss": 2.4486366271972657, "step": 1508800 }, { "epoch": 1.820689174599526, "learning_rate": 3.946910174069241e-06, "loss": 2.4448204040527344, "step": 1508900 }, { "epoch": 1.8208098379220088, "learning_rate": 3.946506338601502e-06, "loss": 2.4382392883300783, "step": 1509000 }, { "epoch": 1.8209305012444914, "learning_rate": 3.946102503133764e-06, "loss": 2.43061279296875, "step": 1509100 }, { "epoch": 1.821051164566974, "learning_rate": 3.945698667666025e-06, "loss": 2.454139404296875, "step": 1509200 }, { "epoch": 1.8211718278894566, "learning_rate": 3.945294832198287e-06, "loss": 2.4395191955566404, "step": 1509300 }, { "epoch": 1.8212924912119393, "learning_rate": 3.944890996730548e-06, "loss": 2.4421484375, "step": 1509400 }, { "epoch": 1.821413154534422, "learning_rate": 3.94448716126281e-06, "loss": 2.4233822631835937, "step": 1509500 }, { "epoch": 1.8215338178569047, "learning_rate": 3.944083325795071e-06, "loss": 2.4356134033203123, "step": 1509600 }, { "epoch": 1.8216544811793876, "learning_rate": 3.943679490327333e-06, "loss": 2.462085876464844, "step": 1509700 }, { "epoch": 1.8217751445018702, "learning_rate": 3.9432756548595944e-06, "loss": 2.4459461975097656, "step": 1509800 }, { "epoch": 1.8218958078243528, "learning_rate": 3.942871819391856e-06, "loss": 2.4530152893066406, "step": 1509900 }, { "epoch": 1.8220164711468354, "learning_rate": 3.942467983924118e-06, "loss": 2.415724639892578, "step": 1510000 }, { "epoch": 1.822137134469318, "learning_rate": 3.9420641484563795e-06, "loss": 2.429998779296875, "step": 1510100 }, { "epoch": 1.8222577977918009, "learning_rate": 3.941660312988641e-06, "loss": 2.445496063232422, "step": 1510200 }, { "epoch": 1.8223784611142837, "learning_rate": 3.941256477520903e-06, "loss": 2.4363777160644533, "step": 1510300 }, { "epoch": 1.8224991244367663, "learning_rate": 3.940852642053165e-06, "loss": 2.438937225341797, "step": 1510400 }, { "epoch": 1.822619787759249, "learning_rate": 3.940448806585427e-06, "loss": 2.4312620544433594, "step": 1510500 }, { "epoch": 1.8227404510817315, "learning_rate": 3.940044971117688e-06, "loss": 2.426069793701172, "step": 1510600 }, { "epoch": 1.8228611144042142, "learning_rate": 3.939641135649949e-06, "loss": 2.4355003356933596, "step": 1510700 }, { "epoch": 1.822981777726697, "learning_rate": 3.939237300182211e-06, "loss": 2.409188232421875, "step": 1510800 }, { "epoch": 1.8231024410491796, "learning_rate": 3.938833464714473e-06, "loss": 2.4404220581054688, "step": 1510900 }, { "epoch": 1.8232231043716625, "learning_rate": 3.938429629246734e-06, "loss": 2.426763000488281, "step": 1511000 }, { "epoch": 1.823343767694145, "learning_rate": 3.938025793778996e-06, "loss": 2.4389617919921873, "step": 1511100 }, { "epoch": 1.8234644310166277, "learning_rate": 3.937621958311257e-06, "loss": 2.4424205017089844, "step": 1511200 }, { "epoch": 1.8235850943391103, "learning_rate": 3.937218122843519e-06, "loss": 2.4619186401367186, "step": 1511300 }, { "epoch": 1.823705757661593, "learning_rate": 3.93681428737578e-06, "loss": 2.42741943359375, "step": 1511400 }, { "epoch": 1.8238264209840758, "learning_rate": 3.936410451908042e-06, "loss": 2.4331817626953125, "step": 1511500 }, { "epoch": 1.8239470843065586, "learning_rate": 3.936006616440304e-06, "loss": 2.4318577575683595, "step": 1511600 }, { "epoch": 1.8240677476290412, "learning_rate": 3.935602780972565e-06, "loss": 2.4343991088867187, "step": 1511700 }, { "epoch": 1.8241884109515238, "learning_rate": 3.9351989455048265e-06, "loss": 2.435884704589844, "step": 1511800 }, { "epoch": 1.8243090742740065, "learning_rate": 3.9347951100370884e-06, "loss": 2.4445265197753905, "step": 1511900 }, { "epoch": 1.824429737596489, "learning_rate": 3.9343912745693504e-06, "loss": 2.4581871032714844, "step": 1512000 }, { "epoch": 1.824550400918972, "learning_rate": 3.9339874391016116e-06, "loss": 2.442604827880859, "step": 1512100 }, { "epoch": 1.8246710642414545, "learning_rate": 3.9335836036338735e-06, "loss": 2.449970245361328, "step": 1512200 }, { "epoch": 1.8247917275639374, "learning_rate": 3.933179768166135e-06, "loss": 2.462432403564453, "step": 1512300 }, { "epoch": 1.82491239088642, "learning_rate": 3.932775932698397e-06, "loss": 2.4469944763183595, "step": 1512400 }, { "epoch": 1.8250330542089026, "learning_rate": 3.932372097230659e-06, "loss": 2.414932861328125, "step": 1512500 }, { "epoch": 1.8251537175313852, "learning_rate": 3.93196826176292e-06, "loss": 2.4286648559570314, "step": 1512600 }, { "epoch": 1.8252743808538678, "learning_rate": 3.931564426295181e-06, "loss": 2.4364984130859373, "step": 1512700 }, { "epoch": 1.8253950441763507, "learning_rate": 3.931160590827443e-06, "loss": 2.4396290588378906, "step": 1512800 }, { "epoch": 1.8255157074988333, "learning_rate": 3.930756755359705e-06, "loss": 2.4330459594726563, "step": 1512900 }, { "epoch": 1.8256363708213161, "learning_rate": 3.930352919891966e-06, "loss": 2.430081787109375, "step": 1513000 }, { "epoch": 1.8257570341437988, "learning_rate": 3.929949084424228e-06, "loss": 2.415271759033203, "step": 1513100 }, { "epoch": 1.8258776974662814, "learning_rate": 3.929545248956489e-06, "loss": 2.4049627685546877, "step": 1513200 }, { "epoch": 1.825998360788764, "learning_rate": 3.929141413488751e-06, "loss": 2.4521798706054687, "step": 1513300 }, { "epoch": 1.8261190241112466, "learning_rate": 3.928737578021013e-06, "loss": 2.4036543273925783, "step": 1513400 }, { "epoch": 1.8262396874337294, "learning_rate": 3.928333742553274e-06, "loss": 2.440210418701172, "step": 1513500 }, { "epoch": 1.8263603507562123, "learning_rate": 3.927929907085536e-06, "loss": 2.4397232055664064, "step": 1513600 }, { "epoch": 1.826481014078695, "learning_rate": 3.927526071617797e-06, "loss": 2.458310089111328, "step": 1513700 }, { "epoch": 1.8266016774011775, "learning_rate": 3.927122236150059e-06, "loss": 2.4314115905761717, "step": 1513800 }, { "epoch": 1.8267223407236601, "learning_rate": 3.9267184006823205e-06, "loss": 2.4561085510253906, "step": 1513900 }, { "epoch": 1.8268430040461427, "learning_rate": 3.9263145652145825e-06, "loss": 2.4419073486328124, "step": 1514000 }, { "epoch": 1.8269636673686256, "learning_rate": 3.9259107297468444e-06, "loss": 2.4388191223144533, "step": 1514100 }, { "epoch": 1.8270843306911082, "learning_rate": 3.9255068942791056e-06, "loss": 2.4407298278808596, "step": 1514200 }, { "epoch": 1.827204994013591, "learning_rate": 3.925103058811367e-06, "loss": 2.4299867248535154, "step": 1514300 }, { "epoch": 1.8273256573360737, "learning_rate": 3.924699223343629e-06, "loss": 2.445773468017578, "step": 1514400 }, { "epoch": 1.8274463206585563, "learning_rate": 3.924295387875891e-06, "loss": 2.441481018066406, "step": 1514500 }, { "epoch": 1.827566983981039, "learning_rate": 3.923891552408152e-06, "loss": 2.4241104125976562, "step": 1514600 }, { "epoch": 1.8276876473035215, "learning_rate": 3.923487716940414e-06, "loss": 2.4439468383789062, "step": 1514700 }, { "epoch": 1.8278083106260044, "learning_rate": 3.923083881472675e-06, "loss": 2.4495762634277343, "step": 1514800 }, { "epoch": 1.827928973948487, "learning_rate": 3.922680046004937e-06, "loss": 2.429299621582031, "step": 1514900 }, { "epoch": 1.8280496372709698, "learning_rate": 3.922276210537199e-06, "loss": 2.4515673828125, "step": 1515000 }, { "epoch": 1.8281703005934524, "learning_rate": 3.92187237506946e-06, "loss": 2.405334930419922, "step": 1515100 }, { "epoch": 1.828290963915935, "learning_rate": 3.921468539601721e-06, "loss": 2.4328817749023437, "step": 1515200 }, { "epoch": 1.8284116272384177, "learning_rate": 3.921064704133983e-06, "loss": 2.441896667480469, "step": 1515300 }, { "epoch": 1.8285322905609003, "learning_rate": 3.920660868666245e-06, "loss": 2.419830627441406, "step": 1515400 }, { "epoch": 1.8286529538833831, "learning_rate": 3.920257033198506e-06, "loss": 2.452900695800781, "step": 1515500 }, { "epoch": 1.828773617205866, "learning_rate": 3.919853197730768e-06, "loss": 2.4555010986328125, "step": 1515600 }, { "epoch": 1.8288942805283486, "learning_rate": 3.919449362263029e-06, "loss": 2.440643310546875, "step": 1515700 }, { "epoch": 1.8290149438508312, "learning_rate": 3.919045526795291e-06, "loss": 2.415866241455078, "step": 1515800 }, { "epoch": 1.8291356071733138, "learning_rate": 3.9186416913275525e-06, "loss": 2.432717590332031, "step": 1515900 }, { "epoch": 1.8292562704957964, "learning_rate": 3.9182378558598145e-06, "loss": 2.4303440856933594, "step": 1516000 }, { "epoch": 1.8293769338182793, "learning_rate": 3.9178340203920765e-06, "loss": 2.432781524658203, "step": 1516100 }, { "epoch": 1.8294975971407619, "learning_rate": 3.917430184924338e-06, "loss": 2.4379171752929687, "step": 1516200 }, { "epoch": 1.8296182604632447, "learning_rate": 3.917026349456599e-06, "loss": 2.4584014892578123, "step": 1516300 }, { "epoch": 1.8297389237857273, "learning_rate": 3.916622513988861e-06, "loss": 2.4169081115722655, "step": 1516400 }, { "epoch": 1.82985958710821, "learning_rate": 3.916218678521123e-06, "loss": 2.430353546142578, "step": 1516500 }, { "epoch": 1.8299802504306926, "learning_rate": 3.915814843053385e-06, "loss": 2.417276153564453, "step": 1516600 }, { "epoch": 1.8301009137531752, "learning_rate": 3.915411007585646e-06, "loss": 2.4515301513671877, "step": 1516700 }, { "epoch": 1.830221577075658, "learning_rate": 3.915007172117907e-06, "loss": 2.455863800048828, "step": 1516800 }, { "epoch": 1.8303422403981409, "learning_rate": 3.914603336650169e-06, "loss": 2.447745361328125, "step": 1516900 }, { "epoch": 1.8304629037206235, "learning_rate": 3.914199501182431e-06, "loss": 2.4435270690917967, "step": 1517000 }, { "epoch": 1.830583567043106, "learning_rate": 3.913795665714692e-06, "loss": 2.4748558044433593, "step": 1517100 }, { "epoch": 1.8307042303655887, "learning_rate": 3.913391830246954e-06, "loss": 2.42590576171875, "step": 1517200 }, { "epoch": 1.8308248936880713, "learning_rate": 3.912987994779215e-06, "loss": 2.426390838623047, "step": 1517300 }, { "epoch": 1.8309455570105542, "learning_rate": 3.912584159311477e-06, "loss": 2.437372283935547, "step": 1517400 }, { "epoch": 1.8310662203330368, "learning_rate": 3.912180323843738e-06, "loss": 2.4542605590820314, "step": 1517500 }, { "epoch": 1.8311868836555196, "learning_rate": 3.911776488376e-06, "loss": 2.4601286315917967, "step": 1517600 }, { "epoch": 1.8313075469780022, "learning_rate": 3.911372652908262e-06, "loss": 2.425869598388672, "step": 1517700 }, { "epoch": 1.8314282103004849, "learning_rate": 3.910968817440523e-06, "loss": 2.4386003112792967, "step": 1517800 }, { "epoch": 1.8315488736229675, "learning_rate": 3.9105649819727845e-06, "loss": 2.446849670410156, "step": 1517900 }, { "epoch": 1.83166953694545, "learning_rate": 3.9101611465050465e-06, "loss": 2.422255401611328, "step": 1518000 }, { "epoch": 1.831790200267933, "learning_rate": 3.9097573110373085e-06, "loss": 2.4482814025878907, "step": 1518100 }, { "epoch": 1.8319108635904156, "learning_rate": 3.90935347556957e-06, "loss": 2.4656521606445314, "step": 1518200 }, { "epoch": 1.8320315269128984, "learning_rate": 3.908949640101832e-06, "loss": 2.434772186279297, "step": 1518300 }, { "epoch": 1.832152190235381, "learning_rate": 3.908545804634093e-06, "loss": 2.425520172119141, "step": 1518400 }, { "epoch": 1.8322728535578636, "learning_rate": 3.908141969166355e-06, "loss": 2.431307830810547, "step": 1518500 }, { "epoch": 1.8323935168803462, "learning_rate": 3.907738133698617e-06, "loss": 2.414031982421875, "step": 1518600 }, { "epoch": 1.8325141802028289, "learning_rate": 3.907334298230878e-06, "loss": 2.4515008544921875, "step": 1518700 }, { "epoch": 1.8326348435253117, "learning_rate": 3.906930462763139e-06, "loss": 2.447434997558594, "step": 1518800 }, { "epoch": 1.8327555068477945, "learning_rate": 3.906526627295401e-06, "loss": 2.4169984436035157, "step": 1518900 }, { "epoch": 1.8328761701702772, "learning_rate": 3.906122791827663e-06, "loss": 2.4269207763671874, "step": 1519000 }, { "epoch": 1.8329968334927598, "learning_rate": 3.905718956359925e-06, "loss": 2.4520474243164063, "step": 1519100 }, { "epoch": 1.8331174968152424, "learning_rate": 3.905315120892186e-06, "loss": 2.442113037109375, "step": 1519200 }, { "epoch": 1.833238160137725, "learning_rate": 3.904911285424447e-06, "loss": 2.4433575439453126, "step": 1519300 }, { "epoch": 1.8333588234602078, "learning_rate": 3.904507449956709e-06, "loss": 2.4325328063964844, "step": 1519400 }, { "epoch": 1.8334794867826905, "learning_rate": 3.904103614488971e-06, "loss": 2.4381495666503907, "step": 1519500 }, { "epoch": 1.8336001501051733, "learning_rate": 3.903699779021232e-06, "loss": 2.396145935058594, "step": 1519600 }, { "epoch": 1.833720813427656, "learning_rate": 3.903295943553494e-06, "loss": 2.439419708251953, "step": 1519700 }, { "epoch": 1.8338414767501385, "learning_rate": 3.902892108085755e-06, "loss": 2.4340467834472657, "step": 1519800 }, { "epoch": 1.8339621400726211, "learning_rate": 3.902488272618017e-06, "loss": 2.423734436035156, "step": 1519900 }, { "epoch": 1.8340828033951038, "learning_rate": 3.9020844371502785e-06, "loss": 2.4324220275878905, "step": 1520000 }, { "epoch": 1.8342034667175866, "learning_rate": 3.9016806016825405e-06, "loss": 2.435362548828125, "step": 1520100 }, { "epoch": 1.8343241300400692, "learning_rate": 3.9012767662148025e-06, "loss": 2.441719665527344, "step": 1520200 }, { "epoch": 1.834444793362552, "learning_rate": 3.900872930747064e-06, "loss": 2.4435214233398437, "step": 1520300 }, { "epoch": 1.8345654566850347, "learning_rate": 3.900469095279325e-06, "loss": 2.4358154296875, "step": 1520400 }, { "epoch": 1.8346861200075173, "learning_rate": 3.900065259811587e-06, "loss": 2.4471505737304686, "step": 1520500 }, { "epoch": 1.83480678333, "learning_rate": 3.899661424343849e-06, "loss": 2.411457977294922, "step": 1520600 }, { "epoch": 1.8349274466524825, "learning_rate": 3.89925758887611e-06, "loss": 2.4286845397949217, "step": 1520700 }, { "epoch": 1.8350481099749654, "learning_rate": 3.898853753408372e-06, "loss": 2.440804138183594, "step": 1520800 }, { "epoch": 1.8351687732974482, "learning_rate": 3.898449917940633e-06, "loss": 2.4121746826171875, "step": 1520900 }, { "epoch": 1.8352894366199308, "learning_rate": 3.898046082472895e-06, "loss": 2.4460121154785157, "step": 1521000 }, { "epoch": 1.8354100999424134, "learning_rate": 3.897642247005157e-06, "loss": 2.447772979736328, "step": 1521100 }, { "epoch": 1.835530763264896, "learning_rate": 3.897238411537418e-06, "loss": 2.4326100158691406, "step": 1521200 }, { "epoch": 1.8356514265873787, "learning_rate": 3.896834576069679e-06, "loss": 2.4658770751953125, "step": 1521300 }, { "epoch": 1.8357720899098615, "learning_rate": 3.896430740601941e-06, "loss": 2.47591064453125, "step": 1521400 }, { "epoch": 1.8358927532323441, "learning_rate": 3.896026905134203e-06, "loss": 2.4064598083496094, "step": 1521500 }, { "epoch": 1.836013416554827, "learning_rate": 3.895623069666464e-06, "loss": 2.42497802734375, "step": 1521600 }, { "epoch": 1.8361340798773096, "learning_rate": 3.895219234198726e-06, "loss": 2.4215696716308592, "step": 1521700 }, { "epoch": 1.8362547431997922, "learning_rate": 3.8948153987309874e-06, "loss": 2.4422434997558593, "step": 1521800 }, { "epoch": 1.8363754065222748, "learning_rate": 3.8944115632632494e-06, "loss": 2.4183169555664064, "step": 1521900 }, { "epoch": 1.8364960698447574, "learning_rate": 3.8940077277955106e-06, "loss": 2.431721649169922, "step": 1522000 }, { "epoch": 1.8366167331672403, "learning_rate": 3.8936038923277725e-06, "loss": 2.445034637451172, "step": 1522100 }, { "epoch": 1.8367373964897231, "learning_rate": 3.8932000568600345e-06, "loss": 2.443372344970703, "step": 1522200 }, { "epoch": 1.8368580598122057, "learning_rate": 3.892796221392296e-06, "loss": 2.435571746826172, "step": 1522300 }, { "epoch": 1.8369787231346884, "learning_rate": 3.892392385924557e-06, "loss": 2.435527801513672, "step": 1522400 }, { "epoch": 1.837099386457171, "learning_rate": 3.891988550456819e-06, "loss": 2.4288668823242188, "step": 1522500 }, { "epoch": 1.8372200497796536, "learning_rate": 3.891584714989081e-06, "loss": 2.447695465087891, "step": 1522600 }, { "epoch": 1.8373407131021364, "learning_rate": 3.891180879521343e-06, "loss": 2.4225978088378906, "step": 1522700 }, { "epoch": 1.837461376424619, "learning_rate": 3.890777044053604e-06, "loss": 2.458771209716797, "step": 1522800 }, { "epoch": 1.8375820397471019, "learning_rate": 3.890373208585865e-06, "loss": 2.425088195800781, "step": 1522900 }, { "epoch": 1.8377027030695845, "learning_rate": 3.889969373118127e-06, "loss": 2.4403509521484374, "step": 1523000 }, { "epoch": 1.8378233663920671, "learning_rate": 3.889565537650389e-06, "loss": 2.4405531311035156, "step": 1523100 }, { "epoch": 1.8379440297145497, "learning_rate": 3.88916170218265e-06, "loss": 2.436156921386719, "step": 1523200 }, { "epoch": 1.8380646930370323, "learning_rate": 3.888757866714912e-06, "loss": 2.4546138000488282, "step": 1523300 }, { "epoch": 1.8381853563595152, "learning_rate": 3.888354031247173e-06, "loss": 2.433369445800781, "step": 1523400 }, { "epoch": 1.8383060196819978, "learning_rate": 3.887950195779435e-06, "loss": 2.4189903259277346, "step": 1523500 }, { "epoch": 1.8384266830044806, "learning_rate": 3.887546360311696e-06, "loss": 2.459973907470703, "step": 1523600 }, { "epoch": 1.8385473463269633, "learning_rate": 3.887142524843958e-06, "loss": 2.4111207580566405, "step": 1523700 }, { "epoch": 1.8386680096494459, "learning_rate": 3.88673868937622e-06, "loss": 2.427070770263672, "step": 1523800 }, { "epoch": 1.8387886729719285, "learning_rate": 3.8863348539084815e-06, "loss": 2.410308380126953, "step": 1523900 }, { "epoch": 1.8389093362944111, "learning_rate": 3.8859310184407434e-06, "loss": 2.4229359436035156, "step": 1524000 }, { "epoch": 1.839029999616894, "learning_rate": 3.8855271829730046e-06, "loss": 2.44236328125, "step": 1524100 }, { "epoch": 1.8391506629393768, "learning_rate": 3.8851233475052666e-06, "loss": 2.442509765625, "step": 1524200 }, { "epoch": 1.8392713262618594, "learning_rate": 3.884719512037528e-06, "loss": 2.4513920593261718, "step": 1524300 }, { "epoch": 1.839391989584342, "learning_rate": 3.88431567656979e-06, "loss": 2.4694454956054686, "step": 1524400 }, { "epoch": 1.8395126529068246, "learning_rate": 3.883911841102051e-06, "loss": 2.4091468811035157, "step": 1524500 }, { "epoch": 1.8396333162293073, "learning_rate": 3.883508005634313e-06, "loss": 2.445056915283203, "step": 1524600 }, { "epoch": 1.83975397955179, "learning_rate": 3.883104170166575e-06, "loss": 2.434682159423828, "step": 1524700 }, { "epoch": 1.8398746428742727, "learning_rate": 3.882700334698836e-06, "loss": 2.4360482788085935, "step": 1524800 }, { "epoch": 1.8399953061967556, "learning_rate": 3.882296499231097e-06, "loss": 2.440980224609375, "step": 1524900 }, { "epoch": 1.8401159695192382, "learning_rate": 3.881892663763359e-06, "loss": 2.434378356933594, "step": 1525000 }, { "epoch": 1.8402366328417208, "learning_rate": 3.881488828295621e-06, "loss": 2.4361737060546873, "step": 1525100 }, { "epoch": 1.8403572961642034, "learning_rate": 3.881084992827883e-06, "loss": 2.4117195129394533, "step": 1525200 }, { "epoch": 1.840477959486686, "learning_rate": 3.880681157360144e-06, "loss": 2.4403730773925782, "step": 1525300 }, { "epoch": 1.8405986228091689, "learning_rate": 3.880277321892405e-06, "loss": 2.4405867004394532, "step": 1525400 }, { "epoch": 1.8407192861316515, "learning_rate": 3.879873486424667e-06, "loss": 2.4364666748046875, "step": 1525500 }, { "epoch": 1.8408399494541343, "learning_rate": 3.879469650956929e-06, "loss": 2.4301918029785154, "step": 1525600 }, { "epoch": 1.840960612776617, "learning_rate": 3.87906581548919e-06, "loss": 2.4266815185546875, "step": 1525700 }, { "epoch": 1.8410812760990996, "learning_rate": 3.878661980021452e-06, "loss": 2.4381034851074217, "step": 1525800 }, { "epoch": 1.8412019394215822, "learning_rate": 3.8782581445537135e-06, "loss": 2.441404266357422, "step": 1525900 }, { "epoch": 1.8413226027440648, "learning_rate": 3.8778543090859755e-06, "loss": 2.4522549438476564, "step": 1526000 }, { "epoch": 1.8414432660665476, "learning_rate": 3.877450473618237e-06, "loss": 2.4190022277832033, "step": 1526100 }, { "epoch": 1.8415639293890305, "learning_rate": 3.8770466381504986e-06, "loss": 2.4033636474609374, "step": 1526200 }, { "epoch": 1.841684592711513, "learning_rate": 3.8766428026827606e-06, "loss": 2.4296368408203124, "step": 1526300 }, { "epoch": 1.8418052560339957, "learning_rate": 3.876238967215022e-06, "loss": 2.4481402587890626, "step": 1526400 }, { "epoch": 1.8419259193564783, "learning_rate": 3.875835131747283e-06, "loss": 2.4129487609863283, "step": 1526500 }, { "epoch": 1.842046582678961, "learning_rate": 3.875431296279545e-06, "loss": 2.4258856201171874, "step": 1526600 }, { "epoch": 1.8421672460014438, "learning_rate": 3.875027460811807e-06, "loss": 2.4482972717285154, "step": 1526700 }, { "epoch": 1.8422879093239264, "learning_rate": 3.874623625344068e-06, "loss": 2.432389373779297, "step": 1526800 }, { "epoch": 1.8424085726464092, "learning_rate": 3.87421978987633e-06, "loss": 2.43484619140625, "step": 1526900 }, { "epoch": 1.8425292359688918, "learning_rate": 3.873815954408591e-06, "loss": 2.438068084716797, "step": 1527000 }, { "epoch": 1.8426498992913745, "learning_rate": 3.873412118940853e-06, "loss": 2.415796813964844, "step": 1527100 }, { "epoch": 1.842770562613857, "learning_rate": 3.873008283473115e-06, "loss": 2.4413774108886717, "step": 1527200 }, { "epoch": 1.8428912259363397, "learning_rate": 3.872604448005376e-06, "loss": 2.447018737792969, "step": 1527300 }, { "epoch": 1.8430118892588225, "learning_rate": 3.872200612537637e-06, "loss": 2.4570718383789063, "step": 1527400 }, { "epoch": 1.8431325525813054, "learning_rate": 3.871796777069899e-06, "loss": 2.4359164428710938, "step": 1527500 }, { "epoch": 1.843253215903788, "learning_rate": 3.871392941602161e-06, "loss": 2.4293060302734375, "step": 1527600 }, { "epoch": 1.8433738792262706, "learning_rate": 3.870989106134422e-06, "loss": 2.427010955810547, "step": 1527700 }, { "epoch": 1.8434945425487532, "learning_rate": 3.870585270666684e-06, "loss": 2.43305908203125, "step": 1527800 }, { "epoch": 1.8436152058712358, "learning_rate": 3.8701814351989455e-06, "loss": 2.446757507324219, "step": 1527900 }, { "epoch": 1.8437358691937187, "learning_rate": 3.8697775997312075e-06, "loss": 2.453741455078125, "step": 1528000 }, { "epoch": 1.8438565325162013, "learning_rate": 3.869373764263469e-06, "loss": 2.4387757873535154, "step": 1528100 }, { "epoch": 1.8439771958386841, "learning_rate": 3.868969928795731e-06, "loss": 2.4539259338378905, "step": 1528200 }, { "epoch": 1.8440978591611668, "learning_rate": 3.868566093327993e-06, "loss": 2.460515441894531, "step": 1528300 }, { "epoch": 1.8442185224836494, "learning_rate": 3.868162257860254e-06, "loss": 2.4494940185546876, "step": 1528400 }, { "epoch": 1.844339185806132, "learning_rate": 3.867758422392515e-06, "loss": 2.4275425720214843, "step": 1528500 }, { "epoch": 1.8444598491286146, "learning_rate": 3.867354586924777e-06, "loss": 2.422240905761719, "step": 1528600 }, { "epoch": 1.8445805124510974, "learning_rate": 3.866950751457039e-06, "loss": 2.438689880371094, "step": 1528700 }, { "epoch": 1.84470117577358, "learning_rate": 3.866546915989301e-06, "loss": 2.433879699707031, "step": 1528800 }, { "epoch": 1.844821839096063, "learning_rate": 3.866143080521562e-06, "loss": 2.442955322265625, "step": 1528900 }, { "epoch": 1.8449425024185455, "learning_rate": 3.865739245053823e-06, "loss": 2.4349676513671876, "step": 1529000 }, { "epoch": 1.8450631657410281, "learning_rate": 3.865335409586085e-06, "loss": 2.4517823791503908, "step": 1529100 }, { "epoch": 1.8451838290635107, "learning_rate": 3.864931574118347e-06, "loss": 2.425872497558594, "step": 1529200 }, { "epoch": 1.8453044923859934, "learning_rate": 3.864527738650608e-06, "loss": 2.4143937683105468, "step": 1529300 }, { "epoch": 1.8454251557084762, "learning_rate": 3.86412390318287e-06, "loss": 2.411795349121094, "step": 1529400 }, { "epoch": 1.845545819030959, "learning_rate": 3.863720067715131e-06, "loss": 2.4367417907714843, "step": 1529500 }, { "epoch": 1.8456664823534417, "learning_rate": 3.863316232247393e-06, "loss": 2.433227081298828, "step": 1529600 }, { "epoch": 1.8457871456759243, "learning_rate": 3.862912396779655e-06, "loss": 2.4423204040527344, "step": 1529700 }, { "epoch": 1.845907808998407, "learning_rate": 3.862508561311916e-06, "loss": 2.4214511108398438, "step": 1529800 }, { "epoch": 1.8460284723208895, "learning_rate": 3.8621047258441775e-06, "loss": 2.4250160217285157, "step": 1529900 }, { "epoch": 1.8461491356433724, "learning_rate": 3.8617008903764395e-06, "loss": 2.4355250549316407, "step": 1530000 }, { "epoch": 1.846269798965855, "learning_rate": 3.8612970549087015e-06, "loss": 2.4337890625, "step": 1530100 }, { "epoch": 1.8463904622883378, "learning_rate": 3.860893219440963e-06, "loss": 2.395427398681641, "step": 1530200 }, { "epoch": 1.8465111256108204, "learning_rate": 3.860489383973225e-06, "loss": 2.4467929077148436, "step": 1530300 }, { "epoch": 1.846631788933303, "learning_rate": 3.860085548505486e-06, "loss": 2.4502003479003904, "step": 1530400 }, { "epoch": 1.8467524522557857, "learning_rate": 3.859681713037748e-06, "loss": 2.4399615478515626, "step": 1530500 }, { "epoch": 1.8468731155782683, "learning_rate": 3.859277877570009e-06, "loss": 2.443051452636719, "step": 1530600 }, { "epoch": 1.8469937789007511, "learning_rate": 3.858874042102271e-06, "loss": 2.4341886901855467, "step": 1530700 }, { "epoch": 1.8471144422232337, "learning_rate": 3.858470206634533e-06, "loss": 2.433516845703125, "step": 1530800 }, { "epoch": 1.8472351055457166, "learning_rate": 3.858066371166794e-06, "loss": 2.4293563842773436, "step": 1530900 }, { "epoch": 1.8473557688681992, "learning_rate": 3.857662535699055e-06, "loss": 2.4233279418945313, "step": 1531000 }, { "epoch": 1.8474764321906818, "learning_rate": 3.857258700231317e-06, "loss": 2.450816345214844, "step": 1531100 }, { "epoch": 1.8475970955131644, "learning_rate": 3.856854864763579e-06, "loss": 2.4464646911621095, "step": 1531200 }, { "epoch": 1.847717758835647, "learning_rate": 3.856451029295841e-06, "loss": 2.449837341308594, "step": 1531300 }, { "epoch": 1.8478384221581299, "learning_rate": 3.856047193828102e-06, "loss": 2.4392755126953123, "step": 1531400 }, { "epoch": 1.8479590854806127, "learning_rate": 3.855643358360363e-06, "loss": 2.4488481140136718, "step": 1531500 }, { "epoch": 1.8480797488030953, "learning_rate": 3.855239522892625e-06, "loss": 2.4446311950683595, "step": 1531600 }, { "epoch": 1.848200412125578, "learning_rate": 3.854835687424887e-06, "loss": 2.445486297607422, "step": 1531700 }, { "epoch": 1.8483210754480606, "learning_rate": 3.854431851957148e-06, "loss": 2.4385520935058596, "step": 1531800 }, { "epoch": 1.8484417387705432, "learning_rate": 3.85402801648941e-06, "loss": 2.415585784912109, "step": 1531900 }, { "epoch": 1.848562402093026, "learning_rate": 3.8536241810216715e-06, "loss": 2.407978820800781, "step": 1532000 }, { "epoch": 1.8486830654155086, "learning_rate": 3.8532203455539335e-06, "loss": 2.4791651916503907, "step": 1532100 }, { "epoch": 1.8488037287379915, "learning_rate": 3.852816510086195e-06, "loss": 2.434897918701172, "step": 1532200 }, { "epoch": 1.848924392060474, "learning_rate": 3.852412674618457e-06, "loss": 2.4470733642578124, "step": 1532300 }, { "epoch": 1.8490450553829567, "learning_rate": 3.852008839150719e-06, "loss": 2.4445176696777344, "step": 1532400 }, { "epoch": 1.8491657187054393, "learning_rate": 3.85160500368298e-06, "loss": 2.4111807250976565, "step": 1532500 }, { "epoch": 1.849286382027922, "learning_rate": 3.851201168215241e-06, "loss": 2.4393743896484374, "step": 1532600 }, { "epoch": 1.8494070453504048, "learning_rate": 3.850797332747503e-06, "loss": 2.446663055419922, "step": 1532700 }, { "epoch": 1.8495277086728876, "learning_rate": 3.850393497279765e-06, "loss": 2.4288665771484377, "step": 1532800 }, { "epoch": 1.8496483719953702, "learning_rate": 3.849989661812026e-06, "loss": 2.4741468811035157, "step": 1532900 }, { "epoch": 1.8497690353178529, "learning_rate": 3.849585826344288e-06, "loss": 2.449058837890625, "step": 1533000 }, { "epoch": 1.8498896986403355, "learning_rate": 3.849181990876549e-06, "loss": 2.439684295654297, "step": 1533100 }, { "epoch": 1.850010361962818, "learning_rate": 3.848778155408811e-06, "loss": 2.4382150268554685, "step": 1533200 }, { "epoch": 1.850131025285301, "learning_rate": 3.848374319941073e-06, "loss": 2.4523927307128908, "step": 1533300 }, { "epoch": 1.8502516886077836, "learning_rate": 3.847970484473334e-06, "loss": 2.4375352478027343, "step": 1533400 }, { "epoch": 1.8503723519302664, "learning_rate": 3.847566649005595e-06, "loss": 2.4316917419433595, "step": 1533500 }, { "epoch": 1.850493015252749, "learning_rate": 3.847162813537857e-06, "loss": 2.448325347900391, "step": 1533600 }, { "epoch": 1.8506136785752316, "learning_rate": 3.846758978070119e-06, "loss": 2.42744384765625, "step": 1533700 }, { "epoch": 1.8507343418977142, "learning_rate": 3.8463551426023804e-06, "loss": 2.416489562988281, "step": 1533800 }, { "epoch": 1.8508550052201969, "learning_rate": 3.8459513071346424e-06, "loss": 2.4360618591308594, "step": 1533900 }, { "epoch": 1.8509756685426797, "learning_rate": 3.8455474716669036e-06, "loss": 2.433793182373047, "step": 1534000 }, { "epoch": 1.8510963318651623, "learning_rate": 3.8451436361991655e-06, "loss": 2.4101222229003905, "step": 1534100 }, { "epoch": 1.8512169951876452, "learning_rate": 3.8447398007314275e-06, "loss": 2.437945556640625, "step": 1534200 }, { "epoch": 1.8513376585101278, "learning_rate": 3.844335965263689e-06, "loss": 2.440096588134766, "step": 1534300 }, { "epoch": 1.8514583218326104, "learning_rate": 3.843932129795951e-06, "loss": 2.4385697937011717, "step": 1534400 }, { "epoch": 1.851578985155093, "learning_rate": 3.843528294328212e-06, "loss": 2.4238841247558596, "step": 1534500 }, { "epoch": 1.8516996484775756, "learning_rate": 3.843124458860474e-06, "loss": 2.4273951721191405, "step": 1534600 }, { "epoch": 1.8518203118000585, "learning_rate": 3.842720623392735e-06, "loss": 2.445664520263672, "step": 1534700 }, { "epoch": 1.8519409751225413, "learning_rate": 3.842316787924997e-06, "loss": 2.434568328857422, "step": 1534800 }, { "epoch": 1.852061638445024, "learning_rate": 3.841912952457259e-06, "loss": 2.465584716796875, "step": 1534900 }, { "epoch": 1.8521823017675065, "learning_rate": 3.84150911698952e-06, "loss": 2.4518557739257814, "step": 1535000 }, { "epoch": 1.8523029650899892, "learning_rate": 3.841105281521781e-06, "loss": 2.4441374206542967, "step": 1535100 }, { "epoch": 1.8524236284124718, "learning_rate": 3.840701446054043e-06, "loss": 2.422535705566406, "step": 1535200 }, { "epoch": 1.8525442917349546, "learning_rate": 3.840297610586305e-06, "loss": 2.440246124267578, "step": 1535300 }, { "epoch": 1.8526649550574372, "learning_rate": 3.839893775118566e-06, "loss": 2.424080352783203, "step": 1535400 }, { "epoch": 1.85278561837992, "learning_rate": 3.839489939650828e-06, "loss": 2.41131103515625, "step": 1535500 }, { "epoch": 1.8529062817024027, "learning_rate": 3.839086104183089e-06, "loss": 2.4357456970214844, "step": 1535600 }, { "epoch": 1.8530269450248853, "learning_rate": 3.838682268715351e-06, "loss": 2.4230564880371093, "step": 1535700 }, { "epoch": 1.853147608347368, "learning_rate": 3.838278433247613e-06, "loss": 2.4194383239746093, "step": 1535800 }, { "epoch": 1.8532682716698505, "learning_rate": 3.8378745977798745e-06, "loss": 2.4132379150390624, "step": 1535900 }, { "epoch": 1.8533889349923334, "learning_rate": 3.837470762312136e-06, "loss": 2.4179086303710937, "step": 1536000 }, { "epoch": 1.853509598314816, "learning_rate": 3.8370669268443976e-06, "loss": 2.423214111328125, "step": 1536100 }, { "epoch": 1.8536302616372988, "learning_rate": 3.8366630913766596e-06, "loss": 2.407090301513672, "step": 1536200 }, { "epoch": 1.8537509249597814, "learning_rate": 3.836259255908921e-06, "loss": 2.4330677795410156, "step": 1536300 }, { "epoch": 1.853871588282264, "learning_rate": 3.835855420441183e-06, "loss": 2.4128387451171873, "step": 1536400 }, { "epoch": 1.8539922516047467, "learning_rate": 3.835451584973444e-06, "loss": 2.4136085510253906, "step": 1536500 }, { "epoch": 1.8541129149272293, "learning_rate": 3.835047749505706e-06, "loss": 2.433245086669922, "step": 1536600 }, { "epoch": 1.8542335782497121, "learning_rate": 3.834643914037967e-06, "loss": 2.4649778747558595, "step": 1536700 }, { "epoch": 1.854354241572195, "learning_rate": 3.834240078570229e-06, "loss": 2.4465263366699217, "step": 1536800 }, { "epoch": 1.8544749048946776, "learning_rate": 3.833836243102491e-06, "loss": 2.411287536621094, "step": 1536900 }, { "epoch": 1.8545955682171602, "learning_rate": 3.833432407634752e-06, "loss": 2.4622203063964845, "step": 1537000 }, { "epoch": 1.8547162315396428, "learning_rate": 3.833028572167013e-06, "loss": 2.43156494140625, "step": 1537100 }, { "epoch": 1.8548368948621254, "learning_rate": 3.832624736699275e-06, "loss": 2.4224180603027343, "step": 1537200 }, { "epoch": 1.8549575581846083, "learning_rate": 3.832220901231537e-06, "loss": 2.428621368408203, "step": 1537300 }, { "epoch": 1.855078221507091, "learning_rate": 3.831817065763799e-06, "loss": 2.433116912841797, "step": 1537400 }, { "epoch": 1.8551988848295737, "learning_rate": 3.83141323029606e-06, "loss": 2.435688934326172, "step": 1537500 }, { "epoch": 1.8553195481520564, "learning_rate": 3.831009394828321e-06, "loss": 2.449479522705078, "step": 1537600 }, { "epoch": 1.855440211474539, "learning_rate": 3.830605559360583e-06, "loss": 2.4403662109375, "step": 1537700 }, { "epoch": 1.8555608747970216, "learning_rate": 3.830201723892845e-06, "loss": 2.4663819885253906, "step": 1537800 }, { "epoch": 1.8556815381195042, "learning_rate": 3.8297978884251065e-06, "loss": 2.4324407958984375, "step": 1537900 }, { "epoch": 1.855802201441987, "learning_rate": 3.8293940529573685e-06, "loss": 2.439719543457031, "step": 1538000 }, { "epoch": 1.8559228647644699, "learning_rate": 3.82899021748963e-06, "loss": 2.4348634338378905, "step": 1538100 }, { "epoch": 1.8560435280869525, "learning_rate": 3.828586382021892e-06, "loss": 2.437733154296875, "step": 1538200 }, { "epoch": 1.8561641914094351, "learning_rate": 3.828182546554153e-06, "loss": 2.4321116638183593, "step": 1538300 }, { "epoch": 1.8562848547319177, "learning_rate": 3.827778711086415e-06, "loss": 2.4485594177246095, "step": 1538400 }, { "epoch": 1.8564055180544003, "learning_rate": 3.827374875618677e-06, "loss": 2.4230528259277344, "step": 1538500 }, { "epoch": 1.8565261813768832, "learning_rate": 3.826971040150938e-06, "loss": 2.4325210571289064, "step": 1538600 }, { "epoch": 1.8566468446993658, "learning_rate": 3.826567204683199e-06, "loss": 2.432833557128906, "step": 1538700 }, { "epoch": 1.8567675080218486, "learning_rate": 3.826163369215461e-06, "loss": 2.4347990417480467, "step": 1538800 }, { "epoch": 1.8568881713443313, "learning_rate": 3.825759533747723e-06, "loss": 2.4265504455566407, "step": 1538900 }, { "epoch": 1.8570088346668139, "learning_rate": 3.825355698279984e-06, "loss": 2.427485046386719, "step": 1539000 }, { "epoch": 1.8571294979892965, "learning_rate": 3.824951862812246e-06, "loss": 2.4438655090332033, "step": 1539100 }, { "epoch": 1.8572501613117791, "learning_rate": 3.824548027344507e-06, "loss": 2.4398649597167967, "step": 1539200 }, { "epoch": 1.857370824634262, "learning_rate": 3.824144191876769e-06, "loss": 2.4294268798828127, "step": 1539300 }, { "epoch": 1.8574914879567446, "learning_rate": 3.823740356409031e-06, "loss": 2.4096937561035157, "step": 1539400 }, { "epoch": 1.8576121512792274, "learning_rate": 3.823336520941292e-06, "loss": 2.445700988769531, "step": 1539500 }, { "epoch": 1.85773281460171, "learning_rate": 3.822932685473553e-06, "loss": 2.4509342956542968, "step": 1539600 }, { "epoch": 1.8578534779241926, "learning_rate": 3.822528850005815e-06, "loss": 2.4344020080566406, "step": 1539700 }, { "epoch": 1.8579741412466753, "learning_rate": 3.822125014538077e-06, "loss": 2.414659881591797, "step": 1539800 }, { "epoch": 1.8580948045691579, "learning_rate": 3.821721179070339e-06, "loss": 2.4511769104003904, "step": 1539900 }, { "epoch": 1.8582154678916407, "learning_rate": 3.8213173436026005e-06, "loss": 2.435956573486328, "step": 1540000 }, { "epoch": 1.8583361312141236, "learning_rate": 3.820913508134862e-06, "loss": 2.4594677734375, "step": 1540100 }, { "epoch": 1.8584567945366062, "learning_rate": 3.820509672667124e-06, "loss": 2.4311769104003904, "step": 1540200 }, { "epoch": 1.8585774578590888, "learning_rate": 3.820105837199386e-06, "loss": 2.43041259765625, "step": 1540300 }, { "epoch": 1.8586981211815714, "learning_rate": 3.819702001731647e-06, "loss": 2.419527893066406, "step": 1540400 }, { "epoch": 1.858818784504054, "learning_rate": 3.819298166263909e-06, "loss": 2.4077330017089844, "step": 1540500 }, { "epoch": 1.8589394478265369, "learning_rate": 3.81889433079617e-06, "loss": 2.4416690063476563, "step": 1540600 }, { "epoch": 1.8590601111490195, "learning_rate": 3.818490495328432e-06, "loss": 2.4287315368652345, "step": 1540700 }, { "epoch": 1.8591807744715023, "learning_rate": 3.818086659860693e-06, "loss": 2.4428411865234376, "step": 1540800 }, { "epoch": 1.859301437793985, "learning_rate": 3.817682824392955e-06, "loss": 2.425250701904297, "step": 1540900 }, { "epoch": 1.8594221011164676, "learning_rate": 3.817278988925217e-06, "loss": 2.4255410766601564, "step": 1541000 }, { "epoch": 1.8595427644389502, "learning_rate": 3.816875153457478e-06, "loss": 2.4016070556640625, "step": 1541100 }, { "epoch": 1.8596634277614328, "learning_rate": 3.816471317989739e-06, "loss": 2.4362728881835936, "step": 1541200 }, { "epoch": 1.8597840910839156, "learning_rate": 3.816067482522001e-06, "loss": 2.4538368225097655, "step": 1541300 }, { "epoch": 1.8599047544063982, "learning_rate": 3.815663647054263e-06, "loss": 2.448605804443359, "step": 1541400 }, { "epoch": 1.860025417728881, "learning_rate": 3.815259811586524e-06, "loss": 2.444321594238281, "step": 1541500 }, { "epoch": 1.8601460810513637, "learning_rate": 3.814855976118786e-06, "loss": 2.415608673095703, "step": 1541600 }, { "epoch": 1.8602667443738463, "learning_rate": 3.814452140651048e-06, "loss": 2.4387806701660155, "step": 1541700 }, { "epoch": 1.860387407696329, "learning_rate": 3.8140483051833094e-06, "loss": 2.43407958984375, "step": 1541800 }, { "epoch": 1.8605080710188115, "learning_rate": 3.813644469715571e-06, "loss": 2.4451969909667968, "step": 1541900 }, { "epoch": 1.8606287343412944, "learning_rate": 3.8132406342478325e-06, "loss": 2.4316439819335938, "step": 1542000 }, { "epoch": 1.8607493976637772, "learning_rate": 3.812836798780094e-06, "loss": 2.440926208496094, "step": 1542100 }, { "epoch": 1.8608700609862598, "learning_rate": 3.8124329633123556e-06, "loss": 2.434532470703125, "step": 1542200 }, { "epoch": 1.8609907243087425, "learning_rate": 3.8120291278446176e-06, "loss": 2.44413330078125, "step": 1542300 }, { "epoch": 1.861111387631225, "learning_rate": 3.8116252923768787e-06, "loss": 2.442521820068359, "step": 1542400 }, { "epoch": 1.8612320509537077, "learning_rate": 3.8112214569091403e-06, "loss": 2.4295240783691407, "step": 1542500 }, { "epoch": 1.8613527142761905, "learning_rate": 3.8108176214414023e-06, "loss": 2.4453485107421873, "step": 1542600 }, { "epoch": 1.8614733775986732, "learning_rate": 3.810413785973664e-06, "loss": 2.455555419921875, "step": 1542700 }, { "epoch": 1.861594040921156, "learning_rate": 3.810009950505925e-06, "loss": 2.4276600646972657, "step": 1542800 }, { "epoch": 1.8617147042436386, "learning_rate": 3.809606115038187e-06, "loss": 2.4208302307128906, "step": 1542900 }, { "epoch": 1.8618353675661212, "learning_rate": 3.8092022795704485e-06, "loss": 2.4313417053222657, "step": 1543000 }, { "epoch": 1.8619560308886038, "learning_rate": 3.8087984441027105e-06, "loss": 2.433102874755859, "step": 1543100 }, { "epoch": 1.8620766942110865, "learning_rate": 3.8083946086349716e-06, "loss": 2.4556961059570312, "step": 1543200 }, { "epoch": 1.8621973575335693, "learning_rate": 3.807990773167233e-06, "loss": 2.430826416015625, "step": 1543300 }, { "epoch": 1.8623180208560521, "learning_rate": 3.807586937699495e-06, "loss": 2.424002838134766, "step": 1543400 }, { "epoch": 1.8624386841785348, "learning_rate": 3.8071831022317567e-06, "loss": 2.391703338623047, "step": 1543500 }, { "epoch": 1.8625593475010174, "learning_rate": 3.806779266764018e-06, "loss": 2.4129981994628906, "step": 1543600 }, { "epoch": 1.8626800108235, "learning_rate": 3.80637543129628e-06, "loss": 2.422019805908203, "step": 1543700 }, { "epoch": 1.8628006741459826, "learning_rate": 3.8059715958285414e-06, "loss": 2.4646145629882814, "step": 1543800 }, { "epoch": 1.8629213374684654, "learning_rate": 3.8055677603608034e-06, "loss": 2.4361920166015625, "step": 1543900 }, { "epoch": 1.863042000790948, "learning_rate": 3.8051639248930645e-06, "loss": 2.415410461425781, "step": 1544000 }, { "epoch": 1.863162664113431, "learning_rate": 3.804760089425326e-06, "loss": 2.442923889160156, "step": 1544100 }, { "epoch": 1.8632833274359135, "learning_rate": 3.804356253957588e-06, "loss": 2.4032984924316407, "step": 1544200 }, { "epoch": 1.8634039907583961, "learning_rate": 3.8039524184898496e-06, "loss": 2.4279776000976563, "step": 1544300 }, { "epoch": 1.8635246540808788, "learning_rate": 3.803548583022111e-06, "loss": 2.4292620849609374, "step": 1544400 }, { "epoch": 1.8636453174033614, "learning_rate": 3.8031447475543728e-06, "loss": 2.421059265136719, "step": 1544500 }, { "epoch": 1.8637659807258442, "learning_rate": 3.8027409120866343e-06, "loss": 2.408119812011719, "step": 1544600 }, { "epoch": 1.8638866440483268, "learning_rate": 3.802337076618896e-06, "loss": 2.428621368408203, "step": 1544700 }, { "epoch": 1.8640073073708097, "learning_rate": 3.801933241151158e-06, "loss": 2.414642028808594, "step": 1544800 }, { "epoch": 1.8641279706932923, "learning_rate": 3.801529405683419e-06, "loss": 2.4261123657226564, "step": 1544900 }, { "epoch": 1.864248634015775, "learning_rate": 3.8011255702156806e-06, "loss": 2.42587890625, "step": 1545000 }, { "epoch": 1.8643692973382575, "learning_rate": 3.8007217347479425e-06, "loss": 2.4347355651855467, "step": 1545100 }, { "epoch": 1.8644899606607401, "learning_rate": 3.800317899280204e-06, "loss": 2.418356475830078, "step": 1545200 }, { "epoch": 1.864610623983223, "learning_rate": 3.7999140638124652e-06, "loss": 2.4565005493164063, "step": 1545300 }, { "epoch": 1.8647312873057058, "learning_rate": 3.799510228344727e-06, "loss": 2.440034942626953, "step": 1545400 }, { "epoch": 1.8648519506281884, "learning_rate": 3.7991063928769888e-06, "loss": 2.4500006103515624, "step": 1545500 }, { "epoch": 1.864972613950671, "learning_rate": 3.7987025574092508e-06, "loss": 2.4277748107910155, "step": 1545600 }, { "epoch": 1.8650932772731537, "learning_rate": 3.798298721941512e-06, "loss": 2.441896667480469, "step": 1545700 }, { "epoch": 1.8652139405956363, "learning_rate": 3.7978948864737734e-06, "loss": 2.423558654785156, "step": 1545800 }, { "epoch": 1.8653346039181191, "learning_rate": 3.7974910510060354e-06, "loss": 2.462665252685547, "step": 1545900 }, { "epoch": 1.8654552672406017, "learning_rate": 3.797087215538297e-06, "loss": 2.427304382324219, "step": 1546000 }, { "epoch": 1.8655759305630846, "learning_rate": 3.796683380070558e-06, "loss": 2.4372886657714843, "step": 1546100 }, { "epoch": 1.8656965938855672, "learning_rate": 3.79627954460282e-06, "loss": 2.4091600036621093, "step": 1546200 }, { "epoch": 1.8658172572080498, "learning_rate": 3.7958757091350817e-06, "loss": 2.418689422607422, "step": 1546300 }, { "epoch": 1.8659379205305324, "learning_rate": 3.7954718736673436e-06, "loss": 2.4165403747558596, "step": 1546400 }, { "epoch": 1.866058583853015, "learning_rate": 3.7950680381996048e-06, "loss": 2.425578918457031, "step": 1546500 }, { "epoch": 1.8661792471754979, "learning_rate": 3.7946642027318663e-06, "loss": 2.4326771545410155, "step": 1546600 }, { "epoch": 1.8662999104979805, "learning_rate": 3.7942603672641283e-06, "loss": 2.409088134765625, "step": 1546700 }, { "epoch": 1.8664205738204633, "learning_rate": 3.79385653179639e-06, "loss": 2.415463104248047, "step": 1546800 }, { "epoch": 1.866541237142946, "learning_rate": 3.793452696328651e-06, "loss": 2.442599639892578, "step": 1546900 }, { "epoch": 1.8666619004654286, "learning_rate": 3.793048860860913e-06, "loss": 2.4232691955566406, "step": 1547000 }, { "epoch": 1.8667825637879112, "learning_rate": 3.7926450253931746e-06, "loss": 2.437453308105469, "step": 1547100 }, { "epoch": 1.8669032271103938, "learning_rate": 3.792241189925436e-06, "loss": 2.4517861938476564, "step": 1547200 }, { "epoch": 1.8670238904328766, "learning_rate": 3.7918373544576977e-06, "loss": 2.410336761474609, "step": 1547300 }, { "epoch": 1.8671445537553595, "learning_rate": 3.7914335189899592e-06, "loss": 2.4301332092285155, "step": 1547400 }, { "epoch": 1.867265217077842, "learning_rate": 3.791029683522221e-06, "loss": 2.4326821899414064, "step": 1547500 }, { "epoch": 1.8673858804003247, "learning_rate": 3.7906258480544828e-06, "loss": 2.4067156982421873, "step": 1547600 }, { "epoch": 1.8675065437228073, "learning_rate": 3.790222012586744e-06, "loss": 2.4319566345214843, "step": 1547700 }, { "epoch": 1.86762720704529, "learning_rate": 3.7898181771190055e-06, "loss": 2.4530101013183594, "step": 1547800 }, { "epoch": 1.8677478703677728, "learning_rate": 3.7894143416512675e-06, "loss": 2.443653564453125, "step": 1547900 }, { "epoch": 1.8678685336902554, "learning_rate": 3.789010506183529e-06, "loss": 2.4544223022460936, "step": 1548000 }, { "epoch": 1.8679891970127382, "learning_rate": 3.78860667071579e-06, "loss": 2.4382035827636717, "step": 1548100 }, { "epoch": 1.8681098603352209, "learning_rate": 3.788202835248052e-06, "loss": 2.4253166198730467, "step": 1548200 }, { "epoch": 1.8682305236577035, "learning_rate": 3.7877989997803137e-06, "loss": 2.4301332092285155, "step": 1548300 }, { "epoch": 1.868351186980186, "learning_rate": 3.7873951643125757e-06, "loss": 2.42890380859375, "step": 1548400 }, { "epoch": 1.8684718503026687, "learning_rate": 3.786991328844837e-06, "loss": 2.446513214111328, "step": 1548500 }, { "epoch": 1.8685925136251516, "learning_rate": 3.7865874933770984e-06, "loss": 2.418091583251953, "step": 1548600 }, { "epoch": 1.8687131769476344, "learning_rate": 3.7861836579093603e-06, "loss": 2.4452748107910156, "step": 1548700 }, { "epoch": 1.868833840270117, "learning_rate": 3.785779822441622e-06, "loss": 2.426166534423828, "step": 1548800 }, { "epoch": 1.8689545035925996, "learning_rate": 3.785375986973883e-06, "loss": 2.420709686279297, "step": 1548900 }, { "epoch": 1.8690751669150822, "learning_rate": 3.784972151506145e-06, "loss": 2.4196841430664064, "step": 1549000 }, { "epoch": 1.8691958302375649, "learning_rate": 3.7845683160384066e-06, "loss": 2.4382334899902345, "step": 1549100 }, { "epoch": 1.8693164935600477, "learning_rate": 3.7841644805706686e-06, "loss": 2.4091949462890625, "step": 1549200 }, { "epoch": 1.8694371568825303, "learning_rate": 3.7837606451029297e-06, "loss": 2.4393911743164063, "step": 1549300 }, { "epoch": 1.8695578202050132, "learning_rate": 3.7833568096351913e-06, "loss": 2.425936737060547, "step": 1549400 }, { "epoch": 1.8696784835274958, "learning_rate": 3.7829529741674532e-06, "loss": 2.4277310180664062, "step": 1549500 }, { "epoch": 1.8697991468499784, "learning_rate": 3.782549138699715e-06, "loss": 2.425767059326172, "step": 1549600 }, { "epoch": 1.869919810172461, "learning_rate": 3.7821453032319768e-06, "loss": 2.4371574401855467, "step": 1549700 }, { "epoch": 1.8700404734949436, "learning_rate": 3.781741467764238e-06, "loss": 2.4224652099609374, "step": 1549800 }, { "epoch": 1.8701611368174265, "learning_rate": 3.7813376322964995e-06, "loss": 2.418629608154297, "step": 1549900 }, { "epoch": 1.870281800139909, "learning_rate": 3.7809337968287615e-06, "loss": 2.453372802734375, "step": 1550000 }, { "epoch": 1.870402463462392, "learning_rate": 3.780529961361023e-06, "loss": 2.4275770568847657, "step": 1550100 }, { "epoch": 1.8705231267848745, "learning_rate": 3.780126125893284e-06, "loss": 2.4384429931640623, "step": 1550200 }, { "epoch": 1.8706437901073572, "learning_rate": 3.779722290425546e-06, "loss": 2.417184143066406, "step": 1550300 }, { "epoch": 1.8707644534298398, "learning_rate": 3.7793184549578077e-06, "loss": 2.4344207763671877, "step": 1550400 }, { "epoch": 1.8708851167523224, "learning_rate": 3.7789146194900693e-06, "loss": 2.450997772216797, "step": 1550500 }, { "epoch": 1.8710057800748052, "learning_rate": 3.778510784022331e-06, "loss": 2.448580017089844, "step": 1550600 }, { "epoch": 1.871126443397288, "learning_rate": 3.7781069485545924e-06, "loss": 2.4278533935546873, "step": 1550700 }, { "epoch": 1.8712471067197707, "learning_rate": 3.777703113086854e-06, "loss": 2.4341993713378907, "step": 1550800 }, { "epoch": 1.8713677700422533, "learning_rate": 3.777299277619116e-06, "loss": 2.433064727783203, "step": 1550900 }, { "epoch": 1.871488433364736, "learning_rate": 3.776895442151377e-06, "loss": 2.4439073181152344, "step": 1551000 }, { "epoch": 1.8716090966872185, "learning_rate": 3.7764916066836386e-06, "loss": 2.4058355712890624, "step": 1551100 }, { "epoch": 1.8717297600097014, "learning_rate": 3.7760877712159006e-06, "loss": 2.441944122314453, "step": 1551200 }, { "epoch": 1.871850423332184, "learning_rate": 3.775683935748162e-06, "loss": 2.410032196044922, "step": 1551300 }, { "epoch": 1.8719710866546668, "learning_rate": 3.7752801002804233e-06, "loss": 2.4230778503417967, "step": 1551400 }, { "epoch": 1.8720917499771494, "learning_rate": 3.7748762648126853e-06, "loss": 2.4226324462890627, "step": 1551500 }, { "epoch": 1.872212413299632, "learning_rate": 3.774472429344947e-06, "loss": 2.4253106689453126, "step": 1551600 }, { "epoch": 1.8723330766221147, "learning_rate": 3.774068593877209e-06, "loss": 2.450467529296875, "step": 1551700 }, { "epoch": 1.8724537399445973, "learning_rate": 3.77366475840947e-06, "loss": 2.4235055541992185, "step": 1551800 }, { "epoch": 1.8725744032670801, "learning_rate": 3.7732609229417315e-06, "loss": 2.4506488037109375, "step": 1551900 }, { "epoch": 1.8726950665895628, "learning_rate": 3.7728570874739935e-06, "loss": 2.4316146850585936, "step": 1552000 }, { "epoch": 1.8728157299120456, "learning_rate": 3.772453252006255e-06, "loss": 2.441747741699219, "step": 1552100 }, { "epoch": 1.8729363932345282, "learning_rate": 3.772049416538516e-06, "loss": 2.4307086181640627, "step": 1552200 }, { "epoch": 1.8730570565570108, "learning_rate": 3.771645581070778e-06, "loss": 2.444449920654297, "step": 1552300 }, { "epoch": 1.8731777198794934, "learning_rate": 3.7712417456030397e-06, "loss": 2.4407373046875, "step": 1552400 }, { "epoch": 1.873298383201976, "learning_rate": 3.7708379101353017e-06, "loss": 2.410560760498047, "step": 1552500 }, { "epoch": 1.873419046524459, "learning_rate": 3.770434074667563e-06, "loss": 2.4233416748046874, "step": 1552600 }, { "epoch": 1.8735397098469417, "learning_rate": 3.7700302391998244e-06, "loss": 2.425584259033203, "step": 1552700 }, { "epoch": 1.8736603731694244, "learning_rate": 3.7696264037320864e-06, "loss": 2.438157958984375, "step": 1552800 }, { "epoch": 1.873781036491907, "learning_rate": 3.769222568264348e-06, "loss": 2.431878662109375, "step": 1552900 }, { "epoch": 1.8739016998143896, "learning_rate": 3.768818732796609e-06, "loss": 2.453172454833984, "step": 1553000 }, { "epoch": 1.8740223631368722, "learning_rate": 3.768414897328871e-06, "loss": 2.425126953125, "step": 1553100 }, { "epoch": 1.874143026459355, "learning_rate": 3.7680110618611326e-06, "loss": 2.430608367919922, "step": 1553200 }, { "epoch": 1.8742636897818377, "learning_rate": 3.767607226393394e-06, "loss": 2.413636016845703, "step": 1553300 }, { "epoch": 1.8743843531043205, "learning_rate": 3.7672033909256557e-06, "loss": 2.4343472290039063, "step": 1553400 }, { "epoch": 1.8745050164268031, "learning_rate": 3.7667995554579173e-06, "loss": 2.4427311706542967, "step": 1553500 }, { "epoch": 1.8746256797492857, "learning_rate": 3.766395719990179e-06, "loss": 2.415516357421875, "step": 1553600 }, { "epoch": 1.8747463430717684, "learning_rate": 3.765991884522441e-06, "loss": 2.431519775390625, "step": 1553700 }, { "epoch": 1.874867006394251, "learning_rate": 3.765588049054702e-06, "loss": 2.4043743896484373, "step": 1553800 }, { "epoch": 1.8749876697167338, "learning_rate": 3.7651842135869635e-06, "loss": 2.424771423339844, "step": 1553900 }, { "epoch": 1.8751083330392166, "learning_rate": 3.7647803781192255e-06, "loss": 2.4331297302246093, "step": 1554000 }, { "epoch": 1.8752289963616993, "learning_rate": 3.764376542651487e-06, "loss": 2.4241961669921874, "step": 1554100 }, { "epoch": 1.8753496596841819, "learning_rate": 3.763972707183748e-06, "loss": 2.4267338562011718, "step": 1554200 }, { "epoch": 1.8754703230066645, "learning_rate": 3.76356887171601e-06, "loss": 2.4330400085449218, "step": 1554300 }, { "epoch": 1.8755909863291471, "learning_rate": 3.7631650362482717e-06, "loss": 2.437216339111328, "step": 1554400 }, { "epoch": 1.87571164965163, "learning_rate": 3.7627612007805337e-06, "loss": 2.4318540954589842, "step": 1554500 }, { "epoch": 1.8758323129741126, "learning_rate": 3.7623573653127953e-06, "loss": 2.3948455810546876, "step": 1554600 }, { "epoch": 1.8759529762965954, "learning_rate": 3.7619535298450564e-06, "loss": 2.4308384704589843, "step": 1554700 }, { "epoch": 1.876073639619078, "learning_rate": 3.7615496943773184e-06, "loss": 2.4128376770019533, "step": 1554800 }, { "epoch": 1.8761943029415606, "learning_rate": 3.76114585890958e-06, "loss": 2.452573089599609, "step": 1554900 }, { "epoch": 1.8763149662640433, "learning_rate": 3.760742023441842e-06, "loss": 2.434567108154297, "step": 1555000 }, { "epoch": 1.8764356295865259, "learning_rate": 3.760338187974103e-06, "loss": 2.443358154296875, "step": 1555100 }, { "epoch": 1.8765562929090087, "learning_rate": 3.7599343525063646e-06, "loss": 2.4372213745117186, "step": 1555200 }, { "epoch": 1.8766769562314913, "learning_rate": 3.7595305170386266e-06, "loss": 2.4215689086914063, "step": 1555300 }, { "epoch": 1.8767976195539742, "learning_rate": 3.759126681570888e-06, "loss": 2.4384951782226563, "step": 1555400 }, { "epoch": 1.8769182828764568, "learning_rate": 3.7587228461031493e-06, "loss": 2.4168487548828126, "step": 1555500 }, { "epoch": 1.8770389461989394, "learning_rate": 3.7583190106354113e-06, "loss": 2.424752502441406, "step": 1555600 }, { "epoch": 1.877159609521422, "learning_rate": 3.757915175167673e-06, "loss": 2.4167776489257813, "step": 1555700 }, { "epoch": 1.8772802728439046, "learning_rate": 3.757511339699935e-06, "loss": 2.413709716796875, "step": 1555800 }, { "epoch": 1.8774009361663875, "learning_rate": 3.757107504232196e-06, "loss": 2.4125717163085936, "step": 1555900 }, { "epoch": 1.8775215994888703, "learning_rate": 3.7567036687644575e-06, "loss": 2.4255216979980467, "step": 1556000 }, { "epoch": 1.877642262811353, "learning_rate": 3.7562998332967195e-06, "loss": 2.423836669921875, "step": 1556100 }, { "epoch": 1.8777629261338356, "learning_rate": 3.755895997828981e-06, "loss": 2.4287738037109374, "step": 1556200 }, { "epoch": 1.8778835894563182, "learning_rate": 3.7554921623612422e-06, "loss": 2.3971511840820314, "step": 1556300 }, { "epoch": 1.8780042527788008, "learning_rate": 3.755088326893504e-06, "loss": 2.403552703857422, "step": 1556400 }, { "epoch": 1.8781249161012836, "learning_rate": 3.7546844914257658e-06, "loss": 2.4150234985351564, "step": 1556500 }, { "epoch": 1.8782455794237662, "learning_rate": 3.7542806559580273e-06, "loss": 2.410536041259766, "step": 1556600 }, { "epoch": 1.878366242746249, "learning_rate": 3.753876820490289e-06, "loss": 2.427120361328125, "step": 1556700 }, { "epoch": 1.8784869060687317, "learning_rate": 3.7534729850225504e-06, "loss": 2.4364144897460935, "step": 1556800 }, { "epoch": 1.8786075693912143, "learning_rate": 3.753069149554812e-06, "loss": 2.4577102661132812, "step": 1556900 }, { "epoch": 1.878728232713697, "learning_rate": 3.752665314087074e-06, "loss": 2.4221795654296874, "step": 1557000 }, { "epoch": 1.8788488960361795, "learning_rate": 3.752261478619335e-06, "loss": 2.389821319580078, "step": 1557100 }, { "epoch": 1.8789695593586624, "learning_rate": 3.7518576431515967e-06, "loss": 2.451032257080078, "step": 1557200 }, { "epoch": 1.879090222681145, "learning_rate": 3.7514538076838587e-06, "loss": 2.474637298583984, "step": 1557300 }, { "epoch": 1.8792108860036278, "learning_rate": 3.75104997221612e-06, "loss": 2.4100798034667967, "step": 1557400 }, { "epoch": 1.8793315493261105, "learning_rate": 3.7506461367483813e-06, "loss": 2.4117852783203126, "step": 1557500 }, { "epoch": 1.879452212648593, "learning_rate": 3.7502423012806433e-06, "loss": 2.4501358032226563, "step": 1557600 }, { "epoch": 1.8795728759710757, "learning_rate": 3.749838465812905e-06, "loss": 2.4257936096191406, "step": 1557700 }, { "epoch": 1.8796935392935583, "learning_rate": 3.749434630345167e-06, "loss": 2.4201507568359375, "step": 1557800 }, { "epoch": 1.8798142026160412, "learning_rate": 3.749030794877428e-06, "loss": 2.425975036621094, "step": 1557900 }, { "epoch": 1.879934865938524, "learning_rate": 3.7486269594096896e-06, "loss": 2.4253814697265623, "step": 1558000 }, { "epoch": 1.8800555292610066, "learning_rate": 3.7482231239419515e-06, "loss": 2.43584228515625, "step": 1558100 }, { "epoch": 1.8801761925834892, "learning_rate": 3.747819288474213e-06, "loss": 2.437994079589844, "step": 1558200 }, { "epoch": 1.8802968559059718, "learning_rate": 3.7474154530064742e-06, "loss": 2.4415827941894532, "step": 1558300 }, { "epoch": 1.8804175192284545, "learning_rate": 3.7470116175387362e-06, "loss": 2.4247764587402343, "step": 1558400 }, { "epoch": 1.8805381825509373, "learning_rate": 3.7466077820709978e-06, "loss": 2.4308039855957033, "step": 1558500 }, { "epoch": 1.88065884587342, "learning_rate": 3.7462039466032598e-06, "loss": 2.426876220703125, "step": 1558600 }, { "epoch": 1.8807795091959028, "learning_rate": 3.745800111135521e-06, "loss": 2.4243751525878907, "step": 1558700 }, { "epoch": 1.8809001725183854, "learning_rate": 3.7453962756677825e-06, "loss": 2.4078070068359376, "step": 1558800 }, { "epoch": 1.881020835840868, "learning_rate": 3.7449924402000444e-06, "loss": 2.454630584716797, "step": 1558900 }, { "epoch": 1.8811414991633506, "learning_rate": 3.744588604732306e-06, "loss": 2.422115936279297, "step": 1559000 }, { "epoch": 1.8812621624858332, "learning_rate": 3.744184769264567e-06, "loss": 2.416592864990234, "step": 1559100 }, { "epoch": 1.881382825808316, "learning_rate": 3.743780933796829e-06, "loss": 2.437705078125, "step": 1559200 }, { "epoch": 1.881503489130799, "learning_rate": 3.7433770983290907e-06, "loss": 2.4580422973632814, "step": 1559300 }, { "epoch": 1.8816241524532815, "learning_rate": 3.7429732628613522e-06, "loss": 2.450306243896484, "step": 1559400 }, { "epoch": 1.8817448157757641, "learning_rate": 3.742569427393614e-06, "loss": 2.435895538330078, "step": 1559500 }, { "epoch": 1.8818654790982468, "learning_rate": 3.7421655919258754e-06, "loss": 2.4332000732421877, "step": 1559600 }, { "epoch": 1.8819861424207294, "learning_rate": 3.741761756458137e-06, "loss": 2.424968566894531, "step": 1559700 }, { "epoch": 1.8821068057432122, "learning_rate": 3.741357920990399e-06, "loss": 2.4195487976074217, "step": 1559800 }, { "epoch": 1.8822274690656948, "learning_rate": 3.7409540855226605e-06, "loss": 2.4091670227050783, "step": 1559900 }, { "epoch": 1.8823481323881777, "learning_rate": 3.7405502500549216e-06, "loss": 2.4093362426757814, "step": 1560000 }, { "epoch": 1.8824687957106603, "learning_rate": 3.7401464145871836e-06, "loss": 2.4105999755859373, "step": 1560100 }, { "epoch": 1.882589459033143, "learning_rate": 3.739742579119445e-06, "loss": 2.438915100097656, "step": 1560200 }, { "epoch": 1.8827101223556255, "learning_rate": 3.739338743651707e-06, "loss": 2.4320858764648436, "step": 1560300 }, { "epoch": 1.8828307856781081, "learning_rate": 3.7389349081839682e-06, "loss": 2.406113586425781, "step": 1560400 }, { "epoch": 1.882951449000591, "learning_rate": 3.73853107271623e-06, "loss": 2.437918243408203, "step": 1560500 }, { "epoch": 1.8830721123230736, "learning_rate": 3.738127237248492e-06, "loss": 2.456574249267578, "step": 1560600 }, { "epoch": 1.8831927756455564, "learning_rate": 3.7377234017807534e-06, "loss": 2.4254212951660157, "step": 1560700 }, { "epoch": 1.883313438968039, "learning_rate": 3.7373195663130145e-06, "loss": 2.42231201171875, "step": 1560800 }, { "epoch": 1.8834341022905217, "learning_rate": 3.7369157308452765e-06, "loss": 2.4165740966796876, "step": 1560900 }, { "epoch": 1.8835547656130043, "learning_rate": 3.736511895377538e-06, "loss": 2.4282830810546874, "step": 1561000 }, { "epoch": 1.883675428935487, "learning_rate": 3.7361080599098e-06, "loss": 2.4218695068359377, "step": 1561100 }, { "epoch": 1.8837960922579697, "learning_rate": 3.735704224442061e-06, "loss": 2.4148008728027346, "step": 1561200 }, { "epoch": 1.8839167555804526, "learning_rate": 3.7353003889743227e-06, "loss": 2.4454986572265627, "step": 1561300 }, { "epoch": 1.8840374189029352, "learning_rate": 3.7348965535065847e-06, "loss": 2.4534123229980467, "step": 1561400 }, { "epoch": 1.8841580822254178, "learning_rate": 3.7344927180388462e-06, "loss": 2.4405914306640626, "step": 1561500 }, { "epoch": 1.8842787455479004, "learning_rate": 3.7340888825711074e-06, "loss": 2.43791748046875, "step": 1561600 }, { "epoch": 1.884399408870383, "learning_rate": 3.7336850471033694e-06, "loss": 2.420409851074219, "step": 1561700 }, { "epoch": 1.8845200721928659, "learning_rate": 3.733281211635631e-06, "loss": 2.4100331115722655, "step": 1561800 }, { "epoch": 1.8846407355153485, "learning_rate": 3.732877376167893e-06, "loss": 2.4422364807128907, "step": 1561900 }, { "epoch": 1.8847613988378313, "learning_rate": 3.732473540700154e-06, "loss": 2.4489450073242187, "step": 1562000 }, { "epoch": 1.884882062160314, "learning_rate": 3.7320697052324156e-06, "loss": 2.3993124389648437, "step": 1562100 }, { "epoch": 1.8850027254827966, "learning_rate": 3.7316658697646776e-06, "loss": 2.404912109375, "step": 1562200 }, { "epoch": 1.8851233888052792, "learning_rate": 3.731262034296939e-06, "loss": 2.4007948303222655, "step": 1562300 }, { "epoch": 1.8852440521277618, "learning_rate": 3.7308581988292003e-06, "loss": 2.4361257934570313, "step": 1562400 }, { "epoch": 1.8853647154502446, "learning_rate": 3.7304543633614623e-06, "loss": 2.402272186279297, "step": 1562500 }, { "epoch": 1.8854853787727273, "learning_rate": 3.730050527893724e-06, "loss": 2.4448477172851564, "step": 1562600 }, { "epoch": 1.88560604209521, "learning_rate": 3.7296466924259854e-06, "loss": 2.409091796875, "step": 1562700 }, { "epoch": 1.8857267054176927, "learning_rate": 3.729242856958247e-06, "loss": 2.400624542236328, "step": 1562800 }, { "epoch": 1.8858473687401753, "learning_rate": 3.7288390214905085e-06, "loss": 2.411277618408203, "step": 1562900 }, { "epoch": 1.885968032062658, "learning_rate": 3.72843518602277e-06, "loss": 2.435188751220703, "step": 1563000 }, { "epoch": 1.8860886953851406, "learning_rate": 3.728031350555032e-06, "loss": 2.4248220825195315, "step": 1563100 }, { "epoch": 1.8862093587076234, "learning_rate": 3.727627515087293e-06, "loss": 2.4325621032714846, "step": 1563200 }, { "epoch": 1.8863300220301062, "learning_rate": 3.7272236796195547e-06, "loss": 2.4134271240234373, "step": 1563300 }, { "epoch": 1.8864506853525889, "learning_rate": 3.7268198441518167e-06, "loss": 2.431482696533203, "step": 1563400 }, { "epoch": 1.8865713486750715, "learning_rate": 3.7264160086840783e-06, "loss": 2.425517883300781, "step": 1563500 }, { "epoch": 1.886692011997554, "learning_rate": 3.7260121732163394e-06, "loss": 2.4033383178710936, "step": 1563600 }, { "epoch": 1.8868126753200367, "learning_rate": 3.7256083377486014e-06, "loss": 2.4297520446777345, "step": 1563700 }, { "epoch": 1.8869333386425196, "learning_rate": 3.725204502280863e-06, "loss": 2.4502745056152344, "step": 1563800 }, { "epoch": 1.8870540019650022, "learning_rate": 3.724800666813125e-06, "loss": 2.415736083984375, "step": 1563900 }, { "epoch": 1.887174665287485, "learning_rate": 3.724396831345386e-06, "loss": 2.4202505493164064, "step": 1564000 }, { "epoch": 1.8872953286099676, "learning_rate": 3.7239929958776476e-06, "loss": 2.4180508422851563, "step": 1564100 }, { "epoch": 1.8874159919324502, "learning_rate": 3.7235891604099096e-06, "loss": 2.3959349060058592, "step": 1564200 }, { "epoch": 1.8875366552549329, "learning_rate": 3.723185324942171e-06, "loss": 2.417259521484375, "step": 1564300 }, { "epoch": 1.8876573185774155, "learning_rate": 3.7227814894744323e-06, "loss": 2.4249505615234375, "step": 1564400 }, { "epoch": 1.8877779818998983, "learning_rate": 3.7223776540066943e-06, "loss": 2.426027984619141, "step": 1564500 }, { "epoch": 1.8878986452223812, "learning_rate": 3.721973818538956e-06, "loss": 2.4430467224121095, "step": 1564600 }, { "epoch": 1.8880193085448638, "learning_rate": 3.721569983071218e-06, "loss": 2.4281846618652345, "step": 1564700 }, { "epoch": 1.8881399718673464, "learning_rate": 3.721166147603479e-06, "loss": 2.4179255676269533, "step": 1564800 }, { "epoch": 1.888260635189829, "learning_rate": 3.7207623121357405e-06, "loss": 2.4398037719726564, "step": 1564900 }, { "epoch": 1.8883812985123116, "learning_rate": 3.7203584766680025e-06, "loss": 2.4080850219726564, "step": 1565000 }, { "epoch": 1.8885019618347945, "learning_rate": 3.719954641200264e-06, "loss": 2.4164476013183593, "step": 1565100 }, { "epoch": 1.888622625157277, "learning_rate": 3.7195508057325256e-06, "loss": 2.4079393005371093, "step": 1565200 }, { "epoch": 1.88874328847976, "learning_rate": 3.719146970264787e-06, "loss": 2.400249481201172, "step": 1565300 }, { "epoch": 1.8888639518022425, "learning_rate": 3.7187431347970487e-06, "loss": 2.4241552734375, "step": 1565400 }, { "epoch": 1.8889846151247252, "learning_rate": 3.7183392993293103e-06, "loss": 2.407884979248047, "step": 1565500 }, { "epoch": 1.8891052784472078, "learning_rate": 3.7179354638615723e-06, "loss": 2.459189453125, "step": 1565600 }, { "epoch": 1.8892259417696904, "learning_rate": 3.7175316283938334e-06, "loss": 2.4132649230957033, "step": 1565700 }, { "epoch": 1.8893466050921732, "learning_rate": 3.717127792926095e-06, "loss": 2.453031463623047, "step": 1565800 }, { "epoch": 1.8894672684146558, "learning_rate": 3.716723957458357e-06, "loss": 2.4391860961914062, "step": 1565900 }, { "epoch": 1.8895879317371387, "learning_rate": 3.7163201219906185e-06, "loss": 2.4242897033691406, "step": 1566000 }, { "epoch": 1.8897085950596213, "learning_rate": 3.7159162865228797e-06, "loss": 2.419852600097656, "step": 1566100 }, { "epoch": 1.889829258382104, "learning_rate": 3.7155124510551416e-06, "loss": 2.4351902770996094, "step": 1566200 }, { "epoch": 1.8899499217045865, "learning_rate": 3.715108615587403e-06, "loss": 2.422099609375, "step": 1566300 }, { "epoch": 1.8900705850270691, "learning_rate": 3.714704780119665e-06, "loss": 2.442519073486328, "step": 1566400 }, { "epoch": 1.890191248349552, "learning_rate": 3.7143009446519263e-06, "loss": 2.4271308898925783, "step": 1566500 }, { "epoch": 1.8903119116720348, "learning_rate": 3.713897109184188e-06, "loss": 2.4295428466796873, "step": 1566600 }, { "epoch": 1.8904325749945174, "learning_rate": 3.71349327371645e-06, "loss": 2.4437506103515627, "step": 1566700 }, { "epoch": 1.890553238317, "learning_rate": 3.7130894382487114e-06, "loss": 2.4198548889160154, "step": 1566800 }, { "epoch": 1.8906739016394827, "learning_rate": 3.7126856027809725e-06, "loss": 2.4493666076660157, "step": 1566900 }, { "epoch": 1.8907945649619653, "learning_rate": 3.7122817673132345e-06, "loss": 2.414295501708984, "step": 1567000 }, { "epoch": 1.8909152282844481, "learning_rate": 3.711877931845496e-06, "loss": 2.4057960510253906, "step": 1567100 }, { "epoch": 1.8910358916069308, "learning_rate": 3.711474096377758e-06, "loss": 2.438407135009766, "step": 1567200 }, { "epoch": 1.8911565549294136, "learning_rate": 3.711070260910019e-06, "loss": 2.3941461181640626, "step": 1567300 }, { "epoch": 1.8912772182518962, "learning_rate": 3.7106664254422808e-06, "loss": 2.39455078125, "step": 1567400 }, { "epoch": 1.8913978815743788, "learning_rate": 3.7102625899745427e-06, "loss": 2.4393763732910156, "step": 1567500 }, { "epoch": 1.8915185448968614, "learning_rate": 3.7098587545068043e-06, "loss": 2.4307321166992186, "step": 1567600 }, { "epoch": 1.891639208219344, "learning_rate": 3.7094549190390654e-06, "loss": 2.4507174682617188, "step": 1567700 }, { "epoch": 1.891759871541827, "learning_rate": 3.7090510835713274e-06, "loss": 2.4650228881835936, "step": 1567800 }, { "epoch": 1.8918805348643095, "learning_rate": 3.708647248103589e-06, "loss": 2.432243194580078, "step": 1567900 }, { "epoch": 1.8920011981867924, "learning_rate": 3.7082434126358505e-06, "loss": 2.446344909667969, "step": 1568000 }, { "epoch": 1.892121861509275, "learning_rate": 3.707839577168112e-06, "loss": 2.423443603515625, "step": 1568100 }, { "epoch": 1.8922425248317576, "learning_rate": 3.7074357417003737e-06, "loss": 2.4584426879882812, "step": 1568200 }, { "epoch": 1.8923631881542402, "learning_rate": 3.7070319062326352e-06, "loss": 2.4230189514160156, "step": 1568300 }, { "epoch": 1.892483851476723, "learning_rate": 3.706628070764897e-06, "loss": 2.4288296508789062, "step": 1568400 }, { "epoch": 1.8926045147992057, "learning_rate": 3.7062242352971583e-06, "loss": 2.4161892700195313, "step": 1568500 }, { "epoch": 1.8927251781216885, "learning_rate": 3.70582039982942e-06, "loss": 2.449143981933594, "step": 1568600 }, { "epoch": 1.8928458414441711, "learning_rate": 3.705416564361682e-06, "loss": 2.4286151123046875, "step": 1568700 }, { "epoch": 1.8929665047666537, "learning_rate": 3.7050127288939434e-06, "loss": 2.436674041748047, "step": 1568800 }, { "epoch": 1.8930871680891364, "learning_rate": 3.7046088934262046e-06, "loss": 2.4053553771972656, "step": 1568900 }, { "epoch": 1.893207831411619, "learning_rate": 3.7042050579584666e-06, "loss": 2.439009094238281, "step": 1569000 }, { "epoch": 1.8933284947341018, "learning_rate": 3.703801222490728e-06, "loss": 2.416606903076172, "step": 1569100 }, { "epoch": 1.8934491580565844, "learning_rate": 3.70339738702299e-06, "loss": 2.436351013183594, "step": 1569200 }, { "epoch": 1.8935698213790673, "learning_rate": 3.7029935515552512e-06, "loss": 2.4099591064453123, "step": 1569300 }, { "epoch": 1.8936904847015499, "learning_rate": 3.702589716087513e-06, "loss": 2.441964111328125, "step": 1569400 }, { "epoch": 1.8938111480240325, "learning_rate": 3.7021858806197748e-06, "loss": 2.426812744140625, "step": 1569500 }, { "epoch": 1.8939318113465151, "learning_rate": 3.7017820451520363e-06, "loss": 2.3962661743164064, "step": 1569600 }, { "epoch": 1.8940524746689977, "learning_rate": 3.7013782096842975e-06, "loss": 2.4379998779296876, "step": 1569700 }, { "epoch": 1.8941731379914806, "learning_rate": 3.7009743742165594e-06, "loss": 2.426189117431641, "step": 1569800 }, { "epoch": 1.8942938013139634, "learning_rate": 3.700570538748821e-06, "loss": 2.428040771484375, "step": 1569900 }, { "epoch": 1.894414464636446, "learning_rate": 3.700166703281083e-06, "loss": 2.4311447143554688, "step": 1570000 }, { "epoch": 1.8945351279589286, "learning_rate": 3.6997628678133445e-06, "loss": 2.4199754333496095, "step": 1570100 }, { "epoch": 1.8946557912814113, "learning_rate": 3.6993590323456057e-06, "loss": 2.4273805236816406, "step": 1570200 }, { "epoch": 1.8947764546038939, "learning_rate": 3.6989551968778677e-06, "loss": 2.4266708374023436, "step": 1570300 }, { "epoch": 1.8948971179263767, "learning_rate": 3.6985513614101292e-06, "loss": 2.4055516052246095, "step": 1570400 }, { "epoch": 1.8950177812488593, "learning_rate": 3.698147525942391e-06, "loss": 2.4175830078125, "step": 1570500 }, { "epoch": 1.8951384445713422, "learning_rate": 3.6977436904746523e-06, "loss": 2.4143589782714843, "step": 1570600 }, { "epoch": 1.8952591078938248, "learning_rate": 3.697339855006914e-06, "loss": 2.4404205322265624, "step": 1570700 }, { "epoch": 1.8953797712163074, "learning_rate": 3.696936019539176e-06, "loss": 2.436672821044922, "step": 1570800 }, { "epoch": 1.89550043453879, "learning_rate": 3.6965321840714374e-06, "loss": 2.4164134216308595, "step": 1570900 }, { "epoch": 1.8956210978612726, "learning_rate": 3.6961283486036986e-06, "loss": 2.4238603210449217, "step": 1571000 }, { "epoch": 1.8957417611837555, "learning_rate": 3.6957245131359606e-06, "loss": 2.4395082092285154, "step": 1571100 }, { "epoch": 1.895862424506238, "learning_rate": 3.695320677668222e-06, "loss": 2.4524774169921875, "step": 1571200 }, { "epoch": 1.895983087828721, "learning_rate": 3.6949168422004837e-06, "loss": 2.4284136962890623, "step": 1571300 }, { "epoch": 1.8961037511512036, "learning_rate": 3.6945130067327452e-06, "loss": 2.40754150390625, "step": 1571400 }, { "epoch": 1.8962244144736862, "learning_rate": 3.694109171265007e-06, "loss": 2.4050306701660156, "step": 1571500 }, { "epoch": 1.8963450777961688, "learning_rate": 3.6937053357972684e-06, "loss": 2.435812683105469, "step": 1571600 }, { "epoch": 1.8964657411186514, "learning_rate": 3.6933015003295303e-06, "loss": 2.4258653259277345, "step": 1571700 }, { "epoch": 1.8965864044411342, "learning_rate": 3.6928976648617915e-06, "loss": 2.4391009521484377, "step": 1571800 }, { "epoch": 1.896707067763617, "learning_rate": 3.692493829394053e-06, "loss": 2.405911407470703, "step": 1571900 }, { "epoch": 1.8968277310860997, "learning_rate": 3.692089993926315e-06, "loss": 2.418018493652344, "step": 1572000 }, { "epoch": 1.8969483944085823, "learning_rate": 3.6916861584585766e-06, "loss": 2.4179452514648436, "step": 1572100 }, { "epoch": 1.897069057731065, "learning_rate": 3.6912823229908377e-06, "loss": 2.4325799560546875, "step": 1572200 }, { "epoch": 1.8971897210535476, "learning_rate": 3.6908784875230997e-06, "loss": 2.408083648681641, "step": 1572300 }, { "epoch": 1.8973103843760304, "learning_rate": 3.6904746520553613e-06, "loss": 2.4161924743652343, "step": 1572400 }, { "epoch": 1.897431047698513, "learning_rate": 3.6900708165876232e-06, "loss": 2.4369967651367186, "step": 1572500 }, { "epoch": 1.8975517110209958, "learning_rate": 3.6896669811198844e-06, "loss": 2.422754364013672, "step": 1572600 }, { "epoch": 1.8976723743434785, "learning_rate": 3.689263145652146e-06, "loss": 2.4111231994628906, "step": 1572700 }, { "epoch": 1.897793037665961, "learning_rate": 3.688859310184408e-06, "loss": 2.4240591430664065, "step": 1572800 }, { "epoch": 1.8979137009884437, "learning_rate": 3.6884554747166695e-06, "loss": 2.4526141357421873, "step": 1572900 }, { "epoch": 1.8980343643109263, "learning_rate": 3.6880516392489306e-06, "loss": 2.4193165588378904, "step": 1573000 }, { "epoch": 1.8981550276334092, "learning_rate": 3.6876478037811926e-06, "loss": 2.414083251953125, "step": 1573100 }, { "epoch": 1.8982756909558918, "learning_rate": 3.687243968313454e-06, "loss": 2.4117660522460938, "step": 1573200 }, { "epoch": 1.8983963542783746, "learning_rate": 3.686840132845716e-06, "loss": 2.421522674560547, "step": 1573300 }, { "epoch": 1.8985170176008572, "learning_rate": 3.6864362973779773e-06, "loss": 2.417006378173828, "step": 1573400 }, { "epoch": 1.8986376809233398, "learning_rate": 3.686032461910239e-06, "loss": 2.442607574462891, "step": 1573500 }, { "epoch": 1.8987583442458225, "learning_rate": 3.685628626442501e-06, "loss": 2.427953796386719, "step": 1573600 }, { "epoch": 1.8988790075683053, "learning_rate": 3.6852247909747624e-06, "loss": 2.419419250488281, "step": 1573700 }, { "epoch": 1.898999670890788, "learning_rate": 3.6848209555070235e-06, "loss": 2.4092201232910155, "step": 1573800 }, { "epoch": 1.8991203342132708, "learning_rate": 3.6844171200392855e-06, "loss": 2.4336318969726562, "step": 1573900 }, { "epoch": 1.8992409975357534, "learning_rate": 3.684013284571547e-06, "loss": 2.4321319580078127, "step": 1574000 }, { "epoch": 1.899361660858236, "learning_rate": 3.6836094491038086e-06, "loss": 2.413782958984375, "step": 1574100 }, { "epoch": 1.8994823241807186, "learning_rate": 3.68320561363607e-06, "loss": 2.424707794189453, "step": 1574200 }, { "epoch": 1.8996029875032012, "learning_rate": 3.6828017781683317e-06, "loss": 2.434251556396484, "step": 1574300 }, { "epoch": 1.899723650825684, "learning_rate": 3.6823979427005933e-06, "loss": 2.423983612060547, "step": 1574400 }, { "epoch": 1.8998443141481667, "learning_rate": 3.6819941072328553e-06, "loss": 2.4284733581542968, "step": 1574500 }, { "epoch": 1.8999649774706495, "learning_rate": 3.6815902717651164e-06, "loss": 2.409667510986328, "step": 1574600 }, { "epoch": 1.9000856407931321, "learning_rate": 3.681186436297378e-06, "loss": 2.427321319580078, "step": 1574700 }, { "epoch": 1.9002063041156148, "learning_rate": 3.68078260082964e-06, "loss": 2.41212158203125, "step": 1574800 }, { "epoch": 1.9003269674380974, "learning_rate": 3.6803787653619015e-06, "loss": 2.4279049682617186, "step": 1574900 }, { "epoch": 1.90044763076058, "learning_rate": 3.6799749298941626e-06, "loss": 2.413191223144531, "step": 1575000 }, { "epoch": 1.9005682940830628, "learning_rate": 3.6795710944264246e-06, "loss": 2.420989685058594, "step": 1575100 }, { "epoch": 1.9006889574055457, "learning_rate": 3.679167258958686e-06, "loss": 2.4183294677734377, "step": 1575200 }, { "epoch": 1.9008096207280283, "learning_rate": 3.678763423490948e-06, "loss": 2.4124400329589846, "step": 1575300 }, { "epoch": 1.900930284050511, "learning_rate": 3.6783595880232097e-06, "loss": 2.4540203857421874, "step": 1575400 }, { "epoch": 1.9010509473729935, "learning_rate": 3.677955752555471e-06, "loss": 2.398612823486328, "step": 1575500 }, { "epoch": 1.9011716106954761, "learning_rate": 3.677551917087733e-06, "loss": 2.4194015502929687, "step": 1575600 }, { "epoch": 1.901292274017959, "learning_rate": 3.6771480816199944e-06, "loss": 2.4315232849121093, "step": 1575700 }, { "epoch": 1.9014129373404416, "learning_rate": 3.6767442461522564e-06, "loss": 2.4037828063964843, "step": 1575800 }, { "epoch": 1.9015336006629244, "learning_rate": 3.6763404106845175e-06, "loss": 2.4515728759765625, "step": 1575900 }, { "epoch": 1.901654263985407, "learning_rate": 3.675936575216779e-06, "loss": 2.4215884399414063, "step": 1576000 }, { "epoch": 1.9017749273078897, "learning_rate": 3.675532739749041e-06, "loss": 2.4087098693847655, "step": 1576100 }, { "epoch": 1.9018955906303723, "learning_rate": 3.6751289042813026e-06, "loss": 2.450660858154297, "step": 1576200 }, { "epoch": 1.902016253952855, "learning_rate": 3.6747250688135637e-06, "loss": 2.428350524902344, "step": 1576300 }, { "epoch": 1.9021369172753377, "learning_rate": 3.6743212333458257e-06, "loss": 2.4199369812011717, "step": 1576400 }, { "epoch": 1.9022575805978204, "learning_rate": 3.6739173978780873e-06, "loss": 2.4350885009765624, "step": 1576500 }, { "epoch": 1.9023782439203032, "learning_rate": 3.6735135624103493e-06, "loss": 2.4012078857421875, "step": 1576600 }, { "epoch": 1.9024989072427858, "learning_rate": 3.6731097269426104e-06, "loss": 2.4052882385253906, "step": 1576700 }, { "epoch": 1.9026195705652684, "learning_rate": 3.672705891474872e-06, "loss": 2.414615478515625, "step": 1576800 }, { "epoch": 1.902740233887751, "learning_rate": 3.672302056007134e-06, "loss": 2.4241656494140624, "step": 1576900 }, { "epoch": 1.9028608972102337, "learning_rate": 3.6718982205393955e-06, "loss": 2.4204646301269532, "step": 1577000 }, { "epoch": 1.9029815605327165, "learning_rate": 3.6714943850716566e-06, "loss": 2.405528564453125, "step": 1577100 }, { "epoch": 1.9031022238551993, "learning_rate": 3.6710905496039186e-06, "loss": 2.4409298706054687, "step": 1577200 }, { "epoch": 1.903222887177682, "learning_rate": 3.67068671413618e-06, "loss": 2.4305833435058593, "step": 1577300 }, { "epoch": 1.9033435505001646, "learning_rate": 3.6702828786684417e-06, "loss": 2.4205421447753905, "step": 1577400 }, { "epoch": 1.9034642138226472, "learning_rate": 3.6698790432007033e-06, "loss": 2.441993865966797, "step": 1577500 }, { "epoch": 1.9035848771451298, "learning_rate": 3.669475207732965e-06, "loss": 2.435485076904297, "step": 1577600 }, { "epoch": 1.9037055404676126, "learning_rate": 3.6690713722652264e-06, "loss": 2.4177476501464845, "step": 1577700 }, { "epoch": 1.9038262037900953, "learning_rate": 3.6686675367974884e-06, "loss": 2.4436772155761717, "step": 1577800 }, { "epoch": 1.903946867112578, "learning_rate": 3.6682637013297495e-06, "loss": 2.4352947998046877, "step": 1577900 }, { "epoch": 1.9040675304350607, "learning_rate": 3.667859865862011e-06, "loss": 2.4409330749511717, "step": 1578000 }, { "epoch": 1.9041881937575433, "learning_rate": 3.667456030394273e-06, "loss": 2.450980224609375, "step": 1578100 }, { "epoch": 1.904308857080026, "learning_rate": 3.6670521949265346e-06, "loss": 2.4048321533203123, "step": 1578200 }, { "epoch": 1.9044295204025086, "learning_rate": 3.6666483594587958e-06, "loss": 2.438008575439453, "step": 1578300 }, { "epoch": 1.9045501837249914, "learning_rate": 3.6662445239910578e-06, "loss": 2.4163548278808595, "step": 1578400 }, { "epoch": 1.904670847047474, "learning_rate": 3.6658406885233193e-06, "loss": 2.448316650390625, "step": 1578500 }, { "epoch": 1.9047915103699569, "learning_rate": 3.6654368530555813e-06, "loss": 2.4309396362304687, "step": 1578600 }, { "epoch": 1.9049121736924395, "learning_rate": 3.6650330175878424e-06, "loss": 2.4356510925292967, "step": 1578700 }, { "epoch": 1.905032837014922, "learning_rate": 3.664629182120104e-06, "loss": 2.4194717407226562, "step": 1578800 }, { "epoch": 1.9051535003374047, "learning_rate": 3.664225346652366e-06, "loss": 2.424374237060547, "step": 1578900 }, { "epoch": 1.9052741636598876, "learning_rate": 3.6638215111846275e-06, "loss": 2.434731292724609, "step": 1579000 }, { "epoch": 1.9053948269823702, "learning_rate": 3.6634176757168887e-06, "loss": 2.4073878479003907, "step": 1579100 }, { "epoch": 1.905515490304853, "learning_rate": 3.6630138402491506e-06, "loss": 2.4331129455566405, "step": 1579200 }, { "epoch": 1.9056361536273356, "learning_rate": 3.662610004781412e-06, "loss": 2.434634552001953, "step": 1579300 }, { "epoch": 1.9057568169498182, "learning_rate": 3.662206169313674e-06, "loss": 2.4207110595703125, "step": 1579400 }, { "epoch": 1.9058774802723009, "learning_rate": 3.6618023338459353e-06, "loss": 2.4272845458984373, "step": 1579500 }, { "epoch": 1.9059981435947835, "learning_rate": 3.661398498378197e-06, "loss": 2.42362548828125, "step": 1579600 }, { "epoch": 1.9061188069172663, "learning_rate": 3.660994662910459e-06, "loss": 2.4457431030273438, "step": 1579700 }, { "epoch": 1.906239470239749, "learning_rate": 3.6605908274427204e-06, "loss": 2.429814758300781, "step": 1579800 }, { "epoch": 1.9063601335622318, "learning_rate": 3.6601869919749816e-06, "loss": 2.4462539672851564, "step": 1579900 }, { "epoch": 1.9064807968847144, "learning_rate": 3.6597831565072435e-06, "loss": 2.422250518798828, "step": 1580000 }, { "epoch": 1.906601460207197, "learning_rate": 3.659379321039505e-06, "loss": 2.417603302001953, "step": 1580100 }, { "epoch": 1.9067221235296796, "learning_rate": 3.6589754855717667e-06, "loss": 2.385449981689453, "step": 1580200 }, { "epoch": 1.9068427868521622, "learning_rate": 3.6585716501040282e-06, "loss": 2.4212648010253908, "step": 1580300 }, { "epoch": 1.906963450174645, "learning_rate": 3.6581678146362898e-06, "loss": 2.4313221740722657, "step": 1580400 }, { "epoch": 1.907084113497128, "learning_rate": 3.6577639791685513e-06, "loss": 2.4174766540527344, "step": 1580500 }, { "epoch": 1.9072047768196105, "learning_rate": 3.6573601437008133e-06, "loss": 2.422402801513672, "step": 1580600 }, { "epoch": 1.9073254401420932, "learning_rate": 3.656956308233075e-06, "loss": 2.4154037475585937, "step": 1580700 }, { "epoch": 1.9074461034645758, "learning_rate": 3.656552472765336e-06, "loss": 2.4214710998535156, "step": 1580800 }, { "epoch": 1.9075667667870584, "learning_rate": 3.656148637297598e-06, "loss": 2.4040205383300783, "step": 1580900 }, { "epoch": 1.9076874301095412, "learning_rate": 3.6557448018298596e-06, "loss": 2.421287078857422, "step": 1581000 }, { "epoch": 1.9078080934320238, "learning_rate": 3.6553409663621215e-06, "loss": 2.4326492309570313, "step": 1581100 }, { "epoch": 1.9079287567545067, "learning_rate": 3.6549371308943827e-06, "loss": 2.4266400146484375, "step": 1581200 }, { "epoch": 1.9080494200769893, "learning_rate": 3.6545332954266442e-06, "loss": 2.411173858642578, "step": 1581300 }, { "epoch": 1.908170083399472, "learning_rate": 3.6541294599589062e-06, "loss": 2.4388372802734377, "step": 1581400 }, { "epoch": 1.9082907467219545, "learning_rate": 3.6537256244911678e-06, "loss": 2.413219146728516, "step": 1581500 }, { "epoch": 1.9084114100444372, "learning_rate": 3.653321789023429e-06, "loss": 2.407933807373047, "step": 1581600 }, { "epoch": 1.90853207336692, "learning_rate": 3.652917953555691e-06, "loss": 2.427490234375, "step": 1581700 }, { "epoch": 1.9086527366894026, "learning_rate": 3.6525141180879525e-06, "loss": 2.4356724548339845, "step": 1581800 }, { "epoch": 1.9087734000118854, "learning_rate": 3.6521102826202144e-06, "loss": 2.412606048583984, "step": 1581900 }, { "epoch": 1.908894063334368, "learning_rate": 3.6517064471524756e-06, "loss": 2.4075462341308596, "step": 1582000 }, { "epoch": 1.9090147266568507, "learning_rate": 3.651302611684737e-06, "loss": 2.425275421142578, "step": 1582100 }, { "epoch": 1.9091353899793333, "learning_rate": 3.650898776216999e-06, "loss": 2.4338409423828127, "step": 1582200 }, { "epoch": 1.909256053301816, "learning_rate": 3.6504949407492607e-06, "loss": 2.422117919921875, "step": 1582300 }, { "epoch": 1.9093767166242988, "learning_rate": 3.650091105281522e-06, "loss": 2.4227915954589845, "step": 1582400 }, { "epoch": 1.9094973799467816, "learning_rate": 3.6496872698137838e-06, "loss": 2.4643521118164062, "step": 1582500 }, { "epoch": 1.9096180432692642, "learning_rate": 3.6492834343460453e-06, "loss": 2.423326873779297, "step": 1582600 }, { "epoch": 1.9097387065917468, "learning_rate": 3.6488795988783073e-06, "loss": 2.4384028625488283, "step": 1582700 }, { "epoch": 1.9098593699142294, "learning_rate": 3.6484757634105685e-06, "loss": 2.4173715209960935, "step": 1582800 }, { "epoch": 1.909980033236712, "learning_rate": 3.64807192794283e-06, "loss": 2.4336399841308594, "step": 1582900 }, { "epoch": 1.910100696559195, "learning_rate": 3.647668092475092e-06, "loss": 2.42327880859375, "step": 1583000 }, { "epoch": 1.9102213598816775, "learning_rate": 3.6472642570073536e-06, "loss": 2.4063174438476564, "step": 1583100 }, { "epoch": 1.9103420232041604, "learning_rate": 3.6468604215396147e-06, "loss": 2.422912292480469, "step": 1583200 }, { "epoch": 1.910462686526643, "learning_rate": 3.6464565860718767e-06, "loss": 2.404812774658203, "step": 1583300 }, { "epoch": 1.9105833498491256, "learning_rate": 3.6460527506041382e-06, "loss": 2.4034770202636717, "step": 1583400 }, { "epoch": 1.9107040131716082, "learning_rate": 3.6456489151364e-06, "loss": 2.411757354736328, "step": 1583500 }, { "epoch": 1.9108246764940908, "learning_rate": 3.645245079668661e-06, "loss": 2.4379637145996096, "step": 1583600 }, { "epoch": 1.9109453398165737, "learning_rate": 3.644841244200923e-06, "loss": 2.458066253662109, "step": 1583700 }, { "epoch": 1.9110660031390563, "learning_rate": 3.6444374087331845e-06, "loss": 2.428444519042969, "step": 1583800 }, { "epoch": 1.9111866664615391, "learning_rate": 3.6440335732654465e-06, "loss": 2.4153701782226564, "step": 1583900 }, { "epoch": 1.9113073297840217, "learning_rate": 3.6436297377977076e-06, "loss": 2.428718719482422, "step": 1584000 }, { "epoch": 1.9114279931065044, "learning_rate": 3.643225902329969e-06, "loss": 2.4327073669433594, "step": 1584100 }, { "epoch": 1.911548656428987, "learning_rate": 3.642822066862231e-06, "loss": 2.412140350341797, "step": 1584200 }, { "epoch": 1.9116693197514698, "learning_rate": 3.6424182313944927e-06, "loss": 2.435455017089844, "step": 1584300 }, { "epoch": 1.9117899830739524, "learning_rate": 3.642014395926754e-06, "loss": 2.4358787536621094, "step": 1584400 }, { "epoch": 1.9119106463964353, "learning_rate": 3.641610560459016e-06, "loss": 2.421814727783203, "step": 1584500 }, { "epoch": 1.9120313097189179, "learning_rate": 3.6412067249912774e-06, "loss": 2.438079071044922, "step": 1584600 }, { "epoch": 1.9121519730414005, "learning_rate": 3.6408028895235394e-06, "loss": 2.407384338378906, "step": 1584700 }, { "epoch": 1.9122726363638831, "learning_rate": 3.6403990540558005e-06, "loss": 2.442793731689453, "step": 1584800 }, { "epoch": 1.9123932996863657, "learning_rate": 3.639995218588062e-06, "loss": 2.4254328918457033, "step": 1584900 }, { "epoch": 1.9125139630088486, "learning_rate": 3.639591383120324e-06, "loss": 2.388721923828125, "step": 1585000 }, { "epoch": 1.9126346263313312, "learning_rate": 3.6391875476525856e-06, "loss": 2.4393099975585937, "step": 1585100 }, { "epoch": 1.912755289653814, "learning_rate": 3.6387837121848467e-06, "loss": 2.4330076599121093, "step": 1585200 }, { "epoch": 1.9128759529762966, "learning_rate": 3.6383798767171087e-06, "loss": 2.4004869079589843, "step": 1585300 }, { "epoch": 1.9129966162987793, "learning_rate": 3.6379760412493703e-06, "loss": 2.420149841308594, "step": 1585400 }, { "epoch": 1.9131172796212619, "learning_rate": 3.6375722057816322e-06, "loss": 2.4152891540527346, "step": 1585500 }, { "epoch": 1.9132379429437445, "learning_rate": 3.637168370313894e-06, "loss": 2.401560974121094, "step": 1585600 }, { "epoch": 1.9133586062662273, "learning_rate": 3.636764534846155e-06, "loss": 2.420676574707031, "step": 1585700 }, { "epoch": 1.9134792695887102, "learning_rate": 3.636360699378417e-06, "loss": 2.431707763671875, "step": 1585800 }, { "epoch": 1.9135999329111928, "learning_rate": 3.6359568639106785e-06, "loss": 2.430321044921875, "step": 1585900 }, { "epoch": 1.9137205962336754, "learning_rate": 3.63555302844294e-06, "loss": 2.423315124511719, "step": 1586000 }, { "epoch": 1.913841259556158, "learning_rate": 3.6351491929752016e-06, "loss": 2.4391108703613282, "step": 1586100 }, { "epoch": 1.9139619228786406, "learning_rate": 3.634745357507463e-06, "loss": 2.433746032714844, "step": 1586200 }, { "epoch": 1.9140825862011235, "learning_rate": 3.6343415220397247e-06, "loss": 2.4113714599609377, "step": 1586300 }, { "epoch": 1.914203249523606, "learning_rate": 3.6339376865719867e-06, "loss": 2.4256044006347657, "step": 1586400 }, { "epoch": 1.914323912846089, "learning_rate": 3.633533851104248e-06, "loss": 2.435028839111328, "step": 1586500 }, { "epoch": 1.9144445761685716, "learning_rate": 3.6331300156365094e-06, "loss": 2.4214869689941407, "step": 1586600 }, { "epoch": 1.9145652394910542, "learning_rate": 3.6327261801687714e-06, "loss": 2.4222596740722655, "step": 1586700 }, { "epoch": 1.9146859028135368, "learning_rate": 3.632322344701033e-06, "loss": 2.43822998046875, "step": 1586800 }, { "epoch": 1.9148065661360194, "learning_rate": 3.631918509233294e-06, "loss": 2.432628936767578, "step": 1586900 }, { "epoch": 1.9149272294585022, "learning_rate": 3.631514673765556e-06, "loss": 2.416792144775391, "step": 1587000 }, { "epoch": 1.9150478927809849, "learning_rate": 3.6311108382978176e-06, "loss": 2.4469886779785157, "step": 1587100 }, { "epoch": 1.9151685561034677, "learning_rate": 3.6307070028300796e-06, "loss": 2.417222900390625, "step": 1587200 }, { "epoch": 1.9152892194259503, "learning_rate": 3.6303031673623407e-06, "loss": 2.4130038452148437, "step": 1587300 }, { "epoch": 1.915409882748433, "learning_rate": 3.6298993318946023e-06, "loss": 2.433729400634766, "step": 1587400 }, { "epoch": 1.9155305460709156, "learning_rate": 3.6294954964268643e-06, "loss": 2.4409617614746093, "step": 1587500 }, { "epoch": 1.9156512093933982, "learning_rate": 3.629091660959126e-06, "loss": 2.427817077636719, "step": 1587600 }, { "epoch": 1.915771872715881, "learning_rate": 3.628687825491387e-06, "loss": 2.4232247924804686, "step": 1587700 }, { "epoch": 1.9158925360383638, "learning_rate": 3.628283990023649e-06, "loss": 2.4376393127441407, "step": 1587800 }, { "epoch": 1.9160131993608465, "learning_rate": 3.6278801545559105e-06, "loss": 2.406996765136719, "step": 1587900 }, { "epoch": 1.916133862683329, "learning_rate": 3.6274763190881725e-06, "loss": 2.4223085021972657, "step": 1588000 }, { "epoch": 1.9162545260058117, "learning_rate": 3.6270724836204336e-06, "loss": 2.4393515014648437, "step": 1588100 }, { "epoch": 1.9163751893282943, "learning_rate": 3.626668648152695e-06, "loss": 2.413396911621094, "step": 1588200 }, { "epoch": 1.9164958526507772, "learning_rate": 3.626264812684957e-06, "loss": 2.434170684814453, "step": 1588300 }, { "epoch": 1.9166165159732598, "learning_rate": 3.6258609772172187e-06, "loss": 2.4190943908691405, "step": 1588400 }, { "epoch": 1.9167371792957426, "learning_rate": 3.62545714174948e-06, "loss": 2.4056124877929688, "step": 1588500 }, { "epoch": 1.9168578426182252, "learning_rate": 3.625053306281742e-06, "loss": 2.443455810546875, "step": 1588600 }, { "epoch": 1.9169785059407078, "learning_rate": 3.6246494708140034e-06, "loss": 2.426269989013672, "step": 1588700 }, { "epoch": 1.9170991692631905, "learning_rate": 3.624245635346265e-06, "loss": 2.43367919921875, "step": 1588800 }, { "epoch": 1.917219832585673, "learning_rate": 3.6238417998785265e-06, "loss": 2.4269363403320314, "step": 1588900 }, { "epoch": 1.917340495908156, "learning_rate": 3.623437964410788e-06, "loss": 2.398011016845703, "step": 1589000 }, { "epoch": 1.9174611592306385, "learning_rate": 3.6230341289430496e-06, "loss": 2.416480712890625, "step": 1589100 }, { "epoch": 1.9175818225531214, "learning_rate": 3.6226302934753116e-06, "loss": 2.416936340332031, "step": 1589200 }, { "epoch": 1.917702485875604, "learning_rate": 3.6222264580075728e-06, "loss": 2.427601165771484, "step": 1589300 }, { "epoch": 1.9178231491980866, "learning_rate": 3.6218226225398343e-06, "loss": 2.428177490234375, "step": 1589400 }, { "epoch": 1.9179438125205692, "learning_rate": 3.6214187870720963e-06, "loss": 2.4154129028320312, "step": 1589500 }, { "epoch": 1.918064475843052, "learning_rate": 3.621014951604358e-06, "loss": 2.4567715454101564, "step": 1589600 }, { "epoch": 1.9181851391655347, "learning_rate": 3.620611116136619e-06, "loss": 2.405514831542969, "step": 1589700 }, { "epoch": 1.9183058024880175, "learning_rate": 3.620207280668881e-06, "loss": 2.420873260498047, "step": 1589800 }, { "epoch": 1.9184264658105001, "learning_rate": 3.6198034452011425e-06, "loss": 2.4295286560058593, "step": 1589900 }, { "epoch": 1.9185471291329828, "learning_rate": 3.6193996097334045e-06, "loss": 2.437022399902344, "step": 1590000 }, { "epoch": 1.9186677924554654, "learning_rate": 3.6189957742656657e-06, "loss": 2.430570068359375, "step": 1590100 }, { "epoch": 1.918788455777948, "learning_rate": 3.6185919387979272e-06, "loss": 2.4238099670410156, "step": 1590200 }, { "epoch": 1.9189091191004308, "learning_rate": 3.618188103330189e-06, "loss": 2.4150489807128905, "step": 1590300 }, { "epoch": 1.9190297824229134, "learning_rate": 3.6177842678624508e-06, "loss": 2.4413169860839843, "step": 1590400 }, { "epoch": 1.9191504457453963, "learning_rate": 3.617380432394712e-06, "loss": 2.420645751953125, "step": 1590500 }, { "epoch": 1.919271109067879, "learning_rate": 3.616976596926974e-06, "loss": 2.431846008300781, "step": 1590600 }, { "epoch": 1.9193917723903615, "learning_rate": 3.6165727614592354e-06, "loss": 2.4368608093261717, "step": 1590700 }, { "epoch": 1.9195124357128441, "learning_rate": 3.6161689259914974e-06, "loss": 2.3857427978515626, "step": 1590800 }, { "epoch": 1.9196330990353268, "learning_rate": 3.615765090523759e-06, "loss": 2.4241493225097654, "step": 1590900 }, { "epoch": 1.9197537623578096, "learning_rate": 3.61536125505602e-06, "loss": 2.4438409423828125, "step": 1591000 }, { "epoch": 1.9198744256802924, "learning_rate": 3.614957419588282e-06, "loss": 2.4156170654296876, "step": 1591100 }, { "epoch": 1.919995089002775, "learning_rate": 3.6145535841205436e-06, "loss": 2.4054295349121095, "step": 1591200 }, { "epoch": 1.9201157523252577, "learning_rate": 3.6141497486528056e-06, "loss": 2.4380726623535156, "step": 1591300 }, { "epoch": 1.9202364156477403, "learning_rate": 3.6137459131850668e-06, "loss": 2.450131378173828, "step": 1591400 }, { "epoch": 1.920357078970223, "learning_rate": 3.6133420777173283e-06, "loss": 2.4246476745605468, "step": 1591500 }, { "epoch": 1.9204777422927057, "learning_rate": 3.6129382422495903e-06, "loss": 2.4192654418945314, "step": 1591600 }, { "epoch": 1.9205984056151884, "learning_rate": 3.612534406781852e-06, "loss": 2.4379702758789064, "step": 1591700 }, { "epoch": 1.9207190689376712, "learning_rate": 3.612130571314113e-06, "loss": 2.4342230224609374, "step": 1591800 }, { "epoch": 1.9208397322601538, "learning_rate": 3.611726735846375e-06, "loss": 2.4186988830566407, "step": 1591900 }, { "epoch": 1.9209603955826364, "learning_rate": 3.6113229003786365e-06, "loss": 2.424341735839844, "step": 1592000 }, { "epoch": 1.921081058905119, "learning_rate": 3.610919064910898e-06, "loss": 2.4216458129882814, "step": 1592100 }, { "epoch": 1.9212017222276017, "learning_rate": 3.6105152294431597e-06, "loss": 2.4226593017578124, "step": 1592200 }, { "epoch": 1.9213223855500845, "learning_rate": 3.6101113939754212e-06, "loss": 2.438141174316406, "step": 1592300 }, { "epoch": 1.9214430488725671, "learning_rate": 3.6097075585076828e-06, "loss": 2.4068785095214844, "step": 1592400 }, { "epoch": 1.92156371219505, "learning_rate": 3.6093037230399448e-06, "loss": 2.4048194885253906, "step": 1592500 }, { "epoch": 1.9216843755175326, "learning_rate": 3.608899887572206e-06, "loss": 2.4319613647460936, "step": 1592600 }, { "epoch": 1.9218050388400152, "learning_rate": 3.6084960521044675e-06, "loss": 2.4382470703125, "step": 1592700 }, { "epoch": 1.9219257021624978, "learning_rate": 3.6080922166367294e-06, "loss": 2.4172271728515624, "step": 1592800 }, { "epoch": 1.9220463654849804, "learning_rate": 3.607688381168991e-06, "loss": 2.422564697265625, "step": 1592900 }, { "epoch": 1.9221670288074633, "learning_rate": 3.607284545701252e-06, "loss": 2.4210670471191404, "step": 1593000 }, { "epoch": 1.922287692129946, "learning_rate": 3.606880710233514e-06, "loss": 2.4252278137207033, "step": 1593100 }, { "epoch": 1.9224083554524287, "learning_rate": 3.6064768747657757e-06, "loss": 2.4044461059570312, "step": 1593200 }, { "epoch": 1.9225290187749113, "learning_rate": 3.6060730392980377e-06, "loss": 2.4225529479980468, "step": 1593300 }, { "epoch": 1.922649682097394, "learning_rate": 3.605669203830299e-06, "loss": 2.4225572204589843, "step": 1593400 }, { "epoch": 1.9227703454198766, "learning_rate": 3.6052653683625604e-06, "loss": 2.422384948730469, "step": 1593500 }, { "epoch": 1.9228910087423594, "learning_rate": 3.6048615328948223e-06, "loss": 2.422252197265625, "step": 1593600 }, { "epoch": 1.923011672064842, "learning_rate": 3.604457697427084e-06, "loss": 2.423900451660156, "step": 1593700 }, { "epoch": 1.9231323353873249, "learning_rate": 3.604053861959345e-06, "loss": 2.396889343261719, "step": 1593800 }, { "epoch": 1.9232529987098075, "learning_rate": 3.603650026491607e-06, "loss": 2.4272836303710936, "step": 1593900 }, { "epoch": 1.92337366203229, "learning_rate": 3.6032461910238686e-06, "loss": 2.4379905700683593, "step": 1594000 }, { "epoch": 1.9234943253547727, "learning_rate": 3.6028423555561306e-06, "loss": 2.402771301269531, "step": 1594100 }, { "epoch": 1.9236149886772553, "learning_rate": 3.6024385200883917e-06, "loss": 2.4053240966796876, "step": 1594200 }, { "epoch": 1.9237356519997382, "learning_rate": 3.6020346846206532e-06, "loss": 2.422737579345703, "step": 1594300 }, { "epoch": 1.923856315322221, "learning_rate": 3.6016308491529152e-06, "loss": 2.4108404541015624, "step": 1594400 }, { "epoch": 1.9239769786447036, "learning_rate": 3.6012270136851768e-06, "loss": 2.4329454040527345, "step": 1594500 }, { "epoch": 1.9240976419671862, "learning_rate": 3.600823178217438e-06, "loss": 2.421120910644531, "step": 1594600 }, { "epoch": 1.9242183052896689, "learning_rate": 3.6004193427497e-06, "loss": 2.425576019287109, "step": 1594700 }, { "epoch": 1.9243389686121515, "learning_rate": 3.6000155072819615e-06, "loss": 2.4290708923339843, "step": 1594800 }, { "epoch": 1.9244596319346343, "learning_rate": 3.599611671814223e-06, "loss": 2.397962646484375, "step": 1594900 }, { "epoch": 1.924580295257117, "learning_rate": 3.5992078363464846e-06, "loss": 2.4360617065429686, "step": 1595000 }, { "epoch": 1.9247009585795998, "learning_rate": 3.598804000878746e-06, "loss": 2.436789093017578, "step": 1595100 }, { "epoch": 1.9248216219020824, "learning_rate": 3.5984001654110077e-06, "loss": 2.4117393493652344, "step": 1595200 }, { "epoch": 1.924942285224565, "learning_rate": 3.5979963299432697e-06, "loss": 2.4181227111816406, "step": 1595300 }, { "epoch": 1.9250629485470476, "learning_rate": 3.597592494475531e-06, "loss": 2.3899972534179685, "step": 1595400 }, { "epoch": 1.9251836118695302, "learning_rate": 3.5971886590077924e-06, "loss": 2.4308351135253905, "step": 1595500 }, { "epoch": 1.925304275192013, "learning_rate": 3.5967848235400544e-06, "loss": 2.411239013671875, "step": 1595600 }, { "epoch": 1.9254249385144957, "learning_rate": 3.596380988072316e-06, "loss": 2.4171470642089843, "step": 1595700 }, { "epoch": 1.9255456018369785, "learning_rate": 3.595977152604578e-06, "loss": 2.442044677734375, "step": 1595800 }, { "epoch": 1.9256662651594612, "learning_rate": 3.595573317136839e-06, "loss": 2.432189178466797, "step": 1595900 }, { "epoch": 1.9257869284819438, "learning_rate": 3.5951694816691006e-06, "loss": 2.433086242675781, "step": 1596000 }, { "epoch": 1.9259075918044264, "learning_rate": 3.5947656462013626e-06, "loss": 2.4228253173828125, "step": 1596100 }, { "epoch": 1.926028255126909, "learning_rate": 3.594361810733624e-06, "loss": 2.4106428527832033, "step": 1596200 }, { "epoch": 1.9261489184493918, "learning_rate": 3.5939579752658853e-06, "loss": 2.435897216796875, "step": 1596300 }, { "epoch": 1.9262695817718747, "learning_rate": 3.5935541397981473e-06, "loss": 2.4111676025390625, "step": 1596400 }, { "epoch": 1.9263902450943573, "learning_rate": 3.593150304330409e-06, "loss": 2.4183514404296873, "step": 1596500 }, { "epoch": 1.92651090841684, "learning_rate": 3.592746468862671e-06, "loss": 2.4250543212890623, "step": 1596600 }, { "epoch": 1.9266315717393225, "learning_rate": 3.592342633394932e-06, "loss": 2.4388864135742185, "step": 1596700 }, { "epoch": 1.9267522350618052, "learning_rate": 3.5919387979271935e-06, "loss": 2.433011322021484, "step": 1596800 }, { "epoch": 1.926872898384288, "learning_rate": 3.5915349624594555e-06, "loss": 2.4229110717773437, "step": 1596900 }, { "epoch": 1.9269935617067706, "learning_rate": 3.591131126991717e-06, "loss": 2.394922332763672, "step": 1597000 }, { "epoch": 1.9271142250292534, "learning_rate": 3.590727291523978e-06, "loss": 2.3987857055664064, "step": 1597100 }, { "epoch": 1.927234888351736, "learning_rate": 3.59032345605624e-06, "loss": 2.411601104736328, "step": 1597200 }, { "epoch": 1.9273555516742187, "learning_rate": 3.5899196205885017e-06, "loss": 2.394120178222656, "step": 1597300 }, { "epoch": 1.9274762149967013, "learning_rate": 3.5895157851207637e-06, "loss": 2.4169993591308594, "step": 1597400 }, { "epoch": 1.927596878319184, "learning_rate": 3.589111949653025e-06, "loss": 2.4218353271484374, "step": 1597500 }, { "epoch": 1.9277175416416668, "learning_rate": 3.5887081141852864e-06, "loss": 2.423897247314453, "step": 1597600 }, { "epoch": 1.9278382049641494, "learning_rate": 3.5883042787175484e-06, "loss": 2.422702178955078, "step": 1597700 }, { "epoch": 1.9279588682866322, "learning_rate": 3.58790044324981e-06, "loss": 2.42423828125, "step": 1597800 }, { "epoch": 1.9280795316091148, "learning_rate": 3.587496607782071e-06, "loss": 2.380113983154297, "step": 1597900 }, { "epoch": 1.9282001949315974, "learning_rate": 3.587092772314333e-06, "loss": 2.40243896484375, "step": 1598000 }, { "epoch": 1.92832085825408, "learning_rate": 3.5866889368465946e-06, "loss": 2.4405978393554686, "step": 1598100 }, { "epoch": 1.9284415215765627, "learning_rate": 3.586285101378856e-06, "loss": 2.438140869140625, "step": 1598200 }, { "epoch": 1.9285621848990455, "learning_rate": 3.5858812659111177e-06, "loss": 2.4164500427246094, "step": 1598300 }, { "epoch": 1.9286828482215284, "learning_rate": 3.5854774304433793e-06, "loss": 2.431685791015625, "step": 1598400 }, { "epoch": 1.928803511544011, "learning_rate": 3.585073594975641e-06, "loss": 2.409343719482422, "step": 1598500 }, { "epoch": 1.9289241748664936, "learning_rate": 3.584669759507903e-06, "loss": 2.4301138305664063, "step": 1598600 }, { "epoch": 1.9290448381889762, "learning_rate": 3.584265924040164e-06, "loss": 2.4108018493652343, "step": 1598700 }, { "epoch": 1.9291655015114588, "learning_rate": 3.5838620885724255e-06, "loss": 2.403242492675781, "step": 1598800 }, { "epoch": 1.9292861648339417, "learning_rate": 3.5834582531046875e-06, "loss": 2.4325936889648436, "step": 1598900 }, { "epoch": 1.9294068281564243, "learning_rate": 3.583054417636949e-06, "loss": 2.413758087158203, "step": 1599000 }, { "epoch": 1.9295274914789071, "learning_rate": 3.58265058216921e-06, "loss": 2.410030975341797, "step": 1599100 }, { "epoch": 1.9296481548013897, "learning_rate": 3.582246746701472e-06, "loss": 2.4190045166015626, "step": 1599200 }, { "epoch": 1.9297688181238724, "learning_rate": 3.5818429112337337e-06, "loss": 2.420889587402344, "step": 1599300 }, { "epoch": 1.929889481446355, "learning_rate": 3.5814390757659957e-06, "loss": 2.4270553588867188, "step": 1599400 }, { "epoch": 1.9300101447688376, "learning_rate": 3.581035240298257e-06, "loss": 2.421343994140625, "step": 1599500 }, { "epoch": 1.9301308080913204, "learning_rate": 3.5806314048305184e-06, "loss": 2.423128967285156, "step": 1599600 }, { "epoch": 1.9302514714138033, "learning_rate": 3.5802275693627804e-06, "loss": 2.426270751953125, "step": 1599700 }, { "epoch": 1.9303721347362859, "learning_rate": 3.579823733895042e-06, "loss": 2.430203552246094, "step": 1599800 }, { "epoch": 1.9304927980587685, "learning_rate": 3.579419898427303e-06, "loss": 2.426493377685547, "step": 1599900 }, { "epoch": 1.9306134613812511, "learning_rate": 3.579016062959565e-06, "loss": 2.431534423828125, "step": 1600000 }, { "epoch": 1.9307341247037337, "learning_rate": 3.5786122274918266e-06, "loss": 2.3973458862304686, "step": 1600100 }, { "epoch": 1.9308547880262166, "learning_rate": 3.5782083920240886e-06, "loss": 2.4122024536132813, "step": 1600200 }, { "epoch": 1.9309754513486992, "learning_rate": 3.5778045565563497e-06, "loss": 2.439319610595703, "step": 1600300 }, { "epoch": 1.931096114671182, "learning_rate": 3.5774007210886113e-06, "loss": 2.4317640686035156, "step": 1600400 }, { "epoch": 1.9312167779936646, "learning_rate": 3.5769968856208733e-06, "loss": 2.4225555419921876, "step": 1600500 }, { "epoch": 1.9313374413161473, "learning_rate": 3.576593050153135e-06, "loss": 2.4218617248535157, "step": 1600600 }, { "epoch": 1.9314581046386299, "learning_rate": 3.576189214685396e-06, "loss": 2.432065124511719, "step": 1600700 }, { "epoch": 1.9315787679611125, "learning_rate": 3.575785379217658e-06, "loss": 2.426555938720703, "step": 1600800 }, { "epoch": 1.9316994312835953, "learning_rate": 3.5753815437499195e-06, "loss": 2.393146820068359, "step": 1600900 }, { "epoch": 1.931820094606078, "learning_rate": 3.574977708282181e-06, "loss": 2.434642333984375, "step": 1601000 }, { "epoch": 1.9319407579285608, "learning_rate": 3.574573872814443e-06, "loss": 2.434586181640625, "step": 1601100 }, { "epoch": 1.9320614212510434, "learning_rate": 3.574170037346704e-06, "loss": 2.3988006591796873, "step": 1601200 }, { "epoch": 1.932182084573526, "learning_rate": 3.5737662018789658e-06, "loss": 2.427896270751953, "step": 1601300 }, { "epoch": 1.9323027478960086, "learning_rate": 3.5733623664112277e-06, "loss": 2.39855224609375, "step": 1601400 }, { "epoch": 1.9324234112184913, "learning_rate": 3.5729585309434893e-06, "loss": 2.4320849609375, "step": 1601500 }, { "epoch": 1.932544074540974, "learning_rate": 3.5725546954757504e-06, "loss": 2.4362290954589843, "step": 1601600 }, { "epoch": 1.932664737863457, "learning_rate": 3.5721508600080124e-06, "loss": 2.4153396606445314, "step": 1601700 }, { "epoch": 1.9327854011859396, "learning_rate": 3.571747024540274e-06, "loss": 2.436151428222656, "step": 1601800 }, { "epoch": 1.9329060645084222, "learning_rate": 3.571343189072536e-06, "loss": 2.4178416442871096, "step": 1601900 }, { "epoch": 1.9330267278309048, "learning_rate": 3.570939353604797e-06, "loss": 2.4139466857910157, "step": 1602000 }, { "epoch": 1.9331473911533874, "learning_rate": 3.5705355181370587e-06, "loss": 2.4217572021484375, "step": 1602100 }, { "epoch": 1.9332680544758702, "learning_rate": 3.5701316826693206e-06, "loss": 2.423597564697266, "step": 1602200 }, { "epoch": 1.9333887177983529, "learning_rate": 3.569727847201582e-06, "loss": 2.4293858337402345, "step": 1602300 }, { "epoch": 1.9335093811208357, "learning_rate": 3.5693240117338433e-06, "loss": 2.4376788330078125, "step": 1602400 }, { "epoch": 1.9336300444433183, "learning_rate": 3.5689201762661053e-06, "loss": 2.414608612060547, "step": 1602500 }, { "epoch": 1.933750707765801, "learning_rate": 3.568516340798367e-06, "loss": 2.407265472412109, "step": 1602600 }, { "epoch": 1.9338713710882836, "learning_rate": 3.568112505330629e-06, "loss": 2.4136399841308593, "step": 1602700 }, { "epoch": 1.9339920344107662, "learning_rate": 3.56770866986289e-06, "loss": 2.4241636657714842, "step": 1602800 }, { "epoch": 1.934112697733249, "learning_rate": 3.5673048343951516e-06, "loss": 2.4101461791992187, "step": 1602900 }, { "epoch": 1.9342333610557316, "learning_rate": 3.5669009989274135e-06, "loss": 2.4270143127441406, "step": 1603000 }, { "epoch": 1.9343540243782145, "learning_rate": 3.566497163459675e-06, "loss": 2.4473826599121096, "step": 1603100 }, { "epoch": 1.934474687700697, "learning_rate": 3.5660933279919362e-06, "loss": 2.4182804870605468, "step": 1603200 }, { "epoch": 1.9345953510231797, "learning_rate": 3.565689492524198e-06, "loss": 2.407869415283203, "step": 1603300 }, { "epoch": 1.9347160143456623, "learning_rate": 3.5652856570564598e-06, "loss": 2.3826725769042967, "step": 1603400 }, { "epoch": 1.934836677668145, "learning_rate": 3.5648818215887213e-06, "loss": 2.422551574707031, "step": 1603500 }, { "epoch": 1.9349573409906278, "learning_rate": 3.564477986120983e-06, "loss": 2.444138488769531, "step": 1603600 }, { "epoch": 1.9350780043131106, "learning_rate": 3.5640741506532444e-06, "loss": 2.4236199951171873, "step": 1603700 }, { "epoch": 1.9351986676355932, "learning_rate": 3.563670315185506e-06, "loss": 2.401583709716797, "step": 1603800 }, { "epoch": 1.9353193309580758, "learning_rate": 3.563266479717768e-06, "loss": 2.4070399475097655, "step": 1603900 }, { "epoch": 1.9354399942805585, "learning_rate": 3.562862644250029e-06, "loss": 2.4353907775878905, "step": 1604000 }, { "epoch": 1.935560657603041, "learning_rate": 3.5624588087822907e-06, "loss": 2.409843292236328, "step": 1604100 }, { "epoch": 1.935681320925524, "learning_rate": 3.5620549733145527e-06, "loss": 2.419228973388672, "step": 1604200 }, { "epoch": 1.9358019842480065, "learning_rate": 3.5616511378468142e-06, "loss": 2.430661163330078, "step": 1604300 }, { "epoch": 1.9359226475704894, "learning_rate": 3.5612473023790754e-06, "loss": 2.420035705566406, "step": 1604400 }, { "epoch": 1.936043310892972, "learning_rate": 3.5608434669113373e-06, "loss": 2.4079861450195312, "step": 1604500 }, { "epoch": 1.9361639742154546, "learning_rate": 3.560439631443599e-06, "loss": 2.4369320678710937, "step": 1604600 }, { "epoch": 1.9362846375379372, "learning_rate": 3.560035795975861e-06, "loss": 2.4101638793945312, "step": 1604700 }, { "epoch": 1.9364053008604198, "learning_rate": 3.559631960508122e-06, "loss": 2.440604553222656, "step": 1604800 }, { "epoch": 1.9365259641829027, "learning_rate": 3.5592281250403836e-06, "loss": 2.3891810607910156, "step": 1604900 }, { "epoch": 1.9366466275053855, "learning_rate": 3.5588242895726456e-06, "loss": 2.4261346435546876, "step": 1605000 }, { "epoch": 1.9367672908278681, "learning_rate": 3.558420454104907e-06, "loss": 2.423863983154297, "step": 1605100 }, { "epoch": 1.9368879541503508, "learning_rate": 3.5580166186371683e-06, "loss": 2.4382769775390627, "step": 1605200 }, { "epoch": 1.9370086174728334, "learning_rate": 3.5576127831694302e-06, "loss": 2.4293048095703127, "step": 1605300 }, { "epoch": 1.937129280795316, "learning_rate": 3.557208947701692e-06, "loss": 2.431893768310547, "step": 1605400 }, { "epoch": 1.9372499441177988, "learning_rate": 3.5568051122339538e-06, "loss": 2.4135479736328125, "step": 1605500 }, { "epoch": 1.9373706074402814, "learning_rate": 3.556401276766215e-06, "loss": 2.417539520263672, "step": 1605600 }, { "epoch": 1.9374912707627643, "learning_rate": 3.5559974412984765e-06, "loss": 2.423747863769531, "step": 1605700 }, { "epoch": 1.937611934085247, "learning_rate": 3.5555936058307385e-06, "loss": 2.4235499572753905, "step": 1605800 }, { "epoch": 1.9377325974077295, "learning_rate": 3.555189770363e-06, "loss": 2.414243621826172, "step": 1605900 }, { "epoch": 1.9378532607302121, "learning_rate": 3.554785934895261e-06, "loss": 2.4086624145507813, "step": 1606000 }, { "epoch": 1.9379739240526948, "learning_rate": 3.554382099427523e-06, "loss": 2.42684326171875, "step": 1606100 }, { "epoch": 1.9380945873751776, "learning_rate": 3.5539782639597847e-06, "loss": 2.404250183105469, "step": 1606200 }, { "epoch": 1.9382152506976602, "learning_rate": 3.5535744284920467e-06, "loss": 2.415589141845703, "step": 1606300 }, { "epoch": 1.938335914020143, "learning_rate": 3.5531705930243082e-06, "loss": 2.4194039916992187, "step": 1606400 }, { "epoch": 1.9384565773426257, "learning_rate": 3.5527667575565694e-06, "loss": 2.4377386474609377, "step": 1606500 }, { "epoch": 1.9385772406651083, "learning_rate": 3.5523629220888313e-06, "loss": 2.4236553955078124, "step": 1606600 }, { "epoch": 1.938697903987591, "learning_rate": 3.551959086621093e-06, "loss": 2.4094195556640625, "step": 1606700 }, { "epoch": 1.9388185673100735, "learning_rate": 3.5515552511533545e-06, "loss": 2.441317138671875, "step": 1606800 }, { "epoch": 1.9389392306325564, "learning_rate": 3.551151415685616e-06, "loss": 2.436989440917969, "step": 1606900 }, { "epoch": 1.9390598939550392, "learning_rate": 3.5507475802178776e-06, "loss": 2.4335765075683593, "step": 1607000 }, { "epoch": 1.9391805572775218, "learning_rate": 3.550343744750139e-06, "loss": 2.4046925354003905, "step": 1607100 }, { "epoch": 1.9393012206000044, "learning_rate": 3.549939909282401e-06, "loss": 2.422813720703125, "step": 1607200 }, { "epoch": 1.939421883922487, "learning_rate": 3.5495360738146623e-06, "loss": 2.408252410888672, "step": 1607300 }, { "epoch": 1.9395425472449697, "learning_rate": 3.549132238346924e-06, "loss": 2.428999786376953, "step": 1607400 }, { "epoch": 1.9396632105674525, "learning_rate": 3.548728402879186e-06, "loss": 2.4323661804199217, "step": 1607500 }, { "epoch": 1.9397838738899351, "learning_rate": 3.5483245674114474e-06, "loss": 2.440027618408203, "step": 1607600 }, { "epoch": 1.939904537212418, "learning_rate": 3.5479207319437085e-06, "loss": 2.3903375244140626, "step": 1607700 }, { "epoch": 1.9400252005349006, "learning_rate": 3.5475168964759705e-06, "loss": 2.414626007080078, "step": 1607800 }, { "epoch": 1.9401458638573832, "learning_rate": 3.547113061008232e-06, "loss": 2.424272155761719, "step": 1607900 }, { "epoch": 1.9402665271798658, "learning_rate": 3.546709225540494e-06, "loss": 2.4416825866699217, "step": 1608000 }, { "epoch": 1.9403871905023484, "learning_rate": 3.546305390072755e-06, "loss": 2.434188232421875, "step": 1608100 }, { "epoch": 1.9405078538248313, "learning_rate": 3.5459015546050167e-06, "loss": 2.436729278564453, "step": 1608200 }, { "epoch": 1.9406285171473139, "learning_rate": 3.5454977191372787e-06, "loss": 2.432928161621094, "step": 1608300 }, { "epoch": 1.9407491804697967, "learning_rate": 3.5450938836695403e-06, "loss": 2.409281005859375, "step": 1608400 }, { "epoch": 1.9408698437922793, "learning_rate": 3.5446900482018014e-06, "loss": 2.3983389282226564, "step": 1608500 }, { "epoch": 1.940990507114762, "learning_rate": 3.5442862127340634e-06, "loss": 2.4330313110351565, "step": 1608600 }, { "epoch": 1.9411111704372446, "learning_rate": 3.543882377266325e-06, "loss": 2.4254824829101564, "step": 1608700 }, { "epoch": 1.9412318337597272, "learning_rate": 3.543478541798587e-06, "loss": 2.403339691162109, "step": 1608800 }, { "epoch": 1.94135249708221, "learning_rate": 3.543074706330848e-06, "loss": 2.4204595947265624, "step": 1608900 }, { "epoch": 1.9414731604046929, "learning_rate": 3.5426708708631096e-06, "loss": 2.4276173400878904, "step": 1609000 }, { "epoch": 1.9415938237271755, "learning_rate": 3.5422670353953716e-06, "loss": 2.427928771972656, "step": 1609100 }, { "epoch": 1.941714487049658, "learning_rate": 3.541863199927633e-06, "loss": 2.4086907958984374, "step": 1609200 }, { "epoch": 1.9418351503721407, "learning_rate": 3.5414593644598943e-06, "loss": 2.4226849365234373, "step": 1609300 }, { "epoch": 1.9419558136946233, "learning_rate": 3.5410555289921563e-06, "loss": 2.428661041259766, "step": 1609400 }, { "epoch": 1.9420764770171062, "learning_rate": 3.540651693524418e-06, "loss": 2.435926513671875, "step": 1609500 }, { "epoch": 1.9421971403395888, "learning_rate": 3.5402478580566794e-06, "loss": 2.405259857177734, "step": 1609600 }, { "epoch": 1.9423178036620716, "learning_rate": 3.539844022588941e-06, "loss": 2.424833221435547, "step": 1609700 }, { "epoch": 1.9424384669845542, "learning_rate": 3.5394401871212025e-06, "loss": 2.4252549743652345, "step": 1609800 }, { "epoch": 1.9425591303070369, "learning_rate": 3.539036351653464e-06, "loss": 2.4189627075195315, "step": 1609900 }, { "epoch": 1.9426797936295195, "learning_rate": 3.538632516185726e-06, "loss": 2.3989044189453126, "step": 1610000 }, { "epoch": 1.942800456952002, "learning_rate": 3.538228680717987e-06, "loss": 2.4045069885253905, "step": 1610100 }, { "epoch": 1.942921120274485, "learning_rate": 3.5378248452502487e-06, "loss": 2.4167718505859375, "step": 1610200 }, { "epoch": 1.9430417835969678, "learning_rate": 3.5374210097825107e-06, "loss": 2.406746826171875, "step": 1610300 }, { "epoch": 1.9431624469194504, "learning_rate": 3.5370171743147723e-06, "loss": 2.4303823852539064, "step": 1610400 }, { "epoch": 1.943283110241933, "learning_rate": 3.5366133388470334e-06, "loss": 2.4138328552246096, "step": 1610500 }, { "epoch": 1.9434037735644156, "learning_rate": 3.5362095033792954e-06, "loss": 2.422849578857422, "step": 1610600 }, { "epoch": 1.9435244368868982, "learning_rate": 3.535805667911557e-06, "loss": 2.4341334533691406, "step": 1610700 }, { "epoch": 1.943645100209381, "learning_rate": 3.535401832443819e-06, "loss": 2.398470001220703, "step": 1610800 }, { "epoch": 1.9437657635318637, "learning_rate": 3.53499799697608e-06, "loss": 2.422085876464844, "step": 1610900 }, { "epoch": 1.9438864268543465, "learning_rate": 3.5345941615083416e-06, "loss": 2.395304412841797, "step": 1611000 }, { "epoch": 1.9440070901768292, "learning_rate": 3.5341903260406036e-06, "loss": 2.4162081909179687, "step": 1611100 }, { "epoch": 1.9441277534993118, "learning_rate": 3.533786490572865e-06, "loss": 2.429281768798828, "step": 1611200 }, { "epoch": 1.9442484168217944, "learning_rate": 3.533382655105127e-06, "loss": 2.4243704223632814, "step": 1611300 }, { "epoch": 1.944369080144277, "learning_rate": 3.5329788196373883e-06, "loss": 2.413815155029297, "step": 1611400 }, { "epoch": 1.9444897434667598, "learning_rate": 3.53257498416965e-06, "loss": 2.4306736755371094, "step": 1611500 }, { "epoch": 1.9446104067892425, "learning_rate": 3.532171148701912e-06, "loss": 2.4096054077148437, "step": 1611600 }, { "epoch": 1.9447310701117253, "learning_rate": 3.5317673132341734e-06, "loss": 2.3973731994628906, "step": 1611700 }, { "epoch": 1.944851733434208, "learning_rate": 3.5313634777664345e-06, "loss": 2.3995237731933594, "step": 1611800 }, { "epoch": 1.9449723967566905, "learning_rate": 3.5309596422986965e-06, "loss": 2.404203338623047, "step": 1611900 }, { "epoch": 1.9450930600791732, "learning_rate": 3.530555806830958e-06, "loss": 2.411386260986328, "step": 1612000 }, { "epoch": 1.9452137234016558, "learning_rate": 3.53015197136322e-06, "loss": 2.419000244140625, "step": 1612100 }, { "epoch": 1.9453343867241386, "learning_rate": 3.529748135895481e-06, "loss": 2.4260028076171873, "step": 1612200 }, { "epoch": 1.9454550500466214, "learning_rate": 3.5293443004277427e-06, "loss": 2.4103317260742188, "step": 1612300 }, { "epoch": 1.945575713369104, "learning_rate": 3.5289404649600047e-06, "loss": 2.3974725341796876, "step": 1612400 }, { "epoch": 1.9456963766915867, "learning_rate": 3.5285366294922663e-06, "loss": 2.4137922668457032, "step": 1612500 }, { "epoch": 1.9458170400140693, "learning_rate": 3.5281327940245274e-06, "loss": 2.4343568420410158, "step": 1612600 }, { "epoch": 1.945937703336552, "learning_rate": 3.5277289585567894e-06, "loss": 2.4370463562011717, "step": 1612700 }, { "epoch": 1.9460583666590348, "learning_rate": 3.527325123089051e-06, "loss": 2.441142120361328, "step": 1612800 }, { "epoch": 1.9461790299815174, "learning_rate": 3.5269212876213125e-06, "loss": 2.4007676696777343, "step": 1612900 }, { "epoch": 1.9462996933040002, "learning_rate": 3.526517452153574e-06, "loss": 2.4184449768066405, "step": 1613000 }, { "epoch": 1.9464203566264828, "learning_rate": 3.5261136166858356e-06, "loss": 2.4268310546875, "step": 1613100 }, { "epoch": 1.9465410199489654, "learning_rate": 3.525709781218097e-06, "loss": 2.4254530334472655, "step": 1613200 }, { "epoch": 1.946661683271448, "learning_rate": 3.525305945750359e-06, "loss": 2.437308807373047, "step": 1613300 }, { "epoch": 1.9467823465939307, "learning_rate": 3.5249021102826203e-06, "loss": 2.4225088500976564, "step": 1613400 }, { "epoch": 1.9469030099164135, "learning_rate": 3.524498274814882e-06, "loss": 2.4145997619628905, "step": 1613500 }, { "epoch": 1.9470236732388961, "learning_rate": 3.524094439347144e-06, "loss": 2.402438507080078, "step": 1613600 }, { "epoch": 1.947144336561379, "learning_rate": 3.5236906038794054e-06, "loss": 2.386249694824219, "step": 1613700 }, { "epoch": 1.9472649998838616, "learning_rate": 3.5232867684116666e-06, "loss": 2.423845062255859, "step": 1613800 }, { "epoch": 1.9473856632063442, "learning_rate": 3.5228829329439285e-06, "loss": 2.4504949951171877, "step": 1613900 }, { "epoch": 1.9475063265288268, "learning_rate": 3.52247909747619e-06, "loss": 2.406119689941406, "step": 1614000 }, { "epoch": 1.9476269898513094, "learning_rate": 3.522075262008452e-06, "loss": 2.383656311035156, "step": 1614100 }, { "epoch": 1.9477476531737923, "learning_rate": 3.5216714265407132e-06, "loss": 2.416601257324219, "step": 1614200 }, { "epoch": 1.9478683164962751, "learning_rate": 3.5212675910729748e-06, "loss": 2.413798980712891, "step": 1614300 }, { "epoch": 1.9479889798187577, "learning_rate": 3.5208637556052368e-06, "loss": 2.439547424316406, "step": 1614400 }, { "epoch": 1.9481096431412404, "learning_rate": 3.5204599201374983e-06, "loss": 2.406587677001953, "step": 1614500 }, { "epoch": 1.948230306463723, "learning_rate": 3.5200560846697595e-06, "loss": 2.41490966796875, "step": 1614600 }, { "epoch": 1.9483509697862056, "learning_rate": 3.5196522492020214e-06, "loss": 2.4030726623535155, "step": 1614700 }, { "epoch": 1.9484716331086884, "learning_rate": 3.519248413734283e-06, "loss": 2.422263336181641, "step": 1614800 }, { "epoch": 1.948592296431171, "learning_rate": 3.518844578266545e-06, "loss": 2.4052978515625, "step": 1614900 }, { "epoch": 1.9487129597536539, "learning_rate": 3.518440742798806e-06, "loss": 2.4284625244140625, "step": 1615000 }, { "epoch": 1.9488336230761365, "learning_rate": 3.5180369073310677e-06, "loss": 2.4285984802246094, "step": 1615100 }, { "epoch": 1.9489542863986191, "learning_rate": 3.5176330718633297e-06, "loss": 2.413594512939453, "step": 1615200 }, { "epoch": 1.9490749497211017, "learning_rate": 3.517229236395591e-06, "loss": 2.4073448181152344, "step": 1615300 }, { "epoch": 1.9491956130435844, "learning_rate": 3.5168254009278523e-06, "loss": 2.3936915588378906, "step": 1615400 }, { "epoch": 1.9493162763660672, "learning_rate": 3.5164215654601143e-06, "loss": 2.401528167724609, "step": 1615500 }, { "epoch": 1.94943693968855, "learning_rate": 3.516017729992376e-06, "loss": 2.395374298095703, "step": 1615600 }, { "epoch": 1.9495576030110326, "learning_rate": 3.5156138945246374e-06, "loss": 2.4242694091796877, "step": 1615700 }, { "epoch": 1.9496782663335153, "learning_rate": 3.515210059056899e-06, "loss": 2.4274533081054686, "step": 1615800 }, { "epoch": 1.9497989296559979, "learning_rate": 3.5148062235891606e-06, "loss": 2.445279083251953, "step": 1615900 }, { "epoch": 1.9499195929784805, "learning_rate": 3.514402388121422e-06, "loss": 2.4402560424804687, "step": 1616000 }, { "epoch": 1.9500402563009633, "learning_rate": 3.513998552653684e-06, "loss": 2.420258331298828, "step": 1616100 }, { "epoch": 1.950160919623446, "learning_rate": 3.5135947171859452e-06, "loss": 2.4143301391601564, "step": 1616200 }, { "epoch": 1.9502815829459288, "learning_rate": 3.513190881718207e-06, "loss": 2.4398028564453127, "step": 1616300 }, { "epoch": 1.9504022462684114, "learning_rate": 3.5127870462504688e-06, "loss": 2.405298767089844, "step": 1616400 }, { "epoch": 1.950522909590894, "learning_rate": 3.5123832107827303e-06, "loss": 2.4134271240234373, "step": 1616500 }, { "epoch": 1.9506435729133766, "learning_rate": 3.5119793753149923e-06, "loss": 2.420360107421875, "step": 1616600 }, { "epoch": 1.9507642362358593, "learning_rate": 3.5115755398472535e-06, "loss": 2.40943359375, "step": 1616700 }, { "epoch": 1.950884899558342, "learning_rate": 3.511171704379515e-06, "loss": 2.4332618713378906, "step": 1616800 }, { "epoch": 1.9510055628808247, "learning_rate": 3.510767868911777e-06, "loss": 2.4219984436035156, "step": 1616900 }, { "epoch": 1.9511262262033076, "learning_rate": 3.5103640334440386e-06, "loss": 2.424136047363281, "step": 1617000 }, { "epoch": 1.9512468895257902, "learning_rate": 3.5099601979762997e-06, "loss": 2.420889892578125, "step": 1617100 }, { "epoch": 1.9513675528482728, "learning_rate": 3.5095563625085617e-06, "loss": 2.4312590026855467, "step": 1617200 }, { "epoch": 1.9514882161707554, "learning_rate": 3.5091525270408232e-06, "loss": 2.417733459472656, "step": 1617300 }, { "epoch": 1.951608879493238, "learning_rate": 3.5087486915730852e-06, "loss": 2.3987168884277343, "step": 1617400 }, { "epoch": 1.9517295428157209, "learning_rate": 3.5083448561053464e-06, "loss": 2.4396864318847657, "step": 1617500 }, { "epoch": 1.9518502061382037, "learning_rate": 3.507941020637608e-06, "loss": 2.4332344055175783, "step": 1617600 }, { "epoch": 1.9519708694606863, "learning_rate": 3.50753718516987e-06, "loss": 2.410402526855469, "step": 1617700 }, { "epoch": 1.952091532783169, "learning_rate": 3.5071333497021315e-06, "loss": 2.40855712890625, "step": 1617800 }, { "epoch": 1.9522121961056516, "learning_rate": 3.5067295142343926e-06, "loss": 2.40724609375, "step": 1617900 }, { "epoch": 1.9523328594281342, "learning_rate": 3.5063256787666546e-06, "loss": 2.422146759033203, "step": 1618000 }, { "epoch": 1.952453522750617, "learning_rate": 3.505921843298916e-06, "loss": 2.422790832519531, "step": 1618100 }, { "epoch": 1.9525741860730996, "learning_rate": 3.505518007831178e-06, "loss": 2.4116229248046874, "step": 1618200 }, { "epoch": 1.9526948493955825, "learning_rate": 3.5051141723634393e-06, "loss": 2.400743408203125, "step": 1618300 }, { "epoch": 1.952815512718065, "learning_rate": 3.504710336895701e-06, "loss": 2.4224847412109374, "step": 1618400 }, { "epoch": 1.9529361760405477, "learning_rate": 3.504306501427963e-06, "loss": 2.4264427185058595, "step": 1618500 }, { "epoch": 1.9530568393630303, "learning_rate": 3.5039026659602244e-06, "loss": 2.3978916931152345, "step": 1618600 }, { "epoch": 1.953177502685513, "learning_rate": 3.5034988304924855e-06, "loss": 2.431426696777344, "step": 1618700 }, { "epoch": 1.9532981660079958, "learning_rate": 3.5030949950247475e-06, "loss": 2.421214904785156, "step": 1618800 }, { "epoch": 1.9534188293304784, "learning_rate": 3.502691159557009e-06, "loss": 2.4382035827636717, "step": 1618900 }, { "epoch": 1.9535394926529612, "learning_rate": 3.5022873240892706e-06, "loss": 2.3866120910644533, "step": 1619000 }, { "epoch": 1.9536601559754438, "learning_rate": 3.501883488621532e-06, "loss": 2.4174565124511718, "step": 1619100 }, { "epoch": 1.9537808192979265, "learning_rate": 3.5014796531537937e-06, "loss": 2.4216989135742186, "step": 1619200 }, { "epoch": 1.953901482620409, "learning_rate": 3.5010758176860553e-06, "loss": 2.4280902099609376, "step": 1619300 }, { "epoch": 1.9540221459428917, "learning_rate": 3.5006719822183172e-06, "loss": 2.4228538513183593, "step": 1619400 }, { "epoch": 1.9541428092653745, "learning_rate": 3.5002681467505784e-06, "loss": 2.4196649169921876, "step": 1619500 }, { "epoch": 1.9542634725878574, "learning_rate": 3.49986431128284e-06, "loss": 2.415563659667969, "step": 1619600 }, { "epoch": 1.95438413591034, "learning_rate": 3.499460475815102e-06, "loss": 2.4242726135253907, "step": 1619700 }, { "epoch": 1.9545047992328226, "learning_rate": 3.4990566403473635e-06, "loss": 2.427458953857422, "step": 1619800 }, { "epoch": 1.9546254625553052, "learning_rate": 3.4986528048796246e-06, "loss": 2.4001426696777344, "step": 1619900 }, { "epoch": 1.9547461258777878, "learning_rate": 3.4982489694118866e-06, "loss": 2.420757141113281, "step": 1620000 } ], "max_steps": 2486256, "num_train_epochs": 3, "total_flos": 12529054414800236544, "trial_name": null, "trial_params": null }