{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.9547461258777878, "global_step": 1620000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00012066332248268406, "learning_rate": 1.0000000000000001e-07, "loss": 10.998963623046874, "step": 100 }, { "epoch": 0.00024132664496536813, "learning_rate": 2.0000000000000002e-07, "loss": 10.867801513671875, "step": 200 }, { "epoch": 0.0003619899674480522, "learning_rate": 3.0000000000000004e-07, "loss": 10.671025390625, "step": 300 }, { "epoch": 0.00048265328993073625, "learning_rate": 4.0000000000000003e-07, "loss": 10.47958740234375, "step": 400 }, { "epoch": 0.0006033166124134203, "learning_rate": 5.000000000000001e-07, "loss": 10.36065185546875, "step": 500 }, { "epoch": 0.0007239799348961044, "learning_rate": 6.000000000000001e-07, "loss": 10.27036865234375, "step": 600 }, { "epoch": 0.0008446432573787884, "learning_rate": 7.000000000000001e-07, "loss": 10.198671264648437, "step": 700 }, { "epoch": 0.0009653065798614725, "learning_rate": 8.000000000000001e-07, "loss": 10.139332275390625, "step": 800 }, { "epoch": 0.0010859699023441566, "learning_rate": 9.000000000000001e-07, "loss": 10.094085083007812, "step": 900 }, { "epoch": 0.0012066332248268407, "learning_rate": 1.0000000000000002e-06, "loss": 10.038567504882813, "step": 1000 }, { "epoch": 0.0013272965473095247, "learning_rate": 1.1e-06, "loss": 9.995147705078125, "step": 1100 }, { "epoch": 0.0014479598697922087, "learning_rate": 1.2000000000000002e-06, "loss": 9.927572021484375, "step": 1200 }, { "epoch": 0.0015686231922748927, "learning_rate": 1.3e-06, "loss": 9.875374755859376, "step": 1300 }, { "epoch": 0.0016892865147575768, "learning_rate": 1.4000000000000001e-06, "loss": 9.811220092773437, "step": 1400 }, { "epoch": 0.001809949837240261, "learning_rate": 1.5e-06, "loss": 9.74679931640625, "step": 1500 }, { "epoch": 0.001930613159722945, "learning_rate": 1.6000000000000001e-06, "loss": 9.663087768554687, "step": 1600 }, { "epoch": 0.002051276482205629, "learning_rate": 1.7000000000000002e-06, "loss": 9.591069946289062, "step": 1700 }, { "epoch": 0.0021719398046883133, "learning_rate": 1.8000000000000001e-06, "loss": 9.529061889648437, "step": 1800 }, { "epoch": 0.002292603127170997, "learning_rate": 1.9000000000000002e-06, "loss": 9.4752197265625, "step": 1900 }, { "epoch": 0.0024132664496536813, "learning_rate": 2.0000000000000003e-06, "loss": 9.4010302734375, "step": 2000 }, { "epoch": 0.002533929772136365, "learning_rate": 2.1000000000000002e-06, "loss": 9.35108642578125, "step": 2100 }, { "epoch": 0.0026545930946190494, "learning_rate": 2.2e-06, "loss": 9.2584326171875, "step": 2200 }, { "epoch": 0.002775256417101733, "learning_rate": 2.3000000000000004e-06, "loss": 9.214194946289062, "step": 2300 }, { "epoch": 0.0028959197395844174, "learning_rate": 2.4000000000000003e-06, "loss": 9.132109985351562, "step": 2400 }, { "epoch": 0.0030165830620671017, "learning_rate": 2.5e-06, "loss": 9.047922973632813, "step": 2500 }, { "epoch": 0.0031372463845497855, "learning_rate": 2.6e-06, "loss": 8.99282958984375, "step": 2600 }, { "epoch": 0.0032579097070324697, "learning_rate": 2.7000000000000004e-06, "loss": 8.95028076171875, "step": 2700 }, { "epoch": 0.0033785730295151535, "learning_rate": 2.8000000000000003e-06, "loss": 8.865433349609376, "step": 2800 }, { "epoch": 0.0034992363519978377, "learning_rate": 2.9e-06, "loss": 8.848460083007813, "step": 2900 }, { "epoch": 0.003619899674480522, "learning_rate": 3e-06, "loss": 8.786046752929687, "step": 3000 }, { "epoch": 0.003740562996963206, "learning_rate": 3.1000000000000004e-06, "loss": 8.73739501953125, "step": 3100 }, { "epoch": 0.00386122631944589, "learning_rate": 3.2000000000000003e-06, "loss": 8.654747924804688, "step": 3200 }, { "epoch": 0.003981889641928574, "learning_rate": 3.3000000000000006e-06, "loss": 8.638505859375, "step": 3300 }, { "epoch": 0.004102552964411258, "learning_rate": 3.4000000000000005e-06, "loss": 8.57900390625, "step": 3400 }, { "epoch": 0.004223216286893942, "learning_rate": 3.5e-06, "loss": 8.544164428710937, "step": 3500 }, { "epoch": 0.0043438796093766266, "learning_rate": 3.6000000000000003e-06, "loss": 8.50919189453125, "step": 3600 }, { "epoch": 0.00446454293185931, "learning_rate": 3.7e-06, "loss": 8.48513671875, "step": 3700 }, { "epoch": 0.004585206254341994, "learning_rate": 3.8000000000000005e-06, "loss": 8.434906005859375, "step": 3800 }, { "epoch": 0.004705869576824678, "learning_rate": 3.900000000000001e-06, "loss": 8.401183471679687, "step": 3900 }, { "epoch": 0.004826532899307363, "learning_rate": 4.000000000000001e-06, "loss": 8.37177001953125, "step": 4000 }, { "epoch": 0.0049471962217900465, "learning_rate": 4.1e-06, "loss": 8.339204711914062, "step": 4100 }, { "epoch": 0.00506785954427273, "learning_rate": 4.2000000000000004e-06, "loss": 8.3411181640625, "step": 4200 }, { "epoch": 0.005188522866755415, "learning_rate": 4.3e-06, "loss": 8.30220947265625, "step": 4300 }, { "epoch": 0.005309186189238099, "learning_rate": 4.4e-06, "loss": 8.303151245117187, "step": 4400 }, { "epoch": 0.0054298495117207825, "learning_rate": 4.5e-06, "loss": 8.252617797851563, "step": 4500 }, { "epoch": 0.005550512834203466, "learning_rate": 4.600000000000001e-06, "loss": 8.258956909179688, "step": 4600 }, { "epoch": 0.005671176156686151, "learning_rate": 4.7e-06, "loss": 8.244758911132813, "step": 4700 }, { "epoch": 0.005791839479168835, "learning_rate": 4.800000000000001e-06, "loss": 8.21389404296875, "step": 4800 }, { "epoch": 0.005912502801651519, "learning_rate": 4.9000000000000005e-06, "loss": 8.185855712890625, "step": 4900 }, { "epoch": 0.006033166124134203, "learning_rate": 5e-06, "loss": 8.198721923828124, "step": 5000 }, { "epoch": 0.006153829446616887, "learning_rate": 5.1e-06, "loss": 8.184302368164062, "step": 5100 }, { "epoch": 0.006274492769099571, "learning_rate": 5.2e-06, "loss": 8.141995849609375, "step": 5200 }, { "epoch": 0.006395156091582255, "learning_rate": 5.300000000000001e-06, "loss": 8.149254150390625, "step": 5300 }, { "epoch": 0.006515819414064939, "learning_rate": 5.400000000000001e-06, "loss": 8.134349365234375, "step": 5400 }, { "epoch": 0.006636482736547623, "learning_rate": 5.500000000000001e-06, "loss": 8.126637573242187, "step": 5500 }, { "epoch": 0.006757146059030307, "learning_rate": 5.600000000000001e-06, "loss": 8.11840087890625, "step": 5600 }, { "epoch": 0.006877809381512992, "learning_rate": 5.7e-06, "loss": 8.152865600585937, "step": 5700 }, { "epoch": 0.0069984727039956755, "learning_rate": 5.8e-06, "loss": 8.106795654296874, "step": 5800 }, { "epoch": 0.007119136026478359, "learning_rate": 5.9e-06, "loss": 8.087644653320313, "step": 5900 }, { "epoch": 0.007239799348961044, "learning_rate": 6e-06, "loss": 8.071045532226563, "step": 6000 }, { "epoch": 0.007360462671443728, "learning_rate": 6.1e-06, "loss": 8.07795654296875, "step": 6100 }, { "epoch": 0.007481125993926412, "learning_rate": 6.200000000000001e-06, "loss": 8.07419677734375, "step": 6200 }, { "epoch": 0.007601789316409095, "learning_rate": 6.300000000000001e-06, "loss": 8.054071655273438, "step": 6300 }, { "epoch": 0.00772245263889178, "learning_rate": 6.4000000000000006e-06, "loss": 8.069452514648438, "step": 6400 }, { "epoch": 0.007843115961374464, "learning_rate": 6.5000000000000004e-06, "loss": 8.062046508789063, "step": 6500 }, { "epoch": 0.007963779283857149, "learning_rate": 6.600000000000001e-06, "loss": 8.041135864257813, "step": 6600 }, { "epoch": 0.008084442606339831, "learning_rate": 6.700000000000001e-06, "loss": 8.0472509765625, "step": 6700 }, { "epoch": 0.008205105928822516, "learning_rate": 6.800000000000001e-06, "loss": 8.015521240234374, "step": 6800 }, { "epoch": 0.0083257692513052, "learning_rate": 6.9e-06, "loss": 7.99987060546875, "step": 6900 }, { "epoch": 0.008446432573787884, "learning_rate": 7e-06, "loss": 8.021083374023437, "step": 7000 }, { "epoch": 0.008567095896270568, "learning_rate": 7.100000000000001e-06, "loss": 8.009032592773437, "step": 7100 }, { "epoch": 0.008687759218753253, "learning_rate": 7.2000000000000005e-06, "loss": 7.98518798828125, "step": 7200 }, { "epoch": 0.008808422541235936, "learning_rate": 7.3e-06, "loss": 7.98792724609375, "step": 7300 }, { "epoch": 0.00892908586371862, "learning_rate": 7.4e-06, "loss": 7.98720703125, "step": 7400 }, { "epoch": 0.009049749186201304, "learning_rate": 7.500000000000001e-06, "loss": 7.946220092773437, "step": 7500 }, { "epoch": 0.009170412508683988, "learning_rate": 7.600000000000001e-06, "loss": 7.945390014648438, "step": 7600 }, { "epoch": 0.009291075831166673, "learning_rate": 7.7e-06, "loss": 7.98837158203125, "step": 7700 }, { "epoch": 0.009411739153649356, "learning_rate": 7.800000000000002e-06, "loss": 7.9614019775390625, "step": 7800 }, { "epoch": 0.00953240247613204, "learning_rate": 7.9e-06, "loss": 7.951765747070312, "step": 7900 }, { "epoch": 0.009653065798614725, "learning_rate": 8.000000000000001e-06, "loss": 7.924186401367187, "step": 8000 }, { "epoch": 0.009773729121097408, "learning_rate": 8.1e-06, "loss": 7.929385375976563, "step": 8100 }, { "epoch": 0.009894392443580093, "learning_rate": 8.2e-06, "loss": 7.926139526367187, "step": 8200 }, { "epoch": 0.010015055766062778, "learning_rate": 8.3e-06, "loss": 7.90500244140625, "step": 8300 }, { "epoch": 0.01013571908854546, "learning_rate": 8.400000000000001e-06, "loss": 7.927145385742188, "step": 8400 }, { "epoch": 0.010256382411028145, "learning_rate": 8.5e-06, "loss": 7.9099884033203125, "step": 8500 }, { "epoch": 0.01037704573351083, "learning_rate": 8.6e-06, "loss": 7.90431640625, "step": 8600 }, { "epoch": 0.010497709055993513, "learning_rate": 8.700000000000001e-06, "loss": 7.885325927734375, "step": 8700 }, { "epoch": 0.010618372378476197, "learning_rate": 8.8e-06, "loss": 7.895731201171875, "step": 8800 }, { "epoch": 0.01073903570095888, "learning_rate": 8.900000000000001e-06, "loss": 7.873722534179688, "step": 8900 }, { "epoch": 0.010859699023441565, "learning_rate": 9e-06, "loss": 7.867328491210937, "step": 9000 }, { "epoch": 0.01098036234592425, "learning_rate": 9.100000000000001e-06, "loss": 7.870953369140625, "step": 9100 }, { "epoch": 0.011101025668406933, "learning_rate": 9.200000000000002e-06, "loss": 7.89510498046875, "step": 9200 }, { "epoch": 0.011221688990889617, "learning_rate": 9.3e-06, "loss": 7.866868896484375, "step": 9300 }, { "epoch": 0.011342352313372302, "learning_rate": 9.4e-06, "loss": 7.843492431640625, "step": 9400 }, { "epoch": 0.011463015635854985, "learning_rate": 9.5e-06, "loss": 7.845059204101562, "step": 9500 }, { "epoch": 0.01158367895833767, "learning_rate": 9.600000000000001e-06, "loss": 7.835038452148438, "step": 9600 }, { "epoch": 0.011704342280820354, "learning_rate": 9.7e-06, "loss": 7.848790893554687, "step": 9700 }, { "epoch": 0.011825005603303037, "learning_rate": 9.800000000000001e-06, "loss": 7.842159423828125, "step": 9800 }, { "epoch": 0.011945668925785722, "learning_rate": 9.9e-06, "loss": 7.8275146484375, "step": 9900 }, { "epoch": 0.012066332248268407, "learning_rate": 1e-05, "loss": 7.826830444335937, "step": 10000 }, { "epoch": 0.01218699557075109, "learning_rate": 9.999596164532263e-06, "loss": 7.812598876953125, "step": 10100 }, { "epoch": 0.012307658893233774, "learning_rate": 9.999192329064525e-06, "loss": 7.807442626953125, "step": 10200 }, { "epoch": 0.012428322215716459, "learning_rate": 9.998788493596787e-06, "loss": 7.79939697265625, "step": 10300 }, { "epoch": 0.012548985538199142, "learning_rate": 9.998384658129047e-06, "loss": 7.804387817382812, "step": 10400 }, { "epoch": 0.012669648860681827, "learning_rate": 9.997980822661309e-06, "loss": 7.799457397460937, "step": 10500 }, { "epoch": 0.01279031218316451, "learning_rate": 9.99757698719357e-06, "loss": 7.800637817382812, "step": 10600 }, { "epoch": 0.012910975505647194, "learning_rate": 9.997173151725831e-06, "loss": 7.776885986328125, "step": 10700 }, { "epoch": 0.013031638828129879, "learning_rate": 9.996769316258093e-06, "loss": 7.790662231445313, "step": 10800 }, { "epoch": 0.013152302150612562, "learning_rate": 9.996365480790355e-06, "loss": 7.780765991210938, "step": 10900 }, { "epoch": 0.013272965473095246, "learning_rate": 9.995961645322617e-06, "loss": 7.776314697265625, "step": 11000 }, { "epoch": 0.013393628795577931, "learning_rate": 9.99555780985488e-06, "loss": 7.753301391601562, "step": 11100 }, { "epoch": 0.013514292118060614, "learning_rate": 9.995153974387141e-06, "loss": 7.774302368164062, "step": 11200 }, { "epoch": 0.013634955440543299, "learning_rate": 9.994750138919402e-06, "loss": 7.761792602539063, "step": 11300 }, { "epoch": 0.013755618763025983, "learning_rate": 9.994346303451663e-06, "loss": 7.756895751953125, "step": 11400 }, { "epoch": 0.013876282085508666, "learning_rate": 9.993942467983925e-06, "loss": 7.756287231445312, "step": 11500 }, { "epoch": 0.013996945407991351, "learning_rate": 9.993538632516186e-06, "loss": 7.74819580078125, "step": 11600 }, { "epoch": 0.014117608730474036, "learning_rate": 9.993134797048448e-06, "loss": 7.748518676757812, "step": 11700 }, { "epoch": 0.014238272052956719, "learning_rate": 9.99273096158071e-06, "loss": 7.73031005859375, "step": 11800 }, { "epoch": 0.014358935375439403, "learning_rate": 9.992327126112972e-06, "loss": 7.731920776367187, "step": 11900 }, { "epoch": 0.014479598697922088, "learning_rate": 9.991923290645234e-06, "loss": 7.719931030273438, "step": 12000 }, { "epoch": 0.014600262020404771, "learning_rate": 9.991519455177494e-06, "loss": 7.723886108398437, "step": 12100 }, { "epoch": 0.014720925342887456, "learning_rate": 9.991115619709756e-06, "loss": 7.706294555664062, "step": 12200 }, { "epoch": 0.014841588665370139, "learning_rate": 9.990711784242018e-06, "loss": 7.7386846923828125, "step": 12300 }, { "epoch": 0.014962251987852823, "learning_rate": 9.99030794877428e-06, "loss": 7.722437744140625, "step": 12400 }, { "epoch": 0.015082915310335508, "learning_rate": 9.989904113306542e-06, "loss": 7.702894287109375, "step": 12500 }, { "epoch": 0.01520357863281819, "learning_rate": 9.989500277838802e-06, "loss": 7.699403076171875, "step": 12600 }, { "epoch": 0.015324241955300875, "learning_rate": 9.989096442371064e-06, "loss": 7.70286865234375, "step": 12700 }, { "epoch": 0.01544490527778356, "learning_rate": 9.988692606903326e-06, "loss": 7.727252197265625, "step": 12800 }, { "epoch": 0.015565568600266243, "learning_rate": 9.988288771435586e-06, "loss": 7.681318969726562, "step": 12900 }, { "epoch": 0.015686231922748928, "learning_rate": 9.987884935967848e-06, "loss": 7.681355590820313, "step": 13000 }, { "epoch": 0.01580689524523161, "learning_rate": 9.98748110050011e-06, "loss": 7.669380493164063, "step": 13100 }, { "epoch": 0.015927558567714297, "learning_rate": 9.987077265032372e-06, "loss": 7.691492309570313, "step": 13200 }, { "epoch": 0.01604822189019698, "learning_rate": 9.986673429564634e-06, "loss": 7.735159301757813, "step": 13300 }, { "epoch": 0.016168885212679663, "learning_rate": 9.986269594096896e-06, "loss": 7.67091552734375, "step": 13400 }, { "epoch": 0.01628954853516235, "learning_rate": 9.985865758629157e-06, "loss": 7.673142700195313, "step": 13500 }, { "epoch": 0.016410211857645032, "learning_rate": 9.985461923161419e-06, "loss": 7.694071044921875, "step": 13600 }, { "epoch": 0.016530875180127715, "learning_rate": 9.98505808769368e-06, "loss": 7.685897216796875, "step": 13700 }, { "epoch": 0.0166515385026104, "learning_rate": 9.984654252225941e-06, "loss": 7.67085693359375, "step": 13800 }, { "epoch": 0.016772201825093085, "learning_rate": 9.984250416758203e-06, "loss": 7.652900390625, "step": 13900 }, { "epoch": 0.016892865147575768, "learning_rate": 9.983846581290465e-06, "loss": 7.666927490234375, "step": 14000 }, { "epoch": 0.017013528470058454, "learning_rate": 9.983442745822727e-06, "loss": 7.651405029296875, "step": 14100 }, { "epoch": 0.017134191792541137, "learning_rate": 9.983038910354989e-06, "loss": 7.638584594726563, "step": 14200 }, { "epoch": 0.01725485511502382, "learning_rate": 9.98263507488725e-06, "loss": 7.643876953125, "step": 14300 }, { "epoch": 0.017375518437506506, "learning_rate": 9.982231239419513e-06, "loss": 7.6271630859375, "step": 14400 }, { "epoch": 0.01749618175998919, "learning_rate": 9.981827403951773e-06, "loss": 7.63806884765625, "step": 14500 }, { "epoch": 0.017616845082471872, "learning_rate": 9.981423568484035e-06, "loss": 7.62742919921875, "step": 14600 }, { "epoch": 0.017737508404954555, "learning_rate": 9.981019733016295e-06, "loss": 7.642492065429687, "step": 14700 }, { "epoch": 0.01785817172743724, "learning_rate": 9.980615897548557e-06, "loss": 7.6192822265625, "step": 14800 }, { "epoch": 0.017978835049919924, "learning_rate": 9.98021206208082e-06, "loss": 7.607686157226563, "step": 14900 }, { "epoch": 0.018099498372402607, "learning_rate": 9.979808226613081e-06, "loss": 7.62489501953125, "step": 15000 }, { "epoch": 0.018220161694885294, "learning_rate": 9.979404391145343e-06, "loss": 7.608429565429687, "step": 15100 }, { "epoch": 0.018340825017367977, "learning_rate": 9.979000555677605e-06, "loss": 7.597339477539062, "step": 15200 }, { "epoch": 0.01846148833985066, "learning_rate": 9.978596720209867e-06, "loss": 7.593267211914062, "step": 15300 }, { "epoch": 0.018582151662333346, "learning_rate": 9.978192884742128e-06, "loss": 7.600186157226562, "step": 15400 }, { "epoch": 0.01870281498481603, "learning_rate": 9.97778904927439e-06, "loss": 7.575609130859375, "step": 15500 }, { "epoch": 0.018823478307298712, "learning_rate": 9.977385213806652e-06, "loss": 7.578140869140625, "step": 15600 }, { "epoch": 0.0189441416297814, "learning_rate": 9.976981378338912e-06, "loss": 7.588411865234375, "step": 15700 }, { "epoch": 0.01906480495226408, "learning_rate": 9.976577542871174e-06, "loss": 7.566851806640625, "step": 15800 }, { "epoch": 0.019185468274746764, "learning_rate": 9.976173707403436e-06, "loss": 7.549029541015625, "step": 15900 }, { "epoch": 0.01930613159722945, "learning_rate": 9.975769871935698e-06, "loss": 7.562918701171875, "step": 16000 }, { "epoch": 0.019426794919712134, "learning_rate": 9.97536603646796e-06, "loss": 7.537685546875, "step": 16100 }, { "epoch": 0.019547458242194816, "learning_rate": 9.97496220100022e-06, "loss": 7.517478637695312, "step": 16200 }, { "epoch": 0.019668121564677503, "learning_rate": 9.974558365532482e-06, "loss": 7.5180731201171875, "step": 16300 }, { "epoch": 0.019788784887160186, "learning_rate": 9.974154530064744e-06, "loss": 7.493146362304688, "step": 16400 }, { "epoch": 0.01990944820964287, "learning_rate": 9.973750694597006e-06, "loss": 7.484447021484375, "step": 16500 }, { "epoch": 0.020030111532125555, "learning_rate": 9.973346859129266e-06, "loss": 7.502681274414062, "step": 16600 }, { "epoch": 0.020150774854608238, "learning_rate": 9.972943023661528e-06, "loss": 7.45322998046875, "step": 16700 }, { "epoch": 0.02027143817709092, "learning_rate": 9.97253918819379e-06, "loss": 7.495328369140625, "step": 16800 }, { "epoch": 0.020392101499573607, "learning_rate": 9.972135352726052e-06, "loss": 7.466298828125, "step": 16900 }, { "epoch": 0.02051276482205629, "learning_rate": 9.971731517258312e-06, "loss": 7.4412060546875, "step": 17000 }, { "epoch": 0.020633428144538973, "learning_rate": 9.971327681790574e-06, "loss": 7.4665283203125, "step": 17100 }, { "epoch": 0.02075409146702166, "learning_rate": 9.970923846322836e-06, "loss": 7.432006225585938, "step": 17200 }, { "epoch": 0.020874754789504343, "learning_rate": 9.970520010855098e-06, "loss": 7.4205126953125, "step": 17300 }, { "epoch": 0.020995418111987026, "learning_rate": 9.97011617538736e-06, "loss": 7.412860107421875, "step": 17400 }, { "epoch": 0.021116081434469712, "learning_rate": 9.969712339919622e-06, "loss": 7.390285034179687, "step": 17500 }, { "epoch": 0.021236744756952395, "learning_rate": 9.969308504451883e-06, "loss": 7.388471069335938, "step": 17600 }, { "epoch": 0.021357408079435078, "learning_rate": 9.968904668984145e-06, "loss": 7.357642822265625, "step": 17700 }, { "epoch": 0.02147807140191776, "learning_rate": 9.968500833516405e-06, "loss": 7.374608154296875, "step": 17800 }, { "epoch": 0.021598734724400447, "learning_rate": 9.968096998048667e-06, "loss": 7.348936767578125, "step": 17900 }, { "epoch": 0.02171939804688313, "learning_rate": 9.967693162580929e-06, "loss": 7.326118774414063, "step": 18000 }, { "epoch": 0.021840061369365813, "learning_rate": 9.967289327113191e-06, "loss": 7.3109765625, "step": 18100 }, { "epoch": 0.0219607246918485, "learning_rate": 9.966885491645453e-06, "loss": 7.311011962890625, "step": 18200 }, { "epoch": 0.022081388014331182, "learning_rate": 9.966481656177715e-06, "loss": 7.274530029296875, "step": 18300 }, { "epoch": 0.022202051336813865, "learning_rate": 9.966077820709977e-06, "loss": 7.23897705078125, "step": 18400 }, { "epoch": 0.022322714659296552, "learning_rate": 9.965673985242237e-06, "loss": 7.2407861328125, "step": 18500 }, { "epoch": 0.022443377981779235, "learning_rate": 9.965270149774499e-06, "loss": 7.240975341796875, "step": 18600 }, { "epoch": 0.022564041304261918, "learning_rate": 9.964866314306761e-06, "loss": 7.222609252929687, "step": 18700 }, { "epoch": 0.022684704626744604, "learning_rate": 9.964462478839021e-06, "loss": 7.2113800048828125, "step": 18800 }, { "epoch": 0.022805367949227287, "learning_rate": 9.964058643371283e-06, "loss": 7.19686767578125, "step": 18900 }, { "epoch": 0.02292603127170997, "learning_rate": 9.963654807903545e-06, "loss": 7.1889306640625, "step": 19000 }, { "epoch": 0.023046694594192656, "learning_rate": 9.963250972435807e-06, "loss": 7.175922241210937, "step": 19100 }, { "epoch": 0.02316735791667534, "learning_rate": 9.96284713696807e-06, "loss": 7.178650512695312, "step": 19200 }, { "epoch": 0.023288021239158022, "learning_rate": 9.962443301500331e-06, "loss": 7.181878662109375, "step": 19300 }, { "epoch": 0.02340868456164071, "learning_rate": 9.962039466032592e-06, "loss": 7.137700805664062, "step": 19400 }, { "epoch": 0.02352934788412339, "learning_rate": 9.961635630564854e-06, "loss": 7.1376220703125, "step": 19500 }, { "epoch": 0.023650011206606075, "learning_rate": 9.961231795097116e-06, "loss": 7.112848510742188, "step": 19600 }, { "epoch": 0.02377067452908876, "learning_rate": 9.960827959629376e-06, "loss": 7.077623291015625, "step": 19700 }, { "epoch": 0.023891337851571444, "learning_rate": 9.960424124161638e-06, "loss": 7.10410888671875, "step": 19800 }, { "epoch": 0.024012001174054127, "learning_rate": 9.9600202886939e-06, "loss": 7.04318359375, "step": 19900 }, { "epoch": 0.024132664496536813, "learning_rate": 9.959616453226162e-06, "loss": 7.05190185546875, "step": 20000 }, { "epoch": 0.024253327819019496, "learning_rate": 9.959212617758424e-06, "loss": 7.062595825195313, "step": 20100 }, { "epoch": 0.02437399114150218, "learning_rate": 9.958808782290684e-06, "loss": 7.040302734375, "step": 20200 }, { "epoch": 0.024494654463984866, "learning_rate": 9.958404946822946e-06, "loss": 7.060929565429688, "step": 20300 }, { "epoch": 0.02461531778646755, "learning_rate": 9.958001111355208e-06, "loss": 7.056749267578125, "step": 20400 }, { "epoch": 0.02473598110895023, "learning_rate": 9.95759727588747e-06, "loss": 7.02091796875, "step": 20500 }, { "epoch": 0.024856644431432918, "learning_rate": 9.957193440419732e-06, "loss": 7.011871337890625, "step": 20600 }, { "epoch": 0.0249773077539156, "learning_rate": 9.956789604951992e-06, "loss": 7.002923583984375, "step": 20700 }, { "epoch": 0.025097971076398284, "learning_rate": 9.956385769484254e-06, "loss": 6.983974609375, "step": 20800 }, { "epoch": 0.025218634398880967, "learning_rate": 9.955981934016516e-06, "loss": 6.9759765625, "step": 20900 }, { "epoch": 0.025339297721363653, "learning_rate": 9.955578098548778e-06, "loss": 6.959908447265625, "step": 21000 }, { "epoch": 0.025459961043846336, "learning_rate": 9.955174263081039e-06, "loss": 6.96692626953125, "step": 21100 }, { "epoch": 0.02558062436632902, "learning_rate": 9.9547704276133e-06, "loss": 6.933953857421875, "step": 21200 }, { "epoch": 0.025701287688811705, "learning_rate": 9.954366592145562e-06, "loss": 6.96384033203125, "step": 21300 }, { "epoch": 0.02582195101129439, "learning_rate": 9.953962756677824e-06, "loss": 6.8951177978515625, "step": 21400 }, { "epoch": 0.02594261433377707, "learning_rate": 9.953558921210086e-06, "loss": 6.91238037109375, "step": 21500 }, { "epoch": 0.026063277656259758, "learning_rate": 9.953155085742347e-06, "loss": 6.896270141601563, "step": 21600 }, { "epoch": 0.02618394097874244, "learning_rate": 9.952751250274609e-06, "loss": 6.896909790039063, "step": 21700 }, { "epoch": 0.026304604301225123, "learning_rate": 9.95234741480687e-06, "loss": 6.881757202148438, "step": 21800 }, { "epoch": 0.02642526762370781, "learning_rate": 9.951943579339131e-06, "loss": 6.8531689453125, "step": 21900 }, { "epoch": 0.026545930946190493, "learning_rate": 9.951539743871393e-06, "loss": 6.872998046875, "step": 22000 }, { "epoch": 0.026666594268673176, "learning_rate": 9.951135908403655e-06, "loss": 6.854584350585937, "step": 22100 }, { "epoch": 0.026787257591155862, "learning_rate": 9.950732072935917e-06, "loss": 6.827476806640625, "step": 22200 }, { "epoch": 0.026907920913638545, "learning_rate": 9.950328237468179e-06, "loss": 6.831190185546875, "step": 22300 }, { "epoch": 0.027028584236121228, "learning_rate": 9.949924402000441e-06, "loss": 6.7924261474609375, "step": 22400 }, { "epoch": 0.027149247558603914, "learning_rate": 9.949520566532703e-06, "loss": 6.790482177734375, "step": 22500 }, { "epoch": 0.027269910881086597, "learning_rate": 9.949116731064963e-06, "loss": 6.803350219726562, "step": 22600 }, { "epoch": 0.02739057420356928, "learning_rate": 9.948712895597225e-06, "loss": 6.785421752929688, "step": 22700 }, { "epoch": 0.027511237526051967, "learning_rate": 9.948309060129485e-06, "loss": 6.777293701171875, "step": 22800 }, { "epoch": 0.02763190084853465, "learning_rate": 9.947905224661747e-06, "loss": 6.767362060546875, "step": 22900 }, { "epoch": 0.027752564171017333, "learning_rate": 9.94750138919401e-06, "loss": 6.742926025390625, "step": 23000 }, { "epoch": 0.02787322749350002, "learning_rate": 9.947097553726271e-06, "loss": 6.78175048828125, "step": 23100 }, { "epoch": 0.027993890815982702, "learning_rate": 9.946693718258533e-06, "loss": 6.729476318359375, "step": 23200 }, { "epoch": 0.028114554138465385, "learning_rate": 9.946289882790795e-06, "loss": 6.729383544921875, "step": 23300 }, { "epoch": 0.02823521746094807, "learning_rate": 9.945886047323057e-06, "loss": 6.723148193359375, "step": 23400 }, { "epoch": 0.028355880783430754, "learning_rate": 9.945482211855318e-06, "loss": 6.739766235351563, "step": 23500 }, { "epoch": 0.028476544105913437, "learning_rate": 9.94507837638758e-06, "loss": 6.685776977539063, "step": 23600 }, { "epoch": 0.028597207428396124, "learning_rate": 9.944674540919842e-06, "loss": 6.71983154296875, "step": 23700 }, { "epoch": 0.028717870750878807, "learning_rate": 9.944270705452102e-06, "loss": 6.673611450195312, "step": 23800 }, { "epoch": 0.02883853407336149, "learning_rate": 9.943866869984364e-06, "loss": 6.659153442382813, "step": 23900 }, { "epoch": 0.028959197395844176, "learning_rate": 9.943463034516626e-06, "loss": 6.669003295898437, "step": 24000 }, { "epoch": 0.02907986071832686, "learning_rate": 9.943059199048888e-06, "loss": 6.634718017578125, "step": 24100 }, { "epoch": 0.029200524040809542, "learning_rate": 9.94265536358115e-06, "loss": 6.655950317382812, "step": 24200 }, { "epoch": 0.029321187363292225, "learning_rate": 9.94225152811341e-06, "loss": 6.658018188476563, "step": 24300 }, { "epoch": 0.02944185068577491, "learning_rate": 9.941847692645672e-06, "loss": 6.616795654296875, "step": 24400 }, { "epoch": 0.029562514008257594, "learning_rate": 9.941443857177934e-06, "loss": 6.64441650390625, "step": 24500 }, { "epoch": 0.029683177330740277, "learning_rate": 9.941040021710196e-06, "loss": 6.600654907226563, "step": 24600 }, { "epoch": 0.029803840653222963, "learning_rate": 9.940636186242458e-06, "loss": 6.606512451171875, "step": 24700 }, { "epoch": 0.029924503975705646, "learning_rate": 9.940232350774718e-06, "loss": 6.615017700195312, "step": 24800 }, { "epoch": 0.03004516729818833, "learning_rate": 9.93982851530698e-06, "loss": 6.570202026367188, "step": 24900 }, { "epoch": 0.030165830620671016, "learning_rate": 9.939424679839242e-06, "loss": 6.583402099609375, "step": 25000 }, { "epoch": 0.0302864939431537, "learning_rate": 9.939020844371503e-06, "loss": 6.571268310546875, "step": 25100 }, { "epoch": 0.03040715726563638, "learning_rate": 9.938617008903765e-06, "loss": 6.569072265625, "step": 25200 }, { "epoch": 0.030527820588119068, "learning_rate": 9.938213173436027e-06, "loss": 6.567750244140625, "step": 25300 }, { "epoch": 0.03064848391060175, "learning_rate": 9.937809337968289e-06, "loss": 6.578480834960938, "step": 25400 }, { "epoch": 0.030769147233084434, "learning_rate": 9.93740550250055e-06, "loss": 6.548373413085938, "step": 25500 }, { "epoch": 0.03088981055556712, "learning_rate": 9.937001667032812e-06, "loss": 6.56265380859375, "step": 25600 }, { "epoch": 0.031010473878049803, "learning_rate": 9.936597831565073e-06, "loss": 6.53989501953125, "step": 25700 }, { "epoch": 0.031131137200532486, "learning_rate": 9.936193996097335e-06, "loss": 6.511539916992188, "step": 25800 }, { "epoch": 0.03125180052301517, "learning_rate": 9.935790160629597e-06, "loss": 6.52816650390625, "step": 25900 }, { "epoch": 0.031372463845497855, "learning_rate": 9.935386325161857e-06, "loss": 6.500388793945312, "step": 26000 }, { "epoch": 0.03149312716798054, "learning_rate": 9.934982489694119e-06, "loss": 6.523255004882812, "step": 26100 }, { "epoch": 0.03161379049046322, "learning_rate": 9.934578654226381e-06, "loss": 6.49367919921875, "step": 26200 }, { "epoch": 0.03173445381294591, "learning_rate": 9.934174818758643e-06, "loss": 6.478309326171875, "step": 26300 }, { "epoch": 0.031855117135428594, "learning_rate": 9.933770983290905e-06, "loss": 6.448147583007812, "step": 26400 }, { "epoch": 0.031975780457911274, "learning_rate": 9.933367147823167e-06, "loss": 6.495176391601563, "step": 26500 }, { "epoch": 0.03209644378039396, "learning_rate": 9.932963312355429e-06, "loss": 6.46186767578125, "step": 26600 }, { "epoch": 0.032217107102876646, "learning_rate": 9.93255947688769e-06, "loss": 6.471776123046875, "step": 26700 }, { "epoch": 0.032337770425359326, "learning_rate": 9.932155641419951e-06, "loss": 6.472383422851562, "step": 26800 }, { "epoch": 0.03245843374784201, "learning_rate": 9.931751805952211e-06, "loss": 6.4738720703125, "step": 26900 }, { "epoch": 0.0325790970703247, "learning_rate": 9.931347970484473e-06, "loss": 6.445848999023437, "step": 27000 }, { "epoch": 0.03269976039280738, "learning_rate": 9.930944135016735e-06, "loss": 6.462876586914063, "step": 27100 }, { "epoch": 0.032820423715290065, "learning_rate": 9.930540299548997e-06, "loss": 6.435804443359375, "step": 27200 }, { "epoch": 0.03294108703777275, "learning_rate": 9.93013646408126e-06, "loss": 6.43695068359375, "step": 27300 }, { "epoch": 0.03306175036025543, "learning_rate": 9.929732628613521e-06, "loss": 6.411896362304687, "step": 27400 }, { "epoch": 0.03318241368273812, "learning_rate": 9.929328793145783e-06, "loss": 6.4326409912109375, "step": 27500 }, { "epoch": 0.0333030770052208, "learning_rate": 9.928924957678044e-06, "loss": 6.415225830078125, "step": 27600 }, { "epoch": 0.03342374032770348, "learning_rate": 9.928521122210306e-06, "loss": 6.409244384765625, "step": 27700 }, { "epoch": 0.03354440365018617, "learning_rate": 9.928117286742568e-06, "loss": 6.386112060546875, "step": 27800 }, { "epoch": 0.033665066972668856, "learning_rate": 9.927713451274828e-06, "loss": 6.3937005615234375, "step": 27900 }, { "epoch": 0.033785730295151535, "learning_rate": 9.92730961580709e-06, "loss": 6.390086059570312, "step": 28000 }, { "epoch": 0.03390639361763422, "learning_rate": 9.926905780339352e-06, "loss": 6.386889038085937, "step": 28100 }, { "epoch": 0.03402705694011691, "learning_rate": 9.926501944871614e-06, "loss": 6.370198974609375, "step": 28200 }, { "epoch": 0.03414772026259959, "learning_rate": 9.926098109403876e-06, "loss": 6.3718328857421875, "step": 28300 }, { "epoch": 0.034268383585082274, "learning_rate": 9.925694273936136e-06, "loss": 6.381991577148438, "step": 28400 }, { "epoch": 0.03438904690756496, "learning_rate": 9.925290438468398e-06, "loss": 6.355091552734375, "step": 28500 }, { "epoch": 0.03450971023004764, "learning_rate": 9.92488660300066e-06, "loss": 6.332806396484375, "step": 28600 }, { "epoch": 0.034630373552530326, "learning_rate": 9.924482767532922e-06, "loss": 6.320509643554687, "step": 28700 }, { "epoch": 0.03475103687501301, "learning_rate": 9.924078932065182e-06, "loss": 6.34507080078125, "step": 28800 }, { "epoch": 0.03487170019749569, "learning_rate": 9.923675096597444e-06, "loss": 6.32692626953125, "step": 28900 }, { "epoch": 0.03499236351997838, "learning_rate": 9.923271261129706e-06, "loss": 6.352927856445312, "step": 29000 }, { "epoch": 0.03511302684246106, "learning_rate": 9.922867425661968e-06, "loss": 6.342001953125, "step": 29100 }, { "epoch": 0.035233690164943744, "learning_rate": 9.922463590194229e-06, "loss": 6.319302368164062, "step": 29200 }, { "epoch": 0.03535435348742643, "learning_rate": 9.92205975472649e-06, "loss": 6.307904052734375, "step": 29300 }, { "epoch": 0.03547501680990911, "learning_rate": 9.921655919258753e-06, "loss": 6.295087280273438, "step": 29400 }, { "epoch": 0.035595680132391797, "learning_rate": 9.921252083791015e-06, "loss": 6.290713500976563, "step": 29500 }, { "epoch": 0.03571634345487448, "learning_rate": 9.920848248323277e-06, "loss": 6.285931396484375, "step": 29600 }, { "epoch": 0.03583700677735716, "learning_rate": 9.920444412855539e-06, "loss": 6.309791870117188, "step": 29700 }, { "epoch": 0.03595767009983985, "learning_rate": 9.920040577387799e-06, "loss": 6.302537841796875, "step": 29800 }, { "epoch": 0.036078333422322535, "learning_rate": 9.91963674192006e-06, "loss": 6.308652954101563, "step": 29900 }, { "epoch": 0.036198996744805215, "learning_rate": 9.919232906452321e-06, "loss": 6.258733520507812, "step": 30000 }, { "epoch": 0.0363196600672879, "learning_rate": 9.918829070984583e-06, "loss": 6.288374633789062, "step": 30100 }, { "epoch": 0.03644032338977059, "learning_rate": 9.918425235516845e-06, "loss": 6.268796997070313, "step": 30200 }, { "epoch": 0.03656098671225327, "learning_rate": 9.918021400049107e-06, "loss": 6.256526489257812, "step": 30300 }, { "epoch": 0.03668165003473595, "learning_rate": 9.917617564581369e-06, "loss": 6.274508056640625, "step": 30400 }, { "epoch": 0.03680231335721864, "learning_rate": 9.917213729113631e-06, "loss": 6.27301025390625, "step": 30500 }, { "epoch": 0.03692297667970132, "learning_rate": 9.916809893645893e-06, "loss": 6.24278076171875, "step": 30600 }, { "epoch": 0.037043640002184006, "learning_rate": 9.916406058178153e-06, "loss": 6.2477734375, "step": 30700 }, { "epoch": 0.03716430332466669, "learning_rate": 9.916002222710415e-06, "loss": 6.243428955078125, "step": 30800 }, { "epoch": 0.03728496664714937, "learning_rate": 9.915598387242677e-06, "loss": 6.238870239257812, "step": 30900 }, { "epoch": 0.03740562996963206, "learning_rate": 9.915194551774938e-06, "loss": 6.225955810546875, "step": 31000 }, { "epoch": 0.037526293292114744, "learning_rate": 9.9147907163072e-06, "loss": 6.218800659179688, "step": 31100 }, { "epoch": 0.037646956614597424, "learning_rate": 9.914386880839461e-06, "loss": 6.21949462890625, "step": 31200 }, { "epoch": 0.03776761993708011, "learning_rate": 9.913983045371723e-06, "loss": 6.182770385742187, "step": 31300 }, { "epoch": 0.0378882832595628, "learning_rate": 9.913579209903985e-06, "loss": 6.196390991210937, "step": 31400 }, { "epoch": 0.038008946582045476, "learning_rate": 9.913175374436247e-06, "loss": 6.185361328125, "step": 31500 }, { "epoch": 0.03812960990452816, "learning_rate": 9.91277153896851e-06, "loss": 6.214140014648438, "step": 31600 }, { "epoch": 0.03825027322701085, "learning_rate": 9.91236770350077e-06, "loss": 6.208532104492187, "step": 31700 }, { "epoch": 0.03837093654949353, "learning_rate": 9.911963868033032e-06, "loss": 6.163168334960938, "step": 31800 }, { "epoch": 0.038491599871976215, "learning_rate": 9.911560032565292e-06, "loss": 6.170020751953125, "step": 31900 }, { "epoch": 0.0386122631944589, "learning_rate": 9.911156197097554e-06, "loss": 6.167660522460937, "step": 32000 }, { "epoch": 0.03873292651694158, "learning_rate": 9.910752361629816e-06, "loss": 6.15995361328125, "step": 32100 }, { "epoch": 0.03885358983942427, "learning_rate": 9.910348526162078e-06, "loss": 6.178750610351562, "step": 32200 }, { "epoch": 0.038974253161906953, "learning_rate": 9.90994469069434e-06, "loss": 6.160189208984375, "step": 32300 }, { "epoch": 0.03909491648438963, "learning_rate": 9.909540855226602e-06, "loss": 6.1517181396484375, "step": 32400 }, { "epoch": 0.03921557980687232, "learning_rate": 9.909137019758862e-06, "loss": 6.173123168945312, "step": 32500 }, { "epoch": 0.039336243129355006, "learning_rate": 9.908733184291124e-06, "loss": 6.134052124023437, "step": 32600 }, { "epoch": 0.039456906451837685, "learning_rate": 9.908329348823386e-06, "loss": 6.1498785400390625, "step": 32700 }, { "epoch": 0.03957756977432037, "learning_rate": 9.907925513355648e-06, "loss": 6.165042724609375, "step": 32800 }, { "epoch": 0.03969823309680306, "learning_rate": 9.907521677887908e-06, "loss": 6.1348779296875, "step": 32900 }, { "epoch": 0.03981889641928574, "learning_rate": 9.90711784242017e-06, "loss": 6.134515991210938, "step": 33000 }, { "epoch": 0.039939559741768424, "learning_rate": 9.906714006952432e-06, "loss": 6.169119873046875, "step": 33100 }, { "epoch": 0.04006022306425111, "learning_rate": 9.906310171484694e-06, "loss": 6.122115478515625, "step": 33200 }, { "epoch": 0.04018088638673379, "learning_rate": 9.905906336016955e-06, "loss": 6.1315069580078125, "step": 33300 }, { "epoch": 0.040301549709216476, "learning_rate": 9.905502500549217e-06, "loss": 6.11522216796875, "step": 33400 }, { "epoch": 0.04042221303169916, "learning_rate": 9.905098665081479e-06, "loss": 6.1282586669921875, "step": 33500 }, { "epoch": 0.04054287635418184, "learning_rate": 9.90469482961374e-06, "loss": 6.114356689453125, "step": 33600 }, { "epoch": 0.04066353967666453, "learning_rate": 9.904290994146003e-06, "loss": 6.118187255859375, "step": 33700 }, { "epoch": 0.040784202999147215, "learning_rate": 9.903887158678263e-06, "loss": 6.131346435546875, "step": 33800 }, { "epoch": 0.040904866321629894, "learning_rate": 9.903483323210525e-06, "loss": 6.07158447265625, "step": 33900 }, { "epoch": 0.04102552964411258, "learning_rate": 9.903079487742787e-06, "loss": 6.1041943359375, "step": 34000 }, { "epoch": 0.04114619296659527, "learning_rate": 9.902675652275047e-06, "loss": 6.083723754882812, "step": 34100 }, { "epoch": 0.04126685628907795, "learning_rate": 9.902271816807309e-06, "loss": 6.080000610351562, "step": 34200 }, { "epoch": 0.04138751961156063, "learning_rate": 9.901867981339571e-06, "loss": 6.075195922851562, "step": 34300 }, { "epoch": 0.04150818293404332, "learning_rate": 9.901464145871833e-06, "loss": 6.10289306640625, "step": 34400 }, { "epoch": 0.041628846256526, "learning_rate": 9.901060310404095e-06, "loss": 6.061969604492187, "step": 34500 }, { "epoch": 0.041749509579008685, "learning_rate": 9.900656474936357e-06, "loss": 6.068685302734375, "step": 34600 }, { "epoch": 0.04187017290149137, "learning_rate": 9.900252639468619e-06, "loss": 6.074742431640625, "step": 34700 }, { "epoch": 0.04199083622397405, "learning_rate": 9.89984880400088e-06, "loss": 6.040508422851563, "step": 34800 }, { "epoch": 0.04211149954645674, "learning_rate": 9.899444968533141e-06, "loss": 6.060413208007812, "step": 34900 }, { "epoch": 0.042232162868939424, "learning_rate": 9.899041133065402e-06, "loss": 6.077679443359375, "step": 35000 }, { "epoch": 0.042352826191422104, "learning_rate": 9.898637297597664e-06, "loss": 6.033153076171875, "step": 35100 }, { "epoch": 0.04247348951390479, "learning_rate": 9.898233462129926e-06, "loss": 6.03320556640625, "step": 35200 }, { "epoch": 0.04259415283638747, "learning_rate": 9.897829626662188e-06, "loss": 6.057587280273437, "step": 35300 }, { "epoch": 0.042714816158870156, "learning_rate": 9.89742579119445e-06, "loss": 6.067791748046875, "step": 35400 }, { "epoch": 0.04283547948135284, "learning_rate": 9.897021955726711e-06, "loss": 6.061552124023438, "step": 35500 }, { "epoch": 0.04295614280383552, "learning_rate": 9.896618120258973e-06, "loss": 6.047073974609375, "step": 35600 }, { "epoch": 0.04307680612631821, "learning_rate": 9.896214284791234e-06, "loss": 6.028131103515625, "step": 35700 }, { "epoch": 0.043197469448800895, "learning_rate": 9.895810449323496e-06, "loss": 6.0347705078125, "step": 35800 }, { "epoch": 0.043318132771283574, "learning_rate": 9.895406613855758e-06, "loss": 6.010587768554688, "step": 35900 }, { "epoch": 0.04343879609376626, "learning_rate": 9.895002778388018e-06, "loss": 6.03420166015625, "step": 36000 }, { "epoch": 0.04355945941624895, "learning_rate": 9.89459894292028e-06, "loss": 6.025477905273437, "step": 36100 }, { "epoch": 0.043680122738731626, "learning_rate": 9.894195107452542e-06, "loss": 6.012522583007812, "step": 36200 }, { "epoch": 0.04380078606121431, "learning_rate": 9.893791271984804e-06, "loss": 5.981051025390625, "step": 36300 }, { "epoch": 0.043921449383697, "learning_rate": 9.893387436517066e-06, "loss": 6.0163201904296875, "step": 36400 }, { "epoch": 0.04404211270617968, "learning_rate": 9.892983601049328e-06, "loss": 6.000119018554687, "step": 36500 }, { "epoch": 0.044162776028662365, "learning_rate": 9.892579765581588e-06, "loss": 6.0064239501953125, "step": 36600 }, { "epoch": 0.04428343935114505, "learning_rate": 9.89217593011385e-06, "loss": 5.995327758789062, "step": 36700 }, { "epoch": 0.04440410267362773, "learning_rate": 9.891772094646112e-06, "loss": 5.96276123046875, "step": 36800 }, { "epoch": 0.04452476599611042, "learning_rate": 9.891368259178372e-06, "loss": 5.97086181640625, "step": 36900 }, { "epoch": 0.044645429318593104, "learning_rate": 9.890964423710634e-06, "loss": 5.97990234375, "step": 37000 }, { "epoch": 0.04476609264107578, "learning_rate": 9.890560588242896e-06, "loss": 5.986522827148438, "step": 37100 }, { "epoch": 0.04488675596355847, "learning_rate": 9.890156752775158e-06, "loss": 6.0063623046875, "step": 37200 }, { "epoch": 0.045007419286041156, "learning_rate": 9.88975291730742e-06, "loss": 5.954756469726562, "step": 37300 }, { "epoch": 0.045128082608523835, "learning_rate": 9.88934908183968e-06, "loss": 5.989403076171875, "step": 37400 }, { "epoch": 0.04524874593100652, "learning_rate": 9.888945246371943e-06, "loss": 5.97143310546875, "step": 37500 }, { "epoch": 0.04536940925348921, "learning_rate": 9.888541410904205e-06, "loss": 5.985697021484375, "step": 37600 }, { "epoch": 0.04549007257597189, "learning_rate": 9.888137575436467e-06, "loss": 5.979300537109375, "step": 37700 }, { "epoch": 0.045610735898454574, "learning_rate": 9.887733739968729e-06, "loss": 5.945584106445312, "step": 37800 }, { "epoch": 0.04573139922093726, "learning_rate": 9.887329904500989e-06, "loss": 5.941597290039063, "step": 37900 }, { "epoch": 0.04585206254341994, "learning_rate": 9.886926069033251e-06, "loss": 5.938487548828125, "step": 38000 }, { "epoch": 0.045972725865902626, "learning_rate": 9.886522233565513e-06, "loss": 5.946324462890625, "step": 38100 }, { "epoch": 0.04609338918838531, "learning_rate": 9.886118398097773e-06, "loss": 5.954590454101562, "step": 38200 }, { "epoch": 0.04621405251086799, "learning_rate": 9.885714562630035e-06, "loss": 5.935897216796875, "step": 38300 }, { "epoch": 0.04633471583335068, "learning_rate": 9.885310727162297e-06, "loss": 5.946389770507812, "step": 38400 }, { "epoch": 0.046455379155833365, "learning_rate": 9.884906891694559e-06, "loss": 5.924605712890625, "step": 38500 }, { "epoch": 0.046576042478316045, "learning_rate": 9.884503056226821e-06, "loss": 5.8884765625, "step": 38600 }, { "epoch": 0.04669670580079873, "learning_rate": 9.884099220759083e-06, "loss": 5.920947875976562, "step": 38700 }, { "epoch": 0.04681736912328142, "learning_rate": 9.883695385291345e-06, "loss": 5.917391357421875, "step": 38800 }, { "epoch": 0.0469380324457641, "learning_rate": 9.883291549823605e-06, "loss": 5.922462768554688, "step": 38900 }, { "epoch": 0.04705869576824678, "learning_rate": 9.882887714355867e-06, "loss": 5.899052124023438, "step": 39000 }, { "epoch": 0.04717935909072947, "learning_rate": 9.882483878888128e-06, "loss": 5.926414184570312, "step": 39100 }, { "epoch": 0.04730002241321215, "learning_rate": 9.88208004342039e-06, "loss": 5.90779296875, "step": 39200 }, { "epoch": 0.047420685735694836, "learning_rate": 9.881676207952652e-06, "loss": 5.891823120117188, "step": 39300 }, { "epoch": 0.04754134905817752, "learning_rate": 9.881272372484914e-06, "loss": 5.90169189453125, "step": 39400 }, { "epoch": 0.0476620123806602, "learning_rate": 9.880868537017176e-06, "loss": 5.892493896484375, "step": 39500 }, { "epoch": 0.04778267570314289, "learning_rate": 9.880464701549438e-06, "loss": 5.870087890625, "step": 39600 }, { "epoch": 0.047903339025625574, "learning_rate": 9.8800608660817e-06, "loss": 5.886649780273437, "step": 39700 }, { "epoch": 0.048024002348108254, "learning_rate": 9.87965703061396e-06, "loss": 5.894774780273438, "step": 39800 }, { "epoch": 0.04814466567059094, "learning_rate": 9.879253195146222e-06, "loss": 5.86189208984375, "step": 39900 }, { "epoch": 0.048265328993073627, "learning_rate": 9.878849359678484e-06, "loss": 5.86906005859375, "step": 40000 }, { "epoch": 0.048385992315556306, "learning_rate": 9.878445524210744e-06, "loss": 5.907960815429687, "step": 40100 }, { "epoch": 0.04850665563803899, "learning_rate": 9.878041688743006e-06, "loss": 5.850534057617187, "step": 40200 }, { "epoch": 0.04862731896052168, "learning_rate": 9.877637853275268e-06, "loss": 5.88085693359375, "step": 40300 }, { "epoch": 0.04874798228300436, "learning_rate": 9.87723401780753e-06, "loss": 5.872523803710937, "step": 40400 }, { "epoch": 0.048868645605487045, "learning_rate": 9.876830182339792e-06, "loss": 5.859061889648437, "step": 40500 }, { "epoch": 0.04898930892796973, "learning_rate": 9.876426346872052e-06, "loss": 5.855042114257812, "step": 40600 }, { "epoch": 0.04910997225045241, "learning_rate": 9.876022511404314e-06, "loss": 5.862298583984375, "step": 40700 }, { "epoch": 0.0492306355729351, "learning_rate": 9.875618675936576e-06, "loss": 5.823678588867187, "step": 40800 }, { "epoch": 0.04935129889541778, "learning_rate": 9.875214840468838e-06, "loss": 5.839556884765625, "step": 40900 }, { "epoch": 0.04947196221790046, "learning_rate": 9.874811005001098e-06, "loss": 5.82404052734375, "step": 41000 }, { "epoch": 0.04959262554038315, "learning_rate": 9.87440716953336e-06, "loss": 5.824871215820313, "step": 41100 }, { "epoch": 0.049713288862865836, "learning_rate": 9.874003334065622e-06, "loss": 5.827488403320313, "step": 41200 }, { "epoch": 0.049833952185348515, "learning_rate": 9.873599498597884e-06, "loss": 5.848665771484375, "step": 41300 }, { "epoch": 0.0499546155078312, "learning_rate": 9.873195663130146e-06, "loss": 5.826472778320312, "step": 41400 }, { "epoch": 0.05007527883031389, "learning_rate": 9.872791827662407e-06, "loss": 5.829556274414062, "step": 41500 }, { "epoch": 0.05019594215279657, "learning_rate": 9.872387992194669e-06, "loss": 5.819097290039062, "step": 41600 }, { "epoch": 0.050316605475279254, "learning_rate": 9.87198415672693e-06, "loss": 5.812535400390625, "step": 41700 }, { "epoch": 0.05043726879776193, "learning_rate": 9.871580321259193e-06, "loss": 5.79991943359375, "step": 41800 }, { "epoch": 0.05055793212024462, "learning_rate": 9.871176485791455e-06, "loss": 5.77990234375, "step": 41900 }, { "epoch": 0.050678595442727306, "learning_rate": 9.870772650323715e-06, "loss": 5.809010009765625, "step": 42000 }, { "epoch": 0.050799258765209986, "learning_rate": 9.870368814855977e-06, "loss": 5.794039306640625, "step": 42100 }, { "epoch": 0.05091992208769267, "learning_rate": 9.869964979388239e-06, "loss": 5.773182373046875, "step": 42200 }, { "epoch": 0.05104058541017536, "learning_rate": 9.8695611439205e-06, "loss": 5.795257568359375, "step": 42300 }, { "epoch": 0.05116124873265804, "learning_rate": 9.869157308452761e-06, "loss": 5.828724975585938, "step": 42400 }, { "epoch": 0.051281912055140724, "learning_rate": 9.868753472985023e-06, "loss": 5.810231323242188, "step": 42500 }, { "epoch": 0.05140257537762341, "learning_rate": 9.868349637517285e-06, "loss": 5.766407470703125, "step": 42600 }, { "epoch": 0.05152323870010609, "learning_rate": 9.867945802049547e-06, "loss": 5.799169311523437, "step": 42700 }, { "epoch": 0.05164390202258878, "learning_rate": 9.867541966581809e-06, "loss": 5.8177978515625, "step": 42800 }, { "epoch": 0.05176456534507146, "learning_rate": 9.86713813111407e-06, "loss": 5.7826611328125, "step": 42900 }, { "epoch": 0.05188522866755414, "learning_rate": 9.866734295646331e-06, "loss": 5.781925659179688, "step": 43000 }, { "epoch": 0.05200589199003683, "learning_rate": 9.866330460178593e-06, "loss": 5.7845916748046875, "step": 43100 }, { "epoch": 0.052126555312519515, "learning_rate": 9.865926624710854e-06, "loss": 5.79017822265625, "step": 43200 }, { "epoch": 0.052247218635002195, "learning_rate": 9.865522789243116e-06, "loss": 5.769013061523437, "step": 43300 }, { "epoch": 0.05236788195748488, "learning_rate": 9.865118953775378e-06, "loss": 5.766888427734375, "step": 43400 }, { "epoch": 0.05248854527996757, "learning_rate": 9.86471511830764e-06, "loss": 5.764293212890625, "step": 43500 }, { "epoch": 0.05260920860245025, "learning_rate": 9.864311282839902e-06, "loss": 5.7430487060546875, "step": 43600 }, { "epoch": 0.05272987192493293, "learning_rate": 9.863907447372164e-06, "loss": 5.750333251953125, "step": 43700 }, { "epoch": 0.05285053524741562, "learning_rate": 9.863503611904426e-06, "loss": 5.78717529296875, "step": 43800 }, { "epoch": 0.0529711985698983, "learning_rate": 9.863099776436686e-06, "loss": 5.78459228515625, "step": 43900 }, { "epoch": 0.053091861892380986, "learning_rate": 9.862695940968948e-06, "loss": 5.7740380859375, "step": 44000 }, { "epoch": 0.05321252521486367, "learning_rate": 9.862292105501208e-06, "loss": 5.722774658203125, "step": 44100 }, { "epoch": 0.05333318853734635, "learning_rate": 9.86188827003347e-06, "loss": 5.745663452148437, "step": 44200 }, { "epoch": 0.05345385185982904, "learning_rate": 9.861484434565732e-06, "loss": 5.737649536132812, "step": 44300 }, { "epoch": 0.053574515182311724, "learning_rate": 9.861080599097994e-06, "loss": 5.747950439453125, "step": 44400 }, { "epoch": 0.053695178504794404, "learning_rate": 9.860676763630256e-06, "loss": 5.738473510742187, "step": 44500 }, { "epoch": 0.05381584182727709, "learning_rate": 9.860272928162518e-06, "loss": 5.716368408203125, "step": 44600 }, { "epoch": 0.05393650514975978, "learning_rate": 9.859869092694778e-06, "loss": 5.750637817382812, "step": 44700 }, { "epoch": 0.054057168472242456, "learning_rate": 9.85946525722704e-06, "loss": 5.746980590820312, "step": 44800 }, { "epoch": 0.05417783179472514, "learning_rate": 9.859061421759302e-06, "loss": 5.73247314453125, "step": 44900 }, { "epoch": 0.05429849511720783, "learning_rate": 9.858657586291564e-06, "loss": 5.742887573242188, "step": 45000 }, { "epoch": 0.05441915843969051, "learning_rate": 9.858253750823825e-06, "loss": 5.718990478515625, "step": 45100 }, { "epoch": 0.054539821762173195, "learning_rate": 9.857849915356087e-06, "loss": 5.700264282226563, "step": 45200 }, { "epoch": 0.05466048508465588, "learning_rate": 9.857446079888348e-06, "loss": 5.7020849609375, "step": 45300 }, { "epoch": 0.05478114840713856, "learning_rate": 9.85704224442061e-06, "loss": 5.697625732421875, "step": 45400 }, { "epoch": 0.05490181172962125, "learning_rate": 9.85663840895287e-06, "loss": 5.695245361328125, "step": 45500 }, { "epoch": 0.055022475052103934, "learning_rate": 9.856234573485133e-06, "loss": 5.713543090820313, "step": 45600 }, { "epoch": 0.05514313837458661, "learning_rate": 9.855830738017395e-06, "loss": 5.684797973632812, "step": 45700 }, { "epoch": 0.0552638016970693, "learning_rate": 9.855426902549657e-06, "loss": 5.691742553710937, "step": 45800 }, { "epoch": 0.055384465019551986, "learning_rate": 9.855023067081919e-06, "loss": 5.704517211914062, "step": 45900 }, { "epoch": 0.055505128342034665, "learning_rate": 9.854619231614179e-06, "loss": 5.6752166748046875, "step": 46000 }, { "epoch": 0.05562579166451735, "learning_rate": 9.854215396146441e-06, "loss": 5.681259765625, "step": 46100 }, { "epoch": 0.05574645498700004, "learning_rate": 9.853811560678703e-06, "loss": 5.696261596679688, "step": 46200 }, { "epoch": 0.05586711830948272, "learning_rate": 9.853407725210965e-06, "loss": 5.70001953125, "step": 46300 }, { "epoch": 0.055987781631965404, "learning_rate": 9.853003889743225e-06, "loss": 5.69338134765625, "step": 46400 }, { "epoch": 0.05610844495444809, "learning_rate": 9.852600054275487e-06, "loss": 5.696197509765625, "step": 46500 }, { "epoch": 0.05622910827693077, "learning_rate": 9.85219621880775e-06, "loss": 5.712601928710938, "step": 46600 }, { "epoch": 0.056349771599413456, "learning_rate": 9.851792383340011e-06, "loss": 5.650829467773438, "step": 46700 }, { "epoch": 0.05647043492189614, "learning_rate": 9.851388547872273e-06, "loss": 5.642108154296875, "step": 46800 }, { "epoch": 0.05659109824437882, "learning_rate": 9.850984712404535e-06, "loss": 5.658579711914062, "step": 46900 }, { "epoch": 0.05671176156686151, "learning_rate": 9.850580876936795e-06, "loss": 5.652801513671875, "step": 47000 }, { "epoch": 0.056832424889344195, "learning_rate": 9.850177041469057e-06, "loss": 5.683375854492187, "step": 47100 }, { "epoch": 0.056953088211826874, "learning_rate": 9.849773206001318e-06, "loss": 5.64796630859375, "step": 47200 }, { "epoch": 0.05707375153430956, "learning_rate": 9.84936937053358e-06, "loss": 5.649228515625, "step": 47300 }, { "epoch": 0.05719441485679225, "learning_rate": 9.848965535065842e-06, "loss": 5.65912841796875, "step": 47400 }, { "epoch": 0.05731507817927493, "learning_rate": 9.848561699598104e-06, "loss": 5.653483276367187, "step": 47500 }, { "epoch": 0.05743574150175761, "learning_rate": 9.848157864130366e-06, "loss": 5.6471826171875, "step": 47600 }, { "epoch": 0.0575564048242403, "learning_rate": 9.847754028662628e-06, "loss": 5.65800048828125, "step": 47700 }, { "epoch": 0.05767706814672298, "learning_rate": 9.84735019319489e-06, "loss": 5.6379833984375, "step": 47800 }, { "epoch": 0.057797731469205665, "learning_rate": 9.84694635772715e-06, "loss": 5.633699340820312, "step": 47900 }, { "epoch": 0.05791839479168835, "learning_rate": 9.846542522259412e-06, "loss": 5.66202392578125, "step": 48000 }, { "epoch": 0.05803905811417103, "learning_rate": 9.846138686791674e-06, "loss": 5.6377734375, "step": 48100 }, { "epoch": 0.05815972143665372, "learning_rate": 9.845734851323934e-06, "loss": 5.629166870117188, "step": 48200 }, { "epoch": 0.0582803847591364, "learning_rate": 9.845331015856196e-06, "loss": 5.624560546875, "step": 48300 }, { "epoch": 0.058401048081619084, "learning_rate": 9.844927180388458e-06, "loss": 5.6068878173828125, "step": 48400 }, { "epoch": 0.05852171140410177, "learning_rate": 9.84452334492072e-06, "loss": 5.632612915039062, "step": 48500 }, { "epoch": 0.05864237472658445, "learning_rate": 9.844119509452982e-06, "loss": 5.59102294921875, "step": 48600 }, { "epoch": 0.058763038049067136, "learning_rate": 9.843715673985244e-06, "loss": 5.6015252685546875, "step": 48700 }, { "epoch": 0.05888370137154982, "learning_rate": 9.843311838517504e-06, "loss": 5.610700073242188, "step": 48800 }, { "epoch": 0.0590043646940325, "learning_rate": 9.842908003049766e-06, "loss": 5.6188427734375, "step": 48900 }, { "epoch": 0.05912502801651519, "learning_rate": 9.842504167582028e-06, "loss": 5.6034698486328125, "step": 49000 }, { "epoch": 0.059245691338997875, "learning_rate": 9.842100332114289e-06, "loss": 5.592289428710938, "step": 49100 }, { "epoch": 0.059366354661480554, "learning_rate": 9.84169649664655e-06, "loss": 5.59678466796875, "step": 49200 }, { "epoch": 0.05948701798396324, "learning_rate": 9.841292661178813e-06, "loss": 5.584678344726562, "step": 49300 }, { "epoch": 0.05960768130644593, "learning_rate": 9.840888825711075e-06, "loss": 5.604636840820312, "step": 49400 }, { "epoch": 0.059728344628928606, "learning_rate": 9.840484990243337e-06, "loss": 5.59030029296875, "step": 49500 }, { "epoch": 0.05984900795141129, "learning_rate": 9.840081154775597e-06, "loss": 5.601084594726562, "step": 49600 }, { "epoch": 0.05996967127389398, "learning_rate": 9.839677319307859e-06, "loss": 5.613219604492188, "step": 49700 }, { "epoch": 0.06009033459637666, "learning_rate": 9.83927348384012e-06, "loss": 5.557407836914063, "step": 49800 }, { "epoch": 0.060210997918859345, "learning_rate": 9.838869648372383e-06, "loss": 5.575147094726563, "step": 49900 }, { "epoch": 0.06033166124134203, "learning_rate": 9.838465812904645e-06, "loss": 5.553262939453125, "step": 50000 }, { "epoch": 0.06045232456382471, "learning_rate": 9.838061977436905e-06, "loss": 5.550405883789063, "step": 50100 }, { "epoch": 0.0605729878863074, "learning_rate": 9.837658141969167e-06, "loss": 5.579466552734375, "step": 50200 }, { "epoch": 0.060693651208790084, "learning_rate": 9.837254306501429e-06, "loss": 5.56111328125, "step": 50300 }, { "epoch": 0.06081431453127276, "learning_rate": 9.83685047103369e-06, "loss": 5.578643798828125, "step": 50400 }, { "epoch": 0.06093497785375545, "learning_rate": 9.836446635565951e-06, "loss": 5.561683349609375, "step": 50500 }, { "epoch": 0.061055641176238136, "learning_rate": 9.836042800098213e-06, "loss": 5.570487060546875, "step": 50600 }, { "epoch": 0.061176304498720815, "learning_rate": 9.835638964630475e-06, "loss": 5.524298095703125, "step": 50700 }, { "epoch": 0.0612969678212035, "learning_rate": 9.835235129162737e-06, "loss": 5.562306518554688, "step": 50800 }, { "epoch": 0.06141763114368619, "learning_rate": 9.834831293695e-06, "loss": 5.566176147460937, "step": 50900 }, { "epoch": 0.06153829446616887, "learning_rate": 9.83442745822726e-06, "loss": 5.533325805664062, "step": 51000 }, { "epoch": 0.061658957788651554, "learning_rate": 9.834023622759521e-06, "loss": 5.5660498046875, "step": 51100 }, { "epoch": 0.06177962111113424, "learning_rate": 9.833619787291783e-06, "loss": 5.52291748046875, "step": 51200 }, { "epoch": 0.06190028443361692, "learning_rate": 9.833215951824044e-06, "loss": 5.526439208984375, "step": 51300 }, { "epoch": 0.062020947756099606, "learning_rate": 9.832812116356306e-06, "loss": 5.51739990234375, "step": 51400 }, { "epoch": 0.06214161107858229, "learning_rate": 9.832408280888568e-06, "loss": 5.55761474609375, "step": 51500 }, { "epoch": 0.06226227440106497, "learning_rate": 9.83200444542083e-06, "loss": 5.556441650390625, "step": 51600 }, { "epoch": 0.06238293772354766, "learning_rate": 9.831600609953092e-06, "loss": 5.51667724609375, "step": 51700 }, { "epoch": 0.06250360104603034, "learning_rate": 9.831196774485354e-06, "loss": 5.497745971679688, "step": 51800 }, { "epoch": 0.06262426436851302, "learning_rate": 9.830792939017616e-06, "loss": 5.506736450195312, "step": 51900 }, { "epoch": 0.06274492769099571, "learning_rate": 9.830389103549876e-06, "loss": 5.5475836181640625, "step": 52000 }, { "epoch": 0.0628655910134784, "learning_rate": 9.829985268082138e-06, "loss": 5.504075317382813, "step": 52100 }, { "epoch": 0.06298625433596108, "learning_rate": 9.829581432614398e-06, "loss": 5.52787109375, "step": 52200 }, { "epoch": 0.06310691765844376, "learning_rate": 9.82917759714666e-06, "loss": 5.494723510742188, "step": 52300 }, { "epoch": 0.06322758098092644, "learning_rate": 9.828773761678922e-06, "loss": 5.514593505859375, "step": 52400 }, { "epoch": 0.06334824430340913, "learning_rate": 9.828369926211184e-06, "loss": 5.506063232421875, "step": 52500 }, { "epoch": 0.06346890762589182, "learning_rate": 9.827966090743446e-06, "loss": 5.525193481445313, "step": 52600 }, { "epoch": 0.0635895709483745, "learning_rate": 9.827562255275708e-06, "loss": 5.536563720703125, "step": 52700 }, { "epoch": 0.06371023427085719, "learning_rate": 9.82715841980797e-06, "loss": 5.473799438476562, "step": 52800 }, { "epoch": 0.06383089759333986, "learning_rate": 9.82675458434023e-06, "loss": 5.494265747070313, "step": 52900 }, { "epoch": 0.06395156091582255, "learning_rate": 9.826350748872492e-06, "loss": 5.47943603515625, "step": 53000 }, { "epoch": 0.06407222423830523, "learning_rate": 9.825946913404754e-06, "loss": 5.489384155273438, "step": 53100 }, { "epoch": 0.06419288756078792, "learning_rate": 9.825543077937015e-06, "loss": 5.486170654296875, "step": 53200 }, { "epoch": 0.0643135508832706, "learning_rate": 9.825139242469277e-06, "loss": 5.4916314697265625, "step": 53300 }, { "epoch": 0.06443421420575329, "learning_rate": 9.824735407001539e-06, "loss": 5.490230102539062, "step": 53400 }, { "epoch": 0.06455487752823597, "learning_rate": 9.8243315715338e-06, "loss": 5.4870233154296875, "step": 53500 }, { "epoch": 0.06467554085071865, "learning_rate": 9.823927736066063e-06, "loss": 5.458673706054688, "step": 53600 }, { "epoch": 0.06479620417320134, "learning_rate": 9.823523900598323e-06, "loss": 5.498256225585937, "step": 53700 }, { "epoch": 0.06491686749568402, "learning_rate": 9.823120065130585e-06, "loss": 5.452241821289062, "step": 53800 }, { "epoch": 0.06503753081816671, "learning_rate": 9.822716229662847e-06, "loss": 5.48254150390625, "step": 53900 }, { "epoch": 0.0651581941406494, "learning_rate": 9.822312394195109e-06, "loss": 5.49094970703125, "step": 54000 }, { "epoch": 0.06527885746313207, "learning_rate": 9.82190855872737e-06, "loss": 5.470156860351563, "step": 54100 }, { "epoch": 0.06539952078561476, "learning_rate": 9.821504723259631e-06, "loss": 5.458375244140625, "step": 54200 }, { "epoch": 0.06552018410809744, "learning_rate": 9.821100887791893e-06, "loss": 5.4711083984375, "step": 54300 }, { "epoch": 0.06564084743058013, "learning_rate": 9.820697052324155e-06, "loss": 5.451007080078125, "step": 54400 }, { "epoch": 0.06576151075306282, "learning_rate": 9.820293216856415e-06, "loss": 5.4637518310546875, "step": 54500 }, { "epoch": 0.0658821740755455, "learning_rate": 9.819889381388677e-06, "loss": 5.446215209960937, "step": 54600 }, { "epoch": 0.06600283739802817, "learning_rate": 9.81948554592094e-06, "loss": 5.457670288085938, "step": 54700 }, { "epoch": 0.06612350072051086, "learning_rate": 9.819081710453201e-06, "loss": 5.455287475585937, "step": 54800 }, { "epoch": 0.06624416404299355, "learning_rate": 9.818677874985463e-06, "loss": 5.436695556640625, "step": 54900 }, { "epoch": 0.06636482736547623, "learning_rate": 9.818274039517725e-06, "loss": 5.45849853515625, "step": 55000 }, { "epoch": 0.06648549068795892, "learning_rate": 9.817870204049985e-06, "loss": 5.436983032226562, "step": 55100 }, { "epoch": 0.0666061540104416, "learning_rate": 9.817466368582247e-06, "loss": 5.450509033203125, "step": 55200 }, { "epoch": 0.06672681733292428, "learning_rate": 9.81706253311451e-06, "loss": 5.440614013671875, "step": 55300 }, { "epoch": 0.06684748065540697, "learning_rate": 9.81665869764677e-06, "loss": 5.450062866210938, "step": 55400 }, { "epoch": 0.06696814397788965, "learning_rate": 9.816254862179032e-06, "loss": 5.440513305664062, "step": 55500 }, { "epoch": 0.06708880730037234, "learning_rate": 9.815851026711294e-06, "loss": 5.45876953125, "step": 55600 }, { "epoch": 0.06720947062285502, "learning_rate": 9.815447191243556e-06, "loss": 5.445390014648438, "step": 55700 }, { "epoch": 0.06733013394533771, "learning_rate": 9.815043355775818e-06, "loss": 5.438015747070312, "step": 55800 }, { "epoch": 0.06745079726782038, "learning_rate": 9.81463952030808e-06, "loss": 5.417323608398437, "step": 55900 }, { "epoch": 0.06757146059030307, "learning_rate": 9.814235684840342e-06, "loss": 5.4468841552734375, "step": 56000 }, { "epoch": 0.06769212391278576, "learning_rate": 9.813831849372602e-06, "loss": 5.424739379882812, "step": 56100 }, { "epoch": 0.06781278723526844, "learning_rate": 9.813428013904864e-06, "loss": 5.445565795898437, "step": 56200 }, { "epoch": 0.06793345055775113, "learning_rate": 9.813024178437124e-06, "loss": 5.397311401367188, "step": 56300 }, { "epoch": 0.06805411388023382, "learning_rate": 9.812620342969386e-06, "loss": 5.42822998046875, "step": 56400 }, { "epoch": 0.06817477720271649, "learning_rate": 9.812216507501648e-06, "loss": 5.4188385009765625, "step": 56500 }, { "epoch": 0.06829544052519917, "learning_rate": 9.81181267203391e-06, "loss": 5.391190795898438, "step": 56600 }, { "epoch": 0.06841610384768186, "learning_rate": 9.811408836566172e-06, "loss": 5.405062255859375, "step": 56700 }, { "epoch": 0.06853676717016455, "learning_rate": 9.811005001098434e-06, "loss": 5.404650268554687, "step": 56800 }, { "epoch": 0.06865743049264723, "learning_rate": 9.810601165630696e-06, "loss": 5.415482788085938, "step": 56900 }, { "epoch": 0.06877809381512992, "learning_rate": 9.810197330162956e-06, "loss": 5.415482177734375, "step": 57000 }, { "epoch": 0.06889875713761259, "learning_rate": 9.809793494695218e-06, "loss": 5.37707763671875, "step": 57100 }, { "epoch": 0.06901942046009528, "learning_rate": 9.80938965922748e-06, "loss": 5.413468017578125, "step": 57200 }, { "epoch": 0.06914008378257797, "learning_rate": 9.80898582375974e-06, "loss": 5.379092407226563, "step": 57300 }, { "epoch": 0.06926074710506065, "learning_rate": 9.808581988292003e-06, "loss": 5.39713623046875, "step": 57400 }, { "epoch": 0.06938141042754334, "learning_rate": 9.808178152824265e-06, "loss": 5.401636352539063, "step": 57500 }, { "epoch": 0.06950207375002602, "learning_rate": 9.807774317356527e-06, "loss": 5.393638916015625, "step": 57600 }, { "epoch": 0.0696227370725087, "learning_rate": 9.807370481888789e-06, "loss": 5.391743774414063, "step": 57700 }, { "epoch": 0.06974340039499138, "learning_rate": 9.806966646421049e-06, "loss": 5.345445556640625, "step": 57800 }, { "epoch": 0.06986406371747407, "learning_rate": 9.80656281095331e-06, "loss": 5.348238525390625, "step": 57900 }, { "epoch": 0.06998472703995676, "learning_rate": 9.806158975485573e-06, "loss": 5.375379028320313, "step": 58000 }, { "epoch": 0.07010539036243944, "learning_rate": 9.805755140017835e-06, "loss": 5.3898388671875, "step": 58100 }, { "epoch": 0.07022605368492212, "learning_rate": 9.805351304550095e-06, "loss": 5.37486328125, "step": 58200 }, { "epoch": 0.0703467170074048, "learning_rate": 9.804947469082357e-06, "loss": 5.377813110351562, "step": 58300 }, { "epoch": 0.07046738032988749, "learning_rate": 9.804543633614619e-06, "loss": 5.381748046875, "step": 58400 }, { "epoch": 0.07058804365237017, "learning_rate": 9.804139798146881e-06, "loss": 5.348593139648438, "step": 58500 }, { "epoch": 0.07070870697485286, "learning_rate": 9.803735962679141e-06, "loss": 5.369475708007813, "step": 58600 }, { "epoch": 0.07082937029733555, "learning_rate": 9.803332127211403e-06, "loss": 5.3422998046875, "step": 58700 }, { "epoch": 0.07095003361981822, "learning_rate": 9.802928291743665e-06, "loss": 5.3921356201171875, "step": 58800 }, { "epoch": 0.0710706969423009, "learning_rate": 9.802524456275927e-06, "loss": 5.365232543945313, "step": 58900 }, { "epoch": 0.07119136026478359, "learning_rate": 9.80212062080819e-06, "loss": 5.341582641601563, "step": 59000 }, { "epoch": 0.07131202358726628, "learning_rate": 9.801716785340451e-06, "loss": 5.3381201171875, "step": 59100 }, { "epoch": 0.07143268690974897, "learning_rate": 9.801312949872712e-06, "loss": 5.333232421875, "step": 59200 }, { "epoch": 0.07155335023223165, "learning_rate": 9.800909114404974e-06, "loss": 5.338631591796875, "step": 59300 }, { "epoch": 0.07167401355471432, "learning_rate": 9.800505278937234e-06, "loss": 5.317579345703125, "step": 59400 }, { "epoch": 0.07179467687719701, "learning_rate": 9.800101443469496e-06, "loss": 5.331469116210937, "step": 59500 }, { "epoch": 0.0719153401996797, "learning_rate": 9.799697608001758e-06, "loss": 5.339337768554688, "step": 59600 }, { "epoch": 0.07203600352216238, "learning_rate": 9.79929377253402e-06, "loss": 5.327628173828125, "step": 59700 }, { "epoch": 0.07215666684464507, "learning_rate": 9.798889937066282e-06, "loss": 5.363141479492188, "step": 59800 }, { "epoch": 0.07227733016712776, "learning_rate": 9.798486101598544e-06, "loss": 5.346229858398438, "step": 59900 }, { "epoch": 0.07239799348961043, "learning_rate": 9.798082266130806e-06, "loss": 5.3337109375, "step": 60000 }, { "epoch": 0.07251865681209312, "learning_rate": 9.797678430663066e-06, "loss": 5.371128540039063, "step": 60100 }, { "epoch": 0.0726393201345758, "learning_rate": 9.797274595195328e-06, "loss": 5.325468139648438, "step": 60200 }, { "epoch": 0.07275998345705849, "learning_rate": 9.79687075972759e-06, "loss": 5.351263427734375, "step": 60300 }, { "epoch": 0.07288064677954117, "learning_rate": 9.79646692425985e-06, "loss": 5.302833251953125, "step": 60400 }, { "epoch": 0.07300131010202386, "learning_rate": 9.796063088792112e-06, "loss": 5.320345458984375, "step": 60500 }, { "epoch": 0.07312197342450653, "learning_rate": 9.795659253324374e-06, "loss": 5.30924560546875, "step": 60600 }, { "epoch": 0.07324263674698922, "learning_rate": 9.795255417856636e-06, "loss": 5.312813110351563, "step": 60700 }, { "epoch": 0.0733633000694719, "learning_rate": 9.794851582388898e-06, "loss": 5.312037963867187, "step": 60800 }, { "epoch": 0.0734839633919546, "learning_rate": 9.79444774692116e-06, "loss": 5.3346142578125, "step": 60900 }, { "epoch": 0.07360462671443728, "learning_rate": 9.79404391145342e-06, "loss": 5.290857543945313, "step": 61000 }, { "epoch": 0.07372529003691997, "learning_rate": 9.793640075985682e-06, "loss": 5.333678588867188, "step": 61100 }, { "epoch": 0.07384595335940264, "learning_rate": 9.793236240517944e-06, "loss": 5.278713989257812, "step": 61200 }, { "epoch": 0.07396661668188532, "learning_rate": 9.792832405050205e-06, "loss": 5.292643432617187, "step": 61300 }, { "epoch": 0.07408728000436801, "learning_rate": 9.792428569582467e-06, "loss": 5.316370849609375, "step": 61400 }, { "epoch": 0.0742079433268507, "learning_rate": 9.792024734114729e-06, "loss": 5.312543334960938, "step": 61500 }, { "epoch": 0.07432860664933338, "learning_rate": 9.79162089864699e-06, "loss": 5.278667602539063, "step": 61600 }, { "epoch": 0.07444926997181607, "learning_rate": 9.791217063179253e-06, "loss": 5.2681646728515625, "step": 61700 }, { "epoch": 0.07456993329429874, "learning_rate": 9.790813227711515e-06, "loss": 5.295643310546875, "step": 61800 }, { "epoch": 0.07469059661678143, "learning_rate": 9.790409392243775e-06, "loss": 5.30662353515625, "step": 61900 }, { "epoch": 0.07481125993926412, "learning_rate": 9.790005556776037e-06, "loss": 5.2986328125, "step": 62000 }, { "epoch": 0.0749319232617468, "learning_rate": 9.789601721308299e-06, "loss": 5.298446044921875, "step": 62100 }, { "epoch": 0.07505258658422949, "learning_rate": 9.78919788584056e-06, "loss": 5.273689575195313, "step": 62200 }, { "epoch": 0.07517324990671218, "learning_rate": 9.788794050372821e-06, "loss": 5.304020385742188, "step": 62300 }, { "epoch": 0.07529391322919485, "learning_rate": 9.788390214905083e-06, "loss": 5.283749389648437, "step": 62400 }, { "epoch": 0.07541457655167753, "learning_rate": 9.787986379437345e-06, "loss": 5.284664916992187, "step": 62500 }, { "epoch": 0.07553523987416022, "learning_rate": 9.787582543969607e-06, "loss": 5.242105712890625, "step": 62600 }, { "epoch": 0.0756559031966429, "learning_rate": 9.787178708501867e-06, "loss": 5.273545532226563, "step": 62700 }, { "epoch": 0.0757765665191256, "learning_rate": 9.78677487303413e-06, "loss": 5.291265869140625, "step": 62800 }, { "epoch": 0.07589722984160828, "learning_rate": 9.786371037566391e-06, "loss": 5.2325592041015625, "step": 62900 }, { "epoch": 0.07601789316409095, "learning_rate": 9.785967202098653e-06, "loss": 5.281777954101562, "step": 63000 }, { "epoch": 0.07613855648657364, "learning_rate": 9.785563366630915e-06, "loss": 5.252301635742188, "step": 63100 }, { "epoch": 0.07625921980905633, "learning_rate": 9.785159531163176e-06, "loss": 5.271336669921875, "step": 63200 }, { "epoch": 0.07637988313153901, "learning_rate": 9.784755695695438e-06, "loss": 5.248751831054688, "step": 63300 }, { "epoch": 0.0765005464540217, "learning_rate": 9.7843518602277e-06, "loss": 5.28734130859375, "step": 63400 }, { "epoch": 0.07662120977650438, "learning_rate": 9.78394802475996e-06, "loss": 5.259991455078125, "step": 63500 }, { "epoch": 0.07674187309898706, "learning_rate": 9.783544189292222e-06, "loss": 5.244822998046875, "step": 63600 }, { "epoch": 0.07686253642146974, "learning_rate": 9.783140353824484e-06, "loss": 5.237239990234375, "step": 63700 }, { "epoch": 0.07698319974395243, "learning_rate": 9.782736518356746e-06, "loss": 5.25580078125, "step": 63800 }, { "epoch": 0.07710386306643512, "learning_rate": 9.782332682889008e-06, "loss": 5.237862548828125, "step": 63900 }, { "epoch": 0.0772245263889178, "learning_rate": 9.78192884742127e-06, "loss": 5.2344818115234375, "step": 64000 }, { "epoch": 0.07734518971140047, "learning_rate": 9.781525011953532e-06, "loss": 5.210677490234375, "step": 64100 }, { "epoch": 0.07746585303388316, "learning_rate": 9.781121176485792e-06, "loss": 5.2437255859375, "step": 64200 }, { "epoch": 0.07758651635636585, "learning_rate": 9.780717341018054e-06, "loss": 5.2295465087890625, "step": 64300 }, { "epoch": 0.07770717967884853, "learning_rate": 9.780313505550314e-06, "loss": 5.21697265625, "step": 64400 }, { "epoch": 0.07782784300133122, "learning_rate": 9.779909670082576e-06, "loss": 5.272308959960937, "step": 64500 }, { "epoch": 0.07794850632381391, "learning_rate": 9.779505834614838e-06, "loss": 5.207241821289062, "step": 64600 }, { "epoch": 0.07806916964629658, "learning_rate": 9.7791019991471e-06, "loss": 5.221626586914063, "step": 64700 }, { "epoch": 0.07818983296877927, "learning_rate": 9.778698163679362e-06, "loss": 5.228670654296875, "step": 64800 }, { "epoch": 0.07831049629126195, "learning_rate": 9.778294328211624e-06, "loss": 5.212542114257812, "step": 64900 }, { "epoch": 0.07843115961374464, "learning_rate": 9.777890492743886e-06, "loss": 5.1939501953125, "step": 65000 }, { "epoch": 0.07855182293622733, "learning_rate": 9.777486657276146e-06, "loss": 5.21961669921875, "step": 65100 }, { "epoch": 0.07867248625871001, "learning_rate": 9.777082821808408e-06, "loss": 5.210693969726562, "step": 65200 }, { "epoch": 0.07879314958119268, "learning_rate": 9.77667898634067e-06, "loss": 5.213010864257813, "step": 65300 }, { "epoch": 0.07891381290367537, "learning_rate": 9.77627515087293e-06, "loss": 5.203443603515625, "step": 65400 }, { "epoch": 0.07903447622615806, "learning_rate": 9.775871315405193e-06, "loss": 5.190748291015625, "step": 65500 }, { "epoch": 0.07915513954864074, "learning_rate": 9.775467479937455e-06, "loss": 5.1969976806640625, "step": 65600 }, { "epoch": 0.07927580287112343, "learning_rate": 9.775063644469717e-06, "loss": 5.207017822265625, "step": 65700 }, { "epoch": 0.07939646619360612, "learning_rate": 9.774659809001979e-06, "loss": 5.158209228515625, "step": 65800 }, { "epoch": 0.07951712951608879, "learning_rate": 9.774255973534239e-06, "loss": 5.209757080078125, "step": 65900 }, { "epoch": 0.07963779283857148, "learning_rate": 9.773852138066501e-06, "loss": 5.1891015625, "step": 66000 }, { "epoch": 0.07975845616105416, "learning_rate": 9.773448302598763e-06, "loss": 5.185696411132812, "step": 66100 }, { "epoch": 0.07987911948353685, "learning_rate": 9.773044467131025e-06, "loss": 5.192301635742187, "step": 66200 }, { "epoch": 0.07999978280601953, "learning_rate": 9.772640631663285e-06, "loss": 5.201160888671875, "step": 66300 }, { "epoch": 0.08012044612850222, "learning_rate": 9.772236796195547e-06, "loss": 5.201710815429688, "step": 66400 }, { "epoch": 0.0802411094509849, "learning_rate": 9.771832960727809e-06, "loss": 5.205989379882812, "step": 66500 }, { "epoch": 0.08036177277346758, "learning_rate": 9.771429125260071e-06, "loss": 5.183333129882812, "step": 66600 }, { "epoch": 0.08048243609595027, "learning_rate": 9.771025289792333e-06, "loss": 5.190036010742188, "step": 66700 }, { "epoch": 0.08060309941843295, "learning_rate": 9.770621454324593e-06, "loss": 5.178285522460937, "step": 66800 }, { "epoch": 0.08072376274091564, "learning_rate": 9.770217618856855e-06, "loss": 5.192055053710938, "step": 66900 }, { "epoch": 0.08084442606339833, "learning_rate": 9.769813783389117e-06, "loss": 5.202462768554687, "step": 67000 }, { "epoch": 0.080965089385881, "learning_rate": 9.76940994792138e-06, "loss": 5.140267333984375, "step": 67100 }, { "epoch": 0.08108575270836368, "learning_rate": 9.769006112453641e-06, "loss": 5.167439575195313, "step": 67200 }, { "epoch": 0.08120641603084637, "learning_rate": 9.768602276985902e-06, "loss": 5.2037286376953125, "step": 67300 }, { "epoch": 0.08132707935332906, "learning_rate": 9.768198441518164e-06, "loss": 5.164884643554688, "step": 67400 }, { "epoch": 0.08144774267581174, "learning_rate": 9.767794606050426e-06, "loss": 5.17246826171875, "step": 67500 }, { "epoch": 0.08156840599829443, "learning_rate": 9.767390770582686e-06, "loss": 5.15818603515625, "step": 67600 }, { "epoch": 0.0816890693207771, "learning_rate": 9.766986935114948e-06, "loss": 5.151226196289063, "step": 67700 }, { "epoch": 0.08180973264325979, "learning_rate": 9.76658309964721e-06, "loss": 5.15694091796875, "step": 67800 }, { "epoch": 0.08193039596574248, "learning_rate": 9.766179264179472e-06, "loss": 5.159863891601563, "step": 67900 }, { "epoch": 0.08205105928822516, "learning_rate": 9.765775428711734e-06, "loss": 5.170521240234375, "step": 68000 }, { "epoch": 0.08217172261070785, "learning_rate": 9.765371593243996e-06, "loss": 5.14292724609375, "step": 68100 }, { "epoch": 0.08229238593319053, "learning_rate": 9.764967757776258e-06, "loss": 5.156976928710938, "step": 68200 }, { "epoch": 0.0824130492556732, "learning_rate": 9.764563922308518e-06, "loss": 5.152540893554687, "step": 68300 }, { "epoch": 0.0825337125781559, "learning_rate": 9.76416008684078e-06, "loss": 5.16983154296875, "step": 68400 }, { "epoch": 0.08265437590063858, "learning_rate": 9.76375625137304e-06, "loss": 5.146065673828125, "step": 68500 }, { "epoch": 0.08277503922312127, "learning_rate": 9.763352415905302e-06, "loss": 5.119190673828125, "step": 68600 }, { "epoch": 0.08289570254560395, "learning_rate": 9.762948580437564e-06, "loss": 5.125591430664063, "step": 68700 }, { "epoch": 0.08301636586808664, "learning_rate": 9.762544744969826e-06, "loss": 5.17458740234375, "step": 68800 }, { "epoch": 0.08313702919056931, "learning_rate": 9.762140909502088e-06, "loss": 5.173352661132813, "step": 68900 }, { "epoch": 0.083257692513052, "learning_rate": 9.76173707403435e-06, "loss": 5.160217895507812, "step": 69000 }, { "epoch": 0.08337835583553468, "learning_rate": 9.761333238566612e-06, "loss": 5.165855102539062, "step": 69100 }, { "epoch": 0.08349901915801737, "learning_rate": 9.760929403098873e-06, "loss": 5.143590087890625, "step": 69200 }, { "epoch": 0.08361968248050006, "learning_rate": 9.760525567631134e-06, "loss": 5.137591552734375, "step": 69300 }, { "epoch": 0.08374034580298274, "learning_rate": 9.760121732163396e-06, "loss": 5.131078491210937, "step": 69400 }, { "epoch": 0.08386100912546542, "learning_rate": 9.759717896695657e-06, "loss": 5.101188659667969, "step": 69500 }, { "epoch": 0.0839816724479481, "learning_rate": 9.759314061227919e-06, "loss": 5.096486206054688, "step": 69600 }, { "epoch": 0.08410233577043079, "learning_rate": 9.75891022576018e-06, "loss": 5.105284118652344, "step": 69700 }, { "epoch": 0.08422299909291348, "learning_rate": 9.758506390292443e-06, "loss": 5.142880859375, "step": 69800 }, { "epoch": 0.08434366241539616, "learning_rate": 9.758102554824705e-06, "loss": 5.14042236328125, "step": 69900 }, { "epoch": 0.08446432573787885, "learning_rate": 9.757698719356965e-06, "loss": 5.126434326171875, "step": 70000 }, { "epoch": 0.08458498906036152, "learning_rate": 9.757294883889227e-06, "loss": 5.136691284179688, "step": 70100 }, { "epoch": 0.08470565238284421, "learning_rate": 9.756891048421489e-06, "loss": 5.160778198242188, "step": 70200 }, { "epoch": 0.0848263157053269, "learning_rate": 9.756487212953751e-06, "loss": 5.119503173828125, "step": 70300 }, { "epoch": 0.08494697902780958, "learning_rate": 9.756083377486011e-06, "loss": 5.148392333984375, "step": 70400 }, { "epoch": 0.08506764235029227, "learning_rate": 9.755679542018273e-06, "loss": 5.1181948852539065, "step": 70500 }, { "epoch": 0.08518830567277494, "learning_rate": 9.755275706550535e-06, "loss": 5.115385131835938, "step": 70600 }, { "epoch": 0.08530896899525763, "learning_rate": 9.754871871082797e-06, "loss": 5.105375366210938, "step": 70700 }, { "epoch": 0.08542963231774031, "learning_rate": 9.754468035615057e-06, "loss": 5.084530944824219, "step": 70800 }, { "epoch": 0.085550295640223, "learning_rate": 9.75406420014732e-06, "loss": 5.155774536132813, "step": 70900 }, { "epoch": 0.08567095896270568, "learning_rate": 9.753660364679581e-06, "loss": 5.116604614257812, "step": 71000 }, { "epoch": 0.08579162228518837, "learning_rate": 9.753256529211843e-06, "loss": 5.0745150756835935, "step": 71100 }, { "epoch": 0.08591228560767104, "learning_rate": 9.752852693744105e-06, "loss": 5.102546081542969, "step": 71200 }, { "epoch": 0.08603294893015373, "learning_rate": 9.752448858276367e-06, "loss": 5.091918334960938, "step": 71300 }, { "epoch": 0.08615361225263642, "learning_rate": 9.752045022808628e-06, "loss": 5.106720886230469, "step": 71400 }, { "epoch": 0.0862742755751191, "learning_rate": 9.75164118734089e-06, "loss": 5.116187438964844, "step": 71500 }, { "epoch": 0.08639493889760179, "learning_rate": 9.75123735187315e-06, "loss": 5.068934326171875, "step": 71600 }, { "epoch": 0.08651560222008448, "learning_rate": 9.750833516405412e-06, "loss": 5.076722717285156, "step": 71700 }, { "epoch": 0.08663626554256715, "learning_rate": 9.750429680937674e-06, "loss": 5.0759515380859375, "step": 71800 }, { "epoch": 0.08675692886504983, "learning_rate": 9.750025845469936e-06, "loss": 5.0674676513671875, "step": 71900 }, { "epoch": 0.08687759218753252, "learning_rate": 9.749622010002198e-06, "loss": 5.062613525390625, "step": 72000 }, { "epoch": 0.08699825551001521, "learning_rate": 9.74921817453446e-06, "loss": 5.085945739746093, "step": 72100 }, { "epoch": 0.0871189188324979, "learning_rate": 9.748814339066722e-06, "loss": 5.070661926269532, "step": 72200 }, { "epoch": 0.08723958215498058, "learning_rate": 9.748410503598982e-06, "loss": 5.0639105224609375, "step": 72300 }, { "epoch": 0.08736024547746325, "learning_rate": 9.748006668131244e-06, "loss": 5.0563897705078125, "step": 72400 }, { "epoch": 0.08748090879994594, "learning_rate": 9.747602832663506e-06, "loss": 5.087702941894531, "step": 72500 }, { "epoch": 0.08760157212242863, "learning_rate": 9.747198997195766e-06, "loss": 5.096186218261718, "step": 72600 }, { "epoch": 0.08772223544491131, "learning_rate": 9.746795161728028e-06, "loss": 5.075828857421875, "step": 72700 }, { "epoch": 0.087842898767394, "learning_rate": 9.74639132626029e-06, "loss": 5.065995788574218, "step": 72800 }, { "epoch": 0.08796356208987668, "learning_rate": 9.745987490792552e-06, "loss": 5.065982971191406, "step": 72900 }, { "epoch": 0.08808422541235936, "learning_rate": 9.745583655324814e-06, "loss": 5.0935498046875, "step": 73000 }, { "epoch": 0.08820488873484204, "learning_rate": 9.745179819857076e-06, "loss": 5.057830200195313, "step": 73100 }, { "epoch": 0.08832555205732473, "learning_rate": 9.744775984389338e-06, "loss": 5.07429443359375, "step": 73200 }, { "epoch": 0.08844621537980742, "learning_rate": 9.744372148921599e-06, "loss": 5.056070251464844, "step": 73300 }, { "epoch": 0.0885668787022901, "learning_rate": 9.74396831345386e-06, "loss": 5.0279473876953125, "step": 73400 }, { "epoch": 0.08868754202477279, "learning_rate": 9.74356447798612e-06, "loss": 5.027820739746094, "step": 73500 }, { "epoch": 0.08880820534725546, "learning_rate": 9.743160642518383e-06, "loss": 5.057041625976563, "step": 73600 }, { "epoch": 0.08892886866973815, "learning_rate": 9.742756807050645e-06, "loss": 5.04556640625, "step": 73700 }, { "epoch": 0.08904953199222083, "learning_rate": 9.742352971582907e-06, "loss": 5.0384423828125, "step": 73800 }, { "epoch": 0.08917019531470352, "learning_rate": 9.741949136115169e-06, "loss": 5.0619985961914065, "step": 73900 }, { "epoch": 0.08929085863718621, "learning_rate": 9.74154530064743e-06, "loss": 5.019390563964844, "step": 74000 }, { "epoch": 0.0894115219596689, "learning_rate": 9.741141465179691e-06, "loss": 5.043472900390625, "step": 74100 }, { "epoch": 0.08953218528215157, "learning_rate": 9.740737629711953e-06, "loss": 5.038667907714844, "step": 74200 }, { "epoch": 0.08965284860463425, "learning_rate": 9.740333794244215e-06, "loss": 5.0395071411132815, "step": 74300 }, { "epoch": 0.08977351192711694, "learning_rate": 9.739929958776477e-06, "loss": 5.0318997192382815, "step": 74400 }, { "epoch": 0.08989417524959963, "learning_rate": 9.739526123308737e-06, "loss": 5.012469177246094, "step": 74500 }, { "epoch": 0.09001483857208231, "learning_rate": 9.739122287841e-06, "loss": 5.035643005371094, "step": 74600 }, { "epoch": 0.090135501894565, "learning_rate": 9.738718452373261e-06, "loss": 5.027536010742187, "step": 74700 }, { "epoch": 0.09025616521704767, "learning_rate": 9.738314616905523e-06, "loss": 5.043776245117187, "step": 74800 }, { "epoch": 0.09037682853953036, "learning_rate": 9.737910781437783e-06, "loss": 5.01318115234375, "step": 74900 }, { "epoch": 0.09049749186201304, "learning_rate": 9.737506945970045e-06, "loss": 5.0130615234375, "step": 75000 }, { "epoch": 0.09061815518449573, "learning_rate": 9.737103110502307e-06, "loss": 5.016927490234375, "step": 75100 }, { "epoch": 0.09073881850697842, "learning_rate": 9.73669927503457e-06, "loss": 5.021900939941406, "step": 75200 }, { "epoch": 0.0908594818294611, "learning_rate": 9.736295439566831e-06, "loss": 5.039082946777344, "step": 75300 }, { "epoch": 0.09098014515194378, "learning_rate": 9.735891604099092e-06, "loss": 5.025408325195312, "step": 75400 }, { "epoch": 0.09110080847442646, "learning_rate": 9.735487768631354e-06, "loss": 4.999896545410156, "step": 75500 }, { "epoch": 0.09122147179690915, "learning_rate": 9.735083933163616e-06, "loss": 5.0109646606445315, "step": 75600 }, { "epoch": 0.09134213511939183, "learning_rate": 9.734680097695876e-06, "loss": 5.01272705078125, "step": 75700 }, { "epoch": 0.09146279844187452, "learning_rate": 9.734276262228138e-06, "loss": 4.993172302246093, "step": 75800 }, { "epoch": 0.09158346176435721, "learning_rate": 9.7338724267604e-06, "loss": 5.027442321777344, "step": 75900 }, { "epoch": 0.09170412508683988, "learning_rate": 9.733468591292662e-06, "loss": 5.016123046875, "step": 76000 }, { "epoch": 0.09182478840932257, "learning_rate": 9.733064755824924e-06, "loss": 5.013028869628906, "step": 76100 }, { "epoch": 0.09194545173180525, "learning_rate": 9.732660920357186e-06, "loss": 4.973556213378906, "step": 76200 }, { "epoch": 0.09206611505428794, "learning_rate": 9.732257084889448e-06, "loss": 5.0146942138671875, "step": 76300 }, { "epoch": 0.09218677837677063, "learning_rate": 9.731853249421708e-06, "loss": 4.992164611816406, "step": 76400 }, { "epoch": 0.09230744169925331, "learning_rate": 9.73144941395397e-06, "loss": 4.999853210449219, "step": 76500 }, { "epoch": 0.09242810502173598, "learning_rate": 9.73104557848623e-06, "loss": 4.986173706054688, "step": 76600 }, { "epoch": 0.09254876834421867, "learning_rate": 9.730641743018492e-06, "loss": 5.011735534667968, "step": 76700 }, { "epoch": 0.09266943166670136, "learning_rate": 9.730237907550754e-06, "loss": 5.000827941894531, "step": 76800 }, { "epoch": 0.09279009498918404, "learning_rate": 9.729834072083016e-06, "loss": 4.992151489257813, "step": 76900 }, { "epoch": 0.09291075831166673, "learning_rate": 9.729430236615278e-06, "loss": 4.989145812988281, "step": 77000 }, { "epoch": 0.0930314216341494, "learning_rate": 9.72902640114754e-06, "loss": 5.0138681030273435, "step": 77100 }, { "epoch": 0.09315208495663209, "learning_rate": 9.728622565679802e-06, "loss": 4.996145324707031, "step": 77200 }, { "epoch": 0.09327274827911478, "learning_rate": 9.728218730212063e-06, "loss": 4.9842221069335935, "step": 77300 }, { "epoch": 0.09339341160159746, "learning_rate": 9.727814894744325e-06, "loss": 4.972623291015625, "step": 77400 }, { "epoch": 0.09351407492408015, "learning_rate": 9.727411059276587e-06, "loss": 4.973984069824219, "step": 77500 }, { "epoch": 0.09363473824656283, "learning_rate": 9.727007223808847e-06, "loss": 4.984323120117187, "step": 77600 }, { "epoch": 0.09375540156904551, "learning_rate": 9.726603388341109e-06, "loss": 4.98031982421875, "step": 77700 }, { "epoch": 0.0938760648915282, "learning_rate": 9.72619955287337e-06, "loss": 4.959669799804687, "step": 77800 }, { "epoch": 0.09399672821401088, "learning_rate": 9.725795717405633e-06, "loss": 4.968257751464844, "step": 77900 }, { "epoch": 0.09411739153649357, "learning_rate": 9.725391881937895e-06, "loss": 4.966848754882813, "step": 78000 }, { "epoch": 0.09423805485897625, "learning_rate": 9.724988046470157e-06, "loss": 4.976156311035156, "step": 78100 }, { "epoch": 0.09435871818145894, "learning_rate": 9.724584211002417e-06, "loss": 4.9650640869140625, "step": 78200 }, { "epoch": 0.09447938150394161, "learning_rate": 9.724180375534679e-06, "loss": 5.000171203613281, "step": 78300 }, { "epoch": 0.0946000448264243, "learning_rate": 9.723776540066941e-06, "loss": 4.980813903808594, "step": 78400 }, { "epoch": 0.09472070814890698, "learning_rate": 9.723372704599201e-06, "loss": 4.964000854492188, "step": 78500 }, { "epoch": 0.09484137147138967, "learning_rate": 9.722968869131463e-06, "loss": 4.972636108398437, "step": 78600 }, { "epoch": 0.09496203479387236, "learning_rate": 9.722565033663725e-06, "loss": 4.949419555664062, "step": 78700 }, { "epoch": 0.09508269811635504, "learning_rate": 9.722161198195987e-06, "loss": 4.97333740234375, "step": 78800 }, { "epoch": 0.09520336143883772, "learning_rate": 9.72175736272825e-06, "loss": 4.967134704589844, "step": 78900 }, { "epoch": 0.0953240247613204, "learning_rate": 9.72135352726051e-06, "loss": 4.9573486328125, "step": 79000 }, { "epoch": 0.09544468808380309, "learning_rate": 9.720949691792772e-06, "loss": 4.946339111328125, "step": 79100 }, { "epoch": 0.09556535140628578, "learning_rate": 9.720545856325033e-06, "loss": 4.958375244140625, "step": 79200 }, { "epoch": 0.09568601472876846, "learning_rate": 9.720142020857295e-06, "loss": 4.967229919433594, "step": 79300 }, { "epoch": 0.09580667805125115, "learning_rate": 9.719738185389557e-06, "loss": 4.963417358398438, "step": 79400 }, { "epoch": 0.09592734137373382, "learning_rate": 9.719334349921818e-06, "loss": 4.937957153320313, "step": 79500 }, { "epoch": 0.09604800469621651, "learning_rate": 9.71893051445408e-06, "loss": 4.933610534667968, "step": 79600 }, { "epoch": 0.0961686680186992, "learning_rate": 9.718526678986342e-06, "loss": 4.95427978515625, "step": 79700 }, { "epoch": 0.09628933134118188, "learning_rate": 9.718122843518602e-06, "loss": 4.928057250976562, "step": 79800 }, { "epoch": 0.09640999466366457, "learning_rate": 9.717719008050864e-06, "loss": 4.925322875976563, "step": 79900 }, { "epoch": 0.09653065798614725, "learning_rate": 9.717315172583126e-06, "loss": 4.908415222167969, "step": 80000 }, { "epoch": 0.09665132130862993, "learning_rate": 9.716911337115388e-06, "loss": 4.9557421875, "step": 80100 }, { "epoch": 0.09677198463111261, "learning_rate": 9.71650750164765e-06, "loss": 4.940488891601563, "step": 80200 }, { "epoch": 0.0968926479535953, "learning_rate": 9.716103666179912e-06, "loss": 4.938771362304688, "step": 80300 }, { "epoch": 0.09701331127607798, "learning_rate": 9.715699830712174e-06, "loss": 4.942922973632813, "step": 80400 }, { "epoch": 0.09713397459856067, "learning_rate": 9.715295995244434e-06, "loss": 4.9132516479492185, "step": 80500 }, { "epoch": 0.09725463792104336, "learning_rate": 9.714892159776696e-06, "loss": 4.945633239746094, "step": 80600 }, { "epoch": 0.09737530124352603, "learning_rate": 9.714488324308956e-06, "loss": 4.918882141113281, "step": 80700 }, { "epoch": 0.09749596456600872, "learning_rate": 9.714084488841218e-06, "loss": 4.931737060546875, "step": 80800 }, { "epoch": 0.0976166278884914, "learning_rate": 9.71368065337348e-06, "loss": 4.926199951171875, "step": 80900 }, { "epoch": 0.09773729121097409, "learning_rate": 9.713276817905742e-06, "loss": 4.918571472167969, "step": 81000 }, { "epoch": 0.09785795453345678, "learning_rate": 9.712872982438004e-06, "loss": 4.9157711791992185, "step": 81100 }, { "epoch": 0.09797861785593946, "learning_rate": 9.712469146970266e-06, "loss": 4.908008422851562, "step": 81200 }, { "epoch": 0.09809928117842213, "learning_rate": 9.712065311502528e-06, "loss": 4.907994995117187, "step": 81300 }, { "epoch": 0.09821994450090482, "learning_rate": 9.711661476034789e-06, "loss": 4.899029846191406, "step": 81400 }, { "epoch": 0.09834060782338751, "learning_rate": 9.71125764056705e-06, "loss": 4.894893798828125, "step": 81500 }, { "epoch": 0.0984612711458702, "learning_rate": 9.710853805099313e-06, "loss": 4.921471252441406, "step": 81600 }, { "epoch": 0.09858193446835288, "learning_rate": 9.710449969631573e-06, "loss": 4.907397766113281, "step": 81700 }, { "epoch": 0.09870259779083557, "learning_rate": 9.710046134163835e-06, "loss": 4.908330383300782, "step": 81800 }, { "epoch": 0.09882326111331824, "learning_rate": 9.709642298696097e-06, "loss": 4.893409729003906, "step": 81900 }, { "epoch": 0.09894392443580093, "learning_rate": 9.709238463228359e-06, "loss": 4.886049194335937, "step": 82000 }, { "epoch": 0.09906458775828361, "learning_rate": 9.70883462776062e-06, "loss": 4.882464294433594, "step": 82100 }, { "epoch": 0.0991852510807663, "learning_rate": 9.708430792292883e-06, "loss": 4.888573303222656, "step": 82200 }, { "epoch": 0.09930591440324898, "learning_rate": 9.708026956825143e-06, "loss": 4.882120361328125, "step": 82300 }, { "epoch": 0.09942657772573167, "learning_rate": 9.707623121357405e-06, "loss": 4.903425903320312, "step": 82400 }, { "epoch": 0.09954724104821434, "learning_rate": 9.707219285889667e-06, "loss": 4.868942565917969, "step": 82500 }, { "epoch": 0.09966790437069703, "learning_rate": 9.706815450421927e-06, "loss": 4.895352783203125, "step": 82600 }, { "epoch": 0.09978856769317972, "learning_rate": 9.70641161495419e-06, "loss": 4.913453063964844, "step": 82700 }, { "epoch": 0.0999092310156624, "learning_rate": 9.706007779486451e-06, "loss": 4.8864443969726565, "step": 82800 }, { "epoch": 0.10002989433814509, "learning_rate": 9.705603944018713e-06, "loss": 4.874024353027344, "step": 82900 }, { "epoch": 0.10015055766062778, "learning_rate": 9.705200108550975e-06, "loss": 4.913255615234375, "step": 83000 }, { "epoch": 0.10027122098311045, "learning_rate": 9.704796273083236e-06, "loss": 4.861760864257812, "step": 83100 }, { "epoch": 0.10039188430559313, "learning_rate": 9.704392437615498e-06, "loss": 4.886510009765625, "step": 83200 }, { "epoch": 0.10051254762807582, "learning_rate": 9.70398860214776e-06, "loss": 4.860154418945313, "step": 83300 }, { "epoch": 0.10063321095055851, "learning_rate": 9.703584766680022e-06, "loss": 4.873463745117188, "step": 83400 }, { "epoch": 0.1007538742730412, "learning_rate": 9.703180931212283e-06, "loss": 4.890827331542969, "step": 83500 }, { "epoch": 0.10087453759552387, "learning_rate": 9.702777095744544e-06, "loss": 4.879186401367187, "step": 83600 }, { "epoch": 0.10099520091800655, "learning_rate": 9.702373260276806e-06, "loss": 4.876583251953125, "step": 83700 }, { "epoch": 0.10111586424048924, "learning_rate": 9.701969424809068e-06, "loss": 4.86263671875, "step": 83800 }, { "epoch": 0.10123652756297193, "learning_rate": 9.701565589341328e-06, "loss": 4.866602783203125, "step": 83900 }, { "epoch": 0.10135719088545461, "learning_rate": 9.70116175387359e-06, "loss": 4.905928344726562, "step": 84000 }, { "epoch": 0.1014778542079373, "learning_rate": 9.700757918405852e-06, "loss": 4.867268371582031, "step": 84100 }, { "epoch": 0.10159851753041997, "learning_rate": 9.700354082938114e-06, "loss": 4.870028381347656, "step": 84200 }, { "epoch": 0.10171918085290266, "learning_rate": 9.699950247470376e-06, "loss": 4.886224670410156, "step": 84300 }, { "epoch": 0.10183984417538534, "learning_rate": 9.699546412002638e-06, "loss": 4.862721862792969, "step": 84400 }, { "epoch": 0.10196050749786803, "learning_rate": 9.699142576534898e-06, "loss": 4.869748840332031, "step": 84500 }, { "epoch": 0.10208117082035072, "learning_rate": 9.69873874106716e-06, "loss": 4.842414245605469, "step": 84600 }, { "epoch": 0.1022018341428334, "learning_rate": 9.698334905599422e-06, "loss": 4.873136291503906, "step": 84700 }, { "epoch": 0.10232249746531608, "learning_rate": 9.697931070131682e-06, "loss": 4.825064697265625, "step": 84800 }, { "epoch": 0.10244316078779876, "learning_rate": 9.697527234663944e-06, "loss": 4.85788818359375, "step": 84900 }, { "epoch": 0.10256382411028145, "learning_rate": 9.697123399196206e-06, "loss": 4.894467468261719, "step": 85000 }, { "epoch": 0.10268448743276413, "learning_rate": 9.696719563728468e-06, "loss": 4.841428527832031, "step": 85100 }, { "epoch": 0.10280515075524682, "learning_rate": 9.69631572826073e-06, "loss": 4.850602722167968, "step": 85200 }, { "epoch": 0.10292581407772951, "learning_rate": 9.695911892792992e-06, "loss": 4.853901062011719, "step": 85300 }, { "epoch": 0.10304647740021218, "learning_rate": 9.695508057325254e-06, "loss": 4.848119201660157, "step": 85400 }, { "epoch": 0.10316714072269487, "learning_rate": 9.695104221857515e-06, "loss": 4.851161499023437, "step": 85500 }, { "epoch": 0.10328780404517755, "learning_rate": 9.694700386389777e-06, "loss": 4.804761962890625, "step": 85600 }, { "epoch": 0.10340846736766024, "learning_rate": 9.694296550922037e-06, "loss": 4.843150024414062, "step": 85700 }, { "epoch": 0.10352913069014293, "learning_rate": 9.693892715454299e-06, "loss": 4.845422973632813, "step": 85800 }, { "epoch": 0.10364979401262561, "learning_rate": 9.693488879986561e-06, "loss": 4.843452758789063, "step": 85900 }, { "epoch": 0.10377045733510828, "learning_rate": 9.693085044518823e-06, "loss": 4.856632385253906, "step": 86000 }, { "epoch": 0.10389112065759097, "learning_rate": 9.692681209051085e-06, "loss": 4.823756713867187, "step": 86100 }, { "epoch": 0.10401178398007366, "learning_rate": 9.692277373583347e-06, "loss": 4.834161987304688, "step": 86200 }, { "epoch": 0.10413244730255634, "learning_rate": 9.691873538115607e-06, "loss": 4.850711059570313, "step": 86300 }, { "epoch": 0.10425311062503903, "learning_rate": 9.691469702647869e-06, "loss": 4.828718566894532, "step": 86400 }, { "epoch": 0.10437377394752172, "learning_rate": 9.691065867180131e-06, "loss": 4.8225927734375, "step": 86500 }, { "epoch": 0.10449443727000439, "learning_rate": 9.690662031712393e-06, "loss": 4.8287655639648435, "step": 86600 }, { "epoch": 0.10461510059248708, "learning_rate": 9.690258196244653e-06, "loss": 4.809221801757812, "step": 86700 }, { "epoch": 0.10473576391496976, "learning_rate": 9.689854360776915e-06, "loss": 4.803803405761719, "step": 86800 }, { "epoch": 0.10485642723745245, "learning_rate": 9.689450525309177e-06, "loss": 4.820423889160156, "step": 86900 }, { "epoch": 0.10497709055993514, "learning_rate": 9.68904668984144e-06, "loss": 4.808703002929687, "step": 87000 }, { "epoch": 0.10509775388241782, "learning_rate": 9.6886428543737e-06, "loss": 4.8158642578125, "step": 87100 }, { "epoch": 0.1052184172049005, "learning_rate": 9.688239018905962e-06, "loss": 4.816473388671875, "step": 87200 }, { "epoch": 0.10533908052738318, "learning_rate": 9.687835183438224e-06, "loss": 4.785604858398438, "step": 87300 }, { "epoch": 0.10545974384986587, "learning_rate": 9.687431347970486e-06, "loss": 4.79506103515625, "step": 87400 }, { "epoch": 0.10558040717234855, "learning_rate": 9.687027512502748e-06, "loss": 4.809523315429687, "step": 87500 }, { "epoch": 0.10570107049483124, "learning_rate": 9.686623677035008e-06, "loss": 4.778346557617187, "step": 87600 }, { "epoch": 0.10582173381731393, "learning_rate": 9.68621984156727e-06, "loss": 4.822114562988281, "step": 87700 }, { "epoch": 0.1059423971397966, "learning_rate": 9.685816006099532e-06, "loss": 4.785655212402344, "step": 87800 }, { "epoch": 0.10606306046227928, "learning_rate": 9.685412170631794e-06, "loss": 4.827339172363281, "step": 87900 }, { "epoch": 0.10618372378476197, "learning_rate": 9.685008335164054e-06, "loss": 4.80163330078125, "step": 88000 }, { "epoch": 0.10630438710724466, "learning_rate": 9.684604499696316e-06, "loss": 4.787745666503906, "step": 88100 }, { "epoch": 0.10642505042972734, "learning_rate": 9.684200664228578e-06, "loss": 4.800241088867187, "step": 88200 }, { "epoch": 0.10654571375221003, "learning_rate": 9.68379682876084e-06, "loss": 4.812076721191406, "step": 88300 }, { "epoch": 0.1066663770746927, "learning_rate": 9.683392993293102e-06, "loss": 4.784380493164062, "step": 88400 }, { "epoch": 0.10678704039717539, "learning_rate": 9.682989157825364e-06, "loss": 4.791062316894531, "step": 88500 }, { "epoch": 0.10690770371965808, "learning_rate": 9.682585322357624e-06, "loss": 4.775936279296875, "step": 88600 }, { "epoch": 0.10702836704214076, "learning_rate": 9.682181486889886e-06, "loss": 4.784500732421875, "step": 88700 }, { "epoch": 0.10714903036462345, "learning_rate": 9.681777651422147e-06, "loss": 4.803079833984375, "step": 88800 }, { "epoch": 0.10726969368710614, "learning_rate": 9.681373815954409e-06, "loss": 4.794912719726563, "step": 88900 }, { "epoch": 0.10739035700958881, "learning_rate": 9.68096998048667e-06, "loss": 4.7925244140625, "step": 89000 }, { "epoch": 0.1075110203320715, "learning_rate": 9.680566145018932e-06, "loss": 4.777199401855468, "step": 89100 }, { "epoch": 0.10763168365455418, "learning_rate": 9.680162309551194e-06, "loss": 4.778366394042969, "step": 89200 }, { "epoch": 0.10775234697703687, "learning_rate": 9.679758474083456e-06, "loss": 4.776029663085938, "step": 89300 }, { "epoch": 0.10787301029951955, "learning_rate": 9.679354638615718e-06, "loss": 4.753299865722656, "step": 89400 }, { "epoch": 0.10799367362200224, "learning_rate": 9.678950803147979e-06, "loss": 4.788411254882813, "step": 89500 }, { "epoch": 0.10811433694448491, "learning_rate": 9.67854696768024e-06, "loss": 4.8108148193359375, "step": 89600 }, { "epoch": 0.1082350002669676, "learning_rate": 9.678143132212503e-06, "loss": 4.770762634277344, "step": 89700 }, { "epoch": 0.10835566358945029, "learning_rate": 9.677739296744763e-06, "loss": 4.769071350097656, "step": 89800 }, { "epoch": 0.10847632691193297, "learning_rate": 9.677335461277025e-06, "loss": 4.78750244140625, "step": 89900 }, { "epoch": 0.10859699023441566, "learning_rate": 9.676931625809287e-06, "loss": 4.77056640625, "step": 90000 }, { "epoch": 0.10871765355689833, "learning_rate": 9.676527790341549e-06, "loss": 4.7862374877929685, "step": 90100 }, { "epoch": 0.10883831687938102, "learning_rate": 9.676123954873811e-06, "loss": 4.737091674804687, "step": 90200 }, { "epoch": 0.1089589802018637, "learning_rate": 9.675720119406073e-06, "loss": 4.722448425292969, "step": 90300 }, { "epoch": 0.10907964352434639, "learning_rate": 9.675316283938333e-06, "loss": 4.7578128051757815, "step": 90400 }, { "epoch": 0.10920030684682908, "learning_rate": 9.674912448470595e-06, "loss": 4.75033447265625, "step": 90500 }, { "epoch": 0.10932097016931176, "learning_rate": 9.674508613002857e-06, "loss": 4.728914794921875, "step": 90600 }, { "epoch": 0.10944163349179444, "learning_rate": 9.674104777535117e-06, "loss": 4.737483520507812, "step": 90700 }, { "epoch": 0.10956229681427712, "learning_rate": 9.67370094206738e-06, "loss": 4.750766906738281, "step": 90800 }, { "epoch": 0.10968296013675981, "learning_rate": 9.673297106599641e-06, "loss": 4.759916687011719, "step": 90900 }, { "epoch": 0.1098036234592425, "learning_rate": 9.672893271131903e-06, "loss": 4.754288635253906, "step": 91000 }, { "epoch": 0.10992428678172518, "learning_rate": 9.672489435664165e-06, "loss": 4.7359814453125, "step": 91100 }, { "epoch": 0.11004495010420787, "learning_rate": 9.672085600196426e-06, "loss": 4.7439111328125, "step": 91200 }, { "epoch": 0.11016561342669054, "learning_rate": 9.671681764728688e-06, "loss": 4.73325927734375, "step": 91300 }, { "epoch": 0.11028627674917323, "learning_rate": 9.67127792926095e-06, "loss": 4.771037902832031, "step": 91400 }, { "epoch": 0.11040694007165591, "learning_rate": 9.670874093793212e-06, "loss": 4.7424014282226565, "step": 91500 }, { "epoch": 0.1105276033941386, "learning_rate": 9.670470258325474e-06, "loss": 4.757178955078125, "step": 91600 }, { "epoch": 0.11064826671662129, "learning_rate": 9.670066422857734e-06, "loss": 4.728418884277343, "step": 91700 }, { "epoch": 0.11076893003910397, "learning_rate": 9.669662587389996e-06, "loss": 4.741020202636719, "step": 91800 }, { "epoch": 0.11088959336158664, "learning_rate": 9.669258751922258e-06, "loss": 4.755391845703125, "step": 91900 }, { "epoch": 0.11101025668406933, "learning_rate": 9.668854916454518e-06, "loss": 4.733238830566406, "step": 92000 }, { "epoch": 0.11113092000655202, "learning_rate": 9.66845108098678e-06, "loss": 4.754249877929688, "step": 92100 }, { "epoch": 0.1112515833290347, "learning_rate": 9.668047245519042e-06, "loss": 4.741124877929687, "step": 92200 }, { "epoch": 0.11137224665151739, "learning_rate": 9.667643410051304e-06, "loss": 4.741844787597656, "step": 92300 }, { "epoch": 0.11149290997400008, "learning_rate": 9.667239574583566e-06, "loss": 4.70602294921875, "step": 92400 }, { "epoch": 0.11161357329648275, "learning_rate": 9.666835739115828e-06, "loss": 4.732904357910156, "step": 92500 }, { "epoch": 0.11173423661896544, "learning_rate": 9.666431903648088e-06, "loss": 4.720787353515625, "step": 92600 }, { "epoch": 0.11185489994144812, "learning_rate": 9.66602806818035e-06, "loss": 4.731036987304687, "step": 92700 }, { "epoch": 0.11197556326393081, "learning_rate": 9.665624232712612e-06, "loss": 4.728709716796875, "step": 92800 }, { "epoch": 0.1120962265864135, "learning_rate": 9.665220397244873e-06, "loss": 4.719226989746094, "step": 92900 }, { "epoch": 0.11221688990889618, "learning_rate": 9.664816561777135e-06, "loss": 4.7157666015625, "step": 93000 }, { "epoch": 0.11233755323137885, "learning_rate": 9.664412726309397e-06, "loss": 4.7111337280273435, "step": 93100 }, { "epoch": 0.11245821655386154, "learning_rate": 9.664008890841659e-06, "loss": 4.713517150878906, "step": 93200 }, { "epoch": 0.11257887987634423, "learning_rate": 9.66360505537392e-06, "loss": 4.706962585449219, "step": 93300 }, { "epoch": 0.11269954319882691, "learning_rate": 9.663201219906182e-06, "loss": 4.721396484375, "step": 93400 }, { "epoch": 0.1128202065213096, "learning_rate": 9.662797384438444e-06, "loss": 4.731193237304687, "step": 93500 }, { "epoch": 0.11294086984379229, "learning_rate": 9.662393548970705e-06, "loss": 4.722343139648437, "step": 93600 }, { "epoch": 0.11306153316627496, "learning_rate": 9.661989713502967e-06, "loss": 4.701794128417969, "step": 93700 }, { "epoch": 0.11318219648875764, "learning_rate": 9.661585878035227e-06, "loss": 4.6912774658203125, "step": 93800 }, { "epoch": 0.11330285981124033, "learning_rate": 9.661182042567489e-06, "loss": 4.714636535644531, "step": 93900 }, { "epoch": 0.11342352313372302, "learning_rate": 9.660778207099751e-06, "loss": 4.71160888671875, "step": 94000 }, { "epoch": 0.1135441864562057, "learning_rate": 9.660374371632013e-06, "loss": 4.710344848632812, "step": 94100 }, { "epoch": 0.11366484977868839, "learning_rate": 9.659970536164275e-06, "loss": 4.702177429199219, "step": 94200 }, { "epoch": 0.11378551310117106, "learning_rate": 9.659566700696537e-06, "loss": 4.699169006347656, "step": 94300 }, { "epoch": 0.11390617642365375, "learning_rate": 9.659162865228799e-06, "loss": 4.69635986328125, "step": 94400 }, { "epoch": 0.11402683974613644, "learning_rate": 9.65875902976106e-06, "loss": 4.693934936523437, "step": 94500 }, { "epoch": 0.11414750306861912, "learning_rate": 9.658355194293321e-06, "loss": 4.700142211914063, "step": 94600 }, { "epoch": 0.11426816639110181, "learning_rate": 9.657951358825583e-06, "loss": 4.660438537597656, "step": 94700 }, { "epoch": 0.1143888297135845, "learning_rate": 9.657547523357843e-06, "loss": 4.706804809570312, "step": 94800 }, { "epoch": 0.11450949303606717, "learning_rate": 9.657143687890105e-06, "loss": 4.686411437988281, "step": 94900 }, { "epoch": 0.11463015635854985, "learning_rate": 9.656739852422367e-06, "loss": 4.704990234375, "step": 95000 }, { "epoch": 0.11475081968103254, "learning_rate": 9.65633601695463e-06, "loss": 4.678945617675781, "step": 95100 }, { "epoch": 0.11487148300351523, "learning_rate": 9.655932181486891e-06, "loss": 4.6987918090820315, "step": 95200 }, { "epoch": 0.11499214632599791, "learning_rate": 9.655528346019152e-06, "loss": 4.716113586425781, "step": 95300 }, { "epoch": 0.1151128096484806, "learning_rate": 9.655124510551414e-06, "loss": 4.678018188476562, "step": 95400 }, { "epoch": 0.11523347297096327, "learning_rate": 9.654720675083676e-06, "loss": 4.681973266601562, "step": 95500 }, { "epoch": 0.11535413629344596, "learning_rate": 9.654316839615938e-06, "loss": 4.708043212890625, "step": 95600 }, { "epoch": 0.11547479961592864, "learning_rate": 9.6539130041482e-06, "loss": 4.685238342285157, "step": 95700 }, { "epoch": 0.11559546293841133, "learning_rate": 9.65350916868046e-06, "loss": 4.6925115966796875, "step": 95800 }, { "epoch": 0.11571612626089402, "learning_rate": 9.653105333212722e-06, "loss": 4.63882568359375, "step": 95900 }, { "epoch": 0.1158367895833767, "learning_rate": 9.652701497744984e-06, "loss": 4.678868103027344, "step": 96000 }, { "epoch": 0.11595745290585938, "learning_rate": 9.652297662277244e-06, "loss": 4.679849243164062, "step": 96100 }, { "epoch": 0.11607811622834206, "learning_rate": 9.651893826809506e-06, "loss": 4.697474060058593, "step": 96200 }, { "epoch": 0.11619877955082475, "learning_rate": 9.651489991341768e-06, "loss": 4.663589782714844, "step": 96300 }, { "epoch": 0.11631944287330744, "learning_rate": 9.65108615587403e-06, "loss": 4.677477416992187, "step": 96400 }, { "epoch": 0.11644010619579012, "learning_rate": 9.650682320406292e-06, "loss": 4.647117309570312, "step": 96500 }, { "epoch": 0.1165607695182728, "learning_rate": 9.650278484938554e-06, "loss": 4.643777465820312, "step": 96600 }, { "epoch": 0.11668143284075548, "learning_rate": 9.649874649470814e-06, "loss": 4.6652224731445315, "step": 96700 }, { "epoch": 0.11680209616323817, "learning_rate": 9.649470814003076e-06, "loss": 4.657362060546875, "step": 96800 }, { "epoch": 0.11692275948572085, "learning_rate": 9.649066978535338e-06, "loss": 4.674615173339844, "step": 96900 }, { "epoch": 0.11704342280820354, "learning_rate": 9.648663143067599e-06, "loss": 4.679769592285156, "step": 97000 }, { "epoch": 0.11716408613068623, "learning_rate": 9.64825930759986e-06, "loss": 4.653609619140625, "step": 97100 }, { "epoch": 0.1172847494531689, "learning_rate": 9.647855472132123e-06, "loss": 4.664938354492188, "step": 97200 }, { "epoch": 0.11740541277565159, "learning_rate": 9.647451636664385e-06, "loss": 4.677825927734375, "step": 97300 }, { "epoch": 0.11752607609813427, "learning_rate": 9.647047801196647e-06, "loss": 4.654386596679688, "step": 97400 }, { "epoch": 0.11764673942061696, "learning_rate": 9.646643965728909e-06, "loss": 4.682733154296875, "step": 97500 }, { "epoch": 0.11776740274309964, "learning_rate": 9.64624013026117e-06, "loss": 4.636017761230469, "step": 97600 }, { "epoch": 0.11788806606558233, "learning_rate": 9.64583629479343e-06, "loss": 4.643951416015625, "step": 97700 }, { "epoch": 0.118008729388065, "learning_rate": 9.645432459325693e-06, "loss": 4.623200378417969, "step": 97800 }, { "epoch": 0.11812939271054769, "learning_rate": 9.645028623857953e-06, "loss": 4.645050964355469, "step": 97900 }, { "epoch": 0.11825005603303038, "learning_rate": 9.644624788390215e-06, "loss": 4.64683349609375, "step": 98000 }, { "epoch": 0.11837071935551306, "learning_rate": 9.644220952922477e-06, "loss": 4.662095031738281, "step": 98100 }, { "epoch": 0.11849138267799575, "learning_rate": 9.643817117454739e-06, "loss": 4.666967468261719, "step": 98200 }, { "epoch": 0.11861204600047844, "learning_rate": 9.643413281987001e-06, "loss": 4.644697875976562, "step": 98300 }, { "epoch": 0.11873270932296111, "learning_rate": 9.643009446519263e-06, "loss": 4.6283261108398435, "step": 98400 }, { "epoch": 0.1188533726454438, "learning_rate": 9.642605611051525e-06, "loss": 4.625231628417969, "step": 98500 }, { "epoch": 0.11897403596792648, "learning_rate": 9.642201775583785e-06, "loss": 4.631438598632813, "step": 98600 }, { "epoch": 0.11909469929040917, "learning_rate": 9.641797940116047e-06, "loss": 4.632507934570312, "step": 98700 }, { "epoch": 0.11921536261289185, "learning_rate": 9.64139410464831e-06, "loss": 4.62410400390625, "step": 98800 }, { "epoch": 0.11933602593537454, "learning_rate": 9.64099026918057e-06, "loss": 4.644050598144531, "step": 98900 }, { "epoch": 0.11945668925785721, "learning_rate": 9.640586433712831e-06, "loss": 4.642160034179687, "step": 99000 }, { "epoch": 0.1195773525803399, "learning_rate": 9.640182598245093e-06, "loss": 4.639566345214844, "step": 99100 }, { "epoch": 0.11969801590282259, "learning_rate": 9.639778762777355e-06, "loss": 4.6316439819335935, "step": 99200 }, { "epoch": 0.11981867922530527, "learning_rate": 9.639374927309617e-06, "loss": 4.651192321777343, "step": 99300 }, { "epoch": 0.11993934254778796, "learning_rate": 9.638971091841878e-06, "loss": 4.610224609375, "step": 99400 }, { "epoch": 0.12006000587027064, "learning_rate": 9.63856725637414e-06, "loss": 4.625392761230469, "step": 99500 }, { "epoch": 0.12018066919275332, "learning_rate": 9.638163420906402e-06, "loss": 4.602829895019531, "step": 99600 }, { "epoch": 0.120301332515236, "learning_rate": 9.637759585438664e-06, "loss": 4.594230041503907, "step": 99700 }, { "epoch": 0.12042199583771869, "learning_rate": 9.637355749970924e-06, "loss": 4.585758361816406, "step": 99800 }, { "epoch": 0.12054265916020138, "learning_rate": 9.636951914503186e-06, "loss": 4.6115719604492185, "step": 99900 }, { "epoch": 0.12066332248268406, "learning_rate": 9.636548079035448e-06, "loss": 4.627333068847657, "step": 100000 }, { "epoch": 0.12078398580516675, "learning_rate": 9.63614424356771e-06, "loss": 4.614095153808594, "step": 100100 }, { "epoch": 0.12090464912764942, "learning_rate": 9.63574040809997e-06, "loss": 4.606982421875, "step": 100200 }, { "epoch": 0.12102531245013211, "learning_rate": 9.635336572632232e-06, "loss": 4.619635009765625, "step": 100300 }, { "epoch": 0.1211459757726148, "learning_rate": 9.634932737164494e-06, "loss": 4.618819580078125, "step": 100400 }, { "epoch": 0.12126663909509748, "learning_rate": 9.634528901696756e-06, "loss": 4.615993041992187, "step": 100500 }, { "epoch": 0.12138730241758017, "learning_rate": 9.634125066229018e-06, "loss": 4.600937194824219, "step": 100600 }, { "epoch": 0.12150796574006285, "learning_rate": 9.63372123076128e-06, "loss": 4.617173156738281, "step": 100700 }, { "epoch": 0.12162862906254553, "learning_rate": 9.63331739529354e-06, "loss": 4.597644348144531, "step": 100800 }, { "epoch": 0.12174929238502821, "learning_rate": 9.632913559825802e-06, "loss": 4.587833862304688, "step": 100900 }, { "epoch": 0.1218699557075109, "learning_rate": 9.632509724358063e-06, "loss": 4.642342529296875, "step": 101000 }, { "epoch": 0.12199061902999359, "learning_rate": 9.632105888890325e-06, "loss": 4.589096984863281, "step": 101100 }, { "epoch": 0.12211128235247627, "learning_rate": 9.631702053422587e-06, "loss": 4.626454467773438, "step": 101200 }, { "epoch": 0.12223194567495896, "learning_rate": 9.631298217954849e-06, "loss": 4.596427917480469, "step": 101300 }, { "epoch": 0.12235260899744163, "learning_rate": 9.63089438248711e-06, "loss": 4.597868347167969, "step": 101400 }, { "epoch": 0.12247327231992432, "learning_rate": 9.630490547019373e-06, "loss": 4.6363897705078125, "step": 101500 }, { "epoch": 0.122593935642407, "learning_rate": 9.630086711551635e-06, "loss": 4.584929809570313, "step": 101600 }, { "epoch": 0.12271459896488969, "learning_rate": 9.629682876083895e-06, "loss": 4.581707153320313, "step": 101700 }, { "epoch": 0.12283526228737238, "learning_rate": 9.629279040616157e-06, "loss": 4.606552734375, "step": 101800 }, { "epoch": 0.12295592560985506, "learning_rate": 9.628875205148419e-06, "loss": 4.596510009765625, "step": 101900 }, { "epoch": 0.12307658893233774, "learning_rate": 9.628471369680679e-06, "loss": 4.600588684082031, "step": 102000 }, { "epoch": 0.12319725225482042, "learning_rate": 9.628067534212941e-06, "loss": 4.584922790527344, "step": 102100 }, { "epoch": 0.12331791557730311, "learning_rate": 9.627663698745203e-06, "loss": 4.573536071777344, "step": 102200 }, { "epoch": 0.1234385788997858, "learning_rate": 9.627259863277465e-06, "loss": 4.591594543457031, "step": 102300 }, { "epoch": 0.12355924222226848, "learning_rate": 9.626856027809727e-06, "loss": 4.5871514892578125, "step": 102400 }, { "epoch": 0.12367990554475117, "learning_rate": 9.626452192341989e-06, "loss": 4.576618957519531, "step": 102500 }, { "epoch": 0.12380056886723384, "learning_rate": 9.62604835687425e-06, "loss": 4.589746704101563, "step": 102600 }, { "epoch": 0.12392123218971653, "learning_rate": 9.625644521406511e-06, "loss": 4.559208374023438, "step": 102700 }, { "epoch": 0.12404189551219921, "learning_rate": 9.625240685938773e-06, "loss": 4.580867919921875, "step": 102800 }, { "epoch": 0.1241625588346819, "learning_rate": 9.624836850471034e-06, "loss": 4.589192199707031, "step": 102900 }, { "epoch": 0.12428322215716459, "learning_rate": 9.624433015003296e-06, "loss": 4.562888793945312, "step": 103000 }, { "epoch": 0.12440388547964726, "learning_rate": 9.624029179535558e-06, "loss": 4.571641540527343, "step": 103100 }, { "epoch": 0.12452454880212994, "learning_rate": 9.62362534406782e-06, "loss": 4.557775573730469, "step": 103200 }, { "epoch": 0.12464521212461263, "learning_rate": 9.623221508600081e-06, "loss": 4.56920654296875, "step": 103300 }, { "epoch": 0.12476587544709532, "learning_rate": 9.622817673132343e-06, "loss": 4.5724484252929685, "step": 103400 }, { "epoch": 0.124886538769578, "learning_rate": 9.622413837664604e-06, "loss": 4.571834716796875, "step": 103500 }, { "epoch": 0.12500720209206068, "learning_rate": 9.622010002196866e-06, "loss": 4.554250793457031, "step": 103600 }, { "epoch": 0.12512786541454338, "learning_rate": 9.621606166729128e-06, "loss": 4.5702078247070315, "step": 103700 }, { "epoch": 0.12524852873702605, "learning_rate": 9.62120233126139e-06, "loss": 4.584476013183593, "step": 103800 }, { "epoch": 0.12536919205950875, "learning_rate": 9.62079849579365e-06, "loss": 4.565232849121093, "step": 103900 }, { "epoch": 0.12548985538199142, "learning_rate": 9.620394660325912e-06, "loss": 4.563414001464844, "step": 104000 }, { "epoch": 0.1256105187044741, "learning_rate": 9.619990824858174e-06, "loss": 4.559494323730469, "step": 104100 }, { "epoch": 0.1257311820269568, "learning_rate": 9.619586989390436e-06, "loss": 4.534017944335938, "step": 104200 }, { "epoch": 0.12585184534943947, "learning_rate": 9.619183153922696e-06, "loss": 4.578702392578125, "step": 104300 }, { "epoch": 0.12597250867192217, "learning_rate": 9.618779318454958e-06, "loss": 4.575626831054688, "step": 104400 }, { "epoch": 0.12609317199440484, "learning_rate": 9.61837548298722e-06, "loss": 4.5360650634765625, "step": 104500 }, { "epoch": 0.1262138353168875, "learning_rate": 9.617971647519482e-06, "loss": 4.535835266113281, "step": 104600 }, { "epoch": 0.1263344986393702, "learning_rate": 9.617567812051744e-06, "loss": 4.560310363769531, "step": 104700 }, { "epoch": 0.12645516196185289, "learning_rate": 9.617163976584004e-06, "loss": 4.557838439941406, "step": 104800 }, { "epoch": 0.12657582528433559, "learning_rate": 9.616760141116266e-06, "loss": 4.553232727050781, "step": 104900 }, { "epoch": 0.12669648860681826, "learning_rate": 9.616356305648528e-06, "loss": 4.531650085449218, "step": 105000 }, { "epoch": 0.12681715192930096, "learning_rate": 9.615952470180789e-06, "loss": 4.5613400268554685, "step": 105100 }, { "epoch": 0.12693781525178363, "learning_rate": 9.61554863471305e-06, "loss": 4.540119018554687, "step": 105200 }, { "epoch": 0.1270584785742663, "learning_rate": 9.615144799245313e-06, "loss": 4.541902465820312, "step": 105300 }, { "epoch": 0.127179141896749, "learning_rate": 9.614740963777575e-06, "loss": 4.54156005859375, "step": 105400 }, { "epoch": 0.12729980521923168, "learning_rate": 9.614337128309837e-06, "loss": 4.518712158203125, "step": 105500 }, { "epoch": 0.12742046854171438, "learning_rate": 9.613933292842099e-06, "loss": 4.5665869140625, "step": 105600 }, { "epoch": 0.12754113186419705, "learning_rate": 9.61352945737436e-06, "loss": 4.523365783691406, "step": 105700 }, { "epoch": 0.12766179518667972, "learning_rate": 9.613125621906621e-06, "loss": 4.531428833007812, "step": 105800 }, { "epoch": 0.12778245850916242, "learning_rate": 9.612721786438883e-06, "loss": 4.523320007324219, "step": 105900 }, { "epoch": 0.1279031218316451, "learning_rate": 9.612317950971143e-06, "loss": 4.526325073242187, "step": 106000 }, { "epoch": 0.1280237851541278, "learning_rate": 9.611914115503405e-06, "loss": 4.555354919433594, "step": 106100 }, { "epoch": 0.12814444847661047, "learning_rate": 9.611510280035667e-06, "loss": 4.529878845214844, "step": 106200 }, { "epoch": 0.12826511179909317, "learning_rate": 9.611106444567929e-06, "loss": 4.527799987792969, "step": 106300 }, { "epoch": 0.12838577512157584, "learning_rate": 9.610702609100191e-06, "loss": 4.535277099609375, "step": 106400 }, { "epoch": 0.1285064384440585, "learning_rate": 9.610298773632453e-06, "loss": 4.510034790039063, "step": 106500 }, { "epoch": 0.1286271017665412, "learning_rate": 9.609894938164715e-06, "loss": 4.517027587890625, "step": 106600 }, { "epoch": 0.12874776508902389, "learning_rate": 9.609491102696975e-06, "loss": 4.513541259765625, "step": 106700 }, { "epoch": 0.12886842841150659, "learning_rate": 9.609087267229237e-06, "loss": 4.532938537597656, "step": 106800 }, { "epoch": 0.12898909173398926, "learning_rate": 9.6086834317615e-06, "loss": 4.523807067871093, "step": 106900 }, { "epoch": 0.12910975505647193, "learning_rate": 9.60827959629376e-06, "loss": 4.536944274902344, "step": 107000 }, { "epoch": 0.12923041837895463, "learning_rate": 9.607875760826022e-06, "loss": 4.547731323242187, "step": 107100 }, { "epoch": 0.1293510817014373, "learning_rate": 9.607471925358284e-06, "loss": 4.500527954101562, "step": 107200 }, { "epoch": 0.12947174502392, "learning_rate": 9.607068089890546e-06, "loss": 4.509184875488281, "step": 107300 }, { "epoch": 0.12959240834640268, "learning_rate": 9.606664254422808e-06, "loss": 4.506120300292968, "step": 107400 }, { "epoch": 0.12971307166888538, "learning_rate": 9.606260418955068e-06, "loss": 4.5154855346679685, "step": 107500 }, { "epoch": 0.12983373499136805, "learning_rate": 9.60585658348733e-06, "loss": 4.532999267578125, "step": 107600 }, { "epoch": 0.12995439831385072, "learning_rate": 9.605452748019592e-06, "loss": 4.532502136230469, "step": 107700 }, { "epoch": 0.13007506163633342, "learning_rate": 9.605048912551854e-06, "loss": 4.498631591796875, "step": 107800 }, { "epoch": 0.1301957249588161, "learning_rate": 9.604645077084114e-06, "loss": 4.540263977050781, "step": 107900 }, { "epoch": 0.1303163882812988, "learning_rate": 9.604241241616376e-06, "loss": 4.516459045410156, "step": 108000 }, { "epoch": 0.13043705160378147, "learning_rate": 9.603837406148638e-06, "loss": 4.507551574707032, "step": 108100 }, { "epoch": 0.13055771492626414, "learning_rate": 9.6034335706809e-06, "loss": 4.481290588378906, "step": 108200 }, { "epoch": 0.13067837824874684, "learning_rate": 9.603029735213162e-06, "loss": 4.516636047363281, "step": 108300 }, { "epoch": 0.1307990415712295, "learning_rate": 9.602625899745422e-06, "loss": 4.498446655273438, "step": 108400 }, { "epoch": 0.1309197048937122, "learning_rate": 9.602222064277684e-06, "loss": 4.496758117675781, "step": 108500 }, { "epoch": 0.13104036821619489, "learning_rate": 9.601818228809946e-06, "loss": 4.514501037597657, "step": 108600 }, { "epoch": 0.13116103153867759, "learning_rate": 9.601414393342208e-06, "loss": 4.525939331054688, "step": 108700 }, { "epoch": 0.13128169486116026, "learning_rate": 9.60101055787447e-06, "loss": 4.491955261230469, "step": 108800 }, { "epoch": 0.13140235818364293, "learning_rate": 9.60060672240673e-06, "loss": 4.504250183105468, "step": 108900 }, { "epoch": 0.13152302150612563, "learning_rate": 9.600202886938992e-06, "loss": 4.5038973999023435, "step": 109000 }, { "epoch": 0.1316436848286083, "learning_rate": 9.599799051471254e-06, "loss": 4.478483581542969, "step": 109100 }, { "epoch": 0.131764348151091, "learning_rate": 9.599395216003515e-06, "loss": 4.497598876953125, "step": 109200 }, { "epoch": 0.13188501147357368, "learning_rate": 9.598991380535777e-06, "loss": 4.518112487792969, "step": 109300 }, { "epoch": 0.13200567479605635, "learning_rate": 9.598587545068039e-06, "loss": 4.495831298828125, "step": 109400 }, { "epoch": 0.13212633811853905, "learning_rate": 9.5981837096003e-06, "loss": 4.465983581542969, "step": 109500 }, { "epoch": 0.13224700144102172, "learning_rate": 9.597779874132563e-06, "loss": 4.517566528320312, "step": 109600 }, { "epoch": 0.13236766476350442, "learning_rate": 9.597376038664825e-06, "loss": 4.489622192382813, "step": 109700 }, { "epoch": 0.1324883280859871, "learning_rate": 9.596972203197087e-06, "loss": 4.4957275390625, "step": 109800 }, { "epoch": 0.13260899140846977, "learning_rate": 9.596568367729347e-06, "loss": 4.512953491210937, "step": 109900 }, { "epoch": 0.13272965473095247, "learning_rate": 9.596164532261609e-06, "loss": 4.487915649414062, "step": 110000 }, { "epoch": 0.13285031805343514, "learning_rate": 9.59576069679387e-06, "loss": 4.477689514160156, "step": 110100 }, { "epoch": 0.13297098137591784, "learning_rate": 9.595356861326131e-06, "loss": 4.457083740234375, "step": 110200 }, { "epoch": 0.1330916446984005, "learning_rate": 9.594953025858393e-06, "loss": 4.4653662109375, "step": 110300 }, { "epoch": 0.1332123080208832, "learning_rate": 9.594549190390655e-06, "loss": 4.469291687011719, "step": 110400 }, { "epoch": 0.13333297134336589, "learning_rate": 9.594145354922917e-06, "loss": 4.486278381347656, "step": 110500 }, { "epoch": 0.13345363466584856, "learning_rate": 9.593741519455179e-06, "loss": 4.490919189453125, "step": 110600 }, { "epoch": 0.13357429798833126, "learning_rate": 9.593337683987441e-06, "loss": 4.4483575439453125, "step": 110700 }, { "epoch": 0.13369496131081393, "learning_rate": 9.592933848519701e-06, "loss": 4.45943359375, "step": 110800 }, { "epoch": 0.13381562463329663, "learning_rate": 9.592530013051963e-06, "loss": 4.465886535644532, "step": 110900 }, { "epoch": 0.1339362879557793, "learning_rate": 9.592126177584225e-06, "loss": 4.440640563964844, "step": 111000 }, { "epoch": 0.13405695127826198, "learning_rate": 9.591722342116486e-06, "loss": 4.476104736328125, "step": 111100 }, { "epoch": 0.13417761460074468, "learning_rate": 9.591318506648748e-06, "loss": 4.466950988769531, "step": 111200 }, { "epoch": 0.13429827792322735, "learning_rate": 9.59091467118101e-06, "loss": 4.44192138671875, "step": 111300 }, { "epoch": 0.13441894124571005, "learning_rate": 9.590510835713272e-06, "loss": 4.460939331054687, "step": 111400 }, { "epoch": 0.13453960456819272, "learning_rate": 9.590107000245534e-06, "loss": 4.462611083984375, "step": 111500 }, { "epoch": 0.13466026789067542, "learning_rate": 9.589703164777794e-06, "loss": 4.46771484375, "step": 111600 }, { "epoch": 0.1347809312131581, "learning_rate": 9.589299329310056e-06, "loss": 4.469099731445312, "step": 111700 }, { "epoch": 0.13490159453564077, "learning_rate": 9.588895493842318e-06, "loss": 4.476997985839843, "step": 111800 }, { "epoch": 0.13502225785812347, "learning_rate": 9.58849165837458e-06, "loss": 4.453414001464844, "step": 111900 }, { "epoch": 0.13514292118060614, "learning_rate": 9.58808782290684e-06, "loss": 4.475471496582031, "step": 112000 }, { "epoch": 0.13526358450308884, "learning_rate": 9.587683987439102e-06, "loss": 4.473577575683594, "step": 112100 }, { "epoch": 0.1353842478255715, "learning_rate": 9.587280151971364e-06, "loss": 4.458526000976563, "step": 112200 }, { "epoch": 0.13550491114805419, "learning_rate": 9.586876316503626e-06, "loss": 4.440609436035157, "step": 112300 }, { "epoch": 0.13562557447053689, "learning_rate": 9.586472481035886e-06, "loss": 4.463949584960938, "step": 112400 }, { "epoch": 0.13574623779301956, "learning_rate": 9.586068645568148e-06, "loss": 4.4455328369140625, "step": 112500 }, { "epoch": 0.13586690111550226, "learning_rate": 9.58566481010041e-06, "loss": 4.45734375, "step": 112600 }, { "epoch": 0.13598756443798493, "learning_rate": 9.585260974632672e-06, "loss": 4.432592468261719, "step": 112700 }, { "epoch": 0.13610822776046763, "learning_rate": 9.584857139164934e-06, "loss": 4.418620910644531, "step": 112800 }, { "epoch": 0.1362288910829503, "learning_rate": 9.584453303697196e-06, "loss": 4.41904052734375, "step": 112900 }, { "epoch": 0.13634955440543298, "learning_rate": 9.584049468229456e-06, "loss": 4.441593017578125, "step": 113000 }, { "epoch": 0.13647021772791568, "learning_rate": 9.583645632761718e-06, "loss": 4.4470431518554685, "step": 113100 }, { "epoch": 0.13659088105039835, "learning_rate": 9.58324179729398e-06, "loss": 4.4390283203125, "step": 113200 }, { "epoch": 0.13671154437288105, "learning_rate": 9.58283796182624e-06, "loss": 4.445567321777344, "step": 113300 }, { "epoch": 0.13683220769536372, "learning_rate": 9.582434126358503e-06, "loss": 4.437692565917969, "step": 113400 }, { "epoch": 0.1369528710178464, "learning_rate": 9.582030290890765e-06, "loss": 4.465968322753906, "step": 113500 }, { "epoch": 0.1370735343403291, "learning_rate": 9.581626455423027e-06, "loss": 4.4066619873046875, "step": 113600 }, { "epoch": 0.13719419766281177, "learning_rate": 9.581222619955289e-06, "loss": 4.454749755859375, "step": 113700 }, { "epoch": 0.13731486098529447, "learning_rate": 9.58081878448755e-06, "loss": 4.4673834228515625, "step": 113800 }, { "epoch": 0.13743552430777714, "learning_rate": 9.580414949019811e-06, "loss": 4.453739318847656, "step": 113900 }, { "epoch": 0.13755618763025984, "learning_rate": 9.580011113552073e-06, "loss": 4.429642639160156, "step": 114000 }, { "epoch": 0.1376768509527425, "learning_rate": 9.579607278084335e-06, "loss": 4.4275906372070315, "step": 114100 }, { "epoch": 0.13779751427522519, "learning_rate": 9.579203442616595e-06, "loss": 4.430051879882813, "step": 114200 }, { "epoch": 0.13791817759770789, "learning_rate": 9.578799607148857e-06, "loss": 4.434742126464844, "step": 114300 }, { "epoch": 0.13803884092019056, "learning_rate": 9.57839577168112e-06, "loss": 4.432896423339844, "step": 114400 }, { "epoch": 0.13815950424267326, "learning_rate": 9.577991936213381e-06, "loss": 4.445202331542969, "step": 114500 }, { "epoch": 0.13828016756515593, "learning_rate": 9.577588100745643e-06, "loss": 4.4600350952148435, "step": 114600 }, { "epoch": 0.1384008308876386, "learning_rate": 9.577184265277905e-06, "loss": 4.4270016479492185, "step": 114700 }, { "epoch": 0.1385214942101213, "learning_rate": 9.576780429810167e-06, "loss": 4.434621887207031, "step": 114800 }, { "epoch": 0.13864215753260398, "learning_rate": 9.576376594342427e-06, "loss": 4.406890869140625, "step": 114900 }, { "epoch": 0.13876282085508668, "learning_rate": 9.57597275887469e-06, "loss": 4.410062866210938, "step": 115000 }, { "epoch": 0.13888348417756935, "learning_rate": 9.57556892340695e-06, "loss": 4.430516357421875, "step": 115100 }, { "epoch": 0.13900414750005205, "learning_rate": 9.575165087939212e-06, "loss": 4.400594787597656, "step": 115200 }, { "epoch": 0.13912481082253472, "learning_rate": 9.574761252471474e-06, "loss": 4.425685424804687, "step": 115300 }, { "epoch": 0.1392454741450174, "learning_rate": 9.574357417003736e-06, "loss": 4.393196105957031, "step": 115400 }, { "epoch": 0.1393661374675001, "learning_rate": 9.573953581535998e-06, "loss": 4.400187683105469, "step": 115500 }, { "epoch": 0.13948680078998277, "learning_rate": 9.57354974606826e-06, "loss": 4.415928649902344, "step": 115600 }, { "epoch": 0.13960746411246547, "learning_rate": 9.57314591060052e-06, "loss": 4.41013671875, "step": 115700 }, { "epoch": 0.13972812743494814, "learning_rate": 9.572742075132782e-06, "loss": 4.4073974609375, "step": 115800 }, { "epoch": 0.1398487907574308, "learning_rate": 9.572338239665044e-06, "loss": 4.400917663574218, "step": 115900 }, { "epoch": 0.1399694540799135, "learning_rate": 9.571934404197306e-06, "loss": 4.448593444824219, "step": 116000 }, { "epoch": 0.14009011740239619, "learning_rate": 9.571530568729566e-06, "loss": 4.393462524414063, "step": 116100 }, { "epoch": 0.1402107807248789, "learning_rate": 9.571126733261828e-06, "loss": 4.4335107421875, "step": 116200 }, { "epoch": 0.14033144404736156, "learning_rate": 9.57072289779409e-06, "loss": 4.392406311035156, "step": 116300 }, { "epoch": 0.14045210736984423, "learning_rate": 9.570319062326352e-06, "loss": 4.394865417480469, "step": 116400 }, { "epoch": 0.14057277069232693, "learning_rate": 9.569915226858612e-06, "loss": 4.381990051269531, "step": 116500 }, { "epoch": 0.1406934340148096, "learning_rate": 9.569511391390874e-06, "loss": 4.418711242675781, "step": 116600 }, { "epoch": 0.1408140973372923, "learning_rate": 9.569107555923136e-06, "loss": 4.386910400390625, "step": 116700 }, { "epoch": 0.14093476065977498, "learning_rate": 9.568703720455398e-06, "loss": 4.409456481933594, "step": 116800 }, { "epoch": 0.14105542398225768, "learning_rate": 9.56829988498766e-06, "loss": 4.389706420898437, "step": 116900 }, { "epoch": 0.14117608730474035, "learning_rate": 9.56789604951992e-06, "loss": 4.406465759277344, "step": 117000 }, { "epoch": 0.14129675062722302, "learning_rate": 9.567492214052183e-06, "loss": 4.351282958984375, "step": 117100 }, { "epoch": 0.14141741394970572, "learning_rate": 9.567088378584445e-06, "loss": 4.409855041503906, "step": 117200 }, { "epoch": 0.1415380772721884, "learning_rate": 9.566684543116705e-06, "loss": 4.378627624511719, "step": 117300 }, { "epoch": 0.1416587405946711, "learning_rate": 9.566280707648967e-06, "loss": 4.415323486328125, "step": 117400 }, { "epoch": 0.14177940391715377, "learning_rate": 9.565876872181229e-06, "loss": 4.38979736328125, "step": 117500 }, { "epoch": 0.14190006723963644, "learning_rate": 9.56547303671349e-06, "loss": 4.387171020507813, "step": 117600 }, { "epoch": 0.14202073056211914, "learning_rate": 9.565069201245753e-06, "loss": 4.388475036621093, "step": 117700 }, { "epoch": 0.1421413938846018, "learning_rate": 9.564665365778015e-06, "loss": 4.3392642211914065, "step": 117800 }, { "epoch": 0.1422620572070845, "learning_rate": 9.564261530310277e-06, "loss": 4.374033813476562, "step": 117900 }, { "epoch": 0.14238272052956719, "learning_rate": 9.563857694842537e-06, "loss": 4.3949432373046875, "step": 118000 }, { "epoch": 0.1425033838520499, "learning_rate": 9.563453859374799e-06, "loss": 4.41203369140625, "step": 118100 }, { "epoch": 0.14262404717453256, "learning_rate": 9.56305002390706e-06, "loss": 4.352719421386719, "step": 118200 }, { "epoch": 0.14274471049701523, "learning_rate": 9.562646188439321e-06, "loss": 4.3942086791992185, "step": 118300 }, { "epoch": 0.14286537381949793, "learning_rate": 9.562242352971583e-06, "loss": 4.374820251464843, "step": 118400 }, { "epoch": 0.1429860371419806, "learning_rate": 9.561838517503845e-06, "loss": 4.379683837890625, "step": 118500 }, { "epoch": 0.1431067004644633, "learning_rate": 9.561434682036107e-06, "loss": 4.376545715332031, "step": 118600 }, { "epoch": 0.14322736378694598, "learning_rate": 9.56103084656837e-06, "loss": 4.389849243164062, "step": 118700 }, { "epoch": 0.14334802710942865, "learning_rate": 9.560627011100631e-06, "loss": 4.3559716796875, "step": 118800 }, { "epoch": 0.14346869043191135, "learning_rate": 9.560223175632891e-06, "loss": 4.365683898925782, "step": 118900 }, { "epoch": 0.14358935375439402, "learning_rate": 9.559819340165153e-06, "loss": 4.386561889648437, "step": 119000 }, { "epoch": 0.14371001707687672, "learning_rate": 9.559415504697415e-06, "loss": 4.356888427734375, "step": 119100 }, { "epoch": 0.1438306803993594, "learning_rate": 9.559011669229676e-06, "loss": 4.371274719238281, "step": 119200 }, { "epoch": 0.1439513437218421, "learning_rate": 9.558607833761938e-06, "loss": 4.351863098144531, "step": 119300 }, { "epoch": 0.14407200704432477, "learning_rate": 9.5582039982942e-06, "loss": 4.347482299804687, "step": 119400 }, { "epoch": 0.14419267036680744, "learning_rate": 9.557800162826462e-06, "loss": 4.378409423828125, "step": 119500 }, { "epoch": 0.14431333368929014, "learning_rate": 9.557396327358724e-06, "loss": 4.374012145996094, "step": 119600 }, { "epoch": 0.1444339970117728, "learning_rate": 9.556992491890986e-06, "loss": 4.375729675292969, "step": 119700 }, { "epoch": 0.1445546603342555, "learning_rate": 9.556588656423246e-06, "loss": 4.373175354003906, "step": 119800 }, { "epoch": 0.1446753236567382, "learning_rate": 9.556184820955508e-06, "loss": 4.3620947265625, "step": 119900 }, { "epoch": 0.14479598697922086, "learning_rate": 9.55578098548777e-06, "loss": 4.358991088867188, "step": 120000 }, { "epoch": 0.14491665030170356, "learning_rate": 9.55537715002003e-06, "loss": 4.350498352050781, "step": 120100 }, { "epoch": 0.14503731362418623, "learning_rate": 9.554973314552292e-06, "loss": 4.350937194824219, "step": 120200 }, { "epoch": 0.14515797694666893, "learning_rate": 9.554569479084554e-06, "loss": 4.331032409667968, "step": 120300 }, { "epoch": 0.1452786402691516, "learning_rate": 9.554165643616816e-06, "loss": 4.3107452392578125, "step": 120400 }, { "epoch": 0.1453993035916343, "learning_rate": 9.553761808149078e-06, "loss": 4.337636413574219, "step": 120500 }, { "epoch": 0.14551996691411698, "learning_rate": 9.553357972681338e-06, "loss": 4.359307861328125, "step": 120600 }, { "epoch": 0.14564063023659965, "learning_rate": 9.5529541372136e-06, "loss": 4.340976257324218, "step": 120700 }, { "epoch": 0.14576129355908235, "learning_rate": 9.552550301745862e-06, "loss": 4.384718933105469, "step": 120800 }, { "epoch": 0.14588195688156502, "learning_rate": 9.552146466278124e-06, "loss": 4.3548126220703125, "step": 120900 }, { "epoch": 0.14600262020404772, "learning_rate": 9.551742630810386e-06, "loss": 4.36437744140625, "step": 121000 }, { "epoch": 0.1461232835265304, "learning_rate": 9.551338795342647e-06, "loss": 4.35047119140625, "step": 121100 }, { "epoch": 0.14624394684901307, "learning_rate": 9.550934959874909e-06, "loss": 4.325852355957031, "step": 121200 }, { "epoch": 0.14636461017149577, "learning_rate": 9.55053112440717e-06, "loss": 4.342714233398437, "step": 121300 }, { "epoch": 0.14648527349397844, "learning_rate": 9.55012728893943e-06, "loss": 4.33703369140625, "step": 121400 }, { "epoch": 0.14660593681646114, "learning_rate": 9.549723453471693e-06, "loss": 4.339054565429688, "step": 121500 }, { "epoch": 0.1467266001389438, "learning_rate": 9.549319618003955e-06, "loss": 4.337333984375, "step": 121600 }, { "epoch": 0.1468472634614265, "learning_rate": 9.548915782536217e-06, "loss": 4.377168273925781, "step": 121700 }, { "epoch": 0.1469679267839092, "learning_rate": 9.548511947068479e-06, "loss": 4.317802124023437, "step": 121800 }, { "epoch": 0.14708859010639186, "learning_rate": 9.54810811160074e-06, "loss": 4.320137939453125, "step": 121900 }, { "epoch": 0.14720925342887456, "learning_rate": 9.547704276133001e-06, "loss": 4.329671936035156, "step": 122000 }, { "epoch": 0.14732991675135723, "learning_rate": 9.547300440665263e-06, "loss": 4.316641845703125, "step": 122100 }, { "epoch": 0.14745058007383993, "learning_rate": 9.546896605197525e-06, "loss": 4.347405700683594, "step": 122200 }, { "epoch": 0.1475712433963226, "learning_rate": 9.546492769729785e-06, "loss": 4.331479797363281, "step": 122300 }, { "epoch": 0.14769190671880528, "learning_rate": 9.546088934262047e-06, "loss": 4.31545166015625, "step": 122400 }, { "epoch": 0.14781257004128798, "learning_rate": 9.54568509879431e-06, "loss": 4.32429443359375, "step": 122500 }, { "epoch": 0.14793323336377065, "learning_rate": 9.545281263326571e-06, "loss": 4.3228302001953125, "step": 122600 }, { "epoch": 0.14805389668625335, "learning_rate": 9.544877427858833e-06, "loss": 4.308872680664063, "step": 122700 }, { "epoch": 0.14817456000873602, "learning_rate": 9.544473592391095e-06, "loss": 4.337101440429688, "step": 122800 }, { "epoch": 0.1482952233312187, "learning_rate": 9.544069756923357e-06, "loss": 4.331028137207031, "step": 122900 }, { "epoch": 0.1484158866537014, "learning_rate": 9.543665921455617e-06, "loss": 4.325223388671875, "step": 123000 }, { "epoch": 0.14853654997618407, "learning_rate": 9.54326208598788e-06, "loss": 4.3249508666992185, "step": 123100 }, { "epoch": 0.14865721329866677, "learning_rate": 9.54285825052014e-06, "loss": 4.341258850097656, "step": 123200 }, { "epoch": 0.14877787662114944, "learning_rate": 9.542454415052402e-06, "loss": 4.3162838745117185, "step": 123300 }, { "epoch": 0.14889853994363214, "learning_rate": 9.542050579584664e-06, "loss": 4.314066162109375, "step": 123400 }, { "epoch": 0.1490192032661148, "learning_rate": 9.541646744116926e-06, "loss": 4.327146911621094, "step": 123500 }, { "epoch": 0.1491398665885975, "learning_rate": 9.541242908649188e-06, "loss": 4.281849670410156, "step": 123600 }, { "epoch": 0.1492605299110802, "learning_rate": 9.54083907318145e-06, "loss": 4.31343505859375, "step": 123700 }, { "epoch": 0.14938119323356286, "learning_rate": 9.540435237713712e-06, "loss": 4.310948486328125, "step": 123800 }, { "epoch": 0.14950185655604556, "learning_rate": 9.540031402245972e-06, "loss": 4.299508056640625, "step": 123900 }, { "epoch": 0.14962251987852823, "learning_rate": 9.539627566778234e-06, "loss": 4.28039794921875, "step": 124000 }, { "epoch": 0.1497431832010109, "learning_rate": 9.539223731310496e-06, "loss": 4.311947326660157, "step": 124100 }, { "epoch": 0.1498638465234936, "learning_rate": 9.538819895842756e-06, "loss": 4.342105712890625, "step": 124200 }, { "epoch": 0.14998450984597628, "learning_rate": 9.538416060375018e-06, "loss": 4.314954833984375, "step": 124300 }, { "epoch": 0.15010517316845898, "learning_rate": 9.53801222490728e-06, "loss": 4.325047912597657, "step": 124400 }, { "epoch": 0.15022583649094165, "learning_rate": 9.537608389439542e-06, "loss": 4.295559692382812, "step": 124500 }, { "epoch": 0.15034649981342435, "learning_rate": 9.537204553971804e-06, "loss": 4.326130981445313, "step": 124600 }, { "epoch": 0.15046716313590702, "learning_rate": 9.536800718504064e-06, "loss": 4.280221557617187, "step": 124700 }, { "epoch": 0.1505878264583897, "learning_rate": 9.536396883036326e-06, "loss": 4.321505737304688, "step": 124800 }, { "epoch": 0.1507084897808724, "learning_rate": 9.535993047568588e-06, "loss": 4.304708557128906, "step": 124900 }, { "epoch": 0.15082915310335507, "learning_rate": 9.53558921210085e-06, "loss": 4.320899658203125, "step": 125000 }, { "epoch": 0.15094981642583777, "learning_rate": 9.535185376633112e-06, "loss": 4.311892700195313, "step": 125100 }, { "epoch": 0.15107047974832044, "learning_rate": 9.534781541165373e-06, "loss": 4.304443359375, "step": 125200 }, { "epoch": 0.1511911430708031, "learning_rate": 9.534377705697635e-06, "loss": 4.29806884765625, "step": 125300 }, { "epoch": 0.1513118063932858, "learning_rate": 9.533973870229897e-06, "loss": 4.282315368652344, "step": 125400 }, { "epoch": 0.1514324697157685, "learning_rate": 9.533570034762157e-06, "loss": 4.294893188476562, "step": 125500 }, { "epoch": 0.1515531330382512, "learning_rate": 9.533166199294419e-06, "loss": 4.278684997558594, "step": 125600 }, { "epoch": 0.15167379636073386, "learning_rate": 9.53276236382668e-06, "loss": 4.298463745117187, "step": 125700 }, { "epoch": 0.15179445968321656, "learning_rate": 9.532358528358943e-06, "loss": 4.276971435546875, "step": 125800 }, { "epoch": 0.15191512300569923, "learning_rate": 9.531954692891205e-06, "loss": 4.266158752441406, "step": 125900 }, { "epoch": 0.1520357863281819, "learning_rate": 9.531550857423467e-06, "loss": 4.272743835449218, "step": 126000 }, { "epoch": 0.1521564496506646, "learning_rate": 9.531147021955727e-06, "loss": 4.277969055175781, "step": 126100 }, { "epoch": 0.15227711297314728, "learning_rate": 9.530743186487989e-06, "loss": 4.287745361328125, "step": 126200 }, { "epoch": 0.15239777629562998, "learning_rate": 9.530339351020251e-06, "loss": 4.300249633789062, "step": 126300 }, { "epoch": 0.15251843961811265, "learning_rate": 9.529935515552511e-06, "loss": 4.285774841308593, "step": 126400 }, { "epoch": 0.15263910294059532, "learning_rate": 9.529531680084773e-06, "loss": 4.305826721191406, "step": 126500 }, { "epoch": 0.15275976626307802, "learning_rate": 9.529127844617035e-06, "loss": 4.295311279296875, "step": 126600 }, { "epoch": 0.1528804295855607, "learning_rate": 9.528724009149297e-06, "loss": 4.2653350830078125, "step": 126700 }, { "epoch": 0.1530010929080434, "learning_rate": 9.52832017368156e-06, "loss": 4.296410827636719, "step": 126800 }, { "epoch": 0.15312175623052607, "learning_rate": 9.527916338213821e-06, "loss": 4.288053283691406, "step": 126900 }, { "epoch": 0.15324241955300877, "learning_rate": 9.527512502746083e-06, "loss": 4.275084228515625, "step": 127000 }, { "epoch": 0.15336308287549144, "learning_rate": 9.527108667278344e-06, "loss": 4.290885009765625, "step": 127100 }, { "epoch": 0.1534837461979741, "learning_rate": 9.526704831810605e-06, "loss": 4.274404907226563, "step": 127200 }, { "epoch": 0.1536044095204568, "learning_rate": 9.526300996342866e-06, "loss": 4.293334350585938, "step": 127300 }, { "epoch": 0.1537250728429395, "learning_rate": 9.525897160875128e-06, "loss": 4.264752197265625, "step": 127400 }, { "epoch": 0.1538457361654222, "learning_rate": 9.52549332540739e-06, "loss": 4.257093505859375, "step": 127500 }, { "epoch": 0.15396639948790486, "learning_rate": 9.525089489939652e-06, "loss": 4.267686157226563, "step": 127600 }, { "epoch": 0.15408706281038753, "learning_rate": 9.524685654471914e-06, "loss": 4.289052734375, "step": 127700 }, { "epoch": 0.15420772613287023, "learning_rate": 9.524281819004176e-06, "loss": 4.2693087768554685, "step": 127800 }, { "epoch": 0.1543283894553529, "learning_rate": 9.523877983536436e-06, "loss": 4.302455139160156, "step": 127900 }, { "epoch": 0.1544490527778356, "learning_rate": 9.523474148068698e-06, "loss": 4.255574645996094, "step": 128000 }, { "epoch": 0.15456971610031828, "learning_rate": 9.52307031260096e-06, "loss": 4.264149169921875, "step": 128100 }, { "epoch": 0.15469037942280095, "learning_rate": 9.522666477133222e-06, "loss": 4.245845031738281, "step": 128200 }, { "epoch": 0.15481104274528365, "learning_rate": 9.522262641665482e-06, "loss": 4.248517150878906, "step": 128300 }, { "epoch": 0.15493170606776632, "learning_rate": 9.521858806197744e-06, "loss": 4.2542047119140625, "step": 128400 }, { "epoch": 0.15505236939024902, "learning_rate": 9.521454970730006e-06, "loss": 4.2518923950195315, "step": 128500 }, { "epoch": 0.1551730327127317, "learning_rate": 9.521051135262268e-06, "loss": 4.2552798461914065, "step": 128600 }, { "epoch": 0.1552936960352144, "learning_rate": 9.52064729979453e-06, "loss": 4.248907470703125, "step": 128700 }, { "epoch": 0.15541435935769707, "learning_rate": 9.52024346432679e-06, "loss": 4.2556304931640625, "step": 128800 }, { "epoch": 0.15553502268017974, "learning_rate": 9.519839628859052e-06, "loss": 4.2737353515625, "step": 128900 }, { "epoch": 0.15565568600266244, "learning_rate": 9.519435793391314e-06, "loss": 4.246327819824219, "step": 129000 }, { "epoch": 0.1557763493251451, "learning_rate": 9.519031957923576e-06, "loss": 4.262615051269531, "step": 129100 }, { "epoch": 0.15589701264762781, "learning_rate": 9.518628122455837e-06, "loss": 4.2385009765625, "step": 129200 }, { "epoch": 0.1560176759701105, "learning_rate": 9.518224286988099e-06, "loss": 4.2525567626953125, "step": 129300 }, { "epoch": 0.15613833929259316, "learning_rate": 9.51782045152036e-06, "loss": 4.260746765136719, "step": 129400 }, { "epoch": 0.15625900261507586, "learning_rate": 9.517416616052623e-06, "loss": 4.245251159667969, "step": 129500 }, { "epoch": 0.15637966593755853, "learning_rate": 9.517012780584883e-06, "loss": 4.228903198242188, "step": 129600 }, { "epoch": 0.15650032926004123, "learning_rate": 9.516608945117145e-06, "loss": 4.230923461914062, "step": 129700 }, { "epoch": 0.1566209925825239, "learning_rate": 9.516205109649407e-06, "loss": 4.2522366333007815, "step": 129800 }, { "epoch": 0.1567416559050066, "learning_rate": 9.515801274181669e-06, "loss": 4.241545104980469, "step": 129900 }, { "epoch": 0.15686231922748928, "learning_rate": 9.51539743871393e-06, "loss": 4.218800048828125, "step": 130000 }, { "epoch": 0.15698298254997195, "learning_rate": 9.514993603246193e-06, "loss": 4.24559326171875, "step": 130100 }, { "epoch": 0.15710364587245465, "learning_rate": 9.514589767778453e-06, "loss": 4.23311767578125, "step": 130200 }, { "epoch": 0.15722430919493732, "learning_rate": 9.514185932310715e-06, "loss": 4.249968566894531, "step": 130300 }, { "epoch": 0.15734497251742002, "learning_rate": 9.513782096842975e-06, "loss": 4.238301086425781, "step": 130400 }, { "epoch": 0.1574656358399027, "learning_rate": 9.513378261375237e-06, "loss": 4.258863525390625, "step": 130500 }, { "epoch": 0.15758629916238537, "learning_rate": 9.5129744259075e-06, "loss": 4.228417053222656, "step": 130600 }, { "epoch": 0.15770696248486807, "learning_rate": 9.512570590439761e-06, "loss": 4.212883605957031, "step": 130700 }, { "epoch": 0.15782762580735074, "learning_rate": 9.512166754972023e-06, "loss": 4.241891784667969, "step": 130800 }, { "epoch": 0.15794828912983344, "learning_rate": 9.511762919504285e-06, "loss": 4.2326287841796875, "step": 130900 }, { "epoch": 0.1580689524523161, "learning_rate": 9.511359084036547e-06, "loss": 4.238702392578125, "step": 131000 }, { "epoch": 0.15818961577479881, "learning_rate": 9.510955248568808e-06, "loss": 4.253780517578125, "step": 131100 }, { "epoch": 0.1583102790972815, "learning_rate": 9.51055141310107e-06, "loss": 4.240475769042969, "step": 131200 }, { "epoch": 0.15843094241976416, "learning_rate": 9.510147577633332e-06, "loss": 4.236222229003906, "step": 131300 }, { "epoch": 0.15855160574224686, "learning_rate": 9.509743742165592e-06, "loss": 4.194006652832031, "step": 131400 }, { "epoch": 0.15867226906472953, "learning_rate": 9.509339906697854e-06, "loss": 4.239622192382813, "step": 131500 }, { "epoch": 0.15879293238721223, "learning_rate": 9.508936071230116e-06, "loss": 4.252107849121094, "step": 131600 }, { "epoch": 0.1589135957096949, "learning_rate": 9.508532235762378e-06, "loss": 4.230406188964844, "step": 131700 }, { "epoch": 0.15903425903217758, "learning_rate": 9.50812840029464e-06, "loss": 4.215827941894531, "step": 131800 }, { "epoch": 0.15915492235466028, "learning_rate": 9.507724564826902e-06, "loss": 4.215340576171875, "step": 131900 }, { "epoch": 0.15927558567714295, "learning_rate": 9.507320729359162e-06, "loss": 4.2347238159179685, "step": 132000 }, { "epoch": 0.15939624899962565, "learning_rate": 9.506916893891424e-06, "loss": 4.237113647460937, "step": 132100 }, { "epoch": 0.15951691232210832, "learning_rate": 9.506513058423686e-06, "loss": 4.220930786132812, "step": 132200 }, { "epoch": 0.15963757564459102, "learning_rate": 9.506109222955946e-06, "loss": 4.192018432617187, "step": 132300 }, { "epoch": 0.1597582389670737, "learning_rate": 9.505705387488208e-06, "loss": 4.224645385742187, "step": 132400 }, { "epoch": 0.15987890228955637, "learning_rate": 9.50530155202047e-06, "loss": 4.231823425292969, "step": 132500 }, { "epoch": 0.15999956561203907, "learning_rate": 9.504897716552732e-06, "loss": 4.199769287109375, "step": 132600 }, { "epoch": 0.16012022893452174, "learning_rate": 9.504493881084994e-06, "loss": 4.216982421875, "step": 132700 }, { "epoch": 0.16024089225700444, "learning_rate": 9.504090045617254e-06, "loss": 4.201979675292969, "step": 132800 }, { "epoch": 0.16036155557948711, "learning_rate": 9.503686210149516e-06, "loss": 4.249957580566406, "step": 132900 }, { "epoch": 0.1604822189019698, "learning_rate": 9.503282374681778e-06, "loss": 4.234060668945313, "step": 133000 }, { "epoch": 0.1606028822244525, "learning_rate": 9.50287853921404e-06, "loss": 4.198249206542969, "step": 133100 }, { "epoch": 0.16072354554693516, "learning_rate": 9.502474703746302e-06, "loss": 4.212026977539063, "step": 133200 }, { "epoch": 0.16084420886941786, "learning_rate": 9.502070868278563e-06, "loss": 4.194464111328125, "step": 133300 }, { "epoch": 0.16096487219190053, "learning_rate": 9.501667032810825e-06, "loss": 4.19867919921875, "step": 133400 }, { "epoch": 0.16108553551438323, "learning_rate": 9.501263197343087e-06, "loss": 4.195557556152344, "step": 133500 }, { "epoch": 0.1612061988368659, "learning_rate": 9.500859361875349e-06, "loss": 4.191703491210937, "step": 133600 }, { "epoch": 0.16132686215934858, "learning_rate": 9.500455526407609e-06, "loss": 4.226734924316406, "step": 133700 }, { "epoch": 0.16144752548183128, "learning_rate": 9.500051690939871e-06, "loss": 4.220860290527344, "step": 133800 }, { "epoch": 0.16156818880431395, "learning_rate": 9.499647855472133e-06, "loss": 4.218114013671875, "step": 133900 }, { "epoch": 0.16168885212679665, "learning_rate": 9.499244020004395e-06, "loss": 4.2, "step": 134000 }, { "epoch": 0.16180951544927932, "learning_rate": 9.498840184536657e-06, "loss": 4.182944641113282, "step": 134100 }, { "epoch": 0.161930178771762, "learning_rate": 9.498436349068917e-06, "loss": 4.156382141113281, "step": 134200 }, { "epoch": 0.1620508420942447, "learning_rate": 9.498032513601179e-06, "loss": 4.207982788085937, "step": 134300 }, { "epoch": 0.16217150541672737, "learning_rate": 9.497628678133441e-06, "loss": 4.20839111328125, "step": 134400 }, { "epoch": 0.16229216873921007, "learning_rate": 9.497224842665701e-06, "loss": 4.201115112304688, "step": 134500 }, { "epoch": 0.16241283206169274, "learning_rate": 9.496821007197963e-06, "loss": 4.1791293334960935, "step": 134600 }, { "epoch": 0.1625334953841754, "learning_rate": 9.496417171730225e-06, "loss": 4.187546997070313, "step": 134700 }, { "epoch": 0.16265415870665811, "learning_rate": 9.496013336262487e-06, "loss": 4.196438293457032, "step": 134800 }, { "epoch": 0.1627748220291408, "learning_rate": 9.49560950079475e-06, "loss": 4.191497802734375, "step": 134900 }, { "epoch": 0.1628954853516235, "learning_rate": 9.495205665327011e-06, "loss": 4.215068054199219, "step": 135000 }, { "epoch": 0.16301614867410616, "learning_rate": 9.494801829859273e-06, "loss": 4.167944641113281, "step": 135100 }, { "epoch": 0.16313681199658886, "learning_rate": 9.494397994391534e-06, "loss": 4.205506591796875, "step": 135200 }, { "epoch": 0.16325747531907153, "learning_rate": 9.493994158923796e-06, "loss": 4.181203308105469, "step": 135300 }, { "epoch": 0.1633781386415542, "learning_rate": 9.493590323456056e-06, "loss": 4.181968383789062, "step": 135400 }, { "epoch": 0.1634988019640369, "learning_rate": 9.493186487988318e-06, "loss": 4.188661193847656, "step": 135500 }, { "epoch": 0.16361946528651958, "learning_rate": 9.49278265252058e-06, "loss": 4.200094604492188, "step": 135600 }, { "epoch": 0.16374012860900228, "learning_rate": 9.492378817052842e-06, "loss": 4.158785705566406, "step": 135700 }, { "epoch": 0.16386079193148495, "learning_rate": 9.491974981585104e-06, "loss": 4.159096374511718, "step": 135800 }, { "epoch": 0.16398145525396762, "learning_rate": 9.491571146117366e-06, "loss": 4.218682556152344, "step": 135900 }, { "epoch": 0.16410211857645032, "learning_rate": 9.491167310649628e-06, "loss": 4.178736572265625, "step": 136000 }, { "epoch": 0.164222781898933, "learning_rate": 9.490763475181888e-06, "loss": 4.1625192260742185, "step": 136100 }, { "epoch": 0.1643434452214157, "learning_rate": 9.49035963971415e-06, "loss": 4.173831787109375, "step": 136200 }, { "epoch": 0.16446410854389837, "learning_rate": 9.489955804246412e-06, "loss": 4.172528381347656, "step": 136300 }, { "epoch": 0.16458477186638107, "learning_rate": 9.489551968778672e-06, "loss": 4.1877224731445315, "step": 136400 }, { "epoch": 0.16470543518886374, "learning_rate": 9.489148133310934e-06, "loss": 4.170550231933594, "step": 136500 }, { "epoch": 0.1648260985113464, "learning_rate": 9.488744297843196e-06, "loss": 4.178667602539062, "step": 136600 }, { "epoch": 0.16494676183382911, "learning_rate": 9.488340462375458e-06, "loss": 4.193502807617188, "step": 136700 }, { "epoch": 0.1650674251563118, "learning_rate": 9.48793662690772e-06, "loss": 4.14175537109375, "step": 136800 }, { "epoch": 0.1651880884787945, "learning_rate": 9.48753279143998e-06, "loss": 4.170281982421875, "step": 136900 }, { "epoch": 0.16530875180127716, "learning_rate": 9.487128955972243e-06, "loss": 4.183246765136719, "step": 137000 }, { "epoch": 0.16542941512375983, "learning_rate": 9.486725120504504e-06, "loss": 4.175970458984375, "step": 137100 }, { "epoch": 0.16555007844624253, "learning_rate": 9.486321285036766e-06, "loss": 4.146685485839844, "step": 137200 }, { "epoch": 0.1656707417687252, "learning_rate": 9.485917449569028e-06, "loss": 4.153794250488281, "step": 137300 }, { "epoch": 0.1657914050912079, "learning_rate": 9.485513614101289e-06, "loss": 4.156079711914063, "step": 137400 }, { "epoch": 0.16591206841369058, "learning_rate": 9.48510977863355e-06, "loss": 4.1634674072265625, "step": 137500 }, { "epoch": 0.16603273173617328, "learning_rate": 9.484705943165813e-06, "loss": 4.172157897949218, "step": 137600 }, { "epoch": 0.16615339505865595, "learning_rate": 9.484302107698073e-06, "loss": 4.152699584960938, "step": 137700 }, { "epoch": 0.16627405838113862, "learning_rate": 9.483898272230335e-06, "loss": 4.132930297851562, "step": 137800 }, { "epoch": 0.16639472170362132, "learning_rate": 9.483494436762597e-06, "loss": 4.167182312011719, "step": 137900 }, { "epoch": 0.166515385026104, "learning_rate": 9.483090601294859e-06, "loss": 4.155087585449219, "step": 138000 }, { "epoch": 0.1666360483485867, "learning_rate": 9.482686765827121e-06, "loss": 4.171703491210938, "step": 138100 }, { "epoch": 0.16675671167106937, "learning_rate": 9.482282930359383e-06, "loss": 4.159670104980469, "step": 138200 }, { "epoch": 0.16687737499355204, "learning_rate": 9.481879094891643e-06, "loss": 4.147190856933594, "step": 138300 }, { "epoch": 0.16699803831603474, "learning_rate": 9.481475259423905e-06, "loss": 4.144685363769531, "step": 138400 }, { "epoch": 0.16711870163851741, "learning_rate": 9.481071423956167e-06, "loss": 4.152030334472657, "step": 138500 }, { "epoch": 0.16723936496100011, "learning_rate": 9.480667588488427e-06, "loss": 4.16162109375, "step": 138600 }, { "epoch": 0.1673600282834828, "learning_rate": 9.48026375302069e-06, "loss": 4.141409912109375, "step": 138700 }, { "epoch": 0.1674806916059655, "learning_rate": 9.479859917552951e-06, "loss": 4.161637573242188, "step": 138800 }, { "epoch": 0.16760135492844816, "learning_rate": 9.479456082085213e-06, "loss": 4.149785461425782, "step": 138900 }, { "epoch": 0.16772201825093083, "learning_rate": 9.479052246617475e-06, "loss": 4.137402648925781, "step": 139000 }, { "epoch": 0.16784268157341353, "learning_rate": 9.478648411149737e-06, "loss": 4.164827270507812, "step": 139100 }, { "epoch": 0.1679633448958962, "learning_rate": 9.478244575682e-06, "loss": 4.136315612792969, "step": 139200 }, { "epoch": 0.1680840082183789, "learning_rate": 9.47784074021426e-06, "loss": 4.13937744140625, "step": 139300 }, { "epoch": 0.16820467154086158, "learning_rate": 9.477436904746522e-06, "loss": 4.138125305175781, "step": 139400 }, { "epoch": 0.16832533486334425, "learning_rate": 9.477033069278782e-06, "loss": 4.1315478515625, "step": 139500 }, { "epoch": 0.16844599818582695, "learning_rate": 9.476629233811044e-06, "loss": 4.156204833984375, "step": 139600 }, { "epoch": 0.16856666150830962, "learning_rate": 9.476225398343306e-06, "loss": 4.163810119628907, "step": 139700 }, { "epoch": 0.16868732483079232, "learning_rate": 9.475821562875568e-06, "loss": 4.1622900390625, "step": 139800 }, { "epoch": 0.168807988153275, "learning_rate": 9.47541772740783e-06, "loss": 4.164542236328125, "step": 139900 }, { "epoch": 0.1689286514757577, "learning_rate": 9.475013891940092e-06, "loss": 4.1283544921875, "step": 140000 }, { "epoch": 0.16904931479824037, "learning_rate": 9.474610056472354e-06, "loss": 4.169474487304687, "step": 140100 }, { "epoch": 0.16916997812072304, "learning_rate": 9.474206221004614e-06, "loss": 4.153294677734375, "step": 140200 }, { "epoch": 0.16929064144320574, "learning_rate": 9.473802385536876e-06, "loss": 4.14068115234375, "step": 140300 }, { "epoch": 0.16941130476568841, "learning_rate": 9.473398550069138e-06, "loss": 4.134254455566406, "step": 140400 }, { "epoch": 0.16953196808817111, "learning_rate": 9.472994714601398e-06, "loss": 4.139063110351563, "step": 140500 }, { "epoch": 0.1696526314106538, "learning_rate": 9.47259087913366e-06, "loss": 4.143599853515625, "step": 140600 }, { "epoch": 0.16977329473313646, "learning_rate": 9.472187043665922e-06, "loss": 4.115407409667969, "step": 140700 }, { "epoch": 0.16989395805561916, "learning_rate": 9.471783208198184e-06, "loss": 4.142363586425781, "step": 140800 }, { "epoch": 0.17001462137810183, "learning_rate": 9.471379372730446e-06, "loss": 4.128663024902344, "step": 140900 }, { "epoch": 0.17013528470058453, "learning_rate": 9.470975537262707e-06, "loss": 4.125610961914062, "step": 141000 }, { "epoch": 0.1702559480230672, "learning_rate": 9.470571701794969e-06, "loss": 4.129360961914062, "step": 141100 }, { "epoch": 0.17037661134554988, "learning_rate": 9.47016786632723e-06, "loss": 4.167195739746094, "step": 141200 }, { "epoch": 0.17049727466803258, "learning_rate": 9.469764030859493e-06, "loss": 4.1093988037109375, "step": 141300 }, { "epoch": 0.17061793799051525, "learning_rate": 9.469360195391753e-06, "loss": 4.131300048828125, "step": 141400 }, { "epoch": 0.17073860131299795, "learning_rate": 9.468956359924015e-06, "loss": 4.122879943847656, "step": 141500 }, { "epoch": 0.17085926463548062, "learning_rate": 9.468552524456277e-06, "loss": 4.110649108886719, "step": 141600 }, { "epoch": 0.17097992795796332, "learning_rate": 9.468148688988539e-06, "loss": 4.117805786132813, "step": 141700 }, { "epoch": 0.171100591280446, "learning_rate": 9.467744853520799e-06, "loss": 4.1547119140625, "step": 141800 }, { "epoch": 0.17122125460292867, "learning_rate": 9.467341018053061e-06, "loss": 4.142525329589843, "step": 141900 }, { "epoch": 0.17134191792541137, "learning_rate": 9.466937182585323e-06, "loss": 4.132686462402344, "step": 142000 }, { "epoch": 0.17146258124789404, "learning_rate": 9.466533347117585e-06, "loss": 4.126594543457031, "step": 142100 }, { "epoch": 0.17158324457037674, "learning_rate": 9.466129511649847e-06, "loss": 4.121519470214844, "step": 142200 }, { "epoch": 0.17170390789285941, "learning_rate": 9.465725676182109e-06, "loss": 4.1388766479492185, "step": 142300 }, { "epoch": 0.1718245712153421, "learning_rate": 9.46532184071437e-06, "loss": 4.122481994628906, "step": 142400 }, { "epoch": 0.1719452345378248, "learning_rate": 9.464918005246631e-06, "loss": 4.111268920898437, "step": 142500 }, { "epoch": 0.17206589786030746, "learning_rate": 9.464514169778891e-06, "loss": 4.127690124511719, "step": 142600 }, { "epoch": 0.17218656118279016, "learning_rate": 9.464110334311153e-06, "loss": 4.116007995605469, "step": 142700 }, { "epoch": 0.17230722450527283, "learning_rate": 9.463706498843415e-06, "loss": 4.094861450195313, "step": 142800 }, { "epoch": 0.17242788782775553, "learning_rate": 9.463302663375677e-06, "loss": 4.121034240722656, "step": 142900 }, { "epoch": 0.1725485511502382, "learning_rate": 9.46289882790794e-06, "loss": 4.107123718261719, "step": 143000 }, { "epoch": 0.17266921447272088, "learning_rate": 9.462494992440201e-06, "loss": 4.114708251953125, "step": 143100 }, { "epoch": 0.17278987779520358, "learning_rate": 9.462091156972463e-06, "loss": 4.089667663574219, "step": 143200 }, { "epoch": 0.17291054111768625, "learning_rate": 9.461687321504724e-06, "loss": 4.112540893554687, "step": 143300 }, { "epoch": 0.17303120444016895, "learning_rate": 9.461283486036986e-06, "loss": 4.1080169677734375, "step": 143400 }, { "epoch": 0.17315186776265162, "learning_rate": 9.460879650569248e-06, "loss": 4.09574462890625, "step": 143500 }, { "epoch": 0.1732725310851343, "learning_rate": 9.460475815101508e-06, "loss": 4.110877990722656, "step": 143600 }, { "epoch": 0.173393194407617, "learning_rate": 9.46007197963377e-06, "loss": 4.111781005859375, "step": 143700 }, { "epoch": 0.17351385773009967, "learning_rate": 9.459668144166032e-06, "loss": 4.116029968261719, "step": 143800 }, { "epoch": 0.17363452105258237, "learning_rate": 9.459264308698294e-06, "loss": 4.083573303222656, "step": 143900 }, { "epoch": 0.17375518437506504, "learning_rate": 9.458860473230556e-06, "loss": 4.128597412109375, "step": 144000 }, { "epoch": 0.17387584769754774, "learning_rate": 9.458456637762818e-06, "loss": 4.100955200195313, "step": 144100 }, { "epoch": 0.17399651102003041, "learning_rate": 9.45805280229508e-06, "loss": 4.0837774658203125, "step": 144200 }, { "epoch": 0.1741171743425131, "learning_rate": 9.45764896682734e-06, "loss": 4.0916552734375, "step": 144300 }, { "epoch": 0.1742378376649958, "learning_rate": 9.457245131359602e-06, "loss": 4.099443969726562, "step": 144400 }, { "epoch": 0.17435850098747846, "learning_rate": 9.456841295891862e-06, "loss": 4.098468933105469, "step": 144500 }, { "epoch": 0.17447916430996116, "learning_rate": 9.456437460424124e-06, "loss": 4.083135070800782, "step": 144600 }, { "epoch": 0.17459982763244383, "learning_rate": 9.456033624956386e-06, "loss": 4.0824978637695315, "step": 144700 }, { "epoch": 0.1747204909549265, "learning_rate": 9.455629789488648e-06, "loss": 4.101973266601562, "step": 144800 }, { "epoch": 0.1748411542774092, "learning_rate": 9.45522595402091e-06, "loss": 4.093297424316407, "step": 144900 }, { "epoch": 0.17496181759989188, "learning_rate": 9.454822118553172e-06, "loss": 4.081582946777344, "step": 145000 }, { "epoch": 0.17508248092237458, "learning_rate": 9.454418283085433e-06, "loss": 4.115688781738282, "step": 145100 }, { "epoch": 0.17520314424485725, "learning_rate": 9.454014447617695e-06, "loss": 4.111075439453125, "step": 145200 }, { "epoch": 0.17532380756733995, "learning_rate": 9.453610612149957e-06, "loss": 4.104603271484375, "step": 145300 }, { "epoch": 0.17544447088982262, "learning_rate": 9.453206776682219e-06, "loss": 4.097171630859375, "step": 145400 }, { "epoch": 0.1755651342123053, "learning_rate": 9.452802941214479e-06, "loss": 4.0814361572265625, "step": 145500 }, { "epoch": 0.175685797534788, "learning_rate": 9.45239910574674e-06, "loss": 4.098536682128906, "step": 145600 }, { "epoch": 0.17580646085727067, "learning_rate": 9.451995270279003e-06, "loss": 4.097376098632813, "step": 145700 }, { "epoch": 0.17592712417975337, "learning_rate": 9.451591434811265e-06, "loss": 4.0992578125, "step": 145800 }, { "epoch": 0.17604778750223604, "learning_rate": 9.451187599343525e-06, "loss": 4.086771240234375, "step": 145900 }, { "epoch": 0.17616845082471871, "learning_rate": 9.450783763875787e-06, "loss": 4.094929504394531, "step": 146000 }, { "epoch": 0.17628911414720141, "learning_rate": 9.450379928408049e-06, "loss": 4.1046044921875, "step": 146100 }, { "epoch": 0.1764097774696841, "learning_rate": 9.449976092940311e-06, "loss": 4.060028686523437, "step": 146200 }, { "epoch": 0.1765304407921668, "learning_rate": 9.449572257472573e-06, "loss": 4.093073425292968, "step": 146300 }, { "epoch": 0.17665110411464946, "learning_rate": 9.449168422004833e-06, "loss": 4.060162963867188, "step": 146400 }, { "epoch": 0.17677176743713216, "learning_rate": 9.448764586537095e-06, "loss": 4.09326904296875, "step": 146500 }, { "epoch": 0.17689243075961483, "learning_rate": 9.448360751069357e-06, "loss": 4.03947265625, "step": 146600 }, { "epoch": 0.1770130940820975, "learning_rate": 9.447956915601618e-06, "loss": 4.081064758300781, "step": 146700 }, { "epoch": 0.1771337574045802, "learning_rate": 9.44755308013388e-06, "loss": 4.06759521484375, "step": 146800 }, { "epoch": 0.17725442072706288, "learning_rate": 9.447149244666141e-06, "loss": 4.101948547363281, "step": 146900 }, { "epoch": 0.17737508404954558, "learning_rate": 9.446745409198403e-06, "loss": 4.0613775634765625, "step": 147000 }, { "epoch": 0.17749574737202825, "learning_rate": 9.446341573730665e-06, "loss": 4.08305908203125, "step": 147100 }, { "epoch": 0.17761641069451092, "learning_rate": 9.445937738262927e-06, "loss": 4.054884338378907, "step": 147200 }, { "epoch": 0.17773707401699362, "learning_rate": 9.44553390279519e-06, "loss": 4.066440734863281, "step": 147300 }, { "epoch": 0.1778577373394763, "learning_rate": 9.44513006732745e-06, "loss": 4.063131713867188, "step": 147400 }, { "epoch": 0.177978400661959, "learning_rate": 9.444726231859712e-06, "loss": 4.0764794921875, "step": 147500 }, { "epoch": 0.17809906398444167, "learning_rate": 9.444322396391972e-06, "loss": 4.0662298583984375, "step": 147600 }, { "epoch": 0.17821972730692434, "learning_rate": 9.443918560924234e-06, "loss": 4.077352294921875, "step": 147700 }, { "epoch": 0.17834039062940704, "learning_rate": 9.443514725456496e-06, "loss": 4.088600158691406, "step": 147800 }, { "epoch": 0.17846105395188971, "learning_rate": 9.443110889988758e-06, "loss": 4.0680224609375, "step": 147900 }, { "epoch": 0.17858171727437241, "learning_rate": 9.44270705452102e-06, "loss": 4.052131958007813, "step": 148000 }, { "epoch": 0.1787023805968551, "learning_rate": 9.442303219053282e-06, "loss": 4.058963928222656, "step": 148100 }, { "epoch": 0.1788230439193378, "learning_rate": 9.441899383585544e-06, "loss": 4.080462341308594, "step": 148200 }, { "epoch": 0.17894370724182046, "learning_rate": 9.441495548117804e-06, "loss": 4.058490905761719, "step": 148300 }, { "epoch": 0.17906437056430313, "learning_rate": 9.441091712650066e-06, "loss": 4.058789672851563, "step": 148400 }, { "epoch": 0.17918503388678583, "learning_rate": 9.440687877182328e-06, "loss": 4.058347473144531, "step": 148500 }, { "epoch": 0.1793056972092685, "learning_rate": 9.440284041714588e-06, "loss": 4.04501708984375, "step": 148600 }, { "epoch": 0.1794263605317512, "learning_rate": 9.43988020624685e-06, "loss": 4.074843444824219, "step": 148700 }, { "epoch": 0.17954702385423388, "learning_rate": 9.439476370779112e-06, "loss": 4.060300598144531, "step": 148800 }, { "epoch": 0.17966768717671655, "learning_rate": 9.439072535311374e-06, "loss": 4.050150756835937, "step": 148900 }, { "epoch": 0.17978835049919925, "learning_rate": 9.438668699843636e-06, "loss": 4.049259338378906, "step": 149000 }, { "epoch": 0.17990901382168192, "learning_rate": 9.438264864375898e-06, "loss": 4.045036010742187, "step": 149100 }, { "epoch": 0.18002967714416462, "learning_rate": 9.437861028908159e-06, "loss": 4.089662170410156, "step": 149200 }, { "epoch": 0.1801503404666473, "learning_rate": 9.43745719344042e-06, "loss": 4.047580871582031, "step": 149300 }, { "epoch": 0.18027100378913, "learning_rate": 9.437053357972683e-06, "loss": 4.08689697265625, "step": 149400 }, { "epoch": 0.18039166711161267, "learning_rate": 9.436649522504943e-06, "loss": 4.0404141235351565, "step": 149500 }, { "epoch": 0.18051233043409534, "learning_rate": 9.436245687037205e-06, "loss": 4.0890960693359375, "step": 149600 }, { "epoch": 0.18063299375657804, "learning_rate": 9.435841851569467e-06, "loss": 4.05540283203125, "step": 149700 }, { "epoch": 0.18075365707906071, "learning_rate": 9.435438016101729e-06, "loss": 4.025476379394531, "step": 149800 }, { "epoch": 0.18087432040154341, "learning_rate": 9.43503418063399e-06, "loss": 4.0574777221679685, "step": 149900 }, { "epoch": 0.1809949837240261, "learning_rate": 9.434630345166251e-06, "loss": 4.03138916015625, "step": 150000 }, { "epoch": 0.18111564704650876, "learning_rate": 9.434226509698513e-06, "loss": 4.055688171386719, "step": 150100 }, { "epoch": 0.18123631036899146, "learning_rate": 9.433822674230775e-06, "loss": 4.031493530273438, "step": 150200 }, { "epoch": 0.18135697369147413, "learning_rate": 9.433418838763037e-06, "loss": 4.042034606933594, "step": 150300 }, { "epoch": 0.18147763701395683, "learning_rate": 9.433015003295299e-06, "loss": 4.044190368652344, "step": 150400 }, { "epoch": 0.1815983003364395, "learning_rate": 9.43261116782756e-06, "loss": 4.054629516601563, "step": 150500 }, { "epoch": 0.1817189636589222, "learning_rate": 9.432207332359821e-06, "loss": 4.025072631835937, "step": 150600 }, { "epoch": 0.18183962698140488, "learning_rate": 9.431803496892083e-06, "loss": 4.047225341796875, "step": 150700 }, { "epoch": 0.18196029030388755, "learning_rate": 9.431399661424344e-06, "loss": 4.048432312011719, "step": 150800 }, { "epoch": 0.18208095362637025, "learning_rate": 9.430995825956606e-06, "loss": 4.036373291015625, "step": 150900 }, { "epoch": 0.18220161694885292, "learning_rate": 9.430591990488868e-06, "loss": 4.003193359375, "step": 151000 }, { "epoch": 0.18232228027133562, "learning_rate": 9.43018815502113e-06, "loss": 4.0211181640625, "step": 151100 }, { "epoch": 0.1824429435938183, "learning_rate": 9.429784319553391e-06, "loss": 4.069910888671875, "step": 151200 }, { "epoch": 0.18256360691630097, "learning_rate": 9.429380484085653e-06, "loss": 4.06355712890625, "step": 151300 }, { "epoch": 0.18268427023878367, "learning_rate": 9.428976648617915e-06, "loss": 4.048116760253906, "step": 151400 }, { "epoch": 0.18280493356126634, "learning_rate": 9.428572813150176e-06, "loss": 4.045962829589843, "step": 151500 }, { "epoch": 0.18292559688374904, "learning_rate": 9.428168977682438e-06, "loss": 4.045631713867188, "step": 151600 }, { "epoch": 0.18304626020623171, "learning_rate": 9.427765142214698e-06, "loss": 4.052801818847656, "step": 151700 }, { "epoch": 0.18316692352871441, "learning_rate": 9.42736130674696e-06, "loss": 4.02794189453125, "step": 151800 }, { "epoch": 0.1832875868511971, "learning_rate": 9.426957471279222e-06, "loss": 4.015117492675781, "step": 151900 }, { "epoch": 0.18340825017367976, "learning_rate": 9.426553635811484e-06, "loss": 4.010919189453125, "step": 152000 }, { "epoch": 0.18352891349616246, "learning_rate": 9.426149800343746e-06, "loss": 4.0254150390625, "step": 152100 }, { "epoch": 0.18364957681864513, "learning_rate": 9.425745964876008e-06, "loss": 3.99409423828125, "step": 152200 }, { "epoch": 0.18377024014112783, "learning_rate": 9.42534212940827e-06, "loss": 4.019951477050781, "step": 152300 }, { "epoch": 0.1838909034636105, "learning_rate": 9.42493829394053e-06, "loss": 4.041195678710937, "step": 152400 }, { "epoch": 0.18401156678609318, "learning_rate": 9.424534458472792e-06, "loss": 4.027416381835938, "step": 152500 }, { "epoch": 0.18413223010857588, "learning_rate": 9.424130623005054e-06, "loss": 4.043953552246093, "step": 152600 }, { "epoch": 0.18425289343105855, "learning_rate": 9.423726787537314e-06, "loss": 4.022510070800781, "step": 152700 }, { "epoch": 0.18437355675354125, "learning_rate": 9.423322952069576e-06, "loss": 4.009160461425782, "step": 152800 }, { "epoch": 0.18449422007602392, "learning_rate": 9.422919116601838e-06, "loss": 4.020636901855469, "step": 152900 }, { "epoch": 0.18461488339850662, "learning_rate": 9.4225152811341e-06, "loss": 4.0316464233398435, "step": 153000 }, { "epoch": 0.1847355467209893, "learning_rate": 9.422111445666362e-06, "loss": 4.0219183349609375, "step": 153100 }, { "epoch": 0.18485621004347197, "learning_rate": 9.421707610198623e-06, "loss": 4.01727294921875, "step": 153200 }, { "epoch": 0.18497687336595467, "learning_rate": 9.421303774730885e-06, "loss": 4.0125732421875, "step": 153300 }, { "epoch": 0.18509753668843734, "learning_rate": 9.420899939263147e-06, "loss": 4.007660827636719, "step": 153400 }, { "epoch": 0.18521820001092004, "learning_rate": 9.420496103795409e-06, "loss": 3.996183166503906, "step": 153500 }, { "epoch": 0.18533886333340271, "learning_rate": 9.420092268327669e-06, "loss": 4.0167715454101565, "step": 153600 }, { "epoch": 0.1854595266558854, "learning_rate": 9.419688432859931e-06, "loss": 4.02603515625, "step": 153700 }, { "epoch": 0.1855801899783681, "learning_rate": 9.419284597392193e-06, "loss": 4.006358947753906, "step": 153800 }, { "epoch": 0.18570085330085076, "learning_rate": 9.418880761924455e-06, "loss": 4.02930908203125, "step": 153900 }, { "epoch": 0.18582151662333346, "learning_rate": 9.418476926456715e-06, "loss": 4.024056396484375, "step": 154000 }, { "epoch": 0.18594217994581613, "learning_rate": 9.418073090988977e-06, "loss": 4.001048889160156, "step": 154100 }, { "epoch": 0.1860628432682988, "learning_rate": 9.417669255521239e-06, "loss": 4.017117919921875, "step": 154200 }, { "epoch": 0.1861835065907815, "learning_rate": 9.417265420053501e-06, "loss": 3.9995022583007813, "step": 154300 }, { "epoch": 0.18630416991326418, "learning_rate": 9.416861584585763e-06, "loss": 3.9941656494140627, "step": 154400 }, { "epoch": 0.18642483323574688, "learning_rate": 9.416457749118025e-06, "loss": 3.992108154296875, "step": 154500 }, { "epoch": 0.18654549655822955, "learning_rate": 9.416053913650285e-06, "loss": 4.011061706542969, "step": 154600 }, { "epoch": 0.18666615988071225, "learning_rate": 9.415650078182547e-06, "loss": 4.010173034667969, "step": 154700 }, { "epoch": 0.18678682320319492, "learning_rate": 9.41524624271481e-06, "loss": 4.005847778320312, "step": 154800 }, { "epoch": 0.1869074865256776, "learning_rate": 9.41484240724707e-06, "loss": 4.026692504882813, "step": 154900 }, { "epoch": 0.1870281498481603, "learning_rate": 9.414438571779332e-06, "loss": 4.003030700683594, "step": 155000 }, { "epoch": 0.18714881317064297, "learning_rate": 9.414034736311594e-06, "loss": 3.986455078125, "step": 155100 }, { "epoch": 0.18726947649312567, "learning_rate": 9.413630900843856e-06, "loss": 3.9916006469726564, "step": 155200 }, { "epoch": 0.18739013981560834, "learning_rate": 9.413227065376118e-06, "loss": 4.001815185546875, "step": 155300 }, { "epoch": 0.18751080313809101, "learning_rate": 9.41282322990838e-06, "loss": 4.031525573730469, "step": 155400 }, { "epoch": 0.18763146646057371, "learning_rate": 9.41241939444064e-06, "loss": 4.016306762695312, "step": 155500 }, { "epoch": 0.1877521297830564, "learning_rate": 9.412015558972902e-06, "loss": 4.017903747558594, "step": 155600 }, { "epoch": 0.1878727931055391, "learning_rate": 9.411611723505164e-06, "loss": 3.995350646972656, "step": 155700 }, { "epoch": 0.18799345642802176, "learning_rate": 9.411207888037424e-06, "loss": 4.006609497070312, "step": 155800 }, { "epoch": 0.18811411975050446, "learning_rate": 9.410804052569686e-06, "loss": 4.022078247070312, "step": 155900 }, { "epoch": 0.18823478307298713, "learning_rate": 9.410400217101948e-06, "loss": 4.009051208496094, "step": 156000 }, { "epoch": 0.1883554463954698, "learning_rate": 9.40999638163421e-06, "loss": 4.0004119873046875, "step": 156100 }, { "epoch": 0.1884761097179525, "learning_rate": 9.409592546166472e-06, "loss": 3.9963970947265626, "step": 156200 }, { "epoch": 0.18859677304043518, "learning_rate": 9.409188710698734e-06, "loss": 3.958802490234375, "step": 156300 }, { "epoch": 0.18871743636291788, "learning_rate": 9.408784875230996e-06, "loss": 3.995546875, "step": 156400 }, { "epoch": 0.18883809968540055, "learning_rate": 9.408381039763256e-06, "loss": 4.009895935058593, "step": 156500 }, { "epoch": 0.18895876300788322, "learning_rate": 9.407977204295518e-06, "loss": 4.016905517578125, "step": 156600 }, { "epoch": 0.18907942633036592, "learning_rate": 9.407573368827779e-06, "loss": 3.996622314453125, "step": 156700 }, { "epoch": 0.1892000896528486, "learning_rate": 9.40716953336004e-06, "loss": 3.9768637084960936, "step": 156800 }, { "epoch": 0.1893207529753313, "learning_rate": 9.406765697892302e-06, "loss": 3.9941397094726563, "step": 156900 }, { "epoch": 0.18944141629781397, "learning_rate": 9.406361862424564e-06, "loss": 4.000443725585938, "step": 157000 }, { "epoch": 0.18956207962029667, "learning_rate": 9.405958026956826e-06, "loss": 3.9986016845703123, "step": 157100 }, { "epoch": 0.18968274294277934, "learning_rate": 9.405554191489088e-06, "loss": 3.9812774658203125, "step": 157200 }, { "epoch": 0.18980340626526201, "learning_rate": 9.405150356021349e-06, "loss": 3.9898141479492186, "step": 157300 }, { "epoch": 0.18992406958774471, "learning_rate": 9.40474652055361e-06, "loss": 3.9905380249023437, "step": 157400 }, { "epoch": 0.1900447329102274, "learning_rate": 9.404342685085873e-06, "loss": 3.9934176635742187, "step": 157500 }, { "epoch": 0.1901653962327101, "learning_rate": 9.403938849618135e-06, "loss": 3.9773764038085937, "step": 157600 }, { "epoch": 0.19028605955519276, "learning_rate": 9.403535014150395e-06, "loss": 3.9768081665039063, "step": 157700 }, { "epoch": 0.19040672287767543, "learning_rate": 9.403131178682657e-06, "loss": 3.9774356079101563, "step": 157800 }, { "epoch": 0.19052738620015813, "learning_rate": 9.402727343214919e-06, "loss": 3.984882507324219, "step": 157900 }, { "epoch": 0.1906480495226408, "learning_rate": 9.402323507747181e-06, "loss": 3.9816928100585938, "step": 158000 }, { "epoch": 0.1907687128451235, "learning_rate": 9.401919672279441e-06, "loss": 3.9713653564453124, "step": 158100 }, { "epoch": 0.19088937616760618, "learning_rate": 9.401515836811703e-06, "loss": 3.97996337890625, "step": 158200 }, { "epoch": 0.19101003949008888, "learning_rate": 9.401112001343965e-06, "loss": 3.9983935546875, "step": 158300 }, { "epoch": 0.19113070281257155, "learning_rate": 9.400708165876227e-06, "loss": 3.979936218261719, "step": 158400 }, { "epoch": 0.19125136613505422, "learning_rate": 9.400304330408489e-06, "loss": 3.9622076416015624, "step": 158500 }, { "epoch": 0.19137202945753692, "learning_rate": 9.39990049494075e-06, "loss": 3.994253845214844, "step": 158600 }, { "epoch": 0.1914926927800196, "learning_rate": 9.399496659473011e-06, "loss": 3.9754034423828126, "step": 158700 }, { "epoch": 0.1916133561025023, "learning_rate": 9.399092824005273e-06, "loss": 3.9619406127929686, "step": 158800 }, { "epoch": 0.19173401942498497, "learning_rate": 9.398688988537534e-06, "loss": 3.9780078125, "step": 158900 }, { "epoch": 0.19185468274746764, "learning_rate": 9.398285153069796e-06, "loss": 3.9652264404296873, "step": 159000 }, { "epoch": 0.19197534606995034, "learning_rate": 9.397881317602058e-06, "loss": 3.9717974853515625, "step": 159100 }, { "epoch": 0.19209600939243301, "learning_rate": 9.39747748213432e-06, "loss": 3.9876675415039062, "step": 159200 }, { "epoch": 0.19221667271491572, "learning_rate": 9.397073646666582e-06, "loss": 3.9908966064453124, "step": 159300 }, { "epoch": 0.1923373360373984, "learning_rate": 9.396669811198844e-06, "loss": 3.9443743896484373, "step": 159400 }, { "epoch": 0.1924579993598811, "learning_rate": 9.396265975731106e-06, "loss": 3.967160339355469, "step": 159500 }, { "epoch": 0.19257866268236376, "learning_rate": 9.395862140263366e-06, "loss": 3.9705538940429688, "step": 159600 }, { "epoch": 0.19269932600484643, "learning_rate": 9.395458304795628e-06, "loss": 4.003659973144531, "step": 159700 }, { "epoch": 0.19281998932732913, "learning_rate": 9.395054469327888e-06, "loss": 3.961138916015625, "step": 159800 }, { "epoch": 0.1929406526498118, "learning_rate": 9.39465063386015e-06, "loss": 3.9472125244140623, "step": 159900 }, { "epoch": 0.1930613159722945, "learning_rate": 9.394246798392412e-06, "loss": 3.961947021484375, "step": 160000 }, { "epoch": 0.19318197929477718, "learning_rate": 9.393842962924674e-06, "loss": 3.9489144897460937, "step": 160100 }, { "epoch": 0.19330264261725985, "learning_rate": 9.393439127456936e-06, "loss": 3.948178405761719, "step": 160200 }, { "epoch": 0.19342330593974255, "learning_rate": 9.393035291989198e-06, "loss": 3.9760037231445313, "step": 160300 }, { "epoch": 0.19354396926222522, "learning_rate": 9.39263145652146e-06, "loss": 3.9468838500976564, "step": 160400 }, { "epoch": 0.19366463258470792, "learning_rate": 9.39222762105372e-06, "loss": 3.9636865234375, "step": 160500 }, { "epoch": 0.1937852959071906, "learning_rate": 9.391823785585982e-06, "loss": 3.98802978515625, "step": 160600 }, { "epoch": 0.19390595922967327, "learning_rate": 9.391419950118244e-06, "loss": 3.943309020996094, "step": 160700 }, { "epoch": 0.19402662255215597, "learning_rate": 9.391016114650505e-06, "loss": 3.945246276855469, "step": 160800 }, { "epoch": 0.19414728587463864, "learning_rate": 9.390612279182767e-06, "loss": 3.943849792480469, "step": 160900 }, { "epoch": 0.19426794919712134, "learning_rate": 9.390208443715029e-06, "loss": 3.965051574707031, "step": 161000 }, { "epoch": 0.19438861251960401, "learning_rate": 9.38980460824729e-06, "loss": 3.9563021850585938, "step": 161100 }, { "epoch": 0.19450927584208672, "learning_rate": 9.389400772779552e-06, "loss": 3.9251171875, "step": 161200 }, { "epoch": 0.1946299391645694, "learning_rate": 9.388996937311814e-06, "loss": 3.9312396240234375, "step": 161300 }, { "epoch": 0.19475060248705206, "learning_rate": 9.388593101844075e-06, "loss": 3.945506591796875, "step": 161400 }, { "epoch": 0.19487126580953476, "learning_rate": 9.388189266376337e-06, "loss": 3.963096923828125, "step": 161500 }, { "epoch": 0.19499192913201743, "learning_rate": 9.387785430908599e-06, "loss": 3.951310729980469, "step": 161600 }, { "epoch": 0.19511259245450013, "learning_rate": 9.387381595440859e-06, "loss": 3.966768798828125, "step": 161700 }, { "epoch": 0.1952332557769828, "learning_rate": 9.386977759973121e-06, "loss": 3.9963201904296874, "step": 161800 }, { "epoch": 0.19535391909946548, "learning_rate": 9.386573924505383e-06, "loss": 3.9126287841796876, "step": 161900 }, { "epoch": 0.19547458242194818, "learning_rate": 9.386170089037645e-06, "loss": 3.967998046875, "step": 162000 }, { "epoch": 0.19559524574443085, "learning_rate": 9.385766253569907e-06, "loss": 3.973890686035156, "step": 162100 }, { "epoch": 0.19571590906691355, "learning_rate": 9.385362418102167e-06, "loss": 3.9504486083984376, "step": 162200 }, { "epoch": 0.19583657238939622, "learning_rate": 9.38495858263443e-06, "loss": 3.937174987792969, "step": 162300 }, { "epoch": 0.19595723571187892, "learning_rate": 9.384554747166691e-06, "loss": 3.95936279296875, "step": 162400 }, { "epoch": 0.1960778990343616, "learning_rate": 9.384150911698953e-06, "loss": 3.938043212890625, "step": 162500 }, { "epoch": 0.19619856235684427, "learning_rate": 9.383747076231215e-06, "loss": 3.968492431640625, "step": 162600 }, { "epoch": 0.19631922567932697, "learning_rate": 9.383343240763475e-06, "loss": 3.9378448486328126, "step": 162700 }, { "epoch": 0.19643988900180964, "learning_rate": 9.382939405295737e-06, "loss": 3.951314697265625, "step": 162800 }, { "epoch": 0.19656055232429234, "learning_rate": 9.382535569828e-06, "loss": 3.9318060302734374, "step": 162900 }, { "epoch": 0.19668121564677502, "learning_rate": 9.38213173436026e-06, "loss": 3.9562448120117186, "step": 163000 }, { "epoch": 0.1968018789692577, "learning_rate": 9.381727898892522e-06, "loss": 3.9357901000976563, "step": 163100 }, { "epoch": 0.1969225422917404, "learning_rate": 9.381324063424784e-06, "loss": 3.9316226196289064, "step": 163200 }, { "epoch": 0.19704320561422306, "learning_rate": 9.380920227957046e-06, "loss": 3.9586306762695314, "step": 163300 }, { "epoch": 0.19716386893670576, "learning_rate": 9.380516392489308e-06, "loss": 3.938726501464844, "step": 163400 }, { "epoch": 0.19728453225918843, "learning_rate": 9.38011255702157e-06, "loss": 3.940384826660156, "step": 163500 }, { "epoch": 0.19740519558167113, "learning_rate": 9.37970872155383e-06, "loss": 3.9382730102539063, "step": 163600 }, { "epoch": 0.1975258589041538, "learning_rate": 9.379304886086092e-06, "loss": 3.929862060546875, "step": 163700 }, { "epoch": 0.19764652222663648, "learning_rate": 9.378901050618354e-06, "loss": 3.934556884765625, "step": 163800 }, { "epoch": 0.19776718554911918, "learning_rate": 9.378497215150614e-06, "loss": 3.936484375, "step": 163900 }, { "epoch": 0.19788784887160185, "learning_rate": 9.378093379682876e-06, "loss": 3.9157168579101564, "step": 164000 }, { "epoch": 0.19800851219408455, "learning_rate": 9.377689544215138e-06, "loss": 3.92895263671875, "step": 164100 }, { "epoch": 0.19812917551656722, "learning_rate": 9.3772857087474e-06, "loss": 3.927414855957031, "step": 164200 }, { "epoch": 0.1982498388390499, "learning_rate": 9.376881873279662e-06, "loss": 3.9280136108398436, "step": 164300 }, { "epoch": 0.1983705021615326, "learning_rate": 9.376478037811924e-06, "loss": 3.951353759765625, "step": 164400 }, { "epoch": 0.19849116548401527, "learning_rate": 9.376074202344186e-06, "loss": 3.9360696411132814, "step": 164500 }, { "epoch": 0.19861182880649797, "learning_rate": 9.375670366876446e-06, "loss": 3.921869201660156, "step": 164600 }, { "epoch": 0.19873249212898064, "learning_rate": 9.375266531408708e-06, "loss": 3.925499267578125, "step": 164700 }, { "epoch": 0.19885315545146334, "learning_rate": 9.374862695940969e-06, "loss": 3.946710510253906, "step": 164800 }, { "epoch": 0.19897381877394602, "learning_rate": 9.37445886047323e-06, "loss": 3.8890890502929687, "step": 164900 }, { "epoch": 0.1990944820964287, "learning_rate": 9.374055025005493e-06, "loss": 3.9316473388671875, "step": 165000 }, { "epoch": 0.1992151454189114, "learning_rate": 9.373651189537755e-06, "loss": 3.92435546875, "step": 165100 }, { "epoch": 0.19933580874139406, "learning_rate": 9.373247354070017e-06, "loss": 3.9189715576171875, "step": 165200 }, { "epoch": 0.19945647206387676, "learning_rate": 9.372843518602279e-06, "loss": 3.904657287597656, "step": 165300 }, { "epoch": 0.19957713538635943, "learning_rate": 9.37243968313454e-06, "loss": 3.9273565673828124, "step": 165400 }, { "epoch": 0.1996977987088421, "learning_rate": 9.3720358476668e-06, "loss": 3.94675537109375, "step": 165500 }, { "epoch": 0.1998184620313248, "learning_rate": 9.371632012199063e-06, "loss": 3.9269332885742188, "step": 165600 }, { "epoch": 0.19993912535380748, "learning_rate": 9.371228176731325e-06, "loss": 3.9447283935546875, "step": 165700 }, { "epoch": 0.20005978867629018, "learning_rate": 9.370824341263585e-06, "loss": 3.9161105346679688, "step": 165800 }, { "epoch": 0.20018045199877285, "learning_rate": 9.370420505795847e-06, "loss": 3.913367919921875, "step": 165900 }, { "epoch": 0.20030111532125555, "learning_rate": 9.370016670328109e-06, "loss": 3.90974365234375, "step": 166000 }, { "epoch": 0.20042177864373822, "learning_rate": 9.369612834860371e-06, "loss": 3.916065979003906, "step": 166100 }, { "epoch": 0.2005424419662209, "learning_rate": 9.369208999392633e-06, "loss": 3.9042202758789064, "step": 166200 }, { "epoch": 0.2006631052887036, "learning_rate": 9.368805163924893e-06, "loss": 3.9106549072265624, "step": 166300 }, { "epoch": 0.20078376861118627, "learning_rate": 9.368401328457155e-06, "loss": 3.9116033935546874, "step": 166400 }, { "epoch": 0.20090443193366897, "learning_rate": 9.367997492989417e-06, "loss": 3.9169955444335938, "step": 166500 }, { "epoch": 0.20102509525615164, "learning_rate": 9.36759365752168e-06, "loss": 3.897344055175781, "step": 166600 }, { "epoch": 0.20114575857863431, "learning_rate": 9.367189822053941e-06, "loss": 3.8958749389648437, "step": 166700 }, { "epoch": 0.20126642190111702, "learning_rate": 9.366785986586201e-06, "loss": 3.917710266113281, "step": 166800 }, { "epoch": 0.2013870852235997, "learning_rate": 9.366382151118463e-06, "loss": 3.93051025390625, "step": 166900 }, { "epoch": 0.2015077485460824, "learning_rate": 9.365978315650725e-06, "loss": 3.91257080078125, "step": 167000 }, { "epoch": 0.20162841186856506, "learning_rate": 9.365574480182986e-06, "loss": 3.8849337768554686, "step": 167100 }, { "epoch": 0.20174907519104773, "learning_rate": 9.365170644715248e-06, "loss": 3.9154803466796877, "step": 167200 }, { "epoch": 0.20186973851353043, "learning_rate": 9.36476680924751e-06, "loss": 3.9124334716796874, "step": 167300 }, { "epoch": 0.2019904018360131, "learning_rate": 9.364362973779772e-06, "loss": 3.9076419067382813, "step": 167400 }, { "epoch": 0.2021110651584958, "learning_rate": 9.363959138312034e-06, "loss": 3.9181591796875, "step": 167500 }, { "epoch": 0.20223172848097848, "learning_rate": 9.363555302844296e-06, "loss": 3.9095223999023436, "step": 167600 }, { "epoch": 0.20235239180346118, "learning_rate": 9.363151467376556e-06, "loss": 3.9223626708984374, "step": 167700 }, { "epoch": 0.20247305512594385, "learning_rate": 9.362747631908818e-06, "loss": 3.908642578125, "step": 167800 }, { "epoch": 0.20259371844842652, "learning_rate": 9.36234379644108e-06, "loss": 3.912618408203125, "step": 167900 }, { "epoch": 0.20271438177090922, "learning_rate": 9.36193996097334e-06, "loss": 3.891865234375, "step": 168000 }, { "epoch": 0.2028350450933919, "learning_rate": 9.361536125505602e-06, "loss": 3.887584533691406, "step": 168100 }, { "epoch": 0.2029557084158746, "learning_rate": 9.361132290037864e-06, "loss": 3.902679443359375, "step": 168200 }, { "epoch": 0.20307637173835727, "learning_rate": 9.360728454570126e-06, "loss": 3.901674499511719, "step": 168300 }, { "epoch": 0.20319703506083994, "learning_rate": 9.360324619102388e-06, "loss": 3.8855657958984375, "step": 168400 }, { "epoch": 0.20331769838332264, "learning_rate": 9.35992078363465e-06, "loss": 3.9087725830078126, "step": 168500 }, { "epoch": 0.20343836170580532, "learning_rate": 9.359516948166912e-06, "loss": 3.8916744995117187, "step": 168600 }, { "epoch": 0.20355902502828802, "learning_rate": 9.359113112699172e-06, "loss": 3.903193054199219, "step": 168700 }, { "epoch": 0.2036796883507707, "learning_rate": 9.358709277231434e-06, "loss": 3.9031878662109376, "step": 168800 }, { "epoch": 0.2038003516732534, "learning_rate": 9.358305441763695e-06, "loss": 3.8811785888671877, "step": 168900 }, { "epoch": 0.20392101499573606, "learning_rate": 9.357901606295957e-06, "loss": 3.9057913208007813, "step": 169000 }, { "epoch": 0.20404167831821873, "learning_rate": 9.357497770828219e-06, "loss": 3.9004705810546874, "step": 169100 }, { "epoch": 0.20416234164070143, "learning_rate": 9.35709393536048e-06, "loss": 3.9152734375, "step": 169200 }, { "epoch": 0.2042830049631841, "learning_rate": 9.356690099892743e-06, "loss": 3.8760000610351564, "step": 169300 }, { "epoch": 0.2044036682856668, "learning_rate": 9.356286264425005e-06, "loss": 3.8949551391601562, "step": 169400 }, { "epoch": 0.20452433160814948, "learning_rate": 9.355882428957265e-06, "loss": 3.9081497192382812, "step": 169500 }, { "epoch": 0.20464499493063215, "learning_rate": 9.355478593489527e-06, "loss": 3.891767578125, "step": 169600 }, { "epoch": 0.20476565825311485, "learning_rate": 9.355074758021789e-06, "loss": 3.9051165771484375, "step": 169700 }, { "epoch": 0.20488632157559752, "learning_rate": 9.35467092255405e-06, "loss": 3.880681457519531, "step": 169800 }, { "epoch": 0.20500698489808022, "learning_rate": 9.354267087086311e-06, "loss": 3.882630615234375, "step": 169900 }, { "epoch": 0.2051276482205629, "learning_rate": 9.353863251618573e-06, "loss": 3.9082928466796876, "step": 170000 }, { "epoch": 0.2052483115430456, "learning_rate": 9.353459416150835e-06, "loss": 3.9023587036132814, "step": 170100 }, { "epoch": 0.20536897486552827, "learning_rate": 9.353055580683097e-06, "loss": 3.9219537353515626, "step": 170200 }, { "epoch": 0.20548963818801094, "learning_rate": 9.352651745215359e-06, "loss": 3.891326599121094, "step": 170300 }, { "epoch": 0.20561030151049364, "learning_rate": 9.35224790974762e-06, "loss": 3.893621826171875, "step": 170400 }, { "epoch": 0.20573096483297632, "learning_rate": 9.351844074279881e-06, "loss": 3.890181579589844, "step": 170500 }, { "epoch": 0.20585162815545902, "learning_rate": 9.351440238812143e-06, "loss": 3.882404479980469, "step": 170600 }, { "epoch": 0.2059722914779417, "learning_rate": 9.351036403344405e-06, "loss": 3.9055499267578124, "step": 170700 }, { "epoch": 0.20609295480042436, "learning_rate": 9.350632567876666e-06, "loss": 3.8784725952148436, "step": 170800 }, { "epoch": 0.20621361812290706, "learning_rate": 9.350228732408927e-06, "loss": 3.8956500244140626, "step": 170900 }, { "epoch": 0.20633428144538973, "learning_rate": 9.34982489694119e-06, "loss": 3.8820159912109373, "step": 171000 }, { "epoch": 0.20645494476787243, "learning_rate": 9.349421061473451e-06, "loss": 3.862356872558594, "step": 171100 }, { "epoch": 0.2065756080903551, "learning_rate": 9.349017226005712e-06, "loss": 3.8845086669921876, "step": 171200 }, { "epoch": 0.2066962714128378, "learning_rate": 9.348613390537974e-06, "loss": 3.8948565673828126, "step": 171300 }, { "epoch": 0.20681693473532048, "learning_rate": 9.348209555070236e-06, "loss": 3.9076422119140624, "step": 171400 }, { "epoch": 0.20693759805780315, "learning_rate": 9.347805719602498e-06, "loss": 3.8729852294921874, "step": 171500 }, { "epoch": 0.20705826138028585, "learning_rate": 9.34740188413476e-06, "loss": 3.870924072265625, "step": 171600 }, { "epoch": 0.20717892470276852, "learning_rate": 9.346998048667022e-06, "loss": 3.8728848266601563, "step": 171700 }, { "epoch": 0.20729958802525122, "learning_rate": 9.346594213199282e-06, "loss": 3.8923126220703126, "step": 171800 }, { "epoch": 0.2074202513477339, "learning_rate": 9.346190377731544e-06, "loss": 3.875132751464844, "step": 171900 }, { "epoch": 0.20754091467021657, "learning_rate": 9.345786542263804e-06, "loss": 3.858740234375, "step": 172000 }, { "epoch": 0.20766157799269927, "learning_rate": 9.345382706796066e-06, "loss": 3.896944885253906, "step": 172100 }, { "epoch": 0.20778224131518194, "learning_rate": 9.344978871328328e-06, "loss": 3.865123596191406, "step": 172200 }, { "epoch": 0.20790290463766464, "learning_rate": 9.34457503586059e-06, "loss": 3.870838317871094, "step": 172300 }, { "epoch": 0.20802356796014732, "learning_rate": 9.344171200392852e-06, "loss": 3.852091979980469, "step": 172400 }, { "epoch": 0.20814423128263002, "learning_rate": 9.343767364925114e-06, "loss": 3.8722979736328127, "step": 172500 }, { "epoch": 0.2082648946051127, "learning_rate": 9.343363529457376e-06, "loss": 3.868000793457031, "step": 172600 }, { "epoch": 0.20838555792759536, "learning_rate": 9.342959693989636e-06, "loss": 3.8725985717773437, "step": 172700 }, { "epoch": 0.20850622125007806, "learning_rate": 9.342555858521898e-06, "loss": 3.8823471069335938, "step": 172800 }, { "epoch": 0.20862688457256073, "learning_rate": 9.34215202305416e-06, "loss": 3.8700616455078123, "step": 172900 }, { "epoch": 0.20874754789504343, "learning_rate": 9.34174818758642e-06, "loss": 3.8738943481445314, "step": 173000 }, { "epoch": 0.2088682112175261, "learning_rate": 9.341344352118683e-06, "loss": 3.851153564453125, "step": 173100 }, { "epoch": 0.20898887454000878, "learning_rate": 9.340940516650945e-06, "loss": 3.8581884765625, "step": 173200 }, { "epoch": 0.20910953786249148, "learning_rate": 9.340536681183207e-06, "loss": 3.873965148925781, "step": 173300 }, { "epoch": 0.20923020118497415, "learning_rate": 9.340132845715469e-06, "loss": 3.8880624389648437, "step": 173400 }, { "epoch": 0.20935086450745685, "learning_rate": 9.33972901024773e-06, "loss": 3.8819808959960938, "step": 173500 }, { "epoch": 0.20947152782993952, "learning_rate": 9.339325174779991e-06, "loss": 3.8697860717773436, "step": 173600 }, { "epoch": 0.2095921911524222, "learning_rate": 9.338921339312253e-06, "loss": 3.8486712646484373, "step": 173700 }, { "epoch": 0.2097128544749049, "learning_rate": 9.338517503844515e-06, "loss": 3.879408264160156, "step": 173800 }, { "epoch": 0.20983351779738757, "learning_rate": 9.338113668376775e-06, "loss": 3.878307189941406, "step": 173900 }, { "epoch": 0.20995418111987027, "learning_rate": 9.337709832909037e-06, "loss": 3.856025390625, "step": 174000 }, { "epoch": 0.21007484444235294, "learning_rate": 9.337305997441299e-06, "loss": 3.864388427734375, "step": 174100 }, { "epoch": 0.21019550776483564, "learning_rate": 9.336902161973561e-06, "loss": 3.840981140136719, "step": 174200 }, { "epoch": 0.21031617108731832, "learning_rate": 9.336498326505823e-06, "loss": 3.8313128662109377, "step": 174300 }, { "epoch": 0.210436834409801, "learning_rate": 9.336094491038083e-06, "loss": 3.880459899902344, "step": 174400 }, { "epoch": 0.2105574977322837, "learning_rate": 9.335690655570345e-06, "loss": 3.8525216674804685, "step": 174500 }, { "epoch": 0.21067816105476636, "learning_rate": 9.335286820102607e-06, "loss": 3.859064636230469, "step": 174600 }, { "epoch": 0.21079882437724906, "learning_rate": 9.33488298463487e-06, "loss": 3.8755914306640626, "step": 174700 }, { "epoch": 0.21091948769973173, "learning_rate": 9.334479149167131e-06, "loss": 3.8529559326171876, "step": 174800 }, { "epoch": 0.2110401510222144, "learning_rate": 9.334075313699392e-06, "loss": 3.8421771240234377, "step": 174900 }, { "epoch": 0.2111608143446971, "learning_rate": 9.333671478231654e-06, "loss": 3.8353622436523436, "step": 175000 }, { "epoch": 0.21128147766717978, "learning_rate": 9.333267642763916e-06, "loss": 3.879399719238281, "step": 175100 }, { "epoch": 0.21140214098966248, "learning_rate": 9.332863807296177e-06, "loss": 3.85759765625, "step": 175200 }, { "epoch": 0.21152280431214515, "learning_rate": 9.332459971828438e-06, "loss": 3.827712097167969, "step": 175300 }, { "epoch": 0.21164346763462785, "learning_rate": 9.3320561363607e-06, "loss": 3.87615966796875, "step": 175400 }, { "epoch": 0.21176413095711052, "learning_rate": 9.331652300892962e-06, "loss": 3.8824026489257815, "step": 175500 }, { "epoch": 0.2118847942795932, "learning_rate": 9.331248465425224e-06, "loss": 3.8432635498046874, "step": 175600 }, { "epoch": 0.2120054576020759, "learning_rate": 9.330844629957486e-06, "loss": 3.834368896484375, "step": 175700 }, { "epoch": 0.21212612092455857, "learning_rate": 9.330440794489746e-06, "loss": 3.8644479370117186, "step": 175800 }, { "epoch": 0.21224678424704127, "learning_rate": 9.330036959022008e-06, "loss": 3.830558166503906, "step": 175900 }, { "epoch": 0.21236744756952394, "learning_rate": 9.32963312355427e-06, "loss": 3.849298095703125, "step": 176000 }, { "epoch": 0.21248811089200662, "learning_rate": 9.32922928808653e-06, "loss": 3.871258544921875, "step": 176100 }, { "epoch": 0.21260877421448932, "learning_rate": 9.328825452618792e-06, "loss": 3.8467529296875, "step": 176200 }, { "epoch": 0.212729437536972, "learning_rate": 9.328421617151054e-06, "loss": 3.833404541015625, "step": 176300 }, { "epoch": 0.2128501008594547, "learning_rate": 9.328017781683316e-06, "loss": 3.8632907104492187, "step": 176400 }, { "epoch": 0.21297076418193736, "learning_rate": 9.327613946215578e-06, "loss": 3.8525067138671876, "step": 176500 }, { "epoch": 0.21309142750442006, "learning_rate": 9.32721011074784e-06, "loss": 3.8538772583007814, "step": 176600 }, { "epoch": 0.21321209082690273, "learning_rate": 9.326806275280102e-06, "loss": 3.8527908325195312, "step": 176700 }, { "epoch": 0.2133327541493854, "learning_rate": 9.326402439812362e-06, "loss": 3.8154119873046874, "step": 176800 }, { "epoch": 0.2134534174718681, "learning_rate": 9.325998604344624e-06, "loss": 3.833676452636719, "step": 176900 }, { "epoch": 0.21357408079435078, "learning_rate": 9.325594768876885e-06, "loss": 3.8553839111328125, "step": 177000 }, { "epoch": 0.21369474411683348, "learning_rate": 9.325190933409147e-06, "loss": 3.8368209838867187, "step": 177100 }, { "epoch": 0.21381540743931615, "learning_rate": 9.324787097941409e-06, "loss": 3.82350830078125, "step": 177200 }, { "epoch": 0.21393607076179882, "learning_rate": 9.32438326247367e-06, "loss": 3.8502886962890623, "step": 177300 }, { "epoch": 0.21405673408428152, "learning_rate": 9.323979427005933e-06, "loss": 3.850924377441406, "step": 177400 }, { "epoch": 0.2141773974067642, "learning_rate": 9.323575591538195e-06, "loss": 3.8369631958007813, "step": 177500 }, { "epoch": 0.2142980607292469, "learning_rate": 9.323171756070457e-06, "loss": 3.81966552734375, "step": 177600 }, { "epoch": 0.21441872405172957, "learning_rate": 9.322767920602717e-06, "loss": 3.8794818115234375, "step": 177700 }, { "epoch": 0.21453938737421227, "learning_rate": 9.322364085134979e-06, "loss": 3.82856689453125, "step": 177800 }, { "epoch": 0.21466005069669494, "learning_rate": 9.321960249667241e-06, "loss": 3.8288058471679687, "step": 177900 }, { "epoch": 0.21478071401917762, "learning_rate": 9.321556414199501e-06, "loss": 3.831231689453125, "step": 178000 }, { "epoch": 0.21490137734166032, "learning_rate": 9.321152578731763e-06, "loss": 3.8515533447265624, "step": 178100 }, { "epoch": 0.215022040664143, "learning_rate": 9.320748743264025e-06, "loss": 3.857205505371094, "step": 178200 }, { "epoch": 0.2151427039866257, "learning_rate": 9.320344907796287e-06, "loss": 3.8408935546875, "step": 178300 }, { "epoch": 0.21526336730910836, "learning_rate": 9.319941072328549e-06, "loss": 3.83988525390625, "step": 178400 }, { "epoch": 0.21538403063159103, "learning_rate": 9.31953723686081e-06, "loss": 3.828887634277344, "step": 178500 }, { "epoch": 0.21550469395407373, "learning_rate": 9.319133401393071e-06, "loss": 3.840606994628906, "step": 178600 }, { "epoch": 0.2156253572765564, "learning_rate": 9.318729565925333e-06, "loss": 3.832397155761719, "step": 178700 }, { "epoch": 0.2157460205990391, "learning_rate": 9.318325730457595e-06, "loss": 3.8263336181640626, "step": 178800 }, { "epoch": 0.21586668392152178, "learning_rate": 9.317921894989856e-06, "loss": 3.80751708984375, "step": 178900 }, { "epoch": 0.21598734724400448, "learning_rate": 9.317518059522118e-06, "loss": 3.8040643310546876, "step": 179000 }, { "epoch": 0.21610801056648715, "learning_rate": 9.31711422405438e-06, "loss": 3.814153137207031, "step": 179100 }, { "epoch": 0.21622867388896982, "learning_rate": 9.316710388586642e-06, "loss": 3.8432388305664062, "step": 179200 }, { "epoch": 0.21634933721145252, "learning_rate": 9.316306553118902e-06, "loss": 3.816586608886719, "step": 179300 }, { "epoch": 0.2164700005339352, "learning_rate": 9.315902717651164e-06, "loss": 3.861735534667969, "step": 179400 }, { "epoch": 0.2165906638564179, "learning_rate": 9.315498882183426e-06, "loss": 3.8271188354492187, "step": 179500 }, { "epoch": 0.21671132717890057, "learning_rate": 9.315095046715688e-06, "loss": 3.8121441650390624, "step": 179600 }, { "epoch": 0.21683199050138324, "learning_rate": 9.31469121124795e-06, "loss": 3.8089938354492188, "step": 179700 }, { "epoch": 0.21695265382386594, "learning_rate": 9.314287375780212e-06, "loss": 3.844149475097656, "step": 179800 }, { "epoch": 0.21707331714634862, "learning_rate": 9.313883540312472e-06, "loss": 3.8364193725585936, "step": 179900 }, { "epoch": 0.21719398046883132, "learning_rate": 9.313479704844734e-06, "loss": 3.8371978759765626, "step": 180000 }, { "epoch": 0.217314643791314, "learning_rate": 9.313075869376996e-06, "loss": 3.8046685791015626, "step": 180100 }, { "epoch": 0.21743530711379666, "learning_rate": 9.312672033909256e-06, "loss": 3.8093197631835936, "step": 180200 }, { "epoch": 0.21755597043627936, "learning_rate": 9.312268198441518e-06, "loss": 3.820914001464844, "step": 180300 }, { "epoch": 0.21767663375876203, "learning_rate": 9.31186436297378e-06, "loss": 3.8356719970703126, "step": 180400 }, { "epoch": 0.21779729708124473, "learning_rate": 9.311460527506042e-06, "loss": 3.805845031738281, "step": 180500 }, { "epoch": 0.2179179604037274, "learning_rate": 9.311056692038304e-06, "loss": 3.83080078125, "step": 180600 }, { "epoch": 0.2180386237262101, "learning_rate": 9.310652856570566e-06, "loss": 3.8284832763671877, "step": 180700 }, { "epoch": 0.21815928704869278, "learning_rate": 9.310249021102828e-06, "loss": 3.7746923828125, "step": 180800 }, { "epoch": 0.21827995037117545, "learning_rate": 9.309845185635088e-06, "loss": 3.8273052978515625, "step": 180900 }, { "epoch": 0.21840061369365815, "learning_rate": 9.30944135016735e-06, "loss": 3.7906207275390624, "step": 181000 }, { "epoch": 0.21852127701614082, "learning_rate": 9.30903751469961e-06, "loss": 3.8062454223632813, "step": 181100 }, { "epoch": 0.21864194033862352, "learning_rate": 9.308633679231873e-06, "loss": 3.8278863525390623, "step": 181200 }, { "epoch": 0.2187626036611062, "learning_rate": 9.308229843764135e-06, "loss": 3.845267639160156, "step": 181300 }, { "epoch": 0.21888326698358887, "learning_rate": 9.307826008296397e-06, "loss": 3.819762878417969, "step": 181400 }, { "epoch": 0.21900393030607157, "learning_rate": 9.307422172828659e-06, "loss": 3.8009677124023438, "step": 181500 }, { "epoch": 0.21912459362855424, "learning_rate": 9.30701833736092e-06, "loss": 3.803919677734375, "step": 181600 }, { "epoch": 0.21924525695103694, "learning_rate": 9.306614501893183e-06, "loss": 3.797157897949219, "step": 181700 }, { "epoch": 0.21936592027351962, "learning_rate": 9.306210666425443e-06, "loss": 3.83072509765625, "step": 181800 }, { "epoch": 0.21948658359600232, "learning_rate": 9.305806830957705e-06, "loss": 3.7823165893554687, "step": 181900 }, { "epoch": 0.219607246918485, "learning_rate": 9.305402995489967e-06, "loss": 3.815687255859375, "step": 182000 }, { "epoch": 0.21972791024096766, "learning_rate": 9.304999160022227e-06, "loss": 3.82070556640625, "step": 182100 }, { "epoch": 0.21984857356345036, "learning_rate": 9.30459532455449e-06, "loss": 3.798536682128906, "step": 182200 }, { "epoch": 0.21996923688593303, "learning_rate": 9.304191489086751e-06, "loss": 3.8398867797851564, "step": 182300 }, { "epoch": 0.22008990020841573, "learning_rate": 9.303787653619013e-06, "loss": 3.8175033569335937, "step": 182400 }, { "epoch": 0.2202105635308984, "learning_rate": 9.303383818151275e-06, "loss": 3.8130667114257815, "step": 182500 }, { "epoch": 0.22033122685338108, "learning_rate": 9.302979982683535e-06, "loss": 3.8300772094726563, "step": 182600 }, { "epoch": 0.22045189017586378, "learning_rate": 9.302576147215797e-06, "loss": 3.801288757324219, "step": 182700 }, { "epoch": 0.22057255349834645, "learning_rate": 9.30217231174806e-06, "loss": 3.803774719238281, "step": 182800 }, { "epoch": 0.22069321682082915, "learning_rate": 9.301768476280321e-06, "loss": 3.7768594360351564, "step": 182900 }, { "epoch": 0.22081388014331182, "learning_rate": 9.301364640812582e-06, "loss": 3.8130340576171875, "step": 183000 }, { "epoch": 0.22093454346579453, "learning_rate": 9.300960805344844e-06, "loss": 3.803114013671875, "step": 183100 }, { "epoch": 0.2210552067882772, "learning_rate": 9.300556969877106e-06, "loss": 3.8122787475585938, "step": 183200 }, { "epoch": 0.22117587011075987, "learning_rate": 9.300153134409368e-06, "loss": 3.7887149047851563, "step": 183300 }, { "epoch": 0.22129653343324257, "learning_rate": 9.299749298941628e-06, "loss": 3.8040652465820313, "step": 183400 }, { "epoch": 0.22141719675572524, "learning_rate": 9.29934546347389e-06, "loss": 3.8092083740234375, "step": 183500 }, { "epoch": 0.22153786007820794, "learning_rate": 9.298941628006152e-06, "loss": 3.800281982421875, "step": 183600 }, { "epoch": 0.22165852340069062, "learning_rate": 9.298537792538414e-06, "loss": 3.8207421875, "step": 183700 }, { "epoch": 0.2217791867231733, "learning_rate": 9.298133957070676e-06, "loss": 3.8118405151367187, "step": 183800 }, { "epoch": 0.221899850045656, "learning_rate": 9.297730121602938e-06, "loss": 3.782644958496094, "step": 183900 }, { "epoch": 0.22202051336813866, "learning_rate": 9.297326286135198e-06, "loss": 3.8218756103515625, "step": 184000 }, { "epoch": 0.22214117669062136, "learning_rate": 9.29692245066746e-06, "loss": 3.771357421875, "step": 184100 }, { "epoch": 0.22226184001310403, "learning_rate": 9.29651861519972e-06, "loss": 3.796797180175781, "step": 184200 }, { "epoch": 0.22238250333558673, "learning_rate": 9.296114779731982e-06, "loss": 3.788507995605469, "step": 184300 }, { "epoch": 0.2225031666580694, "learning_rate": 9.295710944264244e-06, "loss": 3.787674560546875, "step": 184400 }, { "epoch": 0.22262382998055208, "learning_rate": 9.295307108796506e-06, "loss": 3.7998928833007812, "step": 184500 }, { "epoch": 0.22274449330303478, "learning_rate": 9.294903273328768e-06, "loss": 3.7879794311523436, "step": 184600 }, { "epoch": 0.22286515662551745, "learning_rate": 9.29449943786103e-06, "loss": 3.7838589477539064, "step": 184700 }, { "epoch": 0.22298581994800015, "learning_rate": 9.294095602393292e-06, "loss": 3.8012313842773438, "step": 184800 }, { "epoch": 0.22310648327048282, "learning_rate": 9.293691766925553e-06, "loss": 3.784291076660156, "step": 184900 }, { "epoch": 0.2232271465929655, "learning_rate": 9.293287931457815e-06, "loss": 3.8197982788085936, "step": 185000 }, { "epoch": 0.2233478099154482, "learning_rate": 9.292884095990076e-06, "loss": 3.8027383422851564, "step": 185100 }, { "epoch": 0.22346847323793087, "learning_rate": 9.292480260522337e-06, "loss": 3.7904058837890626, "step": 185200 }, { "epoch": 0.22358913656041357, "learning_rate": 9.292076425054599e-06, "loss": 3.794341735839844, "step": 185300 }, { "epoch": 0.22370979988289624, "learning_rate": 9.29167258958686e-06, "loss": 3.791290588378906, "step": 185400 }, { "epoch": 0.22383046320537894, "learning_rate": 9.291268754119123e-06, "loss": 3.8027297973632814, "step": 185500 }, { "epoch": 0.22395112652786162, "learning_rate": 9.290864918651385e-06, "loss": 3.7950787353515625, "step": 185600 }, { "epoch": 0.2240717898503443, "learning_rate": 9.290461083183647e-06, "loss": 3.767216796875, "step": 185700 }, { "epoch": 0.224192453172827, "learning_rate": 9.290057247715909e-06, "loss": 3.77049560546875, "step": 185800 }, { "epoch": 0.22431311649530966, "learning_rate": 9.289653412248169e-06, "loss": 3.7954052734375, "step": 185900 }, { "epoch": 0.22443377981779236, "learning_rate": 9.289249576780431e-06, "loss": 3.794927978515625, "step": 186000 }, { "epoch": 0.22455444314027503, "learning_rate": 9.288845741312691e-06, "loss": 3.8113580322265626, "step": 186100 }, { "epoch": 0.2246751064627577, "learning_rate": 9.288441905844953e-06, "loss": 3.784781188964844, "step": 186200 }, { "epoch": 0.2247957697852404, "learning_rate": 9.288038070377215e-06, "loss": 3.7929623413085936, "step": 186300 }, { "epoch": 0.22491643310772308, "learning_rate": 9.287634234909477e-06, "loss": 3.799100341796875, "step": 186400 }, { "epoch": 0.22503709643020578, "learning_rate": 9.28723039944174e-06, "loss": 3.7763958740234376, "step": 186500 }, { "epoch": 0.22515775975268845, "learning_rate": 9.286826563974001e-06, "loss": 3.769142761230469, "step": 186600 }, { "epoch": 0.22527842307517112, "learning_rate": 9.286422728506261e-06, "loss": 3.782398986816406, "step": 186700 }, { "epoch": 0.22539908639765383, "learning_rate": 9.286018893038523e-06, "loss": 3.7773593139648436, "step": 186800 }, { "epoch": 0.2255197497201365, "learning_rate": 9.285615057570785e-06, "loss": 3.775775146484375, "step": 186900 }, { "epoch": 0.2256404130426192, "learning_rate": 9.285211222103047e-06, "loss": 3.769295349121094, "step": 187000 }, { "epoch": 0.22576107636510187, "learning_rate": 9.284807386635308e-06, "loss": 3.772156982421875, "step": 187100 }, { "epoch": 0.22588173968758457, "learning_rate": 9.28440355116757e-06, "loss": 3.75919677734375, "step": 187200 }, { "epoch": 0.22600240301006724, "learning_rate": 9.283999715699832e-06, "loss": 3.76804443359375, "step": 187300 }, { "epoch": 0.22612306633254992, "learning_rate": 9.283595880232094e-06, "loss": 3.7640045166015623, "step": 187400 }, { "epoch": 0.22624372965503262, "learning_rate": 9.283192044764354e-06, "loss": 3.7552081298828126, "step": 187500 }, { "epoch": 0.2263643929775153, "learning_rate": 9.282788209296616e-06, "loss": 3.7742254638671877, "step": 187600 }, { "epoch": 0.226485056299998, "learning_rate": 9.282384373828878e-06, "loss": 3.7708554077148437, "step": 187700 }, { "epoch": 0.22660571962248066, "learning_rate": 9.28198053836114e-06, "loss": 3.781942138671875, "step": 187800 }, { "epoch": 0.22672638294496333, "learning_rate": 9.281576702893402e-06, "loss": 3.7824172973632812, "step": 187900 }, { "epoch": 0.22684704626744603, "learning_rate": 9.281172867425662e-06, "loss": 3.7651132202148436, "step": 188000 }, { "epoch": 0.2269677095899287, "learning_rate": 9.280769031957924e-06, "loss": 3.771176452636719, "step": 188100 }, { "epoch": 0.2270883729124114, "learning_rate": 9.280365196490186e-06, "loss": 3.8021160888671877, "step": 188200 }, { "epoch": 0.22720903623489408, "learning_rate": 9.279961361022446e-06, "loss": 3.779035949707031, "step": 188300 }, { "epoch": 0.22732969955737678, "learning_rate": 9.279557525554708e-06, "loss": 3.78049072265625, "step": 188400 }, { "epoch": 0.22745036287985945, "learning_rate": 9.27915369008697e-06, "loss": 3.7830355834960936, "step": 188500 }, { "epoch": 0.22757102620234212, "learning_rate": 9.278749854619232e-06, "loss": 3.775142822265625, "step": 188600 }, { "epoch": 0.22769168952482483, "learning_rate": 9.278346019151494e-06, "loss": 3.7713577270507814, "step": 188700 }, { "epoch": 0.2278123528473075, "learning_rate": 9.277942183683756e-06, "loss": 3.764349060058594, "step": 188800 }, { "epoch": 0.2279330161697902, "learning_rate": 9.277538348216018e-06, "loss": 3.7626797485351564, "step": 188900 }, { "epoch": 0.22805367949227287, "learning_rate": 9.277134512748279e-06, "loss": 3.7513308715820313, "step": 189000 }, { "epoch": 0.22817434281475554, "learning_rate": 9.27673067728054e-06, "loss": 3.7844378662109377, "step": 189100 }, { "epoch": 0.22829500613723824, "learning_rate": 9.2763268418128e-06, "loss": 3.776136474609375, "step": 189200 }, { "epoch": 0.22841566945972092, "learning_rate": 9.275923006345063e-06, "loss": 3.766302490234375, "step": 189300 }, { "epoch": 0.22853633278220362, "learning_rate": 9.275519170877325e-06, "loss": 3.7739431762695315, "step": 189400 }, { "epoch": 0.2286569961046863, "learning_rate": 9.275115335409587e-06, "loss": 3.746210632324219, "step": 189500 }, { "epoch": 0.228777659427169, "learning_rate": 9.274711499941849e-06, "loss": 3.7465924072265624, "step": 189600 }, { "epoch": 0.22889832274965166, "learning_rate": 9.27430766447411e-06, "loss": 3.7799801635742187, "step": 189700 }, { "epoch": 0.22901898607213433, "learning_rate": 9.273903829006373e-06, "loss": 3.725357666015625, "step": 189800 }, { "epoch": 0.22913964939461703, "learning_rate": 9.273499993538633e-06, "loss": 3.75540283203125, "step": 189900 }, { "epoch": 0.2292603127170997, "learning_rate": 9.273096158070895e-06, "loss": 3.7522036743164064, "step": 190000 }, { "epoch": 0.2293809760395824, "learning_rate": 9.272692322603157e-06, "loss": 3.7510440063476564, "step": 190100 }, { "epoch": 0.22950163936206508, "learning_rate": 9.272288487135417e-06, "loss": 3.727488708496094, "step": 190200 }, { "epoch": 0.22962230268454775, "learning_rate": 9.27188465166768e-06, "loss": 3.780382080078125, "step": 190300 }, { "epoch": 0.22974296600703045, "learning_rate": 9.271480816199941e-06, "loss": 3.7685797119140627, "step": 190400 }, { "epoch": 0.22986362932951312, "learning_rate": 9.271076980732203e-06, "loss": 3.7479373168945314, "step": 190500 }, { "epoch": 0.22998429265199583, "learning_rate": 9.270673145264465e-06, "loss": 3.75752197265625, "step": 190600 }, { "epoch": 0.2301049559744785, "learning_rate": 9.270269309796727e-06, "loss": 3.7632522583007812, "step": 190700 }, { "epoch": 0.2302256192969612, "learning_rate": 9.269865474328987e-06, "loss": 3.7460955810546874, "step": 190800 }, { "epoch": 0.23034628261944387, "learning_rate": 9.26946163886125e-06, "loss": 3.7422393798828124, "step": 190900 }, { "epoch": 0.23046694594192654, "learning_rate": 9.269057803393511e-06, "loss": 3.7621484375, "step": 191000 }, { "epoch": 0.23058760926440924, "learning_rate": 9.268653967925772e-06, "loss": 3.7656124877929686, "step": 191100 }, { "epoch": 0.23070827258689192, "learning_rate": 9.268250132458034e-06, "loss": 3.7832489013671875, "step": 191200 }, { "epoch": 0.23082893590937462, "learning_rate": 9.267846296990296e-06, "loss": 3.7495806884765623, "step": 191300 }, { "epoch": 0.2309495992318573, "learning_rate": 9.267442461522558e-06, "loss": 3.776719970703125, "step": 191400 }, { "epoch": 0.23107026255433996, "learning_rate": 9.26703862605482e-06, "loss": 3.7207135009765624, "step": 191500 }, { "epoch": 0.23119092587682266, "learning_rate": 9.26663479058708e-06, "loss": 3.7676181030273437, "step": 191600 }, { "epoch": 0.23131158919930533, "learning_rate": 9.266230955119342e-06, "loss": 3.753806457519531, "step": 191700 }, { "epoch": 0.23143225252178803, "learning_rate": 9.265827119651604e-06, "loss": 3.731363525390625, "step": 191800 }, { "epoch": 0.2315529158442707, "learning_rate": 9.265423284183866e-06, "loss": 3.77650146484375, "step": 191900 }, { "epoch": 0.2316735791667534, "learning_rate": 9.265019448716128e-06, "loss": 3.758489074707031, "step": 192000 }, { "epoch": 0.23179424248923608, "learning_rate": 9.264615613248388e-06, "loss": 3.737186279296875, "step": 192100 }, { "epoch": 0.23191490581171875, "learning_rate": 9.26421177778065e-06, "loss": 3.7510443115234375, "step": 192200 }, { "epoch": 0.23203556913420145, "learning_rate": 9.263807942312912e-06, "loss": 3.7581683349609376, "step": 192300 }, { "epoch": 0.23215623245668413, "learning_rate": 9.263404106845172e-06, "loss": 3.7492074584960937, "step": 192400 }, { "epoch": 0.23227689577916683, "learning_rate": 9.263000271377434e-06, "loss": 3.7553305053710937, "step": 192500 }, { "epoch": 0.2323975591016495, "learning_rate": 9.262596435909696e-06, "loss": 3.746603698730469, "step": 192600 }, { "epoch": 0.23251822242413217, "learning_rate": 9.262192600441958e-06, "loss": 3.7663336181640625, "step": 192700 }, { "epoch": 0.23263888574661487, "learning_rate": 9.26178876497422e-06, "loss": 3.7619973754882814, "step": 192800 }, { "epoch": 0.23275954906909754, "learning_rate": 9.261384929506482e-06, "loss": 3.777813720703125, "step": 192900 }, { "epoch": 0.23288021239158024, "learning_rate": 9.260981094038743e-06, "loss": 3.7624166870117186, "step": 193000 }, { "epoch": 0.23300087571406292, "learning_rate": 9.260577258571005e-06, "loss": 3.783835144042969, "step": 193100 }, { "epoch": 0.2331215390365456, "learning_rate": 9.260173423103267e-06, "loss": 3.7421395874023435, "step": 193200 }, { "epoch": 0.2332422023590283, "learning_rate": 9.259769587635527e-06, "loss": 3.709068603515625, "step": 193300 }, { "epoch": 0.23336286568151096, "learning_rate": 9.259365752167789e-06, "loss": 3.7289178466796873, "step": 193400 }, { "epoch": 0.23348352900399366, "learning_rate": 9.25896191670005e-06, "loss": 3.746418762207031, "step": 193500 }, { "epoch": 0.23360419232647633, "learning_rate": 9.258558081232313e-06, "loss": 3.744023742675781, "step": 193600 }, { "epoch": 0.23372485564895903, "learning_rate": 9.258154245764575e-06, "loss": 3.7015484619140624, "step": 193700 }, { "epoch": 0.2338455189714417, "learning_rate": 9.257750410296837e-06, "loss": 3.74681640625, "step": 193800 }, { "epoch": 0.23396618229392438, "learning_rate": 9.257346574829099e-06, "loss": 3.7518820190429687, "step": 193900 }, { "epoch": 0.23408684561640708, "learning_rate": 9.256942739361359e-06, "loss": 3.73414794921875, "step": 194000 }, { "epoch": 0.23420750893888975, "learning_rate": 9.256538903893621e-06, "loss": 3.717051696777344, "step": 194100 }, { "epoch": 0.23432817226137245, "learning_rate": 9.256135068425881e-06, "loss": 3.7203155517578126, "step": 194200 }, { "epoch": 0.23444883558385513, "learning_rate": 9.255731232958143e-06, "loss": 3.705076904296875, "step": 194300 }, { "epoch": 0.2345694989063378, "learning_rate": 9.255327397490405e-06, "loss": 3.7366397094726564, "step": 194400 }, { "epoch": 0.2346901622288205, "learning_rate": 9.254923562022667e-06, "loss": 3.734712829589844, "step": 194500 }, { "epoch": 0.23481082555130317, "learning_rate": 9.25451972655493e-06, "loss": 3.7418222045898437, "step": 194600 }, { "epoch": 0.23493148887378587, "learning_rate": 9.254115891087191e-06, "loss": 3.7293902587890626, "step": 194700 }, { "epoch": 0.23505215219626854, "learning_rate": 9.253712055619452e-06, "loss": 3.7267974853515624, "step": 194800 }, { "epoch": 0.23517281551875124, "learning_rate": 9.253308220151714e-06, "loss": 3.7221417236328125, "step": 194900 }, { "epoch": 0.23529347884123392, "learning_rate": 9.252904384683975e-06, "loss": 3.7525979614257814, "step": 195000 }, { "epoch": 0.2354141421637166, "learning_rate": 9.252500549216237e-06, "loss": 3.731783752441406, "step": 195100 }, { "epoch": 0.2355348054861993, "learning_rate": 9.252096713748498e-06, "loss": 3.7116549682617186, "step": 195200 }, { "epoch": 0.23565546880868196, "learning_rate": 9.25169287828076e-06, "loss": 3.7166778564453127, "step": 195300 }, { "epoch": 0.23577613213116466, "learning_rate": 9.251289042813022e-06, "loss": 3.7092495727539063, "step": 195400 }, { "epoch": 0.23589679545364733, "learning_rate": 9.250885207345284e-06, "loss": 3.7323504638671876, "step": 195500 }, { "epoch": 0.23601745877613, "learning_rate": 9.250481371877546e-06, "loss": 3.7345516967773436, "step": 195600 }, { "epoch": 0.2361381220986127, "learning_rate": 9.250077536409806e-06, "loss": 3.7101144409179687, "step": 195700 }, { "epoch": 0.23625878542109538, "learning_rate": 9.249673700942068e-06, "loss": 3.735495910644531, "step": 195800 }, { "epoch": 0.23637944874357808, "learning_rate": 9.24926986547433e-06, "loss": 3.755951232910156, "step": 195900 }, { "epoch": 0.23650011206606075, "learning_rate": 9.248866030006592e-06, "loss": 3.7482965087890623, "step": 196000 }, { "epoch": 0.23662077538854345, "learning_rate": 9.248462194538854e-06, "loss": 3.7130587768554686, "step": 196100 }, { "epoch": 0.23674143871102613, "learning_rate": 9.248058359071114e-06, "loss": 3.7413601684570312, "step": 196200 }, { "epoch": 0.2368621020335088, "learning_rate": 9.247654523603376e-06, "loss": 3.7243948364257813, "step": 196300 }, { "epoch": 0.2369827653559915, "learning_rate": 9.247250688135638e-06, "loss": 3.7133111572265625, "step": 196400 }, { "epoch": 0.23710342867847417, "learning_rate": 9.246846852667898e-06, "loss": 3.7211761474609375, "step": 196500 }, { "epoch": 0.23722409200095687, "learning_rate": 9.24644301720016e-06, "loss": 3.7363665771484373, "step": 196600 }, { "epoch": 0.23734475532343954, "learning_rate": 9.246039181732422e-06, "loss": 3.726129150390625, "step": 196700 }, { "epoch": 0.23746541864592222, "learning_rate": 9.245635346264684e-06, "loss": 3.7107388305664064, "step": 196800 }, { "epoch": 0.23758608196840492, "learning_rate": 9.245231510796946e-06, "loss": 3.7372119140625, "step": 196900 }, { "epoch": 0.2377067452908876, "learning_rate": 9.244827675329208e-06, "loss": 3.71290771484375, "step": 197000 }, { "epoch": 0.2378274086133703, "learning_rate": 9.244423839861469e-06, "loss": 3.7061029052734376, "step": 197100 }, { "epoch": 0.23794807193585296, "learning_rate": 9.24402000439373e-06, "loss": 3.7164041137695314, "step": 197200 }, { "epoch": 0.23806873525833566, "learning_rate": 9.243616168925993e-06, "loss": 3.712121887207031, "step": 197300 }, { "epoch": 0.23818939858081833, "learning_rate": 9.243212333458253e-06, "loss": 3.736483154296875, "step": 197400 }, { "epoch": 0.238310061903301, "learning_rate": 9.242808497990515e-06, "loss": 3.722565002441406, "step": 197500 }, { "epoch": 0.2384307252257837, "learning_rate": 9.242404662522777e-06, "loss": 3.7054348754882813, "step": 197600 }, { "epoch": 0.23855138854826638, "learning_rate": 9.242000827055039e-06, "loss": 3.7192474365234376, "step": 197700 }, { "epoch": 0.23867205187074908, "learning_rate": 9.2415969915873e-06, "loss": 3.716965637207031, "step": 197800 }, { "epoch": 0.23879271519323175, "learning_rate": 9.241193156119563e-06, "loss": 3.7091140747070312, "step": 197900 }, { "epoch": 0.23891337851571443, "learning_rate": 9.240789320651825e-06, "loss": 3.6944842529296875, "step": 198000 }, { "epoch": 0.23903404183819713, "learning_rate": 9.240385485184085e-06, "loss": 3.728592529296875, "step": 198100 }, { "epoch": 0.2391547051606798, "learning_rate": 9.239981649716347e-06, "loss": 3.74075439453125, "step": 198200 }, { "epoch": 0.2392753684831625, "learning_rate": 9.239577814248607e-06, "loss": 3.7070867919921877, "step": 198300 }, { "epoch": 0.23939603180564517, "learning_rate": 9.23917397878087e-06, "loss": 3.7243670654296874, "step": 198400 }, { "epoch": 0.23951669512812787, "learning_rate": 9.238770143313131e-06, "loss": 3.74302490234375, "step": 198500 }, { "epoch": 0.23963735845061054, "learning_rate": 9.238366307845393e-06, "loss": 3.7204736328125, "step": 198600 }, { "epoch": 0.23975802177309322, "learning_rate": 9.237962472377655e-06, "loss": 3.72676513671875, "step": 198700 }, { "epoch": 0.23987868509557592, "learning_rate": 9.237558636909917e-06, "loss": 3.714619445800781, "step": 198800 }, { "epoch": 0.2399993484180586, "learning_rate": 9.237154801442178e-06, "loss": 3.722392883300781, "step": 198900 }, { "epoch": 0.2401200117405413, "learning_rate": 9.23675096597444e-06, "loss": 3.7029483032226564, "step": 199000 }, { "epoch": 0.24024067506302396, "learning_rate": 9.236347130506702e-06, "loss": 3.6963409423828124, "step": 199100 }, { "epoch": 0.24036133838550663, "learning_rate": 9.235943295038964e-06, "loss": 3.7217718505859376, "step": 199200 }, { "epoch": 0.24048200170798933, "learning_rate": 9.235539459571224e-06, "loss": 3.7127450561523436, "step": 199300 }, { "epoch": 0.240602665030472, "learning_rate": 9.235135624103486e-06, "loss": 3.7036624145507813, "step": 199400 }, { "epoch": 0.2407233283529547, "learning_rate": 9.234731788635748e-06, "loss": 3.705352478027344, "step": 199500 }, { "epoch": 0.24084399167543738, "learning_rate": 9.23432795316801e-06, "loss": 3.6987686157226562, "step": 199600 }, { "epoch": 0.24096465499792005, "learning_rate": 9.23392411770027e-06, "loss": 3.707328186035156, "step": 199700 }, { "epoch": 0.24108531832040275, "learning_rate": 9.233520282232532e-06, "loss": 3.7200494384765626, "step": 199800 }, { "epoch": 0.24120598164288543, "learning_rate": 9.233116446764794e-06, "loss": 3.69326904296875, "step": 199900 }, { "epoch": 0.24132664496536813, "learning_rate": 9.232712611297056e-06, "loss": 3.7053985595703125, "step": 200000 }, { "epoch": 0.2414473082878508, "learning_rate": 9.232308775829318e-06, "loss": 3.7000717163085937, "step": 200100 }, { "epoch": 0.2415679716103335, "learning_rate": 9.231904940361578e-06, "loss": 3.6976361083984375, "step": 200200 }, { "epoch": 0.24168863493281617, "learning_rate": 9.23150110489384e-06, "loss": 3.673581848144531, "step": 200300 }, { "epoch": 0.24180929825529884, "learning_rate": 9.231097269426102e-06, "loss": 3.7136459350585938, "step": 200400 }, { "epoch": 0.24192996157778154, "learning_rate": 9.230693433958364e-06, "loss": 3.695909423828125, "step": 200500 }, { "epoch": 0.24205062490026422, "learning_rate": 9.230289598490624e-06, "loss": 3.674058532714844, "step": 200600 }, { "epoch": 0.24217128822274692, "learning_rate": 9.229885763022886e-06, "loss": 3.7147845458984374, "step": 200700 }, { "epoch": 0.2422919515452296, "learning_rate": 9.229481927555148e-06, "loss": 3.695434265136719, "step": 200800 }, { "epoch": 0.24241261486771226, "learning_rate": 9.22907809208741e-06, "loss": 3.6836480712890625, "step": 200900 }, { "epoch": 0.24253327819019496, "learning_rate": 9.228674256619672e-06, "loss": 3.6956515502929688, "step": 201000 }, { "epoch": 0.24265394151267763, "learning_rate": 9.228270421151934e-06, "loss": 3.6742889404296877, "step": 201100 }, { "epoch": 0.24277460483516033, "learning_rate": 9.227866585684195e-06, "loss": 3.69082763671875, "step": 201200 }, { "epoch": 0.242895268157643, "learning_rate": 9.227462750216457e-06, "loss": 3.7146572875976562, "step": 201300 }, { "epoch": 0.2430159314801257, "learning_rate": 9.227058914748717e-06, "loss": 3.7032601928710935, "step": 201400 }, { "epoch": 0.24313659480260838, "learning_rate": 9.226655079280979e-06, "loss": 3.695606384277344, "step": 201500 }, { "epoch": 0.24325725812509105, "learning_rate": 9.226251243813241e-06, "loss": 3.710067138671875, "step": 201600 }, { "epoch": 0.24337792144757375, "learning_rate": 9.225847408345503e-06, "loss": 3.6949334716796876, "step": 201700 }, { "epoch": 0.24349858477005643, "learning_rate": 9.225443572877765e-06, "loss": 3.694286193847656, "step": 201800 }, { "epoch": 0.24361924809253913, "learning_rate": 9.225039737410027e-06, "loss": 3.702607421875, "step": 201900 }, { "epoch": 0.2437399114150218, "learning_rate": 9.224635901942289e-06, "loss": 3.700819396972656, "step": 202000 }, { "epoch": 0.24386057473750447, "learning_rate": 9.224232066474549e-06, "loss": 3.7006906127929686, "step": 202100 }, { "epoch": 0.24398123805998717, "learning_rate": 9.223828231006811e-06, "loss": 3.707624816894531, "step": 202200 }, { "epoch": 0.24410190138246984, "learning_rate": 9.223424395539073e-06, "loss": 3.6560491943359374, "step": 202300 }, { "epoch": 0.24422256470495254, "learning_rate": 9.223020560071333e-06, "loss": 3.68814453125, "step": 202400 }, { "epoch": 0.24434322802743522, "learning_rate": 9.222616724603595e-06, "loss": 3.6900540161132813, "step": 202500 }, { "epoch": 0.24446389134991792, "learning_rate": 9.222212889135857e-06, "loss": 3.7148141479492187, "step": 202600 }, { "epoch": 0.2445845546724006, "learning_rate": 9.22180905366812e-06, "loss": 3.6685494995117187, "step": 202700 }, { "epoch": 0.24470521799488326, "learning_rate": 9.221405218200381e-06, "loss": 3.7073245239257813, "step": 202800 }, { "epoch": 0.24482588131736596, "learning_rate": 9.221001382732643e-06, "loss": 3.683519287109375, "step": 202900 }, { "epoch": 0.24494654463984863, "learning_rate": 9.220597547264904e-06, "loss": 3.6927325439453127, "step": 203000 }, { "epoch": 0.24506720796233133, "learning_rate": 9.220193711797166e-06, "loss": 3.6921255493164065, "step": 203100 }, { "epoch": 0.245187871284814, "learning_rate": 9.219789876329428e-06, "loss": 3.674447021484375, "step": 203200 }, { "epoch": 0.24530853460729668, "learning_rate": 9.219386040861688e-06, "loss": 3.699053955078125, "step": 203300 }, { "epoch": 0.24542919792977938, "learning_rate": 9.21898220539395e-06, "loss": 3.6666455078125, "step": 203400 }, { "epoch": 0.24554986125226205, "learning_rate": 9.218578369926212e-06, "loss": 3.687672424316406, "step": 203500 }, { "epoch": 0.24567052457474475, "learning_rate": 9.218174534458474e-06, "loss": 3.6936688232421875, "step": 203600 }, { "epoch": 0.24579118789722743, "learning_rate": 9.217770698990736e-06, "loss": 3.718658447265625, "step": 203700 }, { "epoch": 0.24591185121971013, "learning_rate": 9.217366863522996e-06, "loss": 3.6747882080078127, "step": 203800 }, { "epoch": 0.2460325145421928, "learning_rate": 9.216963028055258e-06, "loss": 3.6771527099609376, "step": 203900 }, { "epoch": 0.24615317786467547, "learning_rate": 9.21655919258752e-06, "loss": 3.701468200683594, "step": 204000 }, { "epoch": 0.24627384118715817, "learning_rate": 9.216155357119782e-06, "loss": 3.661234130859375, "step": 204100 }, { "epoch": 0.24639450450964084, "learning_rate": 9.215751521652044e-06, "loss": 3.68523193359375, "step": 204200 }, { "epoch": 0.24651516783212354, "learning_rate": 9.215347686184304e-06, "loss": 3.6767242431640623, "step": 204300 }, { "epoch": 0.24663583115460622, "learning_rate": 9.214943850716566e-06, "loss": 3.685646667480469, "step": 204400 }, { "epoch": 0.2467564944770889, "learning_rate": 9.214540015248828e-06, "loss": 3.6798504638671874, "step": 204500 }, { "epoch": 0.2468771577995716, "learning_rate": 9.214136179781089e-06, "loss": 3.669855041503906, "step": 204600 }, { "epoch": 0.24699782112205426, "learning_rate": 9.21373234431335e-06, "loss": 3.669905700683594, "step": 204700 }, { "epoch": 0.24711848444453696, "learning_rate": 9.213328508845612e-06, "loss": 3.6896548461914063, "step": 204800 }, { "epoch": 0.24723914776701963, "learning_rate": 9.212924673377874e-06, "loss": 3.68878662109375, "step": 204900 }, { "epoch": 0.24735981108950233, "learning_rate": 9.212520837910136e-06, "loss": 3.6997946166992186, "step": 205000 }, { "epoch": 0.247480474411985, "learning_rate": 9.212117002442398e-06, "loss": 3.6602401733398438, "step": 205100 }, { "epoch": 0.24760113773446768, "learning_rate": 9.211713166974659e-06, "loss": 3.6706509399414062, "step": 205200 }, { "epoch": 0.24772180105695038, "learning_rate": 9.21130933150692e-06, "loss": 3.7057321166992185, "step": 205300 }, { "epoch": 0.24784246437943305, "learning_rate": 9.210905496039183e-06, "loss": 3.6448834228515623, "step": 205400 }, { "epoch": 0.24796312770191575, "learning_rate": 9.210501660571443e-06, "loss": 3.686228942871094, "step": 205500 }, { "epoch": 0.24808379102439843, "learning_rate": 9.210097825103705e-06, "loss": 3.662328186035156, "step": 205600 }, { "epoch": 0.2482044543468811, "learning_rate": 9.209693989635967e-06, "loss": 3.638558044433594, "step": 205700 }, { "epoch": 0.2483251176693638, "learning_rate": 9.209290154168229e-06, "loss": 3.6871527099609374, "step": 205800 }, { "epoch": 0.24844578099184647, "learning_rate": 9.208886318700491e-06, "loss": 3.6697811889648437, "step": 205900 }, { "epoch": 0.24856644431432917, "learning_rate": 9.208482483232753e-06, "loss": 3.6819342041015624, "step": 206000 }, { "epoch": 0.24868710763681184, "learning_rate": 9.208078647765015e-06, "loss": 3.679654846191406, "step": 206100 }, { "epoch": 0.24880777095929452, "learning_rate": 9.207674812297275e-06, "loss": 3.680423583984375, "step": 206200 }, { "epoch": 0.24892843428177722, "learning_rate": 9.207270976829537e-06, "loss": 3.64692138671875, "step": 206300 }, { "epoch": 0.2490490976042599, "learning_rate": 9.206867141361797e-06, "loss": 3.659390869140625, "step": 206400 }, { "epoch": 0.2491697609267426, "learning_rate": 9.20646330589406e-06, "loss": 3.6611419677734376, "step": 206500 }, { "epoch": 0.24929042424922526, "learning_rate": 9.206059470426321e-06, "loss": 3.6673675537109376, "step": 206600 }, { "epoch": 0.24941108757170796, "learning_rate": 9.205655634958583e-06, "loss": 3.6616448974609375, "step": 206700 }, { "epoch": 0.24953175089419063, "learning_rate": 9.205251799490845e-06, "loss": 3.6692333984375, "step": 206800 }, { "epoch": 0.2496524142166733, "learning_rate": 9.204847964023107e-06, "loss": 3.6917459106445314, "step": 206900 }, { "epoch": 0.249773077539156, "learning_rate": 9.20444412855537e-06, "loss": 3.6804791259765626, "step": 207000 }, { "epoch": 0.24989374086163868, "learning_rate": 9.20404029308763e-06, "loss": 3.6656124877929686, "step": 207100 }, { "epoch": 0.25001440418412135, "learning_rate": 9.203636457619892e-06, "loss": 3.690818176269531, "step": 207200 }, { "epoch": 0.2501350675066041, "learning_rate": 9.203232622152154e-06, "loss": 3.6568429565429685, "step": 207300 }, { "epoch": 0.25025573082908675, "learning_rate": 9.202828786684414e-06, "loss": 3.6728955078125, "step": 207400 }, { "epoch": 0.2503763941515694, "learning_rate": 9.202424951216676e-06, "loss": 3.6812142944335937, "step": 207500 }, { "epoch": 0.2504970574740521, "learning_rate": 9.202021115748938e-06, "loss": 3.6532241821289064, "step": 207600 }, { "epoch": 0.25061772079653477, "learning_rate": 9.2016172802812e-06, "loss": 3.6612088012695314, "step": 207700 }, { "epoch": 0.2507383841190175, "learning_rate": 9.201213444813462e-06, "loss": 3.669891662597656, "step": 207800 }, { "epoch": 0.25085904744150017, "learning_rate": 9.200809609345722e-06, "loss": 3.652283935546875, "step": 207900 }, { "epoch": 0.25097971076398284, "learning_rate": 9.200405773877984e-06, "loss": 3.6692623901367187, "step": 208000 }, { "epoch": 0.2511003740864655, "learning_rate": 9.200001938410246e-06, "loss": 3.6599322509765626, "step": 208100 }, { "epoch": 0.2512210374089482, "learning_rate": 9.199598102942508e-06, "loss": 3.6554437255859376, "step": 208200 }, { "epoch": 0.2513417007314309, "learning_rate": 9.19919426747477e-06, "loss": 3.6617669677734375, "step": 208300 }, { "epoch": 0.2514623640539136, "learning_rate": 9.19879043200703e-06, "loss": 3.6685800170898437, "step": 208400 }, { "epoch": 0.25158302737639626, "learning_rate": 9.198386596539292e-06, "loss": 3.6759603881835936, "step": 208500 }, { "epoch": 0.25170369069887893, "learning_rate": 9.197982761071554e-06, "loss": 3.6685281372070313, "step": 208600 }, { "epoch": 0.2518243540213616, "learning_rate": 9.197578925603815e-06, "loss": 3.65275146484375, "step": 208700 }, { "epoch": 0.25194501734384434, "learning_rate": 9.197175090136077e-06, "loss": 3.665533447265625, "step": 208800 }, { "epoch": 0.252065680666327, "learning_rate": 9.196771254668339e-06, "loss": 3.656330871582031, "step": 208900 }, { "epoch": 0.2521863439888097, "learning_rate": 9.1963674192006e-06, "loss": 3.6645635986328124, "step": 209000 }, { "epoch": 0.25230700731129235, "learning_rate": 9.195963583732862e-06, "loss": 3.6672955322265626, "step": 209100 }, { "epoch": 0.252427670633775, "learning_rate": 9.195559748265124e-06, "loss": 3.643277893066406, "step": 209200 }, { "epoch": 0.25254833395625775, "learning_rate": 9.195155912797385e-06, "loss": 3.662528381347656, "step": 209300 }, { "epoch": 0.2526689972787404, "learning_rate": 9.194752077329647e-06, "loss": 3.638275146484375, "step": 209400 }, { "epoch": 0.2527896606012231, "learning_rate": 9.194348241861909e-06, "loss": 3.694941101074219, "step": 209500 }, { "epoch": 0.25291032392370577, "learning_rate": 9.193944406394169e-06, "loss": 3.640216064453125, "step": 209600 }, { "epoch": 0.2530309872461885, "learning_rate": 9.193540570926431e-06, "loss": 3.6376080322265625, "step": 209700 }, { "epoch": 0.25315165056867117, "learning_rate": 9.193136735458693e-06, "loss": 3.655018310546875, "step": 209800 }, { "epoch": 0.25327231389115384, "learning_rate": 9.192732899990955e-06, "loss": 3.6468634033203124, "step": 209900 }, { "epoch": 0.2533929772136365, "learning_rate": 9.192329064523217e-06, "loss": 3.677126159667969, "step": 210000 }, { "epoch": 0.2535136405361192, "learning_rate": 9.191925229055479e-06, "loss": 3.63465087890625, "step": 210100 }, { "epoch": 0.2536343038586019, "learning_rate": 9.191521393587741e-06, "loss": 3.6564712524414062, "step": 210200 }, { "epoch": 0.2537549671810846, "learning_rate": 9.191117558120001e-06, "loss": 3.666081848144531, "step": 210300 }, { "epoch": 0.25387563050356726, "learning_rate": 9.190713722652263e-06, "loss": 3.654061279296875, "step": 210400 }, { "epoch": 0.25399629382604993, "learning_rate": 9.190309887184523e-06, "loss": 3.659622802734375, "step": 210500 }, { "epoch": 0.2541169571485326, "learning_rate": 9.189906051716785e-06, "loss": 3.645521545410156, "step": 210600 }, { "epoch": 0.25423762047101534, "learning_rate": 9.189502216249047e-06, "loss": 3.634986572265625, "step": 210700 }, { "epoch": 0.254358283793498, "learning_rate": 9.18909838078131e-06, "loss": 3.6290347290039064, "step": 210800 }, { "epoch": 0.2544789471159807, "learning_rate": 9.188694545313571e-06, "loss": 3.6444961547851564, "step": 210900 }, { "epoch": 0.25459961043846335, "learning_rate": 9.188290709845833e-06, "loss": 3.62194580078125, "step": 211000 }, { "epoch": 0.254720273760946, "learning_rate": 9.187886874378095e-06, "loss": 3.651019287109375, "step": 211100 }, { "epoch": 0.25484093708342875, "learning_rate": 9.187483038910356e-06, "loss": 3.6369573974609377, "step": 211200 }, { "epoch": 0.2549616004059114, "learning_rate": 9.187079203442618e-06, "loss": 3.64165283203125, "step": 211300 }, { "epoch": 0.2550822637283941, "learning_rate": 9.18667536797488e-06, "loss": 3.655348205566406, "step": 211400 }, { "epoch": 0.25520292705087677, "learning_rate": 9.18627153250714e-06, "loss": 3.6637094116210935, "step": 211500 }, { "epoch": 0.25532359037335944, "learning_rate": 9.185867697039402e-06, "loss": 3.632470703125, "step": 211600 }, { "epoch": 0.25544425369584217, "learning_rate": 9.185463861571664e-06, "loss": 3.6434896850585936, "step": 211700 }, { "epoch": 0.25556491701832484, "learning_rate": 9.185060026103926e-06, "loss": 3.6458233642578124, "step": 211800 }, { "epoch": 0.2556855803408075, "learning_rate": 9.184656190636188e-06, "loss": 3.6436273193359376, "step": 211900 }, { "epoch": 0.2558062436632902, "learning_rate": 9.184252355168448e-06, "loss": 3.647513732910156, "step": 212000 }, { "epoch": 0.25592690698577286, "learning_rate": 9.18384851970071e-06, "loss": 3.6456484985351563, "step": 212100 }, { "epoch": 0.2560475703082556, "learning_rate": 9.183444684232972e-06, "loss": 3.6340908813476562, "step": 212200 }, { "epoch": 0.25616823363073826, "learning_rate": 9.183040848765234e-06, "loss": 3.64902587890625, "step": 212300 }, { "epoch": 0.25628889695322093, "learning_rate": 9.182637013297494e-06, "loss": 3.6336788940429687, "step": 212400 }, { "epoch": 0.2564095602757036, "learning_rate": 9.182233177829756e-06, "loss": 3.6513107299804686, "step": 212500 }, { "epoch": 0.25653022359818634, "learning_rate": 9.181829342362018e-06, "loss": 3.6526837158203125, "step": 212600 }, { "epoch": 0.256650886920669, "learning_rate": 9.18142550689428e-06, "loss": 3.6647525024414063, "step": 212700 }, { "epoch": 0.2567715502431517, "learning_rate": 9.18102167142654e-06, "loss": 3.6526068115234374, "step": 212800 }, { "epoch": 0.25689221356563435, "learning_rate": 9.180617835958803e-06, "loss": 3.6386724853515626, "step": 212900 }, { "epoch": 0.257012876888117, "learning_rate": 9.180214000491065e-06, "loss": 3.6438592529296874, "step": 213000 }, { "epoch": 0.25713354021059975, "learning_rate": 9.179810165023327e-06, "loss": 3.634393615722656, "step": 213100 }, { "epoch": 0.2572542035330824, "learning_rate": 9.179406329555589e-06, "loss": 3.6205813598632814, "step": 213200 }, { "epoch": 0.2573748668555651, "learning_rate": 9.17900249408785e-06, "loss": 3.6506982421875, "step": 213300 }, { "epoch": 0.25749553017804777, "learning_rate": 9.17859865862011e-06, "loss": 3.641763000488281, "step": 213400 }, { "epoch": 0.25761619350053044, "learning_rate": 9.178194823152373e-06, "loss": 3.643809814453125, "step": 213500 }, { "epoch": 0.25773685682301317, "learning_rate": 9.177790987684633e-06, "loss": 3.614754943847656, "step": 213600 }, { "epoch": 0.25785752014549584, "learning_rate": 9.177387152216895e-06, "loss": 3.6188323974609373, "step": 213700 }, { "epoch": 0.2579781834679785, "learning_rate": 9.176983316749157e-06, "loss": 3.6238937377929688, "step": 213800 }, { "epoch": 0.2580988467904612, "learning_rate": 9.176579481281419e-06, "loss": 3.64358642578125, "step": 213900 }, { "epoch": 0.25821951011294386, "learning_rate": 9.176175645813681e-06, "loss": 3.6493756103515627, "step": 214000 }, { "epoch": 0.2583401734354266, "learning_rate": 9.175771810345943e-06, "loss": 3.6419134521484375, "step": 214100 }, { "epoch": 0.25846083675790926, "learning_rate": 9.175367974878205e-06, "loss": 3.6235174560546874, "step": 214200 }, { "epoch": 0.25858150008039194, "learning_rate": 9.174964139410465e-06, "loss": 3.6091348266601564, "step": 214300 }, { "epoch": 0.2587021634028746, "learning_rate": 9.174560303942727e-06, "loss": 3.5955380249023436, "step": 214400 }, { "epoch": 0.2588228267253573, "learning_rate": 9.17415646847499e-06, "loss": 3.6241519165039064, "step": 214500 }, { "epoch": 0.25894349004784, "learning_rate": 9.17375263300725e-06, "loss": 3.62678466796875, "step": 214600 }, { "epoch": 0.2590641533703227, "learning_rate": 9.173348797539511e-06, "loss": 3.608099060058594, "step": 214700 }, { "epoch": 0.25918481669280535, "learning_rate": 9.172944962071773e-06, "loss": 3.628077087402344, "step": 214800 }, { "epoch": 0.259305480015288, "learning_rate": 9.172541126604035e-06, "loss": 3.631988525390625, "step": 214900 }, { "epoch": 0.25942614333777075, "learning_rate": 9.172137291136297e-06, "loss": 3.6361068725585937, "step": 215000 }, { "epoch": 0.2595468066602534, "learning_rate": 9.17173345566856e-06, "loss": 3.6112255859375, "step": 215100 }, { "epoch": 0.2596674699827361, "learning_rate": 9.17132962020082e-06, "loss": 3.6156387329101562, "step": 215200 }, { "epoch": 0.25978813330521877, "learning_rate": 9.170925784733082e-06, "loss": 3.6196099853515626, "step": 215300 }, { "epoch": 0.25990879662770144, "learning_rate": 9.170521949265344e-06, "loss": 3.632629699707031, "step": 215400 }, { "epoch": 0.26002945995018417, "learning_rate": 9.170118113797604e-06, "loss": 3.6325814819335935, "step": 215500 }, { "epoch": 0.26015012327266684, "learning_rate": 9.169714278329866e-06, "loss": 3.651593017578125, "step": 215600 }, { "epoch": 0.2602707865951495, "learning_rate": 9.169310442862128e-06, "loss": 3.63134033203125, "step": 215700 }, { "epoch": 0.2603914499176322, "learning_rate": 9.16890660739439e-06, "loss": 3.6174700927734373, "step": 215800 }, { "epoch": 0.26051211324011486, "learning_rate": 9.168502771926652e-06, "loss": 3.6308102416992187, "step": 215900 }, { "epoch": 0.2606327765625976, "learning_rate": 9.168098936458914e-06, "loss": 3.63929443359375, "step": 216000 }, { "epoch": 0.26075343988508026, "learning_rate": 9.167695100991174e-06, "loss": 3.635963134765625, "step": 216100 }, { "epoch": 0.26087410320756294, "learning_rate": 9.167291265523436e-06, "loss": 3.5966302490234376, "step": 216200 }, { "epoch": 0.2609947665300456, "learning_rate": 9.166887430055698e-06, "loss": 3.617817687988281, "step": 216300 }, { "epoch": 0.2611154298525283, "learning_rate": 9.16648359458796e-06, "loss": 3.591999816894531, "step": 216400 }, { "epoch": 0.261236093175011, "learning_rate": 9.16607975912022e-06, "loss": 3.6028131103515624, "step": 216500 }, { "epoch": 0.2613567564974937, "learning_rate": 9.165675923652482e-06, "loss": 3.6028277587890627, "step": 216600 }, { "epoch": 0.26147741981997635, "learning_rate": 9.165272088184744e-06, "loss": 3.631822204589844, "step": 216700 }, { "epoch": 0.261598083142459, "learning_rate": 9.164868252717006e-06, "loss": 3.6150082397460936, "step": 216800 }, { "epoch": 0.2617187464649417, "learning_rate": 9.164464417249267e-06, "loss": 3.644293212890625, "step": 216900 }, { "epoch": 0.2618394097874244, "learning_rate": 9.164060581781529e-06, "loss": 3.6161553955078123, "step": 217000 }, { "epoch": 0.2619600731099071, "learning_rate": 9.16365674631379e-06, "loss": 3.6294183349609375, "step": 217100 }, { "epoch": 0.26208073643238977, "learning_rate": 9.163252910846053e-06, "loss": 3.5988278198242187, "step": 217200 }, { "epoch": 0.26220139975487244, "learning_rate": 9.162849075378315e-06, "loss": 3.6180953979492188, "step": 217300 }, { "epoch": 0.26232206307735517, "learning_rate": 9.162445239910575e-06, "loss": 3.6175637817382813, "step": 217400 }, { "epoch": 0.26244272639983784, "learning_rate": 9.162041404442837e-06, "loss": 3.625796203613281, "step": 217500 }, { "epoch": 0.2625633897223205, "learning_rate": 9.161637568975099e-06, "loss": 3.6257003784179687, "step": 217600 }, { "epoch": 0.2626840530448032, "learning_rate": 9.161233733507359e-06, "loss": 3.6023458862304687, "step": 217700 }, { "epoch": 0.26280471636728586, "learning_rate": 9.160829898039621e-06, "loss": 3.6290814208984377, "step": 217800 }, { "epoch": 0.2629253796897686, "learning_rate": 9.160426062571883e-06, "loss": 3.65021484375, "step": 217900 }, { "epoch": 0.26304604301225126, "learning_rate": 9.160022227104145e-06, "loss": 3.615780029296875, "step": 218000 }, { "epoch": 0.26316670633473394, "learning_rate": 9.159618391636407e-06, "loss": 3.5862045288085938, "step": 218100 }, { "epoch": 0.2632873696572166, "learning_rate": 9.159214556168669e-06, "loss": 3.6121966552734377, "step": 218200 }, { "epoch": 0.2634080329796993, "learning_rate": 9.158810720700931e-06, "loss": 3.6020855712890625, "step": 218300 }, { "epoch": 0.263528696302182, "learning_rate": 9.158406885233191e-06, "loss": 3.609804992675781, "step": 218400 }, { "epoch": 0.2636493596246647, "learning_rate": 9.158003049765453e-06, "loss": 3.603859558105469, "step": 218500 }, { "epoch": 0.26377002294714735, "learning_rate": 9.157599214297714e-06, "loss": 3.6394342041015624, "step": 218600 }, { "epoch": 0.26389068626963, "learning_rate": 9.157195378829976e-06, "loss": 3.5866665649414062, "step": 218700 }, { "epoch": 0.2640113495921127, "learning_rate": 9.156791543362238e-06, "loss": 3.6207781982421876, "step": 218800 }, { "epoch": 0.2641320129145954, "learning_rate": 9.1563877078945e-06, "loss": 3.6049310302734376, "step": 218900 }, { "epoch": 0.2642526762370781, "learning_rate": 9.155983872426761e-06, "loss": 3.5931475830078123, "step": 219000 }, { "epoch": 0.26437333955956077, "learning_rate": 9.155580036959023e-06, "loss": 3.6016531372070313, "step": 219100 }, { "epoch": 0.26449400288204344, "learning_rate": 9.155176201491285e-06, "loss": 3.5916448974609376, "step": 219200 }, { "epoch": 0.2646146662045261, "learning_rate": 9.154772366023546e-06, "loss": 3.626486511230469, "step": 219300 }, { "epoch": 0.26473532952700884, "learning_rate": 9.154368530555808e-06, "loss": 3.5957351684570313, "step": 219400 }, { "epoch": 0.2648559928494915, "learning_rate": 9.15396469508807e-06, "loss": 3.6146258544921874, "step": 219500 }, { "epoch": 0.2649766561719742, "learning_rate": 9.15356085962033e-06, "loss": 3.587324523925781, "step": 219600 }, { "epoch": 0.26509731949445686, "learning_rate": 9.153157024152592e-06, "loss": 3.622711486816406, "step": 219700 }, { "epoch": 0.26521798281693953, "learning_rate": 9.152753188684854e-06, "loss": 3.609224548339844, "step": 219800 }, { "epoch": 0.26533864613942226, "learning_rate": 9.152349353217116e-06, "loss": 3.61752197265625, "step": 219900 }, { "epoch": 0.26545930946190494, "learning_rate": 9.151945517749378e-06, "loss": 3.6301898193359374, "step": 220000 }, { "epoch": 0.2655799727843876, "learning_rate": 9.151541682281638e-06, "loss": 3.624359436035156, "step": 220100 }, { "epoch": 0.2657006361068703, "learning_rate": 9.1511378468139e-06, "loss": 3.6032644653320314, "step": 220200 }, { "epoch": 0.265821299429353, "learning_rate": 9.150734011346162e-06, "loss": 3.602689208984375, "step": 220300 }, { "epoch": 0.2659419627518357, "learning_rate": 9.150330175878424e-06, "loss": 3.6062646484375, "step": 220400 }, { "epoch": 0.26606262607431835, "learning_rate": 9.149926340410684e-06, "loss": 3.589921569824219, "step": 220500 }, { "epoch": 0.266183289396801, "learning_rate": 9.149522504942946e-06, "loss": 3.6008013916015624, "step": 220600 }, { "epoch": 0.2663039527192837, "learning_rate": 9.149118669475208e-06, "loss": 3.5856967163085938, "step": 220700 }, { "epoch": 0.2664246160417664, "learning_rate": 9.14871483400747e-06, "loss": 3.616685791015625, "step": 220800 }, { "epoch": 0.2665452793642491, "learning_rate": 9.14831099853973e-06, "loss": 3.5684024047851564, "step": 220900 }, { "epoch": 0.26666594268673177, "learning_rate": 9.147907163071993e-06, "loss": 3.6155990600585937, "step": 221000 }, { "epoch": 0.26678660600921444, "learning_rate": 9.147503327604255e-06, "loss": 3.5665682983398437, "step": 221100 }, { "epoch": 0.2669072693316971, "learning_rate": 9.147099492136517e-06, "loss": 3.6033291625976562, "step": 221200 }, { "epoch": 0.26702793265417984, "learning_rate": 9.146695656668779e-06, "loss": 3.583944091796875, "step": 221300 }, { "epoch": 0.2671485959766625, "learning_rate": 9.14629182120104e-06, "loss": 3.6123919677734375, "step": 221400 }, { "epoch": 0.2672692592991452, "learning_rate": 9.145887985733301e-06, "loss": 3.590823059082031, "step": 221500 }, { "epoch": 0.26738992262162786, "learning_rate": 9.145484150265563e-06, "loss": 3.5947357177734376, "step": 221600 }, { "epoch": 0.26751058594411053, "learning_rate": 9.145080314797825e-06, "loss": 3.6045773315429686, "step": 221700 }, { "epoch": 0.26763124926659326, "learning_rate": 9.144676479330085e-06, "loss": 3.6083160400390626, "step": 221800 }, { "epoch": 0.26775191258907594, "learning_rate": 9.144272643862347e-06, "loss": 3.6236557006835937, "step": 221900 }, { "epoch": 0.2678725759115586, "learning_rate": 9.143868808394609e-06, "loss": 3.625653076171875, "step": 222000 }, { "epoch": 0.2679932392340413, "learning_rate": 9.143464972926871e-06, "loss": 3.6005319213867186, "step": 222100 }, { "epoch": 0.26811390255652395, "learning_rate": 9.143061137459133e-06, "loss": 3.6062551879882814, "step": 222200 }, { "epoch": 0.2682345658790067, "learning_rate": 9.142657301991395e-06, "loss": 3.593189697265625, "step": 222300 }, { "epoch": 0.26835522920148935, "learning_rate": 9.142253466523657e-06, "loss": 3.6193814086914062, "step": 222400 }, { "epoch": 0.268475892523972, "learning_rate": 9.141849631055917e-06, "loss": 3.6072567749023436, "step": 222500 }, { "epoch": 0.2685965558464547, "learning_rate": 9.14144579558818e-06, "loss": 3.6080941772460937, "step": 222600 }, { "epoch": 0.2687172191689374, "learning_rate": 9.14104196012044e-06, "loss": 3.5828091430664064, "step": 222700 }, { "epoch": 0.2688378824914201, "learning_rate": 9.140638124652702e-06, "loss": 3.569569396972656, "step": 222800 }, { "epoch": 0.26895854581390277, "learning_rate": 9.140234289184964e-06, "loss": 3.5858114624023436, "step": 222900 }, { "epoch": 0.26907920913638544, "learning_rate": 9.139830453717226e-06, "loss": 3.586725158691406, "step": 223000 }, { "epoch": 0.2691998724588681, "learning_rate": 9.139426618249488e-06, "loss": 3.5938870239257814, "step": 223100 }, { "epoch": 0.26932053578135084, "learning_rate": 9.13902278278175e-06, "loss": 3.5902413940429687, "step": 223200 }, { "epoch": 0.2694411991038335, "learning_rate": 9.138618947314011e-06, "loss": 3.583902587890625, "step": 223300 }, { "epoch": 0.2695618624263162, "learning_rate": 9.138215111846272e-06, "loss": 3.5930902099609376, "step": 223400 }, { "epoch": 0.26968252574879886, "learning_rate": 9.137811276378534e-06, "loss": 3.579262390136719, "step": 223500 }, { "epoch": 0.26980318907128154, "learning_rate": 9.137407440910796e-06, "loss": 3.557735595703125, "step": 223600 }, { "epoch": 0.26992385239376426, "learning_rate": 9.137003605443056e-06, "loss": 3.571603088378906, "step": 223700 }, { "epoch": 0.27004451571624694, "learning_rate": 9.136599769975318e-06, "loss": 3.5692864990234376, "step": 223800 }, { "epoch": 0.2701651790387296, "learning_rate": 9.13619593450758e-06, "loss": 3.5735678100585937, "step": 223900 }, { "epoch": 0.2702858423612123, "learning_rate": 9.135792099039842e-06, "loss": 3.5645697021484377, "step": 224000 }, { "epoch": 0.27040650568369495, "learning_rate": 9.135388263572104e-06, "loss": 3.5668536376953126, "step": 224100 }, { "epoch": 0.2705271690061777, "learning_rate": 9.134984428104364e-06, "loss": 3.590341796875, "step": 224200 }, { "epoch": 0.27064783232866035, "learning_rate": 9.134580592636626e-06, "loss": 3.5697021484375, "step": 224300 }, { "epoch": 0.270768495651143, "learning_rate": 9.134176757168888e-06, "loss": 3.5751992797851564, "step": 224400 }, { "epoch": 0.2708891589736257, "learning_rate": 9.13377292170115e-06, "loss": 3.585551452636719, "step": 224500 }, { "epoch": 0.27100982229610837, "learning_rate": 9.13336908623341e-06, "loss": 3.5663882446289064, "step": 224600 }, { "epoch": 0.2711304856185911, "learning_rate": 9.132965250765672e-06, "loss": 3.5887960815429687, "step": 224700 }, { "epoch": 0.27125114894107377, "learning_rate": 9.132561415297934e-06, "loss": 3.5697503662109376, "step": 224800 }, { "epoch": 0.27137181226355644, "learning_rate": 9.132157579830196e-06, "loss": 3.5834054565429687, "step": 224900 }, { "epoch": 0.2714924755860391, "learning_rate": 9.131753744362457e-06, "loss": 3.592548828125, "step": 225000 }, { "epoch": 0.2716131389085218, "learning_rate": 9.131349908894719e-06, "loss": 3.5807876586914062, "step": 225100 }, { "epoch": 0.2717338022310045, "learning_rate": 9.13094607342698e-06, "loss": 3.57626708984375, "step": 225200 }, { "epoch": 0.2718544655534872, "learning_rate": 9.130542237959243e-06, "loss": 3.6006484985351563, "step": 225300 }, { "epoch": 0.27197512887596986, "learning_rate": 9.130138402491505e-06, "loss": 3.560160827636719, "step": 225400 }, { "epoch": 0.27209579219845254, "learning_rate": 9.129734567023767e-06, "loss": 3.574559326171875, "step": 225500 }, { "epoch": 0.27221645552093526, "learning_rate": 9.129330731556027e-06, "loss": 3.5735488891601563, "step": 225600 }, { "epoch": 0.27233711884341794, "learning_rate": 9.128926896088289e-06, "loss": 3.5712103271484374, "step": 225700 }, { "epoch": 0.2724577821659006, "learning_rate": 9.12852306062055e-06, "loss": 3.5774057006835935, "step": 225800 }, { "epoch": 0.2725784454883833, "learning_rate": 9.128119225152811e-06, "loss": 3.581417236328125, "step": 225900 }, { "epoch": 0.27269910881086595, "learning_rate": 9.127715389685073e-06, "loss": 3.5692376708984375, "step": 226000 }, { "epoch": 0.2728197721333487, "learning_rate": 9.127311554217335e-06, "loss": 3.5908126831054688, "step": 226100 }, { "epoch": 0.27294043545583135, "learning_rate": 9.126907718749597e-06, "loss": 3.5904833984375, "step": 226200 }, { "epoch": 0.273061098778314, "learning_rate": 9.126503883281859e-06, "loss": 3.5807513427734374, "step": 226300 }, { "epoch": 0.2731817621007967, "learning_rate": 9.126100047814121e-06, "loss": 3.540194396972656, "step": 226400 }, { "epoch": 0.27330242542327937, "learning_rate": 9.125696212346381e-06, "loss": 3.5534262084960937, "step": 226500 }, { "epoch": 0.2734230887457621, "learning_rate": 9.125292376878643e-06, "loss": 3.570113220214844, "step": 226600 }, { "epoch": 0.27354375206824477, "learning_rate": 9.124888541410905e-06, "loss": 3.57446533203125, "step": 226700 }, { "epoch": 0.27366441539072744, "learning_rate": 9.124484705943166e-06, "loss": 3.5702655029296877, "step": 226800 }, { "epoch": 0.2737850787132101, "learning_rate": 9.124080870475428e-06, "loss": 3.5850836181640626, "step": 226900 }, { "epoch": 0.2739057420356928, "learning_rate": 9.12367703500769e-06, "loss": 3.5583111572265627, "step": 227000 }, { "epoch": 0.2740264053581755, "learning_rate": 9.123273199539952e-06, "loss": 3.5519818115234374, "step": 227100 }, { "epoch": 0.2741470686806582, "learning_rate": 9.122869364072214e-06, "loss": 3.594349365234375, "step": 227200 }, { "epoch": 0.27426773200314086, "learning_rate": 9.122465528604476e-06, "loss": 3.573846740722656, "step": 227300 }, { "epoch": 0.27438839532562354, "learning_rate": 9.122061693136738e-06, "loss": 3.58361572265625, "step": 227400 }, { "epoch": 0.2745090586481062, "learning_rate": 9.121657857668998e-06, "loss": 3.5692919921875, "step": 227500 }, { "epoch": 0.27462972197058894, "learning_rate": 9.12125402220126e-06, "loss": 3.5698699951171875, "step": 227600 }, { "epoch": 0.2747503852930716, "learning_rate": 9.12085018673352e-06, "loss": 3.5634820556640623, "step": 227700 }, { "epoch": 0.2748710486155543, "learning_rate": 9.120446351265782e-06, "loss": 3.5794137573242186, "step": 227800 }, { "epoch": 0.27499171193803695, "learning_rate": 9.120042515798044e-06, "loss": 3.5800238037109375, "step": 227900 }, { "epoch": 0.2751123752605197, "learning_rate": 9.119638680330306e-06, "loss": 3.561803283691406, "step": 228000 }, { "epoch": 0.27523303858300235, "learning_rate": 9.119234844862568e-06, "loss": 3.55359375, "step": 228100 }, { "epoch": 0.275353701905485, "learning_rate": 9.11883100939483e-06, "loss": 3.5770248413085937, "step": 228200 }, { "epoch": 0.2754743652279677, "learning_rate": 9.11842717392709e-06, "loss": 3.54753662109375, "step": 228300 }, { "epoch": 0.27559502855045037, "learning_rate": 9.118023338459352e-06, "loss": 3.5572323608398437, "step": 228400 }, { "epoch": 0.2757156918729331, "learning_rate": 9.117619502991614e-06, "loss": 3.55868896484375, "step": 228500 }, { "epoch": 0.27583635519541577, "learning_rate": 9.117215667523876e-06, "loss": 3.5834515380859373, "step": 228600 }, { "epoch": 0.27595701851789844, "learning_rate": 9.116811832056137e-06, "loss": 3.5615060424804685, "step": 228700 }, { "epoch": 0.2760776818403811, "learning_rate": 9.116407996588398e-06, "loss": 3.562529296875, "step": 228800 }, { "epoch": 0.2761983451628638, "learning_rate": 9.11600416112066e-06, "loss": 3.5629953002929686, "step": 228900 }, { "epoch": 0.2763190084853465, "learning_rate": 9.115600325652922e-06, "loss": 3.5576663208007813, "step": 229000 }, { "epoch": 0.2764396718078292, "learning_rate": 9.115196490185183e-06, "loss": 3.5684384155273436, "step": 229100 }, { "epoch": 0.27656033513031186, "learning_rate": 9.114792654717445e-06, "loss": 3.542799987792969, "step": 229200 }, { "epoch": 0.27668099845279454, "learning_rate": 9.114388819249707e-06, "loss": 3.544237060546875, "step": 229300 }, { "epoch": 0.2768016617752772, "learning_rate": 9.113984983781969e-06, "loss": 3.5936245727539062, "step": 229400 }, { "epoch": 0.27692232509775994, "learning_rate": 9.11358114831423e-06, "loss": 3.5565670776367186, "step": 229500 }, { "epoch": 0.2770429884202426, "learning_rate": 9.113177312846491e-06, "loss": 3.585528564453125, "step": 229600 }, { "epoch": 0.2771636517427253, "learning_rate": 9.112773477378753e-06, "loss": 3.54026611328125, "step": 229700 }, { "epoch": 0.27728431506520795, "learning_rate": 9.112369641911015e-06, "loss": 3.5612591552734374, "step": 229800 }, { "epoch": 0.2774049783876906, "learning_rate": 9.111965806443275e-06, "loss": 3.54359619140625, "step": 229900 }, { "epoch": 0.27752564171017335, "learning_rate": 9.111561970975537e-06, "loss": 3.5542388916015626, "step": 230000 }, { "epoch": 0.277646305032656, "learning_rate": 9.1111581355078e-06, "loss": 3.5533367919921877, "step": 230100 }, { "epoch": 0.2777669683551387, "learning_rate": 9.110754300040061e-06, "loss": 3.5700363159179687, "step": 230200 }, { "epoch": 0.27788763167762137, "learning_rate": 9.110350464572323e-06, "loss": 3.6037078857421876, "step": 230300 }, { "epoch": 0.2780082950001041, "learning_rate": 9.109946629104585e-06, "loss": 3.5694659423828123, "step": 230400 }, { "epoch": 0.2781289583225868, "learning_rate": 9.109542793636847e-06, "loss": 3.5792169189453125, "step": 230500 }, { "epoch": 0.27824962164506944, "learning_rate": 9.109138958169107e-06, "loss": 3.570884094238281, "step": 230600 }, { "epoch": 0.2783702849675521, "learning_rate": 9.10873512270137e-06, "loss": 3.5491015625, "step": 230700 }, { "epoch": 0.2784909482900348, "learning_rate": 9.10833128723363e-06, "loss": 3.541947937011719, "step": 230800 }, { "epoch": 0.2786116116125175, "learning_rate": 9.107927451765892e-06, "loss": 3.558038635253906, "step": 230900 }, { "epoch": 0.2787322749350002, "learning_rate": 9.107523616298154e-06, "loss": 3.5654672241210936, "step": 231000 }, { "epoch": 0.27885293825748286, "learning_rate": 9.107119780830416e-06, "loss": 3.572138366699219, "step": 231100 }, { "epoch": 0.27897360157996554, "learning_rate": 9.106715945362678e-06, "loss": 3.5210507202148436, "step": 231200 }, { "epoch": 0.2790942649024482, "learning_rate": 9.10631210989494e-06, "loss": 3.54669677734375, "step": 231300 }, { "epoch": 0.27921492822493094, "learning_rate": 9.105908274427202e-06, "loss": 3.5767861938476564, "step": 231400 }, { "epoch": 0.2793355915474136, "learning_rate": 9.105504438959462e-06, "loss": 3.534457092285156, "step": 231500 }, { "epoch": 0.2794562548698963, "learning_rate": 9.105100603491724e-06, "loss": 3.5653506469726564, "step": 231600 }, { "epoch": 0.27957691819237895, "learning_rate": 9.104696768023986e-06, "loss": 3.568785400390625, "step": 231700 }, { "epoch": 0.2796975815148616, "learning_rate": 9.104292932556246e-06, "loss": 3.569420166015625, "step": 231800 }, { "epoch": 0.27981824483734435, "learning_rate": 9.103889097088508e-06, "loss": 3.5457232666015623, "step": 231900 }, { "epoch": 0.279938908159827, "learning_rate": 9.10348526162077e-06, "loss": 3.5601092529296876, "step": 232000 }, { "epoch": 0.2800595714823097, "learning_rate": 9.103081426153032e-06, "loss": 3.5472662353515627, "step": 232100 }, { "epoch": 0.28018023480479237, "learning_rate": 9.102677590685294e-06, "loss": 3.559073486328125, "step": 232200 }, { "epoch": 0.28030089812727504, "learning_rate": 9.102273755217556e-06, "loss": 3.5434954833984373, "step": 232300 }, { "epoch": 0.2804215614497578, "learning_rate": 9.101869919749816e-06, "loss": 3.5494454956054686, "step": 232400 }, { "epoch": 0.28054222477224044, "learning_rate": 9.101466084282078e-06, "loss": 3.5655535888671874, "step": 232500 }, { "epoch": 0.2806628880947231, "learning_rate": 9.10106224881434e-06, "loss": 3.55737060546875, "step": 232600 }, { "epoch": 0.2807835514172058, "learning_rate": 9.1006584133466e-06, "loss": 3.5257229614257812, "step": 232700 }, { "epoch": 0.28090421473968846, "learning_rate": 9.100254577878863e-06, "loss": 3.560521545410156, "step": 232800 }, { "epoch": 0.2810248780621712, "learning_rate": 9.099850742411125e-06, "loss": 3.540338134765625, "step": 232900 }, { "epoch": 0.28114554138465386, "learning_rate": 9.099446906943387e-06, "loss": 3.5388763427734373, "step": 233000 }, { "epoch": 0.28126620470713654, "learning_rate": 9.099043071475648e-06, "loss": 3.5608856201171877, "step": 233100 }, { "epoch": 0.2813868680296192, "learning_rate": 9.098639236007909e-06, "loss": 3.511635437011719, "step": 233200 }, { "epoch": 0.28150753135210194, "learning_rate": 9.09823540054017e-06, "loss": 3.5601321411132814, "step": 233300 }, { "epoch": 0.2816281946745846, "learning_rate": 9.097831565072433e-06, "loss": 3.574920654296875, "step": 233400 }, { "epoch": 0.2817488579970673, "learning_rate": 9.097427729604695e-06, "loss": 3.5440493774414064, "step": 233500 }, { "epoch": 0.28186952131954995, "learning_rate": 9.097023894136957e-06, "loss": 3.51092529296875, "step": 233600 }, { "epoch": 0.2819901846420326, "learning_rate": 9.096620058669217e-06, "loss": 3.562699890136719, "step": 233700 }, { "epoch": 0.28211084796451535, "learning_rate": 9.096216223201479e-06, "loss": 3.5338290405273436, "step": 233800 }, { "epoch": 0.282231511286998, "learning_rate": 9.095812387733741e-06, "loss": 3.523289794921875, "step": 233900 }, { "epoch": 0.2823521746094807, "learning_rate": 9.095408552266001e-06, "loss": 3.556551818847656, "step": 234000 }, { "epoch": 0.28247283793196337, "learning_rate": 9.095004716798263e-06, "loss": 3.524173583984375, "step": 234100 }, { "epoch": 0.28259350125444604, "learning_rate": 9.094600881330525e-06, "loss": 3.546764221191406, "step": 234200 }, { "epoch": 0.2827141645769288, "learning_rate": 9.094197045862787e-06, "loss": 3.547751159667969, "step": 234300 }, { "epoch": 0.28283482789941145, "learning_rate": 9.09379321039505e-06, "loss": 3.5356320190429686, "step": 234400 }, { "epoch": 0.2829554912218941, "learning_rate": 9.093389374927311e-06, "loss": 3.5340701293945314, "step": 234500 }, { "epoch": 0.2830761545443768, "learning_rate": 9.092985539459571e-06, "loss": 3.54810302734375, "step": 234600 }, { "epoch": 0.28319681786685946, "learning_rate": 9.092581703991833e-06, "loss": 3.55381103515625, "step": 234700 }, { "epoch": 0.2833174811893422, "learning_rate": 9.092177868524095e-06, "loss": 3.533924865722656, "step": 234800 }, { "epoch": 0.28343814451182486, "learning_rate": 9.091774033056356e-06, "loss": 3.5165390014648437, "step": 234900 }, { "epoch": 0.28355880783430754, "learning_rate": 9.091370197588618e-06, "loss": 3.5360092163085937, "step": 235000 }, { "epoch": 0.2836794711567902, "learning_rate": 9.09096636212088e-06, "loss": 3.530864562988281, "step": 235100 }, { "epoch": 0.2838001344792729, "learning_rate": 9.090562526653142e-06, "loss": 3.551382751464844, "step": 235200 }, { "epoch": 0.2839207978017556, "learning_rate": 9.090158691185404e-06, "loss": 3.5360488891601562, "step": 235300 }, { "epoch": 0.2840414611242383, "learning_rate": 9.089754855717666e-06, "loss": 3.555943908691406, "step": 235400 }, { "epoch": 0.28416212444672095, "learning_rate": 9.089351020249928e-06, "loss": 3.5365390014648437, "step": 235500 }, { "epoch": 0.2842827877692036, "learning_rate": 9.088947184782188e-06, "loss": 3.5623223876953123, "step": 235600 }, { "epoch": 0.28440345109168635, "learning_rate": 9.08854334931445e-06, "loss": 3.5370941162109375, "step": 235700 }, { "epoch": 0.284524114414169, "learning_rate": 9.08813951384671e-06, "loss": 3.561373291015625, "step": 235800 }, { "epoch": 0.2846447777366517, "learning_rate": 9.087735678378972e-06, "loss": 3.523375244140625, "step": 235900 }, { "epoch": 0.28476544105913437, "learning_rate": 9.087331842911234e-06, "loss": 3.549563293457031, "step": 236000 }, { "epoch": 0.28488610438161704, "learning_rate": 9.086928007443496e-06, "loss": 3.5181460571289063, "step": 236100 }, { "epoch": 0.2850067677040998, "learning_rate": 9.086524171975758e-06, "loss": 3.5442230224609377, "step": 236200 }, { "epoch": 0.28512743102658245, "learning_rate": 9.08612033650802e-06, "loss": 3.5504837036132812, "step": 236300 }, { "epoch": 0.2852480943490651, "learning_rate": 9.08571650104028e-06, "loss": 3.5411907958984377, "step": 236400 }, { "epoch": 0.2853687576715478, "learning_rate": 9.085312665572542e-06, "loss": 3.547847900390625, "step": 236500 }, { "epoch": 0.28548942099403046, "learning_rate": 9.084908830104804e-06, "loss": 3.4919146728515624, "step": 236600 }, { "epoch": 0.2856100843165132, "learning_rate": 9.084504994637066e-06, "loss": 3.54189453125, "step": 236700 }, { "epoch": 0.28573074763899586, "learning_rate": 9.084101159169327e-06, "loss": 3.547510070800781, "step": 236800 }, { "epoch": 0.28585141096147854, "learning_rate": 9.083697323701589e-06, "loss": 3.552120361328125, "step": 236900 }, { "epoch": 0.2859720742839612, "learning_rate": 9.08329348823385e-06, "loss": 3.5490631103515624, "step": 237000 }, { "epoch": 0.2860927376064439, "learning_rate": 9.082889652766113e-06, "loss": 3.5557119750976565, "step": 237100 }, { "epoch": 0.2862134009289266, "learning_rate": 9.082485817298375e-06, "loss": 3.5196078491210936, "step": 237200 }, { "epoch": 0.2863340642514093, "learning_rate": 9.082081981830635e-06, "loss": 3.520566101074219, "step": 237300 }, { "epoch": 0.28645472757389195, "learning_rate": 9.081678146362897e-06, "loss": 3.5224969482421873, "step": 237400 }, { "epoch": 0.2865753908963746, "learning_rate": 9.081274310895159e-06, "loss": 3.5348040771484377, "step": 237500 }, { "epoch": 0.2866960542188573, "learning_rate": 9.08087047542742e-06, "loss": 3.523841552734375, "step": 237600 }, { "epoch": 0.28681671754134, "learning_rate": 9.080466639959683e-06, "loss": 3.539947204589844, "step": 237700 }, { "epoch": 0.2869373808638227, "learning_rate": 9.080062804491943e-06, "loss": 3.528543701171875, "step": 237800 }, { "epoch": 0.28705804418630537, "learning_rate": 9.079658969024205e-06, "loss": 3.5332635498046874, "step": 237900 }, { "epoch": 0.28717870750878804, "learning_rate": 9.079255133556467e-06, "loss": 3.5342922973632813, "step": 238000 }, { "epoch": 0.2872993708312707, "learning_rate": 9.078851298088727e-06, "loss": 3.511679992675781, "step": 238100 }, { "epoch": 0.28742003415375345, "learning_rate": 9.07844746262099e-06, "loss": 3.529948425292969, "step": 238200 }, { "epoch": 0.2875406974762361, "learning_rate": 9.078043627153251e-06, "loss": 3.533457946777344, "step": 238300 }, { "epoch": 0.2876613607987188, "learning_rate": 9.077639791685513e-06, "loss": 3.502527160644531, "step": 238400 }, { "epoch": 0.28778202412120146, "learning_rate": 9.077235956217775e-06, "loss": 3.5142483520507812, "step": 238500 }, { "epoch": 0.2879026874436842, "learning_rate": 9.076832120750037e-06, "loss": 3.549124755859375, "step": 238600 }, { "epoch": 0.28802335076616686, "learning_rate": 9.076428285282297e-06, "loss": 3.5248681640625, "step": 238700 }, { "epoch": 0.28814401408864954, "learning_rate": 9.07602444981456e-06, "loss": 3.5463262939453126, "step": 238800 }, { "epoch": 0.2882646774111322, "learning_rate": 9.075620614346821e-06, "loss": 3.5553033447265623, "step": 238900 }, { "epoch": 0.2883853407336149, "learning_rate": 9.075216778879082e-06, "loss": 3.5349688720703125, "step": 239000 }, { "epoch": 0.2885060040560976, "learning_rate": 9.074812943411344e-06, "loss": 3.5142343139648435, "step": 239100 }, { "epoch": 0.2886266673785803, "learning_rate": 9.074409107943606e-06, "loss": 3.503292236328125, "step": 239200 }, { "epoch": 0.28874733070106295, "learning_rate": 9.074005272475868e-06, "loss": 3.555716247558594, "step": 239300 }, { "epoch": 0.2888679940235456, "learning_rate": 9.07360143700813e-06, "loss": 3.532054748535156, "step": 239400 }, { "epoch": 0.2889886573460283, "learning_rate": 9.073197601540392e-06, "loss": 3.523057556152344, "step": 239500 }, { "epoch": 0.289109320668511, "learning_rate": 9.072793766072654e-06, "loss": 3.517941589355469, "step": 239600 }, { "epoch": 0.2892299839909937, "learning_rate": 9.072389930604914e-06, "loss": 3.51544189453125, "step": 239700 }, { "epoch": 0.2893506473134764, "learning_rate": 9.071986095137176e-06, "loss": 3.5075982666015624, "step": 239800 }, { "epoch": 0.28947131063595904, "learning_rate": 9.071582259669436e-06, "loss": 3.543909912109375, "step": 239900 }, { "epoch": 0.2895919739584417, "learning_rate": 9.071178424201698e-06, "loss": 3.523030090332031, "step": 240000 }, { "epoch": 0.28971263728092445, "learning_rate": 9.07077458873396e-06, "loss": 3.519525451660156, "step": 240100 }, { "epoch": 0.2898333006034071, "learning_rate": 9.070370753266222e-06, "loss": 3.4934246826171873, "step": 240200 }, { "epoch": 0.2899539639258898, "learning_rate": 9.069966917798484e-06, "loss": 3.5160708618164063, "step": 240300 }, { "epoch": 0.29007462724837246, "learning_rate": 9.069563082330746e-06, "loss": 3.4987454223632812, "step": 240400 }, { "epoch": 0.29019529057085514, "learning_rate": 9.069159246863006e-06, "loss": 3.52860595703125, "step": 240500 }, { "epoch": 0.29031595389333786, "learning_rate": 9.068755411395268e-06, "loss": 3.5318927001953124, "step": 240600 }, { "epoch": 0.29043661721582054, "learning_rate": 9.06835157592753e-06, "loss": 3.5177487182617186, "step": 240700 }, { "epoch": 0.2905572805383032, "learning_rate": 9.067947740459792e-06, "loss": 3.516593322753906, "step": 240800 }, { "epoch": 0.2906779438607859, "learning_rate": 9.067543904992053e-06, "loss": 3.533345947265625, "step": 240900 }, { "epoch": 0.2907986071832686, "learning_rate": 9.067140069524315e-06, "loss": 3.52850830078125, "step": 241000 }, { "epoch": 0.2909192705057513, "learning_rate": 9.066736234056577e-06, "loss": 3.49110107421875, "step": 241100 }, { "epoch": 0.29103993382823395, "learning_rate": 9.066332398588839e-06, "loss": 3.52057861328125, "step": 241200 }, { "epoch": 0.2911605971507166, "learning_rate": 9.065928563121099e-06, "loss": 3.5335784912109376, "step": 241300 }, { "epoch": 0.2912812604731993, "learning_rate": 9.065524727653361e-06, "loss": 3.51269287109375, "step": 241400 }, { "epoch": 0.291401923795682, "learning_rate": 9.065120892185623e-06, "loss": 3.5162054443359376, "step": 241500 }, { "epoch": 0.2915225871181647, "learning_rate": 9.064717056717885e-06, "loss": 3.530340270996094, "step": 241600 }, { "epoch": 0.2916432504406474, "learning_rate": 9.064313221250147e-06, "loss": 3.5295834350585937, "step": 241700 }, { "epoch": 0.29176391376313004, "learning_rate": 9.063909385782407e-06, "loss": 3.5167926025390623, "step": 241800 }, { "epoch": 0.2918845770856127, "learning_rate": 9.063505550314669e-06, "loss": 3.51607177734375, "step": 241900 }, { "epoch": 0.29200524040809545, "learning_rate": 9.063101714846931e-06, "loss": 3.4878125, "step": 242000 }, { "epoch": 0.2921259037305781, "learning_rate": 9.062697879379193e-06, "loss": 3.5096075439453127, "step": 242100 }, { "epoch": 0.2922465670530608, "learning_rate": 9.062294043911453e-06, "loss": 3.486436767578125, "step": 242200 }, { "epoch": 0.29236723037554346, "learning_rate": 9.061890208443715e-06, "loss": 3.5291424560546876, "step": 242300 }, { "epoch": 0.29248789369802614, "learning_rate": 9.061486372975977e-06, "loss": 3.5026568603515624, "step": 242400 }, { "epoch": 0.29260855702050886, "learning_rate": 9.06108253750824e-06, "loss": 3.522607727050781, "step": 242500 }, { "epoch": 0.29272922034299154, "learning_rate": 9.060678702040501e-06, "loss": 3.50931640625, "step": 242600 }, { "epoch": 0.2928498836654742, "learning_rate": 9.060274866572763e-06, "loss": 3.530660400390625, "step": 242700 }, { "epoch": 0.2929705469879569, "learning_rate": 9.059871031105024e-06, "loss": 3.5016534423828123, "step": 242800 }, { "epoch": 0.29309121031043955, "learning_rate": 9.059467195637286e-06, "loss": 3.5031503295898436, "step": 242900 }, { "epoch": 0.2932118736329223, "learning_rate": 9.059063360169546e-06, "loss": 3.4879962158203126, "step": 243000 }, { "epoch": 0.29333253695540495, "learning_rate": 9.058659524701808e-06, "loss": 3.487945861816406, "step": 243100 }, { "epoch": 0.2934532002778876, "learning_rate": 9.05825568923407e-06, "loss": 3.4756591796875, "step": 243200 }, { "epoch": 0.2935738636003703, "learning_rate": 9.057851853766332e-06, "loss": 3.479200439453125, "step": 243300 }, { "epoch": 0.293694526922853, "learning_rate": 9.057448018298594e-06, "loss": 3.5223843383789064, "step": 243400 }, { "epoch": 0.2938151902453357, "learning_rate": 9.057044182830856e-06, "loss": 3.508787841796875, "step": 243500 }, { "epoch": 0.2939358535678184, "learning_rate": 9.056640347363118e-06, "loss": 3.522214660644531, "step": 243600 }, { "epoch": 0.29405651689030105, "learning_rate": 9.056236511895378e-06, "loss": 3.505821533203125, "step": 243700 }, { "epoch": 0.2941771802127837, "learning_rate": 9.05583267642764e-06, "loss": 3.524658508300781, "step": 243800 }, { "epoch": 0.29429784353526645, "learning_rate": 9.055428840959902e-06, "loss": 3.4910598754882813, "step": 243900 }, { "epoch": 0.2944185068577491, "learning_rate": 9.055025005492162e-06, "loss": 3.5071173095703125, "step": 244000 }, { "epoch": 0.2945391701802318, "learning_rate": 9.054621170024424e-06, "loss": 3.5092437744140623, "step": 244100 }, { "epoch": 0.29465983350271446, "learning_rate": 9.054217334556686e-06, "loss": 3.504959716796875, "step": 244200 }, { "epoch": 0.29478049682519714, "learning_rate": 9.053813499088948e-06, "loss": 3.512716979980469, "step": 244300 }, { "epoch": 0.29490116014767986, "learning_rate": 9.05340966362121e-06, "loss": 3.5111618041992188, "step": 244400 }, { "epoch": 0.29502182347016254, "learning_rate": 9.053005828153472e-06, "loss": 3.4888232421875, "step": 244500 }, { "epoch": 0.2951424867926452, "learning_rate": 9.052601992685732e-06, "loss": 3.49567138671875, "step": 244600 }, { "epoch": 0.2952631501151279, "learning_rate": 9.052198157217994e-06, "loss": 3.5268939208984373, "step": 244700 }, { "epoch": 0.29538381343761055, "learning_rate": 9.051794321750256e-06, "loss": 3.4814801025390625, "step": 244800 }, { "epoch": 0.2955044767600933, "learning_rate": 9.051390486282517e-06, "loss": 3.5128665161132813, "step": 244900 }, { "epoch": 0.29562514008257595, "learning_rate": 9.050986650814779e-06, "loss": 3.5191455078125, "step": 245000 }, { "epoch": 0.2957458034050586, "learning_rate": 9.05058281534704e-06, "loss": 3.4879742431640626, "step": 245100 }, { "epoch": 0.2958664667275413, "learning_rate": 9.050178979879303e-06, "loss": 3.487076416015625, "step": 245200 }, { "epoch": 0.29598713005002397, "learning_rate": 9.049775144411565e-06, "loss": 3.495189208984375, "step": 245300 }, { "epoch": 0.2961077933725067, "learning_rate": 9.049371308943825e-06, "loss": 3.523011474609375, "step": 245400 }, { "epoch": 0.2962284566949894, "learning_rate": 9.048967473476087e-06, "loss": 3.5369317626953123, "step": 245500 }, { "epoch": 0.29634912001747205, "learning_rate": 9.048563638008349e-06, "loss": 3.493325500488281, "step": 245600 }, { "epoch": 0.2964697833399547, "learning_rate": 9.048159802540611e-06, "loss": 3.4990829467773437, "step": 245700 }, { "epoch": 0.2965904466624374, "learning_rate": 9.047755967072873e-06, "loss": 3.4918212890625, "step": 245800 }, { "epoch": 0.2967111099849201, "learning_rate": 9.047352131605133e-06, "loss": 3.5048931884765624, "step": 245900 }, { "epoch": 0.2968317733074028, "learning_rate": 9.046948296137395e-06, "loss": 3.501866760253906, "step": 246000 }, { "epoch": 0.29695243662988546, "learning_rate": 9.046544460669657e-06, "loss": 3.4870660400390623, "step": 246100 }, { "epoch": 0.29707309995236814, "learning_rate": 9.046140625201917e-06, "loss": 3.496470947265625, "step": 246200 }, { "epoch": 0.29719376327485086, "learning_rate": 9.04573678973418e-06, "loss": 3.4828750610351564, "step": 246300 }, { "epoch": 0.29731442659733354, "learning_rate": 9.045332954266441e-06, "loss": 3.51740966796875, "step": 246400 }, { "epoch": 0.2974350899198162, "learning_rate": 9.044929118798703e-06, "loss": 3.495346984863281, "step": 246500 }, { "epoch": 0.2975557532422989, "learning_rate": 9.044525283330965e-06, "loss": 3.4912945556640627, "step": 246600 }, { "epoch": 0.29767641656478155, "learning_rate": 9.044121447863227e-06, "loss": 3.474295654296875, "step": 246700 }, { "epoch": 0.2977970798872643, "learning_rate": 9.043717612395488e-06, "loss": 3.5308804321289062, "step": 246800 }, { "epoch": 0.29791774320974695, "learning_rate": 9.04331377692775e-06, "loss": 3.511390380859375, "step": 246900 }, { "epoch": 0.2980384065322296, "learning_rate": 9.042909941460012e-06, "loss": 3.5071051025390627, "step": 247000 }, { "epoch": 0.2981590698547123, "learning_rate": 9.042506105992272e-06, "loss": 3.499173583984375, "step": 247100 }, { "epoch": 0.298279733177195, "learning_rate": 9.042102270524534e-06, "loss": 3.4815493774414064, "step": 247200 }, { "epoch": 0.2984003964996777, "learning_rate": 9.041698435056796e-06, "loss": 3.486444091796875, "step": 247300 }, { "epoch": 0.2985210598221604, "learning_rate": 9.041294599589058e-06, "loss": 3.53158447265625, "step": 247400 }, { "epoch": 0.29864172314464305, "learning_rate": 9.04089076412132e-06, "loss": 3.4900189208984376, "step": 247500 }, { "epoch": 0.2987623864671257, "learning_rate": 9.040486928653582e-06, "loss": 3.4843649291992187, "step": 247600 }, { "epoch": 0.2988830497896084, "learning_rate": 9.040083093185844e-06, "loss": 3.5197415161132812, "step": 247700 }, { "epoch": 0.2990037131120911, "learning_rate": 9.039679257718104e-06, "loss": 3.4803619384765625, "step": 247800 }, { "epoch": 0.2991243764345738, "learning_rate": 9.039275422250366e-06, "loss": 3.492481994628906, "step": 247900 }, { "epoch": 0.29924503975705646, "learning_rate": 9.038871586782626e-06, "loss": 3.4937982177734375, "step": 248000 }, { "epoch": 0.29936570307953914, "learning_rate": 9.038467751314888e-06, "loss": 3.4978997802734373, "step": 248100 }, { "epoch": 0.2994863664020218, "learning_rate": 9.03806391584715e-06, "loss": 3.4873727416992186, "step": 248200 }, { "epoch": 0.29960702972450454, "learning_rate": 9.037660080379412e-06, "loss": 3.463453369140625, "step": 248300 }, { "epoch": 0.2997276930469872, "learning_rate": 9.037256244911674e-06, "loss": 3.4962835693359375, "step": 248400 }, { "epoch": 0.2998483563694699, "learning_rate": 9.036852409443936e-06, "loss": 3.4929794311523437, "step": 248500 }, { "epoch": 0.29996901969195255, "learning_rate": 9.036448573976198e-06, "loss": 3.4812042236328127, "step": 248600 }, { "epoch": 0.3000896830144353, "learning_rate": 9.036044738508458e-06, "loss": 3.54179443359375, "step": 248700 }, { "epoch": 0.30021034633691795, "learning_rate": 9.03564090304072e-06, "loss": 3.4588742065429687, "step": 248800 }, { "epoch": 0.3003310096594006, "learning_rate": 9.035237067572982e-06, "loss": 3.4777667236328127, "step": 248900 }, { "epoch": 0.3004516729818833, "learning_rate": 9.034833232105243e-06, "loss": 3.4772689819335936, "step": 249000 }, { "epoch": 0.300572336304366, "learning_rate": 9.034429396637505e-06, "loss": 3.4955755615234376, "step": 249100 }, { "epoch": 0.3006929996268487, "learning_rate": 9.034025561169767e-06, "loss": 3.4750491333007814, "step": 249200 }, { "epoch": 0.3008136629493314, "learning_rate": 9.033621725702029e-06, "loss": 3.4789614868164063, "step": 249300 }, { "epoch": 0.30093432627181405, "learning_rate": 9.03321789023429e-06, "loss": 3.484339294433594, "step": 249400 }, { "epoch": 0.3010549895942967, "learning_rate": 9.032814054766551e-06, "loss": 3.492952880859375, "step": 249500 }, { "epoch": 0.3011756529167794, "learning_rate": 9.032410219298813e-06, "loss": 3.4924002075195313, "step": 249600 }, { "epoch": 0.3012963162392621, "learning_rate": 9.032006383831075e-06, "loss": 3.479683532714844, "step": 249700 }, { "epoch": 0.3014169795617448, "learning_rate": 9.031602548363337e-06, "loss": 3.49135986328125, "step": 249800 }, { "epoch": 0.30153764288422746, "learning_rate": 9.031198712895597e-06, "loss": 3.4717813110351563, "step": 249900 }, { "epoch": 0.30165830620671014, "learning_rate": 9.03079487742786e-06, "loss": 3.507582092285156, "step": 250000 }, { "epoch": 0.3017789695291928, "learning_rate": 9.030391041960121e-06, "loss": 3.4800839233398437, "step": 250100 }, { "epoch": 0.30189963285167554, "learning_rate": 9.029987206492383e-06, "loss": 3.4723468017578125, "step": 250200 }, { "epoch": 0.3020202961741582, "learning_rate": 9.029583371024643e-06, "loss": 3.460505065917969, "step": 250300 }, { "epoch": 0.3021409594966409, "learning_rate": 9.029179535556905e-06, "loss": 3.4752301025390624, "step": 250400 }, { "epoch": 0.30226162281912355, "learning_rate": 9.028775700089167e-06, "loss": 3.4550735473632814, "step": 250500 }, { "epoch": 0.3023822861416062, "learning_rate": 9.02837186462143e-06, "loss": 3.459894714355469, "step": 250600 }, { "epoch": 0.30250294946408895, "learning_rate": 9.027968029153691e-06, "loss": 3.491341552734375, "step": 250700 }, { "epoch": 0.3026236127865716, "learning_rate": 9.027564193685953e-06, "loss": 3.4609600830078127, "step": 250800 }, { "epoch": 0.3027442761090543, "learning_rate": 9.027160358218214e-06, "loss": 3.4603173828125, "step": 250900 }, { "epoch": 0.302864939431537, "learning_rate": 9.026756522750476e-06, "loss": 3.4639407348632814, "step": 251000 }, { "epoch": 0.30298560275401965, "learning_rate": 9.026352687282736e-06, "loss": 3.47100830078125, "step": 251100 }, { "epoch": 0.3031062660765024, "learning_rate": 9.025948851814998e-06, "loss": 3.4888729858398437, "step": 251200 }, { "epoch": 0.30322692939898505, "learning_rate": 9.02554501634726e-06, "loss": 3.490747375488281, "step": 251300 }, { "epoch": 0.3033475927214677, "learning_rate": 9.025141180879522e-06, "loss": 3.4747659301757814, "step": 251400 }, { "epoch": 0.3034682560439504, "learning_rate": 9.024737345411784e-06, "loss": 3.468287353515625, "step": 251500 }, { "epoch": 0.3035889193664331, "learning_rate": 9.024333509944046e-06, "loss": 3.4877108764648437, "step": 251600 }, { "epoch": 0.3037095826889158, "learning_rate": 9.023929674476308e-06, "loss": 3.481889343261719, "step": 251700 }, { "epoch": 0.30383024601139846, "learning_rate": 9.02352583900857e-06, "loss": 3.4864935302734374, "step": 251800 }, { "epoch": 0.30395090933388114, "learning_rate": 9.02312200354083e-06, "loss": 3.4692153930664062, "step": 251900 }, { "epoch": 0.3040715726563638, "learning_rate": 9.022718168073092e-06, "loss": 3.477308349609375, "step": 252000 }, { "epoch": 0.30419223597884654, "learning_rate": 9.022314332605352e-06, "loss": 3.4716461181640623, "step": 252100 }, { "epoch": 0.3043128993013292, "learning_rate": 9.021910497137614e-06, "loss": 3.4954263305664064, "step": 252200 }, { "epoch": 0.3044335626238119, "learning_rate": 9.021506661669876e-06, "loss": 3.446484375, "step": 252300 }, { "epoch": 0.30455422594629455, "learning_rate": 9.021102826202138e-06, "loss": 3.4822540283203125, "step": 252400 }, { "epoch": 0.3046748892687772, "learning_rate": 9.0206989907344e-06, "loss": 3.4629345703125, "step": 252500 }, { "epoch": 0.30479555259125996, "learning_rate": 9.020295155266662e-06, "loss": 3.49714599609375, "step": 252600 }, { "epoch": 0.3049162159137426, "learning_rate": 9.019891319798924e-06, "loss": 3.4701107788085936, "step": 252700 }, { "epoch": 0.3050368792362253, "learning_rate": 9.019487484331185e-06, "loss": 3.4754180908203125, "step": 252800 }, { "epoch": 0.305157542558708, "learning_rate": 9.019083648863446e-06, "loss": 3.4624261474609375, "step": 252900 }, { "epoch": 0.30527820588119065, "learning_rate": 9.018679813395708e-06, "loss": 3.47029296875, "step": 253000 }, { "epoch": 0.3053988692036734, "learning_rate": 9.018275977927969e-06, "loss": 3.449705810546875, "step": 253100 }, { "epoch": 0.30551953252615605, "learning_rate": 9.01787214246023e-06, "loss": 3.4592404174804687, "step": 253200 }, { "epoch": 0.3056401958486387, "learning_rate": 9.017468306992493e-06, "loss": 3.4513589477539064, "step": 253300 }, { "epoch": 0.3057608591711214, "learning_rate": 9.017064471524755e-06, "loss": 3.45432373046875, "step": 253400 }, { "epoch": 0.30588152249360406, "learning_rate": 9.016660636057017e-06, "loss": 3.4828924560546874, "step": 253500 }, { "epoch": 0.3060021858160868, "learning_rate": 9.016256800589277e-06, "loss": 3.487909851074219, "step": 253600 }, { "epoch": 0.30612284913856946, "learning_rate": 9.015852965121539e-06, "loss": 3.48064697265625, "step": 253700 }, { "epoch": 0.30624351246105214, "learning_rate": 9.015449129653801e-06, "loss": 3.459417724609375, "step": 253800 }, { "epoch": 0.3063641757835348, "learning_rate": 9.015045294186063e-06, "loss": 3.430541687011719, "step": 253900 }, { "epoch": 0.30648483910601754, "learning_rate": 9.014641458718323e-06, "loss": 3.4528570556640625, "step": 254000 }, { "epoch": 0.3066055024285002, "learning_rate": 9.014237623250585e-06, "loss": 3.4385220336914064, "step": 254100 }, { "epoch": 0.3067261657509829, "learning_rate": 9.013833787782847e-06, "loss": 3.4766796875, "step": 254200 }, { "epoch": 0.30684682907346555, "learning_rate": 9.01342995231511e-06, "loss": 3.4515109252929688, "step": 254300 }, { "epoch": 0.3069674923959482, "learning_rate": 9.01302611684737e-06, "loss": 3.466062316894531, "step": 254400 }, { "epoch": 0.30708815571843096, "learning_rate": 9.012622281379631e-06, "loss": 3.459525451660156, "step": 254500 }, { "epoch": 0.3072088190409136, "learning_rate": 9.012218445911893e-06, "loss": 3.4751983642578126, "step": 254600 }, { "epoch": 0.3073294823633963, "learning_rate": 9.011814610444155e-06, "loss": 3.4866497802734373, "step": 254700 }, { "epoch": 0.307450145685879, "learning_rate": 9.011410774976417e-06, "loss": 3.47266845703125, "step": 254800 }, { "epoch": 0.30757080900836165, "learning_rate": 9.01100693950868e-06, "loss": 3.452107238769531, "step": 254900 }, { "epoch": 0.3076914723308444, "learning_rate": 9.01060310404094e-06, "loss": 3.4435076904296875, "step": 255000 }, { "epoch": 0.30781213565332705, "learning_rate": 9.010199268573202e-06, "loss": 3.458359375, "step": 255100 }, { "epoch": 0.3079327989758097, "learning_rate": 9.009795433105462e-06, "loss": 3.4515771484375, "step": 255200 }, { "epoch": 0.3080534622982924, "learning_rate": 9.009391597637724e-06, "loss": 3.4601556396484376, "step": 255300 }, { "epoch": 0.30817412562077506, "learning_rate": 9.008987762169986e-06, "loss": 3.4779644775390626, "step": 255400 }, { "epoch": 0.3082947889432578, "learning_rate": 9.008583926702248e-06, "loss": 3.443705749511719, "step": 255500 }, { "epoch": 0.30841545226574046, "learning_rate": 9.00818009123451e-06, "loss": 3.4390463256835937, "step": 255600 }, { "epoch": 0.30853611558822314, "learning_rate": 9.007776255766772e-06, "loss": 3.4790573120117188, "step": 255700 }, { "epoch": 0.3086567789107058, "learning_rate": 9.007372420299034e-06, "loss": 3.4838552856445313, "step": 255800 }, { "epoch": 0.3087774422331885, "learning_rate": 9.006968584831294e-06, "loss": 3.491734619140625, "step": 255900 }, { "epoch": 0.3088981055556712, "learning_rate": 9.006564749363556e-06, "loss": 3.4590802001953125, "step": 256000 }, { "epoch": 0.3090187688781539, "learning_rate": 9.006160913895818e-06, "loss": 3.4694879150390623, "step": 256100 }, { "epoch": 0.30913943220063655, "learning_rate": 9.005757078428078e-06, "loss": 3.476360168457031, "step": 256200 }, { "epoch": 0.3092600955231192, "learning_rate": 9.00535324296034e-06, "loss": 3.4748306274414062, "step": 256300 }, { "epoch": 0.3093807588456019, "learning_rate": 9.004949407492602e-06, "loss": 3.4740774536132815, "step": 256400 }, { "epoch": 0.30950142216808463, "learning_rate": 9.004545572024864e-06, "loss": 3.4562893676757813, "step": 256500 }, { "epoch": 0.3096220854905673, "learning_rate": 9.004141736557126e-06, "loss": 3.4700558471679686, "step": 256600 }, { "epoch": 0.30974274881305, "learning_rate": 9.003737901089388e-06, "loss": 3.483645324707031, "step": 256700 }, { "epoch": 0.30986341213553265, "learning_rate": 9.003334065621649e-06, "loss": 3.4599957275390625, "step": 256800 }, { "epoch": 0.3099840754580154, "learning_rate": 9.00293023015391e-06, "loss": 3.4322518920898437, "step": 256900 }, { "epoch": 0.31010473878049805, "learning_rate": 9.002526394686173e-06, "loss": 3.4546319580078126, "step": 257000 }, { "epoch": 0.3102254021029807, "learning_rate": 9.002122559218433e-06, "loss": 3.4382232666015624, "step": 257100 }, { "epoch": 0.3103460654254634, "learning_rate": 9.001718723750695e-06, "loss": 3.4302105712890625, "step": 257200 }, { "epoch": 0.31046672874794606, "learning_rate": 9.001314888282957e-06, "loss": 3.4439813232421876, "step": 257300 }, { "epoch": 0.3105873920704288, "learning_rate": 9.000911052815219e-06, "loss": 3.4578170776367188, "step": 257400 }, { "epoch": 0.31070805539291146, "learning_rate": 9.00050721734748e-06, "loss": 3.4609609985351564, "step": 257500 }, { "epoch": 0.31082871871539414, "learning_rate": 9.000103381879743e-06, "loss": 3.446241455078125, "step": 257600 }, { "epoch": 0.3109493820378768, "learning_rate": 8.999699546412003e-06, "loss": 3.454146728515625, "step": 257700 }, { "epoch": 0.3110700453603595, "learning_rate": 8.999295710944265e-06, "loss": 3.4278073120117187, "step": 257800 }, { "epoch": 0.3111907086828422, "learning_rate": 8.998891875476527e-06, "loss": 3.448636779785156, "step": 257900 }, { "epoch": 0.3113113720053249, "learning_rate": 8.998488040008789e-06, "loss": 3.4290347290039063, "step": 258000 }, { "epoch": 0.31143203532780755, "learning_rate": 8.99808420454105e-06, "loss": 3.467711181640625, "step": 258100 }, { "epoch": 0.3115526986502902, "learning_rate": 8.997680369073311e-06, "loss": 3.486952209472656, "step": 258200 }, { "epoch": 0.3116733619727729, "learning_rate": 8.997276533605573e-06, "loss": 3.483233642578125, "step": 258300 }, { "epoch": 0.31179402529525563, "learning_rate": 8.996872698137835e-06, "loss": 3.4470220947265626, "step": 258400 }, { "epoch": 0.3119146886177383, "learning_rate": 8.996468862670095e-06, "loss": 3.45255615234375, "step": 258500 }, { "epoch": 0.312035351940221, "learning_rate": 8.996065027202357e-06, "loss": 3.4778948974609376, "step": 258600 }, { "epoch": 0.31215601526270365, "learning_rate": 8.99566119173462e-06, "loss": 3.448267517089844, "step": 258700 }, { "epoch": 0.3122766785851863, "learning_rate": 8.995257356266881e-06, "loss": 3.4616732788085938, "step": 258800 }, { "epoch": 0.31239734190766905, "learning_rate": 8.994853520799143e-06, "loss": 3.4321258544921873, "step": 258900 }, { "epoch": 0.3125180052301517, "learning_rate": 8.994449685331404e-06, "loss": 3.4414938354492186, "step": 259000 }, { "epoch": 0.3126386685526344, "learning_rate": 8.994045849863666e-06, "loss": 3.442357482910156, "step": 259100 }, { "epoch": 0.31275933187511706, "learning_rate": 8.993642014395928e-06, "loss": 3.451965026855469, "step": 259200 }, { "epoch": 0.3128799951975998, "learning_rate": 8.993238178928188e-06, "loss": 3.4376675415039064, "step": 259300 }, { "epoch": 0.31300065852008246, "learning_rate": 8.99283434346045e-06, "loss": 3.4315447998046875, "step": 259400 }, { "epoch": 0.31312132184256514, "learning_rate": 8.992430507992712e-06, "loss": 3.4639126586914064, "step": 259500 }, { "epoch": 0.3132419851650478, "learning_rate": 8.992026672524974e-06, "loss": 3.438892517089844, "step": 259600 }, { "epoch": 0.3133626484875305, "learning_rate": 8.991622837057236e-06, "loss": 3.4461026000976562, "step": 259700 }, { "epoch": 0.3134833118100132, "learning_rate": 8.991219001589498e-06, "loss": 3.430269775390625, "step": 259800 }, { "epoch": 0.3136039751324959, "learning_rate": 8.99081516612176e-06, "loss": 3.4286233520507814, "step": 259900 }, { "epoch": 0.31372463845497855, "learning_rate": 8.99041133065402e-06, "loss": 3.4094638061523437, "step": 260000 }, { "epoch": 0.3138453017774612, "learning_rate": 8.990007495186282e-06, "loss": 3.471685485839844, "step": 260100 }, { "epoch": 0.3139659650999439, "learning_rate": 8.989603659718542e-06, "loss": 3.441114807128906, "step": 260200 }, { "epoch": 0.31408662842242663, "learning_rate": 8.989199824250804e-06, "loss": 3.4295526123046876, "step": 260300 }, { "epoch": 0.3142072917449093, "learning_rate": 8.988795988783066e-06, "loss": 3.449185485839844, "step": 260400 }, { "epoch": 0.314327955067392, "learning_rate": 8.988392153315328e-06, "loss": 3.433816223144531, "step": 260500 }, { "epoch": 0.31444861838987465, "learning_rate": 8.98798831784759e-06, "loss": 3.4271749877929687, "step": 260600 }, { "epoch": 0.3145692817123573, "learning_rate": 8.987584482379852e-06, "loss": 3.426239318847656, "step": 260700 }, { "epoch": 0.31468994503484005, "learning_rate": 8.987180646912114e-06, "loss": 3.441658630371094, "step": 260800 }, { "epoch": 0.3148106083573227, "learning_rate": 8.986776811444375e-06, "loss": 3.446959228515625, "step": 260900 }, { "epoch": 0.3149312716798054, "learning_rate": 8.986372975976637e-06, "loss": 3.4415554809570312, "step": 261000 }, { "epoch": 0.31505193500228806, "learning_rate": 8.985969140508899e-06, "loss": 3.459325866699219, "step": 261100 }, { "epoch": 0.31517259832477074, "learning_rate": 8.985565305041159e-06, "loss": 3.4426275634765626, "step": 261200 }, { "epoch": 0.31529326164725346, "learning_rate": 8.98516146957342e-06, "loss": 3.4380389404296876, "step": 261300 }, { "epoch": 0.31541392496973614, "learning_rate": 8.984757634105683e-06, "loss": 3.4577291870117186, "step": 261400 }, { "epoch": 0.3155345882922188, "learning_rate": 8.984353798637945e-06, "loss": 3.4526336669921873, "step": 261500 }, { "epoch": 0.3156552516147015, "learning_rate": 8.983949963170207e-06, "loss": 3.4343365478515624, "step": 261600 }, { "epoch": 0.3157759149371842, "learning_rate": 8.983546127702467e-06, "loss": 3.4428106689453126, "step": 261700 }, { "epoch": 0.3158965782596669, "learning_rate": 8.983142292234729e-06, "loss": 3.4348904418945314, "step": 261800 }, { "epoch": 0.31601724158214956, "learning_rate": 8.982738456766991e-06, "loss": 3.439107666015625, "step": 261900 }, { "epoch": 0.3161379049046322, "learning_rate": 8.982334621299253e-06, "loss": 3.4811529541015624, "step": 262000 }, { "epoch": 0.3162585682271149, "learning_rate": 8.981930785831513e-06, "loss": 3.425936279296875, "step": 262100 }, { "epoch": 0.31637923154959763, "learning_rate": 8.981526950363775e-06, "loss": 3.4206106567382815, "step": 262200 }, { "epoch": 0.3164998948720803, "learning_rate": 8.981123114896037e-06, "loss": 3.430743408203125, "step": 262300 }, { "epoch": 0.316620558194563, "learning_rate": 8.9807192794283e-06, "loss": 3.445758972167969, "step": 262400 }, { "epoch": 0.31674122151704565, "learning_rate": 8.980315443960561e-06, "loss": 3.429609375, "step": 262500 }, { "epoch": 0.3168618848395283, "learning_rate": 8.979911608492822e-06, "loss": 3.4421597290039063, "step": 262600 }, { "epoch": 0.31698254816201105, "learning_rate": 8.979507773025083e-06, "loss": 3.43178466796875, "step": 262700 }, { "epoch": 0.3171032114844937, "learning_rate": 8.979103937557345e-06, "loss": 3.4656103515625, "step": 262800 }, { "epoch": 0.3172238748069764, "learning_rate": 8.978700102089607e-06, "loss": 3.4023223876953126, "step": 262900 }, { "epoch": 0.31734453812945906, "learning_rate": 8.97829626662187e-06, "loss": 3.416497802734375, "step": 263000 }, { "epoch": 0.31746520145194174, "learning_rate": 8.97789243115413e-06, "loss": 3.4252813720703124, "step": 263100 }, { "epoch": 0.31758586477442446, "learning_rate": 8.977488595686392e-06, "loss": 3.4430691528320314, "step": 263200 }, { "epoch": 0.31770652809690714, "learning_rate": 8.977084760218654e-06, "loss": 3.426926574707031, "step": 263300 }, { "epoch": 0.3178271914193898, "learning_rate": 8.976680924750914e-06, "loss": 3.4162826538085938, "step": 263400 }, { "epoch": 0.3179478547418725, "learning_rate": 8.976277089283176e-06, "loss": 3.4495684814453127, "step": 263500 }, { "epoch": 0.31806851806435515, "learning_rate": 8.975873253815438e-06, "loss": 3.443098449707031, "step": 263600 }, { "epoch": 0.3181891813868379, "learning_rate": 8.9754694183477e-06, "loss": 3.4121856689453125, "step": 263700 }, { "epoch": 0.31830984470932056, "learning_rate": 8.975065582879962e-06, "loss": 3.4222564697265625, "step": 263800 }, { "epoch": 0.3184305080318032, "learning_rate": 8.974661747412224e-06, "loss": 3.457413635253906, "step": 263900 }, { "epoch": 0.3185511713542859, "learning_rate": 8.974257911944486e-06, "loss": 3.4241983032226564, "step": 264000 }, { "epoch": 0.3186718346767686, "learning_rate": 8.973854076476746e-06, "loss": 3.471674499511719, "step": 264100 }, { "epoch": 0.3187924979992513, "learning_rate": 8.973450241009008e-06, "loss": 3.458307800292969, "step": 264200 }, { "epoch": 0.318913161321734, "learning_rate": 8.973046405541268e-06, "loss": 3.4418869018554688, "step": 264300 }, { "epoch": 0.31903382464421665, "learning_rate": 8.97264257007353e-06, "loss": 3.424395751953125, "step": 264400 }, { "epoch": 0.3191544879666993, "learning_rate": 8.972238734605792e-06, "loss": 3.43928955078125, "step": 264500 }, { "epoch": 0.31927515128918205, "learning_rate": 8.971834899138054e-06, "loss": 3.4374850463867186, "step": 264600 }, { "epoch": 0.3193958146116647, "learning_rate": 8.971431063670316e-06, "loss": 3.413984375, "step": 264700 }, { "epoch": 0.3195164779341474, "learning_rate": 8.971027228202578e-06, "loss": 3.422423095703125, "step": 264800 }, { "epoch": 0.31963714125663006, "learning_rate": 8.97062339273484e-06, "loss": 3.4129583740234377, "step": 264900 }, { "epoch": 0.31975780457911274, "learning_rate": 8.9702195572671e-06, "loss": 3.4327459716796875, "step": 265000 }, { "epoch": 0.31987846790159546, "learning_rate": 8.969815721799363e-06, "loss": 3.452320251464844, "step": 265100 }, { "epoch": 0.31999913122407814, "learning_rate": 8.969411886331625e-06, "loss": 3.4316326904296877, "step": 265200 }, { "epoch": 0.3201197945465608, "learning_rate": 8.969008050863885e-06, "loss": 3.422105407714844, "step": 265300 }, { "epoch": 0.3202404578690435, "learning_rate": 8.968604215396147e-06, "loss": 3.448186340332031, "step": 265400 }, { "epoch": 0.32036112119152615, "learning_rate": 8.968200379928409e-06, "loss": 3.4348150634765626, "step": 265500 }, { "epoch": 0.3204817845140089, "learning_rate": 8.96779654446067e-06, "loss": 3.4232470703125, "step": 265600 }, { "epoch": 0.32060244783649156, "learning_rate": 8.967392708992933e-06, "loss": 3.420945739746094, "step": 265700 }, { "epoch": 0.32072311115897423, "learning_rate": 8.966988873525193e-06, "loss": 3.418802490234375, "step": 265800 }, { "epoch": 0.3208437744814569, "learning_rate": 8.966585038057455e-06, "loss": 3.4635491943359376, "step": 265900 }, { "epoch": 0.3209644378039396, "learning_rate": 8.966181202589717e-06, "loss": 3.439429931640625, "step": 266000 }, { "epoch": 0.3210851011264223, "learning_rate": 8.965777367121979e-06, "loss": 3.417015380859375, "step": 266100 }, { "epoch": 0.321205764448905, "learning_rate": 8.96537353165424e-06, "loss": 3.4199600219726562, "step": 266200 }, { "epoch": 0.32132642777138765, "learning_rate": 8.964969696186501e-06, "loss": 3.389524230957031, "step": 266300 }, { "epoch": 0.3214470910938703, "learning_rate": 8.964565860718763e-06, "loss": 3.4148764038085937, "step": 266400 }, { "epoch": 0.321567754416353, "learning_rate": 8.964162025251025e-06, "loss": 3.430206298828125, "step": 266500 }, { "epoch": 0.3216884177388357, "learning_rate": 8.963758189783286e-06, "loss": 3.4072830200195314, "step": 266600 }, { "epoch": 0.3218090810613184, "learning_rate": 8.963354354315548e-06, "loss": 3.4197808837890626, "step": 266700 }, { "epoch": 0.32192974438380106, "learning_rate": 8.96295051884781e-06, "loss": 3.4132696533203126, "step": 266800 }, { "epoch": 0.32205040770628374, "learning_rate": 8.962546683380072e-06, "loss": 3.3937384033203126, "step": 266900 }, { "epoch": 0.32217107102876646, "learning_rate": 8.962142847912333e-06, "loss": 3.4091748046875, "step": 267000 }, { "epoch": 0.32229173435124914, "learning_rate": 8.961739012444595e-06, "loss": 3.4112197875976564, "step": 267100 }, { "epoch": 0.3224123976737318, "learning_rate": 8.961335176976856e-06, "loss": 3.434464111328125, "step": 267200 }, { "epoch": 0.3225330609962145, "learning_rate": 8.960931341509118e-06, "loss": 3.4558660888671877, "step": 267300 }, { "epoch": 0.32265372431869715, "learning_rate": 8.960527506041378e-06, "loss": 3.422171936035156, "step": 267400 }, { "epoch": 0.3227743876411799, "learning_rate": 8.96012367057364e-06, "loss": 3.4338082885742187, "step": 267500 }, { "epoch": 0.32289505096366256, "learning_rate": 8.959719835105902e-06, "loss": 3.4131838989257814, "step": 267600 }, { "epoch": 0.32301571428614523, "learning_rate": 8.959315999638164e-06, "loss": 3.405376281738281, "step": 267700 }, { "epoch": 0.3231363776086279, "learning_rate": 8.958912164170426e-06, "loss": 3.41404541015625, "step": 267800 }, { "epoch": 0.3232570409311106, "learning_rate": 8.958508328702688e-06, "loss": 3.4180859375, "step": 267900 }, { "epoch": 0.3233777042535933, "learning_rate": 8.95810449323495e-06, "loss": 3.4190237426757815, "step": 268000 }, { "epoch": 0.323498367576076, "learning_rate": 8.95770065776721e-06, "loss": 3.431121826171875, "step": 268100 }, { "epoch": 0.32361903089855865, "learning_rate": 8.957296822299472e-06, "loss": 3.3913348388671873, "step": 268200 }, { "epoch": 0.3237396942210413, "learning_rate": 8.956892986831734e-06, "loss": 3.414170837402344, "step": 268300 }, { "epoch": 0.323860357543524, "learning_rate": 8.956489151363994e-06, "loss": 3.4269586181640626, "step": 268400 }, { "epoch": 0.3239810208660067, "learning_rate": 8.956085315896256e-06, "loss": 3.4055206298828127, "step": 268500 }, { "epoch": 0.3241016841884894, "learning_rate": 8.955681480428518e-06, "loss": 3.427828674316406, "step": 268600 }, { "epoch": 0.32422234751097206, "learning_rate": 8.95527764496078e-06, "loss": 3.4393997192382812, "step": 268700 }, { "epoch": 0.32434301083345474, "learning_rate": 8.954873809493042e-06, "loss": 3.4129901123046875, "step": 268800 }, { "epoch": 0.3244636741559374, "learning_rate": 8.954469974025304e-06, "loss": 3.407271423339844, "step": 268900 }, { "epoch": 0.32458433747842014, "learning_rate": 8.954066138557566e-06, "loss": 3.4225839233398436, "step": 269000 }, { "epoch": 0.3247050008009028, "learning_rate": 8.953662303089827e-06, "loss": 3.4220285034179687, "step": 269100 }, { "epoch": 0.3248256641233855, "learning_rate": 8.953258467622089e-06, "loss": 3.430135498046875, "step": 269200 }, { "epoch": 0.32494632744586815, "learning_rate": 8.952854632154349e-06, "loss": 3.402149963378906, "step": 269300 }, { "epoch": 0.3250669907683508, "learning_rate": 8.952450796686611e-06, "loss": 3.4288433837890624, "step": 269400 }, { "epoch": 0.32518765409083356, "learning_rate": 8.952046961218873e-06, "loss": 3.3944317626953127, "step": 269500 }, { "epoch": 0.32530831741331623, "learning_rate": 8.951643125751135e-06, "loss": 3.42071044921875, "step": 269600 }, { "epoch": 0.3254289807357989, "learning_rate": 8.951239290283397e-06, "loss": 3.4072747802734376, "step": 269700 }, { "epoch": 0.3255496440582816, "learning_rate": 8.950835454815659e-06, "loss": 3.4286843872070314, "step": 269800 }, { "epoch": 0.3256703073807643, "learning_rate": 8.950431619347919e-06, "loss": 3.4127377319335936, "step": 269900 }, { "epoch": 0.325790970703247, "learning_rate": 8.950027783880181e-06, "loss": 3.410301513671875, "step": 270000 }, { "epoch": 0.32591163402572965, "learning_rate": 8.949623948412443e-06, "loss": 3.4120755004882812, "step": 270100 }, { "epoch": 0.3260322973482123, "learning_rate": 8.949220112944705e-06, "loss": 3.4109710693359374, "step": 270200 }, { "epoch": 0.326152960670695, "learning_rate": 8.948816277476965e-06, "loss": 3.431054992675781, "step": 270300 }, { "epoch": 0.3262736239931777, "learning_rate": 8.948412442009227e-06, "loss": 3.435937805175781, "step": 270400 }, { "epoch": 0.3263942873156604, "learning_rate": 8.94800860654149e-06, "loss": 3.4051300048828126, "step": 270500 }, { "epoch": 0.32651495063814306, "learning_rate": 8.947604771073751e-06, "loss": 3.402293395996094, "step": 270600 }, { "epoch": 0.32663561396062574, "learning_rate": 8.947200935606012e-06, "loss": 3.4104534912109377, "step": 270700 }, { "epoch": 0.3267562772831084, "learning_rate": 8.946797100138274e-06, "loss": 3.450542297363281, "step": 270800 }, { "epoch": 0.32687694060559114, "learning_rate": 8.946393264670536e-06, "loss": 3.404408264160156, "step": 270900 }, { "epoch": 0.3269976039280738, "learning_rate": 8.945989429202798e-06, "loss": 3.3864266967773435, "step": 271000 }, { "epoch": 0.3271182672505565, "learning_rate": 8.94558559373506e-06, "loss": 3.438731384277344, "step": 271100 }, { "epoch": 0.32723893057303916, "learning_rate": 8.94518175826732e-06, "loss": 3.3691412353515626, "step": 271200 }, { "epoch": 0.3273595938955218, "learning_rate": 8.944777922799582e-06, "loss": 3.418052978515625, "step": 271300 }, { "epoch": 0.32748025721800456, "learning_rate": 8.944374087331844e-06, "loss": 3.402443542480469, "step": 271400 }, { "epoch": 0.32760092054048723, "learning_rate": 8.943970251864104e-06, "loss": 3.4133282470703126, "step": 271500 }, { "epoch": 0.3277215838629699, "learning_rate": 8.943566416396366e-06, "loss": 3.4210699462890624, "step": 271600 }, { "epoch": 0.3278422471854526, "learning_rate": 8.943162580928628e-06, "loss": 3.394195556640625, "step": 271700 }, { "epoch": 0.32796291050793525, "learning_rate": 8.94275874546089e-06, "loss": 3.3984625244140627, "step": 271800 }, { "epoch": 0.328083573830418, "learning_rate": 8.942354909993152e-06, "loss": 3.4185125732421877, "step": 271900 }, { "epoch": 0.32820423715290065, "learning_rate": 8.941951074525414e-06, "loss": 3.3967440795898436, "step": 272000 }, { "epoch": 0.3283249004753833, "learning_rate": 8.941547239057676e-06, "loss": 3.404901123046875, "step": 272100 }, { "epoch": 0.328445563797866, "learning_rate": 8.941143403589936e-06, "loss": 3.434716796875, "step": 272200 }, { "epoch": 0.3285662271203487, "learning_rate": 8.940739568122198e-06, "loss": 3.386178283691406, "step": 272300 }, { "epoch": 0.3286868904428314, "learning_rate": 8.940335732654459e-06, "loss": 3.3972821044921875, "step": 272400 }, { "epoch": 0.32880755376531406, "learning_rate": 8.93993189718672e-06, "loss": 3.3879278564453124, "step": 272500 }, { "epoch": 0.32892821708779674, "learning_rate": 8.939528061718982e-06, "loss": 3.4064971923828127, "step": 272600 }, { "epoch": 0.3290488804102794, "learning_rate": 8.939124226251244e-06, "loss": 3.384049987792969, "step": 272700 }, { "epoch": 0.32916954373276214, "learning_rate": 8.938720390783506e-06, "loss": 3.4083456420898437, "step": 272800 }, { "epoch": 0.3292902070552448, "learning_rate": 8.938316555315768e-06, "loss": 3.392106018066406, "step": 272900 }, { "epoch": 0.3294108703777275, "learning_rate": 8.93791271984803e-06, "loss": 3.3937637329101564, "step": 273000 }, { "epoch": 0.32953153370021016, "learning_rate": 8.93750888438029e-06, "loss": 3.4171212768554686, "step": 273100 }, { "epoch": 0.3296521970226928, "learning_rate": 8.937105048912553e-06, "loss": 3.382413635253906, "step": 273200 }, { "epoch": 0.32977286034517556, "learning_rate": 8.936701213444815e-06, "loss": 3.412478332519531, "step": 273300 }, { "epoch": 0.32989352366765823, "learning_rate": 8.936297377977075e-06, "loss": 3.3814852905273436, "step": 273400 }, { "epoch": 0.3300141869901409, "learning_rate": 8.935893542509337e-06, "loss": 3.3921054077148436, "step": 273500 }, { "epoch": 0.3301348503126236, "learning_rate": 8.935489707041599e-06, "loss": 3.406640625, "step": 273600 }, { "epoch": 0.33025551363510625, "learning_rate": 8.935085871573861e-06, "loss": 3.408719177246094, "step": 273700 }, { "epoch": 0.330376176957589, "learning_rate": 8.934682036106123e-06, "loss": 3.3929583740234377, "step": 273800 }, { "epoch": 0.33049684028007165, "learning_rate": 8.934278200638385e-06, "loss": 3.3913949584960936, "step": 273900 }, { "epoch": 0.3306175036025543, "learning_rate": 8.933874365170645e-06, "loss": 3.404845886230469, "step": 274000 }, { "epoch": 0.330738166925037, "learning_rate": 8.933470529702907e-06, "loss": 3.4157815551757813, "step": 274100 }, { "epoch": 0.33085883024751966, "learning_rate": 8.933066694235169e-06, "loss": 3.4067898559570313, "step": 274200 }, { "epoch": 0.3309794935700024, "learning_rate": 8.93266285876743e-06, "loss": 3.3764547729492187, "step": 274300 }, { "epoch": 0.33110015689248506, "learning_rate": 8.932259023299691e-06, "loss": 3.409166259765625, "step": 274400 }, { "epoch": 0.33122082021496774, "learning_rate": 8.931855187831953e-06, "loss": 3.3862844848632814, "step": 274500 }, { "epoch": 0.3313414835374504, "learning_rate": 8.931451352364215e-06, "loss": 3.386566467285156, "step": 274600 }, { "epoch": 0.33146214685993314, "learning_rate": 8.931047516896477e-06, "loss": 3.3982144165039063, "step": 274700 }, { "epoch": 0.3315828101824158, "learning_rate": 8.930643681428738e-06, "loss": 3.400815124511719, "step": 274800 }, { "epoch": 0.3317034735048985, "learning_rate": 8.930239845961e-06, "loss": 3.4145538330078127, "step": 274900 }, { "epoch": 0.33182413682738116, "learning_rate": 8.929836010493262e-06, "loss": 3.4297802734375, "step": 275000 }, { "epoch": 0.33194480014986383, "learning_rate": 8.929432175025524e-06, "loss": 3.41453857421875, "step": 275100 }, { "epoch": 0.33206546347234656, "learning_rate": 8.929028339557786e-06, "loss": 3.4054510498046877, "step": 275200 }, { "epoch": 0.33218612679482923, "learning_rate": 8.928624504090046e-06, "loss": 3.40883056640625, "step": 275300 }, { "epoch": 0.3323067901173119, "learning_rate": 8.928220668622308e-06, "loss": 3.395893859863281, "step": 275400 }, { "epoch": 0.3324274534397946, "learning_rate": 8.92781683315457e-06, "loss": 3.373174133300781, "step": 275500 }, { "epoch": 0.33254811676227725, "learning_rate": 8.92741299768683e-06, "loss": 3.391562194824219, "step": 275600 }, { "epoch": 0.33266878008476, "learning_rate": 8.927009162219092e-06, "loss": 3.4045245361328127, "step": 275700 }, { "epoch": 0.33278944340724265, "learning_rate": 8.926605326751354e-06, "loss": 3.406170654296875, "step": 275800 }, { "epoch": 0.3329101067297253, "learning_rate": 8.926201491283616e-06, "loss": 3.4026727294921875, "step": 275900 }, { "epoch": 0.333030770052208, "learning_rate": 8.925797655815878e-06, "loss": 3.394820556640625, "step": 276000 }, { "epoch": 0.33315143337469066, "learning_rate": 8.92539382034814e-06, "loss": 3.3794119262695315, "step": 276100 }, { "epoch": 0.3332720966971734, "learning_rate": 8.9249899848804e-06, "loss": 3.368946228027344, "step": 276200 }, { "epoch": 0.33339276001965606, "learning_rate": 8.924586149412662e-06, "loss": 3.4138827514648438, "step": 276300 }, { "epoch": 0.33351342334213874, "learning_rate": 8.924182313944924e-06, "loss": 3.3815133666992185, "step": 276400 }, { "epoch": 0.3336340866646214, "learning_rate": 8.923778478477185e-06, "loss": 3.359302673339844, "step": 276500 }, { "epoch": 0.3337547499871041, "learning_rate": 8.923374643009447e-06, "loss": 3.376070251464844, "step": 276600 }, { "epoch": 0.3338754133095868, "learning_rate": 8.922970807541709e-06, "loss": 3.35724853515625, "step": 276700 }, { "epoch": 0.3339960766320695, "learning_rate": 8.92256697207397e-06, "loss": 3.362991943359375, "step": 276800 }, { "epoch": 0.33411673995455216, "learning_rate": 8.922163136606232e-06, "loss": 3.383186950683594, "step": 276900 }, { "epoch": 0.33423740327703483, "learning_rate": 8.921759301138494e-06, "loss": 3.3990017700195314, "step": 277000 }, { "epoch": 0.3343580665995175, "learning_rate": 8.921355465670756e-06, "loss": 3.3729241943359374, "step": 277100 }, { "epoch": 0.33447872992200023, "learning_rate": 8.920951630203017e-06, "loss": 3.3886309814453126, "step": 277200 }, { "epoch": 0.3345993932444829, "learning_rate": 8.920547794735279e-06, "loss": 3.3883697509765627, "step": 277300 }, { "epoch": 0.3347200565669656, "learning_rate": 8.920143959267539e-06, "loss": 3.39986083984375, "step": 277400 }, { "epoch": 0.33484071988944825, "learning_rate": 8.919740123799801e-06, "loss": 3.388621826171875, "step": 277500 }, { "epoch": 0.334961383211931, "learning_rate": 8.919336288332063e-06, "loss": 3.39012451171875, "step": 277600 }, { "epoch": 0.33508204653441365, "learning_rate": 8.918932452864325e-06, "loss": 3.415402526855469, "step": 277700 }, { "epoch": 0.3352027098568963, "learning_rate": 8.918528617396587e-06, "loss": 3.3778555297851565, "step": 277800 }, { "epoch": 0.335323373179379, "learning_rate": 8.918124781928849e-06, "loss": 3.38413818359375, "step": 277900 }, { "epoch": 0.33544403650186166, "learning_rate": 8.917720946461111e-06, "loss": 3.4044259643554686, "step": 278000 }, { "epoch": 0.3355646998243444, "learning_rate": 8.917317110993371e-06, "loss": 3.384930419921875, "step": 278100 }, { "epoch": 0.33568536314682706, "learning_rate": 8.916913275525633e-06, "loss": 3.389382629394531, "step": 278200 }, { "epoch": 0.33580602646930974, "learning_rate": 8.916509440057895e-06, "loss": 3.363320617675781, "step": 278300 }, { "epoch": 0.3359266897917924, "learning_rate": 8.916105604590155e-06, "loss": 3.376626281738281, "step": 278400 }, { "epoch": 0.3360473531142751, "learning_rate": 8.915701769122417e-06, "loss": 3.387845153808594, "step": 278500 }, { "epoch": 0.3361680164367578, "learning_rate": 8.91529793365468e-06, "loss": 3.382444152832031, "step": 278600 }, { "epoch": 0.3362886797592405, "learning_rate": 8.914894098186941e-06, "loss": 3.3610235595703126, "step": 278700 }, { "epoch": 0.33640934308172316, "learning_rate": 8.914490262719203e-06, "loss": 3.3461782836914065, "step": 278800 }, { "epoch": 0.33653000640420583, "learning_rate": 8.914086427251464e-06, "loss": 3.344154968261719, "step": 278900 }, { "epoch": 0.3366506697266885, "learning_rate": 8.913682591783726e-06, "loss": 3.3894277954101564, "step": 279000 }, { "epoch": 0.33677133304917123, "learning_rate": 8.913278756315988e-06, "loss": 3.3843310546875, "step": 279100 }, { "epoch": 0.3368919963716539, "learning_rate": 8.91287492084825e-06, "loss": 3.392698059082031, "step": 279200 }, { "epoch": 0.3370126596941366, "learning_rate": 8.912471085380512e-06, "loss": 3.420693054199219, "step": 279300 }, { "epoch": 0.33713332301661925, "learning_rate": 8.912067249912772e-06, "loss": 3.367318115234375, "step": 279400 }, { "epoch": 0.3372539863391019, "learning_rate": 8.911663414445034e-06, "loss": 3.385009765625, "step": 279500 }, { "epoch": 0.33737464966158465, "learning_rate": 8.911259578977296e-06, "loss": 3.3924191284179686, "step": 279600 }, { "epoch": 0.3374953129840673, "learning_rate": 8.910855743509556e-06, "loss": 3.3769635009765624, "step": 279700 }, { "epoch": 0.33761597630655, "learning_rate": 8.910451908041818e-06, "loss": 3.3821453857421875, "step": 279800 }, { "epoch": 0.33773663962903266, "learning_rate": 8.91004807257408e-06, "loss": 3.37096435546875, "step": 279900 }, { "epoch": 0.3378573029515154, "learning_rate": 8.909644237106342e-06, "loss": 3.3777685546875, "step": 280000 }, { "epoch": 0.33797796627399807, "learning_rate": 8.909240401638604e-06, "loss": 3.3721749877929685, "step": 280100 }, { "epoch": 0.33809862959648074, "learning_rate": 8.908836566170866e-06, "loss": 3.395386962890625, "step": 280200 }, { "epoch": 0.3382192929189634, "learning_rate": 8.908432730703126e-06, "loss": 3.3792495727539062, "step": 280300 }, { "epoch": 0.3383399562414461, "learning_rate": 8.908028895235388e-06, "loss": 3.3678704833984376, "step": 280400 }, { "epoch": 0.3384606195639288, "learning_rate": 8.90762505976765e-06, "loss": 3.3860684204101563, "step": 280500 }, { "epoch": 0.3385812828864115, "learning_rate": 8.90722122429991e-06, "loss": 3.38067626953125, "step": 280600 }, { "epoch": 0.33870194620889416, "learning_rate": 8.906817388832173e-06, "loss": 3.4077716064453125, "step": 280700 }, { "epoch": 0.33882260953137683, "learning_rate": 8.906413553364435e-06, "loss": 3.38542236328125, "step": 280800 }, { "epoch": 0.3389432728538595, "learning_rate": 8.906009717896697e-06, "loss": 3.342257385253906, "step": 280900 }, { "epoch": 0.33906393617634223, "learning_rate": 8.905605882428959e-06, "loss": 3.411065979003906, "step": 281000 }, { "epoch": 0.3391845994988249, "learning_rate": 8.90520204696122e-06, "loss": 3.3679949951171877, "step": 281100 }, { "epoch": 0.3393052628213076, "learning_rate": 8.904798211493482e-06, "loss": 3.3774600219726563, "step": 281200 }, { "epoch": 0.33942592614379025, "learning_rate": 8.904394376025743e-06, "loss": 3.389027099609375, "step": 281300 }, { "epoch": 0.3395465894662729, "learning_rate": 8.903990540558005e-06, "loss": 3.4046002197265626, "step": 281400 }, { "epoch": 0.33966725278875565, "learning_rate": 8.903586705090265e-06, "loss": 3.37701416015625, "step": 281500 }, { "epoch": 0.3397879161112383, "learning_rate": 8.903182869622527e-06, "loss": 3.3534051513671876, "step": 281600 }, { "epoch": 0.339908579433721, "learning_rate": 8.902779034154789e-06, "loss": 3.368833312988281, "step": 281700 }, { "epoch": 0.34002924275620366, "learning_rate": 8.902375198687051e-06, "loss": 3.3513803100585937, "step": 281800 }, { "epoch": 0.34014990607868634, "learning_rate": 8.901971363219313e-06, "loss": 3.3462094116210936, "step": 281900 }, { "epoch": 0.34027056940116907, "learning_rate": 8.901567527751575e-06, "loss": 3.391901550292969, "step": 282000 }, { "epoch": 0.34039123272365174, "learning_rate": 8.901163692283835e-06, "loss": 3.37974609375, "step": 282100 }, { "epoch": 0.3405118960461344, "learning_rate": 8.900759856816097e-06, "loss": 3.3770928955078126, "step": 282200 }, { "epoch": 0.3406325593686171, "learning_rate": 8.90035602134836e-06, "loss": 3.3966827392578125, "step": 282300 }, { "epoch": 0.34075322269109976, "learning_rate": 8.899952185880621e-06, "loss": 3.3758489990234377, "step": 282400 }, { "epoch": 0.3408738860135825, "learning_rate": 8.899548350412881e-06, "loss": 3.412453308105469, "step": 282500 }, { "epoch": 0.34099454933606516, "learning_rate": 8.899144514945143e-06, "loss": 3.3762371826171873, "step": 282600 }, { "epoch": 0.34111521265854783, "learning_rate": 8.898740679477405e-06, "loss": 3.3829190063476564, "step": 282700 }, { "epoch": 0.3412358759810305, "learning_rate": 8.898336844009667e-06, "loss": 3.3675518798828126, "step": 282800 }, { "epoch": 0.34135653930351323, "learning_rate": 8.89793300854193e-06, "loss": 3.3886773681640623, "step": 282900 }, { "epoch": 0.3414772026259959, "learning_rate": 8.89752917307419e-06, "loss": 3.3868609619140626, "step": 283000 }, { "epoch": 0.3415978659484786, "learning_rate": 8.897125337606452e-06, "loss": 3.3706756591796876, "step": 283100 }, { "epoch": 0.34171852927096125, "learning_rate": 8.896721502138714e-06, "loss": 3.3764334106445313, "step": 283200 }, { "epoch": 0.3418391925934439, "learning_rate": 8.896317666670976e-06, "loss": 3.352802734375, "step": 283300 }, { "epoch": 0.34195985591592665, "learning_rate": 8.895913831203236e-06, "loss": 3.391837158203125, "step": 283400 }, { "epoch": 0.3420805192384093, "learning_rate": 8.895509995735498e-06, "loss": 3.388258972167969, "step": 283500 }, { "epoch": 0.342201182560892, "learning_rate": 8.89510616026776e-06, "loss": 3.361815185546875, "step": 283600 }, { "epoch": 0.34232184588337466, "learning_rate": 8.894702324800022e-06, "loss": 3.342745666503906, "step": 283700 }, { "epoch": 0.34244250920585734, "learning_rate": 8.894298489332282e-06, "loss": 3.3899136352539063, "step": 283800 }, { "epoch": 0.34256317252834007, "learning_rate": 8.893894653864544e-06, "loss": 3.3812921142578123, "step": 283900 }, { "epoch": 0.34268383585082274, "learning_rate": 8.893490818396806e-06, "loss": 3.3620645141601564, "step": 284000 }, { "epoch": 0.3428044991733054, "learning_rate": 8.893086982929068e-06, "loss": 3.3420245361328127, "step": 284100 }, { "epoch": 0.3429251624957881, "learning_rate": 8.89268314746133e-06, "loss": 3.374725036621094, "step": 284200 }, { "epoch": 0.34304582581827076, "learning_rate": 8.892279311993592e-06, "loss": 3.3634933471679687, "step": 284300 }, { "epoch": 0.3431664891407535, "learning_rate": 8.891875476525852e-06, "loss": 3.358265686035156, "step": 284400 }, { "epoch": 0.34328715246323616, "learning_rate": 8.891471641058114e-06, "loss": 3.3755764770507812, "step": 284500 }, { "epoch": 0.34340781578571883, "learning_rate": 8.891067805590375e-06, "loss": 3.360271301269531, "step": 284600 }, { "epoch": 0.3435284791082015, "learning_rate": 8.890663970122637e-06, "loss": 3.3660818481445314, "step": 284700 }, { "epoch": 0.3436491424306842, "learning_rate": 8.890260134654899e-06, "loss": 3.367215881347656, "step": 284800 }, { "epoch": 0.3437698057531669, "learning_rate": 8.88985629918716e-06, "loss": 3.3591278076171873, "step": 284900 }, { "epoch": 0.3438904690756496, "learning_rate": 8.889452463719423e-06, "loss": 3.3559494018554688, "step": 285000 }, { "epoch": 0.34401113239813225, "learning_rate": 8.889048628251685e-06, "loss": 3.3690521240234377, "step": 285100 }, { "epoch": 0.3441317957206149, "learning_rate": 8.888644792783947e-06, "loss": 3.3683761596679687, "step": 285200 }, { "epoch": 0.34425245904309765, "learning_rate": 8.888240957316207e-06, "loss": 3.3877032470703123, "step": 285300 }, { "epoch": 0.3443731223655803, "learning_rate": 8.887837121848469e-06, "loss": 3.348993225097656, "step": 285400 }, { "epoch": 0.344493785688063, "learning_rate": 8.88743328638073e-06, "loss": 3.358624267578125, "step": 285500 }, { "epoch": 0.34461444901054566, "learning_rate": 8.887029450912991e-06, "loss": 3.3711981201171874, "step": 285600 }, { "epoch": 0.34473511233302834, "learning_rate": 8.886625615445253e-06, "loss": 3.3545632934570313, "step": 285700 }, { "epoch": 0.34485577565551107, "learning_rate": 8.886221779977515e-06, "loss": 3.377494201660156, "step": 285800 }, { "epoch": 0.34497643897799374, "learning_rate": 8.885817944509777e-06, "loss": 3.332389221191406, "step": 285900 }, { "epoch": 0.3450971023004764, "learning_rate": 8.885414109042039e-06, "loss": 3.38436279296875, "step": 286000 }, { "epoch": 0.3452177656229591, "learning_rate": 8.885010273574301e-06, "loss": 3.3601043701171873, "step": 286100 }, { "epoch": 0.34533842894544176, "learning_rate": 8.884606438106561e-06, "loss": 3.349520568847656, "step": 286200 }, { "epoch": 0.3454590922679245, "learning_rate": 8.884202602638823e-06, "loss": 3.3518450927734373, "step": 286300 }, { "epoch": 0.34557975559040716, "learning_rate": 8.883798767171085e-06, "loss": 3.3643002319335937, "step": 286400 }, { "epoch": 0.34570041891288983, "learning_rate": 8.883394931703346e-06, "loss": 3.386228332519531, "step": 286500 }, { "epoch": 0.3458210822353725, "learning_rate": 8.882991096235608e-06, "loss": 3.3288198852539064, "step": 286600 }, { "epoch": 0.3459417455578552, "learning_rate": 8.88258726076787e-06, "loss": 3.368284912109375, "step": 286700 }, { "epoch": 0.3460624088803379, "learning_rate": 8.882183425300131e-06, "loss": 3.3436083984375, "step": 286800 }, { "epoch": 0.3461830722028206, "learning_rate": 8.881779589832393e-06, "loss": 3.3695303344726564, "step": 286900 }, { "epoch": 0.34630373552530325, "learning_rate": 8.881375754364654e-06, "loss": 3.3454019165039064, "step": 287000 }, { "epoch": 0.3464243988477859, "learning_rate": 8.880971918896916e-06, "loss": 3.3680816650390626, "step": 287100 }, { "epoch": 0.3465450621702686, "learning_rate": 8.880568083429178e-06, "loss": 3.356971435546875, "step": 287200 }, { "epoch": 0.3466657254927513, "learning_rate": 8.88016424796144e-06, "loss": 3.343841857910156, "step": 287300 }, { "epoch": 0.346786388815234, "learning_rate": 8.879760412493702e-06, "loss": 3.34329345703125, "step": 287400 }, { "epoch": 0.34690705213771666, "learning_rate": 8.879356577025962e-06, "loss": 3.3465447998046876, "step": 287500 }, { "epoch": 0.34702771546019934, "learning_rate": 8.878952741558224e-06, "loss": 3.362466125488281, "step": 287600 }, { "epoch": 0.34714837878268207, "learning_rate": 8.878548906090486e-06, "loss": 3.350896301269531, "step": 287700 }, { "epoch": 0.34726904210516474, "learning_rate": 8.878145070622746e-06, "loss": 3.349106750488281, "step": 287800 }, { "epoch": 0.3473897054276474, "learning_rate": 8.877741235155008e-06, "loss": 3.3594305419921877, "step": 287900 }, { "epoch": 0.3475103687501301, "learning_rate": 8.87733739968727e-06, "loss": 3.356083984375, "step": 288000 }, { "epoch": 0.34763103207261276, "learning_rate": 8.876933564219532e-06, "loss": 3.3537591552734374, "step": 288100 }, { "epoch": 0.3477516953950955, "learning_rate": 8.876529728751794e-06, "loss": 3.356206970214844, "step": 288200 }, { "epoch": 0.34787235871757816, "learning_rate": 8.876125893284056e-06, "loss": 3.345203552246094, "step": 288300 }, { "epoch": 0.34799302204006083, "learning_rate": 8.875722057816316e-06, "loss": 3.3486846923828124, "step": 288400 }, { "epoch": 0.3481136853625435, "learning_rate": 8.875318222348578e-06, "loss": 3.3630889892578124, "step": 288500 }, { "epoch": 0.3482343486850262, "learning_rate": 8.87491438688084e-06, "loss": 3.3618679809570313, "step": 288600 }, { "epoch": 0.3483550120075089, "learning_rate": 8.8745105514131e-06, "loss": 3.3436550903320312, "step": 288700 }, { "epoch": 0.3484756753299916, "learning_rate": 8.874106715945363e-06, "loss": 3.339142150878906, "step": 288800 }, { "epoch": 0.34859633865247425, "learning_rate": 8.873702880477625e-06, "loss": 3.3261767578125, "step": 288900 }, { "epoch": 0.3487170019749569, "learning_rate": 8.873299045009887e-06, "loss": 3.356783752441406, "step": 289000 }, { "epoch": 0.3488376652974396, "learning_rate": 8.872895209542149e-06, "loss": 3.3261572265625, "step": 289100 }, { "epoch": 0.3489583286199223, "learning_rate": 8.87249137407441e-06, "loss": 3.35098388671875, "step": 289200 }, { "epoch": 0.349078991942405, "learning_rate": 8.872087538606673e-06, "loss": 3.3693197631835936, "step": 289300 }, { "epoch": 0.34919965526488767, "learning_rate": 8.871683703138933e-06, "loss": 3.3170135498046873, "step": 289400 }, { "epoch": 0.34932031858737034, "learning_rate": 8.871279867671195e-06, "loss": 3.3583859252929686, "step": 289500 }, { "epoch": 0.349440981909853, "learning_rate": 8.870876032203455e-06, "loss": 3.3346939086914062, "step": 289600 }, { "epoch": 0.34956164523233574, "learning_rate": 8.870472196735717e-06, "loss": 3.3283795166015624, "step": 289700 }, { "epoch": 0.3496823085548184, "learning_rate": 8.870068361267979e-06, "loss": 3.3797503662109376, "step": 289800 }, { "epoch": 0.3498029718773011, "learning_rate": 8.869664525800241e-06, "loss": 3.3343365478515623, "step": 289900 }, { "epoch": 0.34992363519978376, "learning_rate": 8.869260690332503e-06, "loss": 3.3282159423828124, "step": 290000 }, { "epoch": 0.35004429852226643, "learning_rate": 8.868856854864765e-06, "loss": 3.363509521484375, "step": 290100 }, { "epoch": 0.35016496184474916, "learning_rate": 8.868453019397027e-06, "loss": 3.357915344238281, "step": 290200 }, { "epoch": 0.35028562516723183, "learning_rate": 8.868049183929287e-06, "loss": 3.3282785034179687, "step": 290300 }, { "epoch": 0.3504062884897145, "learning_rate": 8.86764534846155e-06, "loss": 3.35484130859375, "step": 290400 }, { "epoch": 0.3505269518121972, "learning_rate": 8.867241512993811e-06, "loss": 3.3576254272460937, "step": 290500 }, { "epoch": 0.3506476151346799, "learning_rate": 8.866837677526072e-06, "loss": 3.3507846069335936, "step": 290600 }, { "epoch": 0.3507682784571626, "learning_rate": 8.866433842058334e-06, "loss": 3.3488534545898436, "step": 290700 }, { "epoch": 0.35088894177964525, "learning_rate": 8.866030006590596e-06, "loss": 3.3541641235351562, "step": 290800 }, { "epoch": 0.3510096051021279, "learning_rate": 8.865626171122858e-06, "loss": 3.3707708740234374, "step": 290900 }, { "epoch": 0.3511302684246106, "learning_rate": 8.86522233565512e-06, "loss": 3.3741864013671874, "step": 291000 }, { "epoch": 0.3512509317470933, "learning_rate": 8.86481850018738e-06, "loss": 3.3598983764648436, "step": 291100 }, { "epoch": 0.351371595069576, "learning_rate": 8.864414664719642e-06, "loss": 3.33818359375, "step": 291200 }, { "epoch": 0.35149225839205867, "learning_rate": 8.864010829251904e-06, "loss": 3.328935241699219, "step": 291300 }, { "epoch": 0.35161292171454134, "learning_rate": 8.863606993784166e-06, "loss": 3.3236929321289064, "step": 291400 }, { "epoch": 0.351733585037024, "learning_rate": 8.863203158316426e-06, "loss": 3.3363943481445313, "step": 291500 }, { "epoch": 0.35185424835950674, "learning_rate": 8.862799322848688e-06, "loss": 3.3711962890625, "step": 291600 }, { "epoch": 0.3519749116819894, "learning_rate": 8.86239548738095e-06, "loss": 3.3208868408203127, "step": 291700 }, { "epoch": 0.3520955750044721, "learning_rate": 8.861991651913212e-06, "loss": 3.3388897705078127, "step": 291800 }, { "epoch": 0.35221623832695476, "learning_rate": 8.861587816445472e-06, "loss": 3.3541644287109373, "step": 291900 }, { "epoch": 0.35233690164943743, "learning_rate": 8.861183980977734e-06, "loss": 3.3478387451171874, "step": 292000 }, { "epoch": 0.35245756497192016, "learning_rate": 8.860780145509996e-06, "loss": 3.3465670776367187, "step": 292100 }, { "epoch": 0.35257822829440283, "learning_rate": 8.860376310042258e-06, "loss": 3.3381646728515624, "step": 292200 }, { "epoch": 0.3526988916168855, "learning_rate": 8.85997247457452e-06, "loss": 3.342335510253906, "step": 292300 }, { "epoch": 0.3528195549393682, "learning_rate": 8.859568639106782e-06, "loss": 3.331907043457031, "step": 292400 }, { "epoch": 0.35294021826185085, "learning_rate": 8.859164803639042e-06, "loss": 3.3521966552734375, "step": 292500 }, { "epoch": 0.3530608815843336, "learning_rate": 8.858760968171304e-06, "loss": 3.33973876953125, "step": 292600 }, { "epoch": 0.35318154490681625, "learning_rate": 8.858357132703565e-06, "loss": 3.349891357421875, "step": 292700 }, { "epoch": 0.3533022082292989, "learning_rate": 8.857953297235827e-06, "loss": 3.3384039306640627, "step": 292800 }, { "epoch": 0.3534228715517816, "learning_rate": 8.857549461768089e-06, "loss": 3.3312451171875, "step": 292900 }, { "epoch": 0.3535435348742643, "learning_rate": 8.85714562630035e-06, "loss": 3.351846008300781, "step": 293000 }, { "epoch": 0.353664198196747, "learning_rate": 8.856741790832613e-06, "loss": 3.3284475708007815, "step": 293100 }, { "epoch": 0.35378486151922967, "learning_rate": 8.856337955364875e-06, "loss": 3.3351480102539064, "step": 293200 }, { "epoch": 0.35390552484171234, "learning_rate": 8.855934119897137e-06, "loss": 3.3484158325195312, "step": 293300 }, { "epoch": 0.354026188164195, "learning_rate": 8.855530284429399e-06, "loss": 3.349937744140625, "step": 293400 }, { "epoch": 0.35414685148667774, "learning_rate": 8.855126448961659e-06, "loss": 3.3387371826171877, "step": 293500 }, { "epoch": 0.3542675148091604, "learning_rate": 8.854722613493921e-06, "loss": 3.34574951171875, "step": 293600 }, { "epoch": 0.3543881781316431, "learning_rate": 8.854318778026181e-06, "loss": 3.3603726196289063, "step": 293700 }, { "epoch": 0.35450884145412576, "learning_rate": 8.853914942558443e-06, "loss": 3.340113525390625, "step": 293800 }, { "epoch": 0.35462950477660843, "learning_rate": 8.853511107090705e-06, "loss": 3.3261257934570314, "step": 293900 }, { "epoch": 0.35475016809909116, "learning_rate": 8.853107271622967e-06, "loss": 3.3126797485351562, "step": 294000 }, { "epoch": 0.35487083142157383, "learning_rate": 8.852703436155229e-06, "loss": 3.329942321777344, "step": 294100 }, { "epoch": 0.3549914947440565, "learning_rate": 8.852299600687491e-06, "loss": 3.34689208984375, "step": 294200 }, { "epoch": 0.3551121580665392, "learning_rate": 8.851895765219753e-06, "loss": 3.3400753784179686, "step": 294300 }, { "epoch": 0.35523282138902185, "learning_rate": 8.851491929752013e-06, "loss": 3.3322042846679687, "step": 294400 }, { "epoch": 0.3553534847115046, "learning_rate": 8.851088094284275e-06, "loss": 3.3032736206054687, "step": 294500 }, { "epoch": 0.35547414803398725, "learning_rate": 8.850684258816537e-06, "loss": 3.3311907958984377, "step": 294600 }, { "epoch": 0.3555948113564699, "learning_rate": 8.850280423348798e-06, "loss": 3.3651763916015627, "step": 294700 }, { "epoch": 0.3557154746789526, "learning_rate": 8.84987658788106e-06, "loss": 3.313255615234375, "step": 294800 }, { "epoch": 0.35583613800143526, "learning_rate": 8.849472752413322e-06, "loss": 3.3502621459960937, "step": 294900 }, { "epoch": 0.355956801323918, "learning_rate": 8.849068916945584e-06, "loss": 3.32615966796875, "step": 295000 }, { "epoch": 0.35607746464640067, "learning_rate": 8.848665081477846e-06, "loss": 3.3292901611328123, "step": 295100 }, { "epoch": 0.35619812796888334, "learning_rate": 8.848261246010106e-06, "loss": 3.35273681640625, "step": 295200 }, { "epoch": 0.356318791291366, "learning_rate": 8.847857410542368e-06, "loss": 3.3344461059570314, "step": 295300 }, { "epoch": 0.3564394546138487, "learning_rate": 8.84745357507463e-06, "loss": 3.3574578857421873, "step": 295400 }, { "epoch": 0.3565601179363314, "learning_rate": 8.847049739606892e-06, "loss": 3.3437017822265624, "step": 295500 }, { "epoch": 0.3566807812588141, "learning_rate": 8.846645904139152e-06, "loss": 3.3250396728515623, "step": 295600 }, { "epoch": 0.35680144458129676, "learning_rate": 8.846242068671414e-06, "loss": 3.352808837890625, "step": 295700 }, { "epoch": 0.35692210790377943, "learning_rate": 8.845838233203676e-06, "loss": 3.3430130004882814, "step": 295800 }, { "epoch": 0.35704277122626216, "learning_rate": 8.845434397735938e-06, "loss": 3.2995059204101564, "step": 295900 }, { "epoch": 0.35716343454874483, "learning_rate": 8.845030562268198e-06, "loss": 3.323347473144531, "step": 296000 }, { "epoch": 0.3572840978712275, "learning_rate": 8.84462672680046e-06, "loss": 3.3315829467773437, "step": 296100 }, { "epoch": 0.3574047611937102, "learning_rate": 8.844222891332722e-06, "loss": 3.3295867919921873, "step": 296200 }, { "epoch": 0.35752542451619285, "learning_rate": 8.843819055864984e-06, "loss": 3.330219421386719, "step": 296300 }, { "epoch": 0.3576460878386756, "learning_rate": 8.843415220397246e-06, "loss": 3.31962646484375, "step": 296400 }, { "epoch": 0.35776675116115825, "learning_rate": 8.843011384929508e-06, "loss": 3.3472137451171875, "step": 296500 }, { "epoch": 0.3578874144836409, "learning_rate": 8.842607549461768e-06, "loss": 3.3337026977539064, "step": 296600 }, { "epoch": 0.3580080778061236, "learning_rate": 8.84220371399403e-06, "loss": 3.3129229736328125, "step": 296700 }, { "epoch": 0.35812874112860626, "learning_rate": 8.84179987852629e-06, "loss": 3.307882995605469, "step": 296800 }, { "epoch": 0.358249404451089, "learning_rate": 8.841396043058553e-06, "loss": 3.3341461181640626, "step": 296900 }, { "epoch": 0.35837006777357167, "learning_rate": 8.840992207590815e-06, "loss": 3.301899108886719, "step": 297000 }, { "epoch": 0.35849073109605434, "learning_rate": 8.840588372123077e-06, "loss": 3.3152227783203125, "step": 297100 }, { "epoch": 0.358611394418537, "learning_rate": 8.840184536655339e-06, "loss": 3.345552673339844, "step": 297200 }, { "epoch": 0.3587320577410197, "learning_rate": 8.8397807011876e-06, "loss": 3.3410565185546877, "step": 297300 }, { "epoch": 0.3588527210635024, "learning_rate": 8.839376865719863e-06, "loss": 3.3193359375, "step": 297400 }, { "epoch": 0.3589733843859851, "learning_rate": 8.838973030252123e-06, "loss": 3.33230712890625, "step": 297500 }, { "epoch": 0.35909404770846776, "learning_rate": 8.838569194784385e-06, "loss": 3.32958251953125, "step": 297600 }, { "epoch": 0.35921471103095043, "learning_rate": 8.838165359316647e-06, "loss": 3.328432922363281, "step": 297700 }, { "epoch": 0.3593353743534331, "learning_rate": 8.837761523848907e-06, "loss": 3.3343017578125, "step": 297800 }, { "epoch": 0.35945603767591583, "learning_rate": 8.83735768838117e-06, "loss": 3.33526123046875, "step": 297900 }, { "epoch": 0.3595767009983985, "learning_rate": 8.836953852913431e-06, "loss": 3.3219537353515625, "step": 298000 }, { "epoch": 0.3596973643208812, "learning_rate": 8.836550017445693e-06, "loss": 3.316231994628906, "step": 298100 }, { "epoch": 0.35981802764336385, "learning_rate": 8.836146181977955e-06, "loss": 3.3348828125, "step": 298200 }, { "epoch": 0.3599386909658466, "learning_rate": 8.835742346510217e-06, "loss": 3.3322988891601564, "step": 298300 }, { "epoch": 0.36005935428832925, "learning_rate": 8.835338511042479e-06, "loss": 3.3408843994140627, "step": 298400 }, { "epoch": 0.3601800176108119, "learning_rate": 8.83493467557474e-06, "loss": 3.3089837646484375, "step": 298500 }, { "epoch": 0.3603006809332946, "learning_rate": 8.834530840107001e-06, "loss": 3.305108947753906, "step": 298600 }, { "epoch": 0.36042134425577727, "learning_rate": 8.834127004639262e-06, "loss": 3.3198333740234376, "step": 298700 }, { "epoch": 0.36054200757826, "learning_rate": 8.833723169171524e-06, "loss": 3.325597839355469, "step": 298800 }, { "epoch": 0.36066267090074267, "learning_rate": 8.833319333703786e-06, "loss": 3.316040344238281, "step": 298900 }, { "epoch": 0.36078333422322534, "learning_rate": 8.832915498236048e-06, "loss": 3.3172955322265625, "step": 299000 }, { "epoch": 0.360903997545708, "learning_rate": 8.83251166276831e-06, "loss": 3.325193176269531, "step": 299100 }, { "epoch": 0.3610246608681907, "learning_rate": 8.832107827300572e-06, "loss": 3.31294189453125, "step": 299200 }, { "epoch": 0.3611453241906734, "learning_rate": 8.831703991832832e-06, "loss": 3.324296875, "step": 299300 }, { "epoch": 0.3612659875131561, "learning_rate": 8.831300156365094e-06, "loss": 3.333157958984375, "step": 299400 }, { "epoch": 0.36138665083563876, "learning_rate": 8.830896320897356e-06, "loss": 3.3377294921875, "step": 299500 }, { "epoch": 0.36150731415812143, "learning_rate": 8.830492485429618e-06, "loss": 3.3260113525390627, "step": 299600 }, { "epoch": 0.3616279774806041, "learning_rate": 8.830088649961878e-06, "loss": 3.3337860107421875, "step": 299700 }, { "epoch": 0.36174864080308683, "learning_rate": 8.82968481449414e-06, "loss": 3.31935546875, "step": 299800 }, { "epoch": 0.3618693041255695, "learning_rate": 8.829280979026402e-06, "loss": 3.2990069580078125, "step": 299900 }, { "epoch": 0.3619899674480522, "learning_rate": 8.828877143558664e-06, "loss": 3.31140380859375, "step": 300000 }, { "epoch": 0.36211063077053485, "learning_rate": 8.828473308090924e-06, "loss": 3.30639892578125, "step": 300100 }, { "epoch": 0.3622312940930175, "learning_rate": 8.828069472623186e-06, "loss": 3.322403869628906, "step": 300200 }, { "epoch": 0.36235195741550025, "learning_rate": 8.827665637155448e-06, "loss": 3.304969482421875, "step": 300300 }, { "epoch": 0.3624726207379829, "learning_rate": 8.82726180168771e-06, "loss": 3.3136441040039064, "step": 300400 }, { "epoch": 0.3625932840604656, "learning_rate": 8.826857966219972e-06, "loss": 3.31540283203125, "step": 300500 }, { "epoch": 0.36271394738294827, "learning_rate": 8.826454130752233e-06, "loss": 3.3179580688476564, "step": 300600 }, { "epoch": 0.362834610705431, "learning_rate": 8.826050295284495e-06, "loss": 3.3205157470703126, "step": 300700 }, { "epoch": 0.36295527402791367, "learning_rate": 8.825646459816757e-06, "loss": 3.3216207885742186, "step": 300800 }, { "epoch": 0.36307593735039634, "learning_rate": 8.825242624349017e-06, "loss": 3.3189358520507812, "step": 300900 }, { "epoch": 0.363196600672879, "learning_rate": 8.824838788881279e-06, "loss": 3.3213543701171875, "step": 301000 }, { "epoch": 0.3633172639953617, "learning_rate": 8.82443495341354e-06, "loss": 3.331612548828125, "step": 301100 }, { "epoch": 0.3634379273178444, "learning_rate": 8.824031117945803e-06, "loss": 3.3322308349609373, "step": 301200 }, { "epoch": 0.3635585906403271, "learning_rate": 8.823627282478065e-06, "loss": 3.319403076171875, "step": 301300 }, { "epoch": 0.36367925396280976, "learning_rate": 8.823223447010327e-06, "loss": 3.3143212890625, "step": 301400 }, { "epoch": 0.36379991728529243, "learning_rate": 8.822819611542589e-06, "loss": 3.316423034667969, "step": 301500 }, { "epoch": 0.3639205806077751, "learning_rate": 8.822415776074849e-06, "loss": 3.313104553222656, "step": 301600 }, { "epoch": 0.36404124393025783, "learning_rate": 8.822011940607111e-06, "loss": 3.32320068359375, "step": 301700 }, { "epoch": 0.3641619072527405, "learning_rate": 8.821608105139371e-06, "loss": 3.287771911621094, "step": 301800 }, { "epoch": 0.3642825705752232, "learning_rate": 8.821204269671633e-06, "loss": 3.29591552734375, "step": 301900 }, { "epoch": 0.36440323389770585, "learning_rate": 8.820800434203895e-06, "loss": 3.317733154296875, "step": 302000 }, { "epoch": 0.3645238972201885, "learning_rate": 8.820396598736157e-06, "loss": 3.2830380249023436, "step": 302100 }, { "epoch": 0.36464456054267125, "learning_rate": 8.81999276326842e-06, "loss": 3.3182296752929688, "step": 302200 }, { "epoch": 0.3647652238651539, "learning_rate": 8.819588927800681e-06, "loss": 3.3193603515625, "step": 302300 }, { "epoch": 0.3648858871876366, "learning_rate": 8.819185092332943e-06, "loss": 3.3257107543945312, "step": 302400 }, { "epoch": 0.36500655051011927, "learning_rate": 8.818781256865203e-06, "loss": 3.315701599121094, "step": 302500 }, { "epoch": 0.36512721383260194, "learning_rate": 8.818377421397465e-06, "loss": 3.3238140869140627, "step": 302600 }, { "epoch": 0.36524787715508467, "learning_rate": 8.817973585929727e-06, "loss": 3.3311126708984373, "step": 302700 }, { "epoch": 0.36536854047756734, "learning_rate": 8.817569750461988e-06, "loss": 3.3201943969726564, "step": 302800 }, { "epoch": 0.36548920380005, "learning_rate": 8.81716591499425e-06, "loss": 3.323199462890625, "step": 302900 }, { "epoch": 0.3656098671225327, "learning_rate": 8.816762079526512e-06, "loss": 3.333154296875, "step": 303000 }, { "epoch": 0.36573053044501536, "learning_rate": 8.816358244058774e-06, "loss": 3.2910009765625, "step": 303100 }, { "epoch": 0.3658511937674981, "learning_rate": 8.815954408591036e-06, "loss": 3.312349548339844, "step": 303200 }, { "epoch": 0.36597185708998076, "learning_rate": 8.815550573123296e-06, "loss": 3.2939016723632815, "step": 303300 }, { "epoch": 0.36609252041246343, "learning_rate": 8.815146737655558e-06, "loss": 3.3060198974609376, "step": 303400 }, { "epoch": 0.3662131837349461, "learning_rate": 8.81474290218782e-06, "loss": 3.3187295532226564, "step": 303500 }, { "epoch": 0.36633384705742883, "learning_rate": 8.814339066720082e-06, "loss": 3.319930114746094, "step": 303600 }, { "epoch": 0.3664545103799115, "learning_rate": 8.813935231252342e-06, "loss": 3.338509216308594, "step": 303700 }, { "epoch": 0.3665751737023942, "learning_rate": 8.813531395784604e-06, "loss": 3.3211935424804686, "step": 303800 }, { "epoch": 0.36669583702487685, "learning_rate": 8.813127560316866e-06, "loss": 3.304140930175781, "step": 303900 }, { "epoch": 0.3668165003473595, "learning_rate": 8.812723724849128e-06, "loss": 3.3051583862304685, "step": 304000 }, { "epoch": 0.36693716366984225, "learning_rate": 8.81231988938139e-06, "loss": 3.298758239746094, "step": 304100 }, { "epoch": 0.3670578269923249, "learning_rate": 8.81191605391365e-06, "loss": 3.31005126953125, "step": 304200 }, { "epoch": 0.3671784903148076, "learning_rate": 8.811512218445912e-06, "loss": 3.285517578125, "step": 304300 }, { "epoch": 0.36729915363729027, "learning_rate": 8.811108382978174e-06, "loss": 3.31759765625, "step": 304400 }, { "epoch": 0.36741981695977294, "learning_rate": 8.810704547510436e-06, "loss": 3.324541015625, "step": 304500 }, { "epoch": 0.36754048028225567, "learning_rate": 8.810300712042698e-06, "loss": 3.2998089599609375, "step": 304600 }, { "epoch": 0.36766114360473834, "learning_rate": 8.809896876574959e-06, "loss": 3.315268859863281, "step": 304700 }, { "epoch": 0.367781806927221, "learning_rate": 8.80949304110722e-06, "loss": 3.324373779296875, "step": 304800 }, { "epoch": 0.3679024702497037, "learning_rate": 8.809089205639483e-06, "loss": 3.3101516723632813, "step": 304900 }, { "epoch": 0.36802313357218636, "learning_rate": 8.808685370171743e-06, "loss": 3.3062335205078126, "step": 305000 }, { "epoch": 0.3681437968946691, "learning_rate": 8.808281534704005e-06, "loss": 3.283702392578125, "step": 305100 }, { "epoch": 0.36826446021715176, "learning_rate": 8.807877699236267e-06, "loss": 3.3325180053710937, "step": 305200 }, { "epoch": 0.36838512353963443, "learning_rate": 8.807473863768529e-06, "loss": 3.3021621704101562, "step": 305300 }, { "epoch": 0.3685057868621171, "learning_rate": 8.80707002830079e-06, "loss": 3.340378723144531, "step": 305400 }, { "epoch": 0.3686264501845998, "learning_rate": 8.806666192833053e-06, "loss": 3.3138494873046875, "step": 305500 }, { "epoch": 0.3687471135070825, "learning_rate": 8.806262357365313e-06, "loss": 3.295240478515625, "step": 305600 }, { "epoch": 0.3688677768295652, "learning_rate": 8.805858521897575e-06, "loss": 3.3037368774414064, "step": 305700 }, { "epoch": 0.36898844015204785, "learning_rate": 8.805454686429837e-06, "loss": 3.2917221069335936, "step": 305800 }, { "epoch": 0.3691091034745305, "learning_rate": 8.805050850962097e-06, "loss": 3.296153259277344, "step": 305900 }, { "epoch": 0.36922976679701325, "learning_rate": 8.80464701549436e-06, "loss": 3.2916195678710936, "step": 306000 }, { "epoch": 0.3693504301194959, "learning_rate": 8.804243180026621e-06, "loss": 3.3197772216796877, "step": 306100 }, { "epoch": 0.3694710934419786, "learning_rate": 8.803839344558883e-06, "loss": 3.3021240234375, "step": 306200 }, { "epoch": 0.36959175676446127, "learning_rate": 8.803435509091145e-06, "loss": 3.2962762451171876, "step": 306300 }, { "epoch": 0.36971242008694394, "learning_rate": 8.803031673623407e-06, "loss": 3.324712219238281, "step": 306400 }, { "epoch": 0.36983308340942667, "learning_rate": 8.80262783815567e-06, "loss": 3.3221090698242186, "step": 306500 }, { "epoch": 0.36995374673190934, "learning_rate": 8.80222400268793e-06, "loss": 3.3229052734375, "step": 306600 }, { "epoch": 0.370074410054392, "learning_rate": 8.801820167220191e-06, "loss": 3.3020254516601564, "step": 306700 }, { "epoch": 0.3701950733768747, "learning_rate": 8.801416331752452e-06, "loss": 3.301183166503906, "step": 306800 }, { "epoch": 0.37031573669935736, "learning_rate": 8.801012496284714e-06, "loss": 3.3134396362304686, "step": 306900 }, { "epoch": 0.3704364000218401, "learning_rate": 8.800608660816976e-06, "loss": 3.3111557006835937, "step": 307000 }, { "epoch": 0.37055706334432276, "learning_rate": 8.800204825349238e-06, "loss": 3.3167425537109376, "step": 307100 }, { "epoch": 0.37067772666680543, "learning_rate": 8.7998009898815e-06, "loss": 3.3008447265625, "step": 307200 }, { "epoch": 0.3707983899892881, "learning_rate": 8.799397154413762e-06, "loss": 3.285044860839844, "step": 307300 }, { "epoch": 0.3709190533117708, "learning_rate": 8.798993318946022e-06, "loss": 3.2854852294921875, "step": 307400 }, { "epoch": 0.3710397166342535, "learning_rate": 8.798589483478284e-06, "loss": 3.2860568237304686, "step": 307500 }, { "epoch": 0.3711603799567362, "learning_rate": 8.798185648010546e-06, "loss": 3.3158724975585936, "step": 307600 }, { "epoch": 0.37128104327921885, "learning_rate": 8.797781812542808e-06, "loss": 3.2934579467773437, "step": 307700 }, { "epoch": 0.3714017066017015, "learning_rate": 8.797377977075068e-06, "loss": 3.3062152099609374, "step": 307800 }, { "epoch": 0.3715223699241842, "learning_rate": 8.79697414160733e-06, "loss": 3.3139215087890626, "step": 307900 }, { "epoch": 0.3716430332466669, "learning_rate": 8.796570306139592e-06, "loss": 3.3147311401367188, "step": 308000 }, { "epoch": 0.3717636965691496, "learning_rate": 8.796166470671854e-06, "loss": 3.3254104614257813, "step": 308100 }, { "epoch": 0.37188435989163227, "learning_rate": 8.795762635204114e-06, "loss": 3.285187072753906, "step": 308200 }, { "epoch": 0.37200502321411494, "learning_rate": 8.795358799736376e-06, "loss": 3.296063232421875, "step": 308300 }, { "epoch": 0.3721256865365976, "learning_rate": 8.794954964268638e-06, "loss": 3.310453186035156, "step": 308400 }, { "epoch": 0.37224634985908034, "learning_rate": 8.7945511288009e-06, "loss": 3.3133758544921874, "step": 308500 }, { "epoch": 0.372367013181563, "learning_rate": 8.794147293333162e-06, "loss": 3.298341979980469, "step": 308600 }, { "epoch": 0.3724876765040457, "learning_rate": 8.793743457865424e-06, "loss": 3.3225396728515624, "step": 308700 }, { "epoch": 0.37260833982652836, "learning_rate": 8.793339622397685e-06, "loss": 3.2861734008789063, "step": 308800 }, { "epoch": 0.3727290031490111, "learning_rate": 8.792935786929947e-06, "loss": 3.273369140625, "step": 308900 }, { "epoch": 0.37284966647149376, "learning_rate": 8.792531951462209e-06, "loss": 3.312192687988281, "step": 309000 }, { "epoch": 0.37297032979397643, "learning_rate": 8.792128115994469e-06, "loss": 3.2700869750976564, "step": 309100 }, { "epoch": 0.3730909931164591, "learning_rate": 8.791724280526731e-06, "loss": 3.3293157958984376, "step": 309200 }, { "epoch": 0.3732116564389418, "learning_rate": 8.791320445058993e-06, "loss": 3.2952374267578124, "step": 309300 }, { "epoch": 0.3733323197614245, "learning_rate": 8.790916609591255e-06, "loss": 3.282659912109375, "step": 309400 }, { "epoch": 0.3734529830839072, "learning_rate": 8.790512774123517e-06, "loss": 3.280079345703125, "step": 309500 }, { "epoch": 0.37357364640638985, "learning_rate": 8.790108938655779e-06, "loss": 3.324193420410156, "step": 309600 }, { "epoch": 0.3736943097288725, "learning_rate": 8.789705103188039e-06, "loss": 3.320880126953125, "step": 309700 }, { "epoch": 0.3738149730513552, "learning_rate": 8.789301267720301e-06, "loss": 3.278819885253906, "step": 309800 }, { "epoch": 0.3739356363738379, "learning_rate": 8.788897432252563e-06, "loss": 3.288790283203125, "step": 309900 }, { "epoch": 0.3740562996963206, "learning_rate": 8.788493596784823e-06, "loss": 3.293543395996094, "step": 310000 }, { "epoch": 0.37417696301880327, "learning_rate": 8.788089761317085e-06, "loss": 3.289220886230469, "step": 310100 }, { "epoch": 0.37429762634128594, "learning_rate": 8.787685925849347e-06, "loss": 3.284038391113281, "step": 310200 }, { "epoch": 0.3744182896637686, "learning_rate": 8.78728209038161e-06, "loss": 3.311800231933594, "step": 310300 }, { "epoch": 0.37453895298625134, "learning_rate": 8.786878254913871e-06, "loss": 3.317510681152344, "step": 310400 }, { "epoch": 0.374659616308734, "learning_rate": 8.786474419446133e-06, "loss": 3.2828073120117187, "step": 310500 }, { "epoch": 0.3747802796312167, "learning_rate": 8.786070583978395e-06, "loss": 3.2694500732421874, "step": 310600 }, { "epoch": 0.37490094295369936, "learning_rate": 8.785666748510656e-06, "loss": 3.3128778076171876, "step": 310700 }, { "epoch": 0.37502160627618203, "learning_rate": 8.785262913042917e-06, "loss": 3.27744873046875, "step": 310800 }, { "epoch": 0.37514226959866476, "learning_rate": 8.784859077575178e-06, "loss": 3.2939593505859377, "step": 310900 }, { "epoch": 0.37526293292114743, "learning_rate": 8.78445524210744e-06, "loss": 3.3001422119140624, "step": 311000 }, { "epoch": 0.3753835962436301, "learning_rate": 8.784051406639702e-06, "loss": 3.2914654541015627, "step": 311100 }, { "epoch": 0.3755042595661128, "learning_rate": 8.783647571171964e-06, "loss": 3.287436828613281, "step": 311200 }, { "epoch": 0.3756249228885955, "learning_rate": 8.783243735704226e-06, "loss": 3.29072509765625, "step": 311300 }, { "epoch": 0.3757455862110782, "learning_rate": 8.782839900236488e-06, "loss": 3.2698114013671873, "step": 311400 }, { "epoch": 0.37586624953356085, "learning_rate": 8.782436064768748e-06, "loss": 3.304375, "step": 311500 }, { "epoch": 0.3759869128560435, "learning_rate": 8.78203222930101e-06, "loss": 3.2887890625, "step": 311600 }, { "epoch": 0.3761075761785262, "learning_rate": 8.781628393833272e-06, "loss": 3.292602844238281, "step": 311700 }, { "epoch": 0.3762282395010089, "learning_rate": 8.781224558365534e-06, "loss": 3.285872497558594, "step": 311800 }, { "epoch": 0.3763489028234916, "learning_rate": 8.780820722897794e-06, "loss": 3.301965637207031, "step": 311900 }, { "epoch": 0.37646956614597427, "learning_rate": 8.780416887430056e-06, "loss": 3.281133117675781, "step": 312000 }, { "epoch": 0.37659022946845694, "learning_rate": 8.780013051962318e-06, "loss": 3.2999783325195313, "step": 312100 }, { "epoch": 0.3767108927909396, "learning_rate": 8.77960921649458e-06, "loss": 3.3032260131835938, "step": 312200 }, { "epoch": 0.37683155611342234, "learning_rate": 8.77920538102684e-06, "loss": 3.28312255859375, "step": 312300 }, { "epoch": 0.376952219435905, "learning_rate": 8.778801545559102e-06, "loss": 3.308909912109375, "step": 312400 }, { "epoch": 0.3770728827583877, "learning_rate": 8.778397710091364e-06, "loss": 3.25122314453125, "step": 312500 }, { "epoch": 0.37719354608087036, "learning_rate": 8.777993874623626e-06, "loss": 3.2880038452148437, "step": 312600 }, { "epoch": 0.37731420940335303, "learning_rate": 8.777590039155888e-06, "loss": 3.3010659790039063, "step": 312700 }, { "epoch": 0.37743487272583576, "learning_rate": 8.777186203688149e-06, "loss": 3.279433288574219, "step": 312800 }, { "epoch": 0.37755553604831843, "learning_rate": 8.77678236822041e-06, "loss": 3.300711669921875, "step": 312900 }, { "epoch": 0.3776761993708011, "learning_rate": 8.776378532752673e-06, "loss": 3.277568359375, "step": 313000 }, { "epoch": 0.3777968626932838, "learning_rate": 8.775974697284933e-06, "loss": 3.2576052856445314, "step": 313100 }, { "epoch": 0.37791752601576645, "learning_rate": 8.775570861817195e-06, "loss": 3.2829791259765626, "step": 313200 }, { "epoch": 0.3780381893382492, "learning_rate": 8.775167026349457e-06, "loss": 3.281400451660156, "step": 313300 }, { "epoch": 0.37815885266073185, "learning_rate": 8.774763190881719e-06, "loss": 3.284503173828125, "step": 313400 }, { "epoch": 0.3782795159832145, "learning_rate": 8.77435935541398e-06, "loss": 3.308751525878906, "step": 313500 }, { "epoch": 0.3784001793056972, "learning_rate": 8.773955519946243e-06, "loss": 3.2616864013671876, "step": 313600 }, { "epoch": 0.3785208426281799, "learning_rate": 8.773551684478505e-06, "loss": 3.2837033081054687, "step": 313700 }, { "epoch": 0.3786415059506626, "learning_rate": 8.773147849010765e-06, "loss": 3.279918518066406, "step": 313800 }, { "epoch": 0.37876216927314527, "learning_rate": 8.772744013543027e-06, "loss": 3.2851162719726563, "step": 313900 }, { "epoch": 0.37888283259562794, "learning_rate": 8.772340178075287e-06, "loss": 3.2467465209960937, "step": 314000 }, { "epoch": 0.3790034959181106, "learning_rate": 8.77193634260755e-06, "loss": 3.2915631103515626, "step": 314100 }, { "epoch": 0.37912415924059334, "learning_rate": 8.771532507139811e-06, "loss": 3.273829040527344, "step": 314200 }, { "epoch": 0.379244822563076, "learning_rate": 8.771128671672073e-06, "loss": 3.238301086425781, "step": 314300 }, { "epoch": 0.3793654858855587, "learning_rate": 8.770724836204335e-06, "loss": 3.2906304931640626, "step": 314400 }, { "epoch": 0.37948614920804136, "learning_rate": 8.770321000736597e-06, "loss": 3.2664248657226564, "step": 314500 }, { "epoch": 0.37960681253052403, "learning_rate": 8.76991716526886e-06, "loss": 3.274669494628906, "step": 314600 }, { "epoch": 0.37972747585300676, "learning_rate": 8.76951332980112e-06, "loss": 3.2747454833984375, "step": 314700 }, { "epoch": 0.37984813917548943, "learning_rate": 8.769109494333382e-06, "loss": 3.295265808105469, "step": 314800 }, { "epoch": 0.3799688024979721, "learning_rate": 8.768705658865644e-06, "loss": 3.2701620483398437, "step": 314900 }, { "epoch": 0.3800894658204548, "learning_rate": 8.768301823397904e-06, "loss": 3.2717471313476563, "step": 315000 }, { "epoch": 0.38021012914293745, "learning_rate": 8.767897987930166e-06, "loss": 3.2744296264648436, "step": 315100 }, { "epoch": 0.3803307924654202, "learning_rate": 8.767494152462428e-06, "loss": 3.27110107421875, "step": 315200 }, { "epoch": 0.38045145578790285, "learning_rate": 8.76709031699469e-06, "loss": 3.2762799072265625, "step": 315300 }, { "epoch": 0.3805721191103855, "learning_rate": 8.766686481526952e-06, "loss": 3.2894537353515627, "step": 315400 }, { "epoch": 0.3806927824328682, "learning_rate": 8.766282646059214e-06, "loss": 3.2854052734375, "step": 315500 }, { "epoch": 0.38081344575535087, "learning_rate": 8.765878810591474e-06, "loss": 3.2787136840820312, "step": 315600 }, { "epoch": 0.3809341090778336, "learning_rate": 8.765474975123736e-06, "loss": 3.2867681884765627, "step": 315700 }, { "epoch": 0.38105477240031627, "learning_rate": 8.765071139655998e-06, "loss": 3.2680532836914065, "step": 315800 }, { "epoch": 0.38117543572279894, "learning_rate": 8.764667304188258e-06, "loss": 3.2739834594726562, "step": 315900 }, { "epoch": 0.3812960990452816, "learning_rate": 8.76426346872052e-06, "loss": 3.285141906738281, "step": 316000 }, { "epoch": 0.3814167623677643, "learning_rate": 8.763859633252782e-06, "loss": 3.2821109008789064, "step": 316100 }, { "epoch": 0.381537425690247, "learning_rate": 8.763455797785044e-06, "loss": 3.26627197265625, "step": 316200 }, { "epoch": 0.3816580890127297, "learning_rate": 8.763051962317306e-06, "loss": 3.240209655761719, "step": 316300 }, { "epoch": 0.38177875233521236, "learning_rate": 8.762648126849566e-06, "loss": 3.2754672241210936, "step": 316400 }, { "epoch": 0.38189941565769503, "learning_rate": 8.762244291381828e-06, "loss": 3.2747296142578124, "step": 316500 }, { "epoch": 0.38202007898017776, "learning_rate": 8.76184045591409e-06, "loss": 3.2793539428710936, "step": 316600 }, { "epoch": 0.38214074230266043, "learning_rate": 8.761436620446352e-06, "loss": 3.2627667236328124, "step": 316700 }, { "epoch": 0.3822614056251431, "learning_rate": 8.761032784978614e-06, "loss": 3.2436148071289064, "step": 316800 }, { "epoch": 0.3823820689476258, "learning_rate": 8.760628949510875e-06, "loss": 3.2827850341796876, "step": 316900 }, { "epoch": 0.38250273227010845, "learning_rate": 8.760225114043137e-06, "loss": 3.2916610717773436, "step": 317000 }, { "epoch": 0.3826233955925912, "learning_rate": 8.759821278575399e-06, "loss": 3.2335391235351563, "step": 317100 }, { "epoch": 0.38274405891507385, "learning_rate": 8.759417443107659e-06, "loss": 3.2764181518554687, "step": 317200 }, { "epoch": 0.3828647222375565, "learning_rate": 8.759013607639921e-06, "loss": 3.256866760253906, "step": 317300 }, { "epoch": 0.3829853855600392, "learning_rate": 8.758609772172183e-06, "loss": 3.2746463012695313, "step": 317400 }, { "epoch": 0.38310604888252187, "learning_rate": 8.758205936704445e-06, "loss": 3.246959228515625, "step": 317500 }, { "epoch": 0.3832267122050046, "learning_rate": 8.757802101236707e-06, "loss": 3.2848907470703126, "step": 317600 }, { "epoch": 0.38334737552748727, "learning_rate": 8.757398265768969e-06, "loss": 3.2458203125, "step": 317700 }, { "epoch": 0.38346803884996994, "learning_rate": 8.756994430301229e-06, "loss": 3.279761962890625, "step": 317800 }, { "epoch": 0.3835887021724526, "learning_rate": 8.756590594833491e-06, "loss": 3.292417297363281, "step": 317900 }, { "epoch": 0.3837093654949353, "learning_rate": 8.756186759365753e-06, "loss": 3.251089782714844, "step": 318000 }, { "epoch": 0.383830028817418, "learning_rate": 8.755782923898013e-06, "loss": 3.2748980712890625, "step": 318100 }, { "epoch": 0.3839506921399007, "learning_rate": 8.755379088430275e-06, "loss": 3.306053466796875, "step": 318200 }, { "epoch": 0.38407135546238336, "learning_rate": 8.754975252962537e-06, "loss": 3.2929010009765625, "step": 318300 }, { "epoch": 0.38419201878486603, "learning_rate": 8.7545714174948e-06, "loss": 3.269003601074219, "step": 318400 }, { "epoch": 0.3843126821073487, "learning_rate": 8.754167582027061e-06, "loss": 3.2758865356445312, "step": 318500 }, { "epoch": 0.38443334542983143, "learning_rate": 8.753763746559323e-06, "loss": 3.2650885009765624, "step": 318600 }, { "epoch": 0.3845540087523141, "learning_rate": 8.753359911091585e-06, "loss": 3.2991177368164064, "step": 318700 }, { "epoch": 0.3846746720747968, "learning_rate": 8.752956075623846e-06, "loss": 3.2663214111328127, "step": 318800 }, { "epoch": 0.38479533539727945, "learning_rate": 8.752552240156108e-06, "loss": 3.241009521484375, "step": 318900 }, { "epoch": 0.3849159987197622, "learning_rate": 8.752148404688368e-06, "loss": 3.2705615234375, "step": 319000 }, { "epoch": 0.38503666204224485, "learning_rate": 8.75174456922063e-06, "loss": 3.2790011596679687, "step": 319100 }, { "epoch": 0.3851573253647275, "learning_rate": 8.751340733752892e-06, "loss": 3.2712957763671877, "step": 319200 }, { "epoch": 0.3852779886872102, "learning_rate": 8.750936898285154e-06, "loss": 3.2643399047851562, "step": 319300 }, { "epoch": 0.38539865200969287, "learning_rate": 8.750533062817416e-06, "loss": 3.2708502197265625, "step": 319400 }, { "epoch": 0.3855193153321756, "learning_rate": 8.750129227349678e-06, "loss": 3.2638134765625, "step": 319500 }, { "epoch": 0.38563997865465827, "learning_rate": 8.74972539188194e-06, "loss": 3.2642227172851563, "step": 319600 }, { "epoch": 0.38576064197714094, "learning_rate": 8.7493215564142e-06, "loss": 3.246645812988281, "step": 319700 }, { "epoch": 0.3858813052996236, "learning_rate": 8.748917720946462e-06, "loss": 3.251583251953125, "step": 319800 }, { "epoch": 0.3860019686221063, "learning_rate": 8.748513885478724e-06, "loss": 3.2594647216796875, "step": 319900 }, { "epoch": 0.386122631944589, "learning_rate": 8.748110050010984e-06, "loss": 3.285966796875, "step": 320000 }, { "epoch": 0.3862432952670717, "learning_rate": 8.747706214543246e-06, "loss": 3.2659402465820313, "step": 320100 }, { "epoch": 0.38636395858955436, "learning_rate": 8.747302379075508e-06, "loss": 3.2546759033203125, "step": 320200 }, { "epoch": 0.38648462191203703, "learning_rate": 8.74689854360777e-06, "loss": 3.242425842285156, "step": 320300 }, { "epoch": 0.3866052852345197, "learning_rate": 8.746494708140032e-06, "loss": 3.2424041748046877, "step": 320400 }, { "epoch": 0.38672594855700243, "learning_rate": 8.746090872672293e-06, "loss": 3.2470562744140623, "step": 320500 }, { "epoch": 0.3868466118794851, "learning_rate": 8.745687037204554e-06, "loss": 3.30968017578125, "step": 320600 }, { "epoch": 0.3869672752019678, "learning_rate": 8.745283201736816e-06, "loss": 3.225361328125, "step": 320700 }, { "epoch": 0.38708793852445045, "learning_rate": 8.744879366269078e-06, "loss": 3.250545654296875, "step": 320800 }, { "epoch": 0.3872086018469331, "learning_rate": 8.74447553080134e-06, "loss": 3.2445709228515627, "step": 320900 }, { "epoch": 0.38732926516941585, "learning_rate": 8.7440716953336e-06, "loss": 3.270658264160156, "step": 321000 }, { "epoch": 0.3874499284918985, "learning_rate": 8.743667859865863e-06, "loss": 3.2479019165039062, "step": 321100 }, { "epoch": 0.3875705918143812, "learning_rate": 8.743264024398125e-06, "loss": 3.2724932861328124, "step": 321200 }, { "epoch": 0.38769125513686387, "learning_rate": 8.742860188930385e-06, "loss": 3.264521484375, "step": 321300 }, { "epoch": 0.38781191845934654, "learning_rate": 8.742456353462647e-06, "loss": 3.254627380371094, "step": 321400 }, { "epoch": 0.38793258178182927, "learning_rate": 8.742052517994909e-06, "loss": 3.267957763671875, "step": 321500 }, { "epoch": 0.38805324510431194, "learning_rate": 8.741648682527171e-06, "loss": 3.25322021484375, "step": 321600 }, { "epoch": 0.3881739084267946, "learning_rate": 8.741244847059433e-06, "loss": 3.270889892578125, "step": 321700 }, { "epoch": 0.3882945717492773, "learning_rate": 8.740841011591695e-06, "loss": 3.24781982421875, "step": 321800 }, { "epoch": 0.38841523507176, "learning_rate": 8.740437176123955e-06, "loss": 3.23787353515625, "step": 321900 }, { "epoch": 0.3885358983942427, "learning_rate": 8.740033340656217e-06, "loss": 3.2627996826171874, "step": 322000 }, { "epoch": 0.38865656171672536, "learning_rate": 8.739629505188477e-06, "loss": 3.2830990600585936, "step": 322100 }, { "epoch": 0.38877722503920803, "learning_rate": 8.73922566972074e-06, "loss": 3.249563903808594, "step": 322200 }, { "epoch": 0.3888978883616907, "learning_rate": 8.738821834253001e-06, "loss": 3.262378845214844, "step": 322300 }, { "epoch": 0.38901855168417343, "learning_rate": 8.738417998785263e-06, "loss": 3.242977294921875, "step": 322400 }, { "epoch": 0.3891392150066561, "learning_rate": 8.738014163317525e-06, "loss": 3.2355126953125, "step": 322500 }, { "epoch": 0.3892598783291388, "learning_rate": 8.737610327849787e-06, "loss": 3.258695373535156, "step": 322600 }, { "epoch": 0.38938054165162145, "learning_rate": 8.73720649238205e-06, "loss": 3.2482220458984377, "step": 322700 }, { "epoch": 0.3895012049741041, "learning_rate": 8.736802656914311e-06, "loss": 3.2713168334960936, "step": 322800 }, { "epoch": 0.38962186829658685, "learning_rate": 8.736398821446572e-06, "loss": 3.280970153808594, "step": 322900 }, { "epoch": 0.3897425316190695, "learning_rate": 8.735994985978834e-06, "loss": 3.267020263671875, "step": 323000 }, { "epoch": 0.3898631949415522, "learning_rate": 8.735591150511094e-06, "loss": 3.2653927612304687, "step": 323100 }, { "epoch": 0.38998385826403487, "learning_rate": 8.735187315043356e-06, "loss": 3.2459262084960936, "step": 323200 }, { "epoch": 0.39010452158651754, "learning_rate": 8.734783479575618e-06, "loss": 3.2473968505859374, "step": 323300 }, { "epoch": 0.39022518490900027, "learning_rate": 8.73437964410788e-06, "loss": 3.240254211425781, "step": 323400 }, { "epoch": 0.39034584823148294, "learning_rate": 8.733975808640142e-06, "loss": 3.2710537719726562, "step": 323500 }, { "epoch": 0.3904665115539656, "learning_rate": 8.733571973172404e-06, "loss": 3.2615786743164064, "step": 323600 }, { "epoch": 0.3905871748764483, "learning_rate": 8.733168137704664e-06, "loss": 3.2791656494140624, "step": 323700 }, { "epoch": 0.39070783819893096, "learning_rate": 8.732764302236926e-06, "loss": 3.2612799072265624, "step": 323800 }, { "epoch": 0.3908285015214137, "learning_rate": 8.732360466769188e-06, "loss": 3.252030029296875, "step": 323900 }, { "epoch": 0.39094916484389636, "learning_rate": 8.73195663130145e-06, "loss": 3.2781024169921875, "step": 324000 }, { "epoch": 0.39106982816637903, "learning_rate": 8.73155279583371e-06, "loss": 3.237001647949219, "step": 324100 }, { "epoch": 0.3911904914888617, "learning_rate": 8.731148960365972e-06, "loss": 3.275115966796875, "step": 324200 }, { "epoch": 0.39131115481134443, "learning_rate": 8.730745124898234e-06, "loss": 3.255198974609375, "step": 324300 }, { "epoch": 0.3914318181338271, "learning_rate": 8.730341289430496e-06, "loss": 3.256047668457031, "step": 324400 }, { "epoch": 0.3915524814563098, "learning_rate": 8.729937453962758e-06, "loss": 3.2424325561523437, "step": 324500 }, { "epoch": 0.39167314477879245, "learning_rate": 8.729533618495019e-06, "loss": 3.2617816162109374, "step": 324600 }, { "epoch": 0.3917938081012751, "learning_rate": 8.72912978302728e-06, "loss": 3.2746548461914062, "step": 324700 }, { "epoch": 0.39191447142375785, "learning_rate": 8.728725947559543e-06, "loss": 3.250362548828125, "step": 324800 }, { "epoch": 0.3920351347462405, "learning_rate": 8.728322112091804e-06, "loss": 3.2543563842773438, "step": 324900 }, { "epoch": 0.3921557980687232, "learning_rate": 8.727918276624065e-06, "loss": 3.2623782348632813, "step": 325000 }, { "epoch": 0.39227646139120587, "learning_rate": 8.727514441156327e-06, "loss": 3.2224575805664064, "step": 325100 }, { "epoch": 0.39239712471368854, "learning_rate": 8.727110605688589e-06, "loss": 3.261824035644531, "step": 325200 }, { "epoch": 0.39251778803617127, "learning_rate": 8.72670677022085e-06, "loss": 3.2519992065429686, "step": 325300 }, { "epoch": 0.39263845135865394, "learning_rate": 8.726302934753111e-06, "loss": 3.256750183105469, "step": 325400 }, { "epoch": 0.3927591146811366, "learning_rate": 8.725899099285373e-06, "loss": 3.2094772338867186, "step": 325500 }, { "epoch": 0.3928797780036193, "learning_rate": 8.725495263817635e-06, "loss": 3.266548767089844, "step": 325600 }, { "epoch": 0.39300044132610196, "learning_rate": 8.725091428349897e-06, "loss": 3.2751498413085938, "step": 325700 }, { "epoch": 0.3931211046485847, "learning_rate": 8.724687592882159e-06, "loss": 3.220372314453125, "step": 325800 }, { "epoch": 0.39324176797106736, "learning_rate": 8.724283757414421e-06, "loss": 3.2622271728515626, "step": 325900 }, { "epoch": 0.39336243129355003, "learning_rate": 8.723879921946681e-06, "loss": 3.2347183227539062, "step": 326000 }, { "epoch": 0.3934830946160327, "learning_rate": 8.723476086478943e-06, "loss": 3.2430880737304686, "step": 326100 }, { "epoch": 0.3936037579385154, "learning_rate": 8.723072251011203e-06, "loss": 3.2468997192382814, "step": 326200 }, { "epoch": 0.3937244212609981, "learning_rate": 8.722668415543465e-06, "loss": 3.2621139526367187, "step": 326300 }, { "epoch": 0.3938450845834808, "learning_rate": 8.722264580075727e-06, "loss": 3.274239501953125, "step": 326400 }, { "epoch": 0.39396574790596345, "learning_rate": 8.72186074460799e-06, "loss": 3.256181640625, "step": 326500 }, { "epoch": 0.3940864112284461, "learning_rate": 8.721456909140251e-06, "loss": 3.2360659790039064, "step": 326600 }, { "epoch": 0.39420707455092885, "learning_rate": 8.721053073672513e-06, "loss": 3.2457891845703126, "step": 326700 }, { "epoch": 0.3943277378734115, "learning_rate": 8.720649238204775e-06, "loss": 3.2437158203125, "step": 326800 }, { "epoch": 0.3944484011958942, "learning_rate": 8.720245402737036e-06, "loss": 3.2530947875976564, "step": 326900 }, { "epoch": 0.39456906451837687, "learning_rate": 8.719841567269298e-06, "loss": 3.2392318725585936, "step": 327000 }, { "epoch": 0.39468972784085954, "learning_rate": 8.71943773180156e-06, "loss": 3.2624307250976563, "step": 327100 }, { "epoch": 0.39481039116334227, "learning_rate": 8.71903389633382e-06, "loss": 3.2410653686523436, "step": 327200 }, { "epoch": 0.39493105448582494, "learning_rate": 8.718630060866082e-06, "loss": 3.2493820190429688, "step": 327300 }, { "epoch": 0.3950517178083076, "learning_rate": 8.718226225398344e-06, "loss": 3.224849853515625, "step": 327400 }, { "epoch": 0.3951723811307903, "learning_rate": 8.717822389930606e-06, "loss": 3.2115936279296875, "step": 327500 }, { "epoch": 0.39529304445327296, "learning_rate": 8.717418554462868e-06, "loss": 3.220730895996094, "step": 327600 }, { "epoch": 0.3954137077757557, "learning_rate": 8.71701471899513e-06, "loss": 3.2486026000976564, "step": 327700 }, { "epoch": 0.39553437109823836, "learning_rate": 8.71661088352739e-06, "loss": 3.2581307983398435, "step": 327800 }, { "epoch": 0.39565503442072103, "learning_rate": 8.716207048059652e-06, "loss": 3.2488836669921874, "step": 327900 }, { "epoch": 0.3957756977432037, "learning_rate": 8.715803212591914e-06, "loss": 3.2595529174804687, "step": 328000 }, { "epoch": 0.3958963610656864, "learning_rate": 8.715399377124174e-06, "loss": 3.2381057739257812, "step": 328100 }, { "epoch": 0.3960170243881691, "learning_rate": 8.714995541656436e-06, "loss": 3.240838623046875, "step": 328200 }, { "epoch": 0.3961376877106518, "learning_rate": 8.714591706188698e-06, "loss": 3.22958251953125, "step": 328300 }, { "epoch": 0.39625835103313445, "learning_rate": 8.71418787072096e-06, "loss": 3.2588885498046873, "step": 328400 }, { "epoch": 0.3963790143556171, "learning_rate": 8.713784035253222e-06, "loss": 3.2506768798828123, "step": 328500 }, { "epoch": 0.3964996776780998, "learning_rate": 8.713380199785483e-06, "loss": 3.239845886230469, "step": 328600 }, { "epoch": 0.3966203410005825, "learning_rate": 8.712976364317745e-06, "loss": 3.229544982910156, "step": 328700 }, { "epoch": 0.3967410043230652, "learning_rate": 8.712572528850007e-06, "loss": 3.237188415527344, "step": 328800 }, { "epoch": 0.39686166764554787, "learning_rate": 8.712168693382269e-06, "loss": 3.222325439453125, "step": 328900 }, { "epoch": 0.39698233096803054, "learning_rate": 8.71176485791453e-06, "loss": 3.2317233276367188, "step": 329000 }, { "epoch": 0.3971029942905132, "learning_rate": 8.71136102244679e-06, "loss": 3.2449880981445314, "step": 329100 }, { "epoch": 0.39722365761299594, "learning_rate": 8.710957186979053e-06, "loss": 3.247603454589844, "step": 329200 }, { "epoch": 0.3973443209354786, "learning_rate": 8.710553351511315e-06, "loss": 3.245472106933594, "step": 329300 }, { "epoch": 0.3974649842579613, "learning_rate": 8.710149516043577e-06, "loss": 3.2534674072265624, "step": 329400 }, { "epoch": 0.39758564758044396, "learning_rate": 8.709745680575837e-06, "loss": 3.260495300292969, "step": 329500 }, { "epoch": 0.3977063109029267, "learning_rate": 8.709341845108099e-06, "loss": 3.2542568969726564, "step": 329600 }, { "epoch": 0.39782697422540936, "learning_rate": 8.708938009640361e-06, "loss": 3.215430908203125, "step": 329700 }, { "epoch": 0.39794763754789203, "learning_rate": 8.708534174172623e-06, "loss": 3.2525616455078126, "step": 329800 }, { "epoch": 0.3980683008703747, "learning_rate": 8.708130338704885e-06, "loss": 3.2172467041015627, "step": 329900 }, { "epoch": 0.3981889641928574, "learning_rate": 8.707726503237145e-06, "loss": 3.227056579589844, "step": 330000 }, { "epoch": 0.3983096275153401, "learning_rate": 8.707322667769407e-06, "loss": 3.2540380859375, "step": 330100 }, { "epoch": 0.3984302908378228, "learning_rate": 8.70691883230167e-06, "loss": 3.2183956909179687, "step": 330200 }, { "epoch": 0.39855095416030545, "learning_rate": 8.70651499683393e-06, "loss": 3.222982177734375, "step": 330300 }, { "epoch": 0.3986716174827881, "learning_rate": 8.706111161366192e-06, "loss": 3.2263897705078124, "step": 330400 }, { "epoch": 0.3987922808052708, "learning_rate": 8.705707325898453e-06, "loss": 3.2129312133789063, "step": 330500 }, { "epoch": 0.3989129441277535, "learning_rate": 8.705303490430715e-06, "loss": 3.240805358886719, "step": 330600 }, { "epoch": 0.3990336074502362, "learning_rate": 8.704899654962977e-06, "loss": 3.2541278076171873, "step": 330700 }, { "epoch": 0.39915427077271887, "learning_rate": 8.70449581949524e-06, "loss": 3.23765625, "step": 330800 }, { "epoch": 0.39927493409520154, "learning_rate": 8.704091984027501e-06, "loss": 3.23277587890625, "step": 330900 }, { "epoch": 0.3993955974176842, "learning_rate": 8.703688148559762e-06, "loss": 3.2397525024414064, "step": 331000 }, { "epoch": 0.39951626074016694, "learning_rate": 8.703284313092024e-06, "loss": 3.2474267578125, "step": 331100 }, { "epoch": 0.3996369240626496, "learning_rate": 8.702880477624284e-06, "loss": 3.213720397949219, "step": 331200 }, { "epoch": 0.3997575873851323, "learning_rate": 8.702476642156546e-06, "loss": 3.209533386230469, "step": 331300 }, { "epoch": 0.39987825070761496, "learning_rate": 8.702072806688808e-06, "loss": 3.2245709228515627, "step": 331400 }, { "epoch": 0.39999891403009763, "learning_rate": 8.70166897122107e-06, "loss": 3.258290100097656, "step": 331500 }, { "epoch": 0.40011957735258036, "learning_rate": 8.701265135753332e-06, "loss": 3.2603057861328124, "step": 331600 }, { "epoch": 0.40024024067506303, "learning_rate": 8.700861300285594e-06, "loss": 3.2535665893554686, "step": 331700 }, { "epoch": 0.4003609039975457, "learning_rate": 8.700457464817856e-06, "loss": 3.2403680419921876, "step": 331800 }, { "epoch": 0.4004815673200284, "learning_rate": 8.700053629350116e-06, "loss": 3.223586120605469, "step": 331900 }, { "epoch": 0.4006022306425111, "learning_rate": 8.699649793882378e-06, "loss": 3.216365966796875, "step": 332000 }, { "epoch": 0.4007228939649938, "learning_rate": 8.69924595841464e-06, "loss": 3.230245361328125, "step": 332100 }, { "epoch": 0.40084355728747645, "learning_rate": 8.6988421229469e-06, "loss": 3.2543609619140623, "step": 332200 }, { "epoch": 0.4009642206099591, "learning_rate": 8.698438287479162e-06, "loss": 3.2624642944335935, "step": 332300 }, { "epoch": 0.4010848839324418, "learning_rate": 8.698034452011424e-06, "loss": 3.2456478881835937, "step": 332400 }, { "epoch": 0.4012055472549245, "learning_rate": 8.697630616543686e-06, "loss": 3.2356918334960936, "step": 332500 }, { "epoch": 0.4013262105774072, "learning_rate": 8.697226781075948e-06, "loss": 3.2194866943359375, "step": 332600 }, { "epoch": 0.40144687389988987, "learning_rate": 8.696822945608209e-06, "loss": 3.2380975341796874, "step": 332700 }, { "epoch": 0.40156753722237254, "learning_rate": 8.69641911014047e-06, "loss": 3.2371475219726564, "step": 332800 }, { "epoch": 0.4016882005448552, "learning_rate": 8.696015274672733e-06, "loss": 3.220198669433594, "step": 332900 }, { "epoch": 0.40180886386733794, "learning_rate": 8.695611439204995e-06, "loss": 3.241708068847656, "step": 333000 }, { "epoch": 0.4019295271898206, "learning_rate": 8.695207603737255e-06, "loss": 3.1977859497070313, "step": 333100 }, { "epoch": 0.4020501905123033, "learning_rate": 8.694803768269517e-06, "loss": 3.2426321411132815, "step": 333200 }, { "epoch": 0.40217085383478596, "learning_rate": 8.694399932801779e-06, "loss": 3.1952053833007814, "step": 333300 }, { "epoch": 0.40229151715726863, "learning_rate": 8.69399609733404e-06, "loss": 3.238172912597656, "step": 333400 }, { "epoch": 0.40241218047975136, "learning_rate": 8.693592261866301e-06, "loss": 3.2227496337890624, "step": 333500 }, { "epoch": 0.40253284380223403, "learning_rate": 8.693188426398563e-06, "loss": 3.240567321777344, "step": 333600 }, { "epoch": 0.4026535071247167, "learning_rate": 8.692784590930825e-06, "loss": 3.2373675537109374, "step": 333700 }, { "epoch": 0.4027741704471994, "learning_rate": 8.692380755463087e-06, "loss": 3.22337158203125, "step": 333800 }, { "epoch": 0.40289483376968205, "learning_rate": 8.691976919995349e-06, "loss": 3.219118347167969, "step": 333900 }, { "epoch": 0.4030154970921648, "learning_rate": 8.691573084527611e-06, "loss": 3.2311080932617187, "step": 334000 }, { "epoch": 0.40313616041464745, "learning_rate": 8.691169249059871e-06, "loss": 3.2483099365234374, "step": 334100 }, { "epoch": 0.4032568237371301, "learning_rate": 8.690765413592133e-06, "loss": 3.266927490234375, "step": 334200 }, { "epoch": 0.4033774870596128, "learning_rate": 8.690361578124394e-06, "loss": 3.2319259643554688, "step": 334300 }, { "epoch": 0.40349815038209547, "learning_rate": 8.689957742656656e-06, "loss": 3.2280313110351564, "step": 334400 }, { "epoch": 0.4036188137045782, "learning_rate": 8.689553907188918e-06, "loss": 3.253345642089844, "step": 334500 }, { "epoch": 0.40373947702706087, "learning_rate": 8.68915007172118e-06, "loss": 3.239232482910156, "step": 334600 }, { "epoch": 0.40386014034954354, "learning_rate": 8.688746236253442e-06, "loss": 3.25429443359375, "step": 334700 }, { "epoch": 0.4039808036720262, "learning_rate": 8.688342400785703e-06, "loss": 3.234934997558594, "step": 334800 }, { "epoch": 0.40410146699450894, "learning_rate": 8.687938565317965e-06, "loss": 3.2206710815429687, "step": 334900 }, { "epoch": 0.4042221303169916, "learning_rate": 8.687534729850227e-06, "loss": 3.2517941284179686, "step": 335000 }, { "epoch": 0.4043427936394743, "learning_rate": 8.687130894382488e-06, "loss": 3.2393963623046873, "step": 335100 }, { "epoch": 0.40446345696195696, "learning_rate": 8.68672705891475e-06, "loss": 3.226715393066406, "step": 335200 }, { "epoch": 0.40458412028443963, "learning_rate": 8.68632322344701e-06, "loss": 3.2386956787109376, "step": 335300 }, { "epoch": 0.40470478360692236, "learning_rate": 8.685919387979272e-06, "loss": 3.2447048950195314, "step": 335400 }, { "epoch": 0.40482544692940503, "learning_rate": 8.685515552511534e-06, "loss": 3.218361511230469, "step": 335500 }, { "epoch": 0.4049461102518877, "learning_rate": 8.685111717043796e-06, "loss": 3.209727783203125, "step": 335600 }, { "epoch": 0.4050667735743704, "learning_rate": 8.684707881576058e-06, "loss": 3.227924499511719, "step": 335700 }, { "epoch": 0.40518743689685305, "learning_rate": 8.68430404610832e-06, "loss": 3.2397885131835937, "step": 335800 }, { "epoch": 0.4053081002193358, "learning_rate": 8.683900210640582e-06, "loss": 3.23482666015625, "step": 335900 }, { "epoch": 0.40542876354181845, "learning_rate": 8.683496375172842e-06, "loss": 3.214422302246094, "step": 336000 }, { "epoch": 0.4055494268643011, "learning_rate": 8.683092539705104e-06, "loss": 3.2211929321289063, "step": 336100 }, { "epoch": 0.4056700901867838, "learning_rate": 8.682688704237366e-06, "loss": 3.197298583984375, "step": 336200 }, { "epoch": 0.40579075350926647, "learning_rate": 8.682284868769626e-06, "loss": 3.244281921386719, "step": 336300 }, { "epoch": 0.4059114168317492, "learning_rate": 8.681881033301888e-06, "loss": 3.2218942260742187, "step": 336400 }, { "epoch": 0.40603208015423187, "learning_rate": 8.68147719783415e-06, "loss": 3.2383651733398438, "step": 336500 }, { "epoch": 0.40615274347671454, "learning_rate": 8.681073362366412e-06, "loss": 3.211350402832031, "step": 336600 }, { "epoch": 0.4062734067991972, "learning_rate": 8.680669526898674e-06, "loss": 3.2161904907226564, "step": 336700 }, { "epoch": 0.4063940701216799, "learning_rate": 8.680265691430935e-06, "loss": 3.2426333618164063, "step": 336800 }, { "epoch": 0.4065147334441626, "learning_rate": 8.679861855963197e-06, "loss": 3.204479064941406, "step": 336900 }, { "epoch": 0.4066353967666453, "learning_rate": 8.679458020495459e-06, "loss": 3.25840576171875, "step": 337000 }, { "epoch": 0.40675606008912796, "learning_rate": 8.67905418502772e-06, "loss": 3.205541687011719, "step": 337100 }, { "epoch": 0.40687672341161063, "learning_rate": 8.678650349559981e-06, "loss": 3.2392449951171876, "step": 337200 }, { "epoch": 0.40699738673409336, "learning_rate": 8.678246514092243e-06, "loss": 3.2341339111328127, "step": 337300 }, { "epoch": 0.40711805005657603, "learning_rate": 8.677842678624505e-06, "loss": 3.178050842285156, "step": 337400 }, { "epoch": 0.4072387133790587, "learning_rate": 8.677438843156767e-06, "loss": 3.2221990966796876, "step": 337500 }, { "epoch": 0.4073593767015414, "learning_rate": 8.677035007689027e-06, "loss": 3.2231076049804686, "step": 337600 }, { "epoch": 0.40748004002402405, "learning_rate": 8.676631172221289e-06, "loss": 3.219910888671875, "step": 337700 }, { "epoch": 0.4076007033465068, "learning_rate": 8.676227336753551e-06, "loss": 3.2170254516601564, "step": 337800 }, { "epoch": 0.40772136666898945, "learning_rate": 8.675823501285813e-06, "loss": 3.21661376953125, "step": 337900 }, { "epoch": 0.4078420299914721, "learning_rate": 8.675419665818075e-06, "loss": 3.2232647705078126, "step": 338000 }, { "epoch": 0.4079626933139548, "learning_rate": 8.675015830350337e-06, "loss": 3.235281982421875, "step": 338100 }, { "epoch": 0.40808335663643747, "learning_rate": 8.674611994882597e-06, "loss": 3.229799499511719, "step": 338200 }, { "epoch": 0.4082040199589202, "learning_rate": 8.67420815941486e-06, "loss": 3.2149139404296876, "step": 338300 }, { "epoch": 0.40832468328140287, "learning_rate": 8.67380432394712e-06, "loss": 3.2462454223632813, "step": 338400 }, { "epoch": 0.40844534660388554, "learning_rate": 8.673400488479382e-06, "loss": 3.2204629516601564, "step": 338500 }, { "epoch": 0.4085660099263682, "learning_rate": 8.672996653011644e-06, "loss": 3.2181387329101563, "step": 338600 }, { "epoch": 0.4086866732488509, "learning_rate": 8.672592817543906e-06, "loss": 3.219879455566406, "step": 338700 }, { "epoch": 0.4088073365713336, "learning_rate": 8.672188982076168e-06, "loss": 3.231728210449219, "step": 338800 }, { "epoch": 0.4089279998938163, "learning_rate": 8.67178514660843e-06, "loss": 3.204775085449219, "step": 338900 }, { "epoch": 0.40904866321629896, "learning_rate": 8.671381311140692e-06, "loss": 3.2208401489257814, "step": 339000 }, { "epoch": 0.40916932653878163, "learning_rate": 8.670977475672952e-06, "loss": 3.2086062622070313, "step": 339100 }, { "epoch": 0.4092899898612643, "learning_rate": 8.670573640205214e-06, "loss": 3.197918701171875, "step": 339200 }, { "epoch": 0.40941065318374703, "learning_rate": 8.670169804737476e-06, "loss": 3.2291751098632813, "step": 339300 }, { "epoch": 0.4095313165062297, "learning_rate": 8.669765969269736e-06, "loss": 3.208134765625, "step": 339400 }, { "epoch": 0.4096519798287124, "learning_rate": 8.669362133801998e-06, "loss": 3.2309054565429687, "step": 339500 }, { "epoch": 0.40977264315119505, "learning_rate": 8.66895829833426e-06, "loss": 3.2387905883789063, "step": 339600 }, { "epoch": 0.4098933064736777, "learning_rate": 8.668554462866522e-06, "loss": 3.212843933105469, "step": 339700 }, { "epoch": 0.41001396979616045, "learning_rate": 8.668150627398784e-06, "loss": 3.22937255859375, "step": 339800 }, { "epoch": 0.4101346331186431, "learning_rate": 8.667746791931046e-06, "loss": 3.1962744140625, "step": 339900 }, { "epoch": 0.4102552964411258, "learning_rate": 8.667342956463308e-06, "loss": 3.2106356811523438, "step": 340000 }, { "epoch": 0.41037595976360847, "learning_rate": 8.666939120995568e-06, "loss": 3.209013671875, "step": 340100 }, { "epoch": 0.4104966230860912, "learning_rate": 8.66653528552783e-06, "loss": 3.1933554077148436, "step": 340200 }, { "epoch": 0.41061728640857387, "learning_rate": 8.66613145006009e-06, "loss": 3.2256842041015625, "step": 340300 }, { "epoch": 0.41073794973105654, "learning_rate": 8.665727614592352e-06, "loss": 3.229443359375, "step": 340400 }, { "epoch": 0.4108586130535392, "learning_rate": 8.665323779124614e-06, "loss": 3.230039367675781, "step": 340500 }, { "epoch": 0.4109792763760219, "learning_rate": 8.664919943656876e-06, "loss": 3.2083975219726564, "step": 340600 }, { "epoch": 0.4110999396985046, "learning_rate": 8.664516108189138e-06, "loss": 3.2223355102539064, "step": 340700 }, { "epoch": 0.4112206030209873, "learning_rate": 8.6641122727214e-06, "loss": 3.223494567871094, "step": 340800 }, { "epoch": 0.41134126634346996, "learning_rate": 8.66370843725366e-06, "loss": 3.2406671142578123, "step": 340900 }, { "epoch": 0.41146192966595263, "learning_rate": 8.663304601785923e-06, "loss": 3.242525939941406, "step": 341000 }, { "epoch": 0.4115825929884353, "learning_rate": 8.662900766318185e-06, "loss": 3.222906494140625, "step": 341100 }, { "epoch": 0.41170325631091803, "learning_rate": 8.662496930850447e-06, "loss": 3.231730651855469, "step": 341200 }, { "epoch": 0.4118239196334007, "learning_rate": 8.662093095382707e-06, "loss": 3.198711242675781, "step": 341300 }, { "epoch": 0.4119445829558834, "learning_rate": 8.661689259914969e-06, "loss": 3.226524658203125, "step": 341400 }, { "epoch": 0.41206524627836605, "learning_rate": 8.661285424447231e-06, "loss": 3.202694091796875, "step": 341500 }, { "epoch": 0.4121859096008487, "learning_rate": 8.660881588979493e-06, "loss": 3.239063720703125, "step": 341600 }, { "epoch": 0.41230657292333145, "learning_rate": 8.660477753511753e-06, "loss": 3.2045864868164062, "step": 341700 }, { "epoch": 0.4124272362458141, "learning_rate": 8.660073918044015e-06, "loss": 3.181391296386719, "step": 341800 }, { "epoch": 0.4125478995682968, "learning_rate": 8.659670082576277e-06, "loss": 3.2037448120117187, "step": 341900 }, { "epoch": 0.41266856289077947, "learning_rate": 8.659266247108539e-06, "loss": 3.224603271484375, "step": 342000 }, { "epoch": 0.41278922621326214, "learning_rate": 8.658862411640801e-06, "loss": 3.2082894897460936, "step": 342100 }, { "epoch": 0.41290988953574487, "learning_rate": 8.658458576173061e-06, "loss": 3.183901062011719, "step": 342200 }, { "epoch": 0.41303055285822754, "learning_rate": 8.658054740705323e-06, "loss": 3.2185455322265626, "step": 342300 }, { "epoch": 0.4131512161807102, "learning_rate": 8.657650905237585e-06, "loss": 3.1830328369140624, "step": 342400 }, { "epoch": 0.4132718795031929, "learning_rate": 8.657247069769846e-06, "loss": 3.2155596923828127, "step": 342500 }, { "epoch": 0.4133925428256756, "learning_rate": 8.656843234302108e-06, "loss": 3.1984686279296874, "step": 342600 }, { "epoch": 0.4135132061481583, "learning_rate": 8.65643939883437e-06, "loss": 3.192720947265625, "step": 342700 }, { "epoch": 0.41363386947064096, "learning_rate": 8.656035563366632e-06, "loss": 3.2008929443359375, "step": 342800 }, { "epoch": 0.41375453279312363, "learning_rate": 8.655631727898894e-06, "loss": 3.2165261840820314, "step": 342900 }, { "epoch": 0.4138751961156063, "learning_rate": 8.655227892431156e-06, "loss": 3.2417007446289063, "step": 343000 }, { "epoch": 0.41399585943808903, "learning_rate": 8.654824056963418e-06, "loss": 3.205733337402344, "step": 343100 }, { "epoch": 0.4141165227605717, "learning_rate": 8.654420221495678e-06, "loss": 3.221959228515625, "step": 343200 }, { "epoch": 0.4142371860830544, "learning_rate": 8.65401638602794e-06, "loss": 3.19021728515625, "step": 343300 }, { "epoch": 0.41435784940553705, "learning_rate": 8.6536125505602e-06, "loss": 3.2108798217773438, "step": 343400 }, { "epoch": 0.4144785127280197, "learning_rate": 8.653208715092462e-06, "loss": 3.2116644287109377, "step": 343500 }, { "epoch": 0.41459917605050245, "learning_rate": 8.652804879624724e-06, "loss": 3.2212738037109374, "step": 343600 }, { "epoch": 0.4147198393729851, "learning_rate": 8.652401044156986e-06, "loss": 3.2033590698242187, "step": 343700 }, { "epoch": 0.4148405026954678, "learning_rate": 8.651997208689248e-06, "loss": 3.195982666015625, "step": 343800 }, { "epoch": 0.41496116601795047, "learning_rate": 8.65159337322151e-06, "loss": 3.2180380249023437, "step": 343900 }, { "epoch": 0.41508182934043314, "learning_rate": 8.651189537753772e-06, "loss": 3.1774774169921876, "step": 344000 }, { "epoch": 0.41520249266291587, "learning_rate": 8.650785702286032e-06, "loss": 3.210050048828125, "step": 344100 }, { "epoch": 0.41532315598539854, "learning_rate": 8.650381866818294e-06, "loss": 3.211160888671875, "step": 344200 }, { "epoch": 0.4154438193078812, "learning_rate": 8.649978031350556e-06, "loss": 3.1976614379882813, "step": 344300 }, { "epoch": 0.4155644826303639, "learning_rate": 8.649574195882817e-06, "loss": 3.190289306640625, "step": 344400 }, { "epoch": 0.41568514595284656, "learning_rate": 8.649170360415079e-06, "loss": 3.225347595214844, "step": 344500 }, { "epoch": 0.4158058092753293, "learning_rate": 8.64876652494734e-06, "loss": 3.202977294921875, "step": 344600 }, { "epoch": 0.41592647259781196, "learning_rate": 8.648362689479602e-06, "loss": 3.2093356323242186, "step": 344700 }, { "epoch": 0.41604713592029463, "learning_rate": 8.647958854011864e-06, "loss": 3.1954550170898437, "step": 344800 }, { "epoch": 0.4161677992427773, "learning_rate": 8.647555018544126e-06, "loss": 3.1998214721679688, "step": 344900 }, { "epoch": 0.41628846256526003, "learning_rate": 8.647151183076387e-06, "loss": 3.2063043212890623, "step": 345000 }, { "epoch": 0.4164091258877427, "learning_rate": 8.646747347608649e-06, "loss": 3.22114013671875, "step": 345100 }, { "epoch": 0.4165297892102254, "learning_rate": 8.64634351214091e-06, "loss": 3.223668518066406, "step": 345200 }, { "epoch": 0.41665045253270805, "learning_rate": 8.645939676673171e-06, "loss": 3.206558837890625, "step": 345300 }, { "epoch": 0.4167711158551907, "learning_rate": 8.645535841205433e-06, "loss": 3.205198059082031, "step": 345400 }, { "epoch": 0.41689177917767345, "learning_rate": 8.645132005737695e-06, "loss": 3.192651672363281, "step": 345500 }, { "epoch": 0.4170124425001561, "learning_rate": 8.644728170269957e-06, "loss": 3.2244189453125, "step": 345600 }, { "epoch": 0.4171331058226388, "learning_rate": 8.644324334802219e-06, "loss": 3.2088446044921874, "step": 345700 }, { "epoch": 0.41725376914512147, "learning_rate": 8.64392049933448e-06, "loss": 3.205760192871094, "step": 345800 }, { "epoch": 0.41737443246760414, "learning_rate": 8.643516663866741e-06, "loss": 3.2174618530273436, "step": 345900 }, { "epoch": 0.41749509579008687, "learning_rate": 8.643112828399003e-06, "loss": 3.2103399658203124, "step": 346000 }, { "epoch": 0.41761575911256954, "learning_rate": 8.642708992931265e-06, "loss": 3.2393667602539065, "step": 346100 }, { "epoch": 0.4177364224350522, "learning_rate": 8.642305157463527e-06, "loss": 3.209239196777344, "step": 346200 }, { "epoch": 0.4178570857575349, "learning_rate": 8.641901321995787e-06, "loss": 3.2006735229492187, "step": 346300 }, { "epoch": 0.41797774908001756, "learning_rate": 8.64149748652805e-06, "loss": 3.2213815307617186, "step": 346400 }, { "epoch": 0.4180984124025003, "learning_rate": 8.641093651060311e-06, "loss": 3.1774542236328127, "step": 346500 }, { "epoch": 0.41821907572498296, "learning_rate": 8.640689815592572e-06, "loss": 3.2271368408203127, "step": 346600 }, { "epoch": 0.41833973904746563, "learning_rate": 8.640285980124834e-06, "loss": 3.196385498046875, "step": 346700 }, { "epoch": 0.4184604023699483, "learning_rate": 8.639882144657096e-06, "loss": 3.2082119750976563, "step": 346800 }, { "epoch": 0.418581065692431, "learning_rate": 8.639478309189358e-06, "loss": 3.181191101074219, "step": 346900 }, { "epoch": 0.4187017290149137, "learning_rate": 8.63907447372162e-06, "loss": 3.21628173828125, "step": 347000 }, { "epoch": 0.4188223923373964, "learning_rate": 8.638670638253882e-06, "loss": 3.1893939208984374, "step": 347100 }, { "epoch": 0.41894305565987905, "learning_rate": 8.638266802786142e-06, "loss": 3.2127761840820312, "step": 347200 }, { "epoch": 0.4190637189823617, "learning_rate": 8.637862967318404e-06, "loss": 3.2235122680664063, "step": 347300 }, { "epoch": 0.4191843823048444, "learning_rate": 8.637459131850666e-06, "loss": 3.1816720581054687, "step": 347400 }, { "epoch": 0.4193050456273271, "learning_rate": 8.637055296382926e-06, "loss": 3.2108224487304686, "step": 347500 }, { "epoch": 0.4194257089498098, "learning_rate": 8.636651460915188e-06, "loss": 3.1819384765625, "step": 347600 }, { "epoch": 0.41954637227229247, "learning_rate": 8.63624762544745e-06, "loss": 3.185660705566406, "step": 347700 }, { "epoch": 0.41966703559477514, "learning_rate": 8.635843789979712e-06, "loss": 3.178056640625, "step": 347800 }, { "epoch": 0.41978769891725787, "learning_rate": 8.635439954511974e-06, "loss": 3.2183203125, "step": 347900 }, { "epoch": 0.41990836223974054, "learning_rate": 8.635036119044236e-06, "loss": 3.205784912109375, "step": 348000 }, { "epoch": 0.4200290255622232, "learning_rate": 8.634632283576498e-06, "loss": 3.205758361816406, "step": 348100 }, { "epoch": 0.4201496888847059, "learning_rate": 8.634228448108758e-06, "loss": 3.186525573730469, "step": 348200 }, { "epoch": 0.42027035220718856, "learning_rate": 8.63382461264102e-06, "loss": 3.185724182128906, "step": 348300 }, { "epoch": 0.4203910155296713, "learning_rate": 8.63342077717328e-06, "loss": 3.1968618774414064, "step": 348400 }, { "epoch": 0.42051167885215396, "learning_rate": 8.633016941705543e-06, "loss": 3.1868109130859374, "step": 348500 }, { "epoch": 0.42063234217463663, "learning_rate": 8.632613106237805e-06, "loss": 3.2233200073242188, "step": 348600 }, { "epoch": 0.4207530054971193, "learning_rate": 8.632209270770067e-06, "loss": 3.2074380493164063, "step": 348700 }, { "epoch": 0.420873668819602, "learning_rate": 8.631805435302329e-06, "loss": 3.1990170288085937, "step": 348800 }, { "epoch": 0.4209943321420847, "learning_rate": 8.63140159983459e-06, "loss": 3.205107421875, "step": 348900 }, { "epoch": 0.4211149954645674, "learning_rate": 8.63099776436685e-06, "loss": 3.180198059082031, "step": 349000 }, { "epoch": 0.42123565878705005, "learning_rate": 8.630593928899113e-06, "loss": 3.2174258422851563, "step": 349100 }, { "epoch": 0.4213563221095327, "learning_rate": 8.630190093431375e-06, "loss": 3.212493591308594, "step": 349200 }, { "epoch": 0.4214769854320154, "learning_rate": 8.629786257963637e-06, "loss": 3.188234558105469, "step": 349300 }, { "epoch": 0.4215976487544981, "learning_rate": 8.629382422495897e-06, "loss": 3.2077059936523438, "step": 349400 }, { "epoch": 0.4217183120769808, "learning_rate": 8.628978587028159e-06, "loss": 3.219124450683594, "step": 349500 }, { "epoch": 0.42183897539946347, "learning_rate": 8.628574751560421e-06, "loss": 3.2035372924804686, "step": 349600 }, { "epoch": 0.42195963872194614, "learning_rate": 8.628170916092683e-06, "loss": 3.1906072998046877, "step": 349700 }, { "epoch": 0.4220803020444288, "learning_rate": 8.627767080624943e-06, "loss": 3.204189453125, "step": 349800 }, { "epoch": 0.42220096536691154, "learning_rate": 8.627363245157205e-06, "loss": 3.211806640625, "step": 349900 }, { "epoch": 0.4223216286893942, "learning_rate": 8.626959409689467e-06, "loss": 3.218048095703125, "step": 350000 }, { "epoch": 0.4224422920118769, "learning_rate": 8.62655557422173e-06, "loss": 3.2010458374023436, "step": 350100 }, { "epoch": 0.42256295533435956, "learning_rate": 8.626151738753991e-06, "loss": 3.2027316284179688, "step": 350200 }, { "epoch": 0.4226836186568423, "learning_rate": 8.625747903286253e-06, "loss": 3.193138427734375, "step": 350300 }, { "epoch": 0.42280428197932496, "learning_rate": 8.625344067818513e-06, "loss": 3.2288323974609376, "step": 350400 }, { "epoch": 0.42292494530180763, "learning_rate": 8.624940232350775e-06, "loss": 3.1780859375, "step": 350500 }, { "epoch": 0.4230456086242903, "learning_rate": 8.624536396883037e-06, "loss": 3.2224600219726565, "step": 350600 }, { "epoch": 0.423166271946773, "learning_rate": 8.624132561415298e-06, "loss": 3.1776654052734377, "step": 350700 }, { "epoch": 0.4232869352692557, "learning_rate": 8.62372872594756e-06, "loss": 3.2015042114257812, "step": 350800 }, { "epoch": 0.4234075985917384, "learning_rate": 8.623324890479822e-06, "loss": 3.1626651000976564, "step": 350900 }, { "epoch": 0.42352826191422105, "learning_rate": 8.622921055012084e-06, "loss": 3.226488037109375, "step": 351000 }, { "epoch": 0.4236489252367037, "learning_rate": 8.622517219544346e-06, "loss": 3.1890530395507812, "step": 351100 }, { "epoch": 0.4237695885591864, "learning_rate": 8.622113384076608e-06, "loss": 3.1845584106445313, "step": 351200 }, { "epoch": 0.4238902518816691, "learning_rate": 8.621709548608868e-06, "loss": 3.2036788940429686, "step": 351300 }, { "epoch": 0.4240109152041518, "learning_rate": 8.62130571314113e-06, "loss": 3.202007141113281, "step": 351400 }, { "epoch": 0.42413157852663447, "learning_rate": 8.620901877673392e-06, "loss": 3.1648004150390623, "step": 351500 }, { "epoch": 0.42425224184911714, "learning_rate": 8.620498042205652e-06, "loss": 3.213977966308594, "step": 351600 }, { "epoch": 0.4243729051715998, "learning_rate": 8.620094206737914e-06, "loss": 3.1970068359375, "step": 351700 }, { "epoch": 0.42449356849408254, "learning_rate": 8.619690371270176e-06, "loss": 3.2080477905273437, "step": 351800 }, { "epoch": 0.4246142318165652, "learning_rate": 8.619286535802438e-06, "loss": 3.1725588989257814, "step": 351900 }, { "epoch": 0.4247348951390479, "learning_rate": 8.6188827003347e-06, "loss": 3.1949203491210936, "step": 352000 }, { "epoch": 0.42485555846153056, "learning_rate": 8.618478864866962e-06, "loss": 3.1900143432617187, "step": 352100 }, { "epoch": 0.42497622178401323, "learning_rate": 8.618075029399224e-06, "loss": 3.1891775512695313, "step": 352200 }, { "epoch": 0.42509688510649596, "learning_rate": 8.617671193931484e-06, "loss": 3.1977944946289063, "step": 352300 }, { "epoch": 0.42521754842897863, "learning_rate": 8.617267358463746e-06, "loss": 3.2065228271484374, "step": 352400 }, { "epoch": 0.4253382117514613, "learning_rate": 8.616863522996007e-06, "loss": 3.1953411865234376, "step": 352500 }, { "epoch": 0.425458875073944, "learning_rate": 8.616459687528269e-06, "loss": 3.1885186767578126, "step": 352600 }, { "epoch": 0.42557953839642665, "learning_rate": 8.61605585206053e-06, "loss": 3.1860955810546874, "step": 352700 }, { "epoch": 0.4257002017189094, "learning_rate": 8.615652016592793e-06, "loss": 3.1615304565429687, "step": 352800 }, { "epoch": 0.42582086504139205, "learning_rate": 8.615248181125055e-06, "loss": 3.2005215454101563, "step": 352900 }, { "epoch": 0.4259415283638747, "learning_rate": 8.614844345657317e-06, "loss": 3.1655239868164062, "step": 353000 }, { "epoch": 0.4260621916863574, "learning_rate": 8.614440510189577e-06, "loss": 3.1802490234375, "step": 353100 }, { "epoch": 0.4261828550088401, "learning_rate": 8.614036674721839e-06, "loss": 3.1738934326171875, "step": 353200 }, { "epoch": 0.4263035183313228, "learning_rate": 8.6136328392541e-06, "loss": 3.1935418701171874, "step": 353300 }, { "epoch": 0.42642418165380547, "learning_rate": 8.613229003786363e-06, "loss": 3.168765869140625, "step": 353400 }, { "epoch": 0.42654484497628814, "learning_rate": 8.612825168318623e-06, "loss": 3.1861041259765623, "step": 353500 }, { "epoch": 0.4266655082987708, "learning_rate": 8.612421332850885e-06, "loss": 3.189508972167969, "step": 353600 }, { "epoch": 0.42678617162125354, "learning_rate": 8.612017497383147e-06, "loss": 3.197337341308594, "step": 353700 }, { "epoch": 0.4269068349437362, "learning_rate": 8.611613661915409e-06, "loss": 3.181391296386719, "step": 353800 }, { "epoch": 0.4270274982662189, "learning_rate": 8.61120982644767e-06, "loss": 3.1841604614257815, "step": 353900 }, { "epoch": 0.42714816158870156, "learning_rate": 8.610805990979931e-06, "loss": 3.198205871582031, "step": 354000 }, { "epoch": 0.42726882491118423, "learning_rate": 8.610402155512193e-06, "loss": 3.211336975097656, "step": 354100 }, { "epoch": 0.42738948823366696, "learning_rate": 8.609998320044455e-06, "loss": 3.149882507324219, "step": 354200 }, { "epoch": 0.42751015155614963, "learning_rate": 8.609594484576717e-06, "loss": 3.202339782714844, "step": 354300 }, { "epoch": 0.4276308148786323, "learning_rate": 8.609190649108978e-06, "loss": 3.196155700683594, "step": 354400 }, { "epoch": 0.427751478201115, "learning_rate": 8.60878681364124e-06, "loss": 3.178345947265625, "step": 354500 }, { "epoch": 0.42787214152359765, "learning_rate": 8.608382978173501e-06, "loss": 3.175726318359375, "step": 354600 }, { "epoch": 0.4279928048460804, "learning_rate": 8.607979142705762e-06, "loss": 3.1696160888671874, "step": 354700 }, { "epoch": 0.42811346816856305, "learning_rate": 8.607575307238024e-06, "loss": 3.1580960083007814, "step": 354800 }, { "epoch": 0.4282341314910457, "learning_rate": 8.607171471770286e-06, "loss": 3.1801498413085936, "step": 354900 }, { "epoch": 0.4283547948135284, "learning_rate": 8.606767636302548e-06, "loss": 3.204053955078125, "step": 355000 }, { "epoch": 0.42847545813601107, "learning_rate": 8.60636380083481e-06, "loss": 3.1976077270507814, "step": 355100 }, { "epoch": 0.4285961214584938, "learning_rate": 8.605959965367072e-06, "loss": 3.179556579589844, "step": 355200 }, { "epoch": 0.42871678478097647, "learning_rate": 8.605556129899334e-06, "loss": 3.15634033203125, "step": 355300 }, { "epoch": 0.42883744810345914, "learning_rate": 8.605152294431594e-06, "loss": 3.1712017822265626, "step": 355400 }, { "epoch": 0.4289581114259418, "learning_rate": 8.604748458963856e-06, "loss": 3.194010925292969, "step": 355500 }, { "epoch": 0.42907877474842454, "learning_rate": 8.604344623496116e-06, "loss": 3.1828439331054685, "step": 355600 }, { "epoch": 0.4291994380709072, "learning_rate": 8.603940788028378e-06, "loss": 3.1830108642578123, "step": 355700 }, { "epoch": 0.4293201013933899, "learning_rate": 8.60353695256064e-06, "loss": 3.218525390625, "step": 355800 }, { "epoch": 0.42944076471587256, "learning_rate": 8.603133117092902e-06, "loss": 3.1855133056640623, "step": 355900 }, { "epoch": 0.42956142803835523, "learning_rate": 8.602729281625164e-06, "loss": 3.20457763671875, "step": 356000 }, { "epoch": 0.42968209136083796, "learning_rate": 8.602325446157426e-06, "loss": 3.16480224609375, "step": 356100 }, { "epoch": 0.42980275468332063, "learning_rate": 8.601921610689688e-06, "loss": 3.1808721923828127, "step": 356200 }, { "epoch": 0.4299234180058033, "learning_rate": 8.601517775221948e-06, "loss": 3.193555908203125, "step": 356300 }, { "epoch": 0.430044081328286, "learning_rate": 8.60111393975421e-06, "loss": 3.164589538574219, "step": 356400 }, { "epoch": 0.43016474465076865, "learning_rate": 8.600710104286472e-06, "loss": 3.199861755371094, "step": 356500 }, { "epoch": 0.4302854079732514, "learning_rate": 8.600306268818733e-06, "loss": 3.16435302734375, "step": 356600 }, { "epoch": 0.43040607129573405, "learning_rate": 8.599902433350995e-06, "loss": 3.188094177246094, "step": 356700 }, { "epoch": 0.4305267346182167, "learning_rate": 8.599498597883257e-06, "loss": 3.175874938964844, "step": 356800 }, { "epoch": 0.4306473979406994, "learning_rate": 8.599094762415519e-06, "loss": 3.1786093139648437, "step": 356900 }, { "epoch": 0.43076806126318207, "learning_rate": 8.59869092694778e-06, "loss": 3.161024475097656, "step": 357000 }, { "epoch": 0.4308887245856648, "learning_rate": 8.598287091480043e-06, "loss": 3.1848822021484375, "step": 357100 }, { "epoch": 0.43100938790814747, "learning_rate": 8.597883256012303e-06, "loss": 3.173997802734375, "step": 357200 }, { "epoch": 0.43113005123063014, "learning_rate": 8.597479420544565e-06, "loss": 3.179041442871094, "step": 357300 }, { "epoch": 0.4312507145531128, "learning_rate": 8.597075585076827e-06, "loss": 3.166010437011719, "step": 357400 }, { "epoch": 0.4313713778755955, "learning_rate": 8.596671749609087e-06, "loss": 3.1589715576171873, "step": 357500 }, { "epoch": 0.4314920411980782, "learning_rate": 8.596267914141349e-06, "loss": 3.189253234863281, "step": 357600 }, { "epoch": 0.4316127045205609, "learning_rate": 8.595864078673611e-06, "loss": 3.1857418823242187, "step": 357700 }, { "epoch": 0.43173336784304356, "learning_rate": 8.595460243205873e-06, "loss": 3.1790679931640624, "step": 357800 }, { "epoch": 0.43185403116552623, "learning_rate": 8.595056407738135e-06, "loss": 3.1831463623046874, "step": 357900 }, { "epoch": 0.43197469448800896, "learning_rate": 8.594652572270395e-06, "loss": 3.1714358520507813, "step": 358000 }, { "epoch": 0.43209535781049163, "learning_rate": 8.594248736802657e-06, "loss": 3.189139099121094, "step": 358100 }, { "epoch": 0.4322160211329743, "learning_rate": 8.59384490133492e-06, "loss": 3.1406118774414065, "step": 358200 }, { "epoch": 0.432336684455457, "learning_rate": 8.593441065867181e-06, "loss": 3.1500439453125, "step": 358300 }, { "epoch": 0.43245734777793965, "learning_rate": 8.593037230399443e-06, "loss": 3.208973693847656, "step": 358400 }, { "epoch": 0.4325780111004224, "learning_rate": 8.592633394931704e-06, "loss": 3.1829348754882814, "step": 358500 }, { "epoch": 0.43269867442290505, "learning_rate": 8.592229559463966e-06, "loss": 3.1675155639648436, "step": 358600 }, { "epoch": 0.4328193377453877, "learning_rate": 8.591825723996228e-06, "loss": 3.153431701660156, "step": 358700 }, { "epoch": 0.4329400010678704, "learning_rate": 8.591421888528488e-06, "loss": 3.1683740234375, "step": 358800 }, { "epoch": 0.43306066439035307, "learning_rate": 8.59101805306075e-06, "loss": 3.2201156616210938, "step": 358900 }, { "epoch": 0.4331813277128358, "learning_rate": 8.590614217593012e-06, "loss": 3.1861221313476564, "step": 359000 }, { "epoch": 0.43330199103531847, "learning_rate": 8.590210382125274e-06, "loss": 3.2081201171875, "step": 359100 }, { "epoch": 0.43342265435780114, "learning_rate": 8.589806546657536e-06, "loss": 3.2040924072265624, "step": 359200 }, { "epoch": 0.4335433176802838, "learning_rate": 8.589402711189798e-06, "loss": 3.16206298828125, "step": 359300 }, { "epoch": 0.4336639810027665, "learning_rate": 8.588998875722058e-06, "loss": 3.1880618286132814, "step": 359400 }, { "epoch": 0.4337846443252492, "learning_rate": 8.58859504025432e-06, "loss": 3.1820343017578123, "step": 359500 }, { "epoch": 0.4339053076477319, "learning_rate": 8.588191204786582e-06, "loss": 3.1609405517578124, "step": 359600 }, { "epoch": 0.43402597097021456, "learning_rate": 8.587787369318842e-06, "loss": 3.1588265991210935, "step": 359700 }, { "epoch": 0.43414663429269723, "learning_rate": 8.587383533851104e-06, "loss": 3.148121032714844, "step": 359800 }, { "epoch": 0.4342672976151799, "learning_rate": 8.586979698383366e-06, "loss": 3.1572726440429686, "step": 359900 }, { "epoch": 0.43438796093766263, "learning_rate": 8.586575862915628e-06, "loss": 3.2002822875976564, "step": 360000 }, { "epoch": 0.4345086242601453, "learning_rate": 8.58617202744789e-06, "loss": 3.180852966308594, "step": 360100 }, { "epoch": 0.434629287582628, "learning_rate": 8.585768191980152e-06, "loss": 3.173353576660156, "step": 360200 }, { "epoch": 0.43474995090511065, "learning_rate": 8.585364356512414e-06, "loss": 3.1801852416992187, "step": 360300 }, { "epoch": 0.4348706142275933, "learning_rate": 8.584960521044674e-06, "loss": 3.172731628417969, "step": 360400 }, { "epoch": 0.43499127755007605, "learning_rate": 8.584556685576936e-06, "loss": 3.1771340942382813, "step": 360500 }, { "epoch": 0.4351119408725587, "learning_rate": 8.584152850109197e-06, "loss": 3.1508392333984374, "step": 360600 }, { "epoch": 0.4352326041950414, "learning_rate": 8.583749014641459e-06, "loss": 3.1647915649414062, "step": 360700 }, { "epoch": 0.43535326751752407, "learning_rate": 8.58334517917372e-06, "loss": 3.1881646728515625, "step": 360800 }, { "epoch": 0.4354739308400068, "learning_rate": 8.582941343705983e-06, "loss": 3.12959716796875, "step": 360900 }, { "epoch": 0.43559459416248947, "learning_rate": 8.582537508238245e-06, "loss": 3.2009005737304688, "step": 361000 }, { "epoch": 0.43571525748497214, "learning_rate": 8.582133672770507e-06, "loss": 3.1655712890625, "step": 361100 }, { "epoch": 0.4358359208074548, "learning_rate": 8.581729837302769e-06, "loss": 3.142994384765625, "step": 361200 }, { "epoch": 0.4359565841299375, "learning_rate": 8.581326001835029e-06, "loss": 3.1704888916015626, "step": 361300 }, { "epoch": 0.4360772474524202, "learning_rate": 8.580922166367291e-06, "loss": 3.151007080078125, "step": 361400 }, { "epoch": 0.4361979107749029, "learning_rate": 8.580518330899553e-06, "loss": 3.16232666015625, "step": 361500 }, { "epoch": 0.43631857409738556, "learning_rate": 8.580114495431813e-06, "loss": 3.1726116943359375, "step": 361600 }, { "epoch": 0.43643923741986823, "learning_rate": 8.579710659964075e-06, "loss": 3.1850286865234376, "step": 361700 }, { "epoch": 0.4365599007423509, "learning_rate": 8.579306824496337e-06, "loss": 3.180714416503906, "step": 361800 }, { "epoch": 0.43668056406483363, "learning_rate": 8.578902989028599e-06, "loss": 3.177583923339844, "step": 361900 }, { "epoch": 0.4368012273873163, "learning_rate": 8.578499153560861e-06, "loss": 3.175817565917969, "step": 362000 }, { "epoch": 0.436921890709799, "learning_rate": 8.578095318093121e-06, "loss": 3.182248840332031, "step": 362100 }, { "epoch": 0.43704255403228165, "learning_rate": 8.577691482625383e-06, "loss": 3.1497857666015623, "step": 362200 }, { "epoch": 0.4371632173547643, "learning_rate": 8.577287647157645e-06, "loss": 3.1653057861328127, "step": 362300 }, { "epoch": 0.43728388067724705, "learning_rate": 8.576883811689907e-06, "loss": 3.191617431640625, "step": 362400 }, { "epoch": 0.4374045439997297, "learning_rate": 8.576479976222168e-06, "loss": 3.169830017089844, "step": 362500 }, { "epoch": 0.4375252073222124, "learning_rate": 8.57607614075443e-06, "loss": 3.199478759765625, "step": 362600 }, { "epoch": 0.43764587064469507, "learning_rate": 8.575672305286692e-06, "loss": 3.1641168212890625, "step": 362700 }, { "epoch": 0.43776653396717774, "learning_rate": 8.575268469818954e-06, "loss": 3.182425842285156, "step": 362800 }, { "epoch": 0.43788719728966047, "learning_rate": 8.574864634351214e-06, "loss": 3.176493835449219, "step": 362900 }, { "epoch": 0.43800786061214314, "learning_rate": 8.574460798883476e-06, "loss": 3.163438415527344, "step": 363000 }, { "epoch": 0.4381285239346258, "learning_rate": 8.574056963415738e-06, "loss": 3.163382568359375, "step": 363100 }, { "epoch": 0.4382491872571085, "learning_rate": 8.573653127948e-06, "loss": 3.1730023193359376, "step": 363200 }, { "epoch": 0.4383698505795912, "learning_rate": 8.573249292480262e-06, "loss": 3.1458984375, "step": 363300 }, { "epoch": 0.4384905139020739, "learning_rate": 8.572845457012524e-06, "loss": 3.185274963378906, "step": 363400 }, { "epoch": 0.43861117722455656, "learning_rate": 8.572441621544784e-06, "loss": 3.1657293701171874, "step": 363500 }, { "epoch": 0.43873184054703923, "learning_rate": 8.572037786077046e-06, "loss": 3.1654953002929687, "step": 363600 }, { "epoch": 0.4388525038695219, "learning_rate": 8.571633950609306e-06, "loss": 3.162891540527344, "step": 363700 }, { "epoch": 0.43897316719200463, "learning_rate": 8.571230115141568e-06, "loss": 3.1667965698242186, "step": 363800 }, { "epoch": 0.4390938305144873, "learning_rate": 8.57082627967383e-06, "loss": 3.185269775390625, "step": 363900 }, { "epoch": 0.43921449383697, "learning_rate": 8.570422444206092e-06, "loss": 3.1614620971679686, "step": 364000 }, { "epoch": 0.43933515715945265, "learning_rate": 8.570018608738354e-06, "loss": 3.1583599853515625, "step": 364100 }, { "epoch": 0.4394558204819353, "learning_rate": 8.569614773270616e-06, "loss": 3.1524197387695314, "step": 364200 }, { "epoch": 0.43957648380441805, "learning_rate": 8.569210937802878e-06, "loss": 3.1714382934570313, "step": 364300 }, { "epoch": 0.4396971471269007, "learning_rate": 8.56880710233514e-06, "loss": 3.1352389526367186, "step": 364400 }, { "epoch": 0.4398178104493834, "learning_rate": 8.5684032668674e-06, "loss": 3.155145568847656, "step": 364500 }, { "epoch": 0.43993847377186607, "learning_rate": 8.567999431399662e-06, "loss": 3.165085754394531, "step": 364600 }, { "epoch": 0.44005913709434874, "learning_rate": 8.567595595931923e-06, "loss": 3.1434954833984374, "step": 364700 }, { "epoch": 0.44017980041683147, "learning_rate": 8.567191760464185e-06, "loss": 3.1698394775390626, "step": 364800 }, { "epoch": 0.44030046373931414, "learning_rate": 8.566787924996447e-06, "loss": 3.172398681640625, "step": 364900 }, { "epoch": 0.4404211270617968, "learning_rate": 8.566384089528709e-06, "loss": 3.1468621826171876, "step": 365000 }, { "epoch": 0.4405417903842795, "learning_rate": 8.56598025406097e-06, "loss": 3.1481427001953124, "step": 365100 }, { "epoch": 0.44066245370676216, "learning_rate": 8.565576418593233e-06, "loss": 3.1734017944335937, "step": 365200 }, { "epoch": 0.4407831170292449, "learning_rate": 8.565172583125495e-06, "loss": 3.161773681640625, "step": 365300 }, { "epoch": 0.44090378035172756, "learning_rate": 8.564768747657755e-06, "loss": 3.16112060546875, "step": 365400 }, { "epoch": 0.44102444367421023, "learning_rate": 8.564364912190017e-06, "loss": 3.160003356933594, "step": 365500 }, { "epoch": 0.4411451069966929, "learning_rate": 8.563961076722279e-06, "loss": 3.1549221801757814, "step": 365600 }, { "epoch": 0.4412657703191756, "learning_rate": 8.56355724125454e-06, "loss": 3.1470736694335937, "step": 365700 }, { "epoch": 0.4413864336416583, "learning_rate": 8.563153405786801e-06, "loss": 3.1689163208007813, "step": 365800 }, { "epoch": 0.441507096964141, "learning_rate": 8.562749570319063e-06, "loss": 3.151278076171875, "step": 365900 }, { "epoch": 0.44162776028662365, "learning_rate": 8.562345734851325e-06, "loss": 3.18524658203125, "step": 366000 }, { "epoch": 0.4417484236091063, "learning_rate": 8.561941899383587e-06, "loss": 3.165556640625, "step": 366100 }, { "epoch": 0.44186908693158905, "learning_rate": 8.561538063915847e-06, "loss": 3.1412313842773436, "step": 366200 }, { "epoch": 0.4419897502540717, "learning_rate": 8.56113422844811e-06, "loss": 3.1581845092773437, "step": 366300 }, { "epoch": 0.4421104135765544, "learning_rate": 8.560730392980371e-06, "loss": 3.1530862426757813, "step": 366400 }, { "epoch": 0.44223107689903707, "learning_rate": 8.560326557512633e-06, "loss": 3.1590106201171877, "step": 366500 }, { "epoch": 0.44235174022151974, "learning_rate": 8.559922722044894e-06, "loss": 3.1573910522460937, "step": 366600 }, { "epoch": 0.44247240354400247, "learning_rate": 8.559518886577156e-06, "loss": 3.164007263183594, "step": 366700 }, { "epoch": 0.44259306686648514, "learning_rate": 8.559115051109418e-06, "loss": 3.171766662597656, "step": 366800 }, { "epoch": 0.4427137301889678, "learning_rate": 8.55871121564168e-06, "loss": 3.141598815917969, "step": 366900 }, { "epoch": 0.4428343935114505, "learning_rate": 8.55830738017394e-06, "loss": 3.174053039550781, "step": 367000 }, { "epoch": 0.44295505683393316, "learning_rate": 8.557903544706202e-06, "loss": 3.1652215576171874, "step": 367100 }, { "epoch": 0.4430757201564159, "learning_rate": 8.557499709238464e-06, "loss": 3.15250244140625, "step": 367200 }, { "epoch": 0.44319638347889856, "learning_rate": 8.557095873770726e-06, "loss": 3.1612918090820314, "step": 367300 }, { "epoch": 0.44331704680138123, "learning_rate": 8.556692038302988e-06, "loss": 3.167114562988281, "step": 367400 }, { "epoch": 0.4434377101238639, "learning_rate": 8.55628820283525e-06, "loss": 3.20229248046875, "step": 367500 }, { "epoch": 0.4435583734463466, "learning_rate": 8.55588436736751e-06, "loss": 3.1544873046875, "step": 367600 }, { "epoch": 0.4436790367688293, "learning_rate": 8.555480531899772e-06, "loss": 3.155821533203125, "step": 367700 }, { "epoch": 0.443799700091312, "learning_rate": 8.555076696432032e-06, "loss": 3.1639593505859374, "step": 367800 }, { "epoch": 0.44392036341379465, "learning_rate": 8.554672860964294e-06, "loss": 3.1481503295898436, "step": 367900 }, { "epoch": 0.4440410267362773, "learning_rate": 8.554269025496556e-06, "loss": 3.1459994506835938, "step": 368000 }, { "epoch": 0.44416169005876, "learning_rate": 8.553865190028818e-06, "loss": 3.171048889160156, "step": 368100 }, { "epoch": 0.4442823533812427, "learning_rate": 8.55346135456108e-06, "loss": 3.1597695922851563, "step": 368200 }, { "epoch": 0.4444030167037254, "learning_rate": 8.553057519093342e-06, "loss": 3.1739923095703126, "step": 368300 }, { "epoch": 0.44452368002620807, "learning_rate": 8.552653683625604e-06, "loss": 3.160904541015625, "step": 368400 }, { "epoch": 0.44464434334869074, "learning_rate": 8.552249848157865e-06, "loss": 3.1608096313476564, "step": 368500 }, { "epoch": 0.44476500667117347, "learning_rate": 8.551846012690127e-06, "loss": 3.1560687255859374, "step": 368600 }, { "epoch": 0.44488566999365614, "learning_rate": 8.551442177222388e-06, "loss": 3.1521368408203125, "step": 368700 }, { "epoch": 0.4450063333161388, "learning_rate": 8.551038341754649e-06, "loss": 3.1734774780273436, "step": 368800 }, { "epoch": 0.4451269966386215, "learning_rate": 8.55063450628691e-06, "loss": 3.1270574951171874, "step": 368900 }, { "epoch": 0.44524765996110416, "learning_rate": 8.550230670819173e-06, "loss": 3.16264404296875, "step": 369000 }, { "epoch": 0.4453683232835869, "learning_rate": 8.549826835351435e-06, "loss": 3.163631591796875, "step": 369100 }, { "epoch": 0.44548898660606956, "learning_rate": 8.549422999883697e-06, "loss": 3.1469546508789064, "step": 369200 }, { "epoch": 0.44560964992855223, "learning_rate": 8.549019164415959e-06, "loss": 3.161377258300781, "step": 369300 }, { "epoch": 0.4457303132510349, "learning_rate": 8.548615328948219e-06, "loss": 3.173736877441406, "step": 369400 }, { "epoch": 0.4458509765735176, "learning_rate": 8.548211493480481e-06, "loss": 3.159951477050781, "step": 369500 }, { "epoch": 0.4459716398960003, "learning_rate": 8.547807658012743e-06, "loss": 3.1467889404296874, "step": 369600 }, { "epoch": 0.446092303218483, "learning_rate": 8.547403822545003e-06, "loss": 3.132040710449219, "step": 369700 }, { "epoch": 0.44621296654096565, "learning_rate": 8.546999987077265e-06, "loss": 3.169666748046875, "step": 369800 }, { "epoch": 0.4463336298634483, "learning_rate": 8.546596151609527e-06, "loss": 3.1499310302734376, "step": 369900 }, { "epoch": 0.446454293185931, "learning_rate": 8.54619231614179e-06, "loss": 3.154795837402344, "step": 370000 }, { "epoch": 0.4465749565084137, "learning_rate": 8.545788480674051e-06, "loss": 3.162998046875, "step": 370100 }, { "epoch": 0.4466956198308964, "learning_rate": 8.545384645206311e-06, "loss": 3.1742813110351564, "step": 370200 }, { "epoch": 0.44681628315337907, "learning_rate": 8.544980809738573e-06, "loss": 3.151202392578125, "step": 370300 }, { "epoch": 0.44693694647586174, "learning_rate": 8.544576974270835e-06, "loss": 3.169294738769531, "step": 370400 }, { "epoch": 0.4470576097983444, "learning_rate": 8.544173138803097e-06, "loss": 3.1597335815429686, "step": 370500 }, { "epoch": 0.44717827312082714, "learning_rate": 8.54376930333536e-06, "loss": 3.1634405517578124, "step": 370600 }, { "epoch": 0.4472989364433098, "learning_rate": 8.54336546786762e-06, "loss": 3.171553955078125, "step": 370700 }, { "epoch": 0.4474195997657925, "learning_rate": 8.542961632399882e-06, "loss": 3.1269326782226563, "step": 370800 }, { "epoch": 0.44754026308827516, "learning_rate": 8.542557796932144e-06, "loss": 3.1421353149414064, "step": 370900 }, { "epoch": 0.4476609264107579, "learning_rate": 8.542153961464406e-06, "loss": 3.181333312988281, "step": 371000 }, { "epoch": 0.44778158973324056, "learning_rate": 8.541750125996666e-06, "loss": 3.144024658203125, "step": 371100 }, { "epoch": 0.44790225305572323, "learning_rate": 8.541346290528928e-06, "loss": 3.155126037597656, "step": 371200 }, { "epoch": 0.4480229163782059, "learning_rate": 8.54094245506119e-06, "loss": 3.1495547485351563, "step": 371300 }, { "epoch": 0.4481435797006886, "learning_rate": 8.540538619593452e-06, "loss": 3.1388092041015625, "step": 371400 }, { "epoch": 0.4482642430231713, "learning_rate": 8.540134784125714e-06, "loss": 3.139412841796875, "step": 371500 }, { "epoch": 0.448384906345654, "learning_rate": 8.539730948657974e-06, "loss": 3.142877197265625, "step": 371600 }, { "epoch": 0.44850556966813665, "learning_rate": 8.539327113190236e-06, "loss": 3.1486831665039063, "step": 371700 }, { "epoch": 0.4486262329906193, "learning_rate": 8.538923277722498e-06, "loss": 3.1674664306640623, "step": 371800 }, { "epoch": 0.448746896313102, "learning_rate": 8.538519442254758e-06, "loss": 3.1398745727539064, "step": 371900 }, { "epoch": 0.4488675596355847, "learning_rate": 8.53811560678702e-06, "loss": 3.159801025390625, "step": 372000 }, { "epoch": 0.4489882229580674, "learning_rate": 8.537711771319282e-06, "loss": 3.141025390625, "step": 372100 }, { "epoch": 0.44910888628055007, "learning_rate": 8.537307935851544e-06, "loss": 3.1711880493164064, "step": 372200 }, { "epoch": 0.44922954960303274, "learning_rate": 8.536904100383806e-06, "loss": 3.163363037109375, "step": 372300 }, { "epoch": 0.4493502129255154, "learning_rate": 8.536500264916068e-06, "loss": 3.156895751953125, "step": 372400 }, { "epoch": 0.44947087624799814, "learning_rate": 8.53609642944833e-06, "loss": 3.151407470703125, "step": 372500 }, { "epoch": 0.4495915395704808, "learning_rate": 8.53569259398059e-06, "loss": 3.171239013671875, "step": 372600 }, { "epoch": 0.4497122028929635, "learning_rate": 8.535288758512853e-06, "loss": 3.171841735839844, "step": 372700 }, { "epoch": 0.44983286621544616, "learning_rate": 8.534884923045113e-06, "loss": 3.154608154296875, "step": 372800 }, { "epoch": 0.44995352953792883, "learning_rate": 8.534481087577375e-06, "loss": 3.1462692260742187, "step": 372900 }, { "epoch": 0.45007419286041156, "learning_rate": 8.534077252109637e-06, "loss": 3.1602447509765623, "step": 373000 }, { "epoch": 0.45019485618289423, "learning_rate": 8.533673416641899e-06, "loss": 3.143274230957031, "step": 373100 }, { "epoch": 0.4503155195053769, "learning_rate": 8.53326958117416e-06, "loss": 3.123106689453125, "step": 373200 }, { "epoch": 0.4504361828278596, "learning_rate": 8.532865745706423e-06, "loss": 3.1546035766601563, "step": 373300 }, { "epoch": 0.45055684615034225, "learning_rate": 8.532461910238685e-06, "loss": 3.1678475952148437, "step": 373400 }, { "epoch": 0.450677509472825, "learning_rate": 8.532058074770945e-06, "loss": 3.1607479858398437, "step": 373500 }, { "epoch": 0.45079817279530765, "learning_rate": 8.531654239303207e-06, "loss": 3.16156005859375, "step": 373600 }, { "epoch": 0.4509188361177903, "learning_rate": 8.531250403835469e-06, "loss": 3.14201416015625, "step": 373700 }, { "epoch": 0.451039499440273, "learning_rate": 8.53084656836773e-06, "loss": 3.137664489746094, "step": 373800 }, { "epoch": 0.4511601627627557, "learning_rate": 8.530442732899991e-06, "loss": 3.1570562744140624, "step": 373900 }, { "epoch": 0.4512808260852384, "learning_rate": 8.530038897432253e-06, "loss": 3.12742919921875, "step": 374000 }, { "epoch": 0.45140148940772107, "learning_rate": 8.529635061964515e-06, "loss": 3.1410791015625, "step": 374100 }, { "epoch": 0.45152215273020374, "learning_rate": 8.529231226496777e-06, "loss": 3.154504699707031, "step": 374200 }, { "epoch": 0.4516428160526864, "learning_rate": 8.528827391029037e-06, "loss": 3.14399169921875, "step": 374300 }, { "epoch": 0.45176347937516914, "learning_rate": 8.5284235555613e-06, "loss": 3.1732467651367187, "step": 374400 }, { "epoch": 0.4518841426976518, "learning_rate": 8.528019720093561e-06, "loss": 3.139784240722656, "step": 374500 }, { "epoch": 0.4520048060201345, "learning_rate": 8.527615884625823e-06, "loss": 3.146400146484375, "step": 374600 }, { "epoch": 0.45212546934261716, "learning_rate": 8.527212049158084e-06, "loss": 3.155608825683594, "step": 374700 }, { "epoch": 0.45224613266509983, "learning_rate": 8.526808213690346e-06, "loss": 3.1358660888671874, "step": 374800 }, { "epoch": 0.45236679598758256, "learning_rate": 8.526404378222608e-06, "loss": 3.165531005859375, "step": 374900 }, { "epoch": 0.45248745931006523, "learning_rate": 8.52600054275487e-06, "loss": 3.11739013671875, "step": 375000 }, { "epoch": 0.4526081226325479, "learning_rate": 8.52559670728713e-06, "loss": 3.1539596557617187, "step": 375100 }, { "epoch": 0.4527287859550306, "learning_rate": 8.525192871819392e-06, "loss": 3.1415203857421874, "step": 375200 }, { "epoch": 0.45284944927751325, "learning_rate": 8.524789036351654e-06, "loss": 3.14402587890625, "step": 375300 }, { "epoch": 0.452970112599996, "learning_rate": 8.524385200883916e-06, "loss": 3.143804931640625, "step": 375400 }, { "epoch": 0.45309077592247865, "learning_rate": 8.523981365416178e-06, "loss": 3.127929382324219, "step": 375500 }, { "epoch": 0.4532114392449613, "learning_rate": 8.52357752994844e-06, "loss": 3.1357431030273437, "step": 375600 }, { "epoch": 0.453332102567444, "learning_rate": 8.5231736944807e-06, "loss": 3.1591168212890626, "step": 375700 }, { "epoch": 0.45345276588992667, "learning_rate": 8.522769859012962e-06, "loss": 3.1183770751953124, "step": 375800 }, { "epoch": 0.4535734292124094, "learning_rate": 8.522366023545224e-06, "loss": 3.164037780761719, "step": 375900 }, { "epoch": 0.45369409253489207, "learning_rate": 8.521962188077484e-06, "loss": 3.135923156738281, "step": 376000 }, { "epoch": 0.45381475585737474, "learning_rate": 8.521558352609746e-06, "loss": 3.126140441894531, "step": 376100 }, { "epoch": 0.4539354191798574, "learning_rate": 8.521154517142008e-06, "loss": 3.12957275390625, "step": 376200 }, { "epoch": 0.45405608250234014, "learning_rate": 8.52075068167427e-06, "loss": 3.1425747680664062, "step": 376300 }, { "epoch": 0.4541767458248228, "learning_rate": 8.520346846206532e-06, "loss": 3.1216506958007812, "step": 376400 }, { "epoch": 0.4542974091473055, "learning_rate": 8.519943010738794e-06, "loss": 3.1401470947265624, "step": 376500 }, { "epoch": 0.45441807246978816, "learning_rate": 8.519539175271055e-06, "loss": 3.150085144042969, "step": 376600 }, { "epoch": 0.45453873579227083, "learning_rate": 8.519135339803317e-06, "loss": 3.127613525390625, "step": 376700 }, { "epoch": 0.45465939911475356, "learning_rate": 8.518731504335579e-06, "loss": 3.1407650756835936, "step": 376800 }, { "epoch": 0.45478006243723623, "learning_rate": 8.518327668867839e-06, "loss": 3.147749938964844, "step": 376900 }, { "epoch": 0.4549007257597189, "learning_rate": 8.5179238334001e-06, "loss": 3.1725, "step": 377000 }, { "epoch": 0.4550213890822016, "learning_rate": 8.517519997932363e-06, "loss": 3.126537170410156, "step": 377100 }, { "epoch": 0.45514205240468425, "learning_rate": 8.517116162464625e-06, "loss": 3.153029479980469, "step": 377200 }, { "epoch": 0.455262715727167, "learning_rate": 8.516712326996887e-06, "loss": 3.0733352661132813, "step": 377300 }, { "epoch": 0.45538337904964965, "learning_rate": 8.516308491529149e-06, "loss": 3.164046630859375, "step": 377400 }, { "epoch": 0.4555040423721323, "learning_rate": 8.51590465606141e-06, "loss": 3.1463336181640624, "step": 377500 }, { "epoch": 0.455624705694615, "learning_rate": 8.515500820593671e-06, "loss": 3.1542959594726563, "step": 377600 }, { "epoch": 0.45574536901709767, "learning_rate": 8.515096985125933e-06, "loss": 3.1383633422851562, "step": 377700 }, { "epoch": 0.4558660323395804, "learning_rate": 8.514693149658193e-06, "loss": 3.134474182128906, "step": 377800 }, { "epoch": 0.45598669566206307, "learning_rate": 8.514289314190455e-06, "loss": 3.1476385498046877, "step": 377900 }, { "epoch": 0.45610735898454574, "learning_rate": 8.513885478722717e-06, "loss": 3.119512939453125, "step": 378000 }, { "epoch": 0.4562280223070284, "learning_rate": 8.51348164325498e-06, "loss": 3.1564996337890623, "step": 378100 }, { "epoch": 0.4563486856295111, "learning_rate": 8.513077807787241e-06, "loss": 3.1333682250976564, "step": 378200 }, { "epoch": 0.4564693489519938, "learning_rate": 8.512673972319503e-06, "loss": 3.143529052734375, "step": 378300 }, { "epoch": 0.4565900122744765, "learning_rate": 8.512270136851764e-06, "loss": 3.1058917236328125, "step": 378400 }, { "epoch": 0.45671067559695916, "learning_rate": 8.511866301384025e-06, "loss": 3.1404119873046876, "step": 378500 }, { "epoch": 0.45683133891944183, "learning_rate": 8.511462465916287e-06, "loss": 3.129571533203125, "step": 378600 }, { "epoch": 0.4569520022419245, "learning_rate": 8.51105863044855e-06, "loss": 3.1644186401367187, "step": 378700 }, { "epoch": 0.45707266556440723, "learning_rate": 8.51065479498081e-06, "loss": 3.132996826171875, "step": 378800 }, { "epoch": 0.4571933288868899, "learning_rate": 8.510250959513072e-06, "loss": 3.121293640136719, "step": 378900 }, { "epoch": 0.4573139922093726, "learning_rate": 8.509847124045334e-06, "loss": 3.137345886230469, "step": 379000 }, { "epoch": 0.45743465553185525, "learning_rate": 8.509443288577596e-06, "loss": 3.122278747558594, "step": 379100 }, { "epoch": 0.457555318854338, "learning_rate": 8.509039453109856e-06, "loss": 3.1400909423828125, "step": 379200 }, { "epoch": 0.45767598217682065, "learning_rate": 8.508635617642118e-06, "loss": 3.145557861328125, "step": 379300 }, { "epoch": 0.4577966454993033, "learning_rate": 8.50823178217438e-06, "loss": 3.1471456909179687, "step": 379400 }, { "epoch": 0.457917308821786, "learning_rate": 8.507827946706642e-06, "loss": 3.1113134765625, "step": 379500 }, { "epoch": 0.45803797214426867, "learning_rate": 8.507424111238904e-06, "loss": 3.124092712402344, "step": 379600 }, { "epoch": 0.4581586354667514, "learning_rate": 8.507020275771166e-06, "loss": 3.16373046875, "step": 379700 }, { "epoch": 0.45827929878923407, "learning_rate": 8.506616440303426e-06, "loss": 3.09302490234375, "step": 379800 }, { "epoch": 0.45839996211171674, "learning_rate": 8.506212604835688e-06, "loss": 3.1182241821289063, "step": 379900 }, { "epoch": 0.4585206254341994, "learning_rate": 8.505808769367948e-06, "loss": 3.1402423095703127, "step": 380000 }, { "epoch": 0.4586412887566821, "learning_rate": 8.50540493390021e-06, "loss": 3.1161929321289064, "step": 380100 }, { "epoch": 0.4587619520791648, "learning_rate": 8.505001098432472e-06, "loss": 3.1541259765625, "step": 380200 }, { "epoch": 0.4588826154016475, "learning_rate": 8.504597262964734e-06, "loss": 3.129002990722656, "step": 380300 }, { "epoch": 0.45900327872413016, "learning_rate": 8.504193427496996e-06, "loss": 3.118363037109375, "step": 380400 }, { "epoch": 0.45912394204661283, "learning_rate": 8.503789592029258e-06, "loss": 3.14366943359375, "step": 380500 }, { "epoch": 0.4592446053690955, "learning_rate": 8.50338575656152e-06, "loss": 3.1468746948242186, "step": 380600 }, { "epoch": 0.45936526869157823, "learning_rate": 8.50298192109378e-06, "loss": 3.1465908813476564, "step": 380700 }, { "epoch": 0.4594859320140609, "learning_rate": 8.502578085626043e-06, "loss": 3.1310720825195313, "step": 380800 }, { "epoch": 0.4596065953365436, "learning_rate": 8.502174250158305e-06, "loss": 3.1352825927734376, "step": 380900 }, { "epoch": 0.45972725865902625, "learning_rate": 8.501770414690565e-06, "loss": 3.1203341674804688, "step": 381000 }, { "epoch": 0.4598479219815089, "learning_rate": 8.501366579222827e-06, "loss": 3.087215576171875, "step": 381100 }, { "epoch": 0.45996858530399165, "learning_rate": 8.500962743755089e-06, "loss": 3.139811706542969, "step": 381200 }, { "epoch": 0.4600892486264743, "learning_rate": 8.50055890828735e-06, "loss": 3.137640380859375, "step": 381300 }, { "epoch": 0.460209911948957, "learning_rate": 8.500155072819613e-06, "loss": 3.123800964355469, "step": 381400 }, { "epoch": 0.46033057527143967, "learning_rate": 8.499751237351875e-06, "loss": 3.1358523559570313, "step": 381500 }, { "epoch": 0.4604512385939224, "learning_rate": 8.499347401884137e-06, "loss": 3.121767578125, "step": 381600 }, { "epoch": 0.46057190191640507, "learning_rate": 8.498943566416397e-06, "loss": 3.14825927734375, "step": 381700 }, { "epoch": 0.46069256523888774, "learning_rate": 8.498539730948659e-06, "loss": 3.1300338745117187, "step": 381800 }, { "epoch": 0.4608132285613704, "learning_rate": 8.49813589548092e-06, "loss": 3.13264892578125, "step": 381900 }, { "epoch": 0.4609338918838531, "learning_rate": 8.497732060013181e-06, "loss": 3.1357421875, "step": 382000 }, { "epoch": 0.4610545552063358, "learning_rate": 8.497328224545443e-06, "loss": 3.149007568359375, "step": 382100 }, { "epoch": 0.4611752185288185, "learning_rate": 8.496924389077705e-06, "loss": 3.1301812744140625, "step": 382200 }, { "epoch": 0.46129588185130116, "learning_rate": 8.496520553609967e-06, "loss": 3.1490679931640626, "step": 382300 }, { "epoch": 0.46141654517378383, "learning_rate": 8.49611671814223e-06, "loss": 3.1284271240234376, "step": 382400 }, { "epoch": 0.4615372084962665, "learning_rate": 8.49571288267449e-06, "loss": 3.1376217651367186, "step": 382500 }, { "epoch": 0.46165787181874923, "learning_rate": 8.495309047206752e-06, "loss": 3.1286474609375, "step": 382600 }, { "epoch": 0.4617785351412319, "learning_rate": 8.494905211739014e-06, "loss": 3.1434860229492188, "step": 382700 }, { "epoch": 0.4618991984637146, "learning_rate": 8.494501376271275e-06, "loss": 3.1338992309570313, "step": 382800 }, { "epoch": 0.46201986178619725, "learning_rate": 8.494097540803536e-06, "loss": 3.1025015258789064, "step": 382900 }, { "epoch": 0.4621405251086799, "learning_rate": 8.493693705335798e-06, "loss": 3.1459490966796877, "step": 383000 }, { "epoch": 0.46226118843116265, "learning_rate": 8.49328986986806e-06, "loss": 3.106195983886719, "step": 383100 }, { "epoch": 0.4623818517536453, "learning_rate": 8.492886034400322e-06, "loss": 3.121510314941406, "step": 383200 }, { "epoch": 0.462502515076128, "learning_rate": 8.492482198932582e-06, "loss": 3.1088232421875, "step": 383300 }, { "epoch": 0.46262317839861067, "learning_rate": 8.492078363464844e-06, "loss": 3.127908020019531, "step": 383400 }, { "epoch": 0.46274384172109334, "learning_rate": 8.491674527997106e-06, "loss": 3.147369689941406, "step": 383500 }, { "epoch": 0.46286450504357607, "learning_rate": 8.491270692529368e-06, "loss": 3.1268460083007814, "step": 383600 }, { "epoch": 0.46298516836605874, "learning_rate": 8.49086685706163e-06, "loss": 3.145751647949219, "step": 383700 }, { "epoch": 0.4631058316885414, "learning_rate": 8.49046302159389e-06, "loss": 3.1424606323242186, "step": 383800 }, { "epoch": 0.4632264950110241, "learning_rate": 8.490059186126152e-06, "loss": 3.1460671997070313, "step": 383900 }, { "epoch": 0.4633471583335068, "learning_rate": 8.489655350658414e-06, "loss": 3.1438632202148438, "step": 384000 }, { "epoch": 0.4634678216559895, "learning_rate": 8.489251515190674e-06, "loss": 3.144010009765625, "step": 384100 }, { "epoch": 0.46358848497847216, "learning_rate": 8.488847679722936e-06, "loss": 3.1228207397460936, "step": 384200 }, { "epoch": 0.46370914830095483, "learning_rate": 8.488443844255198e-06, "loss": 3.125281982421875, "step": 384300 }, { "epoch": 0.4638298116234375, "learning_rate": 8.48804000878746e-06, "loss": 3.1420132446289064, "step": 384400 }, { "epoch": 0.46395047494592023, "learning_rate": 8.487636173319722e-06, "loss": 3.121570739746094, "step": 384500 }, { "epoch": 0.4640711382684029, "learning_rate": 8.487232337851984e-06, "loss": 3.120580749511719, "step": 384600 }, { "epoch": 0.4641918015908856, "learning_rate": 8.486828502384246e-06, "loss": 3.1439031982421874, "step": 384700 }, { "epoch": 0.46431246491336825, "learning_rate": 8.486424666916507e-06, "loss": 3.1362924194335937, "step": 384800 }, { "epoch": 0.4644331282358509, "learning_rate": 8.486020831448769e-06, "loss": 3.139161376953125, "step": 384900 }, { "epoch": 0.46455379155833365, "learning_rate": 8.485616995981029e-06, "loss": 3.1094711303710936, "step": 385000 }, { "epoch": 0.4646744548808163, "learning_rate": 8.485213160513291e-06, "loss": 3.129660339355469, "step": 385100 }, { "epoch": 0.464795118203299, "learning_rate": 8.484809325045553e-06, "loss": 3.106048278808594, "step": 385200 }, { "epoch": 0.46491578152578167, "learning_rate": 8.484405489577815e-06, "loss": 3.1188922119140625, "step": 385300 }, { "epoch": 0.46503644484826434, "learning_rate": 8.484001654110077e-06, "loss": 3.1234521484375, "step": 385400 }, { "epoch": 0.46515710817074707, "learning_rate": 8.483597818642339e-06, "loss": 3.1120724487304687, "step": 385500 }, { "epoch": 0.46527777149322974, "learning_rate": 8.4831939831746e-06, "loss": 3.1346871948242185, "step": 385600 }, { "epoch": 0.4653984348157124, "learning_rate": 8.482790147706861e-06, "loss": 3.1387060546875, "step": 385700 }, { "epoch": 0.4655190981381951, "learning_rate": 8.482386312239123e-06, "loss": 3.098907165527344, "step": 385800 }, { "epoch": 0.46563976146067776, "learning_rate": 8.481982476771385e-06, "loss": 3.1122482299804686, "step": 385900 }, { "epoch": 0.4657604247831605, "learning_rate": 8.481578641303645e-06, "loss": 3.138643493652344, "step": 386000 }, { "epoch": 0.46588108810564316, "learning_rate": 8.481174805835907e-06, "loss": 3.121631774902344, "step": 386100 }, { "epoch": 0.46600175142812583, "learning_rate": 8.48077097036817e-06, "loss": 3.136925048828125, "step": 386200 }, { "epoch": 0.4661224147506085, "learning_rate": 8.480367134900431e-06, "loss": 3.1138604736328124, "step": 386300 }, { "epoch": 0.4662430780730912, "learning_rate": 8.479963299432693e-06, "loss": 3.134913330078125, "step": 386400 }, { "epoch": 0.4663637413955739, "learning_rate": 8.479559463964955e-06, "loss": 3.1338992309570313, "step": 386500 }, { "epoch": 0.4664844047180566, "learning_rate": 8.479155628497216e-06, "loss": 3.1130938720703125, "step": 386600 }, { "epoch": 0.46660506804053925, "learning_rate": 8.478751793029478e-06, "loss": 3.1238580322265626, "step": 386700 }, { "epoch": 0.4667257313630219, "learning_rate": 8.47834795756174e-06, "loss": 3.153401184082031, "step": 386800 }, { "epoch": 0.46684639468550465, "learning_rate": 8.477944122094e-06, "loss": 3.1112994384765624, "step": 386900 }, { "epoch": 0.4669670580079873, "learning_rate": 8.477540286626262e-06, "loss": 3.1244522094726563, "step": 387000 }, { "epoch": 0.46708772133047, "learning_rate": 8.477136451158524e-06, "loss": 3.143729553222656, "step": 387100 }, { "epoch": 0.46720838465295267, "learning_rate": 8.476732615690786e-06, "loss": 3.0977691650390624, "step": 387200 }, { "epoch": 0.46732904797543534, "learning_rate": 8.476328780223048e-06, "loss": 3.1258074951171877, "step": 387300 }, { "epoch": 0.46744971129791807, "learning_rate": 8.475924944755308e-06, "loss": 3.1042694091796874, "step": 387400 }, { "epoch": 0.46757037462040074, "learning_rate": 8.47552110928757e-06, "loss": 3.14513427734375, "step": 387500 }, { "epoch": 0.4676910379428834, "learning_rate": 8.475117273819832e-06, "loss": 3.1334906005859375, "step": 387600 }, { "epoch": 0.4678117012653661, "learning_rate": 8.474713438352094e-06, "loss": 3.1305191040039064, "step": 387700 }, { "epoch": 0.46793236458784876, "learning_rate": 8.474309602884356e-06, "loss": 3.1091302490234374, "step": 387800 }, { "epoch": 0.4680530279103315, "learning_rate": 8.473905767416616e-06, "loss": 3.148889465332031, "step": 387900 }, { "epoch": 0.46817369123281416, "learning_rate": 8.473501931948878e-06, "loss": 3.1178985595703126, "step": 388000 }, { "epoch": 0.46829435455529683, "learning_rate": 8.47309809648114e-06, "loss": 3.120003967285156, "step": 388100 }, { "epoch": 0.4684150178777795, "learning_rate": 8.4726942610134e-06, "loss": 3.1320068359375, "step": 388200 }, { "epoch": 0.4685356812002622, "learning_rate": 8.472290425545663e-06, "loss": 3.124786376953125, "step": 388300 }, { "epoch": 0.4686563445227449, "learning_rate": 8.471886590077924e-06, "loss": 3.1269940185546874, "step": 388400 }, { "epoch": 0.4687770078452276, "learning_rate": 8.471482754610186e-06, "loss": 3.0979833984375, "step": 388500 }, { "epoch": 0.46889767116771025, "learning_rate": 8.471078919142448e-06, "loss": 3.1111489868164064, "step": 388600 }, { "epoch": 0.4690183344901929, "learning_rate": 8.47067508367471e-06, "loss": 3.138814697265625, "step": 388700 }, { "epoch": 0.4691389978126756, "learning_rate": 8.47027124820697e-06, "loss": 3.097029113769531, "step": 388800 }, { "epoch": 0.4692596611351583, "learning_rate": 8.469867412739233e-06, "loss": 3.122314147949219, "step": 388900 }, { "epoch": 0.469380324457641, "learning_rate": 8.469463577271495e-06, "loss": 3.1029534912109376, "step": 389000 }, { "epoch": 0.46950098778012367, "learning_rate": 8.469059741803755e-06, "loss": 3.1359765625, "step": 389100 }, { "epoch": 0.46962165110260634, "learning_rate": 8.468655906336017e-06, "loss": 3.1164794921875, "step": 389200 }, { "epoch": 0.46974231442508907, "learning_rate": 8.468252070868279e-06, "loss": 3.1202740478515625, "step": 389300 }, { "epoch": 0.46986297774757174, "learning_rate": 8.467848235400541e-06, "loss": 3.095294189453125, "step": 389400 }, { "epoch": 0.4699836410700544, "learning_rate": 8.467444399932803e-06, "loss": 3.11364013671875, "step": 389500 }, { "epoch": 0.4701043043925371, "learning_rate": 8.467040564465065e-06, "loss": 3.1192578125, "step": 389600 }, { "epoch": 0.47022496771501976, "learning_rate": 8.466636728997327e-06, "loss": 3.1293038940429687, "step": 389700 }, { "epoch": 0.4703456310375025, "learning_rate": 8.466232893529587e-06, "loss": 3.1205938720703124, "step": 389800 }, { "epoch": 0.47046629435998516, "learning_rate": 8.465829058061849e-06, "loss": 3.1202767944335936, "step": 389900 }, { "epoch": 0.47058695768246783, "learning_rate": 8.46542522259411e-06, "loss": 3.1283197021484375, "step": 390000 }, { "epoch": 0.4707076210049505, "learning_rate": 8.465021387126371e-06, "loss": 3.10061279296875, "step": 390100 }, { "epoch": 0.4708282843274332, "learning_rate": 8.464617551658633e-06, "loss": 3.137294921875, "step": 390200 }, { "epoch": 0.4709489476499159, "learning_rate": 8.464213716190895e-06, "loss": 3.0898785400390625, "step": 390300 }, { "epoch": 0.4710696109723986, "learning_rate": 8.463809880723157e-06, "loss": 3.1150802612304687, "step": 390400 }, { "epoch": 0.47119027429488125, "learning_rate": 8.46340604525542e-06, "loss": 3.1151358032226564, "step": 390500 }, { "epoch": 0.4713109376173639, "learning_rate": 8.46300220978768e-06, "loss": 3.107939453125, "step": 390600 }, { "epoch": 0.4714316009398466, "learning_rate": 8.462598374319942e-06, "loss": 3.1264968872070313, "step": 390700 }, { "epoch": 0.4715522642623293, "learning_rate": 8.462194538852204e-06, "loss": 3.122178649902344, "step": 390800 }, { "epoch": 0.471672927584812, "learning_rate": 8.461790703384466e-06, "loss": 3.089374694824219, "step": 390900 }, { "epoch": 0.47179359090729467, "learning_rate": 8.461386867916726e-06, "loss": 3.128847961425781, "step": 391000 }, { "epoch": 0.47191425422977734, "learning_rate": 8.460983032448988e-06, "loss": 3.1029425048828125, "step": 391100 }, { "epoch": 0.47203491755226, "learning_rate": 8.46057919698125e-06, "loss": 3.1005255126953126, "step": 391200 }, { "epoch": 0.47215558087474274, "learning_rate": 8.460175361513512e-06, "loss": 3.1312411499023436, "step": 391300 }, { "epoch": 0.4722762441972254, "learning_rate": 8.459771526045774e-06, "loss": 3.1139947509765626, "step": 391400 }, { "epoch": 0.4723969075197081, "learning_rate": 8.459367690578034e-06, "loss": 3.1184735107421875, "step": 391500 }, { "epoch": 0.47251757084219076, "learning_rate": 8.458963855110296e-06, "loss": 3.1278179931640624, "step": 391600 }, { "epoch": 0.47263823416467343, "learning_rate": 8.458560019642558e-06, "loss": 3.0912960815429686, "step": 391700 }, { "epoch": 0.47275889748715616, "learning_rate": 8.45815618417482e-06, "loss": 3.0673068237304686, "step": 391800 }, { "epoch": 0.47287956080963883, "learning_rate": 8.457752348707082e-06, "loss": 3.118819274902344, "step": 391900 }, { "epoch": 0.4730002241321215, "learning_rate": 8.457348513239342e-06, "loss": 3.1085861206054686, "step": 392000 }, { "epoch": 0.4731208874546042, "learning_rate": 8.456944677771604e-06, "loss": 3.1061740112304688, "step": 392100 }, { "epoch": 0.4732415507770869, "learning_rate": 8.456540842303866e-06, "loss": 3.105338134765625, "step": 392200 }, { "epoch": 0.4733622140995696, "learning_rate": 8.456137006836127e-06, "loss": 3.093358154296875, "step": 392300 }, { "epoch": 0.47348287742205225, "learning_rate": 8.455733171368389e-06, "loss": 3.1238018798828127, "step": 392400 }, { "epoch": 0.4736035407445349, "learning_rate": 8.45532933590065e-06, "loss": 3.1033029174804687, "step": 392500 }, { "epoch": 0.4737242040670176, "learning_rate": 8.454925500432913e-06, "loss": 3.1281802368164064, "step": 392600 }, { "epoch": 0.4738448673895003, "learning_rate": 8.454521664965174e-06, "loss": 3.1319540405273436, "step": 392700 }, { "epoch": 0.473965530711983, "learning_rate": 8.454117829497436e-06, "loss": 3.1147210693359373, "step": 392800 }, { "epoch": 0.47408619403446567, "learning_rate": 8.453713994029697e-06, "loss": 3.1519085693359377, "step": 392900 }, { "epoch": 0.47420685735694834, "learning_rate": 8.453310158561959e-06, "loss": 3.100499267578125, "step": 393000 }, { "epoch": 0.474327520679431, "learning_rate": 8.45290632309422e-06, "loss": 3.1120028686523438, "step": 393100 }, { "epoch": 0.47444818400191374, "learning_rate": 8.452502487626481e-06, "loss": 3.1080838012695313, "step": 393200 }, { "epoch": 0.4745688473243964, "learning_rate": 8.452098652158743e-06, "loss": 3.1241705322265627, "step": 393300 }, { "epoch": 0.4746895106468791, "learning_rate": 8.451694816691005e-06, "loss": 3.1080181884765623, "step": 393400 }, { "epoch": 0.47481017396936176, "learning_rate": 8.451290981223267e-06, "loss": 3.0980453491210938, "step": 393500 }, { "epoch": 0.47493083729184443, "learning_rate": 8.450887145755529e-06, "loss": 3.0788613891601564, "step": 393600 }, { "epoch": 0.47505150061432716, "learning_rate": 8.450483310287791e-06, "loss": 3.136014099121094, "step": 393700 }, { "epoch": 0.47517216393680983, "learning_rate": 8.450079474820053e-06, "loss": 3.120100402832031, "step": 393800 }, { "epoch": 0.4752928272592925, "learning_rate": 8.449675639352313e-06, "loss": 3.1098016357421874, "step": 393900 }, { "epoch": 0.4754134905817752, "learning_rate": 8.449271803884575e-06, "loss": 3.109454345703125, "step": 394000 }, { "epoch": 0.47553415390425785, "learning_rate": 8.448867968416835e-06, "loss": 3.1173699951171874, "step": 394100 }, { "epoch": 0.4756548172267406, "learning_rate": 8.448464132949097e-06, "loss": 3.0544357299804688, "step": 394200 }, { "epoch": 0.47577548054922325, "learning_rate": 8.44806029748136e-06, "loss": 3.098197021484375, "step": 394300 }, { "epoch": 0.4758961438717059, "learning_rate": 8.447656462013621e-06, "loss": 3.088961486816406, "step": 394400 }, { "epoch": 0.4760168071941886, "learning_rate": 8.447252626545883e-06, "loss": 3.0855181884765623, "step": 394500 }, { "epoch": 0.4761374705166713, "learning_rate": 8.446848791078145e-06, "loss": 3.1152850341796876, "step": 394600 }, { "epoch": 0.476258133839154, "learning_rate": 8.446444955610406e-06, "loss": 3.1350958251953127, "step": 394700 }, { "epoch": 0.47637879716163667, "learning_rate": 8.446041120142668e-06, "loss": 3.1023828125, "step": 394800 }, { "epoch": 0.47649946048411934, "learning_rate": 8.44563728467493e-06, "loss": 3.102723388671875, "step": 394900 }, { "epoch": 0.476620123806602, "learning_rate": 8.445233449207192e-06, "loss": 3.107860412597656, "step": 395000 }, { "epoch": 0.47674078712908474, "learning_rate": 8.444829613739452e-06, "loss": 3.10630859375, "step": 395100 }, { "epoch": 0.4768614504515674, "learning_rate": 8.444425778271714e-06, "loss": 3.128507080078125, "step": 395200 }, { "epoch": 0.4769821137740501, "learning_rate": 8.444021942803976e-06, "loss": 3.0866189575195313, "step": 395300 }, { "epoch": 0.47710277709653276, "learning_rate": 8.443618107336238e-06, "loss": 3.0778262329101564, "step": 395400 }, { "epoch": 0.47722344041901543, "learning_rate": 8.443214271868498e-06, "loss": 3.113604736328125, "step": 395500 }, { "epoch": 0.47734410374149816, "learning_rate": 8.44281043640076e-06, "loss": 3.0987164306640627, "step": 395600 }, { "epoch": 0.47746476706398083, "learning_rate": 8.442406600933022e-06, "loss": 3.1265911865234375, "step": 395700 }, { "epoch": 0.4775854303864635, "learning_rate": 8.442002765465284e-06, "loss": 3.0987625122070312, "step": 395800 }, { "epoch": 0.4777060937089462, "learning_rate": 8.441598929997546e-06, "loss": 3.086417236328125, "step": 395900 }, { "epoch": 0.47782675703142885, "learning_rate": 8.441195094529806e-06, "loss": 3.111502380371094, "step": 396000 }, { "epoch": 0.4779474203539116, "learning_rate": 8.440791259062068e-06, "loss": 3.0859475708007813, "step": 396100 }, { "epoch": 0.47806808367639425, "learning_rate": 8.44038742359433e-06, "loss": 3.0990335083007814, "step": 396200 }, { "epoch": 0.4781887469988769, "learning_rate": 8.439983588126592e-06, "loss": 3.116259765625, "step": 396300 }, { "epoch": 0.4783094103213596, "learning_rate": 8.439579752658853e-06, "loss": 3.110775146484375, "step": 396400 }, { "epoch": 0.47843007364384227, "learning_rate": 8.439175917191115e-06, "loss": 3.0855258178710936, "step": 396500 }, { "epoch": 0.478550736966325, "learning_rate": 8.438772081723377e-06, "loss": 3.121785888671875, "step": 396600 }, { "epoch": 0.47867140028880767, "learning_rate": 8.438368246255639e-06, "loss": 3.10590087890625, "step": 396700 }, { "epoch": 0.47879206361129034, "learning_rate": 8.4379644107879e-06, "loss": 3.128548278808594, "step": 396800 }, { "epoch": 0.478912726933773, "learning_rate": 8.437560575320163e-06, "loss": 3.0855377197265623, "step": 396900 }, { "epoch": 0.47903339025625574, "learning_rate": 8.437156739852423e-06, "loss": 3.0881637573242187, "step": 397000 }, { "epoch": 0.4791540535787384, "learning_rate": 8.436752904384685e-06, "loss": 3.0910745239257813, "step": 397100 }, { "epoch": 0.4792747169012211, "learning_rate": 8.436349068916945e-06, "loss": 3.1228036499023437, "step": 397200 }, { "epoch": 0.47939538022370376, "learning_rate": 8.435945233449207e-06, "loss": 3.081323547363281, "step": 397300 }, { "epoch": 0.47951604354618643, "learning_rate": 8.435541397981469e-06, "loss": 3.1056808471679687, "step": 397400 }, { "epoch": 0.47963670686866916, "learning_rate": 8.435137562513731e-06, "loss": 3.089926452636719, "step": 397500 }, { "epoch": 0.47975737019115183, "learning_rate": 8.434733727045993e-06, "loss": 3.0946749877929687, "step": 397600 }, { "epoch": 0.4798780335136345, "learning_rate": 8.434329891578255e-06, "loss": 3.087687683105469, "step": 397700 }, { "epoch": 0.4799986968361172, "learning_rate": 8.433926056110517e-06, "loss": 3.120843505859375, "step": 397800 }, { "epoch": 0.48011936015859985, "learning_rate": 8.433522220642777e-06, "loss": 3.1099539184570313, "step": 397900 }, { "epoch": 0.4802400234810826, "learning_rate": 8.43311838517504e-06, "loss": 3.11024658203125, "step": 398000 }, { "epoch": 0.48036068680356525, "learning_rate": 8.432714549707301e-06, "loss": 3.09318115234375, "step": 398100 }, { "epoch": 0.4804813501260479, "learning_rate": 8.432310714239562e-06, "loss": 3.1173333740234375, "step": 398200 }, { "epoch": 0.4806020134485306, "learning_rate": 8.431906878771823e-06, "loss": 3.097176513671875, "step": 398300 }, { "epoch": 0.48072267677101327, "learning_rate": 8.431503043304085e-06, "loss": 3.1012893676757813, "step": 398400 }, { "epoch": 0.480843340093496, "learning_rate": 8.431099207836347e-06, "loss": 3.1367181396484374, "step": 398500 }, { "epoch": 0.48096400341597867, "learning_rate": 8.43069537236861e-06, "loss": 3.0885751342773435, "step": 398600 }, { "epoch": 0.48108466673846134, "learning_rate": 8.430291536900871e-06, "loss": 3.10408447265625, "step": 398700 }, { "epoch": 0.481205330060944, "learning_rate": 8.429887701433132e-06, "loss": 3.1087435913085937, "step": 398800 }, { "epoch": 0.4813259933834267, "learning_rate": 8.429483865965394e-06, "loss": 3.0896182250976563, "step": 398900 }, { "epoch": 0.4814466567059094, "learning_rate": 8.429080030497656e-06, "loss": 3.0709848022460937, "step": 399000 }, { "epoch": 0.4815673200283921, "learning_rate": 8.428676195029916e-06, "loss": 3.0725668334960936, "step": 399100 }, { "epoch": 0.48168798335087476, "learning_rate": 8.428272359562178e-06, "loss": 3.0570263671875, "step": 399200 }, { "epoch": 0.48180864667335743, "learning_rate": 8.42786852409444e-06, "loss": 3.1007846069335936, "step": 399300 }, { "epoch": 0.4819293099958401, "learning_rate": 8.427464688626702e-06, "loss": 3.06720703125, "step": 399400 }, { "epoch": 0.48204997331832283, "learning_rate": 8.427060853158964e-06, "loss": 3.104925231933594, "step": 399500 }, { "epoch": 0.4821706366408055, "learning_rate": 8.426657017691224e-06, "loss": 3.0758880615234374, "step": 399600 }, { "epoch": 0.4822912999632882, "learning_rate": 8.426253182223486e-06, "loss": 3.1065664672851563, "step": 399700 }, { "epoch": 0.48241196328577085, "learning_rate": 8.425849346755748e-06, "loss": 3.1080535888671874, "step": 399800 }, { "epoch": 0.4825326266082536, "learning_rate": 8.42544551128801e-06, "loss": 3.129813232421875, "step": 399900 }, { "epoch": 0.48265328993073625, "learning_rate": 8.425041675820272e-06, "loss": 3.1167398071289063, "step": 400000 }, { "epoch": 0.4827739532532189, "learning_rate": 8.424637840352532e-06, "loss": 3.1018927001953127, "step": 400100 }, { "epoch": 0.4828946165757016, "learning_rate": 8.424234004884794e-06, "loss": 3.0845901489257814, "step": 400200 }, { "epoch": 0.48301527989818427, "learning_rate": 8.423830169417056e-06, "loss": 3.107624206542969, "step": 400300 }, { "epoch": 0.483135943220667, "learning_rate": 8.423426333949317e-06, "loss": 3.0834930419921873, "step": 400400 }, { "epoch": 0.48325660654314967, "learning_rate": 8.423022498481579e-06, "loss": 3.073968505859375, "step": 400500 }, { "epoch": 0.48337726986563234, "learning_rate": 8.42261866301384e-06, "loss": 3.07536376953125, "step": 400600 }, { "epoch": 0.483497933188115, "learning_rate": 8.422214827546103e-06, "loss": 3.0725445556640625, "step": 400700 }, { "epoch": 0.4836185965105977, "learning_rate": 8.421810992078365e-06, "loss": 3.094947509765625, "step": 400800 }, { "epoch": 0.4837392598330804, "learning_rate": 8.421407156610627e-06, "loss": 3.109068603515625, "step": 400900 }, { "epoch": 0.4838599231555631, "learning_rate": 8.421003321142887e-06, "loss": 3.091180419921875, "step": 401000 }, { "epoch": 0.48398058647804576, "learning_rate": 8.420599485675149e-06, "loss": 3.1118594360351564, "step": 401100 }, { "epoch": 0.48410124980052843, "learning_rate": 8.42019565020741e-06, "loss": 3.098489990234375, "step": 401200 }, { "epoch": 0.4842219131230111, "learning_rate": 8.419791814739671e-06, "loss": 3.0923114013671875, "step": 401300 }, { "epoch": 0.48434257644549383, "learning_rate": 8.419387979271933e-06, "loss": 3.101041564941406, "step": 401400 }, { "epoch": 0.4844632397679765, "learning_rate": 8.418984143804195e-06, "loss": 3.082236633300781, "step": 401500 }, { "epoch": 0.4845839030904592, "learning_rate": 8.418580308336457e-06, "loss": 3.083673400878906, "step": 401600 }, { "epoch": 0.48470456641294185, "learning_rate": 8.418176472868719e-06, "loss": 3.130315246582031, "step": 401700 }, { "epoch": 0.4848252297354245, "learning_rate": 8.417772637400981e-06, "loss": 3.1092239379882813, "step": 401800 }, { "epoch": 0.48494589305790725, "learning_rate": 8.417368801933243e-06, "loss": 3.09388671875, "step": 401900 }, { "epoch": 0.4850665563803899, "learning_rate": 8.416964966465503e-06, "loss": 3.1032403564453124, "step": 402000 }, { "epoch": 0.4851872197028726, "learning_rate": 8.416561130997765e-06, "loss": 3.1174456787109377, "step": 402100 }, { "epoch": 0.48530788302535527, "learning_rate": 8.416157295530026e-06, "loss": 3.0884149169921873, "step": 402200 }, { "epoch": 0.485428546347838, "learning_rate": 8.415753460062288e-06, "loss": 3.1053207397460936, "step": 402300 }, { "epoch": 0.48554920967032067, "learning_rate": 8.41534962459455e-06, "loss": 3.118140869140625, "step": 402400 }, { "epoch": 0.48566987299280334, "learning_rate": 8.414945789126811e-06, "loss": 3.0746533203125, "step": 402500 }, { "epoch": 0.485790536315286, "learning_rate": 8.414541953659073e-06, "loss": 3.0938232421875, "step": 402600 }, { "epoch": 0.4859111996377687, "learning_rate": 8.414138118191335e-06, "loss": 3.070401611328125, "step": 402700 }, { "epoch": 0.4860318629602514, "learning_rate": 8.413734282723597e-06, "loss": 3.123790588378906, "step": 402800 }, { "epoch": 0.4861525262827341, "learning_rate": 8.413330447255858e-06, "loss": 3.1210443115234376, "step": 402900 }, { "epoch": 0.48627318960521676, "learning_rate": 8.41292661178812e-06, "loss": 3.092182922363281, "step": 403000 }, { "epoch": 0.48639385292769943, "learning_rate": 8.412522776320382e-06, "loss": 3.0950628662109376, "step": 403100 }, { "epoch": 0.4865145162501821, "learning_rate": 8.412118940852642e-06, "loss": 3.0670315551757814, "step": 403200 }, { "epoch": 0.48663517957266483, "learning_rate": 8.411715105384904e-06, "loss": 3.098896789550781, "step": 403300 }, { "epoch": 0.4867558428951475, "learning_rate": 8.411311269917166e-06, "loss": 3.085815734863281, "step": 403400 }, { "epoch": 0.4868765062176302, "learning_rate": 8.410907434449428e-06, "loss": 3.1057781982421875, "step": 403500 }, { "epoch": 0.48699716954011285, "learning_rate": 8.41050359898169e-06, "loss": 3.0981674194335938, "step": 403600 }, { "epoch": 0.4871178328625955, "learning_rate": 8.41009976351395e-06, "loss": 3.105654296875, "step": 403700 }, { "epoch": 0.48723849618507825, "learning_rate": 8.409695928046212e-06, "loss": 3.088855895996094, "step": 403800 }, { "epoch": 0.4873591595075609, "learning_rate": 8.409292092578474e-06, "loss": 3.0955364990234373, "step": 403900 }, { "epoch": 0.4874798228300436, "learning_rate": 8.408888257110736e-06, "loss": 3.08198974609375, "step": 404000 }, { "epoch": 0.48760048615252627, "learning_rate": 8.408484421642996e-06, "loss": 3.10002685546875, "step": 404100 }, { "epoch": 0.48772114947500894, "learning_rate": 8.408080586175258e-06, "loss": 3.08379638671875, "step": 404200 }, { "epoch": 0.48784181279749167, "learning_rate": 8.40767675070752e-06, "loss": 3.065028076171875, "step": 404300 }, { "epoch": 0.48796247611997434, "learning_rate": 8.407272915239782e-06, "loss": 3.075791015625, "step": 404400 }, { "epoch": 0.488083139442457, "learning_rate": 8.406869079772043e-06, "loss": 3.1015188598632815, "step": 404500 }, { "epoch": 0.4882038027649397, "learning_rate": 8.406465244304305e-06, "loss": 3.0968704223632812, "step": 404600 }, { "epoch": 0.48832446608742236, "learning_rate": 8.406061408836567e-06, "loss": 3.0848504638671876, "step": 404700 }, { "epoch": 0.4884451294099051, "learning_rate": 8.405657573368829e-06, "loss": 3.0905316162109373, "step": 404800 }, { "epoch": 0.48856579273238776, "learning_rate": 8.40525373790109e-06, "loss": 3.1199295043945314, "step": 404900 }, { "epoch": 0.48868645605487043, "learning_rate": 8.404849902433353e-06, "loss": 3.109422302246094, "step": 405000 }, { "epoch": 0.4888071193773531, "learning_rate": 8.404446066965613e-06, "loss": 3.0794296264648438, "step": 405100 }, { "epoch": 0.48892778269983583, "learning_rate": 8.404042231497875e-06, "loss": 3.09427490234375, "step": 405200 }, { "epoch": 0.4890484460223185, "learning_rate": 8.403638396030135e-06, "loss": 3.0705914306640625, "step": 405300 }, { "epoch": 0.4891691093448012, "learning_rate": 8.403234560562397e-06, "loss": 3.1210516357421874, "step": 405400 }, { "epoch": 0.48928977266728385, "learning_rate": 8.402830725094659e-06, "loss": 3.0909454345703127, "step": 405500 }, { "epoch": 0.4894104359897665, "learning_rate": 8.402426889626921e-06, "loss": 3.084837646484375, "step": 405600 }, { "epoch": 0.48953109931224925, "learning_rate": 8.402023054159183e-06, "loss": 3.0785919189453126, "step": 405700 }, { "epoch": 0.4896517626347319, "learning_rate": 8.401619218691445e-06, "loss": 3.081869812011719, "step": 405800 }, { "epoch": 0.4897724259572146, "learning_rate": 8.401215383223707e-06, "loss": 3.103351745605469, "step": 405900 }, { "epoch": 0.48989308927969727, "learning_rate": 8.400811547755969e-06, "loss": 3.079375, "step": 406000 }, { "epoch": 0.49001375260217994, "learning_rate": 8.40040771228823e-06, "loss": 3.08417724609375, "step": 406100 }, { "epoch": 0.49013441592466267, "learning_rate": 8.400003876820491e-06, "loss": 3.088600769042969, "step": 406200 }, { "epoch": 0.49025507924714534, "learning_rate": 8.399600041352752e-06, "loss": 3.0954666137695312, "step": 406300 }, { "epoch": 0.490375742569628, "learning_rate": 8.399196205885014e-06, "loss": 3.1070513916015625, "step": 406400 }, { "epoch": 0.4904964058921107, "learning_rate": 8.398792370417276e-06, "loss": 3.06857666015625, "step": 406500 }, { "epoch": 0.49061706921459336, "learning_rate": 8.398388534949538e-06, "loss": 3.0771078491210937, "step": 406600 }, { "epoch": 0.4907377325370761, "learning_rate": 8.3979846994818e-06, "loss": 3.0796969604492186, "step": 406700 }, { "epoch": 0.49085839585955876, "learning_rate": 8.397580864014061e-06, "loss": 3.0720809936523437, "step": 406800 }, { "epoch": 0.49097905918204143, "learning_rate": 8.397177028546323e-06, "loss": 3.0769488525390627, "step": 406900 }, { "epoch": 0.4910997225045241, "learning_rate": 8.396773193078584e-06, "loss": 3.0817401123046877, "step": 407000 }, { "epoch": 0.4912203858270068, "learning_rate": 8.396369357610846e-06, "loss": 3.0994720458984375, "step": 407100 }, { "epoch": 0.4913410491494895, "learning_rate": 8.395965522143108e-06, "loss": 3.0987261962890624, "step": 407200 }, { "epoch": 0.4914617124719722, "learning_rate": 8.395561686675368e-06, "loss": 3.086059265136719, "step": 407300 }, { "epoch": 0.49158237579445485, "learning_rate": 8.39515785120763e-06, "loss": 3.09379638671875, "step": 407400 }, { "epoch": 0.4917030391169375, "learning_rate": 8.394754015739892e-06, "loss": 3.0986920166015626, "step": 407500 }, { "epoch": 0.49182370243942025, "learning_rate": 8.394350180272154e-06, "loss": 3.066160888671875, "step": 407600 }, { "epoch": 0.4919443657619029, "learning_rate": 8.393946344804416e-06, "loss": 3.07545654296875, "step": 407700 }, { "epoch": 0.4920650290843856, "learning_rate": 8.393542509336676e-06, "loss": 3.1040966796875, "step": 407800 }, { "epoch": 0.49218569240686827, "learning_rate": 8.393138673868938e-06, "loss": 3.0473764038085935, "step": 407900 }, { "epoch": 0.49230635572935094, "learning_rate": 8.3927348384012e-06, "loss": 3.1065716552734375, "step": 408000 }, { "epoch": 0.49242701905183367, "learning_rate": 8.392331002933462e-06, "loss": 3.0778955078125, "step": 408100 }, { "epoch": 0.49254768237431634, "learning_rate": 8.391927167465722e-06, "loss": 3.090491943359375, "step": 408200 }, { "epoch": 0.492668345696799, "learning_rate": 8.391523331997984e-06, "loss": 3.093789367675781, "step": 408300 }, { "epoch": 0.4927890090192817, "learning_rate": 8.391119496530246e-06, "loss": 3.0637112426757813, "step": 408400 }, { "epoch": 0.49290967234176436, "learning_rate": 8.390715661062508e-06, "loss": 3.0946466064453126, "step": 408500 }, { "epoch": 0.4930303356642471, "learning_rate": 8.390311825594769e-06, "loss": 3.0925286865234374, "step": 408600 }, { "epoch": 0.49315099898672976, "learning_rate": 8.38990799012703e-06, "loss": 3.098787841796875, "step": 408700 }, { "epoch": 0.49327166230921243, "learning_rate": 8.389504154659293e-06, "loss": 3.0761318969726563, "step": 408800 }, { "epoch": 0.4933923256316951, "learning_rate": 8.389100319191555e-06, "loss": 3.078929748535156, "step": 408900 }, { "epoch": 0.4935129889541778, "learning_rate": 8.388696483723817e-06, "loss": 3.0839797973632814, "step": 409000 }, { "epoch": 0.4936336522766605, "learning_rate": 8.388292648256079e-06, "loss": 3.096500244140625, "step": 409100 }, { "epoch": 0.4937543155991432, "learning_rate": 8.387888812788339e-06, "loss": 3.0792950439453124, "step": 409200 }, { "epoch": 0.49387497892162585, "learning_rate": 8.387484977320601e-06, "loss": 3.0995574951171876, "step": 409300 }, { "epoch": 0.4939956422441085, "learning_rate": 8.387081141852861e-06, "loss": 3.1124093627929685, "step": 409400 }, { "epoch": 0.4941163055665912, "learning_rate": 8.386677306385123e-06, "loss": 3.08474853515625, "step": 409500 }, { "epoch": 0.4942369688890739, "learning_rate": 8.386273470917385e-06, "loss": 3.073335876464844, "step": 409600 }, { "epoch": 0.4943576322115566, "learning_rate": 8.385869635449647e-06, "loss": 3.0866018676757814, "step": 409700 }, { "epoch": 0.49447829553403927, "learning_rate": 8.385465799981909e-06, "loss": 3.085537109375, "step": 409800 }, { "epoch": 0.49459895885652194, "learning_rate": 8.385061964514171e-06, "loss": 3.088872375488281, "step": 409900 }, { "epoch": 0.49471962217900467, "learning_rate": 8.384658129046433e-06, "loss": 3.09466064453125, "step": 410000 }, { "epoch": 0.49484028550148734, "learning_rate": 8.384254293578693e-06, "loss": 3.094207763671875, "step": 410100 }, { "epoch": 0.49496094882397, "learning_rate": 8.383850458110955e-06, "loss": 3.102781066894531, "step": 410200 }, { "epoch": 0.4950816121464527, "learning_rate": 8.383446622643217e-06, "loss": 3.0413330078125, "step": 410300 }, { "epoch": 0.49520227546893536, "learning_rate": 8.383042787175478e-06, "loss": 3.0440472412109374, "step": 410400 }, { "epoch": 0.4953229387914181, "learning_rate": 8.38263895170774e-06, "loss": 3.06772705078125, "step": 410500 }, { "epoch": 0.49544360211390076, "learning_rate": 8.382235116240002e-06, "loss": 3.064564208984375, "step": 410600 }, { "epoch": 0.49556426543638343, "learning_rate": 8.381831280772264e-06, "loss": 3.0978408813476563, "step": 410700 }, { "epoch": 0.4956849287588661, "learning_rate": 8.381427445304526e-06, "loss": 3.099930419921875, "step": 410800 }, { "epoch": 0.4958055920813488, "learning_rate": 8.381023609836788e-06, "loss": 3.078155212402344, "step": 410900 }, { "epoch": 0.4959262554038315, "learning_rate": 8.380619774369048e-06, "loss": 3.081851806640625, "step": 411000 }, { "epoch": 0.4960469187263142, "learning_rate": 8.38021593890131e-06, "loss": 3.0806903076171874, "step": 411100 }, { "epoch": 0.49616758204879685, "learning_rate": 8.379812103433572e-06, "loss": 3.0570693969726563, "step": 411200 }, { "epoch": 0.4962882453712795, "learning_rate": 8.379408267965832e-06, "loss": 3.095123596191406, "step": 411300 }, { "epoch": 0.4964089086937622, "learning_rate": 8.379004432498094e-06, "loss": 3.0806570434570313, "step": 411400 }, { "epoch": 0.4965295720162449, "learning_rate": 8.378600597030356e-06, "loss": 3.0630374145507813, "step": 411500 }, { "epoch": 0.4966502353387276, "learning_rate": 8.378196761562618e-06, "loss": 3.0827978515625, "step": 411600 }, { "epoch": 0.49677089866121027, "learning_rate": 8.37779292609488e-06, "loss": 3.0606640625, "step": 411700 }, { "epoch": 0.49689156198369294, "learning_rate": 8.377389090627142e-06, "loss": 3.060072021484375, "step": 411800 }, { "epoch": 0.4970122253061756, "learning_rate": 8.376985255159402e-06, "loss": 3.080679931640625, "step": 411900 }, { "epoch": 0.49713288862865834, "learning_rate": 8.376581419691664e-06, "loss": 3.0780239868164063, "step": 412000 }, { "epoch": 0.497253551951141, "learning_rate": 8.376177584223926e-06, "loss": 3.085160827636719, "step": 412100 }, { "epoch": 0.4973742152736237, "learning_rate": 8.375773748756188e-06, "loss": 3.051485595703125, "step": 412200 }, { "epoch": 0.49749487859610636, "learning_rate": 8.375369913288449e-06, "loss": 3.07180908203125, "step": 412300 }, { "epoch": 0.49761554191858903, "learning_rate": 8.37496607782071e-06, "loss": 3.087249450683594, "step": 412400 }, { "epoch": 0.49773620524107176, "learning_rate": 8.374562242352972e-06, "loss": 3.12490234375, "step": 412500 }, { "epoch": 0.49785686856355443, "learning_rate": 8.374158406885234e-06, "loss": 3.0543276977539064, "step": 412600 }, { "epoch": 0.4979775318860371, "learning_rate": 8.373754571417495e-06, "loss": 3.075504150390625, "step": 412700 }, { "epoch": 0.4980981952085198, "learning_rate": 8.373350735949757e-06, "loss": 3.07824462890625, "step": 412800 }, { "epoch": 0.4982188585310025, "learning_rate": 8.372946900482019e-06, "loss": 3.074071960449219, "step": 412900 }, { "epoch": 0.4983395218534852, "learning_rate": 8.37254306501428e-06, "loss": 3.067923889160156, "step": 413000 }, { "epoch": 0.49846018517596785, "learning_rate": 8.372139229546543e-06, "loss": 3.08997314453125, "step": 413100 }, { "epoch": 0.4985808484984505, "learning_rate": 8.371735394078803e-06, "loss": 3.0839306640625, "step": 413200 }, { "epoch": 0.4987015118209332, "learning_rate": 8.371331558611065e-06, "loss": 3.098357849121094, "step": 413300 }, { "epoch": 0.4988221751434159, "learning_rate": 8.370927723143327e-06, "loss": 3.1040664672851563, "step": 413400 }, { "epoch": 0.4989428384658986, "learning_rate": 8.370523887675587e-06, "loss": 3.033949890136719, "step": 413500 }, { "epoch": 0.49906350178838127, "learning_rate": 8.37012005220785e-06, "loss": 3.0517706298828124, "step": 413600 }, { "epoch": 0.49918416511086394, "learning_rate": 8.369716216740111e-06, "loss": 3.0464508056640627, "step": 413700 }, { "epoch": 0.4993048284333466, "learning_rate": 8.369312381272373e-06, "loss": 3.0998956298828126, "step": 413800 }, { "epoch": 0.49942549175582934, "learning_rate": 8.368908545804635e-06, "loss": 3.0913955688476564, "step": 413900 }, { "epoch": 0.499546155078312, "learning_rate": 8.368504710336897e-06, "loss": 3.069590759277344, "step": 414000 }, { "epoch": 0.4996668184007947, "learning_rate": 8.368100874869159e-06, "loss": 3.06601806640625, "step": 414100 }, { "epoch": 0.49978748172327736, "learning_rate": 8.36769703940142e-06, "loss": 3.0971914672851564, "step": 414200 }, { "epoch": 0.49990814504576003, "learning_rate": 8.367293203933681e-06, "loss": 3.067413635253906, "step": 414300 }, { "epoch": 0.5000288083682427, "learning_rate": 8.366889368465942e-06, "loss": 3.041134948730469, "step": 414400 }, { "epoch": 0.5001494716907254, "learning_rate": 8.366485532998204e-06, "loss": 3.0805117797851564, "step": 414500 }, { "epoch": 0.5002701350132082, "learning_rate": 8.366081697530466e-06, "loss": 3.063617858886719, "step": 414600 }, { "epoch": 0.5003907983356908, "learning_rate": 8.365677862062728e-06, "loss": 3.0628564453125, "step": 414700 }, { "epoch": 0.5005114616581735, "learning_rate": 8.36527402659499e-06, "loss": 3.105867614746094, "step": 414800 }, { "epoch": 0.5006321249806561, "learning_rate": 8.364870191127252e-06, "loss": 3.0685870361328127, "step": 414900 }, { "epoch": 0.5007527883031389, "learning_rate": 8.364466355659514e-06, "loss": 3.044700012207031, "step": 415000 }, { "epoch": 0.5008734516256216, "learning_rate": 8.364062520191774e-06, "loss": 3.0534841918945315, "step": 415100 }, { "epoch": 0.5009941149481042, "learning_rate": 8.363658684724036e-06, "loss": 3.0662347412109376, "step": 415200 }, { "epoch": 0.5011147782705869, "learning_rate": 8.363254849256298e-06, "loss": 3.0634332275390626, "step": 415300 }, { "epoch": 0.5012354415930695, "learning_rate": 8.362851013788558e-06, "loss": 3.0582424926757814, "step": 415400 }, { "epoch": 0.5013561049155523, "learning_rate": 8.36244717832082e-06, "loss": 3.0725778198242186, "step": 415500 }, { "epoch": 0.501476768238035, "learning_rate": 8.362043342853082e-06, "loss": 3.06215087890625, "step": 415600 }, { "epoch": 0.5015974315605176, "learning_rate": 8.361639507385344e-06, "loss": 3.06943603515625, "step": 415700 }, { "epoch": 0.5017180948830003, "learning_rate": 8.361235671917606e-06, "loss": 3.093991394042969, "step": 415800 }, { "epoch": 0.501838758205483, "learning_rate": 8.360831836449866e-06, "loss": 3.05564208984375, "step": 415900 }, { "epoch": 0.5019594215279657, "learning_rate": 8.360428000982128e-06, "loss": 3.0717501831054688, "step": 416000 }, { "epoch": 0.5020800848504484, "learning_rate": 8.36002416551439e-06, "loss": 3.0618905639648437, "step": 416100 }, { "epoch": 0.502200748172931, "learning_rate": 8.359620330046652e-06, "loss": 3.0480221557617186, "step": 416200 }, { "epoch": 0.5023214114954138, "learning_rate": 8.359216494578913e-06, "loss": 3.064105224609375, "step": 416300 }, { "epoch": 0.5024420748178964, "learning_rate": 8.358812659111175e-06, "loss": 3.068736267089844, "step": 416400 }, { "epoch": 0.5025627381403791, "learning_rate": 8.358408823643437e-06, "loss": 3.067481689453125, "step": 416500 }, { "epoch": 0.5026834014628618, "learning_rate": 8.358004988175699e-06, "loss": 3.083235778808594, "step": 416600 }, { "epoch": 0.5028040647853445, "learning_rate": 8.357601152707959e-06, "loss": 3.0538290405273436, "step": 416700 }, { "epoch": 0.5029247281078272, "learning_rate": 8.35719731724022e-06, "loss": 3.0361834716796876, "step": 416800 }, { "epoch": 0.5030453914303098, "learning_rate": 8.356793481772483e-06, "loss": 3.0473150634765624, "step": 416900 }, { "epoch": 0.5031660547527925, "learning_rate": 8.356389646304745e-06, "loss": 3.063091125488281, "step": 417000 }, { "epoch": 0.5032867180752753, "learning_rate": 8.355985810837007e-06, "loss": 3.0621282958984377, "step": 417100 }, { "epoch": 0.5034073813977579, "learning_rate": 8.355581975369269e-06, "loss": 3.0812948608398436, "step": 417200 }, { "epoch": 0.5035280447202406, "learning_rate": 8.355178139901529e-06, "loss": 3.0475759887695313, "step": 417300 }, { "epoch": 0.5036487080427232, "learning_rate": 8.354774304433791e-06, "loss": 3.07255859375, "step": 417400 }, { "epoch": 0.5037693713652059, "learning_rate": 8.354370468966053e-06, "loss": 3.0646743774414062, "step": 417500 }, { "epoch": 0.5038900346876887, "learning_rate": 8.353966633498313e-06, "loss": 3.08345703125, "step": 417600 }, { "epoch": 0.5040106980101713, "learning_rate": 8.353562798030575e-06, "loss": 3.0557269287109374, "step": 417700 }, { "epoch": 0.504131361332654, "learning_rate": 8.353158962562837e-06, "loss": 3.0752493286132814, "step": 417800 }, { "epoch": 0.5042520246551366, "learning_rate": 8.3527551270951e-06, "loss": 3.0719833374023438, "step": 417900 }, { "epoch": 0.5043726879776194, "learning_rate": 8.352351291627361e-06, "loss": 3.0604779052734377, "step": 418000 }, { "epoch": 0.5044933513001021, "learning_rate": 8.351947456159623e-06, "loss": 3.07777587890625, "step": 418100 }, { "epoch": 0.5046140146225847, "learning_rate": 8.351543620691883e-06, "loss": 3.079162902832031, "step": 418200 }, { "epoch": 0.5047346779450674, "learning_rate": 8.351139785224145e-06, "loss": 3.0609991455078127, "step": 418300 }, { "epoch": 0.50485534126755, "learning_rate": 8.350735949756407e-06, "loss": 3.061528625488281, "step": 418400 }, { "epoch": 0.5049760045900328, "learning_rate": 8.350332114288668e-06, "loss": 3.083462829589844, "step": 418500 }, { "epoch": 0.5050966679125155, "learning_rate": 8.34992827882093e-06, "loss": 3.066733093261719, "step": 418600 }, { "epoch": 0.5052173312349981, "learning_rate": 8.349524443353192e-06, "loss": 3.058432312011719, "step": 418700 }, { "epoch": 0.5053379945574809, "learning_rate": 8.349120607885454e-06, "loss": 3.0906692504882813, "step": 418800 }, { "epoch": 0.5054586578799635, "learning_rate": 8.348716772417716e-06, "loss": 3.048239440917969, "step": 418900 }, { "epoch": 0.5055793212024462, "learning_rate": 8.348312936949978e-06, "loss": 3.0807391357421876, "step": 419000 }, { "epoch": 0.5056999845249289, "learning_rate": 8.34790910148224e-06, "loss": 3.098170166015625, "step": 419100 }, { "epoch": 0.5058206478474115, "learning_rate": 8.3475052660145e-06, "loss": 3.056720886230469, "step": 419200 }, { "epoch": 0.5059413111698943, "learning_rate": 8.347101430546762e-06, "loss": 3.087235107421875, "step": 419300 }, { "epoch": 0.506061974492377, "learning_rate": 8.346697595079022e-06, "loss": 3.0625408935546874, "step": 419400 }, { "epoch": 0.5061826378148596, "learning_rate": 8.346293759611284e-06, "loss": 3.047413024902344, "step": 419500 }, { "epoch": 0.5063033011373423, "learning_rate": 8.345889924143546e-06, "loss": 3.032467956542969, "step": 419600 }, { "epoch": 0.506423964459825, "learning_rate": 8.345486088675808e-06, "loss": 3.070262145996094, "step": 419700 }, { "epoch": 0.5065446277823077, "learning_rate": 8.34508225320807e-06, "loss": 3.06198486328125, "step": 419800 }, { "epoch": 0.5066652911047904, "learning_rate": 8.344678417740332e-06, "loss": 3.0581536865234376, "step": 419900 }, { "epoch": 0.506785954427273, "learning_rate": 8.344274582272592e-06, "loss": 3.054132080078125, "step": 420000 }, { "epoch": 0.5069066177497558, "learning_rate": 8.343870746804854e-06, "loss": 3.0500445556640625, "step": 420100 }, { "epoch": 0.5070272810722384, "learning_rate": 8.343466911337116e-06, "loss": 3.069715576171875, "step": 420200 }, { "epoch": 0.5071479443947211, "learning_rate": 8.343063075869378e-06, "loss": 3.061250915527344, "step": 420300 }, { "epoch": 0.5072686077172038, "learning_rate": 8.342659240401639e-06, "loss": 3.065164794921875, "step": 420400 }, { "epoch": 0.5073892710396865, "learning_rate": 8.3422554049339e-06, "loss": 3.071152648925781, "step": 420500 }, { "epoch": 0.5075099343621692, "learning_rate": 8.341851569466163e-06, "loss": 3.0517401123046874, "step": 420600 }, { "epoch": 0.5076305976846518, "learning_rate": 8.341447733998425e-06, "loss": 3.04858642578125, "step": 420700 }, { "epoch": 0.5077512610071345, "learning_rate": 8.341043898530685e-06, "loss": 3.0574853515625, "step": 420800 }, { "epoch": 0.5078719243296173, "learning_rate": 8.340640063062947e-06, "loss": 3.0682489013671876, "step": 420900 }, { "epoch": 0.5079925876520999, "learning_rate": 8.340236227595209e-06, "loss": 3.070512390136719, "step": 421000 }, { "epoch": 0.5081132509745826, "learning_rate": 8.33983239212747e-06, "loss": 3.0714627075195313, "step": 421100 }, { "epoch": 0.5082339142970652, "learning_rate": 8.339428556659733e-06, "loss": 3.052193908691406, "step": 421200 }, { "epoch": 0.5083545776195479, "learning_rate": 8.339024721191995e-06, "loss": 3.048439636230469, "step": 421300 }, { "epoch": 0.5084752409420307, "learning_rate": 8.338620885724255e-06, "loss": 3.068442687988281, "step": 421400 }, { "epoch": 0.5085959042645133, "learning_rate": 8.338217050256517e-06, "loss": 3.0612451171875, "step": 421500 }, { "epoch": 0.508716567586996, "learning_rate": 8.337813214788777e-06, "loss": 3.0792041015625, "step": 421600 }, { "epoch": 0.5088372309094786, "learning_rate": 8.33740937932104e-06, "loss": 3.0510464477539063, "step": 421700 }, { "epoch": 0.5089578942319614, "learning_rate": 8.337005543853301e-06, "loss": 3.0392532348632812, "step": 421800 }, { "epoch": 0.5090785575544441, "learning_rate": 8.336601708385563e-06, "loss": 3.044076232910156, "step": 421900 }, { "epoch": 0.5091992208769267, "learning_rate": 8.336197872917825e-06, "loss": 3.04828369140625, "step": 422000 }, { "epoch": 0.5093198841994094, "learning_rate": 8.335794037450087e-06, "loss": 3.038778076171875, "step": 422100 }, { "epoch": 0.509440547521892, "learning_rate": 8.33539020198235e-06, "loss": 3.0599810791015627, "step": 422200 }, { "epoch": 0.5095612108443748, "learning_rate": 8.33498636651461e-06, "loss": 3.0603094482421875, "step": 422300 }, { "epoch": 0.5096818741668575, "learning_rate": 8.334582531046871e-06, "loss": 3.059103698730469, "step": 422400 }, { "epoch": 0.5098025374893401, "learning_rate": 8.334178695579133e-06, "loss": 3.037176208496094, "step": 422500 }, { "epoch": 0.5099232008118229, "learning_rate": 8.333774860111394e-06, "loss": 3.0613641357421875, "step": 422600 }, { "epoch": 0.5100438641343055, "learning_rate": 8.333371024643656e-06, "loss": 3.067445983886719, "step": 422700 }, { "epoch": 0.5101645274567882, "learning_rate": 8.332967189175918e-06, "loss": 3.075067443847656, "step": 422800 }, { "epoch": 0.5102851907792709, "learning_rate": 8.33256335370818e-06, "loss": 3.0423004150390627, "step": 422900 }, { "epoch": 0.5104058541017535, "learning_rate": 8.332159518240442e-06, "loss": 3.03037841796875, "step": 423000 }, { "epoch": 0.5105265174242363, "learning_rate": 8.331755682772704e-06, "loss": 3.0377597045898437, "step": 423100 }, { "epoch": 0.5106471807467189, "learning_rate": 8.331351847304966e-06, "loss": 3.0459384155273437, "step": 423200 }, { "epoch": 0.5107678440692016, "learning_rate": 8.330948011837226e-06, "loss": 3.0799755859375, "step": 423300 }, { "epoch": 0.5108885073916843, "learning_rate": 8.330544176369488e-06, "loss": 3.0394296264648437, "step": 423400 }, { "epoch": 0.511009170714167, "learning_rate": 8.330140340901748e-06, "loss": 3.0380587768554688, "step": 423500 }, { "epoch": 0.5111298340366497, "learning_rate": 8.32973650543401e-06, "loss": 3.0400350952148436, "step": 423600 }, { "epoch": 0.5112504973591323, "learning_rate": 8.329332669966272e-06, "loss": 3.0556790161132814, "step": 423700 }, { "epoch": 0.511371160681615, "learning_rate": 8.328928834498534e-06, "loss": 3.05145263671875, "step": 423800 }, { "epoch": 0.5114918240040978, "learning_rate": 8.328524999030796e-06, "loss": 3.056429443359375, "step": 423900 }, { "epoch": 0.5116124873265804, "learning_rate": 8.328121163563058e-06, "loss": 3.0487911987304686, "step": 424000 }, { "epoch": 0.5117331506490631, "learning_rate": 8.327717328095318e-06, "loss": 3.0483303833007813, "step": 424100 }, { "epoch": 0.5118538139715457, "learning_rate": 8.32731349262758e-06, "loss": 3.08312255859375, "step": 424200 }, { "epoch": 0.5119744772940285, "learning_rate": 8.326909657159842e-06, "loss": 3.0497344970703124, "step": 424300 }, { "epoch": 0.5120951406165112, "learning_rate": 8.326505821692104e-06, "loss": 3.067230529785156, "step": 424400 }, { "epoch": 0.5122158039389938, "learning_rate": 8.326101986224365e-06, "loss": 3.0073797607421877, "step": 424500 }, { "epoch": 0.5123364672614765, "learning_rate": 8.325698150756627e-06, "loss": 3.0361453247070314, "step": 424600 }, { "epoch": 0.5124571305839593, "learning_rate": 8.325294315288889e-06, "loss": 3.0673797607421873, "step": 424700 }, { "epoch": 0.5125777939064419, "learning_rate": 8.32489047982115e-06, "loss": 3.0618853759765625, "step": 424800 }, { "epoch": 0.5126984572289246, "learning_rate": 8.324486644353411e-06, "loss": 3.039766540527344, "step": 424900 }, { "epoch": 0.5128191205514072, "learning_rate": 8.324082808885673e-06, "loss": 3.0676339721679686, "step": 425000 }, { "epoch": 0.5129397838738899, "learning_rate": 8.323678973417935e-06, "loss": 3.052113037109375, "step": 425100 }, { "epoch": 0.5130604471963727, "learning_rate": 8.323275137950197e-06, "loss": 3.04845947265625, "step": 425200 }, { "epoch": 0.5131811105188553, "learning_rate": 8.322871302482459e-06, "loss": 3.0752008056640623, "step": 425300 }, { "epoch": 0.513301773841338, "learning_rate": 8.322467467014719e-06, "loss": 3.078260803222656, "step": 425400 }, { "epoch": 0.5134224371638206, "learning_rate": 8.322063631546981e-06, "loss": 3.0693145751953126, "step": 425500 }, { "epoch": 0.5135431004863034, "learning_rate": 8.321659796079243e-06, "loss": 3.062494812011719, "step": 425600 }, { "epoch": 0.5136637638087861, "learning_rate": 8.321255960611503e-06, "loss": 3.0423348999023436, "step": 425700 }, { "epoch": 0.5137844271312687, "learning_rate": 8.320852125143765e-06, "loss": 3.0554080200195313, "step": 425800 }, { "epoch": 0.5139050904537514, "learning_rate": 8.320448289676027e-06, "loss": 3.032933349609375, "step": 425900 }, { "epoch": 0.514025753776234, "learning_rate": 8.32004445420829e-06, "loss": 3.0390618896484374, "step": 426000 }, { "epoch": 0.5141464170987168, "learning_rate": 8.319640618740551e-06, "loss": 3.06499755859375, "step": 426100 }, { "epoch": 0.5142670804211995, "learning_rate": 8.319236783272813e-06, "loss": 3.0649758911132814, "step": 426200 }, { "epoch": 0.5143877437436821, "learning_rate": 8.318832947805075e-06, "loss": 3.02170654296875, "step": 426300 }, { "epoch": 0.5145084070661649, "learning_rate": 8.318429112337336e-06, "loss": 3.04176025390625, "step": 426400 }, { "epoch": 0.5146290703886475, "learning_rate": 8.318025276869598e-06, "loss": 3.058222351074219, "step": 426500 }, { "epoch": 0.5147497337111302, "learning_rate": 8.317621441401858e-06, "loss": 3.045534973144531, "step": 426600 }, { "epoch": 0.5148703970336129, "learning_rate": 8.31721760593412e-06, "loss": 3.05906982421875, "step": 426700 }, { "epoch": 0.5149910603560955, "learning_rate": 8.316813770466382e-06, "loss": 3.0301718139648437, "step": 426800 }, { "epoch": 0.5151117236785783, "learning_rate": 8.316409934998644e-06, "loss": 3.071788330078125, "step": 426900 }, { "epoch": 0.5152323870010609, "learning_rate": 8.316006099530906e-06, "loss": 3.033121337890625, "step": 427000 }, { "epoch": 0.5153530503235436, "learning_rate": 8.315602264063168e-06, "loss": 3.0305520629882814, "step": 427100 }, { "epoch": 0.5154737136460263, "learning_rate": 8.31519842859543e-06, "loss": 3.0346124267578123, "step": 427200 }, { "epoch": 0.515594376968509, "learning_rate": 8.31479459312769e-06, "loss": 3.075622253417969, "step": 427300 }, { "epoch": 0.5157150402909917, "learning_rate": 8.314390757659952e-06, "loss": 3.0046380615234374, "step": 427400 }, { "epoch": 0.5158357036134743, "learning_rate": 8.313986922192214e-06, "loss": 3.0335498046875, "step": 427500 }, { "epoch": 0.515956366935957, "learning_rate": 8.313583086724474e-06, "loss": 3.0385031127929687, "step": 427600 }, { "epoch": 0.5160770302584398, "learning_rate": 8.313179251256736e-06, "loss": 3.0766921997070313, "step": 427700 }, { "epoch": 0.5161976935809224, "learning_rate": 8.312775415788998e-06, "loss": 3.0377151489257814, "step": 427800 }, { "epoch": 0.5163183569034051, "learning_rate": 8.31237158032126e-06, "loss": 3.0509808349609373, "step": 427900 }, { "epoch": 0.5164390202258877, "learning_rate": 8.311967744853522e-06, "loss": 3.0555560302734377, "step": 428000 }, { "epoch": 0.5165596835483705, "learning_rate": 8.311563909385784e-06, "loss": 3.039304504394531, "step": 428100 }, { "epoch": 0.5166803468708532, "learning_rate": 8.311160073918044e-06, "loss": 3.058705139160156, "step": 428200 }, { "epoch": 0.5168010101933358, "learning_rate": 8.310756238450306e-06, "loss": 3.056860046386719, "step": 428300 }, { "epoch": 0.5169216735158185, "learning_rate": 8.310352402982568e-06, "loss": 3.046229248046875, "step": 428400 }, { "epoch": 0.5170423368383011, "learning_rate": 8.309948567514829e-06, "loss": 3.0511959838867186, "step": 428500 }, { "epoch": 0.5171630001607839, "learning_rate": 8.30954473204709e-06, "loss": 3.0641293334960937, "step": 428600 }, { "epoch": 0.5172836634832666, "learning_rate": 8.309140896579353e-06, "loss": 3.054437255859375, "step": 428700 }, { "epoch": 0.5174043268057492, "learning_rate": 8.308737061111615e-06, "loss": 3.0301165771484375, "step": 428800 }, { "epoch": 0.5175249901282319, "learning_rate": 8.308333225643877e-06, "loss": 3.0498062133789063, "step": 428900 }, { "epoch": 0.5176456534507146, "learning_rate": 8.307929390176137e-06, "loss": 3.0663275146484374, "step": 429000 }, { "epoch": 0.5177663167731973, "learning_rate": 8.307525554708399e-06, "loss": 3.061188049316406, "step": 429100 }, { "epoch": 0.51788698009568, "learning_rate": 8.307121719240661e-06, "loss": 3.045030212402344, "step": 429200 }, { "epoch": 0.5180076434181626, "learning_rate": 8.306717883772923e-06, "loss": 3.0660830688476564, "step": 429300 }, { "epoch": 0.5181283067406454, "learning_rate": 8.306314048305185e-06, "loss": 3.072074279785156, "step": 429400 }, { "epoch": 0.518248970063128, "learning_rate": 8.305910212837445e-06, "loss": 3.0510189819335936, "step": 429500 }, { "epoch": 0.5183696333856107, "learning_rate": 8.305506377369707e-06, "loss": 3.0200775146484373, "step": 429600 }, { "epoch": 0.5184902967080934, "learning_rate": 8.305102541901969e-06, "loss": 3.0297467041015627, "step": 429700 }, { "epoch": 0.518610960030576, "learning_rate": 8.30469870643423e-06, "loss": 3.053097839355469, "step": 429800 }, { "epoch": 0.5187316233530588, "learning_rate": 8.304294870966491e-06, "loss": 3.050734558105469, "step": 429900 }, { "epoch": 0.5188522866755415, "learning_rate": 8.303891035498753e-06, "loss": 3.05365234375, "step": 430000 }, { "epoch": 0.5189729499980241, "learning_rate": 8.303487200031015e-06, "loss": 3.0288882446289063, "step": 430100 }, { "epoch": 0.5190936133205069, "learning_rate": 8.303083364563277e-06, "loss": 3.063024597167969, "step": 430200 }, { "epoch": 0.5192142766429895, "learning_rate": 8.30267952909554e-06, "loss": 3.037414855957031, "step": 430300 }, { "epoch": 0.5193349399654722, "learning_rate": 8.3022756936278e-06, "loss": 3.055743408203125, "step": 430400 }, { "epoch": 0.5194556032879549, "learning_rate": 8.301871858160062e-06, "loss": 3.052115173339844, "step": 430500 }, { "epoch": 0.5195762666104375, "learning_rate": 8.301468022692324e-06, "loss": 3.0498760986328124, "step": 430600 }, { "epoch": 0.5196969299329203, "learning_rate": 8.301064187224584e-06, "loss": 3.0660003662109374, "step": 430700 }, { "epoch": 0.5198175932554029, "learning_rate": 8.300660351756846e-06, "loss": 3.0593902587890627, "step": 430800 }, { "epoch": 0.5199382565778856, "learning_rate": 8.300256516289108e-06, "loss": 3.0359820556640624, "step": 430900 }, { "epoch": 0.5200589199003683, "learning_rate": 8.29985268082137e-06, "loss": 3.044608154296875, "step": 431000 }, { "epoch": 0.520179583222851, "learning_rate": 8.299448845353632e-06, "loss": 3.043662109375, "step": 431100 }, { "epoch": 0.5203002465453337, "learning_rate": 8.299045009885894e-06, "loss": 3.0331790161132814, "step": 431200 }, { "epoch": 0.5204209098678163, "learning_rate": 8.298641174418156e-06, "loss": 3.06168212890625, "step": 431300 }, { "epoch": 0.520541573190299, "learning_rate": 8.298237338950416e-06, "loss": 3.0216925048828127, "step": 431400 }, { "epoch": 0.5206622365127818, "learning_rate": 8.297833503482678e-06, "loss": 3.04521728515625, "step": 431500 }, { "epoch": 0.5207828998352644, "learning_rate": 8.297429668014938e-06, "loss": 3.06349365234375, "step": 431600 }, { "epoch": 0.5209035631577471, "learning_rate": 8.2970258325472e-06, "loss": 3.015486145019531, "step": 431700 }, { "epoch": 0.5210242264802297, "learning_rate": 8.296621997079462e-06, "loss": 3.049866027832031, "step": 431800 }, { "epoch": 0.5211448898027125, "learning_rate": 8.296218161611724e-06, "loss": 3.0094125366210935, "step": 431900 }, { "epoch": 0.5212655531251952, "learning_rate": 8.295814326143986e-06, "loss": 3.06577880859375, "step": 432000 }, { "epoch": 0.5213862164476778, "learning_rate": 8.295410490676248e-06, "loss": 3.033587646484375, "step": 432100 }, { "epoch": 0.5215068797701605, "learning_rate": 8.29500665520851e-06, "loss": 3.037728576660156, "step": 432200 }, { "epoch": 0.5216275430926431, "learning_rate": 8.29460281974077e-06, "loss": 3.038385314941406, "step": 432300 }, { "epoch": 0.5217482064151259, "learning_rate": 8.294198984273032e-06, "loss": 3.0494979858398437, "step": 432400 }, { "epoch": 0.5218688697376086, "learning_rate": 8.293795148805294e-06, "loss": 3.053844299316406, "step": 432500 }, { "epoch": 0.5219895330600912, "learning_rate": 8.293391313337555e-06, "loss": 3.019091796875, "step": 432600 }, { "epoch": 0.5221101963825739, "learning_rate": 8.292987477869817e-06, "loss": 3.035799560546875, "step": 432700 }, { "epoch": 0.5222308597050566, "learning_rate": 8.292583642402079e-06, "loss": 3.0246429443359375, "step": 432800 }, { "epoch": 0.5223515230275393, "learning_rate": 8.29217980693434e-06, "loss": 3.0304010009765623, "step": 432900 }, { "epoch": 0.522472186350022, "learning_rate": 8.291775971466603e-06, "loss": 3.0269244384765623, "step": 433000 }, { "epoch": 0.5225928496725046, "learning_rate": 8.291372135998863e-06, "loss": 3.0511712646484375, "step": 433100 }, { "epoch": 0.5227135129949874, "learning_rate": 8.290968300531125e-06, "loss": 3.0312127685546875, "step": 433200 }, { "epoch": 0.52283417631747, "learning_rate": 8.290564465063387e-06, "loss": 3.023028564453125, "step": 433300 }, { "epoch": 0.5229548396399527, "learning_rate": 8.290160629595649e-06, "loss": 3.01251220703125, "step": 433400 }, { "epoch": 0.5230755029624354, "learning_rate": 8.28975679412791e-06, "loss": 3.0403378295898436, "step": 433500 }, { "epoch": 0.523196166284918, "learning_rate": 8.289352958660171e-06, "loss": 3.037583923339844, "step": 433600 }, { "epoch": 0.5233168296074008, "learning_rate": 8.288949123192433e-06, "loss": 3.052095947265625, "step": 433700 }, { "epoch": 0.5234374929298834, "learning_rate": 8.288545287724695e-06, "loss": 3.0461572265625, "step": 433800 }, { "epoch": 0.5235581562523661, "learning_rate": 8.288141452256955e-06, "loss": 3.0304461669921876, "step": 433900 }, { "epoch": 0.5236788195748489, "learning_rate": 8.287737616789217e-06, "loss": 3.0209609985351564, "step": 434000 }, { "epoch": 0.5237994828973315, "learning_rate": 8.28733378132148e-06, "loss": 3.01710205078125, "step": 434100 }, { "epoch": 0.5239201462198142, "learning_rate": 8.286929945853741e-06, "loss": 3.0505917358398436, "step": 434200 }, { "epoch": 0.5240408095422968, "learning_rate": 8.286526110386003e-06, "loss": 3.0195462036132814, "step": 434300 }, { "epoch": 0.5241614728647795, "learning_rate": 8.286122274918265e-06, "loss": 3.0492449951171876, "step": 434400 }, { "epoch": 0.5242821361872623, "learning_rate": 8.285718439450526e-06, "loss": 3.0434799194335938, "step": 434500 }, { "epoch": 0.5244027995097449, "learning_rate": 8.285314603982788e-06, "loss": 3.0262298583984375, "step": 434600 }, { "epoch": 0.5245234628322276, "learning_rate": 8.284910768515048e-06, "loss": 3.0278640747070313, "step": 434700 }, { "epoch": 0.5246441261547103, "learning_rate": 8.28450693304731e-06, "loss": 3.027030334472656, "step": 434800 }, { "epoch": 0.524764789477193, "learning_rate": 8.284103097579572e-06, "loss": 3.0209881591796877, "step": 434900 }, { "epoch": 0.5248854527996757, "learning_rate": 8.283699262111834e-06, "loss": 3.0090411376953123, "step": 435000 }, { "epoch": 0.5250061161221583, "learning_rate": 8.283295426644096e-06, "loss": 3.0484347534179688, "step": 435100 }, { "epoch": 0.525126779444641, "learning_rate": 8.282891591176358e-06, "loss": 3.029527282714844, "step": 435200 }, { "epoch": 0.5252474427671238, "learning_rate": 8.28248775570862e-06, "loss": 3.046122741699219, "step": 435300 }, { "epoch": 0.5253681060896064, "learning_rate": 8.282083920240882e-06, "loss": 3.0437503051757813, "step": 435400 }, { "epoch": 0.5254887694120891, "learning_rate": 8.281680084773142e-06, "loss": 3.017331237792969, "step": 435500 }, { "epoch": 0.5256094327345717, "learning_rate": 8.281276249305404e-06, "loss": 3.019862060546875, "step": 435600 }, { "epoch": 0.5257300960570545, "learning_rate": 8.280872413837664e-06, "loss": 3.0174725341796873, "step": 435700 }, { "epoch": 0.5258507593795372, "learning_rate": 8.280468578369926e-06, "loss": 3.0225360107421877, "step": 435800 }, { "epoch": 0.5259714227020198, "learning_rate": 8.280064742902188e-06, "loss": 3.048797607421875, "step": 435900 }, { "epoch": 0.5260920860245025, "learning_rate": 8.27966090743445e-06, "loss": 3.0422622680664064, "step": 436000 }, { "epoch": 0.5262127493469851, "learning_rate": 8.279257071966712e-06, "loss": 3.029744873046875, "step": 436100 }, { "epoch": 0.5263334126694679, "learning_rate": 8.278853236498974e-06, "loss": 3.026267395019531, "step": 436200 }, { "epoch": 0.5264540759919506, "learning_rate": 8.278449401031235e-06, "loss": 3.0416055297851563, "step": 436300 }, { "epoch": 0.5265747393144332, "learning_rate": 8.278045565563496e-06, "loss": 3.0519058227539064, "step": 436400 }, { "epoch": 0.5266954026369159, "learning_rate": 8.277641730095758e-06, "loss": 3.054364013671875, "step": 436500 }, { "epoch": 0.5268160659593986, "learning_rate": 8.27723789462802e-06, "loss": 3.0086798095703124, "step": 436600 }, { "epoch": 0.5269367292818813, "learning_rate": 8.27683405916028e-06, "loss": 3.0447116088867188, "step": 436700 }, { "epoch": 0.527057392604364, "learning_rate": 8.276430223692543e-06, "loss": 3.039418029785156, "step": 436800 }, { "epoch": 0.5271780559268466, "learning_rate": 8.276026388224805e-06, "loss": 3.0420828247070313, "step": 436900 }, { "epoch": 0.5272987192493294, "learning_rate": 8.275622552757067e-06, "loss": 3.056221618652344, "step": 437000 }, { "epoch": 0.527419382571812, "learning_rate": 8.275218717289327e-06, "loss": 3.032608947753906, "step": 437100 }, { "epoch": 0.5275400458942947, "learning_rate": 8.274814881821589e-06, "loss": 3.0226190185546873, "step": 437200 }, { "epoch": 0.5276607092167774, "learning_rate": 8.274411046353851e-06, "loss": 2.998238830566406, "step": 437300 }, { "epoch": 0.52778137253926, "learning_rate": 8.274007210886113e-06, "loss": 3.0441619873046877, "step": 437400 }, { "epoch": 0.5279020358617428, "learning_rate": 8.273603375418375e-06, "loss": 3.0439849853515626, "step": 437500 }, { "epoch": 0.5280226991842254, "learning_rate": 8.273199539950635e-06, "loss": 3.0543450927734375, "step": 437600 }, { "epoch": 0.5281433625067081, "learning_rate": 8.272795704482897e-06, "loss": 3.020230407714844, "step": 437700 }, { "epoch": 0.5282640258291909, "learning_rate": 8.27239186901516e-06, "loss": 3.038050231933594, "step": 437800 }, { "epoch": 0.5283846891516735, "learning_rate": 8.271988033547421e-06, "loss": 3.021733703613281, "step": 437900 }, { "epoch": 0.5285053524741562, "learning_rate": 8.271584198079681e-06, "loss": 3.029966125488281, "step": 438000 }, { "epoch": 0.5286260157966388, "learning_rate": 8.271180362611943e-06, "loss": 3.053952331542969, "step": 438100 }, { "epoch": 0.5287466791191215, "learning_rate": 8.270776527144205e-06, "loss": 3.02169677734375, "step": 438200 }, { "epoch": 0.5288673424416043, "learning_rate": 8.270372691676467e-06, "loss": 3.0531158447265625, "step": 438300 }, { "epoch": 0.5289880057640869, "learning_rate": 8.26996885620873e-06, "loss": 3.0478030395507814, "step": 438400 }, { "epoch": 0.5291086690865696, "learning_rate": 8.269565020740991e-06, "loss": 3.021881103515625, "step": 438500 }, { "epoch": 0.5292293324090522, "learning_rate": 8.269161185273252e-06, "loss": 3.0300494384765626, "step": 438600 }, { "epoch": 0.529349995731535, "learning_rate": 8.268757349805514e-06, "loss": 3.0104168701171874, "step": 438700 }, { "epoch": 0.5294706590540177, "learning_rate": 8.268353514337774e-06, "loss": 3.020096740722656, "step": 438800 }, { "epoch": 0.5295913223765003, "learning_rate": 8.267949678870036e-06, "loss": 3.0495291137695313, "step": 438900 }, { "epoch": 0.529711985698983, "learning_rate": 8.267545843402298e-06, "loss": 3.0659521484375, "step": 439000 }, { "epoch": 0.5298326490214657, "learning_rate": 8.26714200793456e-06, "loss": 3.0177215576171874, "step": 439100 }, { "epoch": 0.5299533123439484, "learning_rate": 8.266738172466822e-06, "loss": 3.036053466796875, "step": 439200 }, { "epoch": 0.5300739756664311, "learning_rate": 8.266334336999084e-06, "loss": 3.007360534667969, "step": 439300 }, { "epoch": 0.5301946389889137, "learning_rate": 8.265930501531346e-06, "loss": 3.0053591918945313, "step": 439400 }, { "epoch": 0.5303153023113965, "learning_rate": 8.265526666063606e-06, "loss": 3.043965148925781, "step": 439500 }, { "epoch": 0.5304359656338791, "learning_rate": 8.265122830595868e-06, "loss": 3.0373468017578125, "step": 439600 }, { "epoch": 0.5305566289563618, "learning_rate": 8.26471899512813e-06, "loss": 3.0461749267578124, "step": 439700 }, { "epoch": 0.5306772922788445, "learning_rate": 8.26431515966039e-06, "loss": 3.0115863037109376, "step": 439800 }, { "epoch": 0.5307979556013271, "learning_rate": 8.263911324192652e-06, "loss": 3.0024359130859377, "step": 439900 }, { "epoch": 0.5309186189238099, "learning_rate": 8.263507488724914e-06, "loss": 3.021661682128906, "step": 440000 }, { "epoch": 0.5310392822462926, "learning_rate": 8.263103653257176e-06, "loss": 3.026658630371094, "step": 440100 }, { "epoch": 0.5311599455687752, "learning_rate": 8.262699817789438e-06, "loss": 3.0172085571289062, "step": 440200 }, { "epoch": 0.5312806088912579, "learning_rate": 8.2622959823217e-06, "loss": 3.02299560546875, "step": 440300 }, { "epoch": 0.5314012722137406, "learning_rate": 8.26189214685396e-06, "loss": 3.0163613891601564, "step": 440400 }, { "epoch": 0.5315219355362233, "learning_rate": 8.261488311386223e-06, "loss": 3.043457336425781, "step": 440500 }, { "epoch": 0.531642598858706, "learning_rate": 8.261084475918485e-06, "loss": 3.0227670288085937, "step": 440600 }, { "epoch": 0.5317632621811886, "learning_rate": 8.260680640450745e-06, "loss": 3.02986328125, "step": 440700 }, { "epoch": 0.5318839255036714, "learning_rate": 8.260276804983007e-06, "loss": 3.028037414550781, "step": 440800 }, { "epoch": 0.532004588826154, "learning_rate": 8.259872969515269e-06, "loss": 3.01552490234375, "step": 440900 }, { "epoch": 0.5321252521486367, "learning_rate": 8.25946913404753e-06, "loss": 3.027689208984375, "step": 441000 }, { "epoch": 0.5322459154711194, "learning_rate": 8.259065298579793e-06, "loss": 3.02337158203125, "step": 441100 }, { "epoch": 0.532366578793602, "learning_rate": 8.258661463112053e-06, "loss": 3.002225036621094, "step": 441200 }, { "epoch": 0.5324872421160848, "learning_rate": 8.258257627644315e-06, "loss": 3.015375671386719, "step": 441300 }, { "epoch": 0.5326079054385674, "learning_rate": 8.257853792176577e-06, "loss": 3.0085568237304687, "step": 441400 }, { "epoch": 0.5327285687610501, "learning_rate": 8.257449956708839e-06, "loss": 3.029344482421875, "step": 441500 }, { "epoch": 0.5328492320835329, "learning_rate": 8.257046121241101e-06, "loss": 3.0445382690429685, "step": 441600 }, { "epoch": 0.5329698954060155, "learning_rate": 8.256642285773361e-06, "loss": 3.036221923828125, "step": 441700 }, { "epoch": 0.5330905587284982, "learning_rate": 8.256238450305623e-06, "loss": 3.022719421386719, "step": 441800 }, { "epoch": 0.5332112220509808, "learning_rate": 8.255834614837885e-06, "loss": 3.015985107421875, "step": 441900 }, { "epoch": 0.5333318853734635, "learning_rate": 8.255430779370145e-06, "loss": 3.007535095214844, "step": 442000 }, { "epoch": 0.5334525486959463, "learning_rate": 8.255026943902407e-06, "loss": 2.9976519775390624, "step": 442100 }, { "epoch": 0.5335732120184289, "learning_rate": 8.25462310843467e-06, "loss": 3.026825256347656, "step": 442200 }, { "epoch": 0.5336938753409116, "learning_rate": 8.254219272966931e-06, "loss": 3.0377377319335936, "step": 442300 }, { "epoch": 0.5338145386633942, "learning_rate": 8.253815437499193e-06, "loss": 3.037503356933594, "step": 442400 }, { "epoch": 0.533935201985877, "learning_rate": 8.253411602031455e-06, "loss": 3.0330621337890626, "step": 442500 }, { "epoch": 0.5340558653083597, "learning_rate": 8.253007766563716e-06, "loss": 3.0423260498046876, "step": 442600 }, { "epoch": 0.5341765286308423, "learning_rate": 8.252603931095978e-06, "loss": 3.013909912109375, "step": 442700 }, { "epoch": 0.534297191953325, "learning_rate": 8.25220009562824e-06, "loss": 3.040461120605469, "step": 442800 }, { "epoch": 0.5344178552758077, "learning_rate": 8.2517962601605e-06, "loss": 3.0267962646484374, "step": 442900 }, { "epoch": 0.5345385185982904, "learning_rate": 8.251392424692762e-06, "loss": 3.031927490234375, "step": 443000 }, { "epoch": 0.5346591819207731, "learning_rate": 8.250988589225024e-06, "loss": 3.0334930419921875, "step": 443100 }, { "epoch": 0.5347798452432557, "learning_rate": 8.250584753757286e-06, "loss": 3.0304254150390624, "step": 443200 }, { "epoch": 0.5349005085657385, "learning_rate": 8.250180918289548e-06, "loss": 3.0278860473632814, "step": 443300 }, { "epoch": 0.5350211718882211, "learning_rate": 8.24977708282181e-06, "loss": 3.04392333984375, "step": 443400 }, { "epoch": 0.5351418352107038, "learning_rate": 8.249373247354072e-06, "loss": 3.0515933227539063, "step": 443500 }, { "epoch": 0.5352624985331865, "learning_rate": 8.248969411886332e-06, "loss": 2.9995220947265624, "step": 443600 }, { "epoch": 0.5353831618556691, "learning_rate": 8.248565576418594e-06, "loss": 3.05199951171875, "step": 443700 }, { "epoch": 0.5355038251781519, "learning_rate": 8.248161740950854e-06, "loss": 3.029063415527344, "step": 443800 }, { "epoch": 0.5356244885006345, "learning_rate": 8.247757905483116e-06, "loss": 3.0162322998046873, "step": 443900 }, { "epoch": 0.5357451518231172, "learning_rate": 8.247354070015378e-06, "loss": 3.0014007568359373, "step": 444000 }, { "epoch": 0.5358658151455999, "learning_rate": 8.24695023454764e-06, "loss": 3.019384765625, "step": 444100 }, { "epoch": 0.5359864784680826, "learning_rate": 8.246546399079902e-06, "loss": 3.014043273925781, "step": 444200 }, { "epoch": 0.5361071417905653, "learning_rate": 8.246142563612164e-06, "loss": 3.0233529663085936, "step": 444300 }, { "epoch": 0.5362278051130479, "learning_rate": 8.245738728144426e-06, "loss": 3.0105099487304687, "step": 444400 }, { "epoch": 0.5363484684355306, "learning_rate": 8.245334892676687e-06, "loss": 3.01185791015625, "step": 444500 }, { "epoch": 0.5364691317580134, "learning_rate": 8.244931057208949e-06, "loss": 3.0508038330078127, "step": 444600 }, { "epoch": 0.536589795080496, "learning_rate": 8.24452722174121e-06, "loss": 3.016676330566406, "step": 444700 }, { "epoch": 0.5367104584029787, "learning_rate": 8.24412338627347e-06, "loss": 3.029635314941406, "step": 444800 }, { "epoch": 0.5368311217254613, "learning_rate": 8.243719550805733e-06, "loss": 3.021878356933594, "step": 444900 }, { "epoch": 0.536951785047944, "learning_rate": 8.243315715337995e-06, "loss": 3.0114556884765626, "step": 445000 }, { "epoch": 0.5370724483704268, "learning_rate": 8.242911879870257e-06, "loss": 3.020982666015625, "step": 445100 }, { "epoch": 0.5371931116929094, "learning_rate": 8.242508044402519e-06, "loss": 3.0232113647460936, "step": 445200 }, { "epoch": 0.5373137750153921, "learning_rate": 8.242104208934779e-06, "loss": 3.005293884277344, "step": 445300 }, { "epoch": 0.5374344383378749, "learning_rate": 8.241700373467041e-06, "loss": 3.03168701171875, "step": 445400 }, { "epoch": 0.5375551016603575, "learning_rate": 8.241296537999303e-06, "loss": 3.009619140625, "step": 445500 }, { "epoch": 0.5376757649828402, "learning_rate": 8.240892702531565e-06, "loss": 3.030387268066406, "step": 445600 }, { "epoch": 0.5377964283053228, "learning_rate": 8.240488867063825e-06, "loss": 3.004181213378906, "step": 445700 }, { "epoch": 0.5379170916278055, "learning_rate": 8.240085031596087e-06, "loss": 3.009443359375, "step": 445800 }, { "epoch": 0.5380377549502883, "learning_rate": 8.23968119612835e-06, "loss": 3.0328079223632813, "step": 445900 }, { "epoch": 0.5381584182727709, "learning_rate": 8.239277360660611e-06, "loss": 3.008001403808594, "step": 446000 }, { "epoch": 0.5382790815952536, "learning_rate": 8.238873525192872e-06, "loss": 3.0023226928710938, "step": 446100 }, { "epoch": 0.5383997449177362, "learning_rate": 8.238469689725134e-06, "loss": 3.0127142333984374, "step": 446200 }, { "epoch": 0.538520408240219, "learning_rate": 8.238065854257395e-06, "loss": 3.0399655151367186, "step": 446300 }, { "epoch": 0.5386410715627017, "learning_rate": 8.237662018789657e-06, "loss": 3.000540771484375, "step": 446400 }, { "epoch": 0.5387617348851843, "learning_rate": 8.23725818332192e-06, "loss": 3.0260101318359376, "step": 446500 }, { "epoch": 0.538882398207667, "learning_rate": 8.236854347854181e-06, "loss": 3.013153381347656, "step": 446600 }, { "epoch": 0.5390030615301497, "learning_rate": 8.236450512386442e-06, "loss": 3.0308767700195314, "step": 446700 }, { "epoch": 0.5391237248526324, "learning_rate": 8.236046676918704e-06, "loss": 3.015799865722656, "step": 446800 }, { "epoch": 0.5392443881751151, "learning_rate": 8.235642841450964e-06, "loss": 3.0192779541015624, "step": 446900 }, { "epoch": 0.5393650514975977, "learning_rate": 8.235239005983226e-06, "loss": 3.0200576782226562, "step": 447000 }, { "epoch": 0.5394857148200805, "learning_rate": 8.234835170515488e-06, "loss": 3.0116571044921874, "step": 447100 }, { "epoch": 0.5396063781425631, "learning_rate": 8.23443133504775e-06, "loss": 3.0280792236328127, "step": 447200 }, { "epoch": 0.5397270414650458, "learning_rate": 8.234027499580012e-06, "loss": 3.02627685546875, "step": 447300 }, { "epoch": 0.5398477047875285, "learning_rate": 8.233623664112274e-06, "loss": 3.011654052734375, "step": 447400 }, { "epoch": 0.5399683681100111, "learning_rate": 8.233219828644536e-06, "loss": 3.0159393310546876, "step": 447500 }, { "epoch": 0.5400890314324939, "learning_rate": 8.232815993176798e-06, "loss": 3.0320013427734374, "step": 447600 }, { "epoch": 0.5402096947549765, "learning_rate": 8.232412157709058e-06, "loss": 2.9989382934570314, "step": 447700 }, { "epoch": 0.5403303580774592, "learning_rate": 8.23200832224132e-06, "loss": 3.0335263061523436, "step": 447800 }, { "epoch": 0.5404510213999419, "learning_rate": 8.23160448677358e-06, "loss": 3.009174499511719, "step": 447900 }, { "epoch": 0.5405716847224246, "learning_rate": 8.231200651305842e-06, "loss": 3.0320751953125, "step": 448000 }, { "epoch": 0.5406923480449073, "learning_rate": 8.230796815838104e-06, "loss": 3.00021728515625, "step": 448100 }, { "epoch": 0.5408130113673899, "learning_rate": 8.230392980370366e-06, "loss": 3.0343118286132813, "step": 448200 }, { "epoch": 0.5409336746898726, "learning_rate": 8.229989144902628e-06, "loss": 3.0097808837890625, "step": 448300 }, { "epoch": 0.5410543380123554, "learning_rate": 8.22958530943489e-06, "loss": 3.0248489379882812, "step": 448400 }, { "epoch": 0.541175001334838, "learning_rate": 8.229181473967152e-06, "loss": 2.9971588134765623, "step": 448500 }, { "epoch": 0.5412956646573207, "learning_rate": 8.228777638499413e-06, "loss": 3.0415640258789063, "step": 448600 }, { "epoch": 0.5414163279798033, "learning_rate": 8.228373803031675e-06, "loss": 3.0337384033203123, "step": 448700 }, { "epoch": 0.541536991302286, "learning_rate": 8.227969967563937e-06, "loss": 3.025321044921875, "step": 448800 }, { "epoch": 0.5416576546247688, "learning_rate": 8.227566132096197e-06, "loss": 3.026483459472656, "step": 448900 }, { "epoch": 0.5417783179472514, "learning_rate": 8.227162296628459e-06, "loss": 3.0326153564453127, "step": 449000 }, { "epoch": 0.5418989812697341, "learning_rate": 8.22675846116072e-06, "loss": 2.998897705078125, "step": 449100 }, { "epoch": 0.5420196445922167, "learning_rate": 8.226354625692983e-06, "loss": 2.9886660766601563, "step": 449200 }, { "epoch": 0.5421403079146995, "learning_rate": 8.225950790225245e-06, "loss": 3.0406594848632813, "step": 449300 }, { "epoch": 0.5422609712371822, "learning_rate": 8.225546954757505e-06, "loss": 3.048433532714844, "step": 449400 }, { "epoch": 0.5423816345596648, "learning_rate": 8.225143119289767e-06, "loss": 3.022899169921875, "step": 449500 }, { "epoch": 0.5425022978821475, "learning_rate": 8.224739283822029e-06, "loss": 3.015343017578125, "step": 449600 }, { "epoch": 0.5426229612046302, "learning_rate": 8.224335448354291e-06, "loss": 3.015889892578125, "step": 449700 }, { "epoch": 0.5427436245271129, "learning_rate": 8.223931612886551e-06, "loss": 3.0024258422851564, "step": 449800 }, { "epoch": 0.5428642878495956, "learning_rate": 8.223527777418813e-06, "loss": 3.009610900878906, "step": 449900 }, { "epoch": 0.5429849511720782, "learning_rate": 8.223123941951075e-06, "loss": 2.999173583984375, "step": 450000 }, { "epoch": 0.543105614494561, "learning_rate": 8.222720106483337e-06, "loss": 3.0015234375, "step": 450100 }, { "epoch": 0.5432262778170436, "learning_rate": 8.222316271015598e-06, "loss": 3.0120281982421875, "step": 450200 }, { "epoch": 0.5433469411395263, "learning_rate": 8.22191243554786e-06, "loss": 2.999786376953125, "step": 450300 }, { "epoch": 0.543467604462009, "learning_rate": 8.221508600080122e-06, "loss": 3.0111660766601562, "step": 450400 }, { "epoch": 0.5435882677844917, "learning_rate": 8.221104764612384e-06, "loss": 3.0109133911132813, "step": 450500 }, { "epoch": 0.5437089311069744, "learning_rate": 8.220700929144645e-06, "loss": 2.984908447265625, "step": 450600 }, { "epoch": 0.5438295944294571, "learning_rate": 8.220297093676907e-06, "loss": 2.9949130249023437, "step": 450700 }, { "epoch": 0.5439502577519397, "learning_rate": 8.219893258209168e-06, "loss": 3.021127014160156, "step": 450800 }, { "epoch": 0.5440709210744225, "learning_rate": 8.21948942274143e-06, "loss": 3.0266192626953123, "step": 450900 }, { "epoch": 0.5441915843969051, "learning_rate": 8.21908558727369e-06, "loss": 3.0105615234375, "step": 451000 }, { "epoch": 0.5443122477193878, "learning_rate": 8.218681751805952e-06, "loss": 3.0360455322265625, "step": 451100 }, { "epoch": 0.5444329110418705, "learning_rate": 8.218277916338214e-06, "loss": 2.9971127319335937, "step": 451200 }, { "epoch": 0.5445535743643531, "learning_rate": 8.217874080870476e-06, "loss": 2.995586242675781, "step": 451300 }, { "epoch": 0.5446742376868359, "learning_rate": 8.217470245402738e-06, "loss": 3.0117559814453125, "step": 451400 }, { "epoch": 0.5447949010093185, "learning_rate": 8.217066409935e-06, "loss": 3.036898498535156, "step": 451500 }, { "epoch": 0.5449155643318012, "learning_rate": 8.216662574467262e-06, "loss": 3.04584228515625, "step": 451600 }, { "epoch": 0.545036227654284, "learning_rate": 8.216258738999522e-06, "loss": 3.030256652832031, "step": 451700 }, { "epoch": 0.5451568909767666, "learning_rate": 8.215854903531784e-06, "loss": 3.0310906982421875, "step": 451800 }, { "epoch": 0.5452775542992493, "learning_rate": 8.215451068064046e-06, "loss": 2.9987249755859375, "step": 451900 }, { "epoch": 0.5453982176217319, "learning_rate": 8.215047232596306e-06, "loss": 2.998523864746094, "step": 452000 }, { "epoch": 0.5455188809442146, "learning_rate": 8.214643397128568e-06, "loss": 3.024566345214844, "step": 452100 }, { "epoch": 0.5456395442666974, "learning_rate": 8.21423956166083e-06, "loss": 3.0222308349609377, "step": 452200 }, { "epoch": 0.54576020758918, "learning_rate": 8.213835726193092e-06, "loss": 3.010903625488281, "step": 452300 }, { "epoch": 0.5458808709116627, "learning_rate": 8.213431890725354e-06, "loss": 3.0244232177734376, "step": 452400 }, { "epoch": 0.5460015342341453, "learning_rate": 8.213028055257616e-06, "loss": 3.0216119384765623, "step": 452500 }, { "epoch": 0.546122197556628, "learning_rate": 8.212624219789877e-06, "loss": 2.999864501953125, "step": 452600 }, { "epoch": 0.5462428608791108, "learning_rate": 8.212220384322139e-06, "loss": 3.0284210205078126, "step": 452700 }, { "epoch": 0.5463635242015934, "learning_rate": 8.2118165488544e-06, "loss": 2.999059143066406, "step": 452800 }, { "epoch": 0.5464841875240761, "learning_rate": 8.211412713386661e-06, "loss": 3.042408142089844, "step": 452900 }, { "epoch": 0.5466048508465587, "learning_rate": 8.211008877918923e-06, "loss": 3.024136962890625, "step": 453000 }, { "epoch": 0.5467255141690415, "learning_rate": 8.210605042451185e-06, "loss": 2.9897027587890626, "step": 453100 }, { "epoch": 0.5468461774915242, "learning_rate": 8.210201206983447e-06, "loss": 3.007030334472656, "step": 453200 }, { "epoch": 0.5469668408140068, "learning_rate": 8.209797371515709e-06, "loss": 3.0133856201171874, "step": 453300 }, { "epoch": 0.5470875041364895, "learning_rate": 8.20939353604797e-06, "loss": 3.0122451782226562, "step": 453400 }, { "epoch": 0.5472081674589722, "learning_rate": 8.208989700580231e-06, "loss": 3.022361145019531, "step": 453500 }, { "epoch": 0.5473288307814549, "learning_rate": 8.208585865112493e-06, "loss": 3.0185812377929686, "step": 453600 }, { "epoch": 0.5474494941039376, "learning_rate": 8.208182029644755e-06, "loss": 2.9914254760742187, "step": 453700 }, { "epoch": 0.5475701574264202, "learning_rate": 8.207778194177017e-06, "loss": 3.001167907714844, "step": 453800 }, { "epoch": 0.547690820748903, "learning_rate": 8.207374358709277e-06, "loss": 3.0201190185546873, "step": 453900 }, { "epoch": 0.5478114840713856, "learning_rate": 8.20697052324154e-06, "loss": 3.0026666259765626, "step": 454000 }, { "epoch": 0.5479321473938683, "learning_rate": 8.206566687773801e-06, "loss": 2.999969787597656, "step": 454100 }, { "epoch": 0.548052810716351, "learning_rate": 8.206162852306063e-06, "loss": 3.0005563354492186, "step": 454200 }, { "epoch": 0.5481734740388337, "learning_rate": 8.205759016838324e-06, "loss": 3.002593994140625, "step": 454300 }, { "epoch": 0.5482941373613164, "learning_rate": 8.205355181370586e-06, "loss": 3.0044915771484373, "step": 454400 }, { "epoch": 0.548414800683799, "learning_rate": 8.204951345902848e-06, "loss": 2.9987005615234374, "step": 454500 }, { "epoch": 0.5485354640062817, "learning_rate": 8.20454751043511e-06, "loss": 3.0016461181640626, "step": 454600 }, { "epoch": 0.5486561273287645, "learning_rate": 8.204143674967372e-06, "loss": 3.0159988403320312, "step": 454700 }, { "epoch": 0.5487767906512471, "learning_rate": 8.203739839499632e-06, "loss": 3.0185556030273437, "step": 454800 }, { "epoch": 0.5488974539737298, "learning_rate": 8.203336004031894e-06, "loss": 2.9955682373046875, "step": 454900 }, { "epoch": 0.5490181172962124, "learning_rate": 8.202932168564156e-06, "loss": 3.0180563354492187, "step": 455000 }, { "epoch": 0.5491387806186951, "learning_rate": 8.202528333096416e-06, "loss": 3.00729248046875, "step": 455100 }, { "epoch": 0.5492594439411779, "learning_rate": 8.202124497628678e-06, "loss": 2.981845703125, "step": 455200 }, { "epoch": 0.5493801072636605, "learning_rate": 8.20172066216094e-06, "loss": 3.0141424560546874, "step": 455300 }, { "epoch": 0.5495007705861432, "learning_rate": 8.201316826693202e-06, "loss": 2.9988238525390627, "step": 455400 }, { "epoch": 0.5496214339086258, "learning_rate": 8.200912991225464e-06, "loss": 3.0104196166992185, "step": 455500 }, { "epoch": 0.5497420972311086, "learning_rate": 8.200509155757726e-06, "loss": 3.0210446166992186, "step": 455600 }, { "epoch": 0.5498627605535913, "learning_rate": 8.200105320289988e-06, "loss": 2.9909295654296875, "step": 455700 }, { "epoch": 0.5499834238760739, "learning_rate": 8.199701484822248e-06, "loss": 3.017538757324219, "step": 455800 }, { "epoch": 0.5501040871985566, "learning_rate": 8.19929764935451e-06, "loss": 3.0219967651367186, "step": 455900 }, { "epoch": 0.5502247505210394, "learning_rate": 8.19889381388677e-06, "loss": 2.9999539184570314, "step": 456000 }, { "epoch": 0.550345413843522, "learning_rate": 8.198489978419033e-06, "loss": 2.9966256713867185, "step": 456100 }, { "epoch": 0.5504660771660047, "learning_rate": 8.198086142951294e-06, "loss": 3.0037548828125, "step": 456200 }, { "epoch": 0.5505867404884873, "learning_rate": 8.197682307483556e-06, "loss": 3.0014892578125, "step": 456300 }, { "epoch": 0.55070740381097, "learning_rate": 8.197278472015818e-06, "loss": 3.0157656860351563, "step": 456400 }, { "epoch": 0.5508280671334528, "learning_rate": 8.19687463654808e-06, "loss": 3.0050479125976564, "step": 456500 }, { "epoch": 0.5509487304559354, "learning_rate": 8.196470801080342e-06, "loss": 2.996612548828125, "step": 456600 }, { "epoch": 0.5510693937784181, "learning_rate": 8.196066965612603e-06, "loss": 3.0021636962890623, "step": 456700 }, { "epoch": 0.5511900571009007, "learning_rate": 8.195663130144865e-06, "loss": 3.01055419921875, "step": 456800 }, { "epoch": 0.5513107204233835, "learning_rate": 8.195259294677127e-06, "loss": 2.991148681640625, "step": 456900 }, { "epoch": 0.5514313837458662, "learning_rate": 8.194855459209387e-06, "loss": 2.985732116699219, "step": 457000 }, { "epoch": 0.5515520470683488, "learning_rate": 8.194451623741649e-06, "loss": 3.0277813720703124, "step": 457100 }, { "epoch": 0.5516727103908315, "learning_rate": 8.194047788273911e-06, "loss": 3.0079150390625, "step": 457200 }, { "epoch": 0.5517933737133142, "learning_rate": 8.193643952806173e-06, "loss": 3.035090026855469, "step": 457300 }, { "epoch": 0.5519140370357969, "learning_rate": 8.193240117338435e-06, "loss": 3.0119354248046877, "step": 457400 }, { "epoch": 0.5520347003582796, "learning_rate": 8.192836281870695e-06, "loss": 3.022391357421875, "step": 457500 }, { "epoch": 0.5521553636807622, "learning_rate": 8.192432446402957e-06, "loss": 2.9878070068359377, "step": 457600 }, { "epoch": 0.552276027003245, "learning_rate": 8.192028610935219e-06, "loss": 2.9676254272460936, "step": 457700 }, { "epoch": 0.5523966903257276, "learning_rate": 8.191624775467481e-06, "loss": 3.000948181152344, "step": 457800 }, { "epoch": 0.5525173536482103, "learning_rate": 8.191220939999741e-06, "loss": 3.0209481811523435, "step": 457900 }, { "epoch": 0.552638016970693, "learning_rate": 8.190817104532003e-06, "loss": 3.016698303222656, "step": 458000 }, { "epoch": 0.5527586802931757, "learning_rate": 8.190413269064265e-06, "loss": 2.993017272949219, "step": 458100 }, { "epoch": 0.5528793436156584, "learning_rate": 8.190009433596527e-06, "loss": 2.995467529296875, "step": 458200 }, { "epoch": 0.553000006938141, "learning_rate": 8.18960559812879e-06, "loss": 2.994551696777344, "step": 458300 }, { "epoch": 0.5531206702606237, "learning_rate": 8.18920176266105e-06, "loss": 2.9993743896484375, "step": 458400 }, { "epoch": 0.5532413335831065, "learning_rate": 8.188797927193312e-06, "loss": 2.995627136230469, "step": 458500 }, { "epoch": 0.5533619969055891, "learning_rate": 8.188394091725574e-06, "loss": 3.0100048828125, "step": 458600 }, { "epoch": 0.5534826602280718, "learning_rate": 8.187990256257836e-06, "loss": 3.0135394287109376, "step": 458700 }, { "epoch": 0.5536033235505544, "learning_rate": 8.187586420790098e-06, "loss": 3.0050653076171874, "step": 458800 }, { "epoch": 0.5537239868730371, "learning_rate": 8.187182585322358e-06, "loss": 2.998879699707031, "step": 458900 }, { "epoch": 0.5538446501955199, "learning_rate": 8.18677874985462e-06, "loss": 3.0019467163085936, "step": 459000 }, { "epoch": 0.5539653135180025, "learning_rate": 8.186374914386882e-06, "loss": 2.9818710327148437, "step": 459100 }, { "epoch": 0.5540859768404852, "learning_rate": 8.185971078919142e-06, "loss": 3.015633544921875, "step": 459200 }, { "epoch": 0.5542066401629678, "learning_rate": 8.185567243451404e-06, "loss": 2.962353515625, "step": 459300 }, { "epoch": 0.5543273034854506, "learning_rate": 8.185163407983666e-06, "loss": 3.020951232910156, "step": 459400 }, { "epoch": 0.5544479668079333, "learning_rate": 8.184759572515928e-06, "loss": 2.986156005859375, "step": 459500 }, { "epoch": 0.5545686301304159, "learning_rate": 8.18435573704819e-06, "loss": 2.994339599609375, "step": 459600 }, { "epoch": 0.5546892934528986, "learning_rate": 8.183951901580452e-06, "loss": 3.0034249877929686, "step": 459700 }, { "epoch": 0.5548099567753813, "learning_rate": 8.183548066112712e-06, "loss": 3.004940185546875, "step": 459800 }, { "epoch": 0.554930620097864, "learning_rate": 8.183144230644974e-06, "loss": 2.9959375, "step": 459900 }, { "epoch": 0.5550512834203467, "learning_rate": 8.182740395177236e-06, "loss": 3.0019882202148436, "step": 460000 }, { "epoch": 0.5551719467428293, "learning_rate": 8.182336559709497e-06, "loss": 2.9806918334960937, "step": 460100 }, { "epoch": 0.555292610065312, "learning_rate": 8.181932724241759e-06, "loss": 3.010456237792969, "step": 460200 }, { "epoch": 0.5554132733877947, "learning_rate": 8.18152888877402e-06, "loss": 3.018319396972656, "step": 460300 }, { "epoch": 0.5555339367102774, "learning_rate": 8.181125053306282e-06, "loss": 3.0150662231445313, "step": 460400 }, { "epoch": 0.5556546000327601, "learning_rate": 8.180721217838544e-06, "loss": 3.0147088623046874, "step": 460500 }, { "epoch": 0.5557752633552427, "learning_rate": 8.180317382370806e-06, "loss": 2.984632568359375, "step": 460600 }, { "epoch": 0.5558959266777255, "learning_rate": 8.179913546903068e-06, "loss": 3.0083657836914064, "step": 460700 }, { "epoch": 0.5560165900002082, "learning_rate": 8.179509711435329e-06, "loss": 2.98829833984375, "step": 460800 }, { "epoch": 0.5561372533226908, "learning_rate": 8.17910587596759e-06, "loss": 3.0026199340820314, "step": 460900 }, { "epoch": 0.5562579166451735, "learning_rate": 8.178702040499851e-06, "loss": 2.98964599609375, "step": 461000 }, { "epoch": 0.5563785799676562, "learning_rate": 8.178298205032113e-06, "loss": 2.9768099975585938, "step": 461100 }, { "epoch": 0.5564992432901389, "learning_rate": 8.177894369564375e-06, "loss": 3.0057339477539062, "step": 461200 }, { "epoch": 0.5566199066126216, "learning_rate": 8.177490534096637e-06, "loss": 3.015718688964844, "step": 461300 }, { "epoch": 0.5567405699351042, "learning_rate": 8.177086698628899e-06, "loss": 3.009690246582031, "step": 461400 }, { "epoch": 0.556861233257587, "learning_rate": 8.176682863161161e-06, "loss": 2.9791058349609374, "step": 461500 }, { "epoch": 0.5569818965800696, "learning_rate": 8.176279027693421e-06, "loss": 2.999722595214844, "step": 461600 }, { "epoch": 0.5571025599025523, "learning_rate": 8.175875192225683e-06, "loss": 3.000059814453125, "step": 461700 }, { "epoch": 0.557223223225035, "learning_rate": 8.175471356757945e-06, "loss": 3.0044793701171875, "step": 461800 }, { "epoch": 0.5573438865475177, "learning_rate": 8.175067521290207e-06, "loss": 3.0161895751953125, "step": 461900 }, { "epoch": 0.5574645498700004, "learning_rate": 8.174663685822467e-06, "loss": 2.9899432373046877, "step": 462000 }, { "epoch": 0.557585213192483, "learning_rate": 8.17425985035473e-06, "loss": 2.975271911621094, "step": 462100 }, { "epoch": 0.5577058765149657, "learning_rate": 8.173856014886991e-06, "loss": 3.000601501464844, "step": 462200 }, { "epoch": 0.5578265398374485, "learning_rate": 8.173452179419253e-06, "loss": 2.9855050659179687, "step": 462300 }, { "epoch": 0.5579472031599311, "learning_rate": 8.173048343951514e-06, "loss": 3.002107849121094, "step": 462400 }, { "epoch": 0.5580678664824138, "learning_rate": 8.172644508483776e-06, "loss": 3.0097360229492187, "step": 462500 }, { "epoch": 0.5581885298048964, "learning_rate": 8.172240673016038e-06, "loss": 3.001328430175781, "step": 462600 }, { "epoch": 0.5583091931273791, "learning_rate": 8.1718368375483e-06, "loss": 3.019193420410156, "step": 462700 }, { "epoch": 0.5584298564498619, "learning_rate": 8.171433002080562e-06, "loss": 2.9669720458984377, "step": 462800 }, { "epoch": 0.5585505197723445, "learning_rate": 8.171029166612824e-06, "loss": 3.005193786621094, "step": 462900 }, { "epoch": 0.5586711830948272, "learning_rate": 8.170625331145084e-06, "loss": 3.0114401245117186, "step": 463000 }, { "epoch": 0.5587918464173098, "learning_rate": 8.170221495677346e-06, "loss": 2.997593994140625, "step": 463100 }, { "epoch": 0.5589125097397926, "learning_rate": 8.169817660209608e-06, "loss": 3.00738037109375, "step": 463200 }, { "epoch": 0.5590331730622753, "learning_rate": 8.169413824741868e-06, "loss": 2.9959030151367188, "step": 463300 }, { "epoch": 0.5591538363847579, "learning_rate": 8.16900998927413e-06, "loss": 3.008182373046875, "step": 463400 }, { "epoch": 0.5592744997072406, "learning_rate": 8.168606153806392e-06, "loss": 2.9801837158203126, "step": 463500 }, { "epoch": 0.5593951630297233, "learning_rate": 8.168202318338654e-06, "loss": 3.0317446899414064, "step": 463600 }, { "epoch": 0.559515826352206, "learning_rate": 8.167798482870916e-06, "loss": 3.0086660766601563, "step": 463700 }, { "epoch": 0.5596364896746887, "learning_rate": 8.167394647403178e-06, "loss": 2.987573547363281, "step": 463800 }, { "epoch": 0.5597571529971713, "learning_rate": 8.166990811935438e-06, "loss": 3.0176132202148436, "step": 463900 }, { "epoch": 0.559877816319654, "learning_rate": 8.1665869764677e-06, "loss": 2.9872970581054688, "step": 464000 }, { "epoch": 0.5599984796421367, "learning_rate": 8.166183140999962e-06, "loss": 3.016565856933594, "step": 464100 }, { "epoch": 0.5601191429646194, "learning_rate": 8.165779305532223e-06, "loss": 3.0058441162109375, "step": 464200 }, { "epoch": 0.5602398062871021, "learning_rate": 8.165375470064485e-06, "loss": 3.0088265991210936, "step": 464300 }, { "epoch": 0.5603604696095847, "learning_rate": 8.164971634596747e-06, "loss": 2.96726806640625, "step": 464400 }, { "epoch": 0.5604811329320675, "learning_rate": 8.164567799129009e-06, "loss": 2.9828610229492187, "step": 464500 }, { "epoch": 0.5606017962545501, "learning_rate": 8.16416396366127e-06, "loss": 2.9877239990234377, "step": 464600 }, { "epoch": 0.5607224595770328, "learning_rate": 8.163760128193532e-06, "loss": 2.983226013183594, "step": 464700 }, { "epoch": 0.5608431228995155, "learning_rate": 8.163356292725794e-06, "loss": 2.9693008422851563, "step": 464800 }, { "epoch": 0.5609637862219982, "learning_rate": 8.162952457258055e-06, "loss": 3.003946533203125, "step": 464900 }, { "epoch": 0.5610844495444809, "learning_rate": 8.162548621790317e-06, "loss": 3.010050048828125, "step": 465000 }, { "epoch": 0.5612051128669635, "learning_rate": 8.162144786322577e-06, "loss": 2.9866204833984376, "step": 465100 }, { "epoch": 0.5613257761894462, "learning_rate": 8.161740950854839e-06, "loss": 3.003884582519531, "step": 465200 }, { "epoch": 0.561446439511929, "learning_rate": 8.161337115387101e-06, "loss": 2.975133361816406, "step": 465300 }, { "epoch": 0.5615671028344116, "learning_rate": 8.160933279919363e-06, "loss": 3.00321044921875, "step": 465400 }, { "epoch": 0.5616877661568943, "learning_rate": 8.160529444451625e-06, "loss": 2.9761087036132814, "step": 465500 }, { "epoch": 0.5618084294793769, "learning_rate": 8.160125608983887e-06, "loss": 2.9978091430664064, "step": 465600 }, { "epoch": 0.5619290928018597, "learning_rate": 8.159721773516147e-06, "loss": 2.985066223144531, "step": 465700 }, { "epoch": 0.5620497561243424, "learning_rate": 8.15931793804841e-06, "loss": 2.9695587158203125, "step": 465800 }, { "epoch": 0.562170419446825, "learning_rate": 8.158914102580671e-06, "loss": 2.9904751586914062, "step": 465900 }, { "epoch": 0.5622910827693077, "learning_rate": 8.158510267112933e-06, "loss": 2.987451171875, "step": 466000 }, { "epoch": 0.5624117460917905, "learning_rate": 8.158106431645193e-06, "loss": 2.9501666259765624, "step": 466100 }, { "epoch": 0.5625324094142731, "learning_rate": 8.157702596177455e-06, "loss": 2.9546029663085935, "step": 466200 }, { "epoch": 0.5626530727367558, "learning_rate": 8.157298760709717e-06, "loss": 2.993612976074219, "step": 466300 }, { "epoch": 0.5627737360592384, "learning_rate": 8.15689492524198e-06, "loss": 3.017295227050781, "step": 466400 }, { "epoch": 0.5628943993817211, "learning_rate": 8.15649108977424e-06, "loss": 3.006566162109375, "step": 466500 }, { "epoch": 0.5630150627042039, "learning_rate": 8.156087254306502e-06, "loss": 2.995247497558594, "step": 466600 }, { "epoch": 0.5631357260266865, "learning_rate": 8.155683418838764e-06, "loss": 2.965714111328125, "step": 466700 }, { "epoch": 0.5632563893491692, "learning_rate": 8.155279583371026e-06, "loss": 2.9988967895507814, "step": 466800 }, { "epoch": 0.5633770526716518, "learning_rate": 8.154875747903288e-06, "loss": 2.9797158813476563, "step": 466900 }, { "epoch": 0.5634977159941346, "learning_rate": 8.154471912435548e-06, "loss": 3.0074114990234375, "step": 467000 }, { "epoch": 0.5636183793166173, "learning_rate": 8.15406807696781e-06, "loss": 2.9966064453125, "step": 467100 }, { "epoch": 0.5637390426390999, "learning_rate": 8.153664241500072e-06, "loss": 3.0003421020507814, "step": 467200 }, { "epoch": 0.5638597059615826, "learning_rate": 8.153260406032332e-06, "loss": 2.9827456665039063, "step": 467300 }, { "epoch": 0.5639803692840653, "learning_rate": 8.152856570564594e-06, "loss": 3.0229400634765624, "step": 467400 }, { "epoch": 0.564101032606548, "learning_rate": 8.152452735096856e-06, "loss": 2.9976632690429685, "step": 467500 }, { "epoch": 0.5642216959290307, "learning_rate": 8.152048899629118e-06, "loss": 2.972752685546875, "step": 467600 }, { "epoch": 0.5643423592515133, "learning_rate": 8.15164506416138e-06, "loss": 3.000854797363281, "step": 467700 }, { "epoch": 0.564463022573996, "learning_rate": 8.151241228693642e-06, "loss": 2.971127624511719, "step": 467800 }, { "epoch": 0.5645836858964787, "learning_rate": 8.150837393225904e-06, "loss": 3.0021893310546877, "step": 467900 }, { "epoch": 0.5647043492189614, "learning_rate": 8.150433557758164e-06, "loss": 2.97356689453125, "step": 468000 }, { "epoch": 0.5648250125414441, "learning_rate": 8.150029722290426e-06, "loss": 3.009740905761719, "step": 468100 }, { "epoch": 0.5649456758639267, "learning_rate": 8.149625886822687e-06, "loss": 2.9869815063476564, "step": 468200 }, { "epoch": 0.5650663391864095, "learning_rate": 8.149222051354949e-06, "loss": 2.9912185668945312, "step": 468300 }, { "epoch": 0.5651870025088921, "learning_rate": 8.14881821588721e-06, "loss": 2.983764343261719, "step": 468400 }, { "epoch": 0.5653076658313748, "learning_rate": 8.148414380419473e-06, "loss": 2.9786697387695313, "step": 468500 }, { "epoch": 0.5654283291538575, "learning_rate": 8.148010544951735e-06, "loss": 2.9820037841796876, "step": 468600 }, { "epoch": 0.5655489924763402, "learning_rate": 8.147606709483997e-06, "loss": 2.9766241455078126, "step": 468700 }, { "epoch": 0.5656696557988229, "learning_rate": 8.147202874016259e-06, "loss": 2.991668395996094, "step": 468800 }, { "epoch": 0.5657903191213055, "learning_rate": 8.146799038548519e-06, "loss": 2.982549743652344, "step": 468900 }, { "epoch": 0.5659109824437882, "learning_rate": 8.14639520308078e-06, "loss": 2.9765692138671875, "step": 469000 }, { "epoch": 0.566031645766271, "learning_rate": 8.145991367613043e-06, "loss": 3.021697998046875, "step": 469100 }, { "epoch": 0.5661523090887536, "learning_rate": 8.145587532145303e-06, "loss": 2.99116455078125, "step": 469200 }, { "epoch": 0.5662729724112363, "learning_rate": 8.145183696677565e-06, "loss": 2.9649371337890624, "step": 469300 }, { "epoch": 0.5663936357337189, "learning_rate": 8.144779861209827e-06, "loss": 2.9671444702148437, "step": 469400 }, { "epoch": 0.5665142990562017, "learning_rate": 8.144376025742089e-06, "loss": 2.999248352050781, "step": 469500 }, { "epoch": 0.5666349623786844, "learning_rate": 8.143972190274351e-06, "loss": 2.952983093261719, "step": 469600 }, { "epoch": 0.566755625701167, "learning_rate": 8.143568354806613e-06, "loss": 2.973188781738281, "step": 469700 }, { "epoch": 0.5668762890236497, "learning_rate": 8.143164519338873e-06, "loss": 2.991272277832031, "step": 469800 }, { "epoch": 0.5669969523461323, "learning_rate": 8.142760683871135e-06, "loss": 2.96271240234375, "step": 469900 }, { "epoch": 0.5671176156686151, "learning_rate": 8.142356848403397e-06, "loss": 2.9962982177734374, "step": 470000 }, { "epoch": 0.5672382789910978, "learning_rate": 8.141953012935658e-06, "loss": 2.9819561767578127, "step": 470100 }, { "epoch": 0.5673589423135804, "learning_rate": 8.14154917746792e-06, "loss": 3.0018905639648437, "step": 470200 }, { "epoch": 0.5674796056360631, "learning_rate": 8.141145342000181e-06, "loss": 2.9827496337890627, "step": 470300 }, { "epoch": 0.5676002689585458, "learning_rate": 8.140741506532443e-06, "loss": 2.9602642822265626, "step": 470400 }, { "epoch": 0.5677209322810285, "learning_rate": 8.140337671064705e-06, "loss": 2.9945339965820312, "step": 470500 }, { "epoch": 0.5678415956035112, "learning_rate": 8.139933835596966e-06, "loss": 2.9567803955078125, "step": 470600 }, { "epoch": 0.5679622589259938, "learning_rate": 8.139530000129228e-06, "loss": 2.9850918579101564, "step": 470700 }, { "epoch": 0.5680829222484766, "learning_rate": 8.13912616466149e-06, "loss": 2.9919552612304687, "step": 470800 }, { "epoch": 0.5682035855709592, "learning_rate": 8.138722329193752e-06, "loss": 3.0009429931640623, "step": 470900 }, { "epoch": 0.5683242488934419, "learning_rate": 8.138318493726014e-06, "loss": 2.999633483886719, "step": 471000 }, { "epoch": 0.5684449122159246, "learning_rate": 8.137914658258274e-06, "loss": 2.994955749511719, "step": 471100 }, { "epoch": 0.5685655755384073, "learning_rate": 8.137510822790536e-06, "loss": 2.9888763427734375, "step": 471200 }, { "epoch": 0.56868623886089, "learning_rate": 8.137106987322798e-06, "loss": 2.994425964355469, "step": 471300 }, { "epoch": 0.5688069021833727, "learning_rate": 8.136703151855058e-06, "loss": 2.98322509765625, "step": 471400 }, { "epoch": 0.5689275655058553, "learning_rate": 8.13629931638732e-06, "loss": 2.9915762329101563, "step": 471500 }, { "epoch": 0.569048228828338, "learning_rate": 8.135895480919582e-06, "loss": 2.9823672485351564, "step": 471600 }, { "epoch": 0.5691688921508207, "learning_rate": 8.135491645451844e-06, "loss": 2.996954345703125, "step": 471700 }, { "epoch": 0.5692895554733034, "learning_rate": 8.135087809984106e-06, "loss": 2.9538153076171874, "step": 471800 }, { "epoch": 0.5694102187957861, "learning_rate": 8.134683974516368e-06, "loss": 2.9856658935546876, "step": 471900 }, { "epoch": 0.5695308821182687, "learning_rate": 8.134280139048628e-06, "loss": 2.98936279296875, "step": 472000 }, { "epoch": 0.5696515454407515, "learning_rate": 8.13387630358089e-06, "loss": 2.9860760498046877, "step": 472100 }, { "epoch": 0.5697722087632341, "learning_rate": 8.133472468113152e-06, "loss": 2.953877258300781, "step": 472200 }, { "epoch": 0.5698928720857168, "learning_rate": 8.133068632645413e-06, "loss": 2.9647430419921874, "step": 472300 }, { "epoch": 0.5700135354081995, "learning_rate": 8.132664797177675e-06, "loss": 2.9823434448242185, "step": 472400 }, { "epoch": 0.5701341987306822, "learning_rate": 8.132260961709937e-06, "loss": 2.963651428222656, "step": 472500 }, { "epoch": 0.5702548620531649, "learning_rate": 8.131857126242199e-06, "loss": 2.985428771972656, "step": 472600 }, { "epoch": 0.5703755253756475, "learning_rate": 8.13145329077446e-06, "loss": 2.963888854980469, "step": 472700 }, { "epoch": 0.5704961886981302, "learning_rate": 8.131049455306723e-06, "loss": 2.9848248291015627, "step": 472800 }, { "epoch": 0.570616852020613, "learning_rate": 8.130645619838985e-06, "loss": 2.960509948730469, "step": 472900 }, { "epoch": 0.5707375153430956, "learning_rate": 8.130241784371245e-06, "loss": 2.9915228271484375, "step": 473000 }, { "epoch": 0.5708581786655783, "learning_rate": 8.129837948903507e-06, "loss": 2.974735107421875, "step": 473100 }, { "epoch": 0.5709788419880609, "learning_rate": 8.129434113435767e-06, "loss": 2.97484375, "step": 473200 }, { "epoch": 0.5710995053105437, "learning_rate": 8.129030277968029e-06, "loss": 2.9823483276367186, "step": 473300 }, { "epoch": 0.5712201686330264, "learning_rate": 8.128626442500291e-06, "loss": 2.9506890869140623, "step": 473400 }, { "epoch": 0.571340831955509, "learning_rate": 8.128222607032553e-06, "loss": 2.9802865600585937, "step": 473500 }, { "epoch": 0.5714614952779917, "learning_rate": 8.127818771564815e-06, "loss": 2.993403015136719, "step": 473600 }, { "epoch": 0.5715821586004743, "learning_rate": 8.127414936097077e-06, "loss": 2.9807058715820314, "step": 473700 }, { "epoch": 0.5717028219229571, "learning_rate": 8.127011100629339e-06, "loss": 2.987046203613281, "step": 473800 }, { "epoch": 0.5718234852454398, "learning_rate": 8.1266072651616e-06, "loss": 2.991500244140625, "step": 473900 }, { "epoch": 0.5719441485679224, "learning_rate": 8.126203429693861e-06, "loss": 2.977865905761719, "step": 474000 }, { "epoch": 0.5720648118904051, "learning_rate": 8.125799594226123e-06, "loss": 2.9773330688476562, "step": 474100 }, { "epoch": 0.5721854752128878, "learning_rate": 8.125395758758384e-06, "loss": 2.970625915527344, "step": 474200 }, { "epoch": 0.5723061385353705, "learning_rate": 8.124991923290646e-06, "loss": 2.999735107421875, "step": 474300 }, { "epoch": 0.5724268018578532, "learning_rate": 8.124588087822908e-06, "loss": 3.0177960205078125, "step": 474400 }, { "epoch": 0.5725474651803358, "learning_rate": 8.12418425235517e-06, "loss": 2.975946044921875, "step": 474500 }, { "epoch": 0.5726681285028186, "learning_rate": 8.123780416887431e-06, "loss": 2.9703582763671874, "step": 474600 }, { "epoch": 0.5727887918253012, "learning_rate": 8.123376581419692e-06, "loss": 2.9667718505859373, "step": 474700 }, { "epoch": 0.5729094551477839, "learning_rate": 8.122972745951954e-06, "loss": 2.9742330932617187, "step": 474800 }, { "epoch": 0.5730301184702666, "learning_rate": 8.122568910484216e-06, "loss": 2.947726135253906, "step": 474900 }, { "epoch": 0.5731507817927493, "learning_rate": 8.122165075016478e-06, "loss": 2.9807330322265626, "step": 475000 }, { "epoch": 0.573271445115232, "learning_rate": 8.121761239548738e-06, "loss": 2.9854776000976564, "step": 475100 }, { "epoch": 0.5733921084377146, "learning_rate": 8.121357404081e-06, "loss": 2.954489440917969, "step": 475200 }, { "epoch": 0.5735127717601973, "learning_rate": 8.120953568613262e-06, "loss": 2.9779437255859373, "step": 475300 }, { "epoch": 0.57363343508268, "learning_rate": 8.120549733145524e-06, "loss": 2.9832638549804686, "step": 475400 }, { "epoch": 0.5737540984051627, "learning_rate": 8.120145897677784e-06, "loss": 2.9620635986328123, "step": 475500 }, { "epoch": 0.5738747617276454, "learning_rate": 8.119742062210046e-06, "loss": 2.987445983886719, "step": 475600 }, { "epoch": 0.573995425050128, "learning_rate": 8.119338226742308e-06, "loss": 2.9681301879882813, "step": 475700 }, { "epoch": 0.5741160883726107, "learning_rate": 8.11893439127457e-06, "loss": 2.9592779541015624, "step": 475800 }, { "epoch": 0.5742367516950935, "learning_rate": 8.118530555806832e-06, "loss": 2.9818679809570314, "step": 475900 }, { "epoch": 0.5743574150175761, "learning_rate": 8.118126720339094e-06, "loss": 3.0136920166015626, "step": 476000 }, { "epoch": 0.5744780783400588, "learning_rate": 8.117722884871354e-06, "loss": 2.9860235595703126, "step": 476100 }, { "epoch": 0.5745987416625414, "learning_rate": 8.117319049403616e-06, "loss": 2.96761962890625, "step": 476200 }, { "epoch": 0.5747194049850242, "learning_rate": 8.116915213935877e-06, "loss": 2.9663983154296876, "step": 476300 }, { "epoch": 0.5748400683075069, "learning_rate": 8.116511378468139e-06, "loss": 2.9492767333984373, "step": 476400 }, { "epoch": 0.5749607316299895, "learning_rate": 8.1161075430004e-06, "loss": 2.986912841796875, "step": 476500 }, { "epoch": 0.5750813949524722, "learning_rate": 8.115703707532663e-06, "loss": 2.9770361328125, "step": 476600 }, { "epoch": 0.575202058274955, "learning_rate": 8.115299872064925e-06, "loss": 2.9979034423828126, "step": 476700 }, { "epoch": 0.5753227215974376, "learning_rate": 8.114896036597187e-06, "loss": 2.969718017578125, "step": 476800 }, { "epoch": 0.5754433849199203, "learning_rate": 8.114492201129449e-06, "loss": 2.981287841796875, "step": 476900 }, { "epoch": 0.5755640482424029, "learning_rate": 8.11408836566171e-06, "loss": 2.987734680175781, "step": 477000 }, { "epoch": 0.5756847115648857, "learning_rate": 8.113684530193971e-06, "loss": 2.979698486328125, "step": 477100 }, { "epoch": 0.5758053748873684, "learning_rate": 8.113280694726233e-06, "loss": 2.964830017089844, "step": 477200 }, { "epoch": 0.575926038209851, "learning_rate": 8.112876859258493e-06, "loss": 2.9503338623046873, "step": 477300 }, { "epoch": 0.5760467015323337, "learning_rate": 8.112473023790755e-06, "loss": 2.9733847045898436, "step": 477400 }, { "epoch": 0.5761673648548163, "learning_rate": 8.112069188323017e-06, "loss": 2.9585009765625, "step": 477500 }, { "epoch": 0.5762880281772991, "learning_rate": 8.111665352855279e-06, "loss": 2.9824008178710937, "step": 477600 }, { "epoch": 0.5764086914997818, "learning_rate": 8.111261517387541e-06, "loss": 2.9772378540039064, "step": 477700 }, { "epoch": 0.5765293548222644, "learning_rate": 8.110857681919803e-06, "loss": 2.9740951538085936, "step": 477800 }, { "epoch": 0.5766500181447471, "learning_rate": 8.110453846452063e-06, "loss": 2.993214111328125, "step": 477900 }, { "epoch": 0.5767706814672298, "learning_rate": 8.110050010984325e-06, "loss": 2.977830810546875, "step": 478000 }, { "epoch": 0.5768913447897125, "learning_rate": 8.109646175516587e-06, "loss": 2.972706604003906, "step": 478100 }, { "epoch": 0.5770120081121952, "learning_rate": 8.10924234004885e-06, "loss": 2.981258544921875, "step": 478200 }, { "epoch": 0.5771326714346778, "learning_rate": 8.10883850458111e-06, "loss": 2.9657022094726564, "step": 478300 }, { "epoch": 0.5772533347571606, "learning_rate": 8.108434669113372e-06, "loss": 2.989014892578125, "step": 478400 }, { "epoch": 0.5773739980796432, "learning_rate": 8.108030833645634e-06, "loss": 2.974716796875, "step": 478500 }, { "epoch": 0.5774946614021259, "learning_rate": 8.107626998177896e-06, "loss": 2.9836196899414062, "step": 478600 }, { "epoch": 0.5776153247246086, "learning_rate": 8.107223162710158e-06, "loss": 2.9681552124023436, "step": 478700 }, { "epoch": 0.5777359880470913, "learning_rate": 8.106819327242418e-06, "loss": 3.008946838378906, "step": 478800 }, { "epoch": 0.577856651369574, "learning_rate": 8.10641549177468e-06, "loss": 2.9639816284179688, "step": 478900 }, { "epoch": 0.5779773146920566, "learning_rate": 8.106011656306942e-06, "loss": 2.9923004150390624, "step": 479000 }, { "epoch": 0.5780979780145393, "learning_rate": 8.105607820839204e-06, "loss": 2.9615414428710936, "step": 479100 }, { "epoch": 0.578218641337022, "learning_rate": 8.105203985371464e-06, "loss": 2.9481521606445313, "step": 479200 }, { "epoch": 0.5783393046595047, "learning_rate": 8.104800149903726e-06, "loss": 2.965667724609375, "step": 479300 }, { "epoch": 0.5784599679819874, "learning_rate": 8.104396314435988e-06, "loss": 2.981436462402344, "step": 479400 }, { "epoch": 0.57858063130447, "learning_rate": 8.10399247896825e-06, "loss": 2.9828228759765625, "step": 479500 }, { "epoch": 0.5787012946269527, "learning_rate": 8.10358864350051e-06, "loss": 2.96062744140625, "step": 479600 }, { "epoch": 0.5788219579494355, "learning_rate": 8.103184808032772e-06, "loss": 2.956165771484375, "step": 479700 }, { "epoch": 0.5789426212719181, "learning_rate": 8.102780972565034e-06, "loss": 2.9961224365234376, "step": 479800 }, { "epoch": 0.5790632845944008, "learning_rate": 8.102377137097296e-06, "loss": 2.9412493896484375, "step": 479900 }, { "epoch": 0.5791839479168834, "learning_rate": 8.101973301629558e-06, "loss": 2.9621832275390627, "step": 480000 }, { "epoch": 0.5793046112393662, "learning_rate": 8.10156946616182e-06, "loss": 2.9854931640625, "step": 480100 }, { "epoch": 0.5794252745618489, "learning_rate": 8.10116563069408e-06, "loss": 2.9970028686523436, "step": 480200 }, { "epoch": 0.5795459378843315, "learning_rate": 8.100761795226342e-06, "loss": 2.9552850341796875, "step": 480300 }, { "epoch": 0.5796666012068142, "learning_rate": 8.100357959758603e-06, "loss": 2.9902328491210937, "step": 480400 }, { "epoch": 0.5797872645292969, "learning_rate": 8.099954124290865e-06, "loss": 2.961526184082031, "step": 480500 }, { "epoch": 0.5799079278517796, "learning_rate": 8.099550288823127e-06, "loss": 2.9639349365234375, "step": 480600 }, { "epoch": 0.5800285911742623, "learning_rate": 8.099146453355389e-06, "loss": 2.966573486328125, "step": 480700 }, { "epoch": 0.5801492544967449, "learning_rate": 8.09874261788765e-06, "loss": 2.9636276245117186, "step": 480800 }, { "epoch": 0.5802699178192277, "learning_rate": 8.098338782419913e-06, "loss": 2.952803649902344, "step": 480900 }, { "epoch": 0.5803905811417103, "learning_rate": 8.097934946952175e-06, "loss": 2.9921038818359373, "step": 481000 }, { "epoch": 0.580511244464193, "learning_rate": 8.097531111484435e-06, "loss": 2.9870700073242187, "step": 481100 }, { "epoch": 0.5806319077866757, "learning_rate": 8.097127276016697e-06, "loss": 2.9667413330078123, "step": 481200 }, { "epoch": 0.5807525711091583, "learning_rate": 8.096723440548959e-06, "loss": 2.9679583740234374, "step": 481300 }, { "epoch": 0.5808732344316411, "learning_rate": 8.09631960508122e-06, "loss": 2.97364990234375, "step": 481400 }, { "epoch": 0.5809938977541237, "learning_rate": 8.095915769613481e-06, "loss": 2.98238037109375, "step": 481500 }, { "epoch": 0.5811145610766064, "learning_rate": 8.095511934145743e-06, "loss": 2.977811279296875, "step": 481600 }, { "epoch": 0.5812352243990891, "learning_rate": 8.095108098678005e-06, "loss": 2.983026428222656, "step": 481700 }, { "epoch": 0.5813558877215718, "learning_rate": 8.094704263210267e-06, "loss": 2.982837829589844, "step": 481800 }, { "epoch": 0.5814765510440545, "learning_rate": 8.094300427742529e-06, "loss": 2.9884658813476563, "step": 481900 }, { "epoch": 0.5815972143665372, "learning_rate": 8.09389659227479e-06, "loss": 2.9661550903320313, "step": 482000 }, { "epoch": 0.5817178776890198, "learning_rate": 8.093492756807051e-06, "loss": 2.973033752441406, "step": 482100 }, { "epoch": 0.5818385410115026, "learning_rate": 8.093088921339313e-06, "loss": 2.973619384765625, "step": 482200 }, { "epoch": 0.5819592043339852, "learning_rate": 8.092685085871574e-06, "loss": 2.9707208251953126, "step": 482300 }, { "epoch": 0.5820798676564679, "learning_rate": 8.092281250403836e-06, "loss": 2.9651748657226564, "step": 482400 }, { "epoch": 0.5822005309789506, "learning_rate": 8.091877414936098e-06, "loss": 2.949432678222656, "step": 482500 }, { "epoch": 0.5823211943014333, "learning_rate": 8.09147357946836e-06, "loss": 2.9793191528320313, "step": 482600 }, { "epoch": 0.582441857623916, "learning_rate": 8.091069744000622e-06, "loss": 2.9813580322265625, "step": 482700 }, { "epoch": 0.5825625209463986, "learning_rate": 8.090665908532882e-06, "loss": 2.961824951171875, "step": 482800 }, { "epoch": 0.5826831842688813, "learning_rate": 8.090262073065144e-06, "loss": 2.9605416870117187, "step": 482900 }, { "epoch": 0.582803847591364, "learning_rate": 8.089858237597406e-06, "loss": 2.952781066894531, "step": 483000 }, { "epoch": 0.5829245109138467, "learning_rate": 8.089454402129668e-06, "loss": 2.9838186645507814, "step": 483100 }, { "epoch": 0.5830451742363294, "learning_rate": 8.08905056666193e-06, "loss": 2.982503662109375, "step": 483200 }, { "epoch": 0.583165837558812, "learning_rate": 8.08864673119419e-06, "loss": 2.9656787109375, "step": 483300 }, { "epoch": 0.5832865008812947, "learning_rate": 8.088242895726452e-06, "loss": 2.9740997314453126, "step": 483400 }, { "epoch": 0.5834071642037775, "learning_rate": 8.087839060258714e-06, "loss": 2.984513854980469, "step": 483500 }, { "epoch": 0.5835278275262601, "learning_rate": 8.087435224790974e-06, "loss": 2.9776446533203127, "step": 483600 }, { "epoch": 0.5836484908487428, "learning_rate": 8.087031389323236e-06, "loss": 2.9530511474609376, "step": 483700 }, { "epoch": 0.5837691541712254, "learning_rate": 8.086627553855498e-06, "loss": 2.9732745361328123, "step": 483800 }, { "epoch": 0.5838898174937082, "learning_rate": 8.08622371838776e-06, "loss": 2.9666485595703125, "step": 483900 }, { "epoch": 0.5840104808161909, "learning_rate": 8.085819882920022e-06, "loss": 2.9661984252929687, "step": 484000 }, { "epoch": 0.5841311441386735, "learning_rate": 8.085416047452284e-06, "loss": 2.9630029296875, "step": 484100 }, { "epoch": 0.5842518074611562, "learning_rate": 8.085012211984545e-06, "loss": 2.9773654174804687, "step": 484200 }, { "epoch": 0.5843724707836389, "learning_rate": 8.084608376516807e-06, "loss": 2.96956298828125, "step": 484300 }, { "epoch": 0.5844931341061216, "learning_rate": 8.084204541049069e-06, "loss": 2.9580194091796876, "step": 484400 }, { "epoch": 0.5846137974286043, "learning_rate": 8.083800705581329e-06, "loss": 2.9955279541015627, "step": 484500 }, { "epoch": 0.5847344607510869, "learning_rate": 8.08339687011359e-06, "loss": 2.9667892456054688, "step": 484600 }, { "epoch": 0.5848551240735697, "learning_rate": 8.082993034645853e-06, "loss": 2.9837551879882813, "step": 484700 }, { "epoch": 0.5849757873960523, "learning_rate": 8.082589199178115e-06, "loss": 2.9466522216796873, "step": 484800 }, { "epoch": 0.585096450718535, "learning_rate": 8.082185363710377e-06, "loss": 2.9726937866210936, "step": 484900 }, { "epoch": 0.5852171140410177, "learning_rate": 8.081781528242639e-06, "loss": 2.9689227294921876, "step": 485000 }, { "epoch": 0.5853377773635003, "learning_rate": 8.0813776927749e-06, "loss": 2.944732971191406, "step": 485100 }, { "epoch": 0.5854584406859831, "learning_rate": 8.080973857307161e-06, "loss": 2.9782815551757813, "step": 485200 }, { "epoch": 0.5855791040084657, "learning_rate": 8.080570021839423e-06, "loss": 2.9612307739257813, "step": 485300 }, { "epoch": 0.5856997673309484, "learning_rate": 8.080166186371683e-06, "loss": 2.940147705078125, "step": 485400 }, { "epoch": 0.5858204306534311, "learning_rate": 8.079762350903945e-06, "loss": 2.9731491088867186, "step": 485500 }, { "epoch": 0.5859410939759138, "learning_rate": 8.079358515436207e-06, "loss": 2.9864181518554687, "step": 485600 }, { "epoch": 0.5860617572983965, "learning_rate": 8.07895467996847e-06, "loss": 2.982764892578125, "step": 485700 }, { "epoch": 0.5861824206208791, "learning_rate": 8.078550844500731e-06, "loss": 2.941102294921875, "step": 485800 }, { "epoch": 0.5863030839433618, "learning_rate": 8.078147009032993e-06, "loss": 2.9511947631835938, "step": 485900 }, { "epoch": 0.5864237472658446, "learning_rate": 8.077743173565255e-06, "loss": 2.9434832763671874, "step": 486000 }, { "epoch": 0.5865444105883272, "learning_rate": 8.077339338097515e-06, "loss": 2.9721939086914064, "step": 486100 }, { "epoch": 0.5866650739108099, "learning_rate": 8.076935502629777e-06, "loss": 2.963254699707031, "step": 486200 }, { "epoch": 0.5867857372332925, "learning_rate": 8.07653166716204e-06, "loss": 2.9630078125, "step": 486300 }, { "epoch": 0.5869064005557753, "learning_rate": 8.0761278316943e-06, "loss": 2.9865576171875, "step": 486400 }, { "epoch": 0.587027063878258, "learning_rate": 8.075723996226562e-06, "loss": 2.9787857055664064, "step": 486500 }, { "epoch": 0.5871477272007406, "learning_rate": 8.075320160758824e-06, "loss": 2.9784112548828126, "step": 486600 }, { "epoch": 0.5872683905232233, "learning_rate": 8.074916325291086e-06, "loss": 2.9550482177734376, "step": 486700 }, { "epoch": 0.587389053845706, "learning_rate": 8.074512489823348e-06, "loss": 2.967176818847656, "step": 486800 }, { "epoch": 0.5875097171681887, "learning_rate": 8.074108654355608e-06, "loss": 2.9666311645507815, "step": 486900 }, { "epoch": 0.5876303804906714, "learning_rate": 8.07370481888787e-06, "loss": 2.939674072265625, "step": 487000 }, { "epoch": 0.587751043813154, "learning_rate": 8.073300983420132e-06, "loss": 2.9351376342773436, "step": 487100 }, { "epoch": 0.5878717071356367, "learning_rate": 8.072897147952394e-06, "loss": 2.9677545166015626, "step": 487200 }, { "epoch": 0.5879923704581195, "learning_rate": 8.072493312484654e-06, "loss": 2.9541204833984374, "step": 487300 }, { "epoch": 0.5881130337806021, "learning_rate": 8.072089477016916e-06, "loss": 2.957548828125, "step": 487400 }, { "epoch": 0.5882336971030848, "learning_rate": 8.071685641549178e-06, "loss": 2.9496249389648437, "step": 487500 }, { "epoch": 0.5883543604255674, "learning_rate": 8.07128180608144e-06, "loss": 2.9719998168945314, "step": 487600 }, { "epoch": 0.5884750237480502, "learning_rate": 8.0708779706137e-06, "loss": 2.9489666748046877, "step": 487700 }, { "epoch": 0.5885956870705329, "learning_rate": 8.070474135145962e-06, "loss": 2.9749627685546876, "step": 487800 }, { "epoch": 0.5887163503930155, "learning_rate": 8.070070299678224e-06, "loss": 2.96795166015625, "step": 487900 }, { "epoch": 0.5888370137154982, "learning_rate": 8.069666464210486e-06, "loss": 2.968385009765625, "step": 488000 }, { "epoch": 0.5889576770379809, "learning_rate": 8.069262628742748e-06, "loss": 2.9446173095703125, "step": 488100 }, { "epoch": 0.5890783403604636, "learning_rate": 8.06885879327501e-06, "loss": 2.942460632324219, "step": 488200 }, { "epoch": 0.5891990036829463, "learning_rate": 8.06845495780727e-06, "loss": 2.9851751708984375, "step": 488300 }, { "epoch": 0.5893196670054289, "learning_rate": 8.068051122339533e-06, "loss": 2.988564453125, "step": 488400 }, { "epoch": 0.5894403303279117, "learning_rate": 8.067647286871793e-06, "loss": 2.958942565917969, "step": 488500 }, { "epoch": 0.5895609936503943, "learning_rate": 8.067243451404055e-06, "loss": 2.9633984375, "step": 488600 }, { "epoch": 0.589681656972877, "learning_rate": 8.066839615936317e-06, "loss": 2.9610614013671874, "step": 488700 }, { "epoch": 0.5898023202953597, "learning_rate": 8.066435780468579e-06, "loss": 2.9576141357421877, "step": 488800 }, { "epoch": 0.5899229836178423, "learning_rate": 8.06603194500084e-06, "loss": 2.9549810791015627, "step": 488900 }, { "epoch": 0.5900436469403251, "learning_rate": 8.065628109533103e-06, "loss": 2.9668426513671875, "step": 489000 }, { "epoch": 0.5901643102628077, "learning_rate": 8.065224274065365e-06, "loss": 2.9712603759765623, "step": 489100 }, { "epoch": 0.5902849735852904, "learning_rate": 8.064820438597625e-06, "loss": 2.960770263671875, "step": 489200 }, { "epoch": 0.5904056369077731, "learning_rate": 8.064416603129887e-06, "loss": 2.9565350341796877, "step": 489300 }, { "epoch": 0.5905263002302558, "learning_rate": 8.064012767662149e-06, "loss": 2.9616189575195313, "step": 489400 }, { "epoch": 0.5906469635527385, "learning_rate": 8.06360893219441e-06, "loss": 2.97448974609375, "step": 489500 }, { "epoch": 0.5907676268752211, "learning_rate": 8.063205096726671e-06, "loss": 2.9743618774414062, "step": 489600 }, { "epoch": 0.5908882901977038, "learning_rate": 8.062801261258933e-06, "loss": 2.9766690063476564, "step": 489700 }, { "epoch": 0.5910089535201866, "learning_rate": 8.062397425791195e-06, "loss": 2.9721905517578127, "step": 489800 }, { "epoch": 0.5911296168426692, "learning_rate": 8.061993590323457e-06, "loss": 2.9808489990234377, "step": 489900 }, { "epoch": 0.5912502801651519, "learning_rate": 8.06158975485572e-06, "loss": 2.945633544921875, "step": 490000 }, { "epoch": 0.5913709434876345, "learning_rate": 8.061185919387981e-06, "loss": 2.958897705078125, "step": 490100 }, { "epoch": 0.5914916068101173, "learning_rate": 8.060782083920241e-06, "loss": 2.9526596069335938, "step": 490200 }, { "epoch": 0.5916122701326, "learning_rate": 8.060378248452503e-06, "loss": 2.95847900390625, "step": 490300 }, { "epoch": 0.5917329334550826, "learning_rate": 8.059974412984764e-06, "loss": 2.9596591186523438, "step": 490400 }, { "epoch": 0.5918535967775653, "learning_rate": 8.059570577517026e-06, "loss": 2.944175109863281, "step": 490500 }, { "epoch": 0.5919742601000479, "learning_rate": 8.059166742049288e-06, "loss": 2.9776235961914064, "step": 490600 }, { "epoch": 0.5920949234225307, "learning_rate": 8.05876290658155e-06, "loss": 2.960718688964844, "step": 490700 }, { "epoch": 0.5922155867450134, "learning_rate": 8.058359071113812e-06, "loss": 2.976762390136719, "step": 490800 }, { "epoch": 0.592336250067496, "learning_rate": 8.057955235646074e-06, "loss": 2.96544677734375, "step": 490900 }, { "epoch": 0.5924569133899787, "learning_rate": 8.057551400178334e-06, "loss": 2.9486407470703124, "step": 491000 }, { "epoch": 0.5925775767124614, "learning_rate": 8.057147564710596e-06, "loss": 2.938033447265625, "step": 491100 }, { "epoch": 0.5926982400349441, "learning_rate": 8.056743729242858e-06, "loss": 2.949468688964844, "step": 491200 }, { "epoch": 0.5928189033574268, "learning_rate": 8.05633989377512e-06, "loss": 2.925229797363281, "step": 491300 }, { "epoch": 0.5929395666799094, "learning_rate": 8.05593605830738e-06, "loss": 2.943150939941406, "step": 491400 }, { "epoch": 0.5930602300023922, "learning_rate": 8.055532222839642e-06, "loss": 2.9539303588867187, "step": 491500 }, { "epoch": 0.5931808933248748, "learning_rate": 8.055128387371904e-06, "loss": 2.9391903686523437, "step": 491600 }, { "epoch": 0.5933015566473575, "learning_rate": 8.054724551904166e-06, "loss": 2.9569131469726564, "step": 491700 }, { "epoch": 0.5934222199698402, "learning_rate": 8.054320716436426e-06, "loss": 2.966691589355469, "step": 491800 }, { "epoch": 0.5935428832923229, "learning_rate": 8.053916880968688e-06, "loss": 2.988161926269531, "step": 491900 }, { "epoch": 0.5936635466148056, "learning_rate": 8.05351304550095e-06, "loss": 2.943126525878906, "step": 492000 }, { "epoch": 0.5937842099372883, "learning_rate": 8.053109210033212e-06, "loss": 2.9560235595703124, "step": 492100 }, { "epoch": 0.5939048732597709, "learning_rate": 8.052705374565474e-06, "loss": 2.952505798339844, "step": 492200 }, { "epoch": 0.5940255365822537, "learning_rate": 8.052301539097736e-06, "loss": 2.96342529296875, "step": 492300 }, { "epoch": 0.5941461999047363, "learning_rate": 8.051897703629997e-06, "loss": 2.9526077270507813, "step": 492400 }, { "epoch": 0.594266863227219, "learning_rate": 8.051493868162259e-06, "loss": 2.992037048339844, "step": 492500 }, { "epoch": 0.5943875265497017, "learning_rate": 8.051090032694519e-06, "loss": 2.9615869140625, "step": 492600 }, { "epoch": 0.5945081898721843, "learning_rate": 8.050686197226781e-06, "loss": 2.97475830078125, "step": 492700 }, { "epoch": 0.5946288531946671, "learning_rate": 8.050282361759043e-06, "loss": 2.9530374145507814, "step": 492800 }, { "epoch": 0.5947495165171497, "learning_rate": 8.049878526291305e-06, "loss": 2.95875732421875, "step": 492900 }, { "epoch": 0.5948701798396324, "learning_rate": 8.049474690823567e-06, "loss": 2.9713275146484377, "step": 493000 }, { "epoch": 0.5949908431621151, "learning_rate": 8.049070855355829e-06, "loss": 2.9611590576171873, "step": 493100 }, { "epoch": 0.5951115064845978, "learning_rate": 8.04866701988809e-06, "loss": 2.96239013671875, "step": 493200 }, { "epoch": 0.5952321698070805, "learning_rate": 8.048263184420351e-06, "loss": 2.9204086303710937, "step": 493300 }, { "epoch": 0.5953528331295631, "learning_rate": 8.047859348952613e-06, "loss": 2.963445129394531, "step": 493400 }, { "epoch": 0.5954734964520458, "learning_rate": 8.047455513484875e-06, "loss": 2.952359924316406, "step": 493500 }, { "epoch": 0.5955941597745286, "learning_rate": 8.047051678017135e-06, "loss": 2.947237243652344, "step": 493600 }, { "epoch": 0.5957148230970112, "learning_rate": 8.046647842549397e-06, "loss": 2.94197021484375, "step": 493700 }, { "epoch": 0.5958354864194939, "learning_rate": 8.04624400708166e-06, "loss": 2.962818603515625, "step": 493800 }, { "epoch": 0.5959561497419765, "learning_rate": 8.045840171613921e-06, "loss": 2.9547216796875, "step": 493900 }, { "epoch": 0.5960768130644593, "learning_rate": 8.045436336146183e-06, "loss": 2.9487380981445312, "step": 494000 }, { "epoch": 0.596197476386942, "learning_rate": 8.045032500678445e-06, "loss": 2.9525277709960935, "step": 494100 }, { "epoch": 0.5963181397094246, "learning_rate": 8.044628665210707e-06, "loss": 2.9557479858398437, "step": 494200 }, { "epoch": 0.5964388030319073, "learning_rate": 8.044224829742967e-06, "loss": 2.96691650390625, "step": 494300 }, { "epoch": 0.59655946635439, "learning_rate": 8.04382099427523e-06, "loss": 2.9398138427734377, "step": 494400 }, { "epoch": 0.5966801296768727, "learning_rate": 8.04341715880749e-06, "loss": 2.93875732421875, "step": 494500 }, { "epoch": 0.5968007929993554, "learning_rate": 8.043013323339752e-06, "loss": 2.964020080566406, "step": 494600 }, { "epoch": 0.596921456321838, "learning_rate": 8.042609487872014e-06, "loss": 2.9571539306640626, "step": 494700 }, { "epoch": 0.5970421196443207, "learning_rate": 8.042205652404276e-06, "loss": 2.975044860839844, "step": 494800 }, { "epoch": 0.5971627829668034, "learning_rate": 8.041801816936538e-06, "loss": 2.965111083984375, "step": 494900 }, { "epoch": 0.5972834462892861, "learning_rate": 8.0413979814688e-06, "loss": 2.9459494018554686, "step": 495000 }, { "epoch": 0.5974041096117688, "learning_rate": 8.04099414600106e-06, "loss": 2.9387896728515623, "step": 495100 }, { "epoch": 0.5975247729342514, "learning_rate": 8.040590310533322e-06, "loss": 2.9479049682617187, "step": 495200 }, { "epoch": 0.5976454362567342, "learning_rate": 8.040186475065584e-06, "loss": 2.9441293334960936, "step": 495300 }, { "epoch": 0.5977660995792168, "learning_rate": 8.039782639597846e-06, "loss": 2.9364984130859373, "step": 495400 }, { "epoch": 0.5978867629016995, "learning_rate": 8.039378804130106e-06, "loss": 2.920135803222656, "step": 495500 }, { "epoch": 0.5980074262241822, "learning_rate": 8.038974968662368e-06, "loss": 2.9691693115234377, "step": 495600 }, { "epoch": 0.5981280895466649, "learning_rate": 8.03857113319463e-06, "loss": 2.9268438720703127, "step": 495700 }, { "epoch": 0.5982487528691476, "learning_rate": 8.038167297726892e-06, "loss": 2.954842834472656, "step": 495800 }, { "epoch": 0.5983694161916302, "learning_rate": 8.037763462259152e-06, "loss": 2.9568231201171873, "step": 495900 }, { "epoch": 0.5984900795141129, "learning_rate": 8.037359626791414e-06, "loss": 2.9504180908203126, "step": 496000 }, { "epoch": 0.5986107428365957, "learning_rate": 8.036955791323676e-06, "loss": 2.93613525390625, "step": 496100 }, { "epoch": 0.5987314061590783, "learning_rate": 8.036551955855938e-06, "loss": 2.949007568359375, "step": 496200 }, { "epoch": 0.598852069481561, "learning_rate": 8.0361481203882e-06, "loss": 2.962759704589844, "step": 496300 }, { "epoch": 0.5989727328040436, "learning_rate": 8.03574428492046e-06, "loss": 2.958729553222656, "step": 496400 }, { "epoch": 0.5990933961265263, "learning_rate": 8.035340449452723e-06, "loss": 2.9451922607421874, "step": 496500 }, { "epoch": 0.5992140594490091, "learning_rate": 8.034936613984985e-06, "loss": 2.956802978515625, "step": 496600 }, { "epoch": 0.5993347227714917, "learning_rate": 8.034532778517245e-06, "loss": 2.9515606689453127, "step": 496700 }, { "epoch": 0.5994553860939744, "learning_rate": 8.034128943049507e-06, "loss": 2.962585144042969, "step": 496800 }, { "epoch": 0.599576049416457, "learning_rate": 8.033725107581769e-06, "loss": 2.9377703857421875, "step": 496900 }, { "epoch": 0.5996967127389398, "learning_rate": 8.033321272114031e-06, "loss": 2.9345822143554687, "step": 497000 }, { "epoch": 0.5998173760614225, "learning_rate": 8.032917436646293e-06, "loss": 2.9454769897460937, "step": 497100 }, { "epoch": 0.5999380393839051, "learning_rate": 8.032513601178555e-06, "loss": 2.972662353515625, "step": 497200 }, { "epoch": 0.6000587027063878, "learning_rate": 8.032109765710817e-06, "loss": 2.954279479980469, "step": 497300 }, { "epoch": 0.6001793660288706, "learning_rate": 8.031705930243077e-06, "loss": 2.928613586425781, "step": 497400 }, { "epoch": 0.6003000293513532, "learning_rate": 8.031302094775339e-06, "loss": 2.937383728027344, "step": 497500 }, { "epoch": 0.6004206926738359, "learning_rate": 8.0308982593076e-06, "loss": 2.954742736816406, "step": 497600 }, { "epoch": 0.6005413559963185, "learning_rate": 8.030494423839861e-06, "loss": 2.9312362670898438, "step": 497700 }, { "epoch": 0.6006620193188013, "learning_rate": 8.030090588372123e-06, "loss": 2.9541384887695314, "step": 497800 }, { "epoch": 0.600782682641284, "learning_rate": 8.029686752904385e-06, "loss": 2.959463806152344, "step": 497900 }, { "epoch": 0.6009033459637666, "learning_rate": 8.029282917436647e-06, "loss": 2.927001953125, "step": 498000 }, { "epoch": 0.6010240092862493, "learning_rate": 8.02887908196891e-06, "loss": 2.9707293701171875, "step": 498100 }, { "epoch": 0.601144672608732, "learning_rate": 8.028475246501171e-06, "loss": 2.944581298828125, "step": 498200 }, { "epoch": 0.6012653359312147, "learning_rate": 8.028071411033432e-06, "loss": 2.954312438964844, "step": 498300 }, { "epoch": 0.6013859992536974, "learning_rate": 8.027667575565694e-06, "loss": 2.9526156616210937, "step": 498400 }, { "epoch": 0.60150666257618, "learning_rate": 8.027263740097956e-06, "loss": 2.949285583496094, "step": 498500 }, { "epoch": 0.6016273258986627, "learning_rate": 8.026859904630216e-06, "loss": 2.980736083984375, "step": 498600 }, { "epoch": 0.6017479892211454, "learning_rate": 8.026456069162478e-06, "loss": 2.949732360839844, "step": 498700 }, { "epoch": 0.6018686525436281, "learning_rate": 8.02605223369474e-06, "loss": 2.9579483032226563, "step": 498800 }, { "epoch": 0.6019893158661108, "learning_rate": 8.025648398227002e-06, "loss": 2.972672424316406, "step": 498900 }, { "epoch": 0.6021099791885934, "learning_rate": 8.025244562759264e-06, "loss": 2.952484436035156, "step": 499000 }, { "epoch": 0.6022306425110762, "learning_rate": 8.024840727291524e-06, "loss": 2.9228143310546875, "step": 499100 }, { "epoch": 0.6023513058335588, "learning_rate": 8.024436891823786e-06, "loss": 2.9677297973632815, "step": 499200 }, { "epoch": 0.6024719691560415, "learning_rate": 8.024033056356048e-06, "loss": 2.968966064453125, "step": 499300 }, { "epoch": 0.6025926324785242, "learning_rate": 8.02362922088831e-06, "loss": 2.9369766235351564, "step": 499400 }, { "epoch": 0.6027132958010069, "learning_rate": 8.02322538542057e-06, "loss": 2.92471435546875, "step": 499500 }, { "epoch": 0.6028339591234896, "learning_rate": 8.022821549952832e-06, "loss": 2.9405337524414064, "step": 499600 }, { "epoch": 0.6029546224459722, "learning_rate": 8.022417714485094e-06, "loss": 2.9437945556640623, "step": 499700 }, { "epoch": 0.6030752857684549, "learning_rate": 8.022013879017356e-06, "loss": 2.9274481201171874, "step": 499800 }, { "epoch": 0.6031959490909377, "learning_rate": 8.021610043549618e-06, "loss": 2.9407730102539062, "step": 499900 }, { "epoch": 0.6033166124134203, "learning_rate": 8.021206208081878e-06, "loss": 2.942716369628906, "step": 500000 }, { "epoch": 0.603437275735903, "learning_rate": 8.02080237261414e-06, "loss": 2.9249346923828123, "step": 500100 }, { "epoch": 0.6035579390583856, "learning_rate": 8.020398537146402e-06, "loss": 2.9676077270507815, "step": 500200 }, { "epoch": 0.6036786023808683, "learning_rate": 8.019994701678664e-06, "loss": 2.953896179199219, "step": 500300 }, { "epoch": 0.6037992657033511, "learning_rate": 8.019590866210926e-06, "loss": 2.9350482177734376, "step": 500400 }, { "epoch": 0.6039199290258337, "learning_rate": 8.019187030743187e-06, "loss": 2.953463134765625, "step": 500500 }, { "epoch": 0.6040405923483164, "learning_rate": 8.018783195275449e-06, "loss": 2.969024658203125, "step": 500600 }, { "epoch": 0.604161255670799, "learning_rate": 8.01837935980771e-06, "loss": 2.936881103515625, "step": 500700 }, { "epoch": 0.6042819189932818, "learning_rate": 8.017975524339971e-06, "loss": 2.9495361328125, "step": 500800 }, { "epoch": 0.6044025823157645, "learning_rate": 8.017571688872233e-06, "loss": 2.9232330322265625, "step": 500900 }, { "epoch": 0.6045232456382471, "learning_rate": 8.017167853404495e-06, "loss": 2.94489501953125, "step": 501000 }, { "epoch": 0.6046439089607298, "learning_rate": 8.016764017936757e-06, "loss": 2.94240234375, "step": 501100 }, { "epoch": 0.6047645722832125, "learning_rate": 8.016360182469019e-06, "loss": 2.937272033691406, "step": 501200 }, { "epoch": 0.6048852356056952, "learning_rate": 8.015956347001281e-06, "loss": 2.96359375, "step": 501300 }, { "epoch": 0.6050058989281779, "learning_rate": 8.015552511533541e-06, "loss": 2.9370523071289063, "step": 501400 }, { "epoch": 0.6051265622506605, "learning_rate": 8.015148676065803e-06, "loss": 2.943509521484375, "step": 501500 }, { "epoch": 0.6052472255731433, "learning_rate": 8.014744840598065e-06, "loss": 2.9520709228515627, "step": 501600 }, { "epoch": 0.6053678888956259, "learning_rate": 8.014341005130325e-06, "loss": 2.924737548828125, "step": 501700 }, { "epoch": 0.6054885522181086, "learning_rate": 8.013937169662587e-06, "loss": 2.9384710693359377, "step": 501800 }, { "epoch": 0.6056092155405913, "learning_rate": 8.01353333419485e-06, "loss": 2.9202166748046876, "step": 501900 }, { "epoch": 0.605729878863074, "learning_rate": 8.013129498727111e-06, "loss": 2.9348904418945314, "step": 502000 }, { "epoch": 0.6058505421855567, "learning_rate": 8.012725663259373e-06, "loss": 2.9645947265625, "step": 502100 }, { "epoch": 0.6059712055080393, "learning_rate": 8.012321827791635e-06, "loss": 2.955181884765625, "step": 502200 }, { "epoch": 0.606091868830522, "learning_rate": 8.011917992323897e-06, "loss": 2.9298760986328123, "step": 502300 }, { "epoch": 0.6062125321530047, "learning_rate": 8.011514156856158e-06, "loss": 2.941722412109375, "step": 502400 }, { "epoch": 0.6063331954754874, "learning_rate": 8.01111032138842e-06, "loss": 2.9457748413085936, "step": 502500 }, { "epoch": 0.6064538587979701, "learning_rate": 8.01070648592068e-06, "loss": 2.9628973388671875, "step": 502600 }, { "epoch": 0.6065745221204528, "learning_rate": 8.010302650452942e-06, "loss": 2.9518466186523438, "step": 502700 }, { "epoch": 0.6066951854429354, "learning_rate": 8.009898814985204e-06, "loss": 2.9688055419921877, "step": 502800 }, { "epoch": 0.6068158487654182, "learning_rate": 8.009494979517466e-06, "loss": 2.9575765991210936, "step": 502900 }, { "epoch": 0.6069365120879008, "learning_rate": 8.009091144049728e-06, "loss": 2.9197097778320313, "step": 503000 }, { "epoch": 0.6070571754103835, "learning_rate": 8.00868730858199e-06, "loss": 2.9297930908203127, "step": 503100 }, { "epoch": 0.6071778387328662, "learning_rate": 8.00828347311425e-06, "loss": 2.9497998046875, "step": 503200 }, { "epoch": 0.6072985020553489, "learning_rate": 8.007879637646512e-06, "loss": 2.9174771118164062, "step": 503300 }, { "epoch": 0.6074191653778316, "learning_rate": 8.007475802178774e-06, "loss": 2.9464212036132813, "step": 503400 }, { "epoch": 0.6075398287003142, "learning_rate": 8.007071966711036e-06, "loss": 2.9540090942382813, "step": 503500 }, { "epoch": 0.6076604920227969, "learning_rate": 8.006668131243296e-06, "loss": 2.935716552734375, "step": 503600 }, { "epoch": 0.6077811553452797, "learning_rate": 8.006264295775558e-06, "loss": 2.9447976684570314, "step": 503700 }, { "epoch": 0.6079018186677623, "learning_rate": 8.00586046030782e-06, "loss": 2.928397216796875, "step": 503800 }, { "epoch": 0.608022481990245, "learning_rate": 8.005456624840082e-06, "loss": 2.9565304565429686, "step": 503900 }, { "epoch": 0.6081431453127276, "learning_rate": 8.005052789372343e-06, "loss": 2.902865295410156, "step": 504000 }, { "epoch": 0.6082638086352103, "learning_rate": 8.004648953904605e-06, "loss": 2.936872863769531, "step": 504100 }, { "epoch": 0.6083844719576931, "learning_rate": 8.004245118436866e-06, "loss": 2.931551208496094, "step": 504200 }, { "epoch": 0.6085051352801757, "learning_rate": 8.003841282969128e-06, "loss": 2.947609558105469, "step": 504300 }, { "epoch": 0.6086257986026584, "learning_rate": 8.00343744750139e-06, "loss": 2.9287814331054687, "step": 504400 }, { "epoch": 0.608746461925141, "learning_rate": 8.00303361203365e-06, "loss": 2.938049621582031, "step": 504500 }, { "epoch": 0.6088671252476238, "learning_rate": 8.002629776565913e-06, "loss": 2.949931945800781, "step": 504600 }, { "epoch": 0.6089877885701065, "learning_rate": 8.002225941098175e-06, "loss": 2.9366058349609374, "step": 504700 }, { "epoch": 0.6091084518925891, "learning_rate": 8.001822105630437e-06, "loss": 2.9943002319335936, "step": 504800 }, { "epoch": 0.6092291152150718, "learning_rate": 8.001418270162697e-06, "loss": 2.940538330078125, "step": 504900 }, { "epoch": 0.6093497785375545, "learning_rate": 8.001014434694959e-06, "loss": 2.934717712402344, "step": 505000 }, { "epoch": 0.6094704418600372, "learning_rate": 8.000610599227221e-06, "loss": 2.958609924316406, "step": 505100 }, { "epoch": 0.6095911051825199, "learning_rate": 8.000206763759483e-06, "loss": 2.96318603515625, "step": 505200 }, { "epoch": 0.6097117685050025, "learning_rate": 7.999802928291745e-06, "loss": 2.9749432373046876, "step": 505300 }, { "epoch": 0.6098324318274853, "learning_rate": 7.999399092824007e-06, "loss": 2.9267352294921873, "step": 505400 }, { "epoch": 0.6099530951499679, "learning_rate": 7.998995257356267e-06, "loss": 2.942299499511719, "step": 505500 }, { "epoch": 0.6100737584724506, "learning_rate": 7.99859142188853e-06, "loss": 2.9731671142578127, "step": 505600 }, { "epoch": 0.6101944217949333, "learning_rate": 7.99818758642079e-06, "loss": 2.950361328125, "step": 505700 }, { "epoch": 0.610315085117416, "learning_rate": 7.997783750953051e-06, "loss": 2.941955871582031, "step": 505800 }, { "epoch": 0.6104357484398987, "learning_rate": 7.997379915485313e-06, "loss": 2.939858703613281, "step": 505900 }, { "epoch": 0.6105564117623813, "learning_rate": 7.996976080017575e-06, "loss": 2.948837890625, "step": 506000 }, { "epoch": 0.610677075084864, "learning_rate": 7.996572244549837e-06, "loss": 2.9474603271484376, "step": 506100 }, { "epoch": 0.6107977384073467, "learning_rate": 7.9961684090821e-06, "loss": 2.9288702392578125, "step": 506200 }, { "epoch": 0.6109184017298294, "learning_rate": 7.995764573614361e-06, "loss": 2.9382174682617186, "step": 506300 }, { "epoch": 0.6110390650523121, "learning_rate": 7.995360738146623e-06, "loss": 2.942349548339844, "step": 506400 }, { "epoch": 0.6111597283747947, "learning_rate": 7.994956902678884e-06, "loss": 2.9141015625, "step": 506500 }, { "epoch": 0.6112803916972774, "learning_rate": 7.994553067211146e-06, "loss": 2.9523745727539064, "step": 506600 }, { "epoch": 0.6114010550197602, "learning_rate": 7.994149231743406e-06, "loss": 2.953815612792969, "step": 506700 }, { "epoch": 0.6115217183422428, "learning_rate": 7.993745396275668e-06, "loss": 2.9407293701171877, "step": 506800 }, { "epoch": 0.6116423816647255, "learning_rate": 7.99334156080793e-06, "loss": 2.9476864624023436, "step": 506900 }, { "epoch": 0.6117630449872081, "learning_rate": 7.992937725340192e-06, "loss": 2.9306097412109375, "step": 507000 }, { "epoch": 0.6118837083096909, "learning_rate": 7.992533889872454e-06, "loss": 2.9344500732421874, "step": 507100 }, { "epoch": 0.6120043716321736, "learning_rate": 7.992130054404716e-06, "loss": 2.9500466918945314, "step": 507200 }, { "epoch": 0.6121250349546562, "learning_rate": 7.991726218936976e-06, "loss": 2.94267578125, "step": 507300 }, { "epoch": 0.6122456982771389, "learning_rate": 7.991322383469238e-06, "loss": 2.9566375732421877, "step": 507400 }, { "epoch": 0.6123663615996215, "learning_rate": 7.9909185480015e-06, "loss": 2.9195281982421877, "step": 507500 }, { "epoch": 0.6124870249221043, "learning_rate": 7.990514712533762e-06, "loss": 2.939086608886719, "step": 507600 }, { "epoch": 0.612607688244587, "learning_rate": 7.990110877066022e-06, "loss": 2.9370703125, "step": 507700 }, { "epoch": 0.6127283515670696, "learning_rate": 7.989707041598284e-06, "loss": 2.941788330078125, "step": 507800 }, { "epoch": 0.6128490148895523, "learning_rate": 7.989303206130546e-06, "loss": 2.9362823486328127, "step": 507900 }, { "epoch": 0.6129696782120351, "learning_rate": 7.988899370662808e-06, "loss": 2.949305114746094, "step": 508000 }, { "epoch": 0.6130903415345177, "learning_rate": 7.988495535195069e-06, "loss": 2.922286376953125, "step": 508100 }, { "epoch": 0.6132110048570004, "learning_rate": 7.98809169972733e-06, "loss": 2.946279296875, "step": 508200 }, { "epoch": 0.613331668179483, "learning_rate": 7.987687864259593e-06, "loss": 2.9381887817382815, "step": 508300 }, { "epoch": 0.6134523315019658, "learning_rate": 7.987284028791855e-06, "loss": 2.9511874389648436, "step": 508400 }, { "epoch": 0.6135729948244485, "learning_rate": 7.986880193324116e-06, "loss": 2.9328399658203126, "step": 508500 }, { "epoch": 0.6136936581469311, "learning_rate": 7.986476357856377e-06, "loss": 2.940248718261719, "step": 508600 }, { "epoch": 0.6138143214694138, "learning_rate": 7.986072522388639e-06, "loss": 2.9078173828125, "step": 508700 }, { "epoch": 0.6139349847918965, "learning_rate": 7.9856686869209e-06, "loss": 2.9195855712890624, "step": 508800 }, { "epoch": 0.6140556481143792, "learning_rate": 7.985264851453161e-06, "loss": 2.923081359863281, "step": 508900 }, { "epoch": 0.6141763114368619, "learning_rate": 7.984861015985423e-06, "loss": 2.9314361572265626, "step": 509000 }, { "epoch": 0.6142969747593445, "learning_rate": 7.984457180517685e-06, "loss": 2.907495422363281, "step": 509100 }, { "epoch": 0.6144176380818273, "learning_rate": 7.984053345049947e-06, "loss": 2.9291592407226563, "step": 509200 }, { "epoch": 0.6145383014043099, "learning_rate": 7.983649509582209e-06, "loss": 2.9413824462890625, "step": 509300 }, { "epoch": 0.6146589647267926, "learning_rate": 7.983245674114471e-06, "loss": 2.926028137207031, "step": 509400 }, { "epoch": 0.6147796280492753, "learning_rate": 7.982841838646733e-06, "loss": 2.928121337890625, "step": 509500 }, { "epoch": 0.614900291371758, "learning_rate": 7.982438003178993e-06, "loss": 2.9601974487304688, "step": 509600 }, { "epoch": 0.6150209546942407, "learning_rate": 7.982034167711255e-06, "loss": 2.9320724487304686, "step": 509700 }, { "epoch": 0.6151416180167233, "learning_rate": 7.981630332243515e-06, "loss": 2.9248001098632814, "step": 509800 }, { "epoch": 0.615262281339206, "learning_rate": 7.981226496775777e-06, "loss": 2.94704833984375, "step": 509900 }, { "epoch": 0.6153829446616887, "learning_rate": 7.98082266130804e-06, "loss": 2.938487854003906, "step": 510000 }, { "epoch": 0.6155036079841714, "learning_rate": 7.980418825840301e-06, "loss": 2.9286630249023435, "step": 510100 }, { "epoch": 0.6156242713066541, "learning_rate": 7.980014990372563e-06, "loss": 2.9487484741210936, "step": 510200 }, { "epoch": 0.6157449346291367, "learning_rate": 7.979611154904825e-06, "loss": 2.9647967529296877, "step": 510300 }, { "epoch": 0.6158655979516194, "learning_rate": 7.979207319437087e-06, "loss": 2.9429425048828124, "step": 510400 }, { "epoch": 0.6159862612741022, "learning_rate": 7.978803483969348e-06, "loss": 2.959300842285156, "step": 510500 }, { "epoch": 0.6161069245965848, "learning_rate": 7.97839964850161e-06, "loss": 2.9324209594726565, "step": 510600 }, { "epoch": 0.6162275879190675, "learning_rate": 7.977995813033872e-06, "loss": 2.931982116699219, "step": 510700 }, { "epoch": 0.6163482512415501, "learning_rate": 7.977591977566132e-06, "loss": 2.9510748291015627, "step": 510800 }, { "epoch": 0.6164689145640329, "learning_rate": 7.977188142098394e-06, "loss": 2.900860595703125, "step": 510900 }, { "epoch": 0.6165895778865156, "learning_rate": 7.976784306630656e-06, "loss": 2.936392517089844, "step": 511000 }, { "epoch": 0.6167102412089982, "learning_rate": 7.976380471162918e-06, "loss": 2.9366650390625, "step": 511100 }, { "epoch": 0.6168309045314809, "learning_rate": 7.97597663569518e-06, "loss": 2.943543701171875, "step": 511200 }, { "epoch": 0.6169515678539635, "learning_rate": 7.975572800227442e-06, "loss": 2.929909362792969, "step": 511300 }, { "epoch": 0.6170722311764463, "learning_rate": 7.975168964759702e-06, "loss": 2.925518798828125, "step": 511400 }, { "epoch": 0.617192894498929, "learning_rate": 7.974765129291964e-06, "loss": 2.9333935546875, "step": 511500 }, { "epoch": 0.6173135578214116, "learning_rate": 7.974361293824226e-06, "loss": 2.924302062988281, "step": 511600 }, { "epoch": 0.6174342211438943, "learning_rate": 7.973957458356486e-06, "loss": 2.9478570556640626, "step": 511700 }, { "epoch": 0.617554884466377, "learning_rate": 7.973553622888748e-06, "loss": 2.9365350341796876, "step": 511800 }, { "epoch": 0.6176755477888597, "learning_rate": 7.97314978742101e-06, "loss": 2.9318582153320314, "step": 511900 }, { "epoch": 0.6177962111113424, "learning_rate": 7.972745951953272e-06, "loss": 2.9342440795898437, "step": 512000 }, { "epoch": 0.617916874433825, "learning_rate": 7.972342116485534e-06, "loss": 2.9170303344726562, "step": 512100 }, { "epoch": 0.6180375377563078, "learning_rate": 7.971938281017795e-06, "loss": 2.8970108032226562, "step": 512200 }, { "epoch": 0.6181582010787904, "learning_rate": 7.971534445550057e-06, "loss": 2.923292541503906, "step": 512300 }, { "epoch": 0.6182788644012731, "learning_rate": 7.971130610082319e-06, "loss": 2.928847351074219, "step": 512400 }, { "epoch": 0.6183995277237558, "learning_rate": 7.97072677461458e-06, "loss": 2.9172064208984376, "step": 512500 }, { "epoch": 0.6185201910462385, "learning_rate": 7.970322939146843e-06, "loss": 2.9376541137695313, "step": 512600 }, { "epoch": 0.6186408543687212, "learning_rate": 7.969919103679103e-06, "loss": 2.9123886108398436, "step": 512700 }, { "epoch": 0.6187615176912038, "learning_rate": 7.969515268211365e-06, "loss": 2.9545639038085936, "step": 512800 }, { "epoch": 0.6188821810136865, "learning_rate": 7.969111432743627e-06, "loss": 2.9437515258789064, "step": 512900 }, { "epoch": 0.6190028443361693, "learning_rate": 7.968707597275887e-06, "loss": 2.9291162109375, "step": 513000 }, { "epoch": 0.6191235076586519, "learning_rate": 7.968303761808149e-06, "loss": 2.9460580444335935, "step": 513100 }, { "epoch": 0.6192441709811346, "learning_rate": 7.967899926340411e-06, "loss": 2.9116244506835938, "step": 513200 }, { "epoch": 0.6193648343036173, "learning_rate": 7.967496090872673e-06, "loss": 2.9105389404296873, "step": 513300 }, { "epoch": 0.6194854976261, "learning_rate": 7.967092255404935e-06, "loss": 2.9243295288085935, "step": 513400 }, { "epoch": 0.6196061609485827, "learning_rate": 7.966688419937197e-06, "loss": 2.9280929565429688, "step": 513500 }, { "epoch": 0.6197268242710653, "learning_rate": 7.966284584469457e-06, "loss": 2.9477328491210937, "step": 513600 }, { "epoch": 0.619847487593548, "learning_rate": 7.96588074900172e-06, "loss": 2.9262680053710937, "step": 513700 }, { "epoch": 0.6199681509160307, "learning_rate": 7.965476913533981e-06, "loss": 2.919295349121094, "step": 513800 }, { "epoch": 0.6200888142385134, "learning_rate": 7.965073078066242e-06, "loss": 2.9143356323242187, "step": 513900 }, { "epoch": 0.6202094775609961, "learning_rate": 7.964669242598504e-06, "loss": 2.9276748657226563, "step": 514000 }, { "epoch": 0.6203301408834787, "learning_rate": 7.964265407130765e-06, "loss": 2.937161865234375, "step": 514100 }, { "epoch": 0.6204508042059614, "learning_rate": 7.963861571663027e-06, "loss": 2.9196502685546877, "step": 514200 }, { "epoch": 0.6205714675284442, "learning_rate": 7.96345773619529e-06, "loss": 2.931656494140625, "step": 514300 }, { "epoch": 0.6206921308509268, "learning_rate": 7.963053900727551e-06, "loss": 2.9033148193359377, "step": 514400 }, { "epoch": 0.6208127941734095, "learning_rate": 7.962650065259813e-06, "loss": 2.92002197265625, "step": 514500 }, { "epoch": 0.6209334574958921, "learning_rate": 7.962246229792074e-06, "loss": 2.919794921875, "step": 514600 }, { "epoch": 0.6210541208183749, "learning_rate": 7.961842394324336e-06, "loss": 2.916904296875, "step": 514700 }, { "epoch": 0.6211747841408576, "learning_rate": 7.961438558856596e-06, "loss": 2.9389263916015627, "step": 514800 }, { "epoch": 0.6212954474633402, "learning_rate": 7.961034723388858e-06, "loss": 2.937230224609375, "step": 514900 }, { "epoch": 0.6214161107858229, "learning_rate": 7.96063088792112e-06, "loss": 2.913074951171875, "step": 515000 }, { "epoch": 0.6215367741083055, "learning_rate": 7.960227052453382e-06, "loss": 2.9199456787109375, "step": 515100 }, { "epoch": 0.6216574374307883, "learning_rate": 7.959823216985644e-06, "loss": 2.933965148925781, "step": 515200 }, { "epoch": 0.621778100753271, "learning_rate": 7.959419381517906e-06, "loss": 2.9413833618164062, "step": 515300 }, { "epoch": 0.6218987640757536, "learning_rate": 7.959015546050168e-06, "loss": 2.9478463745117187, "step": 515400 }, { "epoch": 0.6220194273982363, "learning_rate": 7.958611710582428e-06, "loss": 2.9017559814453127, "step": 515500 }, { "epoch": 0.622140090720719, "learning_rate": 7.95820787511469e-06, "loss": 2.927471008300781, "step": 515600 }, { "epoch": 0.6222607540432017, "learning_rate": 7.957804039646952e-06, "loss": 2.9231170654296874, "step": 515700 }, { "epoch": 0.6223814173656844, "learning_rate": 7.957400204179212e-06, "loss": 2.9155319213867186, "step": 515800 }, { "epoch": 0.622502080688167, "learning_rate": 7.956996368711474e-06, "loss": 2.9355905151367185, "step": 515900 }, { "epoch": 0.6226227440106498, "learning_rate": 7.956592533243736e-06, "loss": 2.915854797363281, "step": 516000 }, { "epoch": 0.6227434073331324, "learning_rate": 7.956188697775998e-06, "loss": 2.937925109863281, "step": 516100 }, { "epoch": 0.6228640706556151, "learning_rate": 7.95578486230826e-06, "loss": 2.958274230957031, "step": 516200 }, { "epoch": 0.6229847339780978, "learning_rate": 7.95538102684052e-06, "loss": 2.900185241699219, "step": 516300 }, { "epoch": 0.6231053973005805, "learning_rate": 7.954977191372783e-06, "loss": 2.9382064819335936, "step": 516400 }, { "epoch": 0.6232260606230632, "learning_rate": 7.954573355905045e-06, "loss": 2.931901550292969, "step": 516500 }, { "epoch": 0.6233467239455458, "learning_rate": 7.954169520437307e-06, "loss": 2.8812347412109376, "step": 516600 }, { "epoch": 0.6234673872680285, "learning_rate": 7.953765684969567e-06, "loss": 2.898975524902344, "step": 516700 }, { "epoch": 0.6235880505905113, "learning_rate": 7.953361849501829e-06, "loss": 2.933077697753906, "step": 516800 }, { "epoch": 0.6237087139129939, "learning_rate": 7.95295801403409e-06, "loss": 2.9323956298828127, "step": 516900 }, { "epoch": 0.6238293772354766, "learning_rate": 7.952554178566353e-06, "loss": 2.9189215087890625, "step": 517000 }, { "epoch": 0.6239500405579592, "learning_rate": 7.952150343098613e-06, "loss": 2.9305963134765625, "step": 517100 }, { "epoch": 0.624070703880442, "learning_rate": 7.951746507630875e-06, "loss": 2.9188876342773438, "step": 517200 }, { "epoch": 0.6241913672029247, "learning_rate": 7.951342672163137e-06, "loss": 2.9377862548828126, "step": 517300 }, { "epoch": 0.6243120305254073, "learning_rate": 7.950938836695399e-06, "loss": 2.9388796997070314, "step": 517400 }, { "epoch": 0.62443269384789, "learning_rate": 7.950535001227661e-06, "loss": 2.920887451171875, "step": 517500 }, { "epoch": 0.6245533571703726, "learning_rate": 7.950131165759923e-06, "loss": 2.8912997436523438, "step": 517600 }, { "epoch": 0.6246740204928554, "learning_rate": 7.949727330292183e-06, "loss": 2.9513134765625, "step": 517700 }, { "epoch": 0.6247946838153381, "learning_rate": 7.949323494824445e-06, "loss": 2.895133056640625, "step": 517800 }, { "epoch": 0.6249153471378207, "learning_rate": 7.948919659356706e-06, "loss": 2.9340667724609375, "step": 517900 }, { "epoch": 0.6250360104603034, "learning_rate": 7.948515823888968e-06, "loss": 2.93799072265625, "step": 518000 }, { "epoch": 0.6251566737827862, "learning_rate": 7.94811198842123e-06, "loss": 2.9283697509765627, "step": 518100 }, { "epoch": 0.6252773371052688, "learning_rate": 7.947708152953492e-06, "loss": 2.9418405151367186, "step": 518200 }, { "epoch": 0.6253980004277515, "learning_rate": 7.947304317485753e-06, "loss": 2.915838317871094, "step": 518300 }, { "epoch": 0.6255186637502341, "learning_rate": 7.946900482018015e-06, "loss": 2.894775085449219, "step": 518400 }, { "epoch": 0.6256393270727169, "learning_rate": 7.946496646550277e-06, "loss": 2.9170150756835938, "step": 518500 }, { "epoch": 0.6257599903951996, "learning_rate": 7.94609281108254e-06, "loss": 2.9279708862304688, "step": 518600 }, { "epoch": 0.6258806537176822, "learning_rate": 7.9456889756148e-06, "loss": 2.9136148071289063, "step": 518700 }, { "epoch": 0.6260013170401649, "learning_rate": 7.945285140147062e-06, "loss": 2.917821960449219, "step": 518800 }, { "epoch": 0.6261219803626475, "learning_rate": 7.944881304679322e-06, "loss": 2.900311279296875, "step": 518900 }, { "epoch": 0.6262426436851303, "learning_rate": 7.944477469211584e-06, "loss": 2.924251708984375, "step": 519000 }, { "epoch": 0.626363307007613, "learning_rate": 7.944073633743846e-06, "loss": 2.939072265625, "step": 519100 }, { "epoch": 0.6264839703300956, "learning_rate": 7.943669798276108e-06, "loss": 2.9273110961914064, "step": 519200 }, { "epoch": 0.6266046336525783, "learning_rate": 7.94326596280837e-06, "loss": 2.8934375, "step": 519300 }, { "epoch": 0.626725296975061, "learning_rate": 7.942862127340632e-06, "loss": 2.9186386108398437, "step": 519400 }, { "epoch": 0.6268459602975437, "learning_rate": 7.942458291872892e-06, "loss": 2.927326354980469, "step": 519500 }, { "epoch": 0.6269666236200264, "learning_rate": 7.942054456405154e-06, "loss": 2.9182174682617186, "step": 519600 }, { "epoch": 0.627087286942509, "learning_rate": 7.941650620937416e-06, "loss": 2.9111480712890625, "step": 519700 }, { "epoch": 0.6272079502649918, "learning_rate": 7.941246785469678e-06, "loss": 2.9423431396484374, "step": 519800 }, { "epoch": 0.6273286135874744, "learning_rate": 7.940842950001938e-06, "loss": 2.922041015625, "step": 519900 }, { "epoch": 0.6274492769099571, "learning_rate": 7.9404391145342e-06, "loss": 2.958108215332031, "step": 520000 }, { "epoch": 0.6275699402324398, "learning_rate": 7.940035279066462e-06, "loss": 2.910821838378906, "step": 520100 }, { "epoch": 0.6276906035549225, "learning_rate": 7.939631443598724e-06, "loss": 2.92248291015625, "step": 520200 }, { "epoch": 0.6278112668774052, "learning_rate": 7.939227608130986e-06, "loss": 2.920801086425781, "step": 520300 }, { "epoch": 0.6279319301998878, "learning_rate": 7.938823772663247e-06, "loss": 2.920839538574219, "step": 520400 }, { "epoch": 0.6280525935223705, "learning_rate": 7.938419937195509e-06, "loss": 2.92770263671875, "step": 520500 }, { "epoch": 0.6281732568448533, "learning_rate": 7.93801610172777e-06, "loss": 2.9224734497070313, "step": 520600 }, { "epoch": 0.6282939201673359, "learning_rate": 7.937612266260033e-06, "loss": 2.9305413818359374, "step": 520700 }, { "epoch": 0.6284145834898186, "learning_rate": 7.937208430792293e-06, "loss": 2.8962722778320313, "step": 520800 }, { "epoch": 0.6285352468123012, "learning_rate": 7.936804595324555e-06, "loss": 2.9308657836914063, "step": 520900 }, { "epoch": 0.628655910134784, "learning_rate": 7.936400759856817e-06, "loss": 2.904207458496094, "step": 521000 }, { "epoch": 0.6287765734572667, "learning_rate": 7.935996924389079e-06, "loss": 2.9203060913085936, "step": 521100 }, { "epoch": 0.6288972367797493, "learning_rate": 7.935593088921339e-06, "loss": 2.916864929199219, "step": 521200 }, { "epoch": 0.629017900102232, "learning_rate": 7.935189253453601e-06, "loss": 2.907156982421875, "step": 521300 }, { "epoch": 0.6291385634247146, "learning_rate": 7.934785417985863e-06, "loss": 2.914400634765625, "step": 521400 }, { "epoch": 0.6292592267471974, "learning_rate": 7.934381582518125e-06, "loss": 2.9265597534179686, "step": 521500 }, { "epoch": 0.6293798900696801, "learning_rate": 7.933977747050387e-06, "loss": 2.9270748901367187, "step": 521600 }, { "epoch": 0.6295005533921627, "learning_rate": 7.933573911582649e-06, "loss": 2.9318606567382814, "step": 521700 }, { "epoch": 0.6296212167146454, "learning_rate": 7.93317007611491e-06, "loss": 2.922077941894531, "step": 521800 }, { "epoch": 0.629741880037128, "learning_rate": 7.932766240647171e-06, "loss": 2.9371435546875, "step": 521900 }, { "epoch": 0.6298625433596108, "learning_rate": 7.932362405179432e-06, "loss": 2.8946109008789063, "step": 522000 }, { "epoch": 0.6299832066820935, "learning_rate": 7.931958569711694e-06, "loss": 2.91708984375, "step": 522100 }, { "epoch": 0.6301038700045761, "learning_rate": 7.931554734243956e-06, "loss": 2.935476989746094, "step": 522200 }, { "epoch": 0.6302245333270589, "learning_rate": 7.931150898776218e-06, "loss": 2.931512756347656, "step": 522300 }, { "epoch": 0.6303451966495415, "learning_rate": 7.93074706330848e-06, "loss": 2.930699462890625, "step": 522400 }, { "epoch": 0.6304658599720242, "learning_rate": 7.930343227840742e-06, "loss": 2.916722717285156, "step": 522500 }, { "epoch": 0.6305865232945069, "learning_rate": 7.929939392373003e-06, "loss": 2.930321044921875, "step": 522600 }, { "epoch": 0.6307071866169895, "learning_rate": 7.929535556905264e-06, "loss": 2.9280126953125, "step": 522700 }, { "epoch": 0.6308278499394723, "learning_rate": 7.929131721437526e-06, "loss": 2.9292257690429686, "step": 522800 }, { "epoch": 0.6309485132619549, "learning_rate": 7.928727885969788e-06, "loss": 2.9129730224609376, "step": 522900 }, { "epoch": 0.6310691765844376, "learning_rate": 7.928324050502048e-06, "loss": 2.9149789428710937, "step": 523000 }, { "epoch": 0.6311898399069203, "learning_rate": 7.92792021503431e-06, "loss": 2.9060940551757812, "step": 523100 }, { "epoch": 0.631310503229403, "learning_rate": 7.927516379566572e-06, "loss": 2.9181484985351562, "step": 523200 }, { "epoch": 0.6314311665518857, "learning_rate": 7.927112544098834e-06, "loss": 2.9121249389648436, "step": 523300 }, { "epoch": 0.6315518298743684, "learning_rate": 7.926708708631096e-06, "loss": 2.9159979248046874, "step": 523400 }, { "epoch": 0.631672493196851, "learning_rate": 7.926304873163358e-06, "loss": 2.948087463378906, "step": 523500 }, { "epoch": 0.6317931565193338, "learning_rate": 7.925901037695618e-06, "loss": 2.930238952636719, "step": 523600 }, { "epoch": 0.6319138198418164, "learning_rate": 7.92549720222788e-06, "loss": 2.912752685546875, "step": 523700 }, { "epoch": 0.6320344831642991, "learning_rate": 7.925093366760142e-06, "loss": 2.9361221313476564, "step": 523800 }, { "epoch": 0.6321551464867818, "learning_rate": 7.924689531292402e-06, "loss": 2.9162432861328127, "step": 523900 }, { "epoch": 0.6322758098092645, "learning_rate": 7.924285695824664e-06, "loss": 2.9198068237304686, "step": 524000 }, { "epoch": 0.6323964731317472, "learning_rate": 7.923881860356926e-06, "loss": 2.9152001953125, "step": 524100 }, { "epoch": 0.6325171364542298, "learning_rate": 7.923478024889188e-06, "loss": 2.9171633911132813, "step": 524200 }, { "epoch": 0.6326377997767125, "learning_rate": 7.92307418942145e-06, "loss": 2.9247210693359373, "step": 524300 }, { "epoch": 0.6327584630991953, "learning_rate": 7.92267035395371e-06, "loss": 2.920307312011719, "step": 524400 }, { "epoch": 0.6328791264216779, "learning_rate": 7.922266518485973e-06, "loss": 2.911843566894531, "step": 524500 }, { "epoch": 0.6329997897441606, "learning_rate": 7.921862683018235e-06, "loss": 2.9048123168945312, "step": 524600 }, { "epoch": 0.6331204530666432, "learning_rate": 7.921458847550497e-06, "loss": 2.8982302856445314, "step": 524700 }, { "epoch": 0.633241116389126, "learning_rate": 7.921055012082759e-06, "loss": 2.9159341430664063, "step": 524800 }, { "epoch": 0.6333617797116087, "learning_rate": 7.920651176615019e-06, "loss": 2.953211364746094, "step": 524900 }, { "epoch": 0.6334824430340913, "learning_rate": 7.920247341147281e-06, "loss": 2.8935418701171876, "step": 525000 }, { "epoch": 0.633603106356574, "learning_rate": 7.919843505679543e-06, "loss": 2.8928067016601564, "step": 525100 }, { "epoch": 0.6337237696790566, "learning_rate": 7.919439670211805e-06, "loss": 2.9214743041992186, "step": 525200 }, { "epoch": 0.6338444330015394, "learning_rate": 7.919035834744065e-06, "loss": 2.9290887451171876, "step": 525300 }, { "epoch": 0.6339650963240221, "learning_rate": 7.918631999276327e-06, "loss": 2.9300689697265625, "step": 525400 }, { "epoch": 0.6340857596465047, "learning_rate": 7.918228163808589e-06, "loss": 2.8972433471679686, "step": 525500 }, { "epoch": 0.6342064229689874, "learning_rate": 7.917824328340851e-06, "loss": 2.8949765014648436, "step": 525600 }, { "epoch": 0.63432708629147, "learning_rate": 7.917420492873113e-06, "loss": 2.91369873046875, "step": 525700 }, { "epoch": 0.6344477496139528, "learning_rate": 7.917016657405373e-06, "loss": 2.900715026855469, "step": 525800 }, { "epoch": 0.6345684129364355, "learning_rate": 7.916612821937635e-06, "loss": 2.9279440307617186, "step": 525900 }, { "epoch": 0.6346890762589181, "learning_rate": 7.916208986469897e-06, "loss": 2.9390029907226562, "step": 526000 }, { "epoch": 0.6348097395814009, "learning_rate": 7.915805151002158e-06, "loss": 2.9287124633789063, "step": 526100 }, { "epoch": 0.6349304029038835, "learning_rate": 7.91540131553442e-06, "loss": 2.89931396484375, "step": 526200 }, { "epoch": 0.6350510662263662, "learning_rate": 7.914997480066682e-06, "loss": 2.9417630004882813, "step": 526300 }, { "epoch": 0.6351717295488489, "learning_rate": 7.914593644598944e-06, "loss": 2.9337152099609374, "step": 526400 }, { "epoch": 0.6352923928713315, "learning_rate": 7.914189809131206e-06, "loss": 2.9253668212890624, "step": 526500 }, { "epoch": 0.6354130561938143, "learning_rate": 7.913785973663468e-06, "loss": 2.9214242553710936, "step": 526600 }, { "epoch": 0.6355337195162969, "learning_rate": 7.91338213819573e-06, "loss": 2.911136474609375, "step": 526700 }, { "epoch": 0.6356543828387796, "learning_rate": 7.91297830272799e-06, "loss": 2.919922180175781, "step": 526800 }, { "epoch": 0.6357750461612623, "learning_rate": 7.912574467260252e-06, "loss": 2.926233825683594, "step": 526900 }, { "epoch": 0.635895709483745, "learning_rate": 7.912170631792512e-06, "loss": 2.8864752197265626, "step": 527000 }, { "epoch": 0.6360163728062277, "learning_rate": 7.911766796324774e-06, "loss": 2.9276934814453126, "step": 527100 }, { "epoch": 0.6361370361287103, "learning_rate": 7.911362960857036e-06, "loss": 2.8995010375976564, "step": 527200 }, { "epoch": 0.636257699451193, "learning_rate": 7.910959125389298e-06, "loss": 2.920686950683594, "step": 527300 }, { "epoch": 0.6363783627736758, "learning_rate": 7.91055528992156e-06, "loss": 2.926412353515625, "step": 527400 }, { "epoch": 0.6364990260961584, "learning_rate": 7.910151454453822e-06, "loss": 2.9265869140625, "step": 527500 }, { "epoch": 0.6366196894186411, "learning_rate": 7.909747618986084e-06, "loss": 2.9085421752929688, "step": 527600 }, { "epoch": 0.6367403527411237, "learning_rate": 7.909343783518344e-06, "loss": 2.9507366943359377, "step": 527700 }, { "epoch": 0.6368610160636065, "learning_rate": 7.908939948050606e-06, "loss": 2.9089315795898436, "step": 527800 }, { "epoch": 0.6369816793860892, "learning_rate": 7.908536112582868e-06, "loss": 2.9272750854492187, "step": 527900 }, { "epoch": 0.6371023427085718, "learning_rate": 7.908132277115129e-06, "loss": 2.8651077270507814, "step": 528000 }, { "epoch": 0.6372230060310545, "learning_rate": 7.90772844164739e-06, "loss": 2.8903424072265627, "step": 528100 }, { "epoch": 0.6373436693535371, "learning_rate": 7.907324606179652e-06, "loss": 2.917109375, "step": 528200 }, { "epoch": 0.6374643326760199, "learning_rate": 7.906920770711914e-06, "loss": 2.90942138671875, "step": 528300 }, { "epoch": 0.6375849959985026, "learning_rate": 7.906516935244176e-06, "loss": 2.9393081665039062, "step": 528400 }, { "epoch": 0.6377056593209852, "learning_rate": 7.906113099776437e-06, "loss": 2.9263076782226562, "step": 528500 }, { "epoch": 0.637826322643468, "learning_rate": 7.905709264308699e-06, "loss": 2.914020690917969, "step": 528600 }, { "epoch": 0.6379469859659507, "learning_rate": 7.90530542884096e-06, "loss": 2.9094778442382814, "step": 528700 }, { "epoch": 0.6380676492884333, "learning_rate": 7.904901593373223e-06, "loss": 2.919495849609375, "step": 528800 }, { "epoch": 0.638188312610916, "learning_rate": 7.904497757905483e-06, "loss": 2.9046136474609376, "step": 528900 }, { "epoch": 0.6383089759333986, "learning_rate": 7.904093922437745e-06, "loss": 2.909035949707031, "step": 529000 }, { "epoch": 0.6384296392558814, "learning_rate": 7.903690086970007e-06, "loss": 2.908266906738281, "step": 529100 }, { "epoch": 0.6385503025783641, "learning_rate": 7.903286251502269e-06, "loss": 2.885537109375, "step": 529200 }, { "epoch": 0.6386709659008467, "learning_rate": 7.90288241603453e-06, "loss": 2.9287509155273437, "step": 529300 }, { "epoch": 0.6387916292233294, "learning_rate": 7.902478580566791e-06, "loss": 2.912772216796875, "step": 529400 }, { "epoch": 0.638912292545812, "learning_rate": 7.902074745099053e-06, "loss": 2.924574279785156, "step": 529500 }, { "epoch": 0.6390329558682948, "learning_rate": 7.901670909631315e-06, "loss": 2.9036474609375, "step": 529600 }, { "epoch": 0.6391536191907775, "learning_rate": 7.901267074163577e-06, "loss": 2.902551574707031, "step": 529700 }, { "epoch": 0.6392742825132601, "learning_rate": 7.900863238695839e-06, "loss": 2.9299160766601564, "step": 529800 }, { "epoch": 0.6393949458357429, "learning_rate": 7.9004594032281e-06, "loss": 2.9189422607421873, "step": 529900 }, { "epoch": 0.6395156091582255, "learning_rate": 7.900055567760361e-06, "loss": 2.919125671386719, "step": 530000 }, { "epoch": 0.6396362724807082, "learning_rate": 7.899651732292623e-06, "loss": 2.889647216796875, "step": 530100 }, { "epoch": 0.6397569358031909, "learning_rate": 7.899247896824884e-06, "loss": 2.9255801391601564, "step": 530200 }, { "epoch": 0.6398775991256735, "learning_rate": 7.898844061357146e-06, "loss": 2.8967352294921875, "step": 530300 }, { "epoch": 0.6399982624481563, "learning_rate": 7.898440225889408e-06, "loss": 2.9440728759765626, "step": 530400 }, { "epoch": 0.6401189257706389, "learning_rate": 7.89803639042167e-06, "loss": 2.9279129028320314, "step": 530500 }, { "epoch": 0.6402395890931216, "learning_rate": 7.897632554953932e-06, "loss": 2.9225119018554686, "step": 530600 }, { "epoch": 0.6403602524156043, "learning_rate": 7.897228719486194e-06, "loss": 2.899134216308594, "step": 530700 }, { "epoch": 0.640480915738087, "learning_rate": 7.896824884018454e-06, "loss": 2.920964660644531, "step": 530800 }, { "epoch": 0.6406015790605697, "learning_rate": 7.896421048550716e-06, "loss": 2.9086627197265624, "step": 530900 }, { "epoch": 0.6407222423830523, "learning_rate": 7.896017213082978e-06, "loss": 2.8920623779296877, "step": 531000 }, { "epoch": 0.640842905705535, "learning_rate": 7.895613377615238e-06, "loss": 2.8837518310546875, "step": 531100 }, { "epoch": 0.6409635690280178, "learning_rate": 7.8952095421475e-06, "loss": 2.91379150390625, "step": 531200 }, { "epoch": 0.6410842323505004, "learning_rate": 7.894805706679762e-06, "loss": 2.931374206542969, "step": 531300 }, { "epoch": 0.6412048956729831, "learning_rate": 7.894401871212024e-06, "loss": 2.9140640258789063, "step": 531400 }, { "epoch": 0.6413255589954657, "learning_rate": 7.893998035744286e-06, "loss": 2.906854553222656, "step": 531500 }, { "epoch": 0.6414462223179485, "learning_rate": 7.893594200276548e-06, "loss": 2.92174560546875, "step": 531600 }, { "epoch": 0.6415668856404312, "learning_rate": 7.89319036480881e-06, "loss": 2.9333343505859375, "step": 531700 }, { "epoch": 0.6416875489629138, "learning_rate": 7.89278652934107e-06, "loss": 2.915685119628906, "step": 531800 }, { "epoch": 0.6418082122853965, "learning_rate": 7.892382693873332e-06, "loss": 2.9405352783203127, "step": 531900 }, { "epoch": 0.6419288756078791, "learning_rate": 7.891978858405593e-06, "loss": 2.8800735473632812, "step": 532000 }, { "epoch": 0.6420495389303619, "learning_rate": 7.891575022937855e-06, "loss": 2.8825479125976563, "step": 532100 }, { "epoch": 0.6421702022528446, "learning_rate": 7.891171187470117e-06, "loss": 2.8957418823242187, "step": 532200 }, { "epoch": 0.6422908655753272, "learning_rate": 7.890767352002379e-06, "loss": 2.9057769775390625, "step": 532300 }, { "epoch": 0.64241152889781, "learning_rate": 7.89036351653464e-06, "loss": 2.9050631713867188, "step": 532400 }, { "epoch": 0.6425321922202926, "learning_rate": 7.889959681066902e-06, "loss": 2.8788491821289064, "step": 532500 }, { "epoch": 0.6426528555427753, "learning_rate": 7.889555845599163e-06, "loss": 2.9095004272460936, "step": 532600 }, { "epoch": 0.642773518865258, "learning_rate": 7.889152010131425e-06, "loss": 2.9180343627929686, "step": 532700 }, { "epoch": 0.6428941821877406, "learning_rate": 7.888748174663687e-06, "loss": 2.930128173828125, "step": 532800 }, { "epoch": 0.6430148455102234, "learning_rate": 7.888344339195949e-06, "loss": 2.9327386474609374, "step": 532900 }, { "epoch": 0.643135508832706, "learning_rate": 7.887940503728209e-06, "loss": 2.9133541870117186, "step": 533000 }, { "epoch": 0.6432561721551887, "learning_rate": 7.887536668260471e-06, "loss": 2.90226806640625, "step": 533100 }, { "epoch": 0.6433768354776714, "learning_rate": 7.887132832792733e-06, "loss": 2.9028521728515626, "step": 533200 }, { "epoch": 0.643497498800154, "learning_rate": 7.886728997324995e-06, "loss": 2.922269592285156, "step": 533300 }, { "epoch": 0.6436181621226368, "learning_rate": 7.886325161857255e-06, "loss": 2.9260598754882814, "step": 533400 }, { "epoch": 0.6437388254451194, "learning_rate": 7.885921326389517e-06, "loss": 2.9319769287109376, "step": 533500 }, { "epoch": 0.6438594887676021, "learning_rate": 7.88551749092178e-06, "loss": 2.901370849609375, "step": 533600 }, { "epoch": 0.6439801520900849, "learning_rate": 7.885113655454041e-06, "loss": 2.9178424072265625, "step": 533700 }, { "epoch": 0.6441008154125675, "learning_rate": 7.884709819986303e-06, "loss": 2.9081576538085936, "step": 533800 }, { "epoch": 0.6442214787350502, "learning_rate": 7.884305984518565e-06, "loss": 2.907099609375, "step": 533900 }, { "epoch": 0.6443421420575329, "learning_rate": 7.883902149050825e-06, "loss": 2.918369140625, "step": 534000 }, { "epoch": 0.6444628053800155, "learning_rate": 7.883498313583087e-06, "loss": 2.9075936889648437, "step": 534100 }, { "epoch": 0.6445834687024983, "learning_rate": 7.883094478115348e-06, "loss": 2.9389569091796877, "step": 534200 }, { "epoch": 0.6447041320249809, "learning_rate": 7.88269064264761e-06, "loss": 2.887899169921875, "step": 534300 }, { "epoch": 0.6448247953474636, "learning_rate": 7.882286807179872e-06, "loss": 2.900060119628906, "step": 534400 }, { "epoch": 0.6449454586699463, "learning_rate": 7.881882971712134e-06, "loss": 2.902264404296875, "step": 534500 }, { "epoch": 0.645066121992429, "learning_rate": 7.881479136244396e-06, "loss": 2.8935296630859373, "step": 534600 }, { "epoch": 0.6451867853149117, "learning_rate": 7.881075300776658e-06, "loss": 2.93751953125, "step": 534700 }, { "epoch": 0.6453074486373943, "learning_rate": 7.88067146530892e-06, "loss": 2.90350830078125, "step": 534800 }, { "epoch": 0.645428111959877, "learning_rate": 7.88026762984118e-06, "loss": 2.890809326171875, "step": 534900 }, { "epoch": 0.6455487752823598, "learning_rate": 7.879863794373442e-06, "loss": 2.91779296875, "step": 535000 }, { "epoch": 0.6456694386048424, "learning_rate": 7.879459958905704e-06, "loss": 2.9179510498046874, "step": 535100 }, { "epoch": 0.6457901019273251, "learning_rate": 7.879056123437964e-06, "loss": 2.9075067138671873, "step": 535200 }, { "epoch": 0.6459107652498077, "learning_rate": 7.878652287970226e-06, "loss": 2.908475646972656, "step": 535300 }, { "epoch": 0.6460314285722905, "learning_rate": 7.878248452502488e-06, "loss": 2.9076922607421873, "step": 535400 }, { "epoch": 0.6461520918947732, "learning_rate": 7.87784461703475e-06, "loss": 2.890078430175781, "step": 535500 }, { "epoch": 0.6462727552172558, "learning_rate": 7.877440781567012e-06, "loss": 2.8760922241210936, "step": 535600 }, { "epoch": 0.6463934185397385, "learning_rate": 7.877036946099274e-06, "loss": 2.93329833984375, "step": 535700 }, { "epoch": 0.6465140818622211, "learning_rate": 7.876633110631536e-06, "loss": 2.9066500854492188, "step": 535800 }, { "epoch": 0.6466347451847039, "learning_rate": 7.876229275163796e-06, "loss": 2.933055419921875, "step": 535900 }, { "epoch": 0.6467554085071866, "learning_rate": 7.875825439696058e-06, "loss": 2.9006198120117186, "step": 536000 }, { "epoch": 0.6468760718296692, "learning_rate": 7.875421604228319e-06, "loss": 2.9125405883789064, "step": 536100 }, { "epoch": 0.646996735152152, "learning_rate": 7.87501776876058e-06, "loss": 2.9205218505859376, "step": 536200 }, { "epoch": 0.6471173984746346, "learning_rate": 7.874613933292843e-06, "loss": 2.9006918334960936, "step": 536300 }, { "epoch": 0.6472380617971173, "learning_rate": 7.874210097825105e-06, "loss": 2.891918029785156, "step": 536400 }, { "epoch": 0.6473587251196, "learning_rate": 7.873806262357367e-06, "loss": 2.9168359375, "step": 536500 }, { "epoch": 0.6474793884420826, "learning_rate": 7.873402426889629e-06, "loss": 2.916479187011719, "step": 536600 }, { "epoch": 0.6476000517645654, "learning_rate": 7.872998591421889e-06, "loss": 2.923353576660156, "step": 536700 }, { "epoch": 0.647720715087048, "learning_rate": 7.87259475595415e-06, "loss": 2.9228530883789063, "step": 536800 }, { "epoch": 0.6478413784095307, "learning_rate": 7.872190920486413e-06, "loss": 2.896103515625, "step": 536900 }, { "epoch": 0.6479620417320134, "learning_rate": 7.871787085018675e-06, "loss": 2.88780029296875, "step": 537000 }, { "epoch": 0.648082705054496, "learning_rate": 7.871383249550935e-06, "loss": 2.892388916015625, "step": 537100 }, { "epoch": 0.6482033683769788, "learning_rate": 7.870979414083197e-06, "loss": 2.903394775390625, "step": 537200 }, { "epoch": 0.6483240316994614, "learning_rate": 7.870575578615459e-06, "loss": 2.889374084472656, "step": 537300 }, { "epoch": 0.6484446950219441, "learning_rate": 7.870171743147721e-06, "loss": 2.9206292724609373, "step": 537400 }, { "epoch": 0.6485653583444269, "learning_rate": 7.869767907679981e-06, "loss": 2.902332458496094, "step": 537500 }, { "epoch": 0.6486860216669095, "learning_rate": 7.869364072212243e-06, "loss": 2.9179312133789064, "step": 537600 }, { "epoch": 0.6488066849893922, "learning_rate": 7.868960236744505e-06, "loss": 2.8813995361328124, "step": 537700 }, { "epoch": 0.6489273483118748, "learning_rate": 7.868556401276767e-06, "loss": 2.92198974609375, "step": 537800 }, { "epoch": 0.6490480116343575, "learning_rate": 7.86815256580903e-06, "loss": 2.8931451416015626, "step": 537900 }, { "epoch": 0.6491686749568403, "learning_rate": 7.86774873034129e-06, "loss": 2.90304443359375, "step": 538000 }, { "epoch": 0.6492893382793229, "learning_rate": 7.867344894873551e-06, "loss": 2.8974130249023435, "step": 538100 }, { "epoch": 0.6494100016018056, "learning_rate": 7.866941059405813e-06, "loss": 2.9123568725585938, "step": 538200 }, { "epoch": 0.6495306649242882, "learning_rate": 7.866537223938074e-06, "loss": 2.8980618286132813, "step": 538300 }, { "epoch": 0.649651328246771, "learning_rate": 7.866133388470336e-06, "loss": 2.9039300537109374, "step": 538400 }, { "epoch": 0.6497719915692537, "learning_rate": 7.865729553002598e-06, "loss": 2.903240051269531, "step": 538500 }, { "epoch": 0.6498926548917363, "learning_rate": 7.86532571753486e-06, "loss": 2.888386535644531, "step": 538600 }, { "epoch": 0.650013318214219, "learning_rate": 7.864921882067122e-06, "loss": 2.865736389160156, "step": 538700 }, { "epoch": 0.6501339815367017, "learning_rate": 7.864518046599384e-06, "loss": 2.8814651489257814, "step": 538800 }, { "epoch": 0.6502546448591844, "learning_rate": 7.864114211131646e-06, "loss": 2.9174713134765624, "step": 538900 }, { "epoch": 0.6503753081816671, "learning_rate": 7.863710375663906e-06, "loss": 2.8867333984375, "step": 539000 }, { "epoch": 0.6504959715041497, "learning_rate": 7.863306540196168e-06, "loss": 2.8783908081054688, "step": 539100 }, { "epoch": 0.6506166348266325, "learning_rate": 7.862902704728428e-06, "loss": 2.9131756591796876, "step": 539200 }, { "epoch": 0.6507372981491152, "learning_rate": 7.86249886926069e-06, "loss": 2.917720947265625, "step": 539300 }, { "epoch": 0.6508579614715978, "learning_rate": 7.862095033792952e-06, "loss": 2.915721130371094, "step": 539400 }, { "epoch": 0.6509786247940805, "learning_rate": 7.861691198325214e-06, "loss": 2.9115286254882813, "step": 539500 }, { "epoch": 0.6510992881165631, "learning_rate": 7.861287362857476e-06, "loss": 2.913331298828125, "step": 539600 }, { "epoch": 0.6512199514390459, "learning_rate": 7.860883527389738e-06, "loss": 2.9298211669921876, "step": 539700 }, { "epoch": 0.6513406147615286, "learning_rate": 7.860479691922e-06, "loss": 2.917668762207031, "step": 539800 }, { "epoch": 0.6514612780840112, "learning_rate": 7.86007585645426e-06, "loss": 2.8871951293945313, "step": 539900 }, { "epoch": 0.651581941406494, "learning_rate": 7.859672020986522e-06, "loss": 2.9174041748046875, "step": 540000 }, { "epoch": 0.6517026047289766, "learning_rate": 7.859268185518784e-06, "loss": 2.891155090332031, "step": 540100 }, { "epoch": 0.6518232680514593, "learning_rate": 7.858864350051045e-06, "loss": 2.8895083618164064, "step": 540200 }, { "epoch": 0.651943931373942, "learning_rate": 7.858460514583307e-06, "loss": 2.8884426879882814, "step": 540300 }, { "epoch": 0.6520645946964246, "learning_rate": 7.858056679115569e-06, "loss": 2.8725735473632814, "step": 540400 }, { "epoch": 0.6521852580189074, "learning_rate": 7.85765284364783e-06, "loss": 2.8968325805664064, "step": 540500 }, { "epoch": 0.65230592134139, "learning_rate": 7.857249008180093e-06, "loss": 2.8704620361328126, "step": 540600 }, { "epoch": 0.6524265846638727, "learning_rate": 7.856845172712355e-06, "loss": 2.915482177734375, "step": 540700 }, { "epoch": 0.6525472479863554, "learning_rate": 7.856441337244615e-06, "loss": 2.9027215576171876, "step": 540800 }, { "epoch": 0.6526679113088381, "learning_rate": 7.856037501776877e-06, "loss": 2.912454833984375, "step": 540900 }, { "epoch": 0.6527885746313208, "learning_rate": 7.855633666309139e-06, "loss": 2.90088134765625, "step": 541000 }, { "epoch": 0.6529092379538034, "learning_rate": 7.855229830841399e-06, "loss": 2.918892822265625, "step": 541100 }, { "epoch": 0.6530299012762861, "learning_rate": 7.854825995373661e-06, "loss": 2.8833172607421873, "step": 541200 }, { "epoch": 0.6531505645987689, "learning_rate": 7.854422159905923e-06, "loss": 2.8815362548828123, "step": 541300 }, { "epoch": 0.6532712279212515, "learning_rate": 7.854018324438185e-06, "loss": 2.908486633300781, "step": 541400 }, { "epoch": 0.6533918912437342, "learning_rate": 7.853614488970447e-06, "loss": 2.8756982421875, "step": 541500 }, { "epoch": 0.6535125545662168, "learning_rate": 7.853210653502707e-06, "loss": 2.8931463623046874, "step": 541600 }, { "epoch": 0.6536332178886995, "learning_rate": 7.85280681803497e-06, "loss": 2.898650817871094, "step": 541700 }, { "epoch": 0.6537538812111823, "learning_rate": 7.852402982567231e-06, "loss": 2.897416687011719, "step": 541800 }, { "epoch": 0.6538745445336649, "learning_rate": 7.851999147099493e-06, "loss": 2.9071905517578127, "step": 541900 }, { "epoch": 0.6539952078561476, "learning_rate": 7.851595311631755e-06, "loss": 2.8878460693359376, "step": 542000 }, { "epoch": 0.6541158711786302, "learning_rate": 7.851191476164016e-06, "loss": 2.900864562988281, "step": 542100 }, { "epoch": 0.654236534501113, "learning_rate": 7.850787640696278e-06, "loss": 2.8920828247070314, "step": 542200 }, { "epoch": 0.6543571978235957, "learning_rate": 7.85038380522854e-06, "loss": 2.870994873046875, "step": 542300 }, { "epoch": 0.6544778611460783, "learning_rate": 7.8499799697608e-06, "loss": 2.911165466308594, "step": 542400 }, { "epoch": 0.654598524468561, "learning_rate": 7.849576134293062e-06, "loss": 2.9239794921875, "step": 542500 }, { "epoch": 0.6547191877910437, "learning_rate": 7.849172298825324e-06, "loss": 2.8798031616210937, "step": 542600 }, { "epoch": 0.6548398511135264, "learning_rate": 7.848768463357586e-06, "loss": 2.885004577636719, "step": 542700 }, { "epoch": 0.6549605144360091, "learning_rate": 7.848364627889848e-06, "loss": 2.8778231811523436, "step": 542800 }, { "epoch": 0.6550811777584917, "learning_rate": 7.84796079242211e-06, "loss": 2.9184939575195314, "step": 542900 }, { "epoch": 0.6552018410809745, "learning_rate": 7.84755695695437e-06, "loss": 2.8894195556640625, "step": 543000 }, { "epoch": 0.6553225044034571, "learning_rate": 7.847153121486632e-06, "loss": 2.8782662963867187, "step": 543100 }, { "epoch": 0.6554431677259398, "learning_rate": 7.846749286018894e-06, "loss": 2.894966735839844, "step": 543200 }, { "epoch": 0.6555638310484225, "learning_rate": 7.846345450551154e-06, "loss": 2.8925051879882813, "step": 543300 }, { "epoch": 0.6556844943709051, "learning_rate": 7.845941615083416e-06, "loss": 2.905179748535156, "step": 543400 }, { "epoch": 0.6558051576933879, "learning_rate": 7.845537779615678e-06, "loss": 2.90675048828125, "step": 543500 }, { "epoch": 0.6559258210158705, "learning_rate": 7.84513394414794e-06, "loss": 2.889992370605469, "step": 543600 }, { "epoch": 0.6560464843383532, "learning_rate": 7.844730108680202e-06, "loss": 2.8882940673828124, "step": 543700 }, { "epoch": 0.656167147660836, "learning_rate": 7.844326273212464e-06, "loss": 2.8928472900390627, "step": 543800 }, { "epoch": 0.6562878109833186, "learning_rate": 7.843922437744726e-06, "loss": 2.8955841064453125, "step": 543900 }, { "epoch": 0.6564084743058013, "learning_rate": 7.843518602276986e-06, "loss": 2.890169677734375, "step": 544000 }, { "epoch": 0.656529137628284, "learning_rate": 7.843114766809248e-06, "loss": 2.8813189697265624, "step": 544100 }, { "epoch": 0.6566498009507666, "learning_rate": 7.842710931341509e-06, "loss": 2.9042623901367186, "step": 544200 }, { "epoch": 0.6567704642732494, "learning_rate": 7.84230709587377e-06, "loss": 2.8564773559570313, "step": 544300 }, { "epoch": 0.656891127595732, "learning_rate": 7.841903260406033e-06, "loss": 2.887789306640625, "step": 544400 }, { "epoch": 0.6570117909182147, "learning_rate": 7.841499424938295e-06, "loss": 2.8893804931640625, "step": 544500 }, { "epoch": 0.6571324542406974, "learning_rate": 7.841095589470557e-06, "loss": 2.893466796875, "step": 544600 }, { "epoch": 0.6572531175631801, "learning_rate": 7.840691754002819e-06, "loss": 2.8943426513671877, "step": 544700 }, { "epoch": 0.6573737808856628, "learning_rate": 7.840287918535079e-06, "loss": 2.911033020019531, "step": 544800 }, { "epoch": 0.6574944442081454, "learning_rate": 7.839884083067341e-06, "loss": 2.89703857421875, "step": 544900 }, { "epoch": 0.6576151075306281, "learning_rate": 7.839480247599603e-06, "loss": 2.886546936035156, "step": 545000 }, { "epoch": 0.6577357708531109, "learning_rate": 7.839076412131865e-06, "loss": 2.8962164306640625, "step": 545100 }, { "epoch": 0.6578564341755935, "learning_rate": 7.838672576664125e-06, "loss": 2.9256500244140624, "step": 545200 }, { "epoch": 0.6579770974980762, "learning_rate": 7.838268741196387e-06, "loss": 2.8784664916992186, "step": 545300 }, { "epoch": 0.6580977608205588, "learning_rate": 7.837864905728649e-06, "loss": 2.907110595703125, "step": 545400 }, { "epoch": 0.6582184241430415, "learning_rate": 7.837461070260911e-06, "loss": 2.900867614746094, "step": 545500 }, { "epoch": 0.6583390874655243, "learning_rate": 7.837057234793173e-06, "loss": 2.909971923828125, "step": 545600 }, { "epoch": 0.6584597507880069, "learning_rate": 7.836653399325433e-06, "loss": 2.9139413452148437, "step": 545700 }, { "epoch": 0.6585804141104896, "learning_rate": 7.836249563857695e-06, "loss": 2.920662841796875, "step": 545800 }, { "epoch": 0.6587010774329722, "learning_rate": 7.835845728389957e-06, "loss": 2.9010275268554686, "step": 545900 }, { "epoch": 0.658821740755455, "learning_rate": 7.83544189292222e-06, "loss": 2.8878598022460937, "step": 546000 }, { "epoch": 0.6589424040779377, "learning_rate": 7.83503805745448e-06, "loss": 2.9176119995117187, "step": 546100 }, { "epoch": 0.6590630674004203, "learning_rate": 7.834634221986742e-06, "loss": 2.9249783325195313, "step": 546200 }, { "epoch": 0.659183730722903, "learning_rate": 7.834230386519004e-06, "loss": 2.901019287109375, "step": 546300 }, { "epoch": 0.6593043940453857, "learning_rate": 7.833826551051266e-06, "loss": 2.8969735717773437, "step": 546400 }, { "epoch": 0.6594250573678684, "learning_rate": 7.833422715583526e-06, "loss": 2.8929318237304686, "step": 546500 }, { "epoch": 0.6595457206903511, "learning_rate": 7.833018880115788e-06, "loss": 2.9113809204101564, "step": 546600 }, { "epoch": 0.6596663840128337, "learning_rate": 7.83261504464805e-06, "loss": 2.8651937866210937, "step": 546700 }, { "epoch": 0.6597870473353165, "learning_rate": 7.832211209180312e-06, "loss": 2.898782958984375, "step": 546800 }, { "epoch": 0.6599077106577991, "learning_rate": 7.831807373712574e-06, "loss": 2.9068112182617187, "step": 546900 }, { "epoch": 0.6600283739802818, "learning_rate": 7.831403538244836e-06, "loss": 2.8640316772460936, "step": 547000 }, { "epoch": 0.6601490373027645, "learning_rate": 7.830999702777096e-06, "loss": 2.8768670654296873, "step": 547100 }, { "epoch": 0.6602697006252471, "learning_rate": 7.830595867309358e-06, "loss": 2.9254611206054686, "step": 547200 }, { "epoch": 0.6603903639477299, "learning_rate": 7.830192031841618e-06, "loss": 2.8940365600585936, "step": 547300 }, { "epoch": 0.6605110272702125, "learning_rate": 7.82978819637388e-06, "loss": 2.888963317871094, "step": 547400 }, { "epoch": 0.6606316905926952, "learning_rate": 7.829384360906142e-06, "loss": 2.8824942016601565, "step": 547500 }, { "epoch": 0.660752353915178, "learning_rate": 7.828980525438404e-06, "loss": 2.8810000610351563, "step": 547600 }, { "epoch": 0.6608730172376606, "learning_rate": 7.828576689970666e-06, "loss": 2.872586975097656, "step": 547700 }, { "epoch": 0.6609936805601433, "learning_rate": 7.828172854502928e-06, "loss": 2.8890869140625, "step": 547800 }, { "epoch": 0.6611143438826259, "learning_rate": 7.82776901903519e-06, "loss": 2.902843017578125, "step": 547900 }, { "epoch": 0.6612350072051086, "learning_rate": 7.827365183567452e-06, "loss": 2.8827139282226564, "step": 548000 }, { "epoch": 0.6613556705275914, "learning_rate": 7.826961348099712e-06, "loss": 2.8952496337890623, "step": 548100 }, { "epoch": 0.661476333850074, "learning_rate": 7.826557512631974e-06, "loss": 2.892314758300781, "step": 548200 }, { "epoch": 0.6615969971725567, "learning_rate": 7.826153677164235e-06, "loss": 2.9087774658203127, "step": 548300 }, { "epoch": 0.6617176604950393, "learning_rate": 7.825749841696497e-06, "loss": 2.8974014282226563, "step": 548400 }, { "epoch": 0.6618383238175221, "learning_rate": 7.825346006228759e-06, "loss": 2.88627685546875, "step": 548500 }, { "epoch": 0.6619589871400048, "learning_rate": 7.82494217076102e-06, "loss": 2.8855911254882813, "step": 548600 }, { "epoch": 0.6620796504624874, "learning_rate": 7.824538335293283e-06, "loss": 2.867442932128906, "step": 548700 }, { "epoch": 0.6622003137849701, "learning_rate": 7.824134499825545e-06, "loss": 2.892622985839844, "step": 548800 }, { "epoch": 0.6623209771074527, "learning_rate": 7.823730664357805e-06, "loss": 2.8662149047851564, "step": 548900 }, { "epoch": 0.6624416404299355, "learning_rate": 7.823326828890067e-06, "loss": 2.9218402099609375, "step": 549000 }, { "epoch": 0.6625623037524182, "learning_rate": 7.822922993422329e-06, "loss": 2.87510009765625, "step": 549100 }, { "epoch": 0.6626829670749008, "learning_rate": 7.822519157954591e-06, "loss": 2.8868499755859376, "step": 549200 }, { "epoch": 0.6628036303973835, "learning_rate": 7.822115322486851e-06, "loss": 2.8812124633789065, "step": 549300 }, { "epoch": 0.6629242937198663, "learning_rate": 7.821711487019113e-06, "loss": 2.9025885009765626, "step": 549400 }, { "epoch": 0.6630449570423489, "learning_rate": 7.821307651551375e-06, "loss": 2.873065185546875, "step": 549500 }, { "epoch": 0.6631656203648316, "learning_rate": 7.820903816083637e-06, "loss": 2.8949411010742185, "step": 549600 }, { "epoch": 0.6632862836873142, "learning_rate": 7.820499980615897e-06, "loss": 2.8904754638671877, "step": 549700 }, { "epoch": 0.663406947009797, "learning_rate": 7.82009614514816e-06, "loss": 2.906838684082031, "step": 549800 }, { "epoch": 0.6635276103322797, "learning_rate": 7.819692309680421e-06, "loss": 2.8911181640625, "step": 549900 }, { "epoch": 0.6636482736547623, "learning_rate": 7.819288474212683e-06, "loss": 2.869093933105469, "step": 550000 }, { "epoch": 0.663768936977245, "learning_rate": 7.818884638744945e-06, "loss": 2.8962200927734374, "step": 550100 }, { "epoch": 0.6638896002997277, "learning_rate": 7.818480803277206e-06, "loss": 2.8813595581054687, "step": 550200 }, { "epoch": 0.6640102636222104, "learning_rate": 7.818076967809468e-06, "loss": 2.9032928466796877, "step": 550300 }, { "epoch": 0.6641309269446931, "learning_rate": 7.81767313234173e-06, "loss": 2.9056414794921874, "step": 550400 }, { "epoch": 0.6642515902671757, "learning_rate": 7.81726929687399e-06, "loss": 2.890927429199219, "step": 550500 }, { "epoch": 0.6643722535896585, "learning_rate": 7.816865461406252e-06, "loss": 2.86630615234375, "step": 550600 }, { "epoch": 0.6644929169121411, "learning_rate": 7.816461625938514e-06, "loss": 2.8881985473632814, "step": 550700 }, { "epoch": 0.6646135802346238, "learning_rate": 7.816057790470776e-06, "loss": 2.9093582153320314, "step": 550800 }, { "epoch": 0.6647342435571065, "learning_rate": 7.815653955003038e-06, "loss": 2.8779608154296876, "step": 550900 }, { "epoch": 0.6648549068795891, "learning_rate": 7.8152501195353e-06, "loss": 2.8884927368164064, "step": 551000 }, { "epoch": 0.6649755702020719, "learning_rate": 7.814846284067562e-06, "loss": 2.8700637817382812, "step": 551100 }, { "epoch": 0.6650962335245545, "learning_rate": 7.814442448599822e-06, "loss": 2.9007708740234377, "step": 551200 }, { "epoch": 0.6652168968470372, "learning_rate": 7.814038613132084e-06, "loss": 2.8968634033203124, "step": 551300 }, { "epoch": 0.66533756016952, "learning_rate": 7.813634777664344e-06, "loss": 2.8800799560546877, "step": 551400 }, { "epoch": 0.6654582234920026, "learning_rate": 7.813230942196606e-06, "loss": 2.9100927734375, "step": 551500 }, { "epoch": 0.6655788868144853, "learning_rate": 7.812827106728868e-06, "loss": 2.918765869140625, "step": 551600 }, { "epoch": 0.6656995501369679, "learning_rate": 7.81242327126113e-06, "loss": 2.8859066772460937, "step": 551700 }, { "epoch": 0.6658202134594506, "learning_rate": 7.812019435793392e-06, "loss": 2.8692236328125, "step": 551800 }, { "epoch": 0.6659408767819334, "learning_rate": 7.811615600325654e-06, "loss": 2.88407958984375, "step": 551900 }, { "epoch": 0.666061540104416, "learning_rate": 7.811211764857916e-06, "loss": 2.8988983154296877, "step": 552000 }, { "epoch": 0.6661822034268987, "learning_rate": 7.810807929390177e-06, "loss": 2.884002990722656, "step": 552100 }, { "epoch": 0.6663028667493813, "learning_rate": 7.810404093922438e-06, "loss": 2.8778765869140623, "step": 552200 }, { "epoch": 0.6664235300718641, "learning_rate": 7.8100002584547e-06, "loss": 2.8798202514648437, "step": 552300 }, { "epoch": 0.6665441933943468, "learning_rate": 7.80959642298696e-06, "loss": 2.880676574707031, "step": 552400 }, { "epoch": 0.6666648567168294, "learning_rate": 7.809192587519223e-06, "loss": 2.888607177734375, "step": 552500 }, { "epoch": 0.6667855200393121, "learning_rate": 7.808788752051485e-06, "loss": 2.883059387207031, "step": 552600 }, { "epoch": 0.6669061833617947, "learning_rate": 7.808384916583747e-06, "loss": 2.8970391845703123, "step": 552700 }, { "epoch": 0.6670268466842775, "learning_rate": 7.807981081116009e-06, "loss": 2.9010162353515625, "step": 552800 }, { "epoch": 0.6671475100067602, "learning_rate": 7.80757724564827e-06, "loss": 2.875140380859375, "step": 552900 }, { "epoch": 0.6672681733292428, "learning_rate": 7.807173410180531e-06, "loss": 2.8983416748046875, "step": 553000 }, { "epoch": 0.6673888366517255, "learning_rate": 7.806769574712793e-06, "loss": 2.8651605224609376, "step": 553100 }, { "epoch": 0.6675094999742082, "learning_rate": 7.806365739245055e-06, "loss": 2.8826727294921874, "step": 553200 }, { "epoch": 0.6676301632966909, "learning_rate": 7.805961903777315e-06, "loss": 2.87650146484375, "step": 553300 }, { "epoch": 0.6677508266191736, "learning_rate": 7.805558068309577e-06, "loss": 2.870502624511719, "step": 553400 }, { "epoch": 0.6678714899416562, "learning_rate": 7.80515423284184e-06, "loss": 2.8962478637695312, "step": 553500 }, { "epoch": 0.667992153264139, "learning_rate": 7.804750397374101e-06, "loss": 2.9070758056640624, "step": 553600 }, { "epoch": 0.6681128165866216, "learning_rate": 7.804346561906363e-06, "loss": 2.87674560546875, "step": 553700 }, { "epoch": 0.6682334799091043, "learning_rate": 7.803942726438623e-06, "loss": 2.872855224609375, "step": 553800 }, { "epoch": 0.668354143231587, "learning_rate": 7.803538890970885e-06, "loss": 2.8738970947265625, "step": 553900 }, { "epoch": 0.6684748065540697, "learning_rate": 7.803135055503147e-06, "loss": 2.862540588378906, "step": 554000 }, { "epoch": 0.6685954698765524, "learning_rate": 7.80273122003541e-06, "loss": 2.900754089355469, "step": 554100 }, { "epoch": 0.668716133199035, "learning_rate": 7.802327384567671e-06, "loss": 2.8874362182617186, "step": 554200 }, { "epoch": 0.6688367965215177, "learning_rate": 7.801923549099932e-06, "loss": 2.8697039794921877, "step": 554300 }, { "epoch": 0.6689574598440005, "learning_rate": 7.801519713632194e-06, "loss": 2.8760580444335937, "step": 554400 }, { "epoch": 0.6690781231664831, "learning_rate": 7.801115878164456e-06, "loss": 2.8804000854492187, "step": 554500 }, { "epoch": 0.6691987864889658, "learning_rate": 7.800712042696716e-06, "loss": 2.889403991699219, "step": 554600 }, { "epoch": 0.6693194498114485, "learning_rate": 7.800308207228978e-06, "loss": 2.8754501342773438, "step": 554700 }, { "epoch": 0.6694401131339311, "learning_rate": 7.79990437176124e-06, "loss": 2.895796203613281, "step": 554800 }, { "epoch": 0.6695607764564139, "learning_rate": 7.799500536293502e-06, "loss": 2.9030282592773435, "step": 554900 }, { "epoch": 0.6696814397788965, "learning_rate": 7.799096700825764e-06, "loss": 2.8908013916015625, "step": 555000 }, { "epoch": 0.6698021031013792, "learning_rate": 7.798692865358026e-06, "loss": 2.875460205078125, "step": 555100 }, { "epoch": 0.669922766423862, "learning_rate": 7.798289029890286e-06, "loss": 2.8758810424804686, "step": 555200 }, { "epoch": 0.6700434297463446, "learning_rate": 7.797885194422548e-06, "loss": 2.8593960571289063, "step": 555300 }, { "epoch": 0.6701640930688273, "learning_rate": 7.79748135895481e-06, "loss": 2.8479013061523437, "step": 555400 }, { "epoch": 0.6702847563913099, "learning_rate": 7.79707752348707e-06, "loss": 2.8833963012695314, "step": 555500 }, { "epoch": 0.6704054197137926, "learning_rate": 7.796673688019332e-06, "loss": 2.8628692626953125, "step": 555600 }, { "epoch": 0.6705260830362754, "learning_rate": 7.796269852551594e-06, "loss": 2.881380310058594, "step": 555700 }, { "epoch": 0.670646746358758, "learning_rate": 7.795866017083856e-06, "loss": 2.838923034667969, "step": 555800 }, { "epoch": 0.6707674096812407, "learning_rate": 7.795462181616118e-06, "loss": 2.894267883300781, "step": 555900 }, { "epoch": 0.6708880730037233, "learning_rate": 7.79505834614838e-06, "loss": 2.883511962890625, "step": 556000 }, { "epoch": 0.6710087363262061, "learning_rate": 7.794654510680642e-06, "loss": 2.87624755859375, "step": 556100 }, { "epoch": 0.6711293996486888, "learning_rate": 7.794250675212903e-06, "loss": 2.878243713378906, "step": 556200 }, { "epoch": 0.6712500629711714, "learning_rate": 7.793846839745165e-06, "loss": 2.8911016845703124, "step": 556300 }, { "epoch": 0.6713707262936541, "learning_rate": 7.793443004277425e-06, "loss": 2.903614196777344, "step": 556400 }, { "epoch": 0.6714913896161367, "learning_rate": 7.793039168809687e-06, "loss": 2.8828045654296877, "step": 556500 }, { "epoch": 0.6716120529386195, "learning_rate": 7.792635333341949e-06, "loss": 2.909044189453125, "step": 556600 }, { "epoch": 0.6717327162611022, "learning_rate": 7.79223149787421e-06, "loss": 2.8577044677734373, "step": 556700 }, { "epoch": 0.6718533795835848, "learning_rate": 7.791827662406473e-06, "loss": 2.886777038574219, "step": 556800 }, { "epoch": 0.6719740429060675, "learning_rate": 7.791423826938735e-06, "loss": 2.8680679321289064, "step": 556900 }, { "epoch": 0.6720947062285502, "learning_rate": 7.791019991470997e-06, "loss": 2.887698059082031, "step": 557000 }, { "epoch": 0.6722153695510329, "learning_rate": 7.790616156003257e-06, "loss": 2.8616558837890627, "step": 557100 }, { "epoch": 0.6723360328735156, "learning_rate": 7.790212320535519e-06, "loss": 2.892606201171875, "step": 557200 }, { "epoch": 0.6724566961959982, "learning_rate": 7.789808485067781e-06, "loss": 2.870316467285156, "step": 557300 }, { "epoch": 0.672577359518481, "learning_rate": 7.789404649600041e-06, "loss": 2.85173095703125, "step": 557400 }, { "epoch": 0.6726980228409636, "learning_rate": 7.789000814132303e-06, "loss": 2.8881787109375, "step": 557500 }, { "epoch": 0.6728186861634463, "learning_rate": 7.788596978664565e-06, "loss": 2.86265625, "step": 557600 }, { "epoch": 0.672939349485929, "learning_rate": 7.788193143196827e-06, "loss": 2.87184814453125, "step": 557700 }, { "epoch": 0.6730600128084117, "learning_rate": 7.78778930772909e-06, "loss": 2.89560302734375, "step": 557800 }, { "epoch": 0.6731806761308944, "learning_rate": 7.78738547226135e-06, "loss": 2.8589797973632813, "step": 557900 }, { "epoch": 0.673301339453377, "learning_rate": 7.786981636793611e-06, "loss": 2.8650192260742187, "step": 558000 }, { "epoch": 0.6734220027758597, "learning_rate": 7.786577801325873e-06, "loss": 2.9020370483398437, "step": 558100 }, { "epoch": 0.6735426660983425, "learning_rate": 7.786173965858135e-06, "loss": 2.876556091308594, "step": 558200 }, { "epoch": 0.6736633294208251, "learning_rate": 7.785770130390396e-06, "loss": 2.868436279296875, "step": 558300 }, { "epoch": 0.6737839927433078, "learning_rate": 7.785366294922658e-06, "loss": 2.885539855957031, "step": 558400 }, { "epoch": 0.6739046560657904, "learning_rate": 7.78496245945492e-06, "loss": 2.886922607421875, "step": 558500 }, { "epoch": 0.6740253193882731, "learning_rate": 7.784558623987182e-06, "loss": 2.8880572509765625, "step": 558600 }, { "epoch": 0.6741459827107559, "learning_rate": 7.784154788519442e-06, "loss": 2.873570556640625, "step": 558700 }, { "epoch": 0.6742666460332385, "learning_rate": 7.783750953051704e-06, "loss": 2.9087109375, "step": 558800 }, { "epoch": 0.6743873093557212, "learning_rate": 7.783347117583966e-06, "loss": 2.8594561767578126, "step": 558900 }, { "epoch": 0.6745079726782038, "learning_rate": 7.782943282116228e-06, "loss": 2.8572076416015624, "step": 559000 }, { "epoch": 0.6746286360006866, "learning_rate": 7.78253944664849e-06, "loss": 2.8629010009765623, "step": 559100 }, { "epoch": 0.6747492993231693, "learning_rate": 7.782135611180752e-06, "loss": 2.88161865234375, "step": 559200 }, { "epoch": 0.6748699626456519, "learning_rate": 7.781731775713012e-06, "loss": 2.8737612915039064, "step": 559300 }, { "epoch": 0.6749906259681346, "learning_rate": 7.781327940245274e-06, "loss": 2.8823065185546874, "step": 559400 }, { "epoch": 0.6751112892906173, "learning_rate": 7.780924104777534e-06, "loss": 2.863649597167969, "step": 559500 }, { "epoch": 0.6752319526131, "learning_rate": 7.780520269309796e-06, "loss": 2.854613952636719, "step": 559600 }, { "epoch": 0.6753526159355827, "learning_rate": 7.780116433842058e-06, "loss": 2.85444091796875, "step": 559700 }, { "epoch": 0.6754732792580653, "learning_rate": 7.77971259837432e-06, "loss": 2.898060607910156, "step": 559800 }, { "epoch": 0.6755939425805481, "learning_rate": 7.779308762906582e-06, "loss": 2.9172439575195312, "step": 559900 }, { "epoch": 0.6757146059030308, "learning_rate": 7.778904927438844e-06, "loss": 2.8942379760742187, "step": 560000 }, { "epoch": 0.6758352692255134, "learning_rate": 7.778501091971106e-06, "loss": 2.8584835815429686, "step": 560100 }, { "epoch": 0.6759559325479961, "learning_rate": 7.778097256503367e-06, "loss": 2.872791748046875, "step": 560200 }, { "epoch": 0.6760765958704787, "learning_rate": 7.777693421035629e-06, "loss": 2.903233947753906, "step": 560300 }, { "epoch": 0.6761972591929615, "learning_rate": 7.77728958556789e-06, "loss": 2.845096435546875, "step": 560400 }, { "epoch": 0.6763179225154442, "learning_rate": 7.776885750100151e-06, "loss": 2.8757818603515624, "step": 560500 }, { "epoch": 0.6764385858379268, "learning_rate": 7.776481914632413e-06, "loss": 2.8799420166015626, "step": 560600 }, { "epoch": 0.6765592491604095, "learning_rate": 7.776078079164675e-06, "loss": 2.8757839965820313, "step": 560700 }, { "epoch": 0.6766799124828922, "learning_rate": 7.775674243696937e-06, "loss": 2.8814715576171874, "step": 560800 }, { "epoch": 0.6768005758053749, "learning_rate": 7.775270408229199e-06, "loss": 2.871025390625, "step": 560900 }, { "epoch": 0.6769212391278576, "learning_rate": 7.77486657276146e-06, "loss": 2.8730758666992187, "step": 561000 }, { "epoch": 0.6770419024503402, "learning_rate": 7.774462737293723e-06, "loss": 2.8659014892578125, "step": 561100 }, { "epoch": 0.677162565772823, "learning_rate": 7.774058901825983e-06, "loss": 2.870810546875, "step": 561200 }, { "epoch": 0.6772832290953056, "learning_rate": 7.773655066358245e-06, "loss": 2.8903762817382814, "step": 561300 }, { "epoch": 0.6774038924177883, "learning_rate": 7.773251230890505e-06, "loss": 2.8667633056640627, "step": 561400 }, { "epoch": 0.677524555740271, "learning_rate": 7.772847395422767e-06, "loss": 2.8895559692382813, "step": 561500 }, { "epoch": 0.6776452190627537, "learning_rate": 7.77244355995503e-06, "loss": 2.868918762207031, "step": 561600 }, { "epoch": 0.6777658823852364, "learning_rate": 7.772039724487291e-06, "loss": 2.854873046875, "step": 561700 }, { "epoch": 0.677886545707719, "learning_rate": 7.771635889019553e-06, "loss": 2.884571533203125, "step": 561800 }, { "epoch": 0.6780072090302017, "learning_rate": 7.771232053551815e-06, "loss": 2.8823175048828125, "step": 561900 }, { "epoch": 0.6781278723526845, "learning_rate": 7.770828218084076e-06, "loss": 2.876451110839844, "step": 562000 }, { "epoch": 0.6782485356751671, "learning_rate": 7.770424382616337e-06, "loss": 2.8530618286132814, "step": 562100 }, { "epoch": 0.6783691989976498, "learning_rate": 7.7700205471486e-06, "loss": 2.8595480346679687, "step": 562200 }, { "epoch": 0.6784898623201324, "learning_rate": 7.769616711680861e-06, "loss": 2.8763507080078123, "step": 562300 }, { "epoch": 0.6786105256426151, "learning_rate": 7.769212876213122e-06, "loss": 2.8865179443359374, "step": 562400 }, { "epoch": 0.6787311889650979, "learning_rate": 7.768809040745384e-06, "loss": 2.8828839111328124, "step": 562500 }, { "epoch": 0.6788518522875805, "learning_rate": 7.768405205277646e-06, "loss": 2.8752972412109377, "step": 562600 }, { "epoch": 0.6789725156100632, "learning_rate": 7.768001369809908e-06, "loss": 2.8934088134765625, "step": 562700 }, { "epoch": 0.6790931789325458, "learning_rate": 7.767597534342168e-06, "loss": 2.8764599609375, "step": 562800 }, { "epoch": 0.6792138422550286, "learning_rate": 7.76719369887443e-06, "loss": 2.8791510009765626, "step": 562900 }, { "epoch": 0.6793345055775113, "learning_rate": 7.766789863406692e-06, "loss": 2.8823703002929686, "step": 563000 }, { "epoch": 0.6794551688999939, "learning_rate": 7.766386027938954e-06, "loss": 2.8865802001953127, "step": 563100 }, { "epoch": 0.6795758322224766, "learning_rate": 7.765982192471216e-06, "loss": 2.876112060546875, "step": 563200 }, { "epoch": 0.6796964955449593, "learning_rate": 7.765578357003478e-06, "loss": 2.8465057373046876, "step": 563300 }, { "epoch": 0.679817158867442, "learning_rate": 7.765174521535738e-06, "loss": 2.87403076171875, "step": 563400 }, { "epoch": 0.6799378221899247, "learning_rate": 7.764770686068e-06, "loss": 2.8897393798828124, "step": 563500 }, { "epoch": 0.6800584855124073, "learning_rate": 7.76436685060026e-06, "loss": 2.874971618652344, "step": 563600 }, { "epoch": 0.6801791488348901, "learning_rate": 7.763963015132522e-06, "loss": 2.8601336669921875, "step": 563700 }, { "epoch": 0.6802998121573727, "learning_rate": 7.763559179664784e-06, "loss": 2.8728759765625, "step": 563800 }, { "epoch": 0.6804204754798554, "learning_rate": 7.763155344197046e-06, "loss": 2.869473876953125, "step": 563900 }, { "epoch": 0.6805411388023381, "learning_rate": 7.762751508729308e-06, "loss": 2.876650390625, "step": 564000 }, { "epoch": 0.6806618021248207, "learning_rate": 7.76234767326157e-06, "loss": 2.8839767456054686, "step": 564100 }, { "epoch": 0.6807824654473035, "learning_rate": 7.761943837793832e-06, "loss": 2.8563507080078123, "step": 564200 }, { "epoch": 0.6809031287697861, "learning_rate": 7.761540002326093e-06, "loss": 2.9017193603515623, "step": 564300 }, { "epoch": 0.6810237920922688, "learning_rate": 7.761136166858355e-06, "loss": 2.8523788452148438, "step": 564400 }, { "epoch": 0.6811444554147515, "learning_rate": 7.760732331390617e-06, "loss": 2.8543975830078123, "step": 564500 }, { "epoch": 0.6812651187372342, "learning_rate": 7.760328495922877e-06, "loss": 2.901194763183594, "step": 564600 }, { "epoch": 0.6813857820597169, "learning_rate": 7.759924660455139e-06, "loss": 2.888547058105469, "step": 564700 }, { "epoch": 0.6815064453821995, "learning_rate": 7.759520824987401e-06, "loss": 2.8899765014648438, "step": 564800 }, { "epoch": 0.6816271087046822, "learning_rate": 7.759116989519663e-06, "loss": 2.892289733886719, "step": 564900 }, { "epoch": 0.681747772027165, "learning_rate": 7.758713154051925e-06, "loss": 2.869903869628906, "step": 565000 }, { "epoch": 0.6818684353496476, "learning_rate": 7.758309318584187e-06, "loss": 2.8770574951171874, "step": 565100 }, { "epoch": 0.6819890986721303, "learning_rate": 7.757905483116447e-06, "loss": 2.9096868896484374, "step": 565200 }, { "epoch": 0.682109761994613, "learning_rate": 7.757501647648709e-06, "loss": 2.8768850708007814, "step": 565300 }, { "epoch": 0.6822304253170957, "learning_rate": 7.757097812180971e-06, "loss": 2.8804562377929686, "step": 565400 }, { "epoch": 0.6823510886395784, "learning_rate": 7.756693976713231e-06, "loss": 2.8872064208984374, "step": 565500 }, { "epoch": 0.682471751962061, "learning_rate": 7.756290141245493e-06, "loss": 2.8703192138671874, "step": 565600 }, { "epoch": 0.6825924152845437, "learning_rate": 7.755886305777755e-06, "loss": 2.847398376464844, "step": 565700 }, { "epoch": 0.6827130786070265, "learning_rate": 7.755482470310017e-06, "loss": 2.879388427734375, "step": 565800 }, { "epoch": 0.6828337419295091, "learning_rate": 7.75507863484228e-06, "loss": 2.9059454345703126, "step": 565900 }, { "epoch": 0.6829544052519918, "learning_rate": 7.75467479937454e-06, "loss": 2.8791693115234374, "step": 566000 }, { "epoch": 0.6830750685744744, "learning_rate": 7.754270963906802e-06, "loss": 2.8903179931640626, "step": 566100 }, { "epoch": 0.6831957318969571, "learning_rate": 7.753867128439064e-06, "loss": 2.8886767578125, "step": 566200 }, { "epoch": 0.6833163952194399, "learning_rate": 7.753463292971326e-06, "loss": 2.874239501953125, "step": 566300 }, { "epoch": 0.6834370585419225, "learning_rate": 7.753059457503587e-06, "loss": 2.88536376953125, "step": 566400 }, { "epoch": 0.6835577218644052, "learning_rate": 7.752655622035848e-06, "loss": 2.879300537109375, "step": 566500 }, { "epoch": 0.6836783851868878, "learning_rate": 7.75225178656811e-06, "loss": 2.8782589721679686, "step": 566600 }, { "epoch": 0.6837990485093706, "learning_rate": 7.751847951100372e-06, "loss": 2.867265625, "step": 566700 }, { "epoch": 0.6839197118318533, "learning_rate": 7.751444115632634e-06, "loss": 2.8794720458984373, "step": 566800 }, { "epoch": 0.6840403751543359, "learning_rate": 7.751040280164894e-06, "loss": 2.8571954345703126, "step": 566900 }, { "epoch": 0.6841610384768186, "learning_rate": 7.750636444697156e-06, "loss": 2.857785949707031, "step": 567000 }, { "epoch": 0.6842817017993013, "learning_rate": 7.750232609229418e-06, "loss": 2.8535577392578126, "step": 567100 }, { "epoch": 0.684402365121784, "learning_rate": 7.74982877376168e-06, "loss": 2.8628280639648436, "step": 567200 }, { "epoch": 0.6845230284442667, "learning_rate": 7.749424938293942e-06, "loss": 2.8665975952148437, "step": 567300 }, { "epoch": 0.6846436917667493, "learning_rate": 7.749021102826202e-06, "loss": 2.8678985595703126, "step": 567400 }, { "epoch": 0.6847643550892321, "learning_rate": 7.748617267358464e-06, "loss": 2.882415771484375, "step": 567500 }, { "epoch": 0.6848850184117147, "learning_rate": 7.748213431890726e-06, "loss": 2.8546875, "step": 567600 }, { "epoch": 0.6850056817341974, "learning_rate": 7.747809596422986e-06, "loss": 2.8489559936523436, "step": 567700 }, { "epoch": 0.6851263450566801, "learning_rate": 7.747405760955248e-06, "loss": 2.883067321777344, "step": 567800 }, { "epoch": 0.6852470083791627, "learning_rate": 7.74700192548751e-06, "loss": 2.880250244140625, "step": 567900 }, { "epoch": 0.6853676717016455, "learning_rate": 7.746598090019772e-06, "loss": 2.9046136474609376, "step": 568000 }, { "epoch": 0.6854883350241281, "learning_rate": 7.746194254552034e-06, "loss": 2.8551254272460938, "step": 568100 }, { "epoch": 0.6856089983466108, "learning_rate": 7.745790419084296e-06, "loss": 2.8562921142578124, "step": 568200 }, { "epoch": 0.6857296616690935, "learning_rate": 7.745386583616558e-06, "loss": 2.8735302734375, "step": 568300 }, { "epoch": 0.6858503249915762, "learning_rate": 7.744982748148819e-06, "loss": 2.8759234619140623, "step": 568400 }, { "epoch": 0.6859709883140589, "learning_rate": 7.74457891268108e-06, "loss": 2.876201477050781, "step": 568500 }, { "epoch": 0.6860916516365415, "learning_rate": 7.744175077213341e-06, "loss": 2.869367980957031, "step": 568600 }, { "epoch": 0.6862123149590242, "learning_rate": 7.743771241745603e-06, "loss": 2.8561962890625, "step": 568700 }, { "epoch": 0.686332978281507, "learning_rate": 7.743367406277865e-06, "loss": 2.859227294921875, "step": 568800 }, { "epoch": 0.6864536416039896, "learning_rate": 7.742963570810127e-06, "loss": 2.875888671875, "step": 568900 }, { "epoch": 0.6865743049264723, "learning_rate": 7.742559735342389e-06, "loss": 2.8876577758789064, "step": 569000 }, { "epoch": 0.6866949682489549, "learning_rate": 7.742155899874651e-06, "loss": 2.861221923828125, "step": 569100 }, { "epoch": 0.6868156315714377, "learning_rate": 7.741752064406913e-06, "loss": 2.8677130126953125, "step": 569200 }, { "epoch": 0.6869362948939204, "learning_rate": 7.741348228939173e-06, "loss": 2.8819265747070313, "step": 569300 }, { "epoch": 0.687056958216403, "learning_rate": 7.740944393471435e-06, "loss": 2.8750811767578126, "step": 569400 }, { "epoch": 0.6871776215388857, "learning_rate": 7.740540558003697e-06, "loss": 2.8770632934570313, "step": 569500 }, { "epoch": 0.6872982848613683, "learning_rate": 7.740136722535957e-06, "loss": 2.865481262207031, "step": 569600 }, { "epoch": 0.6874189481838511, "learning_rate": 7.73973288706822e-06, "loss": 2.8378131103515627, "step": 569700 }, { "epoch": 0.6875396115063338, "learning_rate": 7.739329051600481e-06, "loss": 2.852716979980469, "step": 569800 }, { "epoch": 0.6876602748288164, "learning_rate": 7.738925216132743e-06, "loss": 2.863541259765625, "step": 569900 }, { "epoch": 0.6877809381512991, "learning_rate": 7.738521380665005e-06, "loss": 2.8488308715820314, "step": 570000 }, { "epoch": 0.6879016014737819, "learning_rate": 7.738117545197266e-06, "loss": 2.882537841796875, "step": 570100 }, { "epoch": 0.6880222647962645, "learning_rate": 7.737713709729528e-06, "loss": 2.847112731933594, "step": 570200 }, { "epoch": 0.6881429281187472, "learning_rate": 7.73730987426179e-06, "loss": 2.876348571777344, "step": 570300 }, { "epoch": 0.6882635914412298, "learning_rate": 7.736906038794052e-06, "loss": 2.889609069824219, "step": 570400 }, { "epoch": 0.6883842547637126, "learning_rate": 7.736502203326312e-06, "loss": 2.8449444580078125, "step": 570500 }, { "epoch": 0.6885049180861953, "learning_rate": 7.736098367858574e-06, "loss": 2.8665936279296873, "step": 570600 }, { "epoch": 0.6886255814086779, "learning_rate": 7.735694532390836e-06, "loss": 2.890267333984375, "step": 570700 }, { "epoch": 0.6887462447311606, "learning_rate": 7.735290696923098e-06, "loss": 2.8554742431640623, "step": 570800 }, { "epoch": 0.6888669080536433, "learning_rate": 7.734886861455358e-06, "loss": 2.8798077392578123, "step": 570900 }, { "epoch": 0.688987571376126, "learning_rate": 7.73448302598762e-06, "loss": 2.8675967407226564, "step": 571000 }, { "epoch": 0.6891082346986087, "learning_rate": 7.734079190519882e-06, "loss": 2.8301461791992186, "step": 571100 }, { "epoch": 0.6892288980210913, "learning_rate": 7.733675355052144e-06, "loss": 2.84908935546875, "step": 571200 }, { "epoch": 0.6893495613435741, "learning_rate": 7.733271519584406e-06, "loss": 2.8650912475585937, "step": 571300 }, { "epoch": 0.6894702246660567, "learning_rate": 7.732867684116668e-06, "loss": 2.8545663452148435, "step": 571400 }, { "epoch": 0.6895908879885394, "learning_rate": 7.732463848648928e-06, "loss": 2.8690859985351564, "step": 571500 }, { "epoch": 0.6897115513110221, "learning_rate": 7.73206001318119e-06, "loss": 2.8635479736328127, "step": 571600 }, { "epoch": 0.6898322146335047, "learning_rate": 7.731656177713452e-06, "loss": 2.852455749511719, "step": 571700 }, { "epoch": 0.6899528779559875, "learning_rate": 7.731252342245713e-06, "loss": 2.8488589477539064, "step": 571800 }, { "epoch": 0.6900735412784701, "learning_rate": 7.730848506777975e-06, "loss": 2.8865380859375, "step": 571900 }, { "epoch": 0.6901942046009528, "learning_rate": 7.730444671310236e-06, "loss": 2.874664611816406, "step": 572000 }, { "epoch": 0.6903148679234355, "learning_rate": 7.730040835842498e-06, "loss": 2.8504257202148438, "step": 572100 }, { "epoch": 0.6904355312459182, "learning_rate": 7.72963700037476e-06, "loss": 2.8802975463867186, "step": 572200 }, { "epoch": 0.6905561945684009, "learning_rate": 7.729233164907022e-06, "loss": 2.8815579223632812, "step": 572300 }, { "epoch": 0.6906768578908835, "learning_rate": 7.728829329439283e-06, "loss": 2.8994290161132814, "step": 572400 }, { "epoch": 0.6907975212133662, "learning_rate": 7.728425493971545e-06, "loss": 2.857418212890625, "step": 572500 }, { "epoch": 0.690918184535849, "learning_rate": 7.728021658503807e-06, "loss": 2.8725555419921873, "step": 572600 }, { "epoch": 0.6910388478583316, "learning_rate": 7.727617823036067e-06, "loss": 2.867392578125, "step": 572700 }, { "epoch": 0.6911595111808143, "learning_rate": 7.727213987568329e-06, "loss": 2.870016784667969, "step": 572800 }, { "epoch": 0.6912801745032969, "learning_rate": 7.726810152100591e-06, "loss": 2.853316345214844, "step": 572900 }, { "epoch": 0.6914008378257797, "learning_rate": 7.726406316632853e-06, "loss": 2.8782925415039062, "step": 573000 }, { "epoch": 0.6915215011482624, "learning_rate": 7.726002481165115e-06, "loss": 2.8332757568359375, "step": 573100 }, { "epoch": 0.691642164470745, "learning_rate": 7.725598645697377e-06, "loss": 2.8534942626953126, "step": 573200 }, { "epoch": 0.6917628277932277, "learning_rate": 7.725194810229639e-06, "loss": 2.8601724243164064, "step": 573300 }, { "epoch": 0.6918834911157103, "learning_rate": 7.7247909747619e-06, "loss": 2.872872009277344, "step": 573400 }, { "epoch": 0.6920041544381931, "learning_rate": 7.724387139294161e-06, "loss": 2.8716860961914064, "step": 573500 }, { "epoch": 0.6921248177606758, "learning_rate": 7.723983303826421e-06, "loss": 2.870142517089844, "step": 573600 }, { "epoch": 0.6922454810831584, "learning_rate": 7.723579468358683e-06, "loss": 2.861686096191406, "step": 573700 }, { "epoch": 0.6923661444056411, "learning_rate": 7.723175632890945e-06, "loss": 2.89477294921875, "step": 573800 }, { "epoch": 0.6924868077281238, "learning_rate": 7.722771797423207e-06, "loss": 2.858819580078125, "step": 573900 }, { "epoch": 0.6926074710506065, "learning_rate": 7.72236796195547e-06, "loss": 2.8641656494140624, "step": 574000 }, { "epoch": 0.6927281343730892, "learning_rate": 7.721964126487731e-06, "loss": 2.8659429931640625, "step": 574100 }, { "epoch": 0.6928487976955718, "learning_rate": 7.721560291019992e-06, "loss": 2.86802734375, "step": 574200 }, { "epoch": 0.6929694610180546, "learning_rate": 7.721156455552254e-06, "loss": 2.8383413696289064, "step": 574300 }, { "epoch": 0.6930901243405372, "learning_rate": 7.720752620084516e-06, "loss": 2.8667523193359377, "step": 574400 }, { "epoch": 0.6932107876630199, "learning_rate": 7.720348784616778e-06, "loss": 2.8475680541992188, "step": 574500 }, { "epoch": 0.6933314509855026, "learning_rate": 7.719944949149038e-06, "loss": 2.851126708984375, "step": 574600 }, { "epoch": 0.6934521143079853, "learning_rate": 7.7195411136813e-06, "loss": 2.851023864746094, "step": 574700 }, { "epoch": 0.693572777630468, "learning_rate": 7.719137278213562e-06, "loss": 2.8499740600585937, "step": 574800 }, { "epoch": 0.6936934409529506, "learning_rate": 7.718733442745824e-06, "loss": 2.8620339965820314, "step": 574900 }, { "epoch": 0.6938141042754333, "learning_rate": 7.718329607278084e-06, "loss": 2.8746914672851562, "step": 575000 }, { "epoch": 0.6939347675979161, "learning_rate": 7.717925771810346e-06, "loss": 2.8576153564453124, "step": 575100 }, { "epoch": 0.6940554309203987, "learning_rate": 7.717521936342608e-06, "loss": 2.84666748046875, "step": 575200 }, { "epoch": 0.6941760942428814, "learning_rate": 7.71711810087487e-06, "loss": 2.8798028564453126, "step": 575300 }, { "epoch": 0.6942967575653641, "learning_rate": 7.716714265407132e-06, "loss": 2.8682757568359376, "step": 575400 }, { "epoch": 0.6944174208878467, "learning_rate": 7.716310429939394e-06, "loss": 2.8715280151367186, "step": 575500 }, { "epoch": 0.6945380842103295, "learning_rate": 7.715906594471654e-06, "loss": 2.877300109863281, "step": 575600 }, { "epoch": 0.6946587475328121, "learning_rate": 7.715502759003916e-06, "loss": 2.8766259765625, "step": 575700 }, { "epoch": 0.6947794108552948, "learning_rate": 7.715098923536177e-06, "loss": 2.8907876586914063, "step": 575800 }, { "epoch": 0.6949000741777775, "learning_rate": 7.714695088068439e-06, "loss": 2.8691976928710936, "step": 575900 }, { "epoch": 0.6950207375002602, "learning_rate": 7.7142912526007e-06, "loss": 2.859876708984375, "step": 576000 }, { "epoch": 0.6951414008227429, "learning_rate": 7.713887417132963e-06, "loss": 2.8728204345703126, "step": 576100 }, { "epoch": 0.6952620641452255, "learning_rate": 7.713483581665224e-06, "loss": 2.8735012817382812, "step": 576200 }, { "epoch": 0.6953827274677082, "learning_rate": 7.713079746197486e-06, "loss": 2.8696408081054687, "step": 576300 }, { "epoch": 0.695503390790191, "learning_rate": 7.712675910729748e-06, "loss": 2.8614126586914064, "step": 576400 }, { "epoch": 0.6956240541126736, "learning_rate": 7.712272075262009e-06, "loss": 2.863514709472656, "step": 576500 }, { "epoch": 0.6957447174351563, "learning_rate": 7.71186823979427e-06, "loss": 2.875749206542969, "step": 576600 }, { "epoch": 0.6958653807576389, "learning_rate": 7.711464404326533e-06, "loss": 2.869881286621094, "step": 576700 }, { "epoch": 0.6959860440801217, "learning_rate": 7.711060568858793e-06, "loss": 2.877679443359375, "step": 576800 }, { "epoch": 0.6961067074026044, "learning_rate": 7.710656733391055e-06, "loss": 2.8645761108398435, "step": 576900 }, { "epoch": 0.696227370725087, "learning_rate": 7.710252897923317e-06, "loss": 2.8620050048828123, "step": 577000 }, { "epoch": 0.6963480340475697, "learning_rate": 7.709849062455579e-06, "loss": 2.8769570922851564, "step": 577100 }, { "epoch": 0.6964686973700523, "learning_rate": 7.709445226987841e-06, "loss": 2.856103515625, "step": 577200 }, { "epoch": 0.6965893606925351, "learning_rate": 7.709041391520103e-06, "loss": 2.851171875, "step": 577300 }, { "epoch": 0.6967100240150178, "learning_rate": 7.708637556052365e-06, "loss": 2.864934387207031, "step": 577400 }, { "epoch": 0.6968306873375004, "learning_rate": 7.708233720584625e-06, "loss": 2.8648745727539064, "step": 577500 }, { "epoch": 0.6969513506599831, "learning_rate": 7.707829885116887e-06, "loss": 2.8809881591796875, "step": 577600 }, { "epoch": 0.6970720139824658, "learning_rate": 7.707426049649147e-06, "loss": 2.8629269409179687, "step": 577700 }, { "epoch": 0.6971926773049485, "learning_rate": 7.70702221418141e-06, "loss": 2.8471365356445313, "step": 577800 }, { "epoch": 0.6973133406274312, "learning_rate": 7.706618378713671e-06, "loss": 2.8456512451171876, "step": 577900 }, { "epoch": 0.6974340039499138, "learning_rate": 7.706214543245933e-06, "loss": 2.8593902587890625, "step": 578000 }, { "epoch": 0.6975546672723966, "learning_rate": 7.705810707778195e-06, "loss": 2.888683166503906, "step": 578100 }, { "epoch": 0.6976753305948792, "learning_rate": 7.705406872310457e-06, "loss": 2.86565185546875, "step": 578200 }, { "epoch": 0.6977959939173619, "learning_rate": 7.705003036842718e-06, "loss": 2.8601412963867188, "step": 578300 }, { "epoch": 0.6979166572398446, "learning_rate": 7.70459920137498e-06, "loss": 2.865805969238281, "step": 578400 }, { "epoch": 0.6980373205623273, "learning_rate": 7.704195365907242e-06, "loss": 2.867271728515625, "step": 578500 }, { "epoch": 0.69815798388481, "learning_rate": 7.703791530439504e-06, "loss": 2.8775863647460938, "step": 578600 }, { "epoch": 0.6982786472072926, "learning_rate": 7.703387694971764e-06, "loss": 2.8373922729492187, "step": 578700 }, { "epoch": 0.6983993105297753, "learning_rate": 7.702983859504026e-06, "loss": 2.8459716796875, "step": 578800 }, { "epoch": 0.6985199738522581, "learning_rate": 7.702580024036288e-06, "loss": 2.8858401489257814, "step": 578900 }, { "epoch": 0.6986406371747407, "learning_rate": 7.70217618856855e-06, "loss": 2.8735421752929686, "step": 579000 }, { "epoch": 0.6987613004972234, "learning_rate": 7.70177235310081e-06, "loss": 2.8599142456054687, "step": 579100 }, { "epoch": 0.698881963819706, "learning_rate": 7.701368517633072e-06, "loss": 2.8436068725585937, "step": 579200 }, { "epoch": 0.6990026271421887, "learning_rate": 7.700964682165334e-06, "loss": 2.8749465942382812, "step": 579300 }, { "epoch": 0.6991232904646715, "learning_rate": 7.700560846697596e-06, "loss": 2.8473880004882814, "step": 579400 }, { "epoch": 0.6992439537871541, "learning_rate": 7.700157011229858e-06, "loss": 2.8750433349609374, "step": 579500 }, { "epoch": 0.6993646171096368, "learning_rate": 7.699753175762118e-06, "loss": 2.8686251831054688, "step": 579600 }, { "epoch": 0.6994852804321194, "learning_rate": 7.69934934029438e-06, "loss": 2.8483035278320314, "step": 579700 }, { "epoch": 0.6996059437546022, "learning_rate": 7.698945504826642e-06, "loss": 2.865941162109375, "step": 579800 }, { "epoch": 0.6997266070770849, "learning_rate": 7.698541669358903e-06, "loss": 2.8775344848632813, "step": 579900 }, { "epoch": 0.6998472703995675, "learning_rate": 7.698137833891165e-06, "loss": 2.8662261962890625, "step": 580000 }, { "epoch": 0.6999679337220502, "learning_rate": 7.697733998423427e-06, "loss": 2.8305096435546875, "step": 580100 }, { "epoch": 0.7000885970445329, "learning_rate": 7.697330162955689e-06, "loss": 2.846646423339844, "step": 580200 }, { "epoch": 0.7002092603670156, "learning_rate": 7.69692632748795e-06, "loss": 2.8427920532226563, "step": 580300 }, { "epoch": 0.7003299236894983, "learning_rate": 7.696522492020213e-06, "loss": 2.8501577758789063, "step": 580400 }, { "epoch": 0.7004505870119809, "learning_rate": 7.696118656552474e-06, "loss": 2.856065368652344, "step": 580500 }, { "epoch": 0.7005712503344637, "learning_rate": 7.695714821084735e-06, "loss": 2.86554443359375, "step": 580600 }, { "epoch": 0.7006919136569464, "learning_rate": 7.695310985616997e-06, "loss": 2.861060791015625, "step": 580700 }, { "epoch": 0.700812576979429, "learning_rate": 7.694907150149257e-06, "loss": 2.8796966552734373, "step": 580800 }, { "epoch": 0.7009332403019117, "learning_rate": 7.694503314681519e-06, "loss": 2.846746826171875, "step": 580900 }, { "epoch": 0.7010539036243943, "learning_rate": 7.694099479213781e-06, "loss": 2.8797747802734377, "step": 581000 }, { "epoch": 0.7011745669468771, "learning_rate": 7.693695643746043e-06, "loss": 2.8457540893554687, "step": 581100 }, { "epoch": 0.7012952302693598, "learning_rate": 7.693291808278305e-06, "loss": 2.8617990112304685, "step": 581200 }, { "epoch": 0.7014158935918424, "learning_rate": 7.692887972810567e-06, "loss": 2.8425949096679686, "step": 581300 }, { "epoch": 0.7015365569143251, "learning_rate": 7.692484137342829e-06, "loss": 2.871072082519531, "step": 581400 }, { "epoch": 0.7016572202368078, "learning_rate": 7.69208030187509e-06, "loss": 2.8760720825195314, "step": 581500 }, { "epoch": 0.7017778835592905, "learning_rate": 7.691676466407351e-06, "loss": 2.8598867797851564, "step": 581600 }, { "epoch": 0.7018985468817732, "learning_rate": 7.691272630939613e-06, "loss": 2.848721923828125, "step": 581700 }, { "epoch": 0.7020192102042558, "learning_rate": 7.690868795471873e-06, "loss": 2.879400329589844, "step": 581800 }, { "epoch": 0.7021398735267386, "learning_rate": 7.690464960004135e-06, "loss": 2.8481890869140627, "step": 581900 }, { "epoch": 0.7022605368492212, "learning_rate": 7.690061124536397e-06, "loss": 2.8708651733398436, "step": 582000 }, { "epoch": 0.7023812001717039, "learning_rate": 7.68965728906866e-06, "loss": 2.8634072875976564, "step": 582100 }, { "epoch": 0.7025018634941866, "learning_rate": 7.689253453600921e-06, "loss": 2.8674072265625, "step": 582200 }, { "epoch": 0.7026225268166693, "learning_rate": 7.688849618133183e-06, "loss": 2.850791015625, "step": 582300 }, { "epoch": 0.702743190139152, "learning_rate": 7.688445782665444e-06, "loss": 2.8389996337890624, "step": 582400 }, { "epoch": 0.7028638534616346, "learning_rate": 7.688041947197706e-06, "loss": 2.835662536621094, "step": 582500 }, { "epoch": 0.7029845167841173, "learning_rate": 7.687638111729968e-06, "loss": 2.861239013671875, "step": 582600 }, { "epoch": 0.7031051801066001, "learning_rate": 7.687234276262228e-06, "loss": 2.8550344848632814, "step": 582700 }, { "epoch": 0.7032258434290827, "learning_rate": 7.68683044079449e-06, "loss": 2.8749453735351564, "step": 582800 }, { "epoch": 0.7033465067515654, "learning_rate": 7.686426605326752e-06, "loss": 2.840761413574219, "step": 582900 }, { "epoch": 0.703467170074048, "learning_rate": 7.686022769859014e-06, "loss": 2.824681396484375, "step": 583000 }, { "epoch": 0.7035878333965307, "learning_rate": 7.685618934391276e-06, "loss": 2.8570266723632813, "step": 583100 }, { "epoch": 0.7037084967190135, "learning_rate": 7.685215098923536e-06, "loss": 2.8533200073242186, "step": 583200 }, { "epoch": 0.7038291600414961, "learning_rate": 7.684811263455798e-06, "loss": 2.8620306396484376, "step": 583300 }, { "epoch": 0.7039498233639788, "learning_rate": 7.68440742798806e-06, "loss": 2.8539398193359373, "step": 583400 }, { "epoch": 0.7040704866864614, "learning_rate": 7.684003592520322e-06, "loss": 2.8594931030273436, "step": 583500 }, { "epoch": 0.7041911500089442, "learning_rate": 7.683599757052584e-06, "loss": 2.8342193603515624, "step": 583600 }, { "epoch": 0.7043118133314269, "learning_rate": 7.683195921584844e-06, "loss": 2.847510986328125, "step": 583700 }, { "epoch": 0.7044324766539095, "learning_rate": 7.682792086117106e-06, "loss": 2.8276678466796876, "step": 583800 }, { "epoch": 0.7045531399763922, "learning_rate": 7.682388250649368e-06, "loss": 2.819851989746094, "step": 583900 }, { "epoch": 0.7046738032988749, "learning_rate": 7.681984415181629e-06, "loss": 2.8557998657226564, "step": 584000 }, { "epoch": 0.7047944666213576, "learning_rate": 7.68158057971389e-06, "loss": 2.8221475219726564, "step": 584100 }, { "epoch": 0.7049151299438403, "learning_rate": 7.681176744246153e-06, "loss": 2.8478509521484376, "step": 584200 }, { "epoch": 0.7050357932663229, "learning_rate": 7.680772908778415e-06, "loss": 2.8505010986328125, "step": 584300 }, { "epoch": 0.7051564565888057, "learning_rate": 7.680369073310677e-06, "loss": 2.867825927734375, "step": 584400 }, { "epoch": 0.7052771199112883, "learning_rate": 7.679965237842939e-06, "loss": 2.852281188964844, "step": 584500 }, { "epoch": 0.705397783233771, "learning_rate": 7.679561402375199e-06, "loss": 2.8433111572265624, "step": 584600 }, { "epoch": 0.7055184465562537, "learning_rate": 7.67915756690746e-06, "loss": 2.8510702514648436, "step": 584700 }, { "epoch": 0.7056391098787363, "learning_rate": 7.678753731439723e-06, "loss": 2.847156677246094, "step": 584800 }, { "epoch": 0.7057597732012191, "learning_rate": 7.678349895971983e-06, "loss": 2.862283020019531, "step": 584900 }, { "epoch": 0.7058804365237017, "learning_rate": 7.677946060504245e-06, "loss": 2.870137023925781, "step": 585000 }, { "epoch": 0.7060010998461844, "learning_rate": 7.677542225036507e-06, "loss": 2.858834228515625, "step": 585100 }, { "epoch": 0.7061217631686671, "learning_rate": 7.677138389568769e-06, "loss": 2.8479238891601564, "step": 585200 }, { "epoch": 0.7062424264911498, "learning_rate": 7.676734554101031e-06, "loss": 2.8547308349609377, "step": 585300 }, { "epoch": 0.7063630898136325, "learning_rate": 7.676330718633293e-06, "loss": 2.833609924316406, "step": 585400 }, { "epoch": 0.7064837531361151, "learning_rate": 7.675926883165555e-06, "loss": 2.8622250366210937, "step": 585500 }, { "epoch": 0.7066044164585978, "learning_rate": 7.675523047697815e-06, "loss": 2.842254638671875, "step": 585600 }, { "epoch": 0.7067250797810806, "learning_rate": 7.675119212230077e-06, "loss": 2.854966125488281, "step": 585700 }, { "epoch": 0.7068457431035632, "learning_rate": 7.674715376762338e-06, "loss": 2.8604837036132813, "step": 585800 }, { "epoch": 0.7069664064260459, "learning_rate": 7.6743115412946e-06, "loss": 2.8233154296875, "step": 585900 }, { "epoch": 0.7070870697485286, "learning_rate": 7.673907705826862e-06, "loss": 2.8461572265625, "step": 586000 }, { "epoch": 0.7072077330710113, "learning_rate": 7.673503870359123e-06, "loss": 2.851761779785156, "step": 586100 }, { "epoch": 0.707328396393494, "learning_rate": 7.673100034891385e-06, "loss": 2.8616061401367188, "step": 586200 }, { "epoch": 0.7074490597159766, "learning_rate": 7.672696199423647e-06, "loss": 2.852017517089844, "step": 586300 }, { "epoch": 0.7075697230384593, "learning_rate": 7.672292363955908e-06, "loss": 2.8566278076171874, "step": 586400 }, { "epoch": 0.7076903863609421, "learning_rate": 7.67188852848817e-06, "loss": 2.8473611450195313, "step": 586500 }, { "epoch": 0.7078110496834247, "learning_rate": 7.671484693020432e-06, "loss": 2.87174072265625, "step": 586600 }, { "epoch": 0.7079317130059074, "learning_rate": 7.671080857552694e-06, "loss": 2.8517861938476563, "step": 586700 }, { "epoch": 0.70805237632839, "learning_rate": 7.670677022084954e-06, "loss": 2.862684631347656, "step": 586800 }, { "epoch": 0.7081730396508727, "learning_rate": 7.670273186617216e-06, "loss": 2.8592300415039062, "step": 586900 }, { "epoch": 0.7082937029733555, "learning_rate": 7.669869351149478e-06, "loss": 2.8380801391601564, "step": 587000 }, { "epoch": 0.7084143662958381, "learning_rate": 7.66946551568174e-06, "loss": 2.856009826660156, "step": 587100 }, { "epoch": 0.7085350296183208, "learning_rate": 7.669061680214002e-06, "loss": 2.854145202636719, "step": 587200 }, { "epoch": 0.7086556929408034, "learning_rate": 7.668657844746262e-06, "loss": 2.8359329223632814, "step": 587300 }, { "epoch": 0.7087763562632862, "learning_rate": 7.668254009278524e-06, "loss": 2.8700601196289064, "step": 587400 }, { "epoch": 0.7088970195857689, "learning_rate": 7.667850173810786e-06, "loss": 2.8557757568359374, "step": 587500 }, { "epoch": 0.7090176829082515, "learning_rate": 7.667446338343048e-06, "loss": 2.8446340942382813, "step": 587600 }, { "epoch": 0.7091383462307342, "learning_rate": 7.667042502875308e-06, "loss": 2.8498724365234374, "step": 587700 }, { "epoch": 0.7092590095532169, "learning_rate": 7.66663866740757e-06, "loss": 2.839444274902344, "step": 587800 }, { "epoch": 0.7093796728756996, "learning_rate": 7.666234831939832e-06, "loss": 2.8605221557617186, "step": 587900 }, { "epoch": 0.7095003361981823, "learning_rate": 7.665830996472094e-06, "loss": 2.8712619018554686, "step": 588000 }, { "epoch": 0.7096209995206649, "learning_rate": 7.665427161004355e-06, "loss": 2.851839294433594, "step": 588100 }, { "epoch": 0.7097416628431477, "learning_rate": 7.665023325536617e-06, "loss": 2.8605792236328127, "step": 588200 }, { "epoch": 0.7098623261656303, "learning_rate": 7.664619490068879e-06, "loss": 2.8506231689453125, "step": 588300 }, { "epoch": 0.709982989488113, "learning_rate": 7.66421565460114e-06, "loss": 2.8274185180664064, "step": 588400 }, { "epoch": 0.7101036528105957, "learning_rate": 7.663811819133403e-06, "loss": 2.880670166015625, "step": 588500 }, { "epoch": 0.7102243161330783, "learning_rate": 7.663407983665665e-06, "loss": 2.8383724975585936, "step": 588600 }, { "epoch": 0.7103449794555611, "learning_rate": 7.663004148197925e-06, "loss": 2.846884765625, "step": 588700 }, { "epoch": 0.7104656427780437, "learning_rate": 7.662600312730187e-06, "loss": 2.841048278808594, "step": 588800 }, { "epoch": 0.7105863061005264, "learning_rate": 7.662196477262447e-06, "loss": 2.832183532714844, "step": 588900 }, { "epoch": 0.7107069694230091, "learning_rate": 7.661792641794709e-06, "loss": 2.849126892089844, "step": 589000 }, { "epoch": 0.7108276327454918, "learning_rate": 7.661388806326971e-06, "loss": 2.865208740234375, "step": 589100 }, { "epoch": 0.7109482960679745, "learning_rate": 7.660984970859233e-06, "loss": 2.8427505493164062, "step": 589200 }, { "epoch": 0.7110689593904571, "learning_rate": 7.660581135391495e-06, "loss": 2.8471249389648436, "step": 589300 }, { "epoch": 0.7111896227129398, "learning_rate": 7.660177299923757e-06, "loss": 2.8581051635742187, "step": 589400 }, { "epoch": 0.7113102860354226, "learning_rate": 7.659773464456019e-06, "loss": 2.850183410644531, "step": 589500 }, { "epoch": 0.7114309493579052, "learning_rate": 7.659369628988281e-06, "loss": 2.8320297241210937, "step": 589600 }, { "epoch": 0.7115516126803879, "learning_rate": 7.658965793520541e-06, "loss": 2.8095318603515627, "step": 589700 }, { "epoch": 0.7116722760028705, "learning_rate": 7.658561958052803e-06, "loss": 2.8488092041015625, "step": 589800 }, { "epoch": 0.7117929393253533, "learning_rate": 7.658158122585064e-06, "loss": 2.860452880859375, "step": 589900 }, { "epoch": 0.711913602647836, "learning_rate": 7.657754287117326e-06, "loss": 2.88807373046875, "step": 590000 }, { "epoch": 0.7120342659703186, "learning_rate": 7.657350451649588e-06, "loss": 2.8698056030273436, "step": 590100 }, { "epoch": 0.7121549292928013, "learning_rate": 7.65694661618185e-06, "loss": 2.84966796875, "step": 590200 }, { "epoch": 0.712275592615284, "learning_rate": 7.656542780714112e-06, "loss": 2.8345077514648436, "step": 590300 }, { "epoch": 0.7123962559377667, "learning_rate": 7.656138945246373e-06, "loss": 2.8443502807617187, "step": 590400 }, { "epoch": 0.7125169192602494, "learning_rate": 7.655735109778634e-06, "loss": 2.835208740234375, "step": 590500 }, { "epoch": 0.712637582582732, "learning_rate": 7.655331274310896e-06, "loss": 2.8191632080078124, "step": 590600 }, { "epoch": 0.7127582459052147, "learning_rate": 7.654927438843158e-06, "loss": 2.8341183471679687, "step": 590700 }, { "epoch": 0.7128789092276974, "learning_rate": 7.65452360337542e-06, "loss": 2.831346130371094, "step": 590800 }, { "epoch": 0.7129995725501801, "learning_rate": 7.65411976790768e-06, "loss": 2.8378945922851564, "step": 590900 }, { "epoch": 0.7131202358726628, "learning_rate": 7.653715932439942e-06, "loss": 2.8293966674804687, "step": 591000 }, { "epoch": 0.7132408991951454, "learning_rate": 7.653312096972204e-06, "loss": 2.8608172607421873, "step": 591100 }, { "epoch": 0.7133615625176282, "learning_rate": 7.652908261504466e-06, "loss": 2.87868896484375, "step": 591200 }, { "epoch": 0.7134822258401109, "learning_rate": 7.652504426036726e-06, "loss": 2.8494287109375, "step": 591300 }, { "epoch": 0.7136028891625935, "learning_rate": 7.652100590568988e-06, "loss": 2.852053527832031, "step": 591400 }, { "epoch": 0.7137235524850762, "learning_rate": 7.65169675510125e-06, "loss": 2.867012939453125, "step": 591500 }, { "epoch": 0.7138442158075589, "learning_rate": 7.651292919633512e-06, "loss": 2.8467132568359377, "step": 591600 }, { "epoch": 0.7139648791300416, "learning_rate": 7.650889084165774e-06, "loss": 2.8750851440429686, "step": 591700 }, { "epoch": 0.7140855424525243, "learning_rate": 7.650485248698034e-06, "loss": 2.8647781372070313, "step": 591800 }, { "epoch": 0.7142062057750069, "learning_rate": 7.650081413230296e-06, "loss": 2.858387145996094, "step": 591900 }, { "epoch": 0.7143268690974897, "learning_rate": 7.649677577762558e-06, "loss": 2.8398922729492186, "step": 592000 }, { "epoch": 0.7144475324199723, "learning_rate": 7.64927374229482e-06, "loss": 2.8484786987304687, "step": 592100 }, { "epoch": 0.714568195742455, "learning_rate": 7.64886990682708e-06, "loss": 2.822452392578125, "step": 592200 }, { "epoch": 0.7146888590649377, "learning_rate": 7.648466071359343e-06, "loss": 2.851641845703125, "step": 592300 }, { "epoch": 0.7148095223874203, "learning_rate": 7.648062235891605e-06, "loss": 2.8470709228515627, "step": 592400 }, { "epoch": 0.7149301857099031, "learning_rate": 7.647658400423867e-06, "loss": 2.851204833984375, "step": 592500 }, { "epoch": 0.7150508490323857, "learning_rate": 7.647254564956129e-06, "loss": 2.840595397949219, "step": 592600 }, { "epoch": 0.7151715123548684, "learning_rate": 7.64685072948839e-06, "loss": 2.8561087036132813, "step": 592700 }, { "epoch": 0.7152921756773511, "learning_rate": 7.646446894020651e-06, "loss": 2.830580139160156, "step": 592800 }, { "epoch": 0.7154128389998338, "learning_rate": 7.646043058552913e-06, "loss": 2.8352166748046876, "step": 592900 }, { "epoch": 0.7155335023223165, "learning_rate": 7.645639223085173e-06, "loss": 2.8629534912109373, "step": 593000 }, { "epoch": 0.7156541656447991, "learning_rate": 7.645235387617435e-06, "loss": 2.853104553222656, "step": 593100 }, { "epoch": 0.7157748289672818, "learning_rate": 7.644831552149697e-06, "loss": 2.8582220458984375, "step": 593200 }, { "epoch": 0.7158954922897646, "learning_rate": 7.644427716681959e-06, "loss": 2.8493191528320314, "step": 593300 }, { "epoch": 0.7160161556122472, "learning_rate": 7.644023881214221e-06, "loss": 2.866957702636719, "step": 593400 }, { "epoch": 0.7161368189347299, "learning_rate": 7.643620045746483e-06, "loss": 2.832419738769531, "step": 593500 }, { "epoch": 0.7162574822572125, "learning_rate": 7.643216210278745e-06, "loss": 2.880351257324219, "step": 593600 }, { "epoch": 0.7163781455796953, "learning_rate": 7.642812374811005e-06, "loss": 2.8743853759765625, "step": 593700 }, { "epoch": 0.716498808902178, "learning_rate": 7.642408539343267e-06, "loss": 2.8396533203125, "step": 593800 }, { "epoch": 0.7166194722246606, "learning_rate": 7.64200470387553e-06, "loss": 2.845855712890625, "step": 593900 }, { "epoch": 0.7167401355471433, "learning_rate": 7.64160086840779e-06, "loss": 2.8430340576171873, "step": 594000 }, { "epoch": 0.716860798869626, "learning_rate": 7.641197032940052e-06, "loss": 2.835252380371094, "step": 594100 }, { "epoch": 0.7169814621921087, "learning_rate": 7.640793197472314e-06, "loss": 2.8477993774414063, "step": 594200 }, { "epoch": 0.7171021255145914, "learning_rate": 7.640389362004576e-06, "loss": 2.83353515625, "step": 594300 }, { "epoch": 0.717222788837074, "learning_rate": 7.639985526536838e-06, "loss": 2.838026123046875, "step": 594400 }, { "epoch": 0.7173434521595567, "learning_rate": 7.6395816910691e-06, "loss": 2.8310287475585936, "step": 594500 }, { "epoch": 0.7174641154820394, "learning_rate": 7.63917785560136e-06, "loss": 2.843500061035156, "step": 594600 }, { "epoch": 0.7175847788045221, "learning_rate": 7.638774020133622e-06, "loss": 2.860919189453125, "step": 594700 }, { "epoch": 0.7177054421270048, "learning_rate": 7.638370184665884e-06, "loss": 2.8437673950195315, "step": 594800 }, { "epoch": 0.7178261054494874, "learning_rate": 7.637966349198144e-06, "loss": 2.845377197265625, "step": 594900 }, { "epoch": 0.7179467687719702, "learning_rate": 7.637562513730406e-06, "loss": 2.8584356689453125, "step": 595000 }, { "epoch": 0.7180674320944528, "learning_rate": 7.637158678262668e-06, "loss": 2.8483447265625, "step": 595100 }, { "epoch": 0.7181880954169355, "learning_rate": 7.63675484279493e-06, "loss": 2.830110778808594, "step": 595200 }, { "epoch": 0.7183087587394182, "learning_rate": 7.636351007327192e-06, "loss": 2.831490173339844, "step": 595300 }, { "epoch": 0.7184294220619009, "learning_rate": 7.635947171859452e-06, "loss": 2.880101623535156, "step": 595400 }, { "epoch": 0.7185500853843836, "learning_rate": 7.635543336391714e-06, "loss": 2.814600830078125, "step": 595500 }, { "epoch": 0.7186707487068662, "learning_rate": 7.635139500923976e-06, "loss": 2.8266641235351564, "step": 595600 }, { "epoch": 0.7187914120293489, "learning_rate": 7.634735665456238e-06, "loss": 2.8104318237304686, "step": 595700 }, { "epoch": 0.7189120753518317, "learning_rate": 7.6343318299885e-06, "loss": 2.843552551269531, "step": 595800 }, { "epoch": 0.7190327386743143, "learning_rate": 7.63392799452076e-06, "loss": 2.828013610839844, "step": 595900 }, { "epoch": 0.719153401996797, "learning_rate": 7.633524159053022e-06, "loss": 2.8720211791992187, "step": 596000 }, { "epoch": 0.7192740653192796, "learning_rate": 7.633120323585284e-06, "loss": 2.835665283203125, "step": 596100 }, { "epoch": 0.7193947286417623, "learning_rate": 7.632716488117545e-06, "loss": 2.840772705078125, "step": 596200 }, { "epoch": 0.7195153919642451, "learning_rate": 7.632312652649807e-06, "loss": 2.8577618408203125, "step": 596300 }, { "epoch": 0.7196360552867277, "learning_rate": 7.631908817182069e-06, "loss": 2.844828796386719, "step": 596400 }, { "epoch": 0.7197567186092104, "learning_rate": 7.63150498171433e-06, "loss": 2.8559085083007814, "step": 596500 }, { "epoch": 0.7198773819316931, "learning_rate": 7.631101146246593e-06, "loss": 2.8550439453125, "step": 596600 }, { "epoch": 0.7199980452541758, "learning_rate": 7.630697310778855e-06, "loss": 2.82895263671875, "step": 596700 }, { "epoch": 0.7201187085766585, "learning_rate": 7.630293475311115e-06, "loss": 2.8775347900390624, "step": 596800 }, { "epoch": 0.7202393718991411, "learning_rate": 7.629889639843377e-06, "loss": 2.8132208251953124, "step": 596900 }, { "epoch": 0.7203600352216238, "learning_rate": 7.629485804375639e-06, "loss": 2.855584716796875, "step": 597000 }, { "epoch": 0.7204806985441066, "learning_rate": 7.6290819689079e-06, "loss": 2.835617980957031, "step": 597100 }, { "epoch": 0.7206013618665892, "learning_rate": 7.628678133440161e-06, "loss": 2.833038024902344, "step": 597200 }, { "epoch": 0.7207220251890719, "learning_rate": 7.628274297972423e-06, "loss": 2.8349478149414065, "step": 597300 }, { "epoch": 0.7208426885115545, "learning_rate": 7.627870462504685e-06, "loss": 2.8466970825195315, "step": 597400 }, { "epoch": 0.7209633518340373, "learning_rate": 7.627466627036947e-06, "loss": 2.8552850341796874, "step": 597500 }, { "epoch": 0.72108401515652, "learning_rate": 7.627062791569208e-06, "loss": 2.8689910888671877, "step": 597600 }, { "epoch": 0.7212046784790026, "learning_rate": 7.62665895610147e-06, "loss": 2.848668212890625, "step": 597700 }, { "epoch": 0.7213253418014853, "learning_rate": 7.626255120633732e-06, "loss": 2.8390097045898437, "step": 597800 }, { "epoch": 0.721446005123968, "learning_rate": 7.6258512851659925e-06, "loss": 2.8535665893554687, "step": 597900 }, { "epoch": 0.7215666684464507, "learning_rate": 7.6254474496982545e-06, "loss": 2.8399832153320315, "step": 598000 }, { "epoch": 0.7216873317689334, "learning_rate": 7.6250436142305165e-06, "loss": 2.8328372192382814, "step": 598100 }, { "epoch": 0.721807995091416, "learning_rate": 7.624639778762778e-06, "loss": 2.8236346435546875, "step": 598200 }, { "epoch": 0.7219286584138987, "learning_rate": 7.62423594329504e-06, "loss": 2.839200439453125, "step": 598300 }, { "epoch": 0.7220493217363814, "learning_rate": 7.623832107827302e-06, "loss": 2.858956298828125, "step": 598400 }, { "epoch": 0.7221699850588641, "learning_rate": 7.623428272359564e-06, "loss": 2.83538818359375, "step": 598500 }, { "epoch": 0.7222906483813468, "learning_rate": 7.623024436891825e-06, "loss": 2.8272552490234375, "step": 598600 }, { "epoch": 0.7224113117038294, "learning_rate": 7.622620601424086e-06, "loss": 2.8433087158203123, "step": 598700 }, { "epoch": 0.7225319750263122, "learning_rate": 7.622216765956347e-06, "loss": 2.852114562988281, "step": 598800 }, { "epoch": 0.7226526383487948, "learning_rate": 7.621812930488609e-06, "loss": 2.8037570190429686, "step": 598900 }, { "epoch": 0.7227733016712775, "learning_rate": 7.621409095020871e-06, "loss": 2.860138244628906, "step": 599000 }, { "epoch": 0.7228939649937602, "learning_rate": 7.621005259553133e-06, "loss": 2.849071044921875, "step": 599100 }, { "epoch": 0.7230146283162429, "learning_rate": 7.620601424085394e-06, "loss": 2.834295349121094, "step": 599200 }, { "epoch": 0.7231352916387256, "learning_rate": 7.620197588617656e-06, "loss": 2.86677490234375, "step": 599300 }, { "epoch": 0.7232559549612082, "learning_rate": 7.619793753149918e-06, "loss": 2.8441143798828126, "step": 599400 }, { "epoch": 0.7233766182836909, "learning_rate": 7.619389917682178e-06, "loss": 2.8090560913085936, "step": 599500 }, { "epoch": 0.7234972816061737, "learning_rate": 7.61898608221444e-06, "loss": 2.8088385009765626, "step": 599600 }, { "epoch": 0.7236179449286563, "learning_rate": 7.618582246746702e-06, "loss": 2.8294964599609376, "step": 599700 }, { "epoch": 0.723738608251139, "learning_rate": 7.618178411278963e-06, "loss": 2.8351806640625, "step": 599800 }, { "epoch": 0.7238592715736216, "learning_rate": 7.617774575811225e-06, "loss": 2.8585284423828123, "step": 599900 }, { "epoch": 0.7239799348961043, "learning_rate": 7.617370740343487e-06, "loss": 2.835009765625, "step": 600000 }, { "epoch": 0.7241005982185871, "learning_rate": 7.6169669048757485e-06, "loss": 2.8402664184570314, "step": 600100 }, { "epoch": 0.7242212615410697, "learning_rate": 7.6165630694080105e-06, "loss": 2.8244183349609373, "step": 600200 }, { "epoch": 0.7243419248635524, "learning_rate": 7.616159233940272e-06, "loss": 2.8449526977539064, "step": 600300 }, { "epoch": 0.724462588186035, "learning_rate": 7.615755398472533e-06, "loss": 2.8412411499023436, "step": 600400 }, { "epoch": 0.7245832515085178, "learning_rate": 7.615351563004795e-06, "loss": 2.8219430541992185, "step": 600500 }, { "epoch": 0.7247039148310005, "learning_rate": 7.614947727537057e-06, "loss": 2.832084045410156, "step": 600600 }, { "epoch": 0.7248245781534831, "learning_rate": 7.614543892069318e-06, "loss": 2.8650436401367188, "step": 600700 }, { "epoch": 0.7249452414759658, "learning_rate": 7.61414005660158e-06, "loss": 2.83247314453125, "step": 600800 }, { "epoch": 0.7250659047984485, "learning_rate": 7.613736221133842e-06, "loss": 2.8388943481445312, "step": 600900 }, { "epoch": 0.7251865681209312, "learning_rate": 7.613332385666104e-06, "loss": 2.829284973144531, "step": 601000 }, { "epoch": 0.7253072314434139, "learning_rate": 7.612928550198364e-06, "loss": 2.824978942871094, "step": 601100 }, { "epoch": 0.7254278947658965, "learning_rate": 7.612524714730626e-06, "loss": 2.8546621704101565, "step": 601200 }, { "epoch": 0.7255485580883793, "learning_rate": 7.612120879262887e-06, "loss": 2.8446481323242185, "step": 601300 }, { "epoch": 0.725669221410862, "learning_rate": 7.611717043795149e-06, "loss": 2.8569454956054687, "step": 601400 }, { "epoch": 0.7257898847333446, "learning_rate": 7.611313208327411e-06, "loss": 2.84204345703125, "step": 601500 }, { "epoch": 0.7259105480558273, "learning_rate": 7.610909372859673e-06, "loss": 2.8396881103515623, "step": 601600 }, { "epoch": 0.72603121137831, "learning_rate": 7.610505537391934e-06, "loss": 2.858248596191406, "step": 601700 }, { "epoch": 0.7261518747007927, "learning_rate": 7.610101701924196e-06, "loss": 2.8359979248046874, "step": 601800 }, { "epoch": 0.7262725380232754, "learning_rate": 7.609697866456457e-06, "loss": 2.8368960571289064, "step": 601900 }, { "epoch": 0.726393201345758, "learning_rate": 7.6092940309887186e-06, "loss": 2.844346008300781, "step": 602000 }, { "epoch": 0.7265138646682407, "learning_rate": 7.6088901955209805e-06, "loss": 2.8497967529296875, "step": 602100 }, { "epoch": 0.7266345279907234, "learning_rate": 7.6084863600532425e-06, "loss": 2.818468017578125, "step": 602200 }, { "epoch": 0.7267551913132061, "learning_rate": 7.608082524585504e-06, "loss": 2.84897705078125, "step": 602300 }, { "epoch": 0.7268758546356888, "learning_rate": 7.607678689117766e-06, "loss": 2.8364697265625, "step": 602400 }, { "epoch": 0.7269965179581714, "learning_rate": 7.607274853650028e-06, "loss": 2.8343548583984375, "step": 602500 }, { "epoch": 0.7271171812806542, "learning_rate": 7.606871018182289e-06, "loss": 2.81431640625, "step": 602600 }, { "epoch": 0.7272378446031368, "learning_rate": 7.606467182714551e-06, "loss": 2.8723526000976562, "step": 602700 }, { "epoch": 0.7273585079256195, "learning_rate": 7.606063347246812e-06, "loss": 2.81925537109375, "step": 602800 }, { "epoch": 0.7274791712481022, "learning_rate": 7.605659511779073e-06, "loss": 2.7938177490234377, "step": 602900 }, { "epoch": 0.7275998345705849, "learning_rate": 7.605255676311335e-06, "loss": 2.8298220825195313, "step": 603000 }, { "epoch": 0.7277204978930676, "learning_rate": 7.604851840843597e-06, "loss": 2.842681884765625, "step": 603100 }, { "epoch": 0.7278411612155502, "learning_rate": 7.604448005375858e-06, "loss": 2.8330377197265624, "step": 603200 }, { "epoch": 0.7279618245380329, "learning_rate": 7.60404416990812e-06, "loss": 2.8187625122070314, "step": 603300 }, { "epoch": 0.7280824878605157, "learning_rate": 7.603640334440382e-06, "loss": 2.839820556640625, "step": 603400 }, { "epoch": 0.7282031511829983, "learning_rate": 7.603236498972644e-06, "loss": 2.818056640625, "step": 603500 }, { "epoch": 0.728323814505481, "learning_rate": 7.602832663504904e-06, "loss": 2.8298419189453123, "step": 603600 }, { "epoch": 0.7284444778279636, "learning_rate": 7.602428828037166e-06, "loss": 2.824041442871094, "step": 603700 }, { "epoch": 0.7285651411504463, "learning_rate": 7.6020249925694275e-06, "loss": 2.84650390625, "step": 603800 }, { "epoch": 0.7286858044729291, "learning_rate": 7.6016211571016895e-06, "loss": 2.8340460205078126, "step": 603900 }, { "epoch": 0.7288064677954117, "learning_rate": 7.6012173216339514e-06, "loss": 2.8298089599609373, "step": 604000 }, { "epoch": 0.7289271311178944, "learning_rate": 7.600813486166213e-06, "loss": 2.8144265747070314, "step": 604100 }, { "epoch": 0.729047794440377, "learning_rate": 7.6004096506984746e-06, "loss": 2.8420260620117186, "step": 604200 }, { "epoch": 0.7291684577628598, "learning_rate": 7.6000058152307365e-06, "loss": 2.8317364501953124, "step": 604300 }, { "epoch": 0.7292891210853425, "learning_rate": 7.599601979762997e-06, "loss": 2.854012145996094, "step": 604400 }, { "epoch": 0.7294097844078251, "learning_rate": 7.599198144295259e-06, "loss": 2.852894287109375, "step": 604500 }, { "epoch": 0.7295304477303078, "learning_rate": 7.598794308827521e-06, "loss": 2.8500555419921874, "step": 604600 }, { "epoch": 0.7296511110527905, "learning_rate": 7.598390473359783e-06, "loss": 2.825152587890625, "step": 604700 }, { "epoch": 0.7297717743752732, "learning_rate": 7.597986637892044e-06, "loss": 2.8397869873046875, "step": 604800 }, { "epoch": 0.7298924376977559, "learning_rate": 7.597582802424306e-06, "loss": 2.8551385498046873, "step": 604900 }, { "epoch": 0.7300131010202385, "learning_rate": 7.597178966956568e-06, "loss": 2.8412796020507813, "step": 605000 }, { "epoch": 0.7301337643427213, "learning_rate": 7.596775131488829e-06, "loss": 2.8156011962890624, "step": 605100 }, { "epoch": 0.7302544276652039, "learning_rate": 7.59637129602109e-06, "loss": 2.8235458374023437, "step": 605200 }, { "epoch": 0.7303750909876866, "learning_rate": 7.595967460553352e-06, "loss": 2.8220587158203125, "step": 605300 }, { "epoch": 0.7304957543101693, "learning_rate": 7.595563625085613e-06, "loss": 2.8451638793945313, "step": 605400 }, { "epoch": 0.730616417632652, "learning_rate": 7.595159789617875e-06, "loss": 2.8342608642578124, "step": 605500 }, { "epoch": 0.7307370809551347, "learning_rate": 7.594755954150137e-06, "loss": 2.833648681640625, "step": 605600 }, { "epoch": 0.7308577442776173, "learning_rate": 7.594352118682398e-06, "loss": 2.832721862792969, "step": 605700 }, { "epoch": 0.7309784076001, "learning_rate": 7.59394828321466e-06, "loss": 2.82572265625, "step": 605800 }, { "epoch": 0.7310990709225827, "learning_rate": 7.593544447746922e-06, "loss": 2.8513800048828126, "step": 605900 }, { "epoch": 0.7312197342450654, "learning_rate": 7.593140612279183e-06, "loss": 2.8289996337890626, "step": 606000 }, { "epoch": 0.7313403975675481, "learning_rate": 7.592736776811445e-06, "loss": 2.8240087890625, "step": 606100 }, { "epoch": 0.7314610608900307, "learning_rate": 7.592332941343707e-06, "loss": 2.8449395751953124, "step": 606200 }, { "epoch": 0.7315817242125134, "learning_rate": 7.591929105875968e-06, "loss": 2.8405169677734374, "step": 606300 }, { "epoch": 0.7317023875349962, "learning_rate": 7.59152527040823e-06, "loss": 2.8252545166015626, "step": 606400 }, { "epoch": 0.7318230508574788, "learning_rate": 7.591121434940492e-06, "loss": 2.8312115478515625, "step": 606500 }, { "epoch": 0.7319437141799615, "learning_rate": 7.590717599472754e-06, "loss": 2.820077209472656, "step": 606600 }, { "epoch": 0.7320643775024442, "learning_rate": 7.590313764005015e-06, "loss": 2.823672180175781, "step": 606700 }, { "epoch": 0.7321850408249269, "learning_rate": 7.589909928537276e-06, "loss": 2.8201654052734373, "step": 606800 }, { "epoch": 0.7323057041474096, "learning_rate": 7.589506093069537e-06, "loss": 2.8248065185546873, "step": 606900 }, { "epoch": 0.7324263674698922, "learning_rate": 7.589102257601799e-06, "loss": 2.8089474487304686, "step": 607000 }, { "epoch": 0.7325470307923749, "learning_rate": 7.588698422134061e-06, "loss": 2.8481414794921873, "step": 607100 }, { "epoch": 0.7326676941148577, "learning_rate": 7.588294586666323e-06, "loss": 2.826563720703125, "step": 607200 }, { "epoch": 0.7327883574373403, "learning_rate": 7.587890751198584e-06, "loss": 2.8146597290039064, "step": 607300 }, { "epoch": 0.732909020759823, "learning_rate": 7.587486915730846e-06, "loss": 2.8355548095703127, "step": 607400 }, { "epoch": 0.7330296840823056, "learning_rate": 7.587083080263108e-06, "loss": 2.8327291870117186, "step": 607500 }, { "epoch": 0.7331503474047883, "learning_rate": 7.586679244795369e-06, "loss": 2.835107421875, "step": 607600 }, { "epoch": 0.7332710107272711, "learning_rate": 7.58627540932763e-06, "loss": 2.857324523925781, "step": 607700 }, { "epoch": 0.7333916740497537, "learning_rate": 7.585871573859892e-06, "loss": 2.8485736083984374, "step": 607800 }, { "epoch": 0.7335123373722364, "learning_rate": 7.5854677383921535e-06, "loss": 2.8316030883789063, "step": 607900 }, { "epoch": 0.733633000694719, "learning_rate": 7.5850639029244155e-06, "loss": 2.843360595703125, "step": 608000 }, { "epoch": 0.7337536640172018, "learning_rate": 7.5846600674566775e-06, "loss": 2.8294363403320313, "step": 608100 }, { "epoch": 0.7338743273396845, "learning_rate": 7.584256231988939e-06, "loss": 2.8250167846679686, "step": 608200 }, { "epoch": 0.7339949906621671, "learning_rate": 7.583852396521201e-06, "loss": 2.8388677978515626, "step": 608300 }, { "epoch": 0.7341156539846498, "learning_rate": 7.5834485610534626e-06, "loss": 2.845799865722656, "step": 608400 }, { "epoch": 0.7342363173071325, "learning_rate": 7.583044725585723e-06, "loss": 2.81463623046875, "step": 608500 }, { "epoch": 0.7343569806296152, "learning_rate": 7.582640890117985e-06, "loss": 2.853978576660156, "step": 608600 }, { "epoch": 0.7344776439520979, "learning_rate": 7.582237054650247e-06, "loss": 2.83222412109375, "step": 608700 }, { "epoch": 0.7345983072745805, "learning_rate": 7.581833219182508e-06, "loss": 2.804739990234375, "step": 608800 }, { "epoch": 0.7347189705970633, "learning_rate": 7.58142938371477e-06, "loss": 2.82529052734375, "step": 608900 }, { "epoch": 0.7348396339195459, "learning_rate": 7.581025548247032e-06, "loss": 2.8481216430664062, "step": 609000 }, { "epoch": 0.7349602972420286, "learning_rate": 7.580621712779294e-06, "loss": 2.8316244506835937, "step": 609100 }, { "epoch": 0.7350809605645113, "learning_rate": 7.580217877311555e-06, "loss": 2.8433767700195314, "step": 609200 }, { "epoch": 0.735201623886994, "learning_rate": 7.579814041843816e-06, "loss": 2.8337847900390627, "step": 609300 }, { "epoch": 0.7353222872094767, "learning_rate": 7.579410206376077e-06, "loss": 2.8405975341796874, "step": 609400 }, { "epoch": 0.7354429505319593, "learning_rate": 7.579006370908339e-06, "loss": 2.843521728515625, "step": 609500 }, { "epoch": 0.735563613854442, "learning_rate": 7.578602535440601e-06, "loss": 2.8249505615234374, "step": 609600 }, { "epoch": 0.7356842771769248, "learning_rate": 7.578198699972863e-06, "loss": 2.865635986328125, "step": 609700 }, { "epoch": 0.7358049404994074, "learning_rate": 7.577794864505124e-06, "loss": 2.8307565307617186, "step": 609800 }, { "epoch": 0.7359256038218901, "learning_rate": 7.577391029037386e-06, "loss": 2.7958209228515627, "step": 609900 }, { "epoch": 0.7360462671443727, "learning_rate": 7.576987193569648e-06, "loss": 2.8226547241210938, "step": 610000 }, { "epoch": 0.7361669304668554, "learning_rate": 7.576583358101909e-06, "loss": 2.813846435546875, "step": 610100 }, { "epoch": 0.7362875937893382, "learning_rate": 7.576179522634171e-06, "loss": 2.819149169921875, "step": 610200 }, { "epoch": 0.7364082571118208, "learning_rate": 7.575775687166433e-06, "loss": 2.8468051147460938, "step": 610300 }, { "epoch": 0.7365289204343035, "learning_rate": 7.575371851698694e-06, "loss": 2.8197586059570314, "step": 610400 }, { "epoch": 0.7366495837567861, "learning_rate": 7.574968016230956e-06, "loss": 2.814403381347656, "step": 610500 }, { "epoch": 0.7367702470792689, "learning_rate": 7.574564180763218e-06, "loss": 2.8308221435546876, "step": 610600 }, { "epoch": 0.7368909104017516, "learning_rate": 7.57416034529548e-06, "loss": 2.831101379394531, "step": 610700 }, { "epoch": 0.7370115737242342, "learning_rate": 7.573756509827741e-06, "loss": 2.8293746948242187, "step": 610800 }, { "epoch": 0.7371322370467169, "learning_rate": 7.573352674360002e-06, "loss": 2.850122985839844, "step": 610900 }, { "epoch": 0.7372529003691995, "learning_rate": 7.572948838892263e-06, "loss": 2.8342330932617186, "step": 611000 }, { "epoch": 0.7373735636916823, "learning_rate": 7.572545003424525e-06, "loss": 2.827171630859375, "step": 611100 }, { "epoch": 0.737494227014165, "learning_rate": 7.572141167956787e-06, "loss": 2.822620849609375, "step": 611200 }, { "epoch": 0.7376148903366476, "learning_rate": 7.571737332489049e-06, "loss": 2.8397671508789064, "step": 611300 }, { "epoch": 0.7377355536591303, "learning_rate": 7.57133349702131e-06, "loss": 2.8224777221679687, "step": 611400 }, { "epoch": 0.737856216981613, "learning_rate": 7.570929661553572e-06, "loss": 2.8421759033203124, "step": 611500 }, { "epoch": 0.7379768803040957, "learning_rate": 7.570525826085834e-06, "loss": 2.827149658203125, "step": 611600 }, { "epoch": 0.7380975436265784, "learning_rate": 7.5701219906180944e-06, "loss": 2.8314828491210937, "step": 611700 }, { "epoch": 0.738218206949061, "learning_rate": 7.569718155150356e-06, "loss": 2.797510681152344, "step": 611800 }, { "epoch": 0.7383388702715438, "learning_rate": 7.569314319682618e-06, "loss": 2.8336410522460938, "step": 611900 }, { "epoch": 0.7384595335940265, "learning_rate": 7.5689104842148795e-06, "loss": 2.843047790527344, "step": 612000 }, { "epoch": 0.7385801969165091, "learning_rate": 7.5685066487471415e-06, "loss": 2.8051467895507813, "step": 612100 }, { "epoch": 0.7387008602389918, "learning_rate": 7.5681028132794035e-06, "loss": 2.8253042602539065, "step": 612200 }, { "epoch": 0.7388215235614745, "learning_rate": 7.567698977811665e-06, "loss": 2.781560363769531, "step": 612300 }, { "epoch": 0.7389421868839572, "learning_rate": 7.567295142343927e-06, "loss": 2.8181698608398436, "step": 612400 }, { "epoch": 0.7390628502064399, "learning_rate": 7.566891306876189e-06, "loss": 2.8395892333984376, "step": 612500 }, { "epoch": 0.7391835135289225, "learning_rate": 7.566487471408449e-06, "loss": 2.838157958984375, "step": 612600 }, { "epoch": 0.7393041768514053, "learning_rate": 7.566083635940711e-06, "loss": 2.8269708251953123, "step": 612700 }, { "epoch": 0.7394248401738879, "learning_rate": 7.565679800472973e-06, "loss": 2.8259820556640625, "step": 612800 }, { "epoch": 0.7395455034963706, "learning_rate": 7.565275965005234e-06, "loss": 2.8072039794921877, "step": 612900 }, { "epoch": 0.7396661668188533, "learning_rate": 7.564872129537496e-06, "loss": 2.8385406494140626, "step": 613000 }, { "epoch": 0.739786830141336, "learning_rate": 7.564468294069758e-06, "loss": 2.798528747558594, "step": 613100 }, { "epoch": 0.7399074934638187, "learning_rate": 7.56406445860202e-06, "loss": 2.8339385986328125, "step": 613200 }, { "epoch": 0.7400281567863013, "learning_rate": 7.563660623134281e-06, "loss": 2.8272882080078126, "step": 613300 }, { "epoch": 0.740148820108784, "learning_rate": 7.563256787666542e-06, "loss": 2.8170840454101564, "step": 613400 }, { "epoch": 0.7402694834312668, "learning_rate": 7.562852952198803e-06, "loss": 2.8212686157226563, "step": 613500 }, { "epoch": 0.7403901467537494, "learning_rate": 7.562449116731065e-06, "loss": 2.8304904174804686, "step": 613600 }, { "epoch": 0.7405108100762321, "learning_rate": 7.562045281263327e-06, "loss": 2.83412109375, "step": 613700 }, { "epoch": 0.7406314733987147, "learning_rate": 7.561641445795589e-06, "loss": 2.826516418457031, "step": 613800 }, { "epoch": 0.7407521367211974, "learning_rate": 7.5612376103278504e-06, "loss": 2.813454284667969, "step": 613900 }, { "epoch": 0.7408728000436802, "learning_rate": 7.560833774860112e-06, "loss": 2.8243328857421877, "step": 614000 }, { "epoch": 0.7409934633661628, "learning_rate": 7.560429939392374e-06, "loss": 2.833742980957031, "step": 614100 }, { "epoch": 0.7411141266886455, "learning_rate": 7.560026103924635e-06, "loss": 2.8076470947265624, "step": 614200 }, { "epoch": 0.7412347900111281, "learning_rate": 7.559622268456897e-06, "loss": 2.8299530029296873, "step": 614300 }, { "epoch": 0.7413554533336109, "learning_rate": 7.559218432989159e-06, "loss": 2.819527282714844, "step": 614400 }, { "epoch": 0.7414761166560936, "learning_rate": 7.55881459752142e-06, "loss": 2.8074356079101563, "step": 614500 }, { "epoch": 0.7415967799785762, "learning_rate": 7.558410762053682e-06, "loss": 2.818992004394531, "step": 614600 }, { "epoch": 0.7417174433010589, "learning_rate": 7.558006926585944e-06, "loss": 2.84697021484375, "step": 614700 }, { "epoch": 0.7418381066235415, "learning_rate": 7.557603091118205e-06, "loss": 2.8341073608398437, "step": 614800 }, { "epoch": 0.7419587699460243, "learning_rate": 7.557199255650467e-06, "loss": 2.8070330810546875, "step": 614900 }, { "epoch": 0.742079433268507, "learning_rate": 7.556795420182728e-06, "loss": 2.815440673828125, "step": 615000 }, { "epoch": 0.7422000965909896, "learning_rate": 7.556391584714989e-06, "loss": 2.8568255615234377, "step": 615100 }, { "epoch": 0.7423207599134724, "learning_rate": 7.555987749247251e-06, "loss": 2.8088778686523437, "step": 615200 }, { "epoch": 0.742441423235955, "learning_rate": 7.555583913779513e-06, "loss": 2.8101040649414064, "step": 615300 }, { "epoch": 0.7425620865584377, "learning_rate": 7.555180078311774e-06, "loss": 2.8466583251953126, "step": 615400 }, { "epoch": 0.7426827498809204, "learning_rate": 7.554776242844036e-06, "loss": 2.8294287109375, "step": 615500 }, { "epoch": 0.742803413203403, "learning_rate": 7.554372407376298e-06, "loss": 2.82283935546875, "step": 615600 }, { "epoch": 0.7429240765258858, "learning_rate": 7.55396857190856e-06, "loss": 2.8386404418945315, "step": 615700 }, { "epoch": 0.7430447398483684, "learning_rate": 7.5535647364408205e-06, "loss": 2.8301040649414064, "step": 615800 }, { "epoch": 0.7431654031708511, "learning_rate": 7.5531609009730825e-06, "loss": 2.8170407104492186, "step": 615900 }, { "epoch": 0.7432860664933338, "learning_rate": 7.552757065505344e-06, "loss": 2.8237225341796877, "step": 616000 }, { "epoch": 0.7434067298158165, "learning_rate": 7.5523532300376056e-06, "loss": 2.7910894775390624, "step": 616100 }, { "epoch": 0.7435273931382992, "learning_rate": 7.5519493945698676e-06, "loss": 2.8088031005859375, "step": 616200 }, { "epoch": 0.7436480564607818, "learning_rate": 7.5515455591021295e-06, "loss": 2.810670166015625, "step": 616300 }, { "epoch": 0.7437687197832645, "learning_rate": 7.551141723634391e-06, "loss": 2.8361151123046877, "step": 616400 }, { "epoch": 0.7438893831057473, "learning_rate": 7.550737888166653e-06, "loss": 2.833929138183594, "step": 616500 }, { "epoch": 0.7440100464282299, "learning_rate": 7.550334052698913e-06, "loss": 2.808399658203125, "step": 616600 }, { "epoch": 0.7441307097507126, "learning_rate": 7.549930217231175e-06, "loss": 2.8284747314453127, "step": 616700 }, { "epoch": 0.7442513730731952, "learning_rate": 7.549526381763437e-06, "loss": 2.819230651855469, "step": 616800 }, { "epoch": 0.744372036395678, "learning_rate": 7.549122546295699e-06, "loss": 2.8165911865234374, "step": 616900 }, { "epoch": 0.7444926997181607, "learning_rate": 7.54871871082796e-06, "loss": 2.8294052124023437, "step": 617000 }, { "epoch": 0.7446133630406433, "learning_rate": 7.548314875360222e-06, "loss": 2.812433776855469, "step": 617100 }, { "epoch": 0.744734026363126, "learning_rate": 7.547911039892484e-06, "loss": 2.827803649902344, "step": 617200 }, { "epoch": 0.7448546896856088, "learning_rate": 7.547507204424745e-06, "loss": 2.8532666015625, "step": 617300 }, { "epoch": 0.7449753530080914, "learning_rate": 7.547103368957006e-06, "loss": 2.825555419921875, "step": 617400 }, { "epoch": 0.7450960163305741, "learning_rate": 7.546699533489268e-06, "loss": 2.820987548828125, "step": 617500 }, { "epoch": 0.7452166796530567, "learning_rate": 7.546295698021529e-06, "loss": 2.830040283203125, "step": 617600 }, { "epoch": 0.7453373429755394, "learning_rate": 7.545891862553791e-06, "loss": 2.8361956787109377, "step": 617700 }, { "epoch": 0.7454580062980222, "learning_rate": 7.545488027086053e-06, "loss": 2.8424581909179687, "step": 617800 }, { "epoch": 0.7455786696205048, "learning_rate": 7.5450841916183145e-06, "loss": 2.813293151855469, "step": 617900 }, { "epoch": 0.7456993329429875, "learning_rate": 7.5446803561505765e-06, "loss": 2.8331146240234375, "step": 618000 }, { "epoch": 0.7458199962654701, "learning_rate": 7.5442765206828384e-06, "loss": 2.8351800537109373, "step": 618100 }, { "epoch": 0.7459406595879529, "learning_rate": 7.5438726852151004e-06, "loss": 2.8177914428710937, "step": 618200 }, { "epoch": 0.7460613229104356, "learning_rate": 7.543468849747361e-06, "loss": 2.8362612915039063, "step": 618300 }, { "epoch": 0.7461819862329182, "learning_rate": 7.543065014279623e-06, "loss": 2.8077484130859376, "step": 618400 }, { "epoch": 0.7463026495554009, "learning_rate": 7.542661178811884e-06, "loss": 2.8257672119140627, "step": 618500 }, { "epoch": 0.7464233128778835, "learning_rate": 7.542257343344146e-06, "loss": 2.8363217163085936, "step": 618600 }, { "epoch": 0.7465439762003663, "learning_rate": 7.541853507876408e-06, "loss": 2.8073886108398436, "step": 618700 }, { "epoch": 0.746664639522849, "learning_rate": 7.54144967240867e-06, "loss": 2.8025497436523437, "step": 618800 }, { "epoch": 0.7467853028453316, "learning_rate": 7.541045836940931e-06, "loss": 2.8164547729492186, "step": 618900 }, { "epoch": 0.7469059661678144, "learning_rate": 7.540642001473193e-06, "loss": 2.797499084472656, "step": 619000 }, { "epoch": 0.747026629490297, "learning_rate": 7.540238166005453e-06, "loss": 2.8240225219726565, "step": 619100 }, { "epoch": 0.7471472928127797, "learning_rate": 7.539834330537715e-06, "loss": 2.8514141845703125, "step": 619200 }, { "epoch": 0.7472679561352624, "learning_rate": 7.539430495069977e-06, "loss": 2.8393463134765624, "step": 619300 }, { "epoch": 0.747388619457745, "learning_rate": 7.539026659602239e-06, "loss": 2.8152816772460936, "step": 619400 }, { "epoch": 0.7475092827802278, "learning_rate": 7.5386228241345e-06, "loss": 2.849360046386719, "step": 619500 }, { "epoch": 0.7476299461027104, "learning_rate": 7.538218988666762e-06, "loss": 2.8304534912109376, "step": 619600 }, { "epoch": 0.7477506094251931, "learning_rate": 7.537815153199024e-06, "loss": 2.7997320556640624, "step": 619700 }, { "epoch": 0.7478712727476758, "learning_rate": 7.537411317731285e-06, "loss": 2.8333538818359374, "step": 619800 }, { "epoch": 0.7479919360701585, "learning_rate": 7.5370074822635465e-06, "loss": 2.8378982543945312, "step": 619900 }, { "epoch": 0.7481125993926412, "learning_rate": 7.5366036467958085e-06, "loss": 2.853677062988281, "step": 620000 }, { "epoch": 0.7482332627151238, "learning_rate": 7.53619981132807e-06, "loss": 2.8385684204101564, "step": 620100 }, { "epoch": 0.7483539260376065, "learning_rate": 7.535795975860332e-06, "loss": 2.829327392578125, "step": 620200 }, { "epoch": 0.7484745893600893, "learning_rate": 7.535392140392594e-06, "loss": 2.8047689819335937, "step": 620300 }, { "epoch": 0.7485952526825719, "learning_rate": 7.534988304924855e-06, "loss": 2.817430114746094, "step": 620400 }, { "epoch": 0.7487159160050546, "learning_rate": 7.534584469457117e-06, "loss": 2.8175750732421876, "step": 620500 }, { "epoch": 0.7488365793275372, "learning_rate": 7.534180633989379e-06, "loss": 2.80708251953125, "step": 620600 }, { "epoch": 0.74895724265002, "learning_rate": 7.533776798521639e-06, "loss": 2.8062698364257814, "step": 620700 }, { "epoch": 0.7490779059725027, "learning_rate": 7.533372963053901e-06, "loss": 2.814303283691406, "step": 620800 }, { "epoch": 0.7491985692949853, "learning_rate": 7.532969127586163e-06, "loss": 2.821028747558594, "step": 620900 }, { "epoch": 0.749319232617468, "learning_rate": 7.532565292118424e-06, "loss": 2.8208688354492186, "step": 621000 }, { "epoch": 0.7494398959399506, "learning_rate": 7.532161456650686e-06, "loss": 2.833165588378906, "step": 621100 }, { "epoch": 0.7495605592624334, "learning_rate": 7.531757621182948e-06, "loss": 2.8111578369140626, "step": 621200 }, { "epoch": 0.7496812225849161, "learning_rate": 7.53135378571521e-06, "loss": 2.819300231933594, "step": 621300 }, { "epoch": 0.7498018859073987, "learning_rate": 7.530949950247471e-06, "loss": 2.8168365478515627, "step": 621400 }, { "epoch": 0.7499225492298814, "learning_rate": 7.530546114779732e-06, "loss": 2.84283935546875, "step": 621500 }, { "epoch": 0.7500432125523641, "learning_rate": 7.5301422793119934e-06, "loss": 2.8554141235351564, "step": 621600 }, { "epoch": 0.7501638758748468, "learning_rate": 7.529738443844255e-06, "loss": 2.831490478515625, "step": 621700 }, { "epoch": 0.7502845391973295, "learning_rate": 7.529334608376517e-06, "loss": 2.8194000244140627, "step": 621800 }, { "epoch": 0.7504052025198121, "learning_rate": 7.528930772908779e-06, "loss": 2.8222787475585935, "step": 621900 }, { "epoch": 0.7505258658422949, "learning_rate": 7.5285269374410405e-06, "loss": 2.821630859375, "step": 622000 }, { "epoch": 0.7506465291647775, "learning_rate": 7.5281231019733025e-06, "loss": 2.8231985473632815, "step": 622100 }, { "epoch": 0.7507671924872602, "learning_rate": 7.5277192665055645e-06, "loss": 2.811253967285156, "step": 622200 }, { "epoch": 0.7508878558097429, "learning_rate": 7.527315431037825e-06, "loss": 2.7806607055664063, "step": 622300 }, { "epoch": 0.7510085191322255, "learning_rate": 7.526911595570087e-06, "loss": 2.848405456542969, "step": 622400 }, { "epoch": 0.7511291824547083, "learning_rate": 7.526507760102349e-06, "loss": 2.79271484375, "step": 622500 }, { "epoch": 0.751249845777191, "learning_rate": 7.52610392463461e-06, "loss": 2.8372039794921875, "step": 622600 }, { "epoch": 0.7513705090996736, "learning_rate": 7.525700089166872e-06, "loss": 2.8286602783203123, "step": 622700 }, { "epoch": 0.7514911724221564, "learning_rate": 7.525296253699134e-06, "loss": 2.8279736328125, "step": 622800 }, { "epoch": 0.751611835744639, "learning_rate": 7.524892418231395e-06, "loss": 2.8249545288085938, "step": 622900 }, { "epoch": 0.7517324990671217, "learning_rate": 7.524488582763657e-06, "loss": 2.8132870483398436, "step": 623000 }, { "epoch": 0.7518531623896044, "learning_rate": 7.524084747295919e-06, "loss": 2.8364694213867185, "step": 623100 }, { "epoch": 0.751973825712087, "learning_rate": 7.523680911828179e-06, "loss": 2.8017919921875, "step": 623200 }, { "epoch": 0.7520944890345698, "learning_rate": 7.523277076360441e-06, "loss": 2.8268621826171874, "step": 623300 }, { "epoch": 0.7522151523570524, "learning_rate": 7.522873240892703e-06, "loss": 2.8178338623046875, "step": 623400 }, { "epoch": 0.7523358156795351, "learning_rate": 7.522469405424964e-06, "loss": 2.7910528564453125, "step": 623500 }, { "epoch": 0.7524564790020178, "learning_rate": 7.522065569957226e-06, "loss": 2.8216256713867187, "step": 623600 }, { "epoch": 0.7525771423245005, "learning_rate": 7.521661734489488e-06, "loss": 2.835389404296875, "step": 623700 }, { "epoch": 0.7526978056469832, "learning_rate": 7.52125789902175e-06, "loss": 2.847786865234375, "step": 623800 }, { "epoch": 0.7528184689694658, "learning_rate": 7.520854063554011e-06, "loss": 2.7977569580078123, "step": 623900 }, { "epoch": 0.7529391322919485, "learning_rate": 7.5204502280862725e-06, "loss": 2.8150515747070313, "step": 624000 }, { "epoch": 0.7530597956144313, "learning_rate": 7.520046392618534e-06, "loss": 2.8003094482421873, "step": 624100 }, { "epoch": 0.7531804589369139, "learning_rate": 7.519642557150796e-06, "loss": 2.8240151977539063, "step": 624200 }, { "epoch": 0.7533011222593966, "learning_rate": 7.519238721683058e-06, "loss": 2.8090219116210937, "step": 624300 }, { "epoch": 0.7534217855818792, "learning_rate": 7.51883488621532e-06, "loss": 2.7934942626953125, "step": 624400 }, { "epoch": 0.753542448904362, "learning_rate": 7.518431050747581e-06, "loss": 2.814222717285156, "step": 624500 }, { "epoch": 0.7536631122268447, "learning_rate": 7.518027215279843e-06, "loss": 2.8359490966796876, "step": 624600 }, { "epoch": 0.7537837755493273, "learning_rate": 7.517623379812105e-06, "loss": 2.8103677368164064, "step": 624700 }, { "epoch": 0.75390443887181, "learning_rate": 7.517219544344365e-06, "loss": 2.8218817138671874, "step": 624800 }, { "epoch": 0.7540251021942926, "learning_rate": 7.516815708876627e-06, "loss": 2.8379351806640627, "step": 624900 }, { "epoch": 0.7541457655167754, "learning_rate": 7.516411873408889e-06, "loss": 2.8164877319335937, "step": 625000 }, { "epoch": 0.7542664288392581, "learning_rate": 7.51600803794115e-06, "loss": 2.836911926269531, "step": 625100 }, { "epoch": 0.7543870921617407, "learning_rate": 7.515604202473412e-06, "loss": 2.8158297729492188, "step": 625200 }, { "epoch": 0.7545077554842234, "learning_rate": 7.515200367005674e-06, "loss": 2.832657775878906, "step": 625300 }, { "epoch": 0.7546284188067061, "learning_rate": 7.514796531537936e-06, "loss": 2.838329162597656, "step": 625400 }, { "epoch": 0.7547490821291888, "learning_rate": 7.514392696070197e-06, "loss": 2.80716552734375, "step": 625500 }, { "epoch": 0.7548697454516715, "learning_rate": 7.513988860602458e-06, "loss": 2.838720703125, "step": 625600 }, { "epoch": 0.7549904087741541, "learning_rate": 7.5135850251347195e-06, "loss": 2.814241943359375, "step": 625700 }, { "epoch": 0.7551110720966369, "learning_rate": 7.5131811896669814e-06, "loss": 2.8169039916992187, "step": 625800 }, { "epoch": 0.7552317354191195, "learning_rate": 7.5127773541992434e-06, "loss": 2.82134765625, "step": 625900 }, { "epoch": 0.7553523987416022, "learning_rate": 7.512373518731505e-06, "loss": 2.8186550903320313, "step": 626000 }, { "epoch": 0.7554730620640849, "learning_rate": 7.5119696832637665e-06, "loss": 2.832461242675781, "step": 626100 }, { "epoch": 0.7555937253865675, "learning_rate": 7.5115658477960285e-06, "loss": 2.8221148681640624, "step": 626200 }, { "epoch": 0.7557143887090503, "learning_rate": 7.5111620123282905e-06, "loss": 2.848611145019531, "step": 626300 }, { "epoch": 0.7558350520315329, "learning_rate": 7.510758176860551e-06, "loss": 2.816414794921875, "step": 626400 }, { "epoch": 0.7559557153540156, "learning_rate": 7.510354341392813e-06, "loss": 2.8215090942382814, "step": 626500 }, { "epoch": 0.7560763786764984, "learning_rate": 7.509950505925075e-06, "loss": 2.8143475341796873, "step": 626600 }, { "epoch": 0.756197041998981, "learning_rate": 7.509546670457336e-06, "loss": 2.8294100952148438, "step": 626700 }, { "epoch": 0.7563177053214637, "learning_rate": 7.509142834989598e-06, "loss": 2.81141845703125, "step": 626800 }, { "epoch": 0.7564383686439463, "learning_rate": 7.50873899952186e-06, "loss": 2.807459411621094, "step": 626900 }, { "epoch": 0.756559031966429, "learning_rate": 7.508335164054121e-06, "loss": 2.815330810546875, "step": 627000 }, { "epoch": 0.7566796952889118, "learning_rate": 7.507931328586383e-06, "loss": 2.8179620361328124, "step": 627100 }, { "epoch": 0.7568003586113944, "learning_rate": 7.507527493118644e-06, "loss": 2.8043142700195314, "step": 627200 }, { "epoch": 0.7569210219338771, "learning_rate": 7.507123657650905e-06, "loss": 2.8381643676757813, "step": 627300 }, { "epoch": 0.7570416852563598, "learning_rate": 7.506719822183167e-06, "loss": 2.823447570800781, "step": 627400 }, { "epoch": 0.7571623485788425, "learning_rate": 7.506315986715429e-06, "loss": 2.803863525390625, "step": 627500 }, { "epoch": 0.7572830119013252, "learning_rate": 7.50591215124769e-06, "loss": 2.8209368896484377, "step": 627600 }, { "epoch": 0.7574036752238078, "learning_rate": 7.505508315779952e-06, "loss": 2.810624694824219, "step": 627700 }, { "epoch": 0.7575243385462905, "learning_rate": 7.505104480312214e-06, "loss": 2.8308978271484375, "step": 627800 }, { "epoch": 0.7576450018687733, "learning_rate": 7.504700644844476e-06, "loss": 2.820066223144531, "step": 627900 }, { "epoch": 0.7577656651912559, "learning_rate": 7.5042968093767374e-06, "loss": 2.825129089355469, "step": 628000 }, { "epoch": 0.7578863285137386, "learning_rate": 7.5038929739089986e-06, "loss": 2.7999700927734374, "step": 628100 }, { "epoch": 0.7580069918362212, "learning_rate": 7.50348913844126e-06, "loss": 2.8441912841796877, "step": 628200 }, { "epoch": 0.758127655158704, "learning_rate": 7.503085302973522e-06, "loss": 2.8127236938476563, "step": 628300 }, { "epoch": 0.7582483184811867, "learning_rate": 7.502681467505784e-06, "loss": 2.8064776611328126, "step": 628400 }, { "epoch": 0.7583689818036693, "learning_rate": 7.502277632038046e-06, "loss": 2.81010986328125, "step": 628500 }, { "epoch": 0.758489645126152, "learning_rate": 7.501873796570307e-06, "loss": 2.813505859375, "step": 628600 }, { "epoch": 0.7586103084486346, "learning_rate": 7.501469961102569e-06, "loss": 2.839752502441406, "step": 628700 }, { "epoch": 0.7587309717711174, "learning_rate": 7.501066125634831e-06, "loss": 2.8094476318359374, "step": 628800 }, { "epoch": 0.7588516350936001, "learning_rate": 7.500662290167091e-06, "loss": 2.8255184936523436, "step": 628900 }, { "epoch": 0.7589722984160827, "learning_rate": 7.500258454699353e-06, "loss": 2.7825860595703125, "step": 629000 }, { "epoch": 0.7590929617385654, "learning_rate": 7.499854619231615e-06, "loss": 2.7998233032226563, "step": 629100 }, { "epoch": 0.7592136250610481, "learning_rate": 7.499450783763876e-06, "loss": 2.833280029296875, "step": 629200 }, { "epoch": 0.7593342883835308, "learning_rate": 7.499046948296138e-06, "loss": 2.82797119140625, "step": 629300 }, { "epoch": 0.7594549517060135, "learning_rate": 7.4986431128284e-06, "loss": 2.8048834228515624, "step": 629400 }, { "epoch": 0.7595756150284961, "learning_rate": 7.498239277360661e-06, "loss": 2.840520324707031, "step": 629500 }, { "epoch": 0.7596962783509789, "learning_rate": 7.497835441892923e-06, "loss": 2.8284671020507814, "step": 629600 }, { "epoch": 0.7598169416734615, "learning_rate": 7.497431606425184e-06, "loss": 2.8107119750976564, "step": 629700 }, { "epoch": 0.7599376049959442, "learning_rate": 7.4970277709574455e-06, "loss": 2.817759704589844, "step": 629800 }, { "epoch": 0.7600582683184269, "learning_rate": 7.4966239354897075e-06, "loss": 2.7947119140625, "step": 629900 }, { "epoch": 0.7601789316409095, "learning_rate": 7.4962201000219695e-06, "loss": 2.827834167480469, "step": 630000 }, { "epoch": 0.7602995949633923, "learning_rate": 7.495816264554231e-06, "loss": 2.806748046875, "step": 630100 }, { "epoch": 0.7604202582858749, "learning_rate": 7.495412429086493e-06, "loss": 2.8078036499023438, "step": 630200 }, { "epoch": 0.7605409216083576, "learning_rate": 7.4950085936187546e-06, "loss": 2.7935491943359376, "step": 630300 }, { "epoch": 0.7606615849308404, "learning_rate": 7.4946047581510165e-06, "loss": 2.824662780761719, "step": 630400 }, { "epoch": 0.760782248253323, "learning_rate": 7.494200922683277e-06, "loss": 2.8324224853515627, "step": 630500 }, { "epoch": 0.7609029115758057, "learning_rate": 7.493797087215539e-06, "loss": 2.824881896972656, "step": 630600 }, { "epoch": 0.7610235748982883, "learning_rate": 7.4933932517478e-06, "loss": 2.809110107421875, "step": 630700 }, { "epoch": 0.761144238220771, "learning_rate": 7.492989416280062e-06, "loss": 2.8109576416015627, "step": 630800 }, { "epoch": 0.7612649015432538, "learning_rate": 7.492585580812324e-06, "loss": 2.839380798339844, "step": 630900 }, { "epoch": 0.7613855648657364, "learning_rate": 7.492181745344586e-06, "loss": 2.8052963256835937, "step": 631000 }, { "epoch": 0.7615062281882191, "learning_rate": 7.491777909876847e-06, "loss": 2.8299984741210937, "step": 631100 }, { "epoch": 0.7616268915107017, "learning_rate": 7.491374074409109e-06, "loss": 2.8344342041015627, "step": 631200 }, { "epoch": 0.7617475548331845, "learning_rate": 7.490970238941369e-06, "loss": 2.7963909912109375, "step": 631300 }, { "epoch": 0.7618682181556672, "learning_rate": 7.490566403473631e-06, "loss": 2.819774169921875, "step": 631400 }, { "epoch": 0.7619888814781498, "learning_rate": 7.490162568005893e-06, "loss": 2.829229431152344, "step": 631500 }, { "epoch": 0.7621095448006325, "learning_rate": 7.489758732538155e-06, "loss": 2.7972030639648438, "step": 631600 }, { "epoch": 0.7622302081231151, "learning_rate": 7.489354897070416e-06, "loss": 2.8223831176757814, "step": 631700 }, { "epoch": 0.7623508714455979, "learning_rate": 7.488951061602678e-06, "loss": 2.827274169921875, "step": 631800 }, { "epoch": 0.7624715347680806, "learning_rate": 7.48854722613494e-06, "loss": 2.8172030639648438, "step": 631900 }, { "epoch": 0.7625921980905632, "learning_rate": 7.4881433906672015e-06, "loss": 2.799857177734375, "step": 632000 }, { "epoch": 0.762712861413046, "learning_rate": 7.487739555199463e-06, "loss": 2.80046630859375, "step": 632100 }, { "epoch": 0.7628335247355286, "learning_rate": 7.487335719731725e-06, "loss": 2.8192620849609376, "step": 632200 }, { "epoch": 0.7629541880580113, "learning_rate": 7.486931884263986e-06, "loss": 2.8029095458984377, "step": 632300 }, { "epoch": 0.763074851380494, "learning_rate": 7.486528048796248e-06, "loss": 2.8075775146484374, "step": 632400 }, { "epoch": 0.7631955147029766, "learning_rate": 7.48612421332851e-06, "loss": 2.8197528076171876, "step": 632500 }, { "epoch": 0.7633161780254594, "learning_rate": 7.485720377860771e-06, "loss": 2.798919372558594, "step": 632600 }, { "epoch": 0.7634368413479421, "learning_rate": 7.485316542393033e-06, "loss": 2.815196228027344, "step": 632700 }, { "epoch": 0.7635575046704247, "learning_rate": 7.484912706925295e-06, "loss": 2.795498046875, "step": 632800 }, { "epoch": 0.7636781679929074, "learning_rate": 7.484508871457555e-06, "loss": 2.836619567871094, "step": 632900 }, { "epoch": 0.7637988313153901, "learning_rate": 7.484105035989817e-06, "loss": 2.8059762573242186, "step": 633000 }, { "epoch": 0.7639194946378728, "learning_rate": 7.483701200522079e-06, "loss": 2.806063537597656, "step": 633100 }, { "epoch": 0.7640401579603555, "learning_rate": 7.48329736505434e-06, "loss": 2.806720886230469, "step": 633200 }, { "epoch": 0.7641608212828381, "learning_rate": 7.482893529586602e-06, "loss": 2.82459228515625, "step": 633300 }, { "epoch": 0.7642814846053209, "learning_rate": 7.482489694118864e-06, "loss": 2.8183721923828124, "step": 633400 }, { "epoch": 0.7644021479278035, "learning_rate": 7.482085858651126e-06, "loss": 2.7859466552734373, "step": 633500 }, { "epoch": 0.7645228112502862, "learning_rate": 7.481682023183387e-06, "loss": 2.7920452880859377, "step": 633600 }, { "epoch": 0.7646434745727689, "learning_rate": 7.481278187715649e-06, "loss": 2.826982116699219, "step": 633700 }, { "epoch": 0.7647641378952516, "learning_rate": 7.4808743522479096e-06, "loss": 2.8122933959960936, "step": 633800 }, { "epoch": 0.7648848012177343, "learning_rate": 7.4804705167801715e-06, "loss": 2.8242767333984373, "step": 633900 }, { "epoch": 0.7650054645402169, "learning_rate": 7.4800666813124335e-06, "loss": 2.80056640625, "step": 634000 }, { "epoch": 0.7651261278626996, "learning_rate": 7.4796628458446955e-06, "loss": 2.8149404907226563, "step": 634100 }, { "epoch": 0.7652467911851824, "learning_rate": 7.479259010376957e-06, "loss": 2.8430496215820313, "step": 634200 }, { "epoch": 0.765367454507665, "learning_rate": 7.478855174909219e-06, "loss": 2.825057067871094, "step": 634300 }, { "epoch": 0.7654881178301477, "learning_rate": 7.478451339441481e-06, "loss": 2.7937969970703125, "step": 634400 }, { "epoch": 0.7656087811526303, "learning_rate": 7.478047503973742e-06, "loss": 2.8096853637695314, "step": 634500 }, { "epoch": 0.765729444475113, "learning_rate": 7.477643668506003e-06, "loss": 2.814560546875, "step": 634600 }, { "epoch": 0.7658501077975958, "learning_rate": 7.477239833038265e-06, "loss": 2.814894104003906, "step": 634700 }, { "epoch": 0.7659707711200784, "learning_rate": 7.476835997570526e-06, "loss": 2.8021551513671876, "step": 634800 }, { "epoch": 0.7660914344425611, "learning_rate": 7.476432162102788e-06, "loss": 2.8287619018554686, "step": 634900 }, { "epoch": 0.7662120977650437, "learning_rate": 7.47602832663505e-06, "loss": 2.8066400146484374, "step": 635000 }, { "epoch": 0.7663327610875265, "learning_rate": 7.475624491167311e-06, "loss": 2.8202584838867186, "step": 635100 }, { "epoch": 0.7664534244100092, "learning_rate": 7.475220655699573e-06, "loss": 2.808660583496094, "step": 635200 }, { "epoch": 0.7665740877324918, "learning_rate": 7.474816820231835e-06, "loss": 2.8035342407226564, "step": 635300 }, { "epoch": 0.7666947510549745, "learning_rate": 7.474412984764095e-06, "loss": 2.8066366577148436, "step": 635400 }, { "epoch": 0.7668154143774571, "learning_rate": 7.474009149296357e-06, "loss": 2.8064675903320313, "step": 635500 }, { "epoch": 0.7669360776999399, "learning_rate": 7.473605313828619e-06, "loss": 2.8260287475585937, "step": 635600 }, { "epoch": 0.7670567410224226, "learning_rate": 7.4732014783608804e-06, "loss": 2.81394775390625, "step": 635700 }, { "epoch": 0.7671774043449052, "learning_rate": 7.4727976428931424e-06, "loss": 2.805430908203125, "step": 635800 }, { "epoch": 0.767298067667388, "learning_rate": 7.472393807425404e-06, "loss": 2.825620422363281, "step": 635900 }, { "epoch": 0.7674187309898706, "learning_rate": 7.471989971957666e-06, "loss": 2.8045498657226564, "step": 636000 }, { "epoch": 0.7675393943123533, "learning_rate": 7.4715861364899275e-06, "loss": 2.76764404296875, "step": 636100 }, { "epoch": 0.767660057634836, "learning_rate": 7.471182301022189e-06, "loss": 2.80500244140625, "step": 636200 }, { "epoch": 0.7677807209573186, "learning_rate": 7.47077846555445e-06, "loss": 2.7840670776367187, "step": 636300 }, { "epoch": 0.7679013842798014, "learning_rate": 7.470374630086712e-06, "loss": 2.82157470703125, "step": 636400 }, { "epoch": 0.768022047602284, "learning_rate": 7.469970794618974e-06, "loss": 2.8102056884765627, "step": 636500 }, { "epoch": 0.7681427109247667, "learning_rate": 7.469566959151236e-06, "loss": 2.7919244384765625, "step": 636600 }, { "epoch": 0.7682633742472494, "learning_rate": 7.469163123683497e-06, "loss": 2.8040496826171877, "step": 636700 }, { "epoch": 0.7683840375697321, "learning_rate": 7.468759288215759e-06, "loss": 2.8322763061523437, "step": 636800 }, { "epoch": 0.7685047008922148, "learning_rate": 7.468355452748021e-06, "loss": 2.8125839233398438, "step": 636900 }, { "epoch": 0.7686253642146974, "learning_rate": 7.467951617280281e-06, "loss": 2.81189208984375, "step": 637000 }, { "epoch": 0.7687460275371801, "learning_rate": 7.467547781812543e-06, "loss": 2.7913079833984376, "step": 637100 }, { "epoch": 0.7688666908596629, "learning_rate": 7.467143946344805e-06, "loss": 2.7972946166992188, "step": 637200 }, { "epoch": 0.7689873541821455, "learning_rate": 7.466740110877066e-06, "loss": 2.7843026733398437, "step": 637300 }, { "epoch": 0.7691080175046282, "learning_rate": 7.466336275409328e-06, "loss": 2.8177694702148437, "step": 637400 }, { "epoch": 0.7692286808271108, "learning_rate": 7.46593243994159e-06, "loss": 2.794295654296875, "step": 637500 }, { "epoch": 0.7693493441495936, "learning_rate": 7.465528604473851e-06, "loss": 2.799768981933594, "step": 637600 }, { "epoch": 0.7694700074720763, "learning_rate": 7.465124769006113e-06, "loss": 2.788987731933594, "step": 637700 }, { "epoch": 0.7695906707945589, "learning_rate": 7.4647209335383745e-06, "loss": 2.7929547119140623, "step": 637800 }, { "epoch": 0.7697113341170416, "learning_rate": 7.464317098070636e-06, "loss": 2.7963330078125, "step": 637900 }, { "epoch": 0.7698319974395244, "learning_rate": 7.4639132626028976e-06, "loss": 2.7865264892578123, "step": 638000 }, { "epoch": 0.769952660762007, "learning_rate": 7.4635094271351596e-06, "loss": 2.802998352050781, "step": 638100 }, { "epoch": 0.7700733240844897, "learning_rate": 7.463105591667421e-06, "loss": 2.798790283203125, "step": 638200 }, { "epoch": 0.7701939874069723, "learning_rate": 7.462701756199683e-06, "loss": 2.814588928222656, "step": 638300 }, { "epoch": 0.770314650729455, "learning_rate": 7.462297920731945e-06, "loss": 2.8448245239257814, "step": 638400 }, { "epoch": 0.7704353140519378, "learning_rate": 7.461894085264207e-06, "loss": 2.7995623779296874, "step": 638500 }, { "epoch": 0.7705559773744204, "learning_rate": 7.461490249796468e-06, "loss": 2.7841168212890626, "step": 638600 }, { "epoch": 0.7706766406969031, "learning_rate": 7.461086414328729e-06, "loss": 2.809776611328125, "step": 638700 }, { "epoch": 0.7707973040193857, "learning_rate": 7.46068257886099e-06, "loss": 2.806551513671875, "step": 638800 }, { "epoch": 0.7709179673418685, "learning_rate": 7.460278743393252e-06, "loss": 2.799233093261719, "step": 638900 }, { "epoch": 0.7710386306643512, "learning_rate": 7.459874907925514e-06, "loss": 2.8224993896484376, "step": 639000 }, { "epoch": 0.7711592939868338, "learning_rate": 7.459471072457776e-06, "loss": 2.798675537109375, "step": 639100 }, { "epoch": 0.7712799573093165, "learning_rate": 7.459067236990037e-06, "loss": 2.8178729248046874, "step": 639200 }, { "epoch": 0.7714006206317991, "learning_rate": 7.458663401522299e-06, "loss": 2.787048645019531, "step": 639300 }, { "epoch": 0.7715212839542819, "learning_rate": 7.458259566054561e-06, "loss": 2.8220550537109377, "step": 639400 }, { "epoch": 0.7716419472767646, "learning_rate": 7.457855730586821e-06, "loss": 2.809775390625, "step": 639500 }, { "epoch": 0.7717626105992472, "learning_rate": 7.457451895119083e-06, "loss": 2.8032269287109375, "step": 639600 }, { "epoch": 0.77188327392173, "learning_rate": 7.457048059651345e-06, "loss": 2.802798156738281, "step": 639700 }, { "epoch": 0.7720039372442126, "learning_rate": 7.4566442241836065e-06, "loss": 2.7987185668945314, "step": 639800 }, { "epoch": 0.7721246005666953, "learning_rate": 7.4562403887158685e-06, "loss": 2.8019683837890623, "step": 639900 }, { "epoch": 0.772245263889178, "learning_rate": 7.4558365532481304e-06, "loss": 2.8094406127929688, "step": 640000 }, { "epoch": 0.7723659272116606, "learning_rate": 7.4554327177803924e-06, "loss": 2.781033935546875, "step": 640100 }, { "epoch": 0.7724865905341434, "learning_rate": 7.4550288823126536e-06, "loss": 2.830671691894531, "step": 640200 }, { "epoch": 0.772607253856626, "learning_rate": 7.454625046844915e-06, "loss": 2.8130642700195314, "step": 640300 }, { "epoch": 0.7727279171791087, "learning_rate": 7.454221211377176e-06, "loss": 2.795113830566406, "step": 640400 }, { "epoch": 0.7728485805015914, "learning_rate": 7.453817375909438e-06, "loss": 2.7911883544921876, "step": 640500 }, { "epoch": 0.7729692438240741, "learning_rate": 7.4534135404417e-06, "loss": 2.824063720703125, "step": 640600 }, { "epoch": 0.7730899071465568, "learning_rate": 7.453009704973962e-06, "loss": 2.7955221557617187, "step": 640700 }, { "epoch": 0.7732105704690394, "learning_rate": 7.452605869506223e-06, "loss": 2.810726318359375, "step": 640800 }, { "epoch": 0.7733312337915221, "learning_rate": 7.452202034038485e-06, "loss": 2.8075360107421874, "step": 640900 }, { "epoch": 0.7734518971140049, "learning_rate": 7.451798198570747e-06, "loss": 2.8090118408203124, "step": 641000 }, { "epoch": 0.7735725604364875, "learning_rate": 7.451394363103007e-06, "loss": 2.794954833984375, "step": 641100 }, { "epoch": 0.7736932237589702, "learning_rate": 7.450990527635269e-06, "loss": 2.7930673217773436, "step": 641200 }, { "epoch": 0.7738138870814528, "learning_rate": 7.450586692167531e-06, "loss": 2.783580627441406, "step": 641300 }, { "epoch": 0.7739345504039356, "learning_rate": 7.450182856699792e-06, "loss": 2.7946356201171874, "step": 641400 }, { "epoch": 0.7740552137264183, "learning_rate": 7.449779021232054e-06, "loss": 2.7804501342773436, "step": 641500 }, { "epoch": 0.7741758770489009, "learning_rate": 7.449375185764316e-06, "loss": 2.8231967163085936, "step": 641600 }, { "epoch": 0.7742965403713836, "learning_rate": 7.448971350296577e-06, "loss": 2.797424621582031, "step": 641700 }, { "epoch": 0.7744172036938662, "learning_rate": 7.448567514828839e-06, "loss": 2.8254598999023437, "step": 641800 }, { "epoch": 0.774537867016349, "learning_rate": 7.4481636793611005e-06, "loss": 2.800212097167969, "step": 641900 }, { "epoch": 0.7746585303388317, "learning_rate": 7.447759843893362e-06, "loss": 2.799847412109375, "step": 642000 }, { "epoch": 0.7747791936613143, "learning_rate": 7.447356008425624e-06, "loss": 2.7982672119140624, "step": 642100 }, { "epoch": 0.774899856983797, "learning_rate": 7.446952172957886e-06, "loss": 2.7974948120117187, "step": 642200 }, { "epoch": 0.7750205203062797, "learning_rate": 7.446548337490147e-06, "loss": 2.7808526611328124, "step": 642300 }, { "epoch": 0.7751411836287624, "learning_rate": 7.446144502022409e-06, "loss": 2.7849496459960936, "step": 642400 }, { "epoch": 0.7752618469512451, "learning_rate": 7.445740666554671e-06, "loss": 2.8252993774414064, "step": 642500 }, { "epoch": 0.7753825102737277, "learning_rate": 7.445336831086933e-06, "loss": 2.7983026123046875, "step": 642600 }, { "epoch": 0.7755031735962105, "learning_rate": 7.444932995619193e-06, "loss": 2.8225552368164064, "step": 642700 }, { "epoch": 0.7756238369186931, "learning_rate": 7.444529160151455e-06, "loss": 2.796225280761719, "step": 642800 }, { "epoch": 0.7757445002411758, "learning_rate": 7.444125324683716e-06, "loss": 2.797408142089844, "step": 642900 }, { "epoch": 0.7758651635636585, "learning_rate": 7.443721489215978e-06, "loss": 2.8313677978515623, "step": 643000 }, { "epoch": 0.7759858268861412, "learning_rate": 7.44331765374824e-06, "loss": 2.79855224609375, "step": 643100 }, { "epoch": 0.7761064902086239, "learning_rate": 7.442913818280502e-06, "loss": 2.8013034057617188, "step": 643200 }, { "epoch": 0.7762271535311066, "learning_rate": 7.442509982812763e-06, "loss": 2.791241455078125, "step": 643300 }, { "epoch": 0.7763478168535892, "learning_rate": 7.442106147345025e-06, "loss": 2.803466491699219, "step": 643400 }, { "epoch": 0.776468480176072, "learning_rate": 7.441702311877287e-06, "loss": 2.8065109252929688, "step": 643500 }, { "epoch": 0.7765891434985546, "learning_rate": 7.441298476409547e-06, "loss": 2.8209933471679687, "step": 643600 }, { "epoch": 0.7767098068210373, "learning_rate": 7.440894640941809e-06, "loss": 2.784701232910156, "step": 643700 }, { "epoch": 0.77683047014352, "learning_rate": 7.440490805474071e-06, "loss": 2.811717529296875, "step": 643800 }, { "epoch": 0.7769511334660026, "learning_rate": 7.4400869700063325e-06, "loss": 2.7684066772460936, "step": 643900 }, { "epoch": 0.7770717967884854, "learning_rate": 7.4396831345385945e-06, "loss": 2.8030841064453127, "step": 644000 }, { "epoch": 0.777192460110968, "learning_rate": 7.4392792990708565e-06, "loss": 2.801991271972656, "step": 644100 }, { "epoch": 0.7773131234334507, "learning_rate": 7.438875463603118e-06, "loss": 2.8076577758789063, "step": 644200 }, { "epoch": 0.7774337867559334, "learning_rate": 7.43847162813538e-06, "loss": 2.785273132324219, "step": 644300 }, { "epoch": 0.7775544500784161, "learning_rate": 7.438067792667641e-06, "loss": 2.7681045532226562, "step": 644400 }, { "epoch": 0.7776751134008988, "learning_rate": 7.437663957199902e-06, "loss": 2.8096875, "step": 644500 }, { "epoch": 0.7777957767233814, "learning_rate": 7.437260121732164e-06, "loss": 2.8151321411132812, "step": 644600 }, { "epoch": 0.7779164400458641, "learning_rate": 7.436856286264426e-06, "loss": 2.8049139404296874, "step": 644700 }, { "epoch": 0.7780371033683469, "learning_rate": 7.436452450796687e-06, "loss": 2.7531466674804688, "step": 644800 }, { "epoch": 0.7781577666908295, "learning_rate": 7.436048615328949e-06, "loss": 2.7882122802734375, "step": 644900 }, { "epoch": 0.7782784300133122, "learning_rate": 7.435644779861211e-06, "loss": 2.8069497680664064, "step": 645000 }, { "epoch": 0.7783990933357948, "learning_rate": 7.435240944393473e-06, "loss": 2.8038626098632813, "step": 645100 }, { "epoch": 0.7785197566582776, "learning_rate": 7.434837108925733e-06, "loss": 2.79199462890625, "step": 645200 }, { "epoch": 0.7786404199807603, "learning_rate": 7.434433273457995e-06, "loss": 2.8295538330078127, "step": 645300 }, { "epoch": 0.7787610833032429, "learning_rate": 7.434029437990256e-06, "loss": 2.8368130493164063, "step": 645400 }, { "epoch": 0.7788817466257256, "learning_rate": 7.433625602522518e-06, "loss": 2.80603759765625, "step": 645500 }, { "epoch": 0.7790024099482082, "learning_rate": 7.43322176705478e-06, "loss": 2.794247741699219, "step": 645600 }, { "epoch": 0.779123073270691, "learning_rate": 7.432817931587042e-06, "loss": 2.79450927734375, "step": 645700 }, { "epoch": 0.7792437365931737, "learning_rate": 7.432414096119303e-06, "loss": 2.794268798828125, "step": 645800 }, { "epoch": 0.7793643999156563, "learning_rate": 7.432010260651565e-06, "loss": 2.781707763671875, "step": 645900 }, { "epoch": 0.779485063238139, "learning_rate": 7.431606425183826e-06, "loss": 2.7842803955078126, "step": 646000 }, { "epoch": 0.7796057265606217, "learning_rate": 7.431202589716088e-06, "loss": 2.8273434448242187, "step": 646100 }, { "epoch": 0.7797263898831044, "learning_rate": 7.43079875424835e-06, "loss": 2.7945376586914064, "step": 646200 }, { "epoch": 0.7798470532055871, "learning_rate": 7.430394918780612e-06, "loss": 2.792893981933594, "step": 646300 }, { "epoch": 0.7799677165280697, "learning_rate": 7.429991083312873e-06, "loss": 2.814039611816406, "step": 646400 }, { "epoch": 0.7800883798505525, "learning_rate": 7.429587247845135e-06, "loss": 2.784273681640625, "step": 646500 }, { "epoch": 0.7802090431730351, "learning_rate": 7.429183412377397e-06, "loss": 2.811090087890625, "step": 646600 }, { "epoch": 0.7803297064955178, "learning_rate": 7.428779576909658e-06, "loss": 2.7727545166015624, "step": 646700 }, { "epoch": 0.7804503698180005, "learning_rate": 7.428375741441919e-06, "loss": 2.79545654296875, "step": 646800 }, { "epoch": 0.7805710331404832, "learning_rate": 7.427971905974181e-06, "loss": 2.8199188232421877, "step": 646900 }, { "epoch": 0.7806916964629659, "learning_rate": 7.427568070506442e-06, "loss": 2.8087591552734374, "step": 647000 }, { "epoch": 0.7808123597854485, "learning_rate": 7.427164235038704e-06, "loss": 2.8018902587890624, "step": 647100 }, { "epoch": 0.7809330231079312, "learning_rate": 7.426760399570966e-06, "loss": 2.8068023681640626, "step": 647200 }, { "epoch": 0.781053686430414, "learning_rate": 7.426356564103227e-06, "loss": 2.780206298828125, "step": 647300 }, { "epoch": 0.7811743497528966, "learning_rate": 7.425952728635489e-06, "loss": 2.8132147216796874, "step": 647400 }, { "epoch": 0.7812950130753793, "learning_rate": 7.425548893167751e-06, "loss": 2.7968673706054688, "step": 647500 }, { "epoch": 0.7814156763978619, "learning_rate": 7.4251450577000115e-06, "loss": 2.7901736450195314, "step": 647600 }, { "epoch": 0.7815363397203446, "learning_rate": 7.4247412222322734e-06, "loss": 2.797579650878906, "step": 647700 }, { "epoch": 0.7816570030428274, "learning_rate": 7.4243373867645354e-06, "loss": 2.7747537231445314, "step": 647800 }, { "epoch": 0.78177766636531, "learning_rate": 7.4239335512967966e-06, "loss": 2.792848815917969, "step": 647900 }, { "epoch": 0.7818983296877927, "learning_rate": 7.4235297158290585e-06, "loss": 2.8133364868164064, "step": 648000 }, { "epoch": 0.7820189930102753, "learning_rate": 7.4231258803613205e-06, "loss": 2.8114834594726563, "step": 648100 }, { "epoch": 0.7821396563327581, "learning_rate": 7.4227220448935825e-06, "loss": 2.80548095703125, "step": 648200 }, { "epoch": 0.7822603196552408, "learning_rate": 7.422318209425844e-06, "loss": 2.790826721191406, "step": 648300 }, { "epoch": 0.7823809829777234, "learning_rate": 7.421914373958105e-06, "loss": 2.774923095703125, "step": 648400 }, { "epoch": 0.7825016463002061, "learning_rate": 7.421510538490366e-06, "loss": 2.7789620971679687, "step": 648500 }, { "epoch": 0.7826223096226889, "learning_rate": 7.421106703022628e-06, "loss": 2.8081011962890625, "step": 648600 }, { "epoch": 0.7827429729451715, "learning_rate": 7.42070286755489e-06, "loss": 2.7909561157226563, "step": 648700 }, { "epoch": 0.7828636362676542, "learning_rate": 7.420299032087152e-06, "loss": 2.7952871704101563, "step": 648800 }, { "epoch": 0.7829842995901368, "learning_rate": 7.419895196619413e-06, "loss": 2.8052932739257814, "step": 648900 }, { "epoch": 0.7831049629126196, "learning_rate": 7.419491361151675e-06, "loss": 2.819377136230469, "step": 649000 }, { "epoch": 0.7832256262351023, "learning_rate": 7.419087525683937e-06, "loss": 2.82023681640625, "step": 649100 }, { "epoch": 0.7833462895575849, "learning_rate": 7.418683690216198e-06, "loss": 2.8108856201171877, "step": 649200 }, { "epoch": 0.7834669528800676, "learning_rate": 7.418279854748459e-06, "loss": 2.781102294921875, "step": 649300 }, { "epoch": 0.7835876162025502, "learning_rate": 7.417876019280721e-06, "loss": 2.7746896362304687, "step": 649400 }, { "epoch": 0.783708279525033, "learning_rate": 7.417472183812982e-06, "loss": 2.791792907714844, "step": 649500 }, { "epoch": 0.7838289428475157, "learning_rate": 7.417068348345244e-06, "loss": 2.77331298828125, "step": 649600 }, { "epoch": 0.7839496061699983, "learning_rate": 7.416664512877506e-06, "loss": 2.812242431640625, "step": 649700 }, { "epoch": 0.784070269492481, "learning_rate": 7.4162606774097675e-06, "loss": 2.780318298339844, "step": 649800 }, { "epoch": 0.7841909328149637, "learning_rate": 7.4158568419420294e-06, "loss": 2.813304138183594, "step": 649900 }, { "epoch": 0.7843115961374464, "learning_rate": 7.415453006474291e-06, "loss": 2.8148846435546875, "step": 650000 }, { "epoch": 0.7844322594599291, "learning_rate": 7.415049171006552e-06, "loss": 2.807090148925781, "step": 650100 }, { "epoch": 0.7845529227824117, "learning_rate": 7.414645335538814e-06, "loss": 2.820609436035156, "step": 650200 }, { "epoch": 0.7846735861048945, "learning_rate": 7.414241500071076e-06, "loss": 2.8246429443359373, "step": 650300 }, { "epoch": 0.7847942494273771, "learning_rate": 7.413837664603337e-06, "loss": 2.8008038330078127, "step": 650400 }, { "epoch": 0.7849149127498598, "learning_rate": 7.413433829135599e-06, "loss": 2.79761962890625, "step": 650500 }, { "epoch": 0.7850355760723425, "learning_rate": 7.413029993667861e-06, "loss": 2.8181552124023437, "step": 650600 }, { "epoch": 0.7851562393948252, "learning_rate": 7.412626158200123e-06, "loss": 2.813277282714844, "step": 650700 }, { "epoch": 0.7852769027173079, "learning_rate": 7.412222322732384e-06, "loss": 2.7930374145507812, "step": 650800 }, { "epoch": 0.7853975660397905, "learning_rate": 7.411818487264645e-06, "loss": 2.785684814453125, "step": 650900 }, { "epoch": 0.7855182293622732, "learning_rate": 7.411414651796906e-06, "loss": 2.800728454589844, "step": 651000 }, { "epoch": 0.785638892684756, "learning_rate": 7.411010816329168e-06, "loss": 2.812364196777344, "step": 651100 }, { "epoch": 0.7857595560072386, "learning_rate": 7.41060698086143e-06, "loss": 2.7963671875, "step": 651200 }, { "epoch": 0.7858802193297213, "learning_rate": 7.410203145393692e-06, "loss": 2.78601806640625, "step": 651300 }, { "epoch": 0.7860008826522039, "learning_rate": 7.409799309925953e-06, "loss": 2.7887860107421876, "step": 651400 }, { "epoch": 0.7861215459746866, "learning_rate": 7.409395474458215e-06, "loss": 2.8027056884765624, "step": 651500 }, { "epoch": 0.7862422092971694, "learning_rate": 7.408991638990477e-06, "loss": 2.8188494873046874, "step": 651600 }, { "epoch": 0.786362872619652, "learning_rate": 7.4085878035227375e-06, "loss": 2.806413269042969, "step": 651700 }, { "epoch": 0.7864835359421347, "learning_rate": 7.4081839680549995e-06, "loss": 2.790466613769531, "step": 651800 }, { "epoch": 0.7866041992646173, "learning_rate": 7.4077801325872615e-06, "loss": 2.8119375610351565, "step": 651900 }, { "epoch": 0.7867248625871001, "learning_rate": 7.407376297119523e-06, "loss": 2.8192398071289064, "step": 652000 }, { "epoch": 0.7868455259095828, "learning_rate": 7.406972461651785e-06, "loss": 2.777142333984375, "step": 652100 }, { "epoch": 0.7869661892320654, "learning_rate": 7.4065686261840466e-06, "loss": 2.7916253662109374, "step": 652200 }, { "epoch": 0.7870868525545481, "learning_rate": 7.406164790716308e-06, "loss": 2.8010763549804687, "step": 652300 }, { "epoch": 0.7872075158770308, "learning_rate": 7.40576095524857e-06, "loss": 2.799225158691406, "step": 652400 }, { "epoch": 0.7873281791995135, "learning_rate": 7.405357119780831e-06, "loss": 2.8012130737304686, "step": 652500 }, { "epoch": 0.7874488425219962, "learning_rate": 7.404953284313092e-06, "loss": 2.792757873535156, "step": 652600 }, { "epoch": 0.7875695058444788, "learning_rate": 7.404549448845354e-06, "loss": 2.7983407592773437, "step": 652700 }, { "epoch": 0.7876901691669616, "learning_rate": 7.404145613377616e-06, "loss": 2.7867816162109373, "step": 652800 }, { "epoch": 0.7878108324894442, "learning_rate": 7.403741777909877e-06, "loss": 2.7692584228515624, "step": 652900 }, { "epoch": 0.7879314958119269, "learning_rate": 7.403337942442139e-06, "loss": 2.82015625, "step": 653000 }, { "epoch": 0.7880521591344096, "learning_rate": 7.402934106974401e-06, "loss": 2.781053466796875, "step": 653100 }, { "epoch": 0.7881728224568922, "learning_rate": 7.402530271506663e-06, "loss": 2.7840753173828126, "step": 653200 }, { "epoch": 0.788293485779375, "learning_rate": 7.402126436038923e-06, "loss": 2.784112854003906, "step": 653300 }, { "epoch": 0.7884141491018577, "learning_rate": 7.401722600571185e-06, "loss": 2.772276611328125, "step": 653400 }, { "epoch": 0.7885348124243403, "learning_rate": 7.401318765103446e-06, "loss": 2.7786004638671873, "step": 653500 }, { "epoch": 0.788655475746823, "learning_rate": 7.400914929635708e-06, "loss": 2.8094366455078124, "step": 653600 }, { "epoch": 0.7887761390693057, "learning_rate": 7.40051109416797e-06, "loss": 2.808651123046875, "step": 653700 }, { "epoch": 0.7888968023917884, "learning_rate": 7.400107258700232e-06, "loss": 2.8094168090820313, "step": 653800 }, { "epoch": 0.7890174657142711, "learning_rate": 7.3997034232324935e-06, "loss": 2.786241149902344, "step": 653900 }, { "epoch": 0.7891381290367537, "learning_rate": 7.3992995877647555e-06, "loss": 2.797081298828125, "step": 654000 }, { "epoch": 0.7892587923592365, "learning_rate": 7.3988957522970175e-06, "loss": 2.7973736572265624, "step": 654100 }, { "epoch": 0.7893794556817191, "learning_rate": 7.398491916829278e-06, "loss": 2.7939804077148436, "step": 654200 }, { "epoch": 0.7895001190042018, "learning_rate": 7.39808808136154e-06, "loss": 2.792857360839844, "step": 654300 }, { "epoch": 0.7896207823266845, "learning_rate": 7.397684245893802e-06, "loss": 2.78983642578125, "step": 654400 }, { "epoch": 0.7897414456491672, "learning_rate": 7.397280410426063e-06, "loss": 2.784940490722656, "step": 654500 }, { "epoch": 0.7898621089716499, "learning_rate": 7.396876574958325e-06, "loss": 2.7826373291015627, "step": 654600 }, { "epoch": 0.7899827722941325, "learning_rate": 7.396472739490587e-06, "loss": 2.796996765136719, "step": 654700 }, { "epoch": 0.7901034356166152, "learning_rate": 7.396068904022849e-06, "loss": 2.7768310546875, "step": 654800 }, { "epoch": 0.790224098939098, "learning_rate": 7.39566506855511e-06, "loss": 2.819232177734375, "step": 654900 }, { "epoch": 0.7903447622615806, "learning_rate": 7.395261233087371e-06, "loss": 2.8174673461914064, "step": 655000 }, { "epoch": 0.7904654255840633, "learning_rate": 7.394857397619632e-06, "loss": 2.7847885131835937, "step": 655100 }, { "epoch": 0.7905860889065459, "learning_rate": 7.394453562151894e-06, "loss": 2.784398498535156, "step": 655200 }, { "epoch": 0.7907067522290286, "learning_rate": 7.394049726684156e-06, "loss": 2.8010406494140625, "step": 655300 }, { "epoch": 0.7908274155515114, "learning_rate": 7.393645891216418e-06, "loss": 2.7829110717773435, "step": 655400 }, { "epoch": 0.790948078873994, "learning_rate": 7.393242055748679e-06, "loss": 2.798858642578125, "step": 655500 }, { "epoch": 0.7910687421964767, "learning_rate": 7.392838220280941e-06, "loss": 2.7971316528320314, "step": 655600 }, { "epoch": 0.7911894055189593, "learning_rate": 7.392434384813203e-06, "loss": 2.7993093872070314, "step": 655700 }, { "epoch": 0.7913100688414421, "learning_rate": 7.3920305493454635e-06, "loss": 2.7924017333984374, "step": 655800 }, { "epoch": 0.7914307321639248, "learning_rate": 7.3916267138777255e-06, "loss": 2.802512512207031, "step": 655900 }, { "epoch": 0.7915513954864074, "learning_rate": 7.3912228784099875e-06, "loss": 2.8014016723632813, "step": 656000 }, { "epoch": 0.7916720588088901, "learning_rate": 7.390819042942249e-06, "loss": 2.8237478637695315, "step": 656100 }, { "epoch": 0.7917927221313728, "learning_rate": 7.390415207474511e-06, "loss": 2.8255386352539062, "step": 656200 }, { "epoch": 0.7919133854538555, "learning_rate": 7.390011372006773e-06, "loss": 2.79927734375, "step": 656300 }, { "epoch": 0.7920340487763382, "learning_rate": 7.389607536539034e-06, "loss": 2.7872320556640626, "step": 656400 }, { "epoch": 0.7921547120988208, "learning_rate": 7.389203701071296e-06, "loss": 2.7966079711914062, "step": 656500 }, { "epoch": 0.7922753754213036, "learning_rate": 7.388799865603557e-06, "loss": 2.8005999755859374, "step": 656600 }, { "epoch": 0.7923960387437862, "learning_rate": 7.388396030135818e-06, "loss": 2.7729583740234376, "step": 656700 }, { "epoch": 0.7925167020662689, "learning_rate": 7.38799219466808e-06, "loss": 2.788101806640625, "step": 656800 }, { "epoch": 0.7926373653887516, "learning_rate": 7.387588359200342e-06, "loss": 2.818209533691406, "step": 656900 }, { "epoch": 0.7927580287112342, "learning_rate": 7.387184523732603e-06, "loss": 2.7764602661132813, "step": 657000 }, { "epoch": 0.792878692033717, "learning_rate": 7.386780688264865e-06, "loss": 2.783212890625, "step": 657100 }, { "epoch": 0.7929993553561996, "learning_rate": 7.386376852797127e-06, "loss": 2.802919921875, "step": 657200 }, { "epoch": 0.7931200186786823, "learning_rate": 7.385973017329389e-06, "loss": 2.82133544921875, "step": 657300 }, { "epoch": 0.793240682001165, "learning_rate": 7.385569181861649e-06, "loss": 2.771608581542969, "step": 657400 }, { "epoch": 0.7933613453236477, "learning_rate": 7.385165346393911e-06, "loss": 2.792261962890625, "step": 657500 }, { "epoch": 0.7934820086461304, "learning_rate": 7.3847615109261724e-06, "loss": 2.7808551025390624, "step": 657600 }, { "epoch": 0.793602671968613, "learning_rate": 7.384357675458434e-06, "loss": 2.7785824584960936, "step": 657700 }, { "epoch": 0.7937233352910957, "learning_rate": 7.383953839990696e-06, "loss": 2.7540673828125, "step": 657800 }, { "epoch": 0.7938439986135785, "learning_rate": 7.383550004522958e-06, "loss": 2.778395080566406, "step": 657900 }, { "epoch": 0.7939646619360611, "learning_rate": 7.3831461690552195e-06, "loss": 2.7874209594726564, "step": 658000 }, { "epoch": 0.7940853252585438, "learning_rate": 7.3827423335874815e-06, "loss": 2.82052490234375, "step": 658100 }, { "epoch": 0.7942059885810264, "learning_rate": 7.382338498119742e-06, "loss": 2.7886251831054687, "step": 658200 }, { "epoch": 0.7943266519035092, "learning_rate": 7.381934662652004e-06, "loss": 2.8138217163085937, "step": 658300 }, { "epoch": 0.7944473152259919, "learning_rate": 7.381530827184266e-06, "loss": 2.7949624633789063, "step": 658400 }, { "epoch": 0.7945679785484745, "learning_rate": 7.381126991716528e-06, "loss": 2.7925430297851563, "step": 658500 }, { "epoch": 0.7946886418709572, "learning_rate": 7.380723156248789e-06, "loss": 2.7645278930664063, "step": 658600 }, { "epoch": 0.79480930519344, "learning_rate": 7.380319320781051e-06, "loss": 2.806607971191406, "step": 658700 }, { "epoch": 0.7949299685159226, "learning_rate": 7.379915485313313e-06, "loss": 2.790441589355469, "step": 658800 }, { "epoch": 0.7950506318384053, "learning_rate": 7.379511649845574e-06, "loss": 2.795, "step": 658900 }, { "epoch": 0.7951712951608879, "learning_rate": 7.379107814377836e-06, "loss": 2.809898681640625, "step": 659000 }, { "epoch": 0.7952919584833706, "learning_rate": 7.378703978910097e-06, "loss": 2.7773202514648436, "step": 659100 }, { "epoch": 0.7954126218058534, "learning_rate": 7.378300143442358e-06, "loss": 2.7560894775390623, "step": 659200 }, { "epoch": 0.795533285128336, "learning_rate": 7.37789630797462e-06, "loss": 2.773792724609375, "step": 659300 }, { "epoch": 0.7956539484508187, "learning_rate": 7.377492472506882e-06, "loss": 2.7895248413085936, "step": 659400 }, { "epoch": 0.7957746117733013, "learning_rate": 7.377088637039143e-06, "loss": 2.7947698974609376, "step": 659500 }, { "epoch": 0.7958952750957841, "learning_rate": 7.376684801571405e-06, "loss": 2.7723992919921874, "step": 659600 }, { "epoch": 0.7960159384182668, "learning_rate": 7.376280966103667e-06, "loss": 2.7925439453125, "step": 659700 }, { "epoch": 0.7961366017407494, "learning_rate": 7.375877130635929e-06, "loss": 2.807578125, "step": 659800 }, { "epoch": 0.7962572650632321, "learning_rate": 7.3754732951681896e-06, "loss": 2.782637023925781, "step": 659900 }, { "epoch": 0.7963779283857148, "learning_rate": 7.3750694597004515e-06, "loss": 2.7776123046875, "step": 660000 }, { "epoch": 0.7964985917081975, "learning_rate": 7.374665624232713e-06, "loss": 2.789456787109375, "step": 660100 }, { "epoch": 0.7966192550306802, "learning_rate": 7.374261788764975e-06, "loss": 2.791808776855469, "step": 660200 }, { "epoch": 0.7967399183531628, "learning_rate": 7.373857953297237e-06, "loss": 2.7873214721679687, "step": 660300 }, { "epoch": 0.7968605816756456, "learning_rate": 7.373454117829499e-06, "loss": 2.751332092285156, "step": 660400 }, { "epoch": 0.7969812449981282, "learning_rate": 7.37305028236176e-06, "loss": 2.786790771484375, "step": 660500 }, { "epoch": 0.7971019083206109, "learning_rate": 7.372646446894022e-06, "loss": 2.7691900634765627, "step": 660600 }, { "epoch": 0.7972225716430936, "learning_rate": 7.372242611426282e-06, "loss": 2.773759765625, "step": 660700 }, { "epoch": 0.7973432349655762, "learning_rate": 7.371838775958544e-06, "loss": 2.795589599609375, "step": 660800 }, { "epoch": 0.797463898288059, "learning_rate": 7.371434940490806e-06, "loss": 2.792037353515625, "step": 660900 }, { "epoch": 0.7975845616105416, "learning_rate": 7.371031105023068e-06, "loss": 2.7888421630859375, "step": 661000 }, { "epoch": 0.7977052249330243, "learning_rate": 7.370627269555329e-06, "loss": 2.8155197143554687, "step": 661100 }, { "epoch": 0.797825888255507, "learning_rate": 7.370223434087591e-06, "loss": 2.8025848388671877, "step": 661200 }, { "epoch": 0.7979465515779897, "learning_rate": 7.369819598619853e-06, "loss": 2.7878948974609377, "step": 661300 }, { "epoch": 0.7980672149004724, "learning_rate": 7.369415763152114e-06, "loss": 2.7930889892578126, "step": 661400 }, { "epoch": 0.798187878222955, "learning_rate": 7.369011927684375e-06, "loss": 2.79222900390625, "step": 661500 }, { "epoch": 0.7983085415454377, "learning_rate": 7.368608092216637e-06, "loss": 2.787877197265625, "step": 661600 }, { "epoch": 0.7984292048679205, "learning_rate": 7.3682042567488985e-06, "loss": 2.7590106201171873, "step": 661700 }, { "epoch": 0.7985498681904031, "learning_rate": 7.3678004212811605e-06, "loss": 2.769784240722656, "step": 661800 }, { "epoch": 0.7986705315128858, "learning_rate": 7.3673965858134224e-06, "loss": 2.7575341796875, "step": 661900 }, { "epoch": 0.7987911948353684, "learning_rate": 7.3669927503456836e-06, "loss": 2.8153366088867187, "step": 662000 }, { "epoch": 0.7989118581578512, "learning_rate": 7.3665889148779456e-06, "loss": 2.7815582275390627, "step": 662100 }, { "epoch": 0.7990325214803339, "learning_rate": 7.3661850794102075e-06, "loss": 2.8085784912109375, "step": 662200 }, { "epoch": 0.7991531848028165, "learning_rate": 7.365781243942468e-06, "loss": 2.7746963500976562, "step": 662300 }, { "epoch": 0.7992738481252992, "learning_rate": 7.36537740847473e-06, "loss": 2.803014221191406, "step": 662400 }, { "epoch": 0.7993945114477818, "learning_rate": 7.364973573006992e-06, "loss": 2.785816955566406, "step": 662500 }, { "epoch": 0.7995151747702646, "learning_rate": 7.364569737539253e-06, "loss": 2.8019845581054685, "step": 662600 }, { "epoch": 0.7996358380927473, "learning_rate": 7.364165902071515e-06, "loss": 2.7981805419921875, "step": 662700 }, { "epoch": 0.7997565014152299, "learning_rate": 7.363762066603777e-06, "loss": 2.801832275390625, "step": 662800 }, { "epoch": 0.7998771647377126, "learning_rate": 7.363358231136039e-06, "loss": 2.7599334716796875, "step": 662900 }, { "epoch": 0.7999978280601953, "learning_rate": 7.3629543956683e-06, "loss": 2.7765902709960937, "step": 663000 }, { "epoch": 0.800118491382678, "learning_rate": 7.362550560200561e-06, "loss": 2.7803604125976564, "step": 663100 }, { "epoch": 0.8002391547051607, "learning_rate": 7.362146724732822e-06, "loss": 2.805971984863281, "step": 663200 }, { "epoch": 0.8003598180276433, "learning_rate": 7.361742889265084e-06, "loss": 2.7982293701171876, "step": 663300 }, { "epoch": 0.8004804813501261, "learning_rate": 7.361339053797346e-06, "loss": 2.752122497558594, "step": 663400 }, { "epoch": 0.8006011446726087, "learning_rate": 7.360935218329608e-06, "loss": 2.759324951171875, "step": 663500 }, { "epoch": 0.8007218079950914, "learning_rate": 7.360531382861869e-06, "loss": 2.7706671142578125, "step": 663600 }, { "epoch": 0.8008424713175741, "learning_rate": 7.360127547394131e-06, "loss": 2.779388732910156, "step": 663700 }, { "epoch": 0.8009631346400568, "learning_rate": 7.359723711926393e-06, "loss": 2.7845867919921874, "step": 663800 }, { "epoch": 0.8010837979625395, "learning_rate": 7.3593198764586545e-06, "loss": 2.797130126953125, "step": 663900 }, { "epoch": 0.8012044612850222, "learning_rate": 7.358916040990916e-06, "loss": 2.783852233886719, "step": 664000 }, { "epoch": 0.8013251246075048, "learning_rate": 7.358512205523178e-06, "loss": 2.786119079589844, "step": 664100 }, { "epoch": 0.8014457879299876, "learning_rate": 7.358108370055439e-06, "loss": 2.767880859375, "step": 664200 }, { "epoch": 0.8015664512524702, "learning_rate": 7.357704534587701e-06, "loss": 2.794988098144531, "step": 664300 }, { "epoch": 0.8016871145749529, "learning_rate": 7.357300699119963e-06, "loss": 2.758273010253906, "step": 664400 }, { "epoch": 0.8018077778974356, "learning_rate": 7.356896863652224e-06, "loss": 2.791065673828125, "step": 664500 }, { "epoch": 0.8019284412199182, "learning_rate": 7.356493028184486e-06, "loss": 2.78525634765625, "step": 664600 }, { "epoch": 0.802049104542401, "learning_rate": 7.356089192716748e-06, "loss": 2.7733160400390626, "step": 664700 }, { "epoch": 0.8021697678648836, "learning_rate": 7.355685357249008e-06, "loss": 2.7771453857421875, "step": 664800 }, { "epoch": 0.8022904311873663, "learning_rate": 7.35528152178127e-06, "loss": 2.766620788574219, "step": 664900 }, { "epoch": 0.802411094509849, "learning_rate": 7.354877686313532e-06, "loss": 2.791540222167969, "step": 665000 }, { "epoch": 0.8025317578323317, "learning_rate": 7.354473850845793e-06, "loss": 2.7797222900390626, "step": 665100 }, { "epoch": 0.8026524211548144, "learning_rate": 7.354070015378055e-06, "loss": 2.7765823364257813, "step": 665200 }, { "epoch": 0.802773084477297, "learning_rate": 7.353666179910317e-06, "loss": 2.7628494262695313, "step": 665300 }, { "epoch": 0.8028937477997797, "learning_rate": 7.353262344442579e-06, "loss": 2.789728088378906, "step": 665400 }, { "epoch": 0.8030144111222625, "learning_rate": 7.35285850897484e-06, "loss": 2.764951171875, "step": 665500 }, { "epoch": 0.8031350744447451, "learning_rate": 7.352454673507101e-06, "loss": 2.7846725463867186, "step": 665600 }, { "epoch": 0.8032557377672278, "learning_rate": 7.3520508380393625e-06, "loss": 2.8048196411132813, "step": 665700 }, { "epoch": 0.8033764010897104, "learning_rate": 7.3516470025716245e-06, "loss": 2.7994088745117187, "step": 665800 }, { "epoch": 0.8034970644121932, "learning_rate": 7.3512431671038865e-06, "loss": 2.772532958984375, "step": 665900 }, { "epoch": 0.8036177277346759, "learning_rate": 7.3508393316361485e-06, "loss": 2.7886767578125, "step": 666000 }, { "epoch": 0.8037383910571585, "learning_rate": 7.35043549616841e-06, "loss": 2.805261535644531, "step": 666100 }, { "epoch": 0.8038590543796412, "learning_rate": 7.350031660700672e-06, "loss": 2.777310485839844, "step": 666200 }, { "epoch": 0.8039797177021238, "learning_rate": 7.3496278252329336e-06, "loss": 2.80323974609375, "step": 666300 }, { "epoch": 0.8041003810246066, "learning_rate": 7.349223989765194e-06, "loss": 2.7863595581054685, "step": 666400 }, { "epoch": 0.8042210443470893, "learning_rate": 7.348820154297456e-06, "loss": 2.7771896362304687, "step": 666500 }, { "epoch": 0.8043417076695719, "learning_rate": 7.348416318829718e-06, "loss": 2.7987991333007813, "step": 666600 }, { "epoch": 0.8044623709920546, "learning_rate": 7.348012483361979e-06, "loss": 2.7728643798828125, "step": 666700 }, { "epoch": 0.8045830343145373, "learning_rate": 7.347608647894241e-06, "loss": 2.8204156494140626, "step": 666800 }, { "epoch": 0.80470369763702, "learning_rate": 7.347204812426503e-06, "loss": 2.7827682495117188, "step": 666900 }, { "epoch": 0.8048243609595027, "learning_rate": 7.346800976958765e-06, "loss": 2.770790710449219, "step": 667000 }, { "epoch": 0.8049450242819853, "learning_rate": 7.346397141491026e-06, "loss": 2.807127685546875, "step": 667100 }, { "epoch": 0.8050656876044681, "learning_rate": 7.345993306023287e-06, "loss": 2.774967041015625, "step": 667200 }, { "epoch": 0.8051863509269507, "learning_rate": 7.345589470555548e-06, "loss": 2.772124938964844, "step": 667300 }, { "epoch": 0.8053070142494334, "learning_rate": 7.34518563508781e-06, "loss": 2.804805908203125, "step": 667400 }, { "epoch": 0.8054276775719161, "learning_rate": 7.344781799620072e-06, "loss": 2.7840206909179686, "step": 667500 }, { "epoch": 0.8055483408943988, "learning_rate": 7.344377964152334e-06, "loss": 2.7858447265625, "step": 667600 }, { "epoch": 0.8056690042168815, "learning_rate": 7.343974128684595e-06, "loss": 2.792890930175781, "step": 667700 }, { "epoch": 0.8057896675393641, "learning_rate": 7.343570293216857e-06, "loss": 2.7870553588867186, "step": 667800 }, { "epoch": 0.8059103308618468, "learning_rate": 7.343166457749119e-06, "loss": 2.798052978515625, "step": 667900 }, { "epoch": 0.8060309941843296, "learning_rate": 7.34276262228138e-06, "loss": 2.7840646362304686, "step": 668000 }, { "epoch": 0.8061516575068122, "learning_rate": 7.342358786813642e-06, "loss": 2.7588845825195314, "step": 668100 }, { "epoch": 0.8062723208292949, "learning_rate": 7.341954951345904e-06, "loss": 2.7744430541992187, "step": 668200 }, { "epoch": 0.8063929841517775, "learning_rate": 7.341551115878165e-06, "loss": 2.7746337890625, "step": 668300 }, { "epoch": 0.8065136474742602, "learning_rate": 7.341147280410427e-06, "loss": 2.7823443603515625, "step": 668400 }, { "epoch": 0.806634310796743, "learning_rate": 7.340743444942689e-06, "loss": 2.7789727783203126, "step": 668500 }, { "epoch": 0.8067549741192256, "learning_rate": 7.34033960947495e-06, "loss": 2.798805847167969, "step": 668600 }, { "epoch": 0.8068756374417083, "learning_rate": 7.339935774007212e-06, "loss": 2.782273864746094, "step": 668700 }, { "epoch": 0.8069963007641909, "learning_rate": 7.339531938539473e-06, "loss": 2.767358703613281, "step": 668800 }, { "epoch": 0.8071169640866737, "learning_rate": 7.339128103071734e-06, "loss": 2.775126953125, "step": 668900 }, { "epoch": 0.8072376274091564, "learning_rate": 7.338724267603996e-06, "loss": 2.785374755859375, "step": 669000 }, { "epoch": 0.807358290731639, "learning_rate": 7.338320432136258e-06, "loss": 2.773117980957031, "step": 669100 }, { "epoch": 0.8074789540541217, "learning_rate": 7.337916596668519e-06, "loss": 2.79136474609375, "step": 669200 }, { "epoch": 0.8075996173766045, "learning_rate": 7.337512761200781e-06, "loss": 2.75295654296875, "step": 669300 }, { "epoch": 0.8077202806990871, "learning_rate": 7.337108925733043e-06, "loss": 2.7753939819335938, "step": 669400 }, { "epoch": 0.8078409440215698, "learning_rate": 7.336705090265305e-06, "loss": 2.7691995239257814, "step": 669500 }, { "epoch": 0.8079616073440524, "learning_rate": 7.336301254797566e-06, "loss": 2.77121337890625, "step": 669600 }, { "epoch": 0.8080822706665352, "learning_rate": 7.335897419329827e-06, "loss": 2.805318603515625, "step": 669700 }, { "epoch": 0.8082029339890179, "learning_rate": 7.3354935838620886e-06, "loss": 2.758067932128906, "step": 669800 }, { "epoch": 0.8083235973115005, "learning_rate": 7.3350897483943505e-06, "loss": 2.7659542846679686, "step": 669900 }, { "epoch": 0.8084442606339832, "learning_rate": 7.3346859129266125e-06, "loss": 2.7943734741210937, "step": 670000 }, { "epoch": 0.8085649239564658, "learning_rate": 7.3342820774588745e-06, "loss": 2.7637985229492186, "step": 670100 }, { "epoch": 0.8086855872789486, "learning_rate": 7.333878241991136e-06, "loss": 2.7870721435546875, "step": 670200 }, { "epoch": 0.8088062506014313, "learning_rate": 7.333474406523398e-06, "loss": 2.791502685546875, "step": 670300 }, { "epoch": 0.8089269139239139, "learning_rate": 7.33307057105566e-06, "loss": 2.770005187988281, "step": 670400 }, { "epoch": 0.8090475772463966, "learning_rate": 7.33266673558792e-06, "loss": 2.7822671508789063, "step": 670500 }, { "epoch": 0.8091682405688793, "learning_rate": 7.332262900120182e-06, "loss": 2.7513616943359374, "step": 670600 }, { "epoch": 0.809288903891362, "learning_rate": 7.331859064652444e-06, "loss": 2.7921597290039064, "step": 670700 }, { "epoch": 0.8094095672138447, "learning_rate": 7.331455229184705e-06, "loss": 2.775643615722656, "step": 670800 }, { "epoch": 0.8095302305363273, "learning_rate": 7.331051393716967e-06, "loss": 2.7852047729492186, "step": 670900 }, { "epoch": 0.8096508938588101, "learning_rate": 7.330647558249229e-06, "loss": 2.772471618652344, "step": 671000 }, { "epoch": 0.8097715571812927, "learning_rate": 7.33024372278149e-06, "loss": 2.7878985595703125, "step": 671100 }, { "epoch": 0.8098922205037754, "learning_rate": 7.329839887313752e-06, "loss": 2.7733609008789064, "step": 671200 }, { "epoch": 0.8100128838262581, "learning_rate": 7.329436051846013e-06, "loss": 2.7803582763671875, "step": 671300 }, { "epoch": 0.8101335471487408, "learning_rate": 7.329032216378274e-06, "loss": 2.7941995239257813, "step": 671400 }, { "epoch": 0.8102542104712235, "learning_rate": 7.328628380910536e-06, "loss": 2.7581256103515623, "step": 671500 }, { "epoch": 0.8103748737937061, "learning_rate": 7.328224545442798e-06, "loss": 2.7770376586914063, "step": 671600 }, { "epoch": 0.8104955371161888, "learning_rate": 7.3278207099750594e-06, "loss": 2.764063720703125, "step": 671700 }, { "epoch": 0.8106162004386716, "learning_rate": 7.3274168745073214e-06, "loss": 2.7906890869140626, "step": 671800 }, { "epoch": 0.8107368637611542, "learning_rate": 7.327013039039583e-06, "loss": 2.7944598388671875, "step": 671900 }, { "epoch": 0.8108575270836369, "learning_rate": 7.326609203571845e-06, "loss": 2.762570495605469, "step": 672000 }, { "epoch": 0.8109781904061195, "learning_rate": 7.326205368104106e-06, "loss": 2.779108581542969, "step": 672100 }, { "epoch": 0.8110988537286022, "learning_rate": 7.325801532636368e-06, "loss": 2.782147216796875, "step": 672200 }, { "epoch": 0.811219517051085, "learning_rate": 7.325397697168629e-06, "loss": 2.779765319824219, "step": 672300 }, { "epoch": 0.8113401803735676, "learning_rate": 7.324993861700891e-06, "loss": 2.7478057861328127, "step": 672400 }, { "epoch": 0.8114608436960503, "learning_rate": 7.324590026233153e-06, "loss": 2.7575408935546877, "step": 672500 }, { "epoch": 0.8115815070185329, "learning_rate": 7.324186190765415e-06, "loss": 2.774888610839844, "step": 672600 }, { "epoch": 0.8117021703410157, "learning_rate": 7.323782355297676e-06, "loss": 2.770577392578125, "step": 672700 }, { "epoch": 0.8118228336634984, "learning_rate": 7.323378519829938e-06, "loss": 2.7907574462890623, "step": 672800 }, { "epoch": 0.811943496985981, "learning_rate": 7.322974684362198e-06, "loss": 2.792117004394531, "step": 672900 }, { "epoch": 0.8120641603084637, "learning_rate": 7.32257084889446e-06, "loss": 2.7660174560546875, "step": 673000 }, { "epoch": 0.8121848236309464, "learning_rate": 7.322167013426722e-06, "loss": 2.77701416015625, "step": 673100 }, { "epoch": 0.8123054869534291, "learning_rate": 7.321763177958984e-06, "loss": 2.7650604248046875, "step": 673200 }, { "epoch": 0.8124261502759118, "learning_rate": 7.321359342491245e-06, "loss": 2.7854238891601564, "step": 673300 }, { "epoch": 0.8125468135983944, "learning_rate": 7.320955507023507e-06, "loss": 2.776844482421875, "step": 673400 }, { "epoch": 0.8126674769208772, "learning_rate": 7.320551671555769e-06, "loss": 2.782826232910156, "step": 673500 }, { "epoch": 0.8127881402433598, "learning_rate": 7.32014783608803e-06, "loss": 2.7471697998046873, "step": 673600 }, { "epoch": 0.8129088035658425, "learning_rate": 7.3197440006202915e-06, "loss": 2.7987896728515627, "step": 673700 }, { "epoch": 0.8130294668883252, "learning_rate": 7.3193401651525535e-06, "loss": 2.7811871337890626, "step": 673800 }, { "epoch": 0.8131501302108078, "learning_rate": 7.318936329684815e-06, "loss": 2.7738702392578123, "step": 673900 }, { "epoch": 0.8132707935332906, "learning_rate": 7.3185324942170766e-06, "loss": 2.7958404541015627, "step": 674000 }, { "epoch": 0.8133914568557732, "learning_rate": 7.3181286587493386e-06, "loss": 2.8123013305664064, "step": 674100 }, { "epoch": 0.8135121201782559, "learning_rate": 7.3177248232816e-06, "loss": 2.7953521728515627, "step": 674200 }, { "epoch": 0.8136327835007386, "learning_rate": 7.317320987813862e-06, "loss": 2.7777886962890626, "step": 674300 }, { "epoch": 0.8137534468232213, "learning_rate": 7.316917152346124e-06, "loss": 2.7687893676757813, "step": 674400 }, { "epoch": 0.813874110145704, "learning_rate": 7.316513316878386e-06, "loss": 2.7885232543945313, "step": 674500 }, { "epoch": 0.8139947734681867, "learning_rate": 7.316109481410646e-06, "loss": 2.785223083496094, "step": 674600 }, { "epoch": 0.8141154367906693, "learning_rate": 7.315705645942908e-06, "loss": 2.78183349609375, "step": 674700 }, { "epoch": 0.8142361001131521, "learning_rate": 7.315301810475169e-06, "loss": 2.75867919921875, "step": 674800 }, { "epoch": 0.8143567634356347, "learning_rate": 7.314897975007431e-06, "loss": 2.7710635375976564, "step": 674900 }, { "epoch": 0.8144774267581174, "learning_rate": 7.314494139539693e-06, "loss": 2.7757638549804686, "step": 675000 }, { "epoch": 0.8145980900806001, "learning_rate": 7.314090304071955e-06, "loss": 2.797603759765625, "step": 675100 }, { "epoch": 0.8147187534030828, "learning_rate": 7.313686468604216e-06, "loss": 2.765887451171875, "step": 675200 }, { "epoch": 0.8148394167255655, "learning_rate": 7.313282633136478e-06, "loss": 2.7624163818359375, "step": 675300 }, { "epoch": 0.8149600800480481, "learning_rate": 7.312878797668738e-06, "loss": 2.788194580078125, "step": 675400 }, { "epoch": 0.8150807433705308, "learning_rate": 7.312474962201e-06, "loss": 2.798177490234375, "step": 675500 }, { "epoch": 0.8152014066930136, "learning_rate": 7.312071126733262e-06, "loss": 2.7722097778320314, "step": 675600 }, { "epoch": 0.8153220700154962, "learning_rate": 7.311667291265524e-06, "loss": 2.779398193359375, "step": 675700 }, { "epoch": 0.8154427333379789, "learning_rate": 7.3112634557977855e-06, "loss": 2.781210632324219, "step": 675800 }, { "epoch": 0.8155633966604615, "learning_rate": 7.3108596203300475e-06, "loss": 2.77276123046875, "step": 675900 }, { "epoch": 0.8156840599829442, "learning_rate": 7.3104557848623094e-06, "loss": 2.7947283935546876, "step": 676000 }, { "epoch": 0.815804723305427, "learning_rate": 7.310051949394571e-06, "loss": 2.80211669921875, "step": 676100 }, { "epoch": 0.8159253866279096, "learning_rate": 7.309648113926832e-06, "loss": 2.784278564453125, "step": 676200 }, { "epoch": 0.8160460499503923, "learning_rate": 7.309244278459094e-06, "loss": 2.790855712890625, "step": 676300 }, { "epoch": 0.8161667132728749, "learning_rate": 7.308840442991355e-06, "loss": 2.7782666015625, "step": 676400 }, { "epoch": 0.8162873765953577, "learning_rate": 7.308436607523617e-06, "loss": 2.77833984375, "step": 676500 }, { "epoch": 0.8164080399178404, "learning_rate": 7.308032772055879e-06, "loss": 2.7788742065429686, "step": 676600 }, { "epoch": 0.816528703240323, "learning_rate": 7.30762893658814e-06, "loss": 2.7719540405273437, "step": 676700 }, { "epoch": 0.8166493665628057, "learning_rate": 7.307225101120402e-06, "loss": 2.787636413574219, "step": 676800 }, { "epoch": 0.8167700298852884, "learning_rate": 7.306821265652664e-06, "loss": 2.789268798828125, "step": 676900 }, { "epoch": 0.8168906932077711, "learning_rate": 7.306417430184924e-06, "loss": 2.782451171875, "step": 677000 }, { "epoch": 0.8170113565302538, "learning_rate": 7.306013594717186e-06, "loss": 2.7727215576171873, "step": 677100 }, { "epoch": 0.8171320198527364, "learning_rate": 7.305609759249448e-06, "loss": 2.7946551513671873, "step": 677200 }, { "epoch": 0.8172526831752192, "learning_rate": 7.305205923781709e-06, "loss": 2.7975909423828127, "step": 677300 }, { "epoch": 0.8173733464977018, "learning_rate": 7.304802088313971e-06, "loss": 2.765296630859375, "step": 677400 }, { "epoch": 0.8174940098201845, "learning_rate": 7.304398252846233e-06, "loss": 2.796300964355469, "step": 677500 }, { "epoch": 0.8176146731426672, "learning_rate": 7.303994417378495e-06, "loss": 2.76763671875, "step": 677600 }, { "epoch": 0.8177353364651498, "learning_rate": 7.303590581910756e-06, "loss": 2.774588623046875, "step": 677700 }, { "epoch": 0.8178559997876326, "learning_rate": 7.3031867464430175e-06, "loss": 2.7680130004882812, "step": 677800 }, { "epoch": 0.8179766631101152, "learning_rate": 7.302782910975279e-06, "loss": 2.780946960449219, "step": 677900 }, { "epoch": 0.8180973264325979, "learning_rate": 7.302379075507541e-06, "loss": 2.7843597412109373, "step": 678000 }, { "epoch": 0.8182179897550806, "learning_rate": 7.301975240039803e-06, "loss": 2.762198791503906, "step": 678100 }, { "epoch": 0.8183386530775633, "learning_rate": 7.301571404572065e-06, "loss": 2.7904241943359374, "step": 678200 }, { "epoch": 0.818459316400046, "learning_rate": 7.301167569104326e-06, "loss": 2.7629043579101564, "step": 678300 }, { "epoch": 0.8185799797225286, "learning_rate": 7.300763733636588e-06, "loss": 2.7684771728515627, "step": 678400 }, { "epoch": 0.8187006430450113, "learning_rate": 7.30035989816885e-06, "loss": 2.7525875854492186, "step": 678500 }, { "epoch": 0.8188213063674941, "learning_rate": 7.29995606270111e-06, "loss": 2.78022216796875, "step": 678600 }, { "epoch": 0.8189419696899767, "learning_rate": 7.299552227233372e-06, "loss": 2.770039367675781, "step": 678700 }, { "epoch": 0.8190626330124594, "learning_rate": 7.299148391765634e-06, "loss": 2.7813906860351563, "step": 678800 }, { "epoch": 0.819183296334942, "learning_rate": 7.298744556297895e-06, "loss": 2.768718566894531, "step": 678900 }, { "epoch": 0.8193039596574248, "learning_rate": 7.298340720830157e-06, "loss": 2.750425109863281, "step": 679000 }, { "epoch": 0.8194246229799075, "learning_rate": 7.297936885362419e-06, "loss": 2.7760751342773435, "step": 679100 }, { "epoch": 0.8195452863023901, "learning_rate": 7.29753304989468e-06, "loss": 2.747894592285156, "step": 679200 }, { "epoch": 0.8196659496248728, "learning_rate": 7.297129214426942e-06, "loss": 2.771839904785156, "step": 679300 }, { "epoch": 0.8197866129473554, "learning_rate": 7.296725378959204e-06, "loss": 2.7960140991210936, "step": 679400 }, { "epoch": 0.8199072762698382, "learning_rate": 7.2963215434914644e-06, "loss": 2.776028747558594, "step": 679500 }, { "epoch": 0.8200279395923209, "learning_rate": 7.295917708023726e-06, "loss": 2.7511846923828127, "step": 679600 }, { "epoch": 0.8201486029148035, "learning_rate": 7.295513872555988e-06, "loss": 2.7819943237304687, "step": 679700 }, { "epoch": 0.8202692662372862, "learning_rate": 7.2951100370882495e-06, "loss": 2.747019958496094, "step": 679800 }, { "epoch": 0.820389929559769, "learning_rate": 7.2947062016205115e-06, "loss": 2.774222717285156, "step": 679900 }, { "epoch": 0.8205105928822516, "learning_rate": 7.2943023661527735e-06, "loss": 2.7718215942382813, "step": 680000 }, { "epoch": 0.8206312562047343, "learning_rate": 7.2938985306850355e-06, "loss": 2.780849609375, "step": 680100 }, { "epoch": 0.8207519195272169, "learning_rate": 7.293494695217297e-06, "loss": 2.783356018066406, "step": 680200 }, { "epoch": 0.8208725828496997, "learning_rate": 7.293090859749558e-06, "loss": 2.7759130859375, "step": 680300 }, { "epoch": 0.8209932461721824, "learning_rate": 7.292687024281819e-06, "loss": 2.776283874511719, "step": 680400 }, { "epoch": 0.821113909494665, "learning_rate": 7.292283188814081e-06, "loss": 2.7642578125, "step": 680500 }, { "epoch": 0.8212345728171477, "learning_rate": 7.291879353346343e-06, "loss": 2.7832626342773437, "step": 680600 }, { "epoch": 0.8213552361396304, "learning_rate": 7.291475517878605e-06, "loss": 2.7746176147460937, "step": 680700 }, { "epoch": 0.8214758994621131, "learning_rate": 7.291071682410866e-06, "loss": 2.7747976684570315, "step": 680800 }, { "epoch": 0.8215965627845958, "learning_rate": 7.290667846943128e-06, "loss": 2.7911410522460938, "step": 680900 }, { "epoch": 0.8217172261070784, "learning_rate": 7.29026401147539e-06, "loss": 2.772505798339844, "step": 681000 }, { "epoch": 0.8218378894295612, "learning_rate": 7.28986017600765e-06, "loss": 2.781540832519531, "step": 681100 }, { "epoch": 0.8219585527520438, "learning_rate": 7.289456340539912e-06, "loss": 2.750919189453125, "step": 681200 }, { "epoch": 0.8220792160745265, "learning_rate": 7.289052505072174e-06, "loss": 2.764035949707031, "step": 681300 }, { "epoch": 0.8221998793970092, "learning_rate": 7.288648669604435e-06, "loss": 2.798994445800781, "step": 681400 }, { "epoch": 0.8223205427194918, "learning_rate": 7.288244834136697e-06, "loss": 2.778087463378906, "step": 681500 }, { "epoch": 0.8224412060419746, "learning_rate": 7.287840998668959e-06, "loss": 2.770902404785156, "step": 681600 }, { "epoch": 0.8225618693644572, "learning_rate": 7.287437163201221e-06, "loss": 2.7659957885742186, "step": 681700 }, { "epoch": 0.8226825326869399, "learning_rate": 7.287033327733482e-06, "loss": 2.754152526855469, "step": 681800 }, { "epoch": 0.8228031960094226, "learning_rate": 7.2866294922657435e-06, "loss": 2.794879150390625, "step": 681900 }, { "epoch": 0.8229238593319053, "learning_rate": 7.286225656798005e-06, "loss": 2.791917419433594, "step": 682000 }, { "epoch": 0.823044522654388, "learning_rate": 7.285821821330267e-06, "loss": 2.798742370605469, "step": 682100 }, { "epoch": 0.8231651859768706, "learning_rate": 7.285417985862529e-06, "loss": 2.7911911010742188, "step": 682200 }, { "epoch": 0.8232858492993533, "learning_rate": 7.285014150394791e-06, "loss": 2.726761474609375, "step": 682300 }, { "epoch": 0.8234065126218361, "learning_rate": 7.284610314927052e-06, "loss": 2.76898681640625, "step": 682400 }, { "epoch": 0.8235271759443187, "learning_rate": 7.284206479459314e-06, "loss": 2.7621563720703124, "step": 682500 }, { "epoch": 0.8236478392668014, "learning_rate": 7.283802643991576e-06, "loss": 2.7733587646484374, "step": 682600 }, { "epoch": 0.823768502589284, "learning_rate": 7.283398808523836e-06, "loss": 2.793271484375, "step": 682700 }, { "epoch": 0.8238891659117668, "learning_rate": 7.282994973056098e-06, "loss": 2.76546630859375, "step": 682800 }, { "epoch": 0.8240098292342495, "learning_rate": 7.28259113758836e-06, "loss": 2.7817333984375, "step": 682900 }, { "epoch": 0.8241304925567321, "learning_rate": 7.282187302120621e-06, "loss": 2.7622714233398438, "step": 683000 }, { "epoch": 0.8242511558792148, "learning_rate": 7.281783466652883e-06, "loss": 2.765032958984375, "step": 683100 }, { "epoch": 0.8243718192016974, "learning_rate": 7.281379631185145e-06, "loss": 2.75868408203125, "step": 683200 }, { "epoch": 0.8244924825241802, "learning_rate": 7.280975795717406e-06, "loss": 2.7622296142578127, "step": 683300 }, { "epoch": 0.8246131458466629, "learning_rate": 7.280571960249668e-06, "loss": 2.76447021484375, "step": 683400 }, { "epoch": 0.8247338091691455, "learning_rate": 7.280168124781929e-06, "loss": 2.7963937377929686, "step": 683500 }, { "epoch": 0.8248544724916282, "learning_rate": 7.2797642893141905e-06, "loss": 2.785882873535156, "step": 683600 }, { "epoch": 0.8249751358141109, "learning_rate": 7.2793604538464524e-06, "loss": 2.7596749877929687, "step": 683700 }, { "epoch": 0.8250957991365936, "learning_rate": 7.2789566183787144e-06, "loss": 2.7607269287109375, "step": 683800 }, { "epoch": 0.8252164624590763, "learning_rate": 7.2785527829109756e-06, "loss": 2.767558898925781, "step": 683900 }, { "epoch": 0.8253371257815589, "learning_rate": 7.2781489474432375e-06, "loss": 2.746151123046875, "step": 684000 }, { "epoch": 0.8254577891040417, "learning_rate": 7.2777451119754995e-06, "loss": 2.785746765136719, "step": 684100 }, { "epoch": 0.8255784524265243, "learning_rate": 7.2773412765077615e-06, "loss": 2.772562255859375, "step": 684200 }, { "epoch": 0.825699115749007, "learning_rate": 7.276937441040022e-06, "loss": 2.7555859375, "step": 684300 }, { "epoch": 0.8258197790714897, "learning_rate": 7.276533605572284e-06, "loss": 2.7792007446289064, "step": 684400 }, { "epoch": 0.8259404423939724, "learning_rate": 7.276129770104545e-06, "loss": 2.759610900878906, "step": 684500 }, { "epoch": 0.8260611057164551, "learning_rate": 7.275725934636807e-06, "loss": 2.7839810180664064, "step": 684600 }, { "epoch": 0.8261817690389378, "learning_rate": 7.275322099169069e-06, "loss": 2.765096435546875, "step": 684700 }, { "epoch": 0.8263024323614204, "learning_rate": 7.274918263701331e-06, "loss": 2.7779061889648435, "step": 684800 }, { "epoch": 0.8264230956839032, "learning_rate": 7.274514428233592e-06, "loss": 2.796318359375, "step": 684900 }, { "epoch": 0.8265437590063858, "learning_rate": 7.274110592765854e-06, "loss": 2.8043829345703126, "step": 685000 }, { "epoch": 0.8266644223288685, "learning_rate": 7.273706757298116e-06, "loss": 2.764012756347656, "step": 685100 }, { "epoch": 0.8267850856513512, "learning_rate": 7.273302921830376e-06, "loss": 2.7973806762695315, "step": 685200 }, { "epoch": 0.8269057489738338, "learning_rate": 7.272899086362638e-06, "loss": 2.747877502441406, "step": 685300 }, { "epoch": 0.8270264122963166, "learning_rate": 7.2724952508949e-06, "loss": 2.727659912109375, "step": 685400 }, { "epoch": 0.8271470756187992, "learning_rate": 7.272091415427161e-06, "loss": 2.770906677246094, "step": 685500 }, { "epoch": 0.8272677389412819, "learning_rate": 7.271687579959423e-06, "loss": 2.765697326660156, "step": 685600 }, { "epoch": 0.8273884022637646, "learning_rate": 7.271283744491685e-06, "loss": 2.761227722167969, "step": 685700 }, { "epoch": 0.8275090655862473, "learning_rate": 7.2708799090239465e-06, "loss": 2.779718322753906, "step": 685800 }, { "epoch": 0.82762972890873, "learning_rate": 7.2704760735562084e-06, "loss": 2.74761962890625, "step": 685900 }, { "epoch": 0.8277503922312126, "learning_rate": 7.2700722380884696e-06, "loss": 2.758592529296875, "step": 686000 }, { "epoch": 0.8278710555536953, "learning_rate": 7.269668402620731e-06, "loss": 2.766251220703125, "step": 686100 }, { "epoch": 0.8279917188761781, "learning_rate": 7.269264567152993e-06, "loss": 2.7486810302734375, "step": 686200 }, { "epoch": 0.8281123821986607, "learning_rate": 7.268860731685255e-06, "loss": 2.7468301391601564, "step": 686300 }, { "epoch": 0.8282330455211434, "learning_rate": 7.268456896217516e-06, "loss": 2.783356018066406, "step": 686400 }, { "epoch": 0.828353708843626, "learning_rate": 7.268053060749778e-06, "loss": 2.796214904785156, "step": 686500 }, { "epoch": 0.8284743721661088, "learning_rate": 7.26764922528204e-06, "loss": 2.7551763916015624, "step": 686600 }, { "epoch": 0.8285950354885915, "learning_rate": 7.267245389814302e-06, "loss": 2.7310626220703127, "step": 686700 }, { "epoch": 0.8287156988110741, "learning_rate": 7.266841554346562e-06, "loss": 2.788240966796875, "step": 686800 }, { "epoch": 0.8288363621335568, "learning_rate": 7.266437718878824e-06, "loss": 2.7726473999023438, "step": 686900 }, { "epoch": 0.8289570254560394, "learning_rate": 7.266033883411085e-06, "loss": 2.7804150390625, "step": 687000 }, { "epoch": 0.8290776887785222, "learning_rate": 7.265630047943347e-06, "loss": 2.73583984375, "step": 687100 }, { "epoch": 0.8291983521010049, "learning_rate": 7.265226212475609e-06, "loss": 2.7614453125, "step": 687200 }, { "epoch": 0.8293190154234875, "learning_rate": 7.264822377007871e-06, "loss": 2.776871643066406, "step": 687300 }, { "epoch": 0.8294396787459702, "learning_rate": 7.264418541540132e-06, "loss": 2.7650790405273438, "step": 687400 }, { "epoch": 0.8295603420684529, "learning_rate": 7.264014706072394e-06, "loss": 2.7622006225585936, "step": 687500 }, { "epoch": 0.8296810053909356, "learning_rate": 7.2636108706046545e-06, "loss": 2.74801025390625, "step": 687600 }, { "epoch": 0.8298016687134183, "learning_rate": 7.2632070351369165e-06, "loss": 2.7588674926757815, "step": 687700 }, { "epoch": 0.8299223320359009, "learning_rate": 7.2628031996691785e-06, "loss": 2.7784210205078126, "step": 687800 }, { "epoch": 0.8300429953583837, "learning_rate": 7.2623993642014405e-06, "loss": 2.760014953613281, "step": 687900 }, { "epoch": 0.8301636586808663, "learning_rate": 7.261995528733702e-06, "loss": 2.766098937988281, "step": 688000 }, { "epoch": 0.830284322003349, "learning_rate": 7.261591693265964e-06, "loss": 2.7400997924804686, "step": 688100 }, { "epoch": 0.8304049853258317, "learning_rate": 7.2611878577982256e-06, "loss": 2.7693490600585937, "step": 688200 }, { "epoch": 0.8305256486483144, "learning_rate": 7.260784022330487e-06, "loss": 2.7861932373046874, "step": 688300 }, { "epoch": 0.8306463119707971, "learning_rate": 7.260380186862748e-06, "loss": 2.780870361328125, "step": 688400 }, { "epoch": 0.8307669752932797, "learning_rate": 7.25997635139501e-06, "loss": 2.762931213378906, "step": 688500 }, { "epoch": 0.8308876386157624, "learning_rate": 7.259572515927271e-06, "loss": 2.76712890625, "step": 688600 }, { "epoch": 0.8310083019382452, "learning_rate": 7.259168680459533e-06, "loss": 2.739679260253906, "step": 688700 }, { "epoch": 0.8311289652607278, "learning_rate": 7.258764844991795e-06, "loss": 2.770452575683594, "step": 688800 }, { "epoch": 0.8312496285832105, "learning_rate": 7.258361009524056e-06, "loss": 2.7772784423828125, "step": 688900 }, { "epoch": 0.8313702919056931, "learning_rate": 7.257957174056318e-06, "loss": 2.7580340576171873, "step": 689000 }, { "epoch": 0.8314909552281758, "learning_rate": 7.25755333858858e-06, "loss": 2.7548779296875, "step": 689100 }, { "epoch": 0.8316116185506586, "learning_rate": 7.25714950312084e-06, "loss": 2.7769586181640626, "step": 689200 }, { "epoch": 0.8317322818731412, "learning_rate": 7.256745667653102e-06, "loss": 2.7747686767578124, "step": 689300 }, { "epoch": 0.8318529451956239, "learning_rate": 7.256341832185364e-06, "loss": 2.7806280517578124, "step": 689400 }, { "epoch": 0.8319736085181065, "learning_rate": 7.255937996717625e-06, "loss": 2.7483615112304687, "step": 689500 }, { "epoch": 0.8320942718405893, "learning_rate": 7.255534161249887e-06, "loss": 2.766712951660156, "step": 689600 }, { "epoch": 0.832214935163072, "learning_rate": 7.255130325782149e-06, "loss": 2.7647628784179688, "step": 689700 }, { "epoch": 0.8323355984855546, "learning_rate": 7.254726490314411e-06, "loss": 2.779339599609375, "step": 689800 }, { "epoch": 0.8324562618080373, "learning_rate": 7.2543226548466725e-06, "loss": 2.734499816894531, "step": 689900 }, { "epoch": 0.8325769251305201, "learning_rate": 7.2539188193789345e-06, "loss": 2.7614596557617186, "step": 690000 }, { "epoch": 0.8326975884530027, "learning_rate": 7.253514983911195e-06, "loss": 2.7762570190429687, "step": 690100 }, { "epoch": 0.8328182517754854, "learning_rate": 7.253111148443457e-06, "loss": 2.7788519287109374, "step": 690200 }, { "epoch": 0.832938915097968, "learning_rate": 7.252707312975719e-06, "loss": 2.7794393920898437, "step": 690300 }, { "epoch": 0.8330595784204508, "learning_rate": 7.252303477507981e-06, "loss": 2.744797668457031, "step": 690400 }, { "epoch": 0.8331802417429335, "learning_rate": 7.251899642040242e-06, "loss": 2.7352310180664063, "step": 690500 }, { "epoch": 0.8333009050654161, "learning_rate": 7.251495806572504e-06, "loss": 2.760634765625, "step": 690600 }, { "epoch": 0.8334215683878988, "learning_rate": 7.251091971104766e-06, "loss": 2.747817077636719, "step": 690700 }, { "epoch": 0.8335422317103814, "learning_rate": 7.250688135637027e-06, "loss": 2.737945556640625, "step": 690800 }, { "epoch": 0.8336628950328642, "learning_rate": 7.250284300169288e-06, "loss": 2.768433837890625, "step": 690900 }, { "epoch": 0.8337835583553469, "learning_rate": 7.24988046470155e-06, "loss": 2.74574951171875, "step": 691000 }, { "epoch": 0.8339042216778295, "learning_rate": 7.249476629233811e-06, "loss": 2.7629129028320314, "step": 691100 }, { "epoch": 0.8340248850003122, "learning_rate": 7.249072793766073e-06, "loss": 2.746793518066406, "step": 691200 }, { "epoch": 0.8341455483227949, "learning_rate": 7.248668958298335e-06, "loss": 2.739273681640625, "step": 691300 }, { "epoch": 0.8342662116452776, "learning_rate": 7.248265122830596e-06, "loss": 2.781951904296875, "step": 691400 }, { "epoch": 0.8343868749677603, "learning_rate": 7.247861287362858e-06, "loss": 2.759024963378906, "step": 691500 }, { "epoch": 0.8345075382902429, "learning_rate": 7.24745745189512e-06, "loss": 2.77873291015625, "step": 691600 }, { "epoch": 0.8346282016127257, "learning_rate": 7.2470536164273806e-06, "loss": 2.7770071411132813, "step": 691700 }, { "epoch": 0.8347488649352083, "learning_rate": 7.2466497809596425e-06, "loss": 2.7521490478515624, "step": 691800 }, { "epoch": 0.834869528257691, "learning_rate": 7.2462459454919045e-06, "loss": 2.770146484375, "step": 691900 }, { "epoch": 0.8349901915801737, "learning_rate": 7.245842110024166e-06, "loss": 2.755367431640625, "step": 692000 }, { "epoch": 0.8351108549026564, "learning_rate": 7.245438274556428e-06, "loss": 2.7622604370117188, "step": 692100 }, { "epoch": 0.8352315182251391, "learning_rate": 7.24503443908869e-06, "loss": 2.76739990234375, "step": 692200 }, { "epoch": 0.8353521815476217, "learning_rate": 7.244630603620952e-06, "loss": 2.769892578125, "step": 692300 }, { "epoch": 0.8354728448701044, "learning_rate": 7.244226768153213e-06, "loss": 2.7444207763671873, "step": 692400 }, { "epoch": 0.8355935081925872, "learning_rate": 7.243822932685474e-06, "loss": 2.767644958496094, "step": 692500 }, { "epoch": 0.8357141715150698, "learning_rate": 7.243419097217735e-06, "loss": 2.753415222167969, "step": 692600 }, { "epoch": 0.8358348348375525, "learning_rate": 7.243015261749997e-06, "loss": 2.757127380371094, "step": 692700 }, { "epoch": 0.8359554981600351, "learning_rate": 7.242611426282259e-06, "loss": 2.7736105346679687, "step": 692800 }, { "epoch": 0.8360761614825178, "learning_rate": 7.242207590814521e-06, "loss": 2.7389935302734374, "step": 692900 }, { "epoch": 0.8361968248050006, "learning_rate": 7.241803755346782e-06, "loss": 2.7779116821289063, "step": 693000 }, { "epoch": 0.8363174881274832, "learning_rate": 7.241399919879044e-06, "loss": 2.75095703125, "step": 693100 }, { "epoch": 0.8364381514499659, "learning_rate": 7.240996084411306e-06, "loss": 2.772707214355469, "step": 693200 }, { "epoch": 0.8365588147724485, "learning_rate": 7.240592248943566e-06, "loss": 2.7717205810546877, "step": 693300 }, { "epoch": 0.8366794780949313, "learning_rate": 7.240188413475828e-06, "loss": 2.783363037109375, "step": 693400 }, { "epoch": 0.836800141417414, "learning_rate": 7.23978457800809e-06, "loss": 2.769794921875, "step": 693500 }, { "epoch": 0.8369208047398966, "learning_rate": 7.2393807425403514e-06, "loss": 2.737657470703125, "step": 693600 }, { "epoch": 0.8370414680623793, "learning_rate": 7.2389769070726134e-06, "loss": 2.770452880859375, "step": 693700 }, { "epoch": 0.837162131384862, "learning_rate": 7.238573071604875e-06, "loss": 2.74417236328125, "step": 693800 }, { "epoch": 0.8372827947073447, "learning_rate": 7.2381692361371365e-06, "loss": 2.7591851806640624, "step": 693900 }, { "epoch": 0.8374034580298274, "learning_rate": 7.2377654006693985e-06, "loss": 2.7601513671875, "step": 694000 }, { "epoch": 0.83752412135231, "learning_rate": 7.23736156520166e-06, "loss": 2.7459622192382813, "step": 694100 }, { "epoch": 0.8376447846747928, "learning_rate": 7.236957729733921e-06, "loss": 2.7640350341796873, "step": 694200 }, { "epoch": 0.8377654479972754, "learning_rate": 7.236553894266183e-06, "loss": 2.762540283203125, "step": 694300 }, { "epoch": 0.8378861113197581, "learning_rate": 7.236150058798445e-06, "loss": 2.7619268798828127, "step": 694400 }, { "epoch": 0.8380067746422408, "learning_rate": 7.235746223330706e-06, "loss": 2.7208523559570312, "step": 694500 }, { "epoch": 0.8381274379647234, "learning_rate": 7.235342387862968e-06, "loss": 2.736491394042969, "step": 694600 }, { "epoch": 0.8382481012872062, "learning_rate": 7.23493855239523e-06, "loss": 2.7519732666015626, "step": 694700 }, { "epoch": 0.8383687646096888, "learning_rate": 7.234534716927492e-06, "loss": 2.7600112915039063, "step": 694800 }, { "epoch": 0.8384894279321715, "learning_rate": 7.234130881459753e-06, "loss": 2.77838134765625, "step": 694900 }, { "epoch": 0.8386100912546542, "learning_rate": 7.233727045992014e-06, "loss": 2.778692626953125, "step": 695000 }, { "epoch": 0.8387307545771369, "learning_rate": 7.233323210524275e-06, "loss": 2.767226257324219, "step": 695100 }, { "epoch": 0.8388514178996196, "learning_rate": 7.232919375056537e-06, "loss": 2.7683566284179686, "step": 695200 }, { "epoch": 0.8389720812221023, "learning_rate": 7.232515539588799e-06, "loss": 2.7708123779296874, "step": 695300 }, { "epoch": 0.8390927445445849, "learning_rate": 7.232111704121061e-06, "loss": 2.755225830078125, "step": 695400 }, { "epoch": 0.8392134078670677, "learning_rate": 7.231707868653322e-06, "loss": 2.7623663330078125, "step": 695500 }, { "epoch": 0.8393340711895503, "learning_rate": 7.231304033185584e-06, "loss": 2.7495608520507813, "step": 695600 }, { "epoch": 0.839454734512033, "learning_rate": 7.230900197717846e-06, "loss": 2.754932556152344, "step": 695700 }, { "epoch": 0.8395753978345157, "learning_rate": 7.230496362250107e-06, "loss": 2.7537255859375, "step": 695800 }, { "epoch": 0.8396960611569984, "learning_rate": 7.2300925267823686e-06, "loss": 2.754486389160156, "step": 695900 }, { "epoch": 0.8398167244794811, "learning_rate": 7.2296886913146306e-06, "loss": 2.7523419189453127, "step": 696000 }, { "epoch": 0.8399373878019637, "learning_rate": 7.229284855846892e-06, "loss": 2.745189208984375, "step": 696100 }, { "epoch": 0.8400580511244464, "learning_rate": 7.228881020379154e-06, "loss": 2.7585690307617186, "step": 696200 }, { "epoch": 0.8401787144469292, "learning_rate": 7.228477184911416e-06, "loss": 2.757199401855469, "step": 696300 }, { "epoch": 0.8402993777694118, "learning_rate": 7.228073349443678e-06, "loss": 2.7604180908203126, "step": 696400 }, { "epoch": 0.8404200410918945, "learning_rate": 7.227669513975939e-06, "loss": 2.7483511352539063, "step": 696500 }, { "epoch": 0.8405407044143771, "learning_rate": 7.2272656785082e-06, "loss": 2.7624032592773435, "step": 696600 }, { "epoch": 0.8406613677368598, "learning_rate": 7.226861843040461e-06, "loss": 2.764954833984375, "step": 696700 }, { "epoch": 0.8407820310593426, "learning_rate": 7.226458007572723e-06, "loss": 2.7384982299804688, "step": 696800 }, { "epoch": 0.8409026943818252, "learning_rate": 7.226054172104985e-06, "loss": 2.7461196899414064, "step": 696900 }, { "epoch": 0.8410233577043079, "learning_rate": 7.225650336637247e-06, "loss": 2.73990966796875, "step": 697000 }, { "epoch": 0.8411440210267905, "learning_rate": 7.225246501169508e-06, "loss": 2.7417037963867186, "step": 697100 }, { "epoch": 0.8412646843492733, "learning_rate": 7.22484266570177e-06, "loss": 2.754837951660156, "step": 697200 }, { "epoch": 0.841385347671756, "learning_rate": 7.224438830234032e-06, "loss": 2.7644775390625, "step": 697300 }, { "epoch": 0.8415060109942386, "learning_rate": 7.224034994766292e-06, "loss": 2.7673019409179687, "step": 697400 }, { "epoch": 0.8416266743167213, "learning_rate": 7.223631159298554e-06, "loss": 2.7481979370117187, "step": 697500 }, { "epoch": 0.841747337639204, "learning_rate": 7.223227323830816e-06, "loss": 2.7859262084960936, "step": 697600 }, { "epoch": 0.8418680009616867, "learning_rate": 7.2228234883630775e-06, "loss": 2.7625445556640624, "step": 697700 }, { "epoch": 0.8419886642841694, "learning_rate": 7.2224196528953395e-06, "loss": 2.764498291015625, "step": 697800 }, { "epoch": 0.842109327606652, "learning_rate": 7.2220158174276014e-06, "loss": 2.747264404296875, "step": 697900 }, { "epoch": 0.8422299909291348, "learning_rate": 7.221611981959863e-06, "loss": 2.776311340332031, "step": 698000 }, { "epoch": 0.8423506542516174, "learning_rate": 7.2212081464921246e-06, "loss": 2.7646533203125, "step": 698100 }, { "epoch": 0.8424713175741001, "learning_rate": 7.220804311024386e-06, "loss": 2.7593475341796876, "step": 698200 }, { "epoch": 0.8425919808965828, "learning_rate": 7.220400475556647e-06, "loss": 2.742789611816406, "step": 698300 }, { "epoch": 0.8427126442190654, "learning_rate": 7.219996640088909e-06, "loss": 2.7323455810546875, "step": 698400 }, { "epoch": 0.8428333075415482, "learning_rate": 7.219592804621171e-06, "loss": 2.7811355590820312, "step": 698500 }, { "epoch": 0.8429539708640308, "learning_rate": 7.219188969153432e-06, "loss": 2.7867587280273436, "step": 698600 }, { "epoch": 0.8430746341865135, "learning_rate": 7.218785133685694e-06, "loss": 2.7540383911132813, "step": 698700 }, { "epoch": 0.8431952975089962, "learning_rate": 7.218381298217956e-06, "loss": 2.73100830078125, "step": 698800 }, { "epoch": 0.8433159608314789, "learning_rate": 7.217977462750218e-06, "loss": 2.7559234619140627, "step": 698900 }, { "epoch": 0.8434366241539616, "learning_rate": 7.217573627282478e-06, "loss": 2.7618115234375, "step": 699000 }, { "epoch": 0.8435572874764442, "learning_rate": 7.21716979181474e-06, "loss": 2.746187744140625, "step": 699100 }, { "epoch": 0.8436779507989269, "learning_rate": 7.216765956347001e-06, "loss": 2.7446331787109375, "step": 699200 }, { "epoch": 0.8437986141214097, "learning_rate": 7.216362120879263e-06, "loss": 2.7656594848632814, "step": 699300 }, { "epoch": 0.8439192774438923, "learning_rate": 7.215958285411525e-06, "loss": 2.7403350830078126, "step": 699400 }, { "epoch": 0.844039940766375, "learning_rate": 7.215554449943787e-06, "loss": 2.753825988769531, "step": 699500 }, { "epoch": 0.8441606040888576, "learning_rate": 7.215150614476048e-06, "loss": 2.739991455078125, "step": 699600 }, { "epoch": 0.8442812674113404, "learning_rate": 7.21474677900831e-06, "loss": 2.7475155639648436, "step": 699700 }, { "epoch": 0.8444019307338231, "learning_rate": 7.214342943540571e-06, "loss": 2.75184326171875, "step": 699800 }, { "epoch": 0.8445225940563057, "learning_rate": 7.213939108072833e-06, "loss": 2.735565490722656, "step": 699900 }, { "epoch": 0.8446432573787884, "learning_rate": 7.213535272605095e-06, "loss": 2.769859619140625, "step": 700000 }, { "epoch": 0.844763920701271, "learning_rate": 7.213131437137357e-06, "loss": 2.774072570800781, "step": 700100 }, { "epoch": 0.8448845840237538, "learning_rate": 7.212727601669618e-06, "loss": 2.7508477783203125, "step": 700200 }, { "epoch": 0.8450052473462365, "learning_rate": 7.21232376620188e-06, "loss": 2.7312185668945315, "step": 700300 }, { "epoch": 0.8451259106687191, "learning_rate": 7.211919930734142e-06, "loss": 2.72595947265625, "step": 700400 }, { "epoch": 0.8452465739912018, "learning_rate": 7.211516095266403e-06, "loss": 2.761361083984375, "step": 700500 }, { "epoch": 0.8453672373136846, "learning_rate": 7.211112259798665e-06, "loss": 2.7568505859375, "step": 700600 }, { "epoch": 0.8454879006361672, "learning_rate": 7.210708424330926e-06, "loss": 2.7646929931640627, "step": 700700 }, { "epoch": 0.8456085639586499, "learning_rate": 7.210304588863187e-06, "loss": 2.741496887207031, "step": 700800 }, { "epoch": 0.8457292272811325, "learning_rate": 7.209900753395449e-06, "loss": 2.72297119140625, "step": 700900 }, { "epoch": 0.8458498906036153, "learning_rate": 7.209496917927711e-06, "loss": 2.752399597167969, "step": 701000 }, { "epoch": 0.845970553926098, "learning_rate": 7.209093082459972e-06, "loss": 2.7268942260742186, "step": 701100 }, { "epoch": 0.8460912172485806, "learning_rate": 7.208689246992234e-06, "loss": 2.761585693359375, "step": 701200 }, { "epoch": 0.8462118805710633, "learning_rate": 7.208285411524496e-06, "loss": 2.763692626953125, "step": 701300 }, { "epoch": 0.846332543893546, "learning_rate": 7.207881576056758e-06, "loss": 2.759352111816406, "step": 701400 }, { "epoch": 0.8464532072160287, "learning_rate": 7.207477740589018e-06, "loss": 2.7340435791015625, "step": 701500 }, { "epoch": 0.8465738705385114, "learning_rate": 7.20707390512128e-06, "loss": 2.771798400878906, "step": 701600 }, { "epoch": 0.846694533860994, "learning_rate": 7.2066700696535415e-06, "loss": 2.7612728881835937, "step": 701700 }, { "epoch": 0.8468151971834768, "learning_rate": 7.2062662341858035e-06, "loss": 2.742584228515625, "step": 701800 }, { "epoch": 0.8469358605059594, "learning_rate": 7.2058623987180655e-06, "loss": 2.735779113769531, "step": 701900 }, { "epoch": 0.8470565238284421, "learning_rate": 7.2054585632503275e-06, "loss": 2.717684020996094, "step": 702000 }, { "epoch": 0.8471771871509248, "learning_rate": 7.205054727782589e-06, "loss": 2.7524249267578127, "step": 702100 }, { "epoch": 0.8472978504734074, "learning_rate": 7.204650892314851e-06, "loss": 2.7912030029296875, "step": 702200 }, { "epoch": 0.8474185137958902, "learning_rate": 7.204247056847111e-06, "loss": 2.7568463134765624, "step": 702300 }, { "epoch": 0.8475391771183728, "learning_rate": 7.203843221379373e-06, "loss": 2.742562255859375, "step": 702400 }, { "epoch": 0.8476598404408555, "learning_rate": 7.203439385911635e-06, "loss": 2.7338986206054687, "step": 702500 }, { "epoch": 0.8477805037633382, "learning_rate": 7.203035550443897e-06, "loss": 2.7584689331054686, "step": 702600 }, { "epoch": 0.8479011670858209, "learning_rate": 7.202631714976158e-06, "loss": 2.761337890625, "step": 702700 }, { "epoch": 0.8480218304083036, "learning_rate": 7.20222787950842e-06, "loss": 2.7570785522460937, "step": 702800 }, { "epoch": 0.8481424937307862, "learning_rate": 7.201824044040682e-06, "loss": 2.759461669921875, "step": 702900 }, { "epoch": 0.8482631570532689, "learning_rate": 7.201420208572943e-06, "loss": 2.740189208984375, "step": 703000 }, { "epoch": 0.8483838203757517, "learning_rate": 7.201016373105204e-06, "loss": 2.7350228881835936, "step": 703100 }, { "epoch": 0.8485044836982343, "learning_rate": 7.200612537637466e-06, "loss": 2.747209167480469, "step": 703200 }, { "epoch": 0.848625147020717, "learning_rate": 7.200208702169727e-06, "loss": 2.770213928222656, "step": 703300 }, { "epoch": 0.8487458103431996, "learning_rate": 7.199804866701989e-06, "loss": 2.7480010986328125, "step": 703400 }, { "epoch": 0.8488664736656824, "learning_rate": 7.199401031234251e-06, "loss": 2.729515380859375, "step": 703500 }, { "epoch": 0.8489871369881651, "learning_rate": 7.198997195766512e-06, "loss": 2.7514968872070313, "step": 703600 }, { "epoch": 0.8491078003106477, "learning_rate": 7.198593360298774e-06, "loss": 2.787181396484375, "step": 703700 }, { "epoch": 0.8492284636331304, "learning_rate": 7.198189524831036e-06, "loss": 2.7567489624023436, "step": 703800 }, { "epoch": 0.849349126955613, "learning_rate": 7.197785689363297e-06, "loss": 2.7393313598632814, "step": 703900 }, { "epoch": 0.8494697902780958, "learning_rate": 7.197381853895559e-06, "loss": 2.7720135498046874, "step": 704000 }, { "epoch": 0.8495904536005785, "learning_rate": 7.196978018427821e-06, "loss": 2.76645751953125, "step": 704100 }, { "epoch": 0.8497111169230611, "learning_rate": 7.196574182960082e-06, "loss": 2.7568350219726563, "step": 704200 }, { "epoch": 0.8498317802455438, "learning_rate": 7.196170347492344e-06, "loss": 2.754114685058594, "step": 704300 }, { "epoch": 0.8499524435680265, "learning_rate": 7.195766512024606e-06, "loss": 2.7828915405273436, "step": 704400 }, { "epoch": 0.8500731068905092, "learning_rate": 7.195362676556868e-06, "loss": 2.76895751953125, "step": 704500 }, { "epoch": 0.8501937702129919, "learning_rate": 7.194958841089129e-06, "loss": 2.7466351318359377, "step": 704600 }, { "epoch": 0.8503144335354745, "learning_rate": 7.19455500562139e-06, "loss": 2.754508361816406, "step": 704700 }, { "epoch": 0.8504350968579573, "learning_rate": 7.194151170153651e-06, "loss": 2.7450051879882813, "step": 704800 }, { "epoch": 0.8505557601804399, "learning_rate": 7.193747334685913e-06, "loss": 2.7456875610351563, "step": 704900 }, { "epoch": 0.8506764235029226, "learning_rate": 7.193343499218175e-06, "loss": 2.779808349609375, "step": 705000 }, { "epoch": 0.8507970868254053, "learning_rate": 7.192939663750437e-06, "loss": 2.7399258422851562, "step": 705100 }, { "epoch": 0.850917750147888, "learning_rate": 7.192535828282698e-06, "loss": 2.7727099609375, "step": 705200 }, { "epoch": 0.8510384134703707, "learning_rate": 7.19213199281496e-06, "loss": 2.7663116455078125, "step": 705300 }, { "epoch": 0.8511590767928533, "learning_rate": 7.191728157347222e-06, "loss": 2.7588116455078127, "step": 705400 }, { "epoch": 0.851279740115336, "learning_rate": 7.191324321879483e-06, "loss": 2.7287109375, "step": 705500 }, { "epoch": 0.8514004034378188, "learning_rate": 7.1909204864117444e-06, "loss": 2.728892822265625, "step": 705600 }, { "epoch": 0.8515210667603014, "learning_rate": 7.1905166509440064e-06, "loss": 2.7715408325195314, "step": 705700 }, { "epoch": 0.8516417300827841, "learning_rate": 7.1901128154762676e-06, "loss": 2.739892883300781, "step": 705800 }, { "epoch": 0.8517623934052668, "learning_rate": 7.1897089800085295e-06, "loss": 2.750996398925781, "step": 705900 }, { "epoch": 0.8518830567277494, "learning_rate": 7.1893051445407915e-06, "loss": 2.738392333984375, "step": 706000 }, { "epoch": 0.8520037200502322, "learning_rate": 7.188901309073053e-06, "loss": 2.75764892578125, "step": 706100 }, { "epoch": 0.8521243833727148, "learning_rate": 7.188497473605315e-06, "loss": 2.7510452270507812, "step": 706200 }, { "epoch": 0.8522450466951975, "learning_rate": 7.188093638137577e-06, "loss": 2.7574835205078125, "step": 706300 }, { "epoch": 0.8523657100176802, "learning_rate": 7.187689802669837e-06, "loss": 2.7572174072265625, "step": 706400 }, { "epoch": 0.8524863733401629, "learning_rate": 7.187285967202099e-06, "loss": 2.7706378173828123, "step": 706500 }, { "epoch": 0.8526070366626456, "learning_rate": 7.186882131734361e-06, "loss": 2.7622296142578127, "step": 706600 }, { "epoch": 0.8527276999851282, "learning_rate": 7.186478296266622e-06, "loss": 2.74099365234375, "step": 706700 }, { "epoch": 0.8528483633076109, "learning_rate": 7.186074460798884e-06, "loss": 2.720220031738281, "step": 706800 }, { "epoch": 0.8529690266300937, "learning_rate": 7.185670625331146e-06, "loss": 2.75215576171875, "step": 706900 }, { "epoch": 0.8530896899525763, "learning_rate": 7.185266789863408e-06, "loss": 2.7263839721679686, "step": 707000 }, { "epoch": 0.853210353275059, "learning_rate": 7.184862954395669e-06, "loss": 2.7559783935546873, "step": 707100 }, { "epoch": 0.8533310165975416, "learning_rate": 7.18445911892793e-06, "loss": 2.7144232177734375, "step": 707200 }, { "epoch": 0.8534516799200244, "learning_rate": 7.184055283460191e-06, "loss": 2.773271179199219, "step": 707300 }, { "epoch": 0.8535723432425071, "learning_rate": 7.183651447992453e-06, "loss": 2.7693255615234373, "step": 707400 }, { "epoch": 0.8536930065649897, "learning_rate": 7.183247612524715e-06, "loss": 2.7593157958984373, "step": 707500 }, { "epoch": 0.8538136698874724, "learning_rate": 7.182843777056977e-06, "loss": 2.7662057495117187, "step": 707600 }, { "epoch": 0.853934333209955, "learning_rate": 7.1824399415892385e-06, "loss": 2.7554592895507812, "step": 707700 }, { "epoch": 0.8540549965324378, "learning_rate": 7.1820361061215004e-06, "loss": 2.7663064575195313, "step": 707800 }, { "epoch": 0.8541756598549205, "learning_rate": 7.181632270653762e-06, "loss": 2.722821044921875, "step": 707900 }, { "epoch": 0.8542963231774031, "learning_rate": 7.181228435186023e-0