{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.6229377354266636, "eval_steps": 500, "global_step": 48000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 5e-06, "loss": 10.9368, "step": 5 }, { "epoch": 0.0, "learning_rate": 1e-05, "loss": 10.4988, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.5e-05, "loss": 9.8761, "step": 15 }, { "epoch": 0.0, "learning_rate": 2e-05, "loss": 9.2834, "step": 20 }, { "epoch": 0.0, "learning_rate": 2.5e-05, "loss": 8.5046, "step": 25 }, { "epoch": 0.0, "learning_rate": 3e-05, "loss": 7.8405, "step": 30 }, { "epoch": 0.0, "learning_rate": 3.5e-05, "loss": 7.5177, "step": 35 }, { "epoch": 0.0, "learning_rate": 4e-05, "loss": 7.1661, "step": 40 }, { "epoch": 0.0, "learning_rate": 4.5e-05, "loss": 7.1509, "step": 45 }, { "epoch": 0.0, "learning_rate": 5e-05, "loss": 6.9049, "step": 50 }, { "epoch": 0.0, "learning_rate": 5.500000000000001e-05, "loss": 8.6301, "step": 55 }, { "epoch": 0.0, "learning_rate": 6e-05, "loss": 15.7814, "step": 60 }, { "epoch": 0.0, "learning_rate": 6.500000000000001e-05, "loss": 7.3722, "step": 65 }, { "epoch": 0.0, "learning_rate": 7e-05, "loss": 6.9069, "step": 70 }, { "epoch": 0.0, "learning_rate": 7.500000000000001e-05, "loss": 6.6268, "step": 75 }, { "epoch": 0.0, "learning_rate": 8e-05, "loss": 7.6898, "step": 80 }, { "epoch": 0.0, "learning_rate": 8.5e-05, "loss": 6.515, "step": 85 }, { "epoch": 0.0, "learning_rate": 9e-05, "loss": 6.3189, "step": 90 }, { "epoch": 0.0, "learning_rate": 9.5e-05, "loss": 6.2103, "step": 95 }, { "epoch": 0.0, "learning_rate": 0.0001, "loss": 6.0017, "step": 100 }, { "epoch": 0.0, "learning_rate": 9.99999989583607e-05, "loss": 5.6553, "step": 105 }, { "epoch": 0.0, "learning_rate": 9.99999958334428e-05, "loss": 5.6362, "step": 110 }, { "epoch": 0.0, "learning_rate": 9.999999062524643e-05, "loss": 5.3318, "step": 115 }, { "epoch": 0.0, "learning_rate": 9.999998333377183e-05, "loss": 5.2929, "step": 120 }, { "epoch": 0.0, "learning_rate": 9.99999739590193e-05, "loss": 5.0623, "step": 125 }, { "epoch": 0.0, "learning_rate": 9.999996250098922e-05, "loss": 5.2014, "step": 130 }, { "epoch": 0.0, "learning_rate": 9.999994895968208e-05, "loss": 4.9815, "step": 135 }, { "epoch": 0.0, "learning_rate": 9.999993333509843e-05, "loss": 4.8417, "step": 140 }, { "epoch": 0.0, "learning_rate": 9.999991562723893e-05, "loss": 5.0133, "step": 145 }, { "epoch": 0.0, "learning_rate": 9.999989583610432e-05, "loss": 4.7976, "step": 150 }, { "epoch": 0.0, "learning_rate": 9.999987396169542e-05, "loss": 4.9161, "step": 155 }, { "epoch": 0.0, "learning_rate": 9.999985000401313e-05, "loss": 4.6076, "step": 160 }, { "epoch": 0.0, "learning_rate": 9.999982396305847e-05, "loss": 4.727, "step": 165 }, { "epoch": 0.0, "learning_rate": 9.999979583883253e-05, "loss": 4.8423, "step": 170 }, { "epoch": 0.0, "learning_rate": 9.999976563133644e-05, "loss": 4.6381, "step": 175 }, { "epoch": 0.0, "learning_rate": 9.999973334057148e-05, "loss": 4.4477, "step": 180 }, { "epoch": 0.0, "learning_rate": 9.999969896653903e-05, "loss": 4.6216, "step": 185 }, { "epoch": 0.0, "learning_rate": 9.999966250924046e-05, "loss": 4.5572, "step": 190 }, { "epoch": 0.0, "learning_rate": 9.999962396867735e-05, "loss": 4.5212, "step": 195 }, { "epoch": 0.0, "learning_rate": 9.999958334485127e-05, "loss": 4.4537, "step": 200 }, { "epoch": 0.0, "learning_rate": 9.999954063776392e-05, "loss": 4.4322, "step": 205 }, { "epoch": 0.0, "learning_rate": 9.999949584741708e-05, "loss": 4.5091, "step": 210 }, { "epoch": 0.0, "learning_rate": 9.999944897381261e-05, "loss": 4.4052, "step": 215 }, { "epoch": 0.0, "learning_rate": 9.999940001695247e-05, "loss": 4.5194, "step": 220 }, { "epoch": 0.0, "learning_rate": 9.999934897683871e-05, "loss": 4.5206, "step": 225 }, { "epoch": 0.0, "learning_rate": 9.999929585347342e-05, "loss": 4.3682, "step": 230 }, { "epoch": 0.0, "learning_rate": 9.999924064685887e-05, "loss": 4.3991, "step": 235 }, { "epoch": 0.0, "learning_rate": 9.999918335699731e-05, "loss": 4.2373, "step": 240 }, { "epoch": 0.0, "learning_rate": 9.999912398389115e-05, "loss": 4.1082, "step": 245 }, { "epoch": 0.0, "learning_rate": 9.999906252754288e-05, "loss": 4.2561, "step": 250 }, { "epoch": 0.0, "learning_rate": 9.999899898795501e-05, "loss": 4.0919, "step": 255 }, { "epoch": 0.0, "learning_rate": 9.999893336513022e-05, "loss": 4.235, "step": 260 }, { "epoch": 0.0, "learning_rate": 9.999886565907127e-05, "loss": 4.1673, "step": 265 }, { "epoch": 0.0, "learning_rate": 9.999879586978093e-05, "loss": 4.1842, "step": 270 }, { "epoch": 0.0, "learning_rate": 9.999872399726214e-05, "loss": 4.1511, "step": 275 }, { "epoch": 0.0, "learning_rate": 9.999865004151787e-05, "loss": 4.2516, "step": 280 }, { "epoch": 0.0, "learning_rate": 9.999857400255123e-05, "loss": 4.155, "step": 285 }, { "epoch": 0.0, "learning_rate": 9.999849588036539e-05, "loss": 4.1505, "step": 290 }, { "epoch": 0.0, "learning_rate": 9.999841567496355e-05, "loss": 4.2345, "step": 295 }, { "epoch": 0.0, "learning_rate": 9.999833338634911e-05, "loss": 4.0767, "step": 300 }, { "epoch": 0.0, "learning_rate": 9.99982490145255e-05, "loss": 4.0297, "step": 305 }, { "epoch": 0.0, "learning_rate": 9.99981625594962e-05, "loss": 4.0188, "step": 310 }, { "epoch": 0.0, "learning_rate": 9.999807402126484e-05, "loss": 4.0487, "step": 315 }, { "epoch": 0.0, "learning_rate": 9.999798339983509e-05, "loss": 3.9901, "step": 320 }, { "epoch": 0.0, "learning_rate": 9.999789069521073e-05, "loss": 4.0458, "step": 325 }, { "epoch": 0.0, "learning_rate": 9.999779590739562e-05, "loss": 3.9995, "step": 330 }, { "epoch": 0.0, "learning_rate": 9.999769903639372e-05, "loss": 4.0316, "step": 335 }, { "epoch": 0.0, "learning_rate": 9.999760008220906e-05, "loss": 4.0154, "step": 340 }, { "epoch": 0.0, "learning_rate": 9.999749904484577e-05, "loss": 4.0007, "step": 345 }, { "epoch": 0.0, "learning_rate": 9.999739592430805e-05, "loss": 4.0581, "step": 350 }, { "epoch": 0.0, "learning_rate": 9.99972907206002e-05, "loss": 3.8524, "step": 355 }, { "epoch": 0.0, "learning_rate": 9.999718343372662e-05, "loss": 4.0246, "step": 360 }, { "epoch": 0.0, "learning_rate": 9.999707406369174e-05, "loss": 3.9922, "step": 365 }, { "epoch": 0.0, "learning_rate": 9.999696261050015e-05, "loss": 3.9336, "step": 370 }, { "epoch": 0.0, "learning_rate": 9.999684907415648e-05, "loss": 3.9427, "step": 375 }, { "epoch": 0.0, "learning_rate": 9.999673345466547e-05, "loss": 3.8942, "step": 380 }, { "epoch": 0.0, "learning_rate": 9.999661575203195e-05, "loss": 3.9364, "step": 385 }, { "epoch": 0.01, "learning_rate": 9.999649596626077e-05, "loss": 4.0866, "step": 390 }, { "epoch": 0.01, "learning_rate": 9.999637409735698e-05, "loss": 3.8119, "step": 395 }, { "epoch": 0.01, "learning_rate": 9.999625014532563e-05, "loss": 3.8828, "step": 400 }, { "epoch": 0.01, "learning_rate": 9.99961241101719e-05, "loss": 3.8178, "step": 405 }, { "epoch": 0.01, "learning_rate": 9.999599599190102e-05, "loss": 4.0455, "step": 410 }, { "epoch": 0.01, "learning_rate": 9.999586579051835e-05, "loss": 3.9334, "step": 415 }, { "epoch": 0.01, "learning_rate": 9.999573350602929e-05, "loss": 3.8661, "step": 420 }, { "epoch": 0.01, "learning_rate": 9.999559913843939e-05, "loss": 3.8174, "step": 425 }, { "epoch": 0.01, "learning_rate": 9.999546268775419e-05, "loss": 3.7552, "step": 430 }, { "epoch": 0.01, "learning_rate": 9.999532415397944e-05, "loss": 3.8883, "step": 435 }, { "epoch": 0.01, "learning_rate": 9.999518353712088e-05, "loss": 3.8809, "step": 440 }, { "epoch": 0.01, "learning_rate": 9.999504083718435e-05, "loss": 3.7891, "step": 445 }, { "epoch": 0.01, "learning_rate": 9.999489605417582e-05, "loss": 3.7666, "step": 450 }, { "epoch": 0.01, "learning_rate": 9.999474918810135e-05, "loss": 3.9513, "step": 455 }, { "epoch": 0.01, "learning_rate": 9.9994600238967e-05, "loss": 3.7917, "step": 460 }, { "epoch": 0.01, "learning_rate": 9.999444920677901e-05, "loss": 3.7823, "step": 465 }, { "epoch": 0.01, "learning_rate": 9.999429609154366e-05, "loss": 3.7847, "step": 470 }, { "epoch": 0.01, "learning_rate": 9.999414089326735e-05, "loss": 3.8958, "step": 475 }, { "epoch": 0.01, "learning_rate": 9.999398361195652e-05, "loss": 3.9026, "step": 480 }, { "epoch": 0.01, "learning_rate": 9.999382424761774e-05, "loss": 3.7843, "step": 485 }, { "epoch": 0.01, "learning_rate": 9.999366280025766e-05, "loss": 3.9169, "step": 490 }, { "epoch": 0.01, "learning_rate": 9.999349926988297e-05, "loss": 3.8977, "step": 495 }, { "epoch": 0.01, "learning_rate": 9.999333365650053e-05, "loss": 3.7049, "step": 500 }, { "epoch": 0.01, "learning_rate": 9.99931659601172e-05, "loss": 3.7352, "step": 505 }, { "epoch": 0.01, "learning_rate": 9.999299618074e-05, "loss": 3.7508, "step": 510 }, { "epoch": 0.01, "learning_rate": 9.999282431837598e-05, "loss": 3.7661, "step": 515 }, { "epoch": 0.01, "learning_rate": 9.999265037303231e-05, "loss": 3.7935, "step": 520 }, { "epoch": 0.01, "learning_rate": 9.999247434471623e-05, "loss": 3.7101, "step": 525 }, { "epoch": 0.01, "learning_rate": 9.99922962334351e-05, "loss": 3.6567, "step": 530 }, { "epoch": 0.01, "learning_rate": 9.999211603919629e-05, "loss": 3.6004, "step": 535 }, { "epoch": 0.01, "learning_rate": 9.999193376200737e-05, "loss": 3.6687, "step": 540 }, { "epoch": 0.01, "learning_rate": 9.99917494018759e-05, "loss": 3.671, "step": 545 }, { "epoch": 0.01, "learning_rate": 9.999156295880956e-05, "loss": 3.6843, "step": 550 }, { "epoch": 0.01, "learning_rate": 9.999137443281612e-05, "loss": 3.718, "step": 555 }, { "epoch": 0.01, "learning_rate": 9.999118382390344e-05, "loss": 3.5867, "step": 560 }, { "epoch": 0.01, "learning_rate": 9.999099113207945e-05, "loss": 3.7062, "step": 565 }, { "epoch": 0.01, "learning_rate": 9.999079635735222e-05, "loss": 3.665, "step": 570 }, { "epoch": 0.01, "learning_rate": 9.999059949972982e-05, "loss": 3.6363, "step": 575 }, { "epoch": 0.01, "learning_rate": 9.999040055922046e-05, "loss": 3.7631, "step": 580 }, { "epoch": 0.01, "learning_rate": 9.999019953583245e-05, "loss": 3.5466, "step": 585 }, { "epoch": 0.01, "learning_rate": 9.998999642957414e-05, "loss": 3.6898, "step": 590 }, { "epoch": 0.01, "learning_rate": 9.998979124045401e-05, "loss": 3.7447, "step": 595 }, { "epoch": 0.01, "learning_rate": 9.998958396848061e-05, "loss": 3.6934, "step": 600 }, { "epoch": 0.01, "learning_rate": 9.998937461366255e-05, "loss": 3.707, "step": 605 }, { "epoch": 0.01, "learning_rate": 9.998916317600859e-05, "loss": 3.5377, "step": 610 }, { "epoch": 0.01, "learning_rate": 9.998894965552752e-05, "loss": 3.66, "step": 615 }, { "epoch": 0.01, "learning_rate": 9.998873405222824e-05, "loss": 3.73, "step": 620 }, { "epoch": 0.01, "learning_rate": 9.998851636611975e-05, "loss": 3.6418, "step": 625 }, { "epoch": 0.01, "learning_rate": 9.998829659721107e-05, "loss": 3.4452, "step": 630 }, { "epoch": 0.01, "learning_rate": 9.998807474551141e-05, "loss": 3.6628, "step": 635 }, { "epoch": 0.01, "learning_rate": 9.998785081102998e-05, "loss": 3.6021, "step": 640 }, { "epoch": 0.01, "learning_rate": 9.998762479377613e-05, "loss": 3.6032, "step": 645 }, { "epoch": 0.01, "learning_rate": 9.998739669375927e-05, "loss": 3.6711, "step": 650 }, { "epoch": 0.01, "learning_rate": 9.998716651098889e-05, "loss": 3.5182, "step": 655 }, { "epoch": 0.01, "learning_rate": 9.998693424547462e-05, "loss": 3.6115, "step": 660 }, { "epoch": 0.01, "learning_rate": 9.99866998972261e-05, "loss": 3.5708, "step": 665 }, { "epoch": 0.01, "learning_rate": 9.998646346625312e-05, "loss": 3.5341, "step": 670 }, { "epoch": 0.01, "learning_rate": 9.998622495256549e-05, "loss": 3.5982, "step": 675 }, { "epoch": 0.01, "learning_rate": 9.998598435617319e-05, "loss": 3.5236, "step": 680 }, { "epoch": 0.01, "learning_rate": 9.998574167708623e-05, "loss": 3.5381, "step": 685 }, { "epoch": 0.01, "learning_rate": 9.998549691531472e-05, "loss": 3.5572, "step": 690 }, { "epoch": 0.01, "learning_rate": 9.998525007086886e-05, "loss": 3.5742, "step": 695 }, { "epoch": 0.01, "learning_rate": 9.998500114375894e-05, "loss": 3.3987, "step": 700 }, { "epoch": 0.01, "learning_rate": 9.998475013399532e-05, "loss": 3.5043, "step": 705 }, { "epoch": 0.01, "learning_rate": 9.998449704158847e-05, "loss": 3.5755, "step": 710 }, { "epoch": 0.01, "learning_rate": 9.998424186654892e-05, "loss": 3.5819, "step": 715 }, { "epoch": 0.01, "learning_rate": 9.998398460888731e-05, "loss": 3.58, "step": 720 }, { "epoch": 0.01, "learning_rate": 9.998372526861438e-05, "loss": 3.5973, "step": 725 }, { "epoch": 0.01, "learning_rate": 9.99834638457409e-05, "loss": 3.6318, "step": 730 }, { "epoch": 0.01, "learning_rate": 9.99832003402778e-05, "loss": 3.501, "step": 735 }, { "epoch": 0.01, "learning_rate": 9.998293475223602e-05, "loss": 3.6012, "step": 740 }, { "epoch": 0.01, "learning_rate": 9.998266708162662e-05, "loss": 3.5784, "step": 745 }, { "epoch": 0.01, "learning_rate": 9.998239732846082e-05, "loss": 3.479, "step": 750 }, { "epoch": 0.01, "learning_rate": 9.998212549274978e-05, "loss": 3.6467, "step": 755 }, { "epoch": 0.01, "learning_rate": 9.998185157450489e-05, "loss": 3.462, "step": 760 }, { "epoch": 0.01, "learning_rate": 9.998157557373752e-05, "loss": 3.6106, "step": 765 }, { "epoch": 0.01, "learning_rate": 9.998129749045919e-05, "loss": 3.5404, "step": 770 }, { "epoch": 0.01, "learning_rate": 9.998101732468147e-05, "loss": 3.4392, "step": 775 }, { "epoch": 0.01, "learning_rate": 9.998073507641605e-05, "loss": 3.4403, "step": 780 }, { "epoch": 0.01, "learning_rate": 9.998045074567469e-05, "loss": 3.4939, "step": 785 }, { "epoch": 0.01, "learning_rate": 9.998016433246922e-05, "loss": 3.414, "step": 790 }, { "epoch": 0.01, "learning_rate": 9.99798758368116e-05, "loss": 3.4242, "step": 795 }, { "epoch": 0.01, "learning_rate": 9.997958525871382e-05, "loss": 3.6027, "step": 800 }, { "epoch": 0.01, "learning_rate": 9.997929259818801e-05, "loss": 3.6217, "step": 805 }, { "epoch": 0.01, "learning_rate": 9.997899785524636e-05, "loss": 3.4088, "step": 810 }, { "epoch": 0.01, "learning_rate": 9.997870102990115e-05, "loss": 3.5646, "step": 815 }, { "epoch": 0.01, "learning_rate": 9.997840212216473e-05, "loss": 3.342, "step": 820 }, { "epoch": 0.01, "learning_rate": 9.997810113204958e-05, "loss": 3.5548, "step": 825 }, { "epoch": 0.01, "learning_rate": 9.997779805956821e-05, "loss": 3.5246, "step": 830 }, { "epoch": 0.01, "learning_rate": 9.997749290473329e-05, "loss": 3.4852, "step": 835 }, { "epoch": 0.01, "learning_rate": 9.99771856675575e-05, "loss": 3.39, "step": 840 }, { "epoch": 0.01, "learning_rate": 9.997687634805365e-05, "loss": 3.4571, "step": 845 }, { "epoch": 0.01, "learning_rate": 9.997656494623464e-05, "loss": 3.6108, "step": 850 }, { "epoch": 0.01, "learning_rate": 9.997625146211343e-05, "loss": 3.347, "step": 855 }, { "epoch": 0.01, "learning_rate": 9.997593589570308e-05, "loss": 3.4911, "step": 860 }, { "epoch": 0.01, "learning_rate": 9.997561824701675e-05, "loss": 3.3332, "step": 865 }, { "epoch": 0.01, "learning_rate": 9.997529851606768e-05, "loss": 3.4274, "step": 870 }, { "epoch": 0.01, "learning_rate": 9.997497670286916e-05, "loss": 3.5553, "step": 875 }, { "epoch": 0.01, "learning_rate": 9.997465280743463e-05, "loss": 3.4505, "step": 880 }, { "epoch": 0.01, "learning_rate": 9.997432682977759e-05, "loss": 3.4775, "step": 885 }, { "epoch": 0.01, "learning_rate": 9.997399876991158e-05, "loss": 3.4935, "step": 890 }, { "epoch": 0.01, "learning_rate": 9.997366862785031e-05, "loss": 3.4959, "step": 895 }, { "epoch": 0.01, "learning_rate": 9.997333640360753e-05, "loss": 3.4647, "step": 900 }, { "epoch": 0.01, "learning_rate": 9.997300209719706e-05, "loss": 3.4607, "step": 905 }, { "epoch": 0.01, "learning_rate": 9.997266570863286e-05, "loss": 3.4021, "step": 910 }, { "epoch": 0.01, "learning_rate": 9.997232723792892e-05, "loss": 3.492, "step": 915 }, { "epoch": 0.01, "learning_rate": 9.997198668509936e-05, "loss": 3.52, "step": 920 }, { "epoch": 0.01, "learning_rate": 9.997164405015835e-05, "loss": 3.368, "step": 925 }, { "epoch": 0.01, "learning_rate": 9.997129933312018e-05, "loss": 3.2794, "step": 930 }, { "epoch": 0.01, "learning_rate": 9.99709525339992e-05, "loss": 3.3637, "step": 935 }, { "epoch": 0.01, "learning_rate": 9.997060365280987e-05, "loss": 3.4723, "step": 940 }, { "epoch": 0.01, "learning_rate": 9.997025268956675e-05, "loss": 3.4641, "step": 945 }, { "epoch": 0.01, "learning_rate": 9.996989964428442e-05, "loss": 3.5246, "step": 950 }, { "epoch": 0.01, "learning_rate": 9.996954451697761e-05, "loss": 3.5278, "step": 955 }, { "epoch": 0.01, "learning_rate": 9.996918730766111e-05, "loss": 3.2581, "step": 960 }, { "epoch": 0.01, "learning_rate": 9.996882801634984e-05, "loss": 3.4231, "step": 965 }, { "epoch": 0.01, "learning_rate": 9.99684666430587e-05, "loss": 3.29, "step": 970 }, { "epoch": 0.01, "learning_rate": 9.996810318780281e-05, "loss": 3.4332, "step": 975 }, { "epoch": 0.01, "learning_rate": 9.996773765059728e-05, "loss": 3.3422, "step": 980 }, { "epoch": 0.01, "learning_rate": 9.996737003145734e-05, "loss": 3.33, "step": 985 }, { "epoch": 0.01, "learning_rate": 9.996700033039833e-05, "loss": 3.4228, "step": 990 }, { "epoch": 0.01, "learning_rate": 9.996662854743564e-05, "loss": 3.3158, "step": 995 }, { "epoch": 0.01, "learning_rate": 9.996625468258475e-05, "loss": 3.3928, "step": 1000 }, { "epoch": 0.01, "learning_rate": 9.996587873586125e-05, "loss": 3.397, "step": 1005 }, { "epoch": 0.01, "learning_rate": 9.996550070728081e-05, "loss": 3.5407, "step": 1010 }, { "epoch": 0.01, "learning_rate": 9.996512059685917e-05, "loss": 3.4652, "step": 1015 }, { "epoch": 0.01, "learning_rate": 9.996473840461217e-05, "loss": 3.322, "step": 1020 }, { "epoch": 0.01, "learning_rate": 9.996435413055574e-05, "loss": 3.3883, "step": 1025 }, { "epoch": 0.01, "learning_rate": 9.996396777470589e-05, "loss": 3.435, "step": 1030 }, { "epoch": 0.01, "learning_rate": 9.99635793370787e-05, "loss": 3.4368, "step": 1035 }, { "epoch": 0.01, "learning_rate": 9.996318881769038e-05, "loss": 3.3951, "step": 1040 }, { "epoch": 0.01, "learning_rate": 9.996279621655718e-05, "loss": 3.3531, "step": 1045 }, { "epoch": 0.01, "learning_rate": 9.996240153369547e-05, "loss": 3.5274, "step": 1050 }, { "epoch": 0.01, "learning_rate": 9.996200476912169e-05, "loss": 3.3308, "step": 1055 }, { "epoch": 0.01, "learning_rate": 9.996160592285238e-05, "loss": 3.4562, "step": 1060 }, { "epoch": 0.01, "learning_rate": 9.996120499490414e-05, "loss": 3.3264, "step": 1065 }, { "epoch": 0.01, "learning_rate": 9.99608019852937e-05, "loss": 3.5089, "step": 1070 }, { "epoch": 0.01, "learning_rate": 9.996039689403782e-05, "loss": 3.3761, "step": 1075 }, { "epoch": 0.01, "learning_rate": 9.99599897211534e-05, "loss": 3.3398, "step": 1080 }, { "epoch": 0.01, "learning_rate": 9.995958046665742e-05, "loss": 3.1856, "step": 1085 }, { "epoch": 0.01, "learning_rate": 9.995916913056689e-05, "loss": 3.3973, "step": 1090 }, { "epoch": 0.01, "learning_rate": 9.995875571289899e-05, "loss": 3.2886, "step": 1095 }, { "epoch": 0.01, "learning_rate": 9.995834021367092e-05, "loss": 3.4099, "step": 1100 }, { "epoch": 0.01, "learning_rate": 9.995792263289999e-05, "loss": 3.3685, "step": 1105 }, { "epoch": 0.01, "learning_rate": 9.995750297060362e-05, "loss": 3.3819, "step": 1110 }, { "epoch": 0.01, "learning_rate": 9.995708122679927e-05, "loss": 3.3071, "step": 1115 }, { "epoch": 0.01, "learning_rate": 9.995665740150455e-05, "loss": 3.4318, "step": 1120 }, { "epoch": 0.01, "learning_rate": 9.995623149473708e-05, "loss": 3.3058, "step": 1125 }, { "epoch": 0.01, "learning_rate": 9.995580350651461e-05, "loss": 3.3905, "step": 1130 }, { "epoch": 0.01, "learning_rate": 9.9955373436855e-05, "loss": 3.338, "step": 1135 }, { "epoch": 0.01, "learning_rate": 9.995494128577614e-05, "loss": 3.3196, "step": 1140 }, { "epoch": 0.01, "learning_rate": 9.995450705329605e-05, "loss": 3.3399, "step": 1145 }, { "epoch": 0.01, "learning_rate": 9.995407073943281e-05, "loss": 3.267, "step": 1150 }, { "epoch": 0.01, "learning_rate": 9.995363234420462e-05, "loss": 3.3423, "step": 1155 }, { "epoch": 0.02, "learning_rate": 9.995319186762975e-05, "loss": 3.3172, "step": 1160 }, { "epoch": 0.02, "learning_rate": 9.995274930972651e-05, "loss": 3.5101, "step": 1165 }, { "epoch": 0.02, "learning_rate": 9.995230467051338e-05, "loss": 3.3057, "step": 1170 }, { "epoch": 0.02, "learning_rate": 9.995185795000888e-05, "loss": 3.3146, "step": 1175 }, { "epoch": 0.02, "learning_rate": 9.995140914823162e-05, "loss": 3.3275, "step": 1180 }, { "epoch": 0.02, "learning_rate": 9.995095826520028e-05, "loss": 3.391, "step": 1185 }, { "epoch": 0.02, "learning_rate": 9.995050530093367e-05, "loss": 3.226, "step": 1190 }, { "epoch": 0.02, "learning_rate": 9.995005025545064e-05, "loss": 3.3456, "step": 1195 }, { "epoch": 0.02, "learning_rate": 9.99495931287702e-05, "loss": 3.2692, "step": 1200 }, { "epoch": 0.02, "learning_rate": 9.994913392091132e-05, "loss": 3.3243, "step": 1205 }, { "epoch": 0.02, "learning_rate": 9.99486726318932e-05, "loss": 3.1985, "step": 1210 }, { "epoch": 0.02, "learning_rate": 9.994820926173503e-05, "loss": 3.2962, "step": 1215 }, { "epoch": 0.02, "learning_rate": 9.994774381045611e-05, "loss": 3.3187, "step": 1220 }, { "epoch": 0.02, "learning_rate": 9.994727627807585e-05, "loss": 3.3905, "step": 1225 }, { "epoch": 0.02, "learning_rate": 9.994680666461374e-05, "loss": 3.2708, "step": 1230 }, { "epoch": 0.02, "learning_rate": 9.994633497008931e-05, "loss": 3.38, "step": 1235 }, { "epoch": 0.02, "learning_rate": 9.994586119452225e-05, "loss": 3.1598, "step": 1240 }, { "epoch": 0.02, "learning_rate": 9.994538533793228e-05, "loss": 3.3656, "step": 1245 }, { "epoch": 0.02, "learning_rate": 9.994490740033921e-05, "loss": 3.3246, "step": 1250 }, { "epoch": 0.02, "learning_rate": 9.9944427381763e-05, "loss": 3.2161, "step": 1255 }, { "epoch": 0.02, "learning_rate": 9.994394528222363e-05, "loss": 3.4294, "step": 1260 }, { "epoch": 0.02, "learning_rate": 9.994346110174117e-05, "loss": 3.2217, "step": 1265 }, { "epoch": 0.02, "learning_rate": 9.99429748403358e-05, "loss": 3.2953, "step": 1270 }, { "epoch": 0.02, "learning_rate": 9.99424864980278e-05, "loss": 3.2655, "step": 1275 }, { "epoch": 0.02, "learning_rate": 9.994199607483749e-05, "loss": 3.1983, "step": 1280 }, { "epoch": 0.02, "learning_rate": 9.994150357078533e-05, "loss": 3.254, "step": 1285 }, { "epoch": 0.02, "learning_rate": 9.994100898589182e-05, "loss": 3.422, "step": 1290 }, { "epoch": 0.02, "learning_rate": 9.994051232017757e-05, "loss": 3.1597, "step": 1295 }, { "epoch": 0.02, "learning_rate": 9.994001357366328e-05, "loss": 3.2594, "step": 1300 }, { "epoch": 0.02, "learning_rate": 9.993951274636973e-05, "loss": 3.2144, "step": 1305 }, { "epoch": 0.02, "learning_rate": 9.993900983831779e-05, "loss": 3.3225, "step": 1310 }, { "epoch": 0.02, "learning_rate": 9.993850484952841e-05, "loss": 3.3122, "step": 1315 }, { "epoch": 0.02, "learning_rate": 9.993799778002263e-05, "loss": 3.3864, "step": 1320 }, { "epoch": 0.02, "learning_rate": 9.993748862982157e-05, "loss": 3.3074, "step": 1325 }, { "epoch": 0.02, "learning_rate": 9.993697739894647e-05, "loss": 3.3291, "step": 1330 }, { "epoch": 0.02, "learning_rate": 9.99364640874186e-05, "loss": 3.4528, "step": 1335 }, { "epoch": 0.02, "learning_rate": 9.993594869525938e-05, "loss": 3.2887, "step": 1340 }, { "epoch": 0.02, "learning_rate": 9.993543122249022e-05, "loss": 3.2304, "step": 1345 }, { "epoch": 0.02, "learning_rate": 9.993491166913277e-05, "loss": 3.2373, "step": 1350 }, { "epoch": 0.02, "learning_rate": 9.993439003520861e-05, "loss": 3.2572, "step": 1355 }, { "epoch": 0.02, "learning_rate": 9.993386632073952e-05, "loss": 3.1992, "step": 1360 }, { "epoch": 0.02, "learning_rate": 9.993334052574727e-05, "loss": 3.2235, "step": 1365 }, { "epoch": 0.02, "learning_rate": 9.99328126502538e-05, "loss": 3.2993, "step": 1370 }, { "epoch": 0.02, "learning_rate": 9.993228269428112e-05, "loss": 3.2617, "step": 1375 }, { "epoch": 0.02, "learning_rate": 9.993175065785127e-05, "loss": 3.2636, "step": 1380 }, { "epoch": 0.02, "learning_rate": 9.993121654098644e-05, "loss": 3.1867, "step": 1385 }, { "epoch": 0.02, "learning_rate": 9.993068034370889e-05, "loss": 3.2302, "step": 1390 }, { "epoch": 0.02, "learning_rate": 9.993014206604094e-05, "loss": 3.3281, "step": 1395 }, { "epoch": 0.02, "learning_rate": 9.992960170800505e-05, "loss": 3.2929, "step": 1400 }, { "epoch": 0.02, "learning_rate": 9.99290592696237e-05, "loss": 3.2304, "step": 1405 }, { "epoch": 0.02, "learning_rate": 9.992851475091951e-05, "loss": 3.2959, "step": 1410 }, { "epoch": 0.02, "learning_rate": 9.992796815191516e-05, "loss": 3.2495, "step": 1415 }, { "epoch": 0.02, "learning_rate": 9.992741947263345e-05, "loss": 3.4049, "step": 1420 }, { "epoch": 0.02, "learning_rate": 9.99268687130972e-05, "loss": 3.1027, "step": 1425 }, { "epoch": 0.02, "learning_rate": 9.99263158733294e-05, "loss": 3.3813, "step": 1430 }, { "epoch": 0.02, "learning_rate": 9.992576095335303e-05, "loss": 3.2601, "step": 1435 }, { "epoch": 0.02, "learning_rate": 9.992520395319125e-05, "loss": 3.2943, "step": 1440 }, { "epoch": 0.02, "learning_rate": 9.992464487286726e-05, "loss": 3.1346, "step": 1445 }, { "epoch": 0.02, "learning_rate": 9.992408371240437e-05, "loss": 3.2355, "step": 1450 }, { "epoch": 0.02, "learning_rate": 9.992352047182594e-05, "loss": 3.3049, "step": 1455 }, { "epoch": 0.02, "learning_rate": 9.992295515115544e-05, "loss": 3.2642, "step": 1460 }, { "epoch": 0.02, "learning_rate": 9.992238775041642e-05, "loss": 3.3075, "step": 1465 }, { "epoch": 0.02, "learning_rate": 9.992181826963253e-05, "loss": 3.3076, "step": 1470 }, { "epoch": 0.02, "learning_rate": 9.992124670882751e-05, "loss": 3.2999, "step": 1475 }, { "epoch": 0.02, "learning_rate": 9.992067306802516e-05, "loss": 3.376, "step": 1480 }, { "epoch": 0.02, "learning_rate": 9.992009734724938e-05, "loss": 3.0919, "step": 1485 }, { "epoch": 0.02, "learning_rate": 9.991951954652416e-05, "loss": 3.2184, "step": 1490 }, { "epoch": 0.02, "learning_rate": 9.991893966587357e-05, "loss": 3.2079, "step": 1495 }, { "epoch": 0.02, "learning_rate": 9.991835770532177e-05, "loss": 3.3015, "step": 1500 }, { "epoch": 0.02, "learning_rate": 9.991777366489303e-05, "loss": 3.173, "step": 1505 }, { "epoch": 0.02, "learning_rate": 9.991718754461166e-05, "loss": 3.2064, "step": 1510 }, { "epoch": 0.02, "learning_rate": 9.991659934450208e-05, "loss": 3.171, "step": 1515 }, { "epoch": 0.02, "learning_rate": 9.99160090645888e-05, "loss": 3.1507, "step": 1520 }, { "epoch": 0.02, "learning_rate": 9.991541670489644e-05, "loss": 3.2371, "step": 1525 }, { "epoch": 0.02, "learning_rate": 9.991482226544966e-05, "loss": 3.2305, "step": 1530 }, { "epoch": 0.02, "learning_rate": 9.991422574627323e-05, "loss": 3.1973, "step": 1535 }, { "epoch": 0.02, "learning_rate": 9.991362714739199e-05, "loss": 3.3901, "step": 1540 }, { "epoch": 0.02, "learning_rate": 9.99130264688309e-05, "loss": 3.1564, "step": 1545 }, { "epoch": 0.02, "learning_rate": 9.991242371061498e-05, "loss": 3.3158, "step": 1550 }, { "epoch": 0.02, "learning_rate": 9.991181887276934e-05, "loss": 3.3068, "step": 1555 }, { "epoch": 0.02, "learning_rate": 9.991121195531921e-05, "loss": 3.2162, "step": 1560 }, { "epoch": 0.02, "learning_rate": 9.991060295828985e-05, "loss": 3.1839, "step": 1565 }, { "epoch": 0.02, "learning_rate": 9.990999188170662e-05, "loss": 3.3281, "step": 1570 }, { "epoch": 0.02, "learning_rate": 9.990937872559503e-05, "loss": 3.1989, "step": 1575 }, { "epoch": 0.02, "learning_rate": 9.990876348998057e-05, "loss": 3.2138, "step": 1580 }, { "epoch": 0.02, "learning_rate": 9.99081461748889e-05, "loss": 3.1625, "step": 1585 }, { "epoch": 0.02, "learning_rate": 9.990752678034576e-05, "loss": 3.2497, "step": 1590 }, { "epoch": 0.02, "learning_rate": 9.990690530637694e-05, "loss": 3.206, "step": 1595 }, { "epoch": 0.02, "learning_rate": 9.990628175300832e-05, "loss": 3.2498, "step": 1600 }, { "epoch": 0.02, "learning_rate": 9.99056561202659e-05, "loss": 3.1212, "step": 1605 }, { "epoch": 0.02, "learning_rate": 9.990502840817575e-05, "loss": 3.2365, "step": 1610 }, { "epoch": 0.02, "learning_rate": 9.990439861676401e-05, "loss": 3.1507, "step": 1615 }, { "epoch": 0.02, "learning_rate": 9.990376674605693e-05, "loss": 3.1972, "step": 1620 }, { "epoch": 0.02, "learning_rate": 9.990313279608084e-05, "loss": 3.3543, "step": 1625 }, { "epoch": 0.02, "learning_rate": 9.990249676686212e-05, "loss": 3.2678, "step": 1630 }, { "epoch": 0.02, "learning_rate": 9.990185865842731e-05, "loss": 3.174, "step": 1635 }, { "epoch": 0.02, "learning_rate": 9.9901218470803e-05, "loss": 3.2791, "step": 1640 }, { "epoch": 0.02, "learning_rate": 9.990057620401585e-05, "loss": 3.2766, "step": 1645 }, { "epoch": 0.02, "learning_rate": 9.989993185809262e-05, "loss": 3.148, "step": 1650 }, { "epoch": 0.02, "learning_rate": 9.989928543306014e-05, "loss": 3.264, "step": 1655 }, { "epoch": 0.02, "learning_rate": 9.989863692894536e-05, "loss": 3.2222, "step": 1660 }, { "epoch": 0.02, "learning_rate": 9.98979863457753e-05, "loss": 3.2541, "step": 1665 }, { "epoch": 0.02, "learning_rate": 9.989733368357708e-05, "loss": 3.2739, "step": 1670 }, { "epoch": 0.02, "learning_rate": 9.989667894237788e-05, "loss": 3.28, "step": 1675 }, { "epoch": 0.02, "learning_rate": 9.989602212220497e-05, "loss": 3.2832, "step": 1680 }, { "epoch": 0.02, "learning_rate": 9.989536322308574e-05, "loss": 3.2375, "step": 1685 }, { "epoch": 0.02, "learning_rate": 9.989470224504762e-05, "loss": 3.2302, "step": 1690 }, { "epoch": 0.02, "learning_rate": 9.989403918811817e-05, "loss": 3.1835, "step": 1695 }, { "epoch": 0.02, "learning_rate": 9.989337405232502e-05, "loss": 3.1344, "step": 1700 }, { "epoch": 0.02, "learning_rate": 9.989270683769585e-05, "loss": 3.1153, "step": 1705 }, { "epoch": 0.02, "learning_rate": 9.989203754425849e-05, "loss": 3.3124, "step": 1710 }, { "epoch": 0.02, "learning_rate": 9.989136617204082e-05, "loss": 3.2678, "step": 1715 }, { "epoch": 0.02, "learning_rate": 9.989069272107081e-05, "loss": 3.1469, "step": 1720 }, { "epoch": 0.02, "learning_rate": 9.989001719137652e-05, "loss": 3.1664, "step": 1725 }, { "epoch": 0.02, "learning_rate": 9.98893395829861e-05, "loss": 3.1695, "step": 1730 }, { "epoch": 0.02, "learning_rate": 9.988865989592777e-05, "loss": 3.1716, "step": 1735 }, { "epoch": 0.02, "learning_rate": 9.988797813022985e-05, "loss": 3.0381, "step": 1740 }, { "epoch": 0.02, "learning_rate": 9.988729428592079e-05, "loss": 3.1582, "step": 1745 }, { "epoch": 0.02, "learning_rate": 9.9886608363029e-05, "loss": 3.2137, "step": 1750 }, { "epoch": 0.02, "learning_rate": 9.988592036158315e-05, "loss": 3.077, "step": 1755 }, { "epoch": 0.02, "learning_rate": 9.988523028161185e-05, "loss": 3.1861, "step": 1760 }, { "epoch": 0.02, "learning_rate": 9.988453812314387e-05, "loss": 3.0399, "step": 1765 }, { "epoch": 0.02, "learning_rate": 9.988384388620804e-05, "loss": 3.1207, "step": 1770 }, { "epoch": 0.02, "learning_rate": 9.988314757083329e-05, "loss": 3.1086, "step": 1775 }, { "epoch": 0.02, "learning_rate": 9.988244917704863e-05, "loss": 3.1457, "step": 1780 }, { "epoch": 0.02, "learning_rate": 9.988174870488318e-05, "loss": 3.2802, "step": 1785 }, { "epoch": 0.02, "learning_rate": 9.988104615436608e-05, "loss": 3.1833, "step": 1790 }, { "epoch": 0.02, "learning_rate": 9.988034152552665e-05, "loss": 3.367, "step": 1795 }, { "epoch": 0.02, "learning_rate": 9.987963481839425e-05, "loss": 3.0373, "step": 1800 }, { "epoch": 0.02, "learning_rate": 9.987892603299827e-05, "loss": 3.2095, "step": 1805 }, { "epoch": 0.02, "learning_rate": 9.987821516936828e-05, "loss": 3.2036, "step": 1810 }, { "epoch": 0.02, "learning_rate": 9.987750222753391e-05, "loss": 3.3009, "step": 1815 }, { "epoch": 0.02, "learning_rate": 9.987678720752484e-05, "loss": 3.0445, "step": 1820 }, { "epoch": 0.02, "learning_rate": 9.987607010937088e-05, "loss": 3.2568, "step": 1825 }, { "epoch": 0.02, "learning_rate": 9.987535093310189e-05, "loss": 3.1246, "step": 1830 }, { "epoch": 0.02, "learning_rate": 9.987462967874785e-05, "loss": 3.1944, "step": 1835 }, { "epoch": 0.02, "learning_rate": 9.98739063463388e-05, "loss": 3.1733, "step": 1840 }, { "epoch": 0.02, "learning_rate": 9.987318093590489e-05, "loss": 3.1447, "step": 1845 }, { "epoch": 0.02, "learning_rate": 9.987245344747633e-05, "loss": 3.1463, "step": 1850 }, { "epoch": 0.02, "learning_rate": 9.987172388108346e-05, "loss": 3.2635, "step": 1855 }, { "epoch": 0.02, "learning_rate": 9.987099223675664e-05, "loss": 3.0759, "step": 1860 }, { "epoch": 0.02, "learning_rate": 9.987025851452639e-05, "loss": 3.0964, "step": 1865 }, { "epoch": 0.02, "learning_rate": 9.986952271442325e-05, "loss": 3.271, "step": 1870 }, { "epoch": 0.02, "learning_rate": 9.986878483647788e-05, "loss": 3.2862, "step": 1875 }, { "epoch": 0.02, "learning_rate": 9.986804488072106e-05, "loss": 3.0553, "step": 1880 }, { "epoch": 0.02, "learning_rate": 9.986730284718358e-05, "loss": 3.135, "step": 1885 }, { "epoch": 0.02, "learning_rate": 9.986655873589639e-05, "loss": 3.0756, "step": 1890 }, { "epoch": 0.02, "learning_rate": 9.986581254689044e-05, "loss": 3.2352, "step": 1895 }, { "epoch": 0.02, "learning_rate": 9.98650642801969e-05, "loss": 3.1215, "step": 1900 }, { "epoch": 0.02, "learning_rate": 9.986431393584687e-05, "loss": 3.0595, "step": 1905 }, { "epoch": 0.02, "learning_rate": 9.986356151387168e-05, "loss": 3.2324, "step": 1910 }, { "epoch": 0.02, "learning_rate": 9.986280701430263e-05, "loss": 2.9786, "step": 1915 }, { "epoch": 0.02, "learning_rate": 9.986205043717118e-05, "loss": 3.2154, "step": 1920 }, { "epoch": 0.02, "learning_rate": 9.986129178250884e-05, "loss": 3.1967, "step": 1925 }, { "epoch": 0.03, "learning_rate": 9.986053105034723e-05, "loss": 3.1087, "step": 1930 }, { "epoch": 0.03, "learning_rate": 9.985976824071804e-05, "loss": 3.2547, "step": 1935 }, { "epoch": 0.03, "learning_rate": 9.985900335365307e-05, "loss": 3.2338, "step": 1940 }, { "epoch": 0.03, "learning_rate": 9.985823638918417e-05, "loss": 3.1748, "step": 1945 }, { "epoch": 0.03, "learning_rate": 9.98574673473433e-05, "loss": 3.087, "step": 1950 }, { "epoch": 0.03, "learning_rate": 9.98566962281625e-05, "loss": 3.1046, "step": 1955 }, { "epoch": 0.03, "learning_rate": 9.98559230316739e-05, "loss": 3.2177, "step": 1960 }, { "epoch": 0.03, "learning_rate": 9.985514775790973e-05, "loss": 3.2079, "step": 1965 }, { "epoch": 0.03, "learning_rate": 9.985437040690229e-05, "loss": 3.1594, "step": 1970 }, { "epoch": 0.03, "learning_rate": 9.985359097868395e-05, "loss": 3.2322, "step": 1975 }, { "epoch": 0.03, "learning_rate": 9.98528094732872e-05, "loss": 3.0075, "step": 1980 }, { "epoch": 0.03, "learning_rate": 9.985202589074459e-05, "loss": 3.0865, "step": 1985 }, { "epoch": 0.03, "learning_rate": 9.985124023108878e-05, "loss": 3.2626, "step": 1990 }, { "epoch": 0.03, "learning_rate": 9.985045249435251e-05, "loss": 3.2558, "step": 1995 }, { "epoch": 0.03, "learning_rate": 9.984966268056858e-05, "loss": 3.1046, "step": 2000 }, { "epoch": 0.03, "learning_rate": 9.984887078976992e-05, "loss": 3.151, "step": 2005 }, { "epoch": 0.03, "learning_rate": 9.984807682198951e-05, "loss": 2.9837, "step": 2010 }, { "epoch": 0.03, "learning_rate": 9.984728077726043e-05, "loss": 3.1025, "step": 2015 }, { "epoch": 0.03, "learning_rate": 9.984648265561587e-05, "loss": 3.1191, "step": 2020 }, { "epoch": 0.03, "learning_rate": 9.984568245708905e-05, "loss": 3.1812, "step": 2025 }, { "epoch": 0.03, "learning_rate": 9.984488018171334e-05, "loss": 3.0876, "step": 2030 }, { "epoch": 0.03, "learning_rate": 9.984407582952216e-05, "loss": 3.0888, "step": 2035 }, { "epoch": 0.03, "learning_rate": 9.984326940054901e-05, "loss": 3.0962, "step": 2040 }, { "epoch": 0.03, "learning_rate": 9.984246089482752e-05, "loss": 3.1936, "step": 2045 }, { "epoch": 0.03, "learning_rate": 9.984165031239133e-05, "loss": 3.2139, "step": 2050 }, { "epoch": 0.03, "learning_rate": 9.984083765327425e-05, "loss": 3.1071, "step": 2055 }, { "epoch": 0.03, "learning_rate": 9.984002291751014e-05, "loss": 3.1678, "step": 2060 }, { "epoch": 0.03, "learning_rate": 9.983920610513294e-05, "loss": 3.0255, "step": 2065 }, { "epoch": 0.03, "learning_rate": 9.983838721617666e-05, "loss": 3.1038, "step": 2070 }, { "epoch": 0.03, "learning_rate": 9.983756625067544e-05, "loss": 3.0385, "step": 2075 }, { "epoch": 0.03, "learning_rate": 9.98367432086635e-05, "loss": 3.1361, "step": 2080 }, { "epoch": 0.03, "learning_rate": 9.983591809017511e-05, "loss": 3.0351, "step": 2085 }, { "epoch": 0.03, "learning_rate": 9.983509089524467e-05, "loss": 2.9995, "step": 2090 }, { "epoch": 0.03, "learning_rate": 9.983426162390661e-05, "loss": 3.1601, "step": 2095 }, { "epoch": 0.03, "learning_rate": 9.983343027619551e-05, "loss": 3.2241, "step": 2100 }, { "epoch": 0.03, "learning_rate": 9.983259685214602e-05, "loss": 3.0754, "step": 2105 }, { "epoch": 0.03, "learning_rate": 9.983176135179284e-05, "loss": 3.1167, "step": 2110 }, { "epoch": 0.03, "learning_rate": 9.983092377517078e-05, "loss": 3.1102, "step": 2115 }, { "epoch": 0.03, "learning_rate": 9.983008412231476e-05, "loss": 3.1045, "step": 2120 }, { "epoch": 0.03, "learning_rate": 9.982924239325974e-05, "loss": 3.2415, "step": 2125 }, { "epoch": 0.03, "learning_rate": 9.982839858804082e-05, "loss": 3.2423, "step": 2130 }, { "epoch": 0.03, "learning_rate": 9.982755270669314e-05, "loss": 3.1575, "step": 2135 }, { "epoch": 0.03, "learning_rate": 9.982670474925193e-05, "loss": 3.1589, "step": 2140 }, { "epoch": 0.03, "learning_rate": 9.982585471575255e-05, "loss": 3.0738, "step": 2145 }, { "epoch": 0.03, "learning_rate": 9.98250026062304e-05, "loss": 3.232, "step": 2150 }, { "epoch": 0.03, "learning_rate": 9.982414842072098e-05, "loss": 2.9823, "step": 2155 }, { "epoch": 0.03, "learning_rate": 9.98232921592599e-05, "loss": 3.1703, "step": 2160 }, { "epoch": 0.03, "learning_rate": 9.982243382188282e-05, "loss": 3.0764, "step": 2165 }, { "epoch": 0.03, "learning_rate": 9.98215734086255e-05, "loss": 3.1259, "step": 2170 }, { "epoch": 0.03, "learning_rate": 9.982071091952379e-05, "loss": 3.0977, "step": 2175 }, { "epoch": 0.03, "learning_rate": 9.981984635461365e-05, "loss": 3.1434, "step": 2180 }, { "epoch": 0.03, "learning_rate": 9.981897971393106e-05, "loss": 3.1922, "step": 2185 }, { "epoch": 0.03, "learning_rate": 9.981811099751217e-05, "loss": 3.1504, "step": 2190 }, { "epoch": 0.03, "learning_rate": 9.981724020539316e-05, "loss": 3.0324, "step": 2195 }, { "epoch": 0.03, "learning_rate": 9.981636733761032e-05, "loss": 3.2236, "step": 2200 }, { "epoch": 0.03, "learning_rate": 9.98154923942e-05, "loss": 3.1269, "step": 2205 }, { "epoch": 0.03, "learning_rate": 9.981461537519868e-05, "loss": 2.9605, "step": 2210 }, { "epoch": 0.03, "learning_rate": 9.981373628064286e-05, "loss": 3.1818, "step": 2215 }, { "epoch": 0.03, "learning_rate": 9.981285511056921e-05, "loss": 3.199, "step": 2220 }, { "epoch": 0.03, "learning_rate": 9.981197186501443e-05, "loss": 3.089, "step": 2225 }, { "epoch": 0.03, "learning_rate": 9.98110865440153e-05, "loss": 3.1865, "step": 2230 }, { "epoch": 0.03, "learning_rate": 9.981019914760876e-05, "loss": 3.1291, "step": 2235 }, { "epoch": 0.03, "learning_rate": 9.980930967583174e-05, "loss": 3.2548, "step": 2240 }, { "epoch": 0.03, "learning_rate": 9.980841812872131e-05, "loss": 3.0319, "step": 2245 }, { "epoch": 0.03, "learning_rate": 9.98075245063146e-05, "loss": 3.1813, "step": 2250 }, { "epoch": 0.03, "learning_rate": 9.980662880864888e-05, "loss": 3.1022, "step": 2255 }, { "epoch": 0.03, "learning_rate": 9.980573103576145e-05, "loss": 3.1494, "step": 2260 }, { "epoch": 0.03, "learning_rate": 9.980483118768973e-05, "loss": 2.984, "step": 2265 }, { "epoch": 0.03, "learning_rate": 9.980392926447118e-05, "loss": 3.145, "step": 2270 }, { "epoch": 0.03, "learning_rate": 9.98030252661434e-05, "loss": 3.0024, "step": 2275 }, { "epoch": 0.03, "learning_rate": 9.980211919274407e-05, "loss": 3.1017, "step": 2280 }, { "epoch": 0.03, "learning_rate": 9.980121104431092e-05, "loss": 2.999, "step": 2285 }, { "epoch": 0.03, "learning_rate": 9.98003008208818e-05, "loss": 3.0675, "step": 2290 }, { "epoch": 0.03, "learning_rate": 9.979938852249462e-05, "loss": 3.1599, "step": 2295 }, { "epoch": 0.03, "learning_rate": 9.979847414918741e-05, "loss": 3.1161, "step": 2300 }, { "epoch": 0.03, "learning_rate": 9.979755770099825e-05, "loss": 3.0223, "step": 2305 }, { "epoch": 0.03, "learning_rate": 9.979663917796536e-05, "loss": 3.1252, "step": 2310 }, { "epoch": 0.03, "learning_rate": 9.979571858012698e-05, "loss": 3.0129, "step": 2315 }, { "epoch": 0.03, "learning_rate": 9.979479590752145e-05, "loss": 3.1559, "step": 2320 }, { "epoch": 0.03, "learning_rate": 9.979387116018725e-05, "loss": 3.0921, "step": 2325 }, { "epoch": 0.03, "learning_rate": 9.979294433816288e-05, "loss": 3.0266, "step": 2330 }, { "epoch": 0.03, "learning_rate": 9.979201544148699e-05, "loss": 3.1274, "step": 2335 }, { "epoch": 0.03, "learning_rate": 9.979108447019827e-05, "loss": 3.0526, "step": 2340 }, { "epoch": 0.03, "learning_rate": 9.97901514243355e-05, "loss": 3.087, "step": 2345 }, { "epoch": 0.03, "learning_rate": 9.978921630393756e-05, "loss": 3.0116, "step": 2350 }, { "epoch": 0.03, "learning_rate": 9.978827910904341e-05, "loss": 3.1184, "step": 2355 }, { "epoch": 0.03, "learning_rate": 9.978733983969211e-05, "loss": 3.1038, "step": 2360 }, { "epoch": 0.03, "learning_rate": 9.978639849592277e-05, "loss": 3.0825, "step": 2365 }, { "epoch": 0.03, "learning_rate": 9.978545507777465e-05, "loss": 3.1479, "step": 2370 }, { "epoch": 0.03, "learning_rate": 9.978450958528703e-05, "loss": 3.0441, "step": 2375 }, { "epoch": 0.03, "learning_rate": 9.978356201849932e-05, "loss": 3.1066, "step": 2380 }, { "epoch": 0.03, "learning_rate": 9.978261237745098e-05, "loss": 3.1446, "step": 2385 }, { "epoch": 0.03, "learning_rate": 9.97816606621816e-05, "loss": 3.0552, "step": 2390 }, { "epoch": 0.03, "learning_rate": 9.978070687273081e-05, "loss": 3.0213, "step": 2395 }, { "epoch": 0.03, "learning_rate": 9.977975100913836e-05, "loss": 3.0685, "step": 2400 }, { "epoch": 0.03, "learning_rate": 9.977879307144411e-05, "loss": 2.9938, "step": 2405 }, { "epoch": 0.03, "learning_rate": 9.977783305968791e-05, "loss": 3.0065, "step": 2410 }, { "epoch": 0.03, "learning_rate": 9.977687097390982e-05, "loss": 3.0377, "step": 2415 }, { "epoch": 0.03, "learning_rate": 9.977590681414988e-05, "loss": 2.9936, "step": 2420 }, { "epoch": 0.03, "learning_rate": 9.97749405804483e-05, "loss": 3.0972, "step": 2425 }, { "epoch": 0.03, "learning_rate": 9.97739722728453e-05, "loss": 3.3301, "step": 2430 }, { "epoch": 0.03, "learning_rate": 9.977300189138125e-05, "loss": 3.0813, "step": 2435 }, { "epoch": 0.03, "learning_rate": 9.977202943609658e-05, "loss": 3.0738, "step": 2440 }, { "epoch": 0.03, "learning_rate": 9.97710549070318e-05, "loss": 3.1485, "step": 2445 }, { "epoch": 0.03, "learning_rate": 9.977007830422754e-05, "loss": 3.0598, "step": 2450 }, { "epoch": 0.03, "learning_rate": 9.976909962772445e-05, "loss": 3.038, "step": 2455 }, { "epoch": 0.03, "learning_rate": 9.976811887756332e-05, "loss": 3.0775, "step": 2460 }, { "epoch": 0.03, "learning_rate": 9.976713605378503e-05, "loss": 3.007, "step": 2465 }, { "epoch": 0.03, "learning_rate": 9.97661511564305e-05, "loss": 2.9813, "step": 2470 }, { "epoch": 0.03, "learning_rate": 9.976516418554083e-05, "loss": 3.1444, "step": 2475 }, { "epoch": 0.03, "learning_rate": 9.976417514115706e-05, "loss": 3.2032, "step": 2480 }, { "epoch": 0.03, "learning_rate": 9.976318402332045e-05, "loss": 3.0156, "step": 2485 }, { "epoch": 0.03, "learning_rate": 9.976219083207228e-05, "loss": 3.0786, "step": 2490 }, { "epoch": 0.03, "learning_rate": 9.976119556745395e-05, "loss": 3.1876, "step": 2495 }, { "epoch": 0.03, "learning_rate": 9.976019822950691e-05, "loss": 3.0013, "step": 2500 }, { "epoch": 0.03, "learning_rate": 9.975919881827271e-05, "loss": 3.0149, "step": 2505 }, { "epoch": 0.03, "learning_rate": 9.975819733379299e-05, "loss": 3.0907, "step": 2510 }, { "epoch": 0.03, "learning_rate": 9.97571937761095e-05, "loss": 2.9867, "step": 2515 }, { "epoch": 0.03, "learning_rate": 9.975618814526404e-05, "loss": 3.0256, "step": 2520 }, { "epoch": 0.03, "learning_rate": 9.97551804412985e-05, "loss": 3.0884, "step": 2525 }, { "epoch": 0.03, "learning_rate": 9.97541706642549e-05, "loss": 3.1552, "step": 2530 }, { "epoch": 0.03, "learning_rate": 9.975315881417528e-05, "loss": 3.0722, "step": 2535 }, { "epoch": 0.03, "learning_rate": 9.97521448911018e-05, "loss": 3.1172, "step": 2540 }, { "epoch": 0.03, "learning_rate": 9.975112889507671e-05, "loss": 3.0827, "step": 2545 }, { "epoch": 0.03, "learning_rate": 9.975011082614236e-05, "loss": 3.0765, "step": 2550 }, { "epoch": 0.03, "learning_rate": 9.974909068434116e-05, "loss": 2.9946, "step": 2555 }, { "epoch": 0.03, "learning_rate": 9.974806846971561e-05, "loss": 3.1362, "step": 2560 }, { "epoch": 0.03, "learning_rate": 9.974704418230829e-05, "loss": 3.0507, "step": 2565 }, { "epoch": 0.03, "learning_rate": 9.97460178221619e-05, "loss": 3.0737, "step": 2570 }, { "epoch": 0.03, "learning_rate": 9.974498938931918e-05, "loss": 3.1159, "step": 2575 }, { "epoch": 0.03, "learning_rate": 9.974395888382301e-05, "loss": 3.0222, "step": 2580 }, { "epoch": 0.03, "learning_rate": 9.97429263057163e-05, "loss": 3.0846, "step": 2585 }, { "epoch": 0.03, "learning_rate": 9.974189165504208e-05, "loss": 3.1544, "step": 2590 }, { "epoch": 0.03, "learning_rate": 9.974085493184348e-05, "loss": 3.2247, "step": 2595 }, { "epoch": 0.03, "learning_rate": 9.973981613616366e-05, "loss": 2.9073, "step": 2600 }, { "epoch": 0.03, "learning_rate": 9.973877526804591e-05, "loss": 3.2409, "step": 2605 }, { "epoch": 0.03, "learning_rate": 9.973773232753363e-05, "loss": 3.1316, "step": 2610 }, { "epoch": 0.03, "learning_rate": 9.973668731467025e-05, "loss": 3.0049, "step": 2615 }, { "epoch": 0.03, "learning_rate": 9.97356402294993e-05, "loss": 3.1582, "step": 2620 }, { "epoch": 0.03, "learning_rate": 9.973459107206444e-05, "loss": 3.1152, "step": 2625 }, { "epoch": 0.03, "learning_rate": 9.973353984240936e-05, "loss": 2.9916, "step": 2630 }, { "epoch": 0.03, "learning_rate": 9.973248654057785e-05, "loss": 3.1701, "step": 2635 }, { "epoch": 0.03, "learning_rate": 9.973143116661383e-05, "loss": 3.0948, "step": 2640 }, { "epoch": 0.03, "learning_rate": 9.973037372056125e-05, "loss": 3.0006, "step": 2645 }, { "epoch": 0.03, "learning_rate": 9.972931420246417e-05, "loss": 3.0775, "step": 2650 }, { "epoch": 0.03, "learning_rate": 9.972825261236674e-05, "loss": 2.9505, "step": 2655 }, { "epoch": 0.03, "learning_rate": 9.972718895031319e-05, "loss": 2.9127, "step": 2660 }, { "epoch": 0.03, "learning_rate": 9.972612321634784e-05, "loss": 3.1055, "step": 2665 }, { "epoch": 0.03, "learning_rate": 9.97250554105151e-05, "loss": 3.0655, "step": 2670 }, { "epoch": 0.03, "learning_rate": 9.972398553285944e-05, "loss": 3.0904, "step": 2675 }, { "epoch": 0.03, "learning_rate": 9.972291358342545e-05, "loss": 2.9807, "step": 2680 }, { "epoch": 0.03, "learning_rate": 9.972183956225781e-05, "loss": 3.1014, "step": 2685 }, { "epoch": 0.03, "learning_rate": 9.972076346940125e-05, "loss": 3.019, "step": 2690 }, { "epoch": 0.03, "learning_rate": 9.97196853049006e-05, "loss": 3.0379, "step": 2695 }, { "epoch": 0.04, "learning_rate": 9.971860506880079e-05, "loss": 3.2943, "step": 2700 }, { "epoch": 0.04, "learning_rate": 9.971752276114685e-05, "loss": 3.1135, "step": 2705 }, { "epoch": 0.04, "learning_rate": 9.971643838198385e-05, "loss": 2.9961, "step": 2710 }, { "epoch": 0.04, "learning_rate": 9.971535193135697e-05, "loss": 3.0759, "step": 2715 }, { "epoch": 0.04, "learning_rate": 9.97142634093115e-05, "loss": 3.1541, "step": 2720 }, { "epoch": 0.04, "learning_rate": 9.971317281589277e-05, "loss": 2.9192, "step": 2725 }, { "epoch": 0.04, "learning_rate": 9.971208015114621e-05, "loss": 3.1524, "step": 2730 }, { "epoch": 0.04, "learning_rate": 9.971098541511739e-05, "loss": 3.1077, "step": 2735 }, { "epoch": 0.04, "learning_rate": 9.970988860785188e-05, "loss": 3.1107, "step": 2740 }, { "epoch": 0.04, "learning_rate": 9.970878972939542e-05, "loss": 3.216, "step": 2745 }, { "epoch": 0.04, "learning_rate": 9.970768877979375e-05, "loss": 3.0602, "step": 2750 }, { "epoch": 0.04, "learning_rate": 9.970658575909277e-05, "loss": 3.0763, "step": 2755 }, { "epoch": 0.04, "learning_rate": 9.970548066733845e-05, "loss": 3.1145, "step": 2760 }, { "epoch": 0.04, "learning_rate": 9.97043735045768e-05, "loss": 3.0715, "step": 2765 }, { "epoch": 0.04, "learning_rate": 9.970326427085397e-05, "loss": 3.1386, "step": 2770 }, { "epoch": 0.04, "learning_rate": 9.970215296621618e-05, "loss": 2.9223, "step": 2775 }, { "epoch": 0.04, "learning_rate": 9.970103959070973e-05, "loss": 3.0437, "step": 2780 }, { "epoch": 0.04, "learning_rate": 9.969992414438098e-05, "loss": 3.1019, "step": 2785 }, { "epoch": 0.04, "learning_rate": 9.969880662727647e-05, "loss": 3.0075, "step": 2790 }, { "epoch": 0.04, "learning_rate": 9.96976870394427e-05, "loss": 3.0864, "step": 2795 }, { "epoch": 0.04, "learning_rate": 9.969656538092635e-05, "loss": 2.996, "step": 2800 }, { "epoch": 0.04, "learning_rate": 9.969544165177415e-05, "loss": 3.1502, "step": 2805 }, { "epoch": 0.04, "learning_rate": 9.969431585203292e-05, "loss": 3.1609, "step": 2810 }, { "epoch": 0.04, "learning_rate": 9.969318798174956e-05, "loss": 3.108, "step": 2815 }, { "epoch": 0.04, "learning_rate": 9.969205804097106e-05, "loss": 3.1273, "step": 2820 }, { "epoch": 0.04, "learning_rate": 9.969092602974452e-05, "loss": 3.094, "step": 2825 }, { "epoch": 0.04, "learning_rate": 9.96897919481171e-05, "loss": 3.042, "step": 2830 }, { "epoch": 0.04, "learning_rate": 9.968865579613604e-05, "loss": 3.0226, "step": 2835 }, { "epoch": 0.04, "learning_rate": 9.968751757384867e-05, "loss": 3.0645, "step": 2840 }, { "epoch": 0.04, "learning_rate": 9.968637728130245e-05, "loss": 3.0348, "step": 2845 }, { "epoch": 0.04, "learning_rate": 9.968523491854487e-05, "loss": 2.9963, "step": 2850 }, { "epoch": 0.04, "learning_rate": 9.96840904856235e-05, "loss": 2.989, "step": 2855 }, { "epoch": 0.04, "learning_rate": 9.968294398258608e-05, "loss": 3.1222, "step": 2860 }, { "epoch": 0.04, "learning_rate": 9.968179540948036e-05, "loss": 3.0447, "step": 2865 }, { "epoch": 0.04, "learning_rate": 9.968064476635415e-05, "loss": 2.9716, "step": 2870 }, { "epoch": 0.04, "learning_rate": 9.967949205325545e-05, "loss": 2.9762, "step": 2875 }, { "epoch": 0.04, "learning_rate": 9.967833727023227e-05, "loss": 3.0808, "step": 2880 }, { "epoch": 0.04, "learning_rate": 9.967718041733271e-05, "loss": 2.9732, "step": 2885 }, { "epoch": 0.04, "learning_rate": 9.9676021494605e-05, "loss": 2.9453, "step": 2890 }, { "epoch": 0.04, "learning_rate": 9.96748605020974e-05, "loss": 3.0595, "step": 2895 }, { "epoch": 0.04, "learning_rate": 9.967369743985829e-05, "loss": 2.9063, "step": 2900 }, { "epoch": 0.04, "learning_rate": 9.967253230793614e-05, "loss": 3.1256, "step": 2905 }, { "epoch": 0.04, "learning_rate": 9.967136510637947e-05, "loss": 2.975, "step": 2910 }, { "epoch": 0.04, "learning_rate": 9.967019583523696e-05, "loss": 3.1142, "step": 2915 }, { "epoch": 0.04, "learning_rate": 9.966902449455729e-05, "loss": 3.0562, "step": 2920 }, { "epoch": 0.04, "learning_rate": 9.966785108438926e-05, "loss": 3.0743, "step": 2925 }, { "epoch": 0.04, "learning_rate": 9.966667560478179e-05, "loss": 3.0794, "step": 2930 }, { "epoch": 0.04, "learning_rate": 9.966549805578383e-05, "loss": 3.014, "step": 2935 }, { "epoch": 0.04, "learning_rate": 9.966431843744448e-05, "loss": 2.9659, "step": 2940 }, { "epoch": 0.04, "learning_rate": 9.966313674981283e-05, "loss": 3.1278, "step": 2945 }, { "epoch": 0.04, "learning_rate": 9.966195299293816e-05, "loss": 2.9718, "step": 2950 }, { "epoch": 0.04, "learning_rate": 9.96607671668698e-05, "loss": 3.0157, "step": 2955 }, { "epoch": 0.04, "learning_rate": 9.965957927165715e-05, "loss": 3.0097, "step": 2960 }, { "epoch": 0.04, "learning_rate": 9.965838930734966e-05, "loss": 3.1337, "step": 2965 }, { "epoch": 0.04, "learning_rate": 9.965719727399695e-05, "loss": 2.99, "step": 2970 }, { "epoch": 0.04, "learning_rate": 9.96560031716487e-05, "loss": 3.032, "step": 2975 }, { "epoch": 0.04, "learning_rate": 9.965480700035465e-05, "loss": 3.0429, "step": 2980 }, { "epoch": 0.04, "learning_rate": 9.965360876016461e-05, "loss": 3.1262, "step": 2985 }, { "epoch": 0.04, "learning_rate": 9.965240845112855e-05, "loss": 3.0263, "step": 2990 }, { "epoch": 0.04, "learning_rate": 9.965120607329646e-05, "loss": 2.9854, "step": 2995 }, { "epoch": 0.04, "learning_rate": 9.965000162671842e-05, "loss": 3.0278, "step": 3000 }, { "epoch": 0.04, "learning_rate": 9.964879511144465e-05, "loss": 3.0278, "step": 3005 }, { "epoch": 0.04, "learning_rate": 9.964758652752539e-05, "loss": 3.0889, "step": 3010 }, { "epoch": 0.04, "learning_rate": 9.964637587501102e-05, "loss": 3.0821, "step": 3015 }, { "epoch": 0.04, "learning_rate": 9.964516315395198e-05, "loss": 3.0267, "step": 3020 }, { "epoch": 0.04, "learning_rate": 9.964394836439877e-05, "loss": 3.1469, "step": 3025 }, { "epoch": 0.04, "learning_rate": 9.964273150640203e-05, "loss": 3.0737, "step": 3030 }, { "epoch": 0.04, "learning_rate": 9.964151258001247e-05, "loss": 3.0788, "step": 3035 }, { "epoch": 0.04, "learning_rate": 9.964029158528085e-05, "loss": 3.0117, "step": 3040 }, { "epoch": 0.04, "learning_rate": 9.963906852225806e-05, "loss": 3.0129, "step": 3045 }, { "epoch": 0.04, "learning_rate": 9.963784339099506e-05, "loss": 3.1274, "step": 3050 }, { "epoch": 0.04, "learning_rate": 9.963661619154289e-05, "loss": 2.9024, "step": 3055 }, { "epoch": 0.04, "learning_rate": 9.96353869239527e-05, "loss": 2.9537, "step": 3060 }, { "epoch": 0.04, "learning_rate": 9.963415558827566e-05, "loss": 3.0185, "step": 3065 }, { "epoch": 0.04, "learning_rate": 9.963292218456313e-05, "loss": 3.0433, "step": 3070 }, { "epoch": 0.04, "learning_rate": 9.963168671286647e-05, "loss": 3.1428, "step": 3075 }, { "epoch": 0.04, "learning_rate": 9.963044917323717e-05, "loss": 2.9763, "step": 3080 }, { "epoch": 0.04, "learning_rate": 9.962920956572678e-05, "loss": 3.1532, "step": 3085 }, { "epoch": 0.04, "learning_rate": 9.962796789038698e-05, "loss": 3.1069, "step": 3090 }, { "epoch": 0.04, "learning_rate": 9.962672414726946e-05, "loss": 3.0738, "step": 3095 }, { "epoch": 0.04, "learning_rate": 9.962547833642606e-05, "loss": 2.9582, "step": 3100 }, { "epoch": 0.04, "learning_rate": 9.962423045790869e-05, "loss": 3.0009, "step": 3105 }, { "epoch": 0.04, "learning_rate": 9.962298051176935e-05, "loss": 3.0097, "step": 3110 }, { "epoch": 0.04, "learning_rate": 9.962172849806011e-05, "loss": 3.0652, "step": 3115 }, { "epoch": 0.04, "learning_rate": 9.962047441683313e-05, "loss": 2.9371, "step": 3120 }, { "epoch": 0.04, "learning_rate": 9.961921826814069e-05, "loss": 2.9304, "step": 3125 }, { "epoch": 0.04, "learning_rate": 9.96179600520351e-05, "loss": 2.9778, "step": 3130 }, { "epoch": 0.04, "learning_rate": 9.961669976856879e-05, "loss": 2.9825, "step": 3135 }, { "epoch": 0.04, "learning_rate": 9.961543741779427e-05, "loss": 3.1389, "step": 3140 }, { "epoch": 0.04, "learning_rate": 9.961417299976416e-05, "loss": 3.0422, "step": 3145 }, { "epoch": 0.04, "learning_rate": 9.96129065145311e-05, "loss": 2.9288, "step": 3150 }, { "epoch": 0.04, "learning_rate": 9.961163796214789e-05, "loss": 2.896, "step": 3155 }, { "epoch": 0.04, "learning_rate": 9.961036734266738e-05, "loss": 2.9807, "step": 3160 }, { "epoch": 0.04, "learning_rate": 9.96090946561425e-05, "loss": 2.9945, "step": 3165 }, { "epoch": 0.04, "learning_rate": 9.960781990262631e-05, "loss": 2.9773, "step": 3170 }, { "epoch": 0.04, "learning_rate": 9.960654308217188e-05, "loss": 2.9703, "step": 3175 }, { "epoch": 0.04, "learning_rate": 9.960526419483243e-05, "loss": 2.8595, "step": 3180 }, { "epoch": 0.04, "learning_rate": 9.960398324066124e-05, "loss": 3.0417, "step": 3185 }, { "epoch": 0.04, "learning_rate": 9.960270021971168e-05, "loss": 2.9208, "step": 3190 }, { "epoch": 0.04, "learning_rate": 9.960141513203722e-05, "loss": 2.9939, "step": 3195 }, { "epoch": 0.04, "learning_rate": 9.96001279776914e-05, "loss": 2.8803, "step": 3200 }, { "epoch": 0.04, "learning_rate": 9.959883875672784e-05, "loss": 3.0251, "step": 3205 }, { "epoch": 0.04, "learning_rate": 9.959754746920027e-05, "loss": 2.906, "step": 3210 }, { "epoch": 0.04, "learning_rate": 9.959625411516249e-05, "loss": 3.1077, "step": 3215 }, { "epoch": 0.04, "learning_rate": 9.959495869466837e-05, "loss": 2.9544, "step": 3220 }, { "epoch": 0.04, "learning_rate": 9.95936612077719e-05, "loss": 2.9592, "step": 3225 }, { "epoch": 0.04, "learning_rate": 9.959236165452714e-05, "loss": 2.9108, "step": 3230 }, { "epoch": 0.04, "learning_rate": 9.959106003498824e-05, "loss": 2.9147, "step": 3235 }, { "epoch": 0.04, "learning_rate": 9.958975634920943e-05, "loss": 3.0167, "step": 3240 }, { "epoch": 0.04, "learning_rate": 9.958845059724502e-05, "loss": 3.0868, "step": 3245 }, { "epoch": 0.04, "learning_rate": 9.958714277914942e-05, "loss": 3.0127, "step": 3250 }, { "epoch": 0.04, "learning_rate": 9.958583289497714e-05, "loss": 2.9322, "step": 3255 }, { "epoch": 0.04, "learning_rate": 9.958452094478273e-05, "loss": 2.97, "step": 3260 }, { "epoch": 0.04, "learning_rate": 9.958320692862086e-05, "loss": 2.9601, "step": 3265 }, { "epoch": 0.04, "learning_rate": 9.958189084654628e-05, "loss": 3.0703, "step": 3270 }, { "epoch": 0.04, "learning_rate": 9.958057269861383e-05, "loss": 3.0436, "step": 3275 }, { "epoch": 0.04, "learning_rate": 9.957925248487843e-05, "loss": 3.0255, "step": 3280 }, { "epoch": 0.04, "learning_rate": 9.957793020539508e-05, "loss": 3.0689, "step": 3285 }, { "epoch": 0.04, "learning_rate": 9.957660586021888e-05, "loss": 3.022, "step": 3290 }, { "epoch": 0.04, "learning_rate": 9.957527944940502e-05, "loss": 3.0056, "step": 3295 }, { "epoch": 0.04, "learning_rate": 9.957395097300874e-05, "loss": 2.9736, "step": 3300 }, { "epoch": 0.04, "learning_rate": 9.957262043108542e-05, "loss": 2.9765, "step": 3305 }, { "epoch": 0.04, "learning_rate": 9.957128782369049e-05, "loss": 3.1127, "step": 3310 }, { "epoch": 0.04, "learning_rate": 9.956995315087945e-05, "loss": 3.0416, "step": 3315 }, { "epoch": 0.04, "learning_rate": 9.956861641270794e-05, "loss": 3.0098, "step": 3320 }, { "epoch": 0.04, "learning_rate": 9.956727760923164e-05, "loss": 3.0136, "step": 3325 }, { "epoch": 0.04, "learning_rate": 9.956593674050634e-05, "loss": 3.0541, "step": 3330 }, { "epoch": 0.04, "learning_rate": 9.956459380658791e-05, "loss": 3.1758, "step": 3335 }, { "epoch": 0.04, "learning_rate": 9.95632488075323e-05, "loss": 2.9674, "step": 3340 }, { "epoch": 0.04, "learning_rate": 9.956190174339552e-05, "loss": 3.1105, "step": 3345 }, { "epoch": 0.04, "learning_rate": 9.956055261423375e-05, "loss": 2.9755, "step": 3350 }, { "epoch": 0.04, "learning_rate": 9.955920142010317e-05, "loss": 2.852, "step": 3355 }, { "epoch": 0.04, "learning_rate": 9.95578481610601e-05, "loss": 3.0009, "step": 3360 }, { "epoch": 0.04, "learning_rate": 9.955649283716089e-05, "loss": 3.0686, "step": 3365 }, { "epoch": 0.04, "learning_rate": 9.955513544846205e-05, "loss": 3.0446, "step": 3370 }, { "epoch": 0.04, "learning_rate": 9.955377599502009e-05, "loss": 3.0223, "step": 3375 }, { "epoch": 0.04, "learning_rate": 9.95524144768917e-05, "loss": 2.9742, "step": 3380 }, { "epoch": 0.04, "learning_rate": 9.955105089413358e-05, "loss": 3.049, "step": 3385 }, { "epoch": 0.04, "learning_rate": 9.954968524680254e-05, "loss": 2.9808, "step": 3390 }, { "epoch": 0.04, "learning_rate": 9.954831753495551e-05, "loss": 2.959, "step": 3395 }, { "epoch": 0.04, "learning_rate": 9.954694775864946e-05, "loss": 2.9679, "step": 3400 }, { "epoch": 0.04, "learning_rate": 9.954557591794145e-05, "loss": 3.0502, "step": 3405 }, { "epoch": 0.04, "learning_rate": 9.954420201288866e-05, "loss": 3.03, "step": 3410 }, { "epoch": 0.04, "learning_rate": 9.954282604354832e-05, "loss": 3.1245, "step": 3415 }, { "epoch": 0.04, "learning_rate": 9.954144800997775e-05, "loss": 3.068, "step": 3420 }, { "epoch": 0.04, "learning_rate": 9.95400679122344e-05, "loss": 3.0936, "step": 3425 }, { "epoch": 0.04, "learning_rate": 9.953868575037575e-05, "loss": 3.0323, "step": 3430 }, { "epoch": 0.04, "learning_rate": 9.953730152445939e-05, "loss": 2.9972, "step": 3435 }, { "epoch": 0.04, "learning_rate": 9.9535915234543e-05, "loss": 3.0967, "step": 3440 }, { "epoch": 0.04, "learning_rate": 9.953452688068434e-05, "loss": 3.0512, "step": 3445 }, { "epoch": 0.04, "learning_rate": 9.953313646294125e-05, "loss": 3.0011, "step": 3450 }, { "epoch": 0.04, "learning_rate": 9.953174398137166e-05, "loss": 3.0654, "step": 3455 }, { "epoch": 0.04, "learning_rate": 9.953034943603361e-05, "loss": 3.0531, "step": 3460 }, { "epoch": 0.04, "learning_rate": 9.952895282698517e-05, "loss": 3.0334, "step": 3465 }, { "epoch": 0.05, "learning_rate": 9.952755415428456e-05, "loss": 3.0665, "step": 3470 }, { "epoch": 0.05, "learning_rate": 9.952615341799006e-05, "loss": 2.8184, "step": 3475 }, { "epoch": 0.05, "learning_rate": 9.952475061816e-05, "loss": 3.0243, "step": 3480 }, { "epoch": 0.05, "learning_rate": 9.952334575485287e-05, "loss": 3.0932, "step": 3485 }, { "epoch": 0.05, "learning_rate": 9.952193882812718e-05, "loss": 2.992, "step": 3490 }, { "epoch": 0.05, "learning_rate": 9.952052983804152e-05, "loss": 2.9772, "step": 3495 }, { "epoch": 0.05, "learning_rate": 9.951911878465465e-05, "loss": 2.9722, "step": 3500 }, { "epoch": 0.05, "learning_rate": 9.951770566802535e-05, "loss": 2.9536, "step": 3505 }, { "epoch": 0.05, "learning_rate": 9.951629048821248e-05, "loss": 3.0765, "step": 3510 }, { "epoch": 0.05, "learning_rate": 9.951487324527502e-05, "loss": 3.0754, "step": 3515 }, { "epoch": 0.05, "learning_rate": 9.9513453939272e-05, "loss": 3.0972, "step": 3520 }, { "epoch": 0.05, "learning_rate": 9.951203257026259e-05, "loss": 3.0927, "step": 3525 }, { "epoch": 0.05, "learning_rate": 9.951060913830597e-05, "loss": 3.0237, "step": 3530 }, { "epoch": 0.05, "learning_rate": 9.95091836434615e-05, "loss": 2.9457, "step": 3535 }, { "epoch": 0.05, "learning_rate": 9.950775608578852e-05, "loss": 3.0165, "step": 3540 }, { "epoch": 0.05, "learning_rate": 9.950632646534654e-05, "loss": 2.9489, "step": 3545 }, { "epoch": 0.05, "learning_rate": 9.950489478219513e-05, "loss": 2.9696, "step": 3550 }, { "epoch": 0.05, "learning_rate": 9.950346103639392e-05, "loss": 2.905, "step": 3555 }, { "epoch": 0.05, "learning_rate": 9.950202522800267e-05, "loss": 2.9346, "step": 3560 }, { "epoch": 0.05, "learning_rate": 9.950058735708119e-05, "loss": 3.0025, "step": 3565 }, { "epoch": 0.05, "learning_rate": 9.94991474236894e-05, "loss": 2.979, "step": 3570 }, { "epoch": 0.05, "learning_rate": 9.949770542788727e-05, "loss": 2.9718, "step": 3575 }, { "epoch": 0.05, "learning_rate": 9.949626136973492e-05, "loss": 3.0456, "step": 3580 }, { "epoch": 0.05, "learning_rate": 9.949481524929249e-05, "loss": 3.0618, "step": 3585 }, { "epoch": 0.05, "learning_rate": 9.949336706662024e-05, "loss": 2.9569, "step": 3590 }, { "epoch": 0.05, "learning_rate": 9.949191682177853e-05, "loss": 3.0891, "step": 3595 }, { "epoch": 0.05, "learning_rate": 9.949046451482775e-05, "loss": 3.068, "step": 3600 }, { "epoch": 0.05, "learning_rate": 9.948901014582843e-05, "loss": 3.0835, "step": 3605 }, { "epoch": 0.05, "learning_rate": 9.948755371484118e-05, "loss": 3.1168, "step": 3610 }, { "epoch": 0.05, "learning_rate": 9.948609522192665e-05, "loss": 2.9859, "step": 3615 }, { "epoch": 0.05, "learning_rate": 9.948463466714563e-05, "loss": 2.9355, "step": 3620 }, { "epoch": 0.05, "learning_rate": 9.948317205055898e-05, "loss": 3.1662, "step": 3625 }, { "epoch": 0.05, "learning_rate": 9.948170737222762e-05, "loss": 3.065, "step": 3630 }, { "epoch": 0.05, "learning_rate": 9.948024063221259e-05, "loss": 3.0994, "step": 3635 }, { "epoch": 0.05, "learning_rate": 9.947877183057501e-05, "loss": 2.8956, "step": 3640 }, { "epoch": 0.05, "learning_rate": 9.947730096737609e-05, "loss": 2.8912, "step": 3645 }, { "epoch": 0.05, "learning_rate": 9.947582804267706e-05, "loss": 3.0538, "step": 3650 }, { "epoch": 0.05, "learning_rate": 9.947435305653934e-05, "loss": 3.015, "step": 3655 }, { "epoch": 0.05, "learning_rate": 9.947287600902438e-05, "loss": 2.9891, "step": 3660 }, { "epoch": 0.05, "learning_rate": 9.94713969001937e-05, "loss": 2.9873, "step": 3665 }, { "epoch": 0.05, "learning_rate": 9.946991573010893e-05, "loss": 2.9827, "step": 3670 }, { "epoch": 0.05, "learning_rate": 9.946843249883182e-05, "loss": 2.9125, "step": 3675 }, { "epoch": 0.05, "learning_rate": 9.946694720642413e-05, "loss": 3.0632, "step": 3680 }, { "epoch": 0.05, "learning_rate": 9.946545985294775e-05, "loss": 2.8291, "step": 3685 }, { "epoch": 0.05, "learning_rate": 9.946397043846469e-05, "loss": 2.9844, "step": 3690 }, { "epoch": 0.05, "learning_rate": 9.946247896303695e-05, "loss": 2.9212, "step": 3695 }, { "epoch": 0.05, "learning_rate": 9.946098542672672e-05, "loss": 3.0866, "step": 3700 }, { "epoch": 0.05, "learning_rate": 9.945948982959621e-05, "loss": 3.1144, "step": 3705 }, { "epoch": 0.05, "learning_rate": 9.945799217170773e-05, "loss": 2.9908, "step": 3710 }, { "epoch": 0.05, "learning_rate": 9.94564924531237e-05, "loss": 2.9293, "step": 3715 }, { "epoch": 0.05, "learning_rate": 9.945499067390658e-05, "loss": 2.9391, "step": 3720 }, { "epoch": 0.05, "learning_rate": 9.945348683411894e-05, "loss": 3.0791, "step": 3725 }, { "epoch": 0.05, "learning_rate": 9.945198093382349e-05, "loss": 2.9216, "step": 3730 }, { "epoch": 0.05, "learning_rate": 9.94504729730829e-05, "loss": 2.9672, "step": 3735 }, { "epoch": 0.05, "learning_rate": 9.944896295196007e-05, "loss": 3.0453, "step": 3740 }, { "epoch": 0.05, "learning_rate": 9.944745087051788e-05, "loss": 2.9516, "step": 3745 }, { "epoch": 0.05, "learning_rate": 9.944593672881932e-05, "loss": 2.8246, "step": 3750 }, { "epoch": 0.05, "learning_rate": 9.944442052692751e-05, "loss": 2.9447, "step": 3755 }, { "epoch": 0.05, "learning_rate": 9.94429022649056e-05, "loss": 2.964, "step": 3760 }, { "epoch": 0.05, "learning_rate": 9.944138194281685e-05, "loss": 2.9512, "step": 3765 }, { "epoch": 0.05, "learning_rate": 9.943985956072461e-05, "loss": 2.9784, "step": 3770 }, { "epoch": 0.05, "learning_rate": 9.943833511869232e-05, "loss": 3.0268, "step": 3775 }, { "epoch": 0.05, "learning_rate": 9.94368086167835e-05, "loss": 2.9564, "step": 3780 }, { "epoch": 0.05, "learning_rate": 9.943528005506173e-05, "loss": 2.9699, "step": 3785 }, { "epoch": 0.05, "learning_rate": 9.943374943359071e-05, "loss": 2.9817, "step": 3790 }, { "epoch": 0.05, "learning_rate": 9.943221675243422e-05, "loss": 2.8321, "step": 3795 }, { "epoch": 0.05, "learning_rate": 9.943068201165611e-05, "loss": 2.8718, "step": 3800 }, { "epoch": 0.05, "learning_rate": 9.942914521132032e-05, "loss": 3.1003, "step": 3805 }, { "epoch": 0.05, "learning_rate": 9.94276063514909e-05, "loss": 3.1042, "step": 3810 }, { "epoch": 0.05, "learning_rate": 9.942606543223196e-05, "loss": 3.0337, "step": 3815 }, { "epoch": 0.05, "learning_rate": 9.942452245360772e-05, "loss": 2.9428, "step": 3820 }, { "epoch": 0.05, "learning_rate": 9.942297741568243e-05, "loss": 2.7384, "step": 3825 }, { "epoch": 0.05, "learning_rate": 9.942143031852049e-05, "loss": 3.0969, "step": 3830 }, { "epoch": 0.05, "learning_rate": 9.941988116218635e-05, "loss": 2.8646, "step": 3835 }, { "epoch": 0.05, "learning_rate": 9.941832994674458e-05, "loss": 3.0429, "step": 3840 }, { "epoch": 0.05, "learning_rate": 9.941677667225979e-05, "loss": 2.9304, "step": 3845 }, { "epoch": 0.05, "learning_rate": 9.94152213387967e-05, "loss": 2.953, "step": 3850 }, { "epoch": 0.05, "learning_rate": 9.941366394642012e-05, "loss": 2.9688, "step": 3855 }, { "epoch": 0.05, "learning_rate": 9.941210449519493e-05, "loss": 2.8466, "step": 3860 }, { "epoch": 0.05, "learning_rate": 9.941054298518612e-05, "loss": 3.0085, "step": 3865 }, { "epoch": 0.05, "learning_rate": 9.940897941645875e-05, "loss": 3.0243, "step": 3870 }, { "epoch": 0.05, "learning_rate": 9.940741378907796e-05, "loss": 3.0681, "step": 3875 }, { "epoch": 0.05, "learning_rate": 9.940584610310899e-05, "loss": 2.9454, "step": 3880 }, { "epoch": 0.05, "learning_rate": 9.940427635861713e-05, "loss": 2.9484, "step": 3885 }, { "epoch": 0.05, "learning_rate": 9.940270455566783e-05, "loss": 2.9525, "step": 3890 }, { "epoch": 0.05, "learning_rate": 9.940113069432656e-05, "loss": 2.9672, "step": 3895 }, { "epoch": 0.05, "learning_rate": 9.939955477465887e-05, "loss": 3.077, "step": 3900 }, { "epoch": 0.05, "learning_rate": 9.939797679673044e-05, "loss": 3.0428, "step": 3905 }, { "epoch": 0.05, "learning_rate": 9.939639676060703e-05, "loss": 3.0578, "step": 3910 }, { "epoch": 0.05, "learning_rate": 9.939481466635448e-05, "loss": 3.0489, "step": 3915 }, { "epoch": 0.05, "learning_rate": 9.939323051403869e-05, "loss": 3.0481, "step": 3920 }, { "epoch": 0.05, "learning_rate": 9.939164430372566e-05, "loss": 2.8768, "step": 3925 }, { "epoch": 0.05, "learning_rate": 9.939005603548148e-05, "loss": 2.9702, "step": 3930 }, { "epoch": 0.05, "learning_rate": 9.938846570937236e-05, "loss": 2.795, "step": 3935 }, { "epoch": 0.05, "learning_rate": 9.938687332546453e-05, "loss": 2.879, "step": 3940 }, { "epoch": 0.05, "learning_rate": 9.938527888382432e-05, "loss": 3.0027, "step": 3945 }, { "epoch": 0.05, "learning_rate": 9.93836823845182e-05, "loss": 3.055, "step": 3950 }, { "epoch": 0.05, "learning_rate": 9.938208382761269e-05, "loss": 2.8872, "step": 3955 }, { "epoch": 0.05, "learning_rate": 9.938048321317436e-05, "loss": 2.9879, "step": 3960 }, { "epoch": 0.05, "learning_rate": 9.937888054126995e-05, "loss": 3.0017, "step": 3965 }, { "epoch": 0.05, "learning_rate": 9.937727581196618e-05, "loss": 2.844, "step": 3970 }, { "epoch": 0.05, "learning_rate": 9.937566902532996e-05, "loss": 2.9849, "step": 3975 }, { "epoch": 0.05, "learning_rate": 9.93740601814282e-05, "loss": 2.8629, "step": 3980 }, { "epoch": 0.05, "learning_rate": 9.937244928032796e-05, "loss": 2.9815, "step": 3985 }, { "epoch": 0.05, "learning_rate": 9.937083632209637e-05, "loss": 2.9867, "step": 3990 }, { "epoch": 0.05, "learning_rate": 9.936922130680058e-05, "loss": 3.0226, "step": 3995 }, { "epoch": 0.05, "learning_rate": 9.936760423450794e-05, "loss": 2.9043, "step": 4000 }, { "epoch": 0.05, "learning_rate": 9.936598510528579e-05, "loss": 2.8883, "step": 4005 }, { "epoch": 0.05, "learning_rate": 9.936436391920161e-05, "loss": 2.9002, "step": 4010 }, { "epoch": 0.05, "learning_rate": 9.936274067632294e-05, "loss": 2.908, "step": 4015 }, { "epoch": 0.05, "learning_rate": 9.936111537671742e-05, "loss": 2.9874, "step": 4020 }, { "epoch": 0.05, "learning_rate": 9.935948802045275e-05, "loss": 2.7665, "step": 4025 }, { "epoch": 0.05, "learning_rate": 9.935785860759675e-05, "loss": 2.8691, "step": 4030 }, { "epoch": 0.05, "learning_rate": 9.935622713821732e-05, "loss": 2.9203, "step": 4035 }, { "epoch": 0.05, "learning_rate": 9.935459361238242e-05, "loss": 2.9192, "step": 4040 }, { "epoch": 0.05, "learning_rate": 9.935295803016012e-05, "loss": 3.0162, "step": 4045 }, { "epoch": 0.05, "learning_rate": 9.935132039161857e-05, "loss": 2.9672, "step": 4050 }, { "epoch": 0.05, "learning_rate": 9.934968069682597e-05, "loss": 2.9416, "step": 4055 }, { "epoch": 0.05, "learning_rate": 9.934803894585069e-05, "loss": 3.0276, "step": 4060 }, { "epoch": 0.05, "learning_rate": 9.934639513876111e-05, "loss": 2.8751, "step": 4065 }, { "epoch": 0.05, "learning_rate": 9.934474927562572e-05, "loss": 2.9831, "step": 4070 }, { "epoch": 0.05, "learning_rate": 9.93431013565131e-05, "loss": 3.0012, "step": 4075 }, { "epoch": 0.05, "learning_rate": 9.934145138149189e-05, "loss": 2.8598, "step": 4080 }, { "epoch": 0.05, "learning_rate": 9.933979935063087e-05, "loss": 2.8738, "step": 4085 }, { "epoch": 0.05, "learning_rate": 9.933814526399884e-05, "loss": 2.9897, "step": 4090 }, { "epoch": 0.05, "learning_rate": 9.933648912166476e-05, "loss": 3.0321, "step": 4095 }, { "epoch": 0.05, "learning_rate": 9.933483092369761e-05, "loss": 2.9749, "step": 4100 }, { "epoch": 0.05, "learning_rate": 9.933317067016648e-05, "loss": 2.9229, "step": 4105 }, { "epoch": 0.05, "learning_rate": 9.933150836114054e-05, "loss": 3.0025, "step": 4110 }, { "epoch": 0.05, "learning_rate": 9.932984399668905e-05, "loss": 2.8406, "step": 4115 }, { "epoch": 0.05, "learning_rate": 9.932817757688138e-05, "loss": 2.8229, "step": 4120 }, { "epoch": 0.05, "learning_rate": 9.932650910178694e-05, "loss": 2.9127, "step": 4125 }, { "epoch": 0.05, "learning_rate": 9.932483857147524e-05, "loss": 2.9603, "step": 4130 }, { "epoch": 0.05, "learning_rate": 9.932316598601592e-05, "loss": 2.9961, "step": 4135 }, { "epoch": 0.05, "learning_rate": 9.932149134547863e-05, "loss": 2.9197, "step": 4140 }, { "epoch": 0.05, "learning_rate": 9.931981464993317e-05, "loss": 2.9754, "step": 4145 }, { "epoch": 0.05, "learning_rate": 9.931813589944938e-05, "loss": 3.0895, "step": 4150 }, { "epoch": 0.05, "learning_rate": 9.931645509409724e-05, "loss": 2.9594, "step": 4155 }, { "epoch": 0.05, "learning_rate": 9.931477223394674e-05, "loss": 2.9627, "step": 4160 }, { "epoch": 0.05, "learning_rate": 9.931308731906804e-05, "loss": 3.012, "step": 4165 }, { "epoch": 0.05, "learning_rate": 9.93114003495313e-05, "loss": 2.9217, "step": 4170 }, { "epoch": 0.05, "learning_rate": 9.930971132540683e-05, "loss": 3.084, "step": 4175 }, { "epoch": 0.05, "learning_rate": 9.9308020246765e-05, "loss": 3.0098, "step": 4180 }, { "epoch": 0.05, "learning_rate": 9.930632711367629e-05, "loss": 3.0325, "step": 4185 }, { "epoch": 0.05, "learning_rate": 9.930463192621122e-05, "loss": 2.9338, "step": 4190 }, { "epoch": 0.05, "learning_rate": 9.930293468444043e-05, "loss": 2.937, "step": 4195 }, { "epoch": 0.05, "learning_rate": 9.930123538843463e-05, "loss": 3.0385, "step": 4200 }, { "epoch": 0.05, "learning_rate": 9.929953403826465e-05, "loss": 2.944, "step": 4205 }, { "epoch": 0.05, "learning_rate": 9.929783063400133e-05, "loss": 2.9226, "step": 4210 }, { "epoch": 0.05, "learning_rate": 9.929612517571566e-05, "loss": 3.0018, "step": 4215 }, { "epoch": 0.05, "learning_rate": 9.929441766347873e-05, "loss": 2.8845, "step": 4220 }, { "epoch": 0.05, "learning_rate": 9.929270809736167e-05, "loss": 2.9009, "step": 4225 }, { "epoch": 0.05, "learning_rate": 9.929099647743567e-05, "loss": 2.9567, "step": 4230 }, { "epoch": 0.05, "learning_rate": 9.92892828037721e-05, "loss": 2.9221, "step": 4235 }, { "epoch": 0.06, "learning_rate": 9.928756707644234e-05, "loss": 2.8637, "step": 4240 }, { "epoch": 0.06, "learning_rate": 9.928584929551787e-05, "loss": 2.9708, "step": 4245 }, { "epoch": 0.06, "learning_rate": 9.928412946107028e-05, "loss": 2.8218, "step": 4250 }, { "epoch": 0.06, "learning_rate": 9.928240757317119e-05, "loss": 2.9268, "step": 4255 }, { "epoch": 0.06, "learning_rate": 9.92806836318924e-05, "loss": 2.8877, "step": 4260 }, { "epoch": 0.06, "learning_rate": 9.92789576373057e-05, "loss": 3.0326, "step": 4265 }, { "epoch": 0.06, "learning_rate": 9.9277229589483e-05, "loss": 2.9523, "step": 4270 }, { "epoch": 0.06, "learning_rate": 9.927549948849631e-05, "loss": 3.0924, "step": 4275 }, { "epoch": 0.06, "learning_rate": 9.927376733441774e-05, "loss": 2.9991, "step": 4280 }, { "epoch": 0.06, "learning_rate": 9.927203312731943e-05, "loss": 2.8879, "step": 4285 }, { "epoch": 0.06, "learning_rate": 9.927029686727365e-05, "loss": 2.9525, "step": 4290 }, { "epoch": 0.06, "learning_rate": 9.926855855435273e-05, "loss": 2.915, "step": 4295 }, { "epoch": 0.06, "learning_rate": 9.92668181886291e-05, "loss": 2.9933, "step": 4300 }, { "epoch": 0.06, "learning_rate": 9.92650757701753e-05, "loss": 2.907, "step": 4305 }, { "epoch": 0.06, "learning_rate": 9.926333129906391e-05, "loss": 2.9037, "step": 4310 }, { "epoch": 0.06, "learning_rate": 9.92615847753676e-05, "loss": 2.9471, "step": 4315 }, { "epoch": 0.06, "learning_rate": 9.925983619915916e-05, "loss": 2.9729, "step": 4320 }, { "epoch": 0.06, "learning_rate": 9.925808557051144e-05, "loss": 2.902, "step": 4325 }, { "epoch": 0.06, "learning_rate": 9.925633288949737e-05, "loss": 2.8634, "step": 4330 }, { "epoch": 0.06, "learning_rate": 9.925457815618999e-05, "loss": 2.892, "step": 4335 }, { "epoch": 0.06, "learning_rate": 9.925282137066241e-05, "loss": 2.9493, "step": 4340 }, { "epoch": 0.06, "learning_rate": 9.925106253298784e-05, "loss": 2.9278, "step": 4345 }, { "epoch": 0.06, "learning_rate": 9.924930164323953e-05, "loss": 2.9798, "step": 4350 }, { "epoch": 0.06, "learning_rate": 9.924753870149087e-05, "loss": 2.916, "step": 4355 }, { "epoch": 0.06, "learning_rate": 9.924577370781532e-05, "loss": 2.7866, "step": 4360 }, { "epoch": 0.06, "learning_rate": 9.924400666228639e-05, "loss": 2.9715, "step": 4365 }, { "epoch": 0.06, "learning_rate": 9.924223756497775e-05, "loss": 3.0228, "step": 4370 }, { "epoch": 0.06, "learning_rate": 9.924046641596307e-05, "loss": 2.9402, "step": 4375 }, { "epoch": 0.06, "learning_rate": 9.923869321531616e-05, "loss": 3.0485, "step": 4380 }, { "epoch": 0.06, "learning_rate": 9.923691796311092e-05, "loss": 2.9247, "step": 4385 }, { "epoch": 0.06, "learning_rate": 9.923514065942129e-05, "loss": 3.0022, "step": 4390 }, { "epoch": 0.06, "learning_rate": 9.923336130432133e-05, "loss": 3.0638, "step": 4395 }, { "epoch": 0.06, "learning_rate": 9.923157989788519e-05, "loss": 3.0124, "step": 4400 }, { "epoch": 0.06, "learning_rate": 9.922979644018707e-05, "loss": 2.9465, "step": 4405 }, { "epoch": 0.06, "learning_rate": 9.92280109313013e-05, "loss": 2.9966, "step": 4410 }, { "epoch": 0.06, "learning_rate": 9.922622337130228e-05, "loss": 2.9732, "step": 4415 }, { "epoch": 0.06, "learning_rate": 9.922443376026445e-05, "loss": 2.898, "step": 4420 }, { "epoch": 0.06, "learning_rate": 9.922264209826242e-05, "loss": 2.8411, "step": 4425 }, { "epoch": 0.06, "learning_rate": 9.922084838537081e-05, "loss": 2.9249, "step": 4430 }, { "epoch": 0.06, "learning_rate": 9.921905262166438e-05, "loss": 3.0275, "step": 4435 }, { "epoch": 0.06, "learning_rate": 9.921725480721792e-05, "loss": 2.945, "step": 4440 }, { "epoch": 0.06, "learning_rate": 9.921545494210638e-05, "loss": 2.9585, "step": 4445 }, { "epoch": 0.06, "learning_rate": 9.921365302640473e-05, "loss": 3.0049, "step": 4450 }, { "epoch": 0.06, "learning_rate": 9.921184906018804e-05, "loss": 2.9222, "step": 4455 }, { "epoch": 0.06, "learning_rate": 9.921004304353147e-05, "loss": 2.9882, "step": 4460 }, { "epoch": 0.06, "learning_rate": 9.92082349765103e-05, "loss": 2.9549, "step": 4465 }, { "epoch": 0.06, "learning_rate": 9.920642485919982e-05, "loss": 2.9455, "step": 4470 }, { "epoch": 0.06, "learning_rate": 9.920461269167549e-05, "loss": 3.064, "step": 4475 }, { "epoch": 0.06, "learning_rate": 9.92027984740128e-05, "loss": 3.0116, "step": 4480 }, { "epoch": 0.06, "learning_rate": 9.920098220628733e-05, "loss": 2.9927, "step": 4485 }, { "epoch": 0.06, "learning_rate": 9.919916388857476e-05, "loss": 2.9955, "step": 4490 }, { "epoch": 0.06, "learning_rate": 9.919734352095085e-05, "loss": 2.9969, "step": 4495 }, { "epoch": 0.06, "learning_rate": 9.919552110349147e-05, "loss": 3.0063, "step": 4500 }, { "epoch": 0.06, "learning_rate": 9.919369663627251e-05, "loss": 2.9267, "step": 4505 }, { "epoch": 0.06, "learning_rate": 9.919187011937004e-05, "loss": 2.9336, "step": 4510 }, { "epoch": 0.06, "learning_rate": 9.919004155286012e-05, "loss": 2.9342, "step": 4515 }, { "epoch": 0.06, "learning_rate": 9.918821093681896e-05, "loss": 2.979, "step": 4520 }, { "epoch": 0.06, "learning_rate": 9.918637827132282e-05, "loss": 2.935, "step": 4525 }, { "epoch": 0.06, "learning_rate": 9.918454355644807e-05, "loss": 2.9114, "step": 4530 }, { "epoch": 0.06, "learning_rate": 9.918270679227114e-05, "loss": 2.9629, "step": 4535 }, { "epoch": 0.06, "learning_rate": 9.918086797886857e-05, "loss": 2.9905, "step": 4540 }, { "epoch": 0.06, "learning_rate": 9.9179027116317e-05, "loss": 2.9886, "step": 4545 }, { "epoch": 0.06, "learning_rate": 9.917718420469306e-05, "loss": 2.9472, "step": 4550 }, { "epoch": 0.06, "learning_rate": 9.917533924407361e-05, "loss": 2.911, "step": 4555 }, { "epoch": 0.06, "learning_rate": 9.917349223453549e-05, "loss": 2.951, "step": 4560 }, { "epoch": 0.06, "learning_rate": 9.917164317615566e-05, "loss": 2.9634, "step": 4565 }, { "epoch": 0.06, "learning_rate": 9.916979206901117e-05, "loss": 2.8583, "step": 4570 }, { "epoch": 0.06, "learning_rate": 9.916793891317912e-05, "loss": 2.9257, "step": 4575 }, { "epoch": 0.06, "learning_rate": 9.916608370873677e-05, "loss": 2.9319, "step": 4580 }, { "epoch": 0.06, "learning_rate": 9.916422645576136e-05, "loss": 2.8214, "step": 4585 }, { "epoch": 0.06, "learning_rate": 9.916236715433032e-05, "loss": 2.9531, "step": 4590 }, { "epoch": 0.06, "learning_rate": 9.91605058045211e-05, "loss": 2.9911, "step": 4595 }, { "epoch": 0.06, "learning_rate": 9.915864240641124e-05, "loss": 2.9353, "step": 4600 }, { "epoch": 0.06, "learning_rate": 9.915677696007841e-05, "loss": 2.7067, "step": 4605 }, { "epoch": 0.06, "learning_rate": 9.915490946560033e-05, "loss": 2.9706, "step": 4610 }, { "epoch": 0.06, "learning_rate": 9.91530399230548e-05, "loss": 2.942, "step": 4615 }, { "epoch": 0.06, "learning_rate": 9.91511683325197e-05, "loss": 2.9317, "step": 4620 }, { "epoch": 0.06, "learning_rate": 9.914929469407304e-05, "loss": 2.9059, "step": 4625 }, { "epoch": 0.06, "learning_rate": 9.914741900779288e-05, "loss": 2.8647, "step": 4630 }, { "epoch": 0.06, "learning_rate": 9.914554127375734e-05, "loss": 2.9217, "step": 4635 }, { "epoch": 0.06, "learning_rate": 9.91436614920447e-05, "loss": 2.967, "step": 4640 }, { "epoch": 0.06, "learning_rate": 9.914177966273326e-05, "loss": 2.9694, "step": 4645 }, { "epoch": 0.06, "learning_rate": 9.913989578590144e-05, "loss": 2.984, "step": 4650 }, { "epoch": 0.06, "learning_rate": 9.913800986162772e-05, "loss": 2.8215, "step": 4655 }, { "epoch": 0.06, "learning_rate": 9.913612188999069e-05, "loss": 2.9914, "step": 4660 }, { "epoch": 0.06, "learning_rate": 9.913423187106899e-05, "loss": 2.9364, "step": 4665 }, { "epoch": 0.06, "learning_rate": 9.91323398049414e-05, "loss": 2.9426, "step": 4670 }, { "epoch": 0.06, "learning_rate": 9.913044569168673e-05, "loss": 2.8042, "step": 4675 }, { "epoch": 0.06, "learning_rate": 9.91285495313839e-05, "loss": 2.9083, "step": 4680 }, { "epoch": 0.06, "learning_rate": 9.912665132411194e-05, "loss": 3.0359, "step": 4685 }, { "epoch": 0.06, "learning_rate": 9.912475106994992e-05, "loss": 2.9672, "step": 4690 }, { "epoch": 0.06, "learning_rate": 9.912284876897702e-05, "loss": 2.9005, "step": 4695 }, { "epoch": 0.06, "learning_rate": 9.912094442127248e-05, "loss": 2.8533, "step": 4700 }, { "epoch": 0.06, "learning_rate": 9.911903802691569e-05, "loss": 2.9938, "step": 4705 }, { "epoch": 0.06, "learning_rate": 9.911712958598605e-05, "loss": 2.834, "step": 4710 }, { "epoch": 0.06, "learning_rate": 9.911521909856307e-05, "loss": 2.8906, "step": 4715 }, { "epoch": 0.06, "learning_rate": 9.911330656472637e-05, "loss": 2.8858, "step": 4720 }, { "epoch": 0.06, "learning_rate": 9.911139198455562e-05, "loss": 2.9367, "step": 4725 }, { "epoch": 0.06, "learning_rate": 9.910947535813063e-05, "loss": 2.8831, "step": 4730 }, { "epoch": 0.06, "learning_rate": 9.91075566855312e-05, "loss": 2.9466, "step": 4735 }, { "epoch": 0.06, "learning_rate": 9.91056359668373e-05, "loss": 2.8604, "step": 4740 }, { "epoch": 0.06, "learning_rate": 9.910371320212898e-05, "loss": 2.8832, "step": 4745 }, { "epoch": 0.06, "learning_rate": 9.910178839148632e-05, "loss": 2.9476, "step": 4750 }, { "epoch": 0.06, "learning_rate": 9.909986153498953e-05, "loss": 2.7848, "step": 4755 }, { "epoch": 0.06, "learning_rate": 9.90979326327189e-05, "loss": 2.9377, "step": 4760 }, { "epoch": 0.06, "learning_rate": 9.90960016847548e-05, "loss": 2.9085, "step": 4765 }, { "epoch": 0.06, "learning_rate": 9.909406869117766e-05, "loss": 2.9025, "step": 4770 }, { "epoch": 0.06, "learning_rate": 9.909213365206806e-05, "loss": 2.8972, "step": 4775 }, { "epoch": 0.06, "learning_rate": 9.909019656750658e-05, "loss": 2.7739, "step": 4780 }, { "epoch": 0.06, "learning_rate": 9.908825743757395e-05, "loss": 2.8594, "step": 4785 }, { "epoch": 0.06, "learning_rate": 9.908631626235099e-05, "loss": 2.8937, "step": 4790 }, { "epoch": 0.06, "learning_rate": 9.908437304191854e-05, "loss": 3.0193, "step": 4795 }, { "epoch": 0.06, "learning_rate": 9.908242777635759e-05, "loss": 3.0285, "step": 4800 }, { "epoch": 0.06, "learning_rate": 9.908048046574917e-05, "loss": 2.946, "step": 4805 }, { "epoch": 0.06, "learning_rate": 9.907853111017444e-05, "loss": 2.887, "step": 4810 }, { "epoch": 0.06, "learning_rate": 9.90765797097146e-05, "loss": 2.9824, "step": 4815 }, { "epoch": 0.06, "learning_rate": 9.907462626445096e-05, "loss": 2.8985, "step": 4820 }, { "epoch": 0.06, "learning_rate": 9.907267077446493e-05, "loss": 2.9804, "step": 4825 }, { "epoch": 0.06, "learning_rate": 9.907071323983797e-05, "loss": 2.943, "step": 4830 }, { "epoch": 0.06, "learning_rate": 9.906875366065165e-05, "loss": 2.9137, "step": 4835 }, { "epoch": 0.06, "learning_rate": 9.906679203698761e-05, "loss": 3.0239, "step": 4840 }, { "epoch": 0.06, "learning_rate": 9.906482836892758e-05, "loss": 2.974, "step": 4845 }, { "epoch": 0.06, "learning_rate": 9.906286265655338e-05, "loss": 2.8487, "step": 4850 }, { "epoch": 0.06, "learning_rate": 9.906089489994691e-05, "loss": 2.855, "step": 4855 }, { "epoch": 0.06, "learning_rate": 9.905892509919016e-05, "loss": 2.8534, "step": 4860 }, { "epoch": 0.06, "learning_rate": 9.905695325436522e-05, "loss": 2.869, "step": 4865 }, { "epoch": 0.06, "learning_rate": 9.905497936555423e-05, "loss": 2.9243, "step": 4870 }, { "epoch": 0.06, "learning_rate": 9.905300343283944e-05, "loss": 2.9892, "step": 4875 }, { "epoch": 0.06, "learning_rate": 9.905102545630316e-05, "loss": 2.94, "step": 4880 }, { "epoch": 0.06, "learning_rate": 9.904904543602782e-05, "loss": 3.1187, "step": 4885 }, { "epoch": 0.06, "learning_rate": 9.904706337209593e-05, "loss": 2.9961, "step": 4890 }, { "epoch": 0.06, "learning_rate": 9.904507926459006e-05, "loss": 2.9365, "step": 4895 }, { "epoch": 0.06, "learning_rate": 9.904309311359285e-05, "loss": 2.8629, "step": 4900 }, { "epoch": 0.06, "learning_rate": 9.904110491918712e-05, "loss": 2.8628, "step": 4905 }, { "epoch": 0.06, "learning_rate": 9.903911468145565e-05, "loss": 2.894, "step": 4910 }, { "epoch": 0.06, "learning_rate": 9.90371224004814e-05, "loss": 2.8785, "step": 4915 }, { "epoch": 0.06, "learning_rate": 9.903512807634736e-05, "loss": 2.8508, "step": 4920 }, { "epoch": 0.06, "learning_rate": 9.903313170913662e-05, "loss": 2.9349, "step": 4925 }, { "epoch": 0.06, "learning_rate": 9.903113329893239e-05, "loss": 2.9301, "step": 4930 }, { "epoch": 0.06, "learning_rate": 9.902913284581791e-05, "loss": 2.9025, "step": 4935 }, { "epoch": 0.06, "learning_rate": 9.902713034987654e-05, "loss": 2.8937, "step": 4940 }, { "epoch": 0.06, "learning_rate": 9.90251258111917e-05, "loss": 3.0754, "step": 4945 }, { "epoch": 0.06, "learning_rate": 9.902311922984693e-05, "loss": 2.9705, "step": 4950 }, { "epoch": 0.06, "learning_rate": 9.902111060592583e-05, "loss": 2.9277, "step": 4955 }, { "epoch": 0.06, "learning_rate": 9.901909993951208e-05, "loss": 2.9771, "step": 4960 }, { "epoch": 0.06, "learning_rate": 9.901708723068947e-05, "loss": 2.8593, "step": 4965 }, { "epoch": 0.06, "learning_rate": 9.901507247954185e-05, "loss": 3.0041, "step": 4970 }, { "epoch": 0.06, "learning_rate": 9.901305568615317e-05, "loss": 2.898, "step": 4975 }, { "epoch": 0.06, "learning_rate": 9.901103685060746e-05, "loss": 3.0988, "step": 4980 }, { "epoch": 0.06, "learning_rate": 9.900901597298884e-05, "loss": 2.8751, "step": 4985 }, { "epoch": 0.06, "learning_rate": 9.900699305338149e-05, "loss": 2.9137, "step": 4990 }, { "epoch": 0.06, "learning_rate": 9.900496809186972e-05, "loss": 2.9237, "step": 4995 }, { "epoch": 0.06, "learning_rate": 9.900294108853792e-05, "loss": 2.9498, "step": 5000 }, { "epoch": 0.06, "learning_rate": 9.900091204347049e-05, "loss": 3.0165, "step": 5005 }, { "epoch": 0.07, "learning_rate": 9.899888095675201e-05, "loss": 2.9165, "step": 5010 }, { "epoch": 0.07, "learning_rate": 9.89968478284671e-05, "loss": 2.8344, "step": 5015 }, { "epoch": 0.07, "learning_rate": 9.899481265870047e-05, "loss": 3.0716, "step": 5020 }, { "epoch": 0.07, "learning_rate": 9.899277544753692e-05, "loss": 2.882, "step": 5025 }, { "epoch": 0.07, "learning_rate": 9.899073619506132e-05, "loss": 2.9399, "step": 5030 }, { "epoch": 0.07, "learning_rate": 9.898869490135865e-05, "loss": 2.8863, "step": 5035 }, { "epoch": 0.07, "learning_rate": 9.898665156651395e-05, "loss": 2.9704, "step": 5040 }, { "epoch": 0.07, "learning_rate": 9.898460619061237e-05, "loss": 2.8972, "step": 5045 }, { "epoch": 0.07, "learning_rate": 9.898255877373912e-05, "loss": 2.9458, "step": 5050 }, { "epoch": 0.07, "learning_rate": 9.898050931597952e-05, "loss": 3.0931, "step": 5055 }, { "epoch": 0.07, "learning_rate": 9.897845781741894e-05, "loss": 2.961, "step": 5060 }, { "epoch": 0.07, "learning_rate": 9.897640427814289e-05, "loss": 2.8709, "step": 5065 }, { "epoch": 0.07, "learning_rate": 9.89743486982369e-05, "loss": 2.8921, "step": 5070 }, { "epoch": 0.07, "learning_rate": 9.897229107778663e-05, "loss": 2.8887, "step": 5075 }, { "epoch": 0.07, "learning_rate": 9.89702314168778e-05, "loss": 2.9556, "step": 5080 }, { "epoch": 0.07, "learning_rate": 9.896816971559626e-05, "loss": 2.8209, "step": 5085 }, { "epoch": 0.07, "learning_rate": 9.896610597402787e-05, "loss": 2.9786, "step": 5090 }, { "epoch": 0.07, "learning_rate": 9.896404019225864e-05, "loss": 2.8725, "step": 5095 }, { "epoch": 0.07, "learning_rate": 9.896197237037464e-05, "loss": 2.7786, "step": 5100 }, { "epoch": 0.07, "learning_rate": 9.895990250846203e-05, "loss": 2.9716, "step": 5105 }, { "epoch": 0.07, "learning_rate": 9.895783060660705e-05, "loss": 2.8962, "step": 5110 }, { "epoch": 0.07, "learning_rate": 9.895575666489603e-05, "loss": 2.9493, "step": 5115 }, { "epoch": 0.07, "learning_rate": 9.895368068341537e-05, "loss": 2.8934, "step": 5120 }, { "epoch": 0.07, "learning_rate": 9.895160266225156e-05, "loss": 2.9312, "step": 5125 }, { "epoch": 0.07, "learning_rate": 9.89495226014912e-05, "loss": 2.9448, "step": 5130 }, { "epoch": 0.07, "learning_rate": 9.894744050122096e-05, "loss": 3.0175, "step": 5135 }, { "epoch": 0.07, "learning_rate": 9.89453563615276e-05, "loss": 2.7861, "step": 5140 }, { "epoch": 0.07, "learning_rate": 9.894327018249792e-05, "loss": 3.0269, "step": 5145 }, { "epoch": 0.07, "learning_rate": 9.894118196421887e-05, "loss": 2.9067, "step": 5150 }, { "epoch": 0.07, "learning_rate": 9.893909170677745e-05, "loss": 2.7236, "step": 5155 }, { "epoch": 0.07, "learning_rate": 9.893699941026074e-05, "loss": 2.8902, "step": 5160 }, { "epoch": 0.07, "learning_rate": 9.893490507475593e-05, "loss": 3.0312, "step": 5165 }, { "epoch": 0.07, "learning_rate": 9.89328087003503e-05, "loss": 2.9041, "step": 5170 }, { "epoch": 0.07, "learning_rate": 9.893071028713117e-05, "loss": 2.9729, "step": 5175 }, { "epoch": 0.07, "learning_rate": 9.892860983518597e-05, "loss": 2.9835, "step": 5180 }, { "epoch": 0.07, "learning_rate": 9.892650734460222e-05, "loss": 3.0433, "step": 5185 }, { "epoch": 0.07, "learning_rate": 9.892440281546755e-05, "loss": 2.9108, "step": 5190 }, { "epoch": 0.07, "learning_rate": 9.892229624786959e-05, "loss": 2.8647, "step": 5195 }, { "epoch": 0.07, "learning_rate": 9.892018764189617e-05, "loss": 2.9883, "step": 5200 }, { "epoch": 0.07, "learning_rate": 9.89180769976351e-05, "loss": 2.849, "step": 5205 }, { "epoch": 0.07, "learning_rate": 9.891596431517437e-05, "loss": 2.8058, "step": 5210 }, { "epoch": 0.07, "learning_rate": 9.891384959460197e-05, "loss": 2.8735, "step": 5215 }, { "epoch": 0.07, "learning_rate": 9.8911732836006e-05, "loss": 2.794, "step": 5220 }, { "epoch": 0.07, "learning_rate": 9.890961403947469e-05, "loss": 2.8324, "step": 5225 }, { "epoch": 0.07, "learning_rate": 9.890749320509629e-05, "loss": 2.7313, "step": 5230 }, { "epoch": 0.07, "learning_rate": 9.89053703329592e-05, "loss": 2.879, "step": 5235 }, { "epoch": 0.07, "learning_rate": 9.890324542315184e-05, "loss": 2.963, "step": 5240 }, { "epoch": 0.07, "learning_rate": 9.890111847576275e-05, "loss": 2.8905, "step": 5245 }, { "epoch": 0.07, "learning_rate": 9.889898949088059e-05, "loss": 2.8294, "step": 5250 }, { "epoch": 0.07, "learning_rate": 9.8896858468594e-05, "loss": 2.6963, "step": 5255 }, { "epoch": 0.07, "learning_rate": 9.889472540899183e-05, "loss": 2.8163, "step": 5260 }, { "epoch": 0.07, "learning_rate": 9.889259031216291e-05, "loss": 2.8331, "step": 5265 }, { "epoch": 0.07, "learning_rate": 9.889045317819623e-05, "loss": 2.8462, "step": 5270 }, { "epoch": 0.07, "learning_rate": 9.888831400718082e-05, "loss": 3.0076, "step": 5275 }, { "epoch": 0.07, "learning_rate": 9.88861727992058e-05, "loss": 2.962, "step": 5280 }, { "epoch": 0.07, "learning_rate": 9.888402955436041e-05, "loss": 2.8301, "step": 5285 }, { "epoch": 0.07, "learning_rate": 9.888188427273395e-05, "loss": 2.8763, "step": 5290 }, { "epoch": 0.07, "learning_rate": 9.887973695441577e-05, "loss": 2.9267, "step": 5295 }, { "epoch": 0.07, "learning_rate": 9.887758759949537e-05, "loss": 2.8241, "step": 5300 }, { "epoch": 0.07, "learning_rate": 9.88754362080623e-05, "loss": 2.9033, "step": 5305 }, { "epoch": 0.07, "learning_rate": 9.88732827802062e-05, "loss": 2.9066, "step": 5310 }, { "epoch": 0.07, "learning_rate": 9.887112731601677e-05, "loss": 2.9797, "step": 5315 }, { "epoch": 0.07, "learning_rate": 9.886896981558384e-05, "loss": 2.9534, "step": 5320 }, { "epoch": 0.07, "learning_rate": 9.886681027899731e-05, "loss": 2.8911, "step": 5325 }, { "epoch": 0.07, "learning_rate": 9.886464870634715e-05, "loss": 2.9466, "step": 5330 }, { "epoch": 0.07, "learning_rate": 9.886248509772343e-05, "loss": 3.1127, "step": 5335 }, { "epoch": 0.07, "learning_rate": 9.886031945321628e-05, "loss": 2.9267, "step": 5340 }, { "epoch": 0.07, "learning_rate": 9.885815177291593e-05, "loss": 2.8579, "step": 5345 }, { "epoch": 0.07, "learning_rate": 9.885598205691273e-05, "loss": 3.0462, "step": 5350 }, { "epoch": 0.07, "learning_rate": 9.885381030529706e-05, "loss": 2.8812, "step": 5355 }, { "epoch": 0.07, "learning_rate": 9.88516365181594e-05, "loss": 2.8539, "step": 5360 }, { "epoch": 0.07, "learning_rate": 9.884946069559033e-05, "loss": 2.8866, "step": 5365 }, { "epoch": 0.07, "learning_rate": 9.884728283768052e-05, "loss": 2.8245, "step": 5370 }, { "epoch": 0.07, "learning_rate": 9.88451029445207e-05, "loss": 2.8851, "step": 5375 }, { "epoch": 0.07, "learning_rate": 9.88429210162017e-05, "loss": 2.9094, "step": 5380 }, { "epoch": 0.07, "learning_rate": 9.884073705281442e-05, "loss": 2.8819, "step": 5385 }, { "epoch": 0.07, "learning_rate": 9.883855105444985e-05, "loss": 2.8277, "step": 5390 }, { "epoch": 0.07, "learning_rate": 9.883636302119912e-05, "loss": 2.9202, "step": 5395 }, { "epoch": 0.07, "learning_rate": 9.883417295315334e-05, "loss": 3.037, "step": 5400 }, { "epoch": 0.07, "learning_rate": 9.883198085040378e-05, "loss": 2.9737, "step": 5405 }, { "epoch": 0.07, "learning_rate": 9.882978671304178e-05, "loss": 2.8467, "step": 5410 }, { "epoch": 0.07, "learning_rate": 9.882759054115876e-05, "loss": 2.8865, "step": 5415 }, { "epoch": 0.07, "learning_rate": 9.882539233484623e-05, "loss": 2.9544, "step": 5420 }, { "epoch": 0.07, "learning_rate": 9.882319209419575e-05, "loss": 2.6533, "step": 5425 }, { "epoch": 0.07, "learning_rate": 9.882098981929904e-05, "loss": 2.938, "step": 5430 }, { "epoch": 0.07, "learning_rate": 9.881878551024782e-05, "loss": 2.9573, "step": 5435 }, { "epoch": 0.07, "learning_rate": 9.881657916713394e-05, "loss": 2.8785, "step": 5440 }, { "epoch": 0.07, "learning_rate": 9.881437079004936e-05, "loss": 2.7801, "step": 5445 }, { "epoch": 0.07, "learning_rate": 9.881216037908604e-05, "loss": 2.9745, "step": 5450 }, { "epoch": 0.07, "learning_rate": 9.880994793433614e-05, "loss": 2.8505, "step": 5455 }, { "epoch": 0.07, "learning_rate": 9.88077334558918e-05, "loss": 2.8896, "step": 5460 }, { "epoch": 0.07, "learning_rate": 9.880551694384529e-05, "loss": 2.9155, "step": 5465 }, { "epoch": 0.07, "learning_rate": 9.880329839828897e-05, "loss": 2.9641, "step": 5470 }, { "epoch": 0.07, "learning_rate": 9.880107781931529e-05, "loss": 2.8136, "step": 5475 }, { "epoch": 0.07, "learning_rate": 9.879885520701675e-05, "loss": 2.7998, "step": 5480 }, { "epoch": 0.07, "learning_rate": 9.879663056148595e-05, "loss": 2.9879, "step": 5485 }, { "epoch": 0.07, "learning_rate": 9.879440388281564e-05, "loss": 2.9237, "step": 5490 }, { "epoch": 0.07, "learning_rate": 9.87921751710985e-05, "loss": 2.8661, "step": 5495 }, { "epoch": 0.07, "learning_rate": 9.878994442642748e-05, "loss": 2.8904, "step": 5500 }, { "epoch": 0.07, "learning_rate": 9.878771164889548e-05, "loss": 2.9735, "step": 5505 }, { "epoch": 0.07, "learning_rate": 9.878547683859554e-05, "loss": 2.9575, "step": 5510 }, { "epoch": 0.07, "learning_rate": 9.878323999562078e-05, "loss": 2.8647, "step": 5515 }, { "epoch": 0.07, "learning_rate": 9.878100112006438e-05, "loss": 2.9041, "step": 5520 }, { "epoch": 0.07, "learning_rate": 9.877876021201963e-05, "loss": 2.8787, "step": 5525 }, { "epoch": 0.07, "learning_rate": 9.877651727157993e-05, "loss": 2.9064, "step": 5530 }, { "epoch": 0.07, "learning_rate": 9.877427229883868e-05, "loss": 2.7472, "step": 5535 }, { "epoch": 0.07, "learning_rate": 9.877202529388947e-05, "loss": 2.9124, "step": 5540 }, { "epoch": 0.07, "learning_rate": 9.87697762568259e-05, "loss": 2.6722, "step": 5545 }, { "epoch": 0.07, "learning_rate": 9.876752518774166e-05, "loss": 2.8397, "step": 5550 }, { "epoch": 0.07, "learning_rate": 9.876527208673057e-05, "loss": 2.9191, "step": 5555 }, { "epoch": 0.07, "learning_rate": 9.876301695388649e-05, "loss": 2.9474, "step": 5560 }, { "epoch": 0.07, "learning_rate": 9.87607597893034e-05, "loss": 2.8374, "step": 5565 }, { "epoch": 0.07, "learning_rate": 9.875850059307531e-05, "loss": 2.8883, "step": 5570 }, { "epoch": 0.07, "learning_rate": 9.875623936529638e-05, "loss": 2.8187, "step": 5575 }, { "epoch": 0.07, "learning_rate": 9.875397610606083e-05, "loss": 2.8686, "step": 5580 }, { "epoch": 0.07, "learning_rate": 9.875171081546294e-05, "loss": 2.8551, "step": 5585 }, { "epoch": 0.07, "learning_rate": 9.874944349359711e-05, "loss": 2.7895, "step": 5590 }, { "epoch": 0.07, "learning_rate": 9.87471741405578e-05, "loss": 2.8343, "step": 5595 }, { "epoch": 0.07, "learning_rate": 9.874490275643958e-05, "loss": 2.9152, "step": 5600 }, { "epoch": 0.07, "learning_rate": 9.874262934133706e-05, "loss": 2.8734, "step": 5605 }, { "epoch": 0.07, "learning_rate": 9.874035389534497e-05, "loss": 2.8318, "step": 5610 }, { "epoch": 0.07, "learning_rate": 9.873807641855814e-05, "loss": 2.8536, "step": 5615 }, { "epoch": 0.07, "learning_rate": 9.873579691107146e-05, "loss": 2.9334, "step": 5620 }, { "epoch": 0.07, "learning_rate": 9.873351537297988e-05, "loss": 2.9422, "step": 5625 }, { "epoch": 0.07, "learning_rate": 9.873123180437848e-05, "loss": 2.8634, "step": 5630 }, { "epoch": 0.07, "learning_rate": 9.87289462053624e-05, "loss": 2.9943, "step": 5635 }, { "epoch": 0.07, "learning_rate": 9.872665857602687e-05, "loss": 3.0018, "step": 5640 }, { "epoch": 0.07, "learning_rate": 9.872436891646724e-05, "loss": 2.9175, "step": 5645 }, { "epoch": 0.07, "learning_rate": 9.872207722677885e-05, "loss": 2.8888, "step": 5650 }, { "epoch": 0.07, "learning_rate": 9.871978350705722e-05, "loss": 2.8655, "step": 5655 }, { "epoch": 0.07, "learning_rate": 9.871748775739792e-05, "loss": 2.8202, "step": 5660 }, { "epoch": 0.07, "learning_rate": 9.871518997789659e-05, "loss": 2.8357, "step": 5665 }, { "epoch": 0.07, "learning_rate": 9.871289016864897e-05, "loss": 2.9378, "step": 5670 }, { "epoch": 0.07, "learning_rate": 9.87105883297509e-05, "loss": 2.7266, "step": 5675 }, { "epoch": 0.07, "learning_rate": 9.870828446129827e-05, "loss": 2.9533, "step": 5680 }, { "epoch": 0.07, "learning_rate": 9.870597856338708e-05, "loss": 2.9079, "step": 5685 }, { "epoch": 0.07, "learning_rate": 9.870367063611341e-05, "loss": 2.8203, "step": 5690 }, { "epoch": 0.07, "learning_rate": 9.870136067957341e-05, "loss": 2.7533, "step": 5695 }, { "epoch": 0.07, "learning_rate": 9.869904869386332e-05, "loss": 2.7914, "step": 5700 }, { "epoch": 0.07, "learning_rate": 9.86967346790795e-05, "loss": 2.8144, "step": 5705 }, { "epoch": 0.07, "learning_rate": 9.869441863531835e-05, "loss": 2.9353, "step": 5710 }, { "epoch": 0.07, "learning_rate": 9.869210056267635e-05, "loss": 2.8382, "step": 5715 }, { "epoch": 0.07, "learning_rate": 9.86897804612501e-05, "loss": 3.0396, "step": 5720 }, { "epoch": 0.07, "learning_rate": 9.868745833113627e-05, "loss": 2.857, "step": 5725 }, { "epoch": 0.07, "learning_rate": 9.868513417243161e-05, "loss": 2.8213, "step": 5730 }, { "epoch": 0.07, "learning_rate": 9.868280798523296e-05, "loss": 2.7693, "step": 5735 }, { "epoch": 0.07, "learning_rate": 9.868047976963724e-05, "loss": 2.8511, "step": 5740 }, { "epoch": 0.07, "learning_rate": 9.867814952574146e-05, "loss": 2.9623, "step": 5745 }, { "epoch": 0.07, "learning_rate": 9.86758172536427e-05, "loss": 2.9841, "step": 5750 }, { "epoch": 0.07, "learning_rate": 9.867348295343814e-05, "loss": 2.9203, "step": 5755 }, { "epoch": 0.07, "learning_rate": 9.867114662522505e-05, "loss": 2.8737, "step": 5760 }, { "epoch": 0.07, "learning_rate": 9.866880826910076e-05, "loss": 2.8806, "step": 5765 }, { "epoch": 0.07, "learning_rate": 9.866646788516272e-05, "loss": 3.0282, "step": 5770 }, { "epoch": 0.07, "learning_rate": 9.86641254735084e-05, "loss": 2.9593, "step": 5775 }, { "epoch": 0.08, "learning_rate": 9.866178103423545e-05, "loss": 2.9296, "step": 5780 }, { "epoch": 0.08, "learning_rate": 9.865943456744154e-05, "loss": 2.9261, "step": 5785 }, { "epoch": 0.08, "learning_rate": 9.865708607322441e-05, "loss": 2.9743, "step": 5790 }, { "epoch": 0.08, "learning_rate": 9.865473555168192e-05, "loss": 2.8698, "step": 5795 }, { "epoch": 0.08, "learning_rate": 9.865238300291202e-05, "loss": 2.88, "step": 5800 }, { "epoch": 0.08, "learning_rate": 9.865002842701274e-05, "loss": 2.81, "step": 5805 }, { "epoch": 0.08, "learning_rate": 9.864767182408214e-05, "loss": 3.0062, "step": 5810 }, { "epoch": 0.08, "learning_rate": 9.864531319421846e-05, "loss": 2.7563, "step": 5815 }, { "epoch": 0.08, "learning_rate": 9.864295253751995e-05, "loss": 2.9651, "step": 5820 }, { "epoch": 0.08, "learning_rate": 9.864058985408496e-05, "loss": 2.8464, "step": 5825 }, { "epoch": 0.08, "learning_rate": 9.863822514401195e-05, "loss": 2.7724, "step": 5830 }, { "epoch": 0.08, "learning_rate": 9.863585840739944e-05, "loss": 2.8847, "step": 5835 }, { "epoch": 0.08, "learning_rate": 9.863348964434604e-05, "loss": 2.9172, "step": 5840 }, { "epoch": 0.08, "learning_rate": 9.863111885495044e-05, "loss": 2.95, "step": 5845 }, { "epoch": 0.08, "learning_rate": 9.862874603931144e-05, "loss": 2.7781, "step": 5850 }, { "epoch": 0.08, "learning_rate": 9.862637119752788e-05, "loss": 2.9345, "step": 5855 }, { "epoch": 0.08, "learning_rate": 9.862399432969873e-05, "loss": 3.0297, "step": 5860 }, { "epoch": 0.08, "learning_rate": 9.862161543592301e-05, "loss": 2.8661, "step": 5865 }, { "epoch": 0.08, "learning_rate": 9.861923451629984e-05, "loss": 2.8496, "step": 5870 }, { "epoch": 0.08, "learning_rate": 9.861685157092842e-05, "loss": 2.9451, "step": 5875 }, { "epoch": 0.08, "learning_rate": 9.861446659990805e-05, "loss": 2.9353, "step": 5880 }, { "epoch": 0.08, "learning_rate": 9.861207960333809e-05, "loss": 2.8862, "step": 5885 }, { "epoch": 0.08, "learning_rate": 9.860969058131799e-05, "loss": 2.9295, "step": 5890 }, { "epoch": 0.08, "learning_rate": 9.860729953394731e-05, "loss": 2.7591, "step": 5895 }, { "epoch": 0.08, "learning_rate": 9.860490646132566e-05, "loss": 2.9356, "step": 5900 }, { "epoch": 0.08, "learning_rate": 9.860251136355275e-05, "loss": 2.8735, "step": 5905 }, { "epoch": 0.08, "learning_rate": 9.860011424072837e-05, "loss": 2.8607, "step": 5910 }, { "epoch": 0.08, "learning_rate": 9.859771509295241e-05, "loss": 2.9387, "step": 5915 }, { "epoch": 0.08, "learning_rate": 9.859531392032482e-05, "loss": 3.0107, "step": 5920 }, { "epoch": 0.08, "learning_rate": 9.859291072294565e-05, "loss": 2.855, "step": 5925 }, { "epoch": 0.08, "learning_rate": 9.859050550091503e-05, "loss": 2.9509, "step": 5930 }, { "epoch": 0.08, "learning_rate": 9.858809825433318e-05, "loss": 2.9419, "step": 5935 }, { "epoch": 0.08, "learning_rate": 9.858568898330039e-05, "loss": 2.978, "step": 5940 }, { "epoch": 0.08, "learning_rate": 9.858327768791704e-05, "loss": 2.6415, "step": 5945 }, { "epoch": 0.08, "learning_rate": 9.858086436828362e-05, "loss": 2.9157, "step": 5950 }, { "epoch": 0.08, "learning_rate": 9.857844902450066e-05, "loss": 2.9607, "step": 5955 }, { "epoch": 0.08, "learning_rate": 9.857603165666882e-05, "loss": 2.789, "step": 5960 }, { "epoch": 0.08, "learning_rate": 9.857361226488879e-05, "loss": 2.948, "step": 5965 }, { "epoch": 0.08, "learning_rate": 9.85711908492614e-05, "loss": 2.8312, "step": 5970 }, { "epoch": 0.08, "learning_rate": 9.856876740988754e-05, "loss": 2.8675, "step": 5975 }, { "epoch": 0.08, "learning_rate": 9.856634194686815e-05, "loss": 2.8952, "step": 5980 }, { "epoch": 0.08, "learning_rate": 9.856391446030435e-05, "loss": 2.8872, "step": 5985 }, { "epoch": 0.08, "learning_rate": 9.856148495029723e-05, "loss": 2.8614, "step": 5990 }, { "epoch": 0.08, "learning_rate": 9.855905341694802e-05, "loss": 2.9191, "step": 5995 }, { "epoch": 0.08, "learning_rate": 9.855661986035805e-05, "loss": 3.0328, "step": 6000 }, { "epoch": 0.08, "learning_rate": 9.855418428062873e-05, "loss": 2.9915, "step": 6005 }, { "epoch": 0.08, "learning_rate": 9.855174667786151e-05, "loss": 2.8513, "step": 6010 }, { "epoch": 0.08, "learning_rate": 9.854930705215795e-05, "loss": 2.8199, "step": 6015 }, { "epoch": 0.08, "learning_rate": 9.854686540361972e-05, "loss": 2.8855, "step": 6020 }, { "epoch": 0.08, "learning_rate": 9.854442173234854e-05, "loss": 2.8882, "step": 6025 }, { "epoch": 0.08, "learning_rate": 9.854197603844624e-05, "loss": 2.8992, "step": 6030 }, { "epoch": 0.08, "learning_rate": 9.853952832201472e-05, "loss": 2.7864, "step": 6035 }, { "epoch": 0.08, "learning_rate": 9.853707858315596e-05, "loss": 3.0243, "step": 6040 }, { "epoch": 0.08, "learning_rate": 9.853462682197202e-05, "loss": 2.8665, "step": 6045 }, { "epoch": 0.08, "learning_rate": 9.853217303856506e-05, "loss": 2.9141, "step": 6050 }, { "epoch": 0.08, "learning_rate": 9.852971723303732e-05, "loss": 2.7684, "step": 6055 }, { "epoch": 0.08, "learning_rate": 9.852725940549112e-05, "loss": 2.862, "step": 6060 }, { "epoch": 0.08, "learning_rate": 9.852479955602888e-05, "loss": 2.8497, "step": 6065 }, { "epoch": 0.08, "learning_rate": 9.852233768475307e-05, "loss": 2.7734, "step": 6070 }, { "epoch": 0.08, "learning_rate": 9.85198737917663e-05, "loss": 2.6246, "step": 6075 }, { "epoch": 0.08, "learning_rate": 9.851740787717118e-05, "loss": 2.754, "step": 6080 }, { "epoch": 0.08, "learning_rate": 9.85149399410705e-05, "loss": 2.991, "step": 6085 }, { "epoch": 0.08, "learning_rate": 9.851246998356707e-05, "loss": 2.8066, "step": 6090 }, { "epoch": 0.08, "learning_rate": 9.850999800476378e-05, "loss": 2.8572, "step": 6095 }, { "epoch": 0.08, "learning_rate": 9.850752400476366e-05, "loss": 2.8579, "step": 6100 }, { "epoch": 0.08, "learning_rate": 9.850504798366978e-05, "loss": 2.7666, "step": 6105 }, { "epoch": 0.08, "learning_rate": 9.850256994158529e-05, "loss": 2.8369, "step": 6110 }, { "epoch": 0.08, "learning_rate": 9.850008987861346e-05, "loss": 2.9252, "step": 6115 }, { "epoch": 0.08, "learning_rate": 9.84976077948576e-05, "loss": 2.8854, "step": 6120 }, { "epoch": 0.08, "learning_rate": 9.849512369042116e-05, "loss": 2.774, "step": 6125 }, { "epoch": 0.08, "learning_rate": 9.84926375654076e-05, "loss": 2.8716, "step": 6130 }, { "epoch": 0.08, "learning_rate": 9.849014941992057e-05, "loss": 2.9595, "step": 6135 }, { "epoch": 0.08, "learning_rate": 9.848765925406366e-05, "loss": 2.8379, "step": 6140 }, { "epoch": 0.08, "learning_rate": 9.848516706794068e-05, "loss": 2.757, "step": 6145 }, { "epoch": 0.08, "learning_rate": 9.848267286165544e-05, "loss": 2.8705, "step": 6150 }, { "epoch": 0.08, "learning_rate": 9.848017663531188e-05, "loss": 2.8593, "step": 6155 }, { "epoch": 0.08, "learning_rate": 9.847767838901402e-05, "loss": 3.0704, "step": 6160 }, { "epoch": 0.08, "learning_rate": 9.847517812286591e-05, "loss": 2.82, "step": 6165 }, { "epoch": 0.08, "learning_rate": 9.847267583697176e-05, "loss": 2.8237, "step": 6170 }, { "epoch": 0.08, "learning_rate": 9.847017153143581e-05, "loss": 2.8092, "step": 6175 }, { "epoch": 0.08, "learning_rate": 9.84676652063624e-05, "loss": 2.8508, "step": 6180 }, { "epoch": 0.08, "learning_rate": 9.846515686185598e-05, "loss": 2.8595, "step": 6185 }, { "epoch": 0.08, "learning_rate": 9.846264649802105e-05, "loss": 2.8754, "step": 6190 }, { "epoch": 0.08, "learning_rate": 9.84601341149622e-05, "loss": 2.9301, "step": 6195 }, { "epoch": 0.08, "learning_rate": 9.84576197127841e-05, "loss": 2.7434, "step": 6200 }, { "epoch": 0.08, "learning_rate": 9.845510329159154e-05, "loss": 2.9491, "step": 6205 }, { "epoch": 0.08, "learning_rate": 9.845258485148937e-05, "loss": 2.8169, "step": 6210 }, { "epoch": 0.08, "learning_rate": 9.845006439258247e-05, "loss": 2.86, "step": 6215 }, { "epoch": 0.08, "learning_rate": 9.844754191497592e-05, "loss": 2.8588, "step": 6220 }, { "epoch": 0.08, "learning_rate": 9.84450174187748e-05, "loss": 2.9617, "step": 6225 }, { "epoch": 0.08, "learning_rate": 9.844249090408429e-05, "loss": 2.8893, "step": 6230 }, { "epoch": 0.08, "learning_rate": 9.843996237100965e-05, "loss": 2.7789, "step": 6235 }, { "epoch": 0.08, "learning_rate": 9.843743181965624e-05, "loss": 2.9909, "step": 6240 }, { "epoch": 0.08, "learning_rate": 9.843489925012949e-05, "loss": 2.9819, "step": 6245 }, { "epoch": 0.08, "learning_rate": 9.843236466253496e-05, "loss": 2.977, "step": 6250 }, { "epoch": 0.08, "learning_rate": 9.84298280569782e-05, "loss": 2.9615, "step": 6255 }, { "epoch": 0.08, "learning_rate": 9.842728943356492e-05, "loss": 3.072, "step": 6260 }, { "epoch": 0.08, "learning_rate": 9.84247487924009e-05, "loss": 2.8256, "step": 6265 }, { "epoch": 0.08, "learning_rate": 9.842220613359201e-05, "loss": 2.8356, "step": 6270 }, { "epoch": 0.08, "learning_rate": 9.841966145724416e-05, "loss": 2.9059, "step": 6275 }, { "epoch": 0.08, "learning_rate": 9.84171147634634e-05, "loss": 2.8973, "step": 6280 }, { "epoch": 0.08, "learning_rate": 9.841456605235582e-05, "loss": 2.9939, "step": 6285 }, { "epoch": 0.08, "learning_rate": 9.841201532402763e-05, "loss": 2.6984, "step": 6290 }, { "epoch": 0.08, "learning_rate": 9.84094625785851e-05, "loss": 2.8756, "step": 6295 }, { "epoch": 0.08, "learning_rate": 9.840690781613458e-05, "loss": 2.8495, "step": 6300 }, { "epoch": 0.08, "learning_rate": 9.840435103678254e-05, "loss": 2.9061, "step": 6305 }, { "epoch": 0.08, "learning_rate": 9.84017922406355e-05, "loss": 2.8831, "step": 6310 }, { "epoch": 0.08, "learning_rate": 9.839923142780008e-05, "loss": 3.0073, "step": 6315 }, { "epoch": 0.08, "learning_rate": 9.839666859838294e-05, "loss": 2.9052, "step": 6320 }, { "epoch": 0.08, "learning_rate": 9.839410375249091e-05, "loss": 2.7591, "step": 6325 }, { "epoch": 0.08, "learning_rate": 9.839153689023084e-05, "loss": 2.7375, "step": 6330 }, { "epoch": 0.08, "learning_rate": 9.838896801170967e-05, "loss": 2.8315, "step": 6335 }, { "epoch": 0.08, "learning_rate": 9.838639711703446e-05, "loss": 2.8905, "step": 6340 }, { "epoch": 0.08, "learning_rate": 9.838382420631229e-05, "loss": 2.8123, "step": 6345 }, { "epoch": 0.08, "learning_rate": 9.838124927965038e-05, "loss": 2.8626, "step": 6350 }, { "epoch": 0.08, "learning_rate": 9.837867233715601e-05, "loss": 2.91, "step": 6355 }, { "epoch": 0.08, "learning_rate": 9.837609337893656e-05, "loss": 2.7681, "step": 6360 }, { "epoch": 0.08, "learning_rate": 9.837351240509949e-05, "loss": 2.8682, "step": 6365 }, { "epoch": 0.08, "learning_rate": 9.837092941575232e-05, "loss": 2.9322, "step": 6370 }, { "epoch": 0.08, "learning_rate": 9.836834441100268e-05, "loss": 2.7512, "step": 6375 }, { "epoch": 0.08, "learning_rate": 9.836575739095827e-05, "loss": 2.9146, "step": 6380 }, { "epoch": 0.08, "learning_rate": 9.836316835572688e-05, "loss": 2.6334, "step": 6385 }, { "epoch": 0.08, "learning_rate": 9.83605773054164e-05, "loss": 2.9663, "step": 6390 }, { "epoch": 0.08, "learning_rate": 9.835798424013477e-05, "loss": 2.8056, "step": 6395 }, { "epoch": 0.08, "learning_rate": 9.835538915999003e-05, "loss": 2.977, "step": 6400 }, { "epoch": 0.08, "learning_rate": 9.835279206509032e-05, "loss": 2.7967, "step": 6405 }, { "epoch": 0.08, "learning_rate": 9.835019295554386e-05, "loss": 2.8182, "step": 6410 }, { "epoch": 0.08, "learning_rate": 9.83475918314589e-05, "loss": 2.7491, "step": 6415 }, { "epoch": 0.08, "learning_rate": 9.834498869294385e-05, "loss": 2.893, "step": 6420 }, { "epoch": 0.08, "learning_rate": 9.834238354010716e-05, "loss": 2.9166, "step": 6425 }, { "epoch": 0.08, "learning_rate": 9.833977637305738e-05, "loss": 2.8839, "step": 6430 }, { "epoch": 0.08, "learning_rate": 9.833716719190316e-05, "loss": 2.8859, "step": 6435 }, { "epoch": 0.08, "learning_rate": 9.833455599675317e-05, "loss": 2.8653, "step": 6440 }, { "epoch": 0.08, "learning_rate": 9.833194278771623e-05, "loss": 2.7282, "step": 6445 }, { "epoch": 0.08, "learning_rate": 9.83293275649012e-05, "loss": 2.9646, "step": 6450 }, { "epoch": 0.08, "learning_rate": 9.832671032841709e-05, "loss": 2.9523, "step": 6455 }, { "epoch": 0.08, "learning_rate": 9.832409107837293e-05, "loss": 2.8622, "step": 6460 }, { "epoch": 0.08, "learning_rate": 9.832146981487782e-05, "loss": 2.9179, "step": 6465 }, { "epoch": 0.08, "learning_rate": 9.831884653804102e-05, "loss": 2.8236, "step": 6470 }, { "epoch": 0.08, "learning_rate": 9.831622124797179e-05, "loss": 2.7657, "step": 6475 }, { "epoch": 0.08, "learning_rate": 9.831359394477957e-05, "loss": 2.8763, "step": 6480 }, { "epoch": 0.08, "learning_rate": 9.831096462857377e-05, "loss": 2.8349, "step": 6485 }, { "epoch": 0.08, "learning_rate": 9.830833329946398e-05, "loss": 2.8153, "step": 6490 }, { "epoch": 0.08, "learning_rate": 9.830569995755981e-05, "loss": 2.8729, "step": 6495 }, { "epoch": 0.08, "learning_rate": 9.830306460297099e-05, "loss": 2.8835, "step": 6500 }, { "epoch": 0.08, "learning_rate": 9.830042723580732e-05, "loss": 2.8331, "step": 6505 }, { "epoch": 0.08, "learning_rate": 9.829778785617872e-05, "loss": 2.8494, "step": 6510 }, { "epoch": 0.08, "learning_rate": 9.829514646419511e-05, "loss": 2.8553, "step": 6515 }, { "epoch": 0.08, "learning_rate": 9.829250305996658e-05, "loss": 2.7521, "step": 6520 }, { "epoch": 0.08, "learning_rate": 9.828985764360325e-05, "loss": 2.962, "step": 6525 }, { "epoch": 0.08, "learning_rate": 9.828721021521534e-05, "loss": 2.8022, "step": 6530 }, { "epoch": 0.08, "learning_rate": 9.82845607749132e-05, "loss": 2.855, "step": 6535 }, { "epoch": 0.08, "learning_rate": 9.828190932280716e-05, "loss": 2.8984, "step": 6540 }, { "epoch": 0.08, "learning_rate": 9.827925585900773e-05, "loss": 2.8641, "step": 6545 }, { "epoch": 0.09, "learning_rate": 9.827660038362546e-05, "loss": 2.9364, "step": 6550 }, { "epoch": 0.09, "learning_rate": 9.827394289677098e-05, "loss": 2.8792, "step": 6555 }, { "epoch": 0.09, "learning_rate": 9.827128339855505e-05, "loss": 2.919, "step": 6560 }, { "epoch": 0.09, "learning_rate": 9.826862188908846e-05, "loss": 2.8861, "step": 6565 }, { "epoch": 0.09, "learning_rate": 9.826595836848208e-05, "loss": 2.848, "step": 6570 }, { "epoch": 0.09, "learning_rate": 9.826329283684693e-05, "loss": 2.9422, "step": 6575 }, { "epoch": 0.09, "learning_rate": 9.826062529429402e-05, "loss": 2.7578, "step": 6580 }, { "epoch": 0.09, "learning_rate": 9.825795574093453e-05, "loss": 2.9558, "step": 6585 }, { "epoch": 0.09, "learning_rate": 9.82552841768797e-05, "loss": 2.9087, "step": 6590 }, { "epoch": 0.09, "learning_rate": 9.825261060224081e-05, "loss": 2.8252, "step": 6595 }, { "epoch": 0.09, "learning_rate": 9.824993501712927e-05, "loss": 2.8375, "step": 6600 }, { "epoch": 0.09, "learning_rate": 9.824725742165656e-05, "loss": 2.7593, "step": 6605 }, { "epoch": 0.09, "learning_rate": 9.824457781593426e-05, "loss": 3.0172, "step": 6610 }, { "epoch": 0.09, "learning_rate": 9.824189620007397e-05, "loss": 2.9138, "step": 6615 }, { "epoch": 0.09, "learning_rate": 9.823921257418749e-05, "loss": 2.8133, "step": 6620 }, { "epoch": 0.09, "learning_rate": 9.823652693838656e-05, "loss": 2.7714, "step": 6625 }, { "epoch": 0.09, "learning_rate": 9.823383929278313e-05, "loss": 2.8356, "step": 6630 }, { "epoch": 0.09, "learning_rate": 9.823114963748918e-05, "loss": 2.9722, "step": 6635 }, { "epoch": 0.09, "learning_rate": 9.822845797261675e-05, "loss": 2.6921, "step": 6640 }, { "epoch": 0.09, "learning_rate": 9.822576429827802e-05, "loss": 2.8859, "step": 6645 }, { "epoch": 0.09, "learning_rate": 9.822306861458516e-05, "loss": 2.7756, "step": 6650 }, { "epoch": 0.09, "learning_rate": 9.822037092165058e-05, "loss": 2.875, "step": 6655 }, { "epoch": 0.09, "learning_rate": 9.821767121958662e-05, "loss": 2.8634, "step": 6660 }, { "epoch": 0.09, "learning_rate": 9.821496950850578e-05, "loss": 2.8916, "step": 6665 }, { "epoch": 0.09, "learning_rate": 9.821226578852063e-05, "loss": 2.7789, "step": 6670 }, { "epoch": 0.09, "learning_rate": 9.820956005974382e-05, "loss": 2.8356, "step": 6675 }, { "epoch": 0.09, "learning_rate": 9.820685232228808e-05, "loss": 2.8547, "step": 6680 }, { "epoch": 0.09, "learning_rate": 9.820414257626623e-05, "loss": 2.9, "step": 6685 }, { "epoch": 0.09, "learning_rate": 9.820143082179118e-05, "loss": 2.8243, "step": 6690 }, { "epoch": 0.09, "learning_rate": 9.819871705897591e-05, "loss": 2.8755, "step": 6695 }, { "epoch": 0.09, "learning_rate": 9.819600128793351e-05, "loss": 2.7784, "step": 6700 }, { "epoch": 0.09, "learning_rate": 9.819328350877712e-05, "loss": 2.7706, "step": 6705 }, { "epoch": 0.09, "learning_rate": 9.819056372161998e-05, "loss": 2.9043, "step": 6710 }, { "epoch": 0.09, "learning_rate": 9.81878419265754e-05, "loss": 2.8671, "step": 6715 }, { "epoch": 0.09, "learning_rate": 9.81851181237568e-05, "loss": 2.8587, "step": 6720 }, { "epoch": 0.09, "learning_rate": 9.818239231327766e-05, "loss": 2.713, "step": 6725 }, { "epoch": 0.09, "learning_rate": 9.817966449525154e-05, "loss": 2.8241, "step": 6730 }, { "epoch": 0.09, "learning_rate": 9.817693466979213e-05, "loss": 2.7202, "step": 6735 }, { "epoch": 0.09, "learning_rate": 9.817420283701315e-05, "loss": 2.6986, "step": 6740 }, { "epoch": 0.09, "learning_rate": 9.817146899702842e-05, "loss": 2.7794, "step": 6745 }, { "epoch": 0.09, "learning_rate": 9.816873314995185e-05, "loss": 2.9248, "step": 6750 }, { "epoch": 0.09, "learning_rate": 9.816599529589742e-05, "loss": 2.7395, "step": 6755 }, { "epoch": 0.09, "learning_rate": 9.816325543497924e-05, "loss": 2.91, "step": 6760 }, { "epoch": 0.09, "learning_rate": 9.816051356731143e-05, "loss": 2.7655, "step": 6765 }, { "epoch": 0.09, "learning_rate": 9.815776969300825e-05, "loss": 2.8167, "step": 6770 }, { "epoch": 0.09, "learning_rate": 9.815502381218402e-05, "loss": 2.862, "step": 6775 }, { "epoch": 0.09, "learning_rate": 9.815227592495315e-05, "loss": 2.756, "step": 6780 }, { "epoch": 0.09, "learning_rate": 9.814952603143014e-05, "loss": 2.8802, "step": 6785 }, { "epoch": 0.09, "learning_rate": 9.814677413172955e-05, "loss": 2.8194, "step": 6790 }, { "epoch": 0.09, "learning_rate": 9.814402022596604e-05, "loss": 2.7237, "step": 6795 }, { "epoch": 0.09, "learning_rate": 9.814126431425437e-05, "loss": 2.8589, "step": 6800 }, { "epoch": 0.09, "learning_rate": 9.813850639670936e-05, "loss": 2.8987, "step": 6805 }, { "epoch": 0.09, "learning_rate": 9.81357464734459e-05, "loss": 2.7774, "step": 6810 }, { "epoch": 0.09, "learning_rate": 9.813298454457902e-05, "loss": 2.7853, "step": 6815 }, { "epoch": 0.09, "learning_rate": 9.813022061022377e-05, "loss": 2.7948, "step": 6820 }, { "epoch": 0.09, "learning_rate": 9.812745467049531e-05, "loss": 2.8463, "step": 6825 }, { "epoch": 0.09, "learning_rate": 9.81246867255089e-05, "loss": 2.8774, "step": 6830 }, { "epoch": 0.09, "learning_rate": 9.812191677537987e-05, "loss": 2.8457, "step": 6835 }, { "epoch": 0.09, "learning_rate": 9.811914482022362e-05, "loss": 2.7516, "step": 6840 }, { "epoch": 0.09, "learning_rate": 9.811637086015563e-05, "loss": 2.835, "step": 6845 }, { "epoch": 0.09, "learning_rate": 9.811359489529153e-05, "loss": 2.7701, "step": 6850 }, { "epoch": 0.09, "learning_rate": 9.811081692574693e-05, "loss": 2.7285, "step": 6855 }, { "epoch": 0.09, "learning_rate": 9.81080369516376e-05, "loss": 2.806, "step": 6860 }, { "epoch": 0.09, "learning_rate": 9.810525497307934e-05, "loss": 2.7545, "step": 6865 }, { "epoch": 0.09, "learning_rate": 9.810247099018812e-05, "loss": 2.9074, "step": 6870 }, { "epoch": 0.09, "learning_rate": 9.809968500307989e-05, "loss": 2.8285, "step": 6875 }, { "epoch": 0.09, "learning_rate": 9.809689701187074e-05, "loss": 2.8964, "step": 6880 }, { "epoch": 0.09, "learning_rate": 9.809410701667682e-05, "loss": 2.9263, "step": 6885 }, { "epoch": 0.09, "learning_rate": 9.809131501761443e-05, "loss": 2.7608, "step": 6890 }, { "epoch": 0.09, "learning_rate": 9.808852101479984e-05, "loss": 2.7865, "step": 6895 }, { "epoch": 0.09, "learning_rate": 9.808572500834949e-05, "loss": 2.9991, "step": 6900 }, { "epoch": 0.09, "learning_rate": 9.808292699837986e-05, "loss": 2.9373, "step": 6905 }, { "epoch": 0.09, "learning_rate": 9.808012698500757e-05, "loss": 2.8222, "step": 6910 }, { "epoch": 0.09, "learning_rate": 9.807732496834924e-05, "loss": 2.9273, "step": 6915 }, { "epoch": 0.09, "learning_rate": 9.807452094852165e-05, "loss": 2.7833, "step": 6920 }, { "epoch": 0.09, "learning_rate": 9.807171492564161e-05, "loss": 2.8565, "step": 6925 }, { "epoch": 0.09, "learning_rate": 9.806890689982604e-05, "loss": 2.7904, "step": 6930 }, { "epoch": 0.09, "learning_rate": 9.806609687119194e-05, "loss": 2.9192, "step": 6935 }, { "epoch": 0.09, "learning_rate": 9.806328483985641e-05, "loss": 2.8251, "step": 6940 }, { "epoch": 0.09, "learning_rate": 9.806047080593656e-05, "loss": 2.8422, "step": 6945 }, { "epoch": 0.09, "learning_rate": 9.805765476954971e-05, "loss": 2.926, "step": 6950 }, { "epoch": 0.09, "learning_rate": 9.805483673081314e-05, "loss": 2.8935, "step": 6955 }, { "epoch": 0.09, "learning_rate": 9.805201668984428e-05, "loss": 2.8243, "step": 6960 }, { "epoch": 0.09, "learning_rate": 9.804919464676063e-05, "loss": 2.9091, "step": 6965 }, { "epoch": 0.09, "learning_rate": 9.804637060167979e-05, "loss": 2.9639, "step": 6970 }, { "epoch": 0.09, "learning_rate": 9.804354455471937e-05, "loss": 2.9057, "step": 6975 }, { "epoch": 0.09, "learning_rate": 9.80407165059972e-05, "loss": 2.8447, "step": 6980 }, { "epoch": 0.09, "learning_rate": 9.803788645563104e-05, "loss": 2.7672, "step": 6985 }, { "epoch": 0.09, "learning_rate": 9.803505440373883e-05, "loss": 2.8276, "step": 6990 }, { "epoch": 0.09, "learning_rate": 9.803222035043859e-05, "loss": 2.7208, "step": 6995 }, { "epoch": 0.09, "learning_rate": 9.802938429584839e-05, "loss": 2.8599, "step": 7000 }, { "epoch": 0.09, "learning_rate": 9.802654624008638e-05, "loss": 2.7095, "step": 7005 }, { "epoch": 0.09, "learning_rate": 9.802370618327083e-05, "loss": 2.8134, "step": 7010 }, { "epoch": 0.09, "learning_rate": 9.802086412552007e-05, "loss": 2.8836, "step": 7015 }, { "epoch": 0.09, "learning_rate": 9.801802006695249e-05, "loss": 2.8154, "step": 7020 }, { "epoch": 0.09, "learning_rate": 9.801517400768663e-05, "loss": 2.86, "step": 7025 }, { "epoch": 0.09, "learning_rate": 9.801232594784102e-05, "loss": 2.9218, "step": 7030 }, { "epoch": 0.09, "learning_rate": 9.800947588753438e-05, "loss": 2.7685, "step": 7035 }, { "epoch": 0.09, "learning_rate": 9.800662382688544e-05, "loss": 2.8736, "step": 7040 }, { "epoch": 0.09, "learning_rate": 9.800376976601302e-05, "loss": 2.8022, "step": 7045 }, { "epoch": 0.09, "learning_rate": 9.800091370503605e-05, "loss": 2.9099, "step": 7050 }, { "epoch": 0.09, "learning_rate": 9.799805564407354e-05, "loss": 2.8771, "step": 7055 }, { "epoch": 0.09, "learning_rate": 9.799519558324453e-05, "loss": 2.8995, "step": 7060 }, { "epoch": 0.09, "learning_rate": 9.799233352266823e-05, "loss": 2.824, "step": 7065 }, { "epoch": 0.09, "learning_rate": 9.798946946246388e-05, "loss": 2.8831, "step": 7070 }, { "epoch": 0.09, "learning_rate": 9.798660340275079e-05, "loss": 2.844, "step": 7075 }, { "epoch": 0.09, "learning_rate": 9.79837353436484e-05, "loss": 2.8507, "step": 7080 }, { "epoch": 0.09, "learning_rate": 9.79808652852762e-05, "loss": 2.9306, "step": 7085 }, { "epoch": 0.09, "learning_rate": 9.797799322775379e-05, "loss": 2.7608, "step": 7090 }, { "epoch": 0.09, "learning_rate": 9.797511917120079e-05, "loss": 2.7321, "step": 7095 }, { "epoch": 0.09, "learning_rate": 9.7972243115737e-05, "loss": 2.7679, "step": 7100 }, { "epoch": 0.09, "learning_rate": 9.796936506148222e-05, "loss": 2.9, "step": 7105 }, { "epoch": 0.09, "learning_rate": 9.796648500855639e-05, "loss": 2.8654, "step": 7110 }, { "epoch": 0.09, "learning_rate": 9.79636029570795e-05, "loss": 2.8548, "step": 7115 }, { "epoch": 0.09, "learning_rate": 9.796071890717162e-05, "loss": 2.8215, "step": 7120 }, { "epoch": 0.09, "learning_rate": 9.795783285895293e-05, "loss": 2.8185, "step": 7125 }, { "epoch": 0.09, "learning_rate": 9.795494481254366e-05, "loss": 2.839, "step": 7130 }, { "epoch": 0.09, "learning_rate": 9.795205476806416e-05, "loss": 2.8744, "step": 7135 }, { "epoch": 0.09, "learning_rate": 9.794916272563484e-05, "loss": 2.8738, "step": 7140 }, { "epoch": 0.09, "learning_rate": 9.794626868537622e-05, "loss": 2.8715, "step": 7145 }, { "epoch": 0.09, "learning_rate": 9.794337264740884e-05, "loss": 2.7135, "step": 7150 }, { "epoch": 0.09, "learning_rate": 9.794047461185339e-05, "loss": 2.7635, "step": 7155 }, { "epoch": 0.09, "learning_rate": 9.793757457883062e-05, "loss": 2.8809, "step": 7160 }, { "epoch": 0.09, "learning_rate": 9.793467254846135e-05, "loss": 2.7928, "step": 7165 }, { "epoch": 0.09, "learning_rate": 9.79317685208665e-05, "loss": 2.7684, "step": 7170 }, { "epoch": 0.09, "learning_rate": 9.792886249616709e-05, "loss": 2.8582, "step": 7175 }, { "epoch": 0.09, "learning_rate": 9.792595447448416e-05, "loss": 2.7041, "step": 7180 }, { "epoch": 0.09, "learning_rate": 9.79230444559389e-05, "loss": 2.8933, "step": 7185 }, { "epoch": 0.09, "learning_rate": 9.792013244065255e-05, "loss": 2.9919, "step": 7190 }, { "epoch": 0.09, "learning_rate": 9.791721842874644e-05, "loss": 2.8113, "step": 7195 }, { "epoch": 0.09, "learning_rate": 9.791430242034198e-05, "loss": 2.787, "step": 7200 }, { "epoch": 0.09, "learning_rate": 9.79113844155607e-05, "loss": 2.9021, "step": 7205 }, { "epoch": 0.09, "learning_rate": 9.790846441452413e-05, "loss": 2.7611, "step": 7210 }, { "epoch": 0.09, "learning_rate": 9.790554241735397e-05, "loss": 2.7716, "step": 7215 }, { "epoch": 0.09, "learning_rate": 9.790261842417194e-05, "loss": 2.7807, "step": 7220 }, { "epoch": 0.09, "learning_rate": 9.78996924350999e-05, "loss": 2.9203, "step": 7225 }, { "epoch": 0.09, "learning_rate": 9.789676445025975e-05, "loss": 2.8463, "step": 7230 }, { "epoch": 0.09, "learning_rate": 9.789383446977347e-05, "loss": 2.8744, "step": 7235 }, { "epoch": 0.09, "learning_rate": 9.789090249376315e-05, "loss": 2.9172, "step": 7240 }, { "epoch": 0.09, "learning_rate": 9.788796852235098e-05, "loss": 2.9233, "step": 7245 }, { "epoch": 0.09, "learning_rate": 9.788503255565917e-05, "loss": 2.7821, "step": 7250 }, { "epoch": 0.09, "learning_rate": 9.788209459381006e-05, "loss": 2.8985, "step": 7255 }, { "epoch": 0.09, "learning_rate": 9.787915463692606e-05, "loss": 2.9162, "step": 7260 }, { "epoch": 0.09, "learning_rate": 9.787621268512965e-05, "loss": 2.9049, "step": 7265 }, { "epoch": 0.09, "learning_rate": 9.787326873854345e-05, "loss": 2.8864, "step": 7270 }, { "epoch": 0.09, "learning_rate": 9.787032279729009e-05, "loss": 2.832, "step": 7275 }, { "epoch": 0.09, "learning_rate": 9.786737486149231e-05, "loss": 2.8855, "step": 7280 }, { "epoch": 0.09, "learning_rate": 9.786442493127295e-05, "loss": 2.8606, "step": 7285 }, { "epoch": 0.09, "learning_rate": 9.786147300675492e-05, "loss": 3.0125, "step": 7290 }, { "epoch": 0.09, "learning_rate": 9.785851908806121e-05, "loss": 2.7943, "step": 7295 }, { "epoch": 0.09, "learning_rate": 9.785556317531491e-05, "loss": 2.8916, "step": 7300 }, { "epoch": 0.09, "learning_rate": 9.785260526863916e-05, "loss": 2.9612, "step": 7305 }, { "epoch": 0.09, "learning_rate": 9.784964536815722e-05, "loss": 2.9662, "step": 7310 }, { "epoch": 0.09, "learning_rate": 9.784668347399239e-05, "loss": 2.7763, "step": 7315 }, { "epoch": 0.09, "learning_rate": 9.784371958626811e-05, "loss": 2.7375, "step": 7320 }, { "epoch": 0.1, "learning_rate": 9.784075370510786e-05, "loss": 2.7762, "step": 7325 }, { "epoch": 0.1, "learning_rate": 9.78377858306352e-05, "loss": 2.7887, "step": 7330 }, { "epoch": 0.1, "learning_rate": 9.783481596297381e-05, "loss": 2.8804, "step": 7335 }, { "epoch": 0.1, "learning_rate": 9.783184410224741e-05, "loss": 2.8454, "step": 7340 }, { "epoch": 0.1, "learning_rate": 9.782887024857986e-05, "loss": 2.8163, "step": 7345 }, { "epoch": 0.1, "learning_rate": 9.782589440209504e-05, "loss": 2.7927, "step": 7350 }, { "epoch": 0.1, "learning_rate": 9.782291656291694e-05, "loss": 2.848, "step": 7355 }, { "epoch": 0.1, "learning_rate": 9.781993673116962e-05, "loss": 2.917, "step": 7360 }, { "epoch": 0.1, "learning_rate": 9.781695490697729e-05, "loss": 2.713, "step": 7365 }, { "epoch": 0.1, "learning_rate": 9.781397109046412e-05, "loss": 2.934, "step": 7370 }, { "epoch": 0.1, "learning_rate": 9.781098528175449e-05, "loss": 2.7823, "step": 7375 }, { "epoch": 0.1, "learning_rate": 9.780799748097277e-05, "loss": 2.8295, "step": 7380 }, { "epoch": 0.1, "learning_rate": 9.780500768824345e-05, "loss": 2.7889, "step": 7385 }, { "epoch": 0.1, "learning_rate": 9.780201590369113e-05, "loss": 2.9334, "step": 7390 }, { "epoch": 0.1, "learning_rate": 9.779902212744045e-05, "loss": 2.9727, "step": 7395 }, { "epoch": 0.1, "learning_rate": 9.779602635961613e-05, "loss": 2.7547, "step": 7400 }, { "epoch": 0.1, "learning_rate": 9.7793028600343e-05, "loss": 2.8839, "step": 7405 }, { "epoch": 0.1, "learning_rate": 9.7790028849746e-05, "loss": 2.8216, "step": 7410 }, { "epoch": 0.1, "learning_rate": 9.778702710795004e-05, "loss": 2.7814, "step": 7415 }, { "epoch": 0.1, "learning_rate": 9.778402337508026e-05, "loss": 2.9778, "step": 7420 }, { "epoch": 0.1, "learning_rate": 9.778101765126178e-05, "loss": 2.7591, "step": 7425 }, { "epoch": 0.1, "learning_rate": 9.777800993661983e-05, "loss": 2.7921, "step": 7430 }, { "epoch": 0.1, "learning_rate": 9.777500023127975e-05, "loss": 2.9163, "step": 7435 }, { "epoch": 0.1, "learning_rate": 9.777198853536694e-05, "loss": 2.7094, "step": 7440 }, { "epoch": 0.1, "learning_rate": 9.776897484900685e-05, "loss": 2.8239, "step": 7445 }, { "epoch": 0.1, "learning_rate": 9.776595917232507e-05, "loss": 2.7792, "step": 7450 }, { "epoch": 0.1, "learning_rate": 9.776294150544727e-05, "loss": 2.9131, "step": 7455 }, { "epoch": 0.1, "learning_rate": 9.775992184849916e-05, "loss": 2.8821, "step": 7460 }, { "epoch": 0.1, "learning_rate": 9.775690020160655e-05, "loss": 2.808, "step": 7465 }, { "epoch": 0.1, "learning_rate": 9.775387656489535e-05, "loss": 2.9189, "step": 7470 }, { "epoch": 0.1, "learning_rate": 9.775085093849155e-05, "loss": 2.8073, "step": 7475 }, { "epoch": 0.1, "learning_rate": 9.774782332252119e-05, "loss": 2.767, "step": 7480 }, { "epoch": 0.1, "learning_rate": 9.774479371711043e-05, "loss": 3.0012, "step": 7485 }, { "epoch": 0.1, "learning_rate": 9.77417621223855e-05, "loss": 2.8725, "step": 7490 }, { "epoch": 0.1, "learning_rate": 9.773872853847272e-05, "loss": 2.6973, "step": 7495 }, { "epoch": 0.1, "learning_rate": 9.773569296549849e-05, "loss": 2.7807, "step": 7500 }, { "epoch": 0.1, "learning_rate": 9.773265540358926e-05, "loss": 2.7432, "step": 7505 }, { "epoch": 0.1, "learning_rate": 9.772961585287163e-05, "loss": 2.7808, "step": 7510 }, { "epoch": 0.1, "learning_rate": 9.77265743134722e-05, "loss": 2.8598, "step": 7515 }, { "epoch": 0.1, "learning_rate": 9.772353078551775e-05, "loss": 2.7845, "step": 7520 }, { "epoch": 0.1, "learning_rate": 9.772048526913505e-05, "loss": 2.8126, "step": 7525 }, { "epoch": 0.1, "learning_rate": 9.771743776445102e-05, "loss": 2.8243, "step": 7530 }, { "epoch": 0.1, "learning_rate": 9.77143882715926e-05, "loss": 2.7988, "step": 7535 }, { "epoch": 0.1, "learning_rate": 9.771133679068689e-05, "loss": 2.7008, "step": 7540 }, { "epoch": 0.1, "learning_rate": 9.770828332186101e-05, "loss": 2.7924, "step": 7545 }, { "epoch": 0.1, "learning_rate": 9.770522786524219e-05, "loss": 2.6484, "step": 7550 }, { "epoch": 0.1, "learning_rate": 9.770217042095772e-05, "loss": 2.7566, "step": 7555 }, { "epoch": 0.1, "learning_rate": 9.769911098913502e-05, "loss": 2.8614, "step": 7560 }, { "epoch": 0.1, "learning_rate": 9.769604956990155e-05, "loss": 2.8326, "step": 7565 }, { "epoch": 0.1, "learning_rate": 9.769298616338485e-05, "loss": 2.8138, "step": 7570 }, { "epoch": 0.1, "learning_rate": 9.76899207697126e-05, "loss": 2.9205, "step": 7575 }, { "epoch": 0.1, "learning_rate": 9.768685338901246e-05, "loss": 2.8697, "step": 7580 }, { "epoch": 0.1, "learning_rate": 9.768378402141229e-05, "loss": 2.8555, "step": 7585 }, { "epoch": 0.1, "learning_rate": 9.768071266703995e-05, "loss": 2.7454, "step": 7590 }, { "epoch": 0.1, "learning_rate": 9.76776393260234e-05, "loss": 2.962, "step": 7595 }, { "epoch": 0.1, "learning_rate": 9.767456399849073e-05, "loss": 2.7632, "step": 7600 }, { "epoch": 0.1, "learning_rate": 9.767148668457005e-05, "loss": 2.954, "step": 7605 }, { "epoch": 0.1, "learning_rate": 9.766840738438957e-05, "loss": 2.7899, "step": 7610 }, { "epoch": 0.1, "learning_rate": 9.766532609807761e-05, "loss": 2.832, "step": 7615 }, { "epoch": 0.1, "learning_rate": 9.766224282576254e-05, "loss": 2.7462, "step": 7620 }, { "epoch": 0.1, "learning_rate": 9.765915756757283e-05, "loss": 2.7871, "step": 7625 }, { "epoch": 0.1, "learning_rate": 9.765607032363704e-05, "loss": 2.7871, "step": 7630 }, { "epoch": 0.1, "learning_rate": 9.765298109408379e-05, "loss": 2.8054, "step": 7635 }, { "epoch": 0.1, "learning_rate": 9.764988987904178e-05, "loss": 2.8622, "step": 7640 }, { "epoch": 0.1, "learning_rate": 9.764679667863984e-05, "loss": 2.8768, "step": 7645 }, { "epoch": 0.1, "learning_rate": 9.764370149300683e-05, "loss": 2.8568, "step": 7650 }, { "epoch": 0.1, "learning_rate": 9.764060432227173e-05, "loss": 2.814, "step": 7655 }, { "epoch": 0.1, "learning_rate": 9.763750516656354e-05, "loss": 2.8233, "step": 7660 }, { "epoch": 0.1, "learning_rate": 9.763440402601145e-05, "loss": 2.7248, "step": 7665 }, { "epoch": 0.1, "learning_rate": 9.763130090074463e-05, "loss": 2.7862, "step": 7670 }, { "epoch": 0.1, "learning_rate": 9.762819579089239e-05, "loss": 2.5692, "step": 7675 }, { "epoch": 0.1, "learning_rate": 9.762508869658408e-05, "loss": 2.7532, "step": 7680 }, { "epoch": 0.1, "learning_rate": 9.762197961794921e-05, "loss": 2.818, "step": 7685 }, { "epoch": 0.1, "learning_rate": 9.761886855511727e-05, "loss": 2.9368, "step": 7690 }, { "epoch": 0.1, "learning_rate": 9.761575550821791e-05, "loss": 2.8692, "step": 7695 }, { "epoch": 0.1, "learning_rate": 9.761264047738083e-05, "loss": 2.8099, "step": 7700 }, { "epoch": 0.1, "learning_rate": 9.760952346273582e-05, "loss": 2.9409, "step": 7705 }, { "epoch": 0.1, "learning_rate": 9.760640446441277e-05, "loss": 2.7997, "step": 7710 }, { "epoch": 0.1, "learning_rate": 9.76032834825416e-05, "loss": 2.9128, "step": 7715 }, { "epoch": 0.1, "learning_rate": 9.760016051725238e-05, "loss": 2.8435, "step": 7720 }, { "epoch": 0.1, "learning_rate": 9.759703556867521e-05, "loss": 2.9033, "step": 7725 }, { "epoch": 0.1, "learning_rate": 9.75939086369403e-05, "loss": 2.7767, "step": 7730 }, { "epoch": 0.1, "learning_rate": 9.759077972217794e-05, "loss": 2.8788, "step": 7735 }, { "epoch": 0.1, "learning_rate": 9.758764882451848e-05, "loss": 2.7418, "step": 7740 }, { "epoch": 0.1, "learning_rate": 9.758451594409239e-05, "loss": 2.7821, "step": 7745 }, { "epoch": 0.1, "learning_rate": 9.758138108103022e-05, "loss": 2.8689, "step": 7750 }, { "epoch": 0.1, "learning_rate": 9.757824423546252e-05, "loss": 2.8707, "step": 7755 }, { "epoch": 0.1, "learning_rate": 9.757510540752005e-05, "loss": 2.8909, "step": 7760 }, { "epoch": 0.1, "learning_rate": 9.757196459733357e-05, "loss": 2.7851, "step": 7765 }, { "epoch": 0.1, "learning_rate": 9.756882180503395e-05, "loss": 2.8921, "step": 7770 }, { "epoch": 0.1, "learning_rate": 9.756567703075212e-05, "loss": 2.7757, "step": 7775 }, { "epoch": 0.1, "learning_rate": 9.756253027461915e-05, "loss": 2.796, "step": 7780 }, { "epoch": 0.1, "learning_rate": 9.75593815367661e-05, "loss": 2.7087, "step": 7785 }, { "epoch": 0.1, "learning_rate": 9.755623081732418e-05, "loss": 2.7982, "step": 7790 }, { "epoch": 0.1, "learning_rate": 9.755307811642468e-05, "loss": 2.9007, "step": 7795 }, { "epoch": 0.1, "learning_rate": 9.754992343419895e-05, "loss": 2.7306, "step": 7800 }, { "epoch": 0.1, "learning_rate": 9.754676677077843e-05, "loss": 2.9075, "step": 7805 }, { "epoch": 0.1, "learning_rate": 9.754360812629467e-05, "loss": 2.6866, "step": 7810 }, { "epoch": 0.1, "learning_rate": 9.754044750087923e-05, "loss": 2.7496, "step": 7815 }, { "epoch": 0.1, "learning_rate": 9.753728489466382e-05, "loss": 2.8685, "step": 7820 }, { "epoch": 0.1, "learning_rate": 9.753412030778022e-05, "loss": 2.8566, "step": 7825 }, { "epoch": 0.1, "learning_rate": 9.75309537403603e-05, "loss": 2.7541, "step": 7830 }, { "epoch": 0.1, "learning_rate": 9.752778519253595e-05, "loss": 2.7644, "step": 7835 }, { "epoch": 0.1, "learning_rate": 9.752461466443923e-05, "loss": 2.7036, "step": 7840 }, { "epoch": 0.1, "learning_rate": 9.752144215620223e-05, "loss": 2.9051, "step": 7845 }, { "epoch": 0.1, "learning_rate": 9.751826766795712e-05, "loss": 2.821, "step": 7850 }, { "epoch": 0.1, "learning_rate": 9.751509119983618e-05, "loss": 2.7034, "step": 7855 }, { "epoch": 0.1, "learning_rate": 9.751191275197176e-05, "loss": 2.8867, "step": 7860 }, { "epoch": 0.1, "learning_rate": 9.75087323244963e-05, "loss": 2.818, "step": 7865 }, { "epoch": 0.1, "learning_rate": 9.75055499175423e-05, "loss": 2.7817, "step": 7870 }, { "epoch": 0.1, "learning_rate": 9.750236553124236e-05, "loss": 2.8425, "step": 7875 }, { "epoch": 0.1, "learning_rate": 9.749917916572915e-05, "loss": 2.8572, "step": 7880 }, { "epoch": 0.1, "learning_rate": 9.749599082113545e-05, "loss": 2.7842, "step": 7885 }, { "epoch": 0.1, "learning_rate": 9.749280049759411e-05, "loss": 2.8906, "step": 7890 }, { "epoch": 0.1, "learning_rate": 9.748960819523803e-05, "loss": 2.7725, "step": 7895 }, { "epoch": 0.1, "learning_rate": 9.748641391420023e-05, "loss": 2.6944, "step": 7900 }, { "epoch": 0.1, "learning_rate": 9.748321765461382e-05, "loss": 2.841, "step": 7905 }, { "epoch": 0.1, "learning_rate": 9.748001941661194e-05, "loss": 2.6879, "step": 7910 }, { "epoch": 0.1, "learning_rate": 9.747681920032785e-05, "loss": 2.7713, "step": 7915 }, { "epoch": 0.1, "learning_rate": 9.747361700589492e-05, "loss": 2.7621, "step": 7920 }, { "epoch": 0.1, "learning_rate": 9.747041283344657e-05, "loss": 2.8866, "step": 7925 }, { "epoch": 0.1, "learning_rate": 9.746720668311627e-05, "loss": 2.7318, "step": 7930 }, { "epoch": 0.1, "learning_rate": 9.746399855503763e-05, "loss": 2.77, "step": 7935 }, { "epoch": 0.1, "learning_rate": 9.746078844934431e-05, "loss": 2.8486, "step": 7940 }, { "epoch": 0.1, "learning_rate": 9.745757636617005e-05, "loss": 2.8126, "step": 7945 }, { "epoch": 0.1, "learning_rate": 9.745436230564873e-05, "loss": 3.0206, "step": 7950 }, { "epoch": 0.1, "learning_rate": 9.74511462679142e-05, "loss": 2.8846, "step": 7955 }, { "epoch": 0.1, "learning_rate": 9.74479282531005e-05, "loss": 2.8297, "step": 7960 }, { "epoch": 0.1, "learning_rate": 9.744470826134172e-05, "loss": 2.7655, "step": 7965 }, { "epoch": 0.1, "learning_rate": 9.744148629277198e-05, "loss": 2.8323, "step": 7970 }, { "epoch": 0.1, "learning_rate": 9.743826234752555e-05, "loss": 2.8522, "step": 7975 }, { "epoch": 0.1, "learning_rate": 9.743503642573677e-05, "loss": 2.8764, "step": 7980 }, { "epoch": 0.1, "learning_rate": 9.743180852754004e-05, "loss": 2.8337, "step": 7985 }, { "epoch": 0.1, "learning_rate": 9.742857865306983e-05, "loss": 2.7987, "step": 7990 }, { "epoch": 0.1, "learning_rate": 9.742534680246074e-05, "loss": 2.8744, "step": 7995 }, { "epoch": 0.1, "learning_rate": 9.742211297584742e-05, "loss": 2.8406, "step": 8000 }, { "epoch": 0.1, "learning_rate": 9.741887717336459e-05, "loss": 2.7467, "step": 8005 }, { "epoch": 0.1, "learning_rate": 9.741563939514713e-05, "loss": 2.8176, "step": 8010 }, { "epoch": 0.1, "learning_rate": 9.741239964132988e-05, "loss": 2.7999, "step": 8015 }, { "epoch": 0.1, "learning_rate": 9.740915791204786e-05, "loss": 2.8739, "step": 8020 }, { "epoch": 0.1, "learning_rate": 9.740591420743612e-05, "loss": 2.754, "step": 8025 }, { "epoch": 0.1, "learning_rate": 9.740266852762982e-05, "loss": 2.9101, "step": 8030 }, { "epoch": 0.1, "learning_rate": 9.73994208727642e-05, "loss": 2.8078, "step": 8035 }, { "epoch": 0.1, "learning_rate": 9.739617124297458e-05, "loss": 2.7847, "step": 8040 }, { "epoch": 0.1, "learning_rate": 9.739291963839632e-05, "loss": 2.8384, "step": 8045 }, { "epoch": 0.1, "learning_rate": 9.738966605916495e-05, "loss": 2.8119, "step": 8050 }, { "epoch": 0.1, "learning_rate": 9.738641050541599e-05, "loss": 2.8842, "step": 8055 }, { "epoch": 0.1, "learning_rate": 9.738315297728511e-05, "loss": 2.8724, "step": 8060 }, { "epoch": 0.1, "learning_rate": 9.737989347490804e-05, "loss": 2.8184, "step": 8065 }, { "epoch": 0.1, "learning_rate": 9.737663199842055e-05, "loss": 2.8356, "step": 8070 }, { "epoch": 0.1, "learning_rate": 9.73733685479586e-05, "loss": 2.7318, "step": 8075 }, { "epoch": 0.1, "learning_rate": 9.73701031236581e-05, "loss": 2.7312, "step": 8080 }, { "epoch": 0.1, "learning_rate": 9.736683572565513e-05, "loss": 2.8127, "step": 8085 }, { "epoch": 0.1, "learning_rate": 9.736356635408583e-05, "loss": 2.7408, "step": 8090 }, { "epoch": 0.11, "learning_rate": 9.736029500908642e-05, "loss": 2.7346, "step": 8095 }, { "epoch": 0.11, "learning_rate": 9.735702169079319e-05, "loss": 2.8479, "step": 8100 }, { "epoch": 0.11, "learning_rate": 9.735374639934253e-05, "loss": 2.9039, "step": 8105 }, { "epoch": 0.11, "learning_rate": 9.735046913487093e-05, "loss": 2.875, "step": 8110 }, { "epoch": 0.11, "learning_rate": 9.734718989751492e-05, "loss": 2.8616, "step": 8115 }, { "epoch": 0.11, "learning_rate": 9.734390868741113e-05, "loss": 2.628, "step": 8120 }, { "epoch": 0.11, "learning_rate": 9.734062550469627e-05, "loss": 2.767, "step": 8125 }, { "epoch": 0.11, "learning_rate": 9.733734034950714e-05, "loss": 2.8078, "step": 8130 }, { "epoch": 0.11, "learning_rate": 9.733405322198064e-05, "loss": 2.8049, "step": 8135 }, { "epoch": 0.11, "learning_rate": 9.733076412225368e-05, "loss": 2.858, "step": 8140 }, { "epoch": 0.11, "learning_rate": 9.732747305046334e-05, "loss": 2.8875, "step": 8145 }, { "epoch": 0.11, "learning_rate": 9.732418000674675e-05, "loss": 2.7486, "step": 8150 }, { "epoch": 0.11, "learning_rate": 9.73208849912411e-05, "loss": 2.8804, "step": 8155 }, { "epoch": 0.11, "learning_rate": 9.731758800408366e-05, "loss": 2.8384, "step": 8160 }, { "epoch": 0.11, "learning_rate": 9.731428904541184e-05, "loss": 2.8871, "step": 8165 }, { "epoch": 0.11, "learning_rate": 9.731098811536307e-05, "loss": 2.7952, "step": 8170 }, { "epoch": 0.11, "learning_rate": 9.73076852140749e-05, "loss": 2.8594, "step": 8175 }, { "epoch": 0.11, "learning_rate": 9.730438034168492e-05, "loss": 2.8747, "step": 8180 }, { "epoch": 0.11, "learning_rate": 9.730107349833086e-05, "loss": 2.7661, "step": 8185 }, { "epoch": 0.11, "learning_rate": 9.729776468415047e-05, "loss": 2.8261, "step": 8190 }, { "epoch": 0.11, "learning_rate": 9.729445389928164e-05, "loss": 2.768, "step": 8195 }, { "epoch": 0.11, "learning_rate": 9.729114114386232e-05, "loss": 2.7581, "step": 8200 }, { "epoch": 0.11, "learning_rate": 9.728782641803052e-05, "loss": 2.6805, "step": 8205 }, { "epoch": 0.11, "learning_rate": 9.728450972192435e-05, "loss": 2.8062, "step": 8210 }, { "epoch": 0.11, "learning_rate": 9.728119105568201e-05, "loss": 2.8835, "step": 8215 }, { "epoch": 0.11, "learning_rate": 9.727787041944177e-05, "loss": 2.7238, "step": 8220 }, { "epoch": 0.11, "learning_rate": 9.7274547813342e-05, "loss": 2.8965, "step": 8225 }, { "epoch": 0.11, "learning_rate": 9.727122323752112e-05, "loss": 2.8021, "step": 8230 }, { "epoch": 0.11, "learning_rate": 9.726789669211764e-05, "loss": 2.6209, "step": 8235 }, { "epoch": 0.11, "learning_rate": 9.726456817727019e-05, "loss": 2.743, "step": 8240 }, { "epoch": 0.11, "learning_rate": 9.726123769311746e-05, "loss": 2.8866, "step": 8245 }, { "epoch": 0.11, "learning_rate": 9.725790523979818e-05, "loss": 2.8, "step": 8250 }, { "epoch": 0.11, "learning_rate": 9.725457081745122e-05, "loss": 2.779, "step": 8255 }, { "epoch": 0.11, "learning_rate": 9.725123442621551e-05, "loss": 2.8874, "step": 8260 }, { "epoch": 0.11, "learning_rate": 9.724789606623006e-05, "loss": 2.7602, "step": 8265 }, { "epoch": 0.11, "learning_rate": 9.724455573763398e-05, "loss": 2.8901, "step": 8270 }, { "epoch": 0.11, "learning_rate": 9.724121344056642e-05, "loss": 2.7461, "step": 8275 }, { "epoch": 0.11, "learning_rate": 9.723786917516666e-05, "loss": 2.779, "step": 8280 }, { "epoch": 0.11, "learning_rate": 9.723452294157402e-05, "loss": 2.8642, "step": 8285 }, { "epoch": 0.11, "learning_rate": 9.723117473992795e-05, "loss": 2.7512, "step": 8290 }, { "epoch": 0.11, "learning_rate": 9.722782457036793e-05, "loss": 2.8628, "step": 8295 }, { "epoch": 0.11, "learning_rate": 9.722447243303356e-05, "loss": 2.8286, "step": 8300 }, { "epoch": 0.11, "learning_rate": 9.72211183280645e-05, "loss": 2.7937, "step": 8305 }, { "epoch": 0.11, "learning_rate": 9.721776225560052e-05, "loss": 2.8551, "step": 8310 }, { "epoch": 0.11, "learning_rate": 9.721440421578143e-05, "loss": 2.7985, "step": 8315 }, { "epoch": 0.11, "learning_rate": 9.721104420874717e-05, "loss": 2.7735, "step": 8320 }, { "epoch": 0.11, "learning_rate": 9.72076822346377e-05, "loss": 2.8483, "step": 8325 }, { "epoch": 0.11, "learning_rate": 9.720431829359312e-05, "loss": 2.7318, "step": 8330 }, { "epoch": 0.11, "learning_rate": 9.720095238575359e-05, "loss": 2.828, "step": 8335 }, { "epoch": 0.11, "learning_rate": 9.719758451125935e-05, "loss": 2.7849, "step": 8340 }, { "epoch": 0.11, "learning_rate": 9.719421467025074e-05, "loss": 2.9075, "step": 8345 }, { "epoch": 0.11, "learning_rate": 9.719084286286813e-05, "loss": 2.8331, "step": 8350 }, { "epoch": 0.11, "learning_rate": 9.718746908925205e-05, "loss": 2.7454, "step": 8355 }, { "epoch": 0.11, "learning_rate": 9.718409334954304e-05, "loss": 2.8277, "step": 8360 }, { "epoch": 0.11, "learning_rate": 9.718071564388178e-05, "loss": 2.8978, "step": 8365 }, { "epoch": 0.11, "learning_rate": 9.717733597240897e-05, "loss": 2.7974, "step": 8370 }, { "epoch": 0.11, "learning_rate": 9.717395433526545e-05, "loss": 2.8721, "step": 8375 }, { "epoch": 0.11, "learning_rate": 9.717057073259211e-05, "loss": 2.9812, "step": 8380 }, { "epoch": 0.11, "learning_rate": 9.716718516452994e-05, "loss": 2.8665, "step": 8385 }, { "epoch": 0.11, "learning_rate": 9.716379763121996e-05, "loss": 2.7986, "step": 8390 }, { "epoch": 0.11, "learning_rate": 9.716040813280338e-05, "loss": 2.8982, "step": 8395 }, { "epoch": 0.11, "learning_rate": 9.715701666942138e-05, "loss": 2.6865, "step": 8400 }, { "epoch": 0.11, "learning_rate": 9.715362324121529e-05, "loss": 2.795, "step": 8405 }, { "epoch": 0.11, "learning_rate": 9.715022784832647e-05, "loss": 2.7531, "step": 8410 }, { "epoch": 0.11, "learning_rate": 9.714683049089641e-05, "loss": 2.7506, "step": 8415 }, { "epoch": 0.11, "learning_rate": 9.714343116906667e-05, "loss": 2.8116, "step": 8420 }, { "epoch": 0.11, "learning_rate": 9.714002988297887e-05, "loss": 2.9012, "step": 8425 }, { "epoch": 0.11, "learning_rate": 9.713662663277474e-05, "loss": 2.7491, "step": 8430 }, { "epoch": 0.11, "learning_rate": 9.713322141859607e-05, "loss": 3.005, "step": 8435 }, { "epoch": 0.11, "learning_rate": 9.712981424058473e-05, "loss": 2.8104, "step": 8440 }, { "epoch": 0.11, "learning_rate": 9.712640509888271e-05, "loss": 2.7816, "step": 8445 }, { "epoch": 0.11, "learning_rate": 9.712299399363203e-05, "loss": 2.8207, "step": 8450 }, { "epoch": 0.11, "learning_rate": 9.711958092497482e-05, "loss": 2.7887, "step": 8455 }, { "epoch": 0.11, "learning_rate": 9.711616589305328e-05, "loss": 2.8672, "step": 8460 }, { "epoch": 0.11, "learning_rate": 9.711274889800972e-05, "loss": 2.8199, "step": 8465 }, { "epoch": 0.11, "learning_rate": 9.710932993998651e-05, "loss": 2.7886, "step": 8470 }, { "epoch": 0.11, "learning_rate": 9.710590901912608e-05, "loss": 2.7537, "step": 8475 }, { "epoch": 0.11, "learning_rate": 9.710248613557099e-05, "loss": 2.8124, "step": 8480 }, { "epoch": 0.11, "learning_rate": 9.709906128946383e-05, "loss": 2.8082, "step": 8485 }, { "epoch": 0.11, "learning_rate": 9.709563448094732e-05, "loss": 2.7105, "step": 8490 }, { "epoch": 0.11, "learning_rate": 9.709220571016425e-05, "loss": 2.66, "step": 8495 }, { "epoch": 0.11, "learning_rate": 9.708877497725743e-05, "loss": 2.7014, "step": 8500 }, { "epoch": 0.11, "learning_rate": 9.708534228236986e-05, "loss": 2.7432, "step": 8505 }, { "epoch": 0.11, "learning_rate": 9.708190762564452e-05, "loss": 2.7939, "step": 8510 }, { "epoch": 0.11, "learning_rate": 9.707847100722456e-05, "loss": 2.8668, "step": 8515 }, { "epoch": 0.11, "learning_rate": 9.707503242725316e-05, "loss": 2.8336, "step": 8520 }, { "epoch": 0.11, "learning_rate": 9.707159188587356e-05, "loss": 2.9053, "step": 8525 }, { "epoch": 0.11, "learning_rate": 9.706814938322915e-05, "loss": 2.8925, "step": 8530 }, { "epoch": 0.11, "learning_rate": 9.706470491946331e-05, "loss": 2.7311, "step": 8535 }, { "epoch": 0.11, "learning_rate": 9.706125849471962e-05, "loss": 2.8578, "step": 8540 }, { "epoch": 0.11, "learning_rate": 9.705781010914164e-05, "loss": 2.8451, "step": 8545 }, { "epoch": 0.11, "learning_rate": 9.705435976287305e-05, "loss": 2.8185, "step": 8550 }, { "epoch": 0.11, "learning_rate": 9.705090745605763e-05, "loss": 2.9334, "step": 8555 }, { "epoch": 0.11, "learning_rate": 9.704745318883919e-05, "loss": 2.8554, "step": 8560 }, { "epoch": 0.11, "learning_rate": 9.70439969613617e-05, "loss": 2.8678, "step": 8565 }, { "epoch": 0.11, "learning_rate": 9.704053877376913e-05, "loss": 2.8532, "step": 8570 }, { "epoch": 0.11, "learning_rate": 9.703707862620556e-05, "loss": 2.7768, "step": 8575 }, { "epoch": 0.11, "learning_rate": 9.70336165188152e-05, "loss": 2.7043, "step": 8580 }, { "epoch": 0.11, "learning_rate": 9.703015245174227e-05, "loss": 2.8213, "step": 8585 }, { "epoch": 0.11, "learning_rate": 9.702668642513108e-05, "loss": 2.642, "step": 8590 }, { "epoch": 0.11, "learning_rate": 9.702321843912612e-05, "loss": 2.898, "step": 8595 }, { "epoch": 0.11, "learning_rate": 9.701974849387181e-05, "loss": 2.8975, "step": 8600 }, { "epoch": 0.11, "learning_rate": 9.701627658951276e-05, "loss": 2.7124, "step": 8605 }, { "epoch": 0.11, "learning_rate": 9.701280272619362e-05, "loss": 2.6615, "step": 8610 }, { "epoch": 0.11, "learning_rate": 9.700932690405915e-05, "loss": 2.7862, "step": 8615 }, { "epoch": 0.11, "learning_rate": 9.700584912325414e-05, "loss": 2.8508, "step": 8620 }, { "epoch": 0.11, "learning_rate": 9.700236938392352e-05, "loss": 2.8186, "step": 8625 }, { "epoch": 0.11, "learning_rate": 9.699888768621226e-05, "loss": 2.8928, "step": 8630 }, { "epoch": 0.11, "learning_rate": 9.699540403026544e-05, "loss": 2.7738, "step": 8635 }, { "epoch": 0.11, "learning_rate": 9.69919184162282e-05, "loss": 2.6783, "step": 8640 }, { "epoch": 0.11, "learning_rate": 9.698843084424577e-05, "loss": 2.7072, "step": 8645 }, { "epoch": 0.11, "learning_rate": 9.698494131446346e-05, "loss": 2.9122, "step": 8650 }, { "epoch": 0.11, "learning_rate": 9.698144982702669e-05, "loss": 2.7841, "step": 8655 }, { "epoch": 0.11, "learning_rate": 9.697795638208089e-05, "loss": 2.7988, "step": 8660 }, { "epoch": 0.11, "learning_rate": 9.697446097977163e-05, "loss": 2.7371, "step": 8665 }, { "epoch": 0.11, "learning_rate": 9.697096362024457e-05, "loss": 2.6896, "step": 8670 }, { "epoch": 0.11, "learning_rate": 9.696746430364541e-05, "loss": 2.8074, "step": 8675 }, { "epoch": 0.11, "learning_rate": 9.696396303011996e-05, "loss": 2.9301, "step": 8680 }, { "epoch": 0.11, "learning_rate": 9.69604597998141e-05, "loss": 2.7879, "step": 8685 }, { "epoch": 0.11, "learning_rate": 9.695695461287379e-05, "loss": 2.907, "step": 8690 }, { "epoch": 0.11, "learning_rate": 9.695344746944507e-05, "loss": 2.7047, "step": 8695 }, { "epoch": 0.11, "learning_rate": 9.69499383696741e-05, "loss": 2.8517, "step": 8700 }, { "epoch": 0.11, "learning_rate": 9.694642731370705e-05, "loss": 2.7405, "step": 8705 }, { "epoch": 0.11, "learning_rate": 9.69429143016902e-05, "loss": 2.8586, "step": 8710 }, { "epoch": 0.11, "learning_rate": 9.693939933376999e-05, "loss": 2.8556, "step": 8715 }, { "epoch": 0.11, "learning_rate": 9.693588241009281e-05, "loss": 2.7926, "step": 8720 }, { "epoch": 0.11, "learning_rate": 9.693236353080522e-05, "loss": 2.8054, "step": 8725 }, { "epoch": 0.11, "learning_rate": 9.692884269605381e-05, "loss": 2.8819, "step": 8730 }, { "epoch": 0.11, "learning_rate": 9.692531990598533e-05, "loss": 2.7116, "step": 8735 }, { "epoch": 0.11, "learning_rate": 9.69217951607465e-05, "loss": 2.7994, "step": 8740 }, { "epoch": 0.11, "learning_rate": 9.691826846048421e-05, "loss": 2.707, "step": 8745 }, { "epoch": 0.11, "learning_rate": 9.69147398053454e-05, "loss": 2.8087, "step": 8750 }, { "epoch": 0.11, "learning_rate": 9.69112091954771e-05, "loss": 2.8314, "step": 8755 }, { "epoch": 0.11, "learning_rate": 9.690767663102641e-05, "loss": 2.7959, "step": 8760 }, { "epoch": 0.11, "learning_rate": 9.690414211214052e-05, "loss": 2.7902, "step": 8765 }, { "epoch": 0.11, "learning_rate": 9.690060563896668e-05, "loss": 2.9117, "step": 8770 }, { "epoch": 0.11, "learning_rate": 9.689706721165225e-05, "loss": 2.8347, "step": 8775 }, { "epoch": 0.11, "learning_rate": 9.689352683034466e-05, "loss": 2.7987, "step": 8780 }, { "epoch": 0.11, "learning_rate": 9.688998449519142e-05, "loss": 2.924, "step": 8785 }, { "epoch": 0.11, "learning_rate": 9.688644020634015e-05, "loss": 2.7867, "step": 8790 }, { "epoch": 0.11, "learning_rate": 9.688289396393848e-05, "loss": 2.778, "step": 8795 }, { "epoch": 0.11, "learning_rate": 9.68793457681342e-05, "loss": 2.7757, "step": 8800 }, { "epoch": 0.11, "learning_rate": 9.687579561907512e-05, "loss": 2.8175, "step": 8805 }, { "epoch": 0.11, "learning_rate": 9.687224351690918e-05, "loss": 2.7759, "step": 8810 }, { "epoch": 0.11, "learning_rate": 9.686868946178439e-05, "loss": 2.755, "step": 8815 }, { "epoch": 0.11, "learning_rate": 9.686513345384882e-05, "loss": 2.8086, "step": 8820 }, { "epoch": 0.11, "learning_rate": 9.686157549325061e-05, "loss": 2.7146, "step": 8825 }, { "epoch": 0.11, "learning_rate": 9.685801558013802e-05, "loss": 2.8993, "step": 8830 }, { "epoch": 0.11, "learning_rate": 9.68544537146594e-05, "loss": 2.8359, "step": 8835 }, { "epoch": 0.11, "learning_rate": 9.685088989696312e-05, "loss": 2.8239, "step": 8840 }, { "epoch": 0.11, "learning_rate": 9.68473241271977e-05, "loss": 2.7803, "step": 8845 }, { "epoch": 0.11, "learning_rate": 9.684375640551169e-05, "loss": 2.7284, "step": 8850 }, { "epoch": 0.11, "learning_rate": 9.684018673205374e-05, "loss": 2.8668, "step": 8855 }, { "epoch": 0.11, "learning_rate": 9.68366151069726e-05, "loss": 2.8261, "step": 8860 }, { "epoch": 0.12, "learning_rate": 9.683304153041708e-05, "loss": 2.7946, "step": 8865 }, { "epoch": 0.12, "learning_rate": 9.682946600253606e-05, "loss": 2.7531, "step": 8870 }, { "epoch": 0.12, "learning_rate": 9.682588852347852e-05, "loss": 2.8535, "step": 8875 }, { "epoch": 0.12, "learning_rate": 9.682230909339351e-05, "loss": 2.9638, "step": 8880 }, { "epoch": 0.12, "learning_rate": 9.68187277124302e-05, "loss": 2.8001, "step": 8885 }, { "epoch": 0.12, "learning_rate": 9.68151443807378e-05, "loss": 2.9206, "step": 8890 }, { "epoch": 0.12, "learning_rate": 9.681155909846558e-05, "loss": 2.7616, "step": 8895 }, { "epoch": 0.12, "learning_rate": 9.680797186576295e-05, "loss": 2.9033, "step": 8900 }, { "epoch": 0.12, "learning_rate": 9.680438268277938e-05, "loss": 2.8196, "step": 8905 }, { "epoch": 0.12, "learning_rate": 9.68007915496644e-05, "loss": 2.7202, "step": 8910 }, { "epoch": 0.12, "learning_rate": 9.679719846656764e-05, "loss": 2.786, "step": 8915 }, { "epoch": 0.12, "learning_rate": 9.679360343363882e-05, "loss": 2.7851, "step": 8920 }, { "epoch": 0.12, "learning_rate": 9.679000645102771e-05, "loss": 2.7978, "step": 8925 }, { "epoch": 0.12, "learning_rate": 9.67864075188842e-05, "loss": 2.8338, "step": 8930 }, { "epoch": 0.12, "learning_rate": 9.678280663735822e-05, "loss": 2.803, "step": 8935 }, { "epoch": 0.12, "learning_rate": 9.677920380659981e-05, "loss": 2.7566, "step": 8940 }, { "epoch": 0.12, "learning_rate": 9.67755990267591e-05, "loss": 2.7968, "step": 8945 }, { "epoch": 0.12, "learning_rate": 9.677199229798628e-05, "loss": 2.7317, "step": 8950 }, { "epoch": 0.12, "learning_rate": 9.676838362043161e-05, "loss": 2.8144, "step": 8955 }, { "epoch": 0.12, "learning_rate": 9.676477299424545e-05, "loss": 2.8055, "step": 8960 }, { "epoch": 0.12, "learning_rate": 9.676116041957826e-05, "loss": 2.7706, "step": 8965 }, { "epoch": 0.12, "learning_rate": 9.675754589658053e-05, "loss": 2.8879, "step": 8970 }, { "epoch": 0.12, "learning_rate": 9.675392942540288e-05, "loss": 2.8192, "step": 8975 }, { "epoch": 0.12, "learning_rate": 9.6750311006196e-05, "loss": 2.6596, "step": 8980 }, { "epoch": 0.12, "learning_rate": 9.674669063911064e-05, "loss": 2.7555, "step": 8985 }, { "epoch": 0.12, "learning_rate": 9.674306832429763e-05, "loss": 2.8045, "step": 8990 }, { "epoch": 0.12, "learning_rate": 9.673944406190794e-05, "loss": 2.8214, "step": 8995 }, { "epoch": 0.12, "learning_rate": 9.673581785209254e-05, "loss": 2.7698, "step": 9000 }, { "epoch": 0.12, "learning_rate": 9.673218969500251e-05, "loss": 2.7192, "step": 9005 }, { "epoch": 0.12, "learning_rate": 9.672855959078906e-05, "loss": 2.8318, "step": 9010 }, { "epoch": 0.12, "learning_rate": 9.672492753960341e-05, "loss": 2.8086, "step": 9015 }, { "epoch": 0.12, "learning_rate": 9.67212935415969e-05, "loss": 2.8057, "step": 9020 }, { "epoch": 0.12, "learning_rate": 9.671765759692094e-05, "loss": 2.8491, "step": 9025 }, { "epoch": 0.12, "learning_rate": 9.671401970572704e-05, "loss": 2.7888, "step": 9030 }, { "epoch": 0.12, "learning_rate": 9.671037986816675e-05, "loss": 2.7788, "step": 9035 }, { "epoch": 0.12, "learning_rate": 9.670673808439172e-05, "loss": 2.7279, "step": 9040 }, { "epoch": 0.12, "learning_rate": 9.670309435455374e-05, "loss": 2.7604, "step": 9045 }, { "epoch": 0.12, "learning_rate": 9.669944867880456e-05, "loss": 2.6864, "step": 9050 }, { "epoch": 0.12, "learning_rate": 9.669580105729612e-05, "loss": 2.8447, "step": 9055 }, { "epoch": 0.12, "learning_rate": 9.669215149018039e-05, "loss": 2.7763, "step": 9060 }, { "epoch": 0.12, "learning_rate": 9.668849997760945e-05, "loss": 2.9221, "step": 9065 }, { "epoch": 0.12, "learning_rate": 9.668484651973541e-05, "loss": 2.7485, "step": 9070 }, { "epoch": 0.12, "learning_rate": 9.66811911167105e-05, "loss": 2.8487, "step": 9075 }, { "epoch": 0.12, "learning_rate": 9.667753376868704e-05, "loss": 2.7619, "step": 9080 }, { "epoch": 0.12, "learning_rate": 9.667387447581742e-05, "loss": 2.687, "step": 9085 }, { "epoch": 0.12, "learning_rate": 9.667021323825407e-05, "loss": 2.8124, "step": 9090 }, { "epoch": 0.12, "learning_rate": 9.666655005614958e-05, "loss": 2.7956, "step": 9095 }, { "epoch": 0.12, "learning_rate": 9.666288492965656e-05, "loss": 2.8036, "step": 9100 }, { "epoch": 0.12, "learning_rate": 9.665921785892771e-05, "loss": 2.7638, "step": 9105 }, { "epoch": 0.12, "learning_rate": 9.665554884411585e-05, "loss": 2.7691, "step": 9110 }, { "epoch": 0.12, "learning_rate": 9.665187788537382e-05, "loss": 2.8718, "step": 9115 }, { "epoch": 0.12, "learning_rate": 9.664820498285458e-05, "loss": 2.7798, "step": 9120 }, { "epoch": 0.12, "learning_rate": 9.664453013671119e-05, "loss": 2.8426, "step": 9125 }, { "epoch": 0.12, "learning_rate": 9.664085334709673e-05, "loss": 2.904, "step": 9130 }, { "epoch": 0.12, "learning_rate": 9.66371746141644e-05, "loss": 2.6871, "step": 9135 }, { "epoch": 0.12, "learning_rate": 9.663349393806748e-05, "loss": 2.7272, "step": 9140 }, { "epoch": 0.12, "learning_rate": 9.662981131895936e-05, "loss": 2.8628, "step": 9145 }, { "epoch": 0.12, "learning_rate": 9.662612675699344e-05, "loss": 2.7101, "step": 9150 }, { "epoch": 0.12, "learning_rate": 9.662244025232326e-05, "loss": 2.8292, "step": 9155 }, { "epoch": 0.12, "learning_rate": 9.661875180510239e-05, "loss": 2.781, "step": 9160 }, { "epoch": 0.12, "learning_rate": 9.661506141548454e-05, "loss": 2.7024, "step": 9165 }, { "epoch": 0.12, "learning_rate": 9.661136908362347e-05, "loss": 2.7271, "step": 9170 }, { "epoch": 0.12, "learning_rate": 9.660767480967302e-05, "loss": 2.8244, "step": 9175 }, { "epoch": 0.12, "learning_rate": 9.66039785937871e-05, "loss": 2.8262, "step": 9180 }, { "epoch": 0.12, "learning_rate": 9.660028043611972e-05, "loss": 2.9048, "step": 9185 }, { "epoch": 0.12, "learning_rate": 9.659658033682499e-05, "loss": 2.819, "step": 9190 }, { "epoch": 0.12, "learning_rate": 9.659287829605706e-05, "loss": 2.7672, "step": 9195 }, { "epoch": 0.12, "learning_rate": 9.658917431397017e-05, "loss": 2.696, "step": 9200 }, { "epoch": 0.12, "learning_rate": 9.658546839071865e-05, "loss": 2.8242, "step": 9205 }, { "epoch": 0.12, "learning_rate": 9.658176052645693e-05, "loss": 2.7373, "step": 9210 }, { "epoch": 0.12, "learning_rate": 9.657805072133948e-05, "loss": 2.8669, "step": 9215 }, { "epoch": 0.12, "learning_rate": 9.657433897552086e-05, "loss": 2.8709, "step": 9220 }, { "epoch": 0.12, "learning_rate": 9.657062528915576e-05, "loss": 2.678, "step": 9225 }, { "epoch": 0.12, "learning_rate": 9.656690966239887e-05, "loss": 2.8131, "step": 9230 }, { "epoch": 0.12, "learning_rate": 9.656319209540504e-05, "loss": 2.7482, "step": 9235 }, { "epoch": 0.12, "learning_rate": 9.655947258832916e-05, "loss": 2.813, "step": 9240 }, { "epoch": 0.12, "learning_rate": 9.655575114132618e-05, "loss": 2.7978, "step": 9245 }, { "epoch": 0.12, "learning_rate": 9.655202775455117e-05, "loss": 2.917, "step": 9250 }, { "epoch": 0.12, "learning_rate": 9.654830242815927e-05, "loss": 2.9117, "step": 9255 }, { "epoch": 0.12, "learning_rate": 9.654457516230568e-05, "loss": 2.6777, "step": 9260 }, { "epoch": 0.12, "learning_rate": 9.654084595714575e-05, "loss": 2.7575, "step": 9265 }, { "epoch": 0.12, "learning_rate": 9.65371148128348e-05, "loss": 2.7362, "step": 9270 }, { "epoch": 0.12, "learning_rate": 9.653338172952831e-05, "loss": 2.8234, "step": 9275 }, { "epoch": 0.12, "learning_rate": 9.652964670738184e-05, "loss": 2.7292, "step": 9280 }, { "epoch": 0.12, "learning_rate": 9.6525909746551e-05, "loss": 2.8972, "step": 9285 }, { "epoch": 0.12, "learning_rate": 9.652217084719148e-05, "loss": 2.7878, "step": 9290 }, { "epoch": 0.12, "learning_rate": 9.651843000945907e-05, "loss": 2.7315, "step": 9295 }, { "epoch": 0.12, "learning_rate": 9.651468723350965e-05, "loss": 2.809, "step": 9300 }, { "epoch": 0.12, "learning_rate": 9.651094251949914e-05, "loss": 2.8567, "step": 9305 }, { "epoch": 0.12, "learning_rate": 9.650719586758359e-05, "loss": 2.8296, "step": 9310 }, { "epoch": 0.12, "learning_rate": 9.650344727791908e-05, "loss": 2.8864, "step": 9315 }, { "epoch": 0.12, "learning_rate": 9.649969675066182e-05, "loss": 2.8024, "step": 9320 }, { "epoch": 0.12, "learning_rate": 9.649594428596807e-05, "loss": 2.6926, "step": 9325 }, { "epoch": 0.12, "learning_rate": 9.649218988399417e-05, "loss": 2.8492, "step": 9330 }, { "epoch": 0.12, "learning_rate": 9.648843354489656e-05, "loss": 2.8214, "step": 9335 }, { "epoch": 0.12, "learning_rate": 9.648467526883176e-05, "loss": 2.7602, "step": 9340 }, { "epoch": 0.12, "learning_rate": 9.648091505595634e-05, "loss": 2.8623, "step": 9345 }, { "epoch": 0.12, "learning_rate": 9.647715290642697e-05, "loss": 2.8153, "step": 9350 }, { "epoch": 0.12, "learning_rate": 9.647338882040042e-05, "loss": 2.76, "step": 9355 }, { "epoch": 0.12, "learning_rate": 9.646962279803351e-05, "loss": 2.7311, "step": 9360 }, { "epoch": 0.12, "learning_rate": 9.646585483948315e-05, "loss": 2.8615, "step": 9365 }, { "epoch": 0.12, "learning_rate": 9.646208494490636e-05, "loss": 2.6646, "step": 9370 }, { "epoch": 0.12, "learning_rate": 9.64583131144602e-05, "loss": 2.7414, "step": 9375 }, { "epoch": 0.12, "learning_rate": 9.645453934830181e-05, "loss": 2.8415, "step": 9380 }, { "epoch": 0.12, "learning_rate": 9.645076364658846e-05, "loss": 2.8378, "step": 9385 }, { "epoch": 0.12, "learning_rate": 9.644698600947741e-05, "loss": 2.758, "step": 9390 }, { "epoch": 0.12, "learning_rate": 9.64432064371261e-05, "loss": 2.7447, "step": 9395 }, { "epoch": 0.12, "learning_rate": 9.643942492969201e-05, "loss": 2.7895, "step": 9400 }, { "epoch": 0.12, "learning_rate": 9.643564148733269e-05, "loss": 2.8306, "step": 9405 }, { "epoch": 0.12, "learning_rate": 9.643185611020577e-05, "loss": 2.8069, "step": 9410 }, { "epoch": 0.12, "learning_rate": 9.642806879846899e-05, "loss": 2.7933, "step": 9415 }, { "epoch": 0.12, "learning_rate": 9.642427955228014e-05, "loss": 2.8122, "step": 9420 }, { "epoch": 0.12, "learning_rate": 9.642048837179709e-05, "loss": 2.8296, "step": 9425 }, { "epoch": 0.12, "learning_rate": 9.641669525717782e-05, "loss": 2.7003, "step": 9430 }, { "epoch": 0.12, "learning_rate": 9.641290020858037e-05, "loss": 2.8083, "step": 9435 }, { "epoch": 0.12, "learning_rate": 9.640910322616284e-05, "loss": 2.7948, "step": 9440 }, { "epoch": 0.12, "learning_rate": 9.640530431008345e-05, "loss": 2.7987, "step": 9445 }, { "epoch": 0.12, "learning_rate": 9.64015034605005e-05, "loss": 2.9709, "step": 9450 }, { "epoch": 0.12, "learning_rate": 9.639770067757232e-05, "loss": 2.7428, "step": 9455 }, { "epoch": 0.12, "learning_rate": 9.63938959614574e-05, "loss": 2.7678, "step": 9460 }, { "epoch": 0.12, "learning_rate": 9.639008931231421e-05, "loss": 2.8533, "step": 9465 }, { "epoch": 0.12, "learning_rate": 9.63862807303014e-05, "loss": 2.7631, "step": 9470 }, { "epoch": 0.12, "learning_rate": 9.638247021557764e-05, "loss": 2.8477, "step": 9475 }, { "epoch": 0.12, "learning_rate": 9.637865776830172e-05, "loss": 2.7195, "step": 9480 }, { "epoch": 0.12, "learning_rate": 9.637484338863245e-05, "loss": 2.7386, "step": 9485 }, { "epoch": 0.12, "learning_rate": 9.637102707672879e-05, "loss": 2.7517, "step": 9490 }, { "epoch": 0.12, "learning_rate": 9.63672088327497e-05, "loss": 2.7786, "step": 9495 }, { "epoch": 0.12, "learning_rate": 9.636338865685434e-05, "loss": 2.6976, "step": 9500 }, { "epoch": 0.12, "learning_rate": 9.635956654920182e-05, "loss": 2.8762, "step": 9505 }, { "epoch": 0.12, "learning_rate": 9.635574250995143e-05, "loss": 2.7455, "step": 9510 }, { "epoch": 0.12, "learning_rate": 9.635191653926248e-05, "loss": 2.8711, "step": 9515 }, { "epoch": 0.12, "learning_rate": 9.634808863729438e-05, "loss": 2.7465, "step": 9520 }, { "epoch": 0.12, "learning_rate": 9.634425880420665e-05, "loss": 2.7828, "step": 9525 }, { "epoch": 0.12, "learning_rate": 9.634042704015883e-05, "loss": 2.6708, "step": 9530 }, { "epoch": 0.12, "learning_rate": 9.633659334531057e-05, "loss": 2.7747, "step": 9535 }, { "epoch": 0.12, "learning_rate": 9.633275771982162e-05, "loss": 2.819, "step": 9540 }, { "epoch": 0.12, "learning_rate": 9.63289201638518e-05, "loss": 2.7744, "step": 9545 }, { "epoch": 0.12, "learning_rate": 9.632508067756098e-05, "loss": 2.7775, "step": 9550 }, { "epoch": 0.12, "learning_rate": 9.632123926110916e-05, "loss": 2.8409, "step": 9555 }, { "epoch": 0.12, "learning_rate": 9.631739591465639e-05, "loss": 2.8627, "step": 9560 }, { "epoch": 0.12, "learning_rate": 9.631355063836278e-05, "loss": 2.6915, "step": 9565 }, { "epoch": 0.12, "learning_rate": 9.630970343238857e-05, "loss": 2.6695, "step": 9570 }, { "epoch": 0.12, "learning_rate": 9.630585429689404e-05, "loss": 2.8972, "step": 9575 }, { "epoch": 0.12, "learning_rate": 9.63020032320396e-05, "loss": 2.7579, "step": 9580 }, { "epoch": 0.12, "learning_rate": 9.629815023798567e-05, "loss": 2.8373, "step": 9585 }, { "epoch": 0.12, "learning_rate": 9.62942953148928e-05, "loss": 2.7948, "step": 9590 }, { "epoch": 0.12, "learning_rate": 9.629043846292161e-05, "loss": 2.7461, "step": 9595 }, { "epoch": 0.12, "learning_rate": 9.628657968223278e-05, "loss": 2.8119, "step": 9600 }, { "epoch": 0.12, "learning_rate": 9.628271897298713e-05, "loss": 2.7935, "step": 9605 }, { "epoch": 0.12, "learning_rate": 9.627885633534548e-05, "loss": 2.8831, "step": 9610 }, { "epoch": 0.12, "learning_rate": 9.627499176946878e-05, "loss": 2.7665, "step": 9615 }, { "epoch": 0.12, "learning_rate": 9.627112527551805e-05, "loss": 2.7439, "step": 9620 }, { "epoch": 0.12, "learning_rate": 9.626725685365439e-05, "loss": 2.6995, "step": 9625 }, { "epoch": 0.12, "learning_rate": 9.626338650403899e-05, "loss": 2.7433, "step": 9630 }, { "epoch": 0.13, "learning_rate": 9.625951422683309e-05, "loss": 2.8235, "step": 9635 }, { "epoch": 0.13, "learning_rate": 9.625564002219805e-05, "loss": 2.7929, "step": 9640 }, { "epoch": 0.13, "learning_rate": 9.625176389029528e-05, "loss": 2.6226, "step": 9645 }, { "epoch": 0.13, "learning_rate": 9.624788583128628e-05, "loss": 2.8274, "step": 9650 }, { "epoch": 0.13, "learning_rate": 9.624400584533264e-05, "loss": 2.7769, "step": 9655 }, { "epoch": 0.13, "learning_rate": 9.624012393259601e-05, "loss": 2.7385, "step": 9660 }, { "epoch": 0.13, "learning_rate": 9.623624009323816e-05, "loss": 2.8067, "step": 9665 }, { "epoch": 0.13, "learning_rate": 9.623235432742088e-05, "loss": 2.7924, "step": 9670 }, { "epoch": 0.13, "learning_rate": 9.622846663530607e-05, "loss": 2.8353, "step": 9675 }, { "epoch": 0.13, "learning_rate": 9.622457701705574e-05, "loss": 2.8914, "step": 9680 }, { "epoch": 0.13, "learning_rate": 9.622068547283194e-05, "loss": 2.8251, "step": 9685 }, { "epoch": 0.13, "learning_rate": 9.621679200279682e-05, "loss": 2.7481, "step": 9690 }, { "epoch": 0.13, "learning_rate": 9.621289660711259e-05, "loss": 2.8867, "step": 9695 }, { "epoch": 0.13, "learning_rate": 9.620899928594156e-05, "loss": 2.8487, "step": 9700 }, { "epoch": 0.13, "learning_rate": 9.620510003944612e-05, "loss": 2.814, "step": 9705 }, { "epoch": 0.13, "learning_rate": 9.620119886778873e-05, "loss": 2.7014, "step": 9710 }, { "epoch": 0.13, "learning_rate": 9.619729577113194e-05, "loss": 2.8152, "step": 9715 }, { "epoch": 0.13, "learning_rate": 9.619339074963835e-05, "loss": 2.7025, "step": 9720 }, { "epoch": 0.13, "learning_rate": 9.61894838034707e-05, "loss": 2.7309, "step": 9725 }, { "epoch": 0.13, "learning_rate": 9.618557493279177e-05, "loss": 2.6311, "step": 9730 }, { "epoch": 0.13, "learning_rate": 9.618166413776439e-05, "loss": 2.6902, "step": 9735 }, { "epoch": 0.13, "learning_rate": 9.617775141855154e-05, "loss": 2.8224, "step": 9740 }, { "epoch": 0.13, "learning_rate": 9.617383677531624e-05, "loss": 2.7124, "step": 9745 }, { "epoch": 0.13, "learning_rate": 9.61699202082216e-05, "loss": 2.8251, "step": 9750 }, { "epoch": 0.13, "learning_rate": 9.616600171743078e-05, "loss": 2.8899, "step": 9755 }, { "epoch": 0.13, "learning_rate": 9.616208130310706e-05, "loss": 2.747, "step": 9760 }, { "epoch": 0.13, "learning_rate": 9.61581589654138e-05, "loss": 2.6525, "step": 9765 }, { "epoch": 0.13, "learning_rate": 9.615423470451444e-05, "loss": 2.857, "step": 9770 }, { "epoch": 0.13, "learning_rate": 9.615030852057243e-05, "loss": 2.879, "step": 9775 }, { "epoch": 0.13, "learning_rate": 9.61463804137514e-05, "loss": 2.7698, "step": 9780 }, { "epoch": 0.13, "learning_rate": 9.6142450384215e-05, "loss": 2.7276, "step": 9785 }, { "epoch": 0.13, "learning_rate": 9.6138518432127e-05, "loss": 2.7254, "step": 9790 }, { "epoch": 0.13, "learning_rate": 9.613458455765121e-05, "loss": 2.8431, "step": 9795 }, { "epoch": 0.13, "learning_rate": 9.613064876095153e-05, "loss": 2.7559, "step": 9800 }, { "epoch": 0.13, "learning_rate": 9.612671104219196e-05, "loss": 2.713, "step": 9805 }, { "epoch": 0.13, "learning_rate": 9.612277140153655e-05, "loss": 2.738, "step": 9810 }, { "epoch": 0.13, "learning_rate": 9.611882983914945e-05, "loss": 2.7325, "step": 9815 }, { "epoch": 0.13, "learning_rate": 9.611488635519492e-05, "loss": 2.9767, "step": 9820 }, { "epoch": 0.13, "learning_rate": 9.611094094983725e-05, "loss": 2.7905, "step": 9825 }, { "epoch": 0.13, "learning_rate": 9.61069936232408e-05, "loss": 2.8014, "step": 9830 }, { "epoch": 0.13, "learning_rate": 9.610304437557008e-05, "loss": 2.5857, "step": 9835 }, { "epoch": 0.13, "learning_rate": 9.609909320698961e-05, "loss": 2.8709, "step": 9840 }, { "epoch": 0.13, "learning_rate": 9.609514011766403e-05, "loss": 2.8198, "step": 9845 }, { "epoch": 0.13, "learning_rate": 9.609118510775805e-05, "loss": 2.7241, "step": 9850 }, { "epoch": 0.13, "learning_rate": 9.608722817743642e-05, "loss": 2.8117, "step": 9855 }, { "epoch": 0.13, "learning_rate": 9.608326932686407e-05, "loss": 2.6856, "step": 9860 }, { "epoch": 0.13, "learning_rate": 9.607930855620591e-05, "loss": 2.8474, "step": 9865 }, { "epoch": 0.13, "learning_rate": 9.607534586562697e-05, "loss": 2.737, "step": 9870 }, { "epoch": 0.13, "learning_rate": 9.607138125529236e-05, "loss": 2.7879, "step": 9875 }, { "epoch": 0.13, "learning_rate": 9.606741472536726e-05, "loss": 2.7958, "step": 9880 }, { "epoch": 0.13, "learning_rate": 9.606344627601696e-05, "loss": 2.8036, "step": 9885 }, { "epoch": 0.13, "learning_rate": 9.60594759074068e-05, "loss": 2.7218, "step": 9890 }, { "epoch": 0.13, "learning_rate": 9.605550361970219e-05, "loss": 2.808, "step": 9895 }, { "epoch": 0.13, "learning_rate": 9.605152941306865e-05, "loss": 2.7999, "step": 9900 }, { "epoch": 0.13, "learning_rate": 9.604755328767178e-05, "loss": 2.7354, "step": 9905 }, { "epoch": 0.13, "learning_rate": 9.604357524367722e-05, "loss": 2.7407, "step": 9910 }, { "epoch": 0.13, "learning_rate": 9.603959528125075e-05, "loss": 2.7694, "step": 9915 }, { "epoch": 0.13, "learning_rate": 9.603561340055818e-05, "loss": 2.7871, "step": 9920 }, { "epoch": 0.13, "learning_rate": 9.60316296017654e-05, "loss": 2.7513, "step": 9925 }, { "epoch": 0.13, "learning_rate": 9.602764388503843e-05, "loss": 2.7954, "step": 9930 }, { "epoch": 0.13, "learning_rate": 9.602365625054333e-05, "loss": 2.7006, "step": 9935 }, { "epoch": 0.13, "learning_rate": 9.601966669844622e-05, "loss": 2.6895, "step": 9940 }, { "epoch": 0.13, "learning_rate": 9.601567522891335e-05, "loss": 2.7212, "step": 9945 }, { "epoch": 0.13, "learning_rate": 9.601168184211102e-05, "loss": 2.7031, "step": 9950 }, { "epoch": 0.13, "learning_rate": 9.600768653820564e-05, "loss": 2.8565, "step": 9955 }, { "epoch": 0.13, "learning_rate": 9.600368931736364e-05, "loss": 2.8969, "step": 9960 }, { "epoch": 0.13, "learning_rate": 9.59996901797516e-05, "loss": 2.7693, "step": 9965 }, { "epoch": 0.13, "learning_rate": 9.599568912553611e-05, "loss": 2.7789, "step": 9970 }, { "epoch": 0.13, "learning_rate": 9.59916861548839e-05, "loss": 2.7598, "step": 9975 }, { "epoch": 0.13, "learning_rate": 9.598768126796176e-05, "loss": 2.8548, "step": 9980 }, { "epoch": 0.13, "learning_rate": 9.598367446493653e-05, "loss": 2.761, "step": 9985 }, { "epoch": 0.13, "learning_rate": 9.597966574597519e-05, "loss": 2.7147, "step": 9990 }, { "epoch": 0.13, "learning_rate": 9.597565511124474e-05, "loss": 2.8037, "step": 9995 }, { "epoch": 0.13, "learning_rate": 9.59716425609123e-05, "loss": 2.7751, "step": 10000 }, { "epoch": 0.13, "learning_rate": 9.596762809514505e-05, "loss": 2.7256, "step": 10005 }, { "epoch": 0.13, "learning_rate": 9.596361171411026e-05, "loss": 2.834, "step": 10010 }, { "epoch": 0.13, "learning_rate": 9.595959341797525e-05, "loss": 2.785, "step": 10015 }, { "epoch": 0.13, "learning_rate": 9.595557320690748e-05, "loss": 2.7246, "step": 10020 }, { "epoch": 0.13, "learning_rate": 9.595155108107443e-05, "loss": 2.8481, "step": 10025 }, { "epoch": 0.13, "learning_rate": 9.594752704064369e-05, "loss": 2.8044, "step": 10030 }, { "epoch": 0.13, "learning_rate": 9.594350108578293e-05, "loss": 2.7887, "step": 10035 }, { "epoch": 0.13, "learning_rate": 9.59394732166599e-05, "loss": 2.8206, "step": 10040 }, { "epoch": 0.13, "learning_rate": 9.593544343344241e-05, "loss": 2.6489, "step": 10045 }, { "epoch": 0.13, "learning_rate": 9.593141173629836e-05, "loss": 2.7968, "step": 10050 }, { "epoch": 0.13, "learning_rate": 9.592737812539575e-05, "loss": 2.7783, "step": 10055 }, { "epoch": 0.13, "learning_rate": 9.592334260090263e-05, "loss": 2.7301, "step": 10060 }, { "epoch": 0.13, "learning_rate": 9.591930516298714e-05, "loss": 2.9252, "step": 10065 }, { "epoch": 0.13, "learning_rate": 9.591526581181751e-05, "loss": 2.7918, "step": 10070 }, { "epoch": 0.13, "learning_rate": 9.591122454756203e-05, "loss": 2.786, "step": 10075 }, { "epoch": 0.13, "learning_rate": 9.59071813703891e-05, "loss": 2.6729, "step": 10080 }, { "epoch": 0.13, "learning_rate": 9.590313628046717e-05, "loss": 2.7755, "step": 10085 }, { "epoch": 0.13, "learning_rate": 9.589908927796478e-05, "loss": 2.8611, "step": 10090 }, { "epoch": 0.13, "learning_rate": 9.589504036305056e-05, "loss": 2.7485, "step": 10095 }, { "epoch": 0.13, "learning_rate": 9.58909895358932e-05, "loss": 2.8069, "step": 10100 }, { "epoch": 0.13, "learning_rate": 9.588693679666148e-05, "loss": 2.8484, "step": 10105 }, { "epoch": 0.13, "learning_rate": 9.588288214552427e-05, "loss": 2.7904, "step": 10110 }, { "epoch": 0.13, "learning_rate": 9.58788255826505e-05, "loss": 2.7794, "step": 10115 }, { "epoch": 0.13, "learning_rate": 9.58747671082092e-05, "loss": 2.7503, "step": 10120 }, { "epoch": 0.13, "learning_rate": 9.587070672236944e-05, "loss": 2.8427, "step": 10125 }, { "epoch": 0.13, "learning_rate": 9.586664442530044e-05, "loss": 2.7714, "step": 10130 }, { "epoch": 0.13, "learning_rate": 9.586258021717143e-05, "loss": 2.7668, "step": 10135 }, { "epoch": 0.13, "learning_rate": 9.585851409815175e-05, "loss": 2.7497, "step": 10140 }, { "epoch": 0.13, "learning_rate": 9.585444606841083e-05, "loss": 2.6477, "step": 10145 }, { "epoch": 0.13, "learning_rate": 9.585037612811815e-05, "loss": 2.7119, "step": 10150 }, { "epoch": 0.13, "learning_rate": 9.58463042774433e-05, "loss": 2.7953, "step": 10155 }, { "epoch": 0.13, "learning_rate": 9.584223051655594e-05, "loss": 2.838, "step": 10160 }, { "epoch": 0.13, "learning_rate": 9.583815484562578e-05, "loss": 2.6567, "step": 10165 }, { "epoch": 0.13, "learning_rate": 9.583407726482265e-05, "loss": 2.8916, "step": 10170 }, { "epoch": 0.13, "learning_rate": 9.582999777431648e-05, "loss": 2.8174, "step": 10175 }, { "epoch": 0.13, "learning_rate": 9.582591637427717e-05, "loss": 2.7499, "step": 10180 }, { "epoch": 0.13, "learning_rate": 9.582183306487482e-05, "loss": 2.7721, "step": 10185 }, { "epoch": 0.13, "learning_rate": 9.581774784627957e-05, "loss": 2.8627, "step": 10190 }, { "epoch": 0.13, "learning_rate": 9.581366071866163e-05, "loss": 2.776, "step": 10195 }, { "epoch": 0.13, "learning_rate": 9.580957168219127e-05, "loss": 2.7608, "step": 10200 }, { "epoch": 0.13, "learning_rate": 9.580548073703888e-05, "loss": 2.7564, "step": 10205 }, { "epoch": 0.13, "learning_rate": 9.580138788337489e-05, "loss": 2.7136, "step": 10210 }, { "epoch": 0.13, "learning_rate": 9.579729312136987e-05, "loss": 2.7905, "step": 10215 }, { "epoch": 0.13, "learning_rate": 9.57931964511944e-05, "loss": 2.8705, "step": 10220 }, { "epoch": 0.13, "learning_rate": 9.578909787301918e-05, "loss": 2.7689, "step": 10225 }, { "epoch": 0.13, "learning_rate": 9.578499738701498e-05, "loss": 2.7714, "step": 10230 }, { "epoch": 0.13, "learning_rate": 9.578089499335266e-05, "loss": 2.8872, "step": 10235 }, { "epoch": 0.13, "learning_rate": 9.577679069220312e-05, "loss": 2.7487, "step": 10240 }, { "epoch": 0.13, "learning_rate": 9.577268448373738e-05, "loss": 2.6762, "step": 10245 }, { "epoch": 0.13, "learning_rate": 9.576857636812653e-05, "loss": 2.8771, "step": 10250 }, { "epoch": 0.13, "learning_rate": 9.576446634554175e-05, "loss": 2.7915, "step": 10255 }, { "epoch": 0.13, "learning_rate": 9.576035441615428e-05, "loss": 2.8307, "step": 10260 }, { "epoch": 0.13, "learning_rate": 9.575624058013544e-05, "loss": 2.6711, "step": 10265 }, { "epoch": 0.13, "learning_rate": 9.575212483765662e-05, "loss": 2.7541, "step": 10270 }, { "epoch": 0.13, "learning_rate": 9.574800718888933e-05, "loss": 2.8088, "step": 10275 }, { "epoch": 0.13, "learning_rate": 9.574388763400512e-05, "loss": 2.878, "step": 10280 }, { "epoch": 0.13, "learning_rate": 9.573976617317564e-05, "loss": 2.6824, "step": 10285 }, { "epoch": 0.13, "learning_rate": 9.573564280657264e-05, "loss": 2.7962, "step": 10290 }, { "epoch": 0.13, "learning_rate": 9.573151753436787e-05, "loss": 2.6984, "step": 10295 }, { "epoch": 0.13, "learning_rate": 9.572739035673323e-05, "loss": 2.7218, "step": 10300 }, { "epoch": 0.13, "learning_rate": 9.572326127384069e-05, "loss": 2.7882, "step": 10305 }, { "epoch": 0.13, "learning_rate": 9.571913028586231e-05, "loss": 2.8325, "step": 10310 }, { "epoch": 0.13, "learning_rate": 9.571499739297016e-05, "loss": 2.7604, "step": 10315 }, { "epoch": 0.13, "learning_rate": 9.571086259533649e-05, "loss": 2.865, "step": 10320 }, { "epoch": 0.13, "learning_rate": 9.570672589313353e-05, "loss": 2.7481, "step": 10325 }, { "epoch": 0.13, "learning_rate": 9.570258728653367e-05, "loss": 2.6528, "step": 10330 }, { "epoch": 0.13, "learning_rate": 9.569844677570936e-05, "loss": 2.676, "step": 10335 }, { "epoch": 0.13, "learning_rate": 9.569430436083308e-05, "loss": 2.8062, "step": 10340 }, { "epoch": 0.13, "learning_rate": 9.569016004207746e-05, "loss": 2.8786, "step": 10345 }, { "epoch": 0.13, "learning_rate": 9.568601381961515e-05, "loss": 2.7794, "step": 10350 }, { "epoch": 0.13, "learning_rate": 9.568186569361892e-05, "loss": 2.8343, "step": 10355 }, { "epoch": 0.13, "learning_rate": 9.56777156642616e-05, "loss": 2.9059, "step": 10360 }, { "epoch": 0.13, "learning_rate": 9.56735637317161e-05, "loss": 2.7605, "step": 10365 }, { "epoch": 0.13, "learning_rate": 9.566940989615541e-05, "loss": 2.8505, "step": 10370 }, { "epoch": 0.13, "learning_rate": 9.566525415775261e-05, "loss": 2.8062, "step": 10375 }, { "epoch": 0.13, "learning_rate": 9.566109651668084e-05, "loss": 2.785, "step": 10380 }, { "epoch": 0.13, "learning_rate": 9.565693697311335e-05, "loss": 2.8408, "step": 10385 }, { "epoch": 0.13, "learning_rate": 9.565277552722344e-05, "loss": 2.7545, "step": 10390 }, { "epoch": 0.13, "learning_rate": 9.564861217918448e-05, "loss": 2.7675, "step": 10395 }, { "epoch": 0.13, "learning_rate": 9.564444692916998e-05, "loss": 2.8519, "step": 10400 }, { "epoch": 0.14, "learning_rate": 9.564027977735344e-05, "loss": 2.7963, "step": 10405 }, { "epoch": 0.14, "learning_rate": 9.563611072390852e-05, "loss": 2.8305, "step": 10410 }, { "epoch": 0.14, "learning_rate": 9.563193976900892e-05, "loss": 2.7897, "step": 10415 }, { "epoch": 0.14, "learning_rate": 9.56277669128284e-05, "loss": 2.7788, "step": 10420 }, { "epoch": 0.14, "learning_rate": 9.562359215554086e-05, "loss": 2.6573, "step": 10425 }, { "epoch": 0.14, "learning_rate": 9.561941549732023e-05, "loss": 2.8044, "step": 10430 }, { "epoch": 0.14, "learning_rate": 9.561523693834054e-05, "loss": 2.7019, "step": 10435 }, { "epoch": 0.14, "learning_rate": 9.561105647877587e-05, "loss": 2.8408, "step": 10440 }, { "epoch": 0.14, "learning_rate": 9.560687411880043e-05, "loss": 2.8059, "step": 10445 }, { "epoch": 0.14, "learning_rate": 9.560268985858845e-05, "loss": 2.7701, "step": 10450 }, { "epoch": 0.14, "learning_rate": 9.559850369831429e-05, "loss": 2.6734, "step": 10455 }, { "epoch": 0.14, "learning_rate": 9.559431563815237e-05, "loss": 2.8834, "step": 10460 }, { "epoch": 0.14, "learning_rate": 9.559012567827716e-05, "loss": 2.6867, "step": 10465 }, { "epoch": 0.14, "learning_rate": 9.558593381886329e-05, "loss": 2.8627, "step": 10470 }, { "epoch": 0.14, "learning_rate": 9.558174006008536e-05, "loss": 2.7919, "step": 10475 }, { "epoch": 0.14, "learning_rate": 9.557754440211815e-05, "loss": 2.8056, "step": 10480 }, { "epoch": 0.14, "learning_rate": 9.557334684513643e-05, "loss": 2.8606, "step": 10485 }, { "epoch": 0.14, "learning_rate": 9.556914738931515e-05, "loss": 2.7846, "step": 10490 }, { "epoch": 0.14, "learning_rate": 9.556494603482925e-05, "loss": 2.7242, "step": 10495 }, { "epoch": 0.14, "learning_rate": 9.556074278185375e-05, "loss": 2.6852, "step": 10500 }, { "epoch": 0.14, "learning_rate": 9.555653763056383e-05, "loss": 2.6894, "step": 10505 }, { "epoch": 0.14, "learning_rate": 9.555233058113469e-05, "loss": 2.6775, "step": 10510 }, { "epoch": 0.14, "learning_rate": 9.55481216337416e-05, "loss": 2.6884, "step": 10515 }, { "epoch": 0.14, "learning_rate": 9.554391078855996e-05, "loss": 2.7505, "step": 10520 }, { "epoch": 0.14, "learning_rate": 9.553969804576519e-05, "loss": 2.7073, "step": 10525 }, { "epoch": 0.14, "learning_rate": 9.553548340553282e-05, "loss": 2.6591, "step": 10530 }, { "epoch": 0.14, "learning_rate": 9.553126686803847e-05, "loss": 2.8301, "step": 10535 }, { "epoch": 0.14, "learning_rate": 9.552704843345781e-05, "loss": 2.782, "step": 10540 }, { "epoch": 0.14, "learning_rate": 9.552282810196662e-05, "loss": 2.9332, "step": 10545 }, { "epoch": 0.14, "learning_rate": 9.55186058737407e-05, "loss": 2.7325, "step": 10550 }, { "epoch": 0.14, "learning_rate": 9.551438174895604e-05, "loss": 2.8211, "step": 10555 }, { "epoch": 0.14, "learning_rate": 9.551015572778859e-05, "loss": 2.7542, "step": 10560 }, { "epoch": 0.14, "learning_rate": 9.550592781041444e-05, "loss": 2.8503, "step": 10565 }, { "epoch": 0.14, "learning_rate": 9.550169799700974e-05, "loss": 2.8461, "step": 10570 }, { "epoch": 0.14, "learning_rate": 9.549746628775075e-05, "loss": 2.748, "step": 10575 }, { "epoch": 0.14, "learning_rate": 9.549323268281377e-05, "loss": 2.9099, "step": 10580 }, { "epoch": 0.14, "learning_rate": 9.548899718237521e-05, "loss": 2.6716, "step": 10585 }, { "epoch": 0.14, "learning_rate": 9.548475978661154e-05, "loss": 2.7966, "step": 10590 }, { "epoch": 0.14, "learning_rate": 9.548052049569929e-05, "loss": 2.7825, "step": 10595 }, { "epoch": 0.14, "learning_rate": 9.547627930981512e-05, "loss": 2.6966, "step": 10600 }, { "epoch": 0.14, "learning_rate": 9.547203622913574e-05, "loss": 2.9024, "step": 10605 }, { "epoch": 0.14, "learning_rate": 9.546779125383791e-05, "loss": 2.7471, "step": 10610 }, { "epoch": 0.14, "learning_rate": 9.546354438409854e-05, "loss": 2.784, "step": 10615 }, { "epoch": 0.14, "learning_rate": 9.545929562009457e-05, "loss": 2.725, "step": 10620 }, { "epoch": 0.14, "learning_rate": 9.545504496200302e-05, "loss": 2.8493, "step": 10625 }, { "epoch": 0.14, "learning_rate": 9.545079241000098e-05, "loss": 2.7787, "step": 10630 }, { "epoch": 0.14, "learning_rate": 9.544653796426564e-05, "loss": 2.7827, "step": 10635 }, { "epoch": 0.14, "learning_rate": 9.544228162497429e-05, "loss": 2.8616, "step": 10640 }, { "epoch": 0.14, "learning_rate": 9.543802339230425e-05, "loss": 2.7872, "step": 10645 }, { "epoch": 0.14, "learning_rate": 9.543376326643296e-05, "loss": 2.5983, "step": 10650 }, { "epoch": 0.14, "learning_rate": 9.542950124753789e-05, "loss": 2.8458, "step": 10655 }, { "epoch": 0.14, "learning_rate": 9.542523733579665e-05, "loss": 2.7202, "step": 10660 }, { "epoch": 0.14, "learning_rate": 9.542097153138688e-05, "loss": 2.8648, "step": 10665 }, { "epoch": 0.14, "learning_rate": 9.541670383448634e-05, "loss": 2.7984, "step": 10670 }, { "epoch": 0.14, "learning_rate": 9.54124342452728e-05, "loss": 2.7939, "step": 10675 }, { "epoch": 0.14, "learning_rate": 9.54081627639242e-05, "loss": 2.6552, "step": 10680 }, { "epoch": 0.14, "learning_rate": 9.54038893906185e-05, "loss": 2.6784, "step": 10685 }, { "epoch": 0.14, "learning_rate": 9.539961412553375e-05, "loss": 2.7191, "step": 10690 }, { "epoch": 0.14, "learning_rate": 9.539533696884808e-05, "loss": 2.774, "step": 10695 }, { "epoch": 0.14, "learning_rate": 9.53910579207397e-05, "loss": 2.6664, "step": 10700 }, { "epoch": 0.14, "learning_rate": 9.538677698138689e-05, "loss": 2.6984, "step": 10705 }, { "epoch": 0.14, "learning_rate": 9.538249415096804e-05, "loss": 2.897, "step": 10710 }, { "epoch": 0.14, "learning_rate": 9.537820942966161e-05, "loss": 2.8079, "step": 10715 }, { "epoch": 0.14, "learning_rate": 9.537392281764605e-05, "loss": 2.6687, "step": 10720 }, { "epoch": 0.14, "learning_rate": 9.536963431510005e-05, "loss": 2.7903, "step": 10725 }, { "epoch": 0.14, "learning_rate": 9.536534392220226e-05, "loss": 2.8614, "step": 10730 }, { "epoch": 0.14, "learning_rate": 9.536105163913143e-05, "loss": 2.8877, "step": 10735 }, { "epoch": 0.14, "learning_rate": 9.53567574660664e-05, "loss": 2.7983, "step": 10740 }, { "epoch": 0.14, "learning_rate": 9.535246140318612e-05, "loss": 2.8044, "step": 10745 }, { "epoch": 0.14, "learning_rate": 9.534816345066955e-05, "loss": 2.7986, "step": 10750 }, { "epoch": 0.14, "learning_rate": 9.534386360869578e-05, "loss": 2.7792, "step": 10755 }, { "epoch": 0.14, "learning_rate": 9.533956187744399e-05, "loss": 2.758, "step": 10760 }, { "epoch": 0.14, "learning_rate": 9.533525825709337e-05, "loss": 2.6672, "step": 10765 }, { "epoch": 0.14, "learning_rate": 9.533095274782326e-05, "loss": 2.8395, "step": 10770 }, { "epoch": 0.14, "learning_rate": 9.532664534981306e-05, "loss": 2.8643, "step": 10775 }, { "epoch": 0.14, "learning_rate": 9.532233606324222e-05, "loss": 2.715, "step": 10780 }, { "epoch": 0.14, "learning_rate": 9.53180248882903e-05, "loss": 2.7265, "step": 10785 }, { "epoch": 0.14, "learning_rate": 9.531371182513693e-05, "loss": 2.8836, "step": 10790 }, { "epoch": 0.14, "learning_rate": 9.53093968739618e-05, "loss": 2.6349, "step": 10795 }, { "epoch": 0.14, "learning_rate": 9.530508003494472e-05, "loss": 2.8109, "step": 10800 }, { "epoch": 0.14, "learning_rate": 9.53007613082655e-05, "loss": 2.5857, "step": 10805 }, { "epoch": 0.14, "learning_rate": 9.529644069410416e-05, "loss": 2.7816, "step": 10810 }, { "epoch": 0.14, "learning_rate": 9.529211819264067e-05, "loss": 2.8118, "step": 10815 }, { "epoch": 0.14, "learning_rate": 9.528779380405515e-05, "loss": 2.8097, "step": 10820 }, { "epoch": 0.14, "learning_rate": 9.528346752852775e-05, "loss": 2.859, "step": 10825 }, { "epoch": 0.14, "learning_rate": 9.527913936623876e-05, "loss": 2.6806, "step": 10830 }, { "epoch": 0.14, "learning_rate": 9.52748093173685e-05, "loss": 2.7117, "step": 10835 }, { "epoch": 0.14, "learning_rate": 9.527047738209738e-05, "loss": 2.652, "step": 10840 }, { "epoch": 0.14, "learning_rate": 9.52661435606059e-05, "loss": 2.8177, "step": 10845 }, { "epoch": 0.14, "learning_rate": 9.526180785307463e-05, "loss": 2.7282, "step": 10850 }, { "epoch": 0.14, "learning_rate": 9.525747025968423e-05, "loss": 2.7097, "step": 10855 }, { "epoch": 0.14, "learning_rate": 9.525313078061541e-05, "loss": 2.7555, "step": 10860 }, { "epoch": 0.14, "learning_rate": 9.524878941604898e-05, "loss": 2.8331, "step": 10865 }, { "epoch": 0.14, "learning_rate": 9.524444616616583e-05, "loss": 2.7665, "step": 10870 }, { "epoch": 0.14, "learning_rate": 9.524010103114694e-05, "loss": 2.6999, "step": 10875 }, { "epoch": 0.14, "learning_rate": 9.52357540111733e-05, "loss": 2.6532, "step": 10880 }, { "epoch": 0.14, "learning_rate": 9.52314051064261e-05, "loss": 2.8392, "step": 10885 }, { "epoch": 0.14, "learning_rate": 9.522705431708649e-05, "loss": 2.7978, "step": 10890 }, { "epoch": 0.14, "learning_rate": 9.522270164333578e-05, "loss": 2.7185, "step": 10895 }, { "epoch": 0.14, "learning_rate": 9.521834708535531e-05, "loss": 2.58, "step": 10900 }, { "epoch": 0.14, "learning_rate": 9.52139906433265e-05, "loss": 2.7181, "step": 10905 }, { "epoch": 0.14, "learning_rate": 9.52096323174309e-05, "loss": 2.6442, "step": 10910 }, { "epoch": 0.14, "learning_rate": 9.520527210785007e-05, "loss": 2.7567, "step": 10915 }, { "epoch": 0.14, "learning_rate": 9.52009100147657e-05, "loss": 2.7491, "step": 10920 }, { "epoch": 0.14, "learning_rate": 9.519654603835952e-05, "loss": 2.8375, "step": 10925 }, { "epoch": 0.14, "learning_rate": 9.519218017881338e-05, "loss": 2.6875, "step": 10930 }, { "epoch": 0.14, "learning_rate": 9.518781243630917e-05, "loss": 2.7033, "step": 10935 }, { "epoch": 0.14, "learning_rate": 9.518344281102889e-05, "loss": 2.7909, "step": 10940 }, { "epoch": 0.14, "learning_rate": 9.517907130315459e-05, "loss": 2.8016, "step": 10945 }, { "epoch": 0.14, "learning_rate": 9.517469791286841e-05, "loss": 2.7784, "step": 10950 }, { "epoch": 0.14, "learning_rate": 9.517032264035257e-05, "loss": 2.8614, "step": 10955 }, { "epoch": 0.14, "learning_rate": 9.51659454857894e-05, "loss": 2.8171, "step": 10960 }, { "epoch": 0.14, "learning_rate": 9.516156644936122e-05, "loss": 2.9095, "step": 10965 }, { "epoch": 0.14, "learning_rate": 9.515718553125053e-05, "loss": 2.6836, "step": 10970 }, { "epoch": 0.14, "learning_rate": 9.515280273163984e-05, "loss": 2.8023, "step": 10975 }, { "epoch": 0.14, "learning_rate": 9.514841805071177e-05, "loss": 2.7026, "step": 10980 }, { "epoch": 0.14, "learning_rate": 9.5144031488649e-05, "loss": 2.7405, "step": 10985 }, { "epoch": 0.14, "learning_rate": 9.513964304563434e-05, "loss": 2.6887, "step": 10990 }, { "epoch": 0.14, "learning_rate": 9.513525272185057e-05, "loss": 2.9249, "step": 10995 }, { "epoch": 0.14, "learning_rate": 9.513086051748068e-05, "loss": 2.7932, "step": 11000 }, { "epoch": 0.14, "learning_rate": 9.512646643270764e-05, "loss": 2.6896, "step": 11005 }, { "epoch": 0.14, "learning_rate": 9.512207046771452e-05, "loss": 2.7592, "step": 11010 }, { "epoch": 0.14, "learning_rate": 9.511767262268452e-05, "loss": 2.6699, "step": 11015 }, { "epoch": 0.14, "learning_rate": 9.511327289780083e-05, "loss": 2.8708, "step": 11020 }, { "epoch": 0.14, "learning_rate": 9.510887129324682e-05, "loss": 2.6459, "step": 11025 }, { "epoch": 0.14, "learning_rate": 9.510446780920583e-05, "loss": 2.7387, "step": 11030 }, { "epoch": 0.14, "learning_rate": 9.510006244586138e-05, "loss": 2.845, "step": 11035 }, { "epoch": 0.14, "learning_rate": 9.5095655203397e-05, "loss": 2.7763, "step": 11040 }, { "epoch": 0.14, "learning_rate": 9.509124608199633e-05, "loss": 2.7396, "step": 11045 }, { "epoch": 0.14, "learning_rate": 9.508683508184306e-05, "loss": 2.6725, "step": 11050 }, { "epoch": 0.14, "learning_rate": 9.5082422203121e-05, "loss": 2.8192, "step": 11055 }, { "epoch": 0.14, "learning_rate": 9.5078007446014e-05, "loss": 2.7978, "step": 11060 }, { "epoch": 0.14, "learning_rate": 9.507359081070601e-05, "loss": 2.7482, "step": 11065 }, { "epoch": 0.14, "learning_rate": 9.506917229738105e-05, "loss": 2.8139, "step": 11070 }, { "epoch": 0.14, "learning_rate": 9.506475190622322e-05, "loss": 2.8099, "step": 11075 }, { "epoch": 0.14, "learning_rate": 9.506032963741672e-05, "loss": 2.784, "step": 11080 }, { "epoch": 0.14, "learning_rate": 9.505590549114576e-05, "loss": 2.7735, "step": 11085 }, { "epoch": 0.14, "learning_rate": 9.505147946759469e-05, "loss": 2.7769, "step": 11090 }, { "epoch": 0.14, "learning_rate": 9.504705156694794e-05, "loss": 2.6939, "step": 11095 }, { "epoch": 0.14, "learning_rate": 9.504262178939001e-05, "loss": 2.7613, "step": 11100 }, { "epoch": 0.14, "learning_rate": 9.503819013510542e-05, "loss": 2.8411, "step": 11105 }, { "epoch": 0.14, "learning_rate": 9.503375660427887e-05, "loss": 2.678, "step": 11110 }, { "epoch": 0.14, "learning_rate": 9.502932119709507e-05, "loss": 2.7945, "step": 11115 }, { "epoch": 0.14, "learning_rate": 9.502488391373881e-05, "loss": 2.72, "step": 11120 }, { "epoch": 0.14, "learning_rate": 9.502044475439498e-05, "loss": 2.7504, "step": 11125 }, { "epoch": 0.14, "learning_rate": 9.501600371924854e-05, "loss": 2.7315, "step": 11130 }, { "epoch": 0.14, "learning_rate": 9.501156080848453e-05, "loss": 2.8384, "step": 11135 }, { "epoch": 0.14, "learning_rate": 9.500711602228807e-05, "loss": 2.7734, "step": 11140 }, { "epoch": 0.14, "learning_rate": 9.500266936084435e-05, "loss": 2.6334, "step": 11145 }, { "epoch": 0.14, "learning_rate": 9.499822082433863e-05, "loss": 2.6739, "step": 11150 }, { "epoch": 0.14, "learning_rate": 9.49937704129563e-05, "loss": 2.7324, "step": 11155 }, { "epoch": 0.14, "learning_rate": 9.498931812688274e-05, "loss": 2.9248, "step": 11160 }, { "epoch": 0.14, "learning_rate": 9.498486396630349e-05, "loss": 2.7413, "step": 11165 }, { "epoch": 0.14, "learning_rate": 9.498040793140411e-05, "loss": 2.7845, "step": 11170 }, { "epoch": 0.15, "learning_rate": 9.497595002237029e-05, "loss": 2.819, "step": 11175 }, { "epoch": 0.15, "learning_rate": 9.497149023938776e-05, "loss": 2.7259, "step": 11180 }, { "epoch": 0.15, "learning_rate": 9.496702858264233e-05, "loss": 2.6915, "step": 11185 }, { "epoch": 0.15, "learning_rate": 9.49625650523199e-05, "loss": 2.6912, "step": 11190 }, { "epoch": 0.15, "learning_rate": 9.495809964860649e-05, "loss": 2.7087, "step": 11195 }, { "epoch": 0.15, "learning_rate": 9.495363237168808e-05, "loss": 2.8147, "step": 11200 }, { "epoch": 0.15, "learning_rate": 9.494916322175084e-05, "loss": 2.8605, "step": 11205 }, { "epoch": 0.15, "learning_rate": 9.494469219898099e-05, "loss": 2.9013, "step": 11210 }, { "epoch": 0.15, "learning_rate": 9.494021930356479e-05, "loss": 2.8006, "step": 11215 }, { "epoch": 0.15, "learning_rate": 9.493574453568863e-05, "loss": 2.6936, "step": 11220 }, { "epoch": 0.15, "learning_rate": 9.493126789553894e-05, "loss": 2.8016, "step": 11225 }, { "epoch": 0.15, "learning_rate": 9.492678938330225e-05, "loss": 2.7934, "step": 11230 }, { "epoch": 0.15, "learning_rate": 9.492230899916515e-05, "loss": 2.8583, "step": 11235 }, { "epoch": 0.15, "learning_rate": 9.491782674331432e-05, "loss": 2.8144, "step": 11240 }, { "epoch": 0.15, "learning_rate": 9.491334261593653e-05, "loss": 2.7239, "step": 11245 }, { "epoch": 0.15, "learning_rate": 9.49088566172186e-05, "loss": 2.7508, "step": 11250 }, { "epoch": 0.15, "learning_rate": 9.490436874734743e-05, "loss": 2.7791, "step": 11255 }, { "epoch": 0.15, "learning_rate": 9.489987900651005e-05, "loss": 2.793, "step": 11260 }, { "epoch": 0.15, "learning_rate": 9.489538739489347e-05, "loss": 2.8902, "step": 11265 }, { "epoch": 0.15, "learning_rate": 9.489089391268489e-05, "loss": 2.74, "step": 11270 }, { "epoch": 0.15, "learning_rate": 9.488639856007151e-05, "loss": 2.8004, "step": 11275 }, { "epoch": 0.15, "learning_rate": 9.488190133724062e-05, "loss": 2.6732, "step": 11280 }, { "epoch": 0.15, "learning_rate": 9.487740224437962e-05, "loss": 2.656, "step": 11285 }, { "epoch": 0.15, "learning_rate": 9.487290128167597e-05, "loss": 2.7215, "step": 11290 }, { "epoch": 0.15, "learning_rate": 9.486839844931717e-05, "loss": 2.8815, "step": 11295 }, { "epoch": 0.15, "learning_rate": 9.486389374749087e-05, "loss": 2.7461, "step": 11300 }, { "epoch": 0.15, "learning_rate": 9.485938717638475e-05, "loss": 2.9176, "step": 11305 }, { "epoch": 0.15, "learning_rate": 9.485487873618657e-05, "loss": 2.7982, "step": 11310 }, { "epoch": 0.15, "learning_rate": 9.485036842708418e-05, "loss": 2.7579, "step": 11315 }, { "epoch": 0.15, "learning_rate": 9.484585624926553e-05, "loss": 2.7771, "step": 11320 }, { "epoch": 0.15, "learning_rate": 9.484134220291859e-05, "loss": 2.6871, "step": 11325 }, { "epoch": 0.15, "learning_rate": 9.483682628823145e-05, "loss": 2.8038, "step": 11330 }, { "epoch": 0.15, "learning_rate": 9.483230850539227e-05, "loss": 2.7528, "step": 11335 }, { "epoch": 0.15, "learning_rate": 9.482778885458927e-05, "loss": 2.7177, "step": 11340 }, { "epoch": 0.15, "learning_rate": 9.482326733601079e-05, "loss": 2.8122, "step": 11345 }, { "epoch": 0.15, "learning_rate": 9.481874394984522e-05, "loss": 2.8434, "step": 11350 }, { "epoch": 0.15, "learning_rate": 9.481421869628102e-05, "loss": 2.6392, "step": 11355 }, { "epoch": 0.15, "learning_rate": 9.480969157550672e-05, "loss": 2.7254, "step": 11360 }, { "epoch": 0.15, "learning_rate": 9.480516258771097e-05, "loss": 2.7688, "step": 11365 }, { "epoch": 0.15, "learning_rate": 9.480063173308247e-05, "loss": 2.7873, "step": 11370 }, { "epoch": 0.15, "learning_rate": 9.479609901181e-05, "loss": 2.7414, "step": 11375 }, { "epoch": 0.15, "learning_rate": 9.479156442408242e-05, "loss": 2.746, "step": 11380 }, { "epoch": 0.15, "learning_rate": 9.478702797008863e-05, "loss": 2.7374, "step": 11385 }, { "epoch": 0.15, "learning_rate": 9.47824896500177e-05, "loss": 2.7179, "step": 11390 }, { "epoch": 0.15, "learning_rate": 9.477794946405869e-05, "loss": 2.9093, "step": 11395 }, { "epoch": 0.15, "learning_rate": 9.477340741240078e-05, "loss": 2.8169, "step": 11400 }, { "epoch": 0.15, "learning_rate": 9.476886349523321e-05, "loss": 2.7692, "step": 11405 }, { "epoch": 0.15, "learning_rate": 9.476431771274532e-05, "loss": 2.7458, "step": 11410 }, { "epoch": 0.15, "learning_rate": 9.475977006512648e-05, "loss": 2.7773, "step": 11415 }, { "epoch": 0.15, "learning_rate": 9.475522055256621e-05, "loss": 2.7358, "step": 11420 }, { "epoch": 0.15, "learning_rate": 9.475066917525404e-05, "loss": 2.769, "step": 11425 }, { "epoch": 0.15, "learning_rate": 9.474611593337961e-05, "loss": 2.8694, "step": 11430 }, { "epoch": 0.15, "learning_rate": 9.474156082713264e-05, "loss": 2.726, "step": 11435 }, { "epoch": 0.15, "learning_rate": 9.473700385670292e-05, "loss": 2.7846, "step": 11440 }, { "epoch": 0.15, "learning_rate": 9.473244502228031e-05, "loss": 2.7795, "step": 11445 }, { "epoch": 0.15, "learning_rate": 9.472788432405478e-05, "loss": 2.6993, "step": 11450 }, { "epoch": 0.15, "learning_rate": 9.472332176221634e-05, "loss": 2.8369, "step": 11455 }, { "epoch": 0.15, "learning_rate": 9.471875733695508e-05, "loss": 2.8901, "step": 11460 }, { "epoch": 0.15, "learning_rate": 9.471419104846119e-05, "loss": 2.628, "step": 11465 }, { "epoch": 0.15, "learning_rate": 9.470962289692493e-05, "loss": 2.7638, "step": 11470 }, { "epoch": 0.15, "learning_rate": 9.470505288253664e-05, "loss": 2.713, "step": 11475 }, { "epoch": 0.15, "learning_rate": 9.470048100548671e-05, "loss": 2.6958, "step": 11480 }, { "epoch": 0.15, "learning_rate": 9.469590726596564e-05, "loss": 2.7256, "step": 11485 }, { "epoch": 0.15, "learning_rate": 9.469133166416402e-05, "loss": 2.7948, "step": 11490 }, { "epoch": 0.15, "learning_rate": 9.468675420027246e-05, "loss": 2.7396, "step": 11495 }, { "epoch": 0.15, "learning_rate": 9.46821748744817e-05, "loss": 2.8855, "step": 11500 }, { "epoch": 0.15, "learning_rate": 9.467759368698255e-05, "loss": 2.7134, "step": 11505 }, { "epoch": 0.15, "learning_rate": 9.467301063796587e-05, "loss": 2.8038, "step": 11510 }, { "epoch": 0.15, "learning_rate": 9.466842572762262e-05, "loss": 2.7887, "step": 11515 }, { "epoch": 0.15, "learning_rate": 9.466383895614384e-05, "loss": 2.6267, "step": 11520 }, { "epoch": 0.15, "learning_rate": 9.465925032372063e-05, "loss": 2.8265, "step": 11525 }, { "epoch": 0.15, "learning_rate": 9.465465983054419e-05, "loss": 2.8522, "step": 11530 }, { "epoch": 0.15, "learning_rate": 9.465006747680577e-05, "loss": 2.7116, "step": 11535 }, { "epoch": 0.15, "learning_rate": 9.464547326269673e-05, "loss": 2.7169, "step": 11540 }, { "epoch": 0.15, "learning_rate": 9.464087718840849e-05, "loss": 2.694, "step": 11545 }, { "epoch": 0.15, "learning_rate": 9.463627925413252e-05, "loss": 2.6606, "step": 11550 }, { "epoch": 0.15, "learning_rate": 9.463167946006042e-05, "loss": 2.8458, "step": 11555 }, { "epoch": 0.15, "learning_rate": 9.462707780638384e-05, "loss": 2.8822, "step": 11560 }, { "epoch": 0.15, "learning_rate": 9.462247429329453e-05, "loss": 2.7425, "step": 11565 }, { "epoch": 0.15, "learning_rate": 9.461786892098427e-05, "loss": 2.7122, "step": 11570 }, { "epoch": 0.15, "learning_rate": 9.461326168964495e-05, "loss": 2.7845, "step": 11575 }, { "epoch": 0.15, "learning_rate": 9.460865259946852e-05, "loss": 2.6984, "step": 11580 }, { "epoch": 0.15, "learning_rate": 9.460404165064706e-05, "loss": 2.8578, "step": 11585 }, { "epoch": 0.15, "learning_rate": 9.459942884337264e-05, "loss": 2.7787, "step": 11590 }, { "epoch": 0.15, "learning_rate": 9.45948141778375e-05, "loss": 2.7702, "step": 11595 }, { "epoch": 0.15, "learning_rate": 9.45901976542339e-05, "loss": 2.8385, "step": 11600 }, { "epoch": 0.15, "learning_rate": 9.458557927275417e-05, "loss": 2.6656, "step": 11605 }, { "epoch": 0.15, "learning_rate": 9.458095903359075e-05, "loss": 2.7208, "step": 11610 }, { "epoch": 0.15, "learning_rate": 9.457633693693614e-05, "loss": 2.7405, "step": 11615 }, { "epoch": 0.15, "learning_rate": 9.457171298298293e-05, "loss": 2.8087, "step": 11620 }, { "epoch": 0.15, "learning_rate": 9.456708717192379e-05, "loss": 2.6834, "step": 11625 }, { "epoch": 0.15, "learning_rate": 9.456245950395143e-05, "loss": 2.7267, "step": 11630 }, { "epoch": 0.15, "learning_rate": 9.455782997925868e-05, "loss": 2.8282, "step": 11635 }, { "epoch": 0.15, "learning_rate": 9.455319859803843e-05, "loss": 2.8593, "step": 11640 }, { "epoch": 0.15, "learning_rate": 9.454856536048365e-05, "loss": 2.6607, "step": 11645 }, { "epoch": 0.15, "learning_rate": 9.454393026678738e-05, "loss": 2.6939, "step": 11650 }, { "epoch": 0.15, "learning_rate": 9.453929331714277e-05, "loss": 2.7103, "step": 11655 }, { "epoch": 0.15, "learning_rate": 9.4534654511743e-05, "loss": 2.7237, "step": 11660 }, { "epoch": 0.15, "learning_rate": 9.453001385078133e-05, "loss": 2.881, "step": 11665 }, { "epoch": 0.15, "learning_rate": 9.452537133445114e-05, "loss": 2.6389, "step": 11670 }, { "epoch": 0.15, "learning_rate": 9.452072696294586e-05, "loss": 2.7987, "step": 11675 }, { "epoch": 0.15, "learning_rate": 9.4516080736459e-05, "loss": 2.8135, "step": 11680 }, { "epoch": 0.15, "learning_rate": 9.451143265518414e-05, "loss": 2.677, "step": 11685 }, { "epoch": 0.15, "learning_rate": 9.450678271931497e-05, "loss": 2.6561, "step": 11690 }, { "epoch": 0.15, "learning_rate": 9.450213092904519e-05, "loss": 2.8331, "step": 11695 }, { "epoch": 0.15, "learning_rate": 9.449747728456865e-05, "loss": 2.7385, "step": 11700 }, { "epoch": 0.15, "learning_rate": 9.449282178607925e-05, "loss": 2.8087, "step": 11705 }, { "epoch": 0.15, "learning_rate": 9.448816443377096e-05, "loss": 2.7482, "step": 11710 }, { "epoch": 0.15, "learning_rate": 9.448350522783779e-05, "loss": 2.8617, "step": 11715 }, { "epoch": 0.15, "learning_rate": 9.447884416847395e-05, "loss": 2.7464, "step": 11720 }, { "epoch": 0.15, "learning_rate": 9.447418125587357e-05, "loss": 2.7684, "step": 11725 }, { "epoch": 0.15, "learning_rate": 9.446951649023098e-05, "loss": 2.7619, "step": 11730 }, { "epoch": 0.15, "learning_rate": 9.44648498717405e-05, "loss": 2.9471, "step": 11735 }, { "epoch": 0.15, "learning_rate": 9.44601814005966e-05, "loss": 2.6425, "step": 11740 }, { "epoch": 0.15, "learning_rate": 9.445551107699377e-05, "loss": 2.7347, "step": 11745 }, { "epoch": 0.15, "learning_rate": 9.445083890112664e-05, "loss": 2.747, "step": 11750 }, { "epoch": 0.15, "learning_rate": 9.444616487318985e-05, "loss": 2.841, "step": 11755 }, { "epoch": 0.15, "learning_rate": 9.444148899337815e-05, "loss": 2.7105, "step": 11760 }, { "epoch": 0.15, "learning_rate": 9.443681126188635e-05, "loss": 2.7365, "step": 11765 }, { "epoch": 0.15, "learning_rate": 9.443213167890937e-05, "loss": 2.6899, "step": 11770 }, { "epoch": 0.15, "learning_rate": 9.44274502446422e-05, "loss": 2.7486, "step": 11775 }, { "epoch": 0.15, "learning_rate": 9.442276695927986e-05, "loss": 2.6709, "step": 11780 }, { "epoch": 0.15, "learning_rate": 9.441808182301751e-05, "loss": 2.9125, "step": 11785 }, { "epoch": 0.15, "learning_rate": 9.441339483605033e-05, "loss": 2.6194, "step": 11790 }, { "epoch": 0.15, "learning_rate": 9.440870599857363e-05, "loss": 2.7504, "step": 11795 }, { "epoch": 0.15, "learning_rate": 9.440401531078277e-05, "loss": 2.7598, "step": 11800 }, { "epoch": 0.15, "learning_rate": 9.439932277287318e-05, "loss": 2.77, "step": 11805 }, { "epoch": 0.15, "learning_rate": 9.439462838504039e-05, "loss": 2.6386, "step": 11810 }, { "epoch": 0.15, "learning_rate": 9.438993214747999e-05, "loss": 2.7775, "step": 11815 }, { "epoch": 0.15, "learning_rate": 9.438523406038763e-05, "loss": 2.7744, "step": 11820 }, { "epoch": 0.15, "learning_rate": 9.43805341239591e-05, "loss": 2.7009, "step": 11825 }, { "epoch": 0.15, "learning_rate": 9.43758323383902e-05, "loss": 2.7076, "step": 11830 }, { "epoch": 0.15, "learning_rate": 9.437112870387684e-05, "loss": 2.6648, "step": 11835 }, { "epoch": 0.15, "learning_rate": 9.436642322061499e-05, "loss": 2.8421, "step": 11840 }, { "epoch": 0.15, "learning_rate": 9.436171588880071e-05, "loss": 2.7808, "step": 11845 }, { "epoch": 0.15, "learning_rate": 9.435700670863014e-05, "loss": 2.8372, "step": 11850 }, { "epoch": 0.15, "learning_rate": 9.435229568029948e-05, "loss": 2.796, "step": 11855 }, { "epoch": 0.15, "learning_rate": 9.434758280400504e-05, "loss": 2.713, "step": 11860 }, { "epoch": 0.15, "learning_rate": 9.434286807994316e-05, "loss": 2.7536, "step": 11865 }, { "epoch": 0.15, "learning_rate": 9.43381515083103e-05, "loss": 2.8158, "step": 11870 }, { "epoch": 0.15, "learning_rate": 9.433343308930295e-05, "loss": 2.7919, "step": 11875 }, { "epoch": 0.15, "learning_rate": 9.432871282311772e-05, "loss": 2.6698, "step": 11880 }, { "epoch": 0.15, "learning_rate": 9.43239907099513e-05, "loss": 2.8194, "step": 11885 }, { "epoch": 0.15, "learning_rate": 9.431926675000044e-05, "loss": 2.7116, "step": 11890 }, { "epoch": 0.15, "learning_rate": 9.431454094346195e-05, "loss": 2.7698, "step": 11895 }, { "epoch": 0.15, "learning_rate": 9.430981329053272e-05, "loss": 2.7829, "step": 11900 }, { "epoch": 0.15, "learning_rate": 9.430508379140976e-05, "loss": 2.6872, "step": 11905 }, { "epoch": 0.15, "learning_rate": 9.430035244629012e-05, "loss": 2.7569, "step": 11910 }, { "epoch": 0.15, "learning_rate": 9.429561925537092e-05, "loss": 2.7784, "step": 11915 }, { "epoch": 0.15, "learning_rate": 9.429088421884938e-05, "loss": 2.7525, "step": 11920 }, { "epoch": 0.15, "learning_rate": 9.42861473369228e-05, "loss": 2.8178, "step": 11925 }, { "epoch": 0.15, "learning_rate": 9.428140860978853e-05, "loss": 2.8506, "step": 11930 }, { "epoch": 0.15, "learning_rate": 9.4276668037644e-05, "loss": 2.8494, "step": 11935 }, { "epoch": 0.15, "learning_rate": 9.427192562068675e-05, "loss": 2.6227, "step": 11940 }, { "epoch": 0.16, "learning_rate": 9.426718135911438e-05, "loss": 2.8104, "step": 11945 }, { "epoch": 0.16, "learning_rate": 9.426243525312453e-05, "loss": 2.8713, "step": 11950 }, { "epoch": 0.16, "learning_rate": 9.4257687302915e-05, "loss": 2.8332, "step": 11955 }, { "epoch": 0.16, "learning_rate": 9.425293750868356e-05, "loss": 2.6774, "step": 11960 }, { "epoch": 0.16, "learning_rate": 9.424818587062816e-05, "loss": 2.6927, "step": 11965 }, { "epoch": 0.16, "learning_rate": 9.424343238894674e-05, "loss": 2.7405, "step": 11970 }, { "epoch": 0.16, "learning_rate": 9.423867706383738e-05, "loss": 2.6027, "step": 11975 }, { "epoch": 0.16, "learning_rate": 9.423391989549823e-05, "loss": 2.7904, "step": 11980 }, { "epoch": 0.16, "learning_rate": 9.422916088412745e-05, "loss": 2.8708, "step": 11985 }, { "epoch": 0.16, "learning_rate": 9.422440002992338e-05, "loss": 2.8216, "step": 11990 }, { "epoch": 0.16, "learning_rate": 9.421963733308434e-05, "loss": 2.7967, "step": 11995 }, { "epoch": 0.16, "learning_rate": 9.42148727938088e-05, "loss": 2.6725, "step": 12000 }, { "epoch": 0.16, "learning_rate": 9.421010641229528e-05, "loss": 2.8157, "step": 12005 }, { "epoch": 0.16, "learning_rate": 9.420533818874235e-05, "loss": 2.7022, "step": 12010 }, { "epoch": 0.16, "learning_rate": 9.42005681233487e-05, "loss": 2.7815, "step": 12015 }, { "epoch": 0.16, "learning_rate": 9.419579621631304e-05, "loss": 2.7369, "step": 12020 }, { "epoch": 0.16, "learning_rate": 9.419102246783427e-05, "loss": 2.7213, "step": 12025 }, { "epoch": 0.16, "learning_rate": 9.418624687811121e-05, "loss": 2.8912, "step": 12030 }, { "epoch": 0.16, "learning_rate": 9.41814694473429e-05, "loss": 2.705, "step": 12035 }, { "epoch": 0.16, "learning_rate": 9.417669017572835e-05, "loss": 2.6753, "step": 12040 }, { "epoch": 0.16, "learning_rate": 9.417190906346672e-05, "loss": 2.8426, "step": 12045 }, { "epoch": 0.16, "learning_rate": 9.416712611075718e-05, "loss": 2.8543, "step": 12050 }, { "epoch": 0.16, "learning_rate": 9.416234131779907e-05, "loss": 2.835, "step": 12055 }, { "epoch": 0.16, "learning_rate": 9.415755468479171e-05, "loss": 2.7167, "step": 12060 }, { "epoch": 0.16, "learning_rate": 9.415276621193455e-05, "loss": 2.6794, "step": 12065 }, { "epoch": 0.16, "learning_rate": 9.41479758994271e-05, "loss": 2.6603, "step": 12070 }, { "epoch": 0.16, "learning_rate": 9.414318374746895e-05, "loss": 2.8327, "step": 12075 }, { "epoch": 0.16, "learning_rate": 9.413838975625979e-05, "loss": 2.767, "step": 12080 }, { "epoch": 0.16, "learning_rate": 9.413359392599934e-05, "loss": 2.6589, "step": 12085 }, { "epoch": 0.16, "learning_rate": 9.412879625688742e-05, "loss": 2.8829, "step": 12090 }, { "epoch": 0.16, "learning_rate": 9.412399674912396e-05, "loss": 2.7827, "step": 12095 }, { "epoch": 0.16, "learning_rate": 9.411919540290887e-05, "loss": 2.7491, "step": 12100 }, { "epoch": 0.16, "learning_rate": 9.411439221844227e-05, "loss": 2.7512, "step": 12105 }, { "epoch": 0.16, "learning_rate": 9.410958719592427e-05, "loss": 2.667, "step": 12110 }, { "epoch": 0.16, "learning_rate": 9.410478033555504e-05, "loss": 2.7113, "step": 12115 }, { "epoch": 0.16, "learning_rate": 9.409997163753488e-05, "loss": 2.8083, "step": 12120 }, { "epoch": 0.16, "learning_rate": 9.409516110206417e-05, "loss": 2.755, "step": 12125 }, { "epoch": 0.16, "learning_rate": 9.40903487293433e-05, "loss": 2.8055, "step": 12130 }, { "epoch": 0.16, "learning_rate": 9.408553451957283e-05, "loss": 2.8301, "step": 12135 }, { "epoch": 0.16, "learning_rate": 9.40807184729533e-05, "loss": 2.6462, "step": 12140 }, { "epoch": 0.16, "learning_rate": 9.407590058968541e-05, "loss": 2.7597, "step": 12145 }, { "epoch": 0.16, "learning_rate": 9.407108086996987e-05, "loss": 2.8406, "step": 12150 }, { "epoch": 0.16, "learning_rate": 9.406625931400753e-05, "loss": 2.6744, "step": 12155 }, { "epoch": 0.16, "learning_rate": 9.406143592199924e-05, "loss": 2.7032, "step": 12160 }, { "epoch": 0.16, "learning_rate": 9.4056610694146e-05, "loss": 2.7101, "step": 12165 }, { "epoch": 0.16, "learning_rate": 9.405178363064885e-05, "loss": 2.8218, "step": 12170 }, { "epoch": 0.16, "learning_rate": 9.404695473170892e-05, "loss": 2.7012, "step": 12175 }, { "epoch": 0.16, "learning_rate": 9.40421239975274e-05, "loss": 2.6986, "step": 12180 }, { "epoch": 0.16, "learning_rate": 9.403729142830555e-05, "loss": 2.7986, "step": 12185 }, { "epoch": 0.16, "learning_rate": 9.403245702424475e-05, "loss": 2.8115, "step": 12190 }, { "epoch": 0.16, "learning_rate": 9.402762078554641e-05, "loss": 2.848, "step": 12195 }, { "epoch": 0.16, "learning_rate": 9.402278271241204e-05, "loss": 2.8568, "step": 12200 }, { "epoch": 0.16, "learning_rate": 9.401794280504324e-05, "loss": 2.6883, "step": 12205 }, { "epoch": 0.16, "learning_rate": 9.401310106364162e-05, "loss": 2.7805, "step": 12210 }, { "epoch": 0.16, "learning_rate": 9.400825748840896e-05, "loss": 2.7337, "step": 12215 }, { "epoch": 0.16, "learning_rate": 9.400341207954704e-05, "loss": 2.7899, "step": 12220 }, { "epoch": 0.16, "learning_rate": 9.399856483725778e-05, "loss": 2.7811, "step": 12225 }, { "epoch": 0.16, "learning_rate": 9.39937157617431e-05, "loss": 2.7467, "step": 12230 }, { "epoch": 0.16, "learning_rate": 9.398886485320507e-05, "loss": 2.7753, "step": 12235 }, { "epoch": 0.16, "learning_rate": 9.39840121118458e-05, "loss": 2.7105, "step": 12240 }, { "epoch": 0.16, "learning_rate": 9.397915753786748e-05, "loss": 2.6659, "step": 12245 }, { "epoch": 0.16, "learning_rate": 9.397430113147237e-05, "loss": 2.7376, "step": 12250 }, { "epoch": 0.16, "learning_rate": 9.396944289286284e-05, "loss": 2.7464, "step": 12255 }, { "epoch": 0.16, "learning_rate": 9.396458282224127e-05, "loss": 2.789, "step": 12260 }, { "epoch": 0.16, "learning_rate": 9.395972091981022e-05, "loss": 2.7505, "step": 12265 }, { "epoch": 0.16, "learning_rate": 9.39548571857722e-05, "loss": 2.8219, "step": 12270 }, { "epoch": 0.16, "learning_rate": 9.39499916203299e-05, "loss": 2.7633, "step": 12275 }, { "epoch": 0.16, "learning_rate": 9.394512422368602e-05, "loss": 2.8167, "step": 12280 }, { "epoch": 0.16, "learning_rate": 9.394025499604338e-05, "loss": 2.7147, "step": 12285 }, { "epoch": 0.16, "learning_rate": 9.393538393760485e-05, "loss": 2.6657, "step": 12290 }, { "epoch": 0.16, "learning_rate": 9.393051104857342e-05, "loss": 2.7192, "step": 12295 }, { "epoch": 0.16, "learning_rate": 9.392563632915206e-05, "loss": 2.6831, "step": 12300 }, { "epoch": 0.16, "learning_rate": 9.392075977954394e-05, "loss": 2.7903, "step": 12305 }, { "epoch": 0.16, "learning_rate": 9.391588139995218e-05, "loss": 2.6814, "step": 12310 }, { "epoch": 0.16, "learning_rate": 9.39110011905801e-05, "loss": 2.6425, "step": 12315 }, { "epoch": 0.16, "learning_rate": 9.390611915163102e-05, "loss": 2.697, "step": 12320 }, { "epoch": 0.16, "learning_rate": 9.390123528330832e-05, "loss": 2.7689, "step": 12325 }, { "epoch": 0.16, "learning_rate": 9.389634958581552e-05, "loss": 2.6746, "step": 12330 }, { "epoch": 0.16, "learning_rate": 9.389146205935619e-05, "loss": 2.7524, "step": 12335 }, { "epoch": 0.16, "learning_rate": 9.388657270413394e-05, "loss": 2.8673, "step": 12340 }, { "epoch": 0.16, "learning_rate": 9.388168152035253e-05, "loss": 2.6326, "step": 12345 }, { "epoch": 0.16, "learning_rate": 9.387678850821573e-05, "loss": 2.786, "step": 12350 }, { "epoch": 0.16, "learning_rate": 9.387189366792742e-05, "loss": 2.7623, "step": 12355 }, { "epoch": 0.16, "learning_rate": 9.386699699969153e-05, "loss": 2.6865, "step": 12360 }, { "epoch": 0.16, "learning_rate": 9.386209850371208e-05, "loss": 2.7963, "step": 12365 }, { "epoch": 0.16, "learning_rate": 9.385719818019321e-05, "loss": 2.8015, "step": 12370 }, { "epoch": 0.16, "learning_rate": 9.385229602933903e-05, "loss": 2.7208, "step": 12375 }, { "epoch": 0.16, "learning_rate": 9.384739205135385e-05, "loss": 2.7783, "step": 12380 }, { "epoch": 0.16, "learning_rate": 9.384248624644197e-05, "loss": 2.7366, "step": 12385 }, { "epoch": 0.16, "learning_rate": 9.38375786148078e-05, "loss": 2.685, "step": 12390 }, { "epoch": 0.16, "learning_rate": 9.38326691566558e-05, "loss": 2.7609, "step": 12395 }, { "epoch": 0.16, "learning_rate": 9.382775787219056e-05, "loss": 2.881, "step": 12400 }, { "epoch": 0.16, "learning_rate": 9.38228447616167e-05, "loss": 2.7347, "step": 12405 }, { "epoch": 0.16, "learning_rate": 9.381792982513888e-05, "loss": 2.8066, "step": 12410 }, { "epoch": 0.16, "learning_rate": 9.381301306296196e-05, "loss": 2.5949, "step": 12415 }, { "epoch": 0.16, "learning_rate": 9.380809447529076e-05, "loss": 2.642, "step": 12420 }, { "epoch": 0.16, "learning_rate": 9.380317406233019e-05, "loss": 2.8745, "step": 12425 }, { "epoch": 0.16, "learning_rate": 9.379825182428533e-05, "loss": 2.5969, "step": 12430 }, { "epoch": 0.16, "learning_rate": 9.37933277613612e-05, "loss": 2.8417, "step": 12435 }, { "epoch": 0.16, "learning_rate": 9.3788401873763e-05, "loss": 2.6501, "step": 12440 }, { "epoch": 0.16, "learning_rate": 9.378347416169597e-05, "loss": 2.6399, "step": 12445 }, { "epoch": 0.16, "learning_rate": 9.377854462536542e-05, "loss": 2.8643, "step": 12450 }, { "epoch": 0.16, "learning_rate": 9.377361326497674e-05, "loss": 2.8026, "step": 12455 }, { "epoch": 0.16, "learning_rate": 9.376868008073538e-05, "loss": 2.7163, "step": 12460 }, { "epoch": 0.16, "learning_rate": 9.376374507284693e-05, "loss": 2.7024, "step": 12465 }, { "epoch": 0.16, "learning_rate": 9.375880824151697e-05, "loss": 2.691, "step": 12470 }, { "epoch": 0.16, "learning_rate": 9.37538695869512e-05, "loss": 2.6321, "step": 12475 }, { "epoch": 0.16, "learning_rate": 9.374892910935542e-05, "loss": 2.6948, "step": 12480 }, { "epoch": 0.16, "learning_rate": 9.374398680893544e-05, "loss": 2.6612, "step": 12485 }, { "epoch": 0.16, "learning_rate": 9.373904268589722e-05, "loss": 2.7118, "step": 12490 }, { "epoch": 0.16, "learning_rate": 9.373409674044673e-05, "loss": 2.7391, "step": 12495 }, { "epoch": 0.16, "learning_rate": 9.372914897279006e-05, "loss": 2.7582, "step": 12500 }, { "epoch": 0.16, "learning_rate": 9.372419938313335e-05, "loss": 2.707, "step": 12505 }, { "epoch": 0.16, "learning_rate": 9.371924797168286e-05, "loss": 2.7061, "step": 12510 }, { "epoch": 0.16, "learning_rate": 9.371429473864483e-05, "loss": 2.8078, "step": 12515 }, { "epoch": 0.16, "learning_rate": 9.37093396842257e-05, "loss": 2.8034, "step": 12520 }, { "epoch": 0.16, "learning_rate": 9.370438280863192e-05, "loss": 2.7252, "step": 12525 }, { "epoch": 0.16, "learning_rate": 9.369942411207e-05, "loss": 2.8914, "step": 12530 }, { "epoch": 0.16, "learning_rate": 9.369446359474654e-05, "loss": 2.7994, "step": 12535 }, { "epoch": 0.16, "learning_rate": 9.368950125686824e-05, "loss": 2.6516, "step": 12540 }, { "epoch": 0.16, "learning_rate": 9.368453709864184e-05, "loss": 2.7547, "step": 12545 }, { "epoch": 0.16, "learning_rate": 9.367957112027421e-05, "loss": 2.7508, "step": 12550 }, { "epoch": 0.16, "learning_rate": 9.367460332197223e-05, "loss": 2.8684, "step": 12555 }, { "epoch": 0.16, "learning_rate": 9.366963370394289e-05, "loss": 2.6756, "step": 12560 }, { "epoch": 0.16, "learning_rate": 9.366466226639327e-05, "loss": 2.737, "step": 12565 }, { "epoch": 0.16, "learning_rate": 9.365968900953048e-05, "loss": 2.8521, "step": 12570 }, { "epoch": 0.16, "learning_rate": 9.365471393356176e-05, "loss": 2.7311, "step": 12575 }, { "epoch": 0.16, "learning_rate": 9.364973703869437e-05, "loss": 2.6491, "step": 12580 }, { "epoch": 0.16, "learning_rate": 9.36447583251357e-05, "loss": 2.7765, "step": 12585 }, { "epoch": 0.16, "learning_rate": 9.363977779309321e-05, "loss": 2.7943, "step": 12590 }, { "epoch": 0.16, "learning_rate": 9.363479544277436e-05, "loss": 2.7525, "step": 12595 }, { "epoch": 0.16, "learning_rate": 9.362981127438677e-05, "loss": 2.8283, "step": 12600 }, { "epoch": 0.16, "learning_rate": 9.362482528813815e-05, "loss": 2.7572, "step": 12605 }, { "epoch": 0.16, "learning_rate": 9.361983748423615e-05, "loss": 2.6895, "step": 12610 }, { "epoch": 0.16, "learning_rate": 9.361484786288868e-05, "loss": 2.7933, "step": 12615 }, { "epoch": 0.16, "learning_rate": 9.36098564243036e-05, "loss": 2.7763, "step": 12620 }, { "epoch": 0.16, "learning_rate": 9.360486316868886e-05, "loss": 2.7252, "step": 12625 }, { "epoch": 0.16, "learning_rate": 9.359986809625254e-05, "loss": 2.7656, "step": 12630 }, { "epoch": 0.16, "learning_rate": 9.359487120720276e-05, "loss": 2.7381, "step": 12635 }, { "epoch": 0.16, "learning_rate": 9.358987250174769e-05, "loss": 2.7299, "step": 12640 }, { "epoch": 0.16, "learning_rate": 9.358487198009564e-05, "loss": 2.8053, "step": 12645 }, { "epoch": 0.16, "learning_rate": 9.357986964245494e-05, "loss": 2.7214, "step": 12650 }, { "epoch": 0.16, "learning_rate": 9.3574865489034e-05, "loss": 2.6099, "step": 12655 }, { "epoch": 0.16, "learning_rate": 9.356985952004136e-05, "loss": 2.7937, "step": 12660 }, { "epoch": 0.16, "learning_rate": 9.356485173568556e-05, "loss": 2.6875, "step": 12665 }, { "epoch": 0.16, "learning_rate": 9.355984213617528e-05, "loss": 2.6735, "step": 12670 }, { "epoch": 0.16, "learning_rate": 9.355483072171922e-05, "loss": 2.7575, "step": 12675 }, { "epoch": 0.16, "learning_rate": 9.354981749252621e-05, "loss": 2.6443, "step": 12680 }, { "epoch": 0.16, "learning_rate": 9.354480244880513e-05, "loss": 2.784, "step": 12685 }, { "epoch": 0.16, "learning_rate": 9.353978559076491e-05, "loss": 2.6758, "step": 12690 }, { "epoch": 0.16, "learning_rate": 9.353476691861458e-05, "loss": 2.833, "step": 12695 }, { "epoch": 0.16, "learning_rate": 9.352974643256327e-05, "loss": 2.6977, "step": 12700 }, { "epoch": 0.16, "learning_rate": 9.352472413282015e-05, "loss": 2.6549, "step": 12705 }, { "epoch": 0.16, "learning_rate": 9.351970001959447e-05, "loss": 2.6819, "step": 12710 }, { "epoch": 0.17, "learning_rate": 9.351467409309558e-05, "loss": 2.8726, "step": 12715 }, { "epoch": 0.17, "learning_rate": 9.350964635353287e-05, "loss": 2.8121, "step": 12720 }, { "epoch": 0.17, "learning_rate": 9.350461680111584e-05, "loss": 2.6066, "step": 12725 }, { "epoch": 0.17, "learning_rate": 9.349958543605404e-05, "loss": 2.6986, "step": 12730 }, { "epoch": 0.17, "learning_rate": 9.34945522585571e-05, "loss": 2.7211, "step": 12735 }, { "epoch": 0.17, "learning_rate": 9.348951726883473e-05, "loss": 2.7323, "step": 12740 }, { "epoch": 0.17, "learning_rate": 9.348448046709672e-05, "loss": 2.5975, "step": 12745 }, { "epoch": 0.17, "learning_rate": 9.347944185355295e-05, "loss": 2.7767, "step": 12750 }, { "epoch": 0.17, "learning_rate": 9.347440142841333e-05, "loss": 2.6617, "step": 12755 }, { "epoch": 0.17, "learning_rate": 9.346935919188787e-05, "loss": 2.7513, "step": 12760 }, { "epoch": 0.17, "learning_rate": 9.346431514418668e-05, "loss": 2.6735, "step": 12765 }, { "epoch": 0.17, "learning_rate": 9.345926928551991e-05, "loss": 2.7612, "step": 12770 }, { "epoch": 0.17, "learning_rate": 9.34542216160978e-05, "loss": 2.6269, "step": 12775 }, { "epoch": 0.17, "learning_rate": 9.344917213613067e-05, "loss": 2.6775, "step": 12780 }, { "epoch": 0.17, "learning_rate": 9.34441208458289e-05, "loss": 2.7118, "step": 12785 }, { "epoch": 0.17, "learning_rate": 9.343906774540295e-05, "loss": 2.686, "step": 12790 }, { "epoch": 0.17, "learning_rate": 9.343401283506338e-05, "loss": 2.6675, "step": 12795 }, { "epoch": 0.17, "learning_rate": 9.342895611502079e-05, "loss": 2.5172, "step": 12800 }, { "epoch": 0.17, "learning_rate": 9.342389758548588e-05, "loss": 2.6616, "step": 12805 }, { "epoch": 0.17, "learning_rate": 9.34188372466694e-05, "loss": 2.6968, "step": 12810 }, { "epoch": 0.17, "learning_rate": 9.341377509878223e-05, "loss": 2.7025, "step": 12815 }, { "epoch": 0.17, "learning_rate": 9.340871114203524e-05, "loss": 2.7506, "step": 12820 }, { "epoch": 0.17, "learning_rate": 9.340364537663946e-05, "loss": 2.8149, "step": 12825 }, { "epoch": 0.17, "learning_rate": 9.339857780280594e-05, "loss": 2.6275, "step": 12830 }, { "epoch": 0.17, "learning_rate": 9.339350842074582e-05, "loss": 2.7063, "step": 12835 }, { "epoch": 0.17, "learning_rate": 9.338843723067032e-05, "loss": 2.764, "step": 12840 }, { "epoch": 0.17, "learning_rate": 9.338336423279075e-05, "loss": 2.7319, "step": 12845 }, { "epoch": 0.17, "learning_rate": 9.337828942731846e-05, "loss": 2.7688, "step": 12850 }, { "epoch": 0.17, "learning_rate": 9.33732128144649e-05, "loss": 2.7089, "step": 12855 }, { "epoch": 0.17, "learning_rate": 9.336813439444161e-05, "loss": 2.735, "step": 12860 }, { "epoch": 0.17, "learning_rate": 9.336305416746016e-05, "loss": 2.8013, "step": 12865 }, { "epoch": 0.17, "learning_rate": 9.335797213373222e-05, "loss": 2.7125, "step": 12870 }, { "epoch": 0.17, "learning_rate": 9.335288829346955e-05, "loss": 2.7854, "step": 12875 }, { "epoch": 0.17, "learning_rate": 9.334780264688396e-05, "loss": 2.7834, "step": 12880 }, { "epoch": 0.17, "learning_rate": 9.334271519418736e-05, "loss": 2.7238, "step": 12885 }, { "epoch": 0.17, "learning_rate": 9.33376259355917e-05, "loss": 2.7177, "step": 12890 }, { "epoch": 0.17, "learning_rate": 9.333253487130906e-05, "loss": 2.7343, "step": 12895 }, { "epoch": 0.17, "learning_rate": 9.332744200155154e-05, "loss": 2.7821, "step": 12900 }, { "epoch": 0.17, "learning_rate": 9.332234732653133e-05, "loss": 2.6253, "step": 12905 }, { "epoch": 0.17, "learning_rate": 9.331725084646072e-05, "loss": 2.8616, "step": 12910 }, { "epoch": 0.17, "learning_rate": 9.331215256155203e-05, "loss": 2.7192, "step": 12915 }, { "epoch": 0.17, "learning_rate": 9.330705247201773e-05, "loss": 2.7149, "step": 12920 }, { "epoch": 0.17, "learning_rate": 9.330195057807027e-05, "loss": 2.715, "step": 12925 }, { "epoch": 0.17, "learning_rate": 9.329684687992226e-05, "loss": 2.8438, "step": 12930 }, { "epoch": 0.17, "learning_rate": 9.329174137778634e-05, "loss": 2.6245, "step": 12935 }, { "epoch": 0.17, "learning_rate": 9.32866340718752e-05, "loss": 2.7136, "step": 12940 }, { "epoch": 0.17, "learning_rate": 9.328152496240169e-05, "loss": 2.87, "step": 12945 }, { "epoch": 0.17, "learning_rate": 9.327641404957866e-05, "loss": 2.84, "step": 12950 }, { "epoch": 0.17, "learning_rate": 9.327130133361904e-05, "loss": 2.7589, "step": 12955 }, { "epoch": 0.17, "learning_rate": 9.326618681473589e-05, "loss": 2.6717, "step": 12960 }, { "epoch": 0.17, "learning_rate": 9.326107049314228e-05, "loss": 2.8546, "step": 12965 }, { "epoch": 0.17, "learning_rate": 9.32559523690514e-05, "loss": 2.6902, "step": 12970 }, { "epoch": 0.17, "learning_rate": 9.32508324426765e-05, "loss": 2.7351, "step": 12975 }, { "epoch": 0.17, "learning_rate": 9.32457107142309e-05, "loss": 2.718, "step": 12980 }, { "epoch": 0.17, "learning_rate": 9.324058718392798e-05, "loss": 2.6219, "step": 12985 }, { "epoch": 0.17, "learning_rate": 9.323546185198127e-05, "loss": 2.7106, "step": 12990 }, { "epoch": 0.17, "learning_rate": 9.323033471860427e-05, "loss": 2.6748, "step": 12995 }, { "epoch": 0.17, "learning_rate": 9.322520578401062e-05, "loss": 2.5159, "step": 13000 }, { "epoch": 0.17, "learning_rate": 9.322007504841401e-05, "loss": 2.685, "step": 13005 }, { "epoch": 0.17, "learning_rate": 9.321494251202824e-05, "loss": 2.8663, "step": 13010 }, { "epoch": 0.17, "learning_rate": 9.320980817506715e-05, "loss": 2.7204, "step": 13015 }, { "epoch": 0.17, "learning_rate": 9.320467203774465e-05, "loss": 2.6173, "step": 13020 }, { "epoch": 0.17, "learning_rate": 9.319953410027475e-05, "loss": 2.6614, "step": 13025 }, { "epoch": 0.17, "learning_rate": 9.319439436287154e-05, "loss": 2.7639, "step": 13030 }, { "epoch": 0.17, "learning_rate": 9.318925282574914e-05, "loss": 2.739, "step": 13035 }, { "epoch": 0.17, "learning_rate": 9.31841094891218e-05, "loss": 2.7071, "step": 13040 }, { "epoch": 0.17, "learning_rate": 9.31789643532038e-05, "loss": 2.7708, "step": 13045 }, { "epoch": 0.17, "learning_rate": 9.317381741820955e-05, "loss": 2.6895, "step": 13050 }, { "epoch": 0.17, "learning_rate": 9.316866868435345e-05, "loss": 2.748, "step": 13055 }, { "epoch": 0.17, "learning_rate": 9.316351815185006e-05, "loss": 2.7994, "step": 13060 }, { "epoch": 0.17, "learning_rate": 9.315836582091397e-05, "loss": 2.7356, "step": 13065 }, { "epoch": 0.17, "learning_rate": 9.315321169175986e-05, "loss": 2.6891, "step": 13070 }, { "epoch": 0.17, "learning_rate": 9.314805576460246e-05, "loss": 2.743, "step": 13075 }, { "epoch": 0.17, "learning_rate": 9.314289803965663e-05, "loss": 2.7895, "step": 13080 }, { "epoch": 0.17, "learning_rate": 9.313773851713725e-05, "loss": 2.7504, "step": 13085 }, { "epoch": 0.17, "learning_rate": 9.313257719725927e-05, "loss": 2.7821, "step": 13090 }, { "epoch": 0.17, "learning_rate": 9.31274140802378e-05, "loss": 2.7493, "step": 13095 }, { "epoch": 0.17, "learning_rate": 9.31222491662879e-05, "loss": 2.666, "step": 13100 }, { "epoch": 0.17, "learning_rate": 9.31170824556248e-05, "loss": 2.8132, "step": 13105 }, { "epoch": 0.17, "learning_rate": 9.311191394846378e-05, "loss": 2.7089, "step": 13110 }, { "epoch": 0.17, "learning_rate": 9.310674364502018e-05, "loss": 2.6882, "step": 13115 }, { "epoch": 0.17, "learning_rate": 9.310157154550942e-05, "loss": 2.6413, "step": 13120 }, { "epoch": 0.17, "learning_rate": 9.3096397650147e-05, "loss": 2.7499, "step": 13125 }, { "epoch": 0.17, "learning_rate": 9.309122195914848e-05, "loss": 2.6216, "step": 13130 }, { "epoch": 0.17, "learning_rate": 9.308604447272955e-05, "loss": 2.6559, "step": 13135 }, { "epoch": 0.17, "learning_rate": 9.30808651911059e-05, "loss": 2.7359, "step": 13140 }, { "epoch": 0.17, "learning_rate": 9.307568411449333e-05, "loss": 2.7312, "step": 13145 }, { "epoch": 0.17, "learning_rate": 9.30705012431077e-05, "loss": 2.6256, "step": 13150 }, { "epoch": 0.17, "learning_rate": 9.3065316577165e-05, "loss": 2.7338, "step": 13155 }, { "epoch": 0.17, "learning_rate": 9.306013011688121e-05, "loss": 2.7779, "step": 13160 }, { "epoch": 0.17, "learning_rate": 9.305494186247246e-05, "loss": 2.8004, "step": 13165 }, { "epoch": 0.17, "learning_rate": 9.304975181415489e-05, "loss": 2.7297, "step": 13170 }, { "epoch": 0.17, "learning_rate": 9.304455997214476e-05, "loss": 2.7206, "step": 13175 }, { "epoch": 0.17, "learning_rate": 9.30393663366584e-05, "loss": 2.76, "step": 13180 }, { "epoch": 0.17, "learning_rate": 9.303417090791218e-05, "loss": 2.647, "step": 13185 }, { "epoch": 0.17, "learning_rate": 9.30289736861226e-05, "loss": 2.599, "step": 13190 }, { "epoch": 0.17, "learning_rate": 9.302377467150619e-05, "loss": 2.8337, "step": 13195 }, { "epoch": 0.17, "learning_rate": 9.301857386427956e-05, "loss": 2.7336, "step": 13200 }, { "epoch": 0.17, "learning_rate": 9.301337126465945e-05, "loss": 2.8183, "step": 13205 }, { "epoch": 0.17, "learning_rate": 9.300816687286258e-05, "loss": 2.7259, "step": 13210 }, { "epoch": 0.17, "learning_rate": 9.300296068910581e-05, "loss": 2.7947, "step": 13215 }, { "epoch": 0.17, "learning_rate": 9.299775271360606e-05, "loss": 2.7063, "step": 13220 }, { "epoch": 0.17, "learning_rate": 9.299254294658033e-05, "loss": 2.8579, "step": 13225 }, { "epoch": 0.17, "learning_rate": 9.298733138824567e-05, "loss": 2.6937, "step": 13230 }, { "epoch": 0.17, "learning_rate": 9.298211803881924e-05, "loss": 2.6948, "step": 13235 }, { "epoch": 0.17, "learning_rate": 9.297690289851824e-05, "loss": 2.8219, "step": 13240 }, { "epoch": 0.17, "learning_rate": 9.297168596755999e-05, "loss": 2.7196, "step": 13245 }, { "epoch": 0.17, "learning_rate": 9.296646724616182e-05, "loss": 2.7431, "step": 13250 }, { "epoch": 0.17, "learning_rate": 9.29612467345412e-05, "loss": 2.6684, "step": 13255 }, { "epoch": 0.17, "learning_rate": 9.295602443291563e-05, "loss": 2.7123, "step": 13260 }, { "epoch": 0.17, "learning_rate": 9.295080034150272e-05, "loss": 2.7059, "step": 13265 }, { "epoch": 0.17, "learning_rate": 9.29455744605201e-05, "loss": 2.66, "step": 13270 }, { "epoch": 0.17, "learning_rate": 9.294034679018554e-05, "loss": 2.6222, "step": 13275 }, { "epoch": 0.17, "learning_rate": 9.293511733071684e-05, "loss": 2.8068, "step": 13280 }, { "epoch": 0.17, "learning_rate": 9.29298860823319e-05, "loss": 2.7597, "step": 13285 }, { "epoch": 0.17, "learning_rate": 9.292465304524866e-05, "loss": 2.6128, "step": 13290 }, { "epoch": 0.17, "learning_rate": 9.29194182196852e-05, "loss": 2.8494, "step": 13295 }, { "epoch": 0.17, "learning_rate": 9.291418160585958e-05, "loss": 2.7149, "step": 13300 }, { "epoch": 0.17, "learning_rate": 9.290894320399002e-05, "loss": 2.7676, "step": 13305 }, { "epoch": 0.17, "learning_rate": 9.290370301429476e-05, "loss": 2.7444, "step": 13310 }, { "epoch": 0.17, "learning_rate": 9.289846103699216e-05, "loss": 2.6753, "step": 13315 }, { "epoch": 0.17, "learning_rate": 9.289321727230062e-05, "loss": 2.8331, "step": 13320 }, { "epoch": 0.17, "learning_rate": 9.288797172043862e-05, "loss": 2.7444, "step": 13325 }, { "epoch": 0.17, "learning_rate": 9.288272438162471e-05, "loss": 2.777, "step": 13330 }, { "epoch": 0.17, "learning_rate": 9.287747525607753e-05, "loss": 2.7075, "step": 13335 }, { "epoch": 0.17, "learning_rate": 9.287222434401582e-05, "loss": 2.714, "step": 13340 }, { "epoch": 0.17, "learning_rate": 9.28669716456583e-05, "loss": 2.8811, "step": 13345 }, { "epoch": 0.17, "learning_rate": 9.28617171612239e-05, "loss": 2.6922, "step": 13350 }, { "epoch": 0.17, "learning_rate": 9.285646089093148e-05, "loss": 2.6671, "step": 13355 }, { "epoch": 0.17, "learning_rate": 9.285120283500008e-05, "loss": 2.595, "step": 13360 }, { "epoch": 0.17, "learning_rate": 9.28459429936488e-05, "loss": 2.7484, "step": 13365 }, { "epoch": 0.17, "learning_rate": 9.284068136709675e-05, "loss": 2.6725, "step": 13370 }, { "epoch": 0.17, "learning_rate": 9.283541795556319e-05, "loss": 2.705, "step": 13375 }, { "epoch": 0.17, "learning_rate": 9.283015275926741e-05, "loss": 2.8373, "step": 13380 }, { "epoch": 0.17, "learning_rate": 9.282488577842879e-05, "loss": 2.8184, "step": 13385 }, { "epoch": 0.17, "learning_rate": 9.281961701326678e-05, "loss": 2.8147, "step": 13390 }, { "epoch": 0.17, "learning_rate": 9.281434646400092e-05, "loss": 2.6711, "step": 13395 }, { "epoch": 0.17, "learning_rate": 9.280907413085079e-05, "loss": 2.7702, "step": 13400 }, { "epoch": 0.17, "learning_rate": 9.280380001403608e-05, "loss": 2.82, "step": 13405 }, { "epoch": 0.17, "learning_rate": 9.279852411377652e-05, "loss": 2.7265, "step": 13410 }, { "epoch": 0.17, "learning_rate": 9.279324643029198e-05, "loss": 2.7347, "step": 13415 }, { "epoch": 0.17, "learning_rate": 9.278796696380227e-05, "loss": 2.8002, "step": 13420 }, { "epoch": 0.17, "learning_rate": 9.278268571452746e-05, "loss": 2.5987, "step": 13425 }, { "epoch": 0.17, "learning_rate": 9.277740268268752e-05, "loss": 2.9072, "step": 13430 }, { "epoch": 0.17, "learning_rate": 9.277211786850264e-05, "loss": 2.789, "step": 13435 }, { "epoch": 0.17, "learning_rate": 9.276683127219297e-05, "loss": 2.7798, "step": 13440 }, { "epoch": 0.17, "learning_rate": 9.276154289397877e-05, "loss": 2.7488, "step": 13445 }, { "epoch": 0.17, "learning_rate": 9.275625273408041e-05, "loss": 2.7265, "step": 13450 }, { "epoch": 0.17, "learning_rate": 9.275096079271829e-05, "loss": 2.7845, "step": 13455 }, { "epoch": 0.17, "learning_rate": 9.274566707011291e-05, "loss": 2.8053, "step": 13460 }, { "epoch": 0.17, "learning_rate": 9.274037156648485e-05, "loss": 2.6074, "step": 13465 }, { "epoch": 0.17, "learning_rate": 9.273507428205472e-05, "loss": 2.7659, "step": 13470 }, { "epoch": 0.17, "learning_rate": 9.272977521704325e-05, "loss": 2.722, "step": 13475 }, { "epoch": 0.17, "learning_rate": 9.272447437167125e-05, "loss": 2.8016, "step": 13480 }, { "epoch": 0.18, "learning_rate": 9.271917174615953e-05, "loss": 2.605, "step": 13485 }, { "epoch": 0.18, "learning_rate": 9.271386734072908e-05, "loss": 2.8263, "step": 13490 }, { "epoch": 0.18, "learning_rate": 9.270856115560089e-05, "loss": 2.7588, "step": 13495 }, { "epoch": 0.18, "learning_rate": 9.270325319099602e-05, "loss": 2.76, "step": 13500 }, { "epoch": 0.18, "learning_rate": 9.269794344713568e-05, "loss": 2.7082, "step": 13505 }, { "epoch": 0.18, "learning_rate": 9.269263192424107e-05, "loss": 2.5794, "step": 13510 }, { "epoch": 0.18, "learning_rate": 9.26873186225335e-05, "loss": 2.7583, "step": 13515 }, { "epoch": 0.18, "learning_rate": 9.268200354223437e-05, "loss": 2.7677, "step": 13520 }, { "epoch": 0.18, "learning_rate": 9.267668668356512e-05, "loss": 2.6924, "step": 13525 }, { "epoch": 0.18, "learning_rate": 9.267136804674727e-05, "loss": 2.6457, "step": 13530 }, { "epoch": 0.18, "learning_rate": 9.266604763200245e-05, "loss": 2.6098, "step": 13535 }, { "epoch": 0.18, "learning_rate": 9.266072543955233e-05, "loss": 2.7453, "step": 13540 }, { "epoch": 0.18, "learning_rate": 9.265540146961864e-05, "loss": 2.7576, "step": 13545 }, { "epoch": 0.18, "learning_rate": 9.265007572242323e-05, "loss": 2.7628, "step": 13550 }, { "epoch": 0.18, "learning_rate": 9.264474819818799e-05, "loss": 2.7422, "step": 13555 }, { "epoch": 0.18, "learning_rate": 9.26394188971349e-05, "loss": 2.6796, "step": 13560 }, { "epoch": 0.18, "learning_rate": 9.263408781948601e-05, "loss": 2.7869, "step": 13565 }, { "epoch": 0.18, "learning_rate": 9.262875496546344e-05, "loss": 2.689, "step": 13570 }, { "epoch": 0.18, "learning_rate": 9.262342033528939e-05, "loss": 2.6926, "step": 13575 }, { "epoch": 0.18, "learning_rate": 9.261808392918611e-05, "loss": 2.6755, "step": 13580 }, { "epoch": 0.18, "learning_rate": 9.261274574737598e-05, "loss": 2.626, "step": 13585 }, { "epoch": 0.18, "learning_rate": 9.260740579008138e-05, "loss": 2.5976, "step": 13590 }, { "epoch": 0.18, "learning_rate": 9.260206405752483e-05, "loss": 2.6497, "step": 13595 }, { "epoch": 0.18, "learning_rate": 9.259672054992888e-05, "loss": 2.7319, "step": 13600 }, { "epoch": 0.18, "learning_rate": 9.25913752675162e-05, "loss": 2.7073, "step": 13605 }, { "epoch": 0.18, "learning_rate": 9.258602821050946e-05, "loss": 2.7298, "step": 13610 }, { "epoch": 0.18, "learning_rate": 9.258067937913147e-05, "loss": 2.7897, "step": 13615 }, { "epoch": 0.18, "learning_rate": 9.25753287736051e-05, "loss": 2.76, "step": 13620 }, { "epoch": 0.18, "learning_rate": 9.256997639415327e-05, "loss": 2.7697, "step": 13625 }, { "epoch": 0.18, "learning_rate": 9.2564622240999e-05, "loss": 2.724, "step": 13630 }, { "epoch": 0.18, "learning_rate": 9.255926631436538e-05, "loss": 2.7104, "step": 13635 }, { "epoch": 0.18, "learning_rate": 9.255390861447555e-05, "loss": 2.5601, "step": 13640 }, { "epoch": 0.18, "learning_rate": 9.254854914155276e-05, "loss": 2.6599, "step": 13645 }, { "epoch": 0.18, "learning_rate": 9.25431878958203e-05, "loss": 2.6623, "step": 13650 }, { "epoch": 0.18, "learning_rate": 9.253782487750156e-05, "loss": 2.8866, "step": 13655 }, { "epoch": 0.18, "learning_rate": 9.253246008681999e-05, "loss": 2.7415, "step": 13660 }, { "epoch": 0.18, "learning_rate": 9.252709352399912e-05, "loss": 2.6904, "step": 13665 }, { "epoch": 0.18, "learning_rate": 9.252172518926254e-05, "loss": 2.6842, "step": 13670 }, { "epoch": 0.18, "learning_rate": 9.251635508283394e-05, "loss": 2.8054, "step": 13675 }, { "epoch": 0.18, "learning_rate": 9.251098320493706e-05, "loss": 2.6797, "step": 13680 }, { "epoch": 0.18, "learning_rate": 9.250560955579571e-05, "loss": 2.772, "step": 13685 }, { "epoch": 0.18, "learning_rate": 9.250023413563383e-05, "loss": 2.7239, "step": 13690 }, { "epoch": 0.18, "learning_rate": 9.249485694467532e-05, "loss": 2.7338, "step": 13695 }, { "epoch": 0.18, "learning_rate": 9.248947798314429e-05, "loss": 2.6864, "step": 13700 }, { "epoch": 0.18, "learning_rate": 9.248409725126481e-05, "loss": 2.6543, "step": 13705 }, { "epoch": 0.18, "learning_rate": 9.247871474926111e-05, "loss": 2.5833, "step": 13710 }, { "epoch": 0.18, "learning_rate": 9.247333047735743e-05, "loss": 2.7017, "step": 13715 }, { "epoch": 0.18, "learning_rate": 9.246794443577811e-05, "loss": 2.761, "step": 13720 }, { "epoch": 0.18, "learning_rate": 9.246255662474758e-05, "loss": 2.7562, "step": 13725 }, { "epoch": 0.18, "learning_rate": 9.24571670444903e-05, "loss": 2.7371, "step": 13730 }, { "epoch": 0.18, "learning_rate": 9.245177569523085e-05, "loss": 2.7043, "step": 13735 }, { "epoch": 0.18, "learning_rate": 9.244638257719387e-05, "loss": 2.7293, "step": 13740 }, { "epoch": 0.18, "learning_rate": 9.244098769060404e-05, "loss": 2.6327, "step": 13745 }, { "epoch": 0.18, "learning_rate": 9.243559103568618e-05, "loss": 2.6814, "step": 13750 }, { "epoch": 0.18, "learning_rate": 9.243019261266508e-05, "loss": 2.7527, "step": 13755 }, { "epoch": 0.18, "learning_rate": 9.242479242176573e-05, "loss": 2.686, "step": 13760 }, { "epoch": 0.18, "learning_rate": 9.241939046321312e-05, "loss": 2.728, "step": 13765 }, { "epoch": 0.18, "learning_rate": 9.241398673723231e-05, "loss": 2.7451, "step": 13770 }, { "epoch": 0.18, "learning_rate": 9.240858124404847e-05, "loss": 2.7558, "step": 13775 }, { "epoch": 0.18, "learning_rate": 9.240317398388679e-05, "loss": 2.7149, "step": 13780 }, { "epoch": 0.18, "learning_rate": 9.239776495697259e-05, "loss": 2.8014, "step": 13785 }, { "epoch": 0.18, "learning_rate": 9.239235416353124e-05, "loss": 2.7712, "step": 13790 }, { "epoch": 0.18, "learning_rate": 9.238694160378818e-05, "loss": 2.786, "step": 13795 }, { "epoch": 0.18, "learning_rate": 9.238152727796894e-05, "loss": 2.771, "step": 13800 }, { "epoch": 0.18, "learning_rate": 9.237611118629907e-05, "loss": 2.8241, "step": 13805 }, { "epoch": 0.18, "learning_rate": 9.237069332900429e-05, "loss": 2.9044, "step": 13810 }, { "epoch": 0.18, "learning_rate": 9.236527370631029e-05, "loss": 2.6805, "step": 13815 }, { "epoch": 0.18, "learning_rate": 9.23598523184429e-05, "loss": 2.8124, "step": 13820 }, { "epoch": 0.18, "learning_rate": 9.235442916562805e-05, "loss": 2.7961, "step": 13825 }, { "epoch": 0.18, "learning_rate": 9.234900424809162e-05, "loss": 2.7988, "step": 13830 }, { "epoch": 0.18, "learning_rate": 9.234357756605968e-05, "loss": 2.5787, "step": 13835 }, { "epoch": 0.18, "learning_rate": 9.233814911975834e-05, "loss": 2.7235, "step": 13840 }, { "epoch": 0.18, "learning_rate": 9.233271890941378e-05, "loss": 2.7984, "step": 13845 }, { "epoch": 0.18, "learning_rate": 9.232728693525225e-05, "loss": 2.6869, "step": 13850 }, { "epoch": 0.18, "learning_rate": 9.232185319750006e-05, "loss": 2.785, "step": 13855 }, { "epoch": 0.18, "learning_rate": 9.231641769638363e-05, "loss": 2.7144, "step": 13860 }, { "epoch": 0.18, "learning_rate": 9.231098043212942e-05, "loss": 2.7178, "step": 13865 }, { "epoch": 0.18, "learning_rate": 9.2305541404964e-05, "loss": 2.8169, "step": 13870 }, { "epoch": 0.18, "learning_rate": 9.230010061511396e-05, "loss": 2.7128, "step": 13875 }, { "epoch": 0.18, "learning_rate": 9.229465806280601e-05, "loss": 2.7934, "step": 13880 }, { "epoch": 0.18, "learning_rate": 9.228921374826691e-05, "loss": 2.4815, "step": 13885 }, { "epoch": 0.18, "learning_rate": 9.228376767172351e-05, "loss": 2.7198, "step": 13890 }, { "epoch": 0.18, "learning_rate": 9.227831983340271e-05, "loss": 2.6764, "step": 13895 }, { "epoch": 0.18, "learning_rate": 9.227287023353152e-05, "loss": 2.7156, "step": 13900 }, { "epoch": 0.18, "learning_rate": 9.226741887233698e-05, "loss": 2.6184, "step": 13905 }, { "epoch": 0.18, "learning_rate": 9.226196575004622e-05, "loss": 2.6737, "step": 13910 }, { "epoch": 0.18, "learning_rate": 9.225651086688647e-05, "loss": 2.6704, "step": 13915 }, { "epoch": 0.18, "learning_rate": 9.2251054223085e-05, "loss": 2.7127, "step": 13920 }, { "epoch": 0.18, "learning_rate": 9.224559581886916e-05, "loss": 2.6805, "step": 13925 }, { "epoch": 0.18, "learning_rate": 9.224013565446638e-05, "loss": 2.7267, "step": 13930 }, { "epoch": 0.18, "learning_rate": 9.223467373010415e-05, "loss": 2.782, "step": 13935 }, { "epoch": 0.18, "learning_rate": 9.222921004601007e-05, "loss": 2.6403, "step": 13940 }, { "epoch": 0.18, "learning_rate": 9.222374460241177e-05, "loss": 2.7812, "step": 13945 }, { "epoch": 0.18, "learning_rate": 9.221827739953697e-05, "loss": 2.6152, "step": 13950 }, { "epoch": 0.18, "learning_rate": 9.221280843761349e-05, "loss": 2.8394, "step": 13955 }, { "epoch": 0.18, "learning_rate": 9.220733771686915e-05, "loss": 2.7042, "step": 13960 }, { "epoch": 0.18, "learning_rate": 9.220186523753191e-05, "loss": 2.7393, "step": 13965 }, { "epoch": 0.18, "learning_rate": 9.219639099982981e-05, "loss": 2.6534, "step": 13970 }, { "epoch": 0.18, "learning_rate": 9.219091500399091e-05, "loss": 2.7472, "step": 13975 }, { "epoch": 0.18, "learning_rate": 9.218543725024338e-05, "loss": 2.6295, "step": 13980 }, { "epoch": 0.18, "learning_rate": 9.217995773881545e-05, "loss": 2.7584, "step": 13985 }, { "epoch": 0.18, "learning_rate": 9.217447646993544e-05, "loss": 2.7407, "step": 13990 }, { "epoch": 0.18, "learning_rate": 9.21689934438317e-05, "loss": 2.7068, "step": 13995 }, { "epoch": 0.18, "learning_rate": 9.216350866073271e-05, "loss": 2.8057, "step": 14000 }, { "epoch": 0.18, "learning_rate": 9.2158022120867e-05, "loss": 2.6157, "step": 14005 }, { "epoch": 0.18, "learning_rate": 9.215253382446314e-05, "loss": 2.6949, "step": 14010 }, { "epoch": 0.18, "learning_rate": 9.214704377174983e-05, "loss": 2.8407, "step": 14015 }, { "epoch": 0.18, "learning_rate": 9.214155196295582e-05, "loss": 2.5716, "step": 14020 }, { "epoch": 0.18, "learning_rate": 9.21360583983099e-05, "loss": 2.5686, "step": 14025 }, { "epoch": 0.18, "learning_rate": 9.213056307804098e-05, "loss": 2.8061, "step": 14030 }, { "epoch": 0.18, "learning_rate": 9.212506600237803e-05, "loss": 2.7045, "step": 14035 }, { "epoch": 0.18, "learning_rate": 9.21195671715501e-05, "loss": 2.6875, "step": 14040 }, { "epoch": 0.18, "learning_rate": 9.211406658578628e-05, "loss": 2.6568, "step": 14045 }, { "epoch": 0.18, "learning_rate": 9.210856424531573e-05, "loss": 2.6045, "step": 14050 }, { "epoch": 0.18, "learning_rate": 9.210306015036778e-05, "loss": 2.8033, "step": 14055 }, { "epoch": 0.18, "learning_rate": 9.209755430117169e-05, "loss": 2.7069, "step": 14060 }, { "epoch": 0.18, "learning_rate": 9.209204669795691e-05, "loss": 2.5436, "step": 14065 }, { "epoch": 0.18, "learning_rate": 9.208653734095291e-05, "loss": 2.696, "step": 14070 }, { "epoch": 0.18, "learning_rate": 9.208102623038923e-05, "loss": 2.7251, "step": 14075 }, { "epoch": 0.18, "learning_rate": 9.207551336649549e-05, "loss": 2.6946, "step": 14080 }, { "epoch": 0.18, "learning_rate": 9.20699987495014e-05, "loss": 2.7699, "step": 14085 }, { "epoch": 0.18, "learning_rate": 9.20644823796367e-05, "loss": 2.7484, "step": 14090 }, { "epoch": 0.18, "learning_rate": 9.205896425713127e-05, "loss": 2.7075, "step": 14095 }, { "epoch": 0.18, "learning_rate": 9.205344438221502e-05, "loss": 2.7257, "step": 14100 }, { "epoch": 0.18, "learning_rate": 9.204792275511793e-05, "loss": 2.7234, "step": 14105 }, { "epoch": 0.18, "learning_rate": 9.204239937607007e-05, "loss": 2.6891, "step": 14110 }, { "epoch": 0.18, "learning_rate": 9.203687424530154e-05, "loss": 2.6736, "step": 14115 }, { "epoch": 0.18, "learning_rate": 9.20313473630426e-05, "loss": 2.7957, "step": 14120 }, { "epoch": 0.18, "learning_rate": 9.202581872952348e-05, "loss": 2.6202, "step": 14125 }, { "epoch": 0.18, "learning_rate": 9.202028834497458e-05, "loss": 2.7575, "step": 14130 }, { "epoch": 0.18, "learning_rate": 9.20147562096263e-05, "loss": 2.6876, "step": 14135 }, { "epoch": 0.18, "learning_rate": 9.200922232370914e-05, "loss": 2.5851, "step": 14140 }, { "epoch": 0.18, "learning_rate": 9.200368668745368e-05, "loss": 2.8205, "step": 14145 }, { "epoch": 0.18, "learning_rate": 9.199814930109057e-05, "loss": 2.8148, "step": 14150 }, { "epoch": 0.18, "learning_rate": 9.19926101648505e-05, "loss": 2.7844, "step": 14155 }, { "epoch": 0.18, "learning_rate": 9.19870692789643e-05, "loss": 2.6112, "step": 14160 }, { "epoch": 0.18, "learning_rate": 9.198152664366281e-05, "loss": 2.6561, "step": 14165 }, { "epoch": 0.18, "learning_rate": 9.197598225917699e-05, "loss": 2.8494, "step": 14170 }, { "epoch": 0.18, "learning_rate": 9.197043612573781e-05, "loss": 2.6654, "step": 14175 }, { "epoch": 0.18, "learning_rate": 9.196488824357639e-05, "loss": 2.7202, "step": 14180 }, { "epoch": 0.18, "learning_rate": 9.195933861292388e-05, "loss": 2.6733, "step": 14185 }, { "epoch": 0.18, "learning_rate": 9.195378723401149e-05, "loss": 2.7516, "step": 14190 }, { "epoch": 0.18, "learning_rate": 9.194823410707053e-05, "loss": 2.5864, "step": 14195 }, { "epoch": 0.18, "learning_rate": 9.194267923233237e-05, "loss": 2.7206, "step": 14200 }, { "epoch": 0.18, "learning_rate": 9.193712261002849e-05, "loss": 2.7717, "step": 14205 }, { "epoch": 0.18, "learning_rate": 9.193156424039036e-05, "loss": 2.8368, "step": 14210 }, { "epoch": 0.18, "learning_rate": 9.19260041236496e-05, "loss": 2.7209, "step": 14215 }, { "epoch": 0.18, "learning_rate": 9.192044226003789e-05, "loss": 2.7214, "step": 14220 }, { "epoch": 0.18, "learning_rate": 9.191487864978692e-05, "loss": 2.7852, "step": 14225 }, { "epoch": 0.18, "learning_rate": 9.190931329312854e-05, "loss": 2.68, "step": 14230 }, { "epoch": 0.18, "learning_rate": 9.190374619029464e-05, "loss": 2.6704, "step": 14235 }, { "epoch": 0.18, "learning_rate": 9.189817734151716e-05, "loss": 2.7571, "step": 14240 }, { "epoch": 0.18, "learning_rate": 9.189260674702812e-05, "loss": 2.6768, "step": 14245 }, { "epoch": 0.18, "learning_rate": 9.188703440705964e-05, "loss": 2.7114, "step": 14250 }, { "epoch": 0.18, "learning_rate": 9.188146032184387e-05, "loss": 2.6643, "step": 14255 }, { "epoch": 0.19, "learning_rate": 9.187588449161309e-05, "loss": 2.7429, "step": 14260 }, { "epoch": 0.19, "learning_rate": 9.18703069165996e-05, "loss": 2.8129, "step": 14265 }, { "epoch": 0.19, "learning_rate": 9.186472759703579e-05, "loss": 2.5447, "step": 14270 }, { "epoch": 0.19, "learning_rate": 9.185914653315414e-05, "loss": 2.7068, "step": 14275 }, { "epoch": 0.19, "learning_rate": 9.185356372518718e-05, "loss": 2.6749, "step": 14280 }, { "epoch": 0.19, "learning_rate": 9.184797917336754e-05, "loss": 2.819, "step": 14285 }, { "epoch": 0.19, "learning_rate": 9.184239287792787e-05, "loss": 2.8406, "step": 14290 }, { "epoch": 0.19, "learning_rate": 9.183680483910093e-05, "loss": 2.725, "step": 14295 }, { "epoch": 0.19, "learning_rate": 9.183121505711958e-05, "loss": 2.8123, "step": 14300 }, { "epoch": 0.19, "learning_rate": 9.18256235322167e-05, "loss": 2.6607, "step": 14305 }, { "epoch": 0.19, "learning_rate": 9.182003026462525e-05, "loss": 2.6789, "step": 14310 }, { "epoch": 0.19, "learning_rate": 9.181443525457831e-05, "loss": 2.7576, "step": 14315 }, { "epoch": 0.19, "learning_rate": 9.180883850230898e-05, "loss": 2.5983, "step": 14320 }, { "epoch": 0.19, "learning_rate": 9.180324000805045e-05, "loss": 2.683, "step": 14325 }, { "epoch": 0.19, "learning_rate": 9.1797639772036e-05, "loss": 2.667, "step": 14330 }, { "epoch": 0.19, "learning_rate": 9.179203779449894e-05, "loss": 2.6507, "step": 14335 }, { "epoch": 0.19, "learning_rate": 9.17864340756727e-05, "loss": 2.6833, "step": 14340 }, { "epoch": 0.19, "learning_rate": 9.178082861579076e-05, "loss": 2.7125, "step": 14345 }, { "epoch": 0.19, "learning_rate": 9.177522141508666e-05, "loss": 2.7449, "step": 14350 }, { "epoch": 0.19, "learning_rate": 9.176961247379405e-05, "loss": 2.7703, "step": 14355 }, { "epoch": 0.19, "learning_rate": 9.176400179214663e-05, "loss": 2.7304, "step": 14360 }, { "epoch": 0.19, "learning_rate": 9.175838937037816e-05, "loss": 2.6458, "step": 14365 }, { "epoch": 0.19, "learning_rate": 9.175277520872246e-05, "loss": 2.7482, "step": 14370 }, { "epoch": 0.19, "learning_rate": 9.17471593074135e-05, "loss": 2.6284, "step": 14375 }, { "epoch": 0.19, "learning_rate": 9.174154166668522e-05, "loss": 2.661, "step": 14380 }, { "epoch": 0.19, "learning_rate": 9.173592228677172e-05, "loss": 2.6926, "step": 14385 }, { "epoch": 0.19, "learning_rate": 9.173030116790713e-05, "loss": 2.7472, "step": 14390 }, { "epoch": 0.19, "learning_rate": 9.172467831032562e-05, "loss": 2.6849, "step": 14395 }, { "epoch": 0.19, "learning_rate": 9.171905371426152e-05, "loss": 2.7302, "step": 14400 }, { "epoch": 0.19, "learning_rate": 9.171342737994916e-05, "loss": 2.7141, "step": 14405 }, { "epoch": 0.19, "learning_rate": 9.170779930762295e-05, "loss": 2.6691, "step": 14410 }, { "epoch": 0.19, "learning_rate": 9.17021694975174e-05, "loss": 2.7469, "step": 14415 }, { "epoch": 0.19, "learning_rate": 9.169653794986709e-05, "loss": 2.7723, "step": 14420 }, { "epoch": 0.19, "learning_rate": 9.169090466490664e-05, "loss": 2.658, "step": 14425 }, { "epoch": 0.19, "learning_rate": 9.168526964287079e-05, "loss": 2.8037, "step": 14430 }, { "epoch": 0.19, "learning_rate": 9.16796328839943e-05, "loss": 2.6652, "step": 14435 }, { "epoch": 0.19, "learning_rate": 9.167399438851204e-05, "loss": 2.6566, "step": 14440 }, { "epoch": 0.19, "learning_rate": 9.166835415665896e-05, "loss": 2.5953, "step": 14445 }, { "epoch": 0.19, "learning_rate": 9.166271218867002e-05, "loss": 2.647, "step": 14450 }, { "epoch": 0.19, "learning_rate": 9.165706848478033e-05, "loss": 2.7385, "step": 14455 }, { "epoch": 0.19, "learning_rate": 9.165142304522502e-05, "loss": 2.6625, "step": 14460 }, { "epoch": 0.19, "learning_rate": 9.164577587023932e-05, "loss": 2.5876, "step": 14465 }, { "epoch": 0.19, "learning_rate": 9.164012696005855e-05, "loss": 2.6368, "step": 14470 }, { "epoch": 0.19, "learning_rate": 9.163447631491802e-05, "loss": 2.8695, "step": 14475 }, { "epoch": 0.19, "learning_rate": 9.16288239350532e-05, "loss": 2.6255, "step": 14480 }, { "epoch": 0.19, "learning_rate": 9.162316982069959e-05, "loss": 2.6732, "step": 14485 }, { "epoch": 0.19, "learning_rate": 9.161751397209279e-05, "loss": 2.7345, "step": 14490 }, { "epoch": 0.19, "learning_rate": 9.161185638946843e-05, "loss": 2.6461, "step": 14495 }, { "epoch": 0.19, "learning_rate": 9.160619707306225e-05, "loss": 2.6213, "step": 14500 }, { "epoch": 0.19, "learning_rate": 9.160053602311006e-05, "loss": 2.7629, "step": 14505 }, { "epoch": 0.19, "learning_rate": 9.159487323984769e-05, "loss": 2.894, "step": 14510 }, { "epoch": 0.19, "learning_rate": 9.158920872351112e-05, "loss": 2.759, "step": 14515 }, { "epoch": 0.19, "learning_rate": 9.158354247433636e-05, "loss": 2.6528, "step": 14520 }, { "epoch": 0.19, "learning_rate": 9.157787449255948e-05, "loss": 2.5994, "step": 14525 }, { "epoch": 0.19, "learning_rate": 9.157220477841666e-05, "loss": 2.7392, "step": 14530 }, { "epoch": 0.19, "learning_rate": 9.156653333214412e-05, "loss": 2.7232, "step": 14535 }, { "epoch": 0.19, "learning_rate": 9.156086015397818e-05, "loss": 2.6651, "step": 14540 }, { "epoch": 0.19, "learning_rate": 9.155518524415518e-05, "loss": 2.6292, "step": 14545 }, { "epoch": 0.19, "learning_rate": 9.154950860291162e-05, "loss": 2.6329, "step": 14550 }, { "epoch": 0.19, "learning_rate": 9.154383023048399e-05, "loss": 2.6563, "step": 14555 }, { "epoch": 0.19, "learning_rate": 9.153815012710887e-05, "loss": 2.8005, "step": 14560 }, { "epoch": 0.19, "learning_rate": 9.153246829302295e-05, "loss": 2.7881, "step": 14565 }, { "epoch": 0.19, "learning_rate": 9.152678472846295e-05, "loss": 2.6781, "step": 14570 }, { "epoch": 0.19, "learning_rate": 9.15210994336657e-05, "loss": 2.6897, "step": 14575 }, { "epoch": 0.19, "learning_rate": 9.151541240886804e-05, "loss": 2.637, "step": 14580 }, { "epoch": 0.19, "learning_rate": 9.150972365430696e-05, "loss": 2.8008, "step": 14585 }, { "epoch": 0.19, "learning_rate": 9.15040331702195e-05, "loss": 2.8552, "step": 14590 }, { "epoch": 0.19, "learning_rate": 9.149834095684271e-05, "loss": 2.7339, "step": 14595 }, { "epoch": 0.19, "learning_rate": 9.149264701441379e-05, "loss": 2.7892, "step": 14600 }, { "epoch": 0.19, "learning_rate": 9.148695134316997e-05, "loss": 2.7048, "step": 14605 }, { "epoch": 0.19, "learning_rate": 9.148125394334857e-05, "loss": 2.8013, "step": 14610 }, { "epoch": 0.19, "learning_rate": 9.147555481518697e-05, "loss": 2.6644, "step": 14615 }, { "epoch": 0.19, "learning_rate": 9.146985395892263e-05, "loss": 2.8297, "step": 14620 }, { "epoch": 0.19, "learning_rate": 9.146415137479309e-05, "loss": 2.7052, "step": 14625 }, { "epoch": 0.19, "learning_rate": 9.145844706303593e-05, "loss": 2.6186, "step": 14630 }, { "epoch": 0.19, "learning_rate": 9.145274102388883e-05, "loss": 2.7015, "step": 14635 }, { "epoch": 0.19, "learning_rate": 9.144703325758955e-05, "loss": 2.7411, "step": 14640 }, { "epoch": 0.19, "learning_rate": 9.144132376437589e-05, "loss": 2.727, "step": 14645 }, { "epoch": 0.19, "learning_rate": 9.143561254448575e-05, "loss": 2.7289, "step": 14650 }, { "epoch": 0.19, "learning_rate": 9.142989959815708e-05, "loss": 2.8054, "step": 14655 }, { "epoch": 0.19, "learning_rate": 9.142418492562794e-05, "loss": 2.6339, "step": 14660 }, { "epoch": 0.19, "learning_rate": 9.14184685271364e-05, "loss": 2.7688, "step": 14665 }, { "epoch": 0.19, "learning_rate": 9.141275040292065e-05, "loss": 2.7318, "step": 14670 }, { "epoch": 0.19, "learning_rate": 9.140703055321896e-05, "loss": 2.7344, "step": 14675 }, { "epoch": 0.19, "learning_rate": 9.140130897826959e-05, "loss": 2.8025, "step": 14680 }, { "epoch": 0.19, "learning_rate": 9.139558567831101e-05, "loss": 2.5501, "step": 14685 }, { "epoch": 0.19, "learning_rate": 9.138986065358166e-05, "loss": 2.8048, "step": 14690 }, { "epoch": 0.19, "learning_rate": 9.138413390432004e-05, "loss": 2.7159, "step": 14695 }, { "epoch": 0.19, "learning_rate": 9.13784054307648e-05, "loss": 2.6443, "step": 14700 }, { "epoch": 0.19, "learning_rate": 9.13726752331546e-05, "loss": 2.719, "step": 14705 }, { "epoch": 0.19, "learning_rate": 9.136694331172819e-05, "loss": 2.6468, "step": 14710 }, { "epoch": 0.19, "learning_rate": 9.136120966672441e-05, "loss": 2.6588, "step": 14715 }, { "epoch": 0.19, "learning_rate": 9.135547429838214e-05, "loss": 2.8156, "step": 14720 }, { "epoch": 0.19, "learning_rate": 9.134973720694036e-05, "loss": 2.7455, "step": 14725 }, { "epoch": 0.19, "learning_rate": 9.13439983926381e-05, "loss": 2.5919, "step": 14730 }, { "epoch": 0.19, "learning_rate": 9.133825785571447e-05, "loss": 2.6127, "step": 14735 }, { "epoch": 0.19, "learning_rate": 9.133251559640865e-05, "loss": 2.7159, "step": 14740 }, { "epoch": 0.19, "learning_rate": 9.132677161495991e-05, "loss": 2.7692, "step": 14745 }, { "epoch": 0.19, "learning_rate": 9.132102591160758e-05, "loss": 2.7894, "step": 14750 }, { "epoch": 0.19, "learning_rate": 9.131527848659102e-05, "loss": 2.6371, "step": 14755 }, { "epoch": 0.19, "learning_rate": 9.130952934014973e-05, "loss": 2.7713, "step": 14760 }, { "epoch": 0.19, "learning_rate": 9.130377847252328e-05, "loss": 2.6981, "step": 14765 }, { "epoch": 0.19, "learning_rate": 9.12980258839512e-05, "loss": 2.7661, "step": 14770 }, { "epoch": 0.19, "learning_rate": 9.129227157467325e-05, "loss": 2.5705, "step": 14775 }, { "epoch": 0.19, "learning_rate": 9.128651554492917e-05, "loss": 2.6754, "step": 14780 }, { "epoch": 0.19, "learning_rate": 9.128075779495875e-05, "loss": 2.6586, "step": 14785 }, { "epoch": 0.19, "learning_rate": 9.127499832500195e-05, "loss": 2.7182, "step": 14790 }, { "epoch": 0.19, "learning_rate": 9.126923713529868e-05, "loss": 2.8167, "step": 14795 }, { "epoch": 0.19, "learning_rate": 9.126347422608905e-05, "loss": 2.7133, "step": 14800 }, { "epoch": 0.19, "learning_rate": 9.12577095976131e-05, "loss": 2.6883, "step": 14805 }, { "epoch": 0.19, "learning_rate": 9.125194325011109e-05, "loss": 2.5478, "step": 14810 }, { "epoch": 0.19, "learning_rate": 9.124617518382323e-05, "loss": 2.8026, "step": 14815 }, { "epoch": 0.19, "learning_rate": 9.124040539898986e-05, "loss": 2.7232, "step": 14820 }, { "epoch": 0.19, "learning_rate": 9.123463389585138e-05, "loss": 2.5695, "step": 14825 }, { "epoch": 0.19, "learning_rate": 9.122886067464829e-05, "loss": 2.7285, "step": 14830 }, { "epoch": 0.19, "learning_rate": 9.12230857356211e-05, "loss": 2.6553, "step": 14835 }, { "epoch": 0.19, "learning_rate": 9.121730907901042e-05, "loss": 2.6718, "step": 14840 }, { "epoch": 0.19, "learning_rate": 9.121153070505699e-05, "loss": 2.4145, "step": 14845 }, { "epoch": 0.19, "learning_rate": 9.120575061400152e-05, "loss": 2.7357, "step": 14850 }, { "epoch": 0.19, "learning_rate": 9.119996880608485e-05, "loss": 2.7168, "step": 14855 }, { "epoch": 0.19, "learning_rate": 9.11941852815479e-05, "loss": 2.7543, "step": 14860 }, { "epoch": 0.19, "learning_rate": 9.118840004063162e-05, "loss": 2.8285, "step": 14865 }, { "epoch": 0.19, "learning_rate": 9.118261308357708e-05, "loss": 2.5401, "step": 14870 }, { "epoch": 0.19, "learning_rate": 9.117682441062539e-05, "loss": 2.6965, "step": 14875 }, { "epoch": 0.19, "learning_rate": 9.11710340220177e-05, "loss": 2.7817, "step": 14880 }, { "epoch": 0.19, "learning_rate": 9.116524191799533e-05, "loss": 2.7872, "step": 14885 }, { "epoch": 0.19, "learning_rate": 9.115944809879959e-05, "loss": 2.6949, "step": 14890 }, { "epoch": 0.19, "learning_rate": 9.115365256467187e-05, "loss": 2.7702, "step": 14895 }, { "epoch": 0.19, "learning_rate": 9.114785531585364e-05, "loss": 2.7615, "step": 14900 }, { "epoch": 0.19, "learning_rate": 9.114205635258647e-05, "loss": 2.7894, "step": 14905 }, { "epoch": 0.19, "learning_rate": 9.113625567511196e-05, "loss": 2.7066, "step": 14910 }, { "epoch": 0.19, "learning_rate": 9.11304532836718e-05, "loss": 2.7734, "step": 14915 }, { "epoch": 0.19, "learning_rate": 9.112464917850776e-05, "loss": 2.7469, "step": 14920 }, { "epoch": 0.19, "learning_rate": 9.111884335986166e-05, "loss": 2.6947, "step": 14925 }, { "epoch": 0.19, "learning_rate": 9.111303582797541e-05, "loss": 2.7416, "step": 14930 }, { "epoch": 0.19, "learning_rate": 9.110722658309097e-05, "loss": 2.721, "step": 14935 }, { "epoch": 0.19, "learning_rate": 9.110141562545042e-05, "loss": 2.6809, "step": 14940 }, { "epoch": 0.19, "learning_rate": 9.109560295529583e-05, "loss": 2.694, "step": 14945 }, { "epoch": 0.19, "learning_rate": 9.108978857286943e-05, "loss": 2.7004, "step": 14950 }, { "epoch": 0.19, "learning_rate": 9.108397247841345e-05, "loss": 2.6248, "step": 14955 }, { "epoch": 0.19, "learning_rate": 9.107815467217022e-05, "loss": 2.7154, "step": 14960 }, { "epoch": 0.19, "learning_rate": 9.107233515438218e-05, "loss": 2.6448, "step": 14965 }, { "epoch": 0.19, "learning_rate": 9.106651392529177e-05, "loss": 2.8292, "step": 14970 }, { "epoch": 0.19, "learning_rate": 9.106069098514154e-05, "loss": 2.7175, "step": 14975 }, { "epoch": 0.19, "learning_rate": 9.10548663341741e-05, "loss": 2.5652, "step": 14980 }, { "epoch": 0.19, "learning_rate": 9.104903997263215e-05, "loss": 2.7745, "step": 14985 }, { "epoch": 0.19, "learning_rate": 9.104321190075846e-05, "loss": 2.7075, "step": 14990 }, { "epoch": 0.19, "learning_rate": 9.103738211879582e-05, "loss": 2.8122, "step": 14995 }, { "epoch": 0.19, "learning_rate": 9.103155062698718e-05, "loss": 2.6654, "step": 15000 }, { "epoch": 0.19, "learning_rate": 9.102571742557548e-05, "loss": 2.7972, "step": 15005 }, { "epoch": 0.19, "learning_rate": 9.101988251480377e-05, "loss": 2.5581, "step": 15010 }, { "epoch": 0.19, "learning_rate": 9.101404589491517e-05, "loss": 2.6968, "step": 15015 }, { "epoch": 0.19, "learning_rate": 9.100820756615286e-05, "loss": 2.7335, "step": 15020 }, { "epoch": 0.19, "learning_rate": 9.10023675287601e-05, "loss": 2.6933, "step": 15025 }, { "epoch": 0.2, "learning_rate": 9.099652578298022e-05, "loss": 2.8033, "step": 15030 }, { "epoch": 0.2, "learning_rate": 9.099068232905663e-05, "loss": 2.5468, "step": 15035 }, { "epoch": 0.2, "learning_rate": 9.098483716723276e-05, "loss": 2.7578, "step": 15040 }, { "epoch": 0.2, "learning_rate": 9.09789902977522e-05, "loss": 2.7529, "step": 15045 }, { "epoch": 0.2, "learning_rate": 9.097314172085856e-05, "loss": 2.5979, "step": 15050 }, { "epoch": 0.2, "learning_rate": 9.09672914367955e-05, "loss": 2.7177, "step": 15055 }, { "epoch": 0.2, "learning_rate": 9.096143944580677e-05, "loss": 2.7758, "step": 15060 }, { "epoch": 0.2, "learning_rate": 9.095558574813623e-05, "loss": 2.8426, "step": 15065 }, { "epoch": 0.2, "learning_rate": 9.094973034402774e-05, "loss": 2.7649, "step": 15070 }, { "epoch": 0.2, "learning_rate": 9.09438732337253e-05, "loss": 2.6961, "step": 15075 }, { "epoch": 0.2, "learning_rate": 9.093801441747294e-05, "loss": 2.705, "step": 15080 }, { "epoch": 0.2, "learning_rate": 9.093215389551477e-05, "loss": 2.799, "step": 15085 }, { "epoch": 0.2, "learning_rate": 9.092629166809495e-05, "loss": 2.701, "step": 15090 }, { "epoch": 0.2, "learning_rate": 9.092042773545777e-05, "loss": 2.7773, "step": 15095 }, { "epoch": 0.2, "learning_rate": 9.091456209784755e-05, "loss": 2.5971, "step": 15100 }, { "epoch": 0.2, "learning_rate": 9.090869475550865e-05, "loss": 2.7955, "step": 15105 }, { "epoch": 0.2, "learning_rate": 9.090282570868555e-05, "loss": 2.81, "step": 15110 }, { "epoch": 0.2, "learning_rate": 9.089695495762283e-05, "loss": 2.6744, "step": 15115 }, { "epoch": 0.2, "learning_rate": 9.089108250256504e-05, "loss": 2.5966, "step": 15120 }, { "epoch": 0.2, "learning_rate": 9.088520834375689e-05, "loss": 2.8334, "step": 15125 }, { "epoch": 0.2, "learning_rate": 9.087933248144313e-05, "loss": 2.7791, "step": 15130 }, { "epoch": 0.2, "learning_rate": 9.087345491586856e-05, "loss": 2.6382, "step": 15135 }, { "epoch": 0.2, "learning_rate": 9.08675756472781e-05, "loss": 2.6868, "step": 15140 }, { "epoch": 0.2, "learning_rate": 9.08616946759167e-05, "loss": 2.7705, "step": 15145 }, { "epoch": 0.2, "learning_rate": 9.085581200202937e-05, "loss": 2.6749, "step": 15150 }, { "epoch": 0.2, "learning_rate": 9.084992762586127e-05, "loss": 2.7044, "step": 15155 }, { "epoch": 0.2, "learning_rate": 9.084404154765753e-05, "loss": 2.6519, "step": 15160 }, { "epoch": 0.2, "learning_rate": 9.083815376766342e-05, "loss": 2.7833, "step": 15165 }, { "epoch": 0.2, "learning_rate": 9.083226428612424e-05, "loss": 2.7335, "step": 15170 }, { "epoch": 0.2, "learning_rate": 9.082637310328538e-05, "loss": 2.7817, "step": 15175 }, { "epoch": 0.2, "learning_rate": 9.082048021939233e-05, "loss": 2.7475, "step": 15180 }, { "epoch": 0.2, "learning_rate": 9.081458563469059e-05, "loss": 2.6222, "step": 15185 }, { "epoch": 0.2, "learning_rate": 9.080868934942577e-05, "loss": 2.7218, "step": 15190 }, { "epoch": 0.2, "learning_rate": 9.080279136384354e-05, "loss": 2.7263, "step": 15195 }, { "epoch": 0.2, "learning_rate": 9.079689167818965e-05, "loss": 2.7576, "step": 15200 }, { "epoch": 0.2, "learning_rate": 9.07909902927099e-05, "loss": 2.7598, "step": 15205 }, { "epoch": 0.2, "learning_rate": 9.078508720765018e-05, "loss": 2.6852, "step": 15210 }, { "epoch": 0.2, "learning_rate": 9.077918242325645e-05, "loss": 2.7263, "step": 15215 }, { "epoch": 0.2, "learning_rate": 9.077327593977474e-05, "loss": 2.7834, "step": 15220 }, { "epoch": 0.2, "learning_rate": 9.076736775745114e-05, "loss": 2.5963, "step": 15225 }, { "epoch": 0.2, "learning_rate": 9.076145787653181e-05, "loss": 2.7644, "step": 15230 }, { "epoch": 0.2, "learning_rate": 9.075554629726302e-05, "loss": 2.6077, "step": 15235 }, { "epoch": 0.2, "learning_rate": 9.074963301989103e-05, "loss": 2.8244, "step": 15240 }, { "epoch": 0.2, "learning_rate": 9.074371804466226e-05, "loss": 2.6752, "step": 15245 }, { "epoch": 0.2, "learning_rate": 9.073780137182314e-05, "loss": 2.697, "step": 15250 }, { "epoch": 0.2, "learning_rate": 9.073188300162021e-05, "loss": 2.732, "step": 15255 }, { "epoch": 0.2, "learning_rate": 9.072596293430004e-05, "loss": 2.668, "step": 15260 }, { "epoch": 0.2, "learning_rate": 9.072004117010933e-05, "loss": 2.6491, "step": 15265 }, { "epoch": 0.2, "learning_rate": 9.071411770929477e-05, "loss": 2.7915, "step": 15270 }, { "epoch": 0.2, "learning_rate": 9.07081925521032e-05, "loss": 2.7229, "step": 15275 }, { "epoch": 0.2, "learning_rate": 9.070226569878144e-05, "loss": 2.6798, "step": 15280 }, { "epoch": 0.2, "learning_rate": 9.06963371495765e-05, "loss": 2.7638, "step": 15285 }, { "epoch": 0.2, "learning_rate": 9.069040690473537e-05, "loss": 2.755, "step": 15290 }, { "epoch": 0.2, "learning_rate": 9.068447496450513e-05, "loss": 2.6094, "step": 15295 }, { "epoch": 0.2, "learning_rate": 9.067854132913294e-05, "loss": 2.7231, "step": 15300 }, { "epoch": 0.2, "learning_rate": 9.067260599886604e-05, "loss": 2.7025, "step": 15305 }, { "epoch": 0.2, "learning_rate": 9.066666897395173e-05, "loss": 2.6306, "step": 15310 }, { "epoch": 0.2, "learning_rate": 9.066073025463738e-05, "loss": 2.7106, "step": 15315 }, { "epoch": 0.2, "learning_rate": 9.065478984117039e-05, "loss": 2.711, "step": 15320 }, { "epoch": 0.2, "learning_rate": 9.064884773379832e-05, "loss": 2.7721, "step": 15325 }, { "epoch": 0.2, "learning_rate": 9.064290393276873e-05, "loss": 2.797, "step": 15330 }, { "epoch": 0.2, "learning_rate": 9.063695843832929e-05, "loss": 2.8293, "step": 15335 }, { "epoch": 0.2, "learning_rate": 9.063101125072769e-05, "loss": 2.6718, "step": 15340 }, { "epoch": 0.2, "learning_rate": 9.062506237021176e-05, "loss": 2.6749, "step": 15345 }, { "epoch": 0.2, "learning_rate": 9.061911179702934e-05, "loss": 2.7275, "step": 15350 }, { "epoch": 0.2, "learning_rate": 9.061315953142835e-05, "loss": 2.6575, "step": 15355 }, { "epoch": 0.2, "learning_rate": 9.060720557365683e-05, "loss": 2.8516, "step": 15360 }, { "epoch": 0.2, "learning_rate": 9.060124992396283e-05, "loss": 2.5894, "step": 15365 }, { "epoch": 0.2, "learning_rate": 9.059529258259449e-05, "loss": 2.7666, "step": 15370 }, { "epoch": 0.2, "learning_rate": 9.058933354980005e-05, "loss": 2.6972, "step": 15375 }, { "epoch": 0.2, "learning_rate": 9.058337282582781e-05, "loss": 2.6999, "step": 15380 }, { "epoch": 0.2, "learning_rate": 9.057741041092609e-05, "loss": 2.5961, "step": 15385 }, { "epoch": 0.2, "learning_rate": 9.057144630534332e-05, "loss": 2.7469, "step": 15390 }, { "epoch": 0.2, "learning_rate": 9.056548050932803e-05, "loss": 2.6098, "step": 15395 }, { "epoch": 0.2, "learning_rate": 9.055951302312875e-05, "loss": 2.6222, "step": 15400 }, { "epoch": 0.2, "learning_rate": 9.055354384699413e-05, "loss": 2.6963, "step": 15405 }, { "epoch": 0.2, "learning_rate": 9.05475729811729e-05, "loss": 2.6147, "step": 15410 }, { "epoch": 0.2, "learning_rate": 9.054160042591381e-05, "loss": 2.7663, "step": 15415 }, { "epoch": 0.2, "learning_rate": 9.053562618146573e-05, "loss": 2.8319, "step": 15420 }, { "epoch": 0.2, "learning_rate": 9.052965024807758e-05, "loss": 2.6805, "step": 15425 }, { "epoch": 0.2, "learning_rate": 9.052367262599834e-05, "loss": 2.7109, "step": 15430 }, { "epoch": 0.2, "learning_rate": 9.051769331547708e-05, "loss": 2.7426, "step": 15435 }, { "epoch": 0.2, "learning_rate": 9.051171231676292e-05, "loss": 2.7934, "step": 15440 }, { "epoch": 0.2, "learning_rate": 9.050572963010509e-05, "loss": 2.5353, "step": 15445 }, { "epoch": 0.2, "learning_rate": 9.049974525575282e-05, "loss": 2.635, "step": 15450 }, { "epoch": 0.2, "learning_rate": 9.049375919395548e-05, "loss": 2.7051, "step": 15455 }, { "epoch": 0.2, "learning_rate": 9.048777144496248e-05, "loss": 2.7661, "step": 15460 }, { "epoch": 0.2, "learning_rate": 9.048178200902328e-05, "loss": 2.8346, "step": 15465 }, { "epoch": 0.2, "learning_rate": 9.047579088638747e-05, "loss": 2.7837, "step": 15470 }, { "epoch": 0.2, "learning_rate": 9.046979807730467e-05, "loss": 2.775, "step": 15475 }, { "epoch": 0.2, "learning_rate": 9.046380358202454e-05, "loss": 2.6459, "step": 15480 }, { "epoch": 0.2, "learning_rate": 9.045780740079687e-05, "loss": 2.7765, "step": 15485 }, { "epoch": 0.2, "learning_rate": 9.045180953387149e-05, "loss": 2.635, "step": 15490 }, { "epoch": 0.2, "learning_rate": 9.04458099814983e-05, "loss": 2.8516, "step": 15495 }, { "epoch": 0.2, "learning_rate": 9.043980874392728e-05, "loss": 2.6861, "step": 15500 }, { "epoch": 0.2, "learning_rate": 9.043380582140848e-05, "loss": 2.6964, "step": 15505 }, { "epoch": 0.2, "learning_rate": 9.0427801214192e-05, "loss": 2.6658, "step": 15510 }, { "epoch": 0.2, "learning_rate": 9.042179492252802e-05, "loss": 2.8989, "step": 15515 }, { "epoch": 0.2, "learning_rate": 9.041578694666684e-05, "loss": 2.7853, "step": 15520 }, { "epoch": 0.2, "learning_rate": 9.040977728685873e-05, "loss": 2.7314, "step": 15525 }, { "epoch": 0.2, "learning_rate": 9.040376594335412e-05, "loss": 2.7376, "step": 15530 }, { "epoch": 0.2, "learning_rate": 9.039775291640347e-05, "loss": 2.7795, "step": 15535 }, { "epoch": 0.2, "learning_rate": 9.039173820625732e-05, "loss": 2.7555, "step": 15540 }, { "epoch": 0.2, "learning_rate": 9.038572181316624e-05, "loss": 2.5556, "step": 15545 }, { "epoch": 0.2, "learning_rate": 9.037970373738096e-05, "loss": 2.691, "step": 15550 }, { "epoch": 0.2, "learning_rate": 9.03736839791522e-05, "loss": 2.8144, "step": 15555 }, { "epoch": 0.2, "learning_rate": 9.036766253873078e-05, "loss": 2.7474, "step": 15560 }, { "epoch": 0.2, "learning_rate": 9.036163941636759e-05, "loss": 2.7957, "step": 15565 }, { "epoch": 0.2, "learning_rate": 9.035561461231357e-05, "loss": 2.6339, "step": 15570 }, { "epoch": 0.2, "learning_rate": 9.034958812681977e-05, "loss": 2.7337, "step": 15575 }, { "epoch": 0.2, "learning_rate": 9.034355996013729e-05, "loss": 2.7107, "step": 15580 }, { "epoch": 0.2, "learning_rate": 9.033753011251725e-05, "loss": 2.7441, "step": 15585 }, { "epoch": 0.2, "learning_rate": 9.033149858421094e-05, "loss": 2.6099, "step": 15590 }, { "epoch": 0.2, "learning_rate": 9.032546537546965e-05, "loss": 2.7583, "step": 15595 }, { "epoch": 0.2, "learning_rate": 9.031943048654474e-05, "loss": 2.6908, "step": 15600 }, { "epoch": 0.2, "learning_rate": 9.031339391768768e-05, "loss": 2.5959, "step": 15605 }, { "epoch": 0.2, "learning_rate": 9.030735566914999e-05, "loss": 2.6459, "step": 15610 }, { "epoch": 0.2, "learning_rate": 9.030131574118324e-05, "loss": 2.7019, "step": 15615 }, { "epoch": 0.2, "learning_rate": 9.029527413403909e-05, "loss": 2.7621, "step": 15620 }, { "epoch": 0.2, "learning_rate": 9.028923084796927e-05, "loss": 2.5412, "step": 15625 }, { "epoch": 0.2, "learning_rate": 9.028318588322558e-05, "loss": 2.75, "step": 15630 }, { "epoch": 0.2, "learning_rate": 9.027713924005987e-05, "loss": 2.7757, "step": 15635 }, { "epoch": 0.2, "learning_rate": 9.02710909187241e-05, "loss": 2.7317, "step": 15640 }, { "epoch": 0.2, "learning_rate": 9.026504091947028e-05, "loss": 2.6534, "step": 15645 }, { "epoch": 0.2, "learning_rate": 9.025898924255047e-05, "loss": 2.6378, "step": 15650 }, { "epoch": 0.2, "learning_rate": 9.025293588821682e-05, "loss": 2.7057, "step": 15655 }, { "epoch": 0.2, "learning_rate": 9.024688085672152e-05, "loss": 2.7836, "step": 15660 }, { "epoch": 0.2, "learning_rate": 9.024082414831691e-05, "loss": 2.6472, "step": 15665 }, { "epoch": 0.2, "learning_rate": 9.023476576325534e-05, "loss": 2.9166, "step": 15670 }, { "epoch": 0.2, "learning_rate": 9.022870570178918e-05, "loss": 2.7737, "step": 15675 }, { "epoch": 0.2, "learning_rate": 9.022264396417097e-05, "loss": 2.8888, "step": 15680 }, { "epoch": 0.2, "learning_rate": 9.021658055065328e-05, "loss": 2.7667, "step": 15685 }, { "epoch": 0.2, "learning_rate": 9.021051546148874e-05, "loss": 2.7399, "step": 15690 }, { "epoch": 0.2, "learning_rate": 9.020444869693003e-05, "loss": 2.8913, "step": 15695 }, { "epoch": 0.2, "learning_rate": 9.019838025722995e-05, "loss": 2.7181, "step": 15700 }, { "epoch": 0.2, "learning_rate": 9.019231014264134e-05, "loss": 2.7597, "step": 15705 }, { "epoch": 0.2, "learning_rate": 9.01862383534171e-05, "loss": 2.5929, "step": 15710 }, { "epoch": 0.2, "learning_rate": 9.018016488981025e-05, "loss": 2.6105, "step": 15715 }, { "epoch": 0.2, "learning_rate": 9.017408975207382e-05, "loss": 2.8217, "step": 15720 }, { "epoch": 0.2, "learning_rate": 9.016801294046094e-05, "loss": 2.7002, "step": 15725 }, { "epoch": 0.2, "learning_rate": 9.016193445522478e-05, "loss": 2.7354, "step": 15730 }, { "epoch": 0.2, "learning_rate": 9.015585429661864e-05, "loss": 2.7956, "step": 15735 }, { "epoch": 0.2, "learning_rate": 9.014977246489585e-05, "loss": 2.7627, "step": 15740 }, { "epoch": 0.2, "learning_rate": 9.014368896030978e-05, "loss": 2.7016, "step": 15745 }, { "epoch": 0.2, "learning_rate": 9.013760378311393e-05, "loss": 2.8588, "step": 15750 }, { "epoch": 0.2, "learning_rate": 9.013151693356183e-05, "loss": 2.6392, "step": 15755 }, { "epoch": 0.2, "learning_rate": 9.01254284119071e-05, "loss": 2.7186, "step": 15760 }, { "epoch": 0.2, "learning_rate": 9.011933821840342e-05, "loss": 2.622, "step": 15765 }, { "epoch": 0.2, "learning_rate": 9.011324635330455e-05, "loss": 2.7297, "step": 15770 }, { "epoch": 0.2, "learning_rate": 9.010715281686429e-05, "loss": 2.7386, "step": 15775 }, { "epoch": 0.2, "learning_rate": 9.010105760933656e-05, "loss": 2.8366, "step": 15780 }, { "epoch": 0.2, "learning_rate": 9.009496073097528e-05, "loss": 2.7695, "step": 15785 }, { "epoch": 0.2, "learning_rate": 9.008886218203452e-05, "loss": 2.5633, "step": 15790 }, { "epoch": 0.2, "learning_rate": 9.008276196276835e-05, "loss": 2.8323, "step": 15795 }, { "epoch": 0.21, "learning_rate": 9.007666007343097e-05, "loss": 2.83, "step": 15800 }, { "epoch": 0.21, "learning_rate": 9.007055651427658e-05, "loss": 2.7816, "step": 15805 }, { "epoch": 0.21, "learning_rate": 9.006445128555951e-05, "loss": 2.6746, "step": 15810 }, { "epoch": 0.21, "learning_rate": 9.005834438753415e-05, "loss": 2.6036, "step": 15815 }, { "epoch": 0.21, "learning_rate": 9.005223582045492e-05, "loss": 2.6132, "step": 15820 }, { "epoch": 0.21, "learning_rate": 9.004612558457637e-05, "loss": 2.5009, "step": 15825 }, { "epoch": 0.21, "learning_rate": 9.004001368015305e-05, "loss": 2.7372, "step": 15830 }, { "epoch": 0.21, "learning_rate": 9.003390010743964e-05, "loss": 2.715, "step": 15835 }, { "epoch": 0.21, "learning_rate": 9.002778486669086e-05, "loss": 2.7333, "step": 15840 }, { "epoch": 0.21, "learning_rate": 9.002166795816149e-05, "loss": 2.677, "step": 15845 }, { "epoch": 0.21, "learning_rate": 9.001554938210643e-05, "loss": 2.7003, "step": 15850 }, { "epoch": 0.21, "learning_rate": 9.000942913878058e-05, "loss": 2.7394, "step": 15855 }, { "epoch": 0.21, "learning_rate": 9.000330722843895e-05, "loss": 2.6575, "step": 15860 }, { "epoch": 0.21, "learning_rate": 8.999718365133662e-05, "loss": 2.6318, "step": 15865 }, { "epoch": 0.21, "learning_rate": 8.999105840772874e-05, "loss": 2.8191, "step": 15870 }, { "epoch": 0.21, "learning_rate": 8.998493149787052e-05, "loss": 2.7496, "step": 15875 }, { "epoch": 0.21, "learning_rate": 8.997880292201722e-05, "loss": 2.6236, "step": 15880 }, { "epoch": 0.21, "learning_rate": 8.997267268042419e-05, "loss": 2.7135, "step": 15885 }, { "epoch": 0.21, "learning_rate": 8.996654077334689e-05, "loss": 2.7174, "step": 15890 }, { "epoch": 0.21, "learning_rate": 8.996040720104079e-05, "loss": 2.7394, "step": 15895 }, { "epoch": 0.21, "learning_rate": 8.995427196376143e-05, "loss": 2.719, "step": 15900 }, { "epoch": 0.21, "learning_rate": 8.994813506176445e-05, "loss": 2.6558, "step": 15905 }, { "epoch": 0.21, "learning_rate": 8.994199649530554e-05, "loss": 2.6365, "step": 15910 }, { "epoch": 0.21, "learning_rate": 8.993585626464049e-05, "loss": 2.7206, "step": 15915 }, { "epoch": 0.21, "learning_rate": 8.992971437002512e-05, "loss": 2.7204, "step": 15920 }, { "epoch": 0.21, "learning_rate": 8.992357081171532e-05, "loss": 2.6112, "step": 15925 }, { "epoch": 0.21, "learning_rate": 8.99174255899671e-05, "loss": 2.6305, "step": 15930 }, { "epoch": 0.21, "learning_rate": 8.991127870503648e-05, "loss": 2.6432, "step": 15935 }, { "epoch": 0.21, "learning_rate": 8.990513015717959e-05, "loss": 2.6734, "step": 15940 }, { "epoch": 0.21, "learning_rate": 8.989897994665259e-05, "loss": 2.7464, "step": 15945 }, { "epoch": 0.21, "learning_rate": 8.989282807371175e-05, "loss": 2.7582, "step": 15950 }, { "epoch": 0.21, "learning_rate": 8.988667453861337e-05, "loss": 2.7579, "step": 15955 }, { "epoch": 0.21, "learning_rate": 8.988051934161388e-05, "loss": 2.6265, "step": 15960 }, { "epoch": 0.21, "learning_rate": 8.987436248296969e-05, "loss": 2.6553, "step": 15965 }, { "epoch": 0.21, "learning_rate": 8.986820396293737e-05, "loss": 2.7039, "step": 15970 }, { "epoch": 0.21, "learning_rate": 8.986204378177352e-05, "loss": 2.6802, "step": 15975 }, { "epoch": 0.21, "learning_rate": 8.985588193973477e-05, "loss": 2.6283, "step": 15980 }, { "epoch": 0.21, "learning_rate": 8.984971843707788e-05, "loss": 2.7731, "step": 15985 }, { "epoch": 0.21, "learning_rate": 8.984355327405966e-05, "loss": 2.5819, "step": 15990 }, { "epoch": 0.21, "learning_rate": 8.983738645093698e-05, "loss": 2.7357, "step": 15995 }, { "epoch": 0.21, "learning_rate": 8.983121796796677e-05, "loss": 2.6734, "step": 16000 }, { "epoch": 0.21, "learning_rate": 8.982504782540607e-05, "loss": 2.6908, "step": 16005 }, { "epoch": 0.21, "learning_rate": 8.981887602351195e-05, "loss": 2.7079, "step": 16010 }, { "epoch": 0.21, "learning_rate": 8.981270256254155e-05, "loss": 2.727, "step": 16015 }, { "epoch": 0.21, "learning_rate": 8.980652744275211e-05, "loss": 2.7565, "step": 16020 }, { "epoch": 0.21, "learning_rate": 8.98003506644009e-05, "loss": 2.7844, "step": 16025 }, { "epoch": 0.21, "learning_rate": 8.979417222774529e-05, "loss": 2.7124, "step": 16030 }, { "epoch": 0.21, "learning_rate": 8.978799213304273e-05, "loss": 2.7964, "step": 16035 }, { "epoch": 0.21, "learning_rate": 8.978181038055067e-05, "loss": 2.6776, "step": 16040 }, { "epoch": 0.21, "learning_rate": 8.977562697052671e-05, "loss": 2.624, "step": 16045 }, { "epoch": 0.21, "learning_rate": 8.976944190322847e-05, "loss": 2.5765, "step": 16050 }, { "epoch": 0.21, "learning_rate": 8.976325517891367e-05, "loss": 2.7353, "step": 16055 }, { "epoch": 0.21, "learning_rate": 8.975706679784009e-05, "loss": 2.6354, "step": 16060 }, { "epoch": 0.21, "learning_rate": 8.975087676026552e-05, "loss": 2.7842, "step": 16065 }, { "epoch": 0.21, "learning_rate": 8.974468506644795e-05, "loss": 2.5294, "step": 16070 }, { "epoch": 0.21, "learning_rate": 8.973849171664529e-05, "loss": 2.6326, "step": 16075 }, { "epoch": 0.21, "learning_rate": 8.973229671111563e-05, "loss": 2.7602, "step": 16080 }, { "epoch": 0.21, "learning_rate": 8.972610005011706e-05, "loss": 2.6665, "step": 16085 }, { "epoch": 0.21, "learning_rate": 8.971990173390781e-05, "loss": 2.7528, "step": 16090 }, { "epoch": 0.21, "learning_rate": 8.97137017627461e-05, "loss": 2.8217, "step": 16095 }, { "epoch": 0.21, "learning_rate": 8.970750013689026e-05, "loss": 2.5647, "step": 16100 }, { "epoch": 0.21, "learning_rate": 8.97012968565987e-05, "loss": 2.6705, "step": 16105 }, { "epoch": 0.21, "learning_rate": 8.969509192212988e-05, "loss": 2.75, "step": 16110 }, { "epoch": 0.21, "learning_rate": 8.968888533374231e-05, "loss": 2.8303, "step": 16115 }, { "epoch": 0.21, "learning_rate": 8.96826770916946e-05, "loss": 2.7529, "step": 16120 }, { "epoch": 0.21, "learning_rate": 8.967646719624545e-05, "loss": 2.8506, "step": 16125 }, { "epoch": 0.21, "learning_rate": 8.967025564765357e-05, "loss": 2.6613, "step": 16130 }, { "epoch": 0.21, "learning_rate": 8.966404244617777e-05, "loss": 2.8327, "step": 16135 }, { "epoch": 0.21, "learning_rate": 8.965782759207691e-05, "loss": 2.7271, "step": 16140 }, { "epoch": 0.21, "learning_rate": 8.965161108560998e-05, "loss": 2.7408, "step": 16145 }, { "epoch": 0.21, "learning_rate": 8.964539292703596e-05, "loss": 2.6947, "step": 16150 }, { "epoch": 0.21, "learning_rate": 8.963917311661394e-05, "loss": 2.7608, "step": 16155 }, { "epoch": 0.21, "learning_rate": 8.963295165460309e-05, "loss": 2.4975, "step": 16160 }, { "epoch": 0.21, "learning_rate": 8.962672854126261e-05, "loss": 2.7192, "step": 16165 }, { "epoch": 0.21, "learning_rate": 8.962050377685178e-05, "loss": 2.7, "step": 16170 }, { "epoch": 0.21, "learning_rate": 8.961427736163e-05, "loss": 2.6646, "step": 16175 }, { "epoch": 0.21, "learning_rate": 8.960804929585665e-05, "loss": 2.6285, "step": 16180 }, { "epoch": 0.21, "learning_rate": 8.960181957979125e-05, "loss": 2.7751, "step": 16185 }, { "epoch": 0.21, "learning_rate": 8.959558821369336e-05, "loss": 2.6146, "step": 16190 }, { "epoch": 0.21, "learning_rate": 8.958935519782264e-05, "loss": 2.6145, "step": 16195 }, { "epoch": 0.21, "learning_rate": 8.958312053243874e-05, "loss": 2.629, "step": 16200 }, { "epoch": 0.21, "learning_rate": 8.957688421780146e-05, "loss": 2.7806, "step": 16205 }, { "epoch": 0.21, "learning_rate": 8.957064625417065e-05, "loss": 2.7335, "step": 16210 }, { "epoch": 0.21, "learning_rate": 8.956440664180619e-05, "loss": 2.794, "step": 16215 }, { "epoch": 0.21, "learning_rate": 8.955816538096807e-05, "loss": 2.8051, "step": 16220 }, { "epoch": 0.21, "learning_rate": 8.955192247191636e-05, "loss": 2.7554, "step": 16225 }, { "epoch": 0.21, "learning_rate": 8.954567791491113e-05, "loss": 2.6539, "step": 16230 }, { "epoch": 0.21, "learning_rate": 8.953943171021259e-05, "loss": 2.7146, "step": 16235 }, { "epoch": 0.21, "learning_rate": 8.9533183858081e-05, "loss": 2.5877, "step": 16240 }, { "epoch": 0.21, "learning_rate": 8.952693435877667e-05, "loss": 2.7014, "step": 16245 }, { "epoch": 0.21, "learning_rate": 8.952068321255997e-05, "loss": 2.7453, "step": 16250 }, { "epoch": 0.21, "learning_rate": 8.95144304196914e-05, "loss": 2.7299, "step": 16255 }, { "epoch": 0.21, "learning_rate": 8.950817598043144e-05, "loss": 2.566, "step": 16260 }, { "epoch": 0.21, "learning_rate": 8.950191989504071e-05, "loss": 2.6341, "step": 16265 }, { "epoch": 0.21, "learning_rate": 8.949566216377987e-05, "loss": 2.7382, "step": 16270 }, { "epoch": 0.21, "learning_rate": 8.948940278690964e-05, "loss": 2.6772, "step": 16275 }, { "epoch": 0.21, "learning_rate": 8.948314176469086e-05, "loss": 2.6526, "step": 16280 }, { "epoch": 0.21, "learning_rate": 8.947687909738435e-05, "loss": 2.6765, "step": 16285 }, { "epoch": 0.21, "learning_rate": 8.947061478525108e-05, "loss": 2.6581, "step": 16290 }, { "epoch": 0.21, "learning_rate": 8.946434882855203e-05, "loss": 2.6457, "step": 16295 }, { "epoch": 0.21, "learning_rate": 8.945808122754828e-05, "loss": 2.6748, "step": 16300 }, { "epoch": 0.21, "learning_rate": 8.9451811982501e-05, "loss": 2.8205, "step": 16305 }, { "epoch": 0.21, "learning_rate": 8.944554109367138e-05, "loss": 2.6311, "step": 16310 }, { "epoch": 0.21, "learning_rate": 8.94392685613207e-05, "loss": 2.8236, "step": 16315 }, { "epoch": 0.21, "learning_rate": 8.943299438571034e-05, "loss": 2.6694, "step": 16320 }, { "epoch": 0.21, "learning_rate": 8.942671856710165e-05, "loss": 2.6216, "step": 16325 }, { "epoch": 0.21, "learning_rate": 8.942044110575616e-05, "loss": 2.6809, "step": 16330 }, { "epoch": 0.21, "learning_rate": 8.941416200193545e-05, "loss": 2.7702, "step": 16335 }, { "epoch": 0.21, "learning_rate": 8.940788125590108e-05, "loss": 2.7539, "step": 16340 }, { "epoch": 0.21, "learning_rate": 8.940159886791479e-05, "loss": 2.7199, "step": 16345 }, { "epoch": 0.21, "learning_rate": 8.939531483823832e-05, "loss": 2.6426, "step": 16350 }, { "epoch": 0.21, "learning_rate": 8.938902916713349e-05, "loss": 2.737, "step": 16355 }, { "epoch": 0.21, "learning_rate": 8.938274185486221e-05, "loss": 2.7227, "step": 16360 }, { "epoch": 0.21, "learning_rate": 8.937645290168646e-05, "loss": 2.7139, "step": 16365 }, { "epoch": 0.21, "learning_rate": 8.937016230786823e-05, "loss": 2.8411, "step": 16370 }, { "epoch": 0.21, "learning_rate": 8.936387007366964e-05, "loss": 2.7382, "step": 16375 }, { "epoch": 0.21, "learning_rate": 8.935757619935287e-05, "loss": 2.6594, "step": 16380 }, { "epoch": 0.21, "learning_rate": 8.935128068518017e-05, "loss": 2.7078, "step": 16385 }, { "epoch": 0.21, "learning_rate": 8.93449835314138e-05, "loss": 2.8589, "step": 16390 }, { "epoch": 0.21, "learning_rate": 8.93386847383162e-05, "loss": 2.667, "step": 16395 }, { "epoch": 0.21, "learning_rate": 8.933238430614975e-05, "loss": 2.5743, "step": 16400 }, { "epoch": 0.21, "learning_rate": 8.932608223517698e-05, "loss": 2.6575, "step": 16405 }, { "epoch": 0.21, "learning_rate": 8.931977852566049e-05, "loss": 2.6925, "step": 16410 }, { "epoch": 0.21, "learning_rate": 8.931347317786289e-05, "loss": 2.5494, "step": 16415 }, { "epoch": 0.21, "learning_rate": 8.930716619204693e-05, "loss": 2.6952, "step": 16420 }, { "epoch": 0.21, "learning_rate": 8.93008575684754e-05, "loss": 2.6839, "step": 16425 }, { "epoch": 0.21, "learning_rate": 8.929454730741112e-05, "loss": 2.5809, "step": 16430 }, { "epoch": 0.21, "learning_rate": 8.928823540911703e-05, "loss": 2.7702, "step": 16435 }, { "epoch": 0.21, "learning_rate": 8.928192187385612e-05, "loss": 2.749, "step": 16440 }, { "epoch": 0.21, "learning_rate": 8.927560670189143e-05, "loss": 2.6555, "step": 16445 }, { "epoch": 0.21, "learning_rate": 8.926928989348612e-05, "loss": 2.5963, "step": 16450 }, { "epoch": 0.21, "learning_rate": 8.926297144890335e-05, "loss": 2.6837, "step": 16455 }, { "epoch": 0.21, "learning_rate": 8.925665136840638e-05, "loss": 2.7427, "step": 16460 }, { "epoch": 0.21, "learning_rate": 8.925032965225856e-05, "loss": 2.6404, "step": 16465 }, { "epoch": 0.21, "learning_rate": 8.924400630072329e-05, "loss": 2.6704, "step": 16470 }, { "epoch": 0.21, "learning_rate": 8.923768131406403e-05, "loss": 2.781, "step": 16475 }, { "epoch": 0.21, "learning_rate": 8.92313546925443e-05, "loss": 2.6424, "step": 16480 }, { "epoch": 0.21, "learning_rate": 8.922502643642771e-05, "loss": 2.7888, "step": 16485 }, { "epoch": 0.21, "learning_rate": 8.921869654597795e-05, "loss": 2.6365, "step": 16490 }, { "epoch": 0.21, "learning_rate": 8.921236502145872e-05, "loss": 2.5798, "step": 16495 }, { "epoch": 0.21, "learning_rate": 8.920603186313385e-05, "loss": 2.7028, "step": 16500 }, { "epoch": 0.21, "learning_rate": 8.919969707126723e-05, "loss": 2.7944, "step": 16505 }, { "epoch": 0.21, "learning_rate": 8.919336064612279e-05, "loss": 2.7899, "step": 16510 }, { "epoch": 0.21, "learning_rate": 8.918702258796451e-05, "loss": 2.6657, "step": 16515 }, { "epoch": 0.21, "learning_rate": 8.918068289705651e-05, "loss": 2.7702, "step": 16520 }, { "epoch": 0.21, "learning_rate": 8.917434157366292e-05, "loss": 2.6626, "step": 16525 }, { "epoch": 0.21, "learning_rate": 8.916799861804796e-05, "loss": 2.7533, "step": 16530 }, { "epoch": 0.21, "learning_rate": 8.916165403047592e-05, "loss": 2.7303, "step": 16535 }, { "epoch": 0.21, "learning_rate": 8.915530781121111e-05, "loss": 2.7135, "step": 16540 }, { "epoch": 0.21, "learning_rate": 8.914895996051801e-05, "loss": 2.7935, "step": 16545 }, { "epoch": 0.21, "learning_rate": 8.914261047866107e-05, "loss": 2.6442, "step": 16550 }, { "epoch": 0.21, "learning_rate": 8.913625936590483e-05, "loss": 2.6959, "step": 16555 }, { "epoch": 0.21, "learning_rate": 8.912990662251397e-05, "loss": 2.7346, "step": 16560 }, { "epoch": 0.21, "learning_rate": 8.912355224875312e-05, "loss": 2.6241, "step": 16565 }, { "epoch": 0.22, "learning_rate": 8.911719624488707e-05, "loss": 2.6742, "step": 16570 }, { "epoch": 0.22, "learning_rate": 8.911083861118065e-05, "loss": 2.7294, "step": 16575 }, { "epoch": 0.22, "learning_rate": 8.910447934789874e-05, "loss": 2.6991, "step": 16580 }, { "epoch": 0.22, "learning_rate": 8.909811845530631e-05, "loss": 2.7715, "step": 16585 }, { "epoch": 0.22, "learning_rate": 8.909175593366837e-05, "loss": 2.6999, "step": 16590 }, { "epoch": 0.22, "learning_rate": 8.908539178325004e-05, "loss": 2.6645, "step": 16595 }, { "epoch": 0.22, "learning_rate": 8.907902600431649e-05, "loss": 2.6975, "step": 16600 }, { "epoch": 0.22, "learning_rate": 8.907265859713294e-05, "loss": 2.7544, "step": 16605 }, { "epoch": 0.22, "learning_rate": 8.90662895619647e-05, "loss": 2.7174, "step": 16610 }, { "epoch": 0.22, "learning_rate": 8.905991889907714e-05, "loss": 2.7011, "step": 16615 }, { "epoch": 0.22, "learning_rate": 8.905354660873568e-05, "loss": 2.5493, "step": 16620 }, { "epoch": 0.22, "learning_rate": 8.904717269120585e-05, "loss": 2.6172, "step": 16625 }, { "epoch": 0.22, "learning_rate": 8.90407971467532e-05, "loss": 2.7773, "step": 16630 }, { "epoch": 0.22, "learning_rate": 8.903441997564339e-05, "loss": 2.7507, "step": 16635 }, { "epoch": 0.22, "learning_rate": 8.902804117814212e-05, "loss": 2.7269, "step": 16640 }, { "epoch": 0.22, "learning_rate": 8.902166075451516e-05, "loss": 2.741, "step": 16645 }, { "epoch": 0.22, "learning_rate": 8.901527870502838e-05, "loss": 2.8188, "step": 16650 }, { "epoch": 0.22, "learning_rate": 8.900889502994767e-05, "loss": 2.7122, "step": 16655 }, { "epoch": 0.22, "learning_rate": 8.9002509729539e-05, "loss": 2.7315, "step": 16660 }, { "epoch": 0.22, "learning_rate": 8.899612280406844e-05, "loss": 2.7087, "step": 16665 }, { "epoch": 0.22, "learning_rate": 8.898973425380209e-05, "loss": 2.6706, "step": 16670 }, { "epoch": 0.22, "learning_rate": 8.898334407900613e-05, "loss": 2.6637, "step": 16675 }, { "epoch": 0.22, "learning_rate": 8.897695227994683e-05, "loss": 2.6799, "step": 16680 }, { "epoch": 0.22, "learning_rate": 8.897055885689048e-05, "loss": 2.719, "step": 16685 }, { "epoch": 0.22, "learning_rate": 8.896416381010349e-05, "loss": 2.6429, "step": 16690 }, { "epoch": 0.22, "learning_rate": 8.895776713985229e-05, "loss": 2.7663, "step": 16695 }, { "epoch": 0.22, "learning_rate": 8.895136884640342e-05, "loss": 2.6368, "step": 16700 }, { "epoch": 0.22, "learning_rate": 8.894496893002349e-05, "loss": 2.6544, "step": 16705 }, { "epoch": 0.22, "learning_rate": 8.89385673909791e-05, "loss": 2.6882, "step": 16710 }, { "epoch": 0.22, "learning_rate": 8.893216422953701e-05, "loss": 2.6267, "step": 16715 }, { "epoch": 0.22, "learning_rate": 8.892575944596402e-05, "loss": 2.8154, "step": 16720 }, { "epoch": 0.22, "learning_rate": 8.891935304052697e-05, "loss": 2.7198, "step": 16725 }, { "epoch": 0.22, "learning_rate": 8.891294501349277e-05, "loss": 2.6943, "step": 16730 }, { "epoch": 0.22, "learning_rate": 8.890653536512846e-05, "loss": 2.5733, "step": 16735 }, { "epoch": 0.22, "learning_rate": 8.890012409570106e-05, "loss": 2.7394, "step": 16740 }, { "epoch": 0.22, "learning_rate": 8.889371120547772e-05, "loss": 2.6988, "step": 16745 }, { "epoch": 0.22, "learning_rate": 8.888729669472564e-05, "loss": 2.7468, "step": 16750 }, { "epoch": 0.22, "learning_rate": 8.888088056371205e-05, "loss": 2.7604, "step": 16755 }, { "epoch": 0.22, "learning_rate": 8.887446281270433e-05, "loss": 2.8381, "step": 16760 }, { "epoch": 0.22, "learning_rate": 8.886804344196986e-05, "loss": 2.7262, "step": 16765 }, { "epoch": 0.22, "learning_rate": 8.886162245177609e-05, "loss": 2.6908, "step": 16770 }, { "epoch": 0.22, "learning_rate": 8.885519984239059e-05, "loss": 2.8045, "step": 16775 }, { "epoch": 0.22, "learning_rate": 8.884877561408092e-05, "loss": 2.7724, "step": 16780 }, { "epoch": 0.22, "learning_rate": 8.884234976711478e-05, "loss": 2.7352, "step": 16785 }, { "epoch": 0.22, "learning_rate": 8.883592230175989e-05, "loss": 2.8341, "step": 16790 }, { "epoch": 0.22, "learning_rate": 8.882949321828407e-05, "loss": 2.6934, "step": 16795 }, { "epoch": 0.22, "learning_rate": 8.882306251695517e-05, "loss": 2.6697, "step": 16800 }, { "epoch": 0.22, "learning_rate": 8.881663019804114e-05, "loss": 2.6522, "step": 16805 }, { "epoch": 0.22, "learning_rate": 8.881019626181e-05, "loss": 2.8399, "step": 16810 }, { "epoch": 0.22, "learning_rate": 8.880376070852979e-05, "loss": 2.6663, "step": 16815 }, { "epoch": 0.22, "learning_rate": 8.879732353846869e-05, "loss": 2.6712, "step": 16820 }, { "epoch": 0.22, "learning_rate": 8.879088475189487e-05, "loss": 2.6489, "step": 16825 }, { "epoch": 0.22, "learning_rate": 8.878444434907664e-05, "loss": 2.7482, "step": 16830 }, { "epoch": 0.22, "learning_rate": 8.877800233028233e-05, "loss": 2.8319, "step": 16835 }, { "epoch": 0.22, "learning_rate": 8.877155869578035e-05, "loss": 2.7385, "step": 16840 }, { "epoch": 0.22, "learning_rate": 8.876511344583917e-05, "loss": 2.7062, "step": 16845 }, { "epoch": 0.22, "learning_rate": 8.875866658072734e-05, "loss": 2.7046, "step": 16850 }, { "epoch": 0.22, "learning_rate": 8.875221810071348e-05, "loss": 2.6796, "step": 16855 }, { "epoch": 0.22, "learning_rate": 8.874576800606626e-05, "loss": 2.6508, "step": 16860 }, { "epoch": 0.22, "learning_rate": 8.873931629705443e-05, "loss": 2.7528, "step": 16865 }, { "epoch": 0.22, "learning_rate": 8.873286297394681e-05, "loss": 2.8247, "step": 16870 }, { "epoch": 0.22, "learning_rate": 8.872640803701226e-05, "loss": 2.7119, "step": 16875 }, { "epoch": 0.22, "learning_rate": 8.871995148651976e-05, "loss": 2.6136, "step": 16880 }, { "epoch": 0.22, "learning_rate": 8.871349332273831e-05, "loss": 2.6508, "step": 16885 }, { "epoch": 0.22, "learning_rate": 8.870703354593699e-05, "loss": 2.7322, "step": 16890 }, { "epoch": 0.22, "learning_rate": 8.870057215638495e-05, "loss": 2.8064, "step": 16895 }, { "epoch": 0.22, "learning_rate": 8.869410915435141e-05, "loss": 2.8089, "step": 16900 }, { "epoch": 0.22, "learning_rate": 8.868764454010567e-05, "loss": 2.6794, "step": 16905 }, { "epoch": 0.22, "learning_rate": 8.868117831391704e-05, "loss": 2.6912, "step": 16910 }, { "epoch": 0.22, "learning_rate": 8.867471047605501e-05, "loss": 2.6868, "step": 16915 }, { "epoch": 0.22, "learning_rate": 8.8668241026789e-05, "loss": 2.7347, "step": 16920 }, { "epoch": 0.22, "learning_rate": 8.866176996638858e-05, "loss": 2.7604, "step": 16925 }, { "epoch": 0.22, "learning_rate": 8.865529729512336e-05, "loss": 2.7746, "step": 16930 }, { "epoch": 0.22, "learning_rate": 8.864882301326307e-05, "loss": 2.7499, "step": 16935 }, { "epoch": 0.22, "learning_rate": 8.864234712107744e-05, "loss": 2.671, "step": 16940 }, { "epoch": 0.22, "learning_rate": 8.863586961883629e-05, "loss": 2.6163, "step": 16945 }, { "epoch": 0.22, "learning_rate": 8.86293905068095e-05, "loss": 2.7394, "step": 16950 }, { "epoch": 0.22, "learning_rate": 8.862290978526704e-05, "loss": 2.7599, "step": 16955 }, { "epoch": 0.22, "learning_rate": 8.861642745447894e-05, "loss": 2.488, "step": 16960 }, { "epoch": 0.22, "learning_rate": 8.860994351471526e-05, "loss": 2.7818, "step": 16965 }, { "epoch": 0.22, "learning_rate": 8.860345796624619e-05, "loss": 2.6408, "step": 16970 }, { "epoch": 0.22, "learning_rate": 8.859697080934192e-05, "loss": 2.7853, "step": 16975 }, { "epoch": 0.22, "learning_rate": 8.859048204427279e-05, "loss": 2.7498, "step": 16980 }, { "epoch": 0.22, "learning_rate": 8.858399167130909e-05, "loss": 2.6442, "step": 16985 }, { "epoch": 0.22, "learning_rate": 8.857749969072131e-05, "loss": 2.679, "step": 16990 }, { "epoch": 0.22, "learning_rate": 8.85710061027799e-05, "loss": 2.6941, "step": 16995 }, { "epoch": 0.22, "learning_rate": 8.856451090775546e-05, "loss": 2.6522, "step": 17000 }, { "epoch": 0.22, "learning_rate": 8.855801410591857e-05, "loss": 2.7544, "step": 17005 }, { "epoch": 0.22, "learning_rate": 8.855151569753997e-05, "loss": 2.727, "step": 17010 }, { "epoch": 0.22, "learning_rate": 8.854501568289037e-05, "loss": 2.6233, "step": 17015 }, { "epoch": 0.22, "learning_rate": 8.853851406224064e-05, "loss": 2.5894, "step": 17020 }, { "epoch": 0.22, "learning_rate": 8.853201083586163e-05, "loss": 2.5971, "step": 17025 }, { "epoch": 0.22, "learning_rate": 8.852550600402434e-05, "loss": 2.5437, "step": 17030 }, { "epoch": 0.22, "learning_rate": 8.851899956699978e-05, "loss": 2.7342, "step": 17035 }, { "epoch": 0.22, "learning_rate": 8.851249152505905e-05, "loss": 2.8265, "step": 17040 }, { "epoch": 0.22, "learning_rate": 8.85059818784733e-05, "loss": 2.6128, "step": 17045 }, { "epoch": 0.22, "learning_rate": 8.849947062751377e-05, "loss": 2.7882, "step": 17050 }, { "epoch": 0.22, "learning_rate": 8.849295777245174e-05, "loss": 2.8304, "step": 17055 }, { "epoch": 0.22, "learning_rate": 8.848644331355861e-05, "loss": 2.5571, "step": 17060 }, { "epoch": 0.22, "learning_rate": 8.847992725110576e-05, "loss": 2.748, "step": 17065 }, { "epoch": 0.22, "learning_rate": 8.847340958536472e-05, "loss": 2.5675, "step": 17070 }, { "epoch": 0.22, "learning_rate": 8.846689031660705e-05, "loss": 2.6837, "step": 17075 }, { "epoch": 0.22, "learning_rate": 8.846036944510435e-05, "loss": 2.7065, "step": 17080 }, { "epoch": 0.22, "learning_rate": 8.845384697112834e-05, "loss": 2.7265, "step": 17085 }, { "epoch": 0.22, "learning_rate": 8.844732289495078e-05, "loss": 2.5883, "step": 17090 }, { "epoch": 0.22, "learning_rate": 8.84407972168435e-05, "loss": 2.6471, "step": 17095 }, { "epoch": 0.22, "learning_rate": 8.843426993707839e-05, "loss": 2.6165, "step": 17100 }, { "epoch": 0.22, "learning_rate": 8.842774105592741e-05, "loss": 2.6568, "step": 17105 }, { "epoch": 0.22, "learning_rate": 8.842121057366259e-05, "loss": 2.6517, "step": 17110 }, { "epoch": 0.22, "learning_rate": 8.841467849055604e-05, "loss": 2.6592, "step": 17115 }, { "epoch": 0.22, "learning_rate": 8.840814480687992e-05, "loss": 2.6509, "step": 17120 }, { "epoch": 0.22, "learning_rate": 8.840160952290645e-05, "loss": 2.7666, "step": 17125 }, { "epoch": 0.22, "learning_rate": 8.839507263890793e-05, "loss": 2.6342, "step": 17130 }, { "epoch": 0.22, "learning_rate": 8.838853415515673e-05, "loss": 2.6457, "step": 17135 }, { "epoch": 0.22, "learning_rate": 8.838199407192527e-05, "loss": 2.5348, "step": 17140 }, { "epoch": 0.22, "learning_rate": 8.837545238948604e-05, "loss": 2.6626, "step": 17145 }, { "epoch": 0.22, "learning_rate": 8.836890910811162e-05, "loss": 2.6359, "step": 17150 }, { "epoch": 0.22, "learning_rate": 8.836236422807463e-05, "loss": 2.6463, "step": 17155 }, { "epoch": 0.22, "learning_rate": 8.835581774964777e-05, "loss": 2.765, "step": 17160 }, { "epoch": 0.22, "learning_rate": 8.83492696731038e-05, "loss": 2.7663, "step": 17165 }, { "epoch": 0.22, "learning_rate": 8.834271999871554e-05, "loss": 2.7182, "step": 17170 }, { "epoch": 0.22, "learning_rate": 8.833616872675592e-05, "loss": 2.7987, "step": 17175 }, { "epoch": 0.22, "learning_rate": 8.832961585749787e-05, "loss": 2.6634, "step": 17180 }, { "epoch": 0.22, "learning_rate": 8.832306139121442e-05, "loss": 2.8216, "step": 17185 }, { "epoch": 0.22, "learning_rate": 8.831650532817867e-05, "loss": 2.8423, "step": 17190 }, { "epoch": 0.22, "learning_rate": 8.830994766866381e-05, "loss": 2.5339, "step": 17195 }, { "epoch": 0.22, "learning_rate": 8.830338841294301e-05, "loss": 2.8473, "step": 17200 }, { "epoch": 0.22, "learning_rate": 8.829682756128963e-05, "loss": 2.6392, "step": 17205 }, { "epoch": 0.22, "learning_rate": 8.829026511397698e-05, "loss": 2.7166, "step": 17210 }, { "epoch": 0.22, "learning_rate": 8.828370107127853e-05, "loss": 2.7311, "step": 17215 }, { "epoch": 0.22, "learning_rate": 8.827713543346774e-05, "loss": 2.74, "step": 17220 }, { "epoch": 0.22, "learning_rate": 8.827056820081818e-05, "loss": 2.8055, "step": 17225 }, { "epoch": 0.22, "learning_rate": 8.826399937360348e-05, "loss": 2.7751, "step": 17230 }, { "epoch": 0.22, "learning_rate": 8.825742895209736e-05, "loss": 2.7284, "step": 17235 }, { "epoch": 0.22, "learning_rate": 8.825085693657353e-05, "loss": 2.6825, "step": 17240 }, { "epoch": 0.22, "learning_rate": 8.824428332730585e-05, "loss": 2.7398, "step": 17245 }, { "epoch": 0.22, "learning_rate": 8.823770812456822e-05, "loss": 2.6563, "step": 17250 }, { "epoch": 0.22, "learning_rate": 8.823113132863457e-05, "loss": 2.5882, "step": 17255 }, { "epoch": 0.22, "learning_rate": 8.822455293977895e-05, "loss": 2.7331, "step": 17260 }, { "epoch": 0.22, "learning_rate": 8.821797295827546e-05, "loss": 2.6452, "step": 17265 }, { "epoch": 0.22, "learning_rate": 8.821139138439822e-05, "loss": 2.663, "step": 17270 }, { "epoch": 0.22, "learning_rate": 8.820480821842148e-05, "loss": 2.7348, "step": 17275 }, { "epoch": 0.22, "learning_rate": 8.819822346061954e-05, "loss": 2.6459, "step": 17280 }, { "epoch": 0.22, "learning_rate": 8.819163711126675e-05, "loss": 2.6993, "step": 17285 }, { "epoch": 0.22, "learning_rate": 8.818504917063752e-05, "loss": 2.6667, "step": 17290 }, { "epoch": 0.22, "learning_rate": 8.817845963900635e-05, "loss": 2.573, "step": 17295 }, { "epoch": 0.22, "learning_rate": 8.817186851664781e-05, "loss": 2.7839, "step": 17300 }, { "epoch": 0.22, "learning_rate": 8.81652758038365e-05, "loss": 2.721, "step": 17305 }, { "epoch": 0.22, "learning_rate": 8.815868150084712e-05, "loss": 2.7065, "step": 17310 }, { "epoch": 0.22, "learning_rate": 8.815208560795443e-05, "loss": 2.7193, "step": 17315 }, { "epoch": 0.22, "learning_rate": 8.814548812543327e-05, "loss": 2.6827, "step": 17320 }, { "epoch": 0.22, "learning_rate": 8.813888905355848e-05, "loss": 2.8104, "step": 17325 }, { "epoch": 0.22, "learning_rate": 8.813228839260503e-05, "loss": 2.6981, "step": 17330 }, { "epoch": 0.22, "learning_rate": 8.812568614284797e-05, "loss": 2.6549, "step": 17335 }, { "epoch": 0.23, "learning_rate": 8.811908230456236e-05, "loss": 2.6678, "step": 17340 }, { "epoch": 0.23, "learning_rate": 8.811247687802336e-05, "loss": 2.6922, "step": 17345 }, { "epoch": 0.23, "learning_rate": 8.810586986350619e-05, "loss": 2.6759, "step": 17350 }, { "epoch": 0.23, "learning_rate": 8.809926126128611e-05, "loss": 2.6518, "step": 17355 }, { "epoch": 0.23, "learning_rate": 8.809265107163852e-05, "loss": 2.5507, "step": 17360 }, { "epoch": 0.23, "learning_rate": 8.808603929483881e-05, "loss": 2.6368, "step": 17365 }, { "epoch": 0.23, "learning_rate": 8.807942593116245e-05, "loss": 2.5929, "step": 17370 }, { "epoch": 0.23, "learning_rate": 8.807281098088502e-05, "loss": 2.7976, "step": 17375 }, { "epoch": 0.23, "learning_rate": 8.806619444428212e-05, "loss": 2.6255, "step": 17380 }, { "epoch": 0.23, "learning_rate": 8.805957632162942e-05, "loss": 2.6568, "step": 17385 }, { "epoch": 0.23, "learning_rate": 8.805295661320269e-05, "loss": 2.5749, "step": 17390 }, { "epoch": 0.23, "learning_rate": 8.804633531927773e-05, "loss": 2.6167, "step": 17395 }, { "epoch": 0.23, "learning_rate": 8.803971244013041e-05, "loss": 2.6219, "step": 17400 }, { "epoch": 0.23, "learning_rate": 8.803308797603671e-05, "loss": 2.5632, "step": 17405 }, { "epoch": 0.23, "learning_rate": 8.802646192727262e-05, "loss": 2.7647, "step": 17410 }, { "epoch": 0.23, "learning_rate": 8.801983429411421e-05, "loss": 2.6272, "step": 17415 }, { "epoch": 0.23, "learning_rate": 8.801320507683763e-05, "loss": 2.6105, "step": 17420 }, { "epoch": 0.23, "learning_rate": 8.800657427571913e-05, "loss": 2.6388, "step": 17425 }, { "epoch": 0.23, "learning_rate": 8.799994189103492e-05, "loss": 2.7968, "step": 17430 }, { "epoch": 0.23, "learning_rate": 8.799330792306137e-05, "loss": 2.6837, "step": 17435 }, { "epoch": 0.23, "learning_rate": 8.79866723720749e-05, "loss": 2.7973, "step": 17440 }, { "epoch": 0.23, "learning_rate": 8.798003523835197e-05, "loss": 2.6964, "step": 17445 }, { "epoch": 0.23, "learning_rate": 8.797339652216911e-05, "loss": 2.7166, "step": 17450 }, { "epoch": 0.23, "learning_rate": 8.796675622380297e-05, "loss": 2.5966, "step": 17455 }, { "epoch": 0.23, "learning_rate": 8.796011434353017e-05, "loss": 2.6391, "step": 17460 }, { "epoch": 0.23, "learning_rate": 8.795347088162749e-05, "loss": 2.8251, "step": 17465 }, { "epoch": 0.23, "learning_rate": 8.794682583837169e-05, "loss": 2.6481, "step": 17470 }, { "epoch": 0.23, "learning_rate": 8.794017921403967e-05, "loss": 2.7793, "step": 17475 }, { "epoch": 0.23, "learning_rate": 8.793353100890838e-05, "loss": 2.645, "step": 17480 }, { "epoch": 0.23, "learning_rate": 8.792688122325478e-05, "loss": 2.7763, "step": 17485 }, { "epoch": 0.23, "learning_rate": 8.792022985735595e-05, "loss": 2.6309, "step": 17490 }, { "epoch": 0.23, "learning_rate": 8.791357691148905e-05, "loss": 2.653, "step": 17495 }, { "epoch": 0.23, "learning_rate": 8.790692238593126e-05, "loss": 2.772, "step": 17500 }, { "epoch": 0.23, "learning_rate": 8.790026628095982e-05, "loss": 2.6787, "step": 17505 }, { "epoch": 0.23, "learning_rate": 8.78936085968521e-05, "loss": 2.661, "step": 17510 }, { "epoch": 0.23, "learning_rate": 8.788694933388549e-05, "loss": 2.6087, "step": 17515 }, { "epoch": 0.23, "learning_rate": 8.788028849233742e-05, "loss": 2.5972, "step": 17520 }, { "epoch": 0.23, "learning_rate": 8.787362607248544e-05, "loss": 2.7034, "step": 17525 }, { "epoch": 0.23, "learning_rate": 8.786696207460716e-05, "loss": 2.793, "step": 17530 }, { "epoch": 0.23, "learning_rate": 8.786029649898022e-05, "loss": 2.5895, "step": 17535 }, { "epoch": 0.23, "learning_rate": 8.785362934588233e-05, "loss": 2.6671, "step": 17540 }, { "epoch": 0.23, "learning_rate": 8.784696061559132e-05, "loss": 2.6623, "step": 17545 }, { "epoch": 0.23, "learning_rate": 8.784029030838501e-05, "loss": 2.6178, "step": 17550 }, { "epoch": 0.23, "learning_rate": 8.783361842454135e-05, "loss": 2.8036, "step": 17555 }, { "epoch": 0.23, "learning_rate": 8.782694496433831e-05, "loss": 2.501, "step": 17560 }, { "epoch": 0.23, "learning_rate": 8.782026992805394e-05, "loss": 2.6451, "step": 17565 }, { "epoch": 0.23, "learning_rate": 8.781359331596638e-05, "loss": 2.8157, "step": 17570 }, { "epoch": 0.23, "learning_rate": 8.78069151283538e-05, "loss": 2.7191, "step": 17575 }, { "epoch": 0.23, "learning_rate": 8.780023536549445e-05, "loss": 2.6784, "step": 17580 }, { "epoch": 0.23, "learning_rate": 8.779355402766664e-05, "loss": 2.6658, "step": 17585 }, { "epoch": 0.23, "learning_rate": 8.778687111514878e-05, "loss": 2.7143, "step": 17590 }, { "epoch": 0.23, "learning_rate": 8.77801866282193e-05, "loss": 2.6103, "step": 17595 }, { "epoch": 0.23, "learning_rate": 8.777350056715668e-05, "loss": 2.6274, "step": 17600 }, { "epoch": 0.23, "learning_rate": 8.776681293223956e-05, "loss": 2.6555, "step": 17605 }, { "epoch": 0.23, "learning_rate": 8.776012372374654e-05, "loss": 2.705, "step": 17610 }, { "epoch": 0.23, "learning_rate": 8.775343294195634e-05, "loss": 2.6996, "step": 17615 }, { "epoch": 0.23, "learning_rate": 8.774674058714776e-05, "loss": 2.6281, "step": 17620 }, { "epoch": 0.23, "learning_rate": 8.77400466595996e-05, "loss": 2.6833, "step": 17625 }, { "epoch": 0.23, "learning_rate": 8.773335115959081e-05, "loss": 2.7034, "step": 17630 }, { "epoch": 0.23, "learning_rate": 8.772665408740031e-05, "loss": 2.6776, "step": 17635 }, { "epoch": 0.23, "learning_rate": 8.771995544330717e-05, "loss": 2.7529, "step": 17640 }, { "epoch": 0.23, "learning_rate": 8.77132552275905e-05, "loss": 2.6667, "step": 17645 }, { "epoch": 0.23, "learning_rate": 8.770655344052945e-05, "loss": 2.6136, "step": 17650 }, { "epoch": 0.23, "learning_rate": 8.769985008240326e-05, "loss": 2.6933, "step": 17655 }, { "epoch": 0.23, "learning_rate": 8.769314515349123e-05, "loss": 2.6172, "step": 17660 }, { "epoch": 0.23, "learning_rate": 8.768643865407273e-05, "loss": 2.5798, "step": 17665 }, { "epoch": 0.23, "learning_rate": 8.767973058442718e-05, "loss": 2.7258, "step": 17670 }, { "epoch": 0.23, "learning_rate": 8.767302094483407e-05, "loss": 2.7917, "step": 17675 }, { "epoch": 0.23, "learning_rate": 8.766630973557299e-05, "loss": 2.7789, "step": 17680 }, { "epoch": 0.23, "learning_rate": 8.765959695692355e-05, "loss": 2.7559, "step": 17685 }, { "epoch": 0.23, "learning_rate": 8.765288260916541e-05, "loss": 2.69, "step": 17690 }, { "epoch": 0.23, "learning_rate": 8.764616669257837e-05, "loss": 2.5685, "step": 17695 }, { "epoch": 0.23, "learning_rate": 8.763944920744225e-05, "loss": 2.6856, "step": 17700 }, { "epoch": 0.23, "learning_rate": 8.763273015403691e-05, "loss": 2.6321, "step": 17705 }, { "epoch": 0.23, "learning_rate": 8.762600953264233e-05, "loss": 2.7422, "step": 17710 }, { "epoch": 0.23, "learning_rate": 8.761928734353852e-05, "loss": 2.7553, "step": 17715 }, { "epoch": 0.23, "learning_rate": 8.761256358700556e-05, "loss": 2.8458, "step": 17720 }, { "epoch": 0.23, "learning_rate": 8.760583826332361e-05, "loss": 2.7119, "step": 17725 }, { "epoch": 0.23, "learning_rate": 8.759911137277286e-05, "loss": 2.6853, "step": 17730 }, { "epoch": 0.23, "learning_rate": 8.759238291563359e-05, "loss": 2.6137, "step": 17735 }, { "epoch": 0.23, "learning_rate": 8.758565289218619e-05, "loss": 2.7404, "step": 17740 }, { "epoch": 0.23, "learning_rate": 8.757892130271104e-05, "loss": 2.7254, "step": 17745 }, { "epoch": 0.23, "learning_rate": 8.75721881474886e-05, "loss": 2.671, "step": 17750 }, { "epoch": 0.23, "learning_rate": 8.756545342679944e-05, "loss": 2.5921, "step": 17755 }, { "epoch": 0.23, "learning_rate": 8.755871714092415e-05, "loss": 2.8029, "step": 17760 }, { "epoch": 0.23, "learning_rate": 8.75519792901434e-05, "loss": 2.6829, "step": 17765 }, { "epoch": 0.23, "learning_rate": 8.754523987473793e-05, "loss": 2.649, "step": 17770 }, { "epoch": 0.23, "learning_rate": 8.753849889498855e-05, "loss": 2.6986, "step": 17775 }, { "epoch": 0.23, "learning_rate": 8.753175635117612e-05, "loss": 2.6523, "step": 17780 }, { "epoch": 0.23, "learning_rate": 8.752501224358156e-05, "loss": 2.6336, "step": 17785 }, { "epoch": 0.23, "learning_rate": 8.75182665724859e-05, "loss": 2.6948, "step": 17790 }, { "epoch": 0.23, "learning_rate": 8.751151933817016e-05, "loss": 2.7011, "step": 17795 }, { "epoch": 0.23, "learning_rate": 8.750477054091548e-05, "loss": 2.7173, "step": 17800 }, { "epoch": 0.23, "learning_rate": 8.749802018100308e-05, "loss": 2.5782, "step": 17805 }, { "epoch": 0.23, "learning_rate": 8.74912682587142e-05, "loss": 2.6994, "step": 17810 }, { "epoch": 0.23, "learning_rate": 8.748451477433016e-05, "loss": 2.4897, "step": 17815 }, { "epoch": 0.23, "learning_rate": 8.747775972813232e-05, "loss": 2.6921, "step": 17820 }, { "epoch": 0.23, "learning_rate": 8.74710031204022e-05, "loss": 2.6534, "step": 17825 }, { "epoch": 0.23, "learning_rate": 8.746424495142125e-05, "loss": 2.6236, "step": 17830 }, { "epoch": 0.23, "learning_rate": 8.745748522147109e-05, "loss": 2.6941, "step": 17835 }, { "epoch": 0.23, "learning_rate": 8.745072393083337e-05, "loss": 2.6319, "step": 17840 }, { "epoch": 0.23, "learning_rate": 8.744396107978978e-05, "loss": 2.7973, "step": 17845 }, { "epoch": 0.23, "learning_rate": 8.743719666862213e-05, "loss": 2.5516, "step": 17850 }, { "epoch": 0.23, "learning_rate": 8.743043069761223e-05, "loss": 2.6754, "step": 17855 }, { "epoch": 0.23, "learning_rate": 8.7423663167042e-05, "loss": 2.7615, "step": 17860 }, { "epoch": 0.23, "learning_rate": 8.741689407719343e-05, "loss": 2.765, "step": 17865 }, { "epoch": 0.23, "learning_rate": 8.741012342834853e-05, "loss": 2.7338, "step": 17870 }, { "epoch": 0.23, "learning_rate": 8.740335122078942e-05, "loss": 2.7275, "step": 17875 }, { "epoch": 0.23, "learning_rate": 8.739657745479825e-05, "loss": 2.7464, "step": 17880 }, { "epoch": 0.23, "learning_rate": 8.738980213065729e-05, "loss": 2.7315, "step": 17885 }, { "epoch": 0.23, "learning_rate": 8.738302524864881e-05, "loss": 2.8024, "step": 17890 }, { "epoch": 0.23, "learning_rate": 8.737624680905518e-05, "loss": 2.7526, "step": 17895 }, { "epoch": 0.23, "learning_rate": 8.73694668121588e-05, "loss": 2.7254, "step": 17900 }, { "epoch": 0.23, "learning_rate": 8.736268525824222e-05, "loss": 2.6679, "step": 17905 }, { "epoch": 0.23, "learning_rate": 8.735590214758795e-05, "loss": 2.5833, "step": 17910 }, { "epoch": 0.23, "learning_rate": 8.734911748047864e-05, "loss": 2.7262, "step": 17915 }, { "epoch": 0.23, "learning_rate": 8.734233125719696e-05, "loss": 2.7753, "step": 17920 }, { "epoch": 0.23, "learning_rate": 8.733554347802563e-05, "loss": 2.5935, "step": 17925 }, { "epoch": 0.23, "learning_rate": 8.732875414324755e-05, "loss": 2.6104, "step": 17930 }, { "epoch": 0.23, "learning_rate": 8.732196325314554e-05, "loss": 2.6773, "step": 17935 }, { "epoch": 0.23, "learning_rate": 8.731517080800256e-05, "loss": 2.7216, "step": 17940 }, { "epoch": 0.23, "learning_rate": 8.730837680810162e-05, "loss": 2.7137, "step": 17945 }, { "epoch": 0.23, "learning_rate": 8.730158125372578e-05, "loss": 2.7691, "step": 17950 }, { "epoch": 0.23, "learning_rate": 8.729478414515824e-05, "loss": 2.7579, "step": 17955 }, { "epoch": 0.23, "learning_rate": 8.728798548268213e-05, "loss": 2.6464, "step": 17960 }, { "epoch": 0.23, "learning_rate": 8.728118526658076e-05, "loss": 2.712, "step": 17965 }, { "epoch": 0.23, "learning_rate": 8.727438349713745e-05, "loss": 2.6189, "step": 17970 }, { "epoch": 0.23, "learning_rate": 8.726758017463563e-05, "loss": 2.7137, "step": 17975 }, { "epoch": 0.23, "learning_rate": 8.726077529935873e-05, "loss": 2.735, "step": 17980 }, { "epoch": 0.23, "learning_rate": 8.72539688715903e-05, "loss": 2.6729, "step": 17985 }, { "epoch": 0.23, "learning_rate": 8.724716089161392e-05, "loss": 2.6996, "step": 17990 }, { "epoch": 0.23, "learning_rate": 8.724035135971325e-05, "loss": 2.6852, "step": 17995 }, { "epoch": 0.23, "learning_rate": 8.723354027617204e-05, "loss": 2.6928, "step": 18000 }, { "epoch": 0.23, "learning_rate": 8.722672764127402e-05, "loss": 2.6667, "step": 18005 }, { "epoch": 0.23, "learning_rate": 8.721991345530309e-05, "loss": 2.7784, "step": 18010 }, { "epoch": 0.23, "learning_rate": 8.721309771854316e-05, "loss": 2.8278, "step": 18015 }, { "epoch": 0.23, "learning_rate": 8.72062804312782e-05, "loss": 2.7858, "step": 18020 }, { "epoch": 0.23, "learning_rate": 8.719946159379226e-05, "loss": 2.6352, "step": 18025 }, { "epoch": 0.23, "learning_rate": 8.719264120636947e-05, "loss": 2.6825, "step": 18030 }, { "epoch": 0.23, "learning_rate": 8.718581926929397e-05, "loss": 2.8378, "step": 18035 }, { "epoch": 0.23, "learning_rate": 8.717899578285003e-05, "loss": 2.7344, "step": 18040 }, { "epoch": 0.23, "learning_rate": 8.717217074732192e-05, "loss": 2.7028, "step": 18045 }, { "epoch": 0.23, "learning_rate": 8.716534416299404e-05, "loss": 2.5964, "step": 18050 }, { "epoch": 0.23, "learning_rate": 8.715851603015083e-05, "loss": 2.8671, "step": 18055 }, { "epoch": 0.23, "learning_rate": 8.715168634907675e-05, "loss": 2.6655, "step": 18060 }, { "epoch": 0.23, "learning_rate": 8.714485512005641e-05, "loss": 2.7993, "step": 18065 }, { "epoch": 0.23, "learning_rate": 8.71380223433744e-05, "loss": 2.672, "step": 18070 }, { "epoch": 0.23, "learning_rate": 8.713118801931542e-05, "loss": 2.8136, "step": 18075 }, { "epoch": 0.23, "learning_rate": 8.712435214816424e-05, "loss": 2.7419, "step": 18080 }, { "epoch": 0.23, "learning_rate": 8.711751473020567e-05, "loss": 2.6539, "step": 18085 }, { "epoch": 0.23, "learning_rate": 8.711067576572459e-05, "loss": 2.6523, "step": 18090 }, { "epoch": 0.23, "learning_rate": 8.710383525500594e-05, "loss": 2.5742, "step": 18095 }, { "epoch": 0.23, "learning_rate": 8.709699319833478e-05, "loss": 2.6459, "step": 18100 }, { "epoch": 0.23, "learning_rate": 8.709014959599613e-05, "loss": 2.8131, "step": 18105 }, { "epoch": 0.24, "learning_rate": 8.708330444827518e-05, "loss": 2.7694, "step": 18110 }, { "epoch": 0.24, "learning_rate": 8.707645775545709e-05, "loss": 2.745, "step": 18115 }, { "epoch": 0.24, "learning_rate": 8.706960951782719e-05, "loss": 2.6011, "step": 18120 }, { "epoch": 0.24, "learning_rate": 8.706275973567076e-05, "loss": 2.7174, "step": 18125 }, { "epoch": 0.24, "learning_rate": 8.705590840927322e-05, "loss": 2.788, "step": 18130 }, { "epoch": 0.24, "learning_rate": 8.704905553892006e-05, "loss": 2.714, "step": 18135 }, { "epoch": 0.24, "learning_rate": 8.704220112489678e-05, "loss": 2.5272, "step": 18140 }, { "epoch": 0.24, "learning_rate": 8.703534516748897e-05, "loss": 2.7056, "step": 18145 }, { "epoch": 0.24, "learning_rate": 8.702848766698231e-05, "loss": 2.6977, "step": 18150 }, { "epoch": 0.24, "learning_rate": 8.70216286236625e-05, "loss": 2.6816, "step": 18155 }, { "epoch": 0.24, "learning_rate": 8.701476803781534e-05, "loss": 2.741, "step": 18160 }, { "epoch": 0.24, "learning_rate": 8.700790590972667e-05, "loss": 2.6122, "step": 18165 }, { "epoch": 0.24, "learning_rate": 8.700104223968242e-05, "loss": 2.6665, "step": 18170 }, { "epoch": 0.24, "learning_rate": 8.699417702796855e-05, "loss": 2.7563, "step": 18175 }, { "epoch": 0.24, "learning_rate": 8.69873102748711e-05, "loss": 2.7836, "step": 18180 }, { "epoch": 0.24, "learning_rate": 8.69804419806762e-05, "loss": 2.5991, "step": 18185 }, { "epoch": 0.24, "learning_rate": 8.697357214567002e-05, "loss": 2.6744, "step": 18190 }, { "epoch": 0.24, "learning_rate": 8.696670077013877e-05, "loss": 2.7482, "step": 18195 }, { "epoch": 0.24, "learning_rate": 8.695982785436878e-05, "loss": 2.5935, "step": 18200 }, { "epoch": 0.24, "learning_rate": 8.695295339864638e-05, "loss": 2.5897, "step": 18205 }, { "epoch": 0.24, "learning_rate": 8.694607740325803e-05, "loss": 2.6857, "step": 18210 }, { "epoch": 0.24, "learning_rate": 8.693919986849021e-05, "loss": 2.7334, "step": 18215 }, { "epoch": 0.24, "learning_rate": 8.693232079462947e-05, "loss": 2.756, "step": 18220 }, { "epoch": 0.24, "learning_rate": 8.692544018196245e-05, "loss": 2.8242, "step": 18225 }, { "epoch": 0.24, "learning_rate": 8.69185580307758e-05, "loss": 2.7321, "step": 18230 }, { "epoch": 0.24, "learning_rate": 8.691167434135632e-05, "loss": 2.6746, "step": 18235 }, { "epoch": 0.24, "learning_rate": 8.690478911399077e-05, "loss": 2.7474, "step": 18240 }, { "epoch": 0.24, "learning_rate": 8.689790234896606e-05, "loss": 2.5924, "step": 18245 }, { "epoch": 0.24, "learning_rate": 8.689101404656912e-05, "loss": 2.6879, "step": 18250 }, { "epoch": 0.24, "learning_rate": 8.688412420708693e-05, "loss": 2.5976, "step": 18255 }, { "epoch": 0.24, "learning_rate": 8.687723283080662e-05, "loss": 2.7429, "step": 18260 }, { "epoch": 0.24, "learning_rate": 8.687033991801527e-05, "loss": 2.7227, "step": 18265 }, { "epoch": 0.24, "learning_rate": 8.686344546900012e-05, "loss": 2.6157, "step": 18270 }, { "epoch": 0.24, "learning_rate": 8.685654948404837e-05, "loss": 2.6256, "step": 18275 }, { "epoch": 0.24, "learning_rate": 8.68496519634474e-05, "loss": 2.6901, "step": 18280 }, { "epoch": 0.24, "learning_rate": 8.684275290748459e-05, "loss": 2.6499, "step": 18285 }, { "epoch": 0.24, "learning_rate": 8.683585231644738e-05, "loss": 2.8044, "step": 18290 }, { "epoch": 0.24, "learning_rate": 8.682895019062329e-05, "loss": 2.6549, "step": 18295 }, { "epoch": 0.24, "learning_rate": 8.682204653029991e-05, "loss": 2.6186, "step": 18300 }, { "epoch": 0.24, "learning_rate": 8.681514133576484e-05, "loss": 2.6733, "step": 18305 }, { "epoch": 0.24, "learning_rate": 8.680823460730586e-05, "loss": 2.6836, "step": 18310 }, { "epoch": 0.24, "learning_rate": 8.680132634521071e-05, "loss": 2.7657, "step": 18315 }, { "epoch": 0.24, "learning_rate": 8.679441654976721e-05, "loss": 2.7332, "step": 18320 }, { "epoch": 0.24, "learning_rate": 8.678750522126328e-05, "loss": 2.5053, "step": 18325 }, { "epoch": 0.24, "learning_rate": 8.678059235998689e-05, "loss": 2.6805, "step": 18330 }, { "epoch": 0.24, "learning_rate": 8.677367796622605e-05, "loss": 2.683, "step": 18335 }, { "epoch": 0.24, "learning_rate": 8.676676204026886e-05, "loss": 2.6623, "step": 18340 }, { "epoch": 0.24, "learning_rate": 8.67598445824035e-05, "loss": 2.7013, "step": 18345 }, { "epoch": 0.24, "learning_rate": 8.675292559291813e-05, "loss": 2.6245, "step": 18350 }, { "epoch": 0.24, "learning_rate": 8.674600507210109e-05, "loss": 2.6515, "step": 18355 }, { "epoch": 0.24, "learning_rate": 8.67390830202407e-05, "loss": 2.6644, "step": 18360 }, { "epoch": 0.24, "learning_rate": 8.67321594376254e-05, "loss": 2.6622, "step": 18365 }, { "epoch": 0.24, "learning_rate": 8.672523432454362e-05, "loss": 2.6691, "step": 18370 }, { "epoch": 0.24, "learning_rate": 8.671830768128393e-05, "loss": 2.7045, "step": 18375 }, { "epoch": 0.24, "learning_rate": 8.671137950813492e-05, "loss": 2.5233, "step": 18380 }, { "epoch": 0.24, "learning_rate": 8.670444980538528e-05, "loss": 2.6355, "step": 18385 }, { "epoch": 0.24, "learning_rate": 8.669751857332371e-05, "loss": 2.6115, "step": 18390 }, { "epoch": 0.24, "learning_rate": 8.669058581223902e-05, "loss": 2.6329, "step": 18395 }, { "epoch": 0.24, "learning_rate": 8.668365152242006e-05, "loss": 2.5959, "step": 18400 }, { "epoch": 0.24, "learning_rate": 8.667671570415577e-05, "loss": 2.6282, "step": 18405 }, { "epoch": 0.24, "learning_rate": 8.66697783577351e-05, "loss": 2.6742, "step": 18410 }, { "epoch": 0.24, "learning_rate": 8.666283948344712e-05, "loss": 2.5899, "step": 18415 }, { "epoch": 0.24, "learning_rate": 8.665589908158094e-05, "loss": 2.5541, "step": 18420 }, { "epoch": 0.24, "learning_rate": 8.664895715242573e-05, "loss": 2.6557, "step": 18425 }, { "epoch": 0.24, "learning_rate": 8.664201369627076e-05, "loss": 2.617, "step": 18430 }, { "epoch": 0.24, "learning_rate": 8.663506871340529e-05, "loss": 2.8228, "step": 18435 }, { "epoch": 0.24, "learning_rate": 8.662812220411872e-05, "loss": 2.7063, "step": 18440 }, { "epoch": 0.24, "learning_rate": 8.662117416870044e-05, "loss": 2.5913, "step": 18445 }, { "epoch": 0.24, "learning_rate": 8.661422460743998e-05, "loss": 2.6578, "step": 18450 }, { "epoch": 0.24, "learning_rate": 8.66072735206269e-05, "loss": 2.5801, "step": 18455 }, { "epoch": 0.24, "learning_rate": 8.660032090855078e-05, "loss": 2.6078, "step": 18460 }, { "epoch": 0.24, "learning_rate": 8.659336677150136e-05, "loss": 2.6864, "step": 18465 }, { "epoch": 0.24, "learning_rate": 8.658641110976834e-05, "loss": 2.6255, "step": 18470 }, { "epoch": 0.24, "learning_rate": 8.657945392364155e-05, "loss": 2.7173, "step": 18475 }, { "epoch": 0.24, "learning_rate": 8.657249521341088e-05, "loss": 2.6361, "step": 18480 }, { "epoch": 0.24, "learning_rate": 8.656553497936626e-05, "loss": 2.6079, "step": 18485 }, { "epoch": 0.24, "learning_rate": 8.655857322179767e-05, "loss": 2.8118, "step": 18490 }, { "epoch": 0.24, "learning_rate": 8.65516099409952e-05, "loss": 2.7044, "step": 18495 }, { "epoch": 0.24, "learning_rate": 8.654464513724899e-05, "loss": 2.7118, "step": 18500 }, { "epoch": 0.24, "learning_rate": 8.65376788108492e-05, "loss": 2.6179, "step": 18505 }, { "epoch": 0.24, "learning_rate": 8.653071096208609e-05, "loss": 2.707, "step": 18510 }, { "epoch": 0.24, "learning_rate": 8.652374159125002e-05, "loss": 2.5836, "step": 18515 }, { "epoch": 0.24, "learning_rate": 8.651677069863132e-05, "loss": 2.7018, "step": 18520 }, { "epoch": 0.24, "learning_rate": 8.650979828452046e-05, "loss": 2.6026, "step": 18525 }, { "epoch": 0.24, "learning_rate": 8.650282434920796e-05, "loss": 2.6856, "step": 18530 }, { "epoch": 0.24, "learning_rate": 8.649584889298438e-05, "loss": 2.7181, "step": 18535 }, { "epoch": 0.24, "learning_rate": 8.648887191614035e-05, "loss": 2.7308, "step": 18540 }, { "epoch": 0.24, "learning_rate": 8.648189341896659e-05, "loss": 2.7935, "step": 18545 }, { "epoch": 0.24, "learning_rate": 8.647491340175385e-05, "loss": 2.7475, "step": 18550 }, { "epoch": 0.24, "learning_rate": 8.646793186479294e-05, "loss": 2.7661, "step": 18555 }, { "epoch": 0.24, "learning_rate": 8.646094880837479e-05, "loss": 2.6065, "step": 18560 }, { "epoch": 0.24, "learning_rate": 8.645396423279031e-05, "loss": 2.6493, "step": 18565 }, { "epoch": 0.24, "learning_rate": 8.644697813833056e-05, "loss": 2.6061, "step": 18570 }, { "epoch": 0.24, "learning_rate": 8.643999052528658e-05, "loss": 2.6839, "step": 18575 }, { "epoch": 0.24, "learning_rate": 8.643300139394952e-05, "loss": 2.6284, "step": 18580 }, { "epoch": 0.24, "learning_rate": 8.642601074461062e-05, "loss": 2.7853, "step": 18585 }, { "epoch": 0.24, "learning_rate": 8.641901857756112e-05, "loss": 2.6639, "step": 18590 }, { "epoch": 0.24, "learning_rate": 8.641202489309235e-05, "loss": 2.7235, "step": 18595 }, { "epoch": 0.24, "learning_rate": 8.64050296914957e-05, "loss": 2.4989, "step": 18600 }, { "epoch": 0.24, "learning_rate": 8.639803297306266e-05, "loss": 2.7814, "step": 18605 }, { "epoch": 0.24, "learning_rate": 8.639103473808473e-05, "loss": 2.6208, "step": 18610 }, { "epoch": 0.24, "learning_rate": 8.638403498685351e-05, "loss": 2.6942, "step": 18615 }, { "epoch": 0.24, "learning_rate": 8.637703371966063e-05, "loss": 2.7448, "step": 18620 }, { "epoch": 0.24, "learning_rate": 8.63700309367978e-05, "loss": 2.6722, "step": 18625 }, { "epoch": 0.24, "learning_rate": 8.636302663855683e-05, "loss": 2.7184, "step": 18630 }, { "epoch": 0.24, "learning_rate": 8.635602082522952e-05, "loss": 2.6549, "step": 18635 }, { "epoch": 0.24, "learning_rate": 8.634901349710778e-05, "loss": 2.8364, "step": 18640 }, { "epoch": 0.24, "learning_rate": 8.63420046544836e-05, "loss": 2.7236, "step": 18645 }, { "epoch": 0.24, "learning_rate": 8.633499429764897e-05, "loss": 2.728, "step": 18650 }, { "epoch": 0.24, "learning_rate": 8.6327982426896e-05, "loss": 2.6779, "step": 18655 }, { "epoch": 0.24, "learning_rate": 8.632096904251683e-05, "loss": 2.6707, "step": 18660 }, { "epoch": 0.24, "learning_rate": 8.63139541448037e-05, "loss": 2.7796, "step": 18665 }, { "epoch": 0.24, "learning_rate": 8.630693773404888e-05, "loss": 2.7314, "step": 18670 }, { "epoch": 0.24, "learning_rate": 8.62999198105447e-05, "loss": 2.7973, "step": 18675 }, { "epoch": 0.24, "learning_rate": 8.629290037458359e-05, "loss": 2.778, "step": 18680 }, { "epoch": 0.24, "learning_rate": 8.628587942645798e-05, "loss": 2.7463, "step": 18685 }, { "epoch": 0.24, "learning_rate": 8.627885696646046e-05, "loss": 2.792, "step": 18690 }, { "epoch": 0.24, "learning_rate": 8.627183299488358e-05, "loss": 2.7252, "step": 18695 }, { "epoch": 0.24, "learning_rate": 8.626480751201999e-05, "loss": 2.6728, "step": 18700 }, { "epoch": 0.24, "learning_rate": 8.625778051816244e-05, "loss": 2.7314, "step": 18705 }, { "epoch": 0.24, "learning_rate": 8.625075201360371e-05, "loss": 2.7473, "step": 18710 }, { "epoch": 0.24, "learning_rate": 8.624372199863664e-05, "loss": 2.7744, "step": 18715 }, { "epoch": 0.24, "learning_rate": 8.623669047355414e-05, "loss": 2.7458, "step": 18720 }, { "epoch": 0.24, "learning_rate": 8.622965743864917e-05, "loss": 2.6453, "step": 18725 }, { "epoch": 0.24, "learning_rate": 8.62226228942148e-05, "loss": 2.7324, "step": 18730 }, { "epoch": 0.24, "learning_rate": 8.621558684054408e-05, "loss": 2.7437, "step": 18735 }, { "epoch": 0.24, "learning_rate": 8.620854927793021e-05, "loss": 2.7926, "step": 18740 }, { "epoch": 0.24, "learning_rate": 8.620151020666641e-05, "loss": 2.6661, "step": 18745 }, { "epoch": 0.24, "learning_rate": 8.619446962704595e-05, "loss": 2.7348, "step": 18750 }, { "epoch": 0.24, "learning_rate": 8.618742753936218e-05, "loss": 2.665, "step": 18755 }, { "epoch": 0.24, "learning_rate": 8.618038394390855e-05, "loss": 2.6281, "step": 18760 }, { "epoch": 0.24, "learning_rate": 8.617333884097847e-05, "loss": 2.5756, "step": 18765 }, { "epoch": 0.24, "learning_rate": 8.616629223086554e-05, "loss": 2.6621, "step": 18770 }, { "epoch": 0.24, "learning_rate": 8.615924411386332e-05, "loss": 2.7436, "step": 18775 }, { "epoch": 0.24, "learning_rate": 8.61521944902655e-05, "loss": 2.643, "step": 18780 }, { "epoch": 0.24, "learning_rate": 8.614514336036578e-05, "loss": 2.6802, "step": 18785 }, { "epoch": 0.24, "learning_rate": 8.613809072445798e-05, "loss": 2.6094, "step": 18790 }, { "epoch": 0.24, "learning_rate": 8.613103658283594e-05, "loss": 2.6852, "step": 18795 }, { "epoch": 0.24, "learning_rate": 8.612398093579357e-05, "loss": 2.6879, "step": 18800 }, { "epoch": 0.24, "learning_rate": 8.611692378362483e-05, "loss": 2.6475, "step": 18805 }, { "epoch": 0.24, "learning_rate": 8.610986512662381e-05, "loss": 2.7111, "step": 18810 }, { "epoch": 0.24, "learning_rate": 8.610280496508456e-05, "loss": 2.6778, "step": 18815 }, { "epoch": 0.24, "learning_rate": 8.609574329930128e-05, "loss": 2.6403, "step": 18820 }, { "epoch": 0.24, "learning_rate": 8.608868012956819e-05, "loss": 2.6471, "step": 18825 }, { "epoch": 0.24, "learning_rate": 8.608161545617957e-05, "loss": 2.7092, "step": 18830 }, { "epoch": 0.24, "learning_rate": 8.607454927942979e-05, "loss": 2.7036, "step": 18835 }, { "epoch": 0.24, "learning_rate": 8.606748159961326e-05, "loss": 2.7322, "step": 18840 }, { "epoch": 0.24, "learning_rate": 8.606041241702445e-05, "loss": 2.7232, "step": 18845 }, { "epoch": 0.24, "learning_rate": 8.60533417319579e-05, "loss": 2.7181, "step": 18850 }, { "epoch": 0.24, "learning_rate": 8.604626954470823e-05, "loss": 2.6511, "step": 18855 }, { "epoch": 0.24, "learning_rate": 8.60391958555701e-05, "loss": 2.6863, "step": 18860 }, { "epoch": 0.24, "learning_rate": 8.603212066483825e-05, "loss": 2.7037, "step": 18865 }, { "epoch": 0.24, "learning_rate": 8.602504397280745e-05, "loss": 2.7964, "step": 18870 }, { "epoch": 0.24, "learning_rate": 8.601796577977257e-05, "loss": 2.737, "step": 18875 }, { "epoch": 0.25, "learning_rate": 8.601088608602852e-05, "loss": 2.6314, "step": 18880 }, { "epoch": 0.25, "learning_rate": 8.600380489187027e-05, "loss": 2.7202, "step": 18885 }, { "epoch": 0.25, "learning_rate": 8.599672219759289e-05, "loss": 2.741, "step": 18890 }, { "epoch": 0.25, "learning_rate": 8.598963800349146e-05, "loss": 2.7622, "step": 18895 }, { "epoch": 0.25, "learning_rate": 8.598255230986115e-05, "loss": 2.6947, "step": 18900 }, { "epoch": 0.25, "learning_rate": 8.59754651169972e-05, "loss": 2.7606, "step": 18905 }, { "epoch": 0.25, "learning_rate": 8.59683764251949e-05, "loss": 2.6151, "step": 18910 }, { "epoch": 0.25, "learning_rate": 8.596128623474959e-05, "loss": 2.7867, "step": 18915 }, { "epoch": 0.25, "learning_rate": 8.595419454595671e-05, "loss": 2.5703, "step": 18920 }, { "epoch": 0.25, "learning_rate": 8.594710135911173e-05, "loss": 2.7584, "step": 18925 }, { "epoch": 0.25, "learning_rate": 8.594000667451018e-05, "loss": 2.659, "step": 18930 }, { "epoch": 0.25, "learning_rate": 8.593291049244768e-05, "loss": 2.7224, "step": 18935 }, { "epoch": 0.25, "learning_rate": 8.592581281321988e-05, "loss": 2.5633, "step": 18940 }, { "epoch": 0.25, "learning_rate": 8.591871363712251e-05, "loss": 2.6477, "step": 18945 }, { "epoch": 0.25, "learning_rate": 8.591161296445138e-05, "loss": 2.8519, "step": 18950 }, { "epoch": 0.25, "learning_rate": 8.590451079550234e-05, "loss": 2.6431, "step": 18955 }, { "epoch": 0.25, "learning_rate": 8.589740713057129e-05, "loss": 2.6715, "step": 18960 }, { "epoch": 0.25, "learning_rate": 8.589030196995423e-05, "loss": 2.7268, "step": 18965 }, { "epoch": 0.25, "learning_rate": 8.588319531394718e-05, "loss": 2.6006, "step": 18970 }, { "epoch": 0.25, "learning_rate": 8.587608716284624e-05, "loss": 2.6463, "step": 18975 }, { "epoch": 0.25, "learning_rate": 8.586897751694761e-05, "loss": 2.567, "step": 18980 }, { "epoch": 0.25, "learning_rate": 8.586186637654747e-05, "loss": 2.7146, "step": 18985 }, { "epoch": 0.25, "learning_rate": 8.585475374194213e-05, "loss": 2.7622, "step": 18990 }, { "epoch": 0.25, "learning_rate": 8.584763961342797e-05, "loss": 2.7171, "step": 18995 }, { "epoch": 0.25, "learning_rate": 8.584052399130136e-05, "loss": 2.6488, "step": 19000 }, { "epoch": 0.25, "learning_rate": 8.583340687585879e-05, "loss": 2.7522, "step": 19005 }, { "epoch": 0.25, "learning_rate": 8.582628826739682e-05, "loss": 2.7074, "step": 19010 }, { "epoch": 0.25, "learning_rate": 8.581916816621202e-05, "loss": 2.6179, "step": 19015 }, { "epoch": 0.25, "learning_rate": 8.581204657260109e-05, "loss": 2.6075, "step": 19020 }, { "epoch": 0.25, "learning_rate": 8.580492348686072e-05, "loss": 2.6192, "step": 19025 }, { "epoch": 0.25, "learning_rate": 8.579779890928772e-05, "loss": 2.5947, "step": 19030 }, { "epoch": 0.25, "learning_rate": 8.579067284017892e-05, "loss": 2.671, "step": 19035 }, { "epoch": 0.25, "learning_rate": 8.578354527983126e-05, "loss": 2.4895, "step": 19040 }, { "epoch": 0.25, "learning_rate": 8.577641622854168e-05, "loss": 2.7441, "step": 19045 }, { "epoch": 0.25, "learning_rate": 8.576928568660722e-05, "loss": 2.7613, "step": 19050 }, { "epoch": 0.25, "learning_rate": 8.576215365432502e-05, "loss": 2.6903, "step": 19055 }, { "epoch": 0.25, "learning_rate": 8.575502013199219e-05, "loss": 2.5556, "step": 19060 }, { "epoch": 0.25, "learning_rate": 8.574788511990599e-05, "loss": 2.7615, "step": 19065 }, { "epoch": 0.25, "learning_rate": 8.574074861836367e-05, "loss": 2.7923, "step": 19070 }, { "epoch": 0.25, "learning_rate": 8.573361062766261e-05, "loss": 2.7612, "step": 19075 }, { "epoch": 0.25, "learning_rate": 8.57264711481002e-05, "loss": 2.7603, "step": 19080 }, { "epoch": 0.25, "learning_rate": 8.57193301799739e-05, "loss": 2.6832, "step": 19085 }, { "epoch": 0.25, "learning_rate": 8.571218772358126e-05, "loss": 2.685, "step": 19090 }, { "epoch": 0.25, "learning_rate": 8.570504377921987e-05, "loss": 2.7406, "step": 19095 }, { "epoch": 0.25, "learning_rate": 8.569789834718739e-05, "loss": 2.7211, "step": 19100 }, { "epoch": 0.25, "learning_rate": 8.569075142778153e-05, "loss": 2.6676, "step": 19105 }, { "epoch": 0.25, "learning_rate": 8.568360302130008e-05, "loss": 2.7432, "step": 19110 }, { "epoch": 0.25, "learning_rate": 8.567645312804088e-05, "loss": 2.8219, "step": 19115 }, { "epoch": 0.25, "learning_rate": 8.566930174830182e-05, "loss": 2.6323, "step": 19120 }, { "epoch": 0.25, "learning_rate": 8.566214888238089e-05, "loss": 2.7872, "step": 19125 }, { "epoch": 0.25, "learning_rate": 8.56549945305761e-05, "loss": 2.6595, "step": 19130 }, { "epoch": 0.25, "learning_rate": 8.564783869318555e-05, "loss": 2.6667, "step": 19135 }, { "epoch": 0.25, "learning_rate": 8.56406813705074e-05, "loss": 2.7218, "step": 19140 }, { "epoch": 0.25, "learning_rate": 8.563352256283984e-05, "loss": 2.5946, "step": 19145 }, { "epoch": 0.25, "learning_rate": 8.562636227048115e-05, "loss": 2.5816, "step": 19150 }, { "epoch": 0.25, "learning_rate": 8.56192004937297e-05, "loss": 2.6511, "step": 19155 }, { "epoch": 0.25, "learning_rate": 8.561203723288384e-05, "loss": 2.5926, "step": 19160 }, { "epoch": 0.25, "learning_rate": 8.560487248824208e-05, "loss": 2.6645, "step": 19165 }, { "epoch": 0.25, "learning_rate": 8.559770626010292e-05, "loss": 2.5763, "step": 19170 }, { "epoch": 0.25, "learning_rate": 8.559053854876494e-05, "loss": 2.6292, "step": 19175 }, { "epoch": 0.25, "learning_rate": 8.558336935452678e-05, "loss": 2.6639, "step": 19180 }, { "epoch": 0.25, "learning_rate": 8.557619867768719e-05, "loss": 2.7234, "step": 19185 }, { "epoch": 0.25, "learning_rate": 8.556902651854488e-05, "loss": 2.7354, "step": 19190 }, { "epoch": 0.25, "learning_rate": 8.556185287739871e-05, "loss": 2.6335, "step": 19195 }, { "epoch": 0.25, "learning_rate": 8.555467775454761e-05, "loss": 2.6189, "step": 19200 }, { "epoch": 0.25, "learning_rate": 8.554750115029048e-05, "loss": 2.6181, "step": 19205 }, { "epoch": 0.25, "learning_rate": 8.554032306492637e-05, "loss": 2.6731, "step": 19210 }, { "epoch": 0.25, "learning_rate": 8.553314349875434e-05, "loss": 2.597, "step": 19215 }, { "epoch": 0.25, "learning_rate": 8.552596245207354e-05, "loss": 2.733, "step": 19220 }, { "epoch": 0.25, "learning_rate": 8.551877992518318e-05, "loss": 2.6524, "step": 19225 }, { "epoch": 0.25, "learning_rate": 8.551159591838251e-05, "loss": 2.7244, "step": 19230 }, { "epoch": 0.25, "learning_rate": 8.550441043197088e-05, "loss": 2.7884, "step": 19235 }, { "epoch": 0.25, "learning_rate": 8.549722346624765e-05, "loss": 2.6455, "step": 19240 }, { "epoch": 0.25, "learning_rate": 8.549003502151227e-05, "loss": 2.6214, "step": 19245 }, { "epoch": 0.25, "learning_rate": 8.548284509806426e-05, "loss": 2.68, "step": 19250 }, { "epoch": 0.25, "learning_rate": 8.54756536962032e-05, "loss": 2.6687, "step": 19255 }, { "epoch": 0.25, "learning_rate": 8.54684608162287e-05, "loss": 2.6427, "step": 19260 }, { "epoch": 0.25, "learning_rate": 8.546126645844049e-05, "loss": 2.707, "step": 19265 }, { "epoch": 0.25, "learning_rate": 8.54540706231383e-05, "loss": 2.7284, "step": 19270 }, { "epoch": 0.25, "learning_rate": 8.544687331062196e-05, "loss": 2.7584, "step": 19275 }, { "epoch": 0.25, "learning_rate": 8.543967452119135e-05, "loss": 2.7166, "step": 19280 }, { "epoch": 0.25, "learning_rate": 8.54324742551464e-05, "loss": 2.6095, "step": 19285 }, { "epoch": 0.25, "learning_rate": 8.542527251278712e-05, "loss": 2.6751, "step": 19290 }, { "epoch": 0.25, "learning_rate": 8.541806929441358e-05, "loss": 2.5536, "step": 19295 }, { "epoch": 0.25, "learning_rate": 8.54108646003259e-05, "loss": 2.6305, "step": 19300 }, { "epoch": 0.25, "learning_rate": 8.540365843082428e-05, "loss": 2.6629, "step": 19305 }, { "epoch": 0.25, "learning_rate": 8.539645078620895e-05, "loss": 2.6794, "step": 19310 }, { "epoch": 0.25, "learning_rate": 8.538924166678023e-05, "loss": 2.6366, "step": 19315 }, { "epoch": 0.25, "learning_rate": 8.538203107283849e-05, "loss": 2.605, "step": 19320 }, { "epoch": 0.25, "learning_rate": 8.537481900468418e-05, "loss": 2.8761, "step": 19325 }, { "epoch": 0.25, "learning_rate": 8.536760546261777e-05, "loss": 2.6843, "step": 19330 }, { "epoch": 0.25, "learning_rate": 8.536039044693982e-05, "loss": 2.6744, "step": 19335 }, { "epoch": 0.25, "learning_rate": 8.535317395795097e-05, "loss": 2.6117, "step": 19340 }, { "epoch": 0.25, "learning_rate": 8.534595599595188e-05, "loss": 2.7746, "step": 19345 }, { "epoch": 0.25, "learning_rate": 8.533873656124329e-05, "loss": 2.5525, "step": 19350 }, { "epoch": 0.25, "learning_rate": 8.533151565412601e-05, "loss": 2.7109, "step": 19355 }, { "epoch": 0.25, "learning_rate": 8.53242932749009e-05, "loss": 2.6902, "step": 19360 }, { "epoch": 0.25, "learning_rate": 8.531706942386887e-05, "loss": 2.7579, "step": 19365 }, { "epoch": 0.25, "learning_rate": 8.530984410133094e-05, "loss": 2.6836, "step": 19370 }, { "epoch": 0.25, "learning_rate": 8.530261730758813e-05, "loss": 2.7583, "step": 19375 }, { "epoch": 0.25, "learning_rate": 8.529538904294154e-05, "loss": 2.5576, "step": 19380 }, { "epoch": 0.25, "learning_rate": 8.528815930769238e-05, "loss": 2.6641, "step": 19385 }, { "epoch": 0.25, "learning_rate": 8.528092810214185e-05, "loss": 2.6902, "step": 19390 }, { "epoch": 0.25, "learning_rate": 8.527369542659125e-05, "loss": 2.6259, "step": 19395 }, { "epoch": 0.25, "learning_rate": 8.526646128134192e-05, "loss": 2.7325, "step": 19400 }, { "epoch": 0.25, "learning_rate": 8.525922566669528e-05, "loss": 2.6789, "step": 19405 }, { "epoch": 0.25, "learning_rate": 8.525198858295285e-05, "loss": 2.6318, "step": 19410 }, { "epoch": 0.25, "learning_rate": 8.52447500304161e-05, "loss": 2.5468, "step": 19415 }, { "epoch": 0.25, "learning_rate": 8.523751000938666e-05, "loss": 2.6743, "step": 19420 }, { "epoch": 0.25, "learning_rate": 8.523026852016621e-05, "loss": 2.5574, "step": 19425 }, { "epoch": 0.25, "learning_rate": 8.522302556305644e-05, "loss": 2.7985, "step": 19430 }, { "epoch": 0.25, "learning_rate": 8.521578113835913e-05, "loss": 2.7258, "step": 19435 }, { "epoch": 0.25, "learning_rate": 8.520853524637614e-05, "loss": 2.6614, "step": 19440 }, { "epoch": 0.25, "learning_rate": 8.520128788740937e-05, "loss": 2.5988, "step": 19445 }, { "epoch": 0.25, "learning_rate": 8.51940390617608e-05, "loss": 2.551, "step": 19450 }, { "epoch": 0.25, "learning_rate": 8.518678876973241e-05, "loss": 2.6564, "step": 19455 }, { "epoch": 0.25, "learning_rate": 8.517953701162635e-05, "loss": 2.7076, "step": 19460 }, { "epoch": 0.25, "learning_rate": 8.51722837877447e-05, "loss": 2.5862, "step": 19465 }, { "epoch": 0.25, "learning_rate": 8.516502909838974e-05, "loss": 2.682, "step": 19470 }, { "epoch": 0.25, "learning_rate": 8.515777294386368e-05, "loss": 2.5928, "step": 19475 }, { "epoch": 0.25, "learning_rate": 8.51505153244689e-05, "loss": 2.7256, "step": 19480 }, { "epoch": 0.25, "learning_rate": 8.514325624050776e-05, "loss": 2.6898, "step": 19485 }, { "epoch": 0.25, "learning_rate": 8.513599569228274e-05, "loss": 2.6462, "step": 19490 }, { "epoch": 0.25, "learning_rate": 8.512873368009633e-05, "loss": 2.7129, "step": 19495 }, { "epoch": 0.25, "learning_rate": 8.512147020425112e-05, "loss": 2.6294, "step": 19500 }, { "epoch": 0.25, "learning_rate": 8.511420526504973e-05, "loss": 2.6833, "step": 19505 }, { "epoch": 0.25, "learning_rate": 8.510693886279489e-05, "loss": 2.683, "step": 19510 }, { "epoch": 0.25, "learning_rate": 8.509967099778933e-05, "loss": 2.6902, "step": 19515 }, { "epoch": 0.25, "learning_rate": 8.50924016703359e-05, "loss": 2.6178, "step": 19520 }, { "epoch": 0.25, "learning_rate": 8.508513088073744e-05, "loss": 2.6764, "step": 19525 }, { "epoch": 0.25, "learning_rate": 8.507785862929692e-05, "loss": 2.8521, "step": 19530 }, { "epoch": 0.25, "learning_rate": 8.507058491631732e-05, "loss": 2.7077, "step": 19535 }, { "epoch": 0.25, "learning_rate": 8.506330974210173e-05, "loss": 2.6352, "step": 19540 }, { "epoch": 0.25, "learning_rate": 8.505603310695328e-05, "loss": 2.5966, "step": 19545 }, { "epoch": 0.25, "learning_rate": 8.504875501117511e-05, "loss": 2.6495, "step": 19550 }, { "epoch": 0.25, "learning_rate": 8.504147545507048e-05, "loss": 2.6474, "step": 19555 }, { "epoch": 0.25, "learning_rate": 8.503419443894274e-05, "loss": 2.73, "step": 19560 }, { "epoch": 0.25, "learning_rate": 8.502691196309522e-05, "loss": 2.6476, "step": 19565 }, { "epoch": 0.25, "learning_rate": 8.501962802783137e-05, "loss": 2.706, "step": 19570 }, { "epoch": 0.25, "learning_rate": 8.501234263345465e-05, "loss": 2.7218, "step": 19575 }, { "epoch": 0.25, "learning_rate": 8.500505578026863e-05, "loss": 2.6371, "step": 19580 }, { "epoch": 0.25, "learning_rate": 8.499776746857692e-05, "loss": 2.6268, "step": 19585 }, { "epoch": 0.25, "learning_rate": 8.499047769868318e-05, "loss": 2.7848, "step": 19590 }, { "epoch": 0.25, "learning_rate": 8.498318647089116e-05, "loss": 2.7019, "step": 19595 }, { "epoch": 0.25, "learning_rate": 8.497589378550465e-05, "loss": 2.5823, "step": 19600 }, { "epoch": 0.25, "learning_rate": 8.496859964282749e-05, "loss": 2.6996, "step": 19605 }, { "epoch": 0.25, "learning_rate": 8.49613040431636e-05, "loss": 2.6423, "step": 19610 }, { "epoch": 0.25, "learning_rate": 8.495400698681697e-05, "loss": 2.6142, "step": 19615 }, { "epoch": 0.25, "learning_rate": 8.49467084740916e-05, "loss": 2.6386, "step": 19620 }, { "epoch": 0.25, "learning_rate": 8.493940850529163e-05, "loss": 2.627, "step": 19625 }, { "epoch": 0.25, "learning_rate": 8.493210708072121e-05, "loss": 2.6585, "step": 19630 }, { "epoch": 0.25, "learning_rate": 8.492480420068452e-05, "loss": 2.6115, "step": 19635 }, { "epoch": 0.25, "learning_rate": 8.491749986548589e-05, "loss": 2.6199, "step": 19640 }, { "epoch": 0.25, "learning_rate": 8.491019407542962e-05, "loss": 2.593, "step": 19645 }, { "epoch": 0.26, "learning_rate": 8.490288683082013e-05, "loss": 2.6071, "step": 19650 }, { "epoch": 0.26, "learning_rate": 8.489557813196187e-05, "loss": 2.823, "step": 19655 }, { "epoch": 0.26, "learning_rate": 8.488826797915936e-05, "loss": 2.7134, "step": 19660 }, { "epoch": 0.26, "learning_rate": 8.48809563727172e-05, "loss": 2.748, "step": 19665 }, { "epoch": 0.26, "learning_rate": 8.487364331294001e-05, "loss": 2.7084, "step": 19670 }, { "epoch": 0.26, "learning_rate": 8.486632880013252e-05, "loss": 2.728, "step": 19675 }, { "epoch": 0.26, "learning_rate": 8.485901283459945e-05, "loss": 2.6325, "step": 19680 }, { "epoch": 0.26, "learning_rate": 8.485169541664566e-05, "loss": 2.7189, "step": 19685 }, { "epoch": 0.26, "learning_rate": 8.484437654657604e-05, "loss": 2.6043, "step": 19690 }, { "epoch": 0.26, "learning_rate": 8.483705622469551e-05, "loss": 2.7734, "step": 19695 }, { "epoch": 0.26, "learning_rate": 8.482973445130908e-05, "loss": 2.7122, "step": 19700 }, { "epoch": 0.26, "learning_rate": 8.482241122672183e-05, "loss": 2.6408, "step": 19705 }, { "epoch": 0.26, "learning_rate": 8.481508655123887e-05, "loss": 2.5204, "step": 19710 }, { "epoch": 0.26, "learning_rate": 8.48077604251654e-05, "loss": 2.5324, "step": 19715 }, { "epoch": 0.26, "learning_rate": 8.480043284880666e-05, "loss": 2.9125, "step": 19720 }, { "epoch": 0.26, "learning_rate": 8.479310382246794e-05, "loss": 2.8145, "step": 19725 }, { "epoch": 0.26, "learning_rate": 8.478577334645465e-05, "loss": 2.6216, "step": 19730 }, { "epoch": 0.26, "learning_rate": 8.477844142107219e-05, "loss": 2.6064, "step": 19735 }, { "epoch": 0.26, "learning_rate": 8.477110804662604e-05, "loss": 2.488, "step": 19740 }, { "epoch": 0.26, "learning_rate": 8.476377322342177e-05, "loss": 2.6001, "step": 19745 }, { "epoch": 0.26, "learning_rate": 8.4756436951765e-05, "loss": 2.7437, "step": 19750 }, { "epoch": 0.26, "learning_rate": 8.474909923196138e-05, "loss": 2.6113, "step": 19755 }, { "epoch": 0.26, "learning_rate": 8.474176006431663e-05, "loss": 2.6892, "step": 19760 }, { "epoch": 0.26, "learning_rate": 8.473441944913655e-05, "loss": 2.6633, "step": 19765 }, { "epoch": 0.26, "learning_rate": 8.472707738672701e-05, "loss": 2.6624, "step": 19770 }, { "epoch": 0.26, "learning_rate": 8.471973387739389e-05, "loss": 2.6005, "step": 19775 }, { "epoch": 0.26, "learning_rate": 8.471238892144319e-05, "loss": 2.8051, "step": 19780 }, { "epoch": 0.26, "learning_rate": 8.470504251918092e-05, "loss": 2.6863, "step": 19785 }, { "epoch": 0.26, "learning_rate": 8.469769467091319e-05, "loss": 2.5826, "step": 19790 }, { "epoch": 0.26, "learning_rate": 8.469034537694615e-05, "loss": 2.7268, "step": 19795 }, { "epoch": 0.26, "learning_rate": 8.468299463758597e-05, "loss": 2.6177, "step": 19800 }, { "epoch": 0.26, "learning_rate": 8.4675642453139e-05, "loss": 2.7015, "step": 19805 }, { "epoch": 0.26, "learning_rate": 8.466828882391152e-05, "loss": 2.6958, "step": 19810 }, { "epoch": 0.26, "learning_rate": 8.466093375020993e-05, "loss": 2.6159, "step": 19815 }, { "epoch": 0.26, "learning_rate": 8.46535772323407e-05, "loss": 2.735, "step": 19820 }, { "epoch": 0.26, "learning_rate": 8.464621927061032e-05, "loss": 2.6682, "step": 19825 }, { "epoch": 0.26, "learning_rate": 8.463885986532538e-05, "loss": 2.7642, "step": 19830 }, { "epoch": 0.26, "learning_rate": 8.463149901679251e-05, "loss": 2.6028, "step": 19835 }, { "epoch": 0.26, "learning_rate": 8.462413672531841e-05, "loss": 2.6187, "step": 19840 }, { "epoch": 0.26, "learning_rate": 8.461677299120982e-05, "loss": 2.6396, "step": 19845 }, { "epoch": 0.26, "learning_rate": 8.460940781477357e-05, "loss": 2.6555, "step": 19850 }, { "epoch": 0.26, "learning_rate": 8.460204119631651e-05, "loss": 2.7187, "step": 19855 }, { "epoch": 0.26, "learning_rate": 8.45946731361456e-05, "loss": 2.5371, "step": 19860 }, { "epoch": 0.26, "learning_rate": 8.458730363456783e-05, "loss": 2.6373, "step": 19865 }, { "epoch": 0.26, "learning_rate": 8.457993269189024e-05, "loss": 2.7165, "step": 19870 }, { "epoch": 0.26, "learning_rate": 8.457256030841996e-05, "loss": 2.4928, "step": 19875 }, { "epoch": 0.26, "learning_rate": 8.456518648446417e-05, "loss": 2.7018, "step": 19880 }, { "epoch": 0.26, "learning_rate": 8.455781122033007e-05, "loss": 2.8315, "step": 19885 }, { "epoch": 0.26, "learning_rate": 8.455043451632499e-05, "loss": 2.7104, "step": 19890 }, { "epoch": 0.26, "learning_rate": 8.454305637275626e-05, "loss": 2.7003, "step": 19895 }, { "epoch": 0.26, "learning_rate": 8.453567678993132e-05, "loss": 2.5887, "step": 19900 }, { "epoch": 0.26, "learning_rate": 8.452829576815763e-05, "loss": 2.7002, "step": 19905 }, { "epoch": 0.26, "learning_rate": 8.452091330774272e-05, "loss": 2.6906, "step": 19910 }, { "epoch": 0.26, "learning_rate": 8.45135294089942e-05, "loss": 2.7241, "step": 19915 }, { "epoch": 0.26, "learning_rate": 8.450614407221972e-05, "loss": 2.662, "step": 19920 }, { "epoch": 0.26, "learning_rate": 8.449875729772697e-05, "loss": 2.6568, "step": 19925 }, { "epoch": 0.26, "learning_rate": 8.449136908582375e-05, "loss": 2.6578, "step": 19930 }, { "epoch": 0.26, "learning_rate": 8.44839794368179e-05, "loss": 2.787, "step": 19935 }, { "epoch": 0.26, "learning_rate": 8.447658835101729e-05, "loss": 2.6551, "step": 19940 }, { "epoch": 0.26, "learning_rate": 8.44691958287299e-05, "loss": 2.566, "step": 19945 }, { "epoch": 0.26, "learning_rate": 8.44618018702637e-05, "loss": 2.6709, "step": 19950 }, { "epoch": 0.26, "learning_rate": 8.445440647592681e-05, "loss": 2.6109, "step": 19955 }, { "epoch": 0.26, "learning_rate": 8.444700964602734e-05, "loss": 2.6778, "step": 19960 }, { "epoch": 0.26, "learning_rate": 8.443961138087351e-05, "loss": 2.6912, "step": 19965 }, { "epoch": 0.26, "learning_rate": 8.443221168077352e-05, "loss": 2.7235, "step": 19970 }, { "epoch": 0.26, "learning_rate": 8.442481054603573e-05, "loss": 2.5922, "step": 19975 }, { "epoch": 0.26, "learning_rate": 8.441740797696851e-05, "loss": 2.5777, "step": 19980 }, { "epoch": 0.26, "learning_rate": 8.441000397388025e-05, "loss": 2.6434, "step": 19985 }, { "epoch": 0.26, "learning_rate": 8.440259853707949e-05, "loss": 2.5143, "step": 19990 }, { "epoch": 0.26, "learning_rate": 8.439519166687476e-05, "loss": 2.6306, "step": 19995 }, { "epoch": 0.26, "learning_rate": 8.438778336357467e-05, "loss": 2.7298, "step": 20000 }, { "epoch": 0.26, "learning_rate": 8.43803736274879e-05, "loss": 2.6464, "step": 20005 }, { "epoch": 0.26, "learning_rate": 8.437296245892319e-05, "loss": 2.5885, "step": 20010 }, { "epoch": 0.26, "learning_rate": 8.436554985818929e-05, "loss": 2.6062, "step": 20015 }, { "epoch": 0.26, "learning_rate": 8.43581358255951e-05, "loss": 2.623, "step": 20020 }, { "epoch": 0.26, "learning_rate": 8.43507203614495e-05, "loss": 2.5326, "step": 20025 }, { "epoch": 0.26, "learning_rate": 8.434330346606147e-05, "loss": 2.732, "step": 20030 }, { "epoch": 0.26, "learning_rate": 8.433588513974004e-05, "loss": 2.5873, "step": 20035 }, { "epoch": 0.26, "learning_rate": 8.432846538279428e-05, "loss": 2.63, "step": 20040 }, { "epoch": 0.26, "learning_rate": 8.432104419553336e-05, "loss": 2.5052, "step": 20045 }, { "epoch": 0.26, "learning_rate": 8.431362157826648e-05, "loss": 2.5157, "step": 20050 }, { "epoch": 0.26, "learning_rate": 8.430619753130291e-05, "loss": 2.7174, "step": 20055 }, { "epoch": 0.26, "learning_rate": 8.429877205495198e-05, "loss": 2.6393, "step": 20060 }, { "epoch": 0.26, "learning_rate": 8.429134514952308e-05, "loss": 2.7081, "step": 20065 }, { "epoch": 0.26, "learning_rate": 8.428391681532564e-05, "loss": 2.7156, "step": 20070 }, { "epoch": 0.26, "learning_rate": 8.427648705266917e-05, "loss": 2.6068, "step": 20075 }, { "epoch": 0.26, "learning_rate": 8.426905586186325e-05, "loss": 2.6225, "step": 20080 }, { "epoch": 0.26, "learning_rate": 8.426162324321749e-05, "loss": 2.6403, "step": 20085 }, { "epoch": 0.26, "learning_rate": 8.425418919704158e-05, "loss": 2.6667, "step": 20090 }, { "epoch": 0.26, "learning_rate": 8.424675372364527e-05, "loss": 2.6799, "step": 20095 }, { "epoch": 0.26, "learning_rate": 8.423931682333835e-05, "loss": 2.7256, "step": 20100 }, { "epoch": 0.26, "learning_rate": 8.42318784964307e-05, "loss": 2.6083, "step": 20105 }, { "epoch": 0.26, "learning_rate": 8.42244387432322e-05, "loss": 2.6803, "step": 20110 }, { "epoch": 0.26, "learning_rate": 8.42169975640529e-05, "loss": 2.7045, "step": 20115 }, { "epoch": 0.26, "learning_rate": 8.420955495920277e-05, "loss": 2.6646, "step": 20120 }, { "epoch": 0.26, "learning_rate": 8.420211092899198e-05, "loss": 2.757, "step": 20125 }, { "epoch": 0.26, "learning_rate": 8.419466547373063e-05, "loss": 2.7216, "step": 20130 }, { "epoch": 0.26, "learning_rate": 8.418721859372897e-05, "loss": 2.5226, "step": 20135 }, { "epoch": 0.26, "learning_rate": 8.417977028929727e-05, "loss": 2.5538, "step": 20140 }, { "epoch": 0.26, "learning_rate": 8.417232056074587e-05, "loss": 2.7861, "step": 20145 }, { "epoch": 0.26, "learning_rate": 8.416486940838517e-05, "loss": 2.6236, "step": 20150 }, { "epoch": 0.26, "learning_rate": 8.415741683252562e-05, "loss": 2.7364, "step": 20155 }, { "epoch": 0.26, "learning_rate": 8.414996283347775e-05, "loss": 2.6935, "step": 20160 }, { "epoch": 0.26, "learning_rate": 8.414250741155211e-05, "loss": 2.64, "step": 20165 }, { "epoch": 0.26, "learning_rate": 8.413505056705935e-05, "loss": 2.7811, "step": 20170 }, { "epoch": 0.26, "learning_rate": 8.412759230031017e-05, "loss": 2.6405, "step": 20175 }, { "epoch": 0.26, "learning_rate": 8.412013261161531e-05, "loss": 2.6603, "step": 20180 }, { "epoch": 0.26, "learning_rate": 8.41126715012856e-05, "loss": 2.6157, "step": 20185 }, { "epoch": 0.26, "learning_rate": 8.410520896963189e-05, "loss": 2.5441, "step": 20190 }, { "epoch": 0.26, "learning_rate": 8.409774501696512e-05, "loss": 2.7964, "step": 20195 }, { "epoch": 0.26, "learning_rate": 8.409027964359627e-05, "loss": 2.6207, "step": 20200 }, { "epoch": 0.26, "learning_rate": 8.408281284983642e-05, "loss": 2.801, "step": 20205 }, { "epoch": 0.26, "learning_rate": 8.407534463599663e-05, "loss": 2.8365, "step": 20210 }, { "epoch": 0.26, "learning_rate": 8.406787500238812e-05, "loss": 2.7621, "step": 20215 }, { "epoch": 0.26, "learning_rate": 8.406040394932208e-05, "loss": 2.7069, "step": 20220 }, { "epoch": 0.26, "learning_rate": 8.40529314771098e-05, "loss": 2.6189, "step": 20225 }, { "epoch": 0.26, "learning_rate": 8.404545758606264e-05, "loss": 2.6815, "step": 20230 }, { "epoch": 0.26, "learning_rate": 8.403798227649199e-05, "loss": 2.7704, "step": 20235 }, { "epoch": 0.26, "learning_rate": 8.403050554870932e-05, "loss": 2.6329, "step": 20240 }, { "epoch": 0.26, "learning_rate": 8.402302740302616e-05, "loss": 2.6215, "step": 20245 }, { "epoch": 0.26, "learning_rate": 8.401554783975407e-05, "loss": 2.6732, "step": 20250 }, { "epoch": 0.26, "learning_rate": 8.400806685920471e-05, "loss": 2.7242, "step": 20255 }, { "epoch": 0.26, "learning_rate": 8.400058446168976e-05, "loss": 2.6405, "step": 20260 }, { "epoch": 0.26, "learning_rate": 8.399310064752099e-05, "loss": 2.6405, "step": 20265 }, { "epoch": 0.26, "learning_rate": 8.398561541701023e-05, "loss": 2.6076, "step": 20270 }, { "epoch": 0.26, "learning_rate": 8.397812877046933e-05, "loss": 2.5916, "step": 20275 }, { "epoch": 0.26, "learning_rate": 8.397064070821025e-05, "loss": 2.6987, "step": 20280 }, { "epoch": 0.26, "learning_rate": 8.396315123054498e-05, "loss": 2.6893, "step": 20285 }, { "epoch": 0.26, "learning_rate": 8.395566033778556e-05, "loss": 2.6452, "step": 20290 }, { "epoch": 0.26, "learning_rate": 8.39481680302441e-05, "loss": 2.6498, "step": 20295 }, { "epoch": 0.26, "learning_rate": 8.394067430823279e-05, "loss": 2.6317, "step": 20300 }, { "epoch": 0.26, "learning_rate": 8.393317917206385e-05, "loss": 2.7162, "step": 20305 }, { "epoch": 0.26, "learning_rate": 8.392568262204956e-05, "loss": 2.7822, "step": 20310 }, { "epoch": 0.26, "learning_rate": 8.39181846585023e-05, "loss": 2.779, "step": 20315 }, { "epoch": 0.26, "learning_rate": 8.391068528173442e-05, "loss": 2.6661, "step": 20320 }, { "epoch": 0.26, "learning_rate": 8.390318449205846e-05, "loss": 2.7445, "step": 20325 }, { "epoch": 0.26, "learning_rate": 8.389568228978688e-05, "loss": 2.7478, "step": 20330 }, { "epoch": 0.26, "learning_rate": 8.388817867523229e-05, "loss": 2.6754, "step": 20335 }, { "epoch": 0.26, "learning_rate": 8.388067364870734e-05, "loss": 2.7141, "step": 20340 }, { "epoch": 0.26, "learning_rate": 8.387316721052471e-05, "loss": 2.6671, "step": 20345 }, { "epoch": 0.26, "learning_rate": 8.386565936099718e-05, "loss": 2.7084, "step": 20350 }, { "epoch": 0.26, "learning_rate": 8.385815010043755e-05, "loss": 2.4344, "step": 20355 }, { "epoch": 0.26, "learning_rate": 8.385063942915874e-05, "loss": 2.7786, "step": 20360 }, { "epoch": 0.26, "learning_rate": 8.384312734747363e-05, "loss": 2.6767, "step": 20365 }, { "epoch": 0.26, "learning_rate": 8.383561385569525e-05, "loss": 2.644, "step": 20370 }, { "epoch": 0.26, "learning_rate": 8.382809895413664e-05, "loss": 2.6334, "step": 20375 }, { "epoch": 0.26, "learning_rate": 8.382058264311093e-05, "loss": 2.8322, "step": 20380 }, { "epoch": 0.26, "learning_rate": 8.381306492293127e-05, "loss": 2.6543, "step": 20385 }, { "epoch": 0.26, "learning_rate": 8.38055457939109e-05, "loss": 2.7503, "step": 20390 }, { "epoch": 0.26, "learning_rate": 8.37980252563631e-05, "loss": 2.6131, "step": 20395 }, { "epoch": 0.26, "learning_rate": 8.379050331060123e-05, "loss": 2.592, "step": 20400 }, { "epoch": 0.26, "learning_rate": 8.37829799569387e-05, "loss": 2.7242, "step": 20405 }, { "epoch": 0.26, "learning_rate": 8.377545519568894e-05, "loss": 2.7092, "step": 20410 }, { "epoch": 0.26, "learning_rate": 8.37679290271655e-05, "loss": 2.6589, "step": 20415 }, { "epoch": 0.27, "learning_rate": 8.3760401451682e-05, "loss": 2.6824, "step": 20420 }, { "epoch": 0.27, "learning_rate": 8.375287246955202e-05, "loss": 2.7855, "step": 20425 }, { "epoch": 0.27, "learning_rate": 8.374534208108928e-05, "loss": 2.7873, "step": 20430 }, { "epoch": 0.27, "learning_rate": 8.373781028660755e-05, "loss": 2.682, "step": 20435 }, { "epoch": 0.27, "learning_rate": 8.373027708642062e-05, "loss": 2.6379, "step": 20440 }, { "epoch": 0.27, "learning_rate": 8.372274248084237e-05, "loss": 2.6353, "step": 20445 }, { "epoch": 0.27, "learning_rate": 8.371520647018678e-05, "loss": 2.6679, "step": 20450 }, { "epoch": 0.27, "learning_rate": 8.37076690547678e-05, "loss": 2.6503, "step": 20455 }, { "epoch": 0.27, "learning_rate": 8.370013023489946e-05, "loss": 2.5883, "step": 20460 }, { "epoch": 0.27, "learning_rate": 8.369259001089593e-05, "loss": 2.6107, "step": 20465 }, { "epoch": 0.27, "learning_rate": 8.368504838307134e-05, "loss": 2.6265, "step": 20470 }, { "epoch": 0.27, "learning_rate": 8.36775053517399e-05, "loss": 2.5735, "step": 20475 }, { "epoch": 0.27, "learning_rate": 8.366996091721593e-05, "loss": 2.6964, "step": 20480 }, { "epoch": 0.27, "learning_rate": 8.366241507981375e-05, "loss": 2.5507, "step": 20485 }, { "epoch": 0.27, "learning_rate": 8.365486783984779e-05, "loss": 2.8009, "step": 20490 }, { "epoch": 0.27, "learning_rate": 8.364731919763249e-05, "loss": 2.6735, "step": 20495 }, { "epoch": 0.27, "learning_rate": 8.363976915348235e-05, "loss": 2.7637, "step": 20500 }, { "epoch": 0.27, "learning_rate": 8.363221770771197e-05, "loss": 2.6046, "step": 20505 }, { "epoch": 0.27, "learning_rate": 8.362466486063599e-05, "loss": 2.7144, "step": 20510 }, { "epoch": 0.27, "learning_rate": 8.36171106125691e-05, "loss": 2.6746, "step": 20515 }, { "epoch": 0.27, "learning_rate": 8.360955496382602e-05, "loss": 2.5982, "step": 20520 }, { "epoch": 0.27, "learning_rate": 8.36019979147216e-05, "loss": 2.7248, "step": 20525 }, { "epoch": 0.27, "learning_rate": 8.359443946557072e-05, "loss": 2.6766, "step": 20530 }, { "epoch": 0.27, "learning_rate": 8.358687961668828e-05, "loss": 2.6336, "step": 20535 }, { "epoch": 0.27, "learning_rate": 8.357931836838924e-05, "loss": 2.6907, "step": 20540 }, { "epoch": 0.27, "learning_rate": 8.35717557209887e-05, "loss": 2.7314, "step": 20545 }, { "epoch": 0.27, "learning_rate": 8.356419167480172e-05, "loss": 2.8311, "step": 20550 }, { "epoch": 0.27, "learning_rate": 8.355662623014346e-05, "loss": 2.7417, "step": 20555 }, { "epoch": 0.27, "learning_rate": 8.354905938732918e-05, "loss": 2.6067, "step": 20560 }, { "epoch": 0.27, "learning_rate": 8.354149114667413e-05, "loss": 2.6437, "step": 20565 }, { "epoch": 0.27, "learning_rate": 8.353392150849365e-05, "loss": 2.6164, "step": 20570 }, { "epoch": 0.27, "learning_rate": 8.35263504731031e-05, "loss": 2.525, "step": 20575 }, { "epoch": 0.27, "learning_rate": 8.351877804081798e-05, "loss": 2.5606, "step": 20580 }, { "epoch": 0.27, "learning_rate": 8.351120421195378e-05, "loss": 2.714, "step": 20585 }, { "epoch": 0.27, "learning_rate": 8.350362898682606e-05, "loss": 2.5445, "step": 20590 }, { "epoch": 0.27, "learning_rate": 8.349605236575046e-05, "loss": 2.6599, "step": 20595 }, { "epoch": 0.27, "learning_rate": 8.348847434904267e-05, "loss": 2.7089, "step": 20600 }, { "epoch": 0.27, "learning_rate": 8.34808949370184e-05, "loss": 2.5465, "step": 20605 }, { "epoch": 0.27, "learning_rate": 8.347331412999348e-05, "loss": 2.682, "step": 20610 }, { "epoch": 0.27, "learning_rate": 8.346573192828377e-05, "loss": 2.7098, "step": 20615 }, { "epoch": 0.27, "learning_rate": 8.345814833220516e-05, "loss": 2.5334, "step": 20620 }, { "epoch": 0.27, "learning_rate": 8.345056334207367e-05, "loss": 2.6387, "step": 20625 }, { "epoch": 0.27, "learning_rate": 8.344297695820527e-05, "loss": 2.7504, "step": 20630 }, { "epoch": 0.27, "learning_rate": 8.343538918091611e-05, "loss": 2.6281, "step": 20635 }, { "epoch": 0.27, "learning_rate": 8.342780001052229e-05, "loss": 2.6163, "step": 20640 }, { "epoch": 0.27, "learning_rate": 8.342020944734006e-05, "loss": 2.613, "step": 20645 }, { "epoch": 0.27, "learning_rate": 8.341261749168568e-05, "loss": 2.6752, "step": 20650 }, { "epoch": 0.27, "learning_rate": 8.340502414387544e-05, "loss": 2.6539, "step": 20655 }, { "epoch": 0.27, "learning_rate": 8.339742940422573e-05, "loss": 2.7774, "step": 20660 }, { "epoch": 0.27, "learning_rate": 8.338983327305303e-05, "loss": 2.6927, "step": 20665 }, { "epoch": 0.27, "learning_rate": 8.338223575067379e-05, "loss": 2.5999, "step": 20670 }, { "epoch": 0.27, "learning_rate": 8.337463683740458e-05, "loss": 2.7038, "step": 20675 }, { "epoch": 0.27, "learning_rate": 8.336703653356204e-05, "loss": 2.6653, "step": 20680 }, { "epoch": 0.27, "learning_rate": 8.33594348394628e-05, "loss": 2.7611, "step": 20685 }, { "epoch": 0.27, "learning_rate": 8.335183175542359e-05, "loss": 2.7058, "step": 20690 }, { "epoch": 0.27, "learning_rate": 8.334422728176124e-05, "loss": 2.5993, "step": 20695 }, { "epoch": 0.27, "learning_rate": 8.333662141879255e-05, "loss": 2.6578, "step": 20700 }, { "epoch": 0.27, "learning_rate": 8.332901416683445e-05, "loss": 2.7261, "step": 20705 }, { "epoch": 0.27, "learning_rate": 8.332140552620388e-05, "loss": 2.7115, "step": 20710 }, { "epoch": 0.27, "learning_rate": 8.33137954972179e-05, "loss": 2.7223, "step": 20715 }, { "epoch": 0.27, "learning_rate": 8.330618408019353e-05, "loss": 2.6145, "step": 20720 }, { "epoch": 0.27, "learning_rate": 8.329857127544791e-05, "loss": 2.6288, "step": 20725 }, { "epoch": 0.27, "learning_rate": 8.329095708329829e-05, "loss": 2.6341, "step": 20730 }, { "epoch": 0.27, "learning_rate": 8.328334150406185e-05, "loss": 2.6473, "step": 20735 }, { "epoch": 0.27, "learning_rate": 8.327572453805594e-05, "loss": 2.6506, "step": 20740 }, { "epoch": 0.27, "learning_rate": 8.326810618559793e-05, "loss": 2.6789, "step": 20745 }, { "epoch": 0.27, "learning_rate": 8.326048644700521e-05, "loss": 2.6792, "step": 20750 }, { "epoch": 0.27, "learning_rate": 8.325286532259526e-05, "loss": 2.6588, "step": 20755 }, { "epoch": 0.27, "learning_rate": 8.324524281268567e-05, "loss": 2.5004, "step": 20760 }, { "epoch": 0.27, "learning_rate": 8.323761891759399e-05, "loss": 2.7194, "step": 20765 }, { "epoch": 0.27, "learning_rate": 8.322999363763788e-05, "loss": 2.7634, "step": 20770 }, { "epoch": 0.27, "learning_rate": 8.322236697313506e-05, "loss": 2.5961, "step": 20775 }, { "epoch": 0.27, "learning_rate": 8.321473892440331e-05, "loss": 2.5988, "step": 20780 }, { "epoch": 0.27, "learning_rate": 8.320710949176042e-05, "loss": 2.7056, "step": 20785 }, { "epoch": 0.27, "learning_rate": 8.319947867552431e-05, "loss": 2.7001, "step": 20790 }, { "epoch": 0.27, "learning_rate": 8.31918464760129e-05, "loss": 2.7102, "step": 20795 }, { "epoch": 0.27, "learning_rate": 8.318421289354422e-05, "loss": 2.7279, "step": 20800 }, { "epoch": 0.27, "learning_rate": 8.31765779284363e-05, "loss": 2.5426, "step": 20805 }, { "epoch": 0.27, "learning_rate": 8.316894158100727e-05, "loss": 2.6975, "step": 20810 }, { "epoch": 0.27, "learning_rate": 8.316130385157527e-05, "loss": 2.7286, "step": 20815 }, { "epoch": 0.27, "learning_rate": 8.315366474045861e-05, "loss": 2.7039, "step": 20820 }, { "epoch": 0.27, "learning_rate": 8.314602424797549e-05, "loss": 2.6984, "step": 20825 }, { "epoch": 0.27, "learning_rate": 8.313838237444428e-05, "loss": 2.6484, "step": 20830 }, { "epoch": 0.27, "learning_rate": 8.31307391201834e-05, "loss": 2.7984, "step": 20835 }, { "epoch": 0.27, "learning_rate": 8.312309448551132e-05, "loss": 2.5797, "step": 20840 }, { "epoch": 0.27, "learning_rate": 8.311544847074653e-05, "loss": 2.7099, "step": 20845 }, { "epoch": 0.27, "learning_rate": 8.310780107620764e-05, "loss": 2.6002, "step": 20850 }, { "epoch": 0.27, "learning_rate": 8.310015230221324e-05, "loss": 2.66, "step": 20855 }, { "epoch": 0.27, "learning_rate": 8.309250214908204e-05, "loss": 2.6185, "step": 20860 }, { "epoch": 0.27, "learning_rate": 8.30848506171328e-05, "loss": 2.7035, "step": 20865 }, { "epoch": 0.27, "learning_rate": 8.30771977066843e-05, "loss": 2.7111, "step": 20870 }, { "epoch": 0.27, "learning_rate": 8.306954341805541e-05, "loss": 2.6904, "step": 20875 }, { "epoch": 0.27, "learning_rate": 8.306188775156509e-05, "loss": 2.6925, "step": 20880 }, { "epoch": 0.27, "learning_rate": 8.305423070753227e-05, "loss": 2.7175, "step": 20885 }, { "epoch": 0.27, "learning_rate": 8.304657228627599e-05, "loss": 2.623, "step": 20890 }, { "epoch": 0.27, "learning_rate": 8.303891248811537e-05, "loss": 2.5682, "step": 20895 }, { "epoch": 0.27, "learning_rate": 8.303125131336954e-05, "loss": 2.7765, "step": 20900 }, { "epoch": 0.27, "learning_rate": 8.30235887623577e-05, "loss": 2.56, "step": 20905 }, { "epoch": 0.27, "learning_rate": 8.301592483539913e-05, "loss": 2.6204, "step": 20910 }, { "epoch": 0.27, "learning_rate": 8.300825953281314e-05, "loss": 2.7145, "step": 20915 }, { "epoch": 0.27, "learning_rate": 8.300059285491914e-05, "loss": 2.6258, "step": 20920 }, { "epoch": 0.27, "learning_rate": 8.299292480203653e-05, "loss": 2.7156, "step": 20925 }, { "epoch": 0.27, "learning_rate": 8.298525537448482e-05, "loss": 2.7564, "step": 20930 }, { "epoch": 0.27, "learning_rate": 8.297758457258354e-05, "loss": 2.7622, "step": 20935 }, { "epoch": 0.27, "learning_rate": 8.296991239665233e-05, "loss": 2.6145, "step": 20940 }, { "epoch": 0.27, "learning_rate": 8.296223884701084e-05, "loss": 2.7101, "step": 20945 }, { "epoch": 0.27, "learning_rate": 8.29545639239788e-05, "loss": 2.7587, "step": 20950 }, { "epoch": 0.27, "learning_rate": 8.294688762787597e-05, "loss": 2.6862, "step": 20955 }, { "epoch": 0.27, "learning_rate": 8.293920995902221e-05, "loss": 2.684, "step": 20960 }, { "epoch": 0.27, "learning_rate": 8.293153091773741e-05, "loss": 2.636, "step": 20965 }, { "epoch": 0.27, "learning_rate": 8.29238505043415e-05, "loss": 2.5808, "step": 20970 }, { "epoch": 0.27, "learning_rate": 8.291616871915454e-05, "loss": 2.668, "step": 20975 }, { "epoch": 0.27, "learning_rate": 8.290848556249653e-05, "loss": 2.6256, "step": 20980 }, { "epoch": 0.27, "learning_rate": 8.290080103468765e-05, "loss": 2.676, "step": 20985 }, { "epoch": 0.27, "learning_rate": 8.289311513604806e-05, "loss": 2.6939, "step": 20990 }, { "epoch": 0.27, "learning_rate": 8.288542786689796e-05, "loss": 2.6659, "step": 20995 }, { "epoch": 0.27, "learning_rate": 8.287773922755769e-05, "loss": 2.7101, "step": 21000 }, { "epoch": 0.27, "learning_rate": 8.28700492183476e-05, "loss": 2.5722, "step": 21005 }, { "epoch": 0.27, "learning_rate": 8.286235783958809e-05, "loss": 2.6501, "step": 21010 }, { "epoch": 0.27, "learning_rate": 8.285466509159961e-05, "loss": 2.6319, "step": 21015 }, { "epoch": 0.27, "learning_rate": 8.284697097470271e-05, "loss": 2.5497, "step": 21020 }, { "epoch": 0.27, "learning_rate": 8.283927548921794e-05, "loss": 2.6615, "step": 21025 }, { "epoch": 0.27, "learning_rate": 8.283157863546597e-05, "loss": 2.6463, "step": 21030 }, { "epoch": 0.27, "learning_rate": 8.282388041376747e-05, "loss": 2.6292, "step": 21035 }, { "epoch": 0.27, "learning_rate": 8.28161808244432e-05, "loss": 2.7579, "step": 21040 }, { "epoch": 0.27, "learning_rate": 8.280847986781397e-05, "loss": 2.6955, "step": 21045 }, { "epoch": 0.27, "learning_rate": 8.280077754420062e-05, "loss": 2.5284, "step": 21050 }, { "epoch": 0.27, "learning_rate": 8.279307385392412e-05, "loss": 2.6662, "step": 21055 }, { "epoch": 0.27, "learning_rate": 8.27853687973054e-05, "loss": 2.7377, "step": 21060 }, { "epoch": 0.27, "learning_rate": 8.277766237466552e-05, "loss": 2.6745, "step": 21065 }, { "epoch": 0.27, "learning_rate": 8.276995458632557e-05, "loss": 2.4967, "step": 21070 }, { "epoch": 0.27, "learning_rate": 8.276224543260671e-05, "loss": 2.5895, "step": 21075 }, { "epoch": 0.27, "learning_rate": 8.275453491383012e-05, "loss": 2.6966, "step": 21080 }, { "epoch": 0.27, "learning_rate": 8.274682303031709e-05, "loss": 2.5978, "step": 21085 }, { "epoch": 0.27, "learning_rate": 8.27391097823889e-05, "loss": 2.793, "step": 21090 }, { "epoch": 0.27, "learning_rate": 8.273139517036699e-05, "loss": 2.6711, "step": 21095 }, { "epoch": 0.27, "learning_rate": 8.272367919457274e-05, "loss": 2.654, "step": 21100 }, { "epoch": 0.27, "learning_rate": 8.271596185532766e-05, "loss": 2.549, "step": 21105 }, { "epoch": 0.27, "learning_rate": 8.270824315295329e-05, "loss": 2.5855, "step": 21110 }, { "epoch": 0.27, "learning_rate": 8.270052308777125e-05, "loss": 2.5065, "step": 21115 }, { "epoch": 0.27, "learning_rate": 8.26928016601032e-05, "loss": 2.7069, "step": 21120 }, { "epoch": 0.27, "learning_rate": 8.268507887027084e-05, "loss": 2.6995, "step": 21125 }, { "epoch": 0.27, "learning_rate": 8.267735471859595e-05, "loss": 2.7616, "step": 21130 }, { "epoch": 0.27, "learning_rate": 8.266962920540035e-05, "loss": 2.7117, "step": 21135 }, { "epoch": 0.27, "learning_rate": 8.266190233100598e-05, "loss": 2.6087, "step": 21140 }, { "epoch": 0.27, "learning_rate": 8.265417409573472e-05, "loss": 2.5182, "step": 21145 }, { "epoch": 0.27, "learning_rate": 8.264644449990861e-05, "loss": 2.692, "step": 21150 }, { "epoch": 0.27, "learning_rate": 8.263871354384969e-05, "loss": 2.5651, "step": 21155 }, { "epoch": 0.27, "learning_rate": 8.263098122788008e-05, "loss": 2.5352, "step": 21160 }, { "epoch": 0.27, "learning_rate": 8.262324755232196e-05, "loss": 2.8059, "step": 21165 }, { "epoch": 0.27, "learning_rate": 8.261551251749755e-05, "loss": 2.7499, "step": 21170 }, { "epoch": 0.27, "learning_rate": 8.260777612372913e-05, "loss": 2.596, "step": 21175 }, { "epoch": 0.27, "learning_rate": 8.260003837133905e-05, "loss": 2.5691, "step": 21180 }, { "epoch": 0.27, "learning_rate": 8.259229926064969e-05, "loss": 2.7361, "step": 21185 }, { "epoch": 0.28, "learning_rate": 8.258455879198354e-05, "loss": 2.6353, "step": 21190 }, { "epoch": 0.28, "learning_rate": 8.257681696566308e-05, "loss": 2.6131, "step": 21195 }, { "epoch": 0.28, "learning_rate": 8.256907378201091e-05, "loss": 2.5666, "step": 21200 }, { "epoch": 0.28, "learning_rate": 8.256132924134961e-05, "loss": 2.5687, "step": 21205 }, { "epoch": 0.28, "learning_rate": 8.255358334400187e-05, "loss": 2.5278, "step": 21210 }, { "epoch": 0.28, "learning_rate": 8.254583609029046e-05, "loss": 2.6234, "step": 21215 }, { "epoch": 0.28, "learning_rate": 8.253808748053816e-05, "loss": 2.6939, "step": 21220 }, { "epoch": 0.28, "learning_rate": 8.25303375150678e-05, "loss": 2.7574, "step": 21225 }, { "epoch": 0.28, "learning_rate": 8.25225861942023e-05, "loss": 2.5599, "step": 21230 }, { "epoch": 0.28, "learning_rate": 8.251483351826464e-05, "loss": 2.686, "step": 21235 }, { "epoch": 0.28, "learning_rate": 8.25070794875778e-05, "loss": 2.7111, "step": 21240 }, { "epoch": 0.28, "learning_rate": 8.249932410246487e-05, "loss": 2.5956, "step": 21245 }, { "epoch": 0.28, "learning_rate": 8.249156736324904e-05, "loss": 2.687, "step": 21250 }, { "epoch": 0.28, "learning_rate": 8.24838092702534e-05, "loss": 2.71, "step": 21255 }, { "epoch": 0.28, "learning_rate": 8.247604982380128e-05, "loss": 2.647, "step": 21260 }, { "epoch": 0.28, "learning_rate": 8.246828902421595e-05, "loss": 2.7217, "step": 21265 }, { "epoch": 0.28, "learning_rate": 8.246052687182076e-05, "loss": 2.6174, "step": 21270 }, { "epoch": 0.28, "learning_rate": 8.245276336693912e-05, "loss": 2.59, "step": 21275 }, { "epoch": 0.28, "learning_rate": 8.244499850989452e-05, "loss": 2.5446, "step": 21280 }, { "epoch": 0.28, "learning_rate": 8.243723230101048e-05, "loss": 2.4713, "step": 21285 }, { "epoch": 0.28, "learning_rate": 8.242946474061058e-05, "loss": 2.6204, "step": 21290 }, { "epoch": 0.28, "learning_rate": 8.242169582901846e-05, "loss": 2.6755, "step": 21295 }, { "epoch": 0.28, "learning_rate": 8.241392556655783e-05, "loss": 2.7485, "step": 21300 }, { "epoch": 0.28, "learning_rate": 8.240615395355242e-05, "loss": 2.6256, "step": 21305 }, { "epoch": 0.28, "learning_rate": 8.239838099032606e-05, "loss": 2.7511, "step": 21310 }, { "epoch": 0.28, "learning_rate": 8.23906066772026e-05, "loss": 2.6919, "step": 21315 }, { "epoch": 0.28, "learning_rate": 8.238283101450597e-05, "loss": 2.5303, "step": 21320 }, { "epoch": 0.28, "learning_rate": 8.237505400256014e-05, "loss": 2.6149, "step": 21325 }, { "epoch": 0.28, "learning_rate": 8.236727564168914e-05, "loss": 2.7407, "step": 21330 }, { "epoch": 0.28, "learning_rate": 8.235949593221706e-05, "loss": 2.699, "step": 21335 }, { "epoch": 0.28, "learning_rate": 8.235171487446806e-05, "loss": 2.7285, "step": 21340 }, { "epoch": 0.28, "learning_rate": 8.234393246876635e-05, "loss": 2.7105, "step": 21345 }, { "epoch": 0.28, "learning_rate": 8.233614871543617e-05, "loss": 2.7458, "step": 21350 }, { "epoch": 0.28, "learning_rate": 8.232836361480183e-05, "loss": 2.7147, "step": 21355 }, { "epoch": 0.28, "learning_rate": 8.232057716718771e-05, "loss": 2.4798, "step": 21360 }, { "epoch": 0.28, "learning_rate": 8.231278937291825e-05, "loss": 2.7253, "step": 21365 }, { "epoch": 0.28, "learning_rate": 8.230500023231789e-05, "loss": 2.5622, "step": 21370 }, { "epoch": 0.28, "learning_rate": 8.229720974571123e-05, "loss": 2.6152, "step": 21375 }, { "epoch": 0.28, "learning_rate": 8.228941791342279e-05, "loss": 2.4962, "step": 21380 }, { "epoch": 0.28, "learning_rate": 8.22816247357773e-05, "loss": 2.4978, "step": 21385 }, { "epoch": 0.28, "learning_rate": 8.227383021309943e-05, "loss": 2.7241, "step": 21390 }, { "epoch": 0.28, "learning_rate": 8.226603434571394e-05, "loss": 2.6815, "step": 21395 }, { "epoch": 0.28, "learning_rate": 8.225823713394564e-05, "loss": 2.5558, "step": 21400 }, { "epoch": 0.28, "learning_rate": 8.225043857811943e-05, "loss": 2.5236, "step": 21405 }, { "epoch": 0.28, "learning_rate": 8.224263867856024e-05, "loss": 2.6786, "step": 21410 }, { "epoch": 0.28, "learning_rate": 8.223483743559301e-05, "loss": 2.7092, "step": 21415 }, { "epoch": 0.28, "learning_rate": 8.222703484954286e-05, "loss": 2.6888, "step": 21420 }, { "epoch": 0.28, "learning_rate": 8.221923092073484e-05, "loss": 2.7711, "step": 21425 }, { "epoch": 0.28, "learning_rate": 8.22114256494941e-05, "loss": 2.586, "step": 21430 }, { "epoch": 0.28, "learning_rate": 8.220361903614588e-05, "loss": 2.6616, "step": 21435 }, { "epoch": 0.28, "learning_rate": 8.219581108101544e-05, "loss": 2.5928, "step": 21440 }, { "epoch": 0.28, "learning_rate": 8.218800178442807e-05, "loss": 2.69, "step": 21445 }, { "epoch": 0.28, "learning_rate": 8.218019114670921e-05, "loss": 2.7387, "step": 21450 }, { "epoch": 0.28, "learning_rate": 8.217237916818423e-05, "loss": 2.6774, "step": 21455 }, { "epoch": 0.28, "learning_rate": 8.216456584917866e-05, "loss": 2.6079, "step": 21460 }, { "epoch": 0.28, "learning_rate": 8.215675119001804e-05, "loss": 2.7389, "step": 21465 }, { "epoch": 0.28, "learning_rate": 8.214893519102797e-05, "loss": 2.6718, "step": 21470 }, { "epoch": 0.28, "learning_rate": 8.21411178525341e-05, "loss": 2.5979, "step": 21475 }, { "epoch": 0.28, "learning_rate": 8.213329917486215e-05, "loss": 2.6875, "step": 21480 }, { "epoch": 0.28, "learning_rate": 8.21254791583379e-05, "loss": 2.6498, "step": 21485 }, { "epoch": 0.28, "learning_rate": 8.211765780328716e-05, "loss": 2.668, "step": 21490 }, { "epoch": 0.28, "learning_rate": 8.210983511003582e-05, "loss": 2.6581, "step": 21495 }, { "epoch": 0.28, "learning_rate": 8.210201107890981e-05, "loss": 2.688, "step": 21500 }, { "epoch": 0.28, "learning_rate": 8.209418571023513e-05, "loss": 2.7797, "step": 21505 }, { "epoch": 0.28, "learning_rate": 8.208635900433783e-05, "loss": 2.6636, "step": 21510 }, { "epoch": 0.28, "learning_rate": 8.207853096154401e-05, "loss": 2.6392, "step": 21515 }, { "epoch": 0.28, "learning_rate": 8.207070158217981e-05, "loss": 2.6626, "step": 21520 }, { "epoch": 0.28, "learning_rate": 8.206287086657147e-05, "loss": 2.6158, "step": 21525 }, { "epoch": 0.28, "learning_rate": 8.205503881504528e-05, "loss": 2.524, "step": 21530 }, { "epoch": 0.28, "learning_rate": 8.204720542792753e-05, "loss": 2.6366, "step": 21535 }, { "epoch": 0.28, "learning_rate": 8.203937070554461e-05, "loss": 2.6433, "step": 21540 }, { "epoch": 0.28, "learning_rate": 8.203153464822298e-05, "loss": 2.7314, "step": 21545 }, { "epoch": 0.28, "learning_rate": 8.20236972562891e-05, "loss": 2.6095, "step": 21550 }, { "epoch": 0.28, "learning_rate": 8.201585853006953e-05, "loss": 2.7353, "step": 21555 }, { "epoch": 0.28, "learning_rate": 8.20080184698909e-05, "loss": 2.6896, "step": 21560 }, { "epoch": 0.28, "learning_rate": 8.200017707607985e-05, "loss": 2.599, "step": 21565 }, { "epoch": 0.28, "learning_rate": 8.199233434896309e-05, "loss": 2.5877, "step": 21570 }, { "epoch": 0.28, "learning_rate": 8.198449028886741e-05, "loss": 2.6365, "step": 21575 }, { "epoch": 0.28, "learning_rate": 8.197664489611962e-05, "loss": 2.6601, "step": 21580 }, { "epoch": 0.28, "learning_rate": 8.196879817104662e-05, "loss": 2.6251, "step": 21585 }, { "epoch": 0.28, "learning_rate": 8.196095011397534e-05, "loss": 2.6421, "step": 21590 }, { "epoch": 0.28, "learning_rate": 8.195310072523277e-05, "loss": 2.6674, "step": 21595 }, { "epoch": 0.28, "learning_rate": 8.194525000514594e-05, "loss": 2.6363, "step": 21600 }, { "epoch": 0.28, "learning_rate": 8.1937397954042e-05, "loss": 2.6058, "step": 21605 }, { "epoch": 0.28, "learning_rate": 8.192954457224809e-05, "loss": 2.5569, "step": 21610 }, { "epoch": 0.28, "learning_rate": 8.19216898600914e-05, "loss": 2.495, "step": 21615 }, { "epoch": 0.28, "learning_rate": 8.191383381789926e-05, "loss": 2.6498, "step": 21620 }, { "epoch": 0.28, "learning_rate": 8.190597644599894e-05, "loss": 2.6444, "step": 21625 }, { "epoch": 0.28, "learning_rate": 8.189811774471783e-05, "loss": 2.6434, "step": 21630 }, { "epoch": 0.28, "learning_rate": 8.18902577143834e-05, "loss": 2.6228, "step": 21635 }, { "epoch": 0.28, "learning_rate": 8.188239635532311e-05, "loss": 2.677, "step": 21640 }, { "epoch": 0.28, "learning_rate": 8.187453366786453e-05, "loss": 2.7457, "step": 21645 }, { "epoch": 0.28, "learning_rate": 8.186666965233524e-05, "loss": 2.6851, "step": 21650 }, { "epoch": 0.28, "learning_rate": 8.185880430906292e-05, "loss": 2.6877, "step": 21655 }, { "epoch": 0.28, "learning_rate": 8.185093763837528e-05, "loss": 2.6376, "step": 21660 }, { "epoch": 0.28, "learning_rate": 8.184306964060009e-05, "loss": 2.5922, "step": 21665 }, { "epoch": 0.28, "learning_rate": 8.183520031606516e-05, "loss": 2.8112, "step": 21670 }, { "epoch": 0.28, "learning_rate": 8.182732966509838e-05, "loss": 2.7352, "step": 21675 }, { "epoch": 0.28, "learning_rate": 8.181945768802768e-05, "loss": 2.5936, "step": 21680 }, { "epoch": 0.28, "learning_rate": 8.181158438518107e-05, "loss": 2.6268, "step": 21685 }, { "epoch": 0.28, "learning_rate": 8.180370975688657e-05, "loss": 2.5562, "step": 21690 }, { "epoch": 0.28, "learning_rate": 8.179583380347228e-05, "loss": 2.685, "step": 21695 }, { "epoch": 0.28, "learning_rate": 8.17879565252664e-05, "loss": 2.719, "step": 21700 }, { "epoch": 0.28, "learning_rate": 8.178007792259709e-05, "loss": 2.7457, "step": 21705 }, { "epoch": 0.28, "learning_rate": 8.177219799579264e-05, "loss": 2.6995, "step": 21710 }, { "epoch": 0.28, "learning_rate": 8.176431674518137e-05, "loss": 2.6588, "step": 21715 }, { "epoch": 0.28, "learning_rate": 8.175643417109165e-05, "loss": 2.6407, "step": 21720 }, { "epoch": 0.28, "learning_rate": 8.174855027385193e-05, "loss": 2.741, "step": 21725 }, { "epoch": 0.28, "learning_rate": 8.174066505379067e-05, "loss": 2.7228, "step": 21730 }, { "epoch": 0.28, "learning_rate": 8.173277851123643e-05, "loss": 2.6923, "step": 21735 }, { "epoch": 0.28, "learning_rate": 8.17248906465178e-05, "loss": 2.6285, "step": 21740 }, { "epoch": 0.28, "learning_rate": 8.171700145996343e-05, "loss": 2.7233, "step": 21745 }, { "epoch": 0.28, "learning_rate": 8.170911095190206e-05, "loss": 2.7299, "step": 21750 }, { "epoch": 0.28, "learning_rate": 8.17012191226624e-05, "loss": 2.6289, "step": 21755 }, { "epoch": 0.28, "learning_rate": 8.169332597257331e-05, "loss": 2.7496, "step": 21760 }, { "epoch": 0.28, "learning_rate": 8.168543150196361e-05, "loss": 2.7153, "step": 21765 }, { "epoch": 0.28, "learning_rate": 8.16775357111623e-05, "loss": 2.6522, "step": 21770 }, { "epoch": 0.28, "learning_rate": 8.166963860049832e-05, "loss": 2.6262, "step": 21775 }, { "epoch": 0.28, "learning_rate": 8.166174017030072e-05, "loss": 2.5992, "step": 21780 }, { "epoch": 0.28, "learning_rate": 8.165384042089858e-05, "loss": 2.6361, "step": 21785 }, { "epoch": 0.28, "learning_rate": 8.164593935262103e-05, "loss": 2.7164, "step": 21790 }, { "epoch": 0.28, "learning_rate": 8.163803696579733e-05, "loss": 2.5906, "step": 21795 }, { "epoch": 0.28, "learning_rate": 8.163013326075668e-05, "loss": 2.7087, "step": 21800 }, { "epoch": 0.28, "learning_rate": 8.162222823782843e-05, "loss": 2.606, "step": 21805 }, { "epoch": 0.28, "learning_rate": 8.161432189734193e-05, "loss": 2.6788, "step": 21810 }, { "epoch": 0.28, "learning_rate": 8.160641423962661e-05, "loss": 2.6078, "step": 21815 }, { "epoch": 0.28, "learning_rate": 8.159850526501195e-05, "loss": 2.5195, "step": 21820 }, { "epoch": 0.28, "learning_rate": 8.159059497382746e-05, "loss": 2.5051, "step": 21825 }, { "epoch": 0.28, "learning_rate": 8.158268336640275e-05, "loss": 2.6051, "step": 21830 }, { "epoch": 0.28, "learning_rate": 8.157477044306745e-05, "loss": 2.6291, "step": 21835 }, { "epoch": 0.28, "learning_rate": 8.156685620415125e-05, "loss": 2.6693, "step": 21840 }, { "epoch": 0.28, "learning_rate": 8.155894064998392e-05, "loss": 2.5813, "step": 21845 }, { "epoch": 0.28, "learning_rate": 8.155102378089527e-05, "loss": 2.5809, "step": 21850 }, { "epoch": 0.28, "learning_rate": 8.154310559721514e-05, "loss": 2.5984, "step": 21855 }, { "epoch": 0.28, "learning_rate": 8.153518609927344e-05, "loss": 2.6165, "step": 21860 }, { "epoch": 0.28, "learning_rate": 8.152726528740017e-05, "loss": 2.6594, "step": 21865 }, { "epoch": 0.28, "learning_rate": 8.151934316192534e-05, "loss": 2.6684, "step": 21870 }, { "epoch": 0.28, "learning_rate": 8.151141972317902e-05, "loss": 2.6319, "step": 21875 }, { "epoch": 0.28, "learning_rate": 8.150349497149136e-05, "loss": 2.608, "step": 21880 }, { "epoch": 0.28, "learning_rate": 8.149556890719253e-05, "loss": 2.5742, "step": 21885 }, { "epoch": 0.28, "learning_rate": 8.148764153061279e-05, "loss": 2.6658, "step": 21890 }, { "epoch": 0.28, "learning_rate": 8.147971284208245e-05, "loss": 2.7084, "step": 21895 }, { "epoch": 0.28, "learning_rate": 8.147178284193184e-05, "loss": 2.5945, "step": 21900 }, { "epoch": 0.28, "learning_rate": 8.146385153049139e-05, "loss": 2.7777, "step": 21905 }, { "epoch": 0.28, "learning_rate": 8.145591890809154e-05, "loss": 2.6688, "step": 21910 }, { "epoch": 0.28, "learning_rate": 8.144798497506282e-05, "loss": 2.5224, "step": 21915 }, { "epoch": 0.28, "learning_rate": 8.144004973173578e-05, "loss": 2.6579, "step": 21920 }, { "epoch": 0.28, "learning_rate": 8.14321131784411e-05, "loss": 2.6496, "step": 21925 }, { "epoch": 0.28, "learning_rate": 8.142417531550941e-05, "loss": 2.6305, "step": 21930 }, { "epoch": 0.28, "learning_rate": 8.141623614327145e-05, "loss": 2.6144, "step": 21935 }, { "epoch": 0.28, "learning_rate": 8.140829566205803e-05, "loss": 2.6314, "step": 21940 }, { "epoch": 0.28, "learning_rate": 8.14003538722e-05, "loss": 2.6927, "step": 21945 }, { "epoch": 0.28, "learning_rate": 8.139241077402823e-05, "loss": 2.6517, "step": 21950 }, { "epoch": 0.28, "learning_rate": 8.138446636787369e-05, "loss": 2.645, "step": 21955 }, { "epoch": 0.28, "learning_rate": 8.13765206540674e-05, "loss": 2.6815, "step": 21960 }, { "epoch": 0.29, "learning_rate": 8.136857363294041e-05, "loss": 2.7527, "step": 21965 }, { "epoch": 0.29, "learning_rate": 8.136062530482382e-05, "loss": 2.6455, "step": 21970 }, { "epoch": 0.29, "learning_rate": 8.135267567004884e-05, "loss": 2.7885, "step": 21975 }, { "epoch": 0.29, "learning_rate": 8.134472472894668e-05, "loss": 2.564, "step": 21980 }, { "epoch": 0.29, "learning_rate": 8.133677248184858e-05, "loss": 2.6081, "step": 21985 }, { "epoch": 0.29, "learning_rate": 8.132881892908595e-05, "loss": 2.5995, "step": 21990 }, { "epoch": 0.29, "learning_rate": 8.132086407099013e-05, "loss": 2.7027, "step": 21995 }, { "epoch": 0.29, "learning_rate": 8.131290790789257e-05, "loss": 2.5824, "step": 22000 }, { "epoch": 0.29, "learning_rate": 8.130495044012478e-05, "loss": 2.6381, "step": 22005 }, { "epoch": 0.29, "learning_rate": 8.12969916680183e-05, "loss": 2.6623, "step": 22010 }, { "epoch": 0.29, "learning_rate": 8.128903159190472e-05, "loss": 2.6887, "step": 22015 }, { "epoch": 0.29, "learning_rate": 8.128107021211575e-05, "loss": 2.6819, "step": 22020 }, { "epoch": 0.29, "learning_rate": 8.127310752898308e-05, "loss": 2.7064, "step": 22025 }, { "epoch": 0.29, "learning_rate": 8.126514354283845e-05, "loss": 2.6041, "step": 22030 }, { "epoch": 0.29, "learning_rate": 8.125717825401375e-05, "loss": 2.5992, "step": 22035 }, { "epoch": 0.29, "learning_rate": 8.12492116628408e-05, "loss": 2.5859, "step": 22040 }, { "epoch": 0.29, "learning_rate": 8.124124376965155e-05, "loss": 2.7085, "step": 22045 }, { "epoch": 0.29, "learning_rate": 8.123327457477798e-05, "loss": 2.6443, "step": 22050 }, { "epoch": 0.29, "learning_rate": 8.122530407855216e-05, "loss": 2.6591, "step": 22055 }, { "epoch": 0.29, "learning_rate": 8.121733228130617e-05, "loss": 2.6626, "step": 22060 }, { "epoch": 0.29, "learning_rate": 8.120935918337213e-05, "loss": 2.7612, "step": 22065 }, { "epoch": 0.29, "learning_rate": 8.120138478508231e-05, "loss": 2.6394, "step": 22070 }, { "epoch": 0.29, "learning_rate": 8.119340908676889e-05, "loss": 2.7216, "step": 22075 }, { "epoch": 0.29, "learning_rate": 8.118543208876423e-05, "loss": 2.6379, "step": 22080 }, { "epoch": 0.29, "learning_rate": 8.117745379140068e-05, "loss": 2.6647, "step": 22085 }, { "epoch": 0.29, "learning_rate": 8.116947419501069e-05, "loss": 2.6435, "step": 22090 }, { "epoch": 0.29, "learning_rate": 8.116149329992668e-05, "loss": 2.6694, "step": 22095 }, { "epoch": 0.29, "learning_rate": 8.115351110648122e-05, "loss": 2.6859, "step": 22100 }, { "epoch": 0.29, "learning_rate": 8.114552761500688e-05, "loss": 2.6548, "step": 22105 }, { "epoch": 0.29, "learning_rate": 8.11375428258363e-05, "loss": 2.6775, "step": 22110 }, { "epoch": 0.29, "learning_rate": 8.112955673930218e-05, "loss": 2.6447, "step": 22115 }, { "epoch": 0.29, "learning_rate": 8.112156935573724e-05, "loss": 2.689, "step": 22120 }, { "epoch": 0.29, "learning_rate": 8.11135806754743e-05, "loss": 2.6003, "step": 22125 }, { "epoch": 0.29, "learning_rate": 8.11055906988462e-05, "loss": 2.5865, "step": 22130 }, { "epoch": 0.29, "learning_rate": 8.109759942618584e-05, "loss": 2.6172, "step": 22135 }, { "epoch": 0.29, "learning_rate": 8.108960685782622e-05, "loss": 2.597, "step": 22140 }, { "epoch": 0.29, "learning_rate": 8.108161299410031e-05, "loss": 2.6025, "step": 22145 }, { "epoch": 0.29, "learning_rate": 8.107361783534121e-05, "loss": 2.6799, "step": 22150 }, { "epoch": 0.29, "learning_rate": 8.106562138188204e-05, "loss": 2.5934, "step": 22155 }, { "epoch": 0.29, "learning_rate": 8.105762363405593e-05, "loss": 2.8126, "step": 22160 }, { "epoch": 0.29, "learning_rate": 8.104962459219616e-05, "loss": 2.6037, "step": 22165 }, { "epoch": 0.29, "learning_rate": 8.104162425663602e-05, "loss": 2.588, "step": 22170 }, { "epoch": 0.29, "learning_rate": 8.103362262770881e-05, "loss": 2.7011, "step": 22175 }, { "epoch": 0.29, "learning_rate": 8.102561970574798e-05, "loss": 2.6358, "step": 22180 }, { "epoch": 0.29, "learning_rate": 8.10176154910869e-05, "loss": 2.6638, "step": 22185 }, { "epoch": 0.29, "learning_rate": 8.100960998405914e-05, "loss": 2.667, "step": 22190 }, { "epoch": 0.29, "learning_rate": 8.10016031849982e-05, "loss": 2.702, "step": 22195 }, { "epoch": 0.29, "learning_rate": 8.099359509423772e-05, "loss": 2.6154, "step": 22200 }, { "epoch": 0.29, "learning_rate": 8.098558571211135e-05, "loss": 2.5878, "step": 22205 }, { "epoch": 0.29, "learning_rate": 8.097757503895282e-05, "loss": 2.6002, "step": 22210 }, { "epoch": 0.29, "learning_rate": 8.096956307509588e-05, "loss": 2.5681, "step": 22215 }, { "epoch": 0.29, "learning_rate": 8.096154982087438e-05, "loss": 2.5717, "step": 22220 }, { "epoch": 0.29, "learning_rate": 8.095353527662215e-05, "loss": 2.7076, "step": 22225 }, { "epoch": 0.29, "learning_rate": 8.094551944267317e-05, "loss": 2.6471, "step": 22230 }, { "epoch": 0.29, "learning_rate": 8.093750231936139e-05, "loss": 2.7476, "step": 22235 }, { "epoch": 0.29, "learning_rate": 8.092948390702087e-05, "loss": 2.7439, "step": 22240 }, { "epoch": 0.29, "learning_rate": 8.092146420598568e-05, "loss": 2.5855, "step": 22245 }, { "epoch": 0.29, "learning_rate": 8.091344321658999e-05, "loss": 2.6788, "step": 22250 }, { "epoch": 0.29, "learning_rate": 8.090542093916799e-05, "loss": 2.6125, "step": 22255 }, { "epoch": 0.29, "learning_rate": 8.089739737405392e-05, "loss": 2.6467, "step": 22260 }, { "epoch": 0.29, "learning_rate": 8.088937252158211e-05, "loss": 2.5796, "step": 22265 }, { "epoch": 0.29, "learning_rate": 8.088134638208689e-05, "loss": 2.5999, "step": 22270 }, { "epoch": 0.29, "learning_rate": 8.08733189559027e-05, "loss": 2.599, "step": 22275 }, { "epoch": 0.29, "learning_rate": 8.0865290243364e-05, "loss": 2.7195, "step": 22280 }, { "epoch": 0.29, "learning_rate": 8.08572602448053e-05, "loss": 2.5578, "step": 22285 }, { "epoch": 0.29, "learning_rate": 8.084922896056117e-05, "loss": 2.7127, "step": 22290 }, { "epoch": 0.29, "learning_rate": 8.084119639096628e-05, "loss": 2.6408, "step": 22295 }, { "epoch": 0.29, "learning_rate": 8.083316253635527e-05, "loss": 2.5825, "step": 22300 }, { "epoch": 0.29, "learning_rate": 8.08251273970629e-05, "loss": 2.6977, "step": 22305 }, { "epoch": 0.29, "learning_rate": 8.081709097342394e-05, "loss": 2.5751, "step": 22310 }, { "epoch": 0.29, "learning_rate": 8.080905326577324e-05, "loss": 2.6481, "step": 22315 }, { "epoch": 0.29, "learning_rate": 8.080101427444568e-05, "loss": 2.6071, "step": 22320 }, { "epoch": 0.29, "learning_rate": 8.079297399977624e-05, "loss": 2.5982, "step": 22325 }, { "epoch": 0.29, "learning_rate": 8.07849324420999e-05, "loss": 2.7175, "step": 22330 }, { "epoch": 0.29, "learning_rate": 8.077688960175172e-05, "loss": 2.5193, "step": 22335 }, { "epoch": 0.29, "learning_rate": 8.076884547906681e-05, "loss": 2.6606, "step": 22340 }, { "epoch": 0.29, "learning_rate": 8.076080007438034e-05, "loss": 2.5763, "step": 22345 }, { "epoch": 0.29, "learning_rate": 8.075275338802752e-05, "loss": 2.4622, "step": 22350 }, { "epoch": 0.29, "learning_rate": 8.074470542034362e-05, "loss": 2.6799, "step": 22355 }, { "epoch": 0.29, "learning_rate": 8.073665617166397e-05, "loss": 2.6886, "step": 22360 }, { "epoch": 0.29, "learning_rate": 8.072860564232393e-05, "loss": 2.6741, "step": 22365 }, { "epoch": 0.29, "learning_rate": 8.072055383265895e-05, "loss": 2.6671, "step": 22370 }, { "epoch": 0.29, "learning_rate": 8.071250074300451e-05, "loss": 2.6501, "step": 22375 }, { "epoch": 0.29, "learning_rate": 8.070444637369612e-05, "loss": 2.5751, "step": 22380 }, { "epoch": 0.29, "learning_rate": 8.06963907250694e-05, "loss": 2.6206, "step": 22385 }, { "epoch": 0.29, "learning_rate": 8.068833379746e-05, "loss": 2.6075, "step": 22390 }, { "epoch": 0.29, "learning_rate": 8.068027559120359e-05, "loss": 2.7315, "step": 22395 }, { "epoch": 0.29, "learning_rate": 8.067221610663594e-05, "loss": 2.5683, "step": 22400 }, { "epoch": 0.29, "learning_rate": 8.066415534409281e-05, "loss": 2.6269, "step": 22405 }, { "epoch": 0.29, "learning_rate": 8.065609330391013e-05, "loss": 2.5524, "step": 22410 }, { "epoch": 0.29, "learning_rate": 8.064802998642374e-05, "loss": 2.5079, "step": 22415 }, { "epoch": 0.29, "learning_rate": 8.063996539196962e-05, "loss": 2.6901, "step": 22420 }, { "epoch": 0.29, "learning_rate": 8.063189952088384e-05, "loss": 2.6151, "step": 22425 }, { "epoch": 0.29, "learning_rate": 8.062383237350239e-05, "loss": 2.6766, "step": 22430 }, { "epoch": 0.29, "learning_rate": 8.061576395016146e-05, "loss": 2.5226, "step": 22435 }, { "epoch": 0.29, "learning_rate": 8.060769425119718e-05, "loss": 2.747, "step": 22440 }, { "epoch": 0.29, "learning_rate": 8.05996232769458e-05, "loss": 2.6213, "step": 22445 }, { "epoch": 0.29, "learning_rate": 8.059155102774358e-05, "loss": 2.7423, "step": 22450 }, { "epoch": 0.29, "learning_rate": 8.058347750392687e-05, "loss": 2.5396, "step": 22455 }, { "epoch": 0.29, "learning_rate": 8.057540270583205e-05, "loss": 2.7467, "step": 22460 }, { "epoch": 0.29, "learning_rate": 8.05673266337956e-05, "loss": 2.6436, "step": 22465 }, { "epoch": 0.29, "learning_rate": 8.055924928815397e-05, "loss": 2.6393, "step": 22470 }, { "epoch": 0.29, "learning_rate": 8.055117066924372e-05, "loss": 2.5901, "step": 22475 }, { "epoch": 0.29, "learning_rate": 8.054309077740143e-05, "loss": 2.6043, "step": 22480 }, { "epoch": 0.29, "learning_rate": 8.053500961296381e-05, "loss": 2.6541, "step": 22485 }, { "epoch": 0.29, "learning_rate": 8.05269271762675e-05, "loss": 2.6758, "step": 22490 }, { "epoch": 0.29, "learning_rate": 8.051884346764931e-05, "loss": 2.6417, "step": 22495 }, { "epoch": 0.29, "learning_rate": 8.051075848744603e-05, "loss": 2.5378, "step": 22500 }, { "epoch": 0.29, "learning_rate": 8.05026722359945e-05, "loss": 2.4844, "step": 22505 }, { "epoch": 0.29, "learning_rate": 8.04945847136317e-05, "loss": 2.5527, "step": 22510 }, { "epoch": 0.29, "learning_rate": 8.048649592069455e-05, "loss": 2.5341, "step": 22515 }, { "epoch": 0.29, "learning_rate": 8.047840585752009e-05, "loss": 2.6029, "step": 22520 }, { "epoch": 0.29, "learning_rate": 8.04703145244454e-05, "loss": 2.4807, "step": 22525 }, { "epoch": 0.29, "learning_rate": 8.046222192180761e-05, "loss": 2.6686, "step": 22530 }, { "epoch": 0.29, "learning_rate": 8.04541280499439e-05, "loss": 2.6881, "step": 22535 }, { "epoch": 0.29, "learning_rate": 8.044603290919151e-05, "loss": 2.5881, "step": 22540 }, { "epoch": 0.29, "learning_rate": 8.043793649988773e-05, "loss": 2.5875, "step": 22545 }, { "epoch": 0.29, "learning_rate": 8.04298388223699e-05, "loss": 2.5412, "step": 22550 }, { "epoch": 0.29, "learning_rate": 8.042173987697538e-05, "loss": 2.4835, "step": 22555 }, { "epoch": 0.29, "learning_rate": 8.041363966404168e-05, "loss": 2.6698, "step": 22560 }, { "epoch": 0.29, "learning_rate": 8.040553818390625e-05, "loss": 2.7053, "step": 22565 }, { "epoch": 0.29, "learning_rate": 8.039743543690667e-05, "loss": 2.6189, "step": 22570 }, { "epoch": 0.29, "learning_rate": 8.038933142338054e-05, "loss": 2.6749, "step": 22575 }, { "epoch": 0.29, "learning_rate": 8.038122614366552e-05, "loss": 2.6385, "step": 22580 }, { "epoch": 0.29, "learning_rate": 8.037311959809933e-05, "loss": 2.6188, "step": 22585 }, { "epoch": 0.29, "learning_rate": 8.036501178701969e-05, "loss": 2.6714, "step": 22590 }, { "epoch": 0.29, "learning_rate": 8.035690271076444e-05, "loss": 2.6624, "step": 22595 }, { "epoch": 0.29, "learning_rate": 8.034879236967149e-05, "loss": 2.5642, "step": 22600 }, { "epoch": 0.29, "learning_rate": 8.03406807640787e-05, "loss": 2.7296, "step": 22605 }, { "epoch": 0.29, "learning_rate": 8.03325678943241e-05, "loss": 2.5513, "step": 22610 }, { "epoch": 0.29, "learning_rate": 8.032445376074566e-05, "loss": 2.5818, "step": 22615 }, { "epoch": 0.29, "learning_rate": 8.031633836368152e-05, "loss": 2.5369, "step": 22620 }, { "epoch": 0.29, "learning_rate": 8.030822170346977e-05, "loss": 2.6958, "step": 22625 }, { "epoch": 0.29, "learning_rate": 8.03001037804486e-05, "loss": 2.5842, "step": 22630 }, { "epoch": 0.29, "learning_rate": 8.029198459495626e-05, "loss": 2.6953, "step": 22635 }, { "epoch": 0.29, "learning_rate": 8.028386414733105e-05, "loss": 2.5982, "step": 22640 }, { "epoch": 0.29, "learning_rate": 8.027574243791129e-05, "loss": 2.6611, "step": 22645 }, { "epoch": 0.29, "learning_rate": 8.026761946703538e-05, "loss": 2.6385, "step": 22650 }, { "epoch": 0.29, "learning_rate": 8.025949523504177e-05, "loss": 2.5025, "step": 22655 }, { "epoch": 0.29, "learning_rate": 8.025136974226899e-05, "loss": 2.6942, "step": 22660 }, { "epoch": 0.29, "learning_rate": 8.024324298905555e-05, "loss": 2.6112, "step": 22665 }, { "epoch": 0.29, "learning_rate": 8.023511497574008e-05, "loss": 2.6064, "step": 22670 }, { "epoch": 0.29, "learning_rate": 8.022698570266123e-05, "loss": 2.6477, "step": 22675 }, { "epoch": 0.29, "learning_rate": 8.02188551701577e-05, "loss": 2.5931, "step": 22680 }, { "epoch": 0.29, "learning_rate": 8.021072337856827e-05, "loss": 2.6853, "step": 22685 }, { "epoch": 0.29, "learning_rate": 8.020259032823176e-05, "loss": 2.5583, "step": 22690 }, { "epoch": 0.29, "learning_rate": 8.019445601948704e-05, "loss": 2.5673, "step": 22695 }, { "epoch": 0.29, "learning_rate": 8.0186320452673e-05, "loss": 2.5257, "step": 22700 }, { "epoch": 0.29, "learning_rate": 8.017818362812866e-05, "loss": 2.5978, "step": 22705 }, { "epoch": 0.29, "learning_rate": 8.017004554619298e-05, "loss": 2.6299, "step": 22710 }, { "epoch": 0.29, "learning_rate": 8.016190620720512e-05, "loss": 2.6105, "step": 22715 }, { "epoch": 0.29, "learning_rate": 8.015376561150414e-05, "loss": 2.5013, "step": 22720 }, { "epoch": 0.29, "learning_rate": 8.014562375942925e-05, "loss": 2.5932, "step": 22725 }, { "epoch": 0.29, "learning_rate": 8.01374806513197e-05, "loss": 2.6433, "step": 22730 }, { "epoch": 0.3, "learning_rate": 8.012933628751475e-05, "loss": 2.6439, "step": 22735 }, { "epoch": 0.3, "learning_rate": 8.012119066835375e-05, "loss": 2.5822, "step": 22740 }, { "epoch": 0.3, "learning_rate": 8.01130437941761e-05, "loss": 2.6151, "step": 22745 }, { "epoch": 0.3, "learning_rate": 8.010489566532124e-05, "loss": 2.5353, "step": 22750 }, { "epoch": 0.3, "learning_rate": 8.009674628212866e-05, "loss": 2.5456, "step": 22755 }, { "epoch": 0.3, "learning_rate": 8.008859564493791e-05, "loss": 2.5444, "step": 22760 }, { "epoch": 0.3, "learning_rate": 8.00804437540886e-05, "loss": 2.6732, "step": 22765 }, { "epoch": 0.3, "learning_rate": 8.007229060992038e-05, "loss": 2.6486, "step": 22770 }, { "epoch": 0.3, "learning_rate": 8.006413621277294e-05, "loss": 2.4412, "step": 22775 }, { "epoch": 0.3, "learning_rate": 8.005598056298605e-05, "loss": 2.5534, "step": 22780 }, { "epoch": 0.3, "learning_rate": 8.004782366089954e-05, "loss": 2.6916, "step": 22785 }, { "epoch": 0.3, "learning_rate": 8.003966550685324e-05, "loss": 2.6654, "step": 22790 }, { "epoch": 0.3, "learning_rate": 8.003150610118708e-05, "loss": 2.6344, "step": 22795 }, { "epoch": 0.3, "learning_rate": 8.002334544424102e-05, "loss": 2.7656, "step": 22800 }, { "epoch": 0.3, "learning_rate": 8.001518353635507e-05, "loss": 2.6212, "step": 22805 }, { "epoch": 0.3, "learning_rate": 8.000702037786931e-05, "loss": 2.6765, "step": 22810 }, { "epoch": 0.3, "learning_rate": 7.999885596912387e-05, "loss": 2.7703, "step": 22815 }, { "epoch": 0.3, "learning_rate": 7.999069031045894e-05, "loss": 2.63, "step": 22820 }, { "epoch": 0.3, "learning_rate": 7.99825234022147e-05, "loss": 2.6818, "step": 22825 }, { "epoch": 0.3, "learning_rate": 7.997435524473148e-05, "loss": 2.6193, "step": 22830 }, { "epoch": 0.3, "learning_rate": 7.996618583834955e-05, "loss": 2.572, "step": 22835 }, { "epoch": 0.3, "learning_rate": 7.995801518340934e-05, "loss": 2.6434, "step": 22840 }, { "epoch": 0.3, "learning_rate": 7.994984328025128e-05, "loss": 2.6305, "step": 22845 }, { "epoch": 0.3, "learning_rate": 7.994167012921586e-05, "loss": 2.6469, "step": 22850 }, { "epoch": 0.3, "learning_rate": 7.99334957306436e-05, "loss": 2.5702, "step": 22855 }, { "epoch": 0.3, "learning_rate": 7.99253200848751e-05, "loss": 2.6602, "step": 22860 }, { "epoch": 0.3, "learning_rate": 7.991714319225101e-05, "loss": 2.7906, "step": 22865 }, { "epoch": 0.3, "learning_rate": 7.9908965053112e-05, "loss": 2.6247, "step": 22870 }, { "epoch": 0.3, "learning_rate": 7.990078566779885e-05, "loss": 2.6585, "step": 22875 }, { "epoch": 0.3, "learning_rate": 7.989260503665234e-05, "loss": 2.6267, "step": 22880 }, { "epoch": 0.3, "learning_rate": 7.988442316001332e-05, "loss": 2.6495, "step": 22885 }, { "epoch": 0.3, "learning_rate": 7.987624003822272e-05, "loss": 2.6234, "step": 22890 }, { "epoch": 0.3, "learning_rate": 7.986805567162146e-05, "loss": 2.602, "step": 22895 }, { "epoch": 0.3, "learning_rate": 7.985987006055055e-05, "loss": 2.4819, "step": 22900 }, { "epoch": 0.3, "learning_rate": 7.985168320535106e-05, "loss": 2.54, "step": 22905 }, { "epoch": 0.3, "learning_rate": 7.984349510636408e-05, "loss": 2.6399, "step": 22910 }, { "epoch": 0.3, "learning_rate": 7.983530576393081e-05, "loss": 2.7313, "step": 22915 }, { "epoch": 0.3, "learning_rate": 7.982711517839244e-05, "loss": 2.6319, "step": 22920 }, { "epoch": 0.3, "learning_rate": 7.981892335009025e-05, "loss": 2.5765, "step": 22925 }, { "epoch": 0.3, "learning_rate": 7.981073027936551e-05, "loss": 2.6466, "step": 22930 }, { "epoch": 0.3, "learning_rate": 7.980253596655965e-05, "loss": 2.6922, "step": 22935 }, { "epoch": 0.3, "learning_rate": 7.979434041201406e-05, "loss": 2.71, "step": 22940 }, { "epoch": 0.3, "learning_rate": 7.978614361607019e-05, "loss": 2.6252, "step": 22945 }, { "epoch": 0.3, "learning_rate": 7.977794557906963e-05, "loss": 2.678, "step": 22950 }, { "epoch": 0.3, "learning_rate": 7.97697463013539e-05, "loss": 2.5293, "step": 22955 }, { "epoch": 0.3, "learning_rate": 7.976154578326465e-05, "loss": 2.6983, "step": 22960 }, { "epoch": 0.3, "learning_rate": 7.975334402514354e-05, "loss": 2.5834, "step": 22965 }, { "epoch": 0.3, "learning_rate": 7.974514102733233e-05, "loss": 2.5995, "step": 22970 }, { "epoch": 0.3, "learning_rate": 7.973693679017277e-05, "loss": 2.5257, "step": 22975 }, { "epoch": 0.3, "learning_rate": 7.972873131400673e-05, "loss": 2.7208, "step": 22980 }, { "epoch": 0.3, "learning_rate": 7.972052459917606e-05, "loss": 2.7321, "step": 22985 }, { "epoch": 0.3, "learning_rate": 7.971231664602273e-05, "loss": 2.7654, "step": 22990 }, { "epoch": 0.3, "learning_rate": 7.97041074548887e-05, "loss": 2.6163, "step": 22995 }, { "epoch": 0.3, "learning_rate": 7.969589702611603e-05, "loss": 2.6834, "step": 23000 }, { "epoch": 0.3, "learning_rate": 7.96876853600468e-05, "loss": 2.7799, "step": 23005 }, { "epoch": 0.3, "learning_rate": 7.967947245702319e-05, "loss": 2.5759, "step": 23010 }, { "epoch": 0.3, "learning_rate": 7.967125831738733e-05, "loss": 2.5903, "step": 23015 }, { "epoch": 0.3, "learning_rate": 7.966304294148152e-05, "loss": 2.5901, "step": 23020 }, { "epoch": 0.3, "learning_rate": 7.965482632964802e-05, "loss": 2.4943, "step": 23025 }, { "epoch": 0.3, "learning_rate": 7.964660848222922e-05, "loss": 2.6717, "step": 23030 }, { "epoch": 0.3, "learning_rate": 7.963838939956752e-05, "loss": 2.6995, "step": 23035 }, { "epoch": 0.3, "learning_rate": 7.963016908200534e-05, "loss": 2.5597, "step": 23040 }, { "epoch": 0.3, "learning_rate": 7.962194752988519e-05, "loss": 2.6575, "step": 23045 }, { "epoch": 0.3, "learning_rate": 7.961372474354964e-05, "loss": 2.5746, "step": 23050 }, { "epoch": 0.3, "learning_rate": 7.960550072334127e-05, "loss": 2.6837, "step": 23055 }, { "epoch": 0.3, "learning_rate": 7.959727546960278e-05, "loss": 2.4701, "step": 23060 }, { "epoch": 0.3, "learning_rate": 7.958904898267687e-05, "loss": 2.559, "step": 23065 }, { "epoch": 0.3, "learning_rate": 7.95808212629063e-05, "loss": 2.7268, "step": 23070 }, { "epoch": 0.3, "learning_rate": 7.957259231063384e-05, "loss": 2.7019, "step": 23075 }, { "epoch": 0.3, "learning_rate": 7.956436212620241e-05, "loss": 2.5231, "step": 23080 }, { "epoch": 0.3, "learning_rate": 7.955613070995489e-05, "loss": 2.7338, "step": 23085 }, { "epoch": 0.3, "learning_rate": 7.954789806223427e-05, "loss": 2.7272, "step": 23090 }, { "epoch": 0.3, "learning_rate": 7.953966418338357e-05, "loss": 2.6982, "step": 23095 }, { "epoch": 0.3, "learning_rate": 7.953142907374582e-05, "loss": 2.5149, "step": 23100 }, { "epoch": 0.3, "learning_rate": 7.952319273366418e-05, "loss": 2.5949, "step": 23105 }, { "epoch": 0.3, "learning_rate": 7.951495516348182e-05, "loss": 2.653, "step": 23110 }, { "epoch": 0.3, "learning_rate": 7.950671636354194e-05, "loss": 2.6685, "step": 23115 }, { "epoch": 0.3, "learning_rate": 7.949847633418784e-05, "loss": 2.8321, "step": 23120 }, { "epoch": 0.3, "learning_rate": 7.949023507576282e-05, "loss": 2.512, "step": 23125 }, { "epoch": 0.3, "learning_rate": 7.948199258861028e-05, "loss": 2.7089, "step": 23130 }, { "epoch": 0.3, "learning_rate": 7.947374887307364e-05, "loss": 2.5828, "step": 23135 }, { "epoch": 0.3, "learning_rate": 7.946550392949637e-05, "loss": 2.7194, "step": 23140 }, { "epoch": 0.3, "learning_rate": 7.9457257758222e-05, "loss": 2.5385, "step": 23145 }, { "epoch": 0.3, "learning_rate": 7.944901035959413e-05, "loss": 2.5847, "step": 23150 }, { "epoch": 0.3, "learning_rate": 7.944076173395637e-05, "loss": 2.6598, "step": 23155 }, { "epoch": 0.3, "learning_rate": 7.943251188165242e-05, "loss": 2.6301, "step": 23160 }, { "epoch": 0.3, "learning_rate": 7.9424260803026e-05, "loss": 2.7309, "step": 23165 }, { "epoch": 0.3, "learning_rate": 7.941600849842092e-05, "loss": 2.7161, "step": 23170 }, { "epoch": 0.3, "learning_rate": 7.9407754968181e-05, "loss": 2.5917, "step": 23175 }, { "epoch": 0.3, "learning_rate": 7.939950021265013e-05, "loss": 2.5663, "step": 23180 }, { "epoch": 0.3, "learning_rate": 7.939124423217226e-05, "loss": 2.5648, "step": 23185 }, { "epoch": 0.3, "learning_rate": 7.938298702709135e-05, "loss": 2.4677, "step": 23190 }, { "epoch": 0.3, "learning_rate": 7.937472859775147e-05, "loss": 2.6974, "step": 23195 }, { "epoch": 0.3, "learning_rate": 7.936646894449669e-05, "loss": 2.6641, "step": 23200 }, { "epoch": 0.3, "learning_rate": 7.935820806767119e-05, "loss": 2.694, "step": 23205 }, { "epoch": 0.3, "learning_rate": 7.934994596761913e-05, "loss": 2.5514, "step": 23210 }, { "epoch": 0.3, "learning_rate": 7.934168264468476e-05, "loss": 2.7899, "step": 23215 }, { "epoch": 0.3, "learning_rate": 7.933341809921238e-05, "loss": 2.5545, "step": 23220 }, { "epoch": 0.3, "learning_rate": 7.932515233154635e-05, "loss": 2.5189, "step": 23225 }, { "epoch": 0.3, "learning_rate": 7.931688534203105e-05, "loss": 2.717, "step": 23230 }, { "epoch": 0.3, "learning_rate": 7.930861713101095e-05, "loss": 2.5831, "step": 23235 }, { "epoch": 0.3, "learning_rate": 7.93003476988305e-05, "loss": 2.525, "step": 23240 }, { "epoch": 0.3, "learning_rate": 7.929207704583432e-05, "loss": 2.6045, "step": 23245 }, { "epoch": 0.3, "learning_rate": 7.928380517236695e-05, "loss": 2.5076, "step": 23250 }, { "epoch": 0.3, "learning_rate": 7.927553207877309e-05, "loss": 2.6412, "step": 23255 }, { "epoch": 0.3, "learning_rate": 7.926725776539743e-05, "loss": 2.7521, "step": 23260 }, { "epoch": 0.3, "learning_rate": 7.92589822325847e-05, "loss": 2.6228, "step": 23265 }, { "epoch": 0.3, "learning_rate": 7.925070548067972e-05, "loss": 2.7055, "step": 23270 }, { "epoch": 0.3, "learning_rate": 7.924242751002735e-05, "loss": 2.6062, "step": 23275 }, { "epoch": 0.3, "learning_rate": 7.923414832097251e-05, "loss": 2.8621, "step": 23280 }, { "epoch": 0.3, "learning_rate": 7.922586791386013e-05, "loss": 2.6152, "step": 23285 }, { "epoch": 0.3, "learning_rate": 7.921758628903522e-05, "loss": 2.6041, "step": 23290 }, { "epoch": 0.3, "learning_rate": 7.920930344684286e-05, "loss": 2.6157, "step": 23295 }, { "epoch": 0.3, "learning_rate": 7.920101938762814e-05, "loss": 2.7155, "step": 23300 }, { "epoch": 0.3, "learning_rate": 7.919273411173623e-05, "loss": 2.6161, "step": 23305 }, { "epoch": 0.3, "learning_rate": 7.918444761951233e-05, "loss": 2.7118, "step": 23310 }, { "epoch": 0.3, "learning_rate": 7.917615991130172e-05, "loss": 2.6907, "step": 23315 }, { "epoch": 0.3, "learning_rate": 7.91678709874497e-05, "loss": 2.6343, "step": 23320 }, { "epoch": 0.3, "learning_rate": 7.915958084830162e-05, "loss": 2.6933, "step": 23325 }, { "epoch": 0.3, "learning_rate": 7.915128949420292e-05, "loss": 2.5002, "step": 23330 }, { "epoch": 0.3, "learning_rate": 7.914299692549904e-05, "loss": 2.7376, "step": 23335 }, { "epoch": 0.3, "learning_rate": 7.913470314253552e-05, "loss": 2.5689, "step": 23340 }, { "epoch": 0.3, "learning_rate": 7.912640814565791e-05, "loss": 2.6769, "step": 23345 }, { "epoch": 0.3, "learning_rate": 7.911811193521182e-05, "loss": 2.7441, "step": 23350 }, { "epoch": 0.3, "learning_rate": 7.910981451154292e-05, "loss": 2.734, "step": 23355 }, { "epoch": 0.3, "learning_rate": 7.910151587499695e-05, "loss": 2.7139, "step": 23360 }, { "epoch": 0.3, "learning_rate": 7.909321602591963e-05, "loss": 2.5712, "step": 23365 }, { "epoch": 0.3, "learning_rate": 7.908491496465682e-05, "loss": 2.6495, "step": 23370 }, { "epoch": 0.3, "learning_rate": 7.907661269155438e-05, "loss": 2.6398, "step": 23375 }, { "epoch": 0.3, "learning_rate": 7.90683092069582e-05, "loss": 2.6566, "step": 23380 }, { "epoch": 0.3, "learning_rate": 7.90600045112143e-05, "loss": 2.7648, "step": 23385 }, { "epoch": 0.3, "learning_rate": 7.905169860466866e-05, "loss": 2.7436, "step": 23390 }, { "epoch": 0.3, "learning_rate": 7.904339148766735e-05, "loss": 2.6294, "step": 23395 }, { "epoch": 0.3, "learning_rate": 7.903508316055652e-05, "loss": 2.7139, "step": 23400 }, { "epoch": 0.3, "learning_rate": 7.902677362368234e-05, "loss": 2.601, "step": 23405 }, { "epoch": 0.3, "learning_rate": 7.901846287739099e-05, "loss": 2.6962, "step": 23410 }, { "epoch": 0.3, "learning_rate": 7.901015092202877e-05, "loss": 2.657, "step": 23415 }, { "epoch": 0.3, "learning_rate": 7.900183775794201e-05, "loss": 2.6321, "step": 23420 }, { "epoch": 0.3, "learning_rate": 7.899352338547707e-05, "loss": 2.5446, "step": 23425 }, { "epoch": 0.3, "learning_rate": 7.898520780498038e-05, "loss": 2.8814, "step": 23430 }, { "epoch": 0.3, "learning_rate": 7.897689101679841e-05, "loss": 2.6552, "step": 23435 }, { "epoch": 0.3, "learning_rate": 7.896857302127767e-05, "loss": 2.5648, "step": 23440 }, { "epoch": 0.3, "learning_rate": 7.896025381876477e-05, "loss": 2.5276, "step": 23445 }, { "epoch": 0.3, "learning_rate": 7.89519334096063e-05, "loss": 2.6365, "step": 23450 }, { "epoch": 0.3, "learning_rate": 7.894361179414896e-05, "loss": 2.5894, "step": 23455 }, { "epoch": 0.3, "learning_rate": 7.893528897273943e-05, "loss": 2.6812, "step": 23460 }, { "epoch": 0.3, "learning_rate": 7.892696494572453e-05, "loss": 2.6638, "step": 23465 }, { "epoch": 0.3, "learning_rate": 7.89186397134511e-05, "loss": 2.6959, "step": 23470 }, { "epoch": 0.3, "learning_rate": 7.891031327626596e-05, "loss": 2.5804, "step": 23475 }, { "epoch": 0.3, "learning_rate": 7.890198563451607e-05, "loss": 2.6962, "step": 23480 }, { "epoch": 0.3, "learning_rate": 7.889365678854838e-05, "loss": 2.5028, "step": 23485 }, { "epoch": 0.3, "learning_rate": 7.888532673870997e-05, "loss": 2.7593, "step": 23490 }, { "epoch": 0.3, "learning_rate": 7.887699548534786e-05, "loss": 2.7576, "step": 23495 }, { "epoch": 0.3, "learning_rate": 7.886866302880921e-05, "loss": 2.6657, "step": 23500 }, { "epoch": 0.31, "learning_rate": 7.886032936944117e-05, "loss": 2.6332, "step": 23505 }, { "epoch": 0.31, "learning_rate": 7.885199450759099e-05, "loss": 2.8286, "step": 23510 }, { "epoch": 0.31, "learning_rate": 7.884365844360594e-05, "loss": 2.612, "step": 23515 }, { "epoch": 0.31, "learning_rate": 7.883532117783334e-05, "loss": 2.8192, "step": 23520 }, { "epoch": 0.31, "learning_rate": 7.88269827106206e-05, "loss": 2.7072, "step": 23525 }, { "epoch": 0.31, "learning_rate": 7.881864304231508e-05, "loss": 2.5575, "step": 23530 }, { "epoch": 0.31, "learning_rate": 7.88103021732643e-05, "loss": 2.7419, "step": 23535 }, { "epoch": 0.31, "learning_rate": 7.88019601038158e-05, "loss": 2.6435, "step": 23540 }, { "epoch": 0.31, "learning_rate": 7.879361683431715e-05, "loss": 2.5747, "step": 23545 }, { "epoch": 0.31, "learning_rate": 7.878527236511595e-05, "loss": 2.6403, "step": 23550 }, { "epoch": 0.31, "learning_rate": 7.87769266965599e-05, "loss": 2.6662, "step": 23555 }, { "epoch": 0.31, "learning_rate": 7.876857982899671e-05, "loss": 2.6535, "step": 23560 }, { "epoch": 0.31, "learning_rate": 7.876023176277419e-05, "loss": 2.7197, "step": 23565 }, { "epoch": 0.31, "learning_rate": 7.875188249824013e-05, "loss": 2.5003, "step": 23570 }, { "epoch": 0.31, "learning_rate": 7.874353203574242e-05, "loss": 2.6942, "step": 23575 }, { "epoch": 0.31, "learning_rate": 7.8735180375629e-05, "loss": 2.5819, "step": 23580 }, { "epoch": 0.31, "learning_rate": 7.872682751824782e-05, "loss": 2.6403, "step": 23585 }, { "epoch": 0.31, "learning_rate": 7.871847346394694e-05, "loss": 2.4528, "step": 23590 }, { "epoch": 0.31, "learning_rate": 7.871011821307442e-05, "loss": 2.6183, "step": 23595 }, { "epoch": 0.31, "learning_rate": 7.870176176597837e-05, "loss": 2.6704, "step": 23600 }, { "epoch": 0.31, "learning_rate": 7.869340412300699e-05, "loss": 2.6128, "step": 23605 }, { "epoch": 0.31, "learning_rate": 7.868504528450848e-05, "loss": 2.746, "step": 23610 }, { "epoch": 0.31, "learning_rate": 7.867668525083117e-05, "loss": 2.6158, "step": 23615 }, { "epoch": 0.31, "learning_rate": 7.866832402232331e-05, "loss": 2.6301, "step": 23620 }, { "epoch": 0.31, "learning_rate": 7.865996159933334e-05, "loss": 2.5822, "step": 23625 }, { "epoch": 0.31, "learning_rate": 7.865159798220965e-05, "loss": 2.5064, "step": 23630 }, { "epoch": 0.31, "learning_rate": 7.864323317130073e-05, "loss": 2.6877, "step": 23635 }, { "epoch": 0.31, "learning_rate": 7.86348671669551e-05, "loss": 2.5638, "step": 23640 }, { "epoch": 0.31, "learning_rate": 7.862649996952133e-05, "loss": 2.6009, "step": 23645 }, { "epoch": 0.31, "learning_rate": 7.861813157934804e-05, "loss": 2.5779, "step": 23650 }, { "epoch": 0.31, "learning_rate": 7.860976199678391e-05, "loss": 2.7121, "step": 23655 }, { "epoch": 0.31, "learning_rate": 7.860139122217769e-05, "loss": 2.7451, "step": 23660 }, { "epoch": 0.31, "learning_rate": 7.85930192558781e-05, "loss": 2.8216, "step": 23665 }, { "epoch": 0.31, "learning_rate": 7.858464609823399e-05, "loss": 2.7035, "step": 23670 }, { "epoch": 0.31, "learning_rate": 7.857627174959425e-05, "loss": 2.6433, "step": 23675 }, { "epoch": 0.31, "learning_rate": 7.856789621030778e-05, "loss": 2.7849, "step": 23680 }, { "epoch": 0.31, "learning_rate": 7.855951948072355e-05, "loss": 2.6047, "step": 23685 }, { "epoch": 0.31, "learning_rate": 7.85511415611906e-05, "loss": 2.645, "step": 23690 }, { "epoch": 0.31, "learning_rate": 7.854276245205799e-05, "loss": 2.7229, "step": 23695 }, { "epoch": 0.31, "learning_rate": 7.853438215367481e-05, "loss": 2.6901, "step": 23700 }, { "epoch": 0.31, "learning_rate": 7.852600066639028e-05, "loss": 2.7107, "step": 23705 }, { "epoch": 0.31, "learning_rate": 7.85176179905536e-05, "loss": 2.4979, "step": 23710 }, { "epoch": 0.31, "learning_rate": 7.850923412651404e-05, "loss": 2.6653, "step": 23715 }, { "epoch": 0.31, "learning_rate": 7.850084907462093e-05, "loss": 2.7361, "step": 23720 }, { "epoch": 0.31, "learning_rate": 7.849246283522358e-05, "loss": 2.6512, "step": 23725 }, { "epoch": 0.31, "learning_rate": 7.848407540867147e-05, "loss": 2.6498, "step": 23730 }, { "epoch": 0.31, "learning_rate": 7.847568679531406e-05, "loss": 2.6291, "step": 23735 }, { "epoch": 0.31, "learning_rate": 7.846729699550084e-05, "loss": 2.6322, "step": 23740 }, { "epoch": 0.31, "learning_rate": 7.845890600958142e-05, "loss": 2.7536, "step": 23745 }, { "epoch": 0.31, "learning_rate": 7.845051383790535e-05, "loss": 2.7467, "step": 23750 }, { "epoch": 0.31, "learning_rate": 7.844212048082235e-05, "loss": 2.7038, "step": 23755 }, { "epoch": 0.31, "learning_rate": 7.84337259386821e-05, "loss": 2.7423, "step": 23760 }, { "epoch": 0.31, "learning_rate": 7.84253302118344e-05, "loss": 2.7355, "step": 23765 }, { "epoch": 0.31, "learning_rate": 7.841693330062903e-05, "loss": 2.6315, "step": 23770 }, { "epoch": 0.31, "learning_rate": 7.840853520541585e-05, "loss": 2.503, "step": 23775 }, { "epoch": 0.31, "learning_rate": 7.84001359265448e-05, "loss": 2.6169, "step": 23780 }, { "epoch": 0.31, "learning_rate": 7.839173546436583e-05, "loss": 2.5156, "step": 23785 }, { "epoch": 0.31, "learning_rate": 7.83833338192289e-05, "loss": 2.6041, "step": 23790 }, { "epoch": 0.31, "learning_rate": 7.837493099148416e-05, "loss": 2.5458, "step": 23795 }, { "epoch": 0.31, "learning_rate": 7.836652698148166e-05, "loss": 2.6485, "step": 23800 }, { "epoch": 0.31, "learning_rate": 7.835812178957158e-05, "loss": 2.7963, "step": 23805 }, { "epoch": 0.31, "learning_rate": 7.83497154161041e-05, "loss": 2.8682, "step": 23810 }, { "epoch": 0.31, "learning_rate": 7.83413078614295e-05, "loss": 2.5761, "step": 23815 }, { "epoch": 0.31, "learning_rate": 7.833289912589809e-05, "loss": 2.6026, "step": 23820 }, { "epoch": 0.31, "learning_rate": 7.83244892098602e-05, "loss": 2.6059, "step": 23825 }, { "epoch": 0.31, "learning_rate": 7.831607811366625e-05, "loss": 2.6219, "step": 23830 }, { "epoch": 0.31, "learning_rate": 7.830766583766671e-05, "loss": 2.7363, "step": 23835 }, { "epoch": 0.31, "learning_rate": 7.829925238221206e-05, "loss": 2.7511, "step": 23840 }, { "epoch": 0.31, "learning_rate": 7.829083774765285e-05, "loss": 2.6564, "step": 23845 }, { "epoch": 0.31, "learning_rate": 7.828242193433967e-05, "loss": 2.696, "step": 23850 }, { "epoch": 0.31, "learning_rate": 7.82740049426232e-05, "loss": 2.5551, "step": 23855 }, { "epoch": 0.31, "learning_rate": 7.826558677285412e-05, "loss": 2.7048, "step": 23860 }, { "epoch": 0.31, "learning_rate": 7.825716742538319e-05, "loss": 2.6795, "step": 23865 }, { "epoch": 0.31, "learning_rate": 7.82487469005612e-05, "loss": 2.5539, "step": 23870 }, { "epoch": 0.31, "learning_rate": 7.824032519873899e-05, "loss": 2.6564, "step": 23875 }, { "epoch": 0.31, "learning_rate": 7.823190232026746e-05, "loss": 2.7216, "step": 23880 }, { "epoch": 0.31, "learning_rate": 7.822347826549756e-05, "loss": 2.7806, "step": 23885 }, { "epoch": 0.31, "learning_rate": 7.821505303478027e-05, "loss": 2.6636, "step": 23890 }, { "epoch": 0.31, "learning_rate": 7.820662662846663e-05, "loss": 2.5405, "step": 23895 }, { "epoch": 0.31, "learning_rate": 7.819819904690777e-05, "loss": 2.629, "step": 23900 }, { "epoch": 0.31, "learning_rate": 7.818977029045477e-05, "loss": 2.639, "step": 23905 }, { "epoch": 0.31, "learning_rate": 7.818134035945888e-05, "loss": 2.4206, "step": 23910 }, { "epoch": 0.31, "learning_rate": 7.817290925427128e-05, "loss": 2.6519, "step": 23915 }, { "epoch": 0.31, "learning_rate": 7.81644769752433e-05, "loss": 2.6995, "step": 23920 }, { "epoch": 0.31, "learning_rate": 7.815604352272625e-05, "loss": 2.6325, "step": 23925 }, { "epoch": 0.31, "learning_rate": 7.814760889707154e-05, "loss": 2.7999, "step": 23930 }, { "epoch": 0.31, "learning_rate": 7.813917309863057e-05, "loss": 2.5515, "step": 23935 }, { "epoch": 0.31, "learning_rate": 7.813073612775485e-05, "loss": 2.7079, "step": 23940 }, { "epoch": 0.31, "learning_rate": 7.812229798479589e-05, "loss": 2.5813, "step": 23945 }, { "epoch": 0.31, "learning_rate": 7.811385867010529e-05, "loss": 2.5823, "step": 23950 }, { "epoch": 0.31, "learning_rate": 7.810541818403467e-05, "loss": 2.5795, "step": 23955 }, { "epoch": 0.31, "learning_rate": 7.809697652693571e-05, "loss": 2.7341, "step": 23960 }, { "epoch": 0.31, "learning_rate": 7.808853369916014e-05, "loss": 2.6529, "step": 23965 }, { "epoch": 0.31, "learning_rate": 7.808008970105972e-05, "loss": 2.6972, "step": 23970 }, { "epoch": 0.31, "learning_rate": 7.80716445329863e-05, "loss": 2.6079, "step": 23975 }, { "epoch": 0.31, "learning_rate": 7.806319819529171e-05, "loss": 2.6328, "step": 23980 }, { "epoch": 0.31, "learning_rate": 7.805475068832791e-05, "loss": 2.6285, "step": 23985 }, { "epoch": 0.31, "learning_rate": 7.804630201244688e-05, "loss": 2.5875, "step": 23990 }, { "epoch": 0.31, "learning_rate": 7.803785216800059e-05, "loss": 2.6259, "step": 23995 }, { "epoch": 0.31, "learning_rate": 7.802940115534114e-05, "loss": 2.6867, "step": 24000 }, { "epoch": 0.31, "learning_rate": 7.802094897482066e-05, "loss": 2.7134, "step": 24005 }, { "epoch": 0.31, "learning_rate": 7.801249562679127e-05, "loss": 2.6031, "step": 24010 }, { "epoch": 0.31, "learning_rate": 7.800404111160522e-05, "loss": 2.6502, "step": 24015 }, { "epoch": 0.31, "learning_rate": 7.799558542961477e-05, "loss": 2.6402, "step": 24020 }, { "epoch": 0.31, "learning_rate": 7.798712858117221e-05, "loss": 2.7226, "step": 24025 }, { "epoch": 0.31, "learning_rate": 7.797867056662992e-05, "loss": 2.5286, "step": 24030 }, { "epoch": 0.31, "learning_rate": 7.79702113863403e-05, "loss": 2.6589, "step": 24035 }, { "epoch": 0.31, "learning_rate": 7.796175104065582e-05, "loss": 2.501, "step": 24040 }, { "epoch": 0.31, "learning_rate": 7.795328952992895e-05, "loss": 2.5669, "step": 24045 }, { "epoch": 0.31, "learning_rate": 7.794482685451228e-05, "loss": 2.7108, "step": 24050 }, { "epoch": 0.31, "learning_rate": 7.79363630147584e-05, "loss": 2.6156, "step": 24055 }, { "epoch": 0.31, "learning_rate": 7.792789801101994e-05, "loss": 2.5453, "step": 24060 }, { "epoch": 0.31, "learning_rate": 7.791943184364964e-05, "loss": 2.7187, "step": 24065 }, { "epoch": 0.31, "learning_rate": 7.791096451300021e-05, "loss": 2.6196, "step": 24070 }, { "epoch": 0.31, "learning_rate": 7.790249601942445e-05, "loss": 2.6554, "step": 24075 }, { "epoch": 0.31, "learning_rate": 7.789402636327525e-05, "loss": 2.5363, "step": 24080 }, { "epoch": 0.31, "learning_rate": 7.788555554490545e-05, "loss": 2.6788, "step": 24085 }, { "epoch": 0.31, "learning_rate": 7.7877083564668e-05, "loss": 2.7933, "step": 24090 }, { "epoch": 0.31, "learning_rate": 7.786861042291593e-05, "loss": 2.5646, "step": 24095 }, { "epoch": 0.31, "learning_rate": 7.786013612000222e-05, "loss": 2.6323, "step": 24100 }, { "epoch": 0.31, "learning_rate": 7.785166065628002e-05, "loss": 2.5495, "step": 24105 }, { "epoch": 0.31, "learning_rate": 7.78431840321024e-05, "loss": 2.6874, "step": 24110 }, { "epoch": 0.31, "learning_rate": 7.783470624782258e-05, "loss": 2.6627, "step": 24115 }, { "epoch": 0.31, "learning_rate": 7.782622730379381e-05, "loss": 2.6217, "step": 24120 }, { "epoch": 0.31, "learning_rate": 7.781774720036932e-05, "loss": 2.641, "step": 24125 }, { "epoch": 0.31, "learning_rate": 7.780926593790248e-05, "loss": 2.6757, "step": 24130 }, { "epoch": 0.31, "learning_rate": 7.780078351674665e-05, "loss": 2.6662, "step": 24135 }, { "epoch": 0.31, "learning_rate": 7.779229993725523e-05, "loss": 2.6768, "step": 24140 }, { "epoch": 0.31, "learning_rate": 7.778381519978175e-05, "loss": 2.656, "step": 24145 }, { "epoch": 0.31, "learning_rate": 7.77753293046797e-05, "loss": 2.5294, "step": 24150 }, { "epoch": 0.31, "learning_rate": 7.776684225230262e-05, "loss": 2.6471, "step": 24155 }, { "epoch": 0.31, "learning_rate": 7.775835404300418e-05, "loss": 2.6668, "step": 24160 }, { "epoch": 0.31, "learning_rate": 7.774986467713803e-05, "loss": 2.6584, "step": 24165 }, { "epoch": 0.31, "learning_rate": 7.774137415505786e-05, "loss": 2.5872, "step": 24170 }, { "epoch": 0.31, "learning_rate": 7.773288247711747e-05, "loss": 2.7047, "step": 24175 }, { "epoch": 0.31, "learning_rate": 7.772438964367066e-05, "loss": 2.6157, "step": 24180 }, { "epoch": 0.31, "learning_rate": 7.771589565507125e-05, "loss": 2.5812, "step": 24185 }, { "epoch": 0.31, "learning_rate": 7.77074005116732e-05, "loss": 2.7009, "step": 24190 }, { "epoch": 0.31, "learning_rate": 7.769890421383044e-05, "loss": 2.4782, "step": 24195 }, { "epoch": 0.31, "learning_rate": 7.769040676189698e-05, "loss": 2.6812, "step": 24200 }, { "epoch": 0.31, "learning_rate": 7.768190815622685e-05, "loss": 2.7809, "step": 24205 }, { "epoch": 0.31, "learning_rate": 7.767340839717418e-05, "loss": 2.5666, "step": 24210 }, { "epoch": 0.31, "learning_rate": 7.76649074850931e-05, "loss": 2.627, "step": 24215 }, { "epoch": 0.31, "learning_rate": 7.765640542033781e-05, "loss": 2.631, "step": 24220 }, { "epoch": 0.31, "learning_rate": 7.764790220326253e-05, "loss": 2.6359, "step": 24225 }, { "epoch": 0.31, "learning_rate": 7.76393978342216e-05, "loss": 2.5709, "step": 24230 }, { "epoch": 0.31, "learning_rate": 7.763089231356932e-05, "loss": 2.6721, "step": 24235 }, { "epoch": 0.31, "learning_rate": 7.76223856416601e-05, "loss": 2.7568, "step": 24240 }, { "epoch": 0.31, "learning_rate": 7.761387781884836e-05, "loss": 2.681, "step": 24245 }, { "epoch": 0.31, "learning_rate": 7.760536884548859e-05, "loss": 2.6713, "step": 24250 }, { "epoch": 0.31, "learning_rate": 7.759685872193532e-05, "loss": 2.5551, "step": 24255 }, { "epoch": 0.31, "learning_rate": 7.758834744854312e-05, "loss": 2.5735, "step": 24260 }, { "epoch": 0.31, "learning_rate": 7.757983502566666e-05, "loss": 2.605, "step": 24265 }, { "epoch": 0.31, "learning_rate": 7.757132145366054e-05, "loss": 2.712, "step": 24270 }, { "epoch": 0.32, "learning_rate": 7.756280673287957e-05, "loss": 2.6648, "step": 24275 }, { "epoch": 0.32, "learning_rate": 7.755429086367844e-05, "loss": 2.7652, "step": 24280 }, { "epoch": 0.32, "learning_rate": 7.754577384641199e-05, "loss": 2.5432, "step": 24285 }, { "epoch": 0.32, "learning_rate": 7.753725568143514e-05, "loss": 2.5574, "step": 24290 }, { "epoch": 0.32, "learning_rate": 7.752873636910275e-05, "loss": 2.4899, "step": 24295 }, { "epoch": 0.32, "learning_rate": 7.752021590976979e-05, "loss": 2.7382, "step": 24300 }, { "epoch": 0.32, "learning_rate": 7.751169430379128e-05, "loss": 2.7225, "step": 24305 }, { "epoch": 0.32, "learning_rate": 7.750317155152228e-05, "loss": 2.6819, "step": 24310 }, { "epoch": 0.32, "learning_rate": 7.749464765331787e-05, "loss": 2.6401, "step": 24315 }, { "epoch": 0.32, "learning_rate": 7.748612260953323e-05, "loss": 2.6317, "step": 24320 }, { "epoch": 0.32, "learning_rate": 7.747759642052357e-05, "loss": 2.7098, "step": 24325 }, { "epoch": 0.32, "learning_rate": 7.74690690866441e-05, "loss": 2.6828, "step": 24330 }, { "epoch": 0.32, "learning_rate": 7.746054060825015e-05, "loss": 2.6078, "step": 24335 }, { "epoch": 0.32, "learning_rate": 7.745201098569706e-05, "loss": 2.6711, "step": 24340 }, { "epoch": 0.32, "learning_rate": 7.744348021934017e-05, "loss": 2.7078, "step": 24345 }, { "epoch": 0.32, "learning_rate": 7.743494830953501e-05, "loss": 2.7815, "step": 24350 }, { "epoch": 0.32, "learning_rate": 7.7426415256637e-05, "loss": 2.4414, "step": 24355 }, { "epoch": 0.32, "learning_rate": 7.74178810610017e-05, "loss": 2.7836, "step": 24360 }, { "epoch": 0.32, "learning_rate": 7.740934572298468e-05, "loss": 2.5446, "step": 24365 }, { "epoch": 0.32, "learning_rate": 7.74008092429416e-05, "loss": 2.5896, "step": 24370 }, { "epoch": 0.32, "learning_rate": 7.739227162122808e-05, "loss": 2.5698, "step": 24375 }, { "epoch": 0.32, "learning_rate": 7.738373285819988e-05, "loss": 2.7452, "step": 24380 }, { "epoch": 0.32, "learning_rate": 7.73751929542128e-05, "loss": 2.5026, "step": 24385 }, { "epoch": 0.32, "learning_rate": 7.73666519096226e-05, "loss": 2.6266, "step": 24390 }, { "epoch": 0.32, "learning_rate": 7.73581097247852e-05, "loss": 2.5351, "step": 24395 }, { "epoch": 0.32, "learning_rate": 7.734956640005649e-05, "loss": 2.6677, "step": 24400 }, { "epoch": 0.32, "learning_rate": 7.734102193579242e-05, "loss": 2.5454, "step": 24405 }, { "epoch": 0.32, "learning_rate": 7.733247633234902e-05, "loss": 2.6013, "step": 24410 }, { "epoch": 0.32, "learning_rate": 7.732392959008235e-05, "loss": 2.5339, "step": 24415 }, { "epoch": 0.32, "learning_rate": 7.731538170934851e-05, "loss": 2.7198, "step": 24420 }, { "epoch": 0.32, "learning_rate": 7.730683269050365e-05, "loss": 2.6877, "step": 24425 }, { "epoch": 0.32, "learning_rate": 7.729828253390396e-05, "loss": 2.6231, "step": 24430 }, { "epoch": 0.32, "learning_rate": 7.728973123990572e-05, "loss": 2.7042, "step": 24435 }, { "epoch": 0.32, "learning_rate": 7.728117880886517e-05, "loss": 2.5874, "step": 24440 }, { "epoch": 0.32, "learning_rate": 7.72726252411387e-05, "loss": 2.6407, "step": 24445 }, { "epoch": 0.32, "learning_rate": 7.726407053708268e-05, "loss": 2.6531, "step": 24450 }, { "epoch": 0.32, "learning_rate": 7.725551469705356e-05, "loss": 2.6749, "step": 24455 }, { "epoch": 0.32, "learning_rate": 7.724695772140782e-05, "loss": 2.5002, "step": 24460 }, { "epoch": 0.32, "learning_rate": 7.723839961050196e-05, "loss": 2.5915, "step": 24465 }, { "epoch": 0.32, "learning_rate": 7.72298403646926e-05, "loss": 2.4913, "step": 24470 }, { "epoch": 0.32, "learning_rate": 7.722127998433635e-05, "loss": 2.6042, "step": 24475 }, { "epoch": 0.32, "learning_rate": 7.721271846978988e-05, "loss": 2.6049, "step": 24480 }, { "epoch": 0.32, "learning_rate": 7.72041558214099e-05, "loss": 2.4961, "step": 24485 }, { "epoch": 0.32, "learning_rate": 7.71955920395532e-05, "loss": 2.6752, "step": 24490 }, { "epoch": 0.32, "learning_rate": 7.71870271245766e-05, "loss": 2.6378, "step": 24495 }, { "epoch": 0.32, "learning_rate": 7.717846107683693e-05, "loss": 2.6886, "step": 24500 }, { "epoch": 0.32, "learning_rate": 7.716989389669112e-05, "loss": 2.6333, "step": 24505 }, { "epoch": 0.32, "learning_rate": 7.716132558449612e-05, "loss": 2.5956, "step": 24510 }, { "epoch": 0.32, "learning_rate": 7.715275614060896e-05, "loss": 2.6281, "step": 24515 }, { "epoch": 0.32, "learning_rate": 7.714418556538664e-05, "loss": 2.6151, "step": 24520 }, { "epoch": 0.32, "learning_rate": 7.71356138591863e-05, "loss": 2.6628, "step": 24525 }, { "epoch": 0.32, "learning_rate": 7.712704102236505e-05, "loss": 2.7137, "step": 24530 }, { "epoch": 0.32, "learning_rate": 7.711846705528011e-05, "loss": 2.5708, "step": 24535 }, { "epoch": 0.32, "learning_rate": 7.710989195828873e-05, "loss": 2.6022, "step": 24540 }, { "epoch": 0.32, "learning_rate": 7.710131573174818e-05, "loss": 2.522, "step": 24545 }, { "epoch": 0.32, "learning_rate": 7.709273837601578e-05, "loss": 2.5438, "step": 24550 }, { "epoch": 0.32, "learning_rate": 7.708415989144893e-05, "loss": 2.7779, "step": 24555 }, { "epoch": 0.32, "learning_rate": 7.707558027840504e-05, "loss": 2.7135, "step": 24560 }, { "epoch": 0.32, "learning_rate": 7.70669995372416e-05, "loss": 2.7023, "step": 24565 }, { "epoch": 0.32, "learning_rate": 7.705841766831612e-05, "loss": 2.5859, "step": 24570 }, { "epoch": 0.32, "learning_rate": 7.704983467198619e-05, "loss": 2.5696, "step": 24575 }, { "epoch": 0.32, "learning_rate": 7.70412505486094e-05, "loss": 2.5039, "step": 24580 }, { "epoch": 0.32, "learning_rate": 7.703266529854342e-05, "loss": 2.5505, "step": 24585 }, { "epoch": 0.32, "learning_rate": 7.702407892214596e-05, "loss": 2.6583, "step": 24590 }, { "epoch": 0.32, "learning_rate": 7.701549141977478e-05, "loss": 2.542, "step": 24595 }, { "epoch": 0.32, "learning_rate": 7.700690279178768e-05, "loss": 2.5394, "step": 24600 }, { "epoch": 0.32, "learning_rate": 7.699831303854251e-05, "loss": 2.6062, "step": 24605 }, { "epoch": 0.32, "learning_rate": 7.698972216039717e-05, "loss": 2.5096, "step": 24610 }, { "epoch": 0.32, "learning_rate": 7.69811301577096e-05, "loss": 2.7114, "step": 24615 }, { "epoch": 0.32, "learning_rate": 7.69725370308378e-05, "loss": 2.7084, "step": 24620 }, { "epoch": 0.32, "learning_rate": 7.696394278013979e-05, "loss": 2.6411, "step": 24625 }, { "epoch": 0.32, "learning_rate": 7.695534740597368e-05, "loss": 2.7479, "step": 24630 }, { "epoch": 0.32, "learning_rate": 7.694675090869756e-05, "loss": 2.5742, "step": 24635 }, { "epoch": 0.32, "learning_rate": 7.693815328866967e-05, "loss": 2.7364, "step": 24640 }, { "epoch": 0.32, "learning_rate": 7.692955454624818e-05, "loss": 2.6428, "step": 24645 }, { "epoch": 0.32, "learning_rate": 7.692095468179137e-05, "loss": 2.722, "step": 24650 }, { "epoch": 0.32, "learning_rate": 7.691235369565757e-05, "loss": 2.6502, "step": 24655 }, { "epoch": 0.32, "learning_rate": 7.690375158820516e-05, "loss": 2.5699, "step": 24660 }, { "epoch": 0.32, "learning_rate": 7.689514835979252e-05, "loss": 2.7677, "step": 24665 }, { "epoch": 0.32, "learning_rate": 7.688654401077813e-05, "loss": 2.5703, "step": 24670 }, { "epoch": 0.32, "learning_rate": 7.687793854152049e-05, "loss": 2.5338, "step": 24675 }, { "epoch": 0.32, "learning_rate": 7.686933195237815e-05, "loss": 2.5118, "step": 24680 }, { "epoch": 0.32, "learning_rate": 7.686072424370969e-05, "loss": 2.6393, "step": 24685 }, { "epoch": 0.32, "learning_rate": 7.685211541587379e-05, "loss": 2.5129, "step": 24690 }, { "epoch": 0.32, "learning_rate": 7.684350546922913e-05, "loss": 2.6622, "step": 24695 }, { "epoch": 0.32, "learning_rate": 7.683489440413444e-05, "loss": 2.6038, "step": 24700 }, { "epoch": 0.32, "learning_rate": 7.682628222094851e-05, "loss": 2.5622, "step": 24705 }, { "epoch": 0.32, "learning_rate": 7.681766892003019e-05, "loss": 2.6052, "step": 24710 }, { "epoch": 0.32, "learning_rate": 7.68090545017383e-05, "loss": 2.6152, "step": 24715 }, { "epoch": 0.32, "learning_rate": 7.680043896643182e-05, "loss": 2.6041, "step": 24720 }, { "epoch": 0.32, "learning_rate": 7.679182231446971e-05, "loss": 2.5173, "step": 24725 }, { "epoch": 0.32, "learning_rate": 7.678320454621098e-05, "loss": 2.5602, "step": 24730 }, { "epoch": 0.32, "learning_rate": 7.67745856620147e-05, "loss": 2.5803, "step": 24735 }, { "epoch": 0.32, "learning_rate": 7.676596566223998e-05, "loss": 2.6727, "step": 24740 }, { "epoch": 0.32, "learning_rate": 7.675734454724597e-05, "loss": 2.5822, "step": 24745 }, { "epoch": 0.32, "learning_rate": 7.674872231739186e-05, "loss": 2.6727, "step": 24750 }, { "epoch": 0.32, "learning_rate": 7.674009897303693e-05, "loss": 2.6535, "step": 24755 }, { "epoch": 0.32, "learning_rate": 7.673147451454047e-05, "loss": 2.5992, "step": 24760 }, { "epoch": 0.32, "learning_rate": 7.672284894226183e-05, "loss": 2.5799, "step": 24765 }, { "epoch": 0.32, "learning_rate": 7.671422225656038e-05, "loss": 2.6007, "step": 24770 }, { "epoch": 0.32, "learning_rate": 7.670559445779555e-05, "loss": 2.643, "step": 24775 }, { "epoch": 0.32, "learning_rate": 7.669696554632685e-05, "loss": 2.6702, "step": 24780 }, { "epoch": 0.32, "learning_rate": 7.668833552251378e-05, "loss": 2.7765, "step": 24785 }, { "epoch": 0.32, "learning_rate": 7.667970438671595e-05, "loss": 2.6693, "step": 24790 }, { "epoch": 0.32, "learning_rate": 7.667107213929294e-05, "loss": 2.5158, "step": 24795 }, { "epoch": 0.32, "learning_rate": 7.666243878060444e-05, "loss": 2.6138, "step": 24800 }, { "epoch": 0.32, "learning_rate": 7.665380431101017e-05, "loss": 2.5834, "step": 24805 }, { "epoch": 0.32, "learning_rate": 7.664516873086987e-05, "loss": 2.4902, "step": 24810 }, { "epoch": 0.32, "learning_rate": 7.663653204054337e-05, "loss": 2.5172, "step": 24815 }, { "epoch": 0.32, "learning_rate": 7.66278942403905e-05, "loss": 2.6477, "step": 24820 }, { "epoch": 0.32, "learning_rate": 7.66192553307712e-05, "loss": 2.5397, "step": 24825 }, { "epoch": 0.32, "learning_rate": 7.661061531204535e-05, "loss": 2.743, "step": 24830 }, { "epoch": 0.32, "learning_rate": 7.660197418457298e-05, "loss": 2.5887, "step": 24835 }, { "epoch": 0.32, "learning_rate": 7.659333194871413e-05, "loss": 2.5709, "step": 24840 }, { "epoch": 0.32, "learning_rate": 7.658468860482886e-05, "loss": 2.63, "step": 24845 }, { "epoch": 0.32, "learning_rate": 7.657604415327735e-05, "loss": 2.5133, "step": 24850 }, { "epoch": 0.32, "learning_rate": 7.656739859441973e-05, "loss": 2.6309, "step": 24855 }, { "epoch": 0.32, "learning_rate": 7.655875192861622e-05, "loss": 2.6875, "step": 24860 }, { "epoch": 0.32, "learning_rate": 7.655010415622712e-05, "loss": 2.6402, "step": 24865 }, { "epoch": 0.32, "learning_rate": 7.654145527761271e-05, "loss": 2.7246, "step": 24870 }, { "epoch": 0.32, "learning_rate": 7.653280529313338e-05, "loss": 2.6534, "step": 24875 }, { "epoch": 0.32, "learning_rate": 7.652415420314953e-05, "loss": 2.6318, "step": 24880 }, { "epoch": 0.32, "learning_rate": 7.65155020080216e-05, "loss": 2.7012, "step": 24885 }, { "epoch": 0.32, "learning_rate": 7.650684870811011e-05, "loss": 2.6297, "step": 24890 }, { "epoch": 0.32, "learning_rate": 7.649819430377558e-05, "loss": 2.6965, "step": 24895 }, { "epoch": 0.32, "learning_rate": 7.648953879537861e-05, "loss": 2.7447, "step": 24900 }, { "epoch": 0.32, "learning_rate": 7.648088218327985e-05, "loss": 2.644, "step": 24905 }, { "epoch": 0.32, "learning_rate": 7.647222446783995e-05, "loss": 2.6708, "step": 24910 }, { "epoch": 0.32, "learning_rate": 7.646356564941968e-05, "loss": 2.7487, "step": 24915 }, { "epoch": 0.32, "learning_rate": 7.645490572837977e-05, "loss": 2.6066, "step": 24920 }, { "epoch": 0.32, "learning_rate": 7.644624470508109e-05, "loss": 2.6665, "step": 24925 }, { "epoch": 0.32, "learning_rate": 7.643758257988447e-05, "loss": 2.7538, "step": 24930 }, { "epoch": 0.32, "learning_rate": 7.642891935315084e-05, "loss": 2.6765, "step": 24935 }, { "epoch": 0.32, "learning_rate": 7.642025502524112e-05, "loss": 2.6334, "step": 24940 }, { "epoch": 0.32, "learning_rate": 7.64115895965164e-05, "loss": 2.6044, "step": 24945 }, { "epoch": 0.32, "learning_rate": 7.640292306733764e-05, "loss": 2.6917, "step": 24950 }, { "epoch": 0.32, "learning_rate": 7.639425543806599e-05, "loss": 2.6695, "step": 24955 }, { "epoch": 0.32, "learning_rate": 7.638558670906255e-05, "loss": 2.5722, "step": 24960 }, { "epoch": 0.32, "learning_rate": 7.637691688068855e-05, "loss": 2.6448, "step": 24965 }, { "epoch": 0.32, "learning_rate": 7.63682459533052e-05, "loss": 2.6393, "step": 24970 }, { "epoch": 0.32, "learning_rate": 7.63595739272738e-05, "loss": 2.5684, "step": 24975 }, { "epoch": 0.32, "learning_rate": 7.635090080295564e-05, "loss": 2.7992, "step": 24980 }, { "epoch": 0.32, "learning_rate": 7.634222658071211e-05, "loss": 2.7112, "step": 24985 }, { "epoch": 0.32, "learning_rate": 7.633355126090463e-05, "loss": 2.535, "step": 24990 }, { "epoch": 0.32, "learning_rate": 7.632487484389466e-05, "loss": 2.5738, "step": 24995 }, { "epoch": 0.32, "learning_rate": 7.631619733004371e-05, "loss": 2.602, "step": 25000 }, { "epoch": 0.32, "learning_rate": 7.630751871971331e-05, "loss": 2.7457, "step": 25005 }, { "epoch": 0.32, "learning_rate": 7.629883901326511e-05, "loss": 2.7182, "step": 25010 }, { "epoch": 0.32, "learning_rate": 7.62901582110607e-05, "loss": 2.5547, "step": 25015 }, { "epoch": 0.32, "learning_rate": 7.628147631346181e-05, "loss": 2.7311, "step": 25020 }, { "epoch": 0.32, "learning_rate": 7.627279332083015e-05, "loss": 2.5172, "step": 25025 }, { "epoch": 0.32, "learning_rate": 7.626410923352751e-05, "loss": 2.6126, "step": 25030 }, { "epoch": 0.32, "learning_rate": 7.625542405191573e-05, "loss": 2.6572, "step": 25035 }, { "epoch": 0.32, "learning_rate": 7.624673777635666e-05, "loss": 2.6237, "step": 25040 }, { "epoch": 0.33, "learning_rate": 7.623805040721224e-05, "loss": 2.5692, "step": 25045 }, { "epoch": 0.33, "learning_rate": 7.622936194484443e-05, "loss": 2.7176, "step": 25050 }, { "epoch": 0.33, "learning_rate": 7.622067238961523e-05, "loss": 2.7007, "step": 25055 }, { "epoch": 0.33, "learning_rate": 7.621198174188671e-05, "loss": 2.5705, "step": 25060 }, { "epoch": 0.33, "learning_rate": 7.620329000202096e-05, "loss": 2.588, "step": 25065 }, { "epoch": 0.33, "learning_rate": 7.619459717038012e-05, "loss": 2.6358, "step": 25070 }, { "epoch": 0.33, "learning_rate": 7.61859032473264e-05, "loss": 2.4686, "step": 25075 }, { "epoch": 0.33, "learning_rate": 7.6177208233222e-05, "loss": 2.5492, "step": 25080 }, { "epoch": 0.33, "learning_rate": 7.616851212842926e-05, "loss": 2.6897, "step": 25085 }, { "epoch": 0.33, "learning_rate": 7.615981493331046e-05, "loss": 2.5179, "step": 25090 }, { "epoch": 0.33, "learning_rate": 7.6151116648228e-05, "loss": 2.6899, "step": 25095 }, { "epoch": 0.33, "learning_rate": 7.61424172735443e-05, "loss": 2.8169, "step": 25100 }, { "epoch": 0.33, "learning_rate": 7.61337168096218e-05, "loss": 2.4388, "step": 25105 }, { "epoch": 0.33, "learning_rate": 7.612501525682303e-05, "loss": 2.6471, "step": 25110 }, { "epoch": 0.33, "learning_rate": 7.611631261551055e-05, "loss": 2.7085, "step": 25115 }, { "epoch": 0.33, "learning_rate": 7.610760888604694e-05, "loss": 2.7225, "step": 25120 }, { "epoch": 0.33, "learning_rate": 7.609890406879486e-05, "loss": 2.5102, "step": 25125 }, { "epoch": 0.33, "learning_rate": 7.6090198164117e-05, "loss": 2.5773, "step": 25130 }, { "epoch": 0.33, "learning_rate": 7.608149117237608e-05, "loss": 2.6973, "step": 25135 }, { "epoch": 0.33, "learning_rate": 7.607278309393491e-05, "loss": 2.6476, "step": 25140 }, { "epoch": 0.33, "learning_rate": 7.60640739291563e-05, "loss": 2.6553, "step": 25145 }, { "epoch": 0.33, "learning_rate": 7.605536367840314e-05, "loss": 2.6354, "step": 25150 }, { "epoch": 0.33, "learning_rate": 7.604665234203832e-05, "loss": 2.6264, "step": 25155 }, { "epoch": 0.33, "learning_rate": 7.603793992042481e-05, "loss": 2.7534, "step": 25160 }, { "epoch": 0.33, "learning_rate": 7.602922641392563e-05, "loss": 2.7176, "step": 25165 }, { "epoch": 0.33, "learning_rate": 7.602051182290382e-05, "loss": 2.5997, "step": 25170 }, { "epoch": 0.33, "learning_rate": 7.60117961477225e-05, "loss": 2.6192, "step": 25175 }, { "epoch": 0.33, "learning_rate": 7.600307938874478e-05, "loss": 2.7747, "step": 25180 }, { "epoch": 0.33, "learning_rate": 7.599436154633388e-05, "loss": 2.6367, "step": 25185 }, { "epoch": 0.33, "learning_rate": 7.598564262085301e-05, "loss": 2.6384, "step": 25190 }, { "epoch": 0.33, "learning_rate": 7.597692261266548e-05, "loss": 2.5583, "step": 25195 }, { "epoch": 0.33, "learning_rate": 7.59682015221346e-05, "loss": 2.7506, "step": 25200 }, { "epoch": 0.33, "learning_rate": 7.595947934962371e-05, "loss": 2.8034, "step": 25205 }, { "epoch": 0.33, "learning_rate": 7.595075609549626e-05, "loss": 2.6608, "step": 25210 }, { "epoch": 0.33, "learning_rate": 7.59420317601157e-05, "loss": 2.771, "step": 25215 }, { "epoch": 0.33, "learning_rate": 7.593330634384553e-05, "loss": 2.6203, "step": 25220 }, { "epoch": 0.33, "learning_rate": 7.592457984704931e-05, "loss": 2.679, "step": 25225 }, { "epoch": 0.33, "learning_rate": 7.591585227009061e-05, "loss": 2.6765, "step": 25230 }, { "epoch": 0.33, "learning_rate": 7.59071236133331e-05, "loss": 2.5817, "step": 25235 }, { "epoch": 0.33, "learning_rate": 7.589839387714044e-05, "loss": 2.6358, "step": 25240 }, { "epoch": 0.33, "learning_rate": 7.588966306187636e-05, "loss": 2.5794, "step": 25245 }, { "epoch": 0.33, "learning_rate": 7.588093116790468e-05, "loss": 2.74, "step": 25250 }, { "epoch": 0.33, "learning_rate": 7.587219819558915e-05, "loss": 2.7354, "step": 25255 }, { "epoch": 0.33, "learning_rate": 7.586346414529368e-05, "loss": 2.484, "step": 25260 }, { "epoch": 0.33, "learning_rate": 7.585472901738217e-05, "loss": 2.5992, "step": 25265 }, { "epoch": 0.33, "learning_rate": 7.584599281221858e-05, "loss": 2.7015, "step": 25270 }, { "epoch": 0.33, "learning_rate": 7.583725553016689e-05, "loss": 2.5178, "step": 25275 }, { "epoch": 0.33, "learning_rate": 7.582851717159114e-05, "loss": 2.6454, "step": 25280 }, { "epoch": 0.33, "learning_rate": 7.581977773685544e-05, "loss": 2.6758, "step": 25285 }, { "epoch": 0.33, "learning_rate": 7.581103722632393e-05, "loss": 2.5771, "step": 25290 }, { "epoch": 0.33, "learning_rate": 7.580229564036076e-05, "loss": 2.5067, "step": 25295 }, { "epoch": 0.33, "learning_rate": 7.579355297933017e-05, "loss": 2.6545, "step": 25300 }, { "epoch": 0.33, "learning_rate": 7.578480924359644e-05, "loss": 2.7753, "step": 25305 }, { "epoch": 0.33, "learning_rate": 7.577606443352387e-05, "loss": 2.6239, "step": 25310 }, { "epoch": 0.33, "learning_rate": 7.57673185494768e-05, "loss": 2.7828, "step": 25315 }, { "epoch": 0.33, "learning_rate": 7.575857159181965e-05, "loss": 2.6114, "step": 25320 }, { "epoch": 0.33, "learning_rate": 7.574982356091686e-05, "loss": 2.7235, "step": 25325 }, { "epoch": 0.33, "learning_rate": 7.574107445713294e-05, "loss": 2.5473, "step": 25330 }, { "epoch": 0.33, "learning_rate": 7.573232428083241e-05, "loss": 2.5543, "step": 25335 }, { "epoch": 0.33, "learning_rate": 7.572357303237985e-05, "loss": 2.5405, "step": 25340 }, { "epoch": 0.33, "learning_rate": 7.57148207121399e-05, "loss": 2.5513, "step": 25345 }, { "epoch": 0.33, "learning_rate": 7.570606732047722e-05, "loss": 2.532, "step": 25350 }, { "epoch": 0.33, "learning_rate": 7.569731285775652e-05, "loss": 2.7703, "step": 25355 }, { "epoch": 0.33, "learning_rate": 7.568855732434256e-05, "loss": 2.6175, "step": 25360 }, { "epoch": 0.33, "learning_rate": 7.567980072060015e-05, "loss": 2.6013, "step": 25365 }, { "epoch": 0.33, "learning_rate": 7.567104304689415e-05, "loss": 2.5751, "step": 25370 }, { "epoch": 0.33, "learning_rate": 7.566228430358945e-05, "loss": 2.6469, "step": 25375 }, { "epoch": 0.33, "learning_rate": 7.565352449105096e-05, "loss": 2.6261, "step": 25380 }, { "epoch": 0.33, "learning_rate": 7.56447636096437e-05, "loss": 2.5469, "step": 25385 }, { "epoch": 0.33, "learning_rate": 7.563600165973266e-05, "loss": 2.6366, "step": 25390 }, { "epoch": 0.33, "learning_rate": 7.562723864168294e-05, "loss": 2.5536, "step": 25395 }, { "epoch": 0.33, "learning_rate": 7.561847455585965e-05, "loss": 2.6088, "step": 25400 }, { "epoch": 0.33, "learning_rate": 7.560970940262795e-05, "loss": 2.5426, "step": 25405 }, { "epoch": 0.33, "learning_rate": 7.560094318235304e-05, "loss": 2.7084, "step": 25410 }, { "epoch": 0.33, "learning_rate": 7.559217589540018e-05, "loss": 2.7684, "step": 25415 }, { "epoch": 0.33, "learning_rate": 7.558340754213464e-05, "loss": 2.6667, "step": 25420 }, { "epoch": 0.33, "learning_rate": 7.55746381229218e-05, "loss": 2.6845, "step": 25425 }, { "epoch": 0.33, "learning_rate": 7.5565867638127e-05, "loss": 2.6794, "step": 25430 }, { "epoch": 0.33, "learning_rate": 7.55570960881157e-05, "loss": 2.6491, "step": 25435 }, { "epoch": 0.33, "learning_rate": 7.554832347325335e-05, "loss": 2.6826, "step": 25440 }, { "epoch": 0.33, "learning_rate": 7.553954979390548e-05, "loss": 2.6645, "step": 25445 }, { "epoch": 0.33, "learning_rate": 7.553077505043764e-05, "loss": 2.646, "step": 25450 }, { "epoch": 0.33, "learning_rate": 7.552199924321543e-05, "loss": 2.6978, "step": 25455 }, { "epoch": 0.33, "learning_rate": 7.551322237260452e-05, "loss": 2.6749, "step": 25460 }, { "epoch": 0.33, "learning_rate": 7.55044444389706e-05, "loss": 2.5577, "step": 25465 }, { "epoch": 0.33, "learning_rate": 7.549566544267939e-05, "loss": 2.6978, "step": 25470 }, { "epoch": 0.33, "learning_rate": 7.548688538409666e-05, "loss": 2.4774, "step": 25475 }, { "epoch": 0.33, "learning_rate": 7.547810426358828e-05, "loss": 2.5902, "step": 25480 }, { "epoch": 0.33, "learning_rate": 7.546932208152008e-05, "loss": 2.7045, "step": 25485 }, { "epoch": 0.33, "learning_rate": 7.546053883825802e-05, "loss": 2.5523, "step": 25490 }, { "epoch": 0.33, "learning_rate": 7.5451754534168e-05, "loss": 2.7626, "step": 25495 }, { "epoch": 0.33, "learning_rate": 7.544296916961608e-05, "loss": 2.6537, "step": 25500 }, { "epoch": 0.33, "learning_rate": 7.543418274496826e-05, "loss": 2.581, "step": 25505 }, { "epoch": 0.33, "learning_rate": 7.542539526059065e-05, "loss": 2.5358, "step": 25510 }, { "epoch": 0.33, "learning_rate": 7.54166067168494e-05, "loss": 2.6378, "step": 25515 }, { "epoch": 0.33, "learning_rate": 7.540781711411067e-05, "loss": 2.5906, "step": 25520 }, { "epoch": 0.33, "learning_rate": 7.53990264527407e-05, "loss": 2.6373, "step": 25525 }, { "epoch": 0.33, "learning_rate": 7.539023473310576e-05, "loss": 2.7207, "step": 25530 }, { "epoch": 0.33, "learning_rate": 7.538144195557213e-05, "loss": 2.6776, "step": 25535 }, { "epoch": 0.33, "learning_rate": 7.53726481205062e-05, "loss": 2.5819, "step": 25540 }, { "epoch": 0.33, "learning_rate": 7.536385322827435e-05, "loss": 2.6269, "step": 25545 }, { "epoch": 0.33, "learning_rate": 7.535505727924303e-05, "loss": 2.7223, "step": 25550 }, { "epoch": 0.33, "learning_rate": 7.534626027377873e-05, "loss": 2.64, "step": 25555 }, { "epoch": 0.33, "learning_rate": 7.5337462212248e-05, "loss": 2.7258, "step": 25560 }, { "epoch": 0.33, "learning_rate": 7.532866309501738e-05, "loss": 2.6488, "step": 25565 }, { "epoch": 0.33, "learning_rate": 7.531986292245352e-05, "loss": 2.5005, "step": 25570 }, { "epoch": 0.33, "learning_rate": 7.531106169492305e-05, "loss": 2.5794, "step": 25575 }, { "epoch": 0.33, "learning_rate": 7.530225941279274e-05, "loss": 2.6649, "step": 25580 }, { "epoch": 0.33, "learning_rate": 7.529345607642928e-05, "loss": 2.6729, "step": 25585 }, { "epoch": 0.33, "learning_rate": 7.528465168619949e-05, "loss": 2.6429, "step": 25590 }, { "epoch": 0.33, "learning_rate": 7.527584624247022e-05, "loss": 2.6223, "step": 25595 }, { "epoch": 0.33, "learning_rate": 7.526703974560833e-05, "loss": 2.6902, "step": 25600 }, { "epoch": 0.33, "learning_rate": 7.525823219598078e-05, "loss": 2.5905, "step": 25605 }, { "epoch": 0.33, "learning_rate": 7.52494235939545e-05, "loss": 2.7126, "step": 25610 }, { "epoch": 0.33, "learning_rate": 7.524061393989654e-05, "loss": 2.5128, "step": 25615 }, { "epoch": 0.33, "learning_rate": 7.523180323417396e-05, "loss": 2.5972, "step": 25620 }, { "epoch": 0.33, "learning_rate": 7.522299147715384e-05, "loss": 2.6688, "step": 25625 }, { "epoch": 0.33, "learning_rate": 7.521417866920332e-05, "loss": 2.5325, "step": 25630 }, { "epoch": 0.33, "learning_rate": 7.520536481068963e-05, "loss": 2.6492, "step": 25635 }, { "epoch": 0.33, "learning_rate": 7.519654990197998e-05, "loss": 2.7798, "step": 25640 }, { "epoch": 0.33, "learning_rate": 7.518773394344162e-05, "loss": 2.6244, "step": 25645 }, { "epoch": 0.33, "learning_rate": 7.517891693544194e-05, "loss": 2.7467, "step": 25650 }, { "epoch": 0.33, "learning_rate": 7.517009887834827e-05, "loss": 2.7685, "step": 25655 }, { "epoch": 0.33, "learning_rate": 7.5161279772528e-05, "loss": 2.7553, "step": 25660 }, { "epoch": 0.33, "learning_rate": 7.51524596183486e-05, "loss": 2.7899, "step": 25665 }, { "epoch": 0.33, "learning_rate": 7.514363841617757e-05, "loss": 2.7197, "step": 25670 }, { "epoch": 0.33, "learning_rate": 7.513481616638246e-05, "loss": 2.6306, "step": 25675 }, { "epoch": 0.33, "learning_rate": 7.512599286933084e-05, "loss": 2.6863, "step": 25680 }, { "epoch": 0.33, "learning_rate": 7.511716852539033e-05, "loss": 2.7164, "step": 25685 }, { "epoch": 0.33, "learning_rate": 7.510834313492863e-05, "loss": 2.6593, "step": 25690 }, { "epoch": 0.33, "learning_rate": 7.509951669831341e-05, "loss": 2.6788, "step": 25695 }, { "epoch": 0.33, "learning_rate": 7.509068921591246e-05, "loss": 2.6131, "step": 25700 }, { "epoch": 0.33, "learning_rate": 7.50818606880936e-05, "loss": 2.6841, "step": 25705 }, { "epoch": 0.33, "learning_rate": 7.507303111522463e-05, "loss": 2.6242, "step": 25710 }, { "epoch": 0.33, "learning_rate": 7.506420049767347e-05, "loss": 2.5434, "step": 25715 }, { "epoch": 0.33, "learning_rate": 7.505536883580807e-05, "loss": 2.5733, "step": 25720 }, { "epoch": 0.33, "learning_rate": 7.504653612999634e-05, "loss": 2.6262, "step": 25725 }, { "epoch": 0.33, "learning_rate": 7.503770238060635e-05, "loss": 2.7464, "step": 25730 }, { "epoch": 0.33, "learning_rate": 7.502886758800616e-05, "loss": 2.6485, "step": 25735 }, { "epoch": 0.33, "learning_rate": 7.502003175256387e-05, "loss": 2.4272, "step": 25740 }, { "epoch": 0.33, "learning_rate": 7.501119487464763e-05, "loss": 2.6813, "step": 25745 }, { "epoch": 0.33, "learning_rate": 7.500235695462563e-05, "loss": 2.5489, "step": 25750 }, { "epoch": 0.33, "learning_rate": 7.499351799286612e-05, "loss": 2.7061, "step": 25755 }, { "epoch": 0.33, "learning_rate": 7.498467798973736e-05, "loss": 2.7314, "step": 25760 }, { "epoch": 0.33, "learning_rate": 7.497583694560769e-05, "loss": 2.5536, "step": 25765 }, { "epoch": 0.33, "learning_rate": 7.496699486084548e-05, "loss": 2.6943, "step": 25770 }, { "epoch": 0.33, "learning_rate": 7.495815173581914e-05, "loss": 2.6982, "step": 25775 }, { "epoch": 0.33, "learning_rate": 7.494930757089711e-05, "loss": 2.6518, "step": 25780 }, { "epoch": 0.33, "learning_rate": 7.494046236644789e-05, "loss": 2.6751, "step": 25785 }, { "epoch": 0.33, "learning_rate": 7.493161612284001e-05, "loss": 2.5298, "step": 25790 }, { "epoch": 0.33, "learning_rate": 7.492276884044207e-05, "loss": 2.5354, "step": 25795 }, { "epoch": 0.33, "learning_rate": 7.491392051962272e-05, "loss": 2.4923, "step": 25800 }, { "epoch": 0.33, "learning_rate": 7.490507116075059e-05, "loss": 2.584, "step": 25805 }, { "epoch": 0.33, "learning_rate": 7.489622076419442e-05, "loss": 2.5358, "step": 25810 }, { "epoch": 0.34, "learning_rate": 7.488736933032296e-05, "loss": 2.5432, "step": 25815 }, { "epoch": 0.34, "learning_rate": 7.4878516859505e-05, "loss": 2.503, "step": 25820 }, { "epoch": 0.34, "learning_rate": 7.486966335210937e-05, "loss": 2.6527, "step": 25825 }, { "epoch": 0.34, "learning_rate": 7.486080880850499e-05, "loss": 2.7393, "step": 25830 }, { "epoch": 0.34, "learning_rate": 7.48519532290608e-05, "loss": 2.6807, "step": 25835 }, { "epoch": 0.34, "learning_rate": 7.484309661414572e-05, "loss": 2.4613, "step": 25840 }, { "epoch": 0.34, "learning_rate": 7.48342389641288e-05, "loss": 2.6449, "step": 25845 }, { "epoch": 0.34, "learning_rate": 7.482538027937909e-05, "loss": 2.6591, "step": 25850 }, { "epoch": 0.34, "learning_rate": 7.481652056026571e-05, "loss": 2.7542, "step": 25855 }, { "epoch": 0.34, "learning_rate": 7.480765980715777e-05, "loss": 2.5547, "step": 25860 }, { "epoch": 0.34, "learning_rate": 7.479879802042449e-05, "loss": 2.5915, "step": 25865 }, { "epoch": 0.34, "learning_rate": 7.47899352004351e-05, "loss": 2.7042, "step": 25870 }, { "epoch": 0.34, "learning_rate": 7.478107134755886e-05, "loss": 2.6073, "step": 25875 }, { "epoch": 0.34, "learning_rate": 7.477220646216508e-05, "loss": 2.5168, "step": 25880 }, { "epoch": 0.34, "learning_rate": 7.476334054462316e-05, "loss": 2.6293, "step": 25885 }, { "epoch": 0.34, "learning_rate": 7.475447359530244e-05, "loss": 2.588, "step": 25890 }, { "epoch": 0.34, "learning_rate": 7.474560561457244e-05, "loss": 2.642, "step": 25895 }, { "epoch": 0.34, "learning_rate": 7.47367366028026e-05, "loss": 2.6765, "step": 25900 }, { "epoch": 0.34, "learning_rate": 7.472786656036245e-05, "loss": 2.6871, "step": 25905 }, { "epoch": 0.34, "learning_rate": 7.471899548762159e-05, "loss": 2.513, "step": 25910 }, { "epoch": 0.34, "learning_rate": 7.471012338494963e-05, "loss": 2.6933, "step": 25915 }, { "epoch": 0.34, "learning_rate": 7.470125025271624e-05, "loss": 2.6462, "step": 25920 }, { "epoch": 0.34, "learning_rate": 7.46923760912911e-05, "loss": 2.615, "step": 25925 }, { "epoch": 0.34, "learning_rate": 7.468350090104398e-05, "loss": 2.6526, "step": 25930 }, { "epoch": 0.34, "learning_rate": 7.467462468234467e-05, "loss": 2.6535, "step": 25935 }, { "epoch": 0.34, "learning_rate": 7.466574743556298e-05, "loss": 2.612, "step": 25940 }, { "epoch": 0.34, "learning_rate": 7.46568691610688e-05, "loss": 2.5927, "step": 25945 }, { "epoch": 0.34, "learning_rate": 7.464798985923205e-05, "loss": 2.7098, "step": 25950 }, { "epoch": 0.34, "learning_rate": 7.463910953042268e-05, "loss": 2.573, "step": 25955 }, { "epoch": 0.34, "learning_rate": 7.463022817501071e-05, "loss": 2.6272, "step": 25960 }, { "epoch": 0.34, "learning_rate": 7.462134579336619e-05, "loss": 2.6452, "step": 25965 }, { "epoch": 0.34, "learning_rate": 7.46124623858592e-05, "loss": 2.6719, "step": 25970 }, { "epoch": 0.34, "learning_rate": 7.460357795285985e-05, "loss": 2.5185, "step": 25975 }, { "epoch": 0.34, "learning_rate": 7.459469249473836e-05, "loss": 2.5829, "step": 25980 }, { "epoch": 0.34, "learning_rate": 7.45858060118649e-05, "loss": 2.648, "step": 25985 }, { "epoch": 0.34, "learning_rate": 7.457691850460977e-05, "loss": 2.6992, "step": 25990 }, { "epoch": 0.34, "learning_rate": 7.456802997334327e-05, "loss": 2.7052, "step": 25995 }, { "epoch": 0.34, "learning_rate": 7.455914041843572e-05, "loss": 2.376, "step": 26000 }, { "epoch": 0.34, "learning_rate": 7.455024984025751e-05, "loss": 2.6334, "step": 26005 }, { "epoch": 0.34, "learning_rate": 7.45413582391791e-05, "loss": 2.7114, "step": 26010 }, { "epoch": 0.34, "learning_rate": 7.453246561557094e-05, "loss": 2.7568, "step": 26015 }, { "epoch": 0.34, "learning_rate": 7.452357196980357e-05, "loss": 2.5616, "step": 26020 }, { "epoch": 0.34, "learning_rate": 7.451467730224752e-05, "loss": 2.7087, "step": 26025 }, { "epoch": 0.34, "learning_rate": 7.450578161327339e-05, "loss": 2.6009, "step": 26030 }, { "epoch": 0.34, "learning_rate": 7.449688490325184e-05, "loss": 2.6178, "step": 26035 }, { "epoch": 0.34, "learning_rate": 7.448798717255356e-05, "loss": 2.6524, "step": 26040 }, { "epoch": 0.34, "learning_rate": 7.447908842154929e-05, "loss": 2.7022, "step": 26045 }, { "epoch": 0.34, "learning_rate": 7.447018865060977e-05, "loss": 2.6813, "step": 26050 }, { "epoch": 0.34, "learning_rate": 7.446128786010582e-05, "loss": 2.5606, "step": 26055 }, { "epoch": 0.34, "learning_rate": 7.445238605040831e-05, "loss": 2.5729, "step": 26060 }, { "epoch": 0.34, "learning_rate": 7.444348322188813e-05, "loss": 2.6152, "step": 26065 }, { "epoch": 0.34, "learning_rate": 7.443457937491623e-05, "loss": 2.4829, "step": 26070 }, { "epoch": 0.34, "learning_rate": 7.442567450986359e-05, "loss": 2.602, "step": 26075 }, { "epoch": 0.34, "learning_rate": 7.441676862710124e-05, "loss": 2.8043, "step": 26080 }, { "epoch": 0.34, "learning_rate": 7.440786172700024e-05, "loss": 2.5323, "step": 26085 }, { "epoch": 0.34, "learning_rate": 7.439895380993171e-05, "loss": 2.6363, "step": 26090 }, { "epoch": 0.34, "learning_rate": 7.439004487626679e-05, "loss": 2.5818, "step": 26095 }, { "epoch": 0.34, "learning_rate": 7.438113492637669e-05, "loss": 2.5727, "step": 26100 }, { "epoch": 0.34, "learning_rate": 7.437222396063263e-05, "loss": 2.5698, "step": 26105 }, { "epoch": 0.34, "learning_rate": 7.436331197940591e-05, "loss": 2.6146, "step": 26110 }, { "epoch": 0.34, "learning_rate": 7.435439898306786e-05, "loss": 2.6575, "step": 26115 }, { "epoch": 0.34, "learning_rate": 7.434548497198983e-05, "loss": 2.6814, "step": 26120 }, { "epoch": 0.34, "learning_rate": 7.433656994654321e-05, "loss": 2.4715, "step": 26125 }, { "epoch": 0.34, "learning_rate": 7.432765390709948e-05, "loss": 2.4725, "step": 26130 }, { "epoch": 0.34, "learning_rate": 7.431873685403012e-05, "loss": 2.6323, "step": 26135 }, { "epoch": 0.34, "learning_rate": 7.430981878770666e-05, "loss": 2.6205, "step": 26140 }, { "epoch": 0.34, "learning_rate": 7.430089970850068e-05, "loss": 2.5706, "step": 26145 }, { "epoch": 0.34, "learning_rate": 7.429197961678381e-05, "loss": 2.6583, "step": 26150 }, { "epoch": 0.34, "learning_rate": 7.428305851292769e-05, "loss": 2.6089, "step": 26155 }, { "epoch": 0.34, "learning_rate": 7.427413639730403e-05, "loss": 2.6315, "step": 26160 }, { "epoch": 0.34, "learning_rate": 7.426521327028459e-05, "loss": 2.5684, "step": 26165 }, { "epoch": 0.34, "learning_rate": 7.425628913224114e-05, "loss": 2.5891, "step": 26170 }, { "epoch": 0.34, "learning_rate": 7.42473639835455e-05, "loss": 2.6988, "step": 26175 }, { "epoch": 0.34, "learning_rate": 7.423843782456957e-05, "loss": 2.6444, "step": 26180 }, { "epoch": 0.34, "learning_rate": 7.422951065568526e-05, "loss": 2.571, "step": 26185 }, { "epoch": 0.34, "learning_rate": 7.422058247726449e-05, "loss": 2.6783, "step": 26190 }, { "epoch": 0.34, "learning_rate": 7.42116532896793e-05, "loss": 2.6308, "step": 26195 }, { "epoch": 0.34, "learning_rate": 7.42027230933017e-05, "loss": 2.6535, "step": 26200 }, { "epoch": 0.34, "learning_rate": 7.419379188850379e-05, "loss": 2.5975, "step": 26205 }, { "epoch": 0.34, "learning_rate": 7.418485967565768e-05, "loss": 2.6142, "step": 26210 }, { "epoch": 0.34, "learning_rate": 7.417592645513556e-05, "loss": 2.6593, "step": 26215 }, { "epoch": 0.34, "learning_rate": 7.41669922273096e-05, "loss": 2.6609, "step": 26220 }, { "epoch": 0.34, "learning_rate": 7.41580569925521e-05, "loss": 2.5283, "step": 26225 }, { "epoch": 0.34, "learning_rate": 7.41491207512353e-05, "loss": 2.6012, "step": 26230 }, { "epoch": 0.34, "learning_rate": 7.414018350373157e-05, "loss": 2.5496, "step": 26235 }, { "epoch": 0.34, "learning_rate": 7.413124525041325e-05, "loss": 2.5286, "step": 26240 }, { "epoch": 0.34, "learning_rate": 7.41223059916528e-05, "loss": 2.6971, "step": 26245 }, { "epoch": 0.34, "learning_rate": 7.411336572782263e-05, "loss": 2.6252, "step": 26250 }, { "epoch": 0.34, "learning_rate": 7.41044244592953e-05, "loss": 2.5551, "step": 26255 }, { "epoch": 0.34, "learning_rate": 7.409548218644332e-05, "loss": 2.5768, "step": 26260 }, { "epoch": 0.34, "learning_rate": 7.408653890963928e-05, "loss": 2.7331, "step": 26265 }, { "epoch": 0.34, "learning_rate": 7.407759462925579e-05, "loss": 2.5824, "step": 26270 }, { "epoch": 0.34, "learning_rate": 7.406864934566553e-05, "loss": 2.6153, "step": 26275 }, { "epoch": 0.34, "learning_rate": 7.405970305924123e-05, "loss": 2.623, "step": 26280 }, { "epoch": 0.34, "learning_rate": 7.405075577035561e-05, "loss": 2.619, "step": 26285 }, { "epoch": 0.34, "learning_rate": 7.40418074793815e-05, "loss": 2.5518, "step": 26290 }, { "epoch": 0.34, "learning_rate": 7.40328581866917e-05, "loss": 2.4759, "step": 26295 }, { "epoch": 0.34, "learning_rate": 7.402390789265909e-05, "loss": 2.7206, "step": 26300 }, { "epoch": 0.34, "learning_rate": 7.401495659765662e-05, "loss": 2.6898, "step": 26305 }, { "epoch": 0.34, "learning_rate": 7.400600430205723e-05, "loss": 2.5924, "step": 26310 }, { "epoch": 0.34, "learning_rate": 7.399705100623393e-05, "loss": 2.5636, "step": 26315 }, { "epoch": 0.34, "learning_rate": 7.398809671055975e-05, "loss": 2.4935, "step": 26320 }, { "epoch": 0.34, "learning_rate": 7.397914141540779e-05, "loss": 2.6848, "step": 26325 }, { "epoch": 0.34, "learning_rate": 7.397018512115118e-05, "loss": 2.5541, "step": 26330 }, { "epoch": 0.34, "learning_rate": 7.396122782816307e-05, "loss": 2.6171, "step": 26335 }, { "epoch": 0.34, "learning_rate": 7.395226953681667e-05, "loss": 2.6685, "step": 26340 }, { "epoch": 0.34, "learning_rate": 7.394331024748526e-05, "loss": 2.7123, "step": 26345 }, { "epoch": 0.34, "learning_rate": 7.393434996054213e-05, "loss": 2.6154, "step": 26350 }, { "epoch": 0.34, "learning_rate": 7.392538867636058e-05, "loss": 2.6114, "step": 26355 }, { "epoch": 0.34, "learning_rate": 7.391642639531404e-05, "loss": 2.6144, "step": 26360 }, { "epoch": 0.34, "learning_rate": 7.390746311777588e-05, "loss": 2.5613, "step": 26365 }, { "epoch": 0.34, "learning_rate": 7.389849884411958e-05, "loss": 2.6367, "step": 26370 }, { "epoch": 0.34, "learning_rate": 7.388953357471864e-05, "loss": 2.6673, "step": 26375 }, { "epoch": 0.34, "learning_rate": 7.388056730994661e-05, "loss": 2.6149, "step": 26380 }, { "epoch": 0.34, "learning_rate": 7.387160005017708e-05, "loss": 2.5889, "step": 26385 }, { "epoch": 0.34, "learning_rate": 7.386263179578365e-05, "loss": 2.6119, "step": 26390 }, { "epoch": 0.34, "learning_rate": 7.385366254714001e-05, "loss": 2.7193, "step": 26395 }, { "epoch": 0.34, "learning_rate": 7.384469230461986e-05, "loss": 2.7149, "step": 26400 }, { "epoch": 0.34, "learning_rate": 7.383572106859694e-05, "loss": 2.6521, "step": 26405 }, { "epoch": 0.34, "learning_rate": 7.382674883944506e-05, "loss": 2.8003, "step": 26410 }, { "epoch": 0.34, "learning_rate": 7.381777561753805e-05, "loss": 2.5818, "step": 26415 }, { "epoch": 0.34, "learning_rate": 7.38088014032498e-05, "loss": 2.4786, "step": 26420 }, { "epoch": 0.34, "learning_rate": 7.379982619695417e-05, "loss": 2.6589, "step": 26425 }, { "epoch": 0.34, "learning_rate": 7.379084999902517e-05, "loss": 2.5107, "step": 26430 }, { "epoch": 0.34, "learning_rate": 7.378187280983677e-05, "loss": 2.5569, "step": 26435 }, { "epoch": 0.34, "learning_rate": 7.377289462976305e-05, "loss": 2.5665, "step": 26440 }, { "epoch": 0.34, "learning_rate": 7.376391545917805e-05, "loss": 2.6835, "step": 26445 }, { "epoch": 0.34, "learning_rate": 7.375493529845591e-05, "loss": 2.6201, "step": 26450 }, { "epoch": 0.34, "learning_rate": 7.374595414797079e-05, "loss": 2.7637, "step": 26455 }, { "epoch": 0.34, "learning_rate": 7.373697200809687e-05, "loss": 2.6259, "step": 26460 }, { "epoch": 0.34, "learning_rate": 7.372798887920843e-05, "loss": 2.6301, "step": 26465 }, { "epoch": 0.34, "learning_rate": 7.371900476167976e-05, "loss": 2.669, "step": 26470 }, { "epoch": 0.34, "learning_rate": 7.371001965588517e-05, "loss": 2.6483, "step": 26475 }, { "epoch": 0.34, "learning_rate": 7.370103356219903e-05, "loss": 2.5981, "step": 26480 }, { "epoch": 0.34, "learning_rate": 7.369204648099575e-05, "loss": 2.6405, "step": 26485 }, { "epoch": 0.34, "learning_rate": 7.368305841264979e-05, "loss": 2.5455, "step": 26490 }, { "epoch": 0.34, "learning_rate": 7.367406935753565e-05, "loss": 2.6216, "step": 26495 }, { "epoch": 0.34, "learning_rate": 7.366507931602785e-05, "loss": 2.5852, "step": 26500 }, { "epoch": 0.34, "learning_rate": 7.365608828850097e-05, "loss": 2.5483, "step": 26505 }, { "epoch": 0.34, "learning_rate": 7.364709627532964e-05, "loss": 2.5223, "step": 26510 }, { "epoch": 0.34, "learning_rate": 7.363810327688848e-05, "loss": 2.6924, "step": 26515 }, { "epoch": 0.34, "learning_rate": 7.362910929355222e-05, "loss": 2.5585, "step": 26520 }, { "epoch": 0.34, "learning_rate": 7.362011432569559e-05, "loss": 2.489, "step": 26525 }, { "epoch": 0.34, "learning_rate": 7.361111837369337e-05, "loss": 2.7423, "step": 26530 }, { "epoch": 0.34, "learning_rate": 7.360212143792039e-05, "loss": 2.5327, "step": 26535 }, { "epoch": 0.34, "learning_rate": 7.35931235187515e-05, "loss": 2.677, "step": 26540 }, { "epoch": 0.34, "learning_rate": 7.358412461656162e-05, "loss": 2.6269, "step": 26545 }, { "epoch": 0.34, "learning_rate": 7.357512473172568e-05, "loss": 2.6755, "step": 26550 }, { "epoch": 0.34, "learning_rate": 7.356612386461867e-05, "loss": 2.6881, "step": 26555 }, { "epoch": 0.34, "learning_rate": 7.35571220156156e-05, "loss": 2.7606, "step": 26560 }, { "epoch": 0.34, "learning_rate": 7.354811918509157e-05, "loss": 2.664, "step": 26565 }, { "epoch": 0.34, "learning_rate": 7.353911537342166e-05, "loss": 2.647, "step": 26570 }, { "epoch": 0.34, "learning_rate": 7.353011058098104e-05, "loss": 2.5805, "step": 26575 }, { "epoch": 0.34, "learning_rate": 7.352110480814489e-05, "loss": 2.6149, "step": 26580 }, { "epoch": 0.35, "learning_rate": 7.351209805528843e-05, "loss": 2.6965, "step": 26585 }, { "epoch": 0.35, "learning_rate": 7.350309032278693e-05, "loss": 2.7605, "step": 26590 }, { "epoch": 0.35, "learning_rate": 7.349408161101573e-05, "loss": 2.553, "step": 26595 }, { "epoch": 0.35, "learning_rate": 7.348507192035017e-05, "loss": 2.6768, "step": 26600 }, { "epoch": 0.35, "learning_rate": 7.347606125116564e-05, "loss": 2.5778, "step": 26605 }, { "epoch": 0.35, "learning_rate": 7.346704960383756e-05, "loss": 2.5063, "step": 26610 }, { "epoch": 0.35, "learning_rate": 7.345803697874144e-05, "loss": 2.732, "step": 26615 }, { "epoch": 0.35, "learning_rate": 7.344902337625276e-05, "loss": 2.6962, "step": 26620 }, { "epoch": 0.35, "learning_rate": 7.34400087967471e-05, "loss": 2.6537, "step": 26625 }, { "epoch": 0.35, "learning_rate": 7.343099324060007e-05, "loss": 2.6766, "step": 26630 }, { "epoch": 0.35, "learning_rate": 7.342197670818728e-05, "loss": 2.7123, "step": 26635 }, { "epoch": 0.35, "learning_rate": 7.341295919988442e-05, "loss": 2.642, "step": 26640 }, { "epoch": 0.35, "learning_rate": 7.34039407160672e-05, "loss": 2.5612, "step": 26645 }, { "epoch": 0.35, "learning_rate": 7.339492125711139e-05, "loss": 2.6949, "step": 26650 }, { "epoch": 0.35, "learning_rate": 7.338590082339278e-05, "loss": 2.6453, "step": 26655 }, { "epoch": 0.35, "learning_rate": 7.337687941528725e-05, "loss": 2.6745, "step": 26660 }, { "epoch": 0.35, "learning_rate": 7.336785703317065e-05, "loss": 2.6881, "step": 26665 }, { "epoch": 0.35, "learning_rate": 7.335883367741889e-05, "loss": 2.6037, "step": 26670 }, { "epoch": 0.35, "learning_rate": 7.334980934840796e-05, "loss": 2.7316, "step": 26675 }, { "epoch": 0.35, "learning_rate": 7.334078404651383e-05, "loss": 2.6015, "step": 26680 }, { "epoch": 0.35, "learning_rate": 7.333175777211259e-05, "loss": 2.6887, "step": 26685 }, { "epoch": 0.35, "learning_rate": 7.33227305255803e-05, "loss": 2.6771, "step": 26690 }, { "epoch": 0.35, "learning_rate": 7.331370230729309e-05, "loss": 2.7008, "step": 26695 }, { "epoch": 0.35, "learning_rate": 7.330467311762712e-05, "loss": 2.6957, "step": 26700 }, { "epoch": 0.35, "learning_rate": 7.329564295695861e-05, "loss": 2.5533, "step": 26705 }, { "epoch": 0.35, "learning_rate": 7.328661182566378e-05, "loss": 2.5973, "step": 26710 }, { "epoch": 0.35, "learning_rate": 7.327757972411894e-05, "loss": 2.5921, "step": 26715 }, { "epoch": 0.35, "learning_rate": 7.326854665270042e-05, "loss": 2.6887, "step": 26720 }, { "epoch": 0.35, "learning_rate": 7.325951261178457e-05, "loss": 2.6388, "step": 26725 }, { "epoch": 0.35, "learning_rate": 7.325047760174783e-05, "loss": 2.6229, "step": 26730 }, { "epoch": 0.35, "learning_rate": 7.32414416229666e-05, "loss": 2.7714, "step": 26735 }, { "epoch": 0.35, "learning_rate": 7.32324046758174e-05, "loss": 2.6379, "step": 26740 }, { "epoch": 0.35, "learning_rate": 7.322336676067679e-05, "loss": 2.6422, "step": 26745 }, { "epoch": 0.35, "learning_rate": 7.321432787792126e-05, "loss": 2.7277, "step": 26750 }, { "epoch": 0.35, "learning_rate": 7.320528802792749e-05, "loss": 2.5367, "step": 26755 }, { "epoch": 0.35, "learning_rate": 7.319624721107211e-05, "loss": 2.6687, "step": 26760 }, { "epoch": 0.35, "learning_rate": 7.318720542773181e-05, "loss": 2.5321, "step": 26765 }, { "epoch": 0.35, "learning_rate": 7.31781626782833e-05, "loss": 2.5199, "step": 26770 }, { "epoch": 0.35, "learning_rate": 7.316911896310338e-05, "loss": 2.5033, "step": 26775 }, { "epoch": 0.35, "learning_rate": 7.316007428256886e-05, "loss": 2.5152, "step": 26780 }, { "epoch": 0.35, "learning_rate": 7.315102863705657e-05, "loss": 2.5276, "step": 26785 }, { "epoch": 0.35, "learning_rate": 7.314198202694343e-05, "loss": 2.6624, "step": 26790 }, { "epoch": 0.35, "learning_rate": 7.313293445260635e-05, "loss": 2.6912, "step": 26795 }, { "epoch": 0.35, "learning_rate": 7.312388591442232e-05, "loss": 2.7334, "step": 26800 }, { "epoch": 0.35, "learning_rate": 7.311483641276833e-05, "loss": 2.757, "step": 26805 }, { "epoch": 0.35, "learning_rate": 7.310578594802144e-05, "loss": 2.6905, "step": 26810 }, { "epoch": 0.35, "learning_rate": 7.309673452055876e-05, "loss": 2.6974, "step": 26815 }, { "epoch": 0.35, "learning_rate": 7.308768213075741e-05, "loss": 2.6179, "step": 26820 }, { "epoch": 0.35, "learning_rate": 7.307862877899456e-05, "loss": 2.672, "step": 26825 }, { "epoch": 0.35, "learning_rate": 7.306957446564744e-05, "loss": 2.6504, "step": 26830 }, { "epoch": 0.35, "learning_rate": 7.306051919109327e-05, "loss": 2.5895, "step": 26835 }, { "epoch": 0.35, "learning_rate": 7.305146295570939e-05, "loss": 2.5436, "step": 26840 }, { "epoch": 0.35, "learning_rate": 7.304240575987307e-05, "loss": 2.632, "step": 26845 }, { "epoch": 0.35, "learning_rate": 7.303334760396174e-05, "loss": 2.6119, "step": 26850 }, { "epoch": 0.35, "learning_rate": 7.30242884883528e-05, "loss": 2.6395, "step": 26855 }, { "epoch": 0.35, "learning_rate": 7.301522841342369e-05, "loss": 2.7632, "step": 26860 }, { "epoch": 0.35, "learning_rate": 7.300616737955192e-05, "loss": 2.5858, "step": 26865 }, { "epoch": 0.35, "learning_rate": 7.299710538711499e-05, "loss": 2.7152, "step": 26870 }, { "epoch": 0.35, "learning_rate": 7.29880424364905e-05, "loss": 2.5267, "step": 26875 }, { "epoch": 0.35, "learning_rate": 7.297897852805609e-05, "loss": 2.5914, "step": 26880 }, { "epoch": 0.35, "learning_rate": 7.296991366218935e-05, "loss": 2.5962, "step": 26885 }, { "epoch": 0.35, "learning_rate": 7.296084783926802e-05, "loss": 2.5648, "step": 26890 }, { "epoch": 0.35, "learning_rate": 7.295178105966981e-05, "loss": 2.5126, "step": 26895 }, { "epoch": 0.35, "learning_rate": 7.294271332377251e-05, "loss": 2.6228, "step": 26900 }, { "epoch": 0.35, "learning_rate": 7.29336446319539e-05, "loss": 2.6448, "step": 26905 }, { "epoch": 0.35, "learning_rate": 7.292457498459188e-05, "loss": 2.4711, "step": 26910 }, { "epoch": 0.35, "learning_rate": 7.29155043820643e-05, "loss": 2.7099, "step": 26915 }, { "epoch": 0.35, "learning_rate": 7.290643282474911e-05, "loss": 2.5227, "step": 26920 }, { "epoch": 0.35, "learning_rate": 7.28973603130243e-05, "loss": 2.5385, "step": 26925 }, { "epoch": 0.35, "learning_rate": 7.288828684726783e-05, "loss": 2.5242, "step": 26930 }, { "epoch": 0.35, "learning_rate": 7.28792124278578e-05, "loss": 2.5842, "step": 26935 }, { "epoch": 0.35, "learning_rate": 7.287013705517229e-05, "loss": 2.6937, "step": 26940 }, { "epoch": 0.35, "learning_rate": 7.286106072958941e-05, "loss": 2.6849, "step": 26945 }, { "epoch": 0.35, "learning_rate": 7.285198345148736e-05, "loss": 2.688, "step": 26950 }, { "epoch": 0.35, "learning_rate": 7.284290522124432e-05, "loss": 2.5652, "step": 26955 }, { "epoch": 0.35, "learning_rate": 7.283382603923856e-05, "loss": 2.7167, "step": 26960 }, { "epoch": 0.35, "learning_rate": 7.282474590584838e-05, "loss": 2.5795, "step": 26965 }, { "epoch": 0.35, "learning_rate": 7.281566482145205e-05, "loss": 2.7209, "step": 26970 }, { "epoch": 0.35, "learning_rate": 7.280658278642802e-05, "loss": 2.6514, "step": 26975 }, { "epoch": 0.35, "learning_rate": 7.279749980115466e-05, "loss": 2.6435, "step": 26980 }, { "epoch": 0.35, "learning_rate": 7.278841586601039e-05, "loss": 2.6757, "step": 26985 }, { "epoch": 0.35, "learning_rate": 7.277933098137374e-05, "loss": 2.6937, "step": 26990 }, { "epoch": 0.35, "learning_rate": 7.277024514762323e-05, "loss": 2.504, "step": 26995 }, { "epoch": 0.35, "learning_rate": 7.27611583651374e-05, "loss": 2.605, "step": 27000 }, { "epoch": 0.35, "learning_rate": 7.275207063429488e-05, "loss": 2.7204, "step": 27005 }, { "epoch": 0.35, "learning_rate": 7.27429819554743e-05, "loss": 2.6257, "step": 27010 }, { "epoch": 0.35, "learning_rate": 7.27338923290544e-05, "loss": 2.5621, "step": 27015 }, { "epoch": 0.35, "learning_rate": 7.27248017554138e-05, "loss": 2.6698, "step": 27020 }, { "epoch": 0.35, "learning_rate": 7.271571023493134e-05, "loss": 2.4751, "step": 27025 }, { "epoch": 0.35, "learning_rate": 7.270661776798582e-05, "loss": 2.5566, "step": 27030 }, { "epoch": 0.35, "learning_rate": 7.269752435495606e-05, "loss": 2.4919, "step": 27035 }, { "epoch": 0.35, "learning_rate": 7.268842999622095e-05, "loss": 2.5607, "step": 27040 }, { "epoch": 0.35, "learning_rate": 7.267933469215942e-05, "loss": 2.5793, "step": 27045 }, { "epoch": 0.35, "learning_rate": 7.267023844315042e-05, "loss": 2.6417, "step": 27050 }, { "epoch": 0.35, "learning_rate": 7.266114124957295e-05, "loss": 2.5666, "step": 27055 }, { "epoch": 0.35, "learning_rate": 7.265204311180607e-05, "loss": 2.6829, "step": 27060 }, { "epoch": 0.35, "learning_rate": 7.264294403022883e-05, "loss": 2.4716, "step": 27065 }, { "epoch": 0.35, "learning_rate": 7.263384400522035e-05, "loss": 2.5761, "step": 27070 }, { "epoch": 0.35, "learning_rate": 7.262474303715981e-05, "loss": 2.6054, "step": 27075 }, { "epoch": 0.35, "learning_rate": 7.26156411264264e-05, "loss": 2.6074, "step": 27080 }, { "epoch": 0.35, "learning_rate": 7.260653827339937e-05, "loss": 2.6649, "step": 27085 }, { "epoch": 0.35, "learning_rate": 7.259743447845795e-05, "loss": 2.6135, "step": 27090 }, { "epoch": 0.35, "learning_rate": 7.258832974198149e-05, "loss": 2.6795, "step": 27095 }, { "epoch": 0.35, "learning_rate": 7.257922406434933e-05, "loss": 2.6571, "step": 27100 }, { "epoch": 0.35, "learning_rate": 7.257011744594089e-05, "loss": 2.5311, "step": 27105 }, { "epoch": 0.35, "learning_rate": 7.256100988713557e-05, "loss": 2.6749, "step": 27110 }, { "epoch": 0.35, "learning_rate": 7.255190138831286e-05, "loss": 2.5425, "step": 27115 }, { "epoch": 0.35, "learning_rate": 7.254279194985228e-05, "loss": 2.6419, "step": 27120 }, { "epoch": 0.35, "learning_rate": 7.253368157213333e-05, "loss": 2.6495, "step": 27125 }, { "epoch": 0.35, "learning_rate": 7.252457025553566e-05, "loss": 2.6256, "step": 27130 }, { "epoch": 0.35, "learning_rate": 7.251545800043888e-05, "loss": 2.5833, "step": 27135 }, { "epoch": 0.35, "learning_rate": 7.250634480722262e-05, "loss": 2.5496, "step": 27140 }, { "epoch": 0.35, "learning_rate": 7.249723067626664e-05, "loss": 2.6984, "step": 27145 }, { "epoch": 0.35, "learning_rate": 7.248811560795066e-05, "loss": 2.5919, "step": 27150 }, { "epoch": 0.35, "learning_rate": 7.247899960265447e-05, "loss": 2.575, "step": 27155 }, { "epoch": 0.35, "learning_rate": 7.246988266075787e-05, "loss": 2.5494, "step": 27160 }, { "epoch": 0.35, "learning_rate": 7.246076478264076e-05, "loss": 2.5285, "step": 27165 }, { "epoch": 0.35, "learning_rate": 7.245164596868302e-05, "loss": 2.6278, "step": 27170 }, { "epoch": 0.35, "learning_rate": 7.24425262192646e-05, "loss": 2.5992, "step": 27175 }, { "epoch": 0.35, "learning_rate": 7.243340553476547e-05, "loss": 2.6107, "step": 27180 }, { "epoch": 0.35, "learning_rate": 7.242428391556566e-05, "loss": 2.664, "step": 27185 }, { "epoch": 0.35, "learning_rate": 7.24151613620452e-05, "loss": 2.5793, "step": 27190 }, { "epoch": 0.35, "learning_rate": 7.240603787458422e-05, "loss": 2.5656, "step": 27195 }, { "epoch": 0.35, "learning_rate": 7.239691345356283e-05, "loss": 2.6523, "step": 27200 }, { "epoch": 0.35, "learning_rate": 7.238778809936124e-05, "loss": 2.5535, "step": 27205 }, { "epoch": 0.35, "learning_rate": 7.237866181235963e-05, "loss": 2.6359, "step": 27210 }, { "epoch": 0.35, "learning_rate": 7.236953459293827e-05, "loss": 2.7264, "step": 27215 }, { "epoch": 0.35, "learning_rate": 7.236040644147743e-05, "loss": 2.5738, "step": 27220 }, { "epoch": 0.35, "learning_rate": 7.235127735835744e-05, "loss": 2.6357, "step": 27225 }, { "epoch": 0.35, "learning_rate": 7.234214734395871e-05, "loss": 2.6332, "step": 27230 }, { "epoch": 0.35, "learning_rate": 7.233301639866159e-05, "loss": 2.6114, "step": 27235 }, { "epoch": 0.35, "learning_rate": 7.232388452284657e-05, "loss": 2.7383, "step": 27240 }, { "epoch": 0.35, "learning_rate": 7.231475171689412e-05, "loss": 2.5572, "step": 27245 }, { "epoch": 0.35, "learning_rate": 7.230561798118476e-05, "loss": 2.6435, "step": 27250 }, { "epoch": 0.35, "learning_rate": 7.229648331609906e-05, "loss": 2.6814, "step": 27255 }, { "epoch": 0.35, "learning_rate": 7.228734772201761e-05, "loss": 2.4455, "step": 27260 }, { "epoch": 0.35, "learning_rate": 7.227821119932104e-05, "loss": 2.6039, "step": 27265 }, { "epoch": 0.35, "learning_rate": 7.226907374839007e-05, "loss": 2.48, "step": 27270 }, { "epoch": 0.35, "learning_rate": 7.225993536960538e-05, "loss": 2.5493, "step": 27275 }, { "epoch": 0.35, "learning_rate": 7.225079606334774e-05, "loss": 2.6534, "step": 27280 }, { "epoch": 0.35, "learning_rate": 7.224165582999794e-05, "loss": 2.6405, "step": 27285 }, { "epoch": 0.35, "learning_rate": 7.223251466993682e-05, "loss": 2.6355, "step": 27290 }, { "epoch": 0.35, "learning_rate": 7.222337258354521e-05, "loss": 2.5448, "step": 27295 }, { "epoch": 0.35, "learning_rate": 7.22142295712041e-05, "loss": 2.5839, "step": 27300 }, { "epoch": 0.35, "learning_rate": 7.220508563329438e-05, "loss": 2.6965, "step": 27305 }, { "epoch": 0.35, "learning_rate": 7.219594077019705e-05, "loss": 2.5068, "step": 27310 }, { "epoch": 0.35, "learning_rate": 7.218679498229313e-05, "loss": 2.6662, "step": 27315 }, { "epoch": 0.35, "learning_rate": 7.217764826996372e-05, "loss": 2.6978, "step": 27320 }, { "epoch": 0.35, "learning_rate": 7.216850063358986e-05, "loss": 2.555, "step": 27325 }, { "epoch": 0.35, "learning_rate": 7.215935207355275e-05, "loss": 2.72, "step": 27330 }, { "epoch": 0.35, "learning_rate": 7.215020259023356e-05, "loss": 2.7301, "step": 27335 }, { "epoch": 0.35, "learning_rate": 7.214105218401348e-05, "loss": 2.7419, "step": 27340 }, { "epoch": 0.35, "learning_rate": 7.213190085527378e-05, "loss": 2.7356, "step": 27345 }, { "epoch": 0.35, "learning_rate": 7.212274860439576e-05, "loss": 2.5807, "step": 27350 }, { "epoch": 0.36, "learning_rate": 7.211359543176075e-05, "loss": 2.5446, "step": 27355 }, { "epoch": 0.36, "learning_rate": 7.210444133775014e-05, "loss": 2.6204, "step": 27360 }, { "epoch": 0.36, "learning_rate": 7.209528632274532e-05, "loss": 2.6976, "step": 27365 }, { "epoch": 0.36, "learning_rate": 7.208613038712773e-05, "loss": 2.5779, "step": 27370 }, { "epoch": 0.36, "learning_rate": 7.207697353127889e-05, "loss": 2.5936, "step": 27375 }, { "epoch": 0.36, "learning_rate": 7.206781575558029e-05, "loss": 2.6271, "step": 27380 }, { "epoch": 0.36, "learning_rate": 7.205865706041349e-05, "loss": 2.4783, "step": 27385 }, { "epoch": 0.36, "learning_rate": 7.204949744616014e-05, "loss": 2.6247, "step": 27390 }, { "epoch": 0.36, "learning_rate": 7.204033691320185e-05, "loss": 2.5668, "step": 27395 }, { "epoch": 0.36, "learning_rate": 7.203117546192032e-05, "loss": 2.6263, "step": 27400 }, { "epoch": 0.36, "learning_rate": 7.202201309269722e-05, "loss": 2.6503, "step": 27405 }, { "epoch": 0.36, "learning_rate": 7.201284980591435e-05, "loss": 2.6947, "step": 27410 }, { "epoch": 0.36, "learning_rate": 7.200368560195349e-05, "loss": 2.5731, "step": 27415 }, { "epoch": 0.36, "learning_rate": 7.199452048119646e-05, "loss": 2.5694, "step": 27420 }, { "epoch": 0.36, "learning_rate": 7.198535444402514e-05, "loss": 2.635, "step": 27425 }, { "epoch": 0.36, "learning_rate": 7.197618749082146e-05, "loss": 2.7101, "step": 27430 }, { "epoch": 0.36, "learning_rate": 7.196701962196732e-05, "loss": 2.6807, "step": 27435 }, { "epoch": 0.36, "learning_rate": 7.195785083784475e-05, "loss": 2.6531, "step": 27440 }, { "epoch": 0.36, "learning_rate": 7.194868113883573e-05, "loss": 2.5149, "step": 27445 }, { "epoch": 0.36, "learning_rate": 7.193951052532235e-05, "loss": 2.5109, "step": 27450 }, { "epoch": 0.36, "learning_rate": 7.19303389976867e-05, "loss": 2.5589, "step": 27455 }, { "epoch": 0.36, "learning_rate": 7.192116655631094e-05, "loss": 2.5955, "step": 27460 }, { "epoch": 0.36, "learning_rate": 7.19119932015772e-05, "loss": 2.582, "step": 27465 }, { "epoch": 0.36, "learning_rate": 7.190281893386773e-05, "loss": 2.5747, "step": 27470 }, { "epoch": 0.36, "learning_rate": 7.189364375356475e-05, "loss": 2.6717, "step": 27475 }, { "epoch": 0.36, "learning_rate": 7.188446766105057e-05, "loss": 2.5591, "step": 27480 }, { "epoch": 0.36, "learning_rate": 7.187529065670752e-05, "loss": 2.5288, "step": 27485 }, { "epoch": 0.36, "learning_rate": 7.186611274091797e-05, "loss": 2.6139, "step": 27490 }, { "epoch": 0.36, "learning_rate": 7.185693391406431e-05, "loss": 2.5265, "step": 27495 }, { "epoch": 0.36, "learning_rate": 7.184775417652899e-05, "loss": 2.6215, "step": 27500 }, { "epoch": 0.36, "learning_rate": 7.183857352869445e-05, "loss": 2.7132, "step": 27505 }, { "epoch": 0.36, "learning_rate": 7.182939197094324e-05, "loss": 2.527, "step": 27510 }, { "epoch": 0.36, "learning_rate": 7.182020950365794e-05, "loss": 2.5789, "step": 27515 }, { "epoch": 0.36, "learning_rate": 7.181102612722111e-05, "loss": 2.6361, "step": 27520 }, { "epoch": 0.36, "learning_rate": 7.18018418420154e-05, "loss": 2.6018, "step": 27525 }, { "epoch": 0.36, "learning_rate": 7.179265664842345e-05, "loss": 2.5555, "step": 27530 }, { "epoch": 0.36, "learning_rate": 7.178347054682798e-05, "loss": 2.5643, "step": 27535 }, { "epoch": 0.36, "learning_rate": 7.177428353761173e-05, "loss": 2.5084, "step": 27540 }, { "epoch": 0.36, "learning_rate": 7.17650956211575e-05, "loss": 2.7213, "step": 27545 }, { "epoch": 0.36, "learning_rate": 7.175590679784811e-05, "loss": 2.5794, "step": 27550 }, { "epoch": 0.36, "learning_rate": 7.17467170680664e-05, "loss": 2.5311, "step": 27555 }, { "epoch": 0.36, "learning_rate": 7.173752643219526e-05, "loss": 2.8051, "step": 27560 }, { "epoch": 0.36, "learning_rate": 7.172833489061764e-05, "loss": 2.6759, "step": 27565 }, { "epoch": 0.36, "learning_rate": 7.17191424437165e-05, "loss": 2.606, "step": 27570 }, { "epoch": 0.36, "learning_rate": 7.170994909187485e-05, "loss": 2.5573, "step": 27575 }, { "epoch": 0.36, "learning_rate": 7.170075483547576e-05, "loss": 2.5587, "step": 27580 }, { "epoch": 0.36, "learning_rate": 7.169155967490229e-05, "loss": 2.6748, "step": 27585 }, { "epoch": 0.36, "learning_rate": 7.168236361053755e-05, "loss": 2.6715, "step": 27590 }, { "epoch": 0.36, "learning_rate": 7.167316664276474e-05, "loss": 2.5534, "step": 27595 }, { "epoch": 0.36, "learning_rate": 7.166396877196699e-05, "loss": 2.5182, "step": 27600 }, { "epoch": 0.36, "learning_rate": 7.16547699985276e-05, "loss": 2.6305, "step": 27605 }, { "epoch": 0.36, "learning_rate": 7.164557032282982e-05, "loss": 2.6183, "step": 27610 }, { "epoch": 0.36, "learning_rate": 7.163636974525696e-05, "loss": 2.5598, "step": 27615 }, { "epoch": 0.36, "learning_rate": 7.162716826619237e-05, "loss": 2.7084, "step": 27620 }, { "epoch": 0.36, "learning_rate": 7.161796588601943e-05, "loss": 2.6477, "step": 27625 }, { "epoch": 0.36, "learning_rate": 7.160876260512154e-05, "loss": 2.6936, "step": 27630 }, { "epoch": 0.36, "learning_rate": 7.15995584238822e-05, "loss": 2.6662, "step": 27635 }, { "epoch": 0.36, "learning_rate": 7.159035334268489e-05, "loss": 2.5105, "step": 27640 }, { "epoch": 0.36, "learning_rate": 7.158114736191316e-05, "loss": 2.578, "step": 27645 }, { "epoch": 0.36, "learning_rate": 7.157194048195055e-05, "loss": 2.6493, "step": 27650 }, { "epoch": 0.36, "learning_rate": 7.15627327031807e-05, "loss": 2.6884, "step": 27655 }, { "epoch": 0.36, "learning_rate": 7.155352402598723e-05, "loss": 2.6618, "step": 27660 }, { "epoch": 0.36, "learning_rate": 7.154431445075385e-05, "loss": 2.5637, "step": 27665 }, { "epoch": 0.36, "learning_rate": 7.153510397786425e-05, "loss": 2.7352, "step": 27670 }, { "epoch": 0.36, "learning_rate": 7.152589260770223e-05, "loss": 2.5317, "step": 27675 }, { "epoch": 0.36, "learning_rate": 7.151668034065158e-05, "loss": 2.6411, "step": 27680 }, { "epoch": 0.36, "learning_rate": 7.150746717709613e-05, "loss": 2.5732, "step": 27685 }, { "epoch": 0.36, "learning_rate": 7.149825311741972e-05, "loss": 2.4983, "step": 27690 }, { "epoch": 0.36, "learning_rate": 7.148903816200629e-05, "loss": 2.6282, "step": 27695 }, { "epoch": 0.36, "learning_rate": 7.147982231123977e-05, "loss": 2.5951, "step": 27700 }, { "epoch": 0.36, "learning_rate": 7.147060556550417e-05, "loss": 2.5658, "step": 27705 }, { "epoch": 0.36, "learning_rate": 7.14613879251835e-05, "loss": 2.6881, "step": 27710 }, { "epoch": 0.36, "learning_rate": 7.145216939066182e-05, "loss": 2.6044, "step": 27715 }, { "epoch": 0.36, "learning_rate": 7.144294996232319e-05, "loss": 2.5467, "step": 27720 }, { "epoch": 0.36, "learning_rate": 7.143372964055179e-05, "loss": 2.6179, "step": 27725 }, { "epoch": 0.36, "learning_rate": 7.142450842573176e-05, "loss": 2.5385, "step": 27730 }, { "epoch": 0.36, "learning_rate": 7.141528631824732e-05, "loss": 2.7326, "step": 27735 }, { "epoch": 0.36, "learning_rate": 7.140606331848273e-05, "loss": 2.5669, "step": 27740 }, { "epoch": 0.36, "learning_rate": 7.139683942682225e-05, "loss": 2.5255, "step": 27745 }, { "epoch": 0.36, "learning_rate": 7.13876146436502e-05, "loss": 2.5765, "step": 27750 }, { "epoch": 0.36, "learning_rate": 7.137838896935093e-05, "loss": 2.5815, "step": 27755 }, { "epoch": 0.36, "learning_rate": 7.136916240430885e-05, "loss": 2.6097, "step": 27760 }, { "epoch": 0.36, "learning_rate": 7.135993494890838e-05, "loss": 2.5707, "step": 27765 }, { "epoch": 0.36, "learning_rate": 7.135070660353398e-05, "loss": 2.7389, "step": 27770 }, { "epoch": 0.36, "learning_rate": 7.13414773685702e-05, "loss": 2.6863, "step": 27775 }, { "epoch": 0.36, "learning_rate": 7.133224724440152e-05, "loss": 2.6078, "step": 27780 }, { "epoch": 0.36, "learning_rate": 7.132301623141253e-05, "loss": 2.5685, "step": 27785 }, { "epoch": 0.36, "learning_rate": 7.131378432998788e-05, "loss": 2.6324, "step": 27790 }, { "epoch": 0.36, "learning_rate": 7.130455154051219e-05, "loss": 2.544, "step": 27795 }, { "epoch": 0.36, "learning_rate": 7.129531786337017e-05, "loss": 2.7356, "step": 27800 }, { "epoch": 0.36, "learning_rate": 7.128608329894654e-05, "loss": 2.6003, "step": 27805 }, { "epoch": 0.36, "learning_rate": 7.127684784762606e-05, "loss": 2.6185, "step": 27810 }, { "epoch": 0.36, "learning_rate": 7.126761150979352e-05, "loss": 2.6512, "step": 27815 }, { "epoch": 0.36, "learning_rate": 7.125837428583377e-05, "loss": 2.5336, "step": 27820 }, { "epoch": 0.36, "learning_rate": 7.124913617613169e-05, "loss": 2.6967, "step": 27825 }, { "epoch": 0.36, "learning_rate": 7.123989718107219e-05, "loss": 2.719, "step": 27830 }, { "epoch": 0.36, "learning_rate": 7.123065730104021e-05, "loss": 2.5096, "step": 27835 }, { "epoch": 0.36, "learning_rate": 7.122141653642073e-05, "loss": 2.6755, "step": 27840 }, { "epoch": 0.36, "learning_rate": 7.121217488759877e-05, "loss": 2.6019, "step": 27845 }, { "epoch": 0.36, "learning_rate": 7.120293235495942e-05, "loss": 2.5531, "step": 27850 }, { "epoch": 0.36, "learning_rate": 7.119368893888773e-05, "loss": 2.5729, "step": 27855 }, { "epoch": 0.36, "learning_rate": 7.118444463976887e-05, "loss": 2.5772, "step": 27860 }, { "epoch": 0.36, "learning_rate": 7.117519945798799e-05, "loss": 2.5814, "step": 27865 }, { "epoch": 0.36, "learning_rate": 7.11659533939303e-05, "loss": 2.7178, "step": 27870 }, { "epoch": 0.36, "learning_rate": 7.115670644798105e-05, "loss": 2.5404, "step": 27875 }, { "epoch": 0.36, "learning_rate": 7.11474586205255e-05, "loss": 2.6338, "step": 27880 }, { "epoch": 0.36, "learning_rate": 7.113820991194898e-05, "loss": 2.6289, "step": 27885 }, { "epoch": 0.36, "learning_rate": 7.112896032263683e-05, "loss": 2.5339, "step": 27890 }, { "epoch": 0.36, "learning_rate": 7.111970985297446e-05, "loss": 2.6075, "step": 27895 }, { "epoch": 0.36, "learning_rate": 7.11104585033473e-05, "loss": 2.5491, "step": 27900 }, { "epoch": 0.36, "learning_rate": 7.110120627414079e-05, "loss": 2.5282, "step": 27905 }, { "epoch": 0.36, "learning_rate": 7.109195316574042e-05, "loss": 2.7445, "step": 27910 }, { "epoch": 0.36, "learning_rate": 7.108269917853177e-05, "loss": 2.6293, "step": 27915 }, { "epoch": 0.36, "learning_rate": 7.107344431290036e-05, "loss": 2.6764, "step": 27920 }, { "epoch": 0.36, "learning_rate": 7.106418856923185e-05, "loss": 2.5797, "step": 27925 }, { "epoch": 0.36, "learning_rate": 7.105493194791186e-05, "loss": 2.6539, "step": 27930 }, { "epoch": 0.36, "learning_rate": 7.104567444932605e-05, "loss": 2.7307, "step": 27935 }, { "epoch": 0.36, "learning_rate": 7.10364160738602e-05, "loss": 2.4933, "step": 27940 }, { "epoch": 0.36, "learning_rate": 7.10271568219e-05, "loss": 2.6396, "step": 27945 }, { "epoch": 0.36, "learning_rate": 7.101789669383128e-05, "loss": 2.7721, "step": 27950 }, { "epoch": 0.36, "learning_rate": 7.100863569003985e-05, "loss": 2.5363, "step": 27955 }, { "epoch": 0.36, "learning_rate": 7.09993738109116e-05, "loss": 2.6065, "step": 27960 }, { "epoch": 0.36, "learning_rate": 7.099011105683241e-05, "loss": 2.7244, "step": 27965 }, { "epoch": 0.36, "learning_rate": 7.098084742818822e-05, "loss": 2.5009, "step": 27970 }, { "epoch": 0.36, "learning_rate": 7.097158292536502e-05, "loss": 2.5963, "step": 27975 }, { "epoch": 0.36, "learning_rate": 7.09623175487488e-05, "loss": 2.5152, "step": 27980 }, { "epoch": 0.36, "learning_rate": 7.095305129872563e-05, "loss": 2.5694, "step": 27985 }, { "epoch": 0.36, "learning_rate": 7.094378417568156e-05, "loss": 2.5834, "step": 27990 }, { "epoch": 0.36, "learning_rate": 7.093451618000273e-05, "loss": 2.5377, "step": 27995 }, { "epoch": 0.36, "learning_rate": 7.092524731207532e-05, "loss": 2.5181, "step": 28000 }, { "epoch": 0.36, "learning_rate": 7.091597757228547e-05, "loss": 2.6326, "step": 28005 }, { "epoch": 0.36, "learning_rate": 7.090670696101946e-05, "loss": 2.6434, "step": 28010 }, { "epoch": 0.36, "learning_rate": 7.089743547866351e-05, "loss": 2.6602, "step": 28015 }, { "epoch": 0.36, "learning_rate": 7.088816312560398e-05, "loss": 2.6472, "step": 28020 }, { "epoch": 0.36, "learning_rate": 7.087888990222715e-05, "loss": 2.4622, "step": 28025 }, { "epoch": 0.36, "learning_rate": 7.086961580891942e-05, "loss": 2.5421, "step": 28030 }, { "epoch": 0.36, "learning_rate": 7.08603408460672e-05, "loss": 2.4743, "step": 28035 }, { "epoch": 0.36, "learning_rate": 7.085106501405693e-05, "loss": 2.6478, "step": 28040 }, { "epoch": 0.36, "learning_rate": 7.08417883132751e-05, "loss": 2.7064, "step": 28045 }, { "epoch": 0.36, "learning_rate": 7.083251074410821e-05, "loss": 2.6407, "step": 28050 }, { "epoch": 0.36, "learning_rate": 7.082323230694286e-05, "loss": 2.6478, "step": 28055 }, { "epoch": 0.36, "learning_rate": 7.081395300216559e-05, "loss": 2.5926, "step": 28060 }, { "epoch": 0.36, "learning_rate": 7.080467283016307e-05, "loss": 2.6235, "step": 28065 }, { "epoch": 0.36, "learning_rate": 7.079539179132194e-05, "loss": 2.6231, "step": 28070 }, { "epoch": 0.36, "learning_rate": 7.078610988602887e-05, "loss": 2.6535, "step": 28075 }, { "epoch": 0.36, "learning_rate": 7.077682711467066e-05, "loss": 2.5982, "step": 28080 }, { "epoch": 0.36, "learning_rate": 7.076754347763405e-05, "loss": 2.5871, "step": 28085 }, { "epoch": 0.36, "learning_rate": 7.075825897530586e-05, "loss": 2.7386, "step": 28090 }, { "epoch": 0.36, "learning_rate": 7.07489736080729e-05, "loss": 2.5669, "step": 28095 }, { "epoch": 0.36, "learning_rate": 7.073968737632208e-05, "loss": 2.5925, "step": 28100 }, { "epoch": 0.36, "learning_rate": 7.073040028044034e-05, "loss": 2.5854, "step": 28105 }, { "epoch": 0.36, "learning_rate": 7.072111232081456e-05, "loss": 2.4574, "step": 28110 }, { "epoch": 0.36, "learning_rate": 7.071182349783178e-05, "loss": 2.7098, "step": 28115 }, { "epoch": 0.36, "learning_rate": 7.070253381187903e-05, "loss": 2.6342, "step": 28120 }, { "epoch": 0.37, "learning_rate": 7.069324326334334e-05, "loss": 2.6185, "step": 28125 }, { "epoch": 0.37, "learning_rate": 7.068395185261183e-05, "loss": 2.4827, "step": 28130 }, { "epoch": 0.37, "learning_rate": 7.067465958007163e-05, "loss": 2.6374, "step": 28135 }, { "epoch": 0.37, "learning_rate": 7.066536644610988e-05, "loss": 2.6075, "step": 28140 }, { "epoch": 0.37, "learning_rate": 7.06560724511138e-05, "loss": 2.6553, "step": 28145 }, { "epoch": 0.37, "learning_rate": 7.064677759547065e-05, "loss": 2.4832, "step": 28150 }, { "epoch": 0.37, "learning_rate": 7.06374818795677e-05, "loss": 2.577, "step": 28155 }, { "epoch": 0.37, "learning_rate": 7.062818530379222e-05, "loss": 2.4309, "step": 28160 }, { "epoch": 0.37, "learning_rate": 7.061888786853162e-05, "loss": 2.613, "step": 28165 }, { "epoch": 0.37, "learning_rate": 7.060958957417323e-05, "loss": 2.6841, "step": 28170 }, { "epoch": 0.37, "learning_rate": 7.060029042110449e-05, "loss": 2.4837, "step": 28175 }, { "epoch": 0.37, "learning_rate": 7.059099040971286e-05, "loss": 2.5876, "step": 28180 }, { "epoch": 0.37, "learning_rate": 7.058168954038582e-05, "loss": 2.5534, "step": 28185 }, { "epoch": 0.37, "learning_rate": 7.05723878135109e-05, "loss": 2.5498, "step": 28190 }, { "epoch": 0.37, "learning_rate": 7.056308522947568e-05, "loss": 2.6432, "step": 28195 }, { "epoch": 0.37, "learning_rate": 7.055378178866773e-05, "loss": 2.4975, "step": 28200 }, { "epoch": 0.37, "learning_rate": 7.054447749147468e-05, "loss": 2.6418, "step": 28205 }, { "epoch": 0.37, "learning_rate": 7.053517233828422e-05, "loss": 2.668, "step": 28210 }, { "epoch": 0.37, "learning_rate": 7.052586632948404e-05, "loss": 2.6837, "step": 28215 }, { "epoch": 0.37, "learning_rate": 7.05165594654619e-05, "loss": 2.6153, "step": 28220 }, { "epoch": 0.37, "learning_rate": 7.050725174660556e-05, "loss": 2.729, "step": 28225 }, { "epoch": 0.37, "learning_rate": 7.049794317330283e-05, "loss": 2.6863, "step": 28230 }, { "epoch": 0.37, "learning_rate": 7.048863374594154e-05, "loss": 2.6886, "step": 28235 }, { "epoch": 0.37, "learning_rate": 7.047932346490962e-05, "loss": 2.6938, "step": 28240 }, { "epoch": 0.37, "learning_rate": 7.047001233059495e-05, "loss": 2.6863, "step": 28245 }, { "epoch": 0.37, "learning_rate": 7.04607003433855e-05, "loss": 2.7167, "step": 28250 }, { "epoch": 0.37, "learning_rate": 7.045138750366926e-05, "loss": 2.6935, "step": 28255 }, { "epoch": 0.37, "learning_rate": 7.044207381183424e-05, "loss": 2.7145, "step": 28260 }, { "epoch": 0.37, "learning_rate": 7.04327592682685e-05, "loss": 2.446, "step": 28265 }, { "epoch": 0.37, "learning_rate": 7.042344387336016e-05, "loss": 2.584, "step": 28270 }, { "epoch": 0.37, "learning_rate": 7.041412762749732e-05, "loss": 2.6403, "step": 28275 }, { "epoch": 0.37, "learning_rate": 7.040481053106819e-05, "loss": 2.5137, "step": 28280 }, { "epoch": 0.37, "learning_rate": 7.039549258446092e-05, "loss": 2.6137, "step": 28285 }, { "epoch": 0.37, "learning_rate": 7.03861737880638e-05, "loss": 2.6457, "step": 28290 }, { "epoch": 0.37, "learning_rate": 7.037685414226507e-05, "loss": 2.6, "step": 28295 }, { "epoch": 0.37, "learning_rate": 7.036753364745304e-05, "loss": 2.5729, "step": 28300 }, { "epoch": 0.37, "learning_rate": 7.035821230401605e-05, "loss": 2.6965, "step": 28305 }, { "epoch": 0.37, "learning_rate": 7.034889011234247e-05, "loss": 2.5404, "step": 28310 }, { "epoch": 0.37, "learning_rate": 7.033956707282077e-05, "loss": 2.6154, "step": 28315 }, { "epoch": 0.37, "learning_rate": 7.033024318583934e-05, "loss": 2.6949, "step": 28320 }, { "epoch": 0.37, "learning_rate": 7.03209184517867e-05, "loss": 2.6082, "step": 28325 }, { "epoch": 0.37, "learning_rate": 7.031159287105134e-05, "loss": 2.4881, "step": 28330 }, { "epoch": 0.37, "learning_rate": 7.030226644402185e-05, "loss": 2.5824, "step": 28335 }, { "epoch": 0.37, "learning_rate": 7.029293917108678e-05, "loss": 2.5693, "step": 28340 }, { "epoch": 0.37, "learning_rate": 7.02836110526348e-05, "loss": 2.69, "step": 28345 }, { "epoch": 0.37, "learning_rate": 7.027428208905456e-05, "loss": 2.4875, "step": 28350 }, { "epoch": 0.37, "learning_rate": 7.026495228073473e-05, "loss": 2.6226, "step": 28355 }, { "epoch": 0.37, "learning_rate": 7.025562162806404e-05, "loss": 2.6334, "step": 28360 }, { "epoch": 0.37, "learning_rate": 7.024629013143131e-05, "loss": 2.5767, "step": 28365 }, { "epoch": 0.37, "learning_rate": 7.02369577912253e-05, "loss": 2.6705, "step": 28370 }, { "epoch": 0.37, "learning_rate": 7.022762460783486e-05, "loss": 2.4944, "step": 28375 }, { "epoch": 0.37, "learning_rate": 7.021829058164886e-05, "loss": 2.543, "step": 28380 }, { "epoch": 0.37, "learning_rate": 7.02089557130562e-05, "loss": 2.6903, "step": 28385 }, { "epoch": 0.37, "learning_rate": 7.019962000244582e-05, "loss": 2.7392, "step": 28390 }, { "epoch": 0.37, "learning_rate": 7.019028345020671e-05, "loss": 2.5635, "step": 28395 }, { "epoch": 0.37, "learning_rate": 7.018094605672788e-05, "loss": 2.5863, "step": 28400 }, { "epoch": 0.37, "learning_rate": 7.017160782239837e-05, "loss": 2.6032, "step": 28405 }, { "epoch": 0.37, "learning_rate": 7.01622687476073e-05, "loss": 2.5374, "step": 28410 }, { "epoch": 0.37, "learning_rate": 7.015292883274374e-05, "loss": 2.5943, "step": 28415 }, { "epoch": 0.37, "learning_rate": 7.014358807819685e-05, "loss": 2.5528, "step": 28420 }, { "epoch": 0.37, "learning_rate": 7.013424648435584e-05, "loss": 2.4474, "step": 28425 }, { "epoch": 0.37, "learning_rate": 7.012490405160991e-05, "loss": 2.6328, "step": 28430 }, { "epoch": 0.37, "learning_rate": 7.011556078034835e-05, "loss": 2.5882, "step": 28435 }, { "epoch": 0.37, "learning_rate": 7.010621667096041e-05, "loss": 2.5818, "step": 28440 }, { "epoch": 0.37, "learning_rate": 7.009687172383545e-05, "loss": 2.5857, "step": 28445 }, { "epoch": 0.37, "learning_rate": 7.008752593936283e-05, "loss": 2.5988, "step": 28450 }, { "epoch": 0.37, "learning_rate": 7.007817931793192e-05, "loss": 2.5381, "step": 28455 }, { "epoch": 0.37, "learning_rate": 7.006883185993218e-05, "loss": 2.6015, "step": 28460 }, { "epoch": 0.37, "learning_rate": 7.005948356575309e-05, "loss": 2.5781, "step": 28465 }, { "epoch": 0.37, "learning_rate": 7.00501344357841e-05, "loss": 2.5346, "step": 28470 }, { "epoch": 0.37, "learning_rate": 7.00407844704148e-05, "loss": 2.5474, "step": 28475 }, { "epoch": 0.37, "learning_rate": 7.003143367003473e-05, "loss": 2.6135, "step": 28480 }, { "epoch": 0.37, "learning_rate": 7.002208203503351e-05, "loss": 2.6547, "step": 28485 }, { "epoch": 0.37, "learning_rate": 7.001272956580078e-05, "loss": 2.6888, "step": 28490 }, { "epoch": 0.37, "learning_rate": 7.000337626272619e-05, "loss": 2.6722, "step": 28495 }, { "epoch": 0.37, "learning_rate": 6.99940221261995e-05, "loss": 2.7284, "step": 28500 }, { "epoch": 0.37, "learning_rate": 6.998466715661043e-05, "loss": 2.6177, "step": 28505 }, { "epoch": 0.37, "learning_rate": 6.997531135434876e-05, "loss": 2.5985, "step": 28510 }, { "epoch": 0.37, "learning_rate": 6.99659547198043e-05, "loss": 2.6149, "step": 28515 }, { "epoch": 0.37, "learning_rate": 6.995659725336689e-05, "loss": 2.5816, "step": 28520 }, { "epoch": 0.37, "learning_rate": 6.994723895542644e-05, "loss": 2.5604, "step": 28525 }, { "epoch": 0.37, "learning_rate": 6.993787982637285e-05, "loss": 2.6646, "step": 28530 }, { "epoch": 0.37, "learning_rate": 6.99285198665961e-05, "loss": 2.6014, "step": 28535 }, { "epoch": 0.37, "learning_rate": 6.991915907648613e-05, "loss": 2.5966, "step": 28540 }, { "epoch": 0.37, "learning_rate": 6.990979745643303e-05, "loss": 2.5797, "step": 28545 }, { "epoch": 0.37, "learning_rate": 6.990043500682678e-05, "loss": 2.6312, "step": 28550 }, { "epoch": 0.37, "learning_rate": 6.989107172805752e-05, "loss": 2.6864, "step": 28555 }, { "epoch": 0.37, "learning_rate": 6.988170762051538e-05, "loss": 2.5837, "step": 28560 }, { "epoch": 0.37, "learning_rate": 6.987234268459051e-05, "loss": 2.6452, "step": 28565 }, { "epoch": 0.37, "learning_rate": 6.986297692067309e-05, "loss": 2.7074, "step": 28570 }, { "epoch": 0.37, "learning_rate": 6.985361032915337e-05, "loss": 2.4999, "step": 28575 }, { "epoch": 0.37, "learning_rate": 6.98442429104216e-05, "loss": 2.4744, "step": 28580 }, { "epoch": 0.37, "learning_rate": 6.983487466486809e-05, "loss": 2.7639, "step": 28585 }, { "epoch": 0.37, "learning_rate": 6.982550559288317e-05, "loss": 2.5783, "step": 28590 }, { "epoch": 0.37, "learning_rate": 6.98161356948572e-05, "loss": 2.5353, "step": 28595 }, { "epoch": 0.37, "learning_rate": 6.980676497118061e-05, "loss": 2.691, "step": 28600 }, { "epoch": 0.37, "learning_rate": 6.979739342224381e-05, "loss": 2.5613, "step": 28605 }, { "epoch": 0.37, "learning_rate": 6.978802104843727e-05, "loss": 2.5067, "step": 28610 }, { "epoch": 0.37, "learning_rate": 6.97786478501515e-05, "loss": 2.6345, "step": 28615 }, { "epoch": 0.37, "learning_rate": 6.976927382777705e-05, "loss": 2.5255, "step": 28620 }, { "epoch": 0.37, "learning_rate": 6.975989898170449e-05, "loss": 2.6189, "step": 28625 }, { "epoch": 0.37, "learning_rate": 6.975052331232441e-05, "loss": 2.559, "step": 28630 }, { "epoch": 0.37, "learning_rate": 6.974114682002748e-05, "loss": 2.5405, "step": 28635 }, { "epoch": 0.37, "learning_rate": 6.973176950520436e-05, "loss": 2.5677, "step": 28640 }, { "epoch": 0.37, "learning_rate": 6.972239136824575e-05, "loss": 2.5228, "step": 28645 }, { "epoch": 0.37, "learning_rate": 6.971301240954242e-05, "loss": 2.6627, "step": 28650 }, { "epoch": 0.37, "learning_rate": 6.970363262948515e-05, "loss": 2.6547, "step": 28655 }, { "epoch": 0.37, "learning_rate": 6.969425202846475e-05, "loss": 2.487, "step": 28660 }, { "epoch": 0.37, "learning_rate": 6.968487060687205e-05, "loss": 2.4914, "step": 28665 }, { "epoch": 0.37, "learning_rate": 6.967548836509795e-05, "loss": 2.671, "step": 28670 }, { "epoch": 0.37, "learning_rate": 6.966610530353334e-05, "loss": 2.46, "step": 28675 }, { "epoch": 0.37, "learning_rate": 6.965672142256921e-05, "loss": 2.6178, "step": 28680 }, { "epoch": 0.37, "learning_rate": 6.964733672259653e-05, "loss": 2.5356, "step": 28685 }, { "epoch": 0.37, "learning_rate": 6.963795120400632e-05, "loss": 2.5735, "step": 28690 }, { "epoch": 0.37, "learning_rate": 6.962856486718962e-05, "loss": 2.6182, "step": 28695 }, { "epoch": 0.37, "learning_rate": 6.961917771253751e-05, "loss": 2.4716, "step": 28700 }, { "epoch": 0.37, "learning_rate": 6.960978974044115e-05, "loss": 2.6055, "step": 28705 }, { "epoch": 0.37, "learning_rate": 6.960040095129167e-05, "loss": 2.6686, "step": 28710 }, { "epoch": 0.37, "learning_rate": 6.959101134548025e-05, "loss": 2.5882, "step": 28715 }, { "epoch": 0.37, "learning_rate": 6.958162092339813e-05, "loss": 2.7725, "step": 28720 }, { "epoch": 0.37, "learning_rate": 6.957222968543657e-05, "loss": 2.7884, "step": 28725 }, { "epoch": 0.37, "learning_rate": 6.956283763198684e-05, "loss": 2.5786, "step": 28730 }, { "epoch": 0.37, "learning_rate": 6.955344476344029e-05, "loss": 2.6243, "step": 28735 }, { "epoch": 0.37, "learning_rate": 6.954405108018825e-05, "loss": 2.5893, "step": 28740 }, { "epoch": 0.37, "learning_rate": 6.953465658262214e-05, "loss": 2.6276, "step": 28745 }, { "epoch": 0.37, "learning_rate": 6.952526127113339e-05, "loss": 2.6447, "step": 28750 }, { "epoch": 0.37, "learning_rate": 6.951586514611344e-05, "loss": 2.6901, "step": 28755 }, { "epoch": 0.37, "learning_rate": 6.95064682079538e-05, "loss": 2.5712, "step": 28760 }, { "epoch": 0.37, "learning_rate": 6.949707045704598e-05, "loss": 2.5461, "step": 28765 }, { "epoch": 0.37, "learning_rate": 6.948767189378155e-05, "loss": 2.467, "step": 28770 }, { "epoch": 0.37, "learning_rate": 6.947827251855212e-05, "loss": 2.7104, "step": 28775 }, { "epoch": 0.37, "learning_rate": 6.946887233174931e-05, "loss": 2.6417, "step": 28780 }, { "epoch": 0.37, "learning_rate": 6.94594713337648e-05, "loss": 2.4565, "step": 28785 }, { "epoch": 0.37, "learning_rate": 6.945006952499026e-05, "loss": 2.5821, "step": 28790 }, { "epoch": 0.37, "learning_rate": 6.944066690581745e-05, "loss": 2.5842, "step": 28795 }, { "epoch": 0.37, "learning_rate": 6.943126347663811e-05, "loss": 2.4402, "step": 28800 }, { "epoch": 0.37, "learning_rate": 6.942185923784405e-05, "loss": 2.6676, "step": 28805 }, { "epoch": 0.37, "learning_rate": 6.941245418982711e-05, "loss": 2.6693, "step": 28810 }, { "epoch": 0.37, "learning_rate": 6.940304833297917e-05, "loss": 2.595, "step": 28815 }, { "epoch": 0.37, "learning_rate": 6.939364166769208e-05, "loss": 2.3878, "step": 28820 }, { "epoch": 0.37, "learning_rate": 6.938423419435782e-05, "loss": 2.7018, "step": 28825 }, { "epoch": 0.37, "learning_rate": 6.937482591336834e-05, "loss": 2.6083, "step": 28830 }, { "epoch": 0.37, "learning_rate": 6.936541682511564e-05, "loss": 2.3709, "step": 28835 }, { "epoch": 0.37, "learning_rate": 6.935600692999176e-05, "loss": 2.6218, "step": 28840 }, { "epoch": 0.37, "learning_rate": 6.934659622838877e-05, "loss": 2.4954, "step": 28845 }, { "epoch": 0.37, "learning_rate": 6.933718472069877e-05, "loss": 2.5687, "step": 28850 }, { "epoch": 0.37, "learning_rate": 6.932777240731391e-05, "loss": 2.6419, "step": 28855 }, { "epoch": 0.37, "learning_rate": 6.931835928862632e-05, "loss": 2.5577, "step": 28860 }, { "epoch": 0.37, "learning_rate": 6.930894536502824e-05, "loss": 2.6168, "step": 28865 }, { "epoch": 0.37, "learning_rate": 6.92995306369119e-05, "loss": 2.6327, "step": 28870 }, { "epoch": 0.37, "learning_rate": 6.929011510466957e-05, "loss": 2.5263, "step": 28875 }, { "epoch": 0.37, "learning_rate": 6.928069876869354e-05, "loss": 2.5365, "step": 28880 }, { "epoch": 0.37, "learning_rate": 6.927128162937615e-05, "loss": 2.5427, "step": 28885 }, { "epoch": 0.37, "learning_rate": 6.926186368710979e-05, "loss": 2.5966, "step": 28890 }, { "epoch": 0.37, "learning_rate": 6.925244494228684e-05, "loss": 2.7116, "step": 28895 }, { "epoch": 0.38, "learning_rate": 6.924302539529974e-05, "loss": 2.6167, "step": 28900 }, { "epoch": 0.38, "learning_rate": 6.923360504654098e-05, "loss": 2.5011, "step": 28905 }, { "epoch": 0.38, "learning_rate": 6.922418389640306e-05, "loss": 2.6458, "step": 28910 }, { "epoch": 0.38, "learning_rate": 6.921476194527851e-05, "loss": 2.6204, "step": 28915 }, { "epoch": 0.38, "learning_rate": 6.920533919355988e-05, "loss": 2.6003, "step": 28920 }, { "epoch": 0.38, "learning_rate": 6.919591564163981e-05, "loss": 2.5768, "step": 28925 }, { "epoch": 0.38, "learning_rate": 6.918649128991093e-05, "loss": 2.4142, "step": 28930 }, { "epoch": 0.38, "learning_rate": 6.917706613876588e-05, "loss": 2.6571, "step": 28935 }, { "epoch": 0.38, "learning_rate": 6.916764018859742e-05, "loss": 2.7962, "step": 28940 }, { "epoch": 0.38, "learning_rate": 6.915821343979824e-05, "loss": 2.518, "step": 28945 }, { "epoch": 0.38, "learning_rate": 6.914878589276113e-05, "loss": 2.6208, "step": 28950 }, { "epoch": 0.38, "learning_rate": 6.913935754787888e-05, "loss": 2.5573, "step": 28955 }, { "epoch": 0.38, "learning_rate": 6.912992840554436e-05, "loss": 2.6971, "step": 28960 }, { "epoch": 0.38, "learning_rate": 6.91204984661504e-05, "loss": 2.7228, "step": 28965 }, { "epoch": 0.38, "learning_rate": 6.911106773008992e-05, "loss": 2.6648, "step": 28970 }, { "epoch": 0.38, "learning_rate": 6.910163619775588e-05, "loss": 2.5804, "step": 28975 }, { "epoch": 0.38, "learning_rate": 6.909220386954123e-05, "loss": 2.6273, "step": 28980 }, { "epoch": 0.38, "learning_rate": 6.908277074583895e-05, "loss": 2.456, "step": 28985 }, { "epoch": 0.38, "learning_rate": 6.907333682704212e-05, "loss": 2.6478, "step": 28990 }, { "epoch": 0.38, "learning_rate": 6.906390211354378e-05, "loss": 2.5701, "step": 28995 }, { "epoch": 0.38, "learning_rate": 6.905446660573705e-05, "loss": 2.5774, "step": 29000 }, { "epoch": 0.38, "learning_rate": 6.904503030401506e-05, "loss": 2.6409, "step": 29005 }, { "epoch": 0.38, "learning_rate": 6.903559320877098e-05, "loss": 2.7155, "step": 29010 }, { "epoch": 0.38, "learning_rate": 6.9026155320398e-05, "loss": 2.5209, "step": 29015 }, { "epoch": 0.38, "learning_rate": 6.901671663928935e-05, "loss": 2.5424, "step": 29020 }, { "epoch": 0.38, "learning_rate": 6.900727716583835e-05, "loss": 2.5683, "step": 29025 }, { "epoch": 0.38, "learning_rate": 6.899783690043822e-05, "loss": 2.5788, "step": 29030 }, { "epoch": 0.38, "learning_rate": 6.898839584348237e-05, "loss": 2.5484, "step": 29035 }, { "epoch": 0.38, "learning_rate": 6.897895399536413e-05, "loss": 2.5451, "step": 29040 }, { "epoch": 0.38, "learning_rate": 6.89695113564769e-05, "loss": 2.5811, "step": 29045 }, { "epoch": 0.38, "learning_rate": 6.896006792721411e-05, "loss": 2.6662, "step": 29050 }, { "epoch": 0.38, "learning_rate": 6.895062370796925e-05, "loss": 2.5921, "step": 29055 }, { "epoch": 0.38, "learning_rate": 6.894117869913577e-05, "loss": 2.617, "step": 29060 }, { "epoch": 0.38, "learning_rate": 6.893173290110726e-05, "loss": 2.6524, "step": 29065 }, { "epoch": 0.38, "learning_rate": 6.892228631427726e-05, "loss": 2.7114, "step": 29070 }, { "epoch": 0.38, "learning_rate": 6.891283893903935e-05, "loss": 2.6047, "step": 29075 }, { "epoch": 0.38, "learning_rate": 6.890339077578719e-05, "loss": 2.5176, "step": 29080 }, { "epoch": 0.38, "learning_rate": 6.889394182491444e-05, "loss": 2.6601, "step": 29085 }, { "epoch": 0.38, "learning_rate": 6.888449208681475e-05, "loss": 2.5681, "step": 29090 }, { "epoch": 0.38, "learning_rate": 6.887504156188191e-05, "loss": 2.4962, "step": 29095 }, { "epoch": 0.38, "learning_rate": 6.886559025050965e-05, "loss": 2.6891, "step": 29100 }, { "epoch": 0.38, "learning_rate": 6.885613815309177e-05, "loss": 2.5682, "step": 29105 }, { "epoch": 0.38, "learning_rate": 6.88466852700221e-05, "loss": 2.6251, "step": 29110 }, { "epoch": 0.38, "learning_rate": 6.883723160169449e-05, "loss": 2.6821, "step": 29115 }, { "epoch": 0.38, "learning_rate": 6.882777714850284e-05, "loss": 2.5128, "step": 29120 }, { "epoch": 0.38, "learning_rate": 6.881832191084107e-05, "loss": 2.6269, "step": 29125 }, { "epoch": 0.38, "learning_rate": 6.880886588910316e-05, "loss": 2.6551, "step": 29130 }, { "epoch": 0.38, "learning_rate": 6.879940908368307e-05, "loss": 2.5638, "step": 29135 }, { "epoch": 0.38, "learning_rate": 6.878995149497483e-05, "loss": 2.595, "step": 29140 }, { "epoch": 0.38, "learning_rate": 6.878049312337253e-05, "loss": 2.6067, "step": 29145 }, { "epoch": 0.38, "learning_rate": 6.877103396927021e-05, "loss": 2.5808, "step": 29150 }, { "epoch": 0.38, "learning_rate": 6.8761574033062e-05, "loss": 2.5888, "step": 29155 }, { "epoch": 0.38, "learning_rate": 6.875211331514208e-05, "loss": 2.4187, "step": 29160 }, { "epoch": 0.38, "learning_rate": 6.874265181590462e-05, "loss": 2.4569, "step": 29165 }, { "epoch": 0.38, "learning_rate": 6.873318953574384e-05, "loss": 2.659, "step": 29170 }, { "epoch": 0.38, "learning_rate": 6.872372647505398e-05, "loss": 2.6109, "step": 29175 }, { "epoch": 0.38, "learning_rate": 6.871426263422935e-05, "loss": 2.6116, "step": 29180 }, { "epoch": 0.38, "learning_rate": 6.870479801366425e-05, "loss": 2.5925, "step": 29185 }, { "epoch": 0.38, "learning_rate": 6.869533261375303e-05, "loss": 2.7038, "step": 29190 }, { "epoch": 0.38, "learning_rate": 6.868586643489007e-05, "loss": 2.4546, "step": 29195 }, { "epoch": 0.38, "learning_rate": 6.867639947746977e-05, "loss": 2.5696, "step": 29200 }, { "epoch": 0.38, "learning_rate": 6.86669317418866e-05, "loss": 2.4828, "step": 29205 }, { "epoch": 0.38, "learning_rate": 6.865746322853506e-05, "loss": 2.646, "step": 29210 }, { "epoch": 0.38, "learning_rate": 6.86479939378096e-05, "loss": 2.6415, "step": 29215 }, { "epoch": 0.38, "learning_rate": 6.86385238701048e-05, "loss": 2.4984, "step": 29220 }, { "epoch": 0.38, "learning_rate": 6.862905302581523e-05, "loss": 2.6088, "step": 29225 }, { "epoch": 0.38, "learning_rate": 6.861958140533551e-05, "loss": 2.6345, "step": 29230 }, { "epoch": 0.38, "learning_rate": 6.861010900906026e-05, "loss": 2.6761, "step": 29235 }, { "epoch": 0.38, "learning_rate": 6.860063583738417e-05, "loss": 2.4535, "step": 29240 }, { "epoch": 0.38, "learning_rate": 6.859116189070193e-05, "loss": 2.7058, "step": 29245 }, { "epoch": 0.38, "learning_rate": 6.858168716940828e-05, "loss": 2.576, "step": 29250 }, { "epoch": 0.38, "learning_rate": 6.857221167389801e-05, "loss": 2.6923, "step": 29255 }, { "epoch": 0.38, "learning_rate": 6.856273540456588e-05, "loss": 2.6267, "step": 29260 }, { "epoch": 0.38, "learning_rate": 6.855325836180677e-05, "loss": 2.5768, "step": 29265 }, { "epoch": 0.38, "learning_rate": 6.854378054601553e-05, "loss": 2.6032, "step": 29270 }, { "epoch": 0.38, "learning_rate": 6.853430195758705e-05, "loss": 2.5795, "step": 29275 }, { "epoch": 0.38, "learning_rate": 6.852482259691627e-05, "loss": 2.6485, "step": 29280 }, { "epoch": 0.38, "learning_rate": 6.851534246439814e-05, "loss": 2.5067, "step": 29285 }, { "epoch": 0.38, "learning_rate": 6.850586156042765e-05, "loss": 2.6082, "step": 29290 }, { "epoch": 0.38, "learning_rate": 6.849637988539986e-05, "loss": 2.5888, "step": 29295 }, { "epoch": 0.38, "learning_rate": 6.848689743970982e-05, "loss": 2.5192, "step": 29300 }, { "epoch": 0.38, "learning_rate": 6.847741422375262e-05, "loss": 2.68, "step": 29305 }, { "epoch": 0.38, "learning_rate": 6.846793023792333e-05, "loss": 2.66, "step": 29310 }, { "epoch": 0.38, "learning_rate": 6.84584454826172e-05, "loss": 2.5809, "step": 29315 }, { "epoch": 0.38, "learning_rate": 6.844895995822934e-05, "loss": 2.6633, "step": 29320 }, { "epoch": 0.38, "learning_rate": 6.843947366515502e-05, "loss": 2.5789, "step": 29325 }, { "epoch": 0.38, "learning_rate": 6.842998660378946e-05, "loss": 2.7133, "step": 29330 }, { "epoch": 0.38, "learning_rate": 6.842049877452796e-05, "loss": 2.6254, "step": 29335 }, { "epoch": 0.38, "learning_rate": 6.841101017776584e-05, "loss": 2.6604, "step": 29340 }, { "epoch": 0.38, "learning_rate": 6.840152081389841e-05, "loss": 2.62, "step": 29345 }, { "epoch": 0.38, "learning_rate": 6.83920306833211e-05, "loss": 2.4949, "step": 29350 }, { "epoch": 0.38, "learning_rate": 6.83825397864293e-05, "loss": 2.5966, "step": 29355 }, { "epoch": 0.38, "learning_rate": 6.837304812361846e-05, "loss": 2.5939, "step": 29360 }, { "epoch": 0.38, "learning_rate": 6.836355569528403e-05, "loss": 2.5494, "step": 29365 }, { "epoch": 0.38, "learning_rate": 6.835406250182155e-05, "loss": 2.5342, "step": 29370 }, { "epoch": 0.38, "learning_rate": 6.834456854362655e-05, "loss": 2.5735, "step": 29375 }, { "epoch": 0.38, "learning_rate": 6.833507382109457e-05, "loss": 2.5542, "step": 29380 }, { "epoch": 0.38, "learning_rate": 6.832557833462128e-05, "loss": 2.5478, "step": 29385 }, { "epoch": 0.38, "learning_rate": 6.831608208460225e-05, "loss": 2.644, "step": 29390 }, { "epoch": 0.38, "learning_rate": 6.830658507143319e-05, "loss": 2.6332, "step": 29395 }, { "epoch": 0.38, "learning_rate": 6.829708729550977e-05, "loss": 2.6786, "step": 29400 }, { "epoch": 0.38, "learning_rate": 6.828758875722772e-05, "loss": 2.5449, "step": 29405 }, { "epoch": 0.38, "learning_rate": 6.827808945698284e-05, "loss": 2.5279, "step": 29410 }, { "epoch": 0.38, "learning_rate": 6.826858939517087e-05, "loss": 2.5601, "step": 29415 }, { "epoch": 0.38, "learning_rate": 6.825908857218768e-05, "loss": 2.7134, "step": 29420 }, { "epoch": 0.38, "learning_rate": 6.82495869884291e-05, "loss": 2.5279, "step": 29425 }, { "epoch": 0.38, "learning_rate": 6.824008464429103e-05, "loss": 2.5236, "step": 29430 }, { "epoch": 0.38, "learning_rate": 6.82305815401694e-05, "loss": 2.5943, "step": 29435 }, { "epoch": 0.38, "learning_rate": 6.822107767646014e-05, "loss": 2.567, "step": 29440 }, { "epoch": 0.38, "learning_rate": 6.821157305355924e-05, "loss": 2.6499, "step": 29445 }, { "epoch": 0.38, "learning_rate": 6.820206767186274e-05, "loss": 2.6378, "step": 29450 }, { "epoch": 0.38, "learning_rate": 6.819256153176666e-05, "loss": 2.6225, "step": 29455 }, { "epoch": 0.38, "learning_rate": 6.818305463366708e-05, "loss": 2.6383, "step": 29460 }, { "epoch": 0.38, "learning_rate": 6.817354697796012e-05, "loss": 2.715, "step": 29465 }, { "epoch": 0.38, "learning_rate": 6.816403856504193e-05, "loss": 2.6228, "step": 29470 }, { "epoch": 0.38, "learning_rate": 6.815452939530864e-05, "loss": 2.592, "step": 29475 }, { "epoch": 0.38, "learning_rate": 6.814501946915652e-05, "loss": 2.6702, "step": 29480 }, { "epoch": 0.38, "learning_rate": 6.813550878698177e-05, "loss": 2.5993, "step": 29485 }, { "epoch": 0.38, "learning_rate": 6.812599734918065e-05, "loss": 2.6147, "step": 29490 }, { "epoch": 0.38, "learning_rate": 6.811648515614948e-05, "loss": 2.5984, "step": 29495 }, { "epoch": 0.38, "learning_rate": 6.810697220828457e-05, "loss": 2.4701, "step": 29500 }, { "epoch": 0.38, "learning_rate": 6.809745850598231e-05, "loss": 2.59, "step": 29505 }, { "epoch": 0.38, "learning_rate": 6.808794404963907e-05, "loss": 2.684, "step": 29510 }, { "epoch": 0.38, "learning_rate": 6.807842883965128e-05, "loss": 2.6236, "step": 29515 }, { "epoch": 0.38, "learning_rate": 6.806891287641541e-05, "loss": 2.5391, "step": 29520 }, { "epoch": 0.38, "learning_rate": 6.805939616032795e-05, "loss": 2.5927, "step": 29525 }, { "epoch": 0.38, "learning_rate": 6.80498786917854e-05, "loss": 2.6326, "step": 29530 }, { "epoch": 0.38, "learning_rate": 6.804036047118431e-05, "loss": 2.6253, "step": 29535 }, { "epoch": 0.38, "learning_rate": 6.803084149892127e-05, "loss": 2.5654, "step": 29540 }, { "epoch": 0.38, "learning_rate": 6.80213217753929e-05, "loss": 2.6515, "step": 29545 }, { "epoch": 0.38, "learning_rate": 6.801180130099585e-05, "loss": 2.5074, "step": 29550 }, { "epoch": 0.38, "learning_rate": 6.800228007612676e-05, "loss": 2.5836, "step": 29555 }, { "epoch": 0.38, "learning_rate": 6.79927581011824e-05, "loss": 2.552, "step": 29560 }, { "epoch": 0.38, "learning_rate": 6.798323537655943e-05, "loss": 2.6407, "step": 29565 }, { "epoch": 0.38, "learning_rate": 6.797371190265467e-05, "loss": 2.5465, "step": 29570 }, { "epoch": 0.38, "learning_rate": 6.796418767986494e-05, "loss": 2.7176, "step": 29575 }, { "epoch": 0.38, "learning_rate": 6.795466270858702e-05, "loss": 2.5852, "step": 29580 }, { "epoch": 0.38, "learning_rate": 6.794513698921781e-05, "loss": 2.6368, "step": 29585 }, { "epoch": 0.38, "learning_rate": 6.793561052215419e-05, "loss": 2.6217, "step": 29590 }, { "epoch": 0.38, "learning_rate": 6.792608330779306e-05, "loss": 2.6291, "step": 29595 }, { "epoch": 0.38, "learning_rate": 6.791655534653143e-05, "loss": 2.6583, "step": 29600 }, { "epoch": 0.38, "learning_rate": 6.790702663876625e-05, "loss": 2.6435, "step": 29605 }, { "epoch": 0.38, "learning_rate": 6.789749718489458e-05, "loss": 2.6023, "step": 29610 }, { "epoch": 0.38, "learning_rate": 6.788796698531342e-05, "loss": 2.6146, "step": 29615 }, { "epoch": 0.38, "learning_rate": 6.787843604041988e-05, "loss": 2.6278, "step": 29620 }, { "epoch": 0.38, "learning_rate": 6.786890435061106e-05, "loss": 2.5813, "step": 29625 }, { "epoch": 0.38, "learning_rate": 6.785937191628411e-05, "loss": 2.5819, "step": 29630 }, { "epoch": 0.38, "learning_rate": 6.784983873783619e-05, "loss": 2.6978, "step": 29635 }, { "epoch": 0.38, "learning_rate": 6.784030481566454e-05, "loss": 2.5803, "step": 29640 }, { "epoch": 0.38, "learning_rate": 6.783077015016637e-05, "loss": 2.4767, "step": 29645 }, { "epoch": 0.38, "learning_rate": 6.782123474173895e-05, "loss": 2.6401, "step": 29650 }, { "epoch": 0.38, "learning_rate": 6.781169859077958e-05, "loss": 2.7644, "step": 29655 }, { "epoch": 0.38, "learning_rate": 6.780216169768558e-05, "loss": 2.6539, "step": 29660 }, { "epoch": 0.38, "learning_rate": 6.779262406285432e-05, "loss": 2.5588, "step": 29665 }, { "epoch": 0.39, "learning_rate": 6.77830856866832e-05, "loss": 2.4889, "step": 29670 }, { "epoch": 0.39, "learning_rate": 6.777354656956964e-05, "loss": 2.556, "step": 29675 }, { "epoch": 0.39, "learning_rate": 6.776400671191108e-05, "loss": 2.5333, "step": 29680 }, { "epoch": 0.39, "learning_rate": 6.7754466114105e-05, "loss": 2.7033, "step": 29685 }, { "epoch": 0.39, "learning_rate": 6.774492477654891e-05, "loss": 2.5485, "step": 29690 }, { "epoch": 0.39, "learning_rate": 6.773538269964038e-05, "loss": 2.6014, "step": 29695 }, { "epoch": 0.39, "learning_rate": 6.772583988377698e-05, "loss": 2.4726, "step": 29700 }, { "epoch": 0.39, "learning_rate": 6.771629632935632e-05, "loss": 2.6693, "step": 29705 }, { "epoch": 0.39, "learning_rate": 6.770675203677602e-05, "loss": 2.5198, "step": 29710 }, { "epoch": 0.39, "learning_rate": 6.769720700643376e-05, "loss": 2.5527, "step": 29715 }, { "epoch": 0.39, "learning_rate": 6.768766123872723e-05, "loss": 2.6427, "step": 29720 }, { "epoch": 0.39, "learning_rate": 6.767811473405418e-05, "loss": 2.6368, "step": 29725 }, { "epoch": 0.39, "learning_rate": 6.766856749281233e-05, "loss": 2.6783, "step": 29730 }, { "epoch": 0.39, "learning_rate": 6.765901951539952e-05, "loss": 2.6501, "step": 29735 }, { "epoch": 0.39, "learning_rate": 6.764947080221356e-05, "loss": 2.5831, "step": 29740 }, { "epoch": 0.39, "learning_rate": 6.763992135365227e-05, "loss": 2.6572, "step": 29745 }, { "epoch": 0.39, "learning_rate": 6.763037117011357e-05, "loss": 2.7198, "step": 29750 }, { "epoch": 0.39, "learning_rate": 6.762082025199536e-05, "loss": 2.6353, "step": 29755 }, { "epoch": 0.39, "learning_rate": 6.761126859969557e-05, "loss": 2.602, "step": 29760 }, { "epoch": 0.39, "learning_rate": 6.760171621361221e-05, "loss": 2.6175, "step": 29765 }, { "epoch": 0.39, "learning_rate": 6.759216309414325e-05, "loss": 2.5447, "step": 29770 }, { "epoch": 0.39, "learning_rate": 6.758260924168675e-05, "loss": 2.5714, "step": 29775 }, { "epoch": 0.39, "learning_rate": 6.757305465664077e-05, "loss": 2.5167, "step": 29780 }, { "epoch": 0.39, "learning_rate": 6.756349933940341e-05, "loss": 2.5725, "step": 29785 }, { "epoch": 0.39, "learning_rate": 6.755394329037277e-05, "loss": 2.6823, "step": 29790 }, { "epoch": 0.39, "learning_rate": 6.754438650994704e-05, "loss": 2.5548, "step": 29795 }, { "epoch": 0.39, "learning_rate": 6.753482899852442e-05, "loss": 2.6547, "step": 29800 }, { "epoch": 0.39, "learning_rate": 6.752527075650309e-05, "loss": 2.6297, "step": 29805 }, { "epoch": 0.39, "learning_rate": 6.751571178428132e-05, "loss": 2.6843, "step": 29810 }, { "epoch": 0.39, "learning_rate": 6.750615208225739e-05, "loss": 2.503, "step": 29815 }, { "epoch": 0.39, "learning_rate": 6.749659165082961e-05, "loss": 2.5477, "step": 29820 }, { "epoch": 0.39, "learning_rate": 6.748703049039633e-05, "loss": 2.6967, "step": 29825 }, { "epoch": 0.39, "learning_rate": 6.747746860135591e-05, "loss": 2.6173, "step": 29830 }, { "epoch": 0.39, "learning_rate": 6.746790598410676e-05, "loss": 2.7481, "step": 29835 }, { "epoch": 0.39, "learning_rate": 6.745834263904729e-05, "loss": 2.5399, "step": 29840 }, { "epoch": 0.39, "learning_rate": 6.744877856657596e-05, "loss": 2.6622, "step": 29845 }, { "epoch": 0.39, "learning_rate": 6.743921376709131e-05, "loss": 2.593, "step": 29850 }, { "epoch": 0.39, "learning_rate": 6.742964824099182e-05, "loss": 2.5521, "step": 29855 }, { "epoch": 0.39, "learning_rate": 6.742008198867606e-05, "loss": 2.5224, "step": 29860 }, { "epoch": 0.39, "learning_rate": 6.74105150105426e-05, "loss": 2.5709, "step": 29865 }, { "epoch": 0.39, "learning_rate": 6.740094730699009e-05, "loss": 2.6833, "step": 29870 }, { "epoch": 0.39, "learning_rate": 6.739137887841712e-05, "loss": 2.6508, "step": 29875 }, { "epoch": 0.39, "learning_rate": 6.73818097252224e-05, "loss": 2.4601, "step": 29880 }, { "epoch": 0.39, "learning_rate": 6.737223984780461e-05, "loss": 2.5686, "step": 29885 }, { "epoch": 0.39, "learning_rate": 6.736266924656253e-05, "loss": 2.6427, "step": 29890 }, { "epoch": 0.39, "learning_rate": 6.735309792189488e-05, "loss": 2.7488, "step": 29895 }, { "epoch": 0.39, "learning_rate": 6.734352587420046e-05, "loss": 2.5769, "step": 29900 }, { "epoch": 0.39, "learning_rate": 6.733395310387812e-05, "loss": 2.6249, "step": 29905 }, { "epoch": 0.39, "learning_rate": 6.732437961132669e-05, "loss": 2.6055, "step": 29910 }, { "epoch": 0.39, "learning_rate": 6.731480539694504e-05, "loss": 2.4335, "step": 29915 }, { "epoch": 0.39, "learning_rate": 6.730523046113215e-05, "loss": 2.5737, "step": 29920 }, { "epoch": 0.39, "learning_rate": 6.72956548042869e-05, "loss": 2.6337, "step": 29925 }, { "epoch": 0.39, "learning_rate": 6.72860784268083e-05, "loss": 2.5635, "step": 29930 }, { "epoch": 0.39, "learning_rate": 6.727650132909533e-05, "loss": 2.4933, "step": 29935 }, { "epoch": 0.39, "learning_rate": 6.726692351154704e-05, "loss": 2.6016, "step": 29940 }, { "epoch": 0.39, "learning_rate": 6.72573449745625e-05, "loss": 2.6734, "step": 29945 }, { "epoch": 0.39, "learning_rate": 6.724776571854081e-05, "loss": 2.5964, "step": 29950 }, { "epoch": 0.39, "learning_rate": 6.723818574388107e-05, "loss": 2.7498, "step": 29955 }, { "epoch": 0.39, "learning_rate": 6.722860505098248e-05, "loss": 2.4434, "step": 29960 }, { "epoch": 0.39, "learning_rate": 6.721902364024416e-05, "loss": 2.6383, "step": 29965 }, { "epoch": 0.39, "learning_rate": 6.720944151206538e-05, "loss": 2.6065, "step": 29970 }, { "epoch": 0.39, "learning_rate": 6.719985866684535e-05, "loss": 2.6353, "step": 29975 }, { "epoch": 0.39, "learning_rate": 6.719027510498338e-05, "loss": 2.6086, "step": 29980 }, { "epoch": 0.39, "learning_rate": 6.718069082687874e-05, "loss": 2.5116, "step": 29985 }, { "epoch": 0.39, "learning_rate": 6.71711058329308e-05, "loss": 2.6012, "step": 29990 }, { "epoch": 0.39, "learning_rate": 6.716152012353887e-05, "loss": 2.6804, "step": 29995 }, { "epoch": 0.39, "learning_rate": 6.71519336991024e-05, "loss": 2.5024, "step": 30000 }, { "epoch": 0.39, "learning_rate": 6.714234656002078e-05, "loss": 2.5912, "step": 30005 }, { "epoch": 0.39, "learning_rate": 6.71327587066935e-05, "loss": 2.5421, "step": 30010 }, { "epoch": 0.39, "learning_rate": 6.712317013951999e-05, "loss": 2.4325, "step": 30015 }, { "epoch": 0.39, "learning_rate": 6.71135808588998e-05, "loss": 2.6092, "step": 30020 }, { "epoch": 0.39, "learning_rate": 6.710399086523246e-05, "loss": 2.5345, "step": 30025 }, { "epoch": 0.39, "learning_rate": 6.709440015891755e-05, "loss": 2.677, "step": 30030 }, { "epoch": 0.39, "learning_rate": 6.708480874035467e-05, "loss": 2.6486, "step": 30035 }, { "epoch": 0.39, "learning_rate": 6.707521660994346e-05, "loss": 2.6602, "step": 30040 }, { "epoch": 0.39, "learning_rate": 6.706562376808357e-05, "loss": 2.5292, "step": 30045 }, { "epoch": 0.39, "learning_rate": 6.705603021517469e-05, "loss": 2.6855, "step": 30050 }, { "epoch": 0.39, "learning_rate": 6.704643595161654e-05, "loss": 2.6011, "step": 30055 }, { "epoch": 0.39, "learning_rate": 6.703684097780886e-05, "loss": 2.409, "step": 30060 }, { "epoch": 0.39, "learning_rate": 6.702724529415148e-05, "loss": 2.7107, "step": 30065 }, { "epoch": 0.39, "learning_rate": 6.701764890104416e-05, "loss": 2.6929, "step": 30070 }, { "epoch": 0.39, "learning_rate": 6.700805179888675e-05, "loss": 2.574, "step": 30075 }, { "epoch": 0.39, "learning_rate": 6.699845398807913e-05, "loss": 2.644, "step": 30080 }, { "epoch": 0.39, "learning_rate": 6.69888554690212e-05, "loss": 2.5192, "step": 30085 }, { "epoch": 0.39, "learning_rate": 6.697925624211285e-05, "loss": 2.5668, "step": 30090 }, { "epoch": 0.39, "learning_rate": 6.696965630775409e-05, "loss": 2.617, "step": 30095 }, { "epoch": 0.39, "learning_rate": 6.696005566634487e-05, "loss": 2.6278, "step": 30100 }, { "epoch": 0.39, "learning_rate": 6.695045431828524e-05, "loss": 2.4321, "step": 30105 }, { "epoch": 0.39, "learning_rate": 6.69408522639752e-05, "loss": 2.5716, "step": 30110 }, { "epoch": 0.39, "learning_rate": 6.693124950381488e-05, "loss": 2.5244, "step": 30115 }, { "epoch": 0.39, "learning_rate": 6.692164603820432e-05, "loss": 2.5486, "step": 30120 }, { "epoch": 0.39, "learning_rate": 6.69120418675437e-05, "loss": 2.6993, "step": 30125 }, { "epoch": 0.39, "learning_rate": 6.690243699223319e-05, "loss": 2.5514, "step": 30130 }, { "epoch": 0.39, "learning_rate": 6.689283141267294e-05, "loss": 2.6222, "step": 30135 }, { "epoch": 0.39, "learning_rate": 6.688322512926322e-05, "loss": 2.6768, "step": 30140 }, { "epoch": 0.39, "learning_rate": 6.687361814240424e-05, "loss": 2.5844, "step": 30145 }, { "epoch": 0.39, "learning_rate": 6.68640104524963e-05, "loss": 2.6809, "step": 30150 }, { "epoch": 0.39, "learning_rate": 6.685440205993971e-05, "loss": 2.6136, "step": 30155 }, { "epoch": 0.39, "learning_rate": 6.684479296513481e-05, "loss": 2.7323, "step": 30160 }, { "epoch": 0.39, "learning_rate": 6.683518316848199e-05, "loss": 2.591, "step": 30165 }, { "epoch": 0.39, "learning_rate": 6.682557267038159e-05, "loss": 2.6641, "step": 30170 }, { "epoch": 0.39, "learning_rate": 6.681596147123408e-05, "loss": 2.604, "step": 30175 }, { "epoch": 0.39, "learning_rate": 6.68063495714399e-05, "loss": 2.7022, "step": 30180 }, { "epoch": 0.39, "learning_rate": 6.679673697139954e-05, "loss": 2.6217, "step": 30185 }, { "epoch": 0.39, "learning_rate": 6.678712367151352e-05, "loss": 2.6923, "step": 30190 }, { "epoch": 0.39, "learning_rate": 6.677750967218239e-05, "loss": 2.7344, "step": 30195 }, { "epoch": 0.39, "learning_rate": 6.676789497380671e-05, "loss": 2.6341, "step": 30200 }, { "epoch": 0.39, "learning_rate": 6.675827957678708e-05, "loss": 2.6373, "step": 30205 }, { "epoch": 0.39, "learning_rate": 6.674866348152413e-05, "loss": 2.6155, "step": 30210 }, { "epoch": 0.39, "learning_rate": 6.673904668841854e-05, "loss": 2.7253, "step": 30215 }, { "epoch": 0.39, "learning_rate": 6.672942919787097e-05, "loss": 2.6057, "step": 30220 }, { "epoch": 0.39, "learning_rate": 6.671981101028217e-05, "loss": 2.5625, "step": 30225 }, { "epoch": 0.39, "learning_rate": 6.671019212605286e-05, "loss": 2.5826, "step": 30230 }, { "epoch": 0.39, "learning_rate": 6.670057254558383e-05, "loss": 2.6272, "step": 30235 }, { "epoch": 0.39, "learning_rate": 6.669095226927587e-05, "loss": 2.4932, "step": 30240 }, { "epoch": 0.39, "learning_rate": 6.668133129752985e-05, "loss": 2.6465, "step": 30245 }, { "epoch": 0.39, "learning_rate": 6.667170963074659e-05, "loss": 2.5657, "step": 30250 }, { "epoch": 0.39, "learning_rate": 6.666208726932703e-05, "loss": 2.655, "step": 30255 }, { "epoch": 0.39, "learning_rate": 6.665246421367204e-05, "loss": 2.6231, "step": 30260 }, { "epoch": 0.39, "learning_rate": 6.664284046418259e-05, "loss": 2.5701, "step": 30265 }, { "epoch": 0.39, "learning_rate": 6.663321602125967e-05, "loss": 2.7266, "step": 30270 }, { "epoch": 0.39, "learning_rate": 6.662359088530427e-05, "loss": 2.6583, "step": 30275 }, { "epoch": 0.39, "learning_rate": 6.661396505671745e-05, "loss": 2.5399, "step": 30280 }, { "epoch": 0.39, "learning_rate": 6.660433853590026e-05, "loss": 2.564, "step": 30285 }, { "epoch": 0.39, "learning_rate": 6.65947113232538e-05, "loss": 2.6203, "step": 30290 }, { "epoch": 0.39, "learning_rate": 6.658508341917917e-05, "loss": 2.6833, "step": 30295 }, { "epoch": 0.39, "learning_rate": 6.657545482407756e-05, "loss": 2.6674, "step": 30300 }, { "epoch": 0.39, "learning_rate": 6.656582553835013e-05, "loss": 2.6348, "step": 30305 }, { "epoch": 0.39, "learning_rate": 6.655619556239811e-05, "loss": 2.6415, "step": 30310 }, { "epoch": 0.39, "learning_rate": 6.654656489662271e-05, "loss": 2.5772, "step": 30315 }, { "epoch": 0.39, "learning_rate": 6.653693354142521e-05, "loss": 2.4975, "step": 30320 }, { "epoch": 0.39, "learning_rate": 6.65273014972069e-05, "loss": 2.6206, "step": 30325 }, { "epoch": 0.39, "learning_rate": 6.65176687643691e-05, "loss": 2.5885, "step": 30330 }, { "epoch": 0.39, "learning_rate": 6.650803534331319e-05, "loss": 2.5444, "step": 30335 }, { "epoch": 0.39, "learning_rate": 6.649840123444053e-05, "loss": 2.6364, "step": 30340 }, { "epoch": 0.39, "learning_rate": 6.648876643815255e-05, "loss": 2.5845, "step": 30345 }, { "epoch": 0.39, "learning_rate": 6.647913095485065e-05, "loss": 2.6936, "step": 30350 }, { "epoch": 0.39, "learning_rate": 6.646949478493633e-05, "loss": 2.5056, "step": 30355 }, { "epoch": 0.39, "learning_rate": 6.645985792881109e-05, "loss": 2.6465, "step": 30360 }, { "epoch": 0.39, "learning_rate": 6.645022038687642e-05, "loss": 2.627, "step": 30365 }, { "epoch": 0.39, "learning_rate": 6.644058215953393e-05, "loss": 2.6297, "step": 30370 }, { "epoch": 0.39, "learning_rate": 6.643094324718517e-05, "loss": 2.5375, "step": 30375 }, { "epoch": 0.39, "learning_rate": 6.642130365023174e-05, "loss": 2.6001, "step": 30380 }, { "epoch": 0.39, "learning_rate": 6.641166336907529e-05, "loss": 2.6071, "step": 30385 }, { "epoch": 0.39, "learning_rate": 6.640202240411747e-05, "loss": 2.7004, "step": 30390 }, { "epoch": 0.39, "learning_rate": 6.639238075576001e-05, "loss": 2.5182, "step": 30395 }, { "epoch": 0.39, "learning_rate": 6.638273842440462e-05, "loss": 2.5968, "step": 30400 }, { "epoch": 0.39, "learning_rate": 6.637309541045305e-05, "loss": 2.4705, "step": 30405 }, { "epoch": 0.39, "learning_rate": 6.63634517143071e-05, "loss": 2.5214, "step": 30410 }, { "epoch": 0.39, "learning_rate": 6.635380733636855e-05, "loss": 2.4652, "step": 30415 }, { "epoch": 0.39, "learning_rate": 6.634416227703926e-05, "loss": 2.5372, "step": 30420 }, { "epoch": 0.39, "learning_rate": 6.633451653672108e-05, "loss": 2.5718, "step": 30425 }, { "epoch": 0.39, "learning_rate": 6.632487011581592e-05, "loss": 2.5614, "step": 30430 }, { "epoch": 0.39, "learning_rate": 6.63152230147257e-05, "loss": 2.6838, "step": 30435 }, { "epoch": 0.4, "learning_rate": 6.630557523385238e-05, "loss": 2.5803, "step": 30440 }, { "epoch": 0.4, "learning_rate": 6.629592677359793e-05, "loss": 2.6366, "step": 30445 }, { "epoch": 0.4, "learning_rate": 6.628627763436436e-05, "loss": 2.6939, "step": 30450 }, { "epoch": 0.4, "learning_rate": 6.627662781655368e-05, "loss": 2.5946, "step": 30455 }, { "epoch": 0.4, "learning_rate": 6.6266977320568e-05, "loss": 2.5841, "step": 30460 }, { "epoch": 0.4, "learning_rate": 6.62573261468094e-05, "loss": 2.6686, "step": 30465 }, { "epoch": 0.4, "learning_rate": 6.624767429568e-05, "loss": 2.7153, "step": 30470 }, { "epoch": 0.4, "learning_rate": 6.623802176758194e-05, "loss": 2.7261, "step": 30475 }, { "epoch": 0.4, "learning_rate": 6.622836856291743e-05, "loss": 2.5207, "step": 30480 }, { "epoch": 0.4, "learning_rate": 6.621871468208861e-05, "loss": 2.5577, "step": 30485 }, { "epoch": 0.4, "learning_rate": 6.620906012549776e-05, "loss": 2.5609, "step": 30490 }, { "epoch": 0.4, "learning_rate": 6.619940489354716e-05, "loss": 2.5602, "step": 30495 }, { "epoch": 0.4, "learning_rate": 6.61897489866391e-05, "loss": 2.5126, "step": 30500 }, { "epoch": 0.4, "learning_rate": 6.618009240517584e-05, "loss": 2.5045, "step": 30505 }, { "epoch": 0.4, "learning_rate": 6.617043514955979e-05, "loss": 2.5982, "step": 30510 }, { "epoch": 0.4, "learning_rate": 6.616077722019326e-05, "loss": 2.5643, "step": 30515 }, { "epoch": 0.4, "learning_rate": 6.615111861747872e-05, "loss": 2.6885, "step": 30520 }, { "epoch": 0.4, "learning_rate": 6.614145934181859e-05, "loss": 2.5757, "step": 30525 }, { "epoch": 0.4, "learning_rate": 6.613179939361529e-05, "loss": 2.6474, "step": 30530 }, { "epoch": 0.4, "learning_rate": 6.612213877327135e-05, "loss": 2.5827, "step": 30535 }, { "epoch": 0.4, "learning_rate": 6.611247748118926e-05, "loss": 2.6614, "step": 30540 }, { "epoch": 0.4, "learning_rate": 6.610281551777156e-05, "loss": 2.6452, "step": 30545 }, { "epoch": 0.4, "learning_rate": 6.609315288342084e-05, "loss": 2.6219, "step": 30550 }, { "epoch": 0.4, "learning_rate": 6.608348957853968e-05, "loss": 2.5348, "step": 30555 }, { "epoch": 0.4, "learning_rate": 6.607382560353072e-05, "loss": 2.6081, "step": 30560 }, { "epoch": 0.4, "learning_rate": 6.606416095879663e-05, "loss": 2.5417, "step": 30565 }, { "epoch": 0.4, "learning_rate": 6.605449564474007e-05, "loss": 2.4033, "step": 30570 }, { "epoch": 0.4, "learning_rate": 6.604482966176375e-05, "loss": 2.5909, "step": 30575 }, { "epoch": 0.4, "learning_rate": 6.60351630102704e-05, "loss": 2.5006, "step": 30580 }, { "epoch": 0.4, "learning_rate": 6.602549569066282e-05, "loss": 2.6323, "step": 30585 }, { "epoch": 0.4, "learning_rate": 6.601582770334378e-05, "loss": 2.5353, "step": 30590 }, { "epoch": 0.4, "learning_rate": 6.600615904871612e-05, "loss": 2.6683, "step": 30595 }, { "epoch": 0.4, "learning_rate": 6.599648972718266e-05, "loss": 2.6029, "step": 30600 }, { "epoch": 0.4, "learning_rate": 6.598681973914632e-05, "loss": 2.5037, "step": 30605 }, { "epoch": 0.4, "learning_rate": 6.597714908500996e-05, "loss": 2.6133, "step": 30610 }, { "epoch": 0.4, "learning_rate": 6.596747776517653e-05, "loss": 2.6345, "step": 30615 }, { "epoch": 0.4, "learning_rate": 6.595780578004901e-05, "loss": 2.6454, "step": 30620 }, { "epoch": 0.4, "learning_rate": 6.594813313003038e-05, "loss": 2.7322, "step": 30625 }, { "epoch": 0.4, "learning_rate": 6.593845981552365e-05, "loss": 2.5043, "step": 30630 }, { "epoch": 0.4, "learning_rate": 6.592878583693185e-05, "loss": 2.5599, "step": 30635 }, { "epoch": 0.4, "learning_rate": 6.591911119465807e-05, "loss": 2.6978, "step": 30640 }, { "epoch": 0.4, "learning_rate": 6.59094358891054e-05, "loss": 2.7228, "step": 30645 }, { "epoch": 0.4, "learning_rate": 6.589975992067699e-05, "loss": 2.6618, "step": 30650 }, { "epoch": 0.4, "learning_rate": 6.589008328977599e-05, "loss": 2.51, "step": 30655 }, { "epoch": 0.4, "learning_rate": 6.588040599680556e-05, "loss": 2.4937, "step": 30660 }, { "epoch": 0.4, "learning_rate": 6.587072804216891e-05, "loss": 2.6768, "step": 30665 }, { "epoch": 0.4, "learning_rate": 6.58610494262693e-05, "loss": 2.6657, "step": 30670 }, { "epoch": 0.4, "learning_rate": 6.585137014950998e-05, "loss": 2.6596, "step": 30675 }, { "epoch": 0.4, "learning_rate": 6.584169021229424e-05, "loss": 2.5329, "step": 30680 }, { "epoch": 0.4, "learning_rate": 6.583200961502541e-05, "loss": 2.5413, "step": 30685 }, { "epoch": 0.4, "learning_rate": 6.582232835810684e-05, "loss": 2.5272, "step": 30690 }, { "epoch": 0.4, "learning_rate": 6.58126464419419e-05, "loss": 2.5122, "step": 30695 }, { "epoch": 0.4, "learning_rate": 6.580296386693399e-05, "loss": 2.6026, "step": 30700 }, { "epoch": 0.4, "learning_rate": 6.579328063348653e-05, "loss": 2.5973, "step": 30705 }, { "epoch": 0.4, "learning_rate": 6.5783596742003e-05, "loss": 2.5878, "step": 30710 }, { "epoch": 0.4, "learning_rate": 6.577391219288687e-05, "loss": 2.6547, "step": 30715 }, { "epoch": 0.4, "learning_rate": 6.576422698654167e-05, "loss": 2.5321, "step": 30720 }, { "epoch": 0.4, "learning_rate": 6.575454112337092e-05, "loss": 2.5838, "step": 30725 }, { "epoch": 0.4, "learning_rate": 6.574485460377818e-05, "loss": 2.5591, "step": 30730 }, { "epoch": 0.4, "learning_rate": 6.573516742816707e-05, "loss": 2.6444, "step": 30735 }, { "epoch": 0.4, "learning_rate": 6.572547959694118e-05, "loss": 2.5683, "step": 30740 }, { "epoch": 0.4, "learning_rate": 6.57157911105042e-05, "loss": 2.5798, "step": 30745 }, { "epoch": 0.4, "learning_rate": 6.570610196925977e-05, "loss": 2.7063, "step": 30750 }, { "epoch": 0.4, "learning_rate": 6.569641217361162e-05, "loss": 2.7063, "step": 30755 }, { "epoch": 0.4, "learning_rate": 6.568672172396348e-05, "loss": 2.4773, "step": 30760 }, { "epoch": 0.4, "learning_rate": 6.567703062071907e-05, "loss": 2.6165, "step": 30765 }, { "epoch": 0.4, "learning_rate": 6.566733886428222e-05, "loss": 2.6022, "step": 30770 }, { "epoch": 0.4, "learning_rate": 6.56576464550567e-05, "loss": 2.6792, "step": 30775 }, { "epoch": 0.4, "learning_rate": 6.56479533934464e-05, "loss": 2.5071, "step": 30780 }, { "epoch": 0.4, "learning_rate": 6.563825967985517e-05, "loss": 2.5988, "step": 30785 }, { "epoch": 0.4, "learning_rate": 6.562856531468688e-05, "loss": 2.6551, "step": 30790 }, { "epoch": 0.4, "learning_rate": 6.561887029834547e-05, "loss": 2.611, "step": 30795 }, { "epoch": 0.4, "learning_rate": 6.560917463123488e-05, "loss": 2.644, "step": 30800 }, { "epoch": 0.4, "learning_rate": 6.55994783137591e-05, "loss": 2.5953, "step": 30805 }, { "epoch": 0.4, "learning_rate": 6.558978134632213e-05, "loss": 2.523, "step": 30810 }, { "epoch": 0.4, "learning_rate": 6.558008372932797e-05, "loss": 2.7034, "step": 30815 }, { "epoch": 0.4, "learning_rate": 6.557038546318073e-05, "loss": 2.5548, "step": 30820 }, { "epoch": 0.4, "learning_rate": 6.556068654828444e-05, "loss": 2.6058, "step": 30825 }, { "epoch": 0.4, "learning_rate": 6.555098698504325e-05, "loss": 2.4926, "step": 30830 }, { "epoch": 0.4, "learning_rate": 6.554128677386126e-05, "loss": 2.5418, "step": 30835 }, { "epoch": 0.4, "learning_rate": 6.553158591514268e-05, "loss": 2.6584, "step": 30840 }, { "epoch": 0.4, "learning_rate": 6.552188440929168e-05, "loss": 2.7702, "step": 30845 }, { "epoch": 0.4, "learning_rate": 6.551218225671247e-05, "loss": 2.3814, "step": 30850 }, { "epoch": 0.4, "learning_rate": 6.550247945780931e-05, "loss": 2.6875, "step": 30855 }, { "epoch": 0.4, "learning_rate": 6.549277601298647e-05, "loss": 2.6306, "step": 30860 }, { "epoch": 0.4, "learning_rate": 6.548307192264824e-05, "loss": 2.4986, "step": 30865 }, { "epoch": 0.4, "learning_rate": 6.547336718719894e-05, "loss": 2.7016, "step": 30870 }, { "epoch": 0.4, "learning_rate": 6.546366180704296e-05, "loss": 2.5977, "step": 30875 }, { "epoch": 0.4, "learning_rate": 6.545395578258464e-05, "loss": 2.3862, "step": 30880 }, { "epoch": 0.4, "learning_rate": 6.544424911422841e-05, "loss": 2.4839, "step": 30885 }, { "epoch": 0.4, "learning_rate": 6.543454180237869e-05, "loss": 2.5764, "step": 30890 }, { "epoch": 0.4, "learning_rate": 6.542483384743996e-05, "loss": 2.6196, "step": 30895 }, { "epoch": 0.4, "learning_rate": 6.541512524981667e-05, "loss": 2.634, "step": 30900 }, { "epoch": 0.4, "learning_rate": 6.54054160099134e-05, "loss": 2.6465, "step": 30905 }, { "epoch": 0.4, "learning_rate": 6.539570612813462e-05, "loss": 2.5593, "step": 30910 }, { "epoch": 0.4, "learning_rate": 6.538599560488494e-05, "loss": 2.4729, "step": 30915 }, { "epoch": 0.4, "learning_rate": 6.537628444056894e-05, "loss": 2.6669, "step": 30920 }, { "epoch": 0.4, "learning_rate": 6.536657263559125e-05, "loss": 2.5313, "step": 30925 }, { "epoch": 0.4, "learning_rate": 6.53568601903565e-05, "loss": 2.712, "step": 30930 }, { "epoch": 0.4, "learning_rate": 6.53471471052694e-05, "loss": 2.5761, "step": 30935 }, { "epoch": 0.4, "learning_rate": 6.533743338073461e-05, "loss": 2.4807, "step": 30940 }, { "epoch": 0.4, "learning_rate": 6.532771901715688e-05, "loss": 2.6327, "step": 30945 }, { "epoch": 0.4, "learning_rate": 6.531800401494095e-05, "loss": 2.6521, "step": 30950 }, { "epoch": 0.4, "learning_rate": 6.530828837449164e-05, "loss": 2.5828, "step": 30955 }, { "epoch": 0.4, "learning_rate": 6.529857209621369e-05, "loss": 2.5807, "step": 30960 }, { "epoch": 0.4, "learning_rate": 6.528885518051199e-05, "loss": 2.5661, "step": 30965 }, { "epoch": 0.4, "learning_rate": 6.52791376277914e-05, "loss": 2.536, "step": 30970 }, { "epoch": 0.4, "learning_rate": 6.526941943845679e-05, "loss": 2.5646, "step": 30975 }, { "epoch": 0.4, "learning_rate": 6.525970061291306e-05, "loss": 2.6404, "step": 30980 }, { "epoch": 0.4, "learning_rate": 6.524998115156517e-05, "loss": 2.5024, "step": 30985 }, { "epoch": 0.4, "learning_rate": 6.52402610548181e-05, "loss": 2.6478, "step": 30990 }, { "epoch": 0.4, "learning_rate": 6.52305403230768e-05, "loss": 2.6608, "step": 30995 }, { "epoch": 0.4, "learning_rate": 6.522081895674633e-05, "loss": 2.5004, "step": 31000 }, { "epoch": 0.4, "learning_rate": 6.521109695623174e-05, "loss": 2.5404, "step": 31005 }, { "epoch": 0.4, "learning_rate": 6.520137432193804e-05, "loss": 2.6662, "step": 31010 }, { "epoch": 0.4, "learning_rate": 6.519165105427042e-05, "loss": 2.5923, "step": 31015 }, { "epoch": 0.4, "learning_rate": 6.518192715363394e-05, "loss": 2.5794, "step": 31020 }, { "epoch": 0.4, "learning_rate": 6.517220262043377e-05, "loss": 2.5782, "step": 31025 }, { "epoch": 0.4, "learning_rate": 6.51624774550751e-05, "loss": 2.6274, "step": 31030 }, { "epoch": 0.4, "learning_rate": 6.515275165796311e-05, "loss": 2.7306, "step": 31035 }, { "epoch": 0.4, "learning_rate": 6.514302522950307e-05, "loss": 2.5551, "step": 31040 }, { "epoch": 0.4, "learning_rate": 6.513329817010018e-05, "loss": 2.563, "step": 31045 }, { "epoch": 0.4, "learning_rate": 6.51235704801598e-05, "loss": 2.6488, "step": 31050 }, { "epoch": 0.4, "learning_rate": 6.511384216008716e-05, "loss": 2.673, "step": 31055 }, { "epoch": 0.4, "learning_rate": 6.510411321028764e-05, "loss": 2.5189, "step": 31060 }, { "epoch": 0.4, "learning_rate": 6.50943836311666e-05, "loss": 2.5441, "step": 31065 }, { "epoch": 0.4, "learning_rate": 6.508465342312942e-05, "loss": 2.613, "step": 31070 }, { "epoch": 0.4, "learning_rate": 6.507492258658152e-05, "loss": 2.6758, "step": 31075 }, { "epoch": 0.4, "learning_rate": 6.506519112192834e-05, "loss": 2.6128, "step": 31080 }, { "epoch": 0.4, "learning_rate": 6.505545902957534e-05, "loss": 2.6982, "step": 31085 }, { "epoch": 0.4, "learning_rate": 6.504572630992802e-05, "loss": 2.552, "step": 31090 }, { "epoch": 0.4, "learning_rate": 6.50359929633919e-05, "loss": 2.5883, "step": 31095 }, { "epoch": 0.4, "learning_rate": 6.502625899037252e-05, "loss": 2.5763, "step": 31100 }, { "epoch": 0.4, "learning_rate": 6.501652439127547e-05, "loss": 2.5418, "step": 31105 }, { "epoch": 0.4, "learning_rate": 6.500678916650632e-05, "loss": 2.6481, "step": 31110 }, { "epoch": 0.4, "learning_rate": 6.499705331647072e-05, "loss": 2.5196, "step": 31115 }, { "epoch": 0.4, "learning_rate": 6.498731684157429e-05, "loss": 2.6284, "step": 31120 }, { "epoch": 0.4, "learning_rate": 6.497757974222272e-05, "loss": 2.6287, "step": 31125 }, { "epoch": 0.4, "learning_rate": 6.496784201882172e-05, "loss": 2.633, "step": 31130 }, { "epoch": 0.4, "learning_rate": 6.495810367177701e-05, "loss": 2.5429, "step": 31135 }, { "epoch": 0.4, "learning_rate": 6.494836470149435e-05, "loss": 2.6738, "step": 31140 }, { "epoch": 0.4, "learning_rate": 6.493862510837951e-05, "loss": 2.6253, "step": 31145 }, { "epoch": 0.4, "learning_rate": 6.49288848928383e-05, "loss": 2.632, "step": 31150 }, { "epoch": 0.4, "learning_rate": 6.491914405527657e-05, "loss": 2.4182, "step": 31155 }, { "epoch": 0.4, "learning_rate": 6.490940259610015e-05, "loss": 2.7138, "step": 31160 }, { "epoch": 0.4, "learning_rate": 6.489966051571492e-05, "loss": 2.5583, "step": 31165 }, { "epoch": 0.4, "learning_rate": 6.488991781452682e-05, "loss": 2.5859, "step": 31170 }, { "epoch": 0.4, "learning_rate": 6.488017449294177e-05, "loss": 2.6224, "step": 31175 }, { "epoch": 0.4, "learning_rate": 6.487043055136573e-05, "loss": 2.5241, "step": 31180 }, { "epoch": 0.4, "learning_rate": 6.486068599020466e-05, "loss": 2.6713, "step": 31185 }, { "epoch": 0.4, "learning_rate": 6.485094080986463e-05, "loss": 2.5441, "step": 31190 }, { "epoch": 0.4, "learning_rate": 6.484119501075162e-05, "loss": 2.6112, "step": 31195 }, { "epoch": 0.4, "learning_rate": 6.483144859327174e-05, "loss": 2.7406, "step": 31200 }, { "epoch": 0.4, "learning_rate": 6.482170155783106e-05, "loss": 2.5435, "step": 31205 }, { "epoch": 0.41, "learning_rate": 6.48119539048357e-05, "loss": 2.6228, "step": 31210 }, { "epoch": 0.41, "learning_rate": 6.480220563469179e-05, "loss": 2.4851, "step": 31215 }, { "epoch": 0.41, "learning_rate": 6.479245674780552e-05, "loss": 2.5801, "step": 31220 }, { "epoch": 0.41, "learning_rate": 6.478270724458305e-05, "loss": 2.6319, "step": 31225 }, { "epoch": 0.41, "learning_rate": 6.477295712543064e-05, "loss": 2.7734, "step": 31230 }, { "epoch": 0.41, "learning_rate": 6.47632063907545e-05, "loss": 2.5877, "step": 31235 }, { "epoch": 0.41, "learning_rate": 6.475345504096092e-05, "loss": 2.5918, "step": 31240 }, { "epoch": 0.41, "learning_rate": 6.474370307645617e-05, "loss": 2.6093, "step": 31245 }, { "epoch": 0.41, "learning_rate": 6.47339504976466e-05, "loss": 2.6453, "step": 31250 }, { "epoch": 0.41, "learning_rate": 6.472419730493855e-05, "loss": 2.6443, "step": 31255 }, { "epoch": 0.41, "learning_rate": 6.47144434987384e-05, "loss": 2.6154, "step": 31260 }, { "epoch": 0.41, "learning_rate": 6.470468907945252e-05, "loss": 2.5892, "step": 31265 }, { "epoch": 0.41, "learning_rate": 6.469493404748736e-05, "loss": 2.5005, "step": 31270 }, { "epoch": 0.41, "learning_rate": 6.468517840324935e-05, "loss": 2.6054, "step": 31275 }, { "epoch": 0.41, "learning_rate": 6.467542214714497e-05, "loss": 2.5916, "step": 31280 }, { "epoch": 0.41, "learning_rate": 6.466566527958071e-05, "loss": 2.5344, "step": 31285 }, { "epoch": 0.41, "learning_rate": 6.465590780096313e-05, "loss": 2.569, "step": 31290 }, { "epoch": 0.41, "learning_rate": 6.464614971169877e-05, "loss": 2.609, "step": 31295 }, { "epoch": 0.41, "learning_rate": 6.463639101219418e-05, "loss": 2.6776, "step": 31300 }, { "epoch": 0.41, "learning_rate": 6.462663170285597e-05, "loss": 2.4703, "step": 31305 }, { "epoch": 0.41, "learning_rate": 6.461687178409078e-05, "loss": 2.5973, "step": 31310 }, { "epoch": 0.41, "learning_rate": 6.460711125630526e-05, "loss": 2.4652, "step": 31315 }, { "epoch": 0.41, "learning_rate": 6.459735011990608e-05, "loss": 2.671, "step": 31320 }, { "epoch": 0.41, "learning_rate": 6.458758837529996e-05, "loss": 2.4009, "step": 31325 }, { "epoch": 0.41, "learning_rate": 6.457782602289363e-05, "loss": 2.5622, "step": 31330 }, { "epoch": 0.41, "learning_rate": 6.456806306309382e-05, "loss": 2.6123, "step": 31335 }, { "epoch": 0.41, "learning_rate": 6.455829949630731e-05, "loss": 2.6287, "step": 31340 }, { "epoch": 0.41, "learning_rate": 6.454853532294092e-05, "loss": 2.543, "step": 31345 }, { "epoch": 0.41, "learning_rate": 6.453877054340148e-05, "loss": 2.7387, "step": 31350 }, { "epoch": 0.41, "learning_rate": 6.452900515809584e-05, "loss": 2.6433, "step": 31355 }, { "epoch": 0.41, "learning_rate": 6.451923916743087e-05, "loss": 2.4904, "step": 31360 }, { "epoch": 0.41, "learning_rate": 6.45094725718135e-05, "loss": 2.5707, "step": 31365 }, { "epoch": 0.41, "learning_rate": 6.449970537165064e-05, "loss": 2.6167, "step": 31370 }, { "epoch": 0.41, "learning_rate": 6.448993756734925e-05, "loss": 2.7305, "step": 31375 }, { "epoch": 0.41, "learning_rate": 6.448016915931632e-05, "loss": 2.5509, "step": 31380 }, { "epoch": 0.41, "learning_rate": 6.447040014795885e-05, "loss": 2.5433, "step": 31385 }, { "epoch": 0.41, "learning_rate": 6.446063053368388e-05, "loss": 2.6729, "step": 31390 }, { "epoch": 0.41, "learning_rate": 6.445086031689844e-05, "loss": 2.6254, "step": 31395 }, { "epoch": 0.41, "learning_rate": 6.444108949800965e-05, "loss": 2.6621, "step": 31400 }, { "epoch": 0.41, "learning_rate": 6.443131807742457e-05, "loss": 2.633, "step": 31405 }, { "epoch": 0.41, "learning_rate": 6.442154605555037e-05, "loss": 2.4845, "step": 31410 }, { "epoch": 0.41, "learning_rate": 6.441177343279421e-05, "loss": 2.4099, "step": 31415 }, { "epoch": 0.41, "learning_rate": 6.440200020956327e-05, "loss": 2.4738, "step": 31420 }, { "epoch": 0.41, "learning_rate": 6.439222638626472e-05, "loss": 2.6591, "step": 31425 }, { "epoch": 0.41, "learning_rate": 6.438245196330582e-05, "loss": 2.5445, "step": 31430 }, { "epoch": 0.41, "learning_rate": 6.437267694109382e-05, "loss": 2.5154, "step": 31435 }, { "epoch": 0.41, "learning_rate": 6.436290132003601e-05, "loss": 2.7138, "step": 31440 }, { "epoch": 0.41, "learning_rate": 6.43531251005397e-05, "loss": 2.5249, "step": 31445 }, { "epoch": 0.41, "learning_rate": 6.43433482830122e-05, "loss": 2.5167, "step": 31450 }, { "epoch": 0.41, "learning_rate": 6.43335708678609e-05, "loss": 2.6754, "step": 31455 }, { "epoch": 0.41, "learning_rate": 6.432379285549315e-05, "loss": 2.7297, "step": 31460 }, { "epoch": 0.41, "learning_rate": 6.431401424631637e-05, "loss": 2.5329, "step": 31465 }, { "epoch": 0.41, "learning_rate": 6.430423504073798e-05, "loss": 2.5563, "step": 31470 }, { "epoch": 0.41, "learning_rate": 6.429445523916546e-05, "loss": 2.5339, "step": 31475 }, { "epoch": 0.41, "learning_rate": 6.428467484200627e-05, "loss": 2.4595, "step": 31480 }, { "epoch": 0.41, "learning_rate": 6.427489384966794e-05, "loss": 2.4979, "step": 31485 }, { "epoch": 0.41, "learning_rate": 6.426511226255797e-05, "loss": 2.585, "step": 31490 }, { "epoch": 0.41, "learning_rate": 6.425533008108393e-05, "loss": 2.5646, "step": 31495 }, { "epoch": 0.41, "learning_rate": 6.42455473056534e-05, "loss": 2.6227, "step": 31500 }, { "epoch": 0.41, "learning_rate": 6.423576393667398e-05, "loss": 2.5446, "step": 31505 }, { "epoch": 0.41, "learning_rate": 6.42259799745533e-05, "loss": 2.7414, "step": 31510 }, { "epoch": 0.41, "learning_rate": 6.421619541969904e-05, "loss": 2.5522, "step": 31515 }, { "epoch": 0.41, "learning_rate": 6.420641027251885e-05, "loss": 2.6629, "step": 31520 }, { "epoch": 0.41, "learning_rate": 6.419662453342043e-05, "loss": 2.5875, "step": 31525 }, { "epoch": 0.41, "learning_rate": 6.418683820281153e-05, "loss": 2.6105, "step": 31530 }, { "epoch": 0.41, "learning_rate": 6.417705128109988e-05, "loss": 2.5017, "step": 31535 }, { "epoch": 0.41, "learning_rate": 6.416726376869329e-05, "loss": 2.5912, "step": 31540 }, { "epoch": 0.41, "learning_rate": 6.415747566599954e-05, "loss": 2.4852, "step": 31545 }, { "epoch": 0.41, "learning_rate": 6.414768697342646e-05, "loss": 2.5571, "step": 31550 }, { "epoch": 0.41, "learning_rate": 6.41378976913819e-05, "loss": 2.4957, "step": 31555 }, { "epoch": 0.41, "learning_rate": 6.412810782027373e-05, "loss": 2.6107, "step": 31560 }, { "epoch": 0.41, "learning_rate": 6.411831736050985e-05, "loss": 2.569, "step": 31565 }, { "epoch": 0.41, "learning_rate": 6.41085263124982e-05, "loss": 2.5005, "step": 31570 }, { "epoch": 0.41, "learning_rate": 6.409873467664673e-05, "loss": 2.5913, "step": 31575 }, { "epoch": 0.41, "learning_rate": 6.40889424533634e-05, "loss": 2.714, "step": 31580 }, { "epoch": 0.41, "learning_rate": 6.407914964305623e-05, "loss": 2.6626, "step": 31585 }, { "epoch": 0.41, "learning_rate": 6.406935624613322e-05, "loss": 2.5985, "step": 31590 }, { "epoch": 0.41, "learning_rate": 6.405956226300241e-05, "loss": 2.676, "step": 31595 }, { "epoch": 0.41, "learning_rate": 6.40497676940719e-05, "loss": 2.5371, "step": 31600 }, { "epoch": 0.41, "learning_rate": 6.403997253974977e-05, "loss": 2.5523, "step": 31605 }, { "epoch": 0.41, "learning_rate": 6.403017680044415e-05, "loss": 2.5477, "step": 31610 }, { "epoch": 0.41, "learning_rate": 6.402038047656319e-05, "loss": 2.6291, "step": 31615 }, { "epoch": 0.41, "learning_rate": 6.401058356851504e-05, "loss": 2.6566, "step": 31620 }, { "epoch": 0.41, "learning_rate": 6.40007860767079e-05, "loss": 2.697, "step": 31625 }, { "epoch": 0.41, "learning_rate": 6.399098800154997e-05, "loss": 2.742, "step": 31630 }, { "epoch": 0.41, "learning_rate": 6.398118934344955e-05, "loss": 2.6015, "step": 31635 }, { "epoch": 0.41, "learning_rate": 6.397139010281487e-05, "loss": 2.614, "step": 31640 }, { "epoch": 0.41, "learning_rate": 6.396159028005421e-05, "loss": 2.7171, "step": 31645 }, { "epoch": 0.41, "learning_rate": 6.39517898755759e-05, "loss": 2.5785, "step": 31650 }, { "epoch": 0.41, "learning_rate": 6.394198888978826e-05, "loss": 2.7244, "step": 31655 }, { "epoch": 0.41, "learning_rate": 6.393218732309967e-05, "loss": 2.5836, "step": 31660 }, { "epoch": 0.41, "learning_rate": 6.392238517591853e-05, "loss": 2.573, "step": 31665 }, { "epoch": 0.41, "learning_rate": 6.391258244865325e-05, "loss": 2.5075, "step": 31670 }, { "epoch": 0.41, "learning_rate": 6.390277914171226e-05, "loss": 2.5616, "step": 31675 }, { "epoch": 0.41, "learning_rate": 6.389297525550399e-05, "loss": 2.6692, "step": 31680 }, { "epoch": 0.41, "learning_rate": 6.388317079043695e-05, "loss": 2.6144, "step": 31685 }, { "epoch": 0.41, "learning_rate": 6.387336574691967e-05, "loss": 2.521, "step": 31690 }, { "epoch": 0.41, "learning_rate": 6.386356012536065e-05, "loss": 2.6141, "step": 31695 }, { "epoch": 0.41, "learning_rate": 6.385375392616847e-05, "loss": 2.5469, "step": 31700 }, { "epoch": 0.41, "learning_rate": 6.384394714975169e-05, "loss": 2.5443, "step": 31705 }, { "epoch": 0.41, "learning_rate": 6.383413979651894e-05, "loss": 2.5772, "step": 31710 }, { "epoch": 0.41, "learning_rate": 6.382433186687882e-05, "loss": 2.4806, "step": 31715 }, { "epoch": 0.41, "learning_rate": 6.381452336124e-05, "loss": 2.6489, "step": 31720 }, { "epoch": 0.41, "learning_rate": 6.380471428001113e-05, "loss": 2.5671, "step": 31725 }, { "epoch": 0.41, "learning_rate": 6.379490462360097e-05, "loss": 2.584, "step": 31730 }, { "epoch": 0.41, "learning_rate": 6.37850943924182e-05, "loss": 2.5778, "step": 31735 }, { "epoch": 0.41, "learning_rate": 6.377528358687159e-05, "loss": 2.5933, "step": 31740 }, { "epoch": 0.41, "learning_rate": 6.376547220736988e-05, "loss": 2.5503, "step": 31745 }, { "epoch": 0.41, "learning_rate": 6.37556602543219e-05, "loss": 2.5489, "step": 31750 }, { "epoch": 0.41, "learning_rate": 6.374584772813645e-05, "loss": 2.5244, "step": 31755 }, { "epoch": 0.41, "learning_rate": 6.37360346292224e-05, "loss": 2.5858, "step": 31760 }, { "epoch": 0.41, "learning_rate": 6.372622095798859e-05, "loss": 2.6071, "step": 31765 }, { "epoch": 0.41, "learning_rate": 6.371640671484393e-05, "loss": 2.5318, "step": 31770 }, { "epoch": 0.41, "learning_rate": 6.370659190019732e-05, "loss": 2.5982, "step": 31775 }, { "epoch": 0.41, "learning_rate": 6.369677651445771e-05, "loss": 2.5301, "step": 31780 }, { "epoch": 0.41, "learning_rate": 6.368696055803409e-05, "loss": 2.4283, "step": 31785 }, { "epoch": 0.41, "learning_rate": 6.367714403133538e-05, "loss": 2.4805, "step": 31790 }, { "epoch": 0.41, "learning_rate": 6.366732693477066e-05, "loss": 2.4763, "step": 31795 }, { "epoch": 0.41, "learning_rate": 6.365750926874893e-05, "loss": 2.5705, "step": 31800 }, { "epoch": 0.41, "learning_rate": 6.364769103367926e-05, "loss": 2.7109, "step": 31805 }, { "epoch": 0.41, "learning_rate": 6.363787222997073e-05, "loss": 2.5954, "step": 31810 }, { "epoch": 0.41, "learning_rate": 6.362805285803244e-05, "loss": 2.4723, "step": 31815 }, { "epoch": 0.41, "learning_rate": 6.361823291827351e-05, "loss": 2.6857, "step": 31820 }, { "epoch": 0.41, "learning_rate": 6.360841241110313e-05, "loss": 2.5483, "step": 31825 }, { "epoch": 0.41, "learning_rate": 6.359859133693045e-05, "loss": 2.5954, "step": 31830 }, { "epoch": 0.41, "learning_rate": 6.358876969616468e-05, "loss": 2.5086, "step": 31835 }, { "epoch": 0.41, "learning_rate": 6.357894748921502e-05, "loss": 2.6618, "step": 31840 }, { "epoch": 0.41, "learning_rate": 6.356912471649076e-05, "loss": 2.6394, "step": 31845 }, { "epoch": 0.41, "learning_rate": 6.355930137840114e-05, "loss": 2.5139, "step": 31850 }, { "epoch": 0.41, "learning_rate": 6.354947747535546e-05, "loss": 2.5899, "step": 31855 }, { "epoch": 0.41, "learning_rate": 6.353965300776305e-05, "loss": 2.4861, "step": 31860 }, { "epoch": 0.41, "learning_rate": 6.352982797603324e-05, "loss": 2.5684, "step": 31865 }, { "epoch": 0.41, "learning_rate": 6.35200023805754e-05, "loss": 2.5583, "step": 31870 }, { "epoch": 0.41, "learning_rate": 6.351017622179892e-05, "loss": 2.5661, "step": 31875 }, { "epoch": 0.41, "learning_rate": 6.350034950011322e-05, "loss": 2.5453, "step": 31880 }, { "epoch": 0.41, "learning_rate": 6.34905222159277e-05, "loss": 2.5698, "step": 31885 }, { "epoch": 0.41, "learning_rate": 6.348069436965187e-05, "loss": 2.5465, "step": 31890 }, { "epoch": 0.41, "learning_rate": 6.34708659616952e-05, "loss": 2.5896, "step": 31895 }, { "epoch": 0.41, "learning_rate": 6.346103699246718e-05, "loss": 2.4016, "step": 31900 }, { "epoch": 0.41, "learning_rate": 6.345120746237733e-05, "loss": 2.521, "step": 31905 }, { "epoch": 0.41, "learning_rate": 6.344137737183523e-05, "loss": 2.5007, "step": 31910 }, { "epoch": 0.41, "learning_rate": 6.343154672125043e-05, "loss": 2.6585, "step": 31915 }, { "epoch": 0.41, "learning_rate": 6.342171551103256e-05, "loss": 2.6737, "step": 31920 }, { "epoch": 0.41, "learning_rate": 6.341188374159124e-05, "loss": 2.6916, "step": 31925 }, { "epoch": 0.41, "learning_rate": 6.340205141333609e-05, "loss": 2.3761, "step": 31930 }, { "epoch": 0.41, "learning_rate": 6.33922185266768e-05, "loss": 2.4931, "step": 31935 }, { "epoch": 0.41, "learning_rate": 6.338238508202304e-05, "loss": 2.65, "step": 31940 }, { "epoch": 0.41, "learning_rate": 6.337255107978455e-05, "loss": 2.5966, "step": 31945 }, { "epoch": 0.41, "learning_rate": 6.336271652037107e-05, "loss": 2.6897, "step": 31950 }, { "epoch": 0.41, "learning_rate": 6.335288140419235e-05, "loss": 2.6028, "step": 31955 }, { "epoch": 0.41, "learning_rate": 6.334304573165819e-05, "loss": 2.8243, "step": 31960 }, { "epoch": 0.41, "learning_rate": 6.333320950317838e-05, "loss": 2.5196, "step": 31965 }, { "epoch": 0.41, "learning_rate": 6.332337271916276e-05, "loss": 2.5267, "step": 31970 }, { "epoch": 0.41, "learning_rate": 6.331353538002118e-05, "loss": 2.6261, "step": 31975 }, { "epoch": 0.42, "learning_rate": 6.330369748616355e-05, "loss": 2.514, "step": 31980 }, { "epoch": 0.42, "learning_rate": 6.329385903799974e-05, "loss": 2.4966, "step": 31985 }, { "epoch": 0.42, "learning_rate": 6.328402003593968e-05, "loss": 2.6898, "step": 31990 }, { "epoch": 0.42, "learning_rate": 6.327418048039329e-05, "loss": 2.6058, "step": 31995 }, { "epoch": 0.42, "learning_rate": 6.326434037177059e-05, "loss": 2.625, "step": 32000 }, { "epoch": 0.42, "learning_rate": 6.325449971048156e-05, "loss": 2.5583, "step": 32005 }, { "epoch": 0.42, "learning_rate": 6.32446584969362e-05, "loss": 2.6539, "step": 32010 }, { "epoch": 0.42, "learning_rate": 6.323481673154456e-05, "loss": 2.6645, "step": 32015 }, { "epoch": 0.42, "learning_rate": 6.322497441471672e-05, "loss": 2.6515, "step": 32020 }, { "epoch": 0.42, "learning_rate": 6.321513154686273e-05, "loss": 2.4678, "step": 32025 }, { "epoch": 0.42, "learning_rate": 6.320528812839273e-05, "loss": 2.7435, "step": 32030 }, { "epoch": 0.42, "learning_rate": 6.319544415971683e-05, "loss": 2.4793, "step": 32035 }, { "epoch": 0.42, "learning_rate": 6.318559964124519e-05, "loss": 2.7138, "step": 32040 }, { "epoch": 0.42, "learning_rate": 6.317575457338799e-05, "loss": 2.6222, "step": 32045 }, { "epoch": 0.42, "learning_rate": 6.316590895655545e-05, "loss": 2.5565, "step": 32050 }, { "epoch": 0.42, "learning_rate": 6.315606279115775e-05, "loss": 2.5809, "step": 32055 }, { "epoch": 0.42, "learning_rate": 6.314621607760518e-05, "loss": 2.6321, "step": 32060 }, { "epoch": 0.42, "learning_rate": 6.313636881630798e-05, "loss": 2.6489, "step": 32065 }, { "epoch": 0.42, "learning_rate": 6.312652100767645e-05, "loss": 2.6104, "step": 32070 }, { "epoch": 0.42, "learning_rate": 6.311667265212092e-05, "loss": 2.5475, "step": 32075 }, { "epoch": 0.42, "learning_rate": 6.310682375005169e-05, "loss": 2.6427, "step": 32080 }, { "epoch": 0.42, "learning_rate": 6.309697430187916e-05, "loss": 2.5693, "step": 32085 }, { "epoch": 0.42, "learning_rate": 6.308712430801369e-05, "loss": 2.5856, "step": 32090 }, { "epoch": 0.42, "learning_rate": 6.30772737688657e-05, "loss": 2.5213, "step": 32095 }, { "epoch": 0.42, "learning_rate": 6.30674226848456e-05, "loss": 2.5072, "step": 32100 }, { "epoch": 0.42, "learning_rate": 6.305757105636385e-05, "loss": 2.7023, "step": 32105 }, { "epoch": 0.42, "learning_rate": 6.304771888383094e-05, "loss": 2.6298, "step": 32110 }, { "epoch": 0.42, "learning_rate": 6.303786616765735e-05, "loss": 2.6955, "step": 32115 }, { "epoch": 0.42, "learning_rate": 6.302801290825359e-05, "loss": 2.4752, "step": 32120 }, { "epoch": 0.42, "learning_rate": 6.301815910603022e-05, "loss": 2.5977, "step": 32125 }, { "epoch": 0.42, "learning_rate": 6.300830476139779e-05, "loss": 2.5337, "step": 32130 }, { "epoch": 0.42, "learning_rate": 6.29984498747669e-05, "loss": 2.7005, "step": 32135 }, { "epoch": 0.42, "learning_rate": 6.298859444654814e-05, "loss": 2.4342, "step": 32140 }, { "epoch": 0.42, "learning_rate": 6.297873847715217e-05, "loss": 2.6372, "step": 32145 }, { "epoch": 0.42, "learning_rate": 6.296888196698962e-05, "loss": 2.4551, "step": 32150 }, { "epoch": 0.42, "learning_rate": 6.29590249164712e-05, "loss": 2.534, "step": 32155 }, { "epoch": 0.42, "learning_rate": 6.294916732600757e-05, "loss": 2.47, "step": 32160 }, { "epoch": 0.42, "learning_rate": 6.293930919600946e-05, "loss": 2.554, "step": 32165 }, { "epoch": 0.42, "learning_rate": 6.292945052688763e-05, "loss": 2.5341, "step": 32170 }, { "epoch": 0.42, "learning_rate": 6.291959131905283e-05, "loss": 2.7337, "step": 32175 }, { "epoch": 0.42, "learning_rate": 6.290973157291587e-05, "loss": 2.6688, "step": 32180 }, { "epoch": 0.42, "learning_rate": 6.289987128888756e-05, "loss": 2.5703, "step": 32185 }, { "epoch": 0.42, "learning_rate": 6.289001046737873e-05, "loss": 2.6631, "step": 32190 }, { "epoch": 0.42, "learning_rate": 6.28801491088002e-05, "loss": 2.4487, "step": 32195 }, { "epoch": 0.42, "learning_rate": 6.287028721356292e-05, "loss": 2.6623, "step": 32200 }, { "epoch": 0.42, "learning_rate": 6.286042478207775e-05, "loss": 2.4776, "step": 32205 }, { "epoch": 0.42, "learning_rate": 6.285056181475558e-05, "loss": 2.5646, "step": 32210 }, { "epoch": 0.42, "learning_rate": 6.284069831200742e-05, "loss": 2.4357, "step": 32215 }, { "epoch": 0.42, "learning_rate": 6.283083427424422e-05, "loss": 2.5405, "step": 32220 }, { "epoch": 0.42, "learning_rate": 6.282096970187697e-05, "loss": 2.4319, "step": 32225 }, { "epoch": 0.42, "learning_rate": 6.281110459531665e-05, "loss": 2.5502, "step": 32230 }, { "epoch": 0.42, "learning_rate": 6.280123895497434e-05, "loss": 2.5267, "step": 32235 }, { "epoch": 0.42, "learning_rate": 6.279137278126106e-05, "loss": 2.5682, "step": 32240 }, { "epoch": 0.42, "learning_rate": 6.278150607458792e-05, "loss": 2.6925, "step": 32245 }, { "epoch": 0.42, "learning_rate": 6.277163883536602e-05, "loss": 2.6475, "step": 32250 }, { "epoch": 0.42, "learning_rate": 6.276177106400647e-05, "loss": 2.6014, "step": 32255 }, { "epoch": 0.42, "learning_rate": 6.27519027609204e-05, "loss": 2.6753, "step": 32260 }, { "epoch": 0.42, "learning_rate": 6.274203392651903e-05, "loss": 2.541, "step": 32265 }, { "epoch": 0.42, "learning_rate": 6.273216456121349e-05, "loss": 2.5264, "step": 32270 }, { "epoch": 0.42, "learning_rate": 6.272229466541505e-05, "loss": 2.5328, "step": 32275 }, { "epoch": 0.42, "learning_rate": 6.271242423953492e-05, "loss": 2.6162, "step": 32280 }, { "epoch": 0.42, "learning_rate": 6.270255328398434e-05, "loss": 2.6237, "step": 32285 }, { "epoch": 0.42, "learning_rate": 6.26926817991746e-05, "loss": 2.572, "step": 32290 }, { "epoch": 0.42, "learning_rate": 6.268280978551701e-05, "loss": 2.4709, "step": 32295 }, { "epoch": 0.42, "learning_rate": 6.267293724342289e-05, "loss": 2.6751, "step": 32300 }, { "epoch": 0.42, "learning_rate": 6.266306417330359e-05, "loss": 2.4872, "step": 32305 }, { "epoch": 0.42, "learning_rate": 6.265319057557046e-05, "loss": 2.6526, "step": 32310 }, { "epoch": 0.42, "learning_rate": 6.264331645063492e-05, "loss": 2.5637, "step": 32315 }, { "epoch": 0.42, "learning_rate": 6.263344179890834e-05, "loss": 2.663, "step": 32320 }, { "epoch": 0.42, "learning_rate": 6.262356662080217e-05, "loss": 2.5547, "step": 32325 }, { "epoch": 0.42, "learning_rate": 6.261369091672787e-05, "loss": 2.5205, "step": 32330 }, { "epoch": 0.42, "learning_rate": 6.260381468709693e-05, "loss": 2.5238, "step": 32335 }, { "epoch": 0.42, "learning_rate": 6.259393793232083e-05, "loss": 2.6018, "step": 32340 }, { "epoch": 0.42, "learning_rate": 6.25840606528111e-05, "loss": 2.5726, "step": 32345 }, { "epoch": 0.42, "learning_rate": 6.257418284897927e-05, "loss": 2.5577, "step": 32350 }, { "epoch": 0.42, "learning_rate": 6.25643045212369e-05, "loss": 2.5885, "step": 32355 }, { "epoch": 0.42, "learning_rate": 6.255442566999559e-05, "loss": 2.5664, "step": 32360 }, { "epoch": 0.42, "learning_rate": 6.254454629566696e-05, "loss": 2.529, "step": 32365 }, { "epoch": 0.42, "learning_rate": 6.253466639866262e-05, "loss": 2.4948, "step": 32370 }, { "epoch": 0.42, "learning_rate": 6.252478597939424e-05, "loss": 2.5294, "step": 32375 }, { "epoch": 0.42, "learning_rate": 6.251490503827347e-05, "loss": 2.504, "step": 32380 }, { "epoch": 0.42, "learning_rate": 6.250502357571199e-05, "loss": 2.5868, "step": 32385 }, { "epoch": 0.42, "learning_rate": 6.249514159212156e-05, "loss": 2.5036, "step": 32390 }, { "epoch": 0.42, "learning_rate": 6.248525908791392e-05, "loss": 2.686, "step": 32395 }, { "epoch": 0.42, "learning_rate": 6.24753760635008e-05, "loss": 2.516, "step": 32400 }, { "epoch": 0.42, "learning_rate": 6.246549251929399e-05, "loss": 2.6074, "step": 32405 }, { "epoch": 0.42, "learning_rate": 6.24556084557053e-05, "loss": 2.557, "step": 32410 }, { "epoch": 0.42, "learning_rate": 6.244572387314655e-05, "loss": 2.6298, "step": 32415 }, { "epoch": 0.42, "learning_rate": 6.243583877202958e-05, "loss": 2.6075, "step": 32420 }, { "epoch": 0.42, "learning_rate": 6.242595315276627e-05, "loss": 2.5689, "step": 32425 }, { "epoch": 0.42, "learning_rate": 6.241606701576852e-05, "loss": 2.6256, "step": 32430 }, { "epoch": 0.42, "learning_rate": 6.240618036144821e-05, "loss": 2.8021, "step": 32435 }, { "epoch": 0.42, "learning_rate": 6.239629319021732e-05, "loss": 2.5329, "step": 32440 }, { "epoch": 0.42, "learning_rate": 6.238640550248776e-05, "loss": 2.472, "step": 32445 }, { "epoch": 0.42, "learning_rate": 6.23765172986715e-05, "loss": 2.535, "step": 32450 }, { "epoch": 0.42, "learning_rate": 6.236662857918057e-05, "loss": 2.6435, "step": 32455 }, { "epoch": 0.42, "learning_rate": 6.2356739344427e-05, "loss": 2.4947, "step": 32460 }, { "epoch": 0.42, "learning_rate": 6.23468495948228e-05, "loss": 2.6249, "step": 32465 }, { "epoch": 0.42, "learning_rate": 6.233695933078004e-05, "loss": 2.5605, "step": 32470 }, { "epoch": 0.42, "learning_rate": 6.23270685527108e-05, "loss": 2.5794, "step": 32475 }, { "epoch": 0.42, "learning_rate": 6.231717726102719e-05, "loss": 2.5463, "step": 32480 }, { "epoch": 0.42, "learning_rate": 6.230728545614133e-05, "loss": 2.5948, "step": 32485 }, { "epoch": 0.42, "learning_rate": 6.229739313846542e-05, "loss": 2.6401, "step": 32490 }, { "epoch": 0.42, "learning_rate": 6.228750030841154e-05, "loss": 2.5898, "step": 32495 }, { "epoch": 0.42, "learning_rate": 6.227760696639193e-05, "loss": 2.7162, "step": 32500 }, { "epoch": 0.42, "learning_rate": 6.22677131128188e-05, "loss": 2.644, "step": 32505 }, { "epoch": 0.42, "learning_rate": 6.225781874810439e-05, "loss": 2.4967, "step": 32510 }, { "epoch": 0.42, "learning_rate": 6.224792387266091e-05, "loss": 2.6499, "step": 32515 }, { "epoch": 0.42, "learning_rate": 6.22380284869007e-05, "loss": 2.6061, "step": 32520 }, { "epoch": 0.42, "learning_rate": 6.2228132591236e-05, "loss": 2.652, "step": 32525 }, { "epoch": 0.42, "learning_rate": 6.221823618607919e-05, "loss": 2.7094, "step": 32530 }, { "epoch": 0.42, "learning_rate": 6.220833927184255e-05, "loss": 2.4806, "step": 32535 }, { "epoch": 0.42, "learning_rate": 6.219844184893848e-05, "loss": 2.5826, "step": 32540 }, { "epoch": 0.42, "learning_rate": 6.218854391777931e-05, "loss": 2.641, "step": 32545 }, { "epoch": 0.42, "learning_rate": 6.21786454787775e-05, "loss": 2.8064, "step": 32550 }, { "epoch": 0.42, "learning_rate": 6.216874653234545e-05, "loss": 2.5519, "step": 32555 }, { "epoch": 0.42, "learning_rate": 6.215884707889562e-05, "loss": 2.5305, "step": 32560 }, { "epoch": 0.42, "learning_rate": 6.214894711884046e-05, "loss": 2.5885, "step": 32565 }, { "epoch": 0.42, "learning_rate": 6.213904665259247e-05, "loss": 2.5958, "step": 32570 }, { "epoch": 0.42, "learning_rate": 6.212914568056413e-05, "loss": 2.5707, "step": 32575 }, { "epoch": 0.42, "learning_rate": 6.211924420316797e-05, "loss": 2.6336, "step": 32580 }, { "epoch": 0.42, "learning_rate": 6.210934222081661e-05, "loss": 2.5011, "step": 32585 }, { "epoch": 0.42, "learning_rate": 6.209943973392255e-05, "loss": 2.5995, "step": 32590 }, { "epoch": 0.42, "learning_rate": 6.208953674289841e-05, "loss": 2.6272, "step": 32595 }, { "epoch": 0.42, "learning_rate": 6.207963324815679e-05, "loss": 2.6466, "step": 32600 }, { "epoch": 0.42, "learning_rate": 6.206972925011034e-05, "loss": 2.4822, "step": 32605 }, { "epoch": 0.42, "learning_rate": 6.205982474917172e-05, "loss": 2.689, "step": 32610 }, { "epoch": 0.42, "learning_rate": 6.204991974575359e-05, "loss": 2.6197, "step": 32615 }, { "epoch": 0.42, "learning_rate": 6.204001424026864e-05, "loss": 2.5673, "step": 32620 }, { "epoch": 0.42, "learning_rate": 6.203010823312961e-05, "loss": 2.5508, "step": 32625 }, { "epoch": 0.42, "learning_rate": 6.202020172474926e-05, "loss": 2.7319, "step": 32630 }, { "epoch": 0.42, "learning_rate": 6.201029471554029e-05, "loss": 2.6019, "step": 32635 }, { "epoch": 0.42, "learning_rate": 6.200038720591551e-05, "loss": 2.6013, "step": 32640 }, { "epoch": 0.42, "learning_rate": 6.199047919628773e-05, "loss": 2.7175, "step": 32645 }, { "epoch": 0.42, "learning_rate": 6.198057068706978e-05, "loss": 2.5035, "step": 32650 }, { "epoch": 0.42, "learning_rate": 6.197066167867449e-05, "loss": 2.4995, "step": 32655 }, { "epoch": 0.42, "learning_rate": 6.196075217151473e-05, "loss": 2.5818, "step": 32660 }, { "epoch": 0.42, "learning_rate": 6.195084216600337e-05, "loss": 2.663, "step": 32665 }, { "epoch": 0.42, "learning_rate": 6.194093166255333e-05, "loss": 2.57, "step": 32670 }, { "epoch": 0.42, "learning_rate": 6.193102066157754e-05, "loss": 2.5551, "step": 32675 }, { "epoch": 0.42, "learning_rate": 6.192110916348895e-05, "loss": 2.7318, "step": 32680 }, { "epoch": 0.42, "learning_rate": 6.191119716870051e-05, "loss": 2.5855, "step": 32685 }, { "epoch": 0.42, "learning_rate": 6.190128467762523e-05, "loss": 2.5468, "step": 32690 }, { "epoch": 0.42, "learning_rate": 6.18913716906761e-05, "loss": 2.4276, "step": 32695 }, { "epoch": 0.42, "learning_rate": 6.188145820826616e-05, "loss": 2.6546, "step": 32700 }, { "epoch": 0.42, "learning_rate": 6.187154423080845e-05, "loss": 2.4929, "step": 32705 }, { "epoch": 0.42, "learning_rate": 6.186162975871606e-05, "loss": 2.4845, "step": 32710 }, { "epoch": 0.42, "learning_rate": 6.185171479240208e-05, "loss": 2.509, "step": 32715 }, { "epoch": 0.42, "learning_rate": 6.184179933227963e-05, "loss": 2.5334, "step": 32720 }, { "epoch": 0.42, "learning_rate": 6.183188337876181e-05, "loss": 2.6139, "step": 32725 }, { "epoch": 0.42, "learning_rate": 6.18219669322618e-05, "loss": 2.6722, "step": 32730 }, { "epoch": 0.42, "learning_rate": 6.181204999319277e-05, "loss": 2.6424, "step": 32735 }, { "epoch": 0.42, "learning_rate": 6.18021325619679e-05, "loss": 2.5952, "step": 32740 }, { "epoch": 0.42, "learning_rate": 6.179221463900043e-05, "loss": 2.5049, "step": 32745 }, { "epoch": 0.43, "learning_rate": 6.178229622470359e-05, "loss": 2.6399, "step": 32750 }, { "epoch": 0.43, "learning_rate": 6.177237731949064e-05, "loss": 2.5539, "step": 32755 }, { "epoch": 0.43, "learning_rate": 6.176245792377482e-05, "loss": 2.5239, "step": 32760 }, { "epoch": 0.43, "learning_rate": 6.175253803796947e-05, "loss": 2.5939, "step": 32765 }, { "epoch": 0.43, "learning_rate": 6.17426176624879e-05, "loss": 2.4858, "step": 32770 }, { "epoch": 0.43, "learning_rate": 6.173269679774343e-05, "loss": 2.5605, "step": 32775 }, { "epoch": 0.43, "learning_rate": 6.172277544414943e-05, "loss": 2.5942, "step": 32780 }, { "epoch": 0.43, "learning_rate": 6.17128536021193e-05, "loss": 2.4976, "step": 32785 }, { "epoch": 0.43, "learning_rate": 6.170293127206639e-05, "loss": 2.5015, "step": 32790 }, { "epoch": 0.43, "learning_rate": 6.169300845440415e-05, "loss": 2.578, "step": 32795 }, { "epoch": 0.43, "learning_rate": 6.168308514954602e-05, "loss": 2.5211, "step": 32800 }, { "epoch": 0.43, "learning_rate": 6.167316135790548e-05, "loss": 2.6533, "step": 32805 }, { "epoch": 0.43, "learning_rate": 6.166323707989597e-05, "loss": 2.5929, "step": 32810 }, { "epoch": 0.43, "learning_rate": 6.165331231593101e-05, "loss": 2.5403, "step": 32815 }, { "epoch": 0.43, "learning_rate": 6.164338706642412e-05, "loss": 2.5658, "step": 32820 }, { "epoch": 0.43, "learning_rate": 6.163346133178885e-05, "loss": 2.4941, "step": 32825 }, { "epoch": 0.43, "learning_rate": 6.162353511243874e-05, "loss": 2.5325, "step": 32830 }, { "epoch": 0.43, "learning_rate": 6.161360840878737e-05, "loss": 2.4989, "step": 32835 }, { "epoch": 0.43, "learning_rate": 6.160368122124838e-05, "loss": 2.638, "step": 32840 }, { "epoch": 0.43, "learning_rate": 6.159375355023537e-05, "loss": 2.6226, "step": 32845 }, { "epoch": 0.43, "learning_rate": 6.158382539616195e-05, "loss": 2.5328, "step": 32850 }, { "epoch": 0.43, "learning_rate": 6.157389675944184e-05, "loss": 2.6024, "step": 32855 }, { "epoch": 0.43, "learning_rate": 6.15639676404887e-05, "loss": 2.5311, "step": 32860 }, { "epoch": 0.43, "learning_rate": 6.15540380397162e-05, "loss": 2.5203, "step": 32865 }, { "epoch": 0.43, "learning_rate": 6.154410795753811e-05, "loss": 2.4481, "step": 32870 }, { "epoch": 0.43, "learning_rate": 6.153417739436814e-05, "loss": 2.637, "step": 32875 }, { "epoch": 0.43, "learning_rate": 6.152424635062007e-05, "loss": 2.6109, "step": 32880 }, { "epoch": 0.43, "learning_rate": 6.151431482670768e-05, "loss": 2.5146, "step": 32885 }, { "epoch": 0.43, "learning_rate": 6.150438282304476e-05, "loss": 2.481, "step": 32890 }, { "epoch": 0.43, "learning_rate": 6.149445034004515e-05, "loss": 2.763, "step": 32895 }, { "epoch": 0.43, "learning_rate": 6.148451737812268e-05, "loss": 2.6187, "step": 32900 }, { "epoch": 0.43, "learning_rate": 6.147458393769123e-05, "loss": 2.6567, "step": 32905 }, { "epoch": 0.43, "learning_rate": 6.146465001916465e-05, "loss": 2.7245, "step": 32910 }, { "epoch": 0.43, "learning_rate": 6.145471562295687e-05, "loss": 2.5524, "step": 32915 }, { "epoch": 0.43, "learning_rate": 6.14447807494818e-05, "loss": 2.6094, "step": 32920 }, { "epoch": 0.43, "learning_rate": 6.143484539915341e-05, "loss": 2.6644, "step": 32925 }, { "epoch": 0.43, "learning_rate": 6.142490957238563e-05, "loss": 2.6435, "step": 32930 }, { "epoch": 0.43, "learning_rate": 6.141497326959243e-05, "loss": 2.6011, "step": 32935 }, { "epoch": 0.43, "learning_rate": 6.140503649118786e-05, "loss": 2.5921, "step": 32940 }, { "epoch": 0.43, "learning_rate": 6.139509923758589e-05, "loss": 2.499, "step": 32945 }, { "epoch": 0.43, "learning_rate": 6.13851615092006e-05, "loss": 2.4259, "step": 32950 }, { "epoch": 0.43, "learning_rate": 6.137522330644604e-05, "loss": 2.7431, "step": 32955 }, { "epoch": 0.43, "learning_rate": 6.136528462973628e-05, "loss": 2.5372, "step": 32960 }, { "epoch": 0.43, "learning_rate": 6.135534547948543e-05, "loss": 2.5283, "step": 32965 }, { "epoch": 0.43, "learning_rate": 6.13454058561076e-05, "loss": 2.7066, "step": 32970 }, { "epoch": 0.43, "learning_rate": 6.133546576001695e-05, "loss": 2.6342, "step": 32975 }, { "epoch": 0.43, "learning_rate": 6.132552519162761e-05, "loss": 2.4891, "step": 32980 }, { "epoch": 0.43, "learning_rate": 6.13155841513538e-05, "loss": 2.636, "step": 32985 }, { "epoch": 0.43, "learning_rate": 6.130564263960968e-05, "loss": 2.8164, "step": 32990 }, { "epoch": 0.43, "learning_rate": 6.129570065680951e-05, "loss": 2.6678, "step": 32995 }, { "epoch": 0.43, "learning_rate": 6.128575820336749e-05, "loss": 2.5892, "step": 33000 }, { "epoch": 0.43, "learning_rate": 6.127581527969788e-05, "loss": 2.5694, "step": 33005 }, { "epoch": 0.43, "learning_rate": 6.126587188621499e-05, "loss": 2.4619, "step": 33010 }, { "epoch": 0.43, "learning_rate": 6.125592802333309e-05, "loss": 2.5313, "step": 33015 }, { "epoch": 0.43, "learning_rate": 6.124598369146649e-05, "loss": 2.6301, "step": 33020 }, { "epoch": 0.43, "learning_rate": 6.123603889102955e-05, "loss": 2.684, "step": 33025 }, { "epoch": 0.43, "learning_rate": 6.122609362243663e-05, "loss": 2.6047, "step": 33030 }, { "epoch": 0.43, "learning_rate": 6.121614788610206e-05, "loss": 2.6589, "step": 33035 }, { "epoch": 0.43, "learning_rate": 6.12062016824403e-05, "loss": 2.5915, "step": 33040 }, { "epoch": 0.43, "learning_rate": 6.119625501186572e-05, "loss": 2.7858, "step": 33045 }, { "epoch": 0.43, "learning_rate": 6.118630787479276e-05, "loss": 2.5748, "step": 33050 }, { "epoch": 0.43, "learning_rate": 6.117636027163587e-05, "loss": 2.7101, "step": 33055 }, { "epoch": 0.43, "learning_rate": 6.116641220280954e-05, "loss": 2.4629, "step": 33060 }, { "epoch": 0.43, "learning_rate": 6.115646366872824e-05, "loss": 2.4134, "step": 33065 }, { "epoch": 0.43, "learning_rate": 6.114651466980652e-05, "loss": 2.5532, "step": 33070 }, { "epoch": 0.43, "learning_rate": 6.113656520645886e-05, "loss": 2.5254, "step": 33075 }, { "epoch": 0.43, "learning_rate": 6.112661527909984e-05, "loss": 2.4656, "step": 33080 }, { "epoch": 0.43, "learning_rate": 6.111666488814402e-05, "loss": 2.701, "step": 33085 }, { "epoch": 0.43, "learning_rate": 6.1106714034006e-05, "loss": 2.5614, "step": 33090 }, { "epoch": 0.43, "learning_rate": 6.109676271710037e-05, "loss": 2.6147, "step": 33095 }, { "epoch": 0.43, "learning_rate": 6.108681093784177e-05, "loss": 2.6973, "step": 33100 }, { "epoch": 0.43, "learning_rate": 6.107685869664485e-05, "loss": 2.5839, "step": 33105 }, { "epoch": 0.43, "learning_rate": 6.106690599392427e-05, "loss": 2.606, "step": 33110 }, { "epoch": 0.43, "learning_rate": 6.10569528300947e-05, "loss": 2.5866, "step": 33115 }, { "epoch": 0.43, "learning_rate": 6.104699920557088e-05, "loss": 2.5291, "step": 33120 }, { "epoch": 0.43, "learning_rate": 6.10370451207675e-05, "loss": 2.5288, "step": 33125 }, { "epoch": 0.43, "learning_rate": 6.102709057609931e-05, "loss": 2.5446, "step": 33130 }, { "epoch": 0.43, "learning_rate": 6.1017135571981086e-05, "loss": 2.6941, "step": 33135 }, { "epoch": 0.43, "learning_rate": 6.10071801088276e-05, "loss": 2.4121, "step": 33140 }, { "epoch": 0.43, "learning_rate": 6.099722418705366e-05, "loss": 2.4776, "step": 33145 }, { "epoch": 0.43, "learning_rate": 6.0987267807074054e-05, "loss": 2.7246, "step": 33150 }, { "epoch": 0.43, "learning_rate": 6.097731096930367e-05, "loss": 2.6039, "step": 33155 }, { "epoch": 0.43, "learning_rate": 6.096735367415731e-05, "loss": 2.6294, "step": 33160 }, { "epoch": 0.43, "learning_rate": 6.095739592204991e-05, "loss": 2.4624, "step": 33165 }, { "epoch": 0.43, "learning_rate": 6.0947437713396315e-05, "loss": 2.6058, "step": 33170 }, { "epoch": 0.43, "learning_rate": 6.0937479048611465e-05, "loss": 2.3639, "step": 33175 }, { "epoch": 0.43, "learning_rate": 6.092751992811029e-05, "loss": 2.7096, "step": 33180 }, { "epoch": 0.43, "learning_rate": 6.091756035230775e-05, "loss": 2.5038, "step": 33185 }, { "epoch": 0.43, "learning_rate": 6.0907600321618775e-05, "loss": 2.6076, "step": 33190 }, { "epoch": 0.43, "learning_rate": 6.089763983645841e-05, "loss": 2.5199, "step": 33195 }, { "epoch": 0.43, "learning_rate": 6.088767889724164e-05, "loss": 2.5626, "step": 33200 }, { "epoch": 0.43, "learning_rate": 6.08777175043835e-05, "loss": 2.7083, "step": 33205 }, { "epoch": 0.43, "learning_rate": 6.086775565829902e-05, "loss": 2.615, "step": 33210 }, { "epoch": 0.43, "learning_rate": 6.085779335940328e-05, "loss": 2.5959, "step": 33215 }, { "epoch": 0.43, "learning_rate": 6.084783060811136e-05, "loss": 2.5278, "step": 33220 }, { "epoch": 0.43, "learning_rate": 6.0837867404838366e-05, "loss": 2.5381, "step": 33225 }, { "epoch": 0.43, "learning_rate": 6.082790374999944e-05, "loss": 2.6567, "step": 33230 }, { "epoch": 0.43, "learning_rate": 6.081793964400969e-05, "loss": 2.5974, "step": 33235 }, { "epoch": 0.43, "learning_rate": 6.080797508728429e-05, "loss": 2.7028, "step": 33240 }, { "epoch": 0.43, "learning_rate": 6.079801008023841e-05, "loss": 2.558, "step": 33245 }, { "epoch": 0.43, "learning_rate": 6.0788044623287265e-05, "loss": 2.5601, "step": 33250 }, { "epoch": 0.43, "learning_rate": 6.0778078716846063e-05, "loss": 2.6023, "step": 33255 }, { "epoch": 0.43, "learning_rate": 6.0768112361330043e-05, "loss": 2.5453, "step": 33260 }, { "epoch": 0.43, "learning_rate": 6.075814555715447e-05, "loss": 2.5636, "step": 33265 }, { "epoch": 0.43, "learning_rate": 6.074817830473458e-05, "loss": 2.5779, "step": 33270 }, { "epoch": 0.43, "learning_rate": 6.073821060448569e-05, "loss": 2.6594, "step": 33275 }, { "epoch": 0.43, "learning_rate": 6.0728242456823104e-05, "loss": 2.6205, "step": 33280 }, { "epoch": 0.43, "learning_rate": 6.071827386216216e-05, "loss": 2.6035, "step": 33285 }, { "epoch": 0.43, "learning_rate": 6.0708304820918204e-05, "loss": 2.6414, "step": 33290 }, { "epoch": 0.43, "learning_rate": 6.0698335333506596e-05, "loss": 2.5453, "step": 33295 }, { "epoch": 0.43, "learning_rate": 6.068836540034271e-05, "loss": 2.5862, "step": 33300 }, { "epoch": 0.43, "learning_rate": 6.067839502184196e-05, "loss": 2.6223, "step": 33305 }, { "epoch": 0.43, "learning_rate": 6.0668424198419774e-05, "loss": 2.541, "step": 33310 }, { "epoch": 0.43, "learning_rate": 6.065845293049157e-05, "loss": 2.6424, "step": 33315 }, { "epoch": 0.43, "learning_rate": 6.064848121847284e-05, "loss": 2.6771, "step": 33320 }, { "epoch": 0.43, "learning_rate": 6.0638509062779036e-05, "loss": 2.5937, "step": 33325 }, { "epoch": 0.43, "learning_rate": 6.062853646382567e-05, "loss": 2.4862, "step": 33330 }, { "epoch": 0.43, "learning_rate": 6.061856342202823e-05, "loss": 2.6085, "step": 33335 }, { "epoch": 0.43, "learning_rate": 6.060858993780226e-05, "loss": 2.5947, "step": 33340 }, { "epoch": 0.43, "learning_rate": 6.0598616011563324e-05, "loss": 2.5328, "step": 33345 }, { "epoch": 0.43, "learning_rate": 6.0588641643727e-05, "loss": 2.6084, "step": 33350 }, { "epoch": 0.43, "learning_rate": 6.057866683470884e-05, "loss": 2.4473, "step": 33355 }, { "epoch": 0.43, "learning_rate": 6.0568691584924474e-05, "loss": 2.5249, "step": 33360 }, { "epoch": 0.43, "learning_rate": 6.055871589478953e-05, "loss": 2.5563, "step": 33365 }, { "epoch": 0.43, "learning_rate": 6.054873976471963e-05, "loss": 2.5154, "step": 33370 }, { "epoch": 0.43, "learning_rate": 6.053876319513044e-05, "loss": 2.5596, "step": 33375 }, { "epoch": 0.43, "learning_rate": 6.052878618643767e-05, "loss": 2.6582, "step": 33380 }, { "epoch": 0.43, "learning_rate": 6.051880873905698e-05, "loss": 2.6919, "step": 33385 }, { "epoch": 0.43, "learning_rate": 6.050883085340411e-05, "loss": 2.4003, "step": 33390 }, { "epoch": 0.43, "learning_rate": 6.049885252989478e-05, "loss": 2.6207, "step": 33395 }, { "epoch": 0.43, "learning_rate": 6.0488873768944745e-05, "loss": 2.637, "step": 33400 }, { "epoch": 0.43, "learning_rate": 6.047889457096977e-05, "loss": 2.5381, "step": 33405 }, { "epoch": 0.43, "learning_rate": 6.0468914936385665e-05, "loss": 2.5148, "step": 33410 }, { "epoch": 0.43, "learning_rate": 6.045893486560823e-05, "loss": 2.5698, "step": 33415 }, { "epoch": 0.43, "learning_rate": 6.044895435905328e-05, "loss": 2.3875, "step": 33420 }, { "epoch": 0.43, "learning_rate": 6.043897341713667e-05, "loss": 2.7016, "step": 33425 }, { "epoch": 0.43, "learning_rate": 6.042899204027423e-05, "loss": 2.5624, "step": 33430 }, { "epoch": 0.43, "learning_rate": 6.041901022888189e-05, "loss": 2.6835, "step": 33435 }, { "epoch": 0.43, "learning_rate": 6.040902798337551e-05, "loss": 2.6728, "step": 33440 }, { "epoch": 0.43, "learning_rate": 6.039904530417102e-05, "loss": 2.5464, "step": 33445 }, { "epoch": 0.43, "learning_rate": 6.0389062191684366e-05, "loss": 2.6883, "step": 33450 }, { "epoch": 0.43, "learning_rate": 6.037907864633148e-05, "loss": 2.5803, "step": 33455 }, { "epoch": 0.43, "learning_rate": 6.036909466852834e-05, "loss": 2.4598, "step": 33460 }, { "epoch": 0.43, "learning_rate": 6.035911025869092e-05, "loss": 2.5237, "step": 33465 }, { "epoch": 0.43, "learning_rate": 6.034912541723524e-05, "loss": 2.5393, "step": 33470 }, { "epoch": 0.43, "learning_rate": 6.0339140144577346e-05, "loss": 2.5087, "step": 33475 }, { "epoch": 0.43, "learning_rate": 6.0329154441133254e-05, "loss": 2.6146, "step": 33480 }, { "epoch": 0.43, "learning_rate": 6.031916830731902e-05, "loss": 2.6192, "step": 33485 }, { "epoch": 0.43, "learning_rate": 6.0309181743550725e-05, "loss": 2.5349, "step": 33490 }, { "epoch": 0.43, "learning_rate": 6.029919475024447e-05, "loss": 2.5284, "step": 33495 }, { "epoch": 0.43, "learning_rate": 6.0289207327816365e-05, "loss": 2.5544, "step": 33500 }, { "epoch": 0.43, "learning_rate": 6.027921947668256e-05, "loss": 2.733, "step": 33505 }, { "epoch": 0.43, "learning_rate": 6.026923119725918e-05, "loss": 2.4842, "step": 33510 }, { "epoch": 0.43, "learning_rate": 6.025924248996241e-05, "loss": 2.635, "step": 33515 }, { "epoch": 0.44, "learning_rate": 6.0249253355208414e-05, "loss": 2.5595, "step": 33520 }, { "epoch": 0.44, "learning_rate": 6.0239263793413414e-05, "loss": 2.7868, "step": 33525 }, { "epoch": 0.44, "learning_rate": 6.0229273804993613e-05, "loss": 2.6451, "step": 33530 }, { "epoch": 0.44, "learning_rate": 6.0219283390365286e-05, "loss": 2.5817, "step": 33535 }, { "epoch": 0.44, "learning_rate": 6.020929254994465e-05, "loss": 2.6352, "step": 33540 }, { "epoch": 0.44, "learning_rate": 6.0199301284148004e-05, "loss": 2.7153, "step": 33545 }, { "epoch": 0.44, "learning_rate": 6.018930959339163e-05, "loss": 2.6779, "step": 33550 }, { "epoch": 0.44, "learning_rate": 6.017931747809184e-05, "loss": 2.7041, "step": 33555 }, { "epoch": 0.44, "learning_rate": 6.016932493866494e-05, "loss": 2.4873, "step": 33560 }, { "epoch": 0.44, "learning_rate": 6.0159331975527286e-05, "loss": 2.5475, "step": 33565 }, { "epoch": 0.44, "learning_rate": 6.0149338589095275e-05, "loss": 2.6441, "step": 33570 }, { "epoch": 0.44, "learning_rate": 6.0139344779785256e-05, "loss": 2.5922, "step": 33575 }, { "epoch": 0.44, "learning_rate": 6.012935054801363e-05, "loss": 2.5309, "step": 33580 }, { "epoch": 0.44, "learning_rate": 6.0119355894196815e-05, "loss": 2.5753, "step": 33585 }, { "epoch": 0.44, "learning_rate": 6.010936081875122e-05, "loss": 2.6426, "step": 33590 }, { "epoch": 0.44, "learning_rate": 6.009936532209334e-05, "loss": 2.4658, "step": 33595 }, { "epoch": 0.44, "learning_rate": 6.008936940463961e-05, "loss": 2.6416, "step": 33600 }, { "epoch": 0.44, "learning_rate": 6.007937306680653e-05, "loss": 2.4398, "step": 33605 }, { "epoch": 0.44, "learning_rate": 6.0069376309010615e-05, "loss": 2.6283, "step": 33610 }, { "epoch": 0.44, "learning_rate": 6.005937913166836e-05, "loss": 2.6702, "step": 33615 }, { "epoch": 0.44, "learning_rate": 6.00493815351963e-05, "loss": 2.6695, "step": 33620 }, { "epoch": 0.44, "learning_rate": 6.0039383520011e-05, "loss": 2.4287, "step": 33625 }, { "epoch": 0.44, "learning_rate": 6.002938508652907e-05, "loss": 2.5287, "step": 33630 }, { "epoch": 0.44, "learning_rate": 6.0019386235167055e-05, "loss": 2.6351, "step": 33635 }, { "epoch": 0.44, "learning_rate": 6.000938696634156e-05, "loss": 2.7229, "step": 33640 }, { "epoch": 0.44, "learning_rate": 5.999938728046924e-05, "loss": 2.6142, "step": 33645 }, { "epoch": 0.44, "learning_rate": 5.9989387177966714e-05, "loss": 2.5605, "step": 33650 }, { "epoch": 0.44, "learning_rate": 5.997938665925067e-05, "loss": 2.5551, "step": 33655 }, { "epoch": 0.44, "learning_rate": 5.9969385724737735e-05, "loss": 2.5248, "step": 33660 }, { "epoch": 0.44, "learning_rate": 5.995938437484466e-05, "loss": 2.6188, "step": 33665 }, { "epoch": 0.44, "learning_rate": 5.9949382609988124e-05, "loss": 2.6644, "step": 33670 }, { "epoch": 0.44, "learning_rate": 5.993938043058488e-05, "loss": 2.6164, "step": 33675 }, { "epoch": 0.44, "learning_rate": 5.992937783705164e-05, "loss": 2.6502, "step": 33680 }, { "epoch": 0.44, "learning_rate": 5.991937482980519e-05, "loss": 2.5017, "step": 33685 }, { "epoch": 0.44, "learning_rate": 5.9909371409262305e-05, "loss": 2.5829, "step": 33690 }, { "epoch": 0.44, "learning_rate": 5.989936757583979e-05, "loss": 2.6721, "step": 33695 }, { "epoch": 0.44, "learning_rate": 5.988936332995446e-05, "loss": 2.3128, "step": 33700 }, { "epoch": 0.44, "learning_rate": 5.9879358672023147e-05, "loss": 2.6842, "step": 33705 }, { "epoch": 0.44, "learning_rate": 5.9869353602462685e-05, "loss": 2.4692, "step": 33710 }, { "epoch": 0.44, "learning_rate": 5.9859348121689974e-05, "loss": 2.6425, "step": 33715 }, { "epoch": 0.44, "learning_rate": 5.9849342230121855e-05, "loss": 2.5682, "step": 33720 }, { "epoch": 0.44, "learning_rate": 5.9839335928175265e-05, "loss": 2.6986, "step": 33725 }, { "epoch": 0.44, "learning_rate": 5.9829329216267114e-05, "loss": 2.5689, "step": 33730 }, { "epoch": 0.44, "learning_rate": 5.981932209481433e-05, "loss": 2.4844, "step": 33735 }, { "epoch": 0.44, "learning_rate": 5.980931456423386e-05, "loss": 2.6416, "step": 33740 }, { "epoch": 0.44, "learning_rate": 5.979930662494269e-05, "loss": 2.563, "step": 33745 }, { "epoch": 0.44, "learning_rate": 5.9789298277357796e-05, "loss": 2.6129, "step": 33750 }, { "epoch": 0.44, "learning_rate": 5.9779289521896174e-05, "loss": 2.7145, "step": 33755 }, { "epoch": 0.44, "learning_rate": 5.9769280358974876e-05, "loss": 2.5696, "step": 33760 }, { "epoch": 0.44, "learning_rate": 5.975927078901091e-05, "loss": 2.4766, "step": 33765 }, { "epoch": 0.44, "learning_rate": 5.9749260812421336e-05, "loss": 2.5981, "step": 33770 }, { "epoch": 0.44, "learning_rate": 5.973925042962322e-05, "loss": 2.5732, "step": 33775 }, { "epoch": 0.44, "learning_rate": 5.972923964103367e-05, "loss": 2.5279, "step": 33780 }, { "epoch": 0.44, "learning_rate": 5.971922844706976e-05, "loss": 2.5778, "step": 33785 }, { "epoch": 0.44, "learning_rate": 5.970921684814865e-05, "loss": 2.497, "step": 33790 }, { "epoch": 0.44, "learning_rate": 5.969920484468746e-05, "loss": 2.4773, "step": 33795 }, { "epoch": 0.44, "learning_rate": 5.9689192437103345e-05, "loss": 2.48, "step": 33800 }, { "epoch": 0.44, "learning_rate": 5.967917962581347e-05, "loss": 2.5284, "step": 33805 }, { "epoch": 0.44, "learning_rate": 5.966916641123505e-05, "loss": 2.4957, "step": 33810 }, { "epoch": 0.44, "learning_rate": 5.965915279378525e-05, "loss": 2.7064, "step": 33815 }, { "epoch": 0.44, "learning_rate": 5.964913877388134e-05, "loss": 2.4989, "step": 33820 }, { "epoch": 0.44, "learning_rate": 5.9639124351940545e-05, "loss": 2.525, "step": 33825 }, { "epoch": 0.44, "learning_rate": 5.96291095283801e-05, "loss": 2.5834, "step": 33830 }, { "epoch": 0.44, "learning_rate": 5.961909430361728e-05, "loss": 2.3772, "step": 33835 }, { "epoch": 0.44, "learning_rate": 5.960907867806942e-05, "loss": 2.5084, "step": 33840 }, { "epoch": 0.44, "learning_rate": 5.959906265215376e-05, "loss": 2.6413, "step": 33845 }, { "epoch": 0.44, "learning_rate": 5.958904622628768e-05, "loss": 2.5784, "step": 33850 }, { "epoch": 0.44, "learning_rate": 5.9579029400888496e-05, "loss": 2.658, "step": 33855 }, { "epoch": 0.44, "learning_rate": 5.9569012176373576e-05, "loss": 2.5623, "step": 33860 }, { "epoch": 0.44, "learning_rate": 5.955899455316026e-05, "loss": 2.6132, "step": 33865 }, { "epoch": 0.44, "learning_rate": 5.9548976531665975e-05, "loss": 2.7691, "step": 33870 }, { "epoch": 0.44, "learning_rate": 5.953895811230812e-05, "loss": 2.4796, "step": 33875 }, { "epoch": 0.44, "learning_rate": 5.9528939295504105e-05, "loss": 2.4878, "step": 33880 }, { "epoch": 0.44, "learning_rate": 5.951892008167138e-05, "loss": 2.5056, "step": 33885 }, { "epoch": 0.44, "learning_rate": 5.9508900471227416e-05, "loss": 2.6129, "step": 33890 }, { "epoch": 0.44, "learning_rate": 5.9498880464589636e-05, "loss": 2.3555, "step": 33895 }, { "epoch": 0.44, "learning_rate": 5.948886006217559e-05, "loss": 2.6967, "step": 33900 }, { "epoch": 0.44, "learning_rate": 5.9478839264402755e-05, "loss": 2.6016, "step": 33905 }, { "epoch": 0.44, "learning_rate": 5.946881807168864e-05, "loss": 2.658, "step": 33910 }, { "epoch": 0.44, "learning_rate": 5.9458796484450794e-05, "loss": 2.6406, "step": 33915 }, { "epoch": 0.44, "learning_rate": 5.9448774503106794e-05, "loss": 2.5724, "step": 33920 }, { "epoch": 0.44, "learning_rate": 5.943875212807418e-05, "loss": 2.5686, "step": 33925 }, { "epoch": 0.44, "learning_rate": 5.9428729359770565e-05, "loss": 2.5899, "step": 33930 }, { "epoch": 0.44, "learning_rate": 5.9418706198613536e-05, "loss": 2.6153, "step": 33935 }, { "epoch": 0.44, "learning_rate": 5.940868264502072e-05, "loss": 2.7747, "step": 33940 }, { "epoch": 0.44, "learning_rate": 5.939865869940976e-05, "loss": 2.63, "step": 33945 }, { "epoch": 0.44, "learning_rate": 5.9388634362198304e-05, "loss": 2.5738, "step": 33950 }, { "epoch": 0.44, "learning_rate": 5.937860963380403e-05, "loss": 2.6768, "step": 33955 }, { "epoch": 0.44, "learning_rate": 5.936858451464459e-05, "loss": 2.5448, "step": 33960 }, { "epoch": 0.44, "learning_rate": 5.935855900513773e-05, "loss": 2.4988, "step": 33965 }, { "epoch": 0.44, "learning_rate": 5.9348533105701146e-05, "loss": 2.5842, "step": 33970 }, { "epoch": 0.44, "learning_rate": 5.933850681675257e-05, "loss": 2.6997, "step": 33975 }, { "epoch": 0.44, "learning_rate": 5.9328480138709775e-05, "loss": 2.691, "step": 33980 }, { "epoch": 0.44, "learning_rate": 5.931845307199051e-05, "loss": 2.4965, "step": 33985 }, { "epoch": 0.44, "learning_rate": 5.930842561701254e-05, "loss": 2.6114, "step": 33990 }, { "epoch": 0.44, "learning_rate": 5.929839777419372e-05, "loss": 2.6618, "step": 33995 }, { "epoch": 0.44, "learning_rate": 5.9288369543951814e-05, "loss": 2.6963, "step": 34000 }, { "epoch": 0.44, "learning_rate": 5.927834092670467e-05, "loss": 2.5337, "step": 34005 }, { "epoch": 0.44, "learning_rate": 5.9268311922870145e-05, "loss": 2.5481, "step": 34010 }, { "epoch": 0.44, "learning_rate": 5.9258282532866095e-05, "loss": 2.6993, "step": 34015 }, { "epoch": 0.44, "learning_rate": 5.92482527571104e-05, "loss": 2.5735, "step": 34020 }, { "epoch": 0.44, "learning_rate": 5.9238222596020966e-05, "loss": 2.5428, "step": 34025 }, { "epoch": 0.44, "learning_rate": 5.92281920500157e-05, "loss": 2.5536, "step": 34030 }, { "epoch": 0.44, "learning_rate": 5.921816111951251e-05, "loss": 2.5198, "step": 34035 }, { "epoch": 0.44, "learning_rate": 5.920812980492937e-05, "loss": 2.6806, "step": 34040 }, { "epoch": 0.44, "learning_rate": 5.919809810668423e-05, "loss": 2.5006, "step": 34045 }, { "epoch": 0.44, "learning_rate": 5.918806602519505e-05, "loss": 2.5717, "step": 34050 }, { "epoch": 0.44, "learning_rate": 5.9178033560879866e-05, "loss": 2.5987, "step": 34055 }, { "epoch": 0.44, "learning_rate": 5.9168000714156646e-05, "loss": 2.4316, "step": 34060 }, { "epoch": 0.44, "learning_rate": 5.915796748544343e-05, "loss": 2.5047, "step": 34065 }, { "epoch": 0.44, "learning_rate": 5.914793387515824e-05, "loss": 2.6419, "step": 34070 }, { "epoch": 0.44, "learning_rate": 5.913789988371916e-05, "loss": 2.6373, "step": 34075 }, { "epoch": 0.44, "learning_rate": 5.912786551154424e-05, "loss": 2.4857, "step": 34080 }, { "epoch": 0.44, "learning_rate": 5.911783075905158e-05, "loss": 2.5319, "step": 34085 }, { "epoch": 0.44, "learning_rate": 5.910779562665929e-05, "loss": 2.406, "step": 34090 }, { "epoch": 0.44, "learning_rate": 5.9097760114785486e-05, "loss": 2.5253, "step": 34095 }, { "epoch": 0.44, "learning_rate": 5.9087724223848276e-05, "loss": 2.6214, "step": 34100 }, { "epoch": 0.44, "learning_rate": 5.907768795426585e-05, "loss": 2.6325, "step": 34105 }, { "epoch": 0.44, "learning_rate": 5.906765130645634e-05, "loss": 2.7448, "step": 34110 }, { "epoch": 0.44, "learning_rate": 5.905761428083796e-05, "loss": 2.5464, "step": 34115 }, { "epoch": 0.44, "learning_rate": 5.904757687782889e-05, "loss": 2.7056, "step": 34120 }, { "epoch": 0.44, "learning_rate": 5.903753909784735e-05, "loss": 2.6938, "step": 34125 }, { "epoch": 0.44, "learning_rate": 5.902750094131157e-05, "loss": 2.5918, "step": 34130 }, { "epoch": 0.44, "learning_rate": 5.901746240863979e-05, "loss": 2.5922, "step": 34135 }, { "epoch": 0.44, "learning_rate": 5.900742350025027e-05, "loss": 2.5029, "step": 34140 }, { "epoch": 0.44, "learning_rate": 5.89973842165613e-05, "loss": 2.5827, "step": 34145 }, { "epoch": 0.44, "learning_rate": 5.8987344557991164e-05, "loss": 2.5982, "step": 34150 }, { "epoch": 0.44, "learning_rate": 5.8977304524958176e-05, "loss": 2.5801, "step": 34155 }, { "epoch": 0.44, "learning_rate": 5.896726411788066e-05, "loss": 2.615, "step": 34160 }, { "epoch": 0.44, "learning_rate": 5.895722333717692e-05, "loss": 2.5722, "step": 34165 }, { "epoch": 0.44, "learning_rate": 5.894718218326537e-05, "loss": 2.5525, "step": 34170 }, { "epoch": 0.44, "learning_rate": 5.893714065656434e-05, "loss": 2.5811, "step": 34175 }, { "epoch": 0.44, "learning_rate": 5.892709875749223e-05, "loss": 2.6239, "step": 34180 }, { "epoch": 0.44, "learning_rate": 5.891705648646744e-05, "loss": 2.7538, "step": 34185 }, { "epoch": 0.44, "learning_rate": 5.8907013843908384e-05, "loss": 2.6162, "step": 34190 }, { "epoch": 0.44, "learning_rate": 5.889697083023349e-05, "loss": 2.6962, "step": 34195 }, { "epoch": 0.44, "learning_rate": 5.888692744586122e-05, "loss": 2.6252, "step": 34200 }, { "epoch": 0.44, "learning_rate": 5.8876883691210014e-05, "loss": 2.594, "step": 34205 }, { "epoch": 0.44, "learning_rate": 5.8866839566698385e-05, "loss": 2.5355, "step": 34210 }, { "epoch": 0.44, "learning_rate": 5.885679507274481e-05, "loss": 2.6294, "step": 34215 }, { "epoch": 0.44, "learning_rate": 5.884675020976779e-05, "loss": 2.4498, "step": 34220 }, { "epoch": 0.44, "learning_rate": 5.883670497818585e-05, "loss": 2.7378, "step": 34225 }, { "epoch": 0.44, "learning_rate": 5.882665937841755e-05, "loss": 2.5507, "step": 34230 }, { "epoch": 0.44, "learning_rate": 5.8816613410881416e-05, "loss": 2.5873, "step": 34235 }, { "epoch": 0.44, "learning_rate": 5.8806567075996043e-05, "loss": 2.6581, "step": 34240 }, { "epoch": 0.44, "learning_rate": 5.8796520374180016e-05, "loss": 2.5649, "step": 34245 }, { "epoch": 0.44, "learning_rate": 5.878647330585194e-05, "loss": 2.6367, "step": 34250 }, { "epoch": 0.44, "learning_rate": 5.877642587143039e-05, "loss": 2.6136, "step": 34255 }, { "epoch": 0.44, "learning_rate": 5.876637807133406e-05, "loss": 2.4795, "step": 34260 }, { "epoch": 0.44, "learning_rate": 5.875632990598155e-05, "loss": 2.5483, "step": 34265 }, { "epoch": 0.44, "learning_rate": 5.874628137579156e-05, "loss": 2.6165, "step": 34270 }, { "epoch": 0.44, "learning_rate": 5.873623248118274e-05, "loss": 2.3693, "step": 34275 }, { "epoch": 0.44, "learning_rate": 5.872618322257379e-05, "loss": 2.5053, "step": 34280 }, { "epoch": 0.44, "learning_rate": 5.8716133600383426e-05, "loss": 2.5706, "step": 34285 }, { "epoch": 0.45, "learning_rate": 5.870608361503035e-05, "loss": 2.6443, "step": 34290 }, { "epoch": 0.45, "learning_rate": 5.869603326693332e-05, "loss": 2.4854, "step": 34295 }, { "epoch": 0.45, "learning_rate": 5.8685982556511086e-05, "loss": 2.5173, "step": 34300 }, { "epoch": 0.45, "learning_rate": 5.867593148418242e-05, "loss": 2.6302, "step": 34305 }, { "epoch": 0.45, "learning_rate": 5.8665880050366106e-05, "loss": 2.7687, "step": 34310 }, { "epoch": 0.45, "learning_rate": 5.8655828255480924e-05, "loss": 2.5179, "step": 34315 }, { "epoch": 0.45, "learning_rate": 5.86457760999457e-05, "loss": 2.5806, "step": 34320 }, { "epoch": 0.45, "learning_rate": 5.863572358417927e-05, "loss": 2.5898, "step": 34325 }, { "epoch": 0.45, "learning_rate": 5.862567070860048e-05, "loss": 2.6678, "step": 34330 }, { "epoch": 0.45, "learning_rate": 5.861561747362817e-05, "loss": 2.5668, "step": 34335 }, { "epoch": 0.45, "learning_rate": 5.8605563879681235e-05, "loss": 2.5397, "step": 34340 }, { "epoch": 0.45, "learning_rate": 5.859550992717855e-05, "loss": 2.5726, "step": 34345 }, { "epoch": 0.45, "learning_rate": 5.8585455616539006e-05, "loss": 2.671, "step": 34350 }, { "epoch": 0.45, "learning_rate": 5.8575400948181544e-05, "loss": 2.643, "step": 34355 }, { "epoch": 0.45, "learning_rate": 5.856534592252511e-05, "loss": 2.6439, "step": 34360 }, { "epoch": 0.45, "learning_rate": 5.855529053998862e-05, "loss": 2.4932, "step": 34365 }, { "epoch": 0.45, "learning_rate": 5.854523480099106e-05, "loss": 2.8095, "step": 34370 }, { "epoch": 0.45, "learning_rate": 5.8535178705951385e-05, "loss": 2.7409, "step": 34375 }, { "epoch": 0.45, "learning_rate": 5.852512225528862e-05, "loss": 2.6618, "step": 34380 }, { "epoch": 0.45, "learning_rate": 5.851506544942174e-05, "loss": 2.4595, "step": 34385 }, { "epoch": 0.45, "learning_rate": 5.8505008288769766e-05, "loss": 2.542, "step": 34390 }, { "epoch": 0.45, "learning_rate": 5.8494950773751775e-05, "loss": 2.5934, "step": 34395 }, { "epoch": 0.45, "learning_rate": 5.84848929047868e-05, "loss": 2.3526, "step": 34400 }, { "epoch": 0.45, "learning_rate": 5.84748346822939e-05, "loss": 2.4953, "step": 34405 }, { "epoch": 0.45, "learning_rate": 5.8464776106692166e-05, "loss": 2.6418, "step": 34410 }, { "epoch": 0.45, "learning_rate": 5.8454717178400664e-05, "loss": 2.5372, "step": 34415 }, { "epoch": 0.45, "learning_rate": 5.844465789783854e-05, "loss": 2.5649, "step": 34420 }, { "epoch": 0.45, "learning_rate": 5.843459826542492e-05, "loss": 2.6179, "step": 34425 }, { "epoch": 0.45, "learning_rate": 5.842453828157893e-05, "loss": 2.7153, "step": 34430 }, { "epoch": 0.45, "learning_rate": 5.8414477946719725e-05, "loss": 2.5247, "step": 34435 }, { "epoch": 0.45, "learning_rate": 5.8404417261266485e-05, "loss": 2.563, "step": 34440 }, { "epoch": 0.45, "learning_rate": 5.839435622563838e-05, "loss": 2.5851, "step": 34445 }, { "epoch": 0.45, "learning_rate": 5.83842948402546e-05, "loss": 2.5999, "step": 34450 }, { "epoch": 0.45, "learning_rate": 5.83742331055344e-05, "loss": 2.5302, "step": 34455 }, { "epoch": 0.45, "learning_rate": 5.836417102189699e-05, "loss": 2.5893, "step": 34460 }, { "epoch": 0.45, "learning_rate": 5.835410858976159e-05, "loss": 2.6119, "step": 34465 }, { "epoch": 0.45, "learning_rate": 5.8344045809547476e-05, "loss": 2.6212, "step": 34470 }, { "epoch": 0.45, "learning_rate": 5.833398268167391e-05, "loss": 2.7035, "step": 34475 }, { "epoch": 0.45, "learning_rate": 5.832391920656018e-05, "loss": 2.5254, "step": 34480 }, { "epoch": 0.45, "learning_rate": 5.8313855384625594e-05, "loss": 2.6308, "step": 34485 }, { "epoch": 0.45, "learning_rate": 5.830379121628946e-05, "loss": 2.6313, "step": 34490 }, { "epoch": 0.45, "learning_rate": 5.829372670197112e-05, "loss": 2.5293, "step": 34495 }, { "epoch": 0.45, "learning_rate": 5.828366184208991e-05, "loss": 2.5932, "step": 34500 }, { "epoch": 0.45, "learning_rate": 5.827359663706519e-05, "loss": 2.5889, "step": 34505 }, { "epoch": 0.45, "learning_rate": 5.8263531087316304e-05, "loss": 2.4045, "step": 34510 }, { "epoch": 0.45, "learning_rate": 5.825346519326267e-05, "loss": 2.4326, "step": 34515 }, { "epoch": 0.45, "learning_rate": 5.824339895532369e-05, "loss": 2.5861, "step": 34520 }, { "epoch": 0.45, "learning_rate": 5.823333237391878e-05, "loss": 2.6338, "step": 34525 }, { "epoch": 0.45, "learning_rate": 5.8223265449467354e-05, "loss": 2.6667, "step": 34530 }, { "epoch": 0.45, "learning_rate": 5.8213198182388875e-05, "loss": 2.717, "step": 34535 }, { "epoch": 0.45, "learning_rate": 5.820313057310277e-05, "loss": 2.6831, "step": 34540 }, { "epoch": 0.45, "learning_rate": 5.819306262202854e-05, "loss": 2.6186, "step": 34545 }, { "epoch": 0.45, "learning_rate": 5.818299432958567e-05, "loss": 2.7171, "step": 34550 }, { "epoch": 0.45, "learning_rate": 5.817292569619366e-05, "loss": 2.4533, "step": 34555 }, { "epoch": 0.45, "learning_rate": 5.816285672227202e-05, "loss": 2.6003, "step": 34560 }, { "epoch": 0.45, "learning_rate": 5.815278740824027e-05, "loss": 2.5377, "step": 34565 }, { "epoch": 0.45, "learning_rate": 5.8142717754517964e-05, "loss": 2.5024, "step": 34570 }, { "epoch": 0.45, "learning_rate": 5.8132647761524675e-05, "loss": 2.5, "step": 34575 }, { "epoch": 0.45, "learning_rate": 5.812257742967995e-05, "loss": 2.7064, "step": 34580 }, { "epoch": 0.45, "learning_rate": 5.8112506759403384e-05, "loss": 2.4143, "step": 34585 }, { "epoch": 0.45, "learning_rate": 5.810243575111458e-05, "loss": 2.5839, "step": 34590 }, { "epoch": 0.45, "learning_rate": 5.809236440523316e-05, "loss": 2.5516, "step": 34595 }, { "epoch": 0.45, "learning_rate": 5.808229272217874e-05, "loss": 2.5598, "step": 34600 }, { "epoch": 0.45, "learning_rate": 5.807222070237095e-05, "loss": 2.7062, "step": 34605 }, { "epoch": 0.45, "learning_rate": 5.806214834622947e-05, "loss": 2.6127, "step": 34610 }, { "epoch": 0.45, "learning_rate": 5.805207565417398e-05, "loss": 2.597, "step": 34615 }, { "epoch": 0.45, "learning_rate": 5.8042002626624135e-05, "loss": 2.5631, "step": 34620 }, { "epoch": 0.45, "learning_rate": 5.803192926399964e-05, "loss": 2.5811, "step": 34625 }, { "epoch": 0.45, "learning_rate": 5.802185556672023e-05, "loss": 2.5256, "step": 34630 }, { "epoch": 0.45, "learning_rate": 5.801178153520559e-05, "loss": 2.5671, "step": 34635 }, { "epoch": 0.45, "learning_rate": 5.8001707169875497e-05, "loss": 2.4612, "step": 34640 }, { "epoch": 0.45, "learning_rate": 5.799163247114969e-05, "loss": 2.5947, "step": 34645 }, { "epoch": 0.45, "learning_rate": 5.7981557439447953e-05, "loss": 2.5714, "step": 34650 }, { "epoch": 0.45, "learning_rate": 5.797148207519004e-05, "loss": 2.5901, "step": 34655 }, { "epoch": 0.45, "learning_rate": 5.796140637879578e-05, "loss": 2.4689, "step": 34660 }, { "epoch": 0.45, "learning_rate": 5.795133035068494e-05, "loss": 2.5522, "step": 34665 }, { "epoch": 0.45, "learning_rate": 5.794125399127739e-05, "loss": 2.6613, "step": 34670 }, { "epoch": 0.45, "learning_rate": 5.793117730099292e-05, "loss": 2.5228, "step": 34675 }, { "epoch": 0.45, "learning_rate": 5.7921100280251425e-05, "loss": 2.6729, "step": 34680 }, { "epoch": 0.45, "learning_rate": 5.7911022929472755e-05, "loss": 2.5926, "step": 34685 }, { "epoch": 0.45, "learning_rate": 5.790094524907679e-05, "loss": 2.6364, "step": 34690 }, { "epoch": 0.45, "learning_rate": 5.7890867239483395e-05, "loss": 2.5581, "step": 34695 }, { "epoch": 0.45, "learning_rate": 5.78807889011125e-05, "loss": 2.7329, "step": 34700 }, { "epoch": 0.45, "learning_rate": 5.787071023438403e-05, "loss": 2.5624, "step": 34705 }, { "epoch": 0.45, "learning_rate": 5.7860631239717925e-05, "loss": 2.3531, "step": 34710 }, { "epoch": 0.45, "learning_rate": 5.78505519175341e-05, "loss": 2.6657, "step": 34715 }, { "epoch": 0.45, "learning_rate": 5.7840472268252556e-05, "loss": 2.6363, "step": 34720 }, { "epoch": 0.45, "learning_rate": 5.7830392292293214e-05, "loss": 2.5008, "step": 34725 }, { "epoch": 0.45, "learning_rate": 5.782031199007611e-05, "loss": 2.5794, "step": 34730 }, { "epoch": 0.45, "learning_rate": 5.781023136202123e-05, "loss": 2.6018, "step": 34735 }, { "epoch": 0.45, "learning_rate": 5.780015040854858e-05, "loss": 2.4992, "step": 34740 }, { "epoch": 0.45, "learning_rate": 5.779006913007821e-05, "loss": 2.6425, "step": 34745 }, { "epoch": 0.45, "learning_rate": 5.7779987527030144e-05, "loss": 2.5864, "step": 34750 }, { "epoch": 0.45, "learning_rate": 5.7769905599824434e-05, "loss": 2.5914, "step": 34755 }, { "epoch": 0.45, "learning_rate": 5.7759823348881174e-05, "loss": 2.5511, "step": 34760 }, { "epoch": 0.45, "learning_rate": 5.774974077462041e-05, "loss": 2.5994, "step": 34765 }, { "epoch": 0.45, "learning_rate": 5.773965787746228e-05, "loss": 2.6257, "step": 34770 }, { "epoch": 0.45, "learning_rate": 5.772957465782687e-05, "loss": 2.5634, "step": 34775 }, { "epoch": 0.45, "learning_rate": 5.7719491116134306e-05, "loss": 2.5436, "step": 34780 }, { "epoch": 0.45, "learning_rate": 5.77094072528047e-05, "loss": 2.3873, "step": 34785 }, { "epoch": 0.45, "learning_rate": 5.769932306825826e-05, "loss": 2.5689, "step": 34790 }, { "epoch": 0.45, "learning_rate": 5.7689238562915105e-05, "loss": 2.4493, "step": 34795 }, { "epoch": 0.45, "learning_rate": 5.767915373719541e-05, "loss": 2.5951, "step": 34800 }, { "epoch": 0.45, "learning_rate": 5.766906859151939e-05, "loss": 2.6702, "step": 34805 }, { "epoch": 0.45, "learning_rate": 5.7658983126307234e-05, "loss": 2.6016, "step": 34810 }, { "epoch": 0.45, "learning_rate": 5.764889734197916e-05, "loss": 2.4808, "step": 34815 }, { "epoch": 0.45, "learning_rate": 5.763881123895539e-05, "loss": 2.672, "step": 34820 }, { "epoch": 0.45, "learning_rate": 5.762872481765619e-05, "loss": 2.5868, "step": 34825 }, { "epoch": 0.45, "learning_rate": 5.761863807850179e-05, "loss": 2.697, "step": 34830 }, { "epoch": 0.45, "learning_rate": 5.760855102191247e-05, "loss": 2.5244, "step": 34835 }, { "epoch": 0.45, "learning_rate": 5.7598463648308535e-05, "loss": 2.5551, "step": 34840 }, { "epoch": 0.45, "learning_rate": 5.758837595811025e-05, "loss": 2.5644, "step": 34845 }, { "epoch": 0.45, "learning_rate": 5.757828795173793e-05, "loss": 2.487, "step": 34850 }, { "epoch": 0.45, "learning_rate": 5.756819962961191e-05, "loss": 2.7464, "step": 34855 }, { "epoch": 0.45, "learning_rate": 5.75581109921525e-05, "loss": 2.4939, "step": 34860 }, { "epoch": 0.45, "learning_rate": 5.7548022039780095e-05, "loss": 2.7309, "step": 34865 }, { "epoch": 0.45, "learning_rate": 5.753793277291503e-05, "loss": 2.6313, "step": 34870 }, { "epoch": 0.45, "learning_rate": 5.752784319197766e-05, "loss": 2.5127, "step": 34875 }, { "epoch": 0.45, "learning_rate": 5.75177532973884e-05, "loss": 2.6247, "step": 34880 }, { "epoch": 0.45, "learning_rate": 5.750766308956764e-05, "loss": 2.5003, "step": 34885 }, { "epoch": 0.45, "learning_rate": 5.749757256893582e-05, "loss": 2.6955, "step": 34890 }, { "epoch": 0.45, "learning_rate": 5.748748173591332e-05, "loss": 2.6212, "step": 34895 }, { "epoch": 0.45, "learning_rate": 5.747739059092062e-05, "loss": 2.5809, "step": 34900 }, { "epoch": 0.45, "learning_rate": 5.746729913437816e-05, "loss": 2.5322, "step": 34905 }, { "epoch": 0.45, "learning_rate": 5.745720736670639e-05, "loss": 2.5672, "step": 34910 }, { "epoch": 0.45, "learning_rate": 5.744711528832582e-05, "loss": 2.3411, "step": 34915 }, { "epoch": 0.45, "learning_rate": 5.7437022899656935e-05, "loss": 2.602, "step": 34920 }, { "epoch": 0.45, "learning_rate": 5.742693020112021e-05, "loss": 2.5559, "step": 34925 }, { "epoch": 0.45, "learning_rate": 5.7416837193136194e-05, "loss": 2.6223, "step": 34930 }, { "epoch": 0.45, "learning_rate": 5.7406743876125423e-05, "loss": 2.541, "step": 34935 }, { "epoch": 0.45, "learning_rate": 5.739665025050841e-05, "loss": 2.5805, "step": 34940 }, { "epoch": 0.45, "learning_rate": 5.7386556316705744e-05, "loss": 2.5357, "step": 34945 }, { "epoch": 0.45, "learning_rate": 5.737646207513797e-05, "loss": 2.5727, "step": 34950 }, { "epoch": 0.45, "learning_rate": 5.736636752622567e-05, "loss": 2.5863, "step": 34955 }, { "epoch": 0.45, "learning_rate": 5.7356272670389466e-05, "loss": 2.4765, "step": 34960 }, { "epoch": 0.45, "learning_rate": 5.734617750804995e-05, "loss": 2.4605, "step": 34965 }, { "epoch": 0.45, "learning_rate": 5.7336082039627724e-05, "loss": 2.4295, "step": 34970 }, { "epoch": 0.45, "learning_rate": 5.7325986265543455e-05, "loss": 2.68, "step": 34975 }, { "epoch": 0.45, "learning_rate": 5.731589018621777e-05, "loss": 2.4184, "step": 34980 }, { "epoch": 0.45, "learning_rate": 5.730579380207134e-05, "loss": 2.6275, "step": 34985 }, { "epoch": 0.45, "learning_rate": 5.72956971135248e-05, "loss": 2.6101, "step": 34990 }, { "epoch": 0.45, "learning_rate": 5.728560012099889e-05, "loss": 2.5554, "step": 34995 }, { "epoch": 0.45, "learning_rate": 5.7275502824914264e-05, "loss": 2.6527, "step": 35000 }, { "epoch": 0.45, "learning_rate": 5.726540522569166e-05, "loss": 2.651, "step": 35005 }, { "epoch": 0.45, "learning_rate": 5.725530732375178e-05, "loss": 2.5546, "step": 35010 }, { "epoch": 0.45, "learning_rate": 5.724520911951536e-05, "loss": 2.7194, "step": 35015 }, { "epoch": 0.45, "learning_rate": 5.7235110613403165e-05, "loss": 2.4234, "step": 35020 }, { "epoch": 0.45, "learning_rate": 5.722501180583594e-05, "loss": 2.6868, "step": 35025 }, { "epoch": 0.45, "learning_rate": 5.721491269723446e-05, "loss": 2.5963, "step": 35030 }, { "epoch": 0.45, "learning_rate": 5.72048132880195e-05, "loss": 2.6448, "step": 35035 }, { "epoch": 0.45, "learning_rate": 5.719471357861188e-05, "loss": 2.538, "step": 35040 }, { "epoch": 0.45, "learning_rate": 5.718461356943241e-05, "loss": 2.6377, "step": 35045 }, { "epoch": 0.45, "learning_rate": 5.717451326090188e-05, "loss": 2.5731, "step": 35050 }, { "epoch": 0.45, "learning_rate": 5.716441265344116e-05, "loss": 2.5872, "step": 35055 }, { "epoch": 0.46, "learning_rate": 5.715431174747108e-05, "loss": 2.6908, "step": 35060 }, { "epoch": 0.46, "learning_rate": 5.7144210543412505e-05, "loss": 2.5445, "step": 35065 }, { "epoch": 0.46, "learning_rate": 5.71341090416863e-05, "loss": 2.6079, "step": 35070 }, { "epoch": 0.46, "learning_rate": 5.712400724271337e-05, "loss": 2.6031, "step": 35075 }, { "epoch": 0.46, "learning_rate": 5.7113905146914594e-05, "loss": 2.6754, "step": 35080 }, { "epoch": 0.46, "learning_rate": 5.710380275471089e-05, "loss": 2.4884, "step": 35085 }, { "epoch": 0.46, "learning_rate": 5.709370006652317e-05, "loss": 2.5066, "step": 35090 }, { "epoch": 0.46, "learning_rate": 5.708359708277238e-05, "loss": 2.4706, "step": 35095 }, { "epoch": 0.46, "learning_rate": 5.7073493803879454e-05, "loss": 2.7084, "step": 35100 }, { "epoch": 0.46, "learning_rate": 5.706339023026537e-05, "loss": 2.7039, "step": 35105 }, { "epoch": 0.46, "learning_rate": 5.705328636235108e-05, "loss": 2.5036, "step": 35110 }, { "epoch": 0.46, "learning_rate": 5.7043182200557575e-05, "loss": 2.6315, "step": 35115 }, { "epoch": 0.46, "learning_rate": 5.7033077745305854e-05, "loss": 2.6419, "step": 35120 }, { "epoch": 0.46, "learning_rate": 5.702297299701691e-05, "loss": 2.611, "step": 35125 }, { "epoch": 0.46, "learning_rate": 5.7012867956111784e-05, "loss": 2.6021, "step": 35130 }, { "epoch": 0.46, "learning_rate": 5.700276262301151e-05, "loss": 2.5762, "step": 35135 }, { "epoch": 0.46, "learning_rate": 5.699265699813712e-05, "loss": 2.578, "step": 35140 }, { "epoch": 0.46, "learning_rate": 5.698255108190964e-05, "loss": 2.5852, "step": 35145 }, { "epoch": 0.46, "learning_rate": 5.697244487475021e-05, "loss": 2.5931, "step": 35150 }, { "epoch": 0.46, "learning_rate": 5.6962338377079836e-05, "loss": 2.5027, "step": 35155 }, { "epoch": 0.46, "learning_rate": 5.695223158931968e-05, "loss": 2.47, "step": 35160 }, { "epoch": 0.46, "learning_rate": 5.6942124511890806e-05, "loss": 2.4332, "step": 35165 }, { "epoch": 0.46, "learning_rate": 5.6932017145214335e-05, "loss": 2.5564, "step": 35170 }, { "epoch": 0.46, "learning_rate": 5.6921909489711386e-05, "loss": 2.4691, "step": 35175 }, { "epoch": 0.46, "learning_rate": 5.691180154580313e-05, "loss": 2.5376, "step": 35180 }, { "epoch": 0.46, "learning_rate": 5.69016933139107e-05, "loss": 2.6228, "step": 35185 }, { "epoch": 0.46, "learning_rate": 5.689158479445528e-05, "loss": 2.5049, "step": 35190 }, { "epoch": 0.46, "learning_rate": 5.688147598785802e-05, "loss": 2.5994, "step": 35195 }, { "epoch": 0.46, "learning_rate": 5.687136689454014e-05, "loss": 2.7154, "step": 35200 }, { "epoch": 0.46, "learning_rate": 5.686125751492281e-05, "loss": 2.5649, "step": 35205 }, { "epoch": 0.46, "learning_rate": 5.685114784942724e-05, "loss": 2.6337, "step": 35210 }, { "epoch": 0.46, "learning_rate": 5.684103789847468e-05, "loss": 2.5571, "step": 35215 }, { "epoch": 0.46, "learning_rate": 5.683092766248637e-05, "loss": 2.6486, "step": 35220 }, { "epoch": 0.46, "learning_rate": 5.682081714188355e-05, "loss": 2.554, "step": 35225 }, { "epoch": 0.46, "learning_rate": 5.681070633708747e-05, "loss": 2.641, "step": 35230 }, { "epoch": 0.46, "learning_rate": 5.680059524851942e-05, "loss": 2.5134, "step": 35235 }, { "epoch": 0.46, "learning_rate": 5.679048387660066e-05, "loss": 2.5729, "step": 35240 }, { "epoch": 0.46, "learning_rate": 5.678037222175252e-05, "loss": 2.5743, "step": 35245 }, { "epoch": 0.46, "learning_rate": 5.677026028439627e-05, "loss": 2.6712, "step": 35250 }, { "epoch": 0.46, "learning_rate": 5.6760148064953255e-05, "loss": 2.4914, "step": 35255 }, { "epoch": 0.46, "learning_rate": 5.675003556384481e-05, "loss": 2.574, "step": 35260 }, { "epoch": 0.46, "learning_rate": 5.6739922781492264e-05, "loss": 2.6356, "step": 35265 }, { "epoch": 0.46, "learning_rate": 5.6729809718316965e-05, "loss": 2.5072, "step": 35270 }, { "epoch": 0.46, "learning_rate": 5.671969637474029e-05, "loss": 2.5612, "step": 35275 }, { "epoch": 0.46, "learning_rate": 5.6709582751183635e-05, "loss": 2.6768, "step": 35280 }, { "epoch": 0.46, "learning_rate": 5.669946884806836e-05, "loss": 2.5459, "step": 35285 }, { "epoch": 0.46, "learning_rate": 5.6689354665815887e-05, "loss": 2.4632, "step": 35290 }, { "epoch": 0.46, "learning_rate": 5.6679240204847614e-05, "loss": 2.5286, "step": 35295 }, { "epoch": 0.46, "learning_rate": 5.666912546558498e-05, "loss": 2.5968, "step": 35300 }, { "epoch": 0.46, "learning_rate": 5.665901044844941e-05, "loss": 2.6811, "step": 35305 }, { "epoch": 0.46, "learning_rate": 5.664889515386235e-05, "loss": 2.536, "step": 35310 }, { "epoch": 0.46, "learning_rate": 5.6638779582245284e-05, "loss": 2.5256, "step": 35315 }, { "epoch": 0.46, "learning_rate": 5.662866373401965e-05, "loss": 2.5811, "step": 35320 }, { "epoch": 0.46, "learning_rate": 5.6618547609606965e-05, "loss": 2.5889, "step": 35325 }, { "epoch": 0.46, "learning_rate": 5.660843120942869e-05, "loss": 2.6094, "step": 35330 }, { "epoch": 0.46, "learning_rate": 5.6598314533906335e-05, "loss": 2.4786, "step": 35335 }, { "epoch": 0.46, "learning_rate": 5.6588197583461434e-05, "loss": 2.4953, "step": 35340 }, { "epoch": 0.46, "learning_rate": 5.6578080358515516e-05, "loss": 2.6199, "step": 35345 }, { "epoch": 0.46, "learning_rate": 5.656796285949011e-05, "loss": 2.5027, "step": 35350 }, { "epoch": 0.46, "learning_rate": 5.655784508680677e-05, "loss": 2.4989, "step": 35355 }, { "epoch": 0.46, "learning_rate": 5.654772704088707e-05, "loss": 2.6453, "step": 35360 }, { "epoch": 0.46, "learning_rate": 5.653760872215255e-05, "loss": 2.4388, "step": 35365 }, { "epoch": 0.46, "learning_rate": 5.652749013102483e-05, "loss": 2.4601, "step": 35370 }, { "epoch": 0.46, "learning_rate": 5.65173712679255e-05, "loss": 2.6022, "step": 35375 }, { "epoch": 0.46, "learning_rate": 5.6507252133276164e-05, "loss": 2.6221, "step": 35380 }, { "epoch": 0.46, "learning_rate": 5.649713272749844e-05, "loss": 2.5214, "step": 35385 }, { "epoch": 0.46, "learning_rate": 5.648701305101397e-05, "loss": 2.6235, "step": 35390 }, { "epoch": 0.46, "learning_rate": 5.647689310424437e-05, "loss": 2.4938, "step": 35395 }, { "epoch": 0.46, "learning_rate": 5.646677288761132e-05, "loss": 2.5936, "step": 35400 }, { "epoch": 0.46, "learning_rate": 5.6456652401536456e-05, "loss": 2.551, "step": 35405 }, { "epoch": 0.46, "learning_rate": 5.6446531646441505e-05, "loss": 2.6745, "step": 35410 }, { "epoch": 0.46, "learning_rate": 5.6436410622748104e-05, "loss": 2.6783, "step": 35415 }, { "epoch": 0.46, "learning_rate": 5.642628933087798e-05, "loss": 2.4509, "step": 35420 }, { "epoch": 0.46, "learning_rate": 5.6416167771252826e-05, "loss": 2.7015, "step": 35425 }, { "epoch": 0.46, "learning_rate": 5.640604594429435e-05, "loss": 2.6474, "step": 35430 }, { "epoch": 0.46, "learning_rate": 5.6395923850424314e-05, "loss": 2.6044, "step": 35435 }, { "epoch": 0.46, "learning_rate": 5.638580149006445e-05, "loss": 2.6739, "step": 35440 }, { "epoch": 0.46, "learning_rate": 5.637567886363652e-05, "loss": 2.4516, "step": 35445 }, { "epoch": 0.46, "learning_rate": 5.6365555971562266e-05, "loss": 2.5968, "step": 35450 }, { "epoch": 0.46, "learning_rate": 5.6355432814263486e-05, "loss": 2.6795, "step": 35455 }, { "epoch": 0.46, "learning_rate": 5.634530939216195e-05, "loss": 2.5031, "step": 35460 }, { "epoch": 0.46, "learning_rate": 5.633518570567946e-05, "loss": 2.5916, "step": 35465 }, { "epoch": 0.46, "learning_rate": 5.632506175523784e-05, "loss": 2.6385, "step": 35470 }, { "epoch": 0.46, "learning_rate": 5.6314937541258905e-05, "loss": 2.5212, "step": 35475 }, { "epoch": 0.46, "learning_rate": 5.6304813064164486e-05, "loss": 2.6569, "step": 35480 }, { "epoch": 0.46, "learning_rate": 5.629468832437641e-05, "loss": 2.7507, "step": 35485 }, { "epoch": 0.46, "learning_rate": 5.628456332231653e-05, "loss": 2.56, "step": 35490 }, { "epoch": 0.46, "learning_rate": 5.6274438058406745e-05, "loss": 2.5529, "step": 35495 }, { "epoch": 0.46, "learning_rate": 5.626431253306888e-05, "loss": 2.4858, "step": 35500 }, { "epoch": 0.46, "learning_rate": 5.6254186746724855e-05, "loss": 2.6144, "step": 35505 }, { "epoch": 0.46, "learning_rate": 5.6244060699796574e-05, "loss": 2.5985, "step": 35510 }, { "epoch": 0.46, "learning_rate": 5.6233934392705925e-05, "loss": 2.5988, "step": 35515 }, { "epoch": 0.46, "learning_rate": 5.622380782587482e-05, "loss": 2.6049, "step": 35520 }, { "epoch": 0.46, "learning_rate": 5.621368099972519e-05, "loss": 2.7412, "step": 35525 }, { "epoch": 0.46, "learning_rate": 5.620355391467899e-05, "loss": 2.6758, "step": 35530 }, { "epoch": 0.46, "learning_rate": 5.619342657115817e-05, "loss": 2.6275, "step": 35535 }, { "epoch": 0.46, "learning_rate": 5.6183298969584685e-05, "loss": 2.5172, "step": 35540 }, { "epoch": 0.46, "learning_rate": 5.617317111038051e-05, "loss": 2.7144, "step": 35545 }, { "epoch": 0.46, "learning_rate": 5.6163042993967616e-05, "loss": 2.6071, "step": 35550 }, { "epoch": 0.46, "learning_rate": 5.615291462076802e-05, "loss": 2.5268, "step": 35555 }, { "epoch": 0.46, "learning_rate": 5.614278599120368e-05, "loss": 2.5703, "step": 35560 }, { "epoch": 0.46, "learning_rate": 5.613265710569668e-05, "loss": 2.6266, "step": 35565 }, { "epoch": 0.46, "learning_rate": 5.6122527964669e-05, "loss": 2.5622, "step": 35570 }, { "epoch": 0.46, "learning_rate": 5.611239856854269e-05, "loss": 2.6091, "step": 35575 }, { "epoch": 0.46, "learning_rate": 5.61022689177398e-05, "loss": 2.5625, "step": 35580 }, { "epoch": 0.46, "learning_rate": 5.6092139012682365e-05, "loss": 2.6621, "step": 35585 }, { "epoch": 0.46, "learning_rate": 5.6082008853792465e-05, "loss": 2.7025, "step": 35590 }, { "epoch": 0.46, "learning_rate": 5.60718784414922e-05, "loss": 2.5266, "step": 35595 }, { "epoch": 0.46, "learning_rate": 5.6061747776203646e-05, "loss": 2.665, "step": 35600 }, { "epoch": 0.46, "learning_rate": 5.605161685834889e-05, "loss": 2.5896, "step": 35605 }, { "epoch": 0.46, "learning_rate": 5.604148568835006e-05, "loss": 2.4754, "step": 35610 }, { "epoch": 0.46, "learning_rate": 5.6031354266629256e-05, "loss": 2.5664, "step": 35615 }, { "epoch": 0.46, "learning_rate": 5.6021222593608636e-05, "loss": 2.515, "step": 35620 }, { "epoch": 0.46, "learning_rate": 5.601109066971031e-05, "loss": 2.5221, "step": 35625 }, { "epoch": 0.46, "learning_rate": 5.600095849535647e-05, "loss": 2.4788, "step": 35630 }, { "epoch": 0.46, "learning_rate": 5.599082607096926e-05, "loss": 2.5469, "step": 35635 }, { "epoch": 0.46, "learning_rate": 5.598069339697084e-05, "loss": 2.5247, "step": 35640 }, { "epoch": 0.46, "learning_rate": 5.5970560473783406e-05, "loss": 2.5607, "step": 35645 }, { "epoch": 0.46, "learning_rate": 5.596042730182915e-05, "loss": 2.5457, "step": 35650 }, { "epoch": 0.46, "learning_rate": 5.595029388153028e-05, "loss": 2.632, "step": 35655 }, { "epoch": 0.46, "learning_rate": 5.594016021330901e-05, "loss": 2.5762, "step": 35660 }, { "epoch": 0.46, "learning_rate": 5.593002629758757e-05, "loss": 2.5921, "step": 35665 }, { "epoch": 0.46, "learning_rate": 5.5919892134788175e-05, "loss": 2.7423, "step": 35670 }, { "epoch": 0.46, "learning_rate": 5.5909757725333104e-05, "loss": 2.7527, "step": 35675 }, { "epoch": 0.46, "learning_rate": 5.5899623069644566e-05, "loss": 2.6075, "step": 35680 }, { "epoch": 0.46, "learning_rate": 5.588948816814486e-05, "loss": 2.6541, "step": 35685 }, { "epoch": 0.46, "learning_rate": 5.587935302125626e-05, "loss": 2.5004, "step": 35690 }, { "epoch": 0.46, "learning_rate": 5.586921762940107e-05, "loss": 2.6156, "step": 35695 }, { "epoch": 0.46, "learning_rate": 5.585908199300155e-05, "loss": 2.5675, "step": 35700 }, { "epoch": 0.46, "learning_rate": 5.584894611248004e-05, "loss": 2.5811, "step": 35705 }, { "epoch": 0.46, "learning_rate": 5.5838809988258814e-05, "loss": 2.5072, "step": 35710 }, { "epoch": 0.46, "learning_rate": 5.582867362076024e-05, "loss": 2.5574, "step": 35715 }, { "epoch": 0.46, "learning_rate": 5.5818537010406635e-05, "loss": 2.5618, "step": 35720 }, { "epoch": 0.46, "learning_rate": 5.580840015762037e-05, "loss": 2.5806, "step": 35725 }, { "epoch": 0.46, "learning_rate": 5.579826306282377e-05, "loss": 2.5158, "step": 35730 }, { "epoch": 0.46, "learning_rate": 5.578812572643923e-05, "loss": 2.2977, "step": 35735 }, { "epoch": 0.46, "learning_rate": 5.5777988148889114e-05, "loss": 2.7023, "step": 35740 }, { "epoch": 0.46, "learning_rate": 5.5767850330595816e-05, "loss": 2.6417, "step": 35745 }, { "epoch": 0.46, "learning_rate": 5.575771227198172e-05, "loss": 2.5491, "step": 35750 }, { "epoch": 0.46, "learning_rate": 5.574757397346926e-05, "loss": 2.4836, "step": 35755 }, { "epoch": 0.46, "learning_rate": 5.5737435435480836e-05, "loss": 2.4372, "step": 35760 }, { "epoch": 0.46, "learning_rate": 5.5727296658438886e-05, "loss": 2.5002, "step": 35765 }, { "epoch": 0.46, "learning_rate": 5.5717157642765814e-05, "loss": 2.6197, "step": 35770 }, { "epoch": 0.46, "learning_rate": 5.5707018388884125e-05, "loss": 2.5357, "step": 35775 }, { "epoch": 0.46, "learning_rate": 5.569687889721623e-05, "loss": 2.5019, "step": 35780 }, { "epoch": 0.46, "learning_rate": 5.568673916818462e-05, "loss": 2.4304, "step": 35785 }, { "epoch": 0.46, "learning_rate": 5.567659920221177e-05, "loss": 2.4774, "step": 35790 }, { "epoch": 0.46, "learning_rate": 5.566645899972016e-05, "loss": 2.7419, "step": 35795 }, { "epoch": 0.46, "learning_rate": 5.5656318561132284e-05, "loss": 2.6366, "step": 35800 }, { "epoch": 0.46, "learning_rate": 5.564617788687067e-05, "loss": 2.64, "step": 35805 }, { "epoch": 0.46, "learning_rate": 5.563603697735782e-05, "loss": 2.5088, "step": 35810 }, { "epoch": 0.46, "learning_rate": 5.562589583301624e-05, "loss": 2.4503, "step": 35815 }, { "epoch": 0.46, "learning_rate": 5.561575445426851e-05, "loss": 2.625, "step": 35820 }, { "epoch": 0.46, "learning_rate": 5.5605612841537155e-05, "loss": 2.6322, "step": 35825 }, { "epoch": 0.46, "learning_rate": 5.5595470995244724e-05, "loss": 2.567, "step": 35830 }, { "epoch": 0.47, "learning_rate": 5.558532891581379e-05, "loss": 2.5858, "step": 35835 }, { "epoch": 0.47, "learning_rate": 5.557518660366694e-05, "loss": 2.5707, "step": 35840 }, { "epoch": 0.47, "learning_rate": 5.5565044059226734e-05, "loss": 2.72, "step": 35845 }, { "epoch": 0.47, "learning_rate": 5.555490128291578e-05, "loss": 2.5721, "step": 35850 }, { "epoch": 0.47, "learning_rate": 5.55447582751567e-05, "loss": 2.6884, "step": 35855 }, { "epoch": 0.47, "learning_rate": 5.553461503637207e-05, "loss": 2.5081, "step": 35860 }, { "epoch": 0.47, "learning_rate": 5.552447156698455e-05, "loss": 2.6357, "step": 35865 }, { "epoch": 0.47, "learning_rate": 5.551432786741676e-05, "loss": 2.6828, "step": 35870 }, { "epoch": 0.47, "learning_rate": 5.550418393809132e-05, "loss": 2.5414, "step": 35875 }, { "epoch": 0.47, "learning_rate": 5.549403977943093e-05, "loss": 2.5393, "step": 35880 }, { "epoch": 0.47, "learning_rate": 5.548389539185822e-05, "loss": 2.4333, "step": 35885 }, { "epoch": 0.47, "learning_rate": 5.547375077579587e-05, "loss": 2.544, "step": 35890 }, { "epoch": 0.47, "learning_rate": 5.546360593166655e-05, "loss": 2.585, "step": 35895 }, { "epoch": 0.47, "learning_rate": 5.545346085989297e-05, "loss": 2.5962, "step": 35900 }, { "epoch": 0.47, "learning_rate": 5.544331556089781e-05, "loss": 2.5353, "step": 35905 }, { "epoch": 0.47, "learning_rate": 5.54331700351038e-05, "loss": 2.432, "step": 35910 }, { "epoch": 0.47, "learning_rate": 5.5423024282933657e-05, "loss": 2.5336, "step": 35915 }, { "epoch": 0.47, "learning_rate": 5.541287830481009e-05, "loss": 2.6681, "step": 35920 }, { "epoch": 0.47, "learning_rate": 5.5402732101155844e-05, "loss": 2.63, "step": 35925 }, { "epoch": 0.47, "learning_rate": 5.539258567239368e-05, "loss": 2.5115, "step": 35930 }, { "epoch": 0.47, "learning_rate": 5.538243901894635e-05, "loss": 2.475, "step": 35935 }, { "epoch": 0.47, "learning_rate": 5.53722921412366e-05, "loss": 2.5019, "step": 35940 }, { "epoch": 0.47, "learning_rate": 5.536214503968724e-05, "loss": 2.4588, "step": 35945 }, { "epoch": 0.47, "learning_rate": 5.535199771472104e-05, "loss": 2.6084, "step": 35950 }, { "epoch": 0.47, "learning_rate": 5.5341850166760766e-05, "loss": 2.5629, "step": 35955 }, { "epoch": 0.47, "learning_rate": 5.533170239622927e-05, "loss": 2.6159, "step": 35960 }, { "epoch": 0.47, "learning_rate": 5.532155440354932e-05, "loss": 2.5268, "step": 35965 }, { "epoch": 0.47, "learning_rate": 5.531140618914377e-05, "loss": 2.4712, "step": 35970 }, { "epoch": 0.47, "learning_rate": 5.530125775343544e-05, "loss": 2.6163, "step": 35975 }, { "epoch": 0.47, "learning_rate": 5.529110909684718e-05, "loss": 2.7149, "step": 35980 }, { "epoch": 0.47, "learning_rate": 5.5280960219801816e-05, "loss": 2.5635, "step": 35985 }, { "epoch": 0.47, "learning_rate": 5.527081112272222e-05, "loss": 2.4566, "step": 35990 }, { "epoch": 0.47, "learning_rate": 5.5260661806031265e-05, "loss": 2.446, "step": 35995 }, { "epoch": 0.47, "learning_rate": 5.525051227015182e-05, "loss": 2.6337, "step": 36000 }, { "epoch": 0.47, "learning_rate": 5.524036251550678e-05, "loss": 2.6163, "step": 36005 }, { "epoch": 0.47, "learning_rate": 5.523021254251903e-05, "loss": 2.4684, "step": 36010 }, { "epoch": 0.47, "learning_rate": 5.522006235161148e-05, "loss": 2.6283, "step": 36015 }, { "epoch": 0.47, "learning_rate": 5.520991194320705e-05, "loss": 2.6125, "step": 36020 }, { "epoch": 0.47, "learning_rate": 5.519976131772866e-05, "loss": 2.5514, "step": 36025 }, { "epoch": 0.47, "learning_rate": 5.518961047559923e-05, "loss": 2.4414, "step": 36030 }, { "epoch": 0.47, "learning_rate": 5.51794594172417e-05, "loss": 2.628, "step": 36035 }, { "epoch": 0.47, "learning_rate": 5.516930814307903e-05, "loss": 2.5249, "step": 36040 }, { "epoch": 0.47, "learning_rate": 5.5159156653534184e-05, "loss": 2.4561, "step": 36045 }, { "epoch": 0.47, "learning_rate": 5.514900494903013e-05, "loss": 2.4643, "step": 36050 }, { "epoch": 0.47, "learning_rate": 5.5138853029989825e-05, "loss": 2.5522, "step": 36055 }, { "epoch": 0.47, "learning_rate": 5.512870089683626e-05, "loss": 2.4986, "step": 36060 }, { "epoch": 0.47, "learning_rate": 5.511854854999244e-05, "loss": 2.4169, "step": 36065 }, { "epoch": 0.47, "learning_rate": 5.510839598988137e-05, "loss": 2.6079, "step": 36070 }, { "epoch": 0.47, "learning_rate": 5.509824321692604e-05, "loss": 2.6686, "step": 36075 }, { "epoch": 0.47, "learning_rate": 5.5088090231549505e-05, "loss": 2.5662, "step": 36080 }, { "epoch": 0.47, "learning_rate": 5.5077937034174775e-05, "loss": 2.6261, "step": 36085 }, { "epoch": 0.47, "learning_rate": 5.506778362522489e-05, "loss": 2.6138, "step": 36090 }, { "epoch": 0.47, "learning_rate": 5.5057630005122884e-05, "loss": 2.6736, "step": 36095 }, { "epoch": 0.47, "learning_rate": 5.504747617429185e-05, "loss": 2.4496, "step": 36100 }, { "epoch": 0.47, "learning_rate": 5.503732213315482e-05, "loss": 2.5909, "step": 36105 }, { "epoch": 0.47, "learning_rate": 5.5027167882134864e-05, "loss": 2.6585, "step": 36110 }, { "epoch": 0.47, "learning_rate": 5.50170134216551e-05, "loss": 2.561, "step": 36115 }, { "epoch": 0.47, "learning_rate": 5.50068587521386e-05, "loss": 2.5167, "step": 36120 }, { "epoch": 0.47, "learning_rate": 5.499670387400846e-05, "loss": 2.6276, "step": 36125 }, { "epoch": 0.47, "learning_rate": 5.4986548787687783e-05, "loss": 2.5493, "step": 36130 }, { "epoch": 0.47, "learning_rate": 5.497639349359971e-05, "loss": 2.5836, "step": 36135 }, { "epoch": 0.47, "learning_rate": 5.496623799216734e-05, "loss": 2.5348, "step": 36140 }, { "epoch": 0.47, "learning_rate": 5.4956082283813816e-05, "loss": 2.5188, "step": 36145 }, { "epoch": 0.47, "learning_rate": 5.4945926368962297e-05, "loss": 2.6032, "step": 36150 }, { "epoch": 0.47, "learning_rate": 5.4935770248035934e-05, "loss": 2.6938, "step": 36155 }, { "epoch": 0.47, "learning_rate": 5.492561392145785e-05, "loss": 2.6023, "step": 36160 }, { "epoch": 0.47, "learning_rate": 5.491545738965126e-05, "loss": 2.5989, "step": 36165 }, { "epoch": 0.47, "learning_rate": 5.490530065303931e-05, "loss": 2.5179, "step": 36170 }, { "epoch": 0.47, "learning_rate": 5.4895143712045216e-05, "loss": 2.5568, "step": 36175 }, { "epoch": 0.47, "learning_rate": 5.488498656709216e-05, "loss": 2.6879, "step": 36180 }, { "epoch": 0.47, "learning_rate": 5.487482921860333e-05, "loss": 2.6178, "step": 36185 }, { "epoch": 0.47, "learning_rate": 5.4864671667001946e-05, "loss": 2.5193, "step": 36190 }, { "epoch": 0.47, "learning_rate": 5.4854513912711235e-05, "loss": 2.5617, "step": 36195 }, { "epoch": 0.47, "learning_rate": 5.4844355956154416e-05, "loss": 2.6284, "step": 36200 }, { "epoch": 0.47, "learning_rate": 5.483419779775474e-05, "loss": 2.5148, "step": 36205 }, { "epoch": 0.47, "learning_rate": 5.482403943793545e-05, "loss": 2.4521, "step": 36210 }, { "epoch": 0.47, "learning_rate": 5.4813880877119794e-05, "loss": 2.585, "step": 36215 }, { "epoch": 0.47, "learning_rate": 5.4803722115731025e-05, "loss": 2.6432, "step": 36220 }, { "epoch": 0.47, "learning_rate": 5.4793563154192416e-05, "loss": 2.5399, "step": 36225 }, { "epoch": 0.47, "learning_rate": 5.478340399292726e-05, "loss": 2.5633, "step": 36230 }, { "epoch": 0.47, "learning_rate": 5.477324463235886e-05, "loss": 2.555, "step": 36235 }, { "epoch": 0.47, "learning_rate": 5.476308507291047e-05, "loss": 2.6894, "step": 36240 }, { "epoch": 0.47, "learning_rate": 5.475292531500541e-05, "loss": 2.5185, "step": 36245 }, { "epoch": 0.47, "learning_rate": 5.474276535906701e-05, "loss": 2.6136, "step": 36250 }, { "epoch": 0.47, "learning_rate": 5.4732605205518564e-05, "loss": 2.5651, "step": 36255 }, { "epoch": 0.47, "learning_rate": 5.47224448547834e-05, "loss": 2.5001, "step": 36260 }, { "epoch": 0.47, "learning_rate": 5.471228430728489e-05, "loss": 2.5892, "step": 36265 }, { "epoch": 0.47, "learning_rate": 5.470212356344635e-05, "loss": 2.5572, "step": 36270 }, { "epoch": 0.47, "learning_rate": 5.469196262369114e-05, "loss": 2.4953, "step": 36275 }, { "epoch": 0.47, "learning_rate": 5.468180148844262e-05, "loss": 2.547, "step": 36280 }, { "epoch": 0.47, "learning_rate": 5.467164015812415e-05, "loss": 2.5799, "step": 36285 }, { "epoch": 0.47, "learning_rate": 5.466147863315911e-05, "loss": 2.5352, "step": 36290 }, { "epoch": 0.47, "learning_rate": 5.465131691397092e-05, "loss": 2.5113, "step": 36295 }, { "epoch": 0.47, "learning_rate": 5.4641155000982936e-05, "loss": 2.6294, "step": 36300 }, { "epoch": 0.47, "learning_rate": 5.463099289461857e-05, "loss": 2.6267, "step": 36305 }, { "epoch": 0.47, "learning_rate": 5.462083059530124e-05, "loss": 2.5117, "step": 36310 }, { "epoch": 0.47, "learning_rate": 5.461066810345434e-05, "loss": 2.6024, "step": 36315 }, { "epoch": 0.47, "learning_rate": 5.4600505419501335e-05, "loss": 2.6683, "step": 36320 }, { "epoch": 0.47, "learning_rate": 5.4590342543865625e-05, "loss": 2.4771, "step": 36325 }, { "epoch": 0.47, "learning_rate": 5.4580179476970675e-05, "loss": 2.59, "step": 36330 }, { "epoch": 0.47, "learning_rate": 5.4570016219239914e-05, "loss": 2.4655, "step": 36335 }, { "epoch": 0.47, "learning_rate": 5.455985277109682e-05, "loss": 2.4633, "step": 36340 }, { "epoch": 0.47, "learning_rate": 5.454968913296484e-05, "loss": 2.6056, "step": 36345 }, { "epoch": 0.47, "learning_rate": 5.453952530526746e-05, "loss": 2.5387, "step": 36350 }, { "epoch": 0.47, "learning_rate": 5.452936128842815e-05, "loss": 2.651, "step": 36355 }, { "epoch": 0.47, "learning_rate": 5.451919708287042e-05, "loss": 2.5243, "step": 36360 }, { "epoch": 0.47, "learning_rate": 5.4509032689017755e-05, "loss": 2.446, "step": 36365 }, { "epoch": 0.47, "learning_rate": 5.4498868107293663e-05, "loss": 2.5238, "step": 36370 }, { "epoch": 0.47, "learning_rate": 5.448870333812166e-05, "loss": 2.718, "step": 36375 }, { "epoch": 0.47, "learning_rate": 5.4478538381925246e-05, "loss": 2.7005, "step": 36380 }, { "epoch": 0.47, "learning_rate": 5.4468373239127967e-05, "loss": 2.6062, "step": 36385 }, { "epoch": 0.47, "learning_rate": 5.445820791015337e-05, "loss": 2.5793, "step": 36390 }, { "epoch": 0.47, "learning_rate": 5.444804239542498e-05, "loss": 2.5884, "step": 36395 }, { "epoch": 0.47, "learning_rate": 5.443787669536636e-05, "loss": 2.5524, "step": 36400 }, { "epoch": 0.47, "learning_rate": 5.442771081040108e-05, "loss": 2.658, "step": 36405 }, { "epoch": 0.47, "learning_rate": 5.4417544740952674e-05, "loss": 2.6729, "step": 36410 }, { "epoch": 0.47, "learning_rate": 5.4407378487444723e-05, "loss": 2.4475, "step": 36415 }, { "epoch": 0.47, "learning_rate": 5.439721205030086e-05, "loss": 2.5946, "step": 36420 }, { "epoch": 0.47, "learning_rate": 5.4387045429944616e-05, "loss": 2.5281, "step": 36425 }, { "epoch": 0.47, "learning_rate": 5.4376878626799635e-05, "loss": 2.5579, "step": 36430 }, { "epoch": 0.47, "learning_rate": 5.4366711641289484e-05, "loss": 2.6525, "step": 36435 }, { "epoch": 0.47, "learning_rate": 5.435654447383779e-05, "loss": 2.5261, "step": 36440 }, { "epoch": 0.47, "learning_rate": 5.4346377124868176e-05, "loss": 2.5787, "step": 36445 }, { "epoch": 0.47, "learning_rate": 5.433620959480426e-05, "loss": 2.5514, "step": 36450 }, { "epoch": 0.47, "learning_rate": 5.43260418840697e-05, "loss": 2.6603, "step": 36455 }, { "epoch": 0.47, "learning_rate": 5.431587399308814e-05, "loss": 2.6281, "step": 36460 }, { "epoch": 0.47, "learning_rate": 5.43057059222832e-05, "loss": 2.4689, "step": 36465 }, { "epoch": 0.47, "learning_rate": 5.429553767207858e-05, "loss": 2.7113, "step": 36470 }, { "epoch": 0.47, "learning_rate": 5.42853692428979e-05, "loss": 2.4615, "step": 36475 }, { "epoch": 0.47, "learning_rate": 5.4275200635164845e-05, "loss": 2.6335, "step": 36480 }, { "epoch": 0.47, "learning_rate": 5.426503184930314e-05, "loss": 2.7716, "step": 36485 }, { "epoch": 0.47, "learning_rate": 5.425486288573642e-05, "loss": 2.5614, "step": 36490 }, { "epoch": 0.47, "learning_rate": 5.424469374488842e-05, "loss": 2.6721, "step": 36495 }, { "epoch": 0.47, "learning_rate": 5.423452442718282e-05, "loss": 2.4811, "step": 36500 }, { "epoch": 0.47, "learning_rate": 5.422435493304332e-05, "loss": 2.6921, "step": 36505 }, { "epoch": 0.47, "learning_rate": 5.4214185262893656e-05, "loss": 2.469, "step": 36510 }, { "epoch": 0.47, "learning_rate": 5.420401541715756e-05, "loss": 2.6082, "step": 36515 }, { "epoch": 0.47, "learning_rate": 5.419384539625875e-05, "loss": 2.5723, "step": 36520 }, { "epoch": 0.47, "learning_rate": 5.418367520062097e-05, "loss": 2.4356, "step": 36525 }, { "epoch": 0.47, "learning_rate": 5.4173504830667976e-05, "loss": 2.6074, "step": 36530 }, { "epoch": 0.47, "learning_rate": 5.41633342868235e-05, "loss": 2.5817, "step": 36535 }, { "epoch": 0.47, "learning_rate": 5.4153163569511324e-05, "loss": 2.5214, "step": 36540 }, { "epoch": 0.47, "learning_rate": 5.41429926791552e-05, "loss": 2.6379, "step": 36545 }, { "epoch": 0.47, "learning_rate": 5.413282161617893e-05, "loss": 2.392, "step": 36550 }, { "epoch": 0.47, "learning_rate": 5.412265038100627e-05, "loss": 2.5151, "step": 36555 }, { "epoch": 0.47, "learning_rate": 5.411247897406103e-05, "loss": 2.5247, "step": 36560 }, { "epoch": 0.47, "learning_rate": 5.4102307395766994e-05, "loss": 2.5734, "step": 36565 }, { "epoch": 0.47, "learning_rate": 5.409213564654796e-05, "loss": 2.4544, "step": 36570 }, { "epoch": 0.47, "learning_rate": 5.408196372682776e-05, "loss": 2.5782, "step": 36575 }, { "epoch": 0.47, "learning_rate": 5.407179163703021e-05, "loss": 2.7314, "step": 36580 }, { "epoch": 0.47, "learning_rate": 5.406161937757912e-05, "loss": 2.4342, "step": 36585 }, { "epoch": 0.47, "learning_rate": 5.4051446948898344e-05, "loss": 2.549, "step": 36590 }, { "epoch": 0.47, "learning_rate": 5.4041274351411706e-05, "loss": 2.5384, "step": 36595 }, { "epoch": 0.47, "learning_rate": 5.4031101585543056e-05, "loss": 2.5273, "step": 36600 }, { "epoch": 0.48, "learning_rate": 5.402092865171624e-05, "loss": 2.6081, "step": 36605 }, { "epoch": 0.48, "learning_rate": 5.401075555035515e-05, "loss": 2.5471, "step": 36610 }, { "epoch": 0.48, "learning_rate": 5.400058228188363e-05, "loss": 2.4975, "step": 36615 }, { "epoch": 0.48, "learning_rate": 5.399040884672555e-05, "loss": 2.4371, "step": 36620 }, { "epoch": 0.48, "learning_rate": 5.398023524530481e-05, "loss": 2.534, "step": 36625 }, { "epoch": 0.48, "learning_rate": 5.397006147804528e-05, "loss": 2.572, "step": 36630 }, { "epoch": 0.48, "learning_rate": 5.3959887545370866e-05, "loss": 2.562, "step": 36635 }, { "epoch": 0.48, "learning_rate": 5.394971344770546e-05, "loss": 2.6304, "step": 36640 }, { "epoch": 0.48, "learning_rate": 5.3939539185472996e-05, "loss": 2.6885, "step": 36645 }, { "epoch": 0.48, "learning_rate": 5.3929364759097375e-05, "loss": 2.4616, "step": 36650 }, { "epoch": 0.48, "learning_rate": 5.391919016900253e-05, "loss": 2.5148, "step": 36655 }, { "epoch": 0.48, "learning_rate": 5.3909015415612365e-05, "loss": 2.6762, "step": 36660 }, { "epoch": 0.48, "learning_rate": 5.389884049935084e-05, "loss": 2.5397, "step": 36665 }, { "epoch": 0.48, "learning_rate": 5.388866542064189e-05, "loss": 2.4672, "step": 36670 }, { "epoch": 0.48, "learning_rate": 5.387849017990948e-05, "loss": 2.6219, "step": 36675 }, { "epoch": 0.48, "learning_rate": 5.386831477757755e-05, "loss": 2.4803, "step": 36680 }, { "epoch": 0.48, "learning_rate": 5.385813921407008e-05, "loss": 2.6147, "step": 36685 }, { "epoch": 0.48, "learning_rate": 5.3847963489811014e-05, "loss": 2.6253, "step": 36690 }, { "epoch": 0.48, "learning_rate": 5.383778760522435e-05, "loss": 2.4976, "step": 36695 }, { "epoch": 0.48, "learning_rate": 5.382761156073406e-05, "loss": 2.6208, "step": 36700 }, { "epoch": 0.48, "learning_rate": 5.381743535676416e-05, "loss": 2.7266, "step": 36705 }, { "epoch": 0.48, "learning_rate": 5.380725899373863e-05, "loss": 2.619, "step": 36710 }, { "epoch": 0.48, "learning_rate": 5.3797082472081464e-05, "loss": 2.5541, "step": 36715 }, { "epoch": 0.48, "learning_rate": 5.378690579221668e-05, "loss": 2.6826, "step": 36720 }, { "epoch": 0.48, "learning_rate": 5.377672895456831e-05, "loss": 2.628, "step": 36725 }, { "epoch": 0.48, "learning_rate": 5.376655195956035e-05, "loss": 2.5507, "step": 36730 }, { "epoch": 0.48, "learning_rate": 5.375637480761686e-05, "loss": 2.5935, "step": 36735 }, { "epoch": 0.48, "learning_rate": 5.374619749916185e-05, "loss": 2.5745, "step": 36740 }, { "epoch": 0.48, "learning_rate": 5.373602003461939e-05, "loss": 2.5358, "step": 36745 }, { "epoch": 0.48, "learning_rate": 5.372584241441351e-05, "loss": 2.4394, "step": 36750 }, { "epoch": 0.48, "learning_rate": 5.371566463896827e-05, "loss": 2.51, "step": 36755 }, { "epoch": 0.48, "learning_rate": 5.370548670870774e-05, "loss": 2.5756, "step": 36760 }, { "epoch": 0.48, "learning_rate": 5.369530862405597e-05, "loss": 2.5163, "step": 36765 }, { "epoch": 0.48, "learning_rate": 5.3685130385437065e-05, "loss": 2.5304, "step": 36770 }, { "epoch": 0.48, "learning_rate": 5.36749519932751e-05, "loss": 2.6287, "step": 36775 }, { "epoch": 0.48, "learning_rate": 5.366477344799414e-05, "loss": 2.5622, "step": 36780 }, { "epoch": 0.48, "learning_rate": 5.3654594750018296e-05, "loss": 2.5802, "step": 36785 }, { "epoch": 0.48, "learning_rate": 5.3644415899771684e-05, "loss": 2.659, "step": 36790 }, { "epoch": 0.48, "learning_rate": 5.363423689767837e-05, "loss": 2.4393, "step": 36795 }, { "epoch": 0.48, "learning_rate": 5.362405774416253e-05, "loss": 2.6103, "step": 36800 }, { "epoch": 0.48, "learning_rate": 5.361387843964822e-05, "loss": 2.5304, "step": 36805 }, { "epoch": 0.48, "learning_rate": 5.360369898455961e-05, "loss": 2.5549, "step": 36810 }, { "epoch": 0.48, "learning_rate": 5.359351937932081e-05, "loss": 2.4614, "step": 36815 }, { "epoch": 0.48, "learning_rate": 5.3583339624355974e-05, "loss": 2.5841, "step": 36820 }, { "epoch": 0.48, "learning_rate": 5.357315972008923e-05, "loss": 2.4368, "step": 36825 }, { "epoch": 0.48, "learning_rate": 5.3562979666944755e-05, "loss": 2.466, "step": 36830 }, { "epoch": 0.48, "learning_rate": 5.355279946534669e-05, "loss": 2.6334, "step": 36835 }, { "epoch": 0.48, "learning_rate": 5.354261911571919e-05, "loss": 2.5931, "step": 36840 }, { "epoch": 0.48, "learning_rate": 5.353243861848645e-05, "loss": 2.6399, "step": 36845 }, { "epoch": 0.48, "learning_rate": 5.352225797407262e-05, "loss": 2.5872, "step": 36850 }, { "epoch": 0.48, "learning_rate": 5.351207718290191e-05, "loss": 2.3731, "step": 36855 }, { "epoch": 0.48, "learning_rate": 5.3501896245398475e-05, "loss": 2.6085, "step": 36860 }, { "epoch": 0.48, "learning_rate": 5.3491715161986536e-05, "loss": 2.5769, "step": 36865 }, { "epoch": 0.48, "learning_rate": 5.348153393309029e-05, "loss": 2.6152, "step": 36870 }, { "epoch": 0.48, "learning_rate": 5.347135255913392e-05, "loss": 2.5308, "step": 36875 }, { "epoch": 0.48, "learning_rate": 5.3461171040541677e-05, "loss": 2.5536, "step": 36880 }, { "epoch": 0.48, "learning_rate": 5.345098937773776e-05, "loss": 2.6644, "step": 36885 }, { "epoch": 0.48, "learning_rate": 5.344080757114639e-05, "loss": 2.7269, "step": 36890 }, { "epoch": 0.48, "learning_rate": 5.3430625621191796e-05, "loss": 2.5891, "step": 36895 }, { "epoch": 0.48, "learning_rate": 5.3420443528298236e-05, "loss": 2.5406, "step": 36900 }, { "epoch": 0.48, "learning_rate": 5.341026129288993e-05, "loss": 2.5703, "step": 36905 }, { "epoch": 0.48, "learning_rate": 5.340007891539114e-05, "loss": 2.6167, "step": 36910 }, { "epoch": 0.48, "learning_rate": 5.33898963962261e-05, "loss": 2.5917, "step": 36915 }, { "epoch": 0.48, "learning_rate": 5.3379713735819096e-05, "loss": 2.6619, "step": 36920 }, { "epoch": 0.48, "learning_rate": 5.336953093459438e-05, "loss": 2.513, "step": 36925 }, { "epoch": 0.48, "learning_rate": 5.335934799297624e-05, "loss": 2.5407, "step": 36930 }, { "epoch": 0.48, "learning_rate": 5.334916491138893e-05, "loss": 2.5578, "step": 36935 }, { "epoch": 0.48, "learning_rate": 5.333898169025675e-05, "loss": 2.588, "step": 36940 }, { "epoch": 0.48, "learning_rate": 5.3328798330003993e-05, "loss": 2.6266, "step": 36945 }, { "epoch": 0.48, "learning_rate": 5.331861483105494e-05, "loss": 2.6682, "step": 36950 }, { "epoch": 0.48, "learning_rate": 5.33084311938339e-05, "loss": 2.613, "step": 36955 }, { "epoch": 0.48, "learning_rate": 5.329824741876518e-05, "loss": 2.563, "step": 36960 }, { "epoch": 0.48, "learning_rate": 5.328806350627308e-05, "loss": 2.7034, "step": 36965 }, { "epoch": 0.48, "learning_rate": 5.3277879456781954e-05, "loss": 2.623, "step": 36970 }, { "epoch": 0.48, "learning_rate": 5.326769527071609e-05, "loss": 2.6434, "step": 36975 }, { "epoch": 0.48, "learning_rate": 5.325751094849985e-05, "loss": 2.4472, "step": 36980 }, { "epoch": 0.48, "learning_rate": 5.324732649055752e-05, "loss": 2.5927, "step": 36985 }, { "epoch": 0.48, "learning_rate": 5.323714189731349e-05, "loss": 2.4992, "step": 36990 }, { "epoch": 0.48, "learning_rate": 5.322695716919209e-05, "loss": 2.5952, "step": 36995 }, { "epoch": 0.48, "learning_rate": 5.3216772306617665e-05, "loss": 2.5598, "step": 37000 }, { "epoch": 0.48, "learning_rate": 5.320658731001459e-05, "loss": 2.5872, "step": 37005 }, { "epoch": 0.48, "learning_rate": 5.3196402179807215e-05, "loss": 2.5853, "step": 37010 }, { "epoch": 0.48, "learning_rate": 5.318621691641991e-05, "loss": 2.5506, "step": 37015 }, { "epoch": 0.48, "learning_rate": 5.317603152027705e-05, "loss": 2.4839, "step": 37020 }, { "epoch": 0.48, "learning_rate": 5.316584599180303e-05, "loss": 2.5351, "step": 37025 }, { "epoch": 0.48, "learning_rate": 5.315566033142221e-05, "loss": 2.498, "step": 37030 }, { "epoch": 0.48, "learning_rate": 5.3145474539559e-05, "loss": 2.5696, "step": 37035 }, { "epoch": 0.48, "learning_rate": 5.3135288616637803e-05, "loss": 2.5116, "step": 37040 }, { "epoch": 0.48, "learning_rate": 5.3125102563082996e-05, "loss": 2.5073, "step": 37045 }, { "epoch": 0.48, "learning_rate": 5.3114916379319005e-05, "loss": 2.4949, "step": 37050 }, { "epoch": 0.48, "learning_rate": 5.310473006577025e-05, "loss": 2.5722, "step": 37055 }, { "epoch": 0.48, "learning_rate": 5.309454362286111e-05, "loss": 2.5789, "step": 37060 }, { "epoch": 0.48, "learning_rate": 5.308435705101607e-05, "loss": 2.455, "step": 37065 }, { "epoch": 0.48, "learning_rate": 5.3074170350659516e-05, "loss": 2.5174, "step": 37070 }, { "epoch": 0.48, "learning_rate": 5.3063983522215896e-05, "loss": 2.5262, "step": 37075 }, { "epoch": 0.48, "learning_rate": 5.305379656610964e-05, "loss": 2.4064, "step": 37080 }, { "epoch": 0.48, "learning_rate": 5.304360948276521e-05, "loss": 2.4668, "step": 37085 }, { "epoch": 0.48, "learning_rate": 5.303342227260704e-05, "loss": 2.5168, "step": 37090 }, { "epoch": 0.48, "learning_rate": 5.30232349360596e-05, "loss": 2.5855, "step": 37095 }, { "epoch": 0.48, "learning_rate": 5.301304747354735e-05, "loss": 2.6004, "step": 37100 }, { "epoch": 0.48, "learning_rate": 5.300285988549475e-05, "loss": 2.4828, "step": 37105 }, { "epoch": 0.48, "learning_rate": 5.2992672172326266e-05, "loss": 2.6045, "step": 37110 }, { "epoch": 0.48, "learning_rate": 5.298248433446639e-05, "loss": 2.5389, "step": 37115 }, { "epoch": 0.48, "learning_rate": 5.297229637233958e-05, "loss": 2.474, "step": 37120 }, { "epoch": 0.48, "learning_rate": 5.296210828637036e-05, "loss": 2.5723, "step": 37125 }, { "epoch": 0.48, "learning_rate": 5.29519200769832e-05, "loss": 2.5673, "step": 37130 }, { "epoch": 0.48, "learning_rate": 5.2941731744602594e-05, "loss": 2.5775, "step": 37135 }, { "epoch": 0.48, "learning_rate": 5.293154328965304e-05, "loss": 2.6001, "step": 37140 }, { "epoch": 0.48, "learning_rate": 5.2921354712559066e-05, "loss": 2.5332, "step": 37145 }, { "epoch": 0.48, "learning_rate": 5.291116601374517e-05, "loss": 2.6452, "step": 37150 }, { "epoch": 0.48, "learning_rate": 5.290097719363589e-05, "loss": 2.6843, "step": 37155 }, { "epoch": 0.48, "learning_rate": 5.289078825265573e-05, "loss": 2.5519, "step": 37160 }, { "epoch": 0.48, "learning_rate": 5.288059919122922e-05, "loss": 2.5076, "step": 37165 }, { "epoch": 0.48, "learning_rate": 5.287041000978089e-05, "loss": 2.5597, "step": 37170 }, { "epoch": 0.48, "learning_rate": 5.286022070873528e-05, "loss": 2.569, "step": 37175 }, { "epoch": 0.48, "learning_rate": 5.285003128851694e-05, "loss": 2.5028, "step": 37180 }, { "epoch": 0.48, "learning_rate": 5.283984174955042e-05, "loss": 2.5913, "step": 37185 }, { "epoch": 0.48, "learning_rate": 5.282965209226026e-05, "loss": 2.2926, "step": 37190 }, { "epoch": 0.48, "learning_rate": 5.281946231707104e-05, "loss": 2.5729, "step": 37195 }, { "epoch": 0.48, "learning_rate": 5.2809272424407294e-05, "loss": 2.561, "step": 37200 }, { "epoch": 0.48, "learning_rate": 5.2799082414693614e-05, "loss": 2.561, "step": 37205 }, { "epoch": 0.48, "learning_rate": 5.278889228835455e-05, "loss": 2.5259, "step": 37210 }, { "epoch": 0.48, "learning_rate": 5.27787020458147e-05, "loss": 2.5636, "step": 37215 }, { "epoch": 0.48, "learning_rate": 5.276851168749863e-05, "loss": 2.5529, "step": 37220 }, { "epoch": 0.48, "learning_rate": 5.275832121383095e-05, "loss": 2.6643, "step": 37225 }, { "epoch": 0.48, "learning_rate": 5.274813062523624e-05, "loss": 2.5101, "step": 37230 }, { "epoch": 0.48, "learning_rate": 5.273793992213907e-05, "loss": 2.6547, "step": 37235 }, { "epoch": 0.48, "learning_rate": 5.272774910496407e-05, "loss": 2.408, "step": 37240 }, { "epoch": 0.48, "learning_rate": 5.271755817413585e-05, "loss": 2.5323, "step": 37245 }, { "epoch": 0.48, "learning_rate": 5.270736713007902e-05, "loss": 2.554, "step": 37250 }, { "epoch": 0.48, "learning_rate": 5.269717597321818e-05, "loss": 2.6253, "step": 37255 }, { "epoch": 0.48, "learning_rate": 5.268698470397797e-05, "loss": 2.5426, "step": 37260 }, { "epoch": 0.48, "learning_rate": 5.267679332278299e-05, "loss": 2.5408, "step": 37265 }, { "epoch": 0.48, "learning_rate": 5.266660183005788e-05, "loss": 2.6288, "step": 37270 }, { "epoch": 0.48, "learning_rate": 5.265641022622728e-05, "loss": 2.685, "step": 37275 }, { "epoch": 0.48, "learning_rate": 5.2646218511715826e-05, "loss": 2.4462, "step": 37280 }, { "epoch": 0.48, "learning_rate": 5.263602668694818e-05, "loss": 2.5041, "step": 37285 }, { "epoch": 0.48, "learning_rate": 5.262583475234897e-05, "loss": 2.4318, "step": 37290 }, { "epoch": 0.48, "learning_rate": 5.2615642708342835e-05, "loss": 2.5082, "step": 37295 }, { "epoch": 0.48, "learning_rate": 5.2605450555354455e-05, "loss": 2.6919, "step": 37300 }, { "epoch": 0.48, "learning_rate": 5.259525829380848e-05, "loss": 2.5768, "step": 37305 }, { "epoch": 0.48, "learning_rate": 5.2585065924129585e-05, "loss": 2.5085, "step": 37310 }, { "epoch": 0.48, "learning_rate": 5.2574873446742446e-05, "loss": 2.5435, "step": 37315 }, { "epoch": 0.48, "learning_rate": 5.256468086207173e-05, "loss": 2.6609, "step": 37320 }, { "epoch": 0.48, "learning_rate": 5.2554488170542115e-05, "loss": 2.5344, "step": 37325 }, { "epoch": 0.48, "learning_rate": 5.254429537257829e-05, "loss": 2.5536, "step": 37330 }, { "epoch": 0.48, "learning_rate": 5.2534102468604926e-05, "loss": 2.4408, "step": 37335 }, { "epoch": 0.48, "learning_rate": 5.252390945904675e-05, "loss": 2.6236, "step": 37340 }, { "epoch": 0.48, "learning_rate": 5.2513716344328436e-05, "loss": 2.6071, "step": 37345 }, { "epoch": 0.48, "learning_rate": 5.2503523124874685e-05, "loss": 2.5102, "step": 37350 }, { "epoch": 0.48, "learning_rate": 5.249332980111022e-05, "loss": 2.4296, "step": 37355 }, { "epoch": 0.48, "learning_rate": 5.248313637345974e-05, "loss": 2.5725, "step": 37360 }, { "epoch": 0.48, "learning_rate": 5.247294284234795e-05, "loss": 2.5288, "step": 37365 }, { "epoch": 0.48, "learning_rate": 5.246274920819958e-05, "loss": 2.5413, "step": 37370 }, { "epoch": 0.49, "learning_rate": 5.245255547143937e-05, "loss": 2.5629, "step": 37375 }, { "epoch": 0.49, "learning_rate": 5.244236163249202e-05, "loss": 2.4865, "step": 37380 }, { "epoch": 0.49, "learning_rate": 5.243216769178228e-05, "loss": 2.6217, "step": 37385 }, { "epoch": 0.49, "learning_rate": 5.242197364973489e-05, "loss": 2.558, "step": 37390 }, { "epoch": 0.49, "learning_rate": 5.241177950677456e-05, "loss": 2.6913, "step": 37395 }, { "epoch": 0.49, "learning_rate": 5.240158526332606e-05, "loss": 2.5314, "step": 37400 }, { "epoch": 0.49, "learning_rate": 5.2391390919814145e-05, "loss": 2.6363, "step": 37405 }, { "epoch": 0.49, "learning_rate": 5.238119647666355e-05, "loss": 2.6393, "step": 37410 }, { "epoch": 0.49, "learning_rate": 5.2371001934299045e-05, "loss": 2.5477, "step": 37415 }, { "epoch": 0.49, "learning_rate": 5.2360807293145385e-05, "loss": 2.5417, "step": 37420 }, { "epoch": 0.49, "learning_rate": 5.2350612553627334e-05, "loss": 2.4902, "step": 37425 }, { "epoch": 0.49, "learning_rate": 5.234041771616967e-05, "loss": 2.6388, "step": 37430 }, { "epoch": 0.49, "learning_rate": 5.233022278119716e-05, "loss": 2.6011, "step": 37435 }, { "epoch": 0.49, "learning_rate": 5.232002774913458e-05, "loss": 2.551, "step": 37440 }, { "epoch": 0.49, "learning_rate": 5.230983262040672e-05, "loss": 2.6011, "step": 37445 }, { "epoch": 0.49, "learning_rate": 5.229963739543837e-05, "loss": 2.6209, "step": 37450 }, { "epoch": 0.49, "learning_rate": 5.2289442074654295e-05, "loss": 2.5873, "step": 37455 }, { "epoch": 0.49, "learning_rate": 5.2279246658479305e-05, "loss": 2.6535, "step": 37460 }, { "epoch": 0.49, "learning_rate": 5.22690511473382e-05, "loss": 2.588, "step": 37465 }, { "epoch": 0.49, "learning_rate": 5.2258855541655797e-05, "loss": 2.7279, "step": 37470 }, { "epoch": 0.49, "learning_rate": 5.224865984185686e-05, "loss": 2.5561, "step": 37475 }, { "epoch": 0.49, "learning_rate": 5.2238464048366245e-05, "loss": 2.6114, "step": 37480 }, { "epoch": 0.49, "learning_rate": 5.222826816160874e-05, "loss": 2.5545, "step": 37485 }, { "epoch": 0.49, "learning_rate": 5.221807218200915e-05, "loss": 2.6476, "step": 37490 }, { "epoch": 0.49, "learning_rate": 5.220787610999232e-05, "loss": 2.4798, "step": 37495 }, { "epoch": 0.49, "learning_rate": 5.219767994598307e-05, "loss": 2.5706, "step": 37500 }, { "epoch": 0.49, "learning_rate": 5.218748369040622e-05, "loss": 2.5376, "step": 37505 }, { "epoch": 0.49, "learning_rate": 5.217728734368662e-05, "loss": 2.6157, "step": 37510 }, { "epoch": 0.49, "learning_rate": 5.216709090624909e-05, "loss": 2.5849, "step": 37515 }, { "epoch": 0.49, "learning_rate": 5.2156894378518484e-05, "loss": 2.5653, "step": 37520 }, { "epoch": 0.49, "learning_rate": 5.214669776091962e-05, "loss": 2.6538, "step": 37525 }, { "epoch": 0.49, "learning_rate": 5.213650105387738e-05, "loss": 2.679, "step": 37530 }, { "epoch": 0.49, "learning_rate": 5.21263042578166e-05, "loss": 2.496, "step": 37535 }, { "epoch": 0.49, "learning_rate": 5.211610737316214e-05, "loss": 2.5963, "step": 37540 }, { "epoch": 0.49, "learning_rate": 5.210591040033885e-05, "loss": 2.5851, "step": 37545 }, { "epoch": 0.49, "learning_rate": 5.209571333977159e-05, "loss": 2.6155, "step": 37550 }, { "epoch": 0.49, "learning_rate": 5.208551619188524e-05, "loss": 2.6987, "step": 37555 }, { "epoch": 0.49, "learning_rate": 5.207531895710466e-05, "loss": 2.498, "step": 37560 }, { "epoch": 0.49, "learning_rate": 5.206512163585473e-05, "loss": 2.6044, "step": 37565 }, { "epoch": 0.49, "learning_rate": 5.205492422856033e-05, "loss": 2.5396, "step": 37570 }, { "epoch": 0.49, "learning_rate": 5.204472673564633e-05, "loss": 2.543, "step": 37575 }, { "epoch": 0.49, "learning_rate": 5.2034529157537615e-05, "loss": 2.5326, "step": 37580 }, { "epoch": 0.49, "learning_rate": 5.202433149465908e-05, "loss": 2.5169, "step": 37585 }, { "epoch": 0.49, "learning_rate": 5.201413374743561e-05, "loss": 2.4267, "step": 37590 }, { "epoch": 0.49, "learning_rate": 5.200393591629212e-05, "loss": 2.5908, "step": 37595 }, { "epoch": 0.49, "learning_rate": 5.1993738001653483e-05, "loss": 2.5111, "step": 37600 }, { "epoch": 0.49, "learning_rate": 5.198354000394462e-05, "loss": 2.6333, "step": 37605 }, { "epoch": 0.49, "learning_rate": 5.19733419235904e-05, "loss": 2.6169, "step": 37610 }, { "epoch": 0.49, "learning_rate": 5.1963143761015784e-05, "loss": 2.522, "step": 37615 }, { "epoch": 0.49, "learning_rate": 5.1952945516645644e-05, "loss": 2.6966, "step": 37620 }, { "epoch": 0.49, "learning_rate": 5.194274719090493e-05, "loss": 2.5957, "step": 37625 }, { "epoch": 0.49, "learning_rate": 5.1932548784218525e-05, "loss": 2.5703, "step": 37630 }, { "epoch": 0.49, "learning_rate": 5.192235029701138e-05, "loss": 2.4948, "step": 37635 }, { "epoch": 0.49, "learning_rate": 5.19121517297084e-05, "loss": 2.5783, "step": 37640 }, { "epoch": 0.49, "learning_rate": 5.190195308273452e-05, "loss": 2.6579, "step": 37645 }, { "epoch": 0.49, "learning_rate": 5.1891754356514674e-05, "loss": 2.5564, "step": 37650 }, { "epoch": 0.49, "learning_rate": 5.1881555551473816e-05, "loss": 2.6326, "step": 37655 }, { "epoch": 0.49, "learning_rate": 5.1871356668036866e-05, "loss": 2.6214, "step": 37660 }, { "epoch": 0.49, "learning_rate": 5.186115770662876e-05, "loss": 2.4953, "step": 37665 }, { "epoch": 0.49, "learning_rate": 5.1850958667674467e-05, "loss": 2.5393, "step": 37670 }, { "epoch": 0.49, "learning_rate": 5.184075955159891e-05, "loss": 2.5361, "step": 37675 }, { "epoch": 0.49, "learning_rate": 5.183056035882704e-05, "loss": 2.608, "step": 37680 }, { "epoch": 0.49, "learning_rate": 5.182036108978383e-05, "loss": 2.4813, "step": 37685 }, { "epoch": 0.49, "learning_rate": 5.1810161744894246e-05, "loss": 2.5854, "step": 37690 }, { "epoch": 0.49, "learning_rate": 5.179996232458323e-05, "loss": 2.3859, "step": 37695 }, { "epoch": 0.49, "learning_rate": 5.1789762829275755e-05, "loss": 2.3548, "step": 37700 }, { "epoch": 0.49, "learning_rate": 5.177956325939678e-05, "loss": 2.3954, "step": 37705 }, { "epoch": 0.49, "learning_rate": 5.176936361537129e-05, "loss": 2.534, "step": 37710 }, { "epoch": 0.49, "learning_rate": 5.175916389762424e-05, "loss": 2.5874, "step": 37715 }, { "epoch": 0.49, "learning_rate": 5.1748964106580635e-05, "loss": 2.4975, "step": 37720 }, { "epoch": 0.49, "learning_rate": 5.173876424266544e-05, "loss": 2.5299, "step": 37725 }, { "epoch": 0.49, "learning_rate": 5.172856430630363e-05, "loss": 2.5762, "step": 37730 }, { "epoch": 0.49, "learning_rate": 5.1718364297920194e-05, "loss": 2.3039, "step": 37735 }, { "epoch": 0.49, "learning_rate": 5.1708164217940136e-05, "loss": 2.4828, "step": 37740 }, { "epoch": 0.49, "learning_rate": 5.169796406678842e-05, "loss": 2.6067, "step": 37745 }, { "epoch": 0.49, "learning_rate": 5.168776384489007e-05, "loss": 2.6085, "step": 37750 }, { "epoch": 0.49, "learning_rate": 5.1677563552670086e-05, "loss": 2.5913, "step": 37755 }, { "epoch": 0.49, "learning_rate": 5.166736319055344e-05, "loss": 2.5204, "step": 37760 }, { "epoch": 0.49, "learning_rate": 5.165716275896515e-05, "loss": 2.4793, "step": 37765 }, { "epoch": 0.49, "learning_rate": 5.1646962258330234e-05, "loss": 2.6147, "step": 37770 }, { "epoch": 0.49, "learning_rate": 5.163676168907369e-05, "loss": 2.6719, "step": 37775 }, { "epoch": 0.49, "learning_rate": 5.1626561051620524e-05, "loss": 2.5335, "step": 37780 }, { "epoch": 0.49, "learning_rate": 5.1616360346395764e-05, "loss": 2.567, "step": 37785 }, { "epoch": 0.49, "learning_rate": 5.1606159573824444e-05, "loss": 2.5364, "step": 37790 }, { "epoch": 0.49, "learning_rate": 5.159595873433154e-05, "loss": 2.7176, "step": 37795 }, { "epoch": 0.49, "learning_rate": 5.158575782834211e-05, "loss": 2.5089, "step": 37800 }, { "epoch": 0.49, "learning_rate": 5.157555685628118e-05, "loss": 2.5296, "step": 37805 }, { "epoch": 0.49, "learning_rate": 5.1565355818573754e-05, "loss": 2.5445, "step": 37810 }, { "epoch": 0.49, "learning_rate": 5.1555154715644894e-05, "loss": 2.5534, "step": 37815 }, { "epoch": 0.49, "learning_rate": 5.154495354791963e-05, "loss": 2.6072, "step": 37820 }, { "epoch": 0.49, "learning_rate": 5.153475231582298e-05, "loss": 2.5145, "step": 37825 }, { "epoch": 0.49, "learning_rate": 5.152455101978e-05, "loss": 2.5689, "step": 37830 }, { "epoch": 0.49, "learning_rate": 5.1514349660215734e-05, "loss": 2.6447, "step": 37835 }, { "epoch": 0.49, "learning_rate": 5.1504148237555206e-05, "loss": 2.4738, "step": 37840 }, { "epoch": 0.49, "learning_rate": 5.149394675222349e-05, "loss": 2.607, "step": 37845 }, { "epoch": 0.49, "learning_rate": 5.1483745204645626e-05, "loss": 2.523, "step": 37850 }, { "epoch": 0.49, "learning_rate": 5.1473543595246676e-05, "loss": 2.7129, "step": 37855 }, { "epoch": 0.49, "learning_rate": 5.146334192445168e-05, "loss": 2.6901, "step": 37860 }, { "epoch": 0.49, "learning_rate": 5.145314019268571e-05, "loss": 2.417, "step": 37865 }, { "epoch": 0.49, "learning_rate": 5.144293840037382e-05, "loss": 2.5773, "step": 37870 }, { "epoch": 0.49, "learning_rate": 5.1432736547941065e-05, "loss": 2.7031, "step": 37875 }, { "epoch": 0.49, "learning_rate": 5.142253463581253e-05, "loss": 2.6971, "step": 37880 }, { "epoch": 0.49, "learning_rate": 5.1412332664413284e-05, "loss": 2.6502, "step": 37885 }, { "epoch": 0.49, "learning_rate": 5.140213063416838e-05, "loss": 2.4192, "step": 37890 }, { "epoch": 0.49, "learning_rate": 5.13919285455029e-05, "loss": 2.582, "step": 37895 }, { "epoch": 0.49, "learning_rate": 5.1381726398841924e-05, "loss": 2.6637, "step": 37900 }, { "epoch": 0.49, "learning_rate": 5.137152419461051e-05, "loss": 2.5823, "step": 37905 }, { "epoch": 0.49, "learning_rate": 5.136132193323377e-05, "loss": 2.6897, "step": 37910 }, { "epoch": 0.49, "learning_rate": 5.1351119615136776e-05, "loss": 2.496, "step": 37915 }, { "epoch": 0.49, "learning_rate": 5.13409172407446e-05, "loss": 2.6131, "step": 37920 }, { "epoch": 0.49, "learning_rate": 5.133071481048234e-05, "loss": 2.5193, "step": 37925 }, { "epoch": 0.49, "learning_rate": 5.1320512324775096e-05, "loss": 2.6723, "step": 37930 }, { "epoch": 0.49, "learning_rate": 5.131030978404794e-05, "loss": 2.4328, "step": 37935 }, { "epoch": 0.49, "learning_rate": 5.1300107188725974e-05, "loss": 2.5866, "step": 37940 }, { "epoch": 0.49, "learning_rate": 5.128990453923431e-05, "loss": 2.5143, "step": 37945 }, { "epoch": 0.49, "learning_rate": 5.127970183599802e-05, "loss": 2.6099, "step": 37950 }, { "epoch": 0.49, "learning_rate": 5.126949907944223e-05, "loss": 2.4702, "step": 37955 }, { "epoch": 0.49, "learning_rate": 5.125929626999204e-05, "loss": 2.5508, "step": 37960 }, { "epoch": 0.49, "learning_rate": 5.124909340807253e-05, "loss": 2.5986, "step": 37965 }, { "epoch": 0.49, "learning_rate": 5.123889049410885e-05, "loss": 2.6288, "step": 37970 }, { "epoch": 0.49, "learning_rate": 5.122868752852607e-05, "loss": 2.5111, "step": 37975 }, { "epoch": 0.49, "learning_rate": 5.121848451174932e-05, "loss": 2.5694, "step": 37980 }, { "epoch": 0.49, "learning_rate": 5.120828144420373e-05, "loss": 2.5047, "step": 37985 }, { "epoch": 0.49, "learning_rate": 5.11980783263144e-05, "loss": 2.5669, "step": 37990 }, { "epoch": 0.49, "learning_rate": 5.118787515850645e-05, "loss": 2.5395, "step": 37995 }, { "epoch": 0.49, "learning_rate": 5.117767194120498e-05, "loss": 2.5399, "step": 38000 }, { "epoch": 0.49, "learning_rate": 5.116746867483516e-05, "loss": 2.5386, "step": 38005 }, { "epoch": 0.49, "learning_rate": 5.115726535982208e-05, "loss": 2.628, "step": 38010 }, { "epoch": 0.49, "learning_rate": 5.1147061996590875e-05, "loss": 2.5584, "step": 38015 }, { "epoch": 0.49, "learning_rate": 5.1136858585566684e-05, "loss": 2.5748, "step": 38020 }, { "epoch": 0.49, "learning_rate": 5.112665512717463e-05, "loss": 2.6864, "step": 38025 }, { "epoch": 0.49, "learning_rate": 5.111645162183982e-05, "loss": 2.428, "step": 38030 }, { "epoch": 0.49, "learning_rate": 5.110624806998744e-05, "loss": 2.5099, "step": 38035 }, { "epoch": 0.49, "learning_rate": 5.109604447204258e-05, "loss": 2.5754, "step": 38040 }, { "epoch": 0.49, "learning_rate": 5.108584082843041e-05, "loss": 2.6382, "step": 38045 }, { "epoch": 0.49, "learning_rate": 5.107563713957607e-05, "loss": 2.587, "step": 38050 }, { "epoch": 0.49, "learning_rate": 5.1065433405904684e-05, "loss": 2.5284, "step": 38055 }, { "epoch": 0.49, "learning_rate": 5.105522962784139e-05, "loss": 2.5197, "step": 38060 }, { "epoch": 0.49, "learning_rate": 5.1045025805811376e-05, "loss": 2.6175, "step": 38065 }, { "epoch": 0.49, "learning_rate": 5.1034821940239754e-05, "loss": 2.4524, "step": 38070 }, { "epoch": 0.49, "learning_rate": 5.1024618031551674e-05, "loss": 2.5251, "step": 38075 }, { "epoch": 0.49, "learning_rate": 5.1014414080172315e-05, "loss": 2.6208, "step": 38080 }, { "epoch": 0.49, "learning_rate": 5.10042100865268e-05, "loss": 2.577, "step": 38085 }, { "epoch": 0.49, "learning_rate": 5.09940060510403e-05, "loss": 2.471, "step": 38090 }, { "epoch": 0.49, "learning_rate": 5.098380197413796e-05, "loss": 2.5245, "step": 38095 }, { "epoch": 0.49, "learning_rate": 5.097359785624496e-05, "loss": 2.4474, "step": 38100 }, { "epoch": 0.49, "learning_rate": 5.0963393697786435e-05, "loss": 2.4734, "step": 38105 }, { "epoch": 0.49, "learning_rate": 5.095318949918757e-05, "loss": 2.6091, "step": 38110 }, { "epoch": 0.49, "learning_rate": 5.094298526087351e-05, "loss": 2.6469, "step": 38115 }, { "epoch": 0.49, "learning_rate": 5.093278098326945e-05, "loss": 2.5998, "step": 38120 }, { "epoch": 0.49, "learning_rate": 5.0922576666800505e-05, "loss": 2.5421, "step": 38125 }, { "epoch": 0.49, "learning_rate": 5.09123723118919e-05, "loss": 2.6278, "step": 38130 }, { "epoch": 0.49, "learning_rate": 5.090216791896876e-05, "loss": 2.4732, "step": 38135 }, { "epoch": 0.49, "learning_rate": 5.089196348845629e-05, "loss": 2.5908, "step": 38140 }, { "epoch": 0.5, "learning_rate": 5.088175902077965e-05, "loss": 2.6399, "step": 38145 }, { "epoch": 0.5, "learning_rate": 5.0871554516364014e-05, "loss": 2.5813, "step": 38150 }, { "epoch": 0.5, "learning_rate": 5.0861349975634566e-05, "loss": 2.5749, "step": 38155 }, { "epoch": 0.5, "learning_rate": 5.0851145399016474e-05, "loss": 2.6077, "step": 38160 }, { "epoch": 0.5, "learning_rate": 5.084094078693491e-05, "loss": 2.5932, "step": 38165 }, { "epoch": 0.5, "learning_rate": 5.083073613981508e-05, "loss": 2.4108, "step": 38170 }, { "epoch": 0.5, "learning_rate": 5.082053145808216e-05, "loss": 2.5534, "step": 38175 }, { "epoch": 0.5, "learning_rate": 5.0810326742161305e-05, "loss": 2.6036, "step": 38180 }, { "epoch": 0.5, "learning_rate": 5.0800121992477746e-05, "loss": 2.6237, "step": 38185 }, { "epoch": 0.5, "learning_rate": 5.078991720945663e-05, "loss": 2.5942, "step": 38190 }, { "epoch": 0.5, "learning_rate": 5.077971239352315e-05, "loss": 2.6158, "step": 38195 }, { "epoch": 0.5, "learning_rate": 5.0769507545102525e-05, "loss": 2.533, "step": 38200 }, { "epoch": 0.5, "learning_rate": 5.0759302664619936e-05, "loss": 2.5725, "step": 38205 }, { "epoch": 0.5, "learning_rate": 5.074909775250055e-05, "loss": 2.5448, "step": 38210 }, { "epoch": 0.5, "learning_rate": 5.073889280916959e-05, "loss": 2.5952, "step": 38215 }, { "epoch": 0.5, "learning_rate": 5.072868783505223e-05, "loss": 2.5485, "step": 38220 }, { "epoch": 0.5, "learning_rate": 5.071848283057366e-05, "loss": 2.6182, "step": 38225 }, { "epoch": 0.5, "learning_rate": 5.070827779615911e-05, "loss": 2.5739, "step": 38230 }, { "epoch": 0.5, "learning_rate": 5.069807273223376e-05, "loss": 2.6817, "step": 38235 }, { "epoch": 0.5, "learning_rate": 5.068786763922281e-05, "loss": 2.4906, "step": 38240 }, { "epoch": 0.5, "learning_rate": 5.067766251755146e-05, "loss": 2.5203, "step": 38245 }, { "epoch": 0.5, "learning_rate": 5.06674573676449e-05, "loss": 2.5034, "step": 38250 }, { "epoch": 0.5, "learning_rate": 5.065725218992835e-05, "loss": 2.5847, "step": 38255 }, { "epoch": 0.5, "learning_rate": 5.064704698482702e-05, "loss": 2.429, "step": 38260 }, { "epoch": 0.5, "learning_rate": 5.06368417527661e-05, "loss": 2.7087, "step": 38265 }, { "epoch": 0.5, "learning_rate": 5.062663649417082e-05, "loss": 2.4826, "step": 38270 }, { "epoch": 0.5, "learning_rate": 5.0616431209466366e-05, "loss": 2.5445, "step": 38275 }, { "epoch": 0.5, "learning_rate": 5.060622589907793e-05, "loss": 2.5197, "step": 38280 }, { "epoch": 0.5, "learning_rate": 5.059602056343077e-05, "loss": 2.6987, "step": 38285 }, { "epoch": 0.5, "learning_rate": 5.058581520295006e-05, "loss": 2.4697, "step": 38290 }, { "epoch": 0.5, "learning_rate": 5.0575609818061034e-05, "loss": 2.6054, "step": 38295 }, { "epoch": 0.5, "learning_rate": 5.056540440918889e-05, "loss": 2.4632, "step": 38300 }, { "epoch": 0.5, "learning_rate": 5.055519897675884e-05, "loss": 2.4655, "step": 38305 }, { "epoch": 0.5, "learning_rate": 5.054499352119613e-05, "loss": 2.7133, "step": 38310 }, { "epoch": 0.5, "learning_rate": 5.053478804292592e-05, "loss": 2.5254, "step": 38315 }, { "epoch": 0.5, "learning_rate": 5.052458254237347e-05, "loss": 2.561, "step": 38320 }, { "epoch": 0.5, "learning_rate": 5.0514377019964e-05, "loss": 2.5236, "step": 38325 }, { "epoch": 0.5, "learning_rate": 5.0504171476122706e-05, "loss": 2.5736, "step": 38330 }, { "epoch": 0.5, "learning_rate": 5.049396591127483e-05, "loss": 2.4075, "step": 38335 }, { "epoch": 0.5, "learning_rate": 5.0483760325845575e-05, "loss": 2.5901, "step": 38340 }, { "epoch": 0.5, "learning_rate": 5.047355472026016e-05, "loss": 2.6426, "step": 38345 }, { "epoch": 0.5, "learning_rate": 5.0463349094943824e-05, "loss": 2.5113, "step": 38350 }, { "epoch": 0.5, "learning_rate": 5.0453143450321784e-05, "loss": 2.4682, "step": 38355 }, { "epoch": 0.5, "learning_rate": 5.0442937786819265e-05, "loss": 2.5874, "step": 38360 }, { "epoch": 0.5, "learning_rate": 5.043273210486149e-05, "loss": 2.5092, "step": 38365 }, { "epoch": 0.5, "learning_rate": 5.042252640487369e-05, "loss": 2.6607, "step": 38370 }, { "epoch": 0.5, "learning_rate": 5.041232068728107e-05, "loss": 2.4432, "step": 38375 }, { "epoch": 0.5, "learning_rate": 5.0402114952508886e-05, "loss": 2.5809, "step": 38380 }, { "epoch": 0.5, "learning_rate": 5.039190920098234e-05, "loss": 2.6242, "step": 38385 }, { "epoch": 0.5, "learning_rate": 5.038170343312668e-05, "loss": 2.5132, "step": 38390 }, { "epoch": 0.5, "learning_rate": 5.0371497649367125e-05, "loss": 2.495, "step": 38395 }, { "epoch": 0.5, "learning_rate": 5.036129185012891e-05, "loss": 2.4885, "step": 38400 }, { "epoch": 0.5, "learning_rate": 5.035108603583727e-05, "loss": 2.4917, "step": 38405 }, { "epoch": 0.5, "learning_rate": 5.034088020691742e-05, "loss": 2.6551, "step": 38410 }, { "epoch": 0.5, "learning_rate": 5.0330674363794584e-05, "loss": 2.5471, "step": 38415 }, { "epoch": 0.5, "learning_rate": 5.032046850689404e-05, "loss": 2.4924, "step": 38420 }, { "epoch": 0.5, "learning_rate": 5.031026263664098e-05, "loss": 2.6189, "step": 38425 }, { "epoch": 0.5, "learning_rate": 5.030005675346066e-05, "loss": 2.4841, "step": 38430 }, { "epoch": 0.5, "learning_rate": 5.0289850857778296e-05, "loss": 2.4269, "step": 38435 }, { "epoch": 0.5, "learning_rate": 5.027964495001912e-05, "loss": 2.6583, "step": 38440 }, { "epoch": 0.5, "learning_rate": 5.026943903060838e-05, "loss": 2.576, "step": 38445 }, { "epoch": 0.5, "learning_rate": 5.025923309997131e-05, "loss": 2.5202, "step": 38450 }, { "epoch": 0.5, "learning_rate": 5.024902715853316e-05, "loss": 2.4786, "step": 38455 }, { "epoch": 0.5, "learning_rate": 5.0238821206719145e-05, "loss": 2.6154, "step": 38460 }, { "epoch": 0.5, "learning_rate": 5.0228615244954505e-05, "loss": 2.6249, "step": 38465 }, { "epoch": 0.5, "learning_rate": 5.021840927366447e-05, "loss": 2.6016, "step": 38470 }, { "epoch": 0.5, "learning_rate": 5.020820329327429e-05, "loss": 2.4143, "step": 38475 }, { "epoch": 0.5, "learning_rate": 5.019799730420921e-05, "loss": 2.6476, "step": 38480 }, { "epoch": 0.5, "learning_rate": 5.0187791306894446e-05, "loss": 2.5017, "step": 38485 }, { "epoch": 0.5, "learning_rate": 5.017758530175527e-05, "loss": 2.4404, "step": 38490 }, { "epoch": 0.5, "learning_rate": 5.0167379289216885e-05, "loss": 2.5331, "step": 38495 }, { "epoch": 0.5, "learning_rate": 5.015717326970456e-05, "loss": 2.5504, "step": 38500 }, { "epoch": 0.5, "learning_rate": 5.014696724364351e-05, "loss": 2.5548, "step": 38505 }, { "epoch": 0.5, "learning_rate": 5.0136761211458974e-05, "loss": 2.6551, "step": 38510 }, { "epoch": 0.5, "learning_rate": 5.012655517357622e-05, "loss": 2.5126, "step": 38515 }, { "epoch": 0.5, "learning_rate": 5.011634913042047e-05, "loss": 2.5186, "step": 38520 }, { "epoch": 0.5, "learning_rate": 5.0106143082416965e-05, "loss": 2.5527, "step": 38525 }, { "epoch": 0.5, "learning_rate": 5.009593702999096e-05, "loss": 2.528, "step": 38530 }, { "epoch": 0.5, "learning_rate": 5.008573097356766e-05, "loss": 2.4209, "step": 38535 }, { "epoch": 0.5, "learning_rate": 5.0075524913572336e-05, "loss": 2.6637, "step": 38540 }, { "epoch": 0.5, "learning_rate": 5.006531885043023e-05, "loss": 2.7322, "step": 38545 }, { "epoch": 0.5, "learning_rate": 5.0055112784566586e-05, "loss": 2.6551, "step": 38550 }, { "epoch": 0.5, "learning_rate": 5.0044906716406625e-05, "loss": 2.4128, "step": 38555 }, { "epoch": 0.5, "learning_rate": 5.0034700646375596e-05, "loss": 2.5158, "step": 38560 }, { "epoch": 0.5, "learning_rate": 5.002449457489875e-05, "loss": 2.6112, "step": 38565 }, { "epoch": 0.5, "learning_rate": 5.001428850240131e-05, "loss": 2.5848, "step": 38570 }, { "epoch": 0.5, "learning_rate": 5.0004082429308555e-05, "loss": 2.5732, "step": 38575 }, { "epoch": 0.5, "learning_rate": 4.9993876356045675e-05, "loss": 2.533, "step": 38580 }, { "epoch": 0.5, "learning_rate": 4.9983670283037975e-05, "loss": 2.6599, "step": 38585 }, { "epoch": 0.5, "learning_rate": 4.997346421071063e-05, "loss": 2.6775, "step": 38590 }, { "epoch": 0.5, "learning_rate": 4.996325813948895e-05, "loss": 2.532, "step": 38595 }, { "epoch": 0.5, "learning_rate": 4.9953052069798113e-05, "loss": 2.5972, "step": 38600 }, { "epoch": 0.5, "learning_rate": 4.99428460020634e-05, "loss": 2.5861, "step": 38605 }, { "epoch": 0.5, "learning_rate": 4.993263993671002e-05, "loss": 2.5819, "step": 38610 }, { "epoch": 0.5, "learning_rate": 4.992243387416325e-05, "loss": 2.5413, "step": 38615 }, { "epoch": 0.5, "learning_rate": 4.991222781484833e-05, "loss": 2.5636, "step": 38620 }, { "epoch": 0.5, "learning_rate": 4.990202175919047e-05, "loss": 2.6531, "step": 38625 }, { "epoch": 0.5, "learning_rate": 4.989181570761494e-05, "loss": 2.6258, "step": 38630 }, { "epoch": 0.5, "learning_rate": 4.988160966054696e-05, "loss": 2.5903, "step": 38635 }, { "epoch": 0.5, "learning_rate": 4.9871403618411775e-05, "loss": 2.5778, "step": 38640 }, { "epoch": 0.5, "learning_rate": 4.986119758163467e-05, "loss": 2.4504, "step": 38645 }, { "epoch": 0.5, "learning_rate": 4.985099155064081e-05, "loss": 2.5223, "step": 38650 }, { "epoch": 0.5, "learning_rate": 4.98407855258555e-05, "loss": 2.6704, "step": 38655 }, { "epoch": 0.5, "learning_rate": 4.983057950770393e-05, "loss": 2.5696, "step": 38660 }, { "epoch": 0.5, "learning_rate": 4.9820373496611366e-05, "loss": 2.4681, "step": 38665 }, { "epoch": 0.5, "learning_rate": 4.981016749300304e-05, "loss": 2.5861, "step": 38670 }, { "epoch": 0.5, "learning_rate": 4.9799961497304195e-05, "loss": 2.4171, "step": 38675 }, { "epoch": 0.5, "learning_rate": 4.9789755509940085e-05, "loss": 2.692, "step": 38680 }, { "epoch": 0.5, "learning_rate": 4.9779549531335915e-05, "loss": 2.4743, "step": 38685 }, { "epoch": 0.5, "learning_rate": 4.976934356191695e-05, "loss": 2.5414, "step": 38690 }, { "epoch": 0.5, "learning_rate": 4.9759137602108414e-05, "loss": 2.495, "step": 38695 }, { "epoch": 0.5, "learning_rate": 4.974893165233554e-05, "loss": 2.5302, "step": 38700 }, { "epoch": 0.5, "learning_rate": 4.973872571302358e-05, "loss": 2.5373, "step": 38705 }, { "epoch": 0.5, "learning_rate": 4.972851978459776e-05, "loss": 2.7127, "step": 38710 }, { "epoch": 0.5, "learning_rate": 4.971831386748333e-05, "loss": 2.6204, "step": 38715 }, { "epoch": 0.5, "learning_rate": 4.97081079621055e-05, "loss": 2.6408, "step": 38720 }, { "epoch": 0.5, "learning_rate": 4.9697902068889524e-05, "loss": 2.5163, "step": 38725 }, { "epoch": 0.5, "learning_rate": 4.9687696188260626e-05, "loss": 2.6596, "step": 38730 }, { "epoch": 0.5, "learning_rate": 4.9677490320644044e-05, "loss": 2.4593, "step": 38735 }, { "epoch": 0.5, "learning_rate": 4.966728446646503e-05, "loss": 2.4329, "step": 38740 }, { "epoch": 0.5, "learning_rate": 4.965707862614878e-05, "loss": 2.6195, "step": 38745 }, { "epoch": 0.5, "learning_rate": 4.964687280012057e-05, "loss": 2.6701, "step": 38750 }, { "epoch": 0.5, "learning_rate": 4.963666698880558e-05, "loss": 2.5991, "step": 38755 }, { "epoch": 0.5, "learning_rate": 4.962646119262908e-05, "loss": 2.5232, "step": 38760 }, { "epoch": 0.5, "learning_rate": 4.961625541201628e-05, "loss": 2.517, "step": 38765 }, { "epoch": 0.5, "learning_rate": 4.960604964739242e-05, "loss": 2.6792, "step": 38770 }, { "epoch": 0.5, "learning_rate": 4.959584389918274e-05, "loss": 2.3808, "step": 38775 }, { "epoch": 0.5, "learning_rate": 4.9585638167812445e-05, "loss": 2.5998, "step": 38780 }, { "epoch": 0.5, "learning_rate": 4.9575432453706775e-05, "loss": 2.545, "step": 38785 }, { "epoch": 0.5, "learning_rate": 4.956522675729095e-05, "loss": 2.4688, "step": 38790 }, { "epoch": 0.5, "learning_rate": 4.9555021078990206e-05, "loss": 2.6224, "step": 38795 }, { "epoch": 0.5, "learning_rate": 4.954481541922977e-05, "loss": 2.5701, "step": 38800 }, { "epoch": 0.5, "learning_rate": 4.953460977843484e-05, "loss": 2.3707, "step": 38805 }, { "epoch": 0.5, "learning_rate": 4.952440415703069e-05, "loss": 2.5398, "step": 38810 }, { "epoch": 0.5, "learning_rate": 4.951419855544249e-05, "loss": 2.4992, "step": 38815 }, { "epoch": 0.5, "learning_rate": 4.950399297409549e-05, "loss": 2.4699, "step": 38820 }, { "epoch": 0.5, "learning_rate": 4.94937874134149e-05, "loss": 2.6487, "step": 38825 }, { "epoch": 0.5, "learning_rate": 4.948358187382595e-05, "loss": 2.5062, "step": 38830 }, { "epoch": 0.5, "learning_rate": 4.947337635575388e-05, "loss": 2.6189, "step": 38835 }, { "epoch": 0.5, "learning_rate": 4.9463170859623864e-05, "loss": 2.6416, "step": 38840 }, { "epoch": 0.5, "learning_rate": 4.945296538586116e-05, "loss": 2.7552, "step": 38845 }, { "epoch": 0.5, "learning_rate": 4.944275993489094e-05, "loss": 2.6236, "step": 38850 }, { "epoch": 0.5, "learning_rate": 4.943255450713846e-05, "loss": 2.5342, "step": 38855 }, { "epoch": 0.5, "learning_rate": 4.942234910302892e-05, "loss": 2.5416, "step": 38860 }, { "epoch": 0.5, "learning_rate": 4.9412143722987525e-05, "loss": 2.5359, "step": 38865 }, { "epoch": 0.5, "learning_rate": 4.940193836743953e-05, "loss": 2.5127, "step": 38870 }, { "epoch": 0.5, "learning_rate": 4.939173303681009e-05, "loss": 2.5001, "step": 38875 }, { "epoch": 0.5, "learning_rate": 4.938152773152444e-05, "loss": 2.5936, "step": 38880 }, { "epoch": 0.5, "learning_rate": 4.937132245200779e-05, "loss": 2.541, "step": 38885 }, { "epoch": 0.5, "learning_rate": 4.9361117198685344e-05, "loss": 2.5226, "step": 38890 }, { "epoch": 0.5, "learning_rate": 4.935091197198235e-05, "loss": 2.5969, "step": 38895 }, { "epoch": 0.5, "learning_rate": 4.934070677232395e-05, "loss": 2.5301, "step": 38900 }, { "epoch": 0.5, "learning_rate": 4.93305016001354e-05, "loss": 2.5073, "step": 38905 }, { "epoch": 0.5, "learning_rate": 4.932029645584187e-05, "loss": 2.6249, "step": 38910 }, { "epoch": 0.51, "learning_rate": 4.931009133986857e-05, "loss": 2.5753, "step": 38915 }, { "epoch": 0.51, "learning_rate": 4.929988625264072e-05, "loss": 2.4578, "step": 38920 }, { "epoch": 0.51, "learning_rate": 4.928968119458351e-05, "loss": 2.4722, "step": 38925 }, { "epoch": 0.51, "learning_rate": 4.927947616612215e-05, "loss": 2.5894, "step": 38930 }, { "epoch": 0.51, "learning_rate": 4.9269271167681814e-05, "loss": 2.6101, "step": 38935 }, { "epoch": 0.51, "learning_rate": 4.925906619968773e-05, "loss": 2.466, "step": 38940 }, { "epoch": 0.51, "learning_rate": 4.924886126256506e-05, "loss": 2.391, "step": 38945 }, { "epoch": 0.51, "learning_rate": 4.923865635673901e-05, "loss": 2.4648, "step": 38950 }, { "epoch": 0.51, "learning_rate": 4.922845148263479e-05, "loss": 2.5008, "step": 38955 }, { "epoch": 0.51, "learning_rate": 4.9218246640677576e-05, "loss": 2.6029, "step": 38960 }, { "epoch": 0.51, "learning_rate": 4.920804183129258e-05, "loss": 2.5983, "step": 38965 }, { "epoch": 0.51, "learning_rate": 4.9197837054904946e-05, "loss": 2.6467, "step": 38970 }, { "epoch": 0.51, "learning_rate": 4.918763231193991e-05, "loss": 2.5549, "step": 38975 }, { "epoch": 0.51, "learning_rate": 4.917742760282263e-05, "loss": 2.516, "step": 38980 }, { "epoch": 0.51, "learning_rate": 4.9167222927978295e-05, "loss": 2.606, "step": 38985 }, { "epoch": 0.51, "learning_rate": 4.9157018287832115e-05, "loss": 2.554, "step": 38990 }, { "epoch": 0.51, "learning_rate": 4.9146813682809235e-05, "loss": 2.4309, "step": 38995 }, { "epoch": 0.51, "learning_rate": 4.913660911333487e-05, "loss": 2.5968, "step": 39000 }, { "epoch": 0.51, "learning_rate": 4.9126404579834156e-05, "loss": 2.5315, "step": 39005 }, { "epoch": 0.51, "learning_rate": 4.91162000827323e-05, "loss": 2.666, "step": 39010 }, { "epoch": 0.51, "learning_rate": 4.910599562245448e-05, "loss": 2.474, "step": 39015 }, { "epoch": 0.51, "learning_rate": 4.909579119942586e-05, "loss": 2.5233, "step": 39020 }, { "epoch": 0.51, "learning_rate": 4.9085586814071634e-05, "loss": 2.5585, "step": 39025 }, { "epoch": 0.51, "learning_rate": 4.907538246681693e-05, "loss": 2.4677, "step": 39030 }, { "epoch": 0.51, "learning_rate": 4.9065178158086976e-05, "loss": 2.6523, "step": 39035 }, { "epoch": 0.51, "learning_rate": 4.905497388830689e-05, "loss": 2.5376, "step": 39040 }, { "epoch": 0.51, "learning_rate": 4.9044769657901844e-05, "loss": 2.5388, "step": 39045 }, { "epoch": 0.51, "learning_rate": 4.9034565467297036e-05, "loss": 2.4984, "step": 39050 }, { "epoch": 0.51, "learning_rate": 4.9024361316917605e-05, "loss": 2.6296, "step": 39055 }, { "epoch": 0.51, "learning_rate": 4.901415720718873e-05, "loss": 2.5495, "step": 39060 }, { "epoch": 0.51, "learning_rate": 4.9003953138535544e-05, "loss": 2.6181, "step": 39065 }, { "epoch": 0.51, "learning_rate": 4.8993749111383225e-05, "loss": 2.5693, "step": 39070 }, { "epoch": 0.51, "learning_rate": 4.8983545126156924e-05, "loss": 2.6143, "step": 39075 }, { "epoch": 0.51, "learning_rate": 4.8973341183281795e-05, "loss": 2.5821, "step": 39080 }, { "epoch": 0.51, "learning_rate": 4.8963137283183016e-05, "loss": 2.5106, "step": 39085 }, { "epoch": 0.51, "learning_rate": 4.895293342628569e-05, "loss": 2.571, "step": 39090 }, { "epoch": 0.51, "learning_rate": 4.894272961301502e-05, "loss": 2.4665, "step": 39095 }, { "epoch": 0.51, "learning_rate": 4.8932525843796104e-05, "loss": 2.621, "step": 39100 }, { "epoch": 0.51, "learning_rate": 4.8922322119054104e-05, "loss": 2.5772, "step": 39105 }, { "epoch": 0.51, "learning_rate": 4.891211843921418e-05, "loss": 2.5076, "step": 39110 }, { "epoch": 0.51, "learning_rate": 4.890191480470145e-05, "loss": 2.5767, "step": 39115 }, { "epoch": 0.51, "learning_rate": 4.8891711215941104e-05, "loss": 2.5929, "step": 39120 }, { "epoch": 0.51, "learning_rate": 4.8881507673358215e-05, "loss": 2.5541, "step": 39125 }, { "epoch": 0.51, "learning_rate": 4.887130417737795e-05, "loss": 2.6909, "step": 39130 }, { "epoch": 0.51, "learning_rate": 4.8861100728425464e-05, "loss": 2.5488, "step": 39135 }, { "epoch": 0.51, "learning_rate": 4.8850897326925846e-05, "loss": 2.7915, "step": 39140 }, { "epoch": 0.51, "learning_rate": 4.8840693973304264e-05, "loss": 2.5034, "step": 39145 }, { "epoch": 0.51, "learning_rate": 4.8830490667985814e-05, "loss": 2.4929, "step": 39150 }, { "epoch": 0.51, "learning_rate": 4.8820287411395664e-05, "loss": 2.5069, "step": 39155 }, { "epoch": 0.51, "learning_rate": 4.881008420395889e-05, "loss": 2.6168, "step": 39160 }, { "epoch": 0.51, "learning_rate": 4.879988104610065e-05, "loss": 2.5444, "step": 39165 }, { "epoch": 0.51, "learning_rate": 4.878967793824605e-05, "loss": 2.4823, "step": 39170 }, { "epoch": 0.51, "learning_rate": 4.877947488082021e-05, "loss": 2.512, "step": 39175 }, { "epoch": 0.51, "learning_rate": 4.8769271874248266e-05, "loss": 2.4483, "step": 39180 }, { "epoch": 0.51, "learning_rate": 4.87590689189553e-05, "loss": 2.5774, "step": 39185 }, { "epoch": 0.51, "learning_rate": 4.874886601536645e-05, "loss": 2.4992, "step": 39190 }, { "epoch": 0.51, "learning_rate": 4.87386631639068e-05, "loss": 2.5244, "step": 39195 }, { "epoch": 0.51, "learning_rate": 4.872846036500146e-05, "loss": 2.4658, "step": 39200 }, { "epoch": 0.51, "learning_rate": 4.871825761907557e-05, "loss": 2.5538, "step": 39205 }, { "epoch": 0.51, "learning_rate": 4.870805492655419e-05, "loss": 2.555, "step": 39210 }, { "epoch": 0.51, "learning_rate": 4.869785228786247e-05, "loss": 2.5949, "step": 39215 }, { "epoch": 0.51, "learning_rate": 4.8687649703425455e-05, "loss": 2.3738, "step": 39220 }, { "epoch": 0.51, "learning_rate": 4.867744717366827e-05, "loss": 2.5369, "step": 39225 }, { "epoch": 0.51, "learning_rate": 4.866724469901602e-05, "loss": 2.6033, "step": 39230 }, { "epoch": 0.51, "learning_rate": 4.8657042279893764e-05, "loss": 2.726, "step": 39235 }, { "epoch": 0.51, "learning_rate": 4.8646839916726625e-05, "loss": 2.4958, "step": 39240 }, { "epoch": 0.51, "learning_rate": 4.863663760993966e-05, "loss": 2.4539, "step": 39245 }, { "epoch": 0.51, "learning_rate": 4.8626435359957996e-05, "loss": 2.4707, "step": 39250 }, { "epoch": 0.51, "learning_rate": 4.861623316720666e-05, "loss": 2.4965, "step": 39255 }, { "epoch": 0.51, "learning_rate": 4.860603103211077e-05, "loss": 2.5049, "step": 39260 }, { "epoch": 0.51, "learning_rate": 4.859582895509541e-05, "loss": 2.4907, "step": 39265 }, { "epoch": 0.51, "learning_rate": 4.858562693658562e-05, "loss": 2.558, "step": 39270 }, { "epoch": 0.51, "learning_rate": 4.8575424977006516e-05, "loss": 2.513, "step": 39275 }, { "epoch": 0.51, "learning_rate": 4.856522307678313e-05, "loss": 2.6152, "step": 39280 }, { "epoch": 0.51, "learning_rate": 4.8555021236340545e-05, "loss": 2.5245, "step": 39285 }, { "epoch": 0.51, "learning_rate": 4.854481945610384e-05, "loss": 2.6988, "step": 39290 }, { "epoch": 0.51, "learning_rate": 4.853461773649805e-05, "loss": 2.602, "step": 39295 }, { "epoch": 0.51, "learning_rate": 4.8524416077948264e-05, "loss": 2.4758, "step": 39300 }, { "epoch": 0.51, "learning_rate": 4.851421448087952e-05, "loss": 2.6262, "step": 39305 }, { "epoch": 0.51, "learning_rate": 4.8504012945716895e-05, "loss": 2.5935, "step": 39310 }, { "epoch": 0.51, "learning_rate": 4.8493811472885406e-05, "loss": 2.5004, "step": 39315 }, { "epoch": 0.51, "learning_rate": 4.848361006281013e-05, "loss": 2.6516, "step": 39320 }, { "epoch": 0.51, "learning_rate": 4.847340871591612e-05, "loss": 2.4873, "step": 39325 }, { "epoch": 0.51, "learning_rate": 4.846320743262839e-05, "loss": 2.5345, "step": 39330 }, { "epoch": 0.51, "learning_rate": 4.8453006213372026e-05, "loss": 2.5777, "step": 39335 }, { "epoch": 0.51, "learning_rate": 4.844280505857202e-05, "loss": 2.5323, "step": 39340 }, { "epoch": 0.51, "learning_rate": 4.843260396865344e-05, "loss": 2.6975, "step": 39345 }, { "epoch": 0.51, "learning_rate": 4.842240294404133e-05, "loss": 2.4545, "step": 39350 }, { "epoch": 0.51, "learning_rate": 4.841220198516069e-05, "loss": 2.5084, "step": 39355 }, { "epoch": 0.51, "learning_rate": 4.840200109243657e-05, "loss": 2.5553, "step": 39360 }, { "epoch": 0.51, "learning_rate": 4.839180026629398e-05, "loss": 2.6243, "step": 39365 }, { "epoch": 0.51, "learning_rate": 4.838159950715797e-05, "loss": 2.4903, "step": 39370 }, { "epoch": 0.51, "learning_rate": 4.837139881545352e-05, "loss": 2.4931, "step": 39375 }, { "epoch": 0.51, "learning_rate": 4.836119819160568e-05, "loss": 2.5659, "step": 39380 }, { "epoch": 0.51, "learning_rate": 4.8350997636039476e-05, "loss": 2.5215, "step": 39385 }, { "epoch": 0.51, "learning_rate": 4.834079714917987e-05, "loss": 2.5529, "step": 39390 }, { "epoch": 0.51, "learning_rate": 4.833059673145192e-05, "loss": 2.5732, "step": 39395 }, { "epoch": 0.51, "learning_rate": 4.8320396383280594e-05, "loss": 2.5626, "step": 39400 }, { "epoch": 0.51, "learning_rate": 4.8310196105090944e-05, "loss": 2.5059, "step": 39405 }, { "epoch": 0.51, "learning_rate": 4.829999589730791e-05, "loss": 2.6023, "step": 39410 }, { "epoch": 0.51, "learning_rate": 4.828979576035653e-05, "loss": 2.5203, "step": 39415 }, { "epoch": 0.51, "learning_rate": 4.8279595694661814e-05, "loss": 2.4787, "step": 39420 }, { "epoch": 0.51, "learning_rate": 4.8269395700648695e-05, "loss": 2.3798, "step": 39425 }, { "epoch": 0.51, "learning_rate": 4.825919577874221e-05, "loss": 2.5287, "step": 39430 }, { "epoch": 0.51, "learning_rate": 4.824899592936732e-05, "loss": 2.5675, "step": 39435 }, { "epoch": 0.51, "learning_rate": 4.8238796152949016e-05, "loss": 2.6012, "step": 39440 }, { "epoch": 0.51, "learning_rate": 4.822859644991231e-05, "loss": 2.565, "step": 39445 }, { "epoch": 0.51, "learning_rate": 4.821839682068211e-05, "loss": 2.5068, "step": 39450 }, { "epoch": 0.51, "learning_rate": 4.820819726568344e-05, "loss": 2.5652, "step": 39455 }, { "epoch": 0.51, "learning_rate": 4.8197997785341254e-05, "loss": 2.5477, "step": 39460 }, { "epoch": 0.51, "learning_rate": 4.818779838008054e-05, "loss": 2.5476, "step": 39465 }, { "epoch": 0.51, "learning_rate": 4.817759905032622e-05, "loss": 2.5451, "step": 39470 }, { "epoch": 0.51, "learning_rate": 4.8167399796503284e-05, "loss": 2.5519, "step": 39475 }, { "epoch": 0.51, "learning_rate": 4.81572006190367e-05, "loss": 2.6119, "step": 39480 }, { "epoch": 0.51, "learning_rate": 4.8147001518351395e-05, "loss": 2.6113, "step": 39485 }, { "epoch": 0.51, "learning_rate": 4.8136802494872333e-05, "loss": 2.4714, "step": 39490 }, { "epoch": 0.51, "learning_rate": 4.8126603549024465e-05, "loss": 2.5674, "step": 39495 }, { "epoch": 0.51, "learning_rate": 4.8116404681232716e-05, "loss": 2.5662, "step": 39500 }, { "epoch": 0.51, "learning_rate": 4.810620589192208e-05, "loss": 2.5515, "step": 39505 }, { "epoch": 0.51, "learning_rate": 4.8096007181517433e-05, "loss": 2.4491, "step": 39510 }, { "epoch": 0.51, "learning_rate": 4.8085808550443746e-05, "loss": 2.4817, "step": 39515 }, { "epoch": 0.51, "learning_rate": 4.807560999912594e-05, "loss": 2.4334, "step": 39520 }, { "epoch": 0.51, "learning_rate": 4.8065411527988954e-05, "loss": 2.7105, "step": 39525 }, { "epoch": 0.51, "learning_rate": 4.805521313745768e-05, "loss": 2.577, "step": 39530 }, { "epoch": 0.51, "learning_rate": 4.804501482795708e-05, "loss": 2.6298, "step": 39535 }, { "epoch": 0.51, "learning_rate": 4.803481659991207e-05, "loss": 2.6089, "step": 39540 }, { "epoch": 0.51, "learning_rate": 4.802461845374753e-05, "loss": 2.5568, "step": 39545 }, { "epoch": 0.51, "learning_rate": 4.8014420389888405e-05, "loss": 2.461, "step": 39550 }, { "epoch": 0.51, "learning_rate": 4.800422240875958e-05, "loss": 2.4917, "step": 39555 }, { "epoch": 0.51, "learning_rate": 4.799402451078597e-05, "loss": 2.5203, "step": 39560 }, { "epoch": 0.51, "learning_rate": 4.7983826696392506e-05, "loss": 2.5754, "step": 39565 }, { "epoch": 0.51, "learning_rate": 4.7973628966004025e-05, "loss": 2.5272, "step": 39570 }, { "epoch": 0.51, "learning_rate": 4.7963431320045484e-05, "loss": 2.6604, "step": 39575 }, { "epoch": 0.51, "learning_rate": 4.7953233758941714e-05, "loss": 2.6333, "step": 39580 }, { "epoch": 0.51, "learning_rate": 4.794303628311764e-05, "loss": 2.5333, "step": 39585 }, { "epoch": 0.51, "learning_rate": 4.793283889299814e-05, "loss": 2.5028, "step": 39590 }, { "epoch": 0.51, "learning_rate": 4.7922641589008077e-05, "loss": 2.6163, "step": 39595 }, { "epoch": 0.51, "learning_rate": 4.7912444371572374e-05, "loss": 2.501, "step": 39600 }, { "epoch": 0.51, "learning_rate": 4.790224724111584e-05, "loss": 2.6099, "step": 39605 }, { "epoch": 0.51, "learning_rate": 4.789205019806339e-05, "loss": 2.4486, "step": 39610 }, { "epoch": 0.51, "learning_rate": 4.788185324283987e-05, "loss": 2.577, "step": 39615 }, { "epoch": 0.51, "learning_rate": 4.787165637587017e-05, "loss": 2.5896, "step": 39620 }, { "epoch": 0.51, "learning_rate": 4.78614595975791e-05, "loss": 2.4911, "step": 39625 }, { "epoch": 0.51, "learning_rate": 4.7851262908391536e-05, "loss": 2.6749, "step": 39630 }, { "epoch": 0.51, "learning_rate": 4.784106630873236e-05, "loss": 2.4563, "step": 39635 }, { "epoch": 0.51, "learning_rate": 4.783086979902637e-05, "loss": 2.4801, "step": 39640 }, { "epoch": 0.51, "learning_rate": 4.782067337969844e-05, "loss": 2.5698, "step": 39645 }, { "epoch": 0.51, "learning_rate": 4.78104770511734e-05, "loss": 2.4779, "step": 39650 }, { "epoch": 0.51, "learning_rate": 4.780028081387608e-05, "loss": 2.5079, "step": 39655 }, { "epoch": 0.51, "learning_rate": 4.779008466823134e-05, "loss": 2.6503, "step": 39660 }, { "epoch": 0.51, "learning_rate": 4.777988861466397e-05, "loss": 2.563, "step": 39665 }, { "epoch": 0.51, "learning_rate": 4.776969265359883e-05, "loss": 2.6864, "step": 39670 }, { "epoch": 0.51, "learning_rate": 4.7759496785460704e-05, "loss": 2.6366, "step": 39675 }, { "epoch": 0.51, "learning_rate": 4.7749301010674434e-05, "loss": 2.463, "step": 39680 }, { "epoch": 0.52, "learning_rate": 4.7739105329664815e-05, "loss": 2.461, "step": 39685 }, { "epoch": 0.52, "learning_rate": 4.772890974285668e-05, "loss": 2.6499, "step": 39690 }, { "epoch": 0.52, "learning_rate": 4.7718714250674826e-05, "loss": 2.5922, "step": 39695 }, { "epoch": 0.52, "learning_rate": 4.770851885354404e-05, "loss": 2.549, "step": 39700 }, { "epoch": 0.52, "learning_rate": 4.769832355188913e-05, "loss": 2.6224, "step": 39705 }, { "epoch": 0.52, "learning_rate": 4.768812834613488e-05, "loss": 2.495, "step": 39710 }, { "epoch": 0.52, "learning_rate": 4.76779332367061e-05, "loss": 2.499, "step": 39715 }, { "epoch": 0.52, "learning_rate": 4.766773822402755e-05, "loss": 2.4978, "step": 39720 }, { "epoch": 0.52, "learning_rate": 4.765754330852402e-05, "loss": 2.4923, "step": 39725 }, { "epoch": 0.52, "learning_rate": 4.764734849062031e-05, "loss": 2.4921, "step": 39730 }, { "epoch": 0.52, "learning_rate": 4.7637153770741154e-05, "loss": 2.5241, "step": 39735 }, { "epoch": 0.52, "learning_rate": 4.762695914931135e-05, "loss": 2.6192, "step": 39740 }, { "epoch": 0.52, "learning_rate": 4.7616764626755635e-05, "loss": 2.5266, "step": 39745 }, { "epoch": 0.52, "learning_rate": 4.760657020349879e-05, "loss": 2.5922, "step": 39750 }, { "epoch": 0.52, "learning_rate": 4.759637587996559e-05, "loss": 2.6519, "step": 39755 }, { "epoch": 0.52, "learning_rate": 4.758618165658074e-05, "loss": 2.6483, "step": 39760 }, { "epoch": 0.52, "learning_rate": 4.757598753376904e-05, "loss": 2.6101, "step": 39765 }, { "epoch": 0.52, "learning_rate": 4.756579351195518e-05, "loss": 2.5483, "step": 39770 }, { "epoch": 0.52, "learning_rate": 4.7555599591563934e-05, "loss": 2.671, "step": 39775 }, { "epoch": 0.52, "learning_rate": 4.7545405773020036e-05, "loss": 2.5626, "step": 39780 }, { "epoch": 0.52, "learning_rate": 4.7535212056748204e-05, "loss": 2.4451, "step": 39785 }, { "epoch": 0.52, "learning_rate": 4.7525018443173194e-05, "loss": 2.5651, "step": 39790 }, { "epoch": 0.52, "learning_rate": 4.751482493271968e-05, "loss": 2.424, "step": 39795 }, { "epoch": 0.52, "learning_rate": 4.750463152581242e-05, "loss": 2.3738, "step": 39800 }, { "epoch": 0.52, "learning_rate": 4.749443822287612e-05, "loss": 2.6145, "step": 39805 }, { "epoch": 0.52, "learning_rate": 4.748424502433547e-05, "loss": 2.5819, "step": 39810 }, { "epoch": 0.52, "learning_rate": 4.7474051930615224e-05, "loss": 2.5129, "step": 39815 }, { "epoch": 0.52, "learning_rate": 4.7463858942140026e-05, "loss": 2.4528, "step": 39820 }, { "epoch": 0.52, "learning_rate": 4.745366605933462e-05, "loss": 2.653, "step": 39825 }, { "epoch": 0.52, "learning_rate": 4.744347328262365e-05, "loss": 2.609, "step": 39830 }, { "epoch": 0.52, "learning_rate": 4.743328061243184e-05, "loss": 2.5328, "step": 39835 }, { "epoch": 0.52, "learning_rate": 4.742308804918385e-05, "loss": 2.6753, "step": 39840 }, { "epoch": 0.52, "learning_rate": 4.741289559330438e-05, "loss": 2.5283, "step": 39845 }, { "epoch": 0.52, "learning_rate": 4.740270324521812e-05, "loss": 2.5483, "step": 39850 }, { "epoch": 0.52, "learning_rate": 4.7392511005349685e-05, "loss": 2.4103, "step": 39855 }, { "epoch": 0.52, "learning_rate": 4.7382318874123796e-05, "loss": 2.6013, "step": 39860 }, { "epoch": 0.52, "learning_rate": 4.737212685196507e-05, "loss": 2.5232, "step": 39865 }, { "epoch": 0.52, "learning_rate": 4.736193493929818e-05, "loss": 2.6449, "step": 39870 }, { "epoch": 0.52, "learning_rate": 4.7351743136547796e-05, "loss": 2.5805, "step": 39875 }, { "epoch": 0.52, "learning_rate": 4.734155144413854e-05, "loss": 2.5761, "step": 39880 }, { "epoch": 0.52, "learning_rate": 4.7331359862495087e-05, "loss": 2.496, "step": 39885 }, { "epoch": 0.52, "learning_rate": 4.732116839204203e-05, "loss": 2.5379, "step": 39890 }, { "epoch": 0.52, "learning_rate": 4.731097703320404e-05, "loss": 2.5135, "step": 39895 }, { "epoch": 0.52, "learning_rate": 4.730078578640572e-05, "loss": 2.5897, "step": 39900 }, { "epoch": 0.52, "learning_rate": 4.72905946520717e-05, "loss": 2.512, "step": 39905 }, { "epoch": 0.52, "learning_rate": 4.728040363062664e-05, "loss": 2.5113, "step": 39910 }, { "epoch": 0.52, "learning_rate": 4.727021272249508e-05, "loss": 2.641, "step": 39915 }, { "epoch": 0.52, "learning_rate": 4.726002192810171e-05, "loss": 2.5128, "step": 39920 }, { "epoch": 0.52, "learning_rate": 4.7249831247871054e-05, "loss": 2.5751, "step": 39925 }, { "epoch": 0.52, "learning_rate": 4.723964068222777e-05, "loss": 2.5261, "step": 39930 }, { "epoch": 0.52, "learning_rate": 4.722945023159644e-05, "loss": 2.5505, "step": 39935 }, { "epoch": 0.52, "learning_rate": 4.7219259896401644e-05, "loss": 2.5579, "step": 39940 }, { "epoch": 0.52, "learning_rate": 4.7209069677068004e-05, "loss": 2.695, "step": 39945 }, { "epoch": 0.52, "learning_rate": 4.719887957402004e-05, "loss": 2.6338, "step": 39950 }, { "epoch": 0.52, "learning_rate": 4.71886895876824e-05, "loss": 2.693, "step": 39955 }, { "epoch": 0.52, "learning_rate": 4.717849971847958e-05, "loss": 2.5343, "step": 39960 }, { "epoch": 0.52, "learning_rate": 4.71683099668362e-05, "loss": 2.5245, "step": 39965 }, { "epoch": 0.52, "learning_rate": 4.715812033317681e-05, "loss": 2.5677, "step": 39970 }, { "epoch": 0.52, "learning_rate": 4.714793081792595e-05, "loss": 2.4752, "step": 39975 }, { "epoch": 0.52, "learning_rate": 4.7137741421508206e-05, "loss": 2.5064, "step": 39980 }, { "epoch": 0.52, "learning_rate": 4.712755214434809e-05, "loss": 2.3754, "step": 39985 }, { "epoch": 0.52, "learning_rate": 4.711736298687016e-05, "loss": 2.4425, "step": 39990 }, { "epoch": 0.52, "learning_rate": 4.710717394949896e-05, "loss": 2.6217, "step": 39995 }, { "epoch": 0.52, "learning_rate": 4.7096985032658994e-05, "loss": 2.5805, "step": 40000 }, { "epoch": 0.52, "learning_rate": 4.708679623677484e-05, "loss": 2.5903, "step": 40005 }, { "epoch": 0.52, "learning_rate": 4.707660756227096e-05, "loss": 2.6064, "step": 40010 }, { "epoch": 0.52, "learning_rate": 4.706641900957193e-05, "loss": 2.4619, "step": 40015 }, { "epoch": 0.52, "learning_rate": 4.70562305791022e-05, "loss": 2.5968, "step": 40020 }, { "epoch": 0.52, "learning_rate": 4.704604227128632e-05, "loss": 2.5799, "step": 40025 }, { "epoch": 0.52, "learning_rate": 4.7035854086548785e-05, "loss": 2.4573, "step": 40030 }, { "epoch": 0.52, "learning_rate": 4.702566602531408e-05, "loss": 2.4729, "step": 40035 }, { "epoch": 0.52, "learning_rate": 4.701547808800672e-05, "loss": 2.5444, "step": 40040 }, { "epoch": 0.52, "learning_rate": 4.7005290275051156e-05, "loss": 2.5336, "step": 40045 }, { "epoch": 0.52, "learning_rate": 4.6995102586871906e-05, "loss": 2.4731, "step": 40050 }, { "epoch": 0.52, "learning_rate": 4.69849150238934e-05, "loss": 2.5048, "step": 40055 }, { "epoch": 0.52, "learning_rate": 4.697472758654015e-05, "loss": 2.5976, "step": 40060 }, { "epoch": 0.52, "learning_rate": 4.696454027523661e-05, "loss": 2.4987, "step": 40065 }, { "epoch": 0.52, "learning_rate": 4.695435309040723e-05, "loss": 2.5233, "step": 40070 }, { "epoch": 0.52, "learning_rate": 4.6944166032476494e-05, "loss": 2.5441, "step": 40075 }, { "epoch": 0.52, "learning_rate": 4.69339791018688e-05, "loss": 2.5736, "step": 40080 }, { "epoch": 0.52, "learning_rate": 4.692379229900863e-05, "loss": 2.5923, "step": 40085 }, { "epoch": 0.52, "learning_rate": 4.691360562432043e-05, "loss": 2.572, "step": 40090 }, { "epoch": 0.52, "learning_rate": 4.69034190782286e-05, "loss": 2.5536, "step": 40095 }, { "epoch": 0.52, "learning_rate": 4.689323266115761e-05, "loss": 2.5288, "step": 40100 }, { "epoch": 0.52, "learning_rate": 4.6883046373531844e-05, "loss": 2.4225, "step": 40105 }, { "epoch": 0.52, "learning_rate": 4.6872860215775755e-05, "loss": 2.5145, "step": 40110 }, { "epoch": 0.52, "learning_rate": 4.686267418831371e-05, "loss": 2.5847, "step": 40115 }, { "epoch": 0.52, "learning_rate": 4.6852488291570146e-05, "loss": 2.5459, "step": 40120 }, { "epoch": 0.52, "learning_rate": 4.684230252596947e-05, "loss": 2.5703, "step": 40125 }, { "epoch": 0.52, "learning_rate": 4.683211689193605e-05, "loss": 2.5068, "step": 40130 }, { "epoch": 0.52, "learning_rate": 4.6821931389894325e-05, "loss": 2.5149, "step": 40135 }, { "epoch": 0.52, "learning_rate": 4.681174602026862e-05, "loss": 2.4685, "step": 40140 }, { "epoch": 0.52, "learning_rate": 4.6801560783483345e-05, "loss": 2.4801, "step": 40145 }, { "epoch": 0.52, "learning_rate": 4.679137567996289e-05, "loss": 2.5419, "step": 40150 }, { "epoch": 0.52, "learning_rate": 4.6781190710131584e-05, "loss": 2.6344, "step": 40155 }, { "epoch": 0.52, "learning_rate": 4.6771005874413826e-05, "loss": 2.5559, "step": 40160 }, { "epoch": 0.52, "learning_rate": 4.676082117323394e-05, "loss": 2.5614, "step": 40165 }, { "epoch": 0.52, "learning_rate": 4.675063660701632e-05, "loss": 2.5177, "step": 40170 }, { "epoch": 0.52, "learning_rate": 4.6740452176185265e-05, "loss": 2.435, "step": 40175 }, { "epoch": 0.52, "learning_rate": 4.6730267881165134e-05, "loss": 2.4936, "step": 40180 }, { "epoch": 0.52, "learning_rate": 4.672008372238028e-05, "loss": 2.5029, "step": 40185 }, { "epoch": 0.52, "learning_rate": 4.6709899700254994e-05, "loss": 2.4572, "step": 40190 }, { "epoch": 0.52, "learning_rate": 4.669971581521365e-05, "loss": 2.5616, "step": 40195 }, { "epoch": 0.52, "learning_rate": 4.6689532067680516e-05, "loss": 2.5434, "step": 40200 }, { "epoch": 0.52, "learning_rate": 4.667934845807992e-05, "loss": 2.5377, "step": 40205 }, { "epoch": 0.52, "learning_rate": 4.6669164986836194e-05, "loss": 2.5085, "step": 40210 }, { "epoch": 0.52, "learning_rate": 4.66589816543736e-05, "loss": 2.6121, "step": 40215 }, { "epoch": 0.52, "learning_rate": 4.664879846111646e-05, "loss": 2.5342, "step": 40220 }, { "epoch": 0.52, "learning_rate": 4.663861540748903e-05, "loss": 2.5703, "step": 40225 }, { "epoch": 0.52, "learning_rate": 4.662843249391564e-05, "loss": 2.4072, "step": 40230 }, { "epoch": 0.52, "learning_rate": 4.661824972082052e-05, "loss": 2.6761, "step": 40235 }, { "epoch": 0.52, "learning_rate": 4.660806708862796e-05, "loss": 2.5963, "step": 40240 }, { "epoch": 0.52, "learning_rate": 4.6597884597762257e-05, "loss": 2.4851, "step": 40245 }, { "epoch": 0.52, "learning_rate": 4.6587702248647606e-05, "loss": 2.6456, "step": 40250 }, { "epoch": 0.52, "learning_rate": 4.657752004170831e-05, "loss": 2.5468, "step": 40255 }, { "epoch": 0.52, "learning_rate": 4.656733797736859e-05, "loss": 2.3167, "step": 40260 }, { "epoch": 0.52, "learning_rate": 4.6557156056052725e-05, "loss": 2.618, "step": 40265 }, { "epoch": 0.52, "learning_rate": 4.6546974278184894e-05, "loss": 2.6153, "step": 40270 }, { "epoch": 0.52, "learning_rate": 4.653679264418937e-05, "loss": 2.5773, "step": 40275 }, { "epoch": 0.52, "learning_rate": 4.6526611154490366e-05, "loss": 2.5704, "step": 40280 }, { "epoch": 0.52, "learning_rate": 4.6516429809512085e-05, "loss": 2.5985, "step": 40285 }, { "epoch": 0.52, "learning_rate": 4.6506248609678774e-05, "loss": 2.6433, "step": 40290 }, { "epoch": 0.52, "learning_rate": 4.6496067555414594e-05, "loss": 2.55, "step": 40295 }, { "epoch": 0.52, "learning_rate": 4.6485886647143766e-05, "loss": 2.5518, "step": 40300 }, { "epoch": 0.52, "learning_rate": 4.6475705885290505e-05, "loss": 2.5747, "step": 40305 }, { "epoch": 0.52, "learning_rate": 4.6465525270278956e-05, "loss": 2.5524, "step": 40310 }, { "epoch": 0.52, "learning_rate": 4.645534480253333e-05, "loss": 2.573, "step": 40315 }, { "epoch": 0.52, "learning_rate": 4.6445164482477775e-05, "loss": 2.5192, "step": 40320 }, { "epoch": 0.52, "learning_rate": 4.64349843105365e-05, "loss": 2.564, "step": 40325 }, { "epoch": 0.52, "learning_rate": 4.642480428713363e-05, "loss": 2.511, "step": 40330 }, { "epoch": 0.52, "learning_rate": 4.6414624412693344e-05, "loss": 2.6071, "step": 40335 }, { "epoch": 0.52, "learning_rate": 4.6404444687639784e-05, "loss": 2.4886, "step": 40340 }, { "epoch": 0.52, "learning_rate": 4.639426511239709e-05, "loss": 2.519, "step": 40345 }, { "epoch": 0.52, "learning_rate": 4.6384085687389416e-05, "loss": 2.4298, "step": 40350 }, { "epoch": 0.52, "learning_rate": 4.637390641304087e-05, "loss": 2.6202, "step": 40355 }, { "epoch": 0.52, "learning_rate": 4.636372728977558e-05, "loss": 2.4187, "step": 40360 }, { "epoch": 0.52, "learning_rate": 4.635354831801771e-05, "loss": 2.5496, "step": 40365 }, { "epoch": 0.52, "learning_rate": 4.634336949819131e-05, "loss": 2.5108, "step": 40370 }, { "epoch": 0.52, "learning_rate": 4.633319083072052e-05, "loss": 2.528, "step": 40375 }, { "epoch": 0.52, "learning_rate": 4.6323012316029425e-05, "loss": 2.6509, "step": 40380 }, { "epoch": 0.52, "learning_rate": 4.631283395454215e-05, "loss": 2.6031, "step": 40385 }, { "epoch": 0.52, "learning_rate": 4.630265574668274e-05, "loss": 2.6572, "step": 40390 }, { "epoch": 0.52, "learning_rate": 4.629247769287529e-05, "loss": 2.5986, "step": 40395 }, { "epoch": 0.52, "learning_rate": 4.628229979354391e-05, "loss": 2.6807, "step": 40400 }, { "epoch": 0.52, "learning_rate": 4.627212204911261e-05, "loss": 2.6192, "step": 40405 }, { "epoch": 0.52, "learning_rate": 4.626194446000549e-05, "loss": 2.4282, "step": 40410 }, { "epoch": 0.52, "learning_rate": 4.6251767026646585e-05, "loss": 2.5301, "step": 40415 }, { "epoch": 0.52, "learning_rate": 4.6241589749459954e-05, "loss": 2.5328, "step": 40420 }, { "epoch": 0.52, "learning_rate": 4.6231412628869656e-05, "loss": 2.5353, "step": 40425 }, { "epoch": 0.52, "learning_rate": 4.622123566529969e-05, "loss": 2.521, "step": 40430 }, { "epoch": 0.52, "learning_rate": 4.6211058859174115e-05, "loss": 2.4544, "step": 40435 }, { "epoch": 0.52, "learning_rate": 4.620088221091694e-05, "loss": 2.5619, "step": 40440 }, { "epoch": 0.52, "learning_rate": 4.6190705720952186e-05, "loss": 2.5096, "step": 40445 }, { "epoch": 0.52, "learning_rate": 4.618052938970385e-05, "loss": 2.5845, "step": 40450 }, { "epoch": 0.53, "learning_rate": 4.617035321759593e-05, "loss": 2.5649, "step": 40455 }, { "epoch": 0.53, "learning_rate": 4.6160177205052476e-05, "loss": 2.5589, "step": 40460 }, { "epoch": 0.53, "learning_rate": 4.615000135249741e-05, "loss": 2.6862, "step": 40465 }, { "epoch": 0.53, "learning_rate": 4.613982566035475e-05, "loss": 2.5052, "step": 40470 }, { "epoch": 0.53, "learning_rate": 4.6129650129048454e-05, "loss": 2.5369, "step": 40475 }, { "epoch": 0.53, "learning_rate": 4.611947475900252e-05, "loss": 2.5072, "step": 40480 }, { "epoch": 0.53, "learning_rate": 4.610929955064088e-05, "loss": 2.5013, "step": 40485 }, { "epoch": 0.53, "learning_rate": 4.609912450438749e-05, "loss": 2.5423, "step": 40490 }, { "epoch": 0.53, "learning_rate": 4.6088949620666346e-05, "loss": 2.5874, "step": 40495 }, { "epoch": 0.53, "learning_rate": 4.607877489990132e-05, "loss": 2.5935, "step": 40500 }, { "epoch": 0.53, "learning_rate": 4.60686003425164e-05, "loss": 2.6206, "step": 40505 }, { "epoch": 0.53, "learning_rate": 4.60584259489355e-05, "loss": 2.5271, "step": 40510 }, { "epoch": 0.53, "learning_rate": 4.6048251719582526e-05, "loss": 2.7003, "step": 40515 }, { "epoch": 0.53, "learning_rate": 4.603807765488143e-05, "loss": 2.5344, "step": 40520 }, { "epoch": 0.53, "learning_rate": 4.6027903755256075e-05, "loss": 2.5211, "step": 40525 }, { "epoch": 0.53, "learning_rate": 4.6017730021130396e-05, "loss": 2.5474, "step": 40530 }, { "epoch": 0.53, "learning_rate": 4.6007556452928266e-05, "loss": 2.655, "step": 40535 }, { "epoch": 0.53, "learning_rate": 4.59973830510736e-05, "loss": 2.6531, "step": 40540 }, { "epoch": 0.53, "learning_rate": 4.598720981599024e-05, "loss": 2.6041, "step": 40545 }, { "epoch": 0.53, "learning_rate": 4.597703674810209e-05, "loss": 2.5385, "step": 40550 }, { "epoch": 0.53, "learning_rate": 4.596686384783302e-05, "loss": 2.6251, "step": 40555 }, { "epoch": 0.53, "learning_rate": 4.5956691115606853e-05, "loss": 2.4861, "step": 40560 }, { "epoch": 0.53, "learning_rate": 4.594651855184748e-05, "loss": 2.4587, "step": 40565 }, { "epoch": 0.53, "learning_rate": 4.593634615697873e-05, "loss": 2.5917, "step": 40570 }, { "epoch": 0.53, "learning_rate": 4.592617393142443e-05, "loss": 2.4898, "step": 40575 }, { "epoch": 0.53, "learning_rate": 4.591600187560846e-05, "loss": 2.5581, "step": 40580 }, { "epoch": 0.53, "learning_rate": 4.590582998995459e-05, "loss": 2.5346, "step": 40585 }, { "epoch": 0.53, "learning_rate": 4.589565827488667e-05, "loss": 2.6415, "step": 40590 }, { "epoch": 0.53, "learning_rate": 4.588548673082848e-05, "loss": 2.5546, "step": 40595 }, { "epoch": 0.53, "learning_rate": 4.587531535820385e-05, "loss": 2.4, "step": 40600 }, { "epoch": 0.53, "learning_rate": 4.586514415743656e-05, "loss": 2.4, "step": 40605 }, { "epoch": 0.53, "learning_rate": 4.58549731289504e-05, "loss": 2.6127, "step": 40610 }, { "epoch": 0.53, "learning_rate": 4.584480227316919e-05, "loss": 2.5839, "step": 40615 }, { "epoch": 0.53, "learning_rate": 4.5834631590516644e-05, "loss": 2.6376, "step": 40620 }, { "epoch": 0.53, "learning_rate": 4.5824461081416564e-05, "loss": 2.533, "step": 40625 }, { "epoch": 0.53, "learning_rate": 4.5814290746292695e-05, "loss": 2.4265, "step": 40630 }, { "epoch": 0.53, "learning_rate": 4.58041205855688e-05, "loss": 2.544, "step": 40635 }, { "epoch": 0.53, "learning_rate": 4.5793950599668656e-05, "loss": 2.6053, "step": 40640 }, { "epoch": 0.53, "learning_rate": 4.578378078901593e-05, "loss": 2.4631, "step": 40645 }, { "epoch": 0.53, "learning_rate": 4.577361115403443e-05, "loss": 2.5841, "step": 40650 }, { "epoch": 0.53, "learning_rate": 4.5763441695147805e-05, "loss": 2.6415, "step": 40655 }, { "epoch": 0.53, "learning_rate": 4.575327241277983e-05, "loss": 2.5929, "step": 40660 }, { "epoch": 0.53, "learning_rate": 4.574310330735417e-05, "loss": 2.6024, "step": 40665 }, { "epoch": 0.53, "learning_rate": 4.5732934379294554e-05, "loss": 2.3878, "step": 40670 }, { "epoch": 0.53, "learning_rate": 4.57227656290247e-05, "loss": 2.543, "step": 40675 }, { "epoch": 0.53, "learning_rate": 4.571259705696823e-05, "loss": 2.5509, "step": 40680 }, { "epoch": 0.53, "learning_rate": 4.570242866354889e-05, "loss": 2.5332, "step": 40685 }, { "epoch": 0.53, "learning_rate": 4.569226044919029e-05, "loss": 2.5384, "step": 40690 }, { "epoch": 0.53, "learning_rate": 4.568209241431614e-05, "loss": 2.5881, "step": 40695 }, { "epoch": 0.53, "learning_rate": 4.5671924559350077e-05, "loss": 2.4954, "step": 40700 }, { "epoch": 0.53, "learning_rate": 4.5661756884715746e-05, "loss": 2.5352, "step": 40705 }, { "epoch": 0.53, "learning_rate": 4.565158939083682e-05, "loss": 2.4612, "step": 40710 }, { "epoch": 0.53, "learning_rate": 4.56414220781369e-05, "loss": 2.4515, "step": 40715 }, { "epoch": 0.53, "learning_rate": 4.563125494703963e-05, "loss": 2.5562, "step": 40720 }, { "epoch": 0.53, "learning_rate": 4.5621087997968615e-05, "loss": 2.4613, "step": 40725 }, { "epoch": 0.53, "learning_rate": 4.561092123134747e-05, "loss": 2.4758, "step": 40730 }, { "epoch": 0.53, "learning_rate": 4.560075464759983e-05, "loss": 2.3907, "step": 40735 }, { "epoch": 0.53, "learning_rate": 4.559058824714925e-05, "loss": 2.641, "step": 40740 }, { "epoch": 0.53, "learning_rate": 4.5580422030419354e-05, "loss": 2.4181, "step": 40745 }, { "epoch": 0.53, "learning_rate": 4.5570255997833675e-05, "loss": 2.624, "step": 40750 }, { "epoch": 0.53, "learning_rate": 4.556009014981584e-05, "loss": 2.5498, "step": 40755 }, { "epoch": 0.53, "learning_rate": 4.5549924486789375e-05, "loss": 2.4977, "step": 40760 }, { "epoch": 0.53, "learning_rate": 4.5539759009177855e-05, "loss": 2.7218, "step": 40765 }, { "epoch": 0.53, "learning_rate": 4.552959371740485e-05, "loss": 2.5534, "step": 40770 }, { "epoch": 0.53, "learning_rate": 4.5519428611893857e-05, "loss": 2.6378, "step": 40775 }, { "epoch": 0.53, "learning_rate": 4.550926369306847e-05, "loss": 2.4599, "step": 40780 }, { "epoch": 0.53, "learning_rate": 4.5499098961352147e-05, "loss": 2.6063, "step": 40785 }, { "epoch": 0.53, "learning_rate": 4.548893441716845e-05, "loss": 2.4891, "step": 40790 }, { "epoch": 0.53, "learning_rate": 4.547877006094089e-05, "loss": 2.5584, "step": 40795 }, { "epoch": 0.53, "learning_rate": 4.546860589309296e-05, "loss": 2.5732, "step": 40800 }, { "epoch": 0.53, "learning_rate": 4.545844191404818e-05, "loss": 2.4311, "step": 40805 }, { "epoch": 0.53, "learning_rate": 4.5448278124229995e-05, "loss": 2.6149, "step": 40810 }, { "epoch": 0.53, "learning_rate": 4.543811452406191e-05, "loss": 2.5228, "step": 40815 }, { "epoch": 0.53, "learning_rate": 4.54279511139674e-05, "loss": 2.4378, "step": 40820 }, { "epoch": 0.53, "learning_rate": 4.541778789436992e-05, "loss": 2.5518, "step": 40825 }, { "epoch": 0.53, "learning_rate": 4.540762486569295e-05, "loss": 2.3612, "step": 40830 }, { "epoch": 0.53, "learning_rate": 4.53974620283599e-05, "loss": 2.4901, "step": 40835 }, { "epoch": 0.53, "learning_rate": 4.538729938279425e-05, "loss": 2.5991, "step": 40840 }, { "epoch": 0.53, "learning_rate": 4.53771369294194e-05, "loss": 2.5615, "step": 40845 }, { "epoch": 0.53, "learning_rate": 4.5366974668658776e-05, "loss": 2.5769, "step": 40850 }, { "epoch": 0.53, "learning_rate": 4.535681260093582e-05, "loss": 2.6817, "step": 40855 }, { "epoch": 0.53, "learning_rate": 4.534665072667391e-05, "loss": 2.7036, "step": 40860 }, { "epoch": 0.53, "learning_rate": 4.533648904629649e-05, "loss": 2.4022, "step": 40865 }, { "epoch": 0.53, "learning_rate": 4.5326327560226894e-05, "loss": 2.4951, "step": 40870 }, { "epoch": 0.53, "learning_rate": 4.531616626888857e-05, "loss": 2.6371, "step": 40875 }, { "epoch": 0.53, "learning_rate": 4.530600517270483e-05, "loss": 2.5834, "step": 40880 }, { "epoch": 0.53, "learning_rate": 4.5295844272099076e-05, "loss": 2.4875, "step": 40885 }, { "epoch": 0.53, "learning_rate": 4.5285683567494666e-05, "loss": 2.5735, "step": 40890 }, { "epoch": 0.53, "learning_rate": 4.527552305931495e-05, "loss": 2.6343, "step": 40895 }, { "epoch": 0.53, "learning_rate": 4.526536274798329e-05, "loss": 2.4411, "step": 40900 }, { "epoch": 0.53, "learning_rate": 4.525520263392298e-05, "loss": 2.7544, "step": 40905 }, { "epoch": 0.53, "learning_rate": 4.524504271755738e-05, "loss": 2.4784, "step": 40910 }, { "epoch": 0.53, "learning_rate": 4.5234882999309786e-05, "loss": 2.5371, "step": 40915 }, { "epoch": 0.53, "learning_rate": 4.522472347960352e-05, "loss": 2.5871, "step": 40920 }, { "epoch": 0.53, "learning_rate": 4.5214564158861904e-05, "loss": 2.5923, "step": 40925 }, { "epoch": 0.53, "learning_rate": 4.5204405037508195e-05, "loss": 2.7052, "step": 40930 }, { "epoch": 0.53, "learning_rate": 4.5194246115965716e-05, "loss": 2.5453, "step": 40935 }, { "epoch": 0.53, "learning_rate": 4.5184087394657706e-05, "loss": 2.5741, "step": 40940 }, { "epoch": 0.53, "learning_rate": 4.517392887400745e-05, "loss": 2.5153, "step": 40945 }, { "epoch": 0.53, "learning_rate": 4.516377055443822e-05, "loss": 2.5025, "step": 40950 }, { "epoch": 0.53, "learning_rate": 4.515361243637325e-05, "loss": 2.6195, "step": 40955 }, { "epoch": 0.53, "learning_rate": 4.514345452023581e-05, "loss": 2.6031, "step": 40960 }, { "epoch": 0.53, "learning_rate": 4.51332968064491e-05, "loss": 2.4863, "step": 40965 }, { "epoch": 0.53, "learning_rate": 4.512313929543639e-05, "loss": 2.5074, "step": 40970 }, { "epoch": 0.53, "learning_rate": 4.511298198762085e-05, "loss": 2.5055, "step": 40975 }, { "epoch": 0.53, "learning_rate": 4.510282488342571e-05, "loss": 2.5357, "step": 40980 }, { "epoch": 0.53, "learning_rate": 4.509266798327419e-05, "loss": 2.5104, "step": 40985 }, { "epoch": 0.53, "learning_rate": 4.5082511287589455e-05, "loss": 2.5314, "step": 40990 }, { "epoch": 0.53, "learning_rate": 4.507235479679473e-05, "loss": 2.5184, "step": 40995 }, { "epoch": 0.53, "learning_rate": 4.506219851131314e-05, "loss": 2.6327, "step": 41000 }, { "epoch": 0.53, "learning_rate": 4.505204243156787e-05, "loss": 2.5305, "step": 41005 }, { "epoch": 0.53, "learning_rate": 4.50418865579821e-05, "loss": 2.5854, "step": 41010 }, { "epoch": 0.53, "learning_rate": 4.5031730890978954e-05, "loss": 2.5919, "step": 41015 }, { "epoch": 0.53, "learning_rate": 4.502157543098161e-05, "loss": 2.4208, "step": 41020 }, { "epoch": 0.53, "learning_rate": 4.5011420178413154e-05, "loss": 2.4655, "step": 41025 }, { "epoch": 0.53, "learning_rate": 4.5001265133696754e-05, "loss": 2.4786, "step": 41030 }, { "epoch": 0.53, "learning_rate": 4.4991110297255484e-05, "loss": 2.5342, "step": 41035 }, { "epoch": 0.53, "learning_rate": 4.498095566951247e-05, "loss": 2.5373, "step": 41040 }, { "epoch": 0.53, "learning_rate": 4.497080125089082e-05, "loss": 2.504, "step": 41045 }, { "epoch": 0.53, "learning_rate": 4.4960647041813605e-05, "loss": 2.5214, "step": 41050 }, { "epoch": 0.53, "learning_rate": 4.495049304270394e-05, "loss": 2.5603, "step": 41055 }, { "epoch": 0.53, "learning_rate": 4.4940339253984856e-05, "loss": 2.5283, "step": 41060 }, { "epoch": 0.53, "learning_rate": 4.4930185676079436e-05, "loss": 2.4783, "step": 41065 }, { "epoch": 0.53, "learning_rate": 4.4920032309410745e-05, "loss": 2.5176, "step": 41070 }, { "epoch": 0.53, "learning_rate": 4.4909879154401805e-05, "loss": 2.641, "step": 41075 }, { "epoch": 0.53, "learning_rate": 4.489972621147567e-05, "loss": 2.478, "step": 41080 }, { "epoch": 0.53, "learning_rate": 4.4889573481055345e-05, "loss": 2.3777, "step": 41085 }, { "epoch": 0.53, "learning_rate": 4.48794209635639e-05, "loss": 2.5927, "step": 41090 }, { "epoch": 0.53, "learning_rate": 4.4869268659424284e-05, "loss": 2.5807, "step": 41095 }, { "epoch": 0.53, "learning_rate": 4.485911656905953e-05, "loss": 2.6567, "step": 41100 }, { "epoch": 0.53, "learning_rate": 4.4848964692892634e-05, "loss": 2.4754, "step": 41105 }, { "epoch": 0.53, "learning_rate": 4.483881303134657e-05, "loss": 2.6923, "step": 41110 }, { "epoch": 0.53, "learning_rate": 4.482866158484434e-05, "loss": 2.5676, "step": 41115 }, { "epoch": 0.53, "learning_rate": 4.481851035380886e-05, "loss": 2.5871, "step": 41120 }, { "epoch": 0.53, "learning_rate": 4.480835933866313e-05, "loss": 2.5746, "step": 41125 }, { "epoch": 0.53, "learning_rate": 4.479820853983006e-05, "loss": 2.4721, "step": 41130 }, { "epoch": 0.53, "learning_rate": 4.478805795773261e-05, "loss": 2.6836, "step": 41135 }, { "epoch": 0.53, "learning_rate": 4.477790759279373e-05, "loss": 2.7248, "step": 41140 }, { "epoch": 0.53, "learning_rate": 4.47677574454363e-05, "loss": 2.5143, "step": 41145 }, { "epoch": 0.53, "learning_rate": 4.4757607516083276e-05, "loss": 2.5898, "step": 41150 }, { "epoch": 0.53, "learning_rate": 4.4747457805157516e-05, "loss": 2.4849, "step": 41155 }, { "epoch": 0.53, "learning_rate": 4.4737308313081935e-05, "loss": 2.6694, "step": 41160 }, { "epoch": 0.53, "learning_rate": 4.472715904027943e-05, "loss": 2.4422, "step": 41165 }, { "epoch": 0.53, "learning_rate": 4.471700998717285e-05, "loss": 2.5194, "step": 41170 }, { "epoch": 0.53, "learning_rate": 4.4706861154185086e-05, "loss": 2.506, "step": 41175 }, { "epoch": 0.53, "learning_rate": 4.469671254173897e-05, "loss": 2.4684, "step": 41180 }, { "epoch": 0.53, "learning_rate": 4.468656415025738e-05, "loss": 2.5473, "step": 41185 }, { "epoch": 0.53, "learning_rate": 4.467641598016312e-05, "loss": 2.5667, "step": 41190 }, { "epoch": 0.53, "learning_rate": 4.4666268031879036e-05, "loss": 2.4125, "step": 41195 }, { "epoch": 0.53, "learning_rate": 4.4656120305827956e-05, "loss": 2.5661, "step": 41200 }, { "epoch": 0.53, "learning_rate": 4.464597280243268e-05, "loss": 2.5175, "step": 41205 }, { "epoch": 0.53, "learning_rate": 4.463582552211603e-05, "loss": 2.5493, "step": 41210 }, { "epoch": 0.53, "learning_rate": 4.462567846530075e-05, "loss": 2.4364, "step": 41215 }, { "epoch": 0.53, "learning_rate": 4.461553163240967e-05, "loss": 2.5778, "step": 41220 }, { "epoch": 0.54, "learning_rate": 4.460538502386556e-05, "loss": 2.4413, "step": 41225 }, { "epoch": 0.54, "learning_rate": 4.459523864009115e-05, "loss": 2.6471, "step": 41230 }, { "epoch": 0.54, "learning_rate": 4.4585092481509234e-05, "loss": 2.5981, "step": 41235 }, { "epoch": 0.54, "learning_rate": 4.4574946548542526e-05, "loss": 2.5585, "step": 41240 }, { "epoch": 0.54, "learning_rate": 4.45648008416138e-05, "loss": 2.5279, "step": 41245 }, { "epoch": 0.54, "learning_rate": 4.455465536114573e-05, "loss": 2.4801, "step": 41250 }, { "epoch": 0.54, "learning_rate": 4.454451010756107e-05, "loss": 2.4285, "step": 41255 }, { "epoch": 0.54, "learning_rate": 4.4534365081282524e-05, "loss": 2.6069, "step": 41260 }, { "epoch": 0.54, "learning_rate": 4.452422028273279e-05, "loss": 2.6231, "step": 41265 }, { "epoch": 0.54, "learning_rate": 4.4514075712334556e-05, "loss": 2.6271, "step": 41270 }, { "epoch": 0.54, "learning_rate": 4.450393137051049e-05, "loss": 2.6063, "step": 41275 }, { "epoch": 0.54, "learning_rate": 4.449378725768326e-05, "loss": 2.5088, "step": 41280 }, { "epoch": 0.54, "learning_rate": 4.448364337427557e-05, "loss": 2.4454, "step": 41285 }, { "epoch": 0.54, "learning_rate": 4.447349972071e-05, "loss": 2.6049, "step": 41290 }, { "epoch": 0.54, "learning_rate": 4.446335629740926e-05, "loss": 2.5737, "step": 41295 }, { "epoch": 0.54, "learning_rate": 4.4453213104795925e-05, "loss": 2.4674, "step": 41300 }, { "epoch": 0.54, "learning_rate": 4.444307014329267e-05, "loss": 2.6284, "step": 41305 }, { "epoch": 0.54, "learning_rate": 4.443292741332206e-05, "loss": 2.5386, "step": 41310 }, { "epoch": 0.54, "learning_rate": 4.442278491530671e-05, "loss": 2.5216, "step": 41315 }, { "epoch": 0.54, "learning_rate": 4.4412642649669246e-05, "loss": 2.5751, "step": 41320 }, { "epoch": 0.54, "learning_rate": 4.44025006168322e-05, "loss": 2.6272, "step": 41325 }, { "epoch": 0.54, "learning_rate": 4.4392358817218184e-05, "loss": 2.5208, "step": 41330 }, { "epoch": 0.54, "learning_rate": 4.4382217251249735e-05, "loss": 2.6261, "step": 41335 }, { "epoch": 0.54, "learning_rate": 4.437207591934945e-05, "loss": 2.3634, "step": 41340 }, { "epoch": 0.54, "learning_rate": 4.436193482193981e-05, "loss": 2.5578, "step": 41345 }, { "epoch": 0.54, "learning_rate": 4.435179395944339e-05, "loss": 2.6101, "step": 41350 }, { "epoch": 0.54, "learning_rate": 4.434165333228273e-05, "loss": 2.4575, "step": 41355 }, { "epoch": 0.54, "learning_rate": 4.43315129408803e-05, "loss": 2.5095, "step": 41360 }, { "epoch": 0.54, "learning_rate": 4.4321372785658663e-05, "loss": 2.5967, "step": 41365 }, { "epoch": 0.54, "learning_rate": 4.431123286704025e-05, "loss": 2.4288, "step": 41370 }, { "epoch": 0.54, "learning_rate": 4.430109318544757e-05, "loss": 2.5007, "step": 41375 }, { "epoch": 0.54, "learning_rate": 4.4290953741303135e-05, "loss": 2.5566, "step": 41380 }, { "epoch": 0.54, "learning_rate": 4.428081453502936e-05, "loss": 2.4288, "step": 41385 }, { "epoch": 0.54, "learning_rate": 4.4270675567048735e-05, "loss": 2.4246, "step": 41390 }, { "epoch": 0.54, "learning_rate": 4.4260536837783686e-05, "loss": 2.5449, "step": 41395 }, { "epoch": 0.54, "learning_rate": 4.425039834765667e-05, "loss": 2.4506, "step": 41400 }, { "epoch": 0.54, "learning_rate": 4.424026009709008e-05, "loss": 2.4849, "step": 41405 }, { "epoch": 0.54, "learning_rate": 4.4230122086506345e-05, "loss": 2.499, "step": 41410 }, { "epoch": 0.54, "learning_rate": 4.421998431632791e-05, "loss": 2.5528, "step": 41415 }, { "epoch": 0.54, "learning_rate": 4.420984678697711e-05, "loss": 2.4679, "step": 41420 }, { "epoch": 0.54, "learning_rate": 4.4199709498876366e-05, "loss": 2.6595, "step": 41425 }, { "epoch": 0.54, "learning_rate": 4.418957245244805e-05, "loss": 2.6064, "step": 41430 }, { "epoch": 0.54, "learning_rate": 4.417943564811451e-05, "loss": 2.5582, "step": 41435 }, { "epoch": 0.54, "learning_rate": 4.4169299086298144e-05, "loss": 2.513, "step": 41440 }, { "epoch": 0.54, "learning_rate": 4.415916276742125e-05, "loss": 2.5709, "step": 41445 }, { "epoch": 0.54, "learning_rate": 4.414902669190619e-05, "loss": 2.5405, "step": 41450 }, { "epoch": 0.54, "learning_rate": 4.413889086017528e-05, "loss": 2.659, "step": 41455 }, { "epoch": 0.54, "learning_rate": 4.412875527265085e-05, "loss": 2.5561, "step": 41460 }, { "epoch": 0.54, "learning_rate": 4.411861992975518e-05, "loss": 2.5078, "step": 41465 }, { "epoch": 0.54, "learning_rate": 4.410848483191057e-05, "loss": 2.469, "step": 41470 }, { "epoch": 0.54, "learning_rate": 4.4098349979539344e-05, "loss": 2.5461, "step": 41475 }, { "epoch": 0.54, "learning_rate": 4.408821537306372e-05, "loss": 2.5812, "step": 41480 }, { "epoch": 0.54, "learning_rate": 4.4078081012906e-05, "loss": 2.6235, "step": 41485 }, { "epoch": 0.54, "learning_rate": 4.406794689948841e-05, "loss": 2.5158, "step": 41490 }, { "epoch": 0.54, "learning_rate": 4.405781303323321e-05, "loss": 2.5195, "step": 41495 }, { "epoch": 0.54, "learning_rate": 4.4047679414562655e-05, "loss": 2.4352, "step": 41500 }, { "epoch": 0.54, "learning_rate": 4.4037546043898925e-05, "loss": 2.4997, "step": 41505 }, { "epoch": 0.54, "learning_rate": 4.402741292166427e-05, "loss": 2.6576, "step": 41510 }, { "epoch": 0.54, "learning_rate": 4.401728004828086e-05, "loss": 2.4959, "step": 41515 }, { "epoch": 0.54, "learning_rate": 4.4007147424170914e-05, "loss": 2.398, "step": 41520 }, { "epoch": 0.54, "learning_rate": 4.399701504975659e-05, "loss": 2.5381, "step": 41525 }, { "epoch": 0.54, "learning_rate": 4.398688292546007e-05, "loss": 2.5174, "step": 41530 }, { "epoch": 0.54, "learning_rate": 4.3976751051703536e-05, "loss": 2.5787, "step": 41535 }, { "epoch": 0.54, "learning_rate": 4.39666194289091e-05, "loss": 2.4632, "step": 41540 }, { "epoch": 0.54, "learning_rate": 4.3956488057498926e-05, "loss": 2.5385, "step": 41545 }, { "epoch": 0.54, "learning_rate": 4.394635693789513e-05, "loss": 2.5629, "step": 41550 }, { "epoch": 0.54, "learning_rate": 4.3936226070519856e-05, "loss": 2.5362, "step": 41555 }, { "epoch": 0.54, "learning_rate": 4.392609545579518e-05, "loss": 2.5881, "step": 41560 }, { "epoch": 0.54, "learning_rate": 4.3915965094143215e-05, "loss": 2.6016, "step": 41565 }, { "epoch": 0.54, "learning_rate": 4.390583498598607e-05, "loss": 2.5127, "step": 41570 }, { "epoch": 0.54, "learning_rate": 4.389570513174577e-05, "loss": 2.4814, "step": 41575 }, { "epoch": 0.54, "learning_rate": 4.388557553184442e-05, "loss": 2.4935, "step": 41580 }, { "epoch": 0.54, "learning_rate": 4.3875446186704076e-05, "loss": 2.5602, "step": 41585 }, { "epoch": 0.54, "learning_rate": 4.3865317096746756e-05, "loss": 2.5119, "step": 41590 }, { "epoch": 0.54, "learning_rate": 4.385518826239454e-05, "loss": 2.5187, "step": 41595 }, { "epoch": 0.54, "learning_rate": 4.38450596840694e-05, "loss": 2.5053, "step": 41600 }, { "epoch": 0.54, "learning_rate": 4.383493136219339e-05, "loss": 2.5265, "step": 41605 }, { "epoch": 0.54, "learning_rate": 4.382480329718848e-05, "loss": 2.6733, "step": 41610 }, { "epoch": 0.54, "learning_rate": 4.381467548947668e-05, "loss": 2.6379, "step": 41615 }, { "epoch": 0.54, "learning_rate": 4.380454793947996e-05, "loss": 2.6916, "step": 41620 }, { "epoch": 0.54, "learning_rate": 4.37944206476203e-05, "loss": 2.4295, "step": 41625 }, { "epoch": 0.54, "learning_rate": 4.378429361431968e-05, "loss": 2.4328, "step": 41630 }, { "epoch": 0.54, "learning_rate": 4.377416684e-05, "loss": 2.5597, "step": 41635 }, { "epoch": 0.54, "learning_rate": 4.3764040325083235e-05, "loss": 2.3853, "step": 41640 }, { "epoch": 0.54, "learning_rate": 4.375391406999129e-05, "loss": 2.4602, "step": 41645 }, { "epoch": 0.54, "learning_rate": 4.3743788075146086e-05, "loss": 2.4671, "step": 41650 }, { "epoch": 0.54, "learning_rate": 4.373366234096956e-05, "loss": 2.5164, "step": 41655 }, { "epoch": 0.54, "learning_rate": 4.3723536867883565e-05, "loss": 2.6434, "step": 41660 }, { "epoch": 0.54, "learning_rate": 4.371341165631002e-05, "loss": 2.5249, "step": 41665 }, { "epoch": 0.54, "learning_rate": 4.370328670667075e-05, "loss": 2.3176, "step": 41670 }, { "epoch": 0.54, "learning_rate": 4.369316201938766e-05, "loss": 2.5237, "step": 41675 }, { "epoch": 0.54, "learning_rate": 4.368303759488258e-05, "loss": 2.4463, "step": 41680 }, { "epoch": 0.54, "learning_rate": 4.3672913433577343e-05, "loss": 2.4499, "step": 41685 }, { "epoch": 0.54, "learning_rate": 4.366278953589382e-05, "loss": 2.6002, "step": 41690 }, { "epoch": 0.54, "learning_rate": 4.3652665902253784e-05, "loss": 2.5429, "step": 41695 }, { "epoch": 0.54, "learning_rate": 4.364254253307907e-05, "loss": 2.6951, "step": 41700 }, { "epoch": 0.54, "learning_rate": 4.363241942879144e-05, "loss": 2.5663, "step": 41705 }, { "epoch": 0.54, "learning_rate": 4.3622296589812704e-05, "loss": 2.4867, "step": 41710 }, { "epoch": 0.54, "learning_rate": 4.361217401656464e-05, "loss": 2.4919, "step": 41715 }, { "epoch": 0.54, "learning_rate": 4.3602051709468996e-05, "loss": 2.7056, "step": 41720 }, { "epoch": 0.54, "learning_rate": 4.359192966894755e-05, "loss": 2.6073, "step": 41725 }, { "epoch": 0.54, "learning_rate": 4.3581807895422004e-05, "loss": 2.5266, "step": 41730 }, { "epoch": 0.54, "learning_rate": 4.357168638931412e-05, "loss": 2.6185, "step": 41735 }, { "epoch": 0.54, "learning_rate": 4.356156515104559e-05, "loss": 2.5055, "step": 41740 }, { "epoch": 0.54, "learning_rate": 4.355144418103814e-05, "loss": 2.5327, "step": 41745 }, { "epoch": 0.54, "learning_rate": 4.354132347971347e-05, "loss": 2.4607, "step": 41750 }, { "epoch": 0.54, "learning_rate": 4.353120304749324e-05, "loss": 2.5207, "step": 41755 }, { "epoch": 0.54, "learning_rate": 4.352108288479916e-05, "loss": 2.5685, "step": 41760 }, { "epoch": 0.54, "learning_rate": 4.3510962992052855e-05, "loss": 2.4896, "step": 41765 }, { "epoch": 0.54, "learning_rate": 4.3500843369675996e-05, "loss": 2.4126, "step": 41770 }, { "epoch": 0.54, "learning_rate": 4.349072401809021e-05, "loss": 2.5481, "step": 41775 }, { "epoch": 0.54, "learning_rate": 4.348060493771714e-05, "loss": 2.6216, "step": 41780 }, { "epoch": 0.54, "learning_rate": 4.347048612897842e-05, "loss": 2.5315, "step": 41785 }, { "epoch": 0.54, "learning_rate": 4.3460367592295606e-05, "loss": 2.3418, "step": 41790 }, { "epoch": 0.54, "learning_rate": 4.3450249328090345e-05, "loss": 2.5973, "step": 41795 }, { "epoch": 0.54, "learning_rate": 4.344013133678418e-05, "loss": 2.6442, "step": 41800 }, { "epoch": 0.54, "learning_rate": 4.343001361879869e-05, "loss": 2.5586, "step": 41805 }, { "epoch": 0.54, "learning_rate": 4.341989617455546e-05, "loss": 2.5326, "step": 41810 }, { "epoch": 0.54, "learning_rate": 4.3409779004476015e-05, "loss": 2.5115, "step": 41815 }, { "epoch": 0.54, "learning_rate": 4.339966210898192e-05, "loss": 2.6835, "step": 41820 }, { "epoch": 0.54, "learning_rate": 4.338954548849466e-05, "loss": 2.3532, "step": 41825 }, { "epoch": 0.54, "learning_rate": 4.3379429143435786e-05, "loss": 2.5389, "step": 41830 }, { "epoch": 0.54, "learning_rate": 4.336931307422678e-05, "loss": 2.4731, "step": 41835 }, { "epoch": 0.54, "learning_rate": 4.3359197281289133e-05, "loss": 2.508, "step": 41840 }, { "epoch": 0.54, "learning_rate": 4.3349081765044355e-05, "loss": 2.5636, "step": 41845 }, { "epoch": 0.54, "learning_rate": 4.333896652591388e-05, "loss": 2.5982, "step": 41850 }, { "epoch": 0.54, "learning_rate": 4.33288515643192e-05, "loss": 2.5495, "step": 41855 }, { "epoch": 0.54, "learning_rate": 4.331873688068171e-05, "loss": 2.6061, "step": 41860 }, { "epoch": 0.54, "learning_rate": 4.330862247542288e-05, "loss": 2.4849, "step": 41865 }, { "epoch": 0.54, "learning_rate": 4.329850834896413e-05, "loss": 2.6003, "step": 41870 }, { "epoch": 0.54, "learning_rate": 4.328839450172686e-05, "loss": 2.4938, "step": 41875 }, { "epoch": 0.54, "learning_rate": 4.3278280934132506e-05, "loss": 2.6547, "step": 41880 }, { "epoch": 0.54, "learning_rate": 4.326816764660239e-05, "loss": 2.5324, "step": 41885 }, { "epoch": 0.54, "learning_rate": 4.3258054639557945e-05, "loss": 2.5921, "step": 41890 }, { "epoch": 0.54, "learning_rate": 4.324794191342051e-05, "loss": 2.5629, "step": 41895 }, { "epoch": 0.54, "learning_rate": 4.323782946861143e-05, "loss": 2.4485, "step": 41900 }, { "epoch": 0.54, "learning_rate": 4.3227717305552065e-05, "loss": 2.4408, "step": 41905 }, { "epoch": 0.54, "learning_rate": 4.3217605424663734e-05, "loss": 2.5983, "step": 41910 }, { "epoch": 0.54, "learning_rate": 4.320749382636777e-05, "loss": 2.568, "step": 41915 }, { "epoch": 0.54, "learning_rate": 4.319738251108545e-05, "loss": 2.6374, "step": 41920 }, { "epoch": 0.54, "learning_rate": 4.318727147923808e-05, "loss": 2.4989, "step": 41925 }, { "epoch": 0.54, "learning_rate": 4.317716073124695e-05, "loss": 2.5724, "step": 41930 }, { "epoch": 0.54, "learning_rate": 4.316705026753332e-05, "loss": 2.6689, "step": 41935 }, { "epoch": 0.54, "learning_rate": 4.3156940088518476e-05, "loss": 2.6837, "step": 41940 }, { "epoch": 0.54, "learning_rate": 4.3146830194623614e-05, "loss": 2.4741, "step": 41945 }, { "epoch": 0.54, "learning_rate": 4.3136720586270024e-05, "loss": 2.5642, "step": 41950 }, { "epoch": 0.54, "learning_rate": 4.312661126387888e-05, "loss": 2.4589, "step": 41955 }, { "epoch": 0.54, "learning_rate": 4.311650222787141e-05, "loss": 2.4863, "step": 41960 }, { "epoch": 0.54, "learning_rate": 4.310639347866882e-05, "loss": 2.5937, "step": 41965 }, { "epoch": 0.54, "learning_rate": 4.30962850166923e-05, "loss": 2.5545, "step": 41970 }, { "epoch": 0.54, "learning_rate": 4.308617684236302e-05, "loss": 2.5036, "step": 41975 }, { "epoch": 0.54, "learning_rate": 4.3076068956102125e-05, "loss": 2.515, "step": 41980 }, { "epoch": 0.54, "learning_rate": 4.30659613583308e-05, "loss": 2.5639, "step": 41985 }, { "epoch": 0.54, "learning_rate": 4.3055854049470156e-05, "loss": 2.5771, "step": 41990 }, { "epoch": 0.55, "learning_rate": 4.304574702994132e-05, "loss": 2.5361, "step": 41995 }, { "epoch": 0.55, "learning_rate": 4.303564030016544e-05, "loss": 2.441, "step": 42000 }, { "epoch": 0.55, "learning_rate": 4.302553386056357e-05, "loss": 2.6409, "step": 42005 }, { "epoch": 0.55, "learning_rate": 4.3015427711556846e-05, "loss": 2.6064, "step": 42010 }, { "epoch": 0.55, "learning_rate": 4.300532185356631e-05, "loss": 2.5446, "step": 42015 }, { "epoch": 0.55, "learning_rate": 4.299521628701304e-05, "loss": 2.5653, "step": 42020 }, { "epoch": 0.55, "learning_rate": 4.298511101231811e-05, "loss": 2.599, "step": 42025 }, { "epoch": 0.55, "learning_rate": 4.297500602990253e-05, "loss": 2.5399, "step": 42030 }, { "epoch": 0.55, "learning_rate": 4.2964901340187367e-05, "loss": 2.4851, "step": 42035 }, { "epoch": 0.55, "learning_rate": 4.2954796943593605e-05, "loss": 2.4538, "step": 42040 }, { "epoch": 0.55, "learning_rate": 4.2944692840542277e-05, "loss": 2.5192, "step": 42045 }, { "epoch": 0.55, "learning_rate": 4.293458903145434e-05, "loss": 2.4756, "step": 42050 }, { "epoch": 0.55, "learning_rate": 4.2924485516750804e-05, "loss": 2.584, "step": 42055 }, { "epoch": 0.55, "learning_rate": 4.291438229685263e-05, "loss": 2.4295, "step": 42060 }, { "epoch": 0.55, "learning_rate": 4.290427937218078e-05, "loss": 2.5138, "step": 42065 }, { "epoch": 0.55, "learning_rate": 4.28941767431562e-05, "loss": 2.6349, "step": 42070 }, { "epoch": 0.55, "learning_rate": 4.28840744101998e-05, "loss": 2.5659, "step": 42075 }, { "epoch": 0.55, "learning_rate": 4.2873972373732505e-05, "loss": 2.4832, "step": 42080 }, { "epoch": 0.55, "learning_rate": 4.2863870634175254e-05, "loss": 2.6902, "step": 42085 }, { "epoch": 0.55, "learning_rate": 4.285376919194891e-05, "loss": 2.5143, "step": 42090 }, { "epoch": 0.55, "learning_rate": 4.284366804747437e-05, "loss": 2.5697, "step": 42095 }, { "epoch": 0.55, "learning_rate": 4.2833567201172486e-05, "loss": 2.5145, "step": 42100 }, { "epoch": 0.55, "learning_rate": 4.282346665346415e-05, "loss": 2.5962, "step": 42105 }, { "epoch": 0.55, "learning_rate": 4.2813366404770163e-05, "loss": 2.511, "step": 42110 }, { "epoch": 0.55, "learning_rate": 4.280326645551138e-05, "loss": 2.6066, "step": 42115 }, { "epoch": 0.55, "learning_rate": 4.2793166806108634e-05, "loss": 2.4951, "step": 42120 }, { "epoch": 0.55, "learning_rate": 4.278306745698271e-05, "loss": 2.4534, "step": 42125 }, { "epoch": 0.55, "learning_rate": 4.2772968408554434e-05, "loss": 2.3935, "step": 42130 }, { "epoch": 0.55, "learning_rate": 4.276286966124454e-05, "loss": 2.5529, "step": 42135 }, { "epoch": 0.55, "learning_rate": 4.275277121547383e-05, "loss": 2.658, "step": 42140 }, { "epoch": 0.55, "learning_rate": 4.274267307166307e-05, "loss": 2.4808, "step": 42145 }, { "epoch": 0.55, "learning_rate": 4.2732575230232984e-05, "loss": 2.5607, "step": 42150 }, { "epoch": 0.55, "learning_rate": 4.272247769160432e-05, "loss": 2.4939, "step": 42155 }, { "epoch": 0.55, "learning_rate": 4.2712380456197776e-05, "loss": 2.5436, "step": 42160 }, { "epoch": 0.55, "learning_rate": 4.270228352443409e-05, "loss": 2.4742, "step": 42165 }, { "epoch": 0.55, "learning_rate": 4.2692186896733926e-05, "loss": 2.622, "step": 42170 }, { "epoch": 0.55, "learning_rate": 4.2682090573517974e-05, "loss": 2.5318, "step": 42175 }, { "epoch": 0.55, "learning_rate": 4.2671994555206926e-05, "loss": 2.6161, "step": 42180 }, { "epoch": 0.55, "learning_rate": 4.266189884222141e-05, "loss": 2.6484, "step": 42185 }, { "epoch": 0.55, "learning_rate": 4.265180343498209e-05, "loss": 2.5263, "step": 42190 }, { "epoch": 0.55, "learning_rate": 4.2641708333909574e-05, "loss": 2.3355, "step": 42195 }, { "epoch": 0.55, "learning_rate": 4.263161353942451e-05, "loss": 2.524, "step": 42200 }, { "epoch": 0.55, "learning_rate": 4.262151905194748e-05, "loss": 2.497, "step": 42205 }, { "epoch": 0.55, "learning_rate": 4.261142487189907e-05, "loss": 2.5119, "step": 42210 }, { "epoch": 0.55, "learning_rate": 4.2601330999699886e-05, "loss": 2.5165, "step": 42215 }, { "epoch": 0.55, "learning_rate": 4.259123743577047e-05, "loss": 2.6135, "step": 42220 }, { "epoch": 0.55, "learning_rate": 4.258114418053142e-05, "loss": 2.5819, "step": 42225 }, { "epoch": 0.55, "learning_rate": 4.257105123440321e-05, "loss": 2.6253, "step": 42230 }, { "epoch": 0.55, "learning_rate": 4.256095859780642e-05, "loss": 2.4627, "step": 42235 }, { "epoch": 0.55, "learning_rate": 4.255086627116156e-05, "loss": 2.631, "step": 42240 }, { "epoch": 0.55, "learning_rate": 4.254077425488911e-05, "loss": 2.4747, "step": 42245 }, { "epoch": 0.55, "learning_rate": 4.2530682549409564e-05, "loss": 2.4905, "step": 42250 }, { "epoch": 0.55, "learning_rate": 4.252059115514341e-05, "loss": 2.4158, "step": 42255 }, { "epoch": 0.55, "learning_rate": 4.251050007251113e-05, "loss": 2.5573, "step": 42260 }, { "epoch": 0.55, "learning_rate": 4.250040930193313e-05, "loss": 2.4989, "step": 42265 }, { "epoch": 0.55, "learning_rate": 4.2490318843829866e-05, "loss": 2.6586, "step": 42270 }, { "epoch": 0.55, "learning_rate": 4.248022869862178e-05, "loss": 2.4935, "step": 42275 }, { "epoch": 0.55, "learning_rate": 4.247013886672927e-05, "loss": 2.4052, "step": 42280 }, { "epoch": 0.55, "learning_rate": 4.2460049348572744e-05, "loss": 2.588, "step": 42285 }, { "epoch": 0.55, "learning_rate": 4.2449960144572565e-05, "loss": 2.5941, "step": 42290 }, { "epoch": 0.55, "learning_rate": 4.243987125514911e-05, "loss": 2.5972, "step": 42295 }, { "epoch": 0.55, "learning_rate": 4.242978268072279e-05, "loss": 2.5843, "step": 42300 }, { "epoch": 0.55, "learning_rate": 4.2419694421713866e-05, "loss": 2.5519, "step": 42305 }, { "epoch": 0.55, "learning_rate": 4.240960647854274e-05, "loss": 2.5456, "step": 42310 }, { "epoch": 0.55, "learning_rate": 4.239951885162969e-05, "loss": 2.5201, "step": 42315 }, { "epoch": 0.55, "learning_rate": 4.2389431541395056e-05, "loss": 2.5252, "step": 42320 }, { "epoch": 0.55, "learning_rate": 4.23793445482591e-05, "loss": 2.5429, "step": 42325 }, { "epoch": 0.55, "learning_rate": 4.236925787264212e-05, "loss": 2.5615, "step": 42330 }, { "epoch": 0.55, "learning_rate": 4.2359171514964393e-05, "loss": 2.5077, "step": 42335 }, { "epoch": 0.55, "learning_rate": 4.234908547564614e-05, "loss": 2.4985, "step": 42340 }, { "epoch": 0.55, "learning_rate": 4.233899975510763e-05, "loss": 2.507, "step": 42345 }, { "epoch": 0.55, "learning_rate": 4.2328914353769076e-05, "loss": 2.5934, "step": 42350 }, { "epoch": 0.55, "learning_rate": 4.23188292720507e-05, "loss": 2.5051, "step": 42355 }, { "epoch": 0.55, "learning_rate": 4.230874451037271e-05, "loss": 2.3722, "step": 42360 }, { "epoch": 0.55, "learning_rate": 4.229866006915528e-05, "loss": 2.5015, "step": 42365 }, { "epoch": 0.55, "learning_rate": 4.2288575948818584e-05, "loss": 2.5283, "step": 42370 }, { "epoch": 0.55, "learning_rate": 4.2278492149782784e-05, "loss": 2.5428, "step": 42375 }, { "epoch": 0.55, "learning_rate": 4.2268408672468054e-05, "loss": 2.5542, "step": 42380 }, { "epoch": 0.55, "learning_rate": 4.225832551729447e-05, "loss": 2.4589, "step": 42385 }, { "epoch": 0.55, "learning_rate": 4.224824268468219e-05, "loss": 2.5979, "step": 42390 }, { "epoch": 0.55, "learning_rate": 4.223816017505135e-05, "loss": 2.5425, "step": 42395 }, { "epoch": 0.55, "learning_rate": 4.222807798882198e-05, "loss": 2.4272, "step": 42400 }, { "epoch": 0.55, "learning_rate": 4.22179961264142e-05, "loss": 2.4488, "step": 42405 }, { "epoch": 0.55, "learning_rate": 4.220791458824806e-05, "loss": 2.4859, "step": 42410 }, { "epoch": 0.55, "learning_rate": 4.219783337474365e-05, "loss": 2.5008, "step": 42415 }, { "epoch": 0.55, "learning_rate": 4.218775248632094e-05, "loss": 2.4718, "step": 42420 }, { "epoch": 0.55, "learning_rate": 4.217767192340001e-05, "loss": 2.5884, "step": 42425 }, { "epoch": 0.55, "learning_rate": 4.2167591686400875e-05, "loss": 2.5506, "step": 42430 }, { "epoch": 0.55, "learning_rate": 4.21575117757435e-05, "loss": 2.5628, "step": 42435 }, { "epoch": 0.55, "learning_rate": 4.214743219184789e-05, "loss": 2.4852, "step": 42440 }, { "epoch": 0.55, "learning_rate": 4.213735293513401e-05, "loss": 2.5361, "step": 42445 }, { "epoch": 0.55, "learning_rate": 4.212727400602182e-05, "loss": 2.5153, "step": 42450 }, { "epoch": 0.55, "learning_rate": 4.211719540493129e-05, "loss": 2.5881, "step": 42455 }, { "epoch": 0.55, "learning_rate": 4.21071171322823e-05, "loss": 2.5539, "step": 42460 }, { "epoch": 0.55, "learning_rate": 4.209703918849481e-05, "loss": 2.6209, "step": 42465 }, { "epoch": 0.55, "learning_rate": 4.208696157398869e-05, "loss": 2.4979, "step": 42470 }, { "epoch": 0.55, "learning_rate": 4.207688428918388e-05, "loss": 2.6627, "step": 42475 }, { "epoch": 0.55, "learning_rate": 4.206680733450019e-05, "loss": 2.7272, "step": 42480 }, { "epoch": 0.55, "learning_rate": 4.205673071035752e-05, "loss": 2.6111, "step": 42485 }, { "epoch": 0.55, "learning_rate": 4.204665441717573e-05, "loss": 2.5521, "step": 42490 }, { "epoch": 0.55, "learning_rate": 4.2036578455374626e-05, "loss": 2.5687, "step": 42495 }, { "epoch": 0.55, "learning_rate": 4.202650282537405e-05, "loss": 2.5341, "step": 42500 }, { "epoch": 0.55, "learning_rate": 4.2016427527593784e-05, "loss": 2.557, "step": 42505 }, { "epoch": 0.55, "learning_rate": 4.2006352562453635e-05, "loss": 2.4311, "step": 42510 }, { "epoch": 0.55, "learning_rate": 4.199627793037341e-05, "loss": 2.3774, "step": 42515 }, { "epoch": 0.55, "learning_rate": 4.198620363177282e-05, "loss": 2.5235, "step": 42520 }, { "epoch": 0.55, "learning_rate": 4.1976129667071676e-05, "loss": 2.5836, "step": 42525 }, { "epoch": 0.55, "learning_rate": 4.196605603668965e-05, "loss": 2.5914, "step": 42530 }, { "epoch": 0.55, "learning_rate": 4.195598274104652e-05, "loss": 2.5767, "step": 42535 }, { "epoch": 0.55, "learning_rate": 4.1945909780561954e-05, "loss": 2.5263, "step": 42540 }, { "epoch": 0.55, "learning_rate": 4.1935837155655674e-05, "loss": 2.6766, "step": 42545 }, { "epoch": 0.55, "learning_rate": 4.192576486674739e-05, "loss": 2.5498, "step": 42550 }, { "epoch": 0.55, "learning_rate": 4.19156929142567e-05, "loss": 2.3976, "step": 42555 }, { "epoch": 0.55, "learning_rate": 4.19056212986033e-05, "loss": 2.6022, "step": 42560 }, { "epoch": 0.55, "learning_rate": 4.189555002020683e-05, "loss": 2.6118, "step": 42565 }, { "epoch": 0.55, "learning_rate": 4.188547907948689e-05, "loss": 2.6984, "step": 42570 }, { "epoch": 0.55, "learning_rate": 4.187540847686315e-05, "loss": 2.408, "step": 42575 }, { "epoch": 0.55, "learning_rate": 4.186533821275513e-05, "loss": 2.6188, "step": 42580 }, { "epoch": 0.55, "learning_rate": 4.185526828758248e-05, "loss": 2.6426, "step": 42585 }, { "epoch": 0.55, "learning_rate": 4.184519870176473e-05, "loss": 2.4918, "step": 42590 }, { "epoch": 0.55, "learning_rate": 4.183512945572145e-05, "loss": 2.4698, "step": 42595 }, { "epoch": 0.55, "learning_rate": 4.182506054987215e-05, "loss": 2.4766, "step": 42600 }, { "epoch": 0.55, "learning_rate": 4.18149919846364e-05, "loss": 2.475, "step": 42605 }, { "epoch": 0.55, "learning_rate": 4.1804923760433715e-05, "loss": 2.5651, "step": 42610 }, { "epoch": 0.55, "learning_rate": 4.1794855877683545e-05, "loss": 2.4658, "step": 42615 }, { "epoch": 0.55, "learning_rate": 4.1784788336805434e-05, "loss": 2.507, "step": 42620 }, { "epoch": 0.55, "learning_rate": 4.1774721138218785e-05, "loss": 2.5482, "step": 42625 }, { "epoch": 0.55, "learning_rate": 4.1764654282343116e-05, "loss": 2.5084, "step": 42630 }, { "epoch": 0.55, "learning_rate": 4.1754587769597825e-05, "loss": 2.6389, "step": 42635 }, { "epoch": 0.55, "learning_rate": 4.1744521600402354e-05, "loss": 2.5362, "step": 42640 }, { "epoch": 0.55, "learning_rate": 4.173445577517614e-05, "loss": 2.6281, "step": 42645 }, { "epoch": 0.55, "learning_rate": 4.172439029433854e-05, "loss": 2.5898, "step": 42650 }, { "epoch": 0.55, "learning_rate": 4.1714325158308963e-05, "loss": 2.6419, "step": 42655 }, { "epoch": 0.55, "learning_rate": 4.170426036750676e-05, "loss": 2.5587, "step": 42660 }, { "epoch": 0.55, "learning_rate": 4.169419592235131e-05, "loss": 2.5514, "step": 42665 }, { "epoch": 0.55, "learning_rate": 4.168413182326196e-05, "loss": 2.4352, "step": 42670 }, { "epoch": 0.55, "learning_rate": 4.1674068070658e-05, "loss": 2.5345, "step": 42675 }, { "epoch": 0.55, "learning_rate": 4.1664004664958774e-05, "loss": 2.4719, "step": 42680 }, { "epoch": 0.55, "learning_rate": 4.1653941606583546e-05, "loss": 2.4879, "step": 42685 }, { "epoch": 0.55, "learning_rate": 4.164387889595164e-05, "loss": 2.519, "step": 42690 }, { "epoch": 0.55, "learning_rate": 4.163381653348229e-05, "loss": 2.489, "step": 42695 }, { "epoch": 0.55, "learning_rate": 4.162375451959476e-05, "loss": 2.6565, "step": 42700 }, { "epoch": 0.55, "learning_rate": 4.161369285470832e-05, "loss": 2.5003, "step": 42705 }, { "epoch": 0.55, "learning_rate": 4.160363153924214e-05, "loss": 2.5009, "step": 42710 }, { "epoch": 0.55, "learning_rate": 4.1593570573615495e-05, "loss": 2.6806, "step": 42715 }, { "epoch": 0.55, "learning_rate": 4.158350995824751e-05, "loss": 2.6476, "step": 42720 }, { "epoch": 0.55, "learning_rate": 4.1573449693557406e-05, "loss": 2.6309, "step": 42725 }, { "epoch": 0.55, "learning_rate": 4.156338977996436e-05, "loss": 2.5641, "step": 42730 }, { "epoch": 0.55, "learning_rate": 4.15533302178875e-05, "loss": 2.6267, "step": 42735 }, { "epoch": 0.55, "learning_rate": 4.154327100774599e-05, "loss": 2.5849, "step": 42740 }, { "epoch": 0.55, "learning_rate": 4.153321214995892e-05, "loss": 2.5834, "step": 42745 }, { "epoch": 0.55, "learning_rate": 4.1523153644945415e-05, "loss": 2.5169, "step": 42750 }, { "epoch": 0.55, "learning_rate": 4.1513095493124564e-05, "loss": 2.525, "step": 42755 }, { "epoch": 0.55, "learning_rate": 4.1503037694915446e-05, "loss": 2.4385, "step": 42760 }, { "epoch": 0.55, "learning_rate": 4.149298025073715e-05, "loss": 2.5657, "step": 42765 }, { "epoch": 0.56, "learning_rate": 4.148292316100868e-05, "loss": 2.485, "step": 42770 }, { "epoch": 0.56, "learning_rate": 4.147286642614912e-05, "loss": 2.5168, "step": 42775 }, { "epoch": 0.56, "learning_rate": 4.146281004657744e-05, "loss": 2.4834, "step": 42780 }, { "epoch": 0.56, "learning_rate": 4.1452754022712665e-05, "loss": 2.6258, "step": 42785 }, { "epoch": 0.56, "learning_rate": 4.14426983549738e-05, "loss": 2.5931, "step": 42790 }, { "epoch": 0.56, "learning_rate": 4.14326430437798e-05, "loss": 2.5749, "step": 42795 }, { "epoch": 0.56, "learning_rate": 4.1422588089549644e-05, "loss": 2.555, "step": 42800 }, { "epoch": 0.56, "learning_rate": 4.1412533492702254e-05, "loss": 2.4538, "step": 42805 }, { "epoch": 0.56, "learning_rate": 4.140247925365658e-05, "loss": 2.4587, "step": 42810 }, { "epoch": 0.56, "learning_rate": 4.1392425372831535e-05, "loss": 2.6016, "step": 42815 }, { "epoch": 0.56, "learning_rate": 4.1382371850646e-05, "loss": 2.5306, "step": 42820 }, { "epoch": 0.56, "learning_rate": 4.137231868751889e-05, "loss": 2.5141, "step": 42825 }, { "epoch": 0.56, "learning_rate": 4.136226588386905e-05, "loss": 2.5149, "step": 42830 }, { "epoch": 0.56, "learning_rate": 4.1352213440115374e-05, "loss": 2.5161, "step": 42835 }, { "epoch": 0.56, "learning_rate": 4.134216135667665e-05, "loss": 2.5058, "step": 42840 }, { "epoch": 0.56, "learning_rate": 4.1332109633971745e-05, "loss": 2.4396, "step": 42845 }, { "epoch": 0.56, "learning_rate": 4.132205827241944e-05, "loss": 2.5446, "step": 42850 }, { "epoch": 0.56, "learning_rate": 4.1312007272438545e-05, "loss": 2.3871, "step": 42855 }, { "epoch": 0.56, "learning_rate": 4.130195663444787e-05, "loss": 2.426, "step": 42860 }, { "epoch": 0.56, "learning_rate": 4.129190635886613e-05, "loss": 2.4892, "step": 42865 }, { "epoch": 0.56, "learning_rate": 4.1281856446112116e-05, "loss": 2.5793, "step": 42870 }, { "epoch": 0.56, "learning_rate": 4.1271806896604524e-05, "loss": 2.5578, "step": 42875 }, { "epoch": 0.56, "learning_rate": 4.126175771076209e-05, "loss": 2.5702, "step": 42880 }, { "epoch": 0.56, "learning_rate": 4.1251708889003544e-05, "loss": 2.6669, "step": 42885 }, { "epoch": 0.56, "learning_rate": 4.124166043174754e-05, "loss": 2.6558, "step": 42890 }, { "epoch": 0.56, "learning_rate": 4.1231612339412796e-05, "loss": 2.4835, "step": 42895 }, { "epoch": 0.56, "learning_rate": 4.122156461241792e-05, "loss": 2.3282, "step": 42900 }, { "epoch": 0.56, "learning_rate": 4.121151725118159e-05, "loss": 2.532, "step": 42905 }, { "epoch": 0.56, "learning_rate": 4.120147025612242e-05, "loss": 2.5323, "step": 42910 }, { "epoch": 0.56, "learning_rate": 4.119142362765904e-05, "loss": 2.6142, "step": 42915 }, { "epoch": 0.56, "learning_rate": 4.1181377366210035e-05, "loss": 2.4597, "step": 42920 }, { "epoch": 0.56, "learning_rate": 4.117133147219398e-05, "loss": 2.5992, "step": 42925 }, { "epoch": 0.56, "learning_rate": 4.116128594602948e-05, "loss": 2.56, "step": 42930 }, { "epoch": 0.56, "learning_rate": 4.1151240788135036e-05, "loss": 2.5387, "step": 42935 }, { "epoch": 0.56, "learning_rate": 4.1141195998929216e-05, "loss": 2.5762, "step": 42940 }, { "epoch": 0.56, "learning_rate": 4.1131151578830545e-05, "loss": 2.415, "step": 42945 }, { "epoch": 0.56, "learning_rate": 4.1121107528257506e-05, "loss": 2.5247, "step": 42950 }, { "epoch": 0.56, "learning_rate": 4.111106384762864e-05, "loss": 2.6635, "step": 42955 }, { "epoch": 0.56, "learning_rate": 4.110102053736236e-05, "loss": 2.4876, "step": 42960 }, { "epoch": 0.56, "learning_rate": 4.109097759787717e-05, "loss": 2.6285, "step": 42965 }, { "epoch": 0.56, "learning_rate": 4.1080935029591486e-05, "loss": 2.5754, "step": 42970 }, { "epoch": 0.56, "learning_rate": 4.1070892832923755e-05, "loss": 2.5941, "step": 42975 }, { "epoch": 0.56, "learning_rate": 4.106085100829239e-05, "loss": 2.5477, "step": 42980 }, { "epoch": 0.56, "learning_rate": 4.1050809556115776e-05, "loss": 2.58, "step": 42985 }, { "epoch": 0.56, "learning_rate": 4.104076847681233e-05, "loss": 2.4515, "step": 42990 }, { "epoch": 0.56, "learning_rate": 4.1030727770800376e-05, "loss": 2.491, "step": 42995 }, { "epoch": 0.56, "learning_rate": 4.102068743849828e-05, "loss": 2.6461, "step": 43000 }, { "epoch": 0.56, "learning_rate": 4.10106474803244e-05, "loss": 2.5186, "step": 43005 }, { "epoch": 0.56, "learning_rate": 4.1000607896697024e-05, "loss": 2.6581, "step": 43010 }, { "epoch": 0.56, "learning_rate": 4.0990568688034495e-05, "loss": 2.5703, "step": 43015 }, { "epoch": 0.56, "learning_rate": 4.098052985475506e-05, "loss": 2.5366, "step": 43020 }, { "epoch": 0.56, "learning_rate": 4.097049139727703e-05, "loss": 2.651, "step": 43025 }, { "epoch": 0.56, "learning_rate": 4.0960453316018635e-05, "loss": 2.6676, "step": 43030 }, { "epoch": 0.56, "learning_rate": 4.095041561139813e-05, "loss": 2.4759, "step": 43035 }, { "epoch": 0.56, "learning_rate": 4.094037828383374e-05, "loss": 2.5794, "step": 43040 }, { "epoch": 0.56, "learning_rate": 4.093034133374367e-05, "loss": 2.4876, "step": 43045 }, { "epoch": 0.56, "learning_rate": 4.092030476154614e-05, "loss": 2.6524, "step": 43050 }, { "epoch": 0.56, "learning_rate": 4.0910268567659295e-05, "loss": 2.5804, "step": 43055 }, { "epoch": 0.56, "learning_rate": 4.090023275250133e-05, "loss": 2.6714, "step": 43060 }, { "epoch": 0.56, "learning_rate": 4.0890197316490366e-05, "loss": 2.5341, "step": 43065 }, { "epoch": 0.56, "learning_rate": 4.0880162260044534e-05, "loss": 2.6335, "step": 43070 }, { "epoch": 0.56, "learning_rate": 4.0870127583581985e-05, "loss": 2.6053, "step": 43075 }, { "epoch": 0.56, "learning_rate": 4.0860093287520787e-05, "loss": 2.4527, "step": 43080 }, { "epoch": 0.56, "learning_rate": 4.085005937227905e-05, "loss": 2.4766, "step": 43085 }, { "epoch": 0.56, "learning_rate": 4.0840025838274807e-05, "loss": 2.6996, "step": 43090 }, { "epoch": 0.56, "learning_rate": 4.082999268592614e-05, "loss": 2.549, "step": 43095 }, { "epoch": 0.56, "learning_rate": 4.0819959915651086e-05, "loss": 2.513, "step": 43100 }, { "epoch": 0.56, "learning_rate": 4.080992752786765e-05, "loss": 2.5069, "step": 43105 }, { "epoch": 0.56, "learning_rate": 4.079989552299386e-05, "loss": 2.6365, "step": 43110 }, { "epoch": 0.56, "learning_rate": 4.078986390144768e-05, "loss": 2.5063, "step": 43115 }, { "epoch": 0.56, "learning_rate": 4.07798326636471e-05, "loss": 2.5283, "step": 43120 }, { "epoch": 0.56, "learning_rate": 4.0769801810010065e-05, "loss": 2.3855, "step": 43125 }, { "epoch": 0.56, "learning_rate": 4.0759771340954515e-05, "loss": 2.6074, "step": 43130 }, { "epoch": 0.56, "learning_rate": 4.07497412568984e-05, "loss": 2.5171, "step": 43135 }, { "epoch": 0.56, "learning_rate": 4.07397115582596e-05, "loss": 2.3725, "step": 43140 }, { "epoch": 0.56, "learning_rate": 4.0729682245456035e-05, "loss": 2.6363, "step": 43145 }, { "epoch": 0.56, "learning_rate": 4.071965331890555e-05, "loss": 2.5239, "step": 43150 }, { "epoch": 0.56, "learning_rate": 4.070962477902602e-05, "loss": 2.6584, "step": 43155 }, { "epoch": 0.56, "learning_rate": 4.069959662623532e-05, "loss": 2.5899, "step": 43160 }, { "epoch": 0.56, "learning_rate": 4.0689568860951233e-05, "loss": 2.46, "step": 43165 }, { "epoch": 0.56, "learning_rate": 4.0679541483591595e-05, "loss": 2.4279, "step": 43170 }, { "epoch": 0.56, "learning_rate": 4.066951449457419e-05, "loss": 2.545, "step": 43175 }, { "epoch": 0.56, "learning_rate": 4.065948789431683e-05, "loss": 2.477, "step": 43180 }, { "epoch": 0.56, "learning_rate": 4.064946168323723e-05, "loss": 2.4639, "step": 43185 }, { "epoch": 0.56, "learning_rate": 4.063943586175316e-05, "loss": 2.5122, "step": 43190 }, { "epoch": 0.56, "learning_rate": 4.062941043028237e-05, "loss": 2.6227, "step": 43195 }, { "epoch": 0.56, "learning_rate": 4.061938538924255e-05, "loss": 2.5471, "step": 43200 }, { "epoch": 0.56, "learning_rate": 4.060936073905143e-05, "loss": 2.5434, "step": 43205 }, { "epoch": 0.56, "learning_rate": 4.059933648012665e-05, "loss": 2.4134, "step": 43210 }, { "epoch": 0.56, "learning_rate": 4.0589312612885896e-05, "loss": 2.5887, "step": 43215 }, { "epoch": 0.56, "learning_rate": 4.0579289137746845e-05, "loss": 2.5624, "step": 43220 }, { "epoch": 0.56, "learning_rate": 4.056926605512708e-05, "loss": 2.5101, "step": 43225 }, { "epoch": 0.56, "learning_rate": 4.055924336544426e-05, "loss": 2.4866, "step": 43230 }, { "epoch": 0.56, "learning_rate": 4.054922106911596e-05, "loss": 2.4294, "step": 43235 }, { "epoch": 0.56, "learning_rate": 4.05391991665598e-05, "loss": 2.509, "step": 43240 }, { "epoch": 0.56, "learning_rate": 4.0529177658193296e-05, "loss": 2.6903, "step": 43245 }, { "epoch": 0.56, "learning_rate": 4.051915654443403e-05, "loss": 2.5162, "step": 43250 }, { "epoch": 0.56, "learning_rate": 4.050913582569956e-05, "loss": 2.6368, "step": 43255 }, { "epoch": 0.56, "learning_rate": 4.0499115502407355e-05, "loss": 2.7046, "step": 43260 }, { "epoch": 0.56, "learning_rate": 4.048909557497495e-05, "loss": 2.6293, "step": 43265 }, { "epoch": 0.56, "learning_rate": 4.047907604381982e-05, "loss": 2.4581, "step": 43270 }, { "epoch": 0.56, "learning_rate": 4.046905690935946e-05, "loss": 2.5377, "step": 43275 }, { "epoch": 0.56, "learning_rate": 4.0459038172011274e-05, "loss": 2.6344, "step": 43280 }, { "epoch": 0.56, "learning_rate": 4.044901983219273e-05, "loss": 2.4609, "step": 43285 }, { "epoch": 0.56, "learning_rate": 4.043900189032126e-05, "loss": 2.489, "step": 43290 }, { "epoch": 0.56, "learning_rate": 4.042898434681422e-05, "loss": 2.4678, "step": 43295 }, { "epoch": 0.56, "learning_rate": 4.041896720208907e-05, "loss": 2.4823, "step": 43300 }, { "epoch": 0.56, "learning_rate": 4.040895045656311e-05, "loss": 2.702, "step": 43305 }, { "epoch": 0.56, "learning_rate": 4.039893411065372e-05, "loss": 2.4167, "step": 43310 }, { "epoch": 0.56, "learning_rate": 4.038891816477826e-05, "loss": 2.5271, "step": 43315 }, { "epoch": 0.56, "learning_rate": 4.0378902619354e-05, "loss": 2.5849, "step": 43320 }, { "epoch": 0.56, "learning_rate": 4.036888747479829e-05, "loss": 2.5031, "step": 43325 }, { "epoch": 0.56, "learning_rate": 4.035887273152838e-05, "loss": 2.4873, "step": 43330 }, { "epoch": 0.56, "learning_rate": 4.034885838996158e-05, "loss": 2.5566, "step": 43335 }, { "epoch": 0.56, "learning_rate": 4.0338844450515115e-05, "loss": 2.6784, "step": 43340 }, { "epoch": 0.56, "learning_rate": 4.0328830913606215e-05, "loss": 2.5019, "step": 43345 }, { "epoch": 0.56, "learning_rate": 4.031881777965214e-05, "loss": 2.5515, "step": 43350 }, { "epoch": 0.56, "learning_rate": 4.030880504907003e-05, "loss": 2.37, "step": 43355 }, { "epoch": 0.56, "learning_rate": 4.0298792722277136e-05, "loss": 2.4454, "step": 43360 }, { "epoch": 0.56, "learning_rate": 4.028878079969057e-05, "loss": 2.4211, "step": 43365 }, { "epoch": 0.56, "learning_rate": 4.027876928172752e-05, "loss": 2.4471, "step": 43370 }, { "epoch": 0.56, "learning_rate": 4.0268758168805143e-05, "loss": 2.6054, "step": 43375 }, { "epoch": 0.56, "learning_rate": 4.02587474613405e-05, "loss": 2.4688, "step": 43380 }, { "epoch": 0.56, "learning_rate": 4.024873715975074e-05, "loss": 2.6193, "step": 43385 }, { "epoch": 0.56, "learning_rate": 4.0238727264452914e-05, "loss": 2.511, "step": 43390 }, { "epoch": 0.56, "learning_rate": 4.0228717775864124e-05, "loss": 2.5032, "step": 43395 }, { "epoch": 0.56, "learning_rate": 4.021870869440139e-05, "loss": 2.4686, "step": 43400 }, { "epoch": 0.56, "learning_rate": 4.020870002048175e-05, "loss": 2.5525, "step": 43405 }, { "epoch": 0.56, "learning_rate": 4.019869175452225e-05, "loss": 2.5246, "step": 43410 }, { "epoch": 0.56, "learning_rate": 4.0188683896939855e-05, "loss": 2.6182, "step": 43415 }, { "epoch": 0.56, "learning_rate": 4.0178676448151576e-05, "loss": 2.4765, "step": 43420 }, { "epoch": 0.56, "learning_rate": 4.016866940857435e-05, "loss": 2.465, "step": 43425 }, { "epoch": 0.56, "learning_rate": 4.0158662778625145e-05, "loss": 2.5566, "step": 43430 }, { "epoch": 0.56, "learning_rate": 4.0148656558720906e-05, "loss": 2.4537, "step": 43435 }, { "epoch": 0.56, "learning_rate": 4.013865074927852e-05, "loss": 2.3636, "step": 43440 }, { "epoch": 0.56, "learning_rate": 4.012864535071492e-05, "loss": 2.5171, "step": 43445 }, { "epoch": 0.56, "learning_rate": 4.011864036344694e-05, "loss": 2.5653, "step": 43450 }, { "epoch": 0.56, "learning_rate": 4.010863578789147e-05, "loss": 2.4167, "step": 43455 }, { "epoch": 0.56, "learning_rate": 4.009863162446535e-05, "loss": 2.4867, "step": 43460 }, { "epoch": 0.56, "learning_rate": 4.008862787358541e-05, "loss": 2.5473, "step": 43465 }, { "epoch": 0.56, "learning_rate": 4.0078624535668486e-05, "loss": 2.5464, "step": 43470 }, { "epoch": 0.56, "learning_rate": 4.006862161113133e-05, "loss": 2.6208, "step": 43475 }, { "epoch": 0.56, "learning_rate": 4.005861910039076e-05, "loss": 2.5354, "step": 43480 }, { "epoch": 0.56, "learning_rate": 4.0048617003863495e-05, "loss": 2.4471, "step": 43485 }, { "epoch": 0.56, "learning_rate": 4.003861532196633e-05, "loss": 2.4404, "step": 43490 }, { "epoch": 0.56, "learning_rate": 4.0028614055115936e-05, "loss": 2.4196, "step": 43495 }, { "epoch": 0.56, "learning_rate": 4.001861320372905e-05, "loss": 2.5882, "step": 43500 }, { "epoch": 0.56, "learning_rate": 4.000861276822238e-05, "loss": 2.4315, "step": 43505 }, { "epoch": 0.56, "learning_rate": 3.999861274901256e-05, "loss": 2.4726, "step": 43510 }, { "epoch": 0.56, "learning_rate": 3.998861314651628e-05, "loss": 2.5247, "step": 43515 }, { "epoch": 0.56, "learning_rate": 3.9978613961150145e-05, "loss": 2.461, "step": 43520 }, { "epoch": 0.56, "learning_rate": 3.996861519333081e-05, "loss": 2.5254, "step": 43525 }, { "epoch": 0.56, "learning_rate": 3.995861684347488e-05, "loss": 2.6675, "step": 43530 }, { "epoch": 0.56, "learning_rate": 3.9948618911998905e-05, "loss": 2.5129, "step": 43535 }, { "epoch": 0.57, "learning_rate": 3.993862139931951e-05, "loss": 2.607, "step": 43540 }, { "epoch": 0.57, "learning_rate": 3.9928624305853184e-05, "loss": 2.3862, "step": 43545 }, { "epoch": 0.57, "learning_rate": 3.991862763201651e-05, "loss": 2.5695, "step": 43550 }, { "epoch": 0.57, "learning_rate": 3.990863137822597e-05, "loss": 2.4666, "step": 43555 }, { "epoch": 0.57, "learning_rate": 3.989863554489809e-05, "loss": 2.5141, "step": 43560 }, { "epoch": 0.57, "learning_rate": 3.988864013244937e-05, "loss": 2.597, "step": 43565 }, { "epoch": 0.57, "learning_rate": 3.987864514129622e-05, "loss": 2.4594, "step": 43570 }, { "epoch": 0.57, "learning_rate": 3.986865057185512e-05, "loss": 2.4378, "step": 43575 }, { "epoch": 0.57, "learning_rate": 3.985865642454249e-05, "loss": 2.5489, "step": 43580 }, { "epoch": 0.57, "learning_rate": 3.984866269977475e-05, "loss": 2.4071, "step": 43585 }, { "epoch": 0.57, "learning_rate": 3.983866939796831e-05, "loss": 2.5005, "step": 43590 }, { "epoch": 0.57, "learning_rate": 3.982867651953951e-05, "loss": 2.612, "step": 43595 }, { "epoch": 0.57, "learning_rate": 3.981868406490474e-05, "loss": 2.6285, "step": 43600 }, { "epoch": 0.57, "learning_rate": 3.9808692034480315e-05, "loss": 2.5827, "step": 43605 }, { "epoch": 0.57, "learning_rate": 3.9798700428682584e-05, "loss": 2.5419, "step": 43610 }, { "epoch": 0.57, "learning_rate": 3.978870924792782e-05, "loss": 2.5917, "step": 43615 }, { "epoch": 0.57, "learning_rate": 3.977871849263234e-05, "loss": 2.4413, "step": 43620 }, { "epoch": 0.57, "learning_rate": 3.976872816321243e-05, "loss": 2.5165, "step": 43625 }, { "epoch": 0.57, "learning_rate": 3.975873826008429e-05, "loss": 2.5604, "step": 43630 }, { "epoch": 0.57, "learning_rate": 3.97487487836642e-05, "loss": 2.5387, "step": 43635 }, { "epoch": 0.57, "learning_rate": 3.9738759734368364e-05, "loss": 2.5974, "step": 43640 }, { "epoch": 0.57, "learning_rate": 3.972877111261296e-05, "loss": 2.52, "step": 43645 }, { "epoch": 0.57, "learning_rate": 3.971878291881421e-05, "loss": 2.6094, "step": 43650 }, { "epoch": 0.57, "learning_rate": 3.970879515338824e-05, "loss": 2.5703, "step": 43655 }, { "epoch": 0.57, "learning_rate": 3.969880781675124e-05, "loss": 2.5577, "step": 43660 }, { "epoch": 0.57, "learning_rate": 3.968882090931928e-05, "loss": 2.681, "step": 43665 }, { "epoch": 0.57, "learning_rate": 3.967883443150852e-05, "loss": 2.4464, "step": 43670 }, { "epoch": 0.57, "learning_rate": 3.9668848383735016e-05, "loss": 2.3558, "step": 43675 }, { "epoch": 0.57, "learning_rate": 3.965886276641486e-05, "loss": 2.582, "step": 43680 }, { "epoch": 0.57, "learning_rate": 3.964887757996413e-05, "loss": 2.4352, "step": 43685 }, { "epoch": 0.57, "learning_rate": 3.963889282479883e-05, "loss": 2.5531, "step": 43690 }, { "epoch": 0.57, "learning_rate": 3.962890850133501e-05, "loss": 2.6673, "step": 43695 }, { "epoch": 0.57, "learning_rate": 3.961892460998863e-05, "loss": 2.5331, "step": 43700 }, { "epoch": 0.57, "learning_rate": 3.960894115117571e-05, "loss": 2.4527, "step": 43705 }, { "epoch": 0.57, "learning_rate": 3.95989581253122e-05, "loss": 2.3887, "step": 43710 }, { "epoch": 0.57, "learning_rate": 3.9588975532814056e-05, "loss": 2.5299, "step": 43715 }, { "epoch": 0.57, "learning_rate": 3.9578993374097227e-05, "loss": 2.5574, "step": 43720 }, { "epoch": 0.57, "learning_rate": 3.9569011649577584e-05, "loss": 2.6742, "step": 43725 }, { "epoch": 0.57, "learning_rate": 3.9559030359671054e-05, "loss": 2.4923, "step": 43730 }, { "epoch": 0.57, "learning_rate": 3.95490495047935e-05, "loss": 2.437, "step": 43735 }, { "epoch": 0.57, "learning_rate": 3.953906908536078e-05, "loss": 2.6521, "step": 43740 }, { "epoch": 0.57, "learning_rate": 3.9529089101788746e-05, "loss": 2.516, "step": 43745 }, { "epoch": 0.57, "learning_rate": 3.9519109554493196e-05, "loss": 2.4494, "step": 43750 }, { "epoch": 0.57, "learning_rate": 3.950913044388997e-05, "loss": 2.4742, "step": 43755 }, { "epoch": 0.57, "learning_rate": 3.949915177039481e-05, "loss": 2.6225, "step": 43760 }, { "epoch": 0.57, "learning_rate": 3.948917353442351e-05, "loss": 2.4497, "step": 43765 }, { "epoch": 0.57, "learning_rate": 3.947919573639181e-05, "loss": 2.4413, "step": 43770 }, { "epoch": 0.57, "learning_rate": 3.9469218376715444e-05, "loss": 2.6096, "step": 43775 }, { "epoch": 0.57, "learning_rate": 3.9459241455810135e-05, "loss": 2.609, "step": 43780 }, { "epoch": 0.57, "learning_rate": 3.944926497409156e-05, "loss": 2.5393, "step": 43785 }, { "epoch": 0.57, "learning_rate": 3.943928893197541e-05, "loss": 2.48, "step": 43790 }, { "epoch": 0.57, "learning_rate": 3.9429313329877314e-05, "loss": 2.5835, "step": 43795 }, { "epoch": 0.57, "learning_rate": 3.941933816821294e-05, "loss": 2.6044, "step": 43800 }, { "epoch": 0.57, "learning_rate": 3.94093634473979e-05, "loss": 2.4676, "step": 43805 }, { "epoch": 0.57, "learning_rate": 3.939938916784779e-05, "loss": 2.564, "step": 43810 }, { "epoch": 0.57, "learning_rate": 3.9389415329978226e-05, "loss": 2.5384, "step": 43815 }, { "epoch": 0.57, "learning_rate": 3.9379441934204716e-05, "loss": 2.5344, "step": 43820 }, { "epoch": 0.57, "learning_rate": 3.936946898094286e-05, "loss": 2.5512, "step": 43825 }, { "epoch": 0.57, "learning_rate": 3.935949647060815e-05, "loss": 2.6111, "step": 43830 }, { "epoch": 0.57, "learning_rate": 3.934952440361611e-05, "loss": 2.5414, "step": 43835 }, { "epoch": 0.57, "learning_rate": 3.933955278038226e-05, "loss": 2.5259, "step": 43840 }, { "epoch": 0.57, "learning_rate": 3.932958160132202e-05, "loss": 2.3497, "step": 43845 }, { "epoch": 0.57, "learning_rate": 3.9319610866850905e-05, "loss": 2.5259, "step": 43850 }, { "epoch": 0.57, "learning_rate": 3.930964057738429e-05, "loss": 2.4182, "step": 43855 }, { "epoch": 0.57, "learning_rate": 3.929967073333762e-05, "loss": 2.3927, "step": 43860 }, { "epoch": 0.57, "learning_rate": 3.928970133512631e-05, "loss": 2.4998, "step": 43865 }, { "epoch": 0.57, "learning_rate": 3.927973238316571e-05, "loss": 2.5757, "step": 43870 }, { "epoch": 0.57, "learning_rate": 3.926976387787123e-05, "loss": 2.5633, "step": 43875 }, { "epoch": 0.57, "learning_rate": 3.9259795819658156e-05, "loss": 2.5679, "step": 43880 }, { "epoch": 0.57, "learning_rate": 3.924982820894186e-05, "loss": 2.4834, "step": 43885 }, { "epoch": 0.57, "learning_rate": 3.9239861046137604e-05, "loss": 2.4761, "step": 43890 }, { "epoch": 0.57, "learning_rate": 3.9229894331660696e-05, "loss": 2.5084, "step": 43895 }, { "epoch": 0.57, "learning_rate": 3.921992806592643e-05, "loss": 2.5283, "step": 43900 }, { "epoch": 0.57, "learning_rate": 3.9209962249350015e-05, "loss": 2.4962, "step": 43905 }, { "epoch": 0.57, "learning_rate": 3.9199996882346726e-05, "loss": 2.4948, "step": 43910 }, { "epoch": 0.57, "learning_rate": 3.9190031965331724e-05, "loss": 2.3995, "step": 43915 }, { "epoch": 0.57, "learning_rate": 3.9180067498720244e-05, "loss": 2.5883, "step": 43920 }, { "epoch": 0.57, "learning_rate": 3.9170103482927433e-05, "loss": 2.4636, "step": 43925 }, { "epoch": 0.57, "learning_rate": 3.916013991836847e-05, "loss": 2.6738, "step": 43930 }, { "epoch": 0.57, "learning_rate": 3.9150176805458494e-05, "loss": 2.4623, "step": 43935 }, { "epoch": 0.57, "learning_rate": 3.91402141446126e-05, "loss": 2.4544, "step": 43940 }, { "epoch": 0.57, "learning_rate": 3.913025193624592e-05, "loss": 2.5826, "step": 43945 }, { "epoch": 0.57, "learning_rate": 3.91202901807735e-05, "loss": 2.4506, "step": 43950 }, { "epoch": 0.57, "learning_rate": 3.911032887861042e-05, "loss": 2.5513, "step": 43955 }, { "epoch": 0.57, "learning_rate": 3.910036803017173e-05, "loss": 2.5311, "step": 43960 }, { "epoch": 0.57, "learning_rate": 3.909040763587243e-05, "loss": 2.5496, "step": 43965 }, { "epoch": 0.57, "learning_rate": 3.908044769612758e-05, "loss": 2.4892, "step": 43970 }, { "epoch": 0.57, "learning_rate": 3.907048821135209e-05, "loss": 2.4281, "step": 43975 }, { "epoch": 0.57, "learning_rate": 3.9060529181961e-05, "loss": 2.5381, "step": 43980 }, { "epoch": 0.57, "learning_rate": 3.90505706083692e-05, "loss": 2.4319, "step": 43985 }, { "epoch": 0.57, "learning_rate": 3.9040612490991646e-05, "loss": 2.4996, "step": 43990 }, { "epoch": 0.57, "learning_rate": 3.903065483024326e-05, "loss": 2.6448, "step": 43995 }, { "epoch": 0.57, "learning_rate": 3.902069762653891e-05, "loss": 2.4226, "step": 44000 }, { "epoch": 0.57, "learning_rate": 3.9010740880293504e-05, "loss": 2.6317, "step": 44005 }, { "epoch": 0.57, "learning_rate": 3.900078459192185e-05, "loss": 2.5489, "step": 44010 }, { "epoch": 0.57, "learning_rate": 3.8990828761838796e-05, "loss": 2.5071, "step": 44015 }, { "epoch": 0.57, "learning_rate": 3.898087339045918e-05, "loss": 2.4691, "step": 44020 }, { "epoch": 0.57, "learning_rate": 3.8970918478197776e-05, "loss": 2.3152, "step": 44025 }, { "epoch": 0.57, "learning_rate": 3.896096402546939e-05, "loss": 2.5785, "step": 44030 }, { "epoch": 0.57, "learning_rate": 3.895101003268874e-05, "loss": 2.4776, "step": 44035 }, { "epoch": 0.57, "learning_rate": 3.894105650027059e-05, "loss": 2.6324, "step": 44040 }, { "epoch": 0.57, "learning_rate": 3.893110342862965e-05, "loss": 2.721, "step": 44045 }, { "epoch": 0.57, "learning_rate": 3.892115081818062e-05, "loss": 2.4659, "step": 44050 }, { "epoch": 0.57, "learning_rate": 3.891119866933819e-05, "loss": 2.4757, "step": 44055 }, { "epoch": 0.57, "learning_rate": 3.8901246982517004e-05, "loss": 2.6005, "step": 44060 }, { "epoch": 0.57, "learning_rate": 3.889129575813175e-05, "loss": 2.5838, "step": 44065 }, { "epoch": 0.57, "learning_rate": 3.888134499659699e-05, "loss": 2.4665, "step": 44070 }, { "epoch": 0.57, "learning_rate": 3.8871394698327354e-05, "loss": 2.4794, "step": 44075 }, { "epoch": 0.57, "learning_rate": 3.8861444863737454e-05, "loss": 2.6006, "step": 44080 }, { "epoch": 0.57, "learning_rate": 3.885149549324181e-05, "loss": 2.4705, "step": 44085 }, { "epoch": 0.57, "learning_rate": 3.8841546587255006e-05, "loss": 2.6388, "step": 44090 }, { "epoch": 0.57, "learning_rate": 3.883159814619154e-05, "loss": 2.5732, "step": 44095 }, { "epoch": 0.57, "learning_rate": 3.882165017046595e-05, "loss": 2.4665, "step": 44100 }, { "epoch": 0.57, "learning_rate": 3.881170266049269e-05, "loss": 2.4124, "step": 44105 }, { "epoch": 0.57, "learning_rate": 3.880175561668624e-05, "loss": 2.5151, "step": 44110 }, { "epoch": 0.57, "learning_rate": 3.879180903946107e-05, "loss": 2.7035, "step": 44115 }, { "epoch": 0.57, "learning_rate": 3.878186292923158e-05, "loss": 2.6189, "step": 44120 }, { "epoch": 0.57, "learning_rate": 3.877191728641221e-05, "loss": 2.6009, "step": 44125 }, { "epoch": 0.57, "learning_rate": 3.876197211141732e-05, "loss": 2.4924, "step": 44130 }, { "epoch": 0.57, "learning_rate": 3.875202740466132e-05, "loss": 2.5605, "step": 44135 }, { "epoch": 0.57, "learning_rate": 3.8742083166558515e-05, "loss": 2.5143, "step": 44140 }, { "epoch": 0.57, "learning_rate": 3.873213939752326e-05, "loss": 2.437, "step": 44145 }, { "epoch": 0.57, "learning_rate": 3.8722196097969886e-05, "loss": 2.3095, "step": 44150 }, { "epoch": 0.57, "learning_rate": 3.871225326831265e-05, "loss": 2.5728, "step": 44155 }, { "epoch": 0.57, "learning_rate": 3.870231090896588e-05, "loss": 2.4927, "step": 44160 }, { "epoch": 0.57, "learning_rate": 3.8692369020343764e-05, "loss": 2.6174, "step": 44165 }, { "epoch": 0.57, "learning_rate": 3.8682427602860563e-05, "loss": 2.4703, "step": 44170 }, { "epoch": 0.57, "learning_rate": 3.8672486656930525e-05, "loss": 2.5129, "step": 44175 }, { "epoch": 0.57, "learning_rate": 3.866254618296779e-05, "loss": 2.5938, "step": 44180 }, { "epoch": 0.57, "learning_rate": 3.8652606181386576e-05, "loss": 2.5793, "step": 44185 }, { "epoch": 0.57, "learning_rate": 3.864266665260101e-05, "loss": 2.5697, "step": 44190 }, { "epoch": 0.57, "learning_rate": 3.863272759702526e-05, "loss": 2.4995, "step": 44195 }, { "epoch": 0.57, "learning_rate": 3.86227890150734e-05, "loss": 2.5462, "step": 44200 }, { "epoch": 0.57, "learning_rate": 3.861285090715956e-05, "loss": 2.4341, "step": 44205 }, { "epoch": 0.57, "learning_rate": 3.860291327369781e-05, "loss": 2.4597, "step": 44210 }, { "epoch": 0.57, "learning_rate": 3.85929761151022e-05, "loss": 2.4305, "step": 44215 }, { "epoch": 0.57, "learning_rate": 3.858303943178678e-05, "loss": 2.5969, "step": 44220 }, { "epoch": 0.57, "learning_rate": 3.8573103224165555e-05, "loss": 2.5979, "step": 44225 }, { "epoch": 0.57, "learning_rate": 3.8563167492652516e-05, "loss": 2.6384, "step": 44230 }, { "epoch": 0.57, "learning_rate": 3.855323223766167e-05, "loss": 2.5886, "step": 44235 }, { "epoch": 0.57, "learning_rate": 3.854329745960695e-05, "loss": 2.5589, "step": 44240 }, { "epoch": 0.57, "learning_rate": 3.85333631589023e-05, "loss": 2.5376, "step": 44245 }, { "epoch": 0.57, "learning_rate": 3.8523429335961636e-05, "loss": 2.5088, "step": 44250 }, { "epoch": 0.57, "learning_rate": 3.851349599119888e-05, "loss": 2.5236, "step": 44255 }, { "epoch": 0.57, "learning_rate": 3.8503563125027864e-05, "loss": 2.4985, "step": 44260 }, { "epoch": 0.57, "learning_rate": 3.849363073786248e-05, "loss": 2.427, "step": 44265 }, { "epoch": 0.57, "learning_rate": 3.8483698830116574e-05, "loss": 2.6068, "step": 44270 }, { "epoch": 0.57, "learning_rate": 3.847376740220394e-05, "loss": 2.5105, "step": 44275 }, { "epoch": 0.57, "learning_rate": 3.846383645453839e-05, "loss": 2.4096, "step": 44280 }, { "epoch": 0.57, "learning_rate": 3.845390598753369e-05, "loss": 2.5707, "step": 44285 }, { "epoch": 0.57, "learning_rate": 3.844397600160361e-05, "loss": 2.3985, "step": 44290 }, { "epoch": 0.57, "learning_rate": 3.8434046497161907e-05, "loss": 2.6734, "step": 44295 }, { "epoch": 0.57, "learning_rate": 3.842411747462226e-05, "loss": 2.5246, "step": 44300 }, { "epoch": 0.57, "learning_rate": 3.8414188934398395e-05, "loss": 2.5113, "step": 44305 }, { "epoch": 0.58, "learning_rate": 3.840426087690397e-05, "loss": 2.654, "step": 44310 }, { "epoch": 0.58, "learning_rate": 3.839433330255268e-05, "loss": 2.5043, "step": 44315 }, { "epoch": 0.58, "learning_rate": 3.8384406211758116e-05, "loss": 2.5984, "step": 44320 }, { "epoch": 0.58, "learning_rate": 3.8374479604933915e-05, "loss": 2.4707, "step": 44325 }, { "epoch": 0.58, "learning_rate": 3.8364553482493704e-05, "loss": 2.5048, "step": 44330 }, { "epoch": 0.58, "learning_rate": 3.835462784485101e-05, "loss": 2.5188, "step": 44335 }, { "epoch": 0.58, "learning_rate": 3.834470269241943e-05, "loss": 2.4237, "step": 44340 }, { "epoch": 0.58, "learning_rate": 3.833477802561247e-05, "loss": 2.5502, "step": 44345 }, { "epoch": 0.58, "learning_rate": 3.832485384484369e-05, "loss": 2.4464, "step": 44350 }, { "epoch": 0.58, "learning_rate": 3.831493015052653e-05, "loss": 2.433, "step": 44355 }, { "epoch": 0.58, "learning_rate": 3.83050069430745e-05, "loss": 2.5581, "step": 44360 }, { "epoch": 0.58, "learning_rate": 3.829508422290108e-05, "loss": 2.4696, "step": 44365 }, { "epoch": 0.58, "learning_rate": 3.828516199041965e-05, "loss": 2.4705, "step": 44370 }, { "epoch": 0.58, "learning_rate": 3.827524024604366e-05, "loss": 2.5721, "step": 44375 }, { "epoch": 0.58, "learning_rate": 3.826531899018649e-05, "loss": 2.6063, "step": 44380 }, { "epoch": 0.58, "learning_rate": 3.8255398223261535e-05, "loss": 2.6784, "step": 44385 }, { "epoch": 0.58, "learning_rate": 3.8245477945682154e-05, "loss": 2.5316, "step": 44390 }, { "epoch": 0.58, "learning_rate": 3.823555815786164e-05, "loss": 2.4797, "step": 44395 }, { "epoch": 0.58, "learning_rate": 3.822563886021334e-05, "loss": 2.4432, "step": 44400 }, { "epoch": 0.58, "learning_rate": 3.8215720053150534e-05, "loss": 2.5392, "step": 44405 }, { "epoch": 0.58, "learning_rate": 3.8205801737086514e-05, "loss": 2.5177, "step": 44410 }, { "epoch": 0.58, "learning_rate": 3.819588391243451e-05, "loss": 2.4924, "step": 44415 }, { "epoch": 0.58, "learning_rate": 3.818596657960774e-05, "loss": 2.5731, "step": 44420 }, { "epoch": 0.58, "learning_rate": 3.817604973901948e-05, "loss": 2.5729, "step": 44425 }, { "epoch": 0.58, "learning_rate": 3.816613339108285e-05, "loss": 2.5092, "step": 44430 }, { "epoch": 0.58, "learning_rate": 3.8156217536211055e-05, "loss": 2.5, "step": 44435 }, { "epoch": 0.58, "learning_rate": 3.814630217481723e-05, "loss": 2.5202, "step": 44440 }, { "epoch": 0.58, "learning_rate": 3.813638730731451e-05, "loss": 2.4821, "step": 44445 }, { "epoch": 0.58, "learning_rate": 3.8126472934116023e-05, "loss": 2.5507, "step": 44450 }, { "epoch": 0.58, "learning_rate": 3.8116559055634826e-05, "loss": 2.471, "step": 44455 }, { "epoch": 0.58, "learning_rate": 3.8106645672284014e-05, "loss": 2.4429, "step": 44460 }, { "epoch": 0.58, "learning_rate": 3.8096732784476615e-05, "loss": 2.5276, "step": 44465 }, { "epoch": 0.58, "learning_rate": 3.8086820392625654e-05, "loss": 2.5527, "step": 44470 }, { "epoch": 0.58, "learning_rate": 3.8076908497144145e-05, "loss": 2.4868, "step": 44475 }, { "epoch": 0.58, "learning_rate": 3.806699709844506e-05, "loss": 2.6871, "step": 44480 }, { "epoch": 0.58, "learning_rate": 3.805708619694141e-05, "loss": 2.6359, "step": 44485 }, { "epoch": 0.58, "learning_rate": 3.8047175793046065e-05, "loss": 2.569, "step": 44490 }, { "epoch": 0.58, "learning_rate": 3.8037265887171996e-05, "loss": 2.5079, "step": 44495 }, { "epoch": 0.58, "learning_rate": 3.802735647973209e-05, "loss": 2.4956, "step": 44500 }, { "epoch": 0.58, "learning_rate": 3.8017447571139234e-05, "loss": 2.4815, "step": 44505 }, { "epoch": 0.58, "learning_rate": 3.8007539161806297e-05, "loss": 2.4987, "step": 44510 }, { "epoch": 0.58, "learning_rate": 3.799763125214609e-05, "loss": 2.456, "step": 44515 }, { "epoch": 0.58, "learning_rate": 3.7987723842571474e-05, "loss": 2.3969, "step": 44520 }, { "epoch": 0.58, "learning_rate": 3.79778169334952e-05, "loss": 2.3962, "step": 44525 }, { "epoch": 0.58, "learning_rate": 3.796791052533008e-05, "loss": 2.4739, "step": 44530 }, { "epoch": 0.58, "learning_rate": 3.795800461848884e-05, "loss": 2.5569, "step": 44535 }, { "epoch": 0.58, "learning_rate": 3.794809921338424e-05, "loss": 2.4834, "step": 44540 }, { "epoch": 0.58, "learning_rate": 3.793819431042901e-05, "loss": 2.4603, "step": 44545 }, { "epoch": 0.58, "learning_rate": 3.792828991003579e-05, "loss": 2.5751, "step": 44550 }, { "epoch": 0.58, "learning_rate": 3.79183860126173e-05, "loss": 2.498, "step": 44555 }, { "epoch": 0.58, "learning_rate": 3.790848261858616e-05, "loss": 2.5479, "step": 44560 }, { "epoch": 0.58, "learning_rate": 3.7898579728355045e-05, "loss": 2.3973, "step": 44565 }, { "epoch": 0.58, "learning_rate": 3.788867734233651e-05, "loss": 2.5699, "step": 44570 }, { "epoch": 0.58, "learning_rate": 3.787877546094316e-05, "loss": 2.5438, "step": 44575 }, { "epoch": 0.58, "learning_rate": 3.7868874084587605e-05, "loss": 2.5902, "step": 44580 }, { "epoch": 0.58, "learning_rate": 3.785897321368233e-05, "loss": 2.4726, "step": 44585 }, { "epoch": 0.58, "learning_rate": 3.784907284863989e-05, "loss": 2.5318, "step": 44590 }, { "epoch": 0.58, "learning_rate": 3.783917298987279e-05, "loss": 2.523, "step": 44595 }, { "epoch": 0.58, "learning_rate": 3.782927363779351e-05, "loss": 2.4514, "step": 44600 }, { "epoch": 0.58, "learning_rate": 3.7819374792814526e-05, "loss": 2.598, "step": 44605 }, { "epoch": 0.58, "learning_rate": 3.780947645534825e-05, "loss": 2.3356, "step": 44610 }, { "epoch": 0.58, "learning_rate": 3.7799578625807135e-05, "loss": 2.5521, "step": 44615 }, { "epoch": 0.58, "learning_rate": 3.778968130460354e-05, "loss": 2.4172, "step": 44620 }, { "epoch": 0.58, "learning_rate": 3.777978449214988e-05, "loss": 2.4945, "step": 44625 }, { "epoch": 0.58, "learning_rate": 3.776988818885849e-05, "loss": 2.5232, "step": 44630 }, { "epoch": 0.58, "learning_rate": 3.7759992395141706e-05, "loss": 2.4992, "step": 44635 }, { "epoch": 0.58, "learning_rate": 3.775009711141187e-05, "loss": 2.5236, "step": 44640 }, { "epoch": 0.58, "learning_rate": 3.7740202338081234e-05, "loss": 2.5869, "step": 44645 }, { "epoch": 0.58, "learning_rate": 3.773030807556209e-05, "loss": 2.5193, "step": 44650 }, { "epoch": 0.58, "learning_rate": 3.772041432426668e-05, "loss": 2.5123, "step": 44655 }, { "epoch": 0.58, "learning_rate": 3.7710521084607236e-05, "loss": 2.5793, "step": 44660 }, { "epoch": 0.58, "learning_rate": 3.7700628356995994e-05, "loss": 2.5184, "step": 44665 }, { "epoch": 0.58, "learning_rate": 3.7690736141845086e-05, "loss": 2.6662, "step": 44670 }, { "epoch": 0.58, "learning_rate": 3.768084443956673e-05, "loss": 2.5394, "step": 44675 }, { "epoch": 0.58, "learning_rate": 3.7670953250573024e-05, "loss": 2.4697, "step": 44680 }, { "epoch": 0.58, "learning_rate": 3.766106257527612e-05, "loss": 2.4436, "step": 44685 }, { "epoch": 0.58, "learning_rate": 3.7651172414088095e-05, "loss": 2.5542, "step": 44690 }, { "epoch": 0.58, "learning_rate": 3.764128276742105e-05, "loss": 2.4732, "step": 44695 }, { "epoch": 0.58, "learning_rate": 3.7631393635687054e-05, "loss": 2.5414, "step": 44700 }, { "epoch": 0.58, "learning_rate": 3.76215050192981e-05, "loss": 2.5046, "step": 44705 }, { "epoch": 0.58, "learning_rate": 3.761161691866625e-05, "loss": 2.414, "step": 44710 }, { "epoch": 0.58, "learning_rate": 3.760172933420345e-05, "loss": 2.6542, "step": 44715 }, { "epoch": 0.58, "learning_rate": 3.75918422663217e-05, "loss": 2.4581, "step": 44720 }, { "epoch": 0.58, "learning_rate": 3.758195571543295e-05, "loss": 2.5686, "step": 44725 }, { "epoch": 0.58, "learning_rate": 3.757206968194913e-05, "loss": 2.5702, "step": 44730 }, { "epoch": 0.58, "learning_rate": 3.7562184166282156e-05, "loss": 2.4445, "step": 44735 }, { "epoch": 0.58, "learning_rate": 3.7552299168843875e-05, "loss": 2.5924, "step": 44740 }, { "epoch": 0.58, "learning_rate": 3.754241469004619e-05, "loss": 2.4799, "step": 44745 }, { "epoch": 0.58, "learning_rate": 3.753253073030093e-05, "loss": 2.5009, "step": 44750 }, { "epoch": 0.58, "learning_rate": 3.75226472900199e-05, "loss": 2.5251, "step": 44755 }, { "epoch": 0.58, "learning_rate": 3.751276436961494e-05, "loss": 2.5619, "step": 44760 }, { "epoch": 0.58, "learning_rate": 3.750288196949779e-05, "loss": 2.4821, "step": 44765 }, { "epoch": 0.58, "learning_rate": 3.7493000090080234e-05, "loss": 2.5539, "step": 44770 }, { "epoch": 0.58, "learning_rate": 3.748311873177397e-05, "loss": 2.6841, "step": 44775 }, { "epoch": 0.58, "learning_rate": 3.747323789499073e-05, "loss": 2.5931, "step": 44780 }, { "epoch": 0.58, "learning_rate": 3.7463357580142224e-05, "loss": 2.4449, "step": 44785 }, { "epoch": 0.58, "learning_rate": 3.745347778764008e-05, "loss": 2.5348, "step": 44790 }, { "epoch": 0.58, "learning_rate": 3.7443598517896e-05, "loss": 2.5682, "step": 44795 }, { "epoch": 0.58, "learning_rate": 3.743371977132154e-05, "loss": 2.5511, "step": 44800 }, { "epoch": 0.58, "learning_rate": 3.742384154832838e-05, "loss": 2.5257, "step": 44805 }, { "epoch": 0.58, "learning_rate": 3.741396384932804e-05, "loss": 2.6064, "step": 44810 }, { "epoch": 0.58, "learning_rate": 3.74040866747321e-05, "loss": 2.5682, "step": 44815 }, { "epoch": 0.58, "learning_rate": 3.73942100249521e-05, "loss": 2.5992, "step": 44820 }, { "epoch": 0.58, "learning_rate": 3.738433390039956e-05, "loss": 2.4069, "step": 44825 }, { "epoch": 0.58, "learning_rate": 3.737445830148599e-05, "loss": 2.6105, "step": 44830 }, { "epoch": 0.58, "learning_rate": 3.7364583228622824e-05, "loss": 2.7062, "step": 44835 }, { "epoch": 0.58, "learning_rate": 3.735470868222154e-05, "loss": 2.5932, "step": 44840 }, { "epoch": 0.58, "learning_rate": 3.734483466269355e-05, "loss": 2.4662, "step": 44845 }, { "epoch": 0.58, "learning_rate": 3.733496117045028e-05, "loss": 2.6553, "step": 44850 }, { "epoch": 0.58, "learning_rate": 3.732508820590311e-05, "loss": 2.5434, "step": 44855 }, { "epoch": 0.58, "learning_rate": 3.7315215769463383e-05, "loss": 2.6038, "step": 44860 }, { "epoch": 0.58, "learning_rate": 3.730534386154248e-05, "loss": 2.5563, "step": 44865 }, { "epoch": 0.58, "learning_rate": 3.729547248255166e-05, "loss": 2.6859, "step": 44870 }, { "epoch": 0.58, "learning_rate": 3.728560163290227e-05, "loss": 2.5012, "step": 44875 }, { "epoch": 0.58, "learning_rate": 3.727573131300557e-05, "loss": 2.5634, "step": 44880 }, { "epoch": 0.58, "learning_rate": 3.72658615232728e-05, "loss": 2.5396, "step": 44885 }, { "epoch": 0.58, "learning_rate": 3.725599226411522e-05, "loss": 2.4519, "step": 44890 }, { "epoch": 0.58, "learning_rate": 3.7246123535944e-05, "loss": 2.5991, "step": 44895 }, { "epoch": 0.58, "learning_rate": 3.723625533917038e-05, "loss": 2.5514, "step": 44900 }, { "epoch": 0.58, "learning_rate": 3.7226387674205454e-05, "loss": 2.5804, "step": 44905 }, { "epoch": 0.58, "learning_rate": 3.72165205414604e-05, "loss": 2.5044, "step": 44910 }, { "epoch": 0.58, "learning_rate": 3.720665394134635e-05, "loss": 2.5561, "step": 44915 }, { "epoch": 0.58, "learning_rate": 3.719678787427438e-05, "loss": 2.5951, "step": 44920 }, { "epoch": 0.58, "learning_rate": 3.718692234065559e-05, "loss": 2.6174, "step": 44925 }, { "epoch": 0.58, "learning_rate": 3.7177057340901e-05, "loss": 2.4407, "step": 44930 }, { "epoch": 0.58, "learning_rate": 3.716719287542167e-05, "loss": 2.5002, "step": 44935 }, { "epoch": 0.58, "learning_rate": 3.7157328944628586e-05, "loss": 2.6008, "step": 44940 }, { "epoch": 0.58, "learning_rate": 3.7147465548932746e-05, "loss": 2.5114, "step": 44945 }, { "epoch": 0.58, "learning_rate": 3.7137602688745136e-05, "loss": 2.5654, "step": 44950 }, { "epoch": 0.58, "learning_rate": 3.7127740364476654e-05, "loss": 2.5995, "step": 44955 }, { "epoch": 0.58, "learning_rate": 3.711787857653825e-05, "loss": 2.6614, "step": 44960 }, { "epoch": 0.58, "learning_rate": 3.7108017325340806e-05, "loss": 2.5632, "step": 44965 }, { "epoch": 0.58, "learning_rate": 3.70981566112952e-05, "loss": 2.66, "step": 44970 }, { "epoch": 0.58, "learning_rate": 3.7088296434812286e-05, "loss": 2.5439, "step": 44975 }, { "epoch": 0.58, "learning_rate": 3.7078436796302896e-05, "loss": 2.366, "step": 44980 }, { "epoch": 0.58, "learning_rate": 3.7068577696177846e-05, "loss": 2.5277, "step": 44985 }, { "epoch": 0.58, "learning_rate": 3.70587191348479e-05, "loss": 2.5221, "step": 44990 }, { "epoch": 0.58, "learning_rate": 3.704886111272382e-05, "loss": 2.616, "step": 44995 }, { "epoch": 0.58, "learning_rate": 3.703900363021638e-05, "loss": 2.5391, "step": 45000 }, { "epoch": 0.58, "learning_rate": 3.702914668773626e-05, "loss": 2.5476, "step": 45005 }, { "epoch": 0.58, "learning_rate": 3.701929028569418e-05, "loss": 2.5328, "step": 45010 }, { "epoch": 0.58, "learning_rate": 3.700943442450079e-05, "loss": 2.5176, "step": 45015 }, { "epoch": 0.58, "learning_rate": 3.699957910456678e-05, "loss": 2.5634, "step": 45020 }, { "epoch": 0.58, "learning_rate": 3.698972432630272e-05, "loss": 2.5943, "step": 45025 }, { "epoch": 0.58, "learning_rate": 3.697987009011925e-05, "loss": 2.5039, "step": 45030 }, { "epoch": 0.58, "learning_rate": 3.697001639642697e-05, "loss": 2.4162, "step": 45035 }, { "epoch": 0.58, "learning_rate": 3.6960163245636395e-05, "loss": 2.5272, "step": 45040 }, { "epoch": 0.58, "learning_rate": 3.6950310638158104e-05, "loss": 2.5052, "step": 45045 }, { "epoch": 0.58, "learning_rate": 3.694045857440257e-05, "loss": 2.469, "step": 45050 }, { "epoch": 0.58, "learning_rate": 3.693060705478034e-05, "loss": 2.4409, "step": 45055 }, { "epoch": 0.58, "learning_rate": 3.6920756079701816e-05, "loss": 2.5969, "step": 45060 }, { "epoch": 0.58, "learning_rate": 3.6910905649577485e-05, "loss": 2.4325, "step": 45065 }, { "epoch": 0.58, "learning_rate": 3.690105576481778e-05, "loss": 2.3498, "step": 45070 }, { "epoch": 0.58, "learning_rate": 3.689120642583307e-05, "loss": 2.48, "step": 45075 }, { "epoch": 0.59, "learning_rate": 3.688135763303378e-05, "loss": 2.5936, "step": 45080 }, { "epoch": 0.59, "learning_rate": 3.687150938683021e-05, "loss": 2.5832, "step": 45085 }, { "epoch": 0.59, "learning_rate": 3.686166168763271e-05, "loss": 2.5863, "step": 45090 }, { "epoch": 0.59, "learning_rate": 3.685181453585163e-05, "loss": 2.6599, "step": 45095 }, { "epoch": 0.59, "learning_rate": 3.6841967931897206e-05, "loss": 2.4449, "step": 45100 }, { "epoch": 0.59, "learning_rate": 3.6832121876179724e-05, "loss": 2.5659, "step": 45105 }, { "epoch": 0.59, "learning_rate": 3.682227636910942e-05, "loss": 2.479, "step": 45110 }, { "epoch": 0.59, "learning_rate": 3.6812431411096536e-05, "loss": 2.4782, "step": 45115 }, { "epoch": 0.59, "learning_rate": 3.6802587002551226e-05, "loss": 2.5922, "step": 45120 }, { "epoch": 0.59, "learning_rate": 3.679274314388369e-05, "loss": 2.4171, "step": 45125 }, { "epoch": 0.59, "learning_rate": 3.6782899835504084e-05, "loss": 2.5361, "step": 45130 }, { "epoch": 0.59, "learning_rate": 3.6773057077822505e-05, "loss": 2.4383, "step": 45135 }, { "epoch": 0.59, "learning_rate": 3.676321487124911e-05, "loss": 2.5365, "step": 45140 }, { "epoch": 0.59, "learning_rate": 3.675337321619391e-05, "loss": 2.6426, "step": 45145 }, { "epoch": 0.59, "learning_rate": 3.674353211306701e-05, "loss": 2.6566, "step": 45150 }, { "epoch": 0.59, "learning_rate": 3.6733691562278454e-05, "loss": 2.491, "step": 45155 }, { "epoch": 0.59, "learning_rate": 3.672385156423822e-05, "loss": 2.6605, "step": 45160 }, { "epoch": 0.59, "learning_rate": 3.6714012119356315e-05, "loss": 2.6089, "step": 45165 }, { "epoch": 0.59, "learning_rate": 3.6704173228042695e-05, "loss": 2.5076, "step": 45170 }, { "epoch": 0.59, "learning_rate": 3.669433489070733e-05, "loss": 2.5845, "step": 45175 }, { "epoch": 0.59, "learning_rate": 3.668449710776011e-05, "loss": 2.4864, "step": 45180 }, { "epoch": 0.59, "learning_rate": 3.667465987961093e-05, "loss": 2.4252, "step": 45185 }, { "epoch": 0.59, "learning_rate": 3.6664823206669694e-05, "loss": 2.6748, "step": 45190 }, { "epoch": 0.59, "learning_rate": 3.6654987089346226e-05, "loss": 2.5156, "step": 45195 }, { "epoch": 0.59, "learning_rate": 3.664515152805037e-05, "loss": 2.4603, "step": 45200 }, { "epoch": 0.59, "learning_rate": 3.663531652319191e-05, "loss": 2.3721, "step": 45205 }, { "epoch": 0.59, "learning_rate": 3.662548207518063e-05, "loss": 2.3496, "step": 45210 }, { "epoch": 0.59, "learning_rate": 3.6615648184426334e-05, "loss": 2.5435, "step": 45215 }, { "epoch": 0.59, "learning_rate": 3.660581485133869e-05, "loss": 2.5329, "step": 45220 }, { "epoch": 0.59, "learning_rate": 3.659598207632745e-05, "loss": 2.4711, "step": 45225 }, { "epoch": 0.59, "learning_rate": 3.658614985980229e-05, "loss": 2.588, "step": 45230 }, { "epoch": 0.59, "learning_rate": 3.657631820217289e-05, "loss": 2.5342, "step": 45235 }, { "epoch": 0.59, "learning_rate": 3.6566487103848856e-05, "loss": 2.5278, "step": 45240 }, { "epoch": 0.59, "learning_rate": 3.655665656523983e-05, "loss": 2.4165, "step": 45245 }, { "epoch": 0.59, "learning_rate": 3.6546826586755435e-05, "loss": 2.3992, "step": 45250 }, { "epoch": 0.59, "learning_rate": 3.653699716880519e-05, "loss": 2.5526, "step": 45255 }, { "epoch": 0.59, "learning_rate": 3.652716831179867e-05, "loss": 2.6522, "step": 45260 }, { "epoch": 0.59, "learning_rate": 3.651734001614539e-05, "loss": 2.5453, "step": 45265 }, { "epoch": 0.59, "learning_rate": 3.650751228225488e-05, "loss": 2.4529, "step": 45270 }, { "epoch": 0.59, "learning_rate": 3.649768511053657e-05, "loss": 2.4864, "step": 45275 }, { "epoch": 0.59, "learning_rate": 3.648785850139995e-05, "loss": 2.6344, "step": 45280 }, { "epoch": 0.59, "learning_rate": 3.647803245525445e-05, "loss": 2.4766, "step": 45285 }, { "epoch": 0.59, "learning_rate": 3.6468206972509475e-05, "loss": 2.5499, "step": 45290 }, { "epoch": 0.59, "learning_rate": 3.6458382053574394e-05, "loss": 2.4788, "step": 45295 }, { "epoch": 0.59, "learning_rate": 3.644855769885858e-05, "loss": 2.5281, "step": 45300 }, { "epoch": 0.59, "learning_rate": 3.643873390877136e-05, "loss": 2.6691, "step": 45305 }, { "epoch": 0.59, "learning_rate": 3.642891068372208e-05, "loss": 2.5651, "step": 45310 }, { "epoch": 0.59, "learning_rate": 3.641908802411999e-05, "loss": 2.528, "step": 45315 }, { "epoch": 0.59, "learning_rate": 3.640926593037438e-05, "loss": 2.3641, "step": 45320 }, { "epoch": 0.59, "learning_rate": 3.639944440289448e-05, "loss": 2.562, "step": 45325 }, { "epoch": 0.59, "learning_rate": 3.6389623442089525e-05, "loss": 2.4715, "step": 45330 }, { "epoch": 0.59, "learning_rate": 3.63798030483687e-05, "loss": 2.4508, "step": 45335 }, { "epoch": 0.59, "learning_rate": 3.6369983222141166e-05, "loss": 2.4129, "step": 45340 }, { "epoch": 0.59, "learning_rate": 3.6360163963816114e-05, "loss": 2.5324, "step": 45345 }, { "epoch": 0.59, "learning_rate": 3.6350345273802614e-05, "loss": 2.5469, "step": 45350 }, { "epoch": 0.59, "learning_rate": 3.634052715250981e-05, "loss": 2.5157, "step": 45355 }, { "epoch": 0.59, "learning_rate": 3.633070960034675e-05, "loss": 2.4554, "step": 45360 }, { "epoch": 0.59, "learning_rate": 3.63208926177225e-05, "loss": 2.5888, "step": 45365 }, { "epoch": 0.59, "learning_rate": 3.631107620504612e-05, "loss": 2.5043, "step": 45370 }, { "epoch": 0.59, "learning_rate": 3.630126036272656e-05, "loss": 2.4402, "step": 45375 }, { "epoch": 0.59, "learning_rate": 3.629144509117285e-05, "loss": 2.469, "step": 45380 }, { "epoch": 0.59, "learning_rate": 3.628163039079391e-05, "loss": 2.6941, "step": 45385 }, { "epoch": 0.59, "learning_rate": 3.627181626199871e-05, "loss": 2.6096, "step": 45390 }, { "epoch": 0.59, "learning_rate": 3.626200270519614e-05, "loss": 2.6481, "step": 45395 }, { "epoch": 0.59, "learning_rate": 3.625218972079509e-05, "loss": 2.5547, "step": 45400 }, { "epoch": 0.59, "learning_rate": 3.6242377309204445e-05, "loss": 2.4843, "step": 45405 }, { "epoch": 0.59, "learning_rate": 3.6232565470833e-05, "loss": 2.4039, "step": 45410 }, { "epoch": 0.59, "learning_rate": 3.6222754206089624e-05, "loss": 2.5801, "step": 45415 }, { "epoch": 0.59, "learning_rate": 3.6212943515383056e-05, "loss": 2.6076, "step": 45420 }, { "epoch": 0.59, "learning_rate": 3.6203133399122104e-05, "loss": 2.6099, "step": 45425 }, { "epoch": 0.59, "learning_rate": 3.619332385771551e-05, "loss": 2.4555, "step": 45430 }, { "epoch": 0.59, "learning_rate": 3.618351489157197e-05, "loss": 2.4929, "step": 45435 }, { "epoch": 0.59, "learning_rate": 3.617370650110021e-05, "loss": 2.5945, "step": 45440 }, { "epoch": 0.59, "learning_rate": 3.6163898686708864e-05, "loss": 2.6539, "step": 45445 }, { "epoch": 0.59, "learning_rate": 3.6154091448806616e-05, "loss": 2.5981, "step": 45450 }, { "epoch": 0.59, "learning_rate": 3.614428478780206e-05, "loss": 2.5407, "step": 45455 }, { "epoch": 0.59, "learning_rate": 3.613447870410381e-05, "loss": 2.3631, "step": 45460 }, { "epoch": 0.59, "learning_rate": 3.6124673198120474e-05, "loss": 2.4468, "step": 45465 }, { "epoch": 0.59, "learning_rate": 3.611486827026055e-05, "loss": 2.6707, "step": 45470 }, { "epoch": 0.59, "learning_rate": 3.61050639209326e-05, "loss": 2.4245, "step": 45475 }, { "epoch": 0.59, "learning_rate": 3.609526015054511e-05, "loss": 2.592, "step": 45480 }, { "epoch": 0.59, "learning_rate": 3.608545695950658e-05, "loss": 2.4398, "step": 45485 }, { "epoch": 0.59, "learning_rate": 3.607565434822544e-05, "loss": 2.6023, "step": 45490 }, { "epoch": 0.59, "learning_rate": 3.606585231711013e-05, "loss": 2.5523, "step": 45495 }, { "epoch": 0.59, "learning_rate": 3.605605086656909e-05, "loss": 2.5651, "step": 45500 }, { "epoch": 0.59, "learning_rate": 3.604624999701065e-05, "loss": 2.4523, "step": 45505 }, { "epoch": 0.59, "learning_rate": 3.60364497088432e-05, "loss": 2.4512, "step": 45510 }, { "epoch": 0.59, "learning_rate": 3.602665000247506e-05, "loss": 2.614, "step": 45515 }, { "epoch": 0.59, "learning_rate": 3.601685087831455e-05, "loss": 2.4972, "step": 45520 }, { "epoch": 0.59, "learning_rate": 3.600705233676998e-05, "loss": 2.4814, "step": 45525 }, { "epoch": 0.59, "learning_rate": 3.599725437824956e-05, "loss": 2.5005, "step": 45530 }, { "epoch": 0.59, "learning_rate": 3.598745700316157e-05, "loss": 2.4042, "step": 45535 }, { "epoch": 0.59, "learning_rate": 3.5977660211914196e-05, "loss": 2.5169, "step": 45540 }, { "epoch": 0.59, "learning_rate": 3.596786400491565e-05, "loss": 2.591, "step": 45545 }, { "epoch": 0.59, "learning_rate": 3.5958068382574075e-05, "loss": 2.5052, "step": 45550 }, { "epoch": 0.59, "learning_rate": 3.594827334529761e-05, "loss": 2.5037, "step": 45555 }, { "epoch": 0.59, "learning_rate": 3.593847889349441e-05, "loss": 2.5005, "step": 45560 }, { "epoch": 0.59, "learning_rate": 3.5928685027572514e-05, "loss": 2.454, "step": 45565 }, { "epoch": 0.59, "learning_rate": 3.591889174794003e-05, "loss": 2.6664, "step": 45570 }, { "epoch": 0.59, "learning_rate": 3.590909905500497e-05, "loss": 2.5406, "step": 45575 }, { "epoch": 0.59, "learning_rate": 3.589930694917537e-05, "loss": 2.6217, "step": 45580 }, { "epoch": 0.59, "learning_rate": 3.588951543085924e-05, "loss": 2.5417, "step": 45585 }, { "epoch": 0.59, "learning_rate": 3.5879724500464504e-05, "loss": 2.5132, "step": 45590 }, { "epoch": 0.59, "learning_rate": 3.586993415839915e-05, "loss": 2.4638, "step": 45595 }, { "epoch": 0.59, "learning_rate": 3.586014440507107e-05, "loss": 2.6547, "step": 45600 }, { "epoch": 0.59, "learning_rate": 3.5850355240888176e-05, "loss": 2.6864, "step": 45605 }, { "epoch": 0.59, "learning_rate": 3.5840566666258326e-05, "loss": 2.4333, "step": 45610 }, { "epoch": 0.59, "learning_rate": 3.583077868158936e-05, "loss": 2.4754, "step": 45615 }, { "epoch": 0.59, "learning_rate": 3.582099128728915e-05, "loss": 2.5233, "step": 45620 }, { "epoch": 0.59, "learning_rate": 3.5811204483765424e-05, "loss": 2.5354, "step": 45625 }, { "epoch": 0.59, "learning_rate": 3.580141827142602e-05, "loss": 2.4231, "step": 45630 }, { "epoch": 0.59, "learning_rate": 3.579163265067862e-05, "loss": 2.5409, "step": 45635 }, { "epoch": 0.59, "learning_rate": 3.578184762193099e-05, "loss": 2.4479, "step": 45640 }, { "epoch": 0.59, "learning_rate": 3.577206318559083e-05, "loss": 2.5239, "step": 45645 }, { "epoch": 0.59, "learning_rate": 3.576227934206579e-05, "loss": 2.5645, "step": 45650 }, { "epoch": 0.59, "learning_rate": 3.5752496091763554e-05, "loss": 2.4729, "step": 45655 }, { "epoch": 0.59, "learning_rate": 3.5742713435091716e-05, "loss": 2.5404, "step": 45660 }, { "epoch": 0.59, "learning_rate": 3.5732931372457886e-05, "loss": 2.5433, "step": 45665 }, { "epoch": 0.59, "learning_rate": 3.572314990426963e-05, "loss": 2.5802, "step": 45670 }, { "epoch": 0.59, "learning_rate": 3.571336903093451e-05, "loss": 2.5585, "step": 45675 }, { "epoch": 0.59, "learning_rate": 3.570358875286007e-05, "loss": 2.5434, "step": 45680 }, { "epoch": 0.59, "learning_rate": 3.569380907045378e-05, "loss": 2.6094, "step": 45685 }, { "epoch": 0.59, "learning_rate": 3.5684029984123134e-05, "loss": 2.5277, "step": 45690 }, { "epoch": 0.59, "learning_rate": 3.567425149427556e-05, "loss": 2.5246, "step": 45695 }, { "epoch": 0.59, "learning_rate": 3.5664473601318505e-05, "loss": 2.6234, "step": 45700 }, { "epoch": 0.59, "learning_rate": 3.5654696305659366e-05, "loss": 2.5504, "step": 45705 }, { "epoch": 0.59, "learning_rate": 3.564491960770551e-05, "loss": 2.6197, "step": 45710 }, { "epoch": 0.59, "learning_rate": 3.5635143507864324e-05, "loss": 2.5831, "step": 45715 }, { "epoch": 0.59, "learning_rate": 3.562536800654309e-05, "loss": 2.5667, "step": 45720 }, { "epoch": 0.59, "learning_rate": 3.5615593104149144e-05, "loss": 2.4871, "step": 45725 }, { "epoch": 0.59, "learning_rate": 3.560581880108973e-05, "loss": 2.5861, "step": 45730 }, { "epoch": 0.59, "learning_rate": 3.559604509777212e-05, "loss": 2.5977, "step": 45735 }, { "epoch": 0.59, "learning_rate": 3.558627199460355e-05, "loss": 2.5791, "step": 45740 }, { "epoch": 0.59, "learning_rate": 3.557649949199119e-05, "loss": 2.4738, "step": 45745 }, { "epoch": 0.59, "learning_rate": 3.556672759034227e-05, "loss": 2.4515, "step": 45750 }, { "epoch": 0.59, "learning_rate": 3.555695629006388e-05, "loss": 2.5894, "step": 45755 }, { "epoch": 0.59, "learning_rate": 3.554718559156319e-05, "loss": 2.3858, "step": 45760 }, { "epoch": 0.59, "learning_rate": 3.553741549524729e-05, "loss": 2.4275, "step": 45765 }, { "epoch": 0.59, "learning_rate": 3.552764600152323e-05, "loss": 2.5618, "step": 45770 }, { "epoch": 0.59, "learning_rate": 3.551787711079813e-05, "loss": 2.4991, "step": 45775 }, { "epoch": 0.59, "learning_rate": 3.5508108823478935e-05, "loss": 2.6275, "step": 45780 }, { "epoch": 0.59, "learning_rate": 3.5498341139972714e-05, "loss": 2.4018, "step": 45785 }, { "epoch": 0.59, "learning_rate": 3.548857406068639e-05, "loss": 2.3742, "step": 45790 }, { "epoch": 0.59, "learning_rate": 3.547880758602693e-05, "loss": 2.5784, "step": 45795 }, { "epoch": 0.59, "learning_rate": 3.5469041716401284e-05, "loss": 2.4157, "step": 45800 }, { "epoch": 0.59, "learning_rate": 3.545927645221633e-05, "loss": 2.6065, "step": 45805 }, { "epoch": 0.59, "learning_rate": 3.544951179387896e-05, "loss": 2.598, "step": 45810 }, { "epoch": 0.59, "learning_rate": 3.543974774179599e-05, "loss": 2.4822, "step": 45815 }, { "epoch": 0.59, "learning_rate": 3.5429984296374295e-05, "loss": 2.5784, "step": 45820 }, { "epoch": 0.59, "learning_rate": 3.542022145802063e-05, "loss": 2.3309, "step": 45825 }, { "epoch": 0.59, "learning_rate": 3.541045922714178e-05, "loss": 2.4781, "step": 45830 }, { "epoch": 0.59, "learning_rate": 3.5400697604144515e-05, "loss": 2.4773, "step": 45835 }, { "epoch": 0.59, "learning_rate": 3.539093658943552e-05, "loss": 2.431, "step": 45840 }, { "epoch": 0.59, "learning_rate": 3.5381176183421556e-05, "loss": 2.5035, "step": 45845 }, { "epoch": 0.6, "learning_rate": 3.537141638650923e-05, "loss": 2.4831, "step": 45850 }, { "epoch": 0.6, "learning_rate": 3.536165719910521e-05, "loss": 2.5883, "step": 45855 }, { "epoch": 0.6, "learning_rate": 3.535189862161614e-05, "loss": 2.5919, "step": 45860 }, { "epoch": 0.6, "learning_rate": 3.534214065444859e-05, "loss": 2.2724, "step": 45865 }, { "epoch": 0.6, "learning_rate": 3.533238329800916e-05, "loss": 2.5488, "step": 45870 }, { "epoch": 0.6, "learning_rate": 3.532262655270437e-05, "loss": 2.5574, "step": 45875 }, { "epoch": 0.6, "learning_rate": 3.531287041894076e-05, "loss": 2.6814, "step": 45880 }, { "epoch": 0.6, "learning_rate": 3.53031148971248e-05, "loss": 2.5424, "step": 45885 }, { "epoch": 0.6, "learning_rate": 3.5293359987662966e-05, "loss": 2.3699, "step": 45890 }, { "epoch": 0.6, "learning_rate": 3.528360569096172e-05, "loss": 2.3439, "step": 45895 }, { "epoch": 0.6, "learning_rate": 3.527385200742746e-05, "loss": 2.5948, "step": 45900 }, { "epoch": 0.6, "learning_rate": 3.5264098937466604e-05, "loss": 2.5618, "step": 45905 }, { "epoch": 0.6, "learning_rate": 3.525434648148549e-05, "loss": 2.5005, "step": 45910 }, { "epoch": 0.6, "learning_rate": 3.524459463989049e-05, "loss": 2.5773, "step": 45915 }, { "epoch": 0.6, "learning_rate": 3.523484341308789e-05, "loss": 2.6027, "step": 45920 }, { "epoch": 0.6, "learning_rate": 3.522509280148399e-05, "loss": 2.575, "step": 45925 }, { "epoch": 0.6, "learning_rate": 3.521534280548506e-05, "loss": 2.5987, "step": 45930 }, { "epoch": 0.6, "learning_rate": 3.520559342549734e-05, "loss": 2.502, "step": 45935 }, { "epoch": 0.6, "learning_rate": 3.5195844661927056e-05, "loss": 2.4966, "step": 45940 }, { "epoch": 0.6, "learning_rate": 3.518609651518036e-05, "loss": 2.395, "step": 45945 }, { "epoch": 0.6, "learning_rate": 3.517634898566343e-05, "loss": 2.611, "step": 45950 }, { "epoch": 0.6, "learning_rate": 3.5166602073782426e-05, "loss": 2.4634, "step": 45955 }, { "epoch": 0.6, "learning_rate": 3.515685577994343e-05, "loss": 2.4495, "step": 45960 }, { "epoch": 0.6, "learning_rate": 3.514711010455256e-05, "loss": 2.5762, "step": 45965 }, { "epoch": 0.6, "learning_rate": 3.513736504801582e-05, "loss": 2.6109, "step": 45970 }, { "epoch": 0.6, "learning_rate": 3.5127620610739304e-05, "loss": 2.5001, "step": 45975 }, { "epoch": 0.6, "learning_rate": 3.511787679312897e-05, "loss": 2.5645, "step": 45980 }, { "epoch": 0.6, "learning_rate": 3.510813359559082e-05, "loss": 2.5812, "step": 45985 }, { "epoch": 0.6, "learning_rate": 3.5098391018530816e-05, "loss": 2.5456, "step": 45990 }, { "epoch": 0.6, "learning_rate": 3.508864906235488e-05, "loss": 2.4443, "step": 45995 }, { "epoch": 0.6, "learning_rate": 3.507890772746894e-05, "loss": 2.62, "step": 46000 }, { "epoch": 0.6, "learning_rate": 3.506916701427883e-05, "loss": 2.5579, "step": 46005 }, { "epoch": 0.6, "learning_rate": 3.505942692319043e-05, "loss": 2.361, "step": 46010 }, { "epoch": 0.6, "learning_rate": 3.504968745460957e-05, "loss": 2.5794, "step": 46015 }, { "epoch": 0.6, "learning_rate": 3.503994860894203e-05, "loss": 2.4036, "step": 46020 }, { "epoch": 0.6, "learning_rate": 3.503021038659361e-05, "loss": 2.5557, "step": 46025 }, { "epoch": 0.6, "learning_rate": 3.5020472787970036e-05, "loss": 2.4642, "step": 46030 }, { "epoch": 0.6, "learning_rate": 3.5010735813477055e-05, "loss": 2.5983, "step": 46035 }, { "epoch": 0.6, "learning_rate": 3.500099946352033e-05, "loss": 2.574, "step": 46040 }, { "epoch": 0.6, "learning_rate": 3.499126373850556e-05, "loss": 2.4737, "step": 46045 }, { "epoch": 0.6, "learning_rate": 3.498152863883838e-05, "loss": 2.5576, "step": 46050 }, { "epoch": 0.6, "learning_rate": 3.49717941649244e-05, "loss": 2.5287, "step": 46055 }, { "epoch": 0.6, "learning_rate": 3.496206031716925e-05, "loss": 2.5771, "step": 46060 }, { "epoch": 0.6, "learning_rate": 3.4952327095978436e-05, "loss": 2.6138, "step": 46065 }, { "epoch": 0.6, "learning_rate": 3.4942594501757534e-05, "loss": 2.522, "step": 46070 }, { "epoch": 0.6, "learning_rate": 3.493286253491208e-05, "loss": 2.6456, "step": 46075 }, { "epoch": 0.6, "learning_rate": 3.492313119584751e-05, "loss": 2.6025, "step": 46080 }, { "epoch": 0.6, "learning_rate": 3.491340048496932e-05, "loss": 2.5893, "step": 46085 }, { "epoch": 0.6, "learning_rate": 3.490367040268293e-05, "loss": 2.4562, "step": 46090 }, { "epoch": 0.6, "learning_rate": 3.489394094939378e-05, "loss": 2.5836, "step": 46095 }, { "epoch": 0.6, "learning_rate": 3.48842121255072e-05, "loss": 2.6914, "step": 46100 }, { "epoch": 0.6, "learning_rate": 3.4874483931428586e-05, "loss": 2.5288, "step": 46105 }, { "epoch": 0.6, "learning_rate": 3.4864756367563264e-05, "loss": 2.6905, "step": 46110 }, { "epoch": 0.6, "learning_rate": 3.485502943431655e-05, "loss": 2.5792, "step": 46115 }, { "epoch": 0.6, "learning_rate": 3.484530313209369e-05, "loss": 2.5396, "step": 46120 }, { "epoch": 0.6, "learning_rate": 3.483557746129994e-05, "loss": 2.6889, "step": 46125 }, { "epoch": 0.6, "learning_rate": 3.4825852422340565e-05, "loss": 2.5413, "step": 46130 }, { "epoch": 0.6, "learning_rate": 3.481612801562072e-05, "loss": 2.5499, "step": 46135 }, { "epoch": 0.6, "learning_rate": 3.480640424154559e-05, "loss": 2.4474, "step": 46140 }, { "epoch": 0.6, "learning_rate": 3.479668110052035e-05, "loss": 2.546, "step": 46145 }, { "epoch": 0.6, "learning_rate": 3.478695859295007e-05, "loss": 2.5224, "step": 46150 }, { "epoch": 0.6, "learning_rate": 3.4777236719239895e-05, "loss": 2.6347, "step": 46155 }, { "epoch": 0.6, "learning_rate": 3.476751547979486e-05, "loss": 2.4706, "step": 46160 }, { "epoch": 0.6, "learning_rate": 3.475779487502e-05, "loss": 2.5826, "step": 46165 }, { "epoch": 0.6, "learning_rate": 3.474807490532037e-05, "loss": 2.3628, "step": 46170 }, { "epoch": 0.6, "learning_rate": 3.473835557110091e-05, "loss": 2.5261, "step": 46175 }, { "epoch": 0.6, "learning_rate": 3.472863687276662e-05, "loss": 2.5651, "step": 46180 }, { "epoch": 0.6, "learning_rate": 3.4718918810722406e-05, "loss": 2.5563, "step": 46185 }, { "epoch": 0.6, "learning_rate": 3.470920138537321e-05, "loss": 2.4916, "step": 46190 }, { "epoch": 0.6, "learning_rate": 3.469948459712388e-05, "loss": 2.5231, "step": 46195 }, { "epoch": 0.6, "learning_rate": 3.468976844637927e-05, "loss": 2.4913, "step": 46200 }, { "epoch": 0.6, "learning_rate": 3.4680052933544246e-05, "loss": 2.6175, "step": 46205 }, { "epoch": 0.6, "learning_rate": 3.467033805902358e-05, "loss": 2.5268, "step": 46210 }, { "epoch": 0.6, "learning_rate": 3.4660623823222066e-05, "loss": 2.6103, "step": 46215 }, { "epoch": 0.6, "learning_rate": 3.465091022654443e-05, "loss": 2.5401, "step": 46220 }, { "epoch": 0.6, "learning_rate": 3.464119726939541e-05, "loss": 2.5516, "step": 46225 }, { "epoch": 0.6, "learning_rate": 3.463148495217971e-05, "loss": 2.6056, "step": 46230 }, { "epoch": 0.6, "learning_rate": 3.4621773275301985e-05, "loss": 2.5446, "step": 46235 }, { "epoch": 0.6, "learning_rate": 3.4612062239166884e-05, "loss": 2.6261, "step": 46240 }, { "epoch": 0.6, "learning_rate": 3.460235184417901e-05, "loss": 2.6448, "step": 46245 }, { "epoch": 0.6, "learning_rate": 3.4592642090742985e-05, "loss": 2.5386, "step": 46250 }, { "epoch": 0.6, "learning_rate": 3.4582932979263326e-05, "loss": 2.5475, "step": 46255 }, { "epoch": 0.6, "learning_rate": 3.4573224510144595e-05, "loss": 2.5139, "step": 46260 }, { "epoch": 0.6, "learning_rate": 3.456351668379132e-05, "loss": 2.3605, "step": 46265 }, { "epoch": 0.6, "learning_rate": 3.4553809500607936e-05, "loss": 2.4791, "step": 46270 }, { "epoch": 0.6, "learning_rate": 3.454410296099894e-05, "loss": 2.587, "step": 46275 }, { "epoch": 0.6, "learning_rate": 3.453439706536873e-05, "loss": 2.5428, "step": 46280 }, { "epoch": 0.6, "learning_rate": 3.4524691814121726e-05, "loss": 2.5145, "step": 46285 }, { "epoch": 0.6, "learning_rate": 3.4514987207662306e-05, "loss": 2.5853, "step": 46290 }, { "epoch": 0.6, "learning_rate": 3.4505283246394807e-05, "loss": 2.3234, "step": 46295 }, { "epoch": 0.6, "learning_rate": 3.4495579930723555e-05, "loss": 2.5691, "step": 46300 }, { "epoch": 0.6, "learning_rate": 3.4485877261052835e-05, "loss": 2.5681, "step": 46305 }, { "epoch": 0.6, "learning_rate": 3.447617523778695e-05, "loss": 2.3899, "step": 46310 }, { "epoch": 0.6, "learning_rate": 3.4466473861330076e-05, "loss": 2.59, "step": 46315 }, { "epoch": 0.6, "learning_rate": 3.445677313208647e-05, "loss": 2.64, "step": 46320 }, { "epoch": 0.6, "learning_rate": 3.444707305046033e-05, "loss": 2.4366, "step": 46325 }, { "epoch": 0.6, "learning_rate": 3.4437373616855785e-05, "loss": 2.5603, "step": 46330 }, { "epoch": 0.6, "learning_rate": 3.442767483167698e-05, "loss": 2.6317, "step": 46335 }, { "epoch": 0.6, "learning_rate": 3.441797669532802e-05, "loss": 2.6672, "step": 46340 }, { "epoch": 0.6, "learning_rate": 3.4408279208212994e-05, "loss": 2.7115, "step": 46345 }, { "epoch": 0.6, "learning_rate": 3.439858237073593e-05, "loss": 2.542, "step": 46350 }, { "epoch": 0.6, "learning_rate": 3.4388886183300864e-05, "loss": 2.4008, "step": 46355 }, { "epoch": 0.6, "learning_rate": 3.4379190646311804e-05, "loss": 2.5871, "step": 46360 }, { "epoch": 0.6, "learning_rate": 3.4369495760172697e-05, "loss": 2.5725, "step": 46365 }, { "epoch": 0.6, "learning_rate": 3.435980152528751e-05, "loss": 2.5832, "step": 46370 }, { "epoch": 0.6, "learning_rate": 3.435010794206014e-05, "loss": 2.4396, "step": 46375 }, { "epoch": 0.6, "learning_rate": 3.434041501089448e-05, "loss": 2.4327, "step": 46380 }, { "epoch": 0.6, "learning_rate": 3.433072273219441e-05, "loss": 2.5463, "step": 46385 }, { "epoch": 0.6, "learning_rate": 3.432103110636374e-05, "loss": 2.6585, "step": 46390 }, { "epoch": 0.6, "learning_rate": 3.431134013380629e-05, "loss": 2.5111, "step": 46395 }, { "epoch": 0.6, "learning_rate": 3.430164981492583e-05, "loss": 2.386, "step": 46400 }, { "epoch": 0.6, "learning_rate": 3.4291960150126134e-05, "loss": 2.5974, "step": 46405 }, { "epoch": 0.6, "learning_rate": 3.4282271139810895e-05, "loss": 2.5823, "step": 46410 }, { "epoch": 0.6, "learning_rate": 3.4272582784383834e-05, "loss": 2.6288, "step": 46415 }, { "epoch": 0.6, "learning_rate": 3.4262895084248634e-05, "loss": 2.6006, "step": 46420 }, { "epoch": 0.6, "learning_rate": 3.42532080398089e-05, "loss": 2.551, "step": 46425 }, { "epoch": 0.6, "learning_rate": 3.424352165146828e-05, "loss": 2.5763, "step": 46430 }, { "epoch": 0.6, "learning_rate": 3.423383591963034e-05, "loss": 2.3834, "step": 46435 }, { "epoch": 0.6, "learning_rate": 3.422415084469866e-05, "loss": 2.5681, "step": 46440 }, { "epoch": 0.6, "learning_rate": 3.4214466427076786e-05, "loss": 2.46, "step": 46445 }, { "epoch": 0.6, "learning_rate": 3.420478266716818e-05, "loss": 2.56, "step": 46450 }, { "epoch": 0.6, "learning_rate": 3.419509956537638e-05, "loss": 2.5669, "step": 46455 }, { "epoch": 0.6, "learning_rate": 3.418541712210478e-05, "loss": 2.455, "step": 46460 }, { "epoch": 0.6, "learning_rate": 3.417573533775684e-05, "loss": 2.6135, "step": 46465 }, { "epoch": 0.6, "learning_rate": 3.416605421273594e-05, "loss": 2.6035, "step": 46470 }, { "epoch": 0.6, "learning_rate": 3.415637374744546e-05, "loss": 2.3932, "step": 46475 }, { "epoch": 0.6, "learning_rate": 3.414669394228875e-05, "loss": 2.501, "step": 46480 }, { "epoch": 0.6, "learning_rate": 3.413701479766911e-05, "loss": 2.6801, "step": 46485 }, { "epoch": 0.6, "learning_rate": 3.4127336313989834e-05, "loss": 2.4097, "step": 46490 }, { "epoch": 0.6, "learning_rate": 3.411765849165417e-05, "loss": 2.4999, "step": 46495 }, { "epoch": 0.6, "learning_rate": 3.4107981331065356e-05, "loss": 2.501, "step": 46500 }, { "epoch": 0.6, "learning_rate": 3.4098304832626614e-05, "loss": 2.4582, "step": 46505 }, { "epoch": 0.6, "learning_rate": 3.40886289967411e-05, "loss": 2.5096, "step": 46510 }, { "epoch": 0.6, "learning_rate": 3.407895382381198e-05, "loss": 2.5777, "step": 46515 }, { "epoch": 0.6, "learning_rate": 3.406927931424235e-05, "loss": 2.57, "step": 46520 }, { "epoch": 0.6, "learning_rate": 3.405960546843533e-05, "loss": 2.623, "step": 46525 }, { "epoch": 0.6, "learning_rate": 3.404993228679396e-05, "loss": 2.5256, "step": 46530 }, { "epoch": 0.6, "learning_rate": 3.40402597697213e-05, "loss": 2.4455, "step": 46535 }, { "epoch": 0.6, "learning_rate": 3.4030587917620374e-05, "loss": 2.5221, "step": 46540 }, { "epoch": 0.6, "learning_rate": 3.402091673089412e-05, "loss": 2.5802, "step": 46545 }, { "epoch": 0.6, "learning_rate": 3.401124620994555e-05, "loss": 2.4779, "step": 46550 }, { "epoch": 0.6, "learning_rate": 3.4001576355177534e-05, "loss": 2.406, "step": 46555 }, { "epoch": 0.6, "learning_rate": 3.399190716699301e-05, "loss": 2.4698, "step": 46560 }, { "epoch": 0.6, "learning_rate": 3.398223864579483e-05, "loss": 2.6146, "step": 46565 }, { "epoch": 0.6, "learning_rate": 3.397257079198586e-05, "loss": 2.6579, "step": 46570 }, { "epoch": 0.6, "learning_rate": 3.396290360596891e-05, "loss": 2.5779, "step": 46575 }, { "epoch": 0.6, "learning_rate": 3.395323708814675e-05, "loss": 2.5123, "step": 46580 }, { "epoch": 0.6, "learning_rate": 3.394357123892217e-05, "loss": 2.4408, "step": 46585 }, { "epoch": 0.6, "learning_rate": 3.393390605869787e-05, "loss": 2.3888, "step": 46590 }, { "epoch": 0.6, "learning_rate": 3.392424154787658e-05, "loss": 2.5544, "step": 46595 }, { "epoch": 0.6, "learning_rate": 3.391457770686098e-05, "loss": 2.4719, "step": 46600 }, { "epoch": 0.6, "learning_rate": 3.39049145360537e-05, "loss": 2.4834, "step": 46605 }, { "epoch": 0.6, "learning_rate": 3.3895252035857394e-05, "loss": 2.5407, "step": 46610 }, { "epoch": 0.6, "learning_rate": 3.388559020667461e-05, "loss": 2.6044, "step": 46615 }, { "epoch": 0.61, "learning_rate": 3.3875929048907945e-05, "loss": 2.5442, "step": 46620 }, { "epoch": 0.61, "learning_rate": 3.386626856295993e-05, "loss": 2.6129, "step": 46625 }, { "epoch": 0.61, "learning_rate": 3.385660874923305e-05, "loss": 2.4157, "step": 46630 }, { "epoch": 0.61, "learning_rate": 3.384694960812985e-05, "loss": 2.5149, "step": 46635 }, { "epoch": 0.61, "learning_rate": 3.383729114005272e-05, "loss": 2.4302, "step": 46640 }, { "epoch": 0.61, "learning_rate": 3.3827633345404117e-05, "loss": 2.5424, "step": 46645 }, { "epoch": 0.61, "learning_rate": 3.3817976224586424e-05, "loss": 2.4683, "step": 46650 }, { "epoch": 0.61, "learning_rate": 3.380831977800202e-05, "loss": 2.5845, "step": 46655 }, { "epoch": 0.61, "learning_rate": 3.379866400605325e-05, "loss": 2.503, "step": 46660 }, { "epoch": 0.61, "learning_rate": 3.3789008909142404e-05, "loss": 2.4503, "step": 46665 }, { "epoch": 0.61, "learning_rate": 3.377935448767181e-05, "loss": 2.4523, "step": 46670 }, { "epoch": 0.61, "learning_rate": 3.376970074204368e-05, "loss": 2.5303, "step": 46675 }, { "epoch": 0.61, "learning_rate": 3.376004767266027e-05, "loss": 2.5727, "step": 46680 }, { "epoch": 0.61, "learning_rate": 3.375039527992376e-05, "loss": 2.4962, "step": 46685 }, { "epoch": 0.61, "learning_rate": 3.374074356423634e-05, "loss": 2.4459, "step": 46690 }, { "epoch": 0.61, "learning_rate": 3.373109252600016e-05, "loss": 2.6119, "step": 46695 }, { "epoch": 0.61, "learning_rate": 3.372144216561732e-05, "loss": 2.4879, "step": 46700 }, { "epoch": 0.61, "learning_rate": 3.3711792483489926e-05, "loss": 2.588, "step": 46705 }, { "epoch": 0.61, "learning_rate": 3.370214348002e-05, "loss": 2.5129, "step": 46710 }, { "epoch": 0.61, "learning_rate": 3.3692495155609605e-05, "loss": 2.3996, "step": 46715 }, { "epoch": 0.61, "learning_rate": 3.3682847510660745e-05, "loss": 2.4828, "step": 46720 }, { "epoch": 0.61, "learning_rate": 3.367320054557538e-05, "loss": 2.6807, "step": 46725 }, { "epoch": 0.61, "learning_rate": 3.3663554260755476e-05, "loss": 2.3346, "step": 46730 }, { "epoch": 0.61, "learning_rate": 3.365390865660292e-05, "loss": 2.585, "step": 46735 }, { "epoch": 0.61, "learning_rate": 3.364426373351964e-05, "loss": 2.5222, "step": 46740 }, { "epoch": 0.61, "learning_rate": 3.363461949190746e-05, "loss": 2.5377, "step": 46745 }, { "epoch": 0.61, "learning_rate": 3.3624975932168224e-05, "loss": 2.6176, "step": 46750 }, { "epoch": 0.61, "learning_rate": 3.361533305470376e-05, "loss": 2.754, "step": 46755 }, { "epoch": 0.61, "learning_rate": 3.3605690859915805e-05, "loss": 2.5754, "step": 46760 }, { "epoch": 0.61, "learning_rate": 3.359604934820616e-05, "loss": 2.5857, "step": 46765 }, { "epoch": 0.61, "learning_rate": 3.358640851997649e-05, "loss": 2.441, "step": 46770 }, { "epoch": 0.61, "learning_rate": 3.357676837562851e-05, "loss": 2.5098, "step": 46775 }, { "epoch": 0.61, "learning_rate": 3.356712891556387e-05, "loss": 2.615, "step": 46780 }, { "epoch": 0.61, "learning_rate": 3.355749014018421e-05, "loss": 2.5013, "step": 46785 }, { "epoch": 0.61, "learning_rate": 3.354785204989117e-05, "loss": 2.5589, "step": 46790 }, { "epoch": 0.61, "learning_rate": 3.353821464508626e-05, "loss": 2.4832, "step": 46795 }, { "epoch": 0.61, "learning_rate": 3.35285779261711e-05, "loss": 2.5358, "step": 46800 }, { "epoch": 0.61, "learning_rate": 3.351894189354714e-05, "loss": 2.49, "step": 46805 }, { "epoch": 0.61, "learning_rate": 3.3509306547615905e-05, "loss": 2.5229, "step": 46810 }, { "epoch": 0.61, "learning_rate": 3.349967188877887e-05, "loss": 2.5811, "step": 46815 }, { "epoch": 0.61, "learning_rate": 3.349003791743744e-05, "loss": 2.4143, "step": 46820 }, { "epoch": 0.61, "learning_rate": 3.348040463399306e-05, "loss": 2.7187, "step": 46825 }, { "epoch": 0.61, "learning_rate": 3.347077203884705e-05, "loss": 2.3824, "step": 46830 }, { "epoch": 0.61, "learning_rate": 3.3461140132400804e-05, "loss": 2.6382, "step": 46835 }, { "epoch": 0.61, "learning_rate": 3.345150891505562e-05, "loss": 2.6039, "step": 46840 }, { "epoch": 0.61, "learning_rate": 3.3441878387212786e-05, "loss": 2.5079, "step": 46845 }, { "epoch": 0.61, "learning_rate": 3.343224854927358e-05, "loss": 2.4146, "step": 46850 }, { "epoch": 0.61, "learning_rate": 3.342261940163921e-05, "loss": 2.4872, "step": 46855 }, { "epoch": 0.61, "learning_rate": 3.341299094471092e-05, "loss": 2.4902, "step": 46860 }, { "epoch": 0.61, "learning_rate": 3.340336317888983e-05, "loss": 2.4975, "step": 46865 }, { "epoch": 0.61, "learning_rate": 3.339373610457713e-05, "loss": 2.6009, "step": 46870 }, { "epoch": 0.61, "learning_rate": 3.338410972217393e-05, "loss": 2.3369, "step": 46875 }, { "epoch": 0.61, "learning_rate": 3.33744840320813e-05, "loss": 2.6365, "step": 46880 }, { "epoch": 0.61, "learning_rate": 3.3364859034700335e-05, "loss": 2.4829, "step": 46885 }, { "epoch": 0.61, "learning_rate": 3.3355234730432027e-05, "loss": 2.4788, "step": 46890 }, { "epoch": 0.61, "learning_rate": 3.334561111967741e-05, "loss": 2.6256, "step": 46895 }, { "epoch": 0.61, "learning_rate": 3.333598820283742e-05, "loss": 2.5875, "step": 46900 }, { "epoch": 0.61, "learning_rate": 3.332636598031302e-05, "loss": 2.6626, "step": 46905 }, { "epoch": 0.61, "learning_rate": 3.331674445250515e-05, "loss": 2.5294, "step": 46910 }, { "epoch": 0.61, "learning_rate": 3.330712361981466e-05, "loss": 2.5128, "step": 46915 }, { "epoch": 0.61, "learning_rate": 3.329750348264244e-05, "loss": 2.4466, "step": 46920 }, { "epoch": 0.61, "learning_rate": 3.328788404138928e-05, "loss": 2.6497, "step": 46925 }, { "epoch": 0.61, "learning_rate": 3.327826529645601e-05, "loss": 2.5797, "step": 46930 }, { "epoch": 0.61, "learning_rate": 3.326864724824339e-05, "loss": 2.4361, "step": 46935 }, { "epoch": 0.61, "learning_rate": 3.325902989715217e-05, "loss": 2.5193, "step": 46940 }, { "epoch": 0.61, "learning_rate": 3.324941324358305e-05, "loss": 2.4455, "step": 46945 }, { "epoch": 0.61, "learning_rate": 3.323979728793671e-05, "loss": 2.616, "step": 46950 }, { "epoch": 0.61, "learning_rate": 3.323018203061384e-05, "loss": 2.5378, "step": 46955 }, { "epoch": 0.61, "learning_rate": 3.322056747201501e-05, "loss": 2.5704, "step": 46960 }, { "epoch": 0.61, "learning_rate": 3.321095361254084e-05, "loss": 2.4625, "step": 46965 }, { "epoch": 0.61, "learning_rate": 3.320134045259192e-05, "loss": 2.5213, "step": 46970 }, { "epoch": 0.61, "learning_rate": 3.319172799256876e-05, "loss": 2.4357, "step": 46975 }, { "epoch": 0.61, "learning_rate": 3.3182116232871894e-05, "loss": 2.6105, "step": 46980 }, { "epoch": 0.61, "learning_rate": 3.317250517390177e-05, "loss": 2.6241, "step": 46985 }, { "epoch": 0.61, "learning_rate": 3.316289481605887e-05, "loss": 2.3802, "step": 46990 }, { "epoch": 0.61, "learning_rate": 3.315328515974357e-05, "loss": 2.622, "step": 46995 }, { "epoch": 0.61, "learning_rate": 3.31436762053563e-05, "loss": 2.5372, "step": 47000 }, { "epoch": 0.61, "learning_rate": 3.313406795329741e-05, "loss": 2.5627, "step": 47005 }, { "epoch": 0.61, "learning_rate": 3.312446040396724e-05, "loss": 2.5917, "step": 47010 }, { "epoch": 0.61, "learning_rate": 3.311485355776611e-05, "loss": 2.5352, "step": 47015 }, { "epoch": 0.61, "learning_rate": 3.310524741509425e-05, "loss": 2.4212, "step": 47020 }, { "epoch": 0.61, "learning_rate": 3.3095641976351935e-05, "loss": 2.437, "step": 47025 }, { "epoch": 0.61, "learning_rate": 3.308603724193937e-05, "loss": 2.5467, "step": 47030 }, { "epoch": 0.61, "learning_rate": 3.3076433212256764e-05, "loss": 2.5016, "step": 47035 }, { "epoch": 0.61, "learning_rate": 3.306682988770426e-05, "loss": 2.5831, "step": 47040 }, { "epoch": 0.61, "learning_rate": 3.305722726868197e-05, "loss": 2.6389, "step": 47045 }, { "epoch": 0.61, "learning_rate": 3.304762535559003e-05, "loss": 2.5957, "step": 47050 }, { "epoch": 0.61, "learning_rate": 3.303802414882846e-05, "loss": 2.6776, "step": 47055 }, { "epoch": 0.61, "learning_rate": 3.302842364879733e-05, "loss": 2.4665, "step": 47060 }, { "epoch": 0.61, "learning_rate": 3.301882385589665e-05, "loss": 2.5927, "step": 47065 }, { "epoch": 0.61, "learning_rate": 3.300922477052639e-05, "loss": 2.4518, "step": 47070 }, { "epoch": 0.61, "learning_rate": 3.2999626393086537e-05, "loss": 2.6246, "step": 47075 }, { "epoch": 0.61, "learning_rate": 3.299002872397696e-05, "loss": 2.5006, "step": 47080 }, { "epoch": 0.61, "learning_rate": 3.298043176359758e-05, "loss": 2.6734, "step": 47085 }, { "epoch": 0.61, "learning_rate": 3.297083551234827e-05, "loss": 2.5288, "step": 47090 }, { "epoch": 0.61, "learning_rate": 3.296123997062883e-05, "loss": 2.5251, "step": 47095 }, { "epoch": 0.61, "learning_rate": 3.2951645138839096e-05, "loss": 2.476, "step": 47100 }, { "epoch": 0.61, "learning_rate": 3.2942051017378816e-05, "loss": 2.5137, "step": 47105 }, { "epoch": 0.61, "learning_rate": 3.293245760664777e-05, "loss": 2.4883, "step": 47110 }, { "epoch": 0.61, "learning_rate": 3.292286490704562e-05, "loss": 2.5838, "step": 47115 }, { "epoch": 0.61, "learning_rate": 3.29132729189721e-05, "loss": 2.5995, "step": 47120 }, { "epoch": 0.61, "learning_rate": 3.2903681642826845e-05, "loss": 2.473, "step": 47125 }, { "epoch": 0.61, "learning_rate": 3.289409107900948e-05, "loss": 2.3668, "step": 47130 }, { "epoch": 0.61, "learning_rate": 3.288450122791962e-05, "loss": 2.4777, "step": 47135 }, { "epoch": 0.61, "learning_rate": 3.28749120899568e-05, "loss": 2.4746, "step": 47140 }, { "epoch": 0.61, "learning_rate": 3.286532366552058e-05, "loss": 2.5931, "step": 47145 }, { "epoch": 0.61, "learning_rate": 3.285573595501047e-05, "loss": 2.4229, "step": 47150 }, { "epoch": 0.61, "learning_rate": 3.2846148958825916e-05, "loss": 2.4015, "step": 47155 }, { "epoch": 0.61, "learning_rate": 3.283656267736641e-05, "loss": 2.5455, "step": 47160 }, { "epoch": 0.61, "learning_rate": 3.2826977111031335e-05, "loss": 2.5861, "step": 47165 }, { "epoch": 0.61, "learning_rate": 3.28173922602201e-05, "loss": 2.5742, "step": 47170 }, { "epoch": 0.61, "learning_rate": 3.2807808125332046e-05, "loss": 2.5902, "step": 47175 }, { "epoch": 0.61, "learning_rate": 3.279822470676651e-05, "loss": 2.51, "step": 47180 }, { "epoch": 0.61, "learning_rate": 3.278864200492281e-05, "loss": 2.5076, "step": 47185 }, { "epoch": 0.61, "learning_rate": 3.277906002020017e-05, "loss": 2.5149, "step": 47190 }, { "epoch": 0.61, "learning_rate": 3.2769478752997875e-05, "loss": 2.5504, "step": 47195 }, { "epoch": 0.61, "learning_rate": 3.27598982037151e-05, "loss": 2.5418, "step": 47200 }, { "epoch": 0.61, "learning_rate": 3.275031837275105e-05, "loss": 2.5262, "step": 47205 }, { "epoch": 0.61, "learning_rate": 3.274073926050485e-05, "loss": 2.5419, "step": 47210 }, { "epoch": 0.61, "learning_rate": 3.273116086737563e-05, "loss": 2.5206, "step": 47215 }, { "epoch": 0.61, "learning_rate": 3.2721583193762495e-05, "loss": 2.4749, "step": 47220 }, { "epoch": 0.61, "learning_rate": 3.2712006240064476e-05, "loss": 2.4265, "step": 47225 }, { "epoch": 0.61, "learning_rate": 3.270243000668063e-05, "loss": 2.4442, "step": 47230 }, { "epoch": 0.61, "learning_rate": 3.269285449400993e-05, "loss": 2.4606, "step": 47235 }, { "epoch": 0.61, "learning_rate": 3.268327970245136e-05, "loss": 2.5011, "step": 47240 }, { "epoch": 0.61, "learning_rate": 3.267370563240387e-05, "loss": 2.5917, "step": 47245 }, { "epoch": 0.61, "learning_rate": 3.2664132284266336e-05, "loss": 2.5139, "step": 47250 }, { "epoch": 0.61, "learning_rate": 3.265455965843767e-05, "loss": 2.435, "step": 47255 }, { "epoch": 0.61, "learning_rate": 3.2644987755316695e-05, "loss": 2.5491, "step": 47260 }, { "epoch": 0.61, "learning_rate": 3.263541657530227e-05, "loss": 2.4859, "step": 47265 }, { "epoch": 0.61, "learning_rate": 3.2625846118793126e-05, "loss": 2.5545, "step": 47270 }, { "epoch": 0.61, "learning_rate": 3.261627638618806e-05, "loss": 2.5189, "step": 47275 }, { "epoch": 0.61, "learning_rate": 3.2606707377885806e-05, "loss": 2.4524, "step": 47280 }, { "epoch": 0.61, "learning_rate": 3.259713909428503e-05, "loss": 2.6012, "step": 47285 }, { "epoch": 0.61, "learning_rate": 3.2587571535784436e-05, "loss": 2.6411, "step": 47290 }, { "epoch": 0.61, "learning_rate": 3.257800470278262e-05, "loss": 2.5901, "step": 47295 }, { "epoch": 0.61, "learning_rate": 3.2568438595678226e-05, "loss": 2.6216, "step": 47300 }, { "epoch": 0.61, "learning_rate": 3.255887321486983e-05, "loss": 2.4472, "step": 47305 }, { "epoch": 0.61, "learning_rate": 3.2549308560755956e-05, "loss": 2.5893, "step": 47310 }, { "epoch": 0.61, "learning_rate": 3.253974463373513e-05, "loss": 2.5224, "step": 47315 }, { "epoch": 0.61, "learning_rate": 3.253018143420585e-05, "loss": 2.5591, "step": 47320 }, { "epoch": 0.61, "learning_rate": 3.252061896256657e-05, "loss": 2.4904, "step": 47325 }, { "epoch": 0.61, "learning_rate": 3.25110572192157e-05, "loss": 2.4553, "step": 47330 }, { "epoch": 0.61, "learning_rate": 3.250149620455164e-05, "loss": 2.4851, "step": 47335 }, { "epoch": 0.61, "learning_rate": 3.249193591897278e-05, "loss": 2.5083, "step": 47340 }, { "epoch": 0.61, "learning_rate": 3.248237636287741e-05, "loss": 2.5823, "step": 47345 }, { "epoch": 0.61, "learning_rate": 3.247281753666388e-05, "loss": 2.4896, "step": 47350 }, { "epoch": 0.61, "learning_rate": 3.246325944073043e-05, "loss": 2.5444, "step": 47355 }, { "epoch": 0.61, "learning_rate": 3.2453702075475314e-05, "loss": 2.5211, "step": 47360 }, { "epoch": 0.61, "learning_rate": 3.244414544129677e-05, "loss": 2.5159, "step": 47365 }, { "epoch": 0.61, "learning_rate": 3.243458953859293e-05, "loss": 2.4357, "step": 47370 }, { "epoch": 0.61, "learning_rate": 3.242503436776201e-05, "loss": 2.5715, "step": 47375 }, { "epoch": 0.61, "learning_rate": 3.2415479929202066e-05, "loss": 2.5416, "step": 47380 }, { "epoch": 0.61, "learning_rate": 3.2405926223311236e-05, "loss": 2.4194, "step": 47385 }, { "epoch": 0.62, "learning_rate": 3.2396373250487544e-05, "loss": 2.5486, "step": 47390 }, { "epoch": 0.62, "learning_rate": 3.238682101112904e-05, "loss": 2.5958, "step": 47395 }, { "epoch": 0.62, "learning_rate": 3.237726950563376e-05, "loss": 2.5339, "step": 47400 }, { "epoch": 0.62, "learning_rate": 3.2367718734399596e-05, "loss": 2.5354, "step": 47405 }, { "epoch": 0.62, "learning_rate": 3.2358168697824553e-05, "loss": 2.372, "step": 47410 }, { "epoch": 0.62, "learning_rate": 3.23486193963065e-05, "loss": 2.5725, "step": 47415 }, { "epoch": 0.62, "learning_rate": 3.2339070830243346e-05, "loss": 2.5516, "step": 47420 }, { "epoch": 0.62, "learning_rate": 3.23295230000329e-05, "loss": 2.4576, "step": 47425 }, { "epoch": 0.62, "learning_rate": 3.231997590607299e-05, "loss": 2.5071, "step": 47430 }, { "epoch": 0.62, "learning_rate": 3.2310429548761436e-05, "loss": 2.5221, "step": 47435 }, { "epoch": 0.62, "learning_rate": 3.2300883928495936e-05, "loss": 2.6712, "step": 47440 }, { "epoch": 0.62, "learning_rate": 3.229133904567425e-05, "loss": 2.5965, "step": 47445 }, { "epoch": 0.62, "learning_rate": 3.228179490069406e-05, "loss": 2.5667, "step": 47450 }, { "epoch": 0.62, "learning_rate": 3.227225149395303e-05, "loss": 2.4081, "step": 47455 }, { "epoch": 0.62, "learning_rate": 3.226270882584881e-05, "loss": 2.6451, "step": 47460 }, { "epoch": 0.62, "learning_rate": 3.225316689677896e-05, "loss": 2.571, "step": 47465 }, { "epoch": 0.62, "learning_rate": 3.22436257071411e-05, "loss": 2.516, "step": 47470 }, { "epoch": 0.62, "learning_rate": 3.223408525733271e-05, "loss": 2.585, "step": 47475 }, { "epoch": 0.62, "learning_rate": 3.222454554775135e-05, "loss": 2.3366, "step": 47480 }, { "epoch": 0.62, "learning_rate": 3.221500657879447e-05, "loss": 2.4704, "step": 47485 }, { "epoch": 0.62, "learning_rate": 3.220546835085952e-05, "loss": 2.4882, "step": 47490 }, { "epoch": 0.62, "learning_rate": 3.2195930864343946e-05, "loss": 2.6204, "step": 47495 }, { "epoch": 0.62, "learning_rate": 3.218639411964508e-05, "loss": 2.576, "step": 47500 }, { "epoch": 0.62, "learning_rate": 3.2176858117160315e-05, "loss": 2.5349, "step": 47505 }, { "epoch": 0.62, "learning_rate": 3.216732285728695e-05, "loss": 2.5552, "step": 47510 }, { "epoch": 0.62, "learning_rate": 3.215778834042229e-05, "loss": 2.5088, "step": 47515 }, { "epoch": 0.62, "learning_rate": 3.2148254566963624e-05, "loss": 2.5159, "step": 47520 }, { "epoch": 0.62, "learning_rate": 3.213872153730812e-05, "loss": 2.4657, "step": 47525 }, { "epoch": 0.62, "learning_rate": 3.2129189251853037e-05, "loss": 2.5319, "step": 47530 }, { "epoch": 0.62, "learning_rate": 3.21196577109955e-05, "loss": 2.5368, "step": 47535 }, { "epoch": 0.62, "learning_rate": 3.211012691513267e-05, "loss": 2.5455, "step": 47540 }, { "epoch": 0.62, "learning_rate": 3.210059686466163e-05, "loss": 2.5609, "step": 47545 }, { "epoch": 0.62, "learning_rate": 3.209106755997947e-05, "loss": 2.5944, "step": 47550 }, { "epoch": 0.62, "learning_rate": 3.2081539001483264e-05, "loss": 2.5337, "step": 47555 }, { "epoch": 0.62, "learning_rate": 3.2072011189569976e-05, "loss": 2.5019, "step": 47560 }, { "epoch": 0.62, "learning_rate": 3.206248412463662e-05, "loss": 2.5295, "step": 47565 }, { "epoch": 0.62, "learning_rate": 3.205295780708012e-05, "loss": 2.5863, "step": 47570 }, { "epoch": 0.62, "learning_rate": 3.20434322372974e-05, "loss": 2.5512, "step": 47575 }, { "epoch": 0.62, "learning_rate": 3.2033907415685374e-05, "loss": 2.6226, "step": 47580 }, { "epoch": 0.62, "learning_rate": 3.202438334264087e-05, "loss": 2.4879, "step": 47585 }, { "epoch": 0.62, "learning_rate": 3.2014860018560756e-05, "loss": 2.4414, "step": 47590 }, { "epoch": 0.62, "learning_rate": 3.2005337443841766e-05, "loss": 2.4702, "step": 47595 }, { "epoch": 0.62, "learning_rate": 3.199581561888071e-05, "loss": 2.6102, "step": 47600 }, { "epoch": 0.62, "learning_rate": 3.19862945440743e-05, "loss": 2.4286, "step": 47605 }, { "epoch": 0.62, "learning_rate": 3.197677421981924e-05, "loss": 2.4703, "step": 47610 }, { "epoch": 0.62, "learning_rate": 3.196725464651221e-05, "loss": 2.5134, "step": 47615 }, { "epoch": 0.62, "learning_rate": 3.1957735824549836e-05, "loss": 2.6145, "step": 47620 }, { "epoch": 0.62, "learning_rate": 3.194821775432875e-05, "loss": 2.5254, "step": 47625 }, { "epoch": 0.62, "learning_rate": 3.193870043624548e-05, "loss": 2.4973, "step": 47630 }, { "epoch": 0.62, "learning_rate": 3.192918387069661e-05, "loss": 2.51, "step": 47635 }, { "epoch": 0.62, "learning_rate": 3.191966805807863e-05, "loss": 2.5557, "step": 47640 }, { "epoch": 0.62, "learning_rate": 3.1910152998788034e-05, "loss": 2.488, "step": 47645 }, { "epoch": 0.62, "learning_rate": 3.190063869322129e-05, "loss": 2.5357, "step": 47650 }, { "epoch": 0.62, "learning_rate": 3.189112514177478e-05, "loss": 2.4366, "step": 47655 }, { "epoch": 0.62, "learning_rate": 3.1881612344844924e-05, "loss": 2.624, "step": 47660 }, { "epoch": 0.62, "learning_rate": 3.187210030282806e-05, "loss": 2.5296, "step": 47665 }, { "epoch": 0.62, "learning_rate": 3.1862589016120506e-05, "loss": 2.4462, "step": 47670 }, { "epoch": 0.62, "learning_rate": 3.185307848511858e-05, "loss": 2.521, "step": 47675 }, { "epoch": 0.62, "learning_rate": 3.184356871021852e-05, "loss": 2.577, "step": 47680 }, { "epoch": 0.62, "learning_rate": 3.1834059691816574e-05, "loss": 2.567, "step": 47685 }, { "epoch": 0.62, "learning_rate": 3.1824551430308925e-05, "loss": 2.4875, "step": 47690 }, { "epoch": 0.62, "learning_rate": 3.181504392609176e-05, "loss": 2.4128, "step": 47695 }, { "epoch": 0.62, "learning_rate": 3.1805537179561187e-05, "loss": 2.5672, "step": 47700 }, { "epoch": 0.62, "learning_rate": 3.179603119111332e-05, "loss": 2.4888, "step": 47705 }, { "epoch": 0.62, "learning_rate": 3.1786525961144263e-05, "loss": 2.5272, "step": 47710 }, { "epoch": 0.62, "learning_rate": 3.177702149005001e-05, "loss": 2.4199, "step": 47715 }, { "epoch": 0.62, "learning_rate": 3.176751777822662e-05, "loss": 2.6203, "step": 47720 }, { "epoch": 0.62, "learning_rate": 3.175801482607001e-05, "loss": 2.4615, "step": 47725 }, { "epoch": 0.62, "learning_rate": 3.174851263397616e-05, "loss": 2.6572, "step": 47730 }, { "epoch": 0.62, "learning_rate": 3.1739011202341e-05, "loss": 2.5942, "step": 47735 }, { "epoch": 0.62, "learning_rate": 3.172951053156037e-05, "loss": 2.6331, "step": 47740 }, { "epoch": 0.62, "learning_rate": 3.172001062203017e-05, "loss": 2.4267, "step": 47745 }, { "epoch": 0.62, "learning_rate": 3.171051147414618e-05, "loss": 2.413, "step": 47750 }, { "epoch": 0.62, "learning_rate": 3.170101308830421e-05, "loss": 2.3901, "step": 47755 }, { "epoch": 0.62, "learning_rate": 3.1691515464900004e-05, "loss": 2.5763, "step": 47760 }, { "epoch": 0.62, "learning_rate": 3.1682018604329285e-05, "loss": 2.5967, "step": 47765 }, { "epoch": 0.62, "learning_rate": 3.1672522506987754e-05, "loss": 2.54, "step": 47770 }, { "epoch": 0.62, "learning_rate": 3.166302717327106e-05, "loss": 2.5603, "step": 47775 }, { "epoch": 0.62, "learning_rate": 3.165353260357485e-05, "loss": 2.5741, "step": 47780 }, { "epoch": 0.62, "learning_rate": 3.1644038798294707e-05, "loss": 2.4175, "step": 47785 }, { "epoch": 0.62, "learning_rate": 3.163454575782618e-05, "loss": 2.5793, "step": 47790 }, { "epoch": 0.62, "learning_rate": 3.162505348256485e-05, "loss": 2.4736, "step": 47795 }, { "epoch": 0.62, "learning_rate": 3.161556197290616e-05, "loss": 2.6232, "step": 47800 }, { "epoch": 0.62, "learning_rate": 3.1606071229245635e-05, "loss": 2.5615, "step": 47805 }, { "epoch": 0.62, "learning_rate": 3.1596581251978664e-05, "loss": 2.5703, "step": 47810 }, { "epoch": 0.62, "learning_rate": 3.158709204150069e-05, "loss": 2.5599, "step": 47815 }, { "epoch": 0.62, "learning_rate": 3.157760359820705e-05, "loss": 2.5474, "step": 47820 }, { "epoch": 0.62, "learning_rate": 3.156811592249311e-05, "loss": 2.6082, "step": 47825 }, { "epoch": 0.62, "learning_rate": 3.1558629014754175e-05, "loss": 2.7077, "step": 47830 }, { "epoch": 0.62, "learning_rate": 3.154914287538552e-05, "loss": 2.6877, "step": 47835 }, { "epoch": 0.62, "learning_rate": 3.153965750478241e-05, "loss": 2.6164, "step": 47840 }, { "epoch": 0.62, "learning_rate": 3.153017290334001e-05, "loss": 2.4715, "step": 47845 }, { "epoch": 0.62, "learning_rate": 3.152068907145356e-05, "loss": 2.4258, "step": 47850 }, { "epoch": 0.62, "learning_rate": 3.151120600951816e-05, "loss": 2.4703, "step": 47855 }, { "epoch": 0.62, "learning_rate": 3.150172371792896e-05, "loss": 2.5686, "step": 47860 }, { "epoch": 0.62, "learning_rate": 3.149224219708104e-05, "loss": 2.6129, "step": 47865 }, { "epoch": 0.62, "learning_rate": 3.1482761447369426e-05, "loss": 2.4888, "step": 47870 }, { "epoch": 0.62, "learning_rate": 3.147328146918918e-05, "loss": 2.5174, "step": 47875 }, { "epoch": 0.62, "learning_rate": 3.146380226293525e-05, "loss": 2.5828, "step": 47880 }, { "epoch": 0.62, "learning_rate": 3.145432382900262e-05, "loss": 2.4615, "step": 47885 }, { "epoch": 0.62, "learning_rate": 3.1444846167786215e-05, "loss": 2.475, "step": 47890 }, { "epoch": 0.62, "learning_rate": 3.1435369279680897e-05, "loss": 2.5338, "step": 47895 }, { "epoch": 0.62, "learning_rate": 3.142589316508158e-05, "loss": 2.5198, "step": 47900 }, { "epoch": 0.62, "learning_rate": 3.1416417824383035e-05, "loss": 2.4417, "step": 47905 }, { "epoch": 0.62, "learning_rate": 3.14069432579801e-05, "loss": 2.4186, "step": 47910 }, { "epoch": 0.62, "learning_rate": 3.139746946626751e-05, "loss": 2.5174, "step": 47915 }, { "epoch": 0.62, "learning_rate": 3.138799644964e-05, "loss": 2.5394, "step": 47920 }, { "epoch": 0.62, "learning_rate": 3.137852420849229e-05, "loss": 2.5101, "step": 47925 }, { "epoch": 0.62, "learning_rate": 3.136905274321902e-05, "loss": 2.6073, "step": 47930 }, { "epoch": 0.62, "learning_rate": 3.1359582054214846e-05, "loss": 2.4691, "step": 47935 }, { "epoch": 0.62, "learning_rate": 3.135011214187434e-05, "loss": 2.4614, "step": 47940 }, { "epoch": 0.62, "learning_rate": 3.1340643006592105e-05, "loss": 2.4948, "step": 47945 }, { "epoch": 0.62, "learning_rate": 3.1331174648762665e-05, "loss": 2.4682, "step": 47950 }, { "epoch": 0.62, "learning_rate": 3.132170706878051e-05, "loss": 2.591, "step": 47955 }, { "epoch": 0.62, "learning_rate": 3.131224026704015e-05, "loss": 2.6358, "step": 47960 }, { "epoch": 0.62, "learning_rate": 3.130277424393598e-05, "loss": 2.6084, "step": 47965 }, { "epoch": 0.62, "learning_rate": 3.129330899986244e-05, "loss": 2.4873, "step": 47970 }, { "epoch": 0.62, "learning_rate": 3.128384453521388e-05, "loss": 2.4395, "step": 47975 }, { "epoch": 0.62, "learning_rate": 3.127438085038465e-05, "loss": 2.4437, "step": 47980 }, { "epoch": 0.62, "learning_rate": 3.126491794576908e-05, "loss": 2.4769, "step": 47985 }, { "epoch": 0.62, "learning_rate": 3.125545582176142e-05, "loss": 2.7249, "step": 47990 }, { "epoch": 0.62, "learning_rate": 3.124599447875593e-05, "loss": 2.364, "step": 47995 }, { "epoch": 0.62, "learning_rate": 3.123653391714681e-05, "loss": 2.5245, "step": 48000 } ], "logging_steps": 5, "max_steps": 77054, "num_train_epochs": 1, "save_steps": 1000, "total_flos": 6.925319084703744e+18, "trial_name": null, "trial_params": null }