{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "eval_steps": 500, "global_step": 74635, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.999999944631254e-05, "loss": 1.1175, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.999999778525017e-05, "loss": 1.2963, "step": 10 }, { "epoch": 0.0, "learning_rate": 4.9999995016812976e-05, "loss": 1.2087, "step": 15 }, { "epoch": 0.0, "learning_rate": 4.999999114100106e-05, "loss": 0.9386, "step": 20 }, { "epoch": 0.0, "learning_rate": 4.9999986157814616e-05, "loss": 1.9483, "step": 25 }, { "epoch": 0.0, "learning_rate": 4.999998137395594e-05, "loss": 1.1969, "step": 30 }, { "epoch": 0.0, "learning_rate": 4.999997439749592e-05, "loss": 0.7181, "step": 35 }, { "epoch": 0.0, "learning_rate": 4.9999966313662104e-05, "loss": 0.5784, "step": 40 }, { "epoch": 0.0, "learning_rate": 4.999995712245485e-05, "loss": 0.6916, "step": 45 }, { "epoch": 0.0, "learning_rate": 4.9999946823874566e-05, "loss": 0.5323, "step": 50 }, { "epoch": 0.0, "learning_rate": 4.999993541792172e-05, "loss": 0.3696, "step": 55 }, { "epoch": 0.0, "learning_rate": 4.9999922904596794e-05, "loss": 0.8375, "step": 60 }, { "epoch": 0.0, "learning_rate": 4.999990928390035e-05, "loss": 0.4259, "step": 65 }, { "epoch": 0.0, "learning_rate": 4.999989455583301e-05, "loss": 1.3398, "step": 70 }, { "epoch": 0.0, "learning_rate": 4.99998787203954e-05, "loss": 1.2475, "step": 75 }, { "epoch": 0.0, "learning_rate": 4.999986177758823e-05, "loss": 0.8862, "step": 80 }, { "epoch": 0.0, "learning_rate": 4.9999843727412264e-05, "loss": 0.5089, "step": 85 }, { "epoch": 0.0, "learning_rate": 4.9999824569868284e-05, "loss": 0.5924, "step": 90 }, { "epoch": 0.0, "learning_rate": 4.9999804304957156e-05, "loss": 0.7195, "step": 95 }, { "epoch": 0.0, "learning_rate": 4.999978293267975e-05, "loss": 0.6065, "step": 100 }, { "epoch": 0.0, "learning_rate": 4.999976045303705e-05, "loss": 1.3779, "step": 105 }, { "epoch": 0.0, "learning_rate": 4.999973686603002e-05, "loss": 0.7869, "step": 110 }, { "epoch": 0.0, "learning_rate": 4.999971217165972e-05, "loss": 1.0238, "step": 115 }, { "epoch": 0.0, "learning_rate": 4.999968636992724e-05, "loss": 1.3405, "step": 120 }, { "epoch": 0.0, "learning_rate": 4.999965946083371e-05, "loss": 0.9579, "step": 125 }, { "epoch": 0.0, "learning_rate": 4.999963144438036e-05, "loss": 0.7728, "step": 130 }, { "epoch": 0.0, "learning_rate": 4.999960232056838e-05, "loss": 0.5664, "step": 135 }, { "epoch": 0.0, "learning_rate": 4.999957208939911e-05, "loss": 0.5849, "step": 140 }, { "epoch": 0.0, "learning_rate": 4.9999540750873854e-05, "loss": 0.649, "step": 145 }, { "epoch": 0.0, "learning_rate": 4.9999508304994016e-05, "loss": 0.4769, "step": 150 }, { "epoch": 0.0, "learning_rate": 4.999947475176102e-05, "loss": 1.5452, "step": 155 }, { "epoch": 0.0, "learning_rate": 4.9999440091176365e-05, "loss": 1.3779, "step": 160 }, { "epoch": 0.0, "learning_rate": 4.999940432324158e-05, "loss": 0.7738, "step": 165 }, { "epoch": 0.0, "learning_rate": 4.9999367447958264e-05, "loss": 0.3997, "step": 170 }, { "epoch": 0.0, "learning_rate": 4.9999329465328026e-05, "loss": 0.3091, "step": 175 }, { "epoch": 0.0, "learning_rate": 4.999929037535257e-05, "loss": 0.3844, "step": 180 }, { "epoch": 0.0, "learning_rate": 4.999925017803361e-05, "loss": 1.5298, "step": 185 }, { "epoch": 0.0, "learning_rate": 4.999920887337293e-05, "loss": 0.6153, "step": 190 }, { "epoch": 0.0, "learning_rate": 4.999916646137237e-05, "loss": 0.4478, "step": 195 }, { "epoch": 0.0, "learning_rate": 4.9999122942033805e-05, "loss": 1.5006, "step": 200 }, { "epoch": 0.0, "learning_rate": 4.999907831535916e-05, "loss": 1.6409, "step": 205 }, { "epoch": 0.0, "learning_rate": 4.9999032581350405e-05, "loss": 1.0176, "step": 210 }, { "epoch": 0.0, "learning_rate": 4.999898574000958e-05, "loss": 0.7179, "step": 215 }, { "epoch": 0.0, "learning_rate": 4.999893779133875e-05, "loss": 0.9579, "step": 220 }, { "epoch": 0.0, "learning_rate": 4.9998888735340046e-05, "loss": 0.3466, "step": 225 }, { "epoch": 0.0, "learning_rate": 4.9998838572015624e-05, "loss": 0.8621, "step": 230 }, { "epoch": 0.0, "learning_rate": 4.9998787301367734e-05, "loss": 0.3484, "step": 235 }, { "epoch": 0.0, "learning_rate": 4.9998734923398625e-05, "loss": 0.8321, "step": 240 }, { "epoch": 0.0, "learning_rate": 4.999868143811062e-05, "loss": 1.185, "step": 245 }, { "epoch": 0.0, "learning_rate": 4.9998626845506096e-05, "loss": 0.8132, "step": 250 }, { "epoch": 0.0, "learning_rate": 4.999857114558747e-05, "loss": 1.5201, "step": 255 }, { "epoch": 0.0, "learning_rate": 4.99985143383572e-05, "loss": 0.5482, "step": 260 }, { "epoch": 0.0, "learning_rate": 4.9998456423817806e-05, "loss": 1.1555, "step": 265 }, { "epoch": 0.0, "learning_rate": 4.999839740197186e-05, "loss": 1.1159, "step": 270 }, { "epoch": 0.0, "learning_rate": 4.999833727282198e-05, "loss": 0.8639, "step": 275 }, { "epoch": 0.0, "learning_rate": 4.9998276036370815e-05, "loss": 0.2065, "step": 280 }, { "epoch": 0.0, "learning_rate": 4.9998213692621085e-05, "loss": 1.0141, "step": 285 }, { "epoch": 0.0, "learning_rate": 4.9998150241575547e-05, "loss": 0.4898, "step": 290 }, { "epoch": 0.0, "learning_rate": 4.999808568323702e-05, "loss": 0.6492, "step": 295 }, { "epoch": 0.0, "learning_rate": 4.999802001760835e-05, "loss": 0.4761, "step": 300 }, { "epoch": 0.0, "learning_rate": 4.9997953244692466e-05, "loss": 1.2785, "step": 305 }, { "epoch": 0.0, "learning_rate": 4.99978853644923e-05, "loss": 1.0514, "step": 310 }, { "epoch": 0.0, "learning_rate": 4.999781637701088e-05, "loss": 1.0728, "step": 315 }, { "epoch": 0.0, "learning_rate": 4.9997746282251256e-05, "loss": 1.3544, "step": 320 }, { "epoch": 0.0, "learning_rate": 4.999767508021653e-05, "loss": 0.89, "step": 325 }, { "epoch": 0.0, "learning_rate": 4.999760277090986e-05, "loss": 1.1254, "step": 330 }, { "epoch": 0.0, "learning_rate": 4.999752935433445e-05, "loss": 0.9848, "step": 335 }, { "epoch": 0.0, "learning_rate": 4.999745483049354e-05, "loss": 1.0444, "step": 340 }, { "epoch": 0.0, "learning_rate": 4.9997379199390444e-05, "loss": 1.5312, "step": 345 }, { "epoch": 0.0, "learning_rate": 4.999730246102851e-05, "loss": 1.3145, "step": 350 }, { "epoch": 0.0, "learning_rate": 4.9997224615411126e-05, "loss": 0.9997, "step": 355 }, { "epoch": 0.0, "learning_rate": 4.999714566254176e-05, "loss": 1.1849, "step": 360 }, { "epoch": 0.0, "learning_rate": 4.9997065602423886e-05, "loss": 0.8012, "step": 365 }, { "epoch": 0.0, "learning_rate": 4.9996984435061064e-05, "loss": 0.798, "step": 370 }, { "epoch": 0.01, "learning_rate": 4.9996902160456895e-05, "loss": 1.2059, "step": 375 }, { "epoch": 0.01, "learning_rate": 4.9996818778615004e-05, "loss": 0.4677, "step": 380 }, { "epoch": 0.01, "learning_rate": 4.999673428953911e-05, "loss": 0.8789, "step": 385 }, { "epoch": 0.01, "learning_rate": 4.999664869323294e-05, "loss": 0.9632, "step": 390 }, { "epoch": 0.01, "learning_rate": 4.9996561989700274e-05, "loss": 0.4468, "step": 395 }, { "epoch": 0.01, "learning_rate": 4.999647417894498e-05, "loss": 1.0921, "step": 400 }, { "epoch": 0.01, "learning_rate": 4.9996385260970926e-05, "loss": 1.1251, "step": 405 }, { "epoch": 0.01, "learning_rate": 4.999629523578206e-05, "loss": 0.4541, "step": 410 }, { "epoch": 0.01, "learning_rate": 4.999620410338237e-05, "loss": 1.0725, "step": 415 }, { "epoch": 0.01, "learning_rate": 4.9996111863775886e-05, "loss": 0.8562, "step": 420 }, { "epoch": 0.01, "learning_rate": 4.99960185169667e-05, "loss": 0.581, "step": 425 }, { "epoch": 0.01, "learning_rate": 4.999592406295894e-05, "loss": 0.3293, "step": 430 }, { "epoch": 0.01, "learning_rate": 4.99958285017568e-05, "loss": 0.4994, "step": 435 }, { "epoch": 0.01, "learning_rate": 4.999573183336451e-05, "loss": 0.8315, "step": 440 }, { "epoch": 0.01, "learning_rate": 4.999563405778634e-05, "loss": 0.3814, "step": 445 }, { "epoch": 0.01, "learning_rate": 4.999553517502664e-05, "loss": 0.5276, "step": 450 }, { "epoch": 0.01, "learning_rate": 4.999543518508978e-05, "loss": 0.7973, "step": 455 }, { "epoch": 0.01, "learning_rate": 4.9995334087980186e-05, "loss": 0.8772, "step": 460 }, { "epoch": 0.01, "learning_rate": 4.999523188370234e-05, "loss": 0.3978, "step": 465 }, { "epoch": 0.01, "learning_rate": 4.9995128572260773e-05, "loss": 0.5971, "step": 470 }, { "epoch": 0.01, "learning_rate": 4.9995024153660054e-05, "loss": 1.174, "step": 475 }, { "epoch": 0.01, "learning_rate": 4.9994918627904806e-05, "loss": 0.4168, "step": 480 }, { "epoch": 0.01, "learning_rate": 4.999481199499971e-05, "loss": 1.0939, "step": 485 }, { "epoch": 0.01, "learning_rate": 4.99947042549495e-05, "loss": 0.5027, "step": 490 }, { "epoch": 0.01, "learning_rate": 4.999459540775892e-05, "loss": 0.5189, "step": 495 }, { "epoch": 0.01, "learning_rate": 4.999448545343281e-05, "loss": 0.867, "step": 500 }, { "epoch": 0.01, "learning_rate": 4.999437439197605e-05, "loss": 0.8078, "step": 505 }, { "epoch": 0.01, "learning_rate": 4.999426222339354e-05, "loss": 1.3523, "step": 510 }, { "epoch": 0.01, "learning_rate": 4.999414894769025e-05, "loss": 1.3141, "step": 515 }, { "epoch": 0.01, "learning_rate": 4.9994034564871205e-05, "loss": 1.7203, "step": 520 }, { "epoch": 0.01, "learning_rate": 4.999391907494148e-05, "loss": 0.6086, "step": 525 }, { "epoch": 0.01, "learning_rate": 4.999380247790617e-05, "loss": 0.6749, "step": 530 }, { "epoch": 0.01, "learning_rate": 4.999368477377046e-05, "loss": 0.6562, "step": 535 }, { "epoch": 0.01, "learning_rate": 4.999356596253954e-05, "loss": 1.6794, "step": 540 }, { "epoch": 0.01, "learning_rate": 4.99934460442187e-05, "loss": 0.5717, "step": 545 }, { "epoch": 0.01, "learning_rate": 4.999332501881323e-05, "loss": 0.6799, "step": 550 }, { "epoch": 0.01, "learning_rate": 4.9993202886328506e-05, "loss": 1.6856, "step": 555 }, { "epoch": 0.01, "learning_rate": 4.9993079646769934e-05, "loss": 0.8249, "step": 560 }, { "epoch": 0.01, "learning_rate": 4.9992955300142965e-05, "loss": 1.228, "step": 565 }, { "epoch": 0.01, "learning_rate": 4.99928298464531e-05, "loss": 1.2413, "step": 570 }, { "epoch": 0.01, "learning_rate": 4.999270328570593e-05, "loss": 0.8926, "step": 575 }, { "epoch": 0.01, "learning_rate": 4.999257561790702e-05, "loss": 1.0096, "step": 580 }, { "epoch": 0.01, "learning_rate": 4.9992446843062055e-05, "loss": 0.5719, "step": 585 }, { "epoch": 0.01, "learning_rate": 4.9992316961176725e-05, "loss": 0.9341, "step": 590 }, { "epoch": 0.01, "learning_rate": 4.999218597225679e-05, "loss": 0.4394, "step": 595 }, { "epoch": 0.01, "learning_rate": 4.999205387630804e-05, "loss": 1.0186, "step": 600 }, { "epoch": 0.01, "learning_rate": 4.9991920673336346e-05, "loss": 1.0815, "step": 605 }, { "epoch": 0.01, "learning_rate": 4.999178636334759e-05, "loss": 0.3498, "step": 610 }, { "epoch": 0.01, "learning_rate": 4.999165094634773e-05, "loss": 0.859, "step": 615 }, { "epoch": 0.01, "learning_rate": 4.999151442234275e-05, "loss": 1.0441, "step": 620 }, { "epoch": 0.01, "learning_rate": 4.9991376791338727e-05, "loss": 1.0832, "step": 625 }, { "epoch": 0.01, "learning_rate": 4.999123805334174e-05, "loss": 0.8298, "step": 630 }, { "epoch": 0.01, "learning_rate": 4.9991098208357926e-05, "loss": 1.0205, "step": 635 }, { "epoch": 0.01, "learning_rate": 4.999095725639349e-05, "loss": 0.8987, "step": 640 }, { "epoch": 0.01, "learning_rate": 4.999081519745468e-05, "loss": 0.8961, "step": 645 }, { "epoch": 0.01, "learning_rate": 4.999067203154777e-05, "loss": 1.5879, "step": 650 }, { "epoch": 0.01, "learning_rate": 4.999052775867912e-05, "loss": 0.4529, "step": 655 }, { "epoch": 0.01, "learning_rate": 4.999038237885511e-05, "loss": 1.0315, "step": 660 }, { "epoch": 0.01, "learning_rate": 4.999023589208219e-05, "loss": 1.0413, "step": 665 }, { "epoch": 0.01, "learning_rate": 4.9990088298366835e-05, "loss": 1.4792, "step": 670 }, { "epoch": 0.01, "learning_rate": 4.9989939597715596e-05, "loss": 0.8857, "step": 675 }, { "epoch": 0.01, "learning_rate": 4.998978979013505e-05, "loss": 1.3394, "step": 680 }, { "epoch": 0.01, "learning_rate": 4.998963887563184e-05, "loss": 0.6586, "step": 685 }, { "epoch": 0.01, "learning_rate": 4.9989486854212644e-05, "loss": 0.8019, "step": 690 }, { "epoch": 0.01, "learning_rate": 4.99893337258842e-05, "loss": 0.9601, "step": 695 }, { "epoch": 0.01, "learning_rate": 4.998917949065328e-05, "loss": 0.4579, "step": 700 }, { "epoch": 0.01, "learning_rate": 4.9989024148526744e-05, "loss": 1.2467, "step": 705 }, { "epoch": 0.01, "learning_rate": 4.998886769951144e-05, "loss": 1.1879, "step": 710 }, { "epoch": 0.01, "learning_rate": 4.998871014361431e-05, "loss": 0.6006, "step": 715 }, { "epoch": 0.01, "learning_rate": 4.998855148084235e-05, "loss": 0.4459, "step": 720 }, { "epoch": 0.01, "learning_rate": 4.998839171120257e-05, "loss": 1.0295, "step": 725 }, { "epoch": 0.01, "learning_rate": 4.9988230834702044e-05, "loss": 1.2731, "step": 730 }, { "epoch": 0.01, "learning_rate": 4.9988068851347905e-05, "loss": 0.9354, "step": 735 }, { "epoch": 0.01, "learning_rate": 4.9987905761147327e-05, "loss": 0.9916, "step": 740 }, { "epoch": 0.01, "learning_rate": 4.998774156410753e-05, "loss": 0.8256, "step": 745 }, { "epoch": 0.01, "learning_rate": 4.99875762602358e-05, "loss": 0.555, "step": 750 }, { "epoch": 0.01, "learning_rate": 4.9987409849539446e-05, "loss": 0.4985, "step": 755 }, { "epoch": 0.01, "learning_rate": 4.9987242332025846e-05, "loss": 0.8432, "step": 760 }, { "epoch": 0.01, "learning_rate": 4.998707370770241e-05, "loss": 0.5412, "step": 765 }, { "epoch": 0.01, "learning_rate": 4.9986903976576624e-05, "loss": 1.242, "step": 770 }, { "epoch": 0.01, "learning_rate": 4.9986733138656004e-05, "loss": 0.5827, "step": 775 }, { "epoch": 0.01, "learning_rate": 4.99865611939481e-05, "loss": 1.6726, "step": 780 }, { "epoch": 0.01, "learning_rate": 4.998638814246054e-05, "loss": 1.0135, "step": 785 }, { "epoch": 0.01, "learning_rate": 4.998621398420099e-05, "loss": 1.6161, "step": 790 }, { "epoch": 0.01, "learning_rate": 4.998603871917716e-05, "loss": 0.5247, "step": 795 }, { "epoch": 0.01, "learning_rate": 4.998586234739682e-05, "loss": 0.5473, "step": 800 }, { "epoch": 0.01, "learning_rate": 4.998568486886778e-05, "loss": 0.9008, "step": 805 }, { "epoch": 0.01, "learning_rate": 4.9985506283597894e-05, "loss": 0.8078, "step": 810 }, { "epoch": 0.01, "learning_rate": 4.998532659159508e-05, "loss": 0.5772, "step": 815 }, { "epoch": 0.01, "learning_rate": 4.998514579286729e-05, "loss": 1.8732, "step": 820 }, { "epoch": 0.01, "learning_rate": 4.998496388742256e-05, "loss": 1.0388, "step": 825 }, { "epoch": 0.01, "learning_rate": 4.99847808752689e-05, "loss": 1.3867, "step": 830 }, { "epoch": 0.01, "learning_rate": 4.9984596756414454e-05, "loss": 0.3347, "step": 835 }, { "epoch": 0.01, "learning_rate": 4.998441153086736e-05, "loss": 1.0324, "step": 840 }, { "epoch": 0.01, "learning_rate": 4.9984225198635836e-05, "loss": 1.425, "step": 845 }, { "epoch": 0.01, "learning_rate": 4.998403775972812e-05, "loss": 0.8445, "step": 850 }, { "epoch": 0.01, "learning_rate": 4.998384921415253e-05, "loss": 0.5355, "step": 855 }, { "epoch": 0.01, "learning_rate": 4.9983659561917403e-05, "loss": 0.5849, "step": 860 }, { "epoch": 0.01, "learning_rate": 4.998346880303115e-05, "loss": 1.014, "step": 865 }, { "epoch": 0.01, "learning_rate": 4.998327693750222e-05, "loss": 0.4799, "step": 870 }, { "epoch": 0.01, "learning_rate": 4.998308396533911e-05, "loss": 0.7285, "step": 875 }, { "epoch": 0.01, "learning_rate": 4.998288988655036e-05, "loss": 0.4578, "step": 880 }, { "epoch": 0.01, "learning_rate": 4.9982694701144575e-05, "loss": 0.9269, "step": 885 }, { "epoch": 0.01, "learning_rate": 4.9982498409130404e-05, "loss": 1.3201, "step": 890 }, { "epoch": 0.01, "learning_rate": 4.998230101051653e-05, "loss": 1.0175, "step": 895 }, { "epoch": 0.01, "learning_rate": 4.998210250531171e-05, "loss": 1.2112, "step": 900 }, { "epoch": 0.01, "learning_rate": 4.9981902893524724e-05, "loss": 0.4092, "step": 905 }, { "epoch": 0.01, "learning_rate": 4.998170217516442e-05, "loss": 0.5984, "step": 910 }, { "epoch": 0.01, "learning_rate": 4.99815003502397e-05, "loss": 0.6566, "step": 915 }, { "epoch": 0.01, "learning_rate": 4.998129741875949e-05, "loss": 0.5821, "step": 920 }, { "epoch": 0.01, "learning_rate": 4.998109338073278e-05, "loss": 0.5089, "step": 925 }, { "epoch": 0.01, "learning_rate": 4.99808882361686e-05, "loss": 0.5211, "step": 930 }, { "epoch": 0.01, "learning_rate": 4.9980681985076064e-05, "loss": 1.2705, "step": 935 }, { "epoch": 0.01, "learning_rate": 4.998047462746428e-05, "loss": 0.9202, "step": 940 }, { "epoch": 0.01, "learning_rate": 4.9980266163342444e-05, "loss": 1.2903, "step": 945 }, { "epoch": 0.01, "learning_rate": 4.9980056592719795e-05, "loss": 0.2625, "step": 950 }, { "epoch": 0.01, "learning_rate": 4.99798459156056e-05, "loss": 1.1078, "step": 955 }, { "epoch": 0.01, "learning_rate": 4.997963413200921e-05, "loss": 0.5878, "step": 960 }, { "epoch": 0.01, "learning_rate": 4.997942124193999e-05, "loss": 0.8494, "step": 965 }, { "epoch": 0.01, "learning_rate": 4.9979207245407376e-05, "loss": 0.6503, "step": 970 }, { "epoch": 0.01, "learning_rate": 4.9978992142420853e-05, "loss": 0.2577, "step": 975 }, { "epoch": 0.01, "learning_rate": 4.9978775932989954e-05, "loss": 0.8531, "step": 980 }, { "epoch": 0.01, "learning_rate": 4.9978558617124225e-05, "loss": 0.253, "step": 985 }, { "epoch": 0.01, "learning_rate": 4.997834019483333e-05, "loss": 0.5543, "step": 990 }, { "epoch": 0.01, "learning_rate": 4.997812066612692e-05, "loss": 0.6569, "step": 995 }, { "epoch": 0.01, "learning_rate": 4.997790003101472e-05, "loss": 0.3126, "step": 1000 }, { "epoch": 0.01, "learning_rate": 4.9977678289506524e-05, "loss": 1.2859, "step": 1005 }, { "epoch": 0.01, "learning_rate": 4.997745544161213e-05, "loss": 1.2787, "step": 1010 }, { "epoch": 0.01, "learning_rate": 4.997723148734143e-05, "loss": 1.5152, "step": 1015 }, { "epoch": 0.01, "learning_rate": 4.9977006426704315e-05, "loss": 1.0104, "step": 1020 }, { "epoch": 0.01, "learning_rate": 4.9976780259710775e-05, "loss": 0.4115, "step": 1025 }, { "epoch": 0.01, "learning_rate": 4.997655298637083e-05, "loss": 0.827, "step": 1030 }, { "epoch": 0.01, "learning_rate": 4.9976324606694535e-05, "loss": 0.6862, "step": 1035 }, { "epoch": 0.01, "learning_rate": 4.997609512069202e-05, "loss": 0.5471, "step": 1040 }, { "epoch": 0.01, "learning_rate": 4.997586452837344e-05, "loss": 0.5487, "step": 1045 }, { "epoch": 0.01, "learning_rate": 4.997563282974901e-05, "loss": 1.0812, "step": 1050 }, { "epoch": 0.01, "learning_rate": 4.9975400024829e-05, "loss": 0.3919, "step": 1055 }, { "epoch": 0.01, "learning_rate": 4.9975166113623706e-05, "loss": 1.5837, "step": 1060 }, { "epoch": 0.01, "learning_rate": 4.9974931096143504e-05, "loss": 0.8271, "step": 1065 }, { "epoch": 0.01, "learning_rate": 4.997469497239881e-05, "loss": 0.6542, "step": 1070 }, { "epoch": 0.01, "learning_rate": 4.997445774240007e-05, "loss": 0.9562, "step": 1075 }, { "epoch": 0.01, "learning_rate": 4.9974219406157786e-05, "loss": 0.8433, "step": 1080 }, { "epoch": 0.01, "learning_rate": 4.9973979963682525e-05, "loss": 1.4215, "step": 1085 }, { "epoch": 0.01, "learning_rate": 4.99737394149849e-05, "loss": 1.2069, "step": 1090 }, { "epoch": 0.01, "learning_rate": 4.997349776007556e-05, "loss": 0.9409, "step": 1095 }, { "epoch": 0.01, "learning_rate": 4.9973254998965205e-05, "loss": 0.9299, "step": 1100 }, { "epoch": 0.01, "learning_rate": 4.9973011131664584e-05, "loss": 0.4862, "step": 1105 }, { "epoch": 0.01, "learning_rate": 4.997276615818451e-05, "loss": 1.0234, "step": 1110 }, { "epoch": 0.01, "learning_rate": 4.9972520078535835e-05, "loss": 0.9295, "step": 1115 }, { "epoch": 0.02, "learning_rate": 4.997227289272945e-05, "loss": 1.0981, "step": 1120 }, { "epoch": 0.02, "learning_rate": 4.997202460077631e-05, "loss": 0.3906, "step": 1125 }, { "epoch": 0.02, "learning_rate": 4.997177520268741e-05, "loss": 1.3166, "step": 1130 }, { "epoch": 0.02, "learning_rate": 4.99715246984738e-05, "loss": 0.5201, "step": 1135 }, { "epoch": 0.02, "learning_rate": 4.997127308814657e-05, "loss": 0.8628, "step": 1140 }, { "epoch": 0.02, "learning_rate": 4.997102037171687e-05, "loss": 1.0946, "step": 1145 }, { "epoch": 0.02, "learning_rate": 4.99707665491959e-05, "loss": 0.4313, "step": 1150 }, { "epoch": 0.02, "learning_rate": 4.997051162059489e-05, "loss": 0.7298, "step": 1155 }, { "epoch": 0.02, "learning_rate": 4.997025558592514e-05, "loss": 0.6291, "step": 1160 }, { "epoch": 0.02, "learning_rate": 4.9969998445197995e-05, "loss": 0.458, "step": 1165 }, { "epoch": 0.02, "learning_rate": 4.9969740198424833e-05, "loss": 0.5658, "step": 1170 }, { "epoch": 0.02, "learning_rate": 4.99694808456171e-05, "loss": 0.7582, "step": 1175 }, { "epoch": 0.02, "learning_rate": 4.996922038678629e-05, "loss": 0.7076, "step": 1180 }, { "epoch": 0.02, "learning_rate": 4.9968958821943934e-05, "loss": 1.3329, "step": 1185 }, { "epoch": 0.02, "learning_rate": 4.9968696151101615e-05, "loss": 0.5785, "step": 1190 }, { "epoch": 0.02, "learning_rate": 4.996843237427097e-05, "loss": 1.2699, "step": 1195 }, { "epoch": 0.02, "learning_rate": 4.996816749146368e-05, "loss": 0.9656, "step": 1200 }, { "epoch": 0.02, "learning_rate": 4.996790150269149e-05, "loss": 1.2149, "step": 1205 }, { "epoch": 0.02, "learning_rate": 4.996763440796617e-05, "loss": 0.6695, "step": 1210 }, { "epoch": 0.02, "learning_rate": 4.996736620729956e-05, "loss": 0.8939, "step": 1215 }, { "epoch": 0.02, "learning_rate": 4.9967096900703523e-05, "loss": 0.6298, "step": 1220 }, { "epoch": 0.02, "learning_rate": 4.996682648819001e-05, "loss": 0.9118, "step": 1225 }, { "epoch": 0.02, "learning_rate": 4.996655496977099e-05, "loss": 0.4705, "step": 1230 }, { "epoch": 0.02, "learning_rate": 4.9966282345458485e-05, "loss": 0.6012, "step": 1235 }, { "epoch": 0.02, "learning_rate": 4.996600861526457e-05, "loss": 0.8986, "step": 1240 }, { "epoch": 0.02, "learning_rate": 4.9965733779201375e-05, "loss": 1.1022, "step": 1245 }, { "epoch": 0.02, "learning_rate": 4.996545783728108e-05, "loss": 0.4112, "step": 1250 }, { "epoch": 0.02, "learning_rate": 4.99651807895159e-05, "loss": 0.5566, "step": 1255 }, { "epoch": 0.02, "learning_rate": 4.9964902635918095e-05, "loss": 1.1704, "step": 1260 }, { "epoch": 0.02, "learning_rate": 4.996462337650002e-05, "loss": 0.3849, "step": 1265 }, { "epoch": 0.02, "learning_rate": 4.9964343011274005e-05, "loss": 1.2727, "step": 1270 }, { "epoch": 0.02, "learning_rate": 4.99640615402525e-05, "loss": 0.9498, "step": 1275 }, { "epoch": 0.02, "learning_rate": 4.996377896344795e-05, "loss": 0.4641, "step": 1280 }, { "epoch": 0.02, "learning_rate": 4.996349528087289e-05, "loss": 0.684, "step": 1285 }, { "epoch": 0.02, "learning_rate": 4.996321049253988e-05, "loss": 1.2562, "step": 1290 }, { "epoch": 0.02, "learning_rate": 4.996292459846152e-05, "loss": 1.0132, "step": 1295 }, { "epoch": 0.02, "learning_rate": 4.996263759865049e-05, "loss": 0.9469, "step": 1300 }, { "epoch": 0.02, "learning_rate": 4.9962349493119504e-05, "loss": 1.2261, "step": 1305 }, { "epoch": 0.02, "learning_rate": 4.9962060281881314e-05, "loss": 0.8299, "step": 1310 }, { "epoch": 0.02, "learning_rate": 4.996176996494874e-05, "loss": 0.9838, "step": 1315 }, { "epoch": 0.02, "learning_rate": 4.996147854233463e-05, "loss": 1.1255, "step": 1320 }, { "epoch": 0.02, "learning_rate": 4.99611860140519e-05, "loss": 0.2614, "step": 1325 }, { "epoch": 0.02, "learning_rate": 4.9960892380113505e-05, "loss": 0.7404, "step": 1330 }, { "epoch": 0.02, "learning_rate": 4.9960597640532457e-05, "loss": 1.1008, "step": 1335 }, { "epoch": 0.02, "learning_rate": 4.996030179532181e-05, "loss": 0.7277, "step": 1340 }, { "epoch": 0.02, "learning_rate": 4.9960004844494654e-05, "loss": 1.3166, "step": 1345 }, { "epoch": 0.02, "learning_rate": 4.9959706788064165e-05, "loss": 0.6078, "step": 1350 }, { "epoch": 0.02, "learning_rate": 4.995940762604353e-05, "loss": 1.6196, "step": 1355 }, { "epoch": 0.02, "learning_rate": 4.9959107358446013e-05, "loss": 0.7914, "step": 1360 }, { "epoch": 0.02, "learning_rate": 4.995880598528489e-05, "loss": 0.9917, "step": 1365 }, { "epoch": 0.02, "learning_rate": 4.995850350657354e-05, "loss": 0.9428, "step": 1370 }, { "epoch": 0.02, "learning_rate": 4.995819992232535e-05, "loss": 0.8594, "step": 1375 }, { "epoch": 0.02, "learning_rate": 4.995789523255376e-05, "loss": 0.7691, "step": 1380 }, { "epoch": 0.02, "learning_rate": 4.9957589437272276e-05, "loss": 0.2984, "step": 1385 }, { "epoch": 0.02, "learning_rate": 4.9957282536494434e-05, "loss": 1.196, "step": 1390 }, { "epoch": 0.02, "learning_rate": 4.9956974530233835e-05, "loss": 0.5889, "step": 1395 }, { "epoch": 0.02, "learning_rate": 4.995666541850412e-05, "loss": 0.9657, "step": 1400 }, { "epoch": 0.02, "learning_rate": 4.9956355201318974e-05, "loss": 1.0957, "step": 1405 }, { "epoch": 0.02, "learning_rate": 4.995604387869216e-05, "loss": 1.2781, "step": 1410 }, { "epoch": 0.02, "learning_rate": 4.9955731450637444e-05, "loss": 0.2913, "step": 1415 }, { "epoch": 0.02, "learning_rate": 4.995541791716867e-05, "loss": 0.4179, "step": 1420 }, { "epoch": 0.02, "learning_rate": 4.995510327829974e-05, "loss": 0.94, "step": 1425 }, { "epoch": 0.02, "learning_rate": 4.995478753404458e-05, "loss": 0.6625, "step": 1430 }, { "epoch": 0.02, "learning_rate": 4.995447068441717e-05, "loss": 1.4036, "step": 1435 }, { "epoch": 0.02, "learning_rate": 4.9954152729431556e-05, "loss": 0.4726, "step": 1440 }, { "epoch": 0.02, "learning_rate": 4.995383366910182e-05, "loss": 1.3347, "step": 1445 }, { "epoch": 0.02, "learning_rate": 4.995351350344209e-05, "loss": 0.9503, "step": 1450 }, { "epoch": 0.02, "learning_rate": 4.995319223246655e-05, "loss": 0.8173, "step": 1455 }, { "epoch": 0.02, "learning_rate": 4.995286985618943e-05, "loss": 1.5933, "step": 1460 }, { "epoch": 0.02, "learning_rate": 4.995254637462501e-05, "loss": 1.1265, "step": 1465 }, { "epoch": 0.02, "learning_rate": 4.9952221787787624e-05, "loss": 0.8779, "step": 1470 }, { "epoch": 0.02, "learning_rate": 4.9951896095691644e-05, "loss": 0.395, "step": 1475 }, { "epoch": 0.02, "learning_rate": 4.99515692983515e-05, "loss": 0.7555, "step": 1480 }, { "epoch": 0.02, "learning_rate": 4.9951241395781656e-05, "loss": 0.9592, "step": 1485 }, { "epoch": 0.02, "learning_rate": 4.995091238799665e-05, "loss": 0.7174, "step": 1490 }, { "epoch": 0.02, "learning_rate": 4.995058227501105e-05, "loss": 1.0637, "step": 1495 }, { "epoch": 0.02, "learning_rate": 4.995025105683948e-05, "loss": 0.578, "step": 1500 }, { "epoch": 0.02, "learning_rate": 4.9949918733496614e-05, "loss": 0.6913, "step": 1505 }, { "epoch": 0.02, "learning_rate": 4.994958530499716e-05, "loss": 0.545, "step": 1510 }, { "epoch": 0.02, "learning_rate": 4.99492507713559e-05, "loss": 1.279, "step": 1515 }, { "epoch": 0.02, "learning_rate": 4.994891513258765e-05, "loss": 0.9076, "step": 1520 }, { "epoch": 0.02, "learning_rate": 4.994857838870728e-05, "loss": 0.8357, "step": 1525 }, { "epoch": 0.02, "learning_rate": 4.99482405397297e-05, "loss": 0.5646, "step": 1530 }, { "epoch": 0.02, "learning_rate": 4.9947901585669865e-05, "loss": 1.1263, "step": 1535 }, { "epoch": 0.02, "learning_rate": 4.994756152654281e-05, "loss": 0.4438, "step": 1540 }, { "epoch": 0.02, "learning_rate": 4.994722036236358e-05, "loss": 1.1512, "step": 1545 }, { "epoch": 0.02, "learning_rate": 4.99468780931473e-05, "loss": 0.8834, "step": 1550 }, { "epoch": 0.02, "learning_rate": 4.9946534718909124e-05, "loss": 0.7894, "step": 1555 }, { "epoch": 0.02, "learning_rate": 4.994619023966427e-05, "loss": 0.4945, "step": 1560 }, { "epoch": 0.02, "learning_rate": 4.994584465542798e-05, "loss": 0.8794, "step": 1565 }, { "epoch": 0.02, "learning_rate": 4.994549796621558e-05, "loss": 0.716, "step": 1570 }, { "epoch": 0.02, "learning_rate": 4.9945150172042414e-05, "loss": 0.918, "step": 1575 }, { "epoch": 0.02, "learning_rate": 4.994480127292389e-05, "loss": 1.2396, "step": 1580 }, { "epoch": 0.02, "learning_rate": 4.994445126887547e-05, "loss": 1.1982, "step": 1585 }, { "epoch": 0.02, "learning_rate": 4.994410015991265e-05, "loss": 1.7369, "step": 1590 }, { "epoch": 0.02, "learning_rate": 4.9943747946050986e-05, "loss": 0.8866, "step": 1595 }, { "epoch": 0.02, "learning_rate": 4.994339462730608e-05, "loss": 0.8461, "step": 1600 }, { "epoch": 0.02, "learning_rate": 4.994304020369358e-05, "loss": 0.6142, "step": 1605 }, { "epoch": 0.02, "learning_rate": 4.994268467522918e-05, "loss": 1.8143, "step": 1610 }, { "epoch": 0.02, "learning_rate": 4.9942328041928633e-05, "loss": 0.5012, "step": 1615 }, { "epoch": 0.02, "learning_rate": 4.9941970303807735e-05, "loss": 1.0357, "step": 1620 }, { "epoch": 0.02, "learning_rate": 4.994161146088233e-05, "loss": 0.5546, "step": 1625 }, { "epoch": 0.02, "learning_rate": 4.994125151316833e-05, "loss": 0.8161, "step": 1630 }, { "epoch": 0.02, "learning_rate": 4.994089046068166e-05, "loss": 0.2373, "step": 1635 }, { "epoch": 0.02, "learning_rate": 4.99405283034383e-05, "loss": 0.6655, "step": 1640 }, { "epoch": 0.02, "learning_rate": 4.994016504145433e-05, "loss": 0.7921, "step": 1645 }, { "epoch": 0.02, "learning_rate": 4.9939800674745815e-05, "loss": 0.6118, "step": 1650 }, { "epoch": 0.02, "learning_rate": 4.9939435203328904e-05, "loss": 1.139, "step": 1655 }, { "epoch": 0.02, "learning_rate": 4.9939068627219776e-05, "loss": 0.6861, "step": 1660 }, { "epoch": 0.02, "learning_rate": 4.993870094643468e-05, "loss": 0.638, "step": 1665 }, { "epoch": 0.02, "learning_rate": 4.9938332160989884e-05, "loss": 0.5028, "step": 1670 }, { "epoch": 0.02, "learning_rate": 4.993796227090175e-05, "loss": 0.5536, "step": 1675 }, { "epoch": 0.02, "learning_rate": 4.993759127618665e-05, "loss": 0.2113, "step": 1680 }, { "epoch": 0.02, "learning_rate": 4.9937219176861e-05, "loss": 0.9614, "step": 1685 }, { "epoch": 0.02, "learning_rate": 4.993684597294131e-05, "loss": 0.9976, "step": 1690 }, { "epoch": 0.02, "learning_rate": 4.993647166444409e-05, "loss": 0.2613, "step": 1695 }, { "epoch": 0.02, "learning_rate": 4.9936096251385935e-05, "loss": 0.792, "step": 1700 }, { "epoch": 0.02, "learning_rate": 4.993571973378346e-05, "loss": 1.2821, "step": 1705 }, { "epoch": 0.02, "learning_rate": 4.993534211165335e-05, "loss": 0.7822, "step": 1710 }, { "epoch": 0.02, "learning_rate": 4.993496338501234e-05, "loss": 1.8109, "step": 1715 }, { "epoch": 0.02, "learning_rate": 4.99345835538772e-05, "loss": 0.8169, "step": 1720 }, { "epoch": 0.02, "learning_rate": 4.993420261826475e-05, "loss": 1.2367, "step": 1725 }, { "epoch": 0.02, "learning_rate": 4.993382057819186e-05, "loss": 0.914, "step": 1730 }, { "epoch": 0.02, "learning_rate": 4.9933437433675455e-05, "loss": 1.0807, "step": 1735 }, { "epoch": 0.02, "learning_rate": 4.9933053184732515e-05, "loss": 1.421, "step": 1740 }, { "epoch": 0.02, "learning_rate": 4.9932667831380056e-05, "loss": 0.7569, "step": 1745 }, { "epoch": 0.02, "learning_rate": 4.993228137363515e-05, "loss": 0.5558, "step": 1750 }, { "epoch": 0.02, "learning_rate": 4.993189381151491e-05, "loss": 1.1531, "step": 1755 }, { "epoch": 0.02, "learning_rate": 4.99315051450365e-05, "loss": 0.7702, "step": 1760 }, { "epoch": 0.02, "learning_rate": 4.993111537421714e-05, "loss": 0.6939, "step": 1765 }, { "epoch": 0.02, "learning_rate": 4.99307244990741e-05, "loss": 0.4104, "step": 1770 }, { "epoch": 0.02, "learning_rate": 4.993033251962469e-05, "loss": 0.3486, "step": 1775 }, { "epoch": 0.02, "learning_rate": 4.992993943588626e-05, "loss": 0.7353, "step": 1780 }, { "epoch": 0.02, "learning_rate": 4.992954524787625e-05, "loss": 0.2444, "step": 1785 }, { "epoch": 0.02, "learning_rate": 4.99291499556121e-05, "loss": 0.5504, "step": 1790 }, { "epoch": 0.02, "learning_rate": 4.992875355911132e-05, "loss": 0.5027, "step": 1795 }, { "epoch": 0.02, "learning_rate": 4.992835605839147e-05, "loss": 0.891, "step": 1800 }, { "epoch": 0.02, "learning_rate": 4.9927957453470164e-05, "loss": 0.622, "step": 1805 }, { "epoch": 0.02, "learning_rate": 4.992755774436505e-05, "loss": 0.8561, "step": 1810 }, { "epoch": 0.02, "learning_rate": 4.992715693109383e-05, "loss": 1.2842, "step": 1815 }, { "epoch": 0.02, "learning_rate": 4.992675501367428e-05, "loss": 1.2458, "step": 1820 }, { "epoch": 0.02, "learning_rate": 4.992635199212418e-05, "loss": 1.4007, "step": 1825 }, { "epoch": 0.02, "learning_rate": 4.992594786646139e-05, "loss": 1.0679, "step": 1830 }, { "epoch": 0.02, "learning_rate": 4.99255426367038e-05, "loss": 1.0209, "step": 1835 }, { "epoch": 0.02, "learning_rate": 4.992513630286938e-05, "loss": 0.3619, "step": 1840 }, { "epoch": 0.02, "learning_rate": 4.9924728864976124e-05, "loss": 0.5408, "step": 1845 }, { "epoch": 0.02, "learning_rate": 4.992432032304206e-05, "loss": 1.5902, "step": 1850 }, { "epoch": 0.02, "learning_rate": 4.992391067708531e-05, "loss": 1.463, "step": 1855 }, { "epoch": 0.02, "learning_rate": 4.9923499927124007e-05, "loss": 0.7185, "step": 1860 }, { "epoch": 0.02, "learning_rate": 4.992308807317634e-05, "loss": 0.7497, "step": 1865 }, { "epoch": 0.03, "learning_rate": 4.992267511526055e-05, "loss": 1.0309, "step": 1870 }, { "epoch": 0.03, "learning_rate": 4.992226105339495e-05, "loss": 0.3684, "step": 1875 }, { "epoch": 0.03, "learning_rate": 4.992184588759786e-05, "loss": 0.7907, "step": 1880 }, { "epoch": 0.03, "learning_rate": 4.9921429617887684e-05, "loss": 0.7616, "step": 1885 }, { "epoch": 0.03, "learning_rate": 4.992101224428285e-05, "loss": 0.3511, "step": 1890 }, { "epoch": 0.03, "learning_rate": 4.992059376680185e-05, "loss": 0.6516, "step": 1895 }, { "epoch": 0.03, "learning_rate": 4.992017418546322e-05, "loss": 0.567, "step": 1900 }, { "epoch": 0.03, "learning_rate": 4.991975350028555e-05, "loss": 1.0473, "step": 1905 }, { "epoch": 0.03, "learning_rate": 4.991933171128746e-05, "loss": 0.306, "step": 1910 }, { "epoch": 0.03, "learning_rate": 4.991890881848765e-05, "loss": 0.3976, "step": 1915 }, { "epoch": 0.03, "learning_rate": 4.9918484821904844e-05, "loss": 0.4893, "step": 1920 }, { "epoch": 0.03, "learning_rate": 4.991805972155782e-05, "loss": 1.1616, "step": 1925 }, { "epoch": 0.03, "learning_rate": 4.991763351746541e-05, "loss": 1.3054, "step": 1930 }, { "epoch": 0.03, "learning_rate": 4.9917206209646496e-05, "loss": 1.4177, "step": 1935 }, { "epoch": 0.03, "learning_rate": 4.9916777798120006e-05, "loss": 0.5165, "step": 1940 }, { "epoch": 0.03, "learning_rate": 4.991634828290491e-05, "loss": 1.7427, "step": 1945 }, { "epoch": 0.03, "learning_rate": 4.991591766402024e-05, "loss": 0.287, "step": 1950 }, { "epoch": 0.03, "learning_rate": 4.9915485941485075e-05, "loss": 0.8183, "step": 1955 }, { "epoch": 0.03, "learning_rate": 4.991505311531852e-05, "loss": 1.0476, "step": 1960 }, { "epoch": 0.03, "learning_rate": 4.9914619185539765e-05, "loss": 0.6414, "step": 1965 }, { "epoch": 0.03, "learning_rate": 4.991418415216802e-05, "loss": 0.8021, "step": 1970 }, { "epoch": 0.03, "learning_rate": 4.991374801522256e-05, "loss": 0.4192, "step": 1975 }, { "epoch": 0.03, "learning_rate": 4.99133107747227e-05, "loss": 0.699, "step": 1980 }, { "epoch": 0.03, "learning_rate": 4.991287243068782e-05, "loss": 0.7809, "step": 1985 }, { "epoch": 0.03, "learning_rate": 4.991243298313732e-05, "loss": 0.7769, "step": 1990 }, { "epoch": 0.03, "learning_rate": 4.9911992432090674e-05, "loss": 0.9924, "step": 1995 }, { "epoch": 0.03, "learning_rate": 4.9911550777567384e-05, "loss": 0.9471, "step": 2000 }, { "epoch": 0.03, "learning_rate": 4.991110801958704e-05, "loss": 0.4096, "step": 2005 }, { "epoch": 0.03, "learning_rate": 4.991066415816922e-05, "loss": 1.2013, "step": 2010 }, { "epoch": 0.03, "learning_rate": 4.991021919333361e-05, "loss": 1.0866, "step": 2015 }, { "epoch": 0.03, "learning_rate": 4.990977312509991e-05, "loss": 0.4902, "step": 2020 }, { "epoch": 0.03, "learning_rate": 4.990932595348789e-05, "loss": 0.4152, "step": 2025 }, { "epoch": 0.03, "learning_rate": 4.990887767851734e-05, "loss": 0.72, "step": 2030 }, { "epoch": 0.03, "learning_rate": 4.990842830020812e-05, "loss": 1.2541, "step": 2035 }, { "epoch": 0.03, "learning_rate": 4.990797781858014e-05, "loss": 1.145, "step": 2040 }, { "epoch": 0.03, "learning_rate": 4.9907526233653355e-05, "loss": 1.3577, "step": 2045 }, { "epoch": 0.03, "learning_rate": 4.990707354544777e-05, "loss": 0.4055, "step": 2050 }, { "epoch": 0.03, "learning_rate": 4.990661975398343e-05, "loss": 0.8183, "step": 2055 }, { "epoch": 0.03, "learning_rate": 4.9906164859280435e-05, "loss": 0.9741, "step": 2060 }, { "epoch": 0.03, "learning_rate": 4.9905708861358945e-05, "loss": 0.8818, "step": 2065 }, { "epoch": 0.03, "learning_rate": 4.9905251760239145e-05, "loss": 0.7496, "step": 2070 }, { "epoch": 0.03, "learning_rate": 4.99047935559413e-05, "loss": 1.0609, "step": 2075 }, { "epoch": 0.03, "learning_rate": 4.990433424848568e-05, "loss": 0.2517, "step": 2080 }, { "epoch": 0.03, "learning_rate": 4.9903873837892657e-05, "loss": 0.7865, "step": 2085 }, { "epoch": 0.03, "learning_rate": 4.9903412324182616e-05, "loss": 1.1957, "step": 2090 }, { "epoch": 0.03, "learning_rate": 4.990294970737599e-05, "loss": 0.9885, "step": 2095 }, { "epoch": 0.03, "learning_rate": 4.9902485987493274e-05, "loss": 0.6151, "step": 2100 }, { "epoch": 0.03, "learning_rate": 4.990202116455502e-05, "loss": 0.644, "step": 2105 }, { "epoch": 0.03, "learning_rate": 4.9901555238581805e-05, "loss": 1.039, "step": 2110 }, { "epoch": 0.03, "learning_rate": 4.9901088209594274e-05, "loss": 0.5855, "step": 2115 }, { "epoch": 0.03, "learning_rate": 4.99006200776131e-05, "loss": 1.0015, "step": 2120 }, { "epoch": 0.03, "learning_rate": 4.990015084265904e-05, "loss": 0.5825, "step": 2125 }, { "epoch": 0.03, "learning_rate": 4.9899680504752874e-05, "loss": 0.3583, "step": 2130 }, { "epoch": 0.03, "learning_rate": 4.989920906391543e-05, "loss": 0.8008, "step": 2135 }, { "epoch": 0.03, "learning_rate": 4.989873652016759e-05, "loss": 1.0115, "step": 2140 }, { "epoch": 0.03, "learning_rate": 4.989826287353028e-05, "loss": 0.9514, "step": 2145 }, { "epoch": 0.03, "learning_rate": 4.989778812402449e-05, "loss": 0.7021, "step": 2150 }, { "epoch": 0.03, "learning_rate": 4.989731227167125e-05, "loss": 0.6597, "step": 2155 }, { "epoch": 0.03, "learning_rate": 4.9896835316491634e-05, "loss": 0.6834, "step": 2160 }, { "epoch": 0.03, "learning_rate": 4.989635725850676e-05, "loss": 0.4437, "step": 2165 }, { "epoch": 0.03, "learning_rate": 4.9895878097737815e-05, "loss": 1.0334, "step": 2170 }, { "epoch": 0.03, "learning_rate": 4.9895397834206024e-05, "loss": 0.5497, "step": 2175 }, { "epoch": 0.03, "learning_rate": 4.989491646793265e-05, "loss": 1.0403, "step": 2180 }, { "epoch": 0.03, "learning_rate": 4.989443399893903e-05, "loss": 0.366, "step": 2185 }, { "epoch": 0.03, "learning_rate": 4.9893950427246526e-05, "loss": 0.5615, "step": 2190 }, { "epoch": 0.03, "learning_rate": 4.989346575287656e-05, "loss": 0.7266, "step": 2195 }, { "epoch": 0.03, "learning_rate": 4.989297997585059e-05, "loss": 1.197, "step": 2200 }, { "epoch": 0.03, "learning_rate": 4.989249309619015e-05, "loss": 0.9577, "step": 2205 }, { "epoch": 0.03, "learning_rate": 4.989200511391679e-05, "loss": 0.3421, "step": 2210 }, { "epoch": 0.03, "learning_rate": 4.9891516029052145e-05, "loss": 0.9852, "step": 2215 }, { "epoch": 0.03, "learning_rate": 4.989102584161787e-05, "loss": 1.2119, "step": 2220 }, { "epoch": 0.03, "learning_rate": 4.989053455163567e-05, "loss": 0.9544, "step": 2225 }, { "epoch": 0.03, "learning_rate": 4.989004215912731e-05, "loss": 0.7582, "step": 2230 }, { "epoch": 0.03, "learning_rate": 4.9889548664114605e-05, "loss": 0.6777, "step": 2235 }, { "epoch": 0.03, "learning_rate": 4.9889054066619416e-05, "loss": 0.6517, "step": 2240 }, { "epoch": 0.03, "learning_rate": 4.988855836666365e-05, "loss": 1.2618, "step": 2245 }, { "epoch": 0.03, "learning_rate": 4.9888061564269254e-05, "loss": 0.4411, "step": 2250 }, { "epoch": 0.03, "learning_rate": 4.9887563659458245e-05, "loss": 0.6538, "step": 2255 }, { "epoch": 0.03, "learning_rate": 4.988706465225268e-05, "loss": 0.3968, "step": 2260 }, { "epoch": 0.03, "learning_rate": 4.988656454267465e-05, "loss": 0.9654, "step": 2265 }, { "epoch": 0.03, "learning_rate": 4.988606333074632e-05, "loss": 1.8523, "step": 2270 }, { "epoch": 0.03, "learning_rate": 4.988556101648988e-05, "loss": 0.699, "step": 2275 }, { "epoch": 0.03, "learning_rate": 4.988505759992759e-05, "loss": 0.5273, "step": 2280 }, { "epoch": 0.03, "learning_rate": 4.988455308108174e-05, "loss": 0.4947, "step": 2285 }, { "epoch": 0.03, "learning_rate": 4.988404745997468e-05, "loss": 0.4026, "step": 2290 }, { "epoch": 0.03, "learning_rate": 4.988354073662882e-05, "loss": 0.7474, "step": 2295 }, { "epoch": 0.03, "learning_rate": 4.988303291106658e-05, "loss": 0.4164, "step": 2300 }, { "epoch": 0.03, "learning_rate": 4.988252398331048e-05, "loss": 0.5982, "step": 2305 }, { "epoch": 0.03, "learning_rate": 4.9882013953383047e-05, "loss": 0.2961, "step": 2310 }, { "epoch": 0.03, "learning_rate": 4.988150282130687e-05, "loss": 0.9195, "step": 2315 }, { "epoch": 0.03, "learning_rate": 4.98809905871046e-05, "loss": 0.2701, "step": 2320 }, { "epoch": 0.03, "learning_rate": 4.988047725079893e-05, "loss": 0.7474, "step": 2325 }, { "epoch": 0.03, "learning_rate": 4.987996281241258e-05, "loss": 0.9411, "step": 2330 }, { "epoch": 0.03, "learning_rate": 4.987944727196835e-05, "loss": 0.4647, "step": 2335 }, { "epoch": 0.03, "learning_rate": 4.9878930629489086e-05, "loss": 0.5357, "step": 2340 }, { "epoch": 0.03, "learning_rate": 4.987841288499765e-05, "loss": 0.8839, "step": 2345 }, { "epoch": 0.03, "learning_rate": 4.9877997895971154e-05, "loss": 1.7563, "step": 2350 }, { "epoch": 0.03, "learning_rate": 4.9877478167915653e-05, "loss": 0.7657, "step": 2355 }, { "epoch": 0.03, "learning_rate": 4.9877061592067706e-05, "loss": 1.4684, "step": 2360 }, { "epoch": 0.03, "learning_rate": 4.9876539880522735e-05, "loss": 1.1712, "step": 2365 }, { "epoch": 0.03, "learning_rate": 4.987601706707149e-05, "loss": 0.8255, "step": 2370 }, { "epoch": 0.03, "learning_rate": 4.987549315173715e-05, "loss": 1.178, "step": 2375 }, { "epoch": 0.03, "learning_rate": 4.98749681345429e-05, "loss": 1.2578, "step": 2380 }, { "epoch": 0.03, "learning_rate": 4.987444201551202e-05, "loss": 1.6248, "step": 2385 }, { "epoch": 0.03, "learning_rate": 4.98739147946678e-05, "loss": 0.919, "step": 2390 }, { "epoch": 0.03, "learning_rate": 4.987338647203358e-05, "loss": 0.655, "step": 2395 }, { "epoch": 0.03, "learning_rate": 4.987285704763279e-05, "loss": 0.6527, "step": 2400 }, { "epoch": 0.03, "learning_rate": 4.987232652148886e-05, "loss": 1.0444, "step": 2405 }, { "epoch": 0.03, "learning_rate": 4.987179489362531e-05, "loss": 1.234, "step": 2410 }, { "epoch": 0.03, "learning_rate": 4.987126216406567e-05, "loss": 1.36, "step": 2415 }, { "epoch": 0.03, "learning_rate": 4.987072833283354e-05, "loss": 0.9785, "step": 2420 }, { "epoch": 0.03, "learning_rate": 4.987019339995257e-05, "loss": 0.9738, "step": 2425 }, { "epoch": 0.03, "learning_rate": 4.986965736544645e-05, "loss": 0.459, "step": 2430 }, { "epoch": 0.03, "learning_rate": 4.9869120229338936e-05, "loss": 0.6921, "step": 2435 }, { "epoch": 0.03, "learning_rate": 4.986858199165381e-05, "loss": 0.7319, "step": 2440 }, { "epoch": 0.03, "learning_rate": 4.986804265241491e-05, "loss": 1.0496, "step": 2445 }, { "epoch": 0.03, "learning_rate": 4.986750221164613e-05, "loss": 0.4351, "step": 2450 }, { "epoch": 0.03, "learning_rate": 4.986696066937142e-05, "loss": 0.6981, "step": 2455 }, { "epoch": 0.03, "learning_rate": 4.9866418025614754e-05, "loss": 0.4266, "step": 2460 }, { "epoch": 0.03, "learning_rate": 4.986587428040017e-05, "loss": 0.5965, "step": 2465 }, { "epoch": 0.03, "learning_rate": 4.986532943375175e-05, "loss": 0.5691, "step": 2470 }, { "epoch": 0.03, "learning_rate": 4.986478348569364e-05, "loss": 0.9082, "step": 2475 }, { "epoch": 0.03, "learning_rate": 4.986423643625002e-05, "loss": 0.8509, "step": 2480 }, { "epoch": 0.03, "learning_rate": 4.986368828544512e-05, "loss": 0.32, "step": 2485 }, { "epoch": 0.03, "learning_rate": 4.986313903330321e-05, "loss": 0.283, "step": 2490 }, { "epoch": 0.03, "learning_rate": 4.986258867984863e-05, "loss": 0.8743, "step": 2495 }, { "epoch": 0.03, "learning_rate": 4.9862037225105754e-05, "loss": 0.9107, "step": 2500 }, { "epoch": 0.03, "learning_rate": 4.986148466909901e-05, "loss": 1.0217, "step": 2505 }, { "epoch": 0.03, "learning_rate": 4.986093101185287e-05, "loss": 1.0811, "step": 2510 }, { "epoch": 0.03, "learning_rate": 4.9860376253391874e-05, "loss": 0.1914, "step": 2515 }, { "epoch": 0.03, "learning_rate": 4.985982039374057e-05, "loss": 0.803, "step": 2520 }, { "epoch": 0.03, "learning_rate": 4.98592634329236e-05, "loss": 0.877, "step": 2525 }, { "epoch": 0.03, "learning_rate": 4.985870537096562e-05, "loss": 0.6571, "step": 2530 }, { "epoch": 0.03, "learning_rate": 4.985814620789136e-05, "loss": 0.7564, "step": 2535 }, { "epoch": 0.03, "learning_rate": 4.985758594372558e-05, "loss": 0.4985, "step": 2540 }, { "epoch": 0.03, "learning_rate": 4.9857024578493104e-05, "loss": 0.6987, "step": 2545 }, { "epoch": 0.03, "learning_rate": 4.9856462112218796e-05, "loss": 0.4647, "step": 2550 }, { "epoch": 0.03, "learning_rate": 4.9855898544927574e-05, "loss": 0.235, "step": 2555 }, { "epoch": 0.03, "learning_rate": 4.9855333876644386e-05, "loss": 0.4087, "step": 2560 }, { "epoch": 0.03, "learning_rate": 4.985476810739426e-05, "loss": 0.7464, "step": 2565 }, { "epoch": 0.03, "learning_rate": 4.985420123720225e-05, "loss": 0.3383, "step": 2570 }, { "epoch": 0.03, "learning_rate": 4.9853633266093466e-05, "loss": 0.7762, "step": 2575 }, { "epoch": 0.03, "learning_rate": 4.9853064194093074e-05, "loss": 1.346, "step": 2580 }, { "epoch": 0.03, "learning_rate": 4.985249402122627e-05, "loss": 1.0055, "step": 2585 }, { "epoch": 0.03, "learning_rate": 4.9851922747518316e-05, "loss": 1.5706, "step": 2590 }, { "epoch": 0.03, "learning_rate": 4.985135037299451e-05, "loss": 1.0129, "step": 2595 }, { "epoch": 0.03, "learning_rate": 4.985077689768021e-05, "loss": 0.7317, "step": 2600 }, { "epoch": 0.03, "learning_rate": 4.9850202321600824e-05, "loss": 0.9799, "step": 2605 }, { "epoch": 0.03, "learning_rate": 4.984962664478179e-05, "loss": 1.0148, "step": 2610 }, { "epoch": 0.04, "learning_rate": 4.984904986724862e-05, "loss": 1.2287, "step": 2615 }, { "epoch": 0.04, "learning_rate": 4.9848471989026856e-05, "loss": 0.5616, "step": 2620 }, { "epoch": 0.04, "learning_rate": 4.984789301014209e-05, "loss": 0.7716, "step": 2625 }, { "epoch": 0.04, "learning_rate": 4.984731293061998e-05, "loss": 1.3306, "step": 2630 }, { "epoch": 0.04, "learning_rate": 4.984673175048621e-05, "loss": 1.0681, "step": 2635 }, { "epoch": 0.04, "learning_rate": 4.984614946976654e-05, "loss": 0.8964, "step": 2640 }, { "epoch": 0.04, "learning_rate": 4.984556608848673e-05, "loss": 0.5652, "step": 2645 }, { "epoch": 0.04, "learning_rate": 4.9844981606672653e-05, "loss": 0.7767, "step": 2650 }, { "epoch": 0.04, "learning_rate": 4.984439602435018e-05, "loss": 0.4719, "step": 2655 }, { "epoch": 0.04, "learning_rate": 4.984380934154526e-05, "loss": 0.7617, "step": 2660 }, { "epoch": 0.04, "learning_rate": 4.984322155828388e-05, "loss": 0.8898, "step": 2665 }, { "epoch": 0.04, "learning_rate": 4.984263267459206e-05, "loss": 1.2053, "step": 2670 }, { "epoch": 0.04, "learning_rate": 4.98420426904959e-05, "loss": 0.6988, "step": 2675 }, { "epoch": 0.04, "learning_rate": 4.984145160602154e-05, "loss": 1.0365, "step": 2680 }, { "epoch": 0.04, "learning_rate": 4.984085942119515e-05, "loss": 0.8006, "step": 2685 }, { "epoch": 0.04, "learning_rate": 4.9840266136042956e-05, "loss": 0.7906, "step": 2690 }, { "epoch": 0.04, "learning_rate": 4.9839671750591244e-05, "loss": 1.0152, "step": 2695 }, { "epoch": 0.04, "learning_rate": 4.983907626486634e-05, "loss": 0.5343, "step": 2700 }, { "epoch": 0.04, "learning_rate": 4.983847967889463e-05, "loss": 0.5788, "step": 2705 }, { "epoch": 0.04, "learning_rate": 4.983788199270253e-05, "loss": 0.8525, "step": 2710 }, { "epoch": 0.04, "learning_rate": 4.983728320631652e-05, "loss": 0.4533, "step": 2715 }, { "epoch": 0.04, "learning_rate": 4.9836683319763113e-05, "loss": 1.1049, "step": 2720 }, { "epoch": 0.04, "learning_rate": 4.98360823330689e-05, "loss": 0.781, "step": 2725 }, { "epoch": 0.04, "learning_rate": 4.9835480246260484e-05, "loss": 0.9969, "step": 2730 }, { "epoch": 0.04, "learning_rate": 4.9834877059364545e-05, "loss": 0.8607, "step": 2735 }, { "epoch": 0.04, "learning_rate": 4.9834272772407795e-05, "loss": 0.4459, "step": 2740 }, { "epoch": 0.04, "learning_rate": 4.9833667385417006e-05, "loss": 1.1628, "step": 2745 }, { "epoch": 0.04, "learning_rate": 4.983306089841898e-05, "loss": 1.2639, "step": 2750 }, { "epoch": 0.04, "learning_rate": 4.983245331144061e-05, "loss": 0.8062, "step": 2755 }, { "epoch": 0.04, "learning_rate": 4.983184462450878e-05, "loss": 0.6399, "step": 2760 }, { "epoch": 0.04, "learning_rate": 4.983123483765046e-05, "loss": 0.8879, "step": 2765 }, { "epoch": 0.04, "learning_rate": 4.983062395089267e-05, "loss": 1.0355, "step": 2770 }, { "epoch": 0.04, "learning_rate": 4.9830011964262455e-05, "loss": 0.2408, "step": 2775 }, { "epoch": 0.04, "learning_rate": 4.9829398877786934e-05, "loss": 1.1693, "step": 2780 }, { "epoch": 0.04, "learning_rate": 4.9828784691493266e-05, "loss": 1.5412, "step": 2785 }, { "epoch": 0.04, "learning_rate": 4.982816940540865e-05, "loss": 0.7459, "step": 2790 }, { "epoch": 0.04, "learning_rate": 4.982755301956034e-05, "loss": 0.5666, "step": 2795 }, { "epoch": 0.04, "learning_rate": 4.982693553397564e-05, "loss": 0.6943, "step": 2800 }, { "epoch": 0.04, "learning_rate": 4.982631694868189e-05, "loss": 1.1842, "step": 2805 }, { "epoch": 0.04, "learning_rate": 4.9825697263706515e-05, "loss": 0.5255, "step": 2810 }, { "epoch": 0.04, "learning_rate": 4.982507647907694e-05, "loss": 0.7996, "step": 2815 }, { "epoch": 0.04, "learning_rate": 4.982445459482068e-05, "loss": 0.989, "step": 2820 }, { "epoch": 0.04, "learning_rate": 4.982383161096528e-05, "loss": 0.3268, "step": 2825 }, { "epoch": 0.04, "learning_rate": 4.982320752753832e-05, "loss": 0.9517, "step": 2830 }, { "epoch": 0.04, "learning_rate": 4.982258234456745e-05, "loss": 0.6922, "step": 2835 }, { "epoch": 0.04, "learning_rate": 4.982195606208037e-05, "loss": 0.843, "step": 2840 }, { "epoch": 0.04, "learning_rate": 4.982132868010482e-05, "loss": 0.6083, "step": 2845 }, { "epoch": 0.04, "learning_rate": 4.982070019866858e-05, "loss": 0.9425, "step": 2850 }, { "epoch": 0.04, "learning_rate": 4.98200706177995e-05, "loss": 1.0912, "step": 2855 }, { "epoch": 0.04, "learning_rate": 4.981943993752546e-05, "loss": 0.5367, "step": 2860 }, { "epoch": 0.04, "learning_rate": 4.9818808157874405e-05, "loss": 0.467, "step": 2865 }, { "epoch": 0.04, "learning_rate": 4.981817527887431e-05, "loss": 0.5148, "step": 2870 }, { "epoch": 0.04, "learning_rate": 4.98175413005532e-05, "loss": 0.5565, "step": 2875 }, { "epoch": 0.04, "learning_rate": 4.9816906222939184e-05, "loss": 0.6018, "step": 2880 }, { "epoch": 0.04, "learning_rate": 4.9816270046060375e-05, "loss": 1.1111, "step": 2885 }, { "epoch": 0.04, "learning_rate": 4.981563276994495e-05, "loss": 1.4529, "step": 2890 }, { "epoch": 0.04, "learning_rate": 4.9814994394621144e-05, "loss": 1.3564, "step": 2895 }, { "epoch": 0.04, "learning_rate": 4.9814354920117236e-05, "loss": 0.567, "step": 2900 }, { "epoch": 0.04, "learning_rate": 4.981371434646154e-05, "loss": 0.6069, "step": 2905 }, { "epoch": 0.04, "learning_rate": 4.981307267368244e-05, "loss": 0.8488, "step": 2910 }, { "epoch": 0.04, "learning_rate": 4.9812429901808356e-05, "loss": 0.6717, "step": 2915 }, { "epoch": 0.04, "learning_rate": 4.9811786030867756e-05, "loss": 0.6891, "step": 2920 }, { "epoch": 0.04, "learning_rate": 4.9811141060889174e-05, "loss": 0.6973, "step": 2925 }, { "epoch": 0.04, "learning_rate": 4.9810494991901166e-05, "loss": 0.6652, "step": 2930 }, { "epoch": 0.04, "learning_rate": 4.9809847823932354e-05, "loss": 0.9278, "step": 2935 }, { "epoch": 0.04, "learning_rate": 4.98091995570114e-05, "loss": 0.6717, "step": 2940 }, { "epoch": 0.04, "learning_rate": 4.980855019116702e-05, "loss": 0.8417, "step": 2945 }, { "epoch": 0.04, "learning_rate": 4.9807899726427983e-05, "loss": 0.5613, "step": 2950 }, { "epoch": 0.04, "learning_rate": 4.9807248162823095e-05, "loss": 0.9351, "step": 2955 }, { "epoch": 0.04, "learning_rate": 4.980659550038123e-05, "loss": 0.7545, "step": 2960 }, { "epoch": 0.04, "learning_rate": 4.980594173913128e-05, "loss": 0.4632, "step": 2965 }, { "epoch": 0.04, "learning_rate": 4.980528687910221e-05, "loss": 0.7313, "step": 2970 }, { "epoch": 0.04, "learning_rate": 4.9804630920323025e-05, "loss": 0.3477, "step": 2975 }, { "epoch": 0.04, "learning_rate": 4.980397386282279e-05, "loss": 0.2059, "step": 2980 }, { "epoch": 0.04, "learning_rate": 4.98033157066306e-05, "loss": 1.294, "step": 2985 }, { "epoch": 0.04, "learning_rate": 4.980265645177562e-05, "loss": 0.2295, "step": 2990 }, { "epoch": 0.04, "learning_rate": 4.980199609828704e-05, "loss": 0.5236, "step": 2995 }, { "epoch": 0.04, "learning_rate": 4.980133464619411e-05, "loss": 1.1881, "step": 3000 }, { "epoch": 0.04, "learning_rate": 4.980067209552612e-05, "loss": 0.2714, "step": 3005 }, { "epoch": 0.04, "learning_rate": 4.9800008446312454e-05, "loss": 1.1401, "step": 3010 }, { "epoch": 0.04, "learning_rate": 4.979934369858247e-05, "loss": 1.0933, "step": 3015 }, { "epoch": 0.04, "learning_rate": 4.979867785236563e-05, "loss": 0.2539, "step": 3020 }, { "epoch": 0.04, "learning_rate": 4.9798010907691423e-05, "loss": 0.6935, "step": 3025 }, { "epoch": 0.04, "learning_rate": 4.979734286458939e-05, "loss": 1.021, "step": 3030 }, { "epoch": 0.04, "learning_rate": 4.979667372308914e-05, "loss": 1.0689, "step": 3035 }, { "epoch": 0.04, "learning_rate": 4.9796003483220286e-05, "loss": 0.5021, "step": 3040 }, { "epoch": 0.04, "learning_rate": 4.979533214501253e-05, "loss": 1.1022, "step": 3045 }, { "epoch": 0.04, "learning_rate": 4.979465970849561e-05, "loss": 0.6277, "step": 3050 }, { "epoch": 0.04, "learning_rate": 4.9793986173699305e-05, "loss": 1.3499, "step": 3055 }, { "epoch": 0.04, "learning_rate": 4.979331154065345e-05, "loss": 0.9102, "step": 3060 }, { "epoch": 0.04, "learning_rate": 4.979263580938794e-05, "loss": 0.4307, "step": 3065 }, { "epoch": 0.04, "learning_rate": 4.979195897993269e-05, "loss": 1.3121, "step": 3070 }, { "epoch": 0.04, "learning_rate": 4.979128105231769e-05, "loss": 0.9159, "step": 3075 }, { "epoch": 0.04, "learning_rate": 4.9790602026572965e-05, "loss": 0.1863, "step": 3080 }, { "epoch": 0.04, "learning_rate": 4.9789921902728596e-05, "loss": 1.3423, "step": 3085 }, { "epoch": 0.04, "learning_rate": 4.978924068081471e-05, "loss": 0.832, "step": 3090 }, { "epoch": 0.04, "learning_rate": 4.978855836086147e-05, "loss": 1.265, "step": 3095 }, { "epoch": 0.04, "learning_rate": 4.978787494289911e-05, "loss": 0.7418, "step": 3100 }, { "epoch": 0.04, "learning_rate": 4.978719042695791e-05, "loss": 0.2473, "step": 3105 }, { "epoch": 0.04, "learning_rate": 4.9786504813068166e-05, "loss": 1.0325, "step": 3110 }, { "epoch": 0.04, "learning_rate": 4.978581810126027e-05, "loss": 0.6214, "step": 3115 }, { "epoch": 0.04, "learning_rate": 4.978513029156463e-05, "loss": 0.9682, "step": 3120 }, { "epoch": 0.04, "learning_rate": 4.9784441384011714e-05, "loss": 0.2062, "step": 3125 }, { "epoch": 0.04, "learning_rate": 4.978375137863204e-05, "loss": 0.4427, "step": 3130 }, { "epoch": 0.04, "learning_rate": 4.978306027545616e-05, "loss": 0.9781, "step": 3135 }, { "epoch": 0.04, "learning_rate": 4.978236807451471e-05, "loss": 0.8505, "step": 3140 }, { "epoch": 0.04, "learning_rate": 4.9781674775838324e-05, "loss": 0.7987, "step": 3145 }, { "epoch": 0.04, "learning_rate": 4.978098037945773e-05, "loss": 0.254, "step": 3150 }, { "epoch": 0.04, "learning_rate": 4.978028488540368e-05, "loss": 1.5854, "step": 3155 }, { "epoch": 0.04, "learning_rate": 4.977958829370698e-05, "loss": 0.9271, "step": 3160 }, { "epoch": 0.04, "learning_rate": 4.977889060439849e-05, "loss": 0.8002, "step": 3165 }, { "epoch": 0.04, "learning_rate": 4.977819181750911e-05, "loss": 0.3987, "step": 3170 }, { "epoch": 0.04, "learning_rate": 4.9777491933069795e-05, "loss": 0.6166, "step": 3175 }, { "epoch": 0.04, "learning_rate": 4.977679095111154e-05, "loss": 0.6864, "step": 3180 }, { "epoch": 0.04, "learning_rate": 4.9776088871665404e-05, "loss": 0.988, "step": 3185 }, { "epoch": 0.04, "learning_rate": 4.9775385694762475e-05, "loss": 0.2027, "step": 3190 }, { "epoch": 0.04, "learning_rate": 4.977468142043392e-05, "loss": 0.4261, "step": 3195 }, { "epoch": 0.04, "learning_rate": 4.9773976048710916e-05, "loss": 0.8661, "step": 3200 }, { "epoch": 0.04, "learning_rate": 4.9773269579624715e-05, "loss": 0.6245, "step": 3205 }, { "epoch": 0.04, "learning_rate": 4.97725620132066e-05, "loss": 0.6725, "step": 3210 }, { "epoch": 0.04, "learning_rate": 4.977185334948793e-05, "loss": 0.4991, "step": 3215 }, { "epoch": 0.04, "learning_rate": 4.977114358850008e-05, "loss": 1.0742, "step": 3220 }, { "epoch": 0.04, "learning_rate": 4.9770432730274505e-05, "loss": 0.766, "step": 3225 }, { "epoch": 0.04, "learning_rate": 4.9769720774842674e-05, "loss": 0.437, "step": 3230 }, { "epoch": 0.04, "learning_rate": 4.976900772223613e-05, "loss": 0.7723, "step": 3235 }, { "epoch": 0.04, "learning_rate": 4.9768293572486465e-05, "loss": 0.5197, "step": 3240 }, { "epoch": 0.04, "learning_rate": 4.976757832562531e-05, "loss": 1.1187, "step": 3245 }, { "epoch": 0.04, "learning_rate": 4.976686198168433e-05, "loss": 0.99, "step": 3250 }, { "epoch": 0.04, "learning_rate": 4.976614454069528e-05, "loss": 0.3075, "step": 3255 }, { "epoch": 0.04, "learning_rate": 4.976542600268993e-05, "loss": 1.4992, "step": 3260 }, { "epoch": 0.04, "learning_rate": 4.97647063677001e-05, "loss": 1.1848, "step": 3265 }, { "epoch": 0.04, "learning_rate": 4.9763985635757674e-05, "loss": 0.8167, "step": 3270 }, { "epoch": 0.04, "learning_rate": 4.976326380689457e-05, "loss": 1.353, "step": 3275 }, { "epoch": 0.04, "learning_rate": 4.9762540881142774e-05, "loss": 0.4374, "step": 3280 }, { "epoch": 0.04, "learning_rate": 4.976181685853429e-05, "loss": 0.7247, "step": 3285 }, { "epoch": 0.04, "learning_rate": 4.9761091739101206e-05, "loss": 0.8045, "step": 3290 }, { "epoch": 0.04, "learning_rate": 4.976036552287563e-05, "loss": 0.8334, "step": 3295 }, { "epoch": 0.04, "learning_rate": 4.975963820988974e-05, "loss": 0.3525, "step": 3300 }, { "epoch": 0.04, "learning_rate": 4.9758909800175735e-05, "loss": 0.7553, "step": 3305 }, { "epoch": 0.04, "learning_rate": 4.97581802937659e-05, "loss": 1.2237, "step": 3310 }, { "epoch": 0.04, "learning_rate": 4.975744969069254e-05, "loss": 0.7046, "step": 3315 }, { "epoch": 0.04, "learning_rate": 4.975671799098801e-05, "loss": 0.1562, "step": 3320 }, { "epoch": 0.04, "learning_rate": 4.975598519468473e-05, "loss": 1.1846, "step": 3325 }, { "epoch": 0.04, "learning_rate": 4.975525130181515e-05, "loss": 1.3198, "step": 3330 }, { "epoch": 0.04, "learning_rate": 4.975451631241179e-05, "loss": 0.2697, "step": 3335 }, { "epoch": 0.04, "learning_rate": 4.9753780226507205e-05, "loss": 0.8931, "step": 3340 }, { "epoch": 0.04, "learning_rate": 4.975304304413399e-05, "loss": 1.5062, "step": 3345 }, { "epoch": 0.04, "learning_rate": 4.975230476532481e-05, "loss": 0.6078, "step": 3350 }, { "epoch": 0.04, "learning_rate": 4.975156539011235e-05, "loss": 0.8941, "step": 3355 }, { "epoch": 0.05, "learning_rate": 4.9750824918529376e-05, "loss": 0.7903, "step": 3360 }, { "epoch": 0.05, "learning_rate": 4.9750083350608685e-05, "loss": 1.2815, "step": 3365 }, { "epoch": 0.05, "learning_rate": 4.974934068638312e-05, "loss": 0.6684, "step": 3370 }, { "epoch": 0.05, "learning_rate": 4.9748596925885585e-05, "loss": 0.594, "step": 3375 }, { "epoch": 0.05, "learning_rate": 4.974785206914901e-05, "loss": 0.2848, "step": 3380 }, { "epoch": 0.05, "learning_rate": 4.97471061162064e-05, "loss": 0.6103, "step": 3385 }, { "epoch": 0.05, "learning_rate": 4.97463590670908e-05, "loss": 1.8821, "step": 3390 }, { "epoch": 0.05, "learning_rate": 4.974561092183529e-05, "loss": 0.6497, "step": 3395 }, { "epoch": 0.05, "learning_rate": 4.974486168047302e-05, "loss": 0.6983, "step": 3400 }, { "epoch": 0.05, "learning_rate": 4.974411134303717e-05, "loss": 1.3707, "step": 3405 }, { "epoch": 0.05, "learning_rate": 4.974335990956098e-05, "loss": 0.5377, "step": 3410 }, { "epoch": 0.05, "learning_rate": 4.974260738007773e-05, "loss": 0.5527, "step": 3415 }, { "epoch": 0.05, "learning_rate": 4.9741853754620755e-05, "loss": 0.7997, "step": 3420 }, { "epoch": 0.05, "learning_rate": 4.974109903322344e-05, "loss": 1.3219, "step": 3425 }, { "epoch": 0.05, "learning_rate": 4.9740343215919215e-05, "loss": 0.1655, "step": 3430 }, { "epoch": 0.05, "learning_rate": 4.973958630274156e-05, "loss": 0.6577, "step": 3435 }, { "epoch": 0.05, "learning_rate": 4.973882829372399e-05, "loss": 0.6486, "step": 3440 }, { "epoch": 0.05, "learning_rate": 4.97380691889001e-05, "loss": 1.0772, "step": 3445 }, { "epoch": 0.05, "learning_rate": 4.9737308988303505e-05, "loss": 1.3685, "step": 3450 }, { "epoch": 0.05, "learning_rate": 4.9736547691967875e-05, "loss": 0.9558, "step": 3455 }, { "epoch": 0.05, "learning_rate": 4.973578529992694e-05, "loss": 0.3955, "step": 3460 }, { "epoch": 0.05, "learning_rate": 4.973502181221447e-05, "loss": 0.8326, "step": 3465 }, { "epoch": 0.05, "learning_rate": 4.973425722886427e-05, "loss": 0.623, "step": 3470 }, { "epoch": 0.05, "learning_rate": 4.973349154991022e-05, "loss": 0.7513, "step": 3475 }, { "epoch": 0.05, "learning_rate": 4.973272477538622e-05, "loss": 1.2407, "step": 3480 }, { "epoch": 0.05, "learning_rate": 4.973195690532626e-05, "loss": 0.4089, "step": 3485 }, { "epoch": 0.05, "learning_rate": 4.973118793976434e-05, "loss": 0.6868, "step": 3490 }, { "epoch": 0.05, "learning_rate": 4.973041787873451e-05, "loss": 0.8174, "step": 3495 }, { "epoch": 0.05, "learning_rate": 4.972964672227091e-05, "loss": 1.1905, "step": 3500 }, { "epoch": 0.05, "learning_rate": 4.972887447040766e-05, "loss": 1.0471, "step": 3505 }, { "epoch": 0.05, "learning_rate": 4.972810112317899e-05, "loss": 1.4952, "step": 3510 }, { "epoch": 0.05, "learning_rate": 4.9727326680619154e-05, "loss": 0.7131, "step": 3515 }, { "epoch": 0.05, "learning_rate": 4.972655114276245e-05, "loss": 0.4358, "step": 3520 }, { "epoch": 0.05, "learning_rate": 4.972577450964324e-05, "loss": 1.1582, "step": 3525 }, { "epoch": 0.05, "learning_rate": 4.9724996781295904e-05, "loss": 0.5165, "step": 3530 }, { "epoch": 0.05, "learning_rate": 4.972421795775492e-05, "loss": 1.2324, "step": 3535 }, { "epoch": 0.05, "learning_rate": 4.972343803905477e-05, "loss": 0.9332, "step": 3540 }, { "epoch": 0.05, "learning_rate": 4.972265702523e-05, "loss": 0.4642, "step": 3545 }, { "epoch": 0.05, "learning_rate": 4.9721874916315206e-05, "loss": 0.6453, "step": 3550 }, { "epoch": 0.05, "learning_rate": 4.9721091712345035e-05, "loss": 0.4429, "step": 3555 }, { "epoch": 0.05, "learning_rate": 4.972030741335417e-05, "loss": 1.71, "step": 3560 }, { "epoch": 0.05, "learning_rate": 4.971952201937737e-05, "loss": 0.9299, "step": 3565 }, { "epoch": 0.05, "learning_rate": 4.97187355304494e-05, "loss": 0.4922, "step": 3570 }, { "epoch": 0.05, "learning_rate": 4.971794794660512e-05, "loss": 1.2144, "step": 3575 }, { "epoch": 0.05, "learning_rate": 4.97171592678794e-05, "loss": 1.3294, "step": 3580 }, { "epoch": 0.05, "learning_rate": 4.9716369494307184e-05, "loss": 0.7824, "step": 3585 }, { "epoch": 0.05, "learning_rate": 4.9715578625923455e-05, "loss": 0.3279, "step": 3590 }, { "epoch": 0.05, "learning_rate": 4.9714786662763236e-05, "loss": 0.3672, "step": 3595 }, { "epoch": 0.05, "learning_rate": 4.9713993604861606e-05, "loss": 1.2012, "step": 3600 }, { "epoch": 0.05, "learning_rate": 4.9713199452253714e-05, "loss": 1.5225, "step": 3605 }, { "epoch": 0.05, "learning_rate": 4.97124042049747e-05, "loss": 0.6093, "step": 3610 }, { "epoch": 0.05, "learning_rate": 4.971160786305984e-05, "loss": 0.8438, "step": 3615 }, { "epoch": 0.05, "learning_rate": 4.9710810426544365e-05, "loss": 0.4272, "step": 3620 }, { "epoch": 0.05, "learning_rate": 4.971001189546361e-05, "loss": 0.8822, "step": 3625 }, { "epoch": 0.05, "learning_rate": 4.9709212269852955e-05, "loss": 0.862, "step": 3630 }, { "epoch": 0.05, "learning_rate": 4.9708411549747805e-05, "loss": 0.6941, "step": 3635 }, { "epoch": 0.05, "learning_rate": 4.9707609735183645e-05, "loss": 1.0584, "step": 3640 }, { "epoch": 0.05, "learning_rate": 4.970680682619597e-05, "loss": 0.4967, "step": 3645 }, { "epoch": 0.05, "learning_rate": 4.970600282282037e-05, "loss": 1.015, "step": 3650 }, { "epoch": 0.05, "learning_rate": 4.970519772509244e-05, "loss": 0.3541, "step": 3655 }, { "epoch": 0.05, "learning_rate": 4.970439153304784e-05, "loss": 0.9704, "step": 3660 }, { "epoch": 0.05, "learning_rate": 4.97035842467223e-05, "loss": 0.8816, "step": 3665 }, { "epoch": 0.05, "learning_rate": 4.9702775866151565e-05, "loss": 0.9495, "step": 3670 }, { "epoch": 0.05, "learning_rate": 4.970196639137144e-05, "loss": 0.601, "step": 3675 }, { "epoch": 0.05, "learning_rate": 4.970115582241778e-05, "loss": 0.7744, "step": 3680 }, { "epoch": 0.05, "learning_rate": 4.970034415932649e-05, "loss": 0.5664, "step": 3685 }, { "epoch": 0.05, "learning_rate": 4.969953140213353e-05, "loss": 1.1389, "step": 3690 }, { "epoch": 0.05, "learning_rate": 4.9698717550874896e-05, "loss": 0.4188, "step": 3695 }, { "epoch": 0.05, "learning_rate": 4.969790260558664e-05, "loss": 1.0433, "step": 3700 }, { "epoch": 0.05, "learning_rate": 4.969708656630486e-05, "loss": 0.501, "step": 3705 }, { "epoch": 0.05, "learning_rate": 4.96962694330657e-05, "loss": 1.2308, "step": 3710 }, { "epoch": 0.05, "learning_rate": 4.969545120590535e-05, "loss": 0.5618, "step": 3715 }, { "epoch": 0.05, "learning_rate": 4.9694631884860065e-05, "loss": 0.6735, "step": 3720 }, { "epoch": 0.05, "learning_rate": 4.969381146996613e-05, "loss": 0.5196, "step": 3725 }, { "epoch": 0.05, "learning_rate": 4.9692989961259884e-05, "loss": 0.2278, "step": 3730 }, { "epoch": 0.05, "learning_rate": 4.969216735877772e-05, "loss": 1.0927, "step": 3735 }, { "epoch": 0.05, "learning_rate": 4.969134366255608e-05, "loss": 0.6376, "step": 3740 }, { "epoch": 0.05, "learning_rate": 4.969051887263143e-05, "loss": 1.1881, "step": 3745 }, { "epoch": 0.05, "learning_rate": 4.968969298904032e-05, "loss": 0.9272, "step": 3750 }, { "epoch": 0.05, "learning_rate": 4.968886601181933e-05, "loss": 0.9346, "step": 3755 }, { "epoch": 0.05, "learning_rate": 4.96880379410051e-05, "loss": 0.7099, "step": 3760 }, { "epoch": 0.05, "learning_rate": 4.968720877663429e-05, "loss": 0.6478, "step": 3765 }, { "epoch": 0.05, "learning_rate": 4.968637851874363e-05, "loss": 1.0572, "step": 3770 }, { "epoch": 0.05, "learning_rate": 4.9685547167369915e-05, "loss": 0.88, "step": 3775 }, { "epoch": 0.05, "learning_rate": 4.968471472254995e-05, "loss": 1.2131, "step": 3780 }, { "epoch": 0.05, "learning_rate": 4.9683881184320626e-05, "loss": 0.6165, "step": 3785 }, { "epoch": 0.05, "learning_rate": 4.9683046552718845e-05, "loss": 0.6915, "step": 3790 }, { "epoch": 0.05, "learning_rate": 4.96822108277816e-05, "loss": 1.1321, "step": 3795 }, { "epoch": 0.05, "learning_rate": 4.968137400954589e-05, "loss": 0.9788, "step": 3800 }, { "epoch": 0.05, "learning_rate": 4.9680536098048785e-05, "loss": 0.7479, "step": 3805 }, { "epoch": 0.05, "learning_rate": 4.967969709332741e-05, "loss": 1.2326, "step": 3810 }, { "epoch": 0.05, "learning_rate": 4.967885699541892e-05, "loss": 1.3747, "step": 3815 }, { "epoch": 0.05, "learning_rate": 4.967801580436052e-05, "loss": 0.9349, "step": 3820 }, { "epoch": 0.05, "learning_rate": 4.9677173520189495e-05, "loss": 0.7903, "step": 3825 }, { "epoch": 0.05, "learning_rate": 4.967633014294313e-05, "loss": 0.892, "step": 3830 }, { "epoch": 0.05, "learning_rate": 4.9675485672658795e-05, "loss": 0.7944, "step": 3835 }, { "epoch": 0.05, "learning_rate": 4.967464010937389e-05, "loss": 1.0728, "step": 3840 }, { "epoch": 0.05, "learning_rate": 4.967379345312588e-05, "loss": 0.8028, "step": 3845 }, { "epoch": 0.05, "learning_rate": 4.967294570395224e-05, "loss": 0.8058, "step": 3850 }, { "epoch": 0.05, "learning_rate": 4.967209686189056e-05, "loss": 1.5739, "step": 3855 }, { "epoch": 0.05, "learning_rate": 4.967124692697841e-05, "loss": 0.3856, "step": 3860 }, { "epoch": 0.05, "learning_rate": 4.9670395899253454e-05, "loss": 0.6281, "step": 3865 }, { "epoch": 0.05, "learning_rate": 4.966954377875338e-05, "loss": 0.7387, "step": 3870 }, { "epoch": 0.05, "learning_rate": 4.966869056551593e-05, "loss": 0.5523, "step": 3875 }, { "epoch": 0.05, "learning_rate": 4.96678362595789e-05, "loss": 0.7693, "step": 3880 }, { "epoch": 0.05, "learning_rate": 4.966698086098014e-05, "loss": 1.0, "step": 3885 }, { "epoch": 0.05, "learning_rate": 4.966612436975753e-05, "loss": 0.6566, "step": 3890 }, { "epoch": 0.05, "learning_rate": 4.9665266785949004e-05, "loss": 0.6631, "step": 3895 }, { "epoch": 0.05, "learning_rate": 4.9664408109592565e-05, "loss": 0.5425, "step": 3900 }, { "epoch": 0.05, "learning_rate": 4.966354834072624e-05, "loss": 1.1694, "step": 3905 }, { "epoch": 0.05, "learning_rate": 4.96626874793881e-05, "loss": 0.5426, "step": 3910 }, { "epoch": 0.05, "learning_rate": 4.96618255256163e-05, "loss": 0.8268, "step": 3915 }, { "epoch": 0.05, "learning_rate": 4.9660962479449e-05, "loss": 0.5539, "step": 3920 }, { "epoch": 0.05, "learning_rate": 4.966009834092444e-05, "loss": 1.1335, "step": 3925 }, { "epoch": 0.05, "learning_rate": 4.96592331100809e-05, "loss": 0.8021, "step": 3930 }, { "epoch": 0.05, "learning_rate": 4.9658366786956694e-05, "loss": 1.338, "step": 3935 }, { "epoch": 0.05, "learning_rate": 4.96574993715902e-05, "loss": 0.9685, "step": 3940 }, { "epoch": 0.05, "learning_rate": 4.965663086401985e-05, "loss": 0.5646, "step": 3945 }, { "epoch": 0.05, "learning_rate": 4.96557612642841e-05, "loss": 1.3559, "step": 3950 }, { "epoch": 0.05, "learning_rate": 4.965489057242147e-05, "loss": 1.2648, "step": 3955 }, { "epoch": 0.05, "learning_rate": 4.965401878847054e-05, "loss": 0.8787, "step": 3960 }, { "epoch": 0.05, "learning_rate": 4.965314591246991e-05, "loss": 0.8779, "step": 3965 }, { "epoch": 0.05, "learning_rate": 4.9652271944458256e-05, "loss": 0.6939, "step": 3970 }, { "epoch": 0.05, "learning_rate": 4.965139688447429e-05, "loss": 0.6098, "step": 3975 }, { "epoch": 0.05, "learning_rate": 4.965052073255676e-05, "loss": 0.5506, "step": 3980 }, { "epoch": 0.05, "learning_rate": 4.964964348874449e-05, "loss": 0.3134, "step": 3985 }, { "epoch": 0.05, "learning_rate": 4.964876515307634e-05, "loss": 0.8846, "step": 3990 }, { "epoch": 0.05, "learning_rate": 4.964788572559119e-05, "loss": 0.5929, "step": 3995 }, { "epoch": 0.05, "learning_rate": 4.9647005206328025e-05, "loss": 0.7639, "step": 4000 }, { "epoch": 0.05, "learning_rate": 4.964612359532583e-05, "loss": 0.9997, "step": 4005 }, { "epoch": 0.05, "learning_rate": 4.9645240892623655e-05, "loss": 0.5324, "step": 4010 }, { "epoch": 0.05, "learning_rate": 4.964435709826062e-05, "loss": 0.5297, "step": 4015 }, { "epoch": 0.05, "learning_rate": 4.9643472212275845e-05, "loss": 0.2765, "step": 4020 }, { "epoch": 0.05, "learning_rate": 4.964258623470855e-05, "loss": 1.5651, "step": 4025 }, { "epoch": 0.05, "learning_rate": 4.964169916559795e-05, "loss": 0.5073, "step": 4030 }, { "epoch": 0.05, "learning_rate": 4.964081100498337e-05, "loss": 0.8853, "step": 4035 }, { "epoch": 0.05, "learning_rate": 4.963992175290413e-05, "loss": 0.5929, "step": 4040 }, { "epoch": 0.05, "learning_rate": 4.963903140939962e-05, "loss": 0.5431, "step": 4045 }, { "epoch": 0.05, "learning_rate": 4.963813997450929e-05, "loss": 0.5493, "step": 4050 }, { "epoch": 0.05, "learning_rate": 4.9637247448272626e-05, "loss": 0.4897, "step": 4055 }, { "epoch": 0.05, "learning_rate": 4.963635383072915e-05, "loss": 0.9978, "step": 4060 }, { "epoch": 0.05, "learning_rate": 4.963545912191845e-05, "loss": 0.4768, "step": 4065 }, { "epoch": 0.05, "learning_rate": 4.963456332188016e-05, "loss": 0.8546, "step": 4070 }, { "epoch": 0.05, "learning_rate": 4.963366643065396e-05, "loss": 1.5385, "step": 4075 }, { "epoch": 0.05, "learning_rate": 4.963276844827958e-05, "loss": 0.7996, "step": 4080 }, { "epoch": 0.05, "learning_rate": 4.963186937479678e-05, "loss": 1.2318, "step": 4085 }, { "epoch": 0.05, "learning_rate": 4.9630969210245404e-05, "loss": 1.387, "step": 4090 }, { "epoch": 0.05, "learning_rate": 4.963006795466531e-05, "loss": 1.3987, "step": 4095 }, { "epoch": 0.05, "learning_rate": 4.9629165608096425e-05, "loss": 0.5505, "step": 4100 }, { "epoch": 0.06, "learning_rate": 4.962826217057873e-05, "loss": 0.5635, "step": 4105 }, { "epoch": 0.06, "learning_rate": 4.9627357642152226e-05, "loss": 0.8504, "step": 4110 }, { "epoch": 0.06, "learning_rate": 4.9626452022856986e-05, "loss": 0.7243, "step": 4115 }, { "epoch": 0.06, "learning_rate": 4.962554531273313e-05, "loss": 0.6964, "step": 4120 }, { "epoch": 0.06, "learning_rate": 4.9624637511820804e-05, "loss": 0.5984, "step": 4125 }, { "epoch": 0.06, "learning_rate": 4.9623728620160235e-05, "loss": 0.6149, "step": 4130 }, { "epoch": 0.06, "learning_rate": 4.962281863779168e-05, "loss": 0.9798, "step": 4135 }, { "epoch": 0.06, "learning_rate": 4.962190756475543e-05, "loss": 0.8481, "step": 4140 }, { "epoch": 0.06, "learning_rate": 4.9620995401091864e-05, "loss": 1.0338, "step": 4145 }, { "epoch": 0.06, "learning_rate": 4.9620082146841374e-05, "loss": 1.171, "step": 4150 }, { "epoch": 0.06, "learning_rate": 4.961916780204442e-05, "loss": 0.8918, "step": 4155 }, { "epoch": 0.06, "learning_rate": 4.961825236674149e-05, "loss": 1.0609, "step": 4160 }, { "epoch": 0.06, "learning_rate": 4.961733584097315e-05, "loss": 0.524, "step": 4165 }, { "epoch": 0.06, "learning_rate": 4.961641822477999e-05, "loss": 0.2458, "step": 4170 }, { "epoch": 0.06, "learning_rate": 4.9615499518202645e-05, "loss": 0.5365, "step": 4175 }, { "epoch": 0.06, "learning_rate": 4.9614579721281826e-05, "loss": 0.7457, "step": 4180 }, { "epoch": 0.06, "learning_rate": 4.961365883405826e-05, "loss": 1.0368, "step": 4185 }, { "epoch": 0.06, "learning_rate": 4.961273685657276e-05, "loss": 0.8769, "step": 4190 }, { "epoch": 0.06, "learning_rate": 4.961181378886614e-05, "loss": 1.4468, "step": 4195 }, { "epoch": 0.06, "learning_rate": 4.9610889630979304e-05, "loss": 0.7384, "step": 4200 }, { "epoch": 0.06, "learning_rate": 4.960996438295318e-05, "loss": 1.5492, "step": 4205 }, { "epoch": 0.06, "learning_rate": 4.960903804482875e-05, "loss": 0.6691, "step": 4210 }, { "epoch": 0.06, "learning_rate": 4.960811061664705e-05, "loss": 0.9146, "step": 4215 }, { "epoch": 0.06, "learning_rate": 4.960718209844917e-05, "loss": 0.5556, "step": 4220 }, { "epoch": 0.06, "learning_rate": 4.960625249027622e-05, "loss": 0.5529, "step": 4225 }, { "epoch": 0.06, "learning_rate": 4.9605321792169385e-05, "loss": 0.5236, "step": 4230 }, { "epoch": 0.06, "learning_rate": 4.960439000416989e-05, "loss": 0.7544, "step": 4235 }, { "epoch": 0.06, "learning_rate": 4.960345712631902e-05, "loss": 1.026, "step": 4240 }, { "epoch": 0.06, "learning_rate": 4.9602523158658075e-05, "loss": 0.6147, "step": 4245 }, { "epoch": 0.06, "learning_rate": 4.9601588101228443e-05, "loss": 0.6293, "step": 4250 }, { "epoch": 0.06, "learning_rate": 4.960065195407153e-05, "loss": 0.8561, "step": 4255 }, { "epoch": 0.06, "learning_rate": 4.959971471722882e-05, "loss": 0.563, "step": 4260 }, { "epoch": 0.06, "learning_rate": 4.9598776390741806e-05, "loss": 1.3912, "step": 4265 }, { "epoch": 0.06, "learning_rate": 4.959783697465207e-05, "loss": 0.5504, "step": 4270 }, { "epoch": 0.06, "learning_rate": 4.959689646900121e-05, "loss": 0.6368, "step": 4275 }, { "epoch": 0.06, "learning_rate": 4.9595954873830886e-05, "loss": 0.424, "step": 4280 }, { "epoch": 0.06, "learning_rate": 4.959501218918282e-05, "loss": 0.7319, "step": 4285 }, { "epoch": 0.06, "learning_rate": 4.959406841509875e-05, "loss": 0.6301, "step": 4290 }, { "epoch": 0.06, "learning_rate": 4.95931235516205e-05, "loss": 1.2872, "step": 4295 }, { "epoch": 0.06, "learning_rate": 4.9592177598789904e-05, "loss": 0.6805, "step": 4300 }, { "epoch": 0.06, "learning_rate": 4.959123055664887e-05, "loss": 0.2626, "step": 4305 }, { "epoch": 0.06, "learning_rate": 4.9590282425239355e-05, "loss": 0.9996, "step": 4310 }, { "epoch": 0.06, "learning_rate": 4.958933320460335e-05, "loss": 0.7985, "step": 4315 }, { "epoch": 0.06, "learning_rate": 4.958838289478289e-05, "loss": 0.7577, "step": 4320 }, { "epoch": 0.06, "learning_rate": 4.958743149582009e-05, "loss": 0.7785, "step": 4325 }, { "epoch": 0.06, "learning_rate": 4.958647900775708e-05, "loss": 0.8803, "step": 4330 }, { "epoch": 0.06, "learning_rate": 4.958552543063605e-05, "loss": 0.5642, "step": 4335 }, { "epoch": 0.06, "learning_rate": 4.958457076449925e-05, "loss": 1.0093, "step": 4340 }, { "epoch": 0.06, "learning_rate": 4.9583615009388945e-05, "loss": 1.145, "step": 4345 }, { "epoch": 0.06, "learning_rate": 4.958265816534749e-05, "loss": 0.2417, "step": 4350 }, { "epoch": 0.06, "learning_rate": 4.958170023241726e-05, "loss": 0.5464, "step": 4355 }, { "epoch": 0.06, "learning_rate": 4.9580741210640685e-05, "loss": 0.9662, "step": 4360 }, { "epoch": 0.06, "learning_rate": 4.957978110006025e-05, "loss": 1.1097, "step": 4365 }, { "epoch": 0.06, "learning_rate": 4.9578819900718484e-05, "loss": 0.9485, "step": 4370 }, { "epoch": 0.06, "learning_rate": 4.9577857612657956e-05, "loss": 0.3633, "step": 4375 }, { "epoch": 0.06, "learning_rate": 4.95768942359213e-05, "loss": 0.7004, "step": 4380 }, { "epoch": 0.06, "learning_rate": 4.957592977055118e-05, "loss": 0.7473, "step": 4385 }, { "epoch": 0.06, "learning_rate": 4.9574964216590316e-05, "loss": 1.1594, "step": 4390 }, { "epoch": 0.06, "learning_rate": 4.957399757408149e-05, "loss": 0.5809, "step": 4395 }, { "epoch": 0.06, "learning_rate": 4.957302984306751e-05, "loss": 1.1134, "step": 4400 }, { "epoch": 0.06, "learning_rate": 4.957206102359124e-05, "loss": 1.1025, "step": 4405 }, { "epoch": 0.06, "learning_rate": 4.95710911156956e-05, "loss": 1.0843, "step": 4410 }, { "epoch": 0.06, "learning_rate": 4.9570120119423544e-05, "loss": 1.2057, "step": 4415 }, { "epoch": 0.06, "learning_rate": 4.956914803481809e-05, "loss": 1.0412, "step": 4420 }, { "epoch": 0.06, "learning_rate": 4.95681748619223e-05, "loss": 0.2909, "step": 4425 }, { "epoch": 0.06, "learning_rate": 4.956720060077926e-05, "loss": 0.6218, "step": 4430 }, { "epoch": 0.06, "learning_rate": 4.956622525143215e-05, "loss": 0.3591, "step": 4435 }, { "epoch": 0.06, "learning_rate": 4.9565248813924166e-05, "loss": 1.0478, "step": 4440 }, { "epoch": 0.06, "learning_rate": 4.956427128829855e-05, "loss": 1.3519, "step": 4445 }, { "epoch": 0.06, "learning_rate": 4.9563292674598606e-05, "loss": 1.1688, "step": 4450 }, { "epoch": 0.06, "learning_rate": 4.956231297286768e-05, "loss": 0.8875, "step": 4455 }, { "epoch": 0.06, "learning_rate": 4.956133218314918e-05, "loss": 0.7535, "step": 4460 }, { "epoch": 0.06, "learning_rate": 4.956035030548653e-05, "loss": 0.5925, "step": 4465 }, { "epoch": 0.06, "learning_rate": 4.9559367339923234e-05, "loss": 0.7007, "step": 4470 }, { "epoch": 0.06, "learning_rate": 4.955838328650284e-05, "loss": 0.7225, "step": 4475 }, { "epoch": 0.06, "learning_rate": 4.9557398145268924e-05, "loss": 0.8764, "step": 4480 }, { "epoch": 0.06, "learning_rate": 4.955641191626512e-05, "loss": 0.7212, "step": 4485 }, { "epoch": 0.06, "learning_rate": 4.955542459953513e-05, "loss": 1.1364, "step": 4490 }, { "epoch": 0.06, "learning_rate": 4.955443619512268e-05, "loss": 0.5095, "step": 4495 }, { "epoch": 0.06, "learning_rate": 4.955344670307154e-05, "loss": 0.7547, "step": 4500 }, { "epoch": 0.06, "learning_rate": 4.955245612342555e-05, "loss": 0.3087, "step": 4505 }, { "epoch": 0.06, "learning_rate": 4.955146445622858e-05, "loss": 1.3824, "step": 4510 }, { "epoch": 0.06, "learning_rate": 4.955047170152457e-05, "loss": 0.5836, "step": 4515 }, { "epoch": 0.06, "learning_rate": 4.954947785935749e-05, "loss": 0.9102, "step": 4520 }, { "epoch": 0.06, "learning_rate": 4.954848292977134e-05, "loss": 0.5472, "step": 4525 }, { "epoch": 0.06, "learning_rate": 4.954748691281023e-05, "loss": 1.354, "step": 4530 }, { "epoch": 0.06, "learning_rate": 4.9546489808518245e-05, "loss": 0.5045, "step": 4535 }, { "epoch": 0.06, "learning_rate": 4.954549161693957e-05, "loss": 0.9128, "step": 4540 }, { "epoch": 0.06, "learning_rate": 4.9544492338118406e-05, "loss": 1.0513, "step": 4545 }, { "epoch": 0.06, "learning_rate": 4.954349197209902e-05, "loss": 1.147, "step": 4550 }, { "epoch": 0.06, "learning_rate": 4.954249051892574e-05, "loss": 0.5977, "step": 4555 }, { "epoch": 0.06, "learning_rate": 4.9541487978642905e-05, "loss": 0.7018, "step": 4560 }, { "epoch": 0.06, "learning_rate": 4.954048435129493e-05, "loss": 0.4513, "step": 4565 }, { "epoch": 0.06, "learning_rate": 4.953947963692627e-05, "loss": 0.5538, "step": 4570 }, { "epoch": 0.06, "learning_rate": 4.9538473835581434e-05, "loss": 0.2304, "step": 4575 }, { "epoch": 0.06, "learning_rate": 4.953746694730497e-05, "loss": 0.7455, "step": 4580 }, { "epoch": 0.06, "learning_rate": 4.953645897214146e-05, "loss": 0.8419, "step": 4585 }, { "epoch": 0.06, "learning_rate": 4.953544991013559e-05, "loss": 0.8252, "step": 4590 }, { "epoch": 0.06, "learning_rate": 4.953443976133203e-05, "loss": 1.2297, "step": 4595 }, { "epoch": 0.06, "learning_rate": 4.953342852577553e-05, "loss": 0.763, "step": 4600 }, { "epoch": 0.06, "learning_rate": 4.953241620351088e-05, "loss": 1.1741, "step": 4605 }, { "epoch": 0.06, "learning_rate": 4.953140279458293e-05, "loss": 0.6655, "step": 4610 }, { "epoch": 0.06, "learning_rate": 4.9530388299036556e-05, "loss": 0.9325, "step": 4615 }, { "epoch": 0.06, "learning_rate": 4.9529372716916697e-05, "loss": 1.155, "step": 4620 }, { "epoch": 0.06, "learning_rate": 4.9528356048268353e-05, "loss": 0.8223, "step": 4625 }, { "epoch": 0.06, "learning_rate": 4.952733829313655e-05, "loss": 0.4771, "step": 4630 }, { "epoch": 0.06, "learning_rate": 4.952631945156636e-05, "loss": 0.3619, "step": 4635 }, { "epoch": 0.06, "learning_rate": 4.9525299523602926e-05, "loss": 0.2216, "step": 4640 }, { "epoch": 0.06, "learning_rate": 4.952427850929142e-05, "loss": 0.5658, "step": 4645 }, { "epoch": 0.06, "learning_rate": 4.952325640867705e-05, "loss": 0.5298, "step": 4650 }, { "epoch": 0.06, "learning_rate": 4.952223322180513e-05, "loss": 0.5541, "step": 4655 }, { "epoch": 0.06, "learning_rate": 4.952120894872095e-05, "loss": 0.3783, "step": 4660 }, { "epoch": 0.06, "learning_rate": 4.952018358946989e-05, "loss": 0.7742, "step": 4665 }, { "epoch": 0.06, "learning_rate": 4.951915714409736e-05, "loss": 0.9107, "step": 4670 }, { "epoch": 0.06, "learning_rate": 4.951812961264884e-05, "loss": 0.5942, "step": 4675 }, { "epoch": 0.06, "learning_rate": 4.951710099516984e-05, "loss": 0.7492, "step": 4680 }, { "epoch": 0.06, "learning_rate": 4.951607129170592e-05, "loss": 1.096, "step": 4685 }, { "epoch": 0.06, "learning_rate": 4.9515040502302686e-05, "loss": 0.291, "step": 4690 }, { "epoch": 0.06, "learning_rate": 4.9514008627005815e-05, "loss": 0.7473, "step": 4695 }, { "epoch": 0.06, "learning_rate": 4.951297566586099e-05, "loss": 1.2531, "step": 4700 }, { "epoch": 0.06, "learning_rate": 4.9511941618913986e-05, "loss": 1.1285, "step": 4705 }, { "epoch": 0.06, "learning_rate": 4.95109064862106e-05, "loss": 0.2516, "step": 4710 }, { "epoch": 0.06, "learning_rate": 4.950987026779667e-05, "loss": 0.806, "step": 4715 }, { "epoch": 0.06, "learning_rate": 4.950883296371811e-05, "loss": 0.391, "step": 4720 }, { "epoch": 0.06, "learning_rate": 4.950779457402087e-05, "loss": 0.5749, "step": 4725 }, { "epoch": 0.06, "learning_rate": 4.950675509875093e-05, "loss": 0.4852, "step": 4730 }, { "epoch": 0.06, "learning_rate": 4.950571453795435e-05, "loss": 0.9534, "step": 4735 }, { "epoch": 0.06, "learning_rate": 4.9504672891677205e-05, "loss": 0.8782, "step": 4740 }, { "epoch": 0.06, "learning_rate": 4.9503630159965655e-05, "loss": 1.8923, "step": 4745 }, { "epoch": 0.06, "learning_rate": 4.950258634286586e-05, "loss": 1.1646, "step": 4750 }, { "epoch": 0.06, "learning_rate": 4.950154144042409e-05, "loss": 0.7057, "step": 4755 }, { "epoch": 0.06, "learning_rate": 4.9500495452686606e-05, "loss": 0.7829, "step": 4760 }, { "epoch": 0.06, "learning_rate": 4.9499448379699744e-05, "loss": 0.6613, "step": 4765 }, { "epoch": 0.06, "learning_rate": 4.949840022150989e-05, "loss": 0.4131, "step": 4770 }, { "epoch": 0.06, "learning_rate": 4.949735097816346e-05, "loss": 0.2849, "step": 4775 }, { "epoch": 0.06, "learning_rate": 4.949630064970695e-05, "loss": 0.4401, "step": 4780 }, { "epoch": 0.06, "learning_rate": 4.949524923618686e-05, "loss": 0.7941, "step": 4785 }, { "epoch": 0.06, "learning_rate": 4.9494196737649776e-05, "loss": 0.9288, "step": 4790 }, { "epoch": 0.06, "learning_rate": 4.9493143154142324e-05, "loss": 0.9473, "step": 4795 }, { "epoch": 0.06, "learning_rate": 4.949208848571116e-05, "loss": 1.4367, "step": 4800 }, { "epoch": 0.06, "learning_rate": 4.949124396985256e-05, "loss": 1.5272, "step": 4805 }, { "epoch": 0.06, "learning_rate": 4.949018734867648e-05, "loss": 1.073, "step": 4810 }, { "epoch": 0.06, "learning_rate": 4.948912964270763e-05, "loss": 0.5946, "step": 4815 }, { "epoch": 0.06, "learning_rate": 4.948807085199284e-05, "loss": 0.4268, "step": 4820 }, { "epoch": 0.06, "learning_rate": 4.948701097657904e-05, "loss": 0.5821, "step": 4825 }, { "epoch": 0.06, "learning_rate": 4.948595001651314e-05, "loss": 1.0033, "step": 4830 }, { "epoch": 0.06, "learning_rate": 4.948488797184216e-05, "loss": 0.663, "step": 4835 }, { "epoch": 0.06, "learning_rate": 4.9483824842613144e-05, "loss": 1.0686, "step": 4840 }, { "epoch": 0.06, "learning_rate": 4.9482760628873165e-05, "loss": 1.0782, "step": 4845 }, { "epoch": 0.06, "learning_rate": 4.948169533066938e-05, "loss": 0.4974, "step": 4850 }, { "epoch": 0.07, "learning_rate": 4.948062894804897e-05, "loss": 1.0377, "step": 4855 }, { "epoch": 0.07, "learning_rate": 4.947956148105917e-05, "loss": 0.5624, "step": 4860 }, { "epoch": 0.07, "learning_rate": 4.947849292974726e-05, "loss": 0.4404, "step": 4865 }, { "epoch": 0.07, "learning_rate": 4.9477423294160575e-05, "loss": 0.6222, "step": 4870 }, { "epoch": 0.07, "learning_rate": 4.94763525743465e-05, "loss": 0.3875, "step": 4875 }, { "epoch": 0.07, "learning_rate": 4.947528077035245e-05, "loss": 0.5085, "step": 4880 }, { "epoch": 0.07, "learning_rate": 4.947420788222592e-05, "loss": 0.5763, "step": 4885 }, { "epoch": 0.07, "learning_rate": 4.947313391001441e-05, "loss": 1.0699, "step": 4890 }, { "epoch": 0.07, "learning_rate": 4.947205885376551e-05, "loss": 1.2184, "step": 4895 }, { "epoch": 0.07, "learning_rate": 4.947098271352683e-05, "loss": 1.0638, "step": 4900 }, { "epoch": 0.07, "learning_rate": 4.9469905489346044e-05, "loss": 0.9528, "step": 4905 }, { "epoch": 0.07, "learning_rate": 4.946882718127086e-05, "loss": 1.5389, "step": 4910 }, { "epoch": 0.07, "learning_rate": 4.946774778934904e-05, "loss": 0.6596, "step": 4915 }, { "epoch": 0.07, "learning_rate": 4.946666731362841e-05, "loss": 1.3197, "step": 4920 }, { "epoch": 0.07, "learning_rate": 4.9465585754156816e-05, "loss": 0.5777, "step": 4925 }, { "epoch": 0.07, "learning_rate": 4.9464503110982175e-05, "loss": 0.9238, "step": 4930 }, { "epoch": 0.07, "learning_rate": 4.946341938415243e-05, "loss": 0.5639, "step": 4935 }, { "epoch": 0.07, "learning_rate": 4.9462334573715604e-05, "loss": 1.0064, "step": 4940 }, { "epoch": 0.07, "learning_rate": 4.9461248679719727e-05, "loss": 1.5447, "step": 4945 }, { "epoch": 0.07, "learning_rate": 4.946016170221292e-05, "loss": 1.2077, "step": 4950 }, { "epoch": 0.07, "learning_rate": 4.945907364124331e-05, "loss": 1.0827, "step": 4955 }, { "epoch": 0.07, "learning_rate": 4.945798449685911e-05, "loss": 1.4197, "step": 4960 }, { "epoch": 0.07, "learning_rate": 4.9456894269108555e-05, "loss": 0.3804, "step": 4965 }, { "epoch": 0.07, "learning_rate": 4.945580295803993e-05, "loss": 0.4386, "step": 4970 }, { "epoch": 0.07, "learning_rate": 4.945471056370159e-05, "loss": 0.4593, "step": 4975 }, { "epoch": 0.07, "learning_rate": 4.945361708614192e-05, "loss": 0.6048, "step": 4980 }, { "epoch": 0.07, "learning_rate": 4.945252252540934e-05, "loss": 0.8124, "step": 4985 }, { "epoch": 0.07, "learning_rate": 4.945142688155235e-05, "loss": 0.6763, "step": 4990 }, { "epoch": 0.07, "learning_rate": 4.945033015461947e-05, "loss": 1.3459, "step": 4995 }, { "epoch": 0.07, "learning_rate": 4.9449232344659294e-05, "loss": 0.6308, "step": 5000 }, { "epoch": 0.07, "learning_rate": 4.944813345172044e-05, "loss": 1.2369, "step": 5005 }, { "epoch": 0.07, "learning_rate": 4.9447033475851576e-05, "loss": 0.5001, "step": 5010 }, { "epoch": 0.07, "learning_rate": 4.944593241710144e-05, "loss": 1.0378, "step": 5015 }, { "epoch": 0.07, "learning_rate": 4.944483027551879e-05, "loss": 0.6398, "step": 5020 }, { "epoch": 0.07, "learning_rate": 4.9443727051152465e-05, "loss": 0.6699, "step": 5025 }, { "epoch": 0.07, "learning_rate": 4.944262274405131e-05, "loss": 1.0138, "step": 5030 }, { "epoch": 0.07, "learning_rate": 4.9441517354264257e-05, "loss": 1.3351, "step": 5035 }, { "epoch": 0.07, "learning_rate": 4.944041088184026e-05, "loss": 0.8636, "step": 5040 }, { "epoch": 0.07, "learning_rate": 4.943930332682832e-05, "loss": 0.6586, "step": 5045 }, { "epoch": 0.07, "learning_rate": 4.943819468927752e-05, "loss": 1.2399, "step": 5050 }, { "epoch": 0.07, "learning_rate": 4.9437084969236956e-05, "loss": 1.2593, "step": 5055 }, { "epoch": 0.07, "learning_rate": 4.9435974166755784e-05, "loss": 0.9656, "step": 5060 }, { "epoch": 0.07, "learning_rate": 4.9434862281883206e-05, "loss": 0.3828, "step": 5065 }, { "epoch": 0.07, "learning_rate": 4.9433749314668466e-05, "loss": 0.5869, "step": 5070 }, { "epoch": 0.07, "learning_rate": 4.943263526516087e-05, "loss": 1.2778, "step": 5075 }, { "epoch": 0.07, "learning_rate": 4.943152013340977e-05, "loss": 0.7616, "step": 5080 }, { "epoch": 0.07, "learning_rate": 4.943040391946455e-05, "loss": 1.4096, "step": 5085 }, { "epoch": 0.07, "learning_rate": 4.942928662337467e-05, "loss": 0.6835, "step": 5090 }, { "epoch": 0.07, "learning_rate": 4.94281682451896e-05, "loss": 0.5815, "step": 5095 }, { "epoch": 0.07, "learning_rate": 4.942704878495889e-05, "loss": 0.5383, "step": 5100 }, { "epoch": 0.07, "learning_rate": 4.942592824273211e-05, "loss": 1.2244, "step": 5105 }, { "epoch": 0.07, "learning_rate": 4.942480661855892e-05, "loss": 1.258, "step": 5110 }, { "epoch": 0.07, "learning_rate": 4.942368391248899e-05, "loss": 0.8661, "step": 5115 }, { "epoch": 0.07, "learning_rate": 4.9422560124572045e-05, "loss": 1.2328, "step": 5120 }, { "epoch": 0.07, "learning_rate": 4.942143525485787e-05, "loss": 1.1205, "step": 5125 }, { "epoch": 0.07, "learning_rate": 4.9420309303396295e-05, "loss": 1.2581, "step": 5130 }, { "epoch": 0.07, "learning_rate": 4.941918227023719e-05, "loss": 0.2682, "step": 5135 }, { "epoch": 0.07, "learning_rate": 4.941805415543047e-05, "loss": 0.7995, "step": 5140 }, { "epoch": 0.07, "learning_rate": 4.941692495902611e-05, "loss": 1.3602, "step": 5145 }, { "epoch": 0.07, "learning_rate": 4.941579468107413e-05, "loss": 0.2352, "step": 5150 }, { "epoch": 0.07, "learning_rate": 4.94146633216246e-05, "loss": 0.6922, "step": 5155 }, { "epoch": 0.07, "learning_rate": 4.941353088072762e-05, "loss": 0.7593, "step": 5160 }, { "epoch": 0.07, "learning_rate": 4.941239735843336e-05, "loss": 0.9613, "step": 5165 }, { "epoch": 0.07, "learning_rate": 4.941126275479203e-05, "loss": 1.379, "step": 5170 }, { "epoch": 0.07, "learning_rate": 4.941012706985388e-05, "loss": 1.3141, "step": 5175 }, { "epoch": 0.07, "learning_rate": 4.940899030366923e-05, "loss": 0.9473, "step": 5180 }, { "epoch": 0.07, "learning_rate": 4.940785245628842e-05, "loss": 0.8657, "step": 5185 }, { "epoch": 0.07, "learning_rate": 4.940671352776185e-05, "loss": 0.7301, "step": 5190 }, { "epoch": 0.07, "learning_rate": 4.940557351813999e-05, "loss": 0.7924, "step": 5195 }, { "epoch": 0.07, "learning_rate": 4.94044324274733e-05, "loss": 0.7377, "step": 5200 }, { "epoch": 0.07, "learning_rate": 4.9403290255812354e-05, "loss": 1.1139, "step": 5205 }, { "epoch": 0.07, "learning_rate": 4.9402147003207735e-05, "loss": 0.8094, "step": 5210 }, { "epoch": 0.07, "learning_rate": 4.940100266971009e-05, "loss": 0.6073, "step": 5215 }, { "epoch": 0.07, "learning_rate": 4.9399857255370097e-05, "loss": 1.0039, "step": 5220 }, { "epoch": 0.07, "learning_rate": 4.939871076023849e-05, "loss": 0.9739, "step": 5225 }, { "epoch": 0.07, "learning_rate": 4.939756318436607e-05, "loss": 1.181, "step": 5230 }, { "epoch": 0.07, "learning_rate": 4.939641452780365e-05, "loss": 0.4648, "step": 5235 }, { "epoch": 0.07, "learning_rate": 4.9395264790602114e-05, "loss": 0.4583, "step": 5240 }, { "epoch": 0.07, "learning_rate": 4.9394113972812404e-05, "loss": 0.571, "step": 5245 }, { "epoch": 0.07, "learning_rate": 4.9392962074485484e-05, "loss": 1.4392, "step": 5250 }, { "epoch": 0.07, "learning_rate": 4.939180909567237e-05, "loss": 0.4656, "step": 5255 }, { "epoch": 0.07, "learning_rate": 4.939065503642415e-05, "loss": 0.4398, "step": 5260 }, { "epoch": 0.07, "learning_rate": 4.938949989679193e-05, "loss": 0.4025, "step": 5265 }, { "epoch": 0.07, "learning_rate": 4.9388343676826874e-05, "loss": 0.5695, "step": 5270 }, { "epoch": 0.07, "learning_rate": 4.938718637658022e-05, "loss": 0.5405, "step": 5275 }, { "epoch": 0.07, "learning_rate": 4.93860279961032e-05, "loss": 1.0506, "step": 5280 }, { "epoch": 0.07, "learning_rate": 4.938486853544715e-05, "loss": 0.9756, "step": 5285 }, { "epoch": 0.07, "learning_rate": 4.938370799466341e-05, "loss": 0.2166, "step": 5290 }, { "epoch": 0.07, "learning_rate": 4.9382546373803394e-05, "loss": 0.4422, "step": 5295 }, { "epoch": 0.07, "learning_rate": 4.9381383672918564e-05, "loss": 0.284, "step": 5300 }, { "epoch": 0.07, "learning_rate": 4.938021989206041e-05, "loss": 1.0823, "step": 5305 }, { "epoch": 0.07, "learning_rate": 4.9379055031280486e-05, "loss": 1.2403, "step": 5310 }, { "epoch": 0.07, "learning_rate": 4.937788909063038e-05, "loss": 0.3603, "step": 5315 }, { "epoch": 0.07, "learning_rate": 4.937672207016175e-05, "loss": 0.343, "step": 5320 }, { "epoch": 0.07, "learning_rate": 4.9375553969926295e-05, "loss": 1.3681, "step": 5325 }, { "epoch": 0.07, "learning_rate": 4.937438478997573e-05, "loss": 0.6706, "step": 5330 }, { "epoch": 0.07, "learning_rate": 4.9373214530361876e-05, "loss": 0.3843, "step": 5335 }, { "epoch": 0.07, "learning_rate": 4.937204319113654e-05, "loss": 0.8672, "step": 5340 }, { "epoch": 0.07, "learning_rate": 4.937087077235163e-05, "loss": 0.7624, "step": 5345 }, { "epoch": 0.07, "learning_rate": 4.936969727405907e-05, "loss": 0.6919, "step": 5350 }, { "epoch": 0.07, "learning_rate": 4.936852269631083e-05, "loss": 0.5557, "step": 5355 }, { "epoch": 0.07, "learning_rate": 4.936734703915895e-05, "loss": 0.8234, "step": 5360 }, { "epoch": 0.07, "learning_rate": 4.9366170302655504e-05, "loss": 0.8622, "step": 5365 }, { "epoch": 0.07, "learning_rate": 4.9364992486852614e-05, "loss": 0.5652, "step": 5370 }, { "epoch": 0.07, "learning_rate": 4.9363813591802444e-05, "loss": 0.7132, "step": 5375 }, { "epoch": 0.07, "learning_rate": 4.9362633617557225e-05, "loss": 1.8639, "step": 5380 }, { "epoch": 0.07, "learning_rate": 4.936145256416922e-05, "loss": 0.7416, "step": 5385 }, { "epoch": 0.07, "learning_rate": 4.936027043169074e-05, "loss": 0.4663, "step": 5390 }, { "epoch": 0.07, "learning_rate": 4.935908722017416e-05, "loss": 1.1528, "step": 5395 }, { "epoch": 0.07, "learning_rate": 4.935790292967187e-05, "loss": 0.3635, "step": 5400 }, { "epoch": 0.07, "learning_rate": 4.935671756023634e-05, "loss": 0.4986, "step": 5405 }, { "epoch": 0.07, "learning_rate": 4.935553111192008e-05, "loss": 0.4764, "step": 5410 }, { "epoch": 0.07, "learning_rate": 4.935434358477563e-05, "loss": 0.2827, "step": 5415 }, { "epoch": 0.07, "learning_rate": 4.935315497885561e-05, "loss": 0.7427, "step": 5420 }, { "epoch": 0.07, "learning_rate": 4.9351965294212654e-05, "loss": 0.3166, "step": 5425 }, { "epoch": 0.07, "learning_rate": 4.9350774530899466e-05, "loss": 0.6791, "step": 5430 }, { "epoch": 0.07, "learning_rate": 4.934958268896879e-05, "loss": 1.007, "step": 5435 }, { "epoch": 0.07, "learning_rate": 4.934838976847342e-05, "loss": 0.5546, "step": 5440 }, { "epoch": 0.07, "learning_rate": 4.934719576946619e-05, "loss": 0.508, "step": 5445 }, { "epoch": 0.07, "learning_rate": 4.9346000692e-05, "loss": 0.6777, "step": 5450 }, { "epoch": 0.07, "learning_rate": 4.934480453612776e-05, "loss": 1.8958, "step": 5455 }, { "epoch": 0.07, "learning_rate": 4.93436073019025e-05, "loss": 0.4605, "step": 5460 }, { "epoch": 0.07, "learning_rate": 4.9342408989377206e-05, "loss": 0.5934, "step": 5465 }, { "epoch": 0.07, "learning_rate": 4.934120959860497e-05, "loss": 1.3238, "step": 5470 }, { "epoch": 0.07, "learning_rate": 4.934000912963894e-05, "loss": 0.7274, "step": 5475 }, { "epoch": 0.07, "learning_rate": 4.933880758253227e-05, "loss": 0.6163, "step": 5480 }, { "epoch": 0.07, "learning_rate": 4.9337604957338176e-05, "loss": 0.4487, "step": 5485 }, { "epoch": 0.07, "learning_rate": 4.9336401254109945e-05, "loss": 1.1427, "step": 5490 }, { "epoch": 0.07, "learning_rate": 4.93351964729009e-05, "loss": 0.4089, "step": 5495 }, { "epoch": 0.07, "learning_rate": 4.933399061376439e-05, "loss": 0.3037, "step": 5500 }, { "epoch": 0.07, "learning_rate": 4.933278367675383e-05, "loss": 1.0067, "step": 5505 }, { "epoch": 0.07, "learning_rate": 4.933157566192269e-05, "loss": 0.343, "step": 5510 }, { "epoch": 0.07, "learning_rate": 4.933036656932447e-05, "loss": 0.5222, "step": 5515 }, { "epoch": 0.07, "learning_rate": 4.932915639901274e-05, "loss": 1.1745, "step": 5520 }, { "epoch": 0.07, "learning_rate": 4.93279451510411e-05, "loss": 0.6292, "step": 5525 }, { "epoch": 0.07, "learning_rate": 4.932673282546318e-05, "loss": 0.765, "step": 5530 }, { "epoch": 0.07, "learning_rate": 4.932551942233272e-05, "loss": 0.8477, "step": 5535 }, { "epoch": 0.07, "learning_rate": 4.932430494170344e-05, "loss": 0.493, "step": 5540 }, { "epoch": 0.07, "learning_rate": 4.932308938362914e-05, "loss": 0.8588, "step": 5545 }, { "epoch": 0.07, "learning_rate": 4.932187274816365e-05, "loss": 0.4241, "step": 5550 }, { "epoch": 0.07, "learning_rate": 4.9320655035360895e-05, "loss": 0.2881, "step": 5555 }, { "epoch": 0.07, "learning_rate": 4.9319436245274794e-05, "loss": 0.8029, "step": 5560 }, { "epoch": 0.07, "learning_rate": 4.9318216377959324e-05, "loss": 1.9187, "step": 5565 }, { "epoch": 0.07, "learning_rate": 4.931699543346854e-05, "loss": 0.8799, "step": 5570 }, { "epoch": 0.07, "learning_rate": 4.93157734118565e-05, "loss": 0.8142, "step": 5575 }, { "epoch": 0.07, "learning_rate": 4.9314550313177354e-05, "loss": 0.7785, "step": 5580 }, { "epoch": 0.07, "learning_rate": 4.931332613748527e-05, "loss": 0.9401, "step": 5585 }, { "epoch": 0.07, "learning_rate": 4.9312100884834474e-05, "loss": 0.6881, "step": 5590 }, { "epoch": 0.07, "learning_rate": 4.9310874555279236e-05, "loss": 0.9349, "step": 5595 }, { "epoch": 0.08, "learning_rate": 4.9309647148873875e-05, "loss": 0.7266, "step": 5600 }, { "epoch": 0.08, "learning_rate": 4.930841866567277e-05, "loss": 0.6857, "step": 5605 }, { "epoch": 0.08, "learning_rate": 4.930718910573033e-05, "loss": 1.0948, "step": 5610 }, { "epoch": 0.08, "learning_rate": 4.930595846910101e-05, "loss": 0.4666, "step": 5615 }, { "epoch": 0.08, "learning_rate": 4.9304726755839334e-05, "loss": 0.7403, "step": 5620 }, { "epoch": 0.08, "learning_rate": 4.930349396599986e-05, "loss": 0.5009, "step": 5625 }, { "epoch": 0.08, "learning_rate": 4.930226009963718e-05, "loss": 0.9285, "step": 5630 }, { "epoch": 0.08, "learning_rate": 4.930102515680596e-05, "loss": 0.418, "step": 5635 }, { "epoch": 0.08, "learning_rate": 4.9299789137560904e-05, "loss": 0.897, "step": 5640 }, { "epoch": 0.08, "learning_rate": 4.929855204195676e-05, "loss": 0.5968, "step": 5645 }, { "epoch": 0.08, "learning_rate": 4.929731387004831e-05, "loss": 0.7023, "step": 5650 }, { "epoch": 0.08, "learning_rate": 4.929607462189042e-05, "loss": 0.7224, "step": 5655 }, { "epoch": 0.08, "learning_rate": 4.9294834297537976e-05, "loss": 0.3094, "step": 5660 }, { "epoch": 0.08, "learning_rate": 4.929359289704591e-05, "loss": 0.6856, "step": 5665 }, { "epoch": 0.08, "learning_rate": 4.929235042046922e-05, "loss": 1.0851, "step": 5670 }, { "epoch": 0.08, "learning_rate": 4.9291106867862934e-05, "loss": 0.5618, "step": 5675 }, { "epoch": 0.08, "learning_rate": 4.928986223928214e-05, "loss": 0.4987, "step": 5680 }, { "epoch": 0.08, "learning_rate": 4.928861653478196e-05, "loss": 0.6692, "step": 5685 }, { "epoch": 0.08, "learning_rate": 4.928736975441759e-05, "loss": 0.8234, "step": 5690 }, { "epoch": 0.08, "learning_rate": 4.928612189824424e-05, "loss": 1.2215, "step": 5695 }, { "epoch": 0.08, "learning_rate": 4.92848729663172e-05, "loss": 1.3212, "step": 5700 }, { "epoch": 0.08, "learning_rate": 4.928362295869177e-05, "loss": 0.9183, "step": 5705 }, { "epoch": 0.08, "learning_rate": 4.9282371875423325e-05, "loss": 0.4754, "step": 5710 }, { "epoch": 0.08, "learning_rate": 4.9281119716567305e-05, "loss": 1.5195, "step": 5715 }, { "epoch": 0.08, "learning_rate": 4.927986648217914e-05, "loss": 1.101, "step": 5720 }, { "epoch": 0.08, "learning_rate": 4.9278612172314364e-05, "loss": 1.108, "step": 5725 }, { "epoch": 0.08, "learning_rate": 4.927735678702853e-05, "loss": 0.1931, "step": 5730 }, { "epoch": 0.08, "learning_rate": 4.927610032637725e-05, "loss": 0.7402, "step": 5735 }, { "epoch": 0.08, "learning_rate": 4.9274842790416174e-05, "loss": 0.6257, "step": 5740 }, { "epoch": 0.08, "learning_rate": 4.9273584179201e-05, "loss": 1.0822, "step": 5745 }, { "epoch": 0.08, "learning_rate": 4.9272324492787484e-05, "loss": 1.1728, "step": 5750 }, { "epoch": 0.08, "learning_rate": 4.927106373123142e-05, "loss": 0.3904, "step": 5755 }, { "epoch": 0.08, "learning_rate": 4.9269801894588673e-05, "loss": 0.6569, "step": 5760 }, { "epoch": 0.08, "learning_rate": 4.926853898291511e-05, "loss": 0.6806, "step": 5765 }, { "epoch": 0.08, "learning_rate": 4.9267274996266685e-05, "loss": 1.0489, "step": 5770 }, { "epoch": 0.08, "learning_rate": 4.9266009934699384e-05, "loss": 0.5691, "step": 5775 }, { "epoch": 0.08, "learning_rate": 4.9264743798269234e-05, "loss": 0.7168, "step": 5780 }, { "epoch": 0.08, "learning_rate": 4.926347658703233e-05, "loss": 0.5124, "step": 5785 }, { "epoch": 0.08, "learning_rate": 4.92622083010448e-05, "loss": 0.9391, "step": 5790 }, { "epoch": 0.08, "learning_rate": 4.9260938940362824e-05, "loss": 0.6711, "step": 5795 }, { "epoch": 0.08, "learning_rate": 4.925966850504263e-05, "loss": 1.6487, "step": 5800 }, { "epoch": 0.08, "learning_rate": 4.9258396995140485e-05, "loss": 0.7966, "step": 5805 }, { "epoch": 0.08, "learning_rate": 4.925712441071271e-05, "loss": 0.3572, "step": 5810 }, { "epoch": 0.08, "learning_rate": 4.925585075181568e-05, "loss": 0.9409, "step": 5815 }, { "epoch": 0.08, "learning_rate": 4.9254576018505815e-05, "loss": 0.3735, "step": 5820 }, { "epoch": 0.08, "learning_rate": 4.925330021083957e-05, "loss": 0.5839, "step": 5825 }, { "epoch": 0.08, "learning_rate": 4.9252023328873456e-05, "loss": 0.1645, "step": 5830 }, { "epoch": 0.08, "learning_rate": 4.925074537266404e-05, "loss": 1.1899, "step": 5835 }, { "epoch": 0.08, "learning_rate": 4.924946634226794e-05, "loss": 0.3501, "step": 5840 }, { "epoch": 0.08, "learning_rate": 4.924818623774178e-05, "loss": 0.5667, "step": 5845 }, { "epoch": 0.08, "learning_rate": 4.924690505914229e-05, "loss": 0.8983, "step": 5850 }, { "epoch": 0.08, "learning_rate": 4.92456228065262e-05, "loss": 0.4867, "step": 5855 }, { "epoch": 0.08, "learning_rate": 4.924433947995033e-05, "loss": 1.2927, "step": 5860 }, { "epoch": 0.08, "learning_rate": 4.9243055079471504e-05, "loss": 0.7365, "step": 5865 }, { "epoch": 0.08, "learning_rate": 4.924176960514662e-05, "loss": 0.8537, "step": 5870 }, { "epoch": 0.08, "learning_rate": 4.924048305703263e-05, "loss": 0.9171, "step": 5875 }, { "epoch": 0.08, "learning_rate": 4.9239195435186495e-05, "loss": 1.2398, "step": 5880 }, { "epoch": 0.08, "learning_rate": 4.923790673966528e-05, "loss": 0.5193, "step": 5885 }, { "epoch": 0.08, "learning_rate": 4.923661697052605e-05, "loss": 1.034, "step": 5890 }, { "epoch": 0.08, "learning_rate": 4.923532612782594e-05, "loss": 0.8478, "step": 5895 }, { "epoch": 0.08, "learning_rate": 4.923403421162213e-05, "loss": 1.065, "step": 5900 }, { "epoch": 0.08, "learning_rate": 4.923274122197185e-05, "loss": 0.8, "step": 5905 }, { "epoch": 0.08, "learning_rate": 4.9231447158932356e-05, "loss": 0.9991, "step": 5910 }, { "epoch": 0.08, "learning_rate": 4.9230152022560984e-05, "loss": 0.2925, "step": 5915 }, { "epoch": 0.08, "learning_rate": 4.92288558129151e-05, "loss": 0.3514, "step": 5920 }, { "epoch": 0.08, "learning_rate": 4.922755853005211e-05, "loss": 0.8416, "step": 5925 }, { "epoch": 0.08, "learning_rate": 4.922626017402948e-05, "loss": 0.8616, "step": 5930 }, { "epoch": 0.08, "learning_rate": 4.9224960744904736e-05, "loss": 0.9168, "step": 5935 }, { "epoch": 0.08, "learning_rate": 4.9223660242735416e-05, "loss": 0.6734, "step": 5940 }, { "epoch": 0.08, "learning_rate": 4.922235866757914e-05, "loss": 0.2439, "step": 5945 }, { "epoch": 0.08, "learning_rate": 4.922105601949355e-05, "loss": 0.9016, "step": 5950 }, { "epoch": 0.08, "learning_rate": 4.921975229853636e-05, "loss": 0.6212, "step": 5955 }, { "epoch": 0.08, "learning_rate": 4.921844750476531e-05, "loss": 1.0316, "step": 5960 }, { "epoch": 0.08, "learning_rate": 4.9217141638238186e-05, "loss": 0.5187, "step": 5965 }, { "epoch": 0.08, "learning_rate": 4.921583469901285e-05, "loss": 1.097, "step": 5970 }, { "epoch": 0.08, "learning_rate": 4.921452668714719e-05, "loss": 1.2541, "step": 5975 }, { "epoch": 0.08, "learning_rate": 4.921321760269913e-05, "loss": 0.745, "step": 5980 }, { "epoch": 0.08, "learning_rate": 4.921190744572667e-05, "loss": 0.4876, "step": 5985 }, { "epoch": 0.08, "learning_rate": 4.921059621628783e-05, "loss": 0.3747, "step": 5990 }, { "epoch": 0.08, "learning_rate": 4.9209283914440714e-05, "loss": 1.3669, "step": 5995 }, { "epoch": 0.08, "learning_rate": 4.9207970540243426e-05, "loss": 1.1131, "step": 6000 }, { "epoch": 0.08, "learning_rate": 4.920665609375416e-05, "loss": 1.4159, "step": 6005 }, { "epoch": 0.08, "learning_rate": 4.920534057503112e-05, "loss": 0.7648, "step": 6010 }, { "epoch": 0.08, "learning_rate": 4.920402398413259e-05, "loss": 1.0631, "step": 6015 }, { "epoch": 0.08, "learning_rate": 4.920270632111689e-05, "loss": 1.6565, "step": 6020 }, { "epoch": 0.08, "learning_rate": 4.920138758604238e-05, "loss": 1.0828, "step": 6025 }, { "epoch": 0.08, "learning_rate": 4.920006777896749e-05, "loss": 0.7259, "step": 6030 }, { "epoch": 0.08, "learning_rate": 4.9198746899950646e-05, "loss": 0.6315, "step": 6035 }, { "epoch": 0.08, "learning_rate": 4.9197424949050385e-05, "loss": 0.5332, "step": 6040 }, { "epoch": 0.08, "learning_rate": 4.919610192632526e-05, "loss": 0.937, "step": 6045 }, { "epoch": 0.08, "learning_rate": 4.919477783183386e-05, "loss": 0.5215, "step": 6050 }, { "epoch": 0.08, "learning_rate": 4.919345266563484e-05, "loss": 0.9191, "step": 6055 }, { "epoch": 0.08, "learning_rate": 4.919212642778692e-05, "loss": 1.0527, "step": 6060 }, { "epoch": 0.08, "learning_rate": 4.919079911834882e-05, "loss": 0.7205, "step": 6065 }, { "epoch": 0.08, "learning_rate": 4.918947073737934e-05, "loss": 0.5126, "step": 6070 }, { "epoch": 0.08, "learning_rate": 4.918814128493732e-05, "loss": 1.0779, "step": 6075 }, { "epoch": 0.08, "learning_rate": 4.918681076108166e-05, "loss": 0.5877, "step": 6080 }, { "epoch": 0.08, "learning_rate": 4.918547916587128e-05, "loss": 0.812, "step": 6085 }, { "epoch": 0.08, "learning_rate": 4.918414649936517e-05, "loss": 1.0673, "step": 6090 }, { "epoch": 0.08, "learning_rate": 4.918281276162235e-05, "loss": 0.5139, "step": 6095 }, { "epoch": 0.08, "learning_rate": 4.918147795270193e-05, "loss": 0.4643, "step": 6100 }, { "epoch": 0.08, "learning_rate": 4.9180142072662994e-05, "loss": 0.6529, "step": 6105 }, { "epoch": 0.08, "learning_rate": 4.917880512156474e-05, "loss": 0.3821, "step": 6110 }, { "epoch": 0.08, "learning_rate": 4.917746709946638e-05, "loss": 1.2349, "step": 6115 }, { "epoch": 0.08, "learning_rate": 4.9176128006427186e-05, "loss": 0.3874, "step": 6120 }, { "epoch": 0.08, "learning_rate": 4.917478784250647e-05, "loss": 0.7871, "step": 6125 }, { "epoch": 0.08, "learning_rate": 4.9173446607763594e-05, "loss": 1.05, "step": 6130 }, { "epoch": 0.08, "learning_rate": 4.917210430225797e-05, "loss": 0.5467, "step": 6135 }, { "epoch": 0.08, "learning_rate": 4.917076092604905e-05, "loss": 0.8975, "step": 6140 }, { "epoch": 0.08, "learning_rate": 4.916941647919635e-05, "loss": 1.5522, "step": 6145 }, { "epoch": 0.08, "learning_rate": 4.916807096175942e-05, "loss": 0.56, "step": 6150 }, { "epoch": 0.08, "learning_rate": 4.9166724373797846e-05, "loss": 0.769, "step": 6155 }, { "epoch": 0.08, "learning_rate": 4.916537671537129e-05, "loss": 1.176, "step": 6160 }, { "epoch": 0.08, "learning_rate": 4.916402798653944e-05, "loss": 0.3801, "step": 6165 }, { "epoch": 0.08, "learning_rate": 4.916267818736203e-05, "loss": 0.6563, "step": 6170 }, { "epoch": 0.08, "learning_rate": 4.916132731789887e-05, "loss": 0.466, "step": 6175 }, { "epoch": 0.08, "learning_rate": 4.915997537820978e-05, "loss": 0.4605, "step": 6180 }, { "epoch": 0.08, "learning_rate": 4.915862236835466e-05, "loss": 0.8179, "step": 6185 }, { "epoch": 0.08, "learning_rate": 4.915726828839342e-05, "loss": 1.0004, "step": 6190 }, { "epoch": 0.08, "learning_rate": 4.9155913138386044e-05, "loss": 0.6179, "step": 6195 }, { "epoch": 0.08, "learning_rate": 4.915455691839258e-05, "loss": 0.668, "step": 6200 }, { "epoch": 0.08, "learning_rate": 4.915319962847307e-05, "loss": 0.4948, "step": 6205 }, { "epoch": 0.08, "learning_rate": 4.915184126868766e-05, "loss": 0.6054, "step": 6210 }, { "epoch": 0.08, "learning_rate": 4.9150481839096504e-05, "loss": 0.7317, "step": 6215 }, { "epoch": 0.08, "learning_rate": 4.914912133975983e-05, "loss": 1.0232, "step": 6220 }, { "epoch": 0.08, "learning_rate": 4.91477597707379e-05, "loss": 0.7809, "step": 6225 }, { "epoch": 0.08, "learning_rate": 4.914639713209101e-05, "loss": 0.3897, "step": 6230 }, { "epoch": 0.08, "learning_rate": 4.914503342387953e-05, "loss": 1.039, "step": 6235 }, { "epoch": 0.08, "learning_rate": 4.914366864616386e-05, "loss": 1.1445, "step": 6240 }, { "epoch": 0.08, "learning_rate": 4.9142302799004455e-05, "loss": 0.7065, "step": 6245 }, { "epoch": 0.08, "learning_rate": 4.9140935882461826e-05, "loss": 0.7869, "step": 6250 }, { "epoch": 0.08, "learning_rate": 4.913956789659651e-05, "loss": 0.3144, "step": 6255 }, { "epoch": 0.08, "learning_rate": 4.91381988414691e-05, "loss": 1.1093, "step": 6260 }, { "epoch": 0.08, "learning_rate": 4.913682871714023e-05, "loss": 0.9388, "step": 6265 }, { "epoch": 0.08, "learning_rate": 4.913545752367061e-05, "loss": 1.1091, "step": 6270 }, { "epoch": 0.08, "learning_rate": 4.9134085261120966e-05, "loss": 0.9619, "step": 6275 }, { "epoch": 0.08, "learning_rate": 4.913271192955209e-05, "loss": 0.5497, "step": 6280 }, { "epoch": 0.08, "learning_rate": 4.9131337529024805e-05, "loss": 0.6709, "step": 6285 }, { "epoch": 0.08, "learning_rate": 4.912996205959999e-05, "loss": 0.5715, "step": 6290 }, { "epoch": 0.08, "learning_rate": 4.912858552133857e-05, "loss": 0.6043, "step": 6295 }, { "epoch": 0.08, "learning_rate": 4.912720791430153e-05, "loss": 0.5407, "step": 6300 }, { "epoch": 0.08, "learning_rate": 4.912582923854988e-05, "loss": 0.4415, "step": 6305 }, { "epoch": 0.08, "learning_rate": 4.912444949414469e-05, "loss": 0.7032, "step": 6310 }, { "epoch": 0.08, "learning_rate": 4.912306868114709e-05, "loss": 0.6514, "step": 6315 }, { "epoch": 0.08, "learning_rate": 4.9121686799618214e-05, "loss": 0.8998, "step": 6320 }, { "epoch": 0.08, "learning_rate": 4.9120303849619304e-05, "loss": 0.4265, "step": 6325 }, { "epoch": 0.08, "learning_rate": 4.91189198312116e-05, "loss": 1.47, "step": 6330 }, { "epoch": 0.08, "learning_rate": 4.911753474445641e-05, "loss": 1.1257, "step": 6335 }, { "epoch": 0.08, "learning_rate": 4.9116148589415086e-05, "loss": 0.7904, "step": 6340 }, { "epoch": 0.09, "learning_rate": 4.911476136614903e-05, "loss": 0.289, "step": 6345 }, { "epoch": 0.09, "learning_rate": 4.911337307471968e-05, "loss": 0.2885, "step": 6350 }, { "epoch": 0.09, "learning_rate": 4.911198371518855e-05, "loss": 0.7973, "step": 6355 }, { "epoch": 0.09, "learning_rate": 4.911059328761717e-05, "loss": 0.9484, "step": 6360 }, { "epoch": 0.09, "learning_rate": 4.910920179206712e-05, "loss": 1.0592, "step": 6365 }, { "epoch": 0.09, "learning_rate": 4.9107809228600046e-05, "loss": 0.524, "step": 6370 }, { "epoch": 0.09, "learning_rate": 4.9106415597277635e-05, "loss": 0.3374, "step": 6375 }, { "epoch": 0.09, "learning_rate": 4.910502089816161e-05, "loss": 1.0328, "step": 6380 }, { "epoch": 0.09, "learning_rate": 4.910362513131376e-05, "loss": 1.0723, "step": 6385 }, { "epoch": 0.09, "learning_rate": 4.91022282967959e-05, "loss": 0.9935, "step": 6390 }, { "epoch": 0.09, "learning_rate": 4.9100830394669904e-05, "loss": 0.7047, "step": 6395 }, { "epoch": 0.09, "learning_rate": 4.9099431424997695e-05, "loss": 2.1917, "step": 6400 }, { "epoch": 0.09, "learning_rate": 4.9098031387841236e-05, "loss": 0.551, "step": 6405 }, { "epoch": 0.09, "learning_rate": 4.909663028326255e-05, "loss": 0.8098, "step": 6410 }, { "epoch": 0.09, "learning_rate": 4.90952281113237e-05, "loss": 1.122, "step": 6415 }, { "epoch": 0.09, "learning_rate": 4.909382487208678e-05, "loss": 0.4967, "step": 6420 }, { "epoch": 0.09, "learning_rate": 4.9092420565613954e-05, "loss": 0.5201, "step": 6425 }, { "epoch": 0.09, "learning_rate": 4.909101519196743e-05, "loss": 0.8304, "step": 6430 }, { "epoch": 0.09, "learning_rate": 4.908960875120946e-05, "loss": 0.2138, "step": 6435 }, { "epoch": 0.09, "learning_rate": 4.9088201243402335e-05, "loss": 0.3229, "step": 6440 }, { "epoch": 0.09, "learning_rate": 4.908679266860841e-05, "loss": 0.6076, "step": 6445 }, { "epoch": 0.09, "learning_rate": 4.908538302689007e-05, "loss": 0.3777, "step": 6450 }, { "epoch": 0.09, "learning_rate": 4.9083972318309753e-05, "loss": 1.2985, "step": 6455 }, { "epoch": 0.09, "learning_rate": 4.908256054292996e-05, "loss": 0.7037, "step": 6460 }, { "epoch": 0.09, "learning_rate": 4.90811477008132e-05, "loss": 0.9845, "step": 6465 }, { "epoch": 0.09, "learning_rate": 4.907973379202209e-05, "loss": 1.1756, "step": 6470 }, { "epoch": 0.09, "learning_rate": 4.907831881661923e-05, "loss": 0.9815, "step": 6475 }, { "epoch": 0.09, "learning_rate": 4.90769027746673e-05, "loss": 1.2536, "step": 6480 }, { "epoch": 0.09, "learning_rate": 4.9075485666229035e-05, "loss": 0.6892, "step": 6485 }, { "epoch": 0.09, "learning_rate": 4.90740674913672e-05, "loss": 0.5818, "step": 6490 }, { "epoch": 0.09, "learning_rate": 4.9072648250144624e-05, "loss": 0.6855, "step": 6495 }, { "epoch": 0.09, "learning_rate": 4.907122794262415e-05, "loss": 1.3387, "step": 6500 }, { "epoch": 0.09, "learning_rate": 4.9069806568868715e-05, "loss": 0.7801, "step": 6505 }, { "epoch": 0.09, "learning_rate": 4.906838412894126e-05, "loss": 0.1881, "step": 6510 }, { "epoch": 0.09, "learning_rate": 4.90669606229048e-05, "loss": 0.8438, "step": 6515 }, { "epoch": 0.09, "learning_rate": 4.906553605082238e-05, "loss": 0.961, "step": 6520 }, { "epoch": 0.09, "learning_rate": 4.906411041275711e-05, "loss": 0.7045, "step": 6525 }, { "epoch": 0.09, "learning_rate": 4.906268370877215e-05, "loss": 0.9502, "step": 6530 }, { "epoch": 0.09, "learning_rate": 4.906125593893067e-05, "loss": 0.6143, "step": 6535 }, { "epoch": 0.09, "learning_rate": 4.905982710329594e-05, "loss": 0.5577, "step": 6540 }, { "epoch": 0.09, "learning_rate": 4.905839720193123e-05, "loss": 0.5937, "step": 6545 }, { "epoch": 0.09, "learning_rate": 4.9056966234899883e-05, "loss": 1.3914, "step": 6550 }, { "epoch": 0.09, "learning_rate": 4.9055534202265286e-05, "loss": 0.7212, "step": 6555 }, { "epoch": 0.09, "learning_rate": 4.905410110409087e-05, "loss": 0.998, "step": 6560 }, { "epoch": 0.09, "learning_rate": 4.905266694044011e-05, "loss": 0.9038, "step": 6565 }, { "epoch": 0.09, "learning_rate": 4.905123171137654e-05, "loss": 0.3152, "step": 6570 }, { "epoch": 0.09, "learning_rate": 4.904979541696373e-05, "loss": 0.9448, "step": 6575 }, { "epoch": 0.09, "learning_rate": 4.90483580572653e-05, "loss": 0.9352, "step": 6580 }, { "epoch": 0.09, "learning_rate": 4.904691963234491e-05, "loss": 1.0754, "step": 6585 }, { "epoch": 0.09, "learning_rate": 4.90454801422663e-05, "loss": 0.7662, "step": 6590 }, { "epoch": 0.09, "learning_rate": 4.9044039587093206e-05, "loss": 0.9574, "step": 6595 }, { "epoch": 0.09, "learning_rate": 4.9042597966889446e-05, "loss": 0.8656, "step": 6600 }, { "epoch": 0.09, "learning_rate": 4.904115528171887e-05, "loss": 0.5652, "step": 6605 }, { "epoch": 0.09, "learning_rate": 4.903971153164541e-05, "loss": 0.6213, "step": 6610 }, { "epoch": 0.09, "learning_rate": 4.903826671673298e-05, "loss": 0.7779, "step": 6615 }, { "epoch": 0.09, "learning_rate": 4.9036820837045595e-05, "loss": 0.7958, "step": 6620 }, { "epoch": 0.09, "learning_rate": 4.9035373892647306e-05, "loss": 1.2004, "step": 6625 }, { "epoch": 0.09, "learning_rate": 4.903392588360219e-05, "loss": 1.099, "step": 6630 }, { "epoch": 0.09, "learning_rate": 4.9032476809974405e-05, "loss": 0.6193, "step": 6635 }, { "epoch": 0.09, "learning_rate": 4.903102667182812e-05, "loss": 1.1691, "step": 6640 }, { "epoch": 0.09, "learning_rate": 4.902957546922758e-05, "loss": 1.3608, "step": 6645 }, { "epoch": 0.09, "learning_rate": 4.902812320223707e-05, "loss": 1.093, "step": 6650 }, { "epoch": 0.09, "learning_rate": 4.902666987092091e-05, "loss": 0.7023, "step": 6655 }, { "epoch": 0.09, "learning_rate": 4.9025215475343466e-05, "loss": 0.4569, "step": 6660 }, { "epoch": 0.09, "learning_rate": 4.902376001556918e-05, "loss": 0.5557, "step": 6665 }, { "epoch": 0.09, "learning_rate": 4.9022303491662505e-05, "loss": 0.8535, "step": 6670 }, { "epoch": 0.09, "learning_rate": 4.902084590368796e-05, "loss": 1.0275, "step": 6675 }, { "epoch": 0.09, "learning_rate": 4.901938725171012e-05, "loss": 1.0458, "step": 6680 }, { "epoch": 0.09, "learning_rate": 4.9017927535793595e-05, "loss": 1.0597, "step": 6685 }, { "epoch": 0.09, "learning_rate": 4.9016466756003036e-05, "loss": 0.8567, "step": 6690 }, { "epoch": 0.09, "learning_rate": 4.901500491240315e-05, "loss": 0.9145, "step": 6695 }, { "epoch": 0.09, "learning_rate": 4.9013542005058687e-05, "loss": 0.5113, "step": 6700 }, { "epoch": 0.09, "learning_rate": 4.901207803403446e-05, "loss": 0.5969, "step": 6705 }, { "epoch": 0.09, "learning_rate": 4.901061299939529e-05, "loss": 1.0862, "step": 6710 }, { "epoch": 0.09, "learning_rate": 4.9009146901206095e-05, "loss": 0.5365, "step": 6715 }, { "epoch": 0.09, "learning_rate": 4.90076797395318e-05, "loss": 0.4696, "step": 6720 }, { "epoch": 0.09, "learning_rate": 4.9006211514437405e-05, "loss": 1.1453, "step": 6725 }, { "epoch": 0.09, "learning_rate": 4.900474222598793e-05, "loss": 0.7627, "step": 6730 }, { "epoch": 0.09, "learning_rate": 4.900327187424848e-05, "loss": 0.9849, "step": 6735 }, { "epoch": 0.09, "learning_rate": 4.9001800459284157e-05, "loss": 0.2499, "step": 6740 }, { "epoch": 0.09, "learning_rate": 4.900032798116016e-05, "loss": 0.6465, "step": 6745 }, { "epoch": 0.09, "learning_rate": 4.89988544399417e-05, "loss": 0.9543, "step": 6750 }, { "epoch": 0.09, "learning_rate": 4.899737983569405e-05, "loss": 0.8135, "step": 6755 }, { "epoch": 0.09, "learning_rate": 4.899590416848253e-05, "loss": 0.4647, "step": 6760 }, { "epoch": 0.09, "learning_rate": 4.8994427438372503e-05, "loss": 0.3564, "step": 6765 }, { "epoch": 0.09, "learning_rate": 4.899294964542938e-05, "loss": 0.6206, "step": 6770 }, { "epoch": 0.09, "learning_rate": 4.899147078971862e-05, "loss": 0.5936, "step": 6775 }, { "epoch": 0.09, "learning_rate": 4.8989990871305736e-05, "loss": 0.8982, "step": 6780 }, { "epoch": 0.09, "learning_rate": 4.8988509890256264e-05, "loss": 0.9293, "step": 6785 }, { "epoch": 0.09, "learning_rate": 4.898702784663582e-05, "loss": 0.4235, "step": 6790 }, { "epoch": 0.09, "learning_rate": 4.898554474051005e-05, "loss": 0.1645, "step": 6795 }, { "epoch": 0.09, "learning_rate": 4.898406057194463e-05, "loss": 0.9189, "step": 6800 }, { "epoch": 0.09, "learning_rate": 4.898257534100533e-05, "loss": 0.7283, "step": 6805 }, { "epoch": 0.09, "learning_rate": 4.8981089047757914e-05, "loss": 0.9502, "step": 6810 }, { "epoch": 0.09, "learning_rate": 4.8979601692268234e-05, "loss": 0.9239, "step": 6815 }, { "epoch": 0.09, "learning_rate": 4.897811327460216e-05, "loss": 1.0526, "step": 6820 }, { "epoch": 0.09, "learning_rate": 4.8976623794825635e-05, "loss": 1.0882, "step": 6825 }, { "epoch": 0.09, "learning_rate": 4.8975133253004616e-05, "loss": 0.4821, "step": 6830 }, { "epoch": 0.09, "learning_rate": 4.897364164920514e-05, "loss": 0.9757, "step": 6835 }, { "epoch": 0.09, "learning_rate": 4.8972148983493285e-05, "loss": 1.0293, "step": 6840 }, { "epoch": 0.09, "learning_rate": 4.897065525593515e-05, "loss": 0.8841, "step": 6845 }, { "epoch": 0.09, "learning_rate": 4.896916046659691e-05, "loss": 0.8063, "step": 6850 }, { "epoch": 0.09, "learning_rate": 4.8967664615544776e-05, "loss": 0.6729, "step": 6855 }, { "epoch": 0.09, "learning_rate": 4.8966167702845e-05, "loss": 0.8555, "step": 6860 }, { "epoch": 0.09, "learning_rate": 4.896466972856391e-05, "loss": 0.8237, "step": 6865 }, { "epoch": 0.09, "learning_rate": 4.896317069276782e-05, "loss": 0.6233, "step": 6870 }, { "epoch": 0.09, "learning_rate": 4.896167059552317e-05, "loss": 0.176, "step": 6875 }, { "epoch": 0.09, "learning_rate": 4.896016943689638e-05, "loss": 0.5396, "step": 6880 }, { "epoch": 0.09, "learning_rate": 4.8958667216953956e-05, "loss": 1.341, "step": 6885 }, { "epoch": 0.09, "learning_rate": 4.895716393576244e-05, "loss": 0.8875, "step": 6890 }, { "epoch": 0.09, "learning_rate": 4.895565959338841e-05, "loss": 0.5139, "step": 6895 }, { "epoch": 0.09, "learning_rate": 4.8954154189898506e-05, "loss": 0.3881, "step": 6900 }, { "epoch": 0.09, "learning_rate": 4.8952647725359414e-05, "loss": 1.0058, "step": 6905 }, { "epoch": 0.09, "learning_rate": 4.895114019983785e-05, "loss": 0.7627, "step": 6910 }, { "epoch": 0.09, "learning_rate": 4.8949631613400614e-05, "loss": 0.8786, "step": 6915 }, { "epoch": 0.09, "learning_rate": 4.89481219661145e-05, "loss": 0.3067, "step": 6920 }, { "epoch": 0.09, "learning_rate": 4.8946611258046405e-05, "loss": 1.4111, "step": 6925 }, { "epoch": 0.09, "learning_rate": 4.894509948926322e-05, "loss": 0.8964, "step": 6930 }, { "epoch": 0.09, "learning_rate": 4.894358665983193e-05, "loss": 0.502, "step": 6935 }, { "epoch": 0.09, "learning_rate": 4.894207276981953e-05, "loss": 0.2979, "step": 6940 }, { "epoch": 0.09, "learning_rate": 4.8940557819293085e-05, "loss": 0.392, "step": 6945 }, { "epoch": 0.09, "learning_rate": 4.8939041808319705e-05, "loss": 0.5543, "step": 6950 }, { "epoch": 0.09, "learning_rate": 4.8937524736966534e-05, "loss": 0.4294, "step": 6955 }, { "epoch": 0.09, "learning_rate": 4.893600660530077e-05, "loss": 0.4191, "step": 6960 }, { "epoch": 0.09, "learning_rate": 4.893448741338966e-05, "loss": 0.563, "step": 6965 }, { "epoch": 0.09, "learning_rate": 4.89329671613005e-05, "loss": 0.8604, "step": 6970 }, { "epoch": 0.09, "learning_rate": 4.893144584910063e-05, "loss": 0.3763, "step": 6975 }, { "epoch": 0.09, "learning_rate": 4.892992347685744e-05, "loss": 0.4038, "step": 6980 }, { "epoch": 0.09, "learning_rate": 4.892840004463835e-05, "loss": 1.1034, "step": 6985 }, { "epoch": 0.09, "learning_rate": 4.892687555251085e-05, "loss": 0.8447, "step": 6990 }, { "epoch": 0.09, "learning_rate": 4.892535000054246e-05, "loss": 0.6206, "step": 6995 }, { "epoch": 0.09, "learning_rate": 4.892382338880077e-05, "loss": 1.0937, "step": 7000 }, { "epoch": 0.09, "learning_rate": 4.8922295717353386e-05, "loss": 0.492, "step": 7005 }, { "epoch": 0.09, "learning_rate": 4.8920766986267974e-05, "loss": 1.1292, "step": 7010 }, { "epoch": 0.09, "learning_rate": 4.891923719561227e-05, "loss": 1.2954, "step": 7015 }, { "epoch": 0.09, "learning_rate": 4.891770634545401e-05, "loss": 1.02, "step": 7020 }, { "epoch": 0.09, "learning_rate": 4.891617443586102e-05, "loss": 0.6541, "step": 7025 }, { "epoch": 0.09, "learning_rate": 4.8914641466901155e-05, "loss": 1.1827, "step": 7030 }, { "epoch": 0.09, "learning_rate": 4.891310743864232e-05, "loss": 0.4747, "step": 7035 }, { "epoch": 0.09, "learning_rate": 4.891157235115244e-05, "loss": 0.8445, "step": 7040 }, { "epoch": 0.09, "learning_rate": 4.891003620449954e-05, "loss": 0.2168, "step": 7045 }, { "epoch": 0.09, "learning_rate": 4.8908498998751655e-05, "loss": 1.1441, "step": 7050 }, { "epoch": 0.09, "learning_rate": 4.890696073397687e-05, "loss": 0.3412, "step": 7055 }, { "epoch": 0.09, "learning_rate": 4.890542141024334e-05, "loss": 0.7782, "step": 7060 }, { "epoch": 0.09, "learning_rate": 4.890388102761922e-05, "loss": 0.8981, "step": 7065 }, { "epoch": 0.09, "learning_rate": 4.8902339586172774e-05, "loss": 1.1688, "step": 7070 }, { "epoch": 0.09, "learning_rate": 4.8900797085972255e-05, "loss": 1.4676, "step": 7075 }, { "epoch": 0.09, "learning_rate": 4.8899253527086e-05, "loss": 0.5691, "step": 7080 }, { "epoch": 0.09, "learning_rate": 4.889770890958237e-05, "loss": 1.4128, "step": 7085 }, { "epoch": 0.09, "learning_rate": 4.88961632335298e-05, "loss": 1.0709, "step": 7090 }, { "epoch": 0.1, "learning_rate": 4.8894616498996747e-05, "loss": 0.7907, "step": 7095 }, { "epoch": 0.1, "learning_rate": 4.889306870605173e-05, "loss": 0.755, "step": 7100 }, { "epoch": 0.1, "learning_rate": 4.889151985476329e-05, "loss": 0.8179, "step": 7105 }, { "epoch": 0.1, "learning_rate": 4.888996994520005e-05, "loss": 0.729, "step": 7110 }, { "epoch": 0.1, "learning_rate": 4.888841897743066e-05, "loss": 0.4536, "step": 7115 }, { "epoch": 0.1, "learning_rate": 4.888686695152383e-05, "loss": 1.2975, "step": 7120 }, { "epoch": 0.1, "learning_rate": 4.8885313867548275e-05, "loss": 0.5321, "step": 7125 }, { "epoch": 0.1, "learning_rate": 4.888407063860461e-05, "loss": 0.6051, "step": 7130 }, { "epoch": 0.1, "learning_rate": 4.888251565027879e-05, "loss": 0.7746, "step": 7135 }, { "epoch": 0.1, "learning_rate": 4.8880959604077006e-05, "loss": 0.8193, "step": 7140 }, { "epoch": 0.1, "learning_rate": 4.887940250006819e-05, "loss": 0.6303, "step": 7145 }, { "epoch": 0.1, "learning_rate": 4.88778443383213e-05, "loss": 0.9084, "step": 7150 }, { "epoch": 0.1, "learning_rate": 4.887628511890537e-05, "loss": 0.5742, "step": 7155 }, { "epoch": 0.1, "learning_rate": 4.887472484188946e-05, "loss": 0.4738, "step": 7160 }, { "epoch": 0.1, "learning_rate": 4.887316350734268e-05, "loss": 1.1326, "step": 7165 }, { "epoch": 0.1, "learning_rate": 4.887160111533418e-05, "loss": 0.4216, "step": 7170 }, { "epoch": 0.1, "learning_rate": 4.887003766593319e-05, "loss": 0.7859, "step": 7175 }, { "epoch": 0.1, "learning_rate": 4.886847315920894e-05, "loss": 1.0532, "step": 7180 }, { "epoch": 0.1, "learning_rate": 4.8866907595230744e-05, "loss": 0.5639, "step": 7185 }, { "epoch": 0.1, "learning_rate": 4.8865340974067944e-05, "loss": 1.0241, "step": 7190 }, { "epoch": 0.1, "learning_rate": 4.886377329578993e-05, "loss": 0.3737, "step": 7195 }, { "epoch": 0.1, "learning_rate": 4.886220456046615e-05, "loss": 0.6213, "step": 7200 }, { "epoch": 0.1, "learning_rate": 4.886063476816608e-05, "loss": 1.0708, "step": 7205 }, { "epoch": 0.1, "learning_rate": 4.885906391895927e-05, "loss": 0.9963, "step": 7210 }, { "epoch": 0.1, "learning_rate": 4.885749201291528e-05, "loss": 0.9707, "step": 7215 }, { "epoch": 0.1, "learning_rate": 4.885591905010376e-05, "loss": 0.8626, "step": 7220 }, { "epoch": 0.1, "learning_rate": 4.885434503059437e-05, "loss": 0.8117, "step": 7225 }, { "epoch": 0.1, "learning_rate": 4.885276995445683e-05, "loss": 0.9073, "step": 7230 }, { "epoch": 0.1, "learning_rate": 4.885119382176092e-05, "loss": 1.0541, "step": 7235 }, { "epoch": 0.1, "learning_rate": 4.884961663257645e-05, "loss": 0.5725, "step": 7240 }, { "epoch": 0.1, "learning_rate": 4.884803838697327e-05, "loss": 0.4595, "step": 7245 }, { "epoch": 0.1, "learning_rate": 4.88464590850213e-05, "loss": 1.0779, "step": 7250 }, { "epoch": 0.1, "learning_rate": 4.88448787267905e-05, "loss": 0.3651, "step": 7255 }, { "epoch": 0.1, "learning_rate": 4.884329731235085e-05, "loss": 0.6814, "step": 7260 }, { "epoch": 0.1, "learning_rate": 4.884171484177242e-05, "loss": 0.7214, "step": 7265 }, { "epoch": 0.1, "learning_rate": 4.8840131315125304e-05, "loss": 1.6515, "step": 7270 }, { "epoch": 0.1, "learning_rate": 4.883854673247964e-05, "loss": 0.7906, "step": 7275 }, { "epoch": 0.1, "learning_rate": 4.883696109390561e-05, "loss": 1.3654, "step": 7280 }, { "epoch": 0.1, "learning_rate": 4.8835374399473456e-05, "loss": 0.862, "step": 7285 }, { "epoch": 0.1, "learning_rate": 4.8833786649253466e-05, "loss": 0.1899, "step": 7290 }, { "epoch": 0.1, "learning_rate": 4.8832197843315965e-05, "loss": 1.6223, "step": 7295 }, { "epoch": 0.1, "learning_rate": 4.883060798173132e-05, "loss": 0.1249, "step": 7300 }, { "epoch": 0.1, "learning_rate": 4.882901706456997e-05, "loss": 0.747, "step": 7305 }, { "epoch": 0.1, "learning_rate": 4.882742509190237e-05, "loss": 0.7647, "step": 7310 }, { "epoch": 0.1, "learning_rate": 4.882583206379905e-05, "loss": 0.4934, "step": 7315 }, { "epoch": 0.1, "learning_rate": 4.8824237980330556e-05, "loss": 0.5093, "step": 7320 }, { "epoch": 0.1, "learning_rate": 4.8822642841567515e-05, "loss": 1.1398, "step": 7325 }, { "epoch": 0.1, "learning_rate": 4.882104664758058e-05, "loss": 0.6909, "step": 7330 }, { "epoch": 0.1, "learning_rate": 4.8819449398440446e-05, "loss": 0.9084, "step": 7335 }, { "epoch": 0.1, "learning_rate": 4.881785109421787e-05, "loss": 0.6221, "step": 7340 }, { "epoch": 0.1, "learning_rate": 4.8816251734983656e-05, "loss": 1.2407, "step": 7345 }, { "epoch": 0.1, "learning_rate": 4.881465132080863e-05, "loss": 0.1764, "step": 7350 }, { "epoch": 0.1, "learning_rate": 4.881304985176369e-05, "loss": 0.8759, "step": 7355 }, { "epoch": 0.1, "learning_rate": 4.881144732791978e-05, "loss": 0.8509, "step": 7360 }, { "epoch": 0.1, "learning_rate": 4.8809843749347876e-05, "loss": 0.2417, "step": 7365 }, { "epoch": 0.1, "learning_rate": 4.880823911611901e-05, "loss": 0.6007, "step": 7370 }, { "epoch": 0.1, "learning_rate": 4.880663342830426e-05, "loss": 0.8648, "step": 7375 }, { "epoch": 0.1, "learning_rate": 4.880502668597475e-05, "loss": 0.9826, "step": 7380 }, { "epoch": 0.1, "learning_rate": 4.880341888920166e-05, "loss": 0.7356, "step": 7385 }, { "epoch": 0.1, "learning_rate": 4.8801810038056186e-05, "loss": 0.7851, "step": 7390 }, { "epoch": 0.1, "learning_rate": 4.880020013260961e-05, "loss": 1.1215, "step": 7395 }, { "epoch": 0.1, "learning_rate": 4.879858917293323e-05, "loss": 0.4687, "step": 7400 }, { "epoch": 0.1, "learning_rate": 4.879697715909842e-05, "loss": 0.685, "step": 7405 }, { "epoch": 0.1, "learning_rate": 4.879536409117656e-05, "loss": 0.638, "step": 7410 }, { "epoch": 0.1, "learning_rate": 4.8793749969239135e-05, "loss": 1.0507, "step": 7415 }, { "epoch": 0.1, "learning_rate": 4.8792134793357604e-05, "loss": 0.2795, "step": 7420 }, { "epoch": 0.1, "learning_rate": 4.8790518563603535e-05, "loss": 0.4304, "step": 7425 }, { "epoch": 0.1, "learning_rate": 4.878890128004852e-05, "loss": 1.4203, "step": 7430 }, { "epoch": 0.1, "learning_rate": 4.878728294276419e-05, "loss": 1.3231, "step": 7435 }, { "epoch": 0.1, "learning_rate": 4.878566355182223e-05, "loss": 0.6085, "step": 7440 }, { "epoch": 0.1, "learning_rate": 4.8784043107294365e-05, "loss": 0.4365, "step": 7445 }, { "epoch": 0.1, "learning_rate": 4.878242160925238e-05, "loss": 0.9645, "step": 7450 }, { "epoch": 0.1, "learning_rate": 4.8780799057768104e-05, "loss": 0.5794, "step": 7455 }, { "epoch": 0.1, "learning_rate": 4.877917545291339e-05, "loss": 1.4299, "step": 7460 }, { "epoch": 0.1, "learning_rate": 4.8777550794760174e-05, "loss": 1.6564, "step": 7465 }, { "epoch": 0.1, "learning_rate": 4.877592508338041e-05, "loss": 1.4123, "step": 7470 }, { "epoch": 0.1, "learning_rate": 4.877429831884611e-05, "loss": 0.6599, "step": 7475 }, { "epoch": 0.1, "learning_rate": 4.877267050122934e-05, "loss": 0.4659, "step": 7480 }, { "epoch": 0.1, "learning_rate": 4.87710416306022e-05, "loss": 0.4718, "step": 7485 }, { "epoch": 0.1, "learning_rate": 4.876941170703683e-05, "loss": 1.4195, "step": 7490 }, { "epoch": 0.1, "learning_rate": 4.876778073060544e-05, "loss": 0.1854, "step": 7495 }, { "epoch": 0.1, "learning_rate": 4.8766148701380264e-05, "loss": 0.2831, "step": 7500 }, { "epoch": 0.1, "learning_rate": 4.876451561943361e-05, "loss": 0.8843, "step": 7505 }, { "epoch": 0.1, "learning_rate": 4.87628814848378e-05, "loss": 1.1949, "step": 7510 }, { "epoch": 0.1, "learning_rate": 4.876124629766522e-05, "loss": 0.6792, "step": 7515 }, { "epoch": 0.1, "learning_rate": 4.87596100579883e-05, "loss": 0.3922, "step": 7520 }, { "epoch": 0.1, "learning_rate": 4.875797276587952e-05, "loss": 0.547, "step": 7525 }, { "epoch": 0.1, "learning_rate": 4.8756334421411406e-05, "loss": 1.019, "step": 7530 }, { "epoch": 0.1, "learning_rate": 4.8754695024656535e-05, "loss": 1.2159, "step": 7535 }, { "epoch": 0.1, "learning_rate": 4.875305457568751e-05, "loss": 0.6001, "step": 7540 }, { "epoch": 0.1, "learning_rate": 4.875141307457699e-05, "loss": 0.4924, "step": 7545 }, { "epoch": 0.1, "learning_rate": 4.874977052139771e-05, "loss": 1.333, "step": 7550 }, { "epoch": 0.1, "learning_rate": 4.8748126916222406e-05, "loss": 1.3698, "step": 7555 }, { "epoch": 0.1, "learning_rate": 4.874648225912388e-05, "loss": 1.7691, "step": 7560 }, { "epoch": 0.1, "learning_rate": 4.8744836550175e-05, "loss": 0.3318, "step": 7565 }, { "epoch": 0.1, "learning_rate": 4.8743189789448653e-05, "loss": 1.1436, "step": 7570 }, { "epoch": 0.1, "learning_rate": 4.874154197701778e-05, "loss": 1.0626, "step": 7575 }, { "epoch": 0.1, "learning_rate": 4.873989311295537e-05, "loss": 1.2681, "step": 7580 }, { "epoch": 0.1, "learning_rate": 4.873824319733446e-05, "loss": 0.9659, "step": 7585 }, { "epoch": 0.1, "learning_rate": 4.873659223022814e-05, "loss": 0.5289, "step": 7590 }, { "epoch": 0.1, "learning_rate": 4.873494021170953e-05, "loss": 0.8104, "step": 7595 }, { "epoch": 0.1, "learning_rate": 4.8733287141851816e-05, "loss": 0.5341, "step": 7600 }, { "epoch": 0.1, "learning_rate": 4.873163302072822e-05, "loss": 0.1798, "step": 7605 }, { "epoch": 0.1, "learning_rate": 4.8729977848412e-05, "loss": 1.0615, "step": 7610 }, { "epoch": 0.1, "learning_rate": 4.8728321624976473e-05, "loss": 0.4426, "step": 7615 }, { "epoch": 0.1, "learning_rate": 4.8726664350495014e-05, "loss": 0.9316, "step": 7620 }, { "epoch": 0.1, "learning_rate": 4.8725006025041026e-05, "loss": 0.9473, "step": 7625 }, { "epoch": 0.1, "learning_rate": 4.872334664868796e-05, "loss": 1.0107, "step": 7630 }, { "epoch": 0.1, "learning_rate": 4.872168622150932e-05, "loss": 0.2689, "step": 7635 }, { "epoch": 0.1, "learning_rate": 4.872002474357866e-05, "loss": 0.1721, "step": 7640 }, { "epoch": 0.1, "learning_rate": 4.871836221496957e-05, "loss": 0.7516, "step": 7645 }, { "epoch": 0.1, "learning_rate": 4.87166986357557e-05, "loss": 0.8698, "step": 7650 }, { "epoch": 0.1, "learning_rate": 4.8715034006010725e-05, "loss": 0.6428, "step": 7655 }, { "epoch": 0.1, "learning_rate": 4.871336832580838e-05, "loss": 0.376, "step": 7660 }, { "epoch": 0.1, "learning_rate": 4.8711701595222465e-05, "loss": 0.5898, "step": 7665 }, { "epoch": 0.1, "learning_rate": 4.8710033814326786e-05, "loss": 0.8958, "step": 7670 }, { "epoch": 0.1, "learning_rate": 4.870836498319523e-05, "loss": 0.447, "step": 7675 }, { "epoch": 0.1, "learning_rate": 4.8706695101901715e-05, "loss": 1.3484, "step": 7680 }, { "epoch": 0.1, "learning_rate": 4.870502417052021e-05, "loss": 0.8393, "step": 7685 }, { "epoch": 0.1, "learning_rate": 4.870335218912472e-05, "loss": 0.5213, "step": 7690 }, { "epoch": 0.1, "learning_rate": 4.870167915778931e-05, "loss": 0.5845, "step": 7695 }, { "epoch": 0.1, "learning_rate": 4.870000507658811e-05, "loss": 1.1215, "step": 7700 }, { "epoch": 0.1, "learning_rate": 4.869832994559523e-05, "loss": 0.7863, "step": 7705 }, { "epoch": 0.1, "learning_rate": 4.86966537648849e-05, "loss": 0.3112, "step": 7710 }, { "epoch": 0.1, "learning_rate": 4.869497653453136e-05, "loss": 0.7528, "step": 7715 }, { "epoch": 0.1, "learning_rate": 4.86932982546089e-05, "loss": 0.8334, "step": 7720 }, { "epoch": 0.1, "learning_rate": 4.8691618925191865e-05, "loss": 0.8385, "step": 7725 }, { "epoch": 0.1, "learning_rate": 4.868993854635463e-05, "loss": 0.3347, "step": 7730 }, { "epoch": 0.1, "learning_rate": 4.8688257118171635e-05, "loss": 0.7236, "step": 7735 }, { "epoch": 0.1, "learning_rate": 4.868657464071736e-05, "loss": 1.0137, "step": 7740 }, { "epoch": 0.1, "learning_rate": 4.8684891114066336e-05, "loss": 0.8674, "step": 7745 }, { "epoch": 0.1, "learning_rate": 4.868320653829312e-05, "loss": 1.7813, "step": 7750 }, { "epoch": 0.1, "learning_rate": 4.868152091347234e-05, "loss": 0.6112, "step": 7755 }, { "epoch": 0.1, "learning_rate": 4.867983423967866e-05, "loss": 0.4669, "step": 7760 }, { "epoch": 0.1, "learning_rate": 4.8678146516986786e-05, "loss": 0.7684, "step": 7765 }, { "epoch": 0.1, "learning_rate": 4.8676457745471484e-05, "loss": 0.68, "step": 7770 }, { "epoch": 0.1, "learning_rate": 4.867476792520754e-05, "loss": 0.4264, "step": 7775 }, { "epoch": 0.1, "learning_rate": 4.867307705626983e-05, "loss": 0.7833, "step": 7780 }, { "epoch": 0.1, "learning_rate": 4.867138513873324e-05, "loss": 0.7541, "step": 7785 }, { "epoch": 0.1, "learning_rate": 4.866969217267271e-05, "loss": 0.321, "step": 7790 }, { "epoch": 0.1, "learning_rate": 4.8667998158163233e-05, "loss": 1.2606, "step": 7795 }, { "epoch": 0.1, "learning_rate": 4.866630309527984e-05, "loss": 0.3086, "step": 7800 }, { "epoch": 0.1, "learning_rate": 4.866460698409763e-05, "loss": 0.2283, "step": 7805 }, { "epoch": 0.1, "learning_rate": 4.866290982469172e-05, "loss": 0.6873, "step": 7810 }, { "epoch": 0.1, "learning_rate": 4.866121161713727e-05, "loss": 1.073, "step": 7815 }, { "epoch": 0.1, "learning_rate": 4.865951236150953e-05, "loss": 0.354, "step": 7820 }, { "epoch": 0.1, "learning_rate": 4.865781205788376e-05, "loss": 0.7297, "step": 7825 }, { "epoch": 0.1, "learning_rate": 4.865611070633527e-05, "loss": 0.941, "step": 7830 }, { "epoch": 0.1, "learning_rate": 4.865440830693941e-05, "loss": 0.7969, "step": 7835 }, { "epoch": 0.11, "learning_rate": 4.865270485977162e-05, "loss": 0.9956, "step": 7840 }, { "epoch": 0.11, "learning_rate": 4.865100036490733e-05, "loss": 0.8341, "step": 7845 }, { "epoch": 0.11, "learning_rate": 4.8649294822422045e-05, "loss": 0.4742, "step": 7850 }, { "epoch": 0.11, "learning_rate": 4.8647588232391314e-05, "loss": 0.7922, "step": 7855 }, { "epoch": 0.11, "learning_rate": 4.864588059489073e-05, "loss": 0.8657, "step": 7860 }, { "epoch": 0.11, "learning_rate": 4.864417190999593e-05, "loss": 0.5717, "step": 7865 }, { "epoch": 0.11, "learning_rate": 4.86424621777826e-05, "loss": 0.3545, "step": 7870 }, { "epoch": 0.11, "learning_rate": 4.8640751398326476e-05, "loss": 1.6149, "step": 7875 }, { "epoch": 0.11, "learning_rate": 4.8639039571703336e-05, "loss": 0.9805, "step": 7880 }, { "epoch": 0.11, "learning_rate": 4.863732669798902e-05, "loss": 0.4073, "step": 7885 }, { "epoch": 0.11, "learning_rate": 4.8635612777259366e-05, "loss": 1.5369, "step": 7890 }, { "epoch": 0.11, "learning_rate": 4.863389780959032e-05, "loss": 0.8681, "step": 7895 }, { "epoch": 0.11, "learning_rate": 4.8632181795057826e-05, "loss": 0.554, "step": 7900 }, { "epoch": 0.11, "learning_rate": 4.863046473373792e-05, "loss": 0.783, "step": 7905 }, { "epoch": 0.11, "learning_rate": 4.862874662570664e-05, "loss": 0.7614, "step": 7910 }, { "epoch": 0.11, "learning_rate": 4.86270274710401e-05, "loss": 0.4963, "step": 7915 }, { "epoch": 0.11, "learning_rate": 4.862530726981445e-05, "loss": 1.2092, "step": 7920 }, { "epoch": 0.11, "learning_rate": 4.8623586022105874e-05, "loss": 0.695, "step": 7925 }, { "epoch": 0.11, "learning_rate": 4.862186372799061e-05, "loss": 1.4519, "step": 7930 }, { "epoch": 0.11, "learning_rate": 4.862014038754498e-05, "loss": 0.6458, "step": 7935 }, { "epoch": 0.11, "learning_rate": 4.861841600084529e-05, "loss": 0.6815, "step": 7940 }, { "epoch": 0.11, "learning_rate": 4.861669056796793e-05, "loss": 0.4795, "step": 7945 }, { "epoch": 0.11, "learning_rate": 4.861496408898933e-05, "loss": 0.3405, "step": 7950 }, { "epoch": 0.11, "learning_rate": 4.861323656398597e-05, "loss": 0.4824, "step": 7955 }, { "epoch": 0.11, "learning_rate": 4.861150799303434e-05, "loss": 0.649, "step": 7960 }, { "epoch": 0.11, "learning_rate": 4.8609778376211056e-05, "loss": 1.3521, "step": 7965 }, { "epoch": 0.11, "learning_rate": 4.86080477135927e-05, "loss": 0.7583, "step": 7970 }, { "epoch": 0.11, "learning_rate": 4.860631600525593e-05, "loss": 0.6176, "step": 7975 }, { "epoch": 0.11, "learning_rate": 4.860458325127746e-05, "loss": 0.8255, "step": 7980 }, { "epoch": 0.11, "learning_rate": 4.8602849451734044e-05, "loss": 0.4943, "step": 7985 }, { "epoch": 0.11, "learning_rate": 4.860111460670248e-05, "loss": 0.5879, "step": 7990 }, { "epoch": 0.11, "learning_rate": 4.859937871625961e-05, "loss": 0.3241, "step": 7995 }, { "epoch": 0.11, "learning_rate": 4.859764178048234e-05, "loss": 0.6548, "step": 8000 }, { "epoch": 0.11, "learning_rate": 4.859590379944757e-05, "loss": 0.9802, "step": 8005 }, { "epoch": 0.11, "learning_rate": 4.859416477323233e-05, "loss": 0.343, "step": 8010 }, { "epoch": 0.11, "learning_rate": 4.8592424701913616e-05, "loss": 0.4643, "step": 8015 }, { "epoch": 0.11, "learning_rate": 4.859068358556852e-05, "loss": 1.4744, "step": 8020 }, { "epoch": 0.11, "learning_rate": 4.8588941424274165e-05, "loss": 0.7589, "step": 8025 }, { "epoch": 0.11, "learning_rate": 4.8587198218107713e-05, "loss": 1.2637, "step": 8030 }, { "epoch": 0.11, "learning_rate": 4.858545396714638e-05, "loss": 1.1327, "step": 8035 }, { "epoch": 0.11, "learning_rate": 4.8583708671467434e-05, "loss": 1.2629, "step": 8040 }, { "epoch": 0.11, "learning_rate": 4.858196233114819e-05, "loss": 1.0462, "step": 8045 }, { "epoch": 0.11, "learning_rate": 4.858021494626598e-05, "loss": 1.0307, "step": 8050 }, { "epoch": 0.11, "learning_rate": 4.857846651689821e-05, "loss": 0.634, "step": 8055 }, { "epoch": 0.11, "learning_rate": 4.8576717043122344e-05, "loss": 0.767, "step": 8060 }, { "epoch": 0.11, "learning_rate": 4.857496652501586e-05, "loss": 0.4698, "step": 8065 }, { "epoch": 0.11, "learning_rate": 4.85732149626563e-05, "loss": 1.0879, "step": 8070 }, { "epoch": 0.11, "learning_rate": 4.857146235612125e-05, "loss": 0.5888, "step": 8075 }, { "epoch": 0.11, "learning_rate": 4.856970870548834e-05, "loss": 0.4813, "step": 8080 }, { "epoch": 0.11, "learning_rate": 4.856795401083525e-05, "loss": 1.1441, "step": 8085 }, { "epoch": 0.11, "learning_rate": 4.8566198272239714e-05, "loss": 0.6225, "step": 8090 }, { "epoch": 0.11, "learning_rate": 4.8564441489779486e-05, "loss": 1.4356, "step": 8095 }, { "epoch": 0.11, "learning_rate": 4.856268366353238e-05, "loss": 0.5217, "step": 8100 }, { "epoch": 0.11, "learning_rate": 4.856092479357628e-05, "loss": 0.6796, "step": 8105 }, { "epoch": 0.11, "learning_rate": 4.8559164879989084e-05, "loss": 0.5883, "step": 8110 }, { "epoch": 0.11, "learning_rate": 4.8557403922848744e-05, "loss": 1.5383, "step": 8115 }, { "epoch": 0.11, "learning_rate": 4.8555641922233256e-05, "loss": 0.6446, "step": 8120 }, { "epoch": 0.11, "learning_rate": 4.855387887822068e-05, "loss": 0.4643, "step": 8125 }, { "epoch": 0.11, "learning_rate": 4.8552114790889114e-05, "loss": 0.2003, "step": 8130 }, { "epoch": 0.11, "learning_rate": 4.8550349660316686e-05, "loss": 0.7641, "step": 8135 }, { "epoch": 0.11, "learning_rate": 4.8548583486581585e-05, "loss": 0.4089, "step": 8140 }, { "epoch": 0.11, "learning_rate": 4.854681626976205e-05, "loss": 0.6486, "step": 8145 }, { "epoch": 0.11, "learning_rate": 4.854504800993634e-05, "loss": 1.4724, "step": 8150 }, { "epoch": 0.11, "learning_rate": 4.854327870718281e-05, "loss": 0.642, "step": 8155 }, { "epoch": 0.11, "learning_rate": 4.854150836157981e-05, "loss": 1.1589, "step": 8160 }, { "epoch": 0.11, "learning_rate": 4.853973697320577e-05, "loss": 0.714, "step": 8165 }, { "epoch": 0.11, "learning_rate": 4.8537964542139145e-05, "loss": 1.499, "step": 8170 }, { "epoch": 0.11, "learning_rate": 4.853619106845845e-05, "loss": 1.0502, "step": 8175 }, { "epoch": 0.11, "learning_rate": 4.853441655224224e-05, "loss": 0.7377, "step": 8180 }, { "epoch": 0.11, "learning_rate": 4.853264099356911e-05, "loss": 0.7446, "step": 8185 }, { "epoch": 0.11, "learning_rate": 4.853086439251772e-05, "loss": 0.2988, "step": 8190 }, { "epoch": 0.11, "learning_rate": 4.852908674916675e-05, "loss": 1.0258, "step": 8195 }, { "epoch": 0.11, "learning_rate": 4.8527308063594956e-05, "loss": 0.2716, "step": 8200 }, { "epoch": 0.11, "learning_rate": 4.852552833588111e-05, "loss": 0.3534, "step": 8205 }, { "epoch": 0.11, "learning_rate": 4.852374756610406e-05, "loss": 0.3901, "step": 8210 }, { "epoch": 0.11, "learning_rate": 4.852196575434268e-05, "loss": 0.4565, "step": 8215 }, { "epoch": 0.11, "learning_rate": 4.852018290067589e-05, "loss": 1.5893, "step": 8220 }, { "epoch": 0.11, "learning_rate": 4.8518399005182666e-05, "loss": 0.8702, "step": 8225 }, { "epoch": 0.11, "learning_rate": 4.8516614067942024e-05, "loss": 0.3411, "step": 8230 }, { "epoch": 0.11, "learning_rate": 4.851482808903304e-05, "loss": 0.9008, "step": 8235 }, { "epoch": 0.11, "learning_rate": 4.85130410685348e-05, "loss": 0.4474, "step": 8240 }, { "epoch": 0.11, "learning_rate": 4.851125300652647e-05, "loss": 0.6568, "step": 8245 }, { "epoch": 0.11, "learning_rate": 4.850946390308726e-05, "loss": 0.7353, "step": 8250 }, { "epoch": 0.11, "learning_rate": 4.8507673758296416e-05, "loss": 0.5601, "step": 8255 }, { "epoch": 0.11, "learning_rate": 4.850588257223323e-05, "loss": 0.3112, "step": 8260 }, { "epoch": 0.11, "learning_rate": 4.850409034497704e-05, "loss": 0.521, "step": 8265 }, { "epoch": 0.11, "learning_rate": 4.8502297076607235e-05, "loss": 0.6592, "step": 8270 }, { "epoch": 0.11, "learning_rate": 4.850050276720325e-05, "loss": 0.8109, "step": 8275 }, { "epoch": 0.11, "learning_rate": 4.849870741684456e-05, "loss": 0.2925, "step": 8280 }, { "epoch": 0.11, "learning_rate": 4.849691102561069e-05, "loss": 1.1379, "step": 8285 }, { "epoch": 0.11, "learning_rate": 4.849511359358121e-05, "loss": 0.5226, "step": 8290 }, { "epoch": 0.11, "learning_rate": 4.849331512083575e-05, "loss": 0.6932, "step": 8295 }, { "epoch": 0.11, "learning_rate": 4.849151560745395e-05, "loss": 0.8763, "step": 8300 }, { "epoch": 0.11, "learning_rate": 4.848971505351554e-05, "loss": 1.2361, "step": 8305 }, { "epoch": 0.11, "learning_rate": 4.848791345910027e-05, "loss": 0.6727, "step": 8310 }, { "epoch": 0.11, "learning_rate": 4.848611082428794e-05, "loss": 0.977, "step": 8315 }, { "epoch": 0.11, "learning_rate": 4.84843071491584e-05, "loss": 0.4884, "step": 8320 }, { "epoch": 0.11, "learning_rate": 4.848250243379154e-05, "loss": 0.9695, "step": 8325 }, { "epoch": 0.11, "learning_rate": 4.84806966782673e-05, "loss": 0.6767, "step": 8330 }, { "epoch": 0.11, "learning_rate": 4.847888988266567e-05, "loss": 1.451, "step": 8335 }, { "epoch": 0.11, "learning_rate": 4.847708204706667e-05, "loss": 0.961, "step": 8340 }, { "epoch": 0.11, "learning_rate": 4.8475273171550395e-05, "loss": 0.8234, "step": 8345 }, { "epoch": 0.11, "learning_rate": 4.847346325619696e-05, "loss": 0.9766, "step": 8350 }, { "epoch": 0.11, "learning_rate": 4.847165230108654e-05, "loss": 0.4269, "step": 8355 }, { "epoch": 0.11, "learning_rate": 4.846984030629934e-05, "loss": 0.7891, "step": 8360 }, { "epoch": 0.11, "learning_rate": 4.846802727191564e-05, "loss": 0.3904, "step": 8365 }, { "epoch": 0.11, "learning_rate": 4.846621319801574e-05, "loss": 0.8136, "step": 8370 }, { "epoch": 0.11, "learning_rate": 4.846439808467998e-05, "loss": 0.5813, "step": 8375 }, { "epoch": 0.11, "learning_rate": 4.846258193198878e-05, "loss": 0.7563, "step": 8380 }, { "epoch": 0.11, "learning_rate": 4.846076474002258e-05, "loss": 0.5251, "step": 8385 }, { "epoch": 0.11, "learning_rate": 4.845894650886188e-05, "loss": 1.1477, "step": 8390 }, { "epoch": 0.11, "learning_rate": 4.845712723858721e-05, "loss": 0.4476, "step": 8395 }, { "epoch": 0.11, "learning_rate": 4.845530692927914e-05, "loss": 1.1135, "step": 8400 }, { "epoch": 0.11, "learning_rate": 4.845348558101833e-05, "loss": 0.6341, "step": 8405 }, { "epoch": 0.11, "learning_rate": 4.845166319388544e-05, "loss": 0.7908, "step": 8410 }, { "epoch": 0.11, "learning_rate": 4.84498397679612e-05, "loss": 0.7353, "step": 8415 }, { "epoch": 0.11, "learning_rate": 4.844801530332636e-05, "loss": 0.9096, "step": 8420 }, { "epoch": 0.11, "learning_rate": 4.8446189800061765e-05, "loss": 0.7596, "step": 8425 }, { "epoch": 0.11, "learning_rate": 4.8444363258248255e-05, "loss": 0.904, "step": 8430 }, { "epoch": 0.11, "learning_rate": 4.844253567796674e-05, "loss": 1.0719, "step": 8435 }, { "epoch": 0.11, "learning_rate": 4.8440707059298165e-05, "loss": 0.826, "step": 8440 }, { "epoch": 0.11, "learning_rate": 4.8438877402323545e-05, "loss": 0.7115, "step": 8445 }, { "epoch": 0.11, "learning_rate": 4.8437046707123924e-05, "loss": 0.8424, "step": 8450 }, { "epoch": 0.11, "learning_rate": 4.8435214973780374e-05, "loss": 0.6097, "step": 8455 }, { "epoch": 0.11, "learning_rate": 4.843338220237405e-05, "loss": 1.146, "step": 8460 }, { "epoch": 0.11, "learning_rate": 4.843154839298612e-05, "loss": 0.958, "step": 8465 }, { "epoch": 0.11, "learning_rate": 4.842971354569783e-05, "loss": 0.3508, "step": 8470 }, { "epoch": 0.11, "learning_rate": 4.8427877660590446e-05, "loss": 0.7967, "step": 8475 }, { "epoch": 0.11, "learning_rate": 4.842604073774528e-05, "loss": 0.8018, "step": 8480 }, { "epoch": 0.11, "learning_rate": 4.842420277724371e-05, "loss": 0.8104, "step": 8485 }, { "epoch": 0.11, "learning_rate": 4.842236377916715e-05, "loss": 0.6958, "step": 8490 }, { "epoch": 0.11, "learning_rate": 4.842052374359705e-05, "loss": 0.9201, "step": 8495 }, { "epoch": 0.11, "learning_rate": 4.841868267061491e-05, "loss": 0.453, "step": 8500 }, { "epoch": 0.11, "learning_rate": 4.841684056030229e-05, "loss": 1.0491, "step": 8505 }, { "epoch": 0.11, "learning_rate": 4.8414997412740786e-05, "loss": 0.6824, "step": 8510 }, { "epoch": 0.11, "learning_rate": 4.8413153228012044e-05, "loss": 0.767, "step": 8515 }, { "epoch": 0.11, "learning_rate": 4.841130800619774e-05, "loss": 0.5233, "step": 8520 }, { "epoch": 0.11, "learning_rate": 4.8409461747379614e-05, "loss": 0.8583, "step": 8525 }, { "epoch": 0.11, "learning_rate": 4.8407614451639443e-05, "loss": 0.3751, "step": 8530 }, { "epoch": 0.11, "learning_rate": 4.8405766119059056e-05, "loss": 0.5378, "step": 8535 }, { "epoch": 0.11, "learning_rate": 4.840391674972034e-05, "loss": 0.6692, "step": 8540 }, { "epoch": 0.11, "learning_rate": 4.840206634370519e-05, "loss": 0.8044, "step": 8545 }, { "epoch": 0.11, "learning_rate": 4.8400214901095567e-05, "loss": 1.1925, "step": 8550 }, { "epoch": 0.11, "learning_rate": 4.83983624219735e-05, "loss": 1.1147, "step": 8555 }, { "epoch": 0.11, "learning_rate": 4.839650890642104e-05, "loss": 0.7444, "step": 8560 }, { "epoch": 0.11, "learning_rate": 4.839465435452029e-05, "loss": 1.6644, "step": 8565 }, { "epoch": 0.11, "learning_rate": 4.8392798766353374e-05, "loss": 0.6879, "step": 8570 }, { "epoch": 0.11, "learning_rate": 4.839094214200252e-05, "loss": 0.8096, "step": 8575 }, { "epoch": 0.11, "learning_rate": 4.838908448154994e-05, "loss": 0.4424, "step": 8580 }, { "epoch": 0.12, "learning_rate": 4.838722578507793e-05, "loss": 1.039, "step": 8585 }, { "epoch": 0.12, "learning_rate": 4.838536605266882e-05, "loss": 0.8154, "step": 8590 }, { "epoch": 0.12, "learning_rate": 4.838350528440498e-05, "loss": 0.4551, "step": 8595 }, { "epoch": 0.12, "learning_rate": 4.838164348036885e-05, "loss": 0.2672, "step": 8600 }, { "epoch": 0.12, "learning_rate": 4.837978064064289e-05, "loss": 1.1779, "step": 8605 }, { "epoch": 0.12, "learning_rate": 4.8377916765309616e-05, "loss": 0.3263, "step": 8610 }, { "epoch": 0.12, "learning_rate": 4.837605185445158e-05, "loss": 1.3868, "step": 8615 }, { "epoch": 0.12, "learning_rate": 4.837418590815139e-05, "loss": 1.2777, "step": 8620 }, { "epoch": 0.12, "learning_rate": 4.837231892649171e-05, "loss": 0.477, "step": 8625 }, { "epoch": 0.12, "learning_rate": 4.837045090955522e-05, "loss": 0.4254, "step": 8630 }, { "epoch": 0.12, "learning_rate": 4.8368581857424684e-05, "loss": 0.6005, "step": 8635 }, { "epoch": 0.12, "learning_rate": 4.836671177018287e-05, "loss": 1.3037, "step": 8640 }, { "epoch": 0.12, "learning_rate": 4.8364840647912636e-05, "loss": 1.0103, "step": 8645 }, { "epoch": 0.12, "learning_rate": 4.836296849069684e-05, "loss": 1.1736, "step": 8650 }, { "epoch": 0.12, "learning_rate": 4.836109529861843e-05, "loss": 0.8066, "step": 8655 }, { "epoch": 0.12, "learning_rate": 4.835922107176036e-05, "loss": 0.7338, "step": 8660 }, { "epoch": 0.12, "learning_rate": 4.835734581020567e-05, "loss": 0.4902, "step": 8665 }, { "epoch": 0.12, "learning_rate": 4.835546951403741e-05, "loss": 0.3613, "step": 8670 }, { "epoch": 0.12, "learning_rate": 4.83535921833387e-05, "loss": 0.9843, "step": 8675 }, { "epoch": 0.12, "learning_rate": 4.835171381819268e-05, "loss": 0.7265, "step": 8680 }, { "epoch": 0.12, "learning_rate": 4.8349834418682574e-05, "loss": 1.0773, "step": 8685 }, { "epoch": 0.12, "learning_rate": 4.83479539848916e-05, "loss": 0.9802, "step": 8690 }, { "epoch": 0.12, "learning_rate": 4.834607251690309e-05, "loss": 1.1262, "step": 8695 }, { "epoch": 0.12, "learning_rate": 4.834419001480036e-05, "loss": 0.8751, "step": 8700 }, { "epoch": 0.12, "learning_rate": 4.834230647866679e-05, "loss": 0.436, "step": 8705 }, { "epoch": 0.12, "learning_rate": 4.834042190858583e-05, "loss": 0.8112, "step": 8710 }, { "epoch": 0.12, "learning_rate": 4.8338536304640946e-05, "loss": 0.9533, "step": 8715 }, { "epoch": 0.12, "learning_rate": 4.833664966691566e-05, "loss": 0.5943, "step": 8720 }, { "epoch": 0.12, "learning_rate": 4.833476199549355e-05, "loss": 0.9189, "step": 8725 }, { "epoch": 0.12, "learning_rate": 4.8332873290458215e-05, "loss": 0.2124, "step": 8730 }, { "epoch": 0.12, "learning_rate": 4.8330983551893325e-05, "loss": 1.3537, "step": 8735 }, { "epoch": 0.12, "learning_rate": 4.83290927798826e-05, "loss": 0.6253, "step": 8740 }, { "epoch": 0.12, "learning_rate": 4.832720097450976e-05, "loss": 0.5891, "step": 8745 }, { "epoch": 0.12, "learning_rate": 4.832530813585863e-05, "loss": 0.8435, "step": 8750 }, { "epoch": 0.12, "learning_rate": 4.832341426401303e-05, "loss": 1.0243, "step": 8755 }, { "epoch": 0.12, "learning_rate": 4.8321519359056867e-05, "loss": 0.8024, "step": 8760 }, { "epoch": 0.12, "learning_rate": 4.831962342107407e-05, "loss": 1.4014, "step": 8765 }, { "epoch": 0.12, "learning_rate": 4.8317726450148624e-05, "loss": 0.5386, "step": 8770 }, { "epoch": 0.12, "learning_rate": 4.831582844636455e-05, "loss": 0.3792, "step": 8775 }, { "epoch": 0.12, "learning_rate": 4.8313929409805915e-05, "loss": 1.4474, "step": 8780 }, { "epoch": 0.12, "learning_rate": 4.8312029340556854e-05, "loss": 0.7258, "step": 8785 }, { "epoch": 0.12, "learning_rate": 4.831012823870151e-05, "loss": 0.5759, "step": 8790 }, { "epoch": 0.12, "learning_rate": 4.8308226104324105e-05, "loss": 0.6566, "step": 8795 }, { "epoch": 0.12, "learning_rate": 4.830632293750889e-05, "loss": 0.7254, "step": 8800 }, { "epoch": 0.12, "learning_rate": 4.830441873834017e-05, "loss": 0.7362, "step": 8805 }, { "epoch": 0.12, "learning_rate": 4.830251350690228e-05, "loss": 0.8416, "step": 8810 }, { "epoch": 0.12, "learning_rate": 4.830060724327963e-05, "loss": 0.6707, "step": 8815 }, { "epoch": 0.12, "learning_rate": 4.8298699947556645e-05, "loss": 0.214, "step": 8820 }, { "epoch": 0.12, "learning_rate": 4.829679161981781e-05, "loss": 0.5847, "step": 8825 }, { "epoch": 0.12, "learning_rate": 4.829488226014766e-05, "loss": 0.1229, "step": 8830 }, { "epoch": 0.12, "learning_rate": 4.829297186863076e-05, "loss": 0.8375, "step": 8835 }, { "epoch": 0.12, "learning_rate": 4.829106044535174e-05, "loss": 1.1516, "step": 8840 }, { "epoch": 0.12, "learning_rate": 4.828914799039527e-05, "loss": 0.3745, "step": 8845 }, { "epoch": 0.12, "learning_rate": 4.8287234503846057e-05, "loss": 1.331, "step": 8850 }, { "epoch": 0.12, "learning_rate": 4.828531998578885e-05, "loss": 0.6824, "step": 8855 }, { "epoch": 0.12, "learning_rate": 4.8283404436308464e-05, "loss": 0.7021, "step": 8860 }, { "epoch": 0.12, "learning_rate": 4.8281487855489744e-05, "loss": 1.3055, "step": 8865 }, { "epoch": 0.12, "learning_rate": 4.827957024341758e-05, "loss": 1.6496, "step": 8870 }, { "epoch": 0.12, "learning_rate": 4.827765160017693e-05, "loss": 1.0607, "step": 8875 }, { "epoch": 0.12, "learning_rate": 4.8275731925852765e-05, "loss": 0.3206, "step": 8880 }, { "epoch": 0.12, "learning_rate": 4.827381122053011e-05, "loss": 0.7973, "step": 8885 }, { "epoch": 0.12, "learning_rate": 4.827188948429407e-05, "loss": 0.6887, "step": 8890 }, { "epoch": 0.12, "learning_rate": 4.826996671722974e-05, "loss": 0.811, "step": 8895 }, { "epoch": 0.12, "learning_rate": 4.8268042919422295e-05, "loss": 0.2693, "step": 8900 }, { "epoch": 0.12, "learning_rate": 4.826611809095697e-05, "loss": 0.7161, "step": 8905 }, { "epoch": 0.12, "learning_rate": 4.8264192231919006e-05, "loss": 0.7449, "step": 8910 }, { "epoch": 0.12, "learning_rate": 4.826226534239371e-05, "loss": 0.8695, "step": 8915 }, { "epoch": 0.12, "learning_rate": 4.826033742246643e-05, "loss": 1.2223, "step": 8920 }, { "epoch": 0.12, "learning_rate": 4.825840847222258e-05, "loss": 0.4582, "step": 8925 }, { "epoch": 0.12, "learning_rate": 4.8256478491747594e-05, "loss": 1.23, "step": 8930 }, { "epoch": 0.12, "learning_rate": 4.825454748112695e-05, "loss": 1.0588, "step": 8935 }, { "epoch": 0.12, "learning_rate": 4.8252615440446196e-05, "loss": 0.889, "step": 8940 }, { "epoch": 0.12, "learning_rate": 4.8250682369790915e-05, "loss": 0.5093, "step": 8945 }, { "epoch": 0.12, "learning_rate": 4.824874826924671e-05, "loss": 0.4253, "step": 8950 }, { "epoch": 0.12, "learning_rate": 4.824681313889927e-05, "loss": 0.9195, "step": 8955 }, { "epoch": 0.12, "learning_rate": 4.824487697883432e-05, "loss": 0.9349, "step": 8960 }, { "epoch": 0.12, "learning_rate": 4.82429397891376e-05, "loss": 0.7329, "step": 8965 }, { "epoch": 0.12, "learning_rate": 4.824100156989493e-05, "loss": 0.8638, "step": 8970 }, { "epoch": 0.12, "learning_rate": 4.823906232119216e-05, "loss": 1.2509, "step": 8975 }, { "epoch": 0.12, "learning_rate": 4.823712204311519e-05, "loss": 0.7642, "step": 8980 }, { "epoch": 0.12, "learning_rate": 4.8235180735749976e-05, "loss": 0.1447, "step": 8985 }, { "epoch": 0.12, "learning_rate": 4.8233238399182486e-05, "loss": 0.5316, "step": 8990 }, { "epoch": 0.12, "learning_rate": 4.823129503349877e-05, "loss": 1.0117, "step": 8995 }, { "epoch": 0.12, "learning_rate": 4.822935063878491e-05, "loss": 0.9659, "step": 9000 }, { "epoch": 0.12, "learning_rate": 4.822740521512702e-05, "loss": 0.8155, "step": 9005 }, { "epoch": 0.12, "learning_rate": 4.822545876261129e-05, "loss": 1.1388, "step": 9010 }, { "epoch": 0.12, "learning_rate": 4.822351128132393e-05, "loss": 1.8259, "step": 9015 }, { "epoch": 0.12, "learning_rate": 4.8221562771351206e-05, "loss": 0.6872, "step": 9020 }, { "epoch": 0.12, "learning_rate": 4.8219613232779416e-05, "loss": 1.1732, "step": 9025 }, { "epoch": 0.12, "learning_rate": 4.821766266569493e-05, "loss": 1.5334, "step": 9030 }, { "epoch": 0.12, "learning_rate": 4.821571107018414e-05, "loss": 1.3901, "step": 9035 }, { "epoch": 0.12, "learning_rate": 4.8213758446333496e-05, "loss": 0.5799, "step": 9040 }, { "epoch": 0.12, "learning_rate": 4.8211804794229485e-05, "loss": 0.4994, "step": 9045 }, { "epoch": 0.12, "learning_rate": 4.820985011395865e-05, "loss": 0.898, "step": 9050 }, { "epoch": 0.12, "learning_rate": 4.820789440560757e-05, "loss": 0.9534, "step": 9055 }, { "epoch": 0.12, "learning_rate": 4.820593766926287e-05, "loss": 0.9222, "step": 9060 }, { "epoch": 0.12, "learning_rate": 4.820397990501123e-05, "loss": 0.7966, "step": 9065 }, { "epoch": 0.12, "learning_rate": 4.820202111293937e-05, "loss": 0.9057, "step": 9070 }, { "epoch": 0.12, "learning_rate": 4.820006129313404e-05, "loss": 0.6672, "step": 9075 }, { "epoch": 0.12, "learning_rate": 4.819810044568207e-05, "loss": 1.3912, "step": 9080 }, { "epoch": 0.12, "learning_rate": 4.81961385706703e-05, "loss": 1.3842, "step": 9085 }, { "epoch": 0.12, "learning_rate": 4.8194175668185645e-05, "loss": 0.9908, "step": 9090 }, { "epoch": 0.12, "learning_rate": 4.819221173831504e-05, "loss": 0.636, "step": 9095 }, { "epoch": 0.12, "learning_rate": 4.8190246781145484e-05, "loss": 0.8566, "step": 9100 }, { "epoch": 0.12, "learning_rate": 4.818828079676401e-05, "loss": 0.7639, "step": 9105 }, { "epoch": 0.12, "learning_rate": 4.818631378525771e-05, "loss": 0.4931, "step": 9110 }, { "epoch": 0.12, "learning_rate": 4.81843457467137e-05, "loss": 1.2962, "step": 9115 }, { "epoch": 0.12, "learning_rate": 4.818237668121917e-05, "loss": 0.9621, "step": 9120 }, { "epoch": 0.12, "learning_rate": 4.8180406588861317e-05, "loss": 1.3108, "step": 9125 }, { "epoch": 0.12, "learning_rate": 4.817843546972743e-05, "loss": 1.7516, "step": 9130 }, { "epoch": 0.12, "learning_rate": 4.817646332390481e-05, "loss": 1.0579, "step": 9135 }, { "epoch": 0.12, "learning_rate": 4.817449015148081e-05, "loss": 0.8059, "step": 9140 }, { "epoch": 0.12, "learning_rate": 4.817251595254283e-05, "loss": 0.504, "step": 9145 }, { "epoch": 0.12, "learning_rate": 4.8170540727178326e-05, "loss": 0.3782, "step": 9150 }, { "epoch": 0.12, "learning_rate": 4.816856447547479e-05, "loss": 0.4365, "step": 9155 }, { "epoch": 0.12, "learning_rate": 4.8166587197519754e-05, "loss": 1.3224, "step": 9160 }, { "epoch": 0.12, "learning_rate": 4.8164608893400796e-05, "loss": 0.4961, "step": 9165 }, { "epoch": 0.12, "learning_rate": 4.816262956320556e-05, "loss": 1.1164, "step": 9170 }, { "epoch": 0.12, "learning_rate": 4.816064920702172e-05, "loss": 0.6284, "step": 9175 }, { "epoch": 0.12, "learning_rate": 4.815866782493698e-05, "loss": 0.6002, "step": 9180 }, { "epoch": 0.12, "learning_rate": 4.8156685417039116e-05, "loss": 0.8208, "step": 9185 }, { "epoch": 0.12, "learning_rate": 4.815470198341594e-05, "loss": 0.2013, "step": 9190 }, { "epoch": 0.12, "learning_rate": 4.815271752415531e-05, "loss": 0.7123, "step": 9195 }, { "epoch": 0.12, "learning_rate": 4.8150732039345115e-05, "loss": 0.5541, "step": 9200 }, { "epoch": 0.12, "learning_rate": 4.814874552907331e-05, "loss": 0.4822, "step": 9205 }, { "epoch": 0.12, "learning_rate": 4.8146757993427895e-05, "loss": 0.4125, "step": 9210 }, { "epoch": 0.12, "learning_rate": 4.8144769432496895e-05, "loss": 0.6628, "step": 9215 }, { "epoch": 0.12, "learning_rate": 4.81427798463684e-05, "loss": 0.6073, "step": 9220 }, { "epoch": 0.12, "learning_rate": 4.8140789235130534e-05, "loss": 1.1483, "step": 9225 }, { "epoch": 0.12, "learning_rate": 4.8138797598871476e-05, "loss": 0.3568, "step": 9230 }, { "epoch": 0.12, "learning_rate": 4.8136804937679446e-05, "loss": 1.0957, "step": 9235 }, { "epoch": 0.12, "learning_rate": 4.813481125164271e-05, "loss": 1.0944, "step": 9240 }, { "epoch": 0.12, "learning_rate": 4.813281654084957e-05, "loss": 0.8015, "step": 9245 }, { "epoch": 0.12, "learning_rate": 4.813082080538839e-05, "loss": 1.2426, "step": 9250 }, { "epoch": 0.12, "learning_rate": 4.812882404534757e-05, "loss": 0.8696, "step": 9255 }, { "epoch": 0.12, "learning_rate": 4.8126826260815545e-05, "loss": 0.839, "step": 9260 }, { "epoch": 0.12, "learning_rate": 4.8124827451880826e-05, "loss": 0.8043, "step": 9265 }, { "epoch": 0.12, "learning_rate": 4.8122827618631936e-05, "loss": 0.2996, "step": 9270 }, { "epoch": 0.12, "learning_rate": 4.812082676115747e-05, "loss": 0.9579, "step": 9275 }, { "epoch": 0.12, "learning_rate": 4.811882487954604e-05, "loss": 1.1807, "step": 9280 }, { "epoch": 0.12, "learning_rate": 4.811682197388633e-05, "loss": 1.3747, "step": 9285 }, { "epoch": 0.12, "learning_rate": 4.811481804426705e-05, "loss": 0.12, "step": 9290 }, { "epoch": 0.12, "learning_rate": 4.811281309077698e-05, "loss": 1.2675, "step": 9295 }, { "epoch": 0.12, "learning_rate": 4.811080711350492e-05, "loss": 0.904, "step": 9300 }, { "epoch": 0.12, "learning_rate": 4.810880011253972e-05, "loss": 0.8039, "step": 9305 }, { "epoch": 0.12, "learning_rate": 4.810679208797029e-05, "loss": 0.4748, "step": 9310 }, { "epoch": 0.12, "learning_rate": 4.810478303988556e-05, "loss": 0.7057, "step": 9315 }, { "epoch": 0.12, "learning_rate": 4.8102772968374543e-05, "loss": 0.7347, "step": 9320 }, { "epoch": 0.12, "learning_rate": 4.810076187352626e-05, "loss": 1.4841, "step": 9325 }, { "epoch": 0.13, "learning_rate": 4.809874975542979e-05, "loss": 1.2959, "step": 9330 }, { "epoch": 0.13, "learning_rate": 4.809673661417427e-05, "loss": 0.4903, "step": 9335 }, { "epoch": 0.13, "learning_rate": 4.8094722449848863e-05, "loss": 0.3061, "step": 9340 }, { "epoch": 0.13, "learning_rate": 4.809270726254279e-05, "loss": 1.1026, "step": 9345 }, { "epoch": 0.13, "learning_rate": 4.809069105234532e-05, "loss": 1.0478, "step": 9350 }, { "epoch": 0.13, "learning_rate": 4.8088673819345756e-05, "loss": 0.6622, "step": 9355 }, { "epoch": 0.13, "learning_rate": 4.808665556363345e-05, "loss": 1.5507, "step": 9360 }, { "epoch": 0.13, "learning_rate": 4.8084636285297795e-05, "loss": 0.8836, "step": 9365 }, { "epoch": 0.13, "learning_rate": 4.8082615984428244e-05, "loss": 0.6043, "step": 9370 }, { "epoch": 0.13, "learning_rate": 4.808059466111429e-05, "loss": 0.5939, "step": 9375 }, { "epoch": 0.13, "learning_rate": 4.807857231544546e-05, "loss": 0.498, "step": 9380 }, { "epoch": 0.13, "learning_rate": 4.807654894751133e-05, "loss": 1.0658, "step": 9385 }, { "epoch": 0.13, "learning_rate": 4.807452455740153e-05, "loss": 1.2436, "step": 9390 }, { "epoch": 0.13, "learning_rate": 4.807249914520573e-05, "loss": 0.5976, "step": 9395 }, { "epoch": 0.13, "learning_rate": 4.807047271101365e-05, "loss": 0.933, "step": 9400 }, { "epoch": 0.13, "learning_rate": 4.806844525491504e-05, "loss": 0.4744, "step": 9405 }, { "epoch": 0.13, "learning_rate": 4.806641677699972e-05, "loss": 0.3847, "step": 9410 }, { "epoch": 0.13, "learning_rate": 4.8064387277357535e-05, "loss": 0.9937, "step": 9415 }, { "epoch": 0.13, "learning_rate": 4.8062356756078375e-05, "loss": 1.1117, "step": 9420 }, { "epoch": 0.13, "learning_rate": 4.8060325213252186e-05, "loss": 0.699, "step": 9425 }, { "epoch": 0.13, "learning_rate": 4.8058292648968975e-05, "loss": 0.095, "step": 9430 }, { "epoch": 0.13, "learning_rate": 4.805625906331874e-05, "loss": 0.712, "step": 9435 }, { "epoch": 0.13, "learning_rate": 4.8054224456391574e-05, "loss": 0.8682, "step": 9440 }, { "epoch": 0.13, "learning_rate": 4.805218882827761e-05, "loss": 0.3967, "step": 9445 }, { "epoch": 0.13, "learning_rate": 4.8050152179067005e-05, "loss": 0.8945, "step": 9450 }, { "epoch": 0.13, "learning_rate": 4.804811450884997e-05, "loss": 0.6007, "step": 9455 }, { "epoch": 0.13, "learning_rate": 4.804607581771678e-05, "loss": 0.9019, "step": 9460 }, { "epoch": 0.13, "learning_rate": 4.8044036105757716e-05, "loss": 1.3697, "step": 9465 }, { "epoch": 0.13, "learning_rate": 4.8041995373063144e-05, "loss": 1.0051, "step": 9470 }, { "epoch": 0.13, "learning_rate": 4.803995361972344e-05, "loss": 0.7595, "step": 9475 }, { "epoch": 0.13, "learning_rate": 4.803791084582907e-05, "loss": 0.6735, "step": 9480 }, { "epoch": 0.13, "learning_rate": 4.80358670514705e-05, "loss": 0.6559, "step": 9485 }, { "epoch": 0.13, "learning_rate": 4.803382223673827e-05, "loss": 0.5342, "step": 9490 }, { "epoch": 0.13, "learning_rate": 4.803177640172294e-05, "loss": 0.9688, "step": 9495 }, { "epoch": 0.13, "learning_rate": 4.802972954651514e-05, "loss": 0.4012, "step": 9500 }, { "epoch": 0.13, "learning_rate": 4.8027681671205545e-05, "loss": 0.676, "step": 9505 }, { "epoch": 0.13, "learning_rate": 4.802563277588485e-05, "loss": 0.6984, "step": 9510 }, { "epoch": 0.13, "learning_rate": 4.802358286064382e-05, "loss": 0.4982, "step": 9515 }, { "epoch": 0.13, "learning_rate": 4.802153192557325e-05, "loss": 1.1633, "step": 9520 }, { "epoch": 0.13, "learning_rate": 4.801947997076398e-05, "loss": 0.8125, "step": 9525 }, { "epoch": 0.13, "learning_rate": 4.801742699630692e-05, "loss": 0.5945, "step": 9530 }, { "epoch": 0.13, "learning_rate": 4.801537300229299e-05, "loss": 1.5168, "step": 9535 }, { "epoch": 0.13, "learning_rate": 4.801331798881319e-05, "loss": 1.0967, "step": 9540 }, { "epoch": 0.13, "learning_rate": 4.801126195595853e-05, "loss": 0.7929, "step": 9545 }, { "epoch": 0.13, "learning_rate": 4.800920490382008e-05, "loss": 1.5165, "step": 9550 }, { "epoch": 0.13, "learning_rate": 4.8007146832488974e-05, "loss": 0.6962, "step": 9555 }, { "epoch": 0.13, "learning_rate": 4.800508774205636e-05, "loss": 0.8863, "step": 9560 }, { "epoch": 0.13, "learning_rate": 4.800302763261345e-05, "loss": 0.8116, "step": 9565 }, { "epoch": 0.13, "learning_rate": 4.80009665042515e-05, "loss": 0.5576, "step": 9570 }, { "epoch": 0.13, "learning_rate": 4.7998904357061795e-05, "loss": 0.3793, "step": 9575 }, { "epoch": 0.13, "learning_rate": 4.7996841191135695e-05, "loss": 0.2126, "step": 9580 }, { "epoch": 0.13, "learning_rate": 4.7994777006564574e-05, "loss": 0.3458, "step": 9585 }, { "epoch": 0.13, "learning_rate": 4.799271180343988e-05, "loss": 0.6577, "step": 9590 }, { "epoch": 0.13, "learning_rate": 4.799064558185307e-05, "loss": 0.2613, "step": 9595 }, { "epoch": 0.13, "learning_rate": 4.7988991871352415e-05, "loss": 0.8633, "step": 9600 }, { "epoch": 0.13, "learning_rate": 4.79869238167645e-05, "loss": 0.5466, "step": 9605 }, { "epoch": 0.13, "learning_rate": 4.7984854743970846e-05, "loss": 0.2218, "step": 9610 }, { "epoch": 0.13, "learning_rate": 4.798278465306313e-05, "loss": 0.5906, "step": 9615 }, { "epoch": 0.13, "learning_rate": 4.798071354413302e-05, "loss": 0.6741, "step": 9620 }, { "epoch": 0.13, "learning_rate": 4.7978641417272276e-05, "loss": 0.6727, "step": 9625 }, { "epoch": 0.13, "learning_rate": 4.797656827257268e-05, "loss": 0.9533, "step": 9630 }, { "epoch": 0.13, "learning_rate": 4.797449411012604e-05, "loss": 0.5159, "step": 9635 }, { "epoch": 0.13, "learning_rate": 4.797241893002427e-05, "loss": 0.5652, "step": 9640 }, { "epoch": 0.13, "learning_rate": 4.797034273235926e-05, "loss": 1.0334, "step": 9645 }, { "epoch": 0.13, "learning_rate": 4.796826551722299e-05, "loss": 0.4861, "step": 9650 }, { "epoch": 0.13, "learning_rate": 4.796618728470745e-05, "loss": 0.8191, "step": 9655 }, { "epoch": 0.13, "learning_rate": 4.796410803490472e-05, "loss": 1.0752, "step": 9660 }, { "epoch": 0.13, "learning_rate": 4.796202776790689e-05, "loss": 1.3562, "step": 9665 }, { "epoch": 0.13, "learning_rate": 4.7959946483806104e-05, "loss": 0.7741, "step": 9670 }, { "epoch": 0.13, "learning_rate": 4.795786418269455e-05, "loss": 1.1642, "step": 9675 }, { "epoch": 0.13, "learning_rate": 4.795578086466447e-05, "loss": 0.83, "step": 9680 }, { "epoch": 0.13, "learning_rate": 4.795369652980815e-05, "loss": 0.426, "step": 9685 }, { "epoch": 0.13, "learning_rate": 4.7951611178217894e-05, "loss": 0.3527, "step": 9690 }, { "epoch": 0.13, "learning_rate": 4.794952480998609e-05, "loss": 0.5081, "step": 9695 }, { "epoch": 0.13, "learning_rate": 4.794743742520515e-05, "loss": 0.7866, "step": 9700 }, { "epoch": 0.13, "learning_rate": 4.794534902396753e-05, "loss": 0.2226, "step": 9705 }, { "epoch": 0.13, "learning_rate": 4.7943259606365754e-05, "loss": 0.6263, "step": 9710 }, { "epoch": 0.13, "learning_rate": 4.7941169172492354e-05, "loss": 0.6831, "step": 9715 }, { "epoch": 0.13, "learning_rate": 4.7939077722439924e-05, "loss": 1.0099, "step": 9720 }, { "epoch": 0.13, "learning_rate": 4.7936985256301115e-05, "loss": 1.3413, "step": 9725 }, { "epoch": 0.13, "learning_rate": 4.793489177416861e-05, "loss": 0.6958, "step": 9730 }, { "epoch": 0.13, "learning_rate": 4.7932797276135134e-05, "loss": 0.7534, "step": 9735 }, { "epoch": 0.13, "learning_rate": 4.7930701762293475e-05, "loss": 0.8695, "step": 9740 }, { "epoch": 0.13, "learning_rate": 4.7928605232736445e-05, "loss": 1.0328, "step": 9745 }, { "epoch": 0.13, "learning_rate": 4.792650768755691e-05, "loss": 0.5269, "step": 9750 }, { "epoch": 0.13, "learning_rate": 4.792440912684778e-05, "loss": 1.004, "step": 9755 }, { "epoch": 0.13, "learning_rate": 4.792230955070201e-05, "loss": 0.8288, "step": 9760 }, { "epoch": 0.13, "learning_rate": 4.792020895921262e-05, "loss": 0.7183, "step": 9765 }, { "epoch": 0.13, "learning_rate": 4.7918107352472626e-05, "loss": 0.3115, "step": 9770 }, { "epoch": 0.13, "learning_rate": 4.791600473057514e-05, "loss": 0.818, "step": 9775 }, { "epoch": 0.13, "learning_rate": 4.791390109361328e-05, "loss": 0.3933, "step": 9780 }, { "epoch": 0.13, "learning_rate": 4.7911796441680235e-05, "loss": 0.4678, "step": 9785 }, { "epoch": 0.13, "learning_rate": 4.790969077486924e-05, "loss": 0.2995, "step": 9790 }, { "epoch": 0.13, "learning_rate": 4.790758409327355e-05, "loss": 0.1256, "step": 9795 }, { "epoch": 0.13, "learning_rate": 4.790547639698649e-05, "loss": 0.7906, "step": 9800 }, { "epoch": 0.13, "learning_rate": 4.7903367686101426e-05, "loss": 0.3111, "step": 9805 }, { "epoch": 0.13, "learning_rate": 4.7901257960711746e-05, "loss": 0.71, "step": 9810 }, { "epoch": 0.13, "learning_rate": 4.7899147220910914e-05, "loss": 0.7001, "step": 9815 }, { "epoch": 0.13, "learning_rate": 4.7897035466792425e-05, "loss": 1.4315, "step": 9820 }, { "epoch": 0.13, "learning_rate": 4.7894922698449804e-05, "loss": 0.8372, "step": 9825 }, { "epoch": 0.13, "learning_rate": 4.789280891597666e-05, "loss": 1.0255, "step": 9830 }, { "epoch": 0.13, "learning_rate": 4.78906941194666e-05, "loss": 1.1903, "step": 9835 }, { "epoch": 0.13, "learning_rate": 4.788857830901331e-05, "loss": 1.0766, "step": 9840 }, { "epoch": 0.13, "learning_rate": 4.788646148471051e-05, "loss": 1.4223, "step": 9845 }, { "epoch": 0.13, "learning_rate": 4.788434364665197e-05, "loss": 0.7248, "step": 9850 }, { "epoch": 0.13, "learning_rate": 4.788222479493148e-05, "loss": 1.0411, "step": 9855 }, { "epoch": 0.13, "learning_rate": 4.788010492964292e-05, "loss": 0.5936, "step": 9860 }, { "epoch": 0.13, "learning_rate": 4.787798405088018e-05, "loss": 0.3401, "step": 9865 }, { "epoch": 0.13, "learning_rate": 4.7875862158737196e-05, "loss": 0.7232, "step": 9870 }, { "epoch": 0.13, "learning_rate": 4.7873739253307956e-05, "loss": 0.6645, "step": 9875 }, { "epoch": 0.13, "learning_rate": 4.78716153346865e-05, "loss": 0.7399, "step": 9880 }, { "epoch": 0.13, "learning_rate": 4.786949040296692e-05, "loss": 1.0137, "step": 9885 }, { "epoch": 0.13, "learning_rate": 4.7867364458243324e-05, "loss": 0.641, "step": 9890 }, { "epoch": 0.13, "learning_rate": 4.786523750060988e-05, "loss": 0.4651, "step": 9895 }, { "epoch": 0.13, "learning_rate": 4.786310953016081e-05, "loss": 1.1009, "step": 9900 }, { "epoch": 0.13, "learning_rate": 4.7860980546990364e-05, "loss": 0.5898, "step": 9905 }, { "epoch": 0.13, "learning_rate": 4.7858850551192847e-05, "loss": 0.4341, "step": 9910 }, { "epoch": 0.13, "learning_rate": 4.7856719542862614e-05, "loss": 0.6001, "step": 9915 }, { "epoch": 0.13, "learning_rate": 4.785458752209406e-05, "loss": 1.3792, "step": 9920 }, { "epoch": 0.13, "learning_rate": 4.7852454488981614e-05, "loss": 0.388, "step": 9925 }, { "epoch": 0.13, "learning_rate": 4.785032044361976e-05, "loss": 0.5962, "step": 9930 }, { "epoch": 0.13, "learning_rate": 4.7848185386103014e-05, "loss": 0.8759, "step": 9935 }, { "epoch": 0.13, "learning_rate": 4.7846049316525977e-05, "loss": 1.1187, "step": 9940 }, { "epoch": 0.13, "learning_rate": 4.784391223498325e-05, "loss": 0.929, "step": 9945 }, { "epoch": 0.13, "learning_rate": 4.784177414156949e-05, "loss": 0.8253, "step": 9950 }, { "epoch": 0.13, "learning_rate": 4.783963503637941e-05, "loss": 0.9294, "step": 9955 }, { "epoch": 0.13, "learning_rate": 4.7837494919507764e-05, "loss": 0.5894, "step": 9960 }, { "epoch": 0.13, "learning_rate": 4.783535379104934e-05, "loss": 0.9567, "step": 9965 }, { "epoch": 0.13, "learning_rate": 4.7833211651098985e-05, "loss": 0.5116, "step": 9970 }, { "epoch": 0.13, "learning_rate": 4.783106849975159e-05, "loss": 1.1773, "step": 9975 }, { "epoch": 0.13, "learning_rate": 4.7828924337102075e-05, "loss": 0.3304, "step": 9980 }, { "epoch": 0.13, "learning_rate": 4.7826779163245424e-05, "loss": 0.5927, "step": 9985 }, { "epoch": 0.13, "learning_rate": 4.782463297827666e-05, "loss": 0.4952, "step": 9990 }, { "epoch": 0.13, "learning_rate": 4.7822485782290835e-05, "loss": 1.0959, "step": 9995 }, { "epoch": 0.13, "learning_rate": 4.782033757538308e-05, "loss": 0.6686, "step": 10000 }, { "epoch": 0.13, "learning_rate": 4.7818188357648525e-05, "loss": 0.5324, "step": 10005 }, { "epoch": 0.13, "learning_rate": 4.7816038129182385e-05, "loss": 0.9648, "step": 10010 }, { "epoch": 0.13, "learning_rate": 4.78138868900799e-05, "loss": 0.9519, "step": 10015 }, { "epoch": 0.13, "learning_rate": 4.781173464043636e-05, "loss": 0.1964, "step": 10020 }, { "epoch": 0.13, "learning_rate": 4.78095813803471e-05, "loss": 1.6336, "step": 10025 }, { "epoch": 0.13, "learning_rate": 4.78074271099075e-05, "loss": 0.8705, "step": 10030 }, { "epoch": 0.13, "learning_rate": 4.7805271829212975e-05, "loss": 0.4373, "step": 10035 }, { "epoch": 0.13, "learning_rate": 4.7803115538359e-05, "loss": 1.2123, "step": 10040 }, { "epoch": 0.13, "learning_rate": 4.780095823744109e-05, "loss": 0.369, "step": 10045 }, { "epoch": 0.13, "learning_rate": 4.7798799926554804e-05, "loss": 0.5521, "step": 10050 }, { "epoch": 0.13, "learning_rate": 4.779664060579573e-05, "loss": 1.0541, "step": 10055 }, { "epoch": 0.13, "learning_rate": 4.7794480275259534e-05, "loss": 0.9843, "step": 10060 }, { "epoch": 0.13, "learning_rate": 4.779231893504189e-05, "loss": 0.5914, "step": 10065 }, { "epoch": 0.13, "learning_rate": 4.779015658523855e-05, "loss": 0.5511, "step": 10070 }, { "epoch": 0.13, "learning_rate": 4.778799322594529e-05, "loss": 1.119, "step": 10075 }, { "epoch": 0.14, "learning_rate": 4.778582885725793e-05, "loss": 1.2106, "step": 10080 }, { "epoch": 0.14, "learning_rate": 4.7783663479272356e-05, "loss": 0.723, "step": 10085 }, { "epoch": 0.14, "learning_rate": 4.778149709208446e-05, "loss": 0.7142, "step": 10090 }, { "epoch": 0.14, "learning_rate": 4.777932969579022e-05, "loss": 0.9893, "step": 10095 }, { "epoch": 0.14, "learning_rate": 4.777716129048564e-05, "loss": 0.7353, "step": 10100 }, { "epoch": 0.14, "learning_rate": 4.777499187626676e-05, "loss": 0.685, "step": 10105 }, { "epoch": 0.14, "learning_rate": 4.777282145322968e-05, "loss": 1.0527, "step": 10110 }, { "epoch": 0.14, "learning_rate": 4.777065002147054e-05, "loss": 0.4958, "step": 10115 }, { "epoch": 0.14, "learning_rate": 4.7768477581085526e-05, "loss": 1.1132, "step": 10120 }, { "epoch": 0.14, "learning_rate": 4.776630413217085e-05, "loss": 0.7657, "step": 10125 }, { "epoch": 0.14, "learning_rate": 4.776412967482281e-05, "loss": 0.8644, "step": 10130 }, { "epoch": 0.14, "learning_rate": 4.77619542091377e-05, "loss": 0.7478, "step": 10135 }, { "epoch": 0.14, "learning_rate": 4.77597777352119e-05, "loss": 0.7706, "step": 10140 }, { "epoch": 0.14, "learning_rate": 4.775760025314181e-05, "loss": 0.4555, "step": 10145 }, { "epoch": 0.14, "learning_rate": 4.775542176302388e-05, "loss": 0.8833, "step": 10150 }, { "epoch": 0.14, "learning_rate": 4.775324226495461e-05, "loss": 0.6524, "step": 10155 }, { "epoch": 0.14, "learning_rate": 4.775106175903054e-05, "loss": 0.8154, "step": 10160 }, { "epoch": 0.14, "learning_rate": 4.774888024534825e-05, "loss": 0.7918, "step": 10165 }, { "epoch": 0.14, "learning_rate": 4.7746697724004366e-05, "loss": 0.7544, "step": 10170 }, { "epoch": 0.14, "learning_rate": 4.774451419509558e-05, "loss": 0.994, "step": 10175 }, { "epoch": 0.14, "learning_rate": 4.774232965871861e-05, "loss": 0.5328, "step": 10180 }, { "epoch": 0.14, "learning_rate": 4.7740144114970195e-05, "loss": 1.1567, "step": 10185 }, { "epoch": 0.14, "learning_rate": 4.7737957563947176e-05, "loss": 0.7956, "step": 10190 }, { "epoch": 0.14, "learning_rate": 4.773577000574638e-05, "loss": 0.6007, "step": 10195 }, { "epoch": 0.14, "learning_rate": 4.773358144046472e-05, "loss": 0.9387, "step": 10200 }, { "epoch": 0.14, "learning_rate": 4.7731391868199146e-05, "loss": 1.2307, "step": 10205 }, { "epoch": 0.14, "learning_rate": 4.772920128904662e-05, "loss": 0.5043, "step": 10210 }, { "epoch": 0.14, "learning_rate": 4.77270097031042e-05, "loss": 0.2984, "step": 10215 }, { "epoch": 0.14, "learning_rate": 4.772481711046893e-05, "loss": 1.0094, "step": 10220 }, { "epoch": 0.14, "learning_rate": 4.772262351123797e-05, "loss": 1.7482, "step": 10225 }, { "epoch": 0.14, "learning_rate": 4.772042890550846e-05, "loss": 1.0971, "step": 10230 }, { "epoch": 0.14, "learning_rate": 4.771823329337761e-05, "loss": 1.5578, "step": 10235 }, { "epoch": 0.14, "learning_rate": 4.771603667494269e-05, "loss": 0.6284, "step": 10240 }, { "epoch": 0.14, "learning_rate": 4.771383905030099e-05, "loss": 0.5875, "step": 10245 }, { "epoch": 0.14, "learning_rate": 4.771164041954984e-05, "loss": 0.6786, "step": 10250 }, { "epoch": 0.14, "learning_rate": 4.7709440782786654e-05, "loss": 0.8102, "step": 10255 }, { "epoch": 0.14, "learning_rate": 4.770724014010886e-05, "loss": 1.0403, "step": 10260 }, { "epoch": 0.14, "learning_rate": 4.770503849161391e-05, "loss": 1.2341, "step": 10265 }, { "epoch": 0.14, "learning_rate": 4.770283583739935e-05, "loss": 0.4445, "step": 10270 }, { "epoch": 0.14, "learning_rate": 4.7700632177562754e-05, "loss": 1.0748, "step": 10275 }, { "epoch": 0.14, "learning_rate": 4.76984275122017e-05, "loss": 0.6405, "step": 10280 }, { "epoch": 0.14, "learning_rate": 4.769622184141388e-05, "loss": 1.2489, "step": 10285 }, { "epoch": 0.14, "learning_rate": 4.769401516529698e-05, "loss": 0.3974, "step": 10290 }, { "epoch": 0.14, "learning_rate": 4.769180748394874e-05, "loss": 1.2375, "step": 10295 }, { "epoch": 0.14, "learning_rate": 4.768959879746694e-05, "loss": 0.3164, "step": 10300 }, { "epoch": 0.14, "learning_rate": 4.768738910594943e-05, "loss": 0.7714, "step": 10305 }, { "epoch": 0.14, "learning_rate": 4.768517840949409e-05, "loss": 0.744, "step": 10310 }, { "epoch": 0.14, "learning_rate": 4.768296670819884e-05, "loss": 0.6641, "step": 10315 }, { "epoch": 0.14, "learning_rate": 4.7680754002161635e-05, "loss": 1.2144, "step": 10320 }, { "epoch": 0.14, "learning_rate": 4.76785402914805e-05, "loss": 1.183, "step": 10325 }, { "epoch": 0.14, "learning_rate": 4.7676325576253486e-05, "loss": 0.4724, "step": 10330 }, { "epoch": 0.14, "learning_rate": 4.76741098565787e-05, "loss": 0.8067, "step": 10335 }, { "epoch": 0.14, "learning_rate": 4.767189313255428e-05, "loss": 0.8402, "step": 10340 }, { "epoch": 0.14, "learning_rate": 4.766967540427841e-05, "loss": 0.6562, "step": 10345 }, { "epoch": 0.14, "learning_rate": 4.766745667184934e-05, "loss": 0.3731, "step": 10350 }, { "epoch": 0.14, "learning_rate": 4.766523693536534e-05, "loss": 1.4322, "step": 10355 }, { "epoch": 0.14, "learning_rate": 4.7663016194924736e-05, "loss": 0.7137, "step": 10360 }, { "epoch": 0.14, "learning_rate": 4.76607944506259e-05, "loss": 1.0227, "step": 10365 }, { "epoch": 0.14, "learning_rate": 4.765857170256722e-05, "loss": 0.7119, "step": 10370 }, { "epoch": 0.14, "learning_rate": 4.7656347950847184e-05, "loss": 0.7348, "step": 10375 }, { "epoch": 0.14, "learning_rate": 4.765412319556428e-05, "loss": 1.1485, "step": 10380 }, { "epoch": 0.14, "learning_rate": 4.765189743681705e-05, "loss": 0.5319, "step": 10385 }, { "epoch": 0.14, "learning_rate": 4.76496706747041e-05, "loss": 0.791, "step": 10390 }, { "epoch": 0.14, "learning_rate": 4.764744290932403e-05, "loss": 0.4282, "step": 10395 }, { "epoch": 0.14, "learning_rate": 4.764521414077555e-05, "loss": 1.7415, "step": 10400 }, { "epoch": 0.14, "learning_rate": 4.7642984369157376e-05, "loss": 0.309, "step": 10405 }, { "epoch": 0.14, "learning_rate": 4.7640753594568277e-05, "loss": 0.9659, "step": 10410 }, { "epoch": 0.14, "learning_rate": 4.763852181710705e-05, "loss": 0.798, "step": 10415 }, { "epoch": 0.14, "learning_rate": 4.763628903687257e-05, "loss": 1.1751, "step": 10420 }, { "epoch": 0.14, "learning_rate": 4.7634055253963736e-05, "loss": 0.5747, "step": 10425 }, { "epoch": 0.14, "learning_rate": 4.7631820468479485e-05, "loss": 0.5774, "step": 10430 }, { "epoch": 0.14, "learning_rate": 4.762958468051881e-05, "loss": 0.273, "step": 10435 }, { "epoch": 0.14, "learning_rate": 4.762734789018075e-05, "loss": 0.9676, "step": 10440 }, { "epoch": 0.14, "learning_rate": 4.762511009756437e-05, "loss": 0.4925, "step": 10445 }, { "epoch": 0.14, "learning_rate": 4.762287130276882e-05, "loss": 0.57, "step": 10450 }, { "epoch": 0.14, "learning_rate": 4.7620631505893234e-05, "loss": 0.9788, "step": 10455 }, { "epoch": 0.14, "learning_rate": 4.761839070703685e-05, "loss": 0.6179, "step": 10460 }, { "epoch": 0.14, "learning_rate": 4.7616148906298905e-05, "loss": 0.4654, "step": 10465 }, { "epoch": 0.14, "learning_rate": 4.761390610377872e-05, "loss": 0.77, "step": 10470 }, { "epoch": 0.14, "learning_rate": 4.761166229957562e-05, "loss": 0.8135, "step": 10475 }, { "epoch": 0.14, "learning_rate": 4.7609417493789e-05, "loss": 1.1477, "step": 10480 }, { "epoch": 0.14, "learning_rate": 4.76071716865183e-05, "loss": 1.134, "step": 10485 }, { "epoch": 0.14, "learning_rate": 4.760492487786299e-05, "loss": 0.7811, "step": 10490 }, { "epoch": 0.14, "learning_rate": 4.7602677067922604e-05, "loss": 1.3194, "step": 10495 }, { "epoch": 0.14, "learning_rate": 4.7600428256796695e-05, "loss": 0.3124, "step": 10500 }, { "epoch": 0.14, "learning_rate": 4.759817844458489e-05, "loss": 0.7561, "step": 10505 }, { "epoch": 0.14, "learning_rate": 4.7595927631386826e-05, "loss": 0.9677, "step": 10510 }, { "epoch": 0.14, "learning_rate": 4.7593675817302216e-05, "loss": 0.423, "step": 10515 }, { "epoch": 0.14, "learning_rate": 4.75914230024308e-05, "loss": 0.4467, "step": 10520 }, { "epoch": 0.14, "learning_rate": 4.7589169186872365e-05, "loss": 0.4003, "step": 10525 }, { "epoch": 0.14, "learning_rate": 4.7586914370726746e-05, "loss": 1.2682, "step": 10530 }, { "epoch": 0.14, "learning_rate": 4.7584658554093816e-05, "loss": 1.1048, "step": 10535 }, { "epoch": 0.14, "learning_rate": 4.75824017370735e-05, "loss": 0.842, "step": 10540 }, { "epoch": 0.14, "learning_rate": 4.758014391976577e-05, "loss": 1.2344, "step": 10545 }, { "epoch": 0.14, "learning_rate": 4.7577885102270625e-05, "loss": 0.6664, "step": 10550 }, { "epoch": 0.14, "learning_rate": 4.757562528468812e-05, "loss": 0.1736, "step": 10555 }, { "epoch": 0.14, "learning_rate": 4.757336446711836e-05, "loss": 0.6526, "step": 10560 }, { "epoch": 0.14, "learning_rate": 4.7571102649661485e-05, "loss": 0.6032, "step": 10565 }, { "epoch": 0.14, "learning_rate": 4.756883983241768e-05, "loss": 0.6401, "step": 10570 }, { "epoch": 0.14, "learning_rate": 4.7566576015487185e-05, "loss": 0.202, "step": 10575 }, { "epoch": 0.14, "learning_rate": 4.756431119897027e-05, "loss": 1.2508, "step": 10580 }, { "epoch": 0.14, "learning_rate": 4.7562045382967244e-05, "loss": 0.8815, "step": 10585 }, { "epoch": 0.14, "learning_rate": 4.7559778567578494e-05, "loss": 0.8895, "step": 10590 }, { "epoch": 0.14, "learning_rate": 4.755751075290441e-05, "loss": 1.9446, "step": 10595 }, { "epoch": 0.14, "learning_rate": 4.7555241939045446e-05, "loss": 1.7407, "step": 10600 }, { "epoch": 0.14, "learning_rate": 4.755297212610211e-05, "loss": 0.9629, "step": 10605 }, { "epoch": 0.14, "learning_rate": 4.7550701314174943e-05, "loss": 0.8277, "step": 10610 }, { "epoch": 0.14, "learning_rate": 4.754842950336452e-05, "loss": 0.5351, "step": 10615 }, { "epoch": 0.14, "learning_rate": 4.7546156693771485e-05, "loss": 1.0266, "step": 10620 }, { "epoch": 0.14, "learning_rate": 4.754388288549649e-05, "loss": 0.4748, "step": 10625 }, { "epoch": 0.14, "learning_rate": 4.754160807864027e-05, "loss": 0.4828, "step": 10630 }, { "epoch": 0.14, "learning_rate": 4.753933227330359e-05, "loss": 1.0082, "step": 10635 }, { "epoch": 0.14, "learning_rate": 4.7537055469587246e-05, "loss": 0.611, "step": 10640 }, { "epoch": 0.14, "learning_rate": 4.7534777667592095e-05, "loss": 0.5213, "step": 10645 }, { "epoch": 0.14, "learning_rate": 4.753249886741903e-05, "loss": 0.5762, "step": 10650 }, { "epoch": 0.14, "learning_rate": 4.7530219069168995e-05, "loss": 1.3051, "step": 10655 }, { "epoch": 0.14, "learning_rate": 4.752793827294297e-05, "loss": 0.541, "step": 10660 }, { "epoch": 0.14, "learning_rate": 4.752565647884199e-05, "loss": 0.828, "step": 10665 }, { "epoch": 0.14, "learning_rate": 4.7523373686967104e-05, "loss": 0.8232, "step": 10670 }, { "epoch": 0.14, "learning_rate": 4.752108989741945e-05, "loss": 0.4555, "step": 10675 }, { "epoch": 0.14, "learning_rate": 4.7518805110300193e-05, "loss": 0.8456, "step": 10680 }, { "epoch": 0.14, "learning_rate": 4.751651932571052e-05, "loss": 0.4662, "step": 10685 }, { "epoch": 0.14, "learning_rate": 4.751423254375168e-05, "loss": 0.5457, "step": 10690 }, { "epoch": 0.14, "learning_rate": 4.751194476452499e-05, "loss": 1.0297, "step": 10695 }, { "epoch": 0.14, "learning_rate": 4.750965598813176e-05, "loss": 0.3155, "step": 10700 }, { "epoch": 0.14, "learning_rate": 4.7507366214673384e-05, "loss": 0.3117, "step": 10705 }, { "epoch": 0.14, "learning_rate": 4.750507544425128e-05, "loss": 0.8371, "step": 10710 }, { "epoch": 0.14, "learning_rate": 4.7502783676966935e-05, "loss": 1.0471, "step": 10715 }, { "epoch": 0.14, "learning_rate": 4.750049091292184e-05, "loss": 0.8249, "step": 10720 }, { "epoch": 0.14, "learning_rate": 4.749819715221757e-05, "loss": 0.622, "step": 10725 }, { "epoch": 0.14, "learning_rate": 4.749590239495572e-05, "loss": 0.5835, "step": 10730 }, { "epoch": 0.14, "learning_rate": 4.749360664123794e-05, "loss": 1.0733, "step": 10735 }, { "epoch": 0.14, "learning_rate": 4.7491309891165913e-05, "loss": 1.4486, "step": 10740 }, { "epoch": 0.14, "learning_rate": 4.7489012144841385e-05, "loss": 0.2968, "step": 10745 }, { "epoch": 0.14, "learning_rate": 4.7486713402366125e-05, "loss": 0.982, "step": 10750 }, { "epoch": 0.14, "learning_rate": 4.748441366384195e-05, "loss": 0.6264, "step": 10755 }, { "epoch": 0.14, "learning_rate": 4.748211292937075e-05, "loss": 1.01, "step": 10760 }, { "epoch": 0.14, "learning_rate": 4.747981119905441e-05, "loss": 0.8098, "step": 10765 }, { "epoch": 0.14, "learning_rate": 4.74775084729949e-05, "loss": 0.9644, "step": 10770 }, { "epoch": 0.14, "learning_rate": 4.747520475129422e-05, "loss": 1.3363, "step": 10775 }, { "epoch": 0.14, "learning_rate": 4.74729000340544e-05, "loss": 0.518, "step": 10780 }, { "epoch": 0.14, "learning_rate": 4.747059432137755e-05, "loss": 0.6329, "step": 10785 }, { "epoch": 0.14, "learning_rate": 4.746828761336578e-05, "loss": 0.4461, "step": 10790 }, { "epoch": 0.14, "learning_rate": 4.746597991012128e-05, "loss": 0.46, "step": 10795 }, { "epoch": 0.14, "learning_rate": 4.7463671211746255e-05, "loss": 0.154, "step": 10800 }, { "epoch": 0.14, "learning_rate": 4.7461361518342984e-05, "loss": 0.4736, "step": 10805 }, { "epoch": 0.14, "learning_rate": 4.745905083001377e-05, "loss": 0.6889, "step": 10810 }, { "epoch": 0.14, "learning_rate": 4.7456739146860953e-05, "loss": 0.5073, "step": 10815 }, { "epoch": 0.14, "learning_rate": 4.745442646898695e-05, "loss": 0.6079, "step": 10820 }, { "epoch": 0.15, "learning_rate": 4.745211279649418e-05, "loss": 0.5972, "step": 10825 }, { "epoch": 0.15, "learning_rate": 4.744979812948515e-05, "loss": 1.3442, "step": 10830 }, { "epoch": 0.15, "learning_rate": 4.744748246806238e-05, "loss": 1.0254, "step": 10835 }, { "epoch": 0.15, "learning_rate": 4.744516581232842e-05, "loss": 0.8014, "step": 10840 }, { "epoch": 0.15, "learning_rate": 4.744284816238591e-05, "loss": 0.7941, "step": 10845 }, { "epoch": 0.15, "learning_rate": 4.744052951833751e-05, "loss": 0.6458, "step": 10850 }, { "epoch": 0.15, "learning_rate": 4.7438209880285916e-05, "loss": 0.8467, "step": 10855 }, { "epoch": 0.15, "learning_rate": 4.743588924833387e-05, "loss": 0.4801, "step": 10860 }, { "epoch": 0.15, "learning_rate": 4.743356762258419e-05, "loss": 1.4848, "step": 10865 }, { "epoch": 0.15, "learning_rate": 4.743124500313969e-05, "loss": 0.8278, "step": 10870 }, { "epoch": 0.15, "learning_rate": 4.742892139010325e-05, "loss": 1.0828, "step": 10875 }, { "epoch": 0.15, "learning_rate": 4.7426596783577806e-05, "loss": 1.0107, "step": 10880 }, { "epoch": 0.15, "learning_rate": 4.742427118366632e-05, "loss": 1.0178, "step": 10885 }, { "epoch": 0.15, "learning_rate": 4.7421944590471805e-05, "loss": 0.5589, "step": 10890 }, { "epoch": 0.15, "learning_rate": 4.7419617004097324e-05, "loss": 0.917, "step": 10895 }, { "epoch": 0.15, "learning_rate": 4.7417288424645966e-05, "loss": 0.6427, "step": 10900 }, { "epoch": 0.15, "learning_rate": 4.741495885222088e-05, "loss": 0.6122, "step": 10905 }, { "epoch": 0.15, "learning_rate": 4.741262828692525e-05, "loss": 0.8567, "step": 10910 }, { "epoch": 0.15, "learning_rate": 4.741029672886232e-05, "loss": 0.6807, "step": 10915 }, { "epoch": 0.15, "learning_rate": 4.7407964178135365e-05, "loss": 0.7875, "step": 10920 }, { "epoch": 0.15, "learning_rate": 4.74056306348477e-05, "loss": 0.5909, "step": 10925 }, { "epoch": 0.15, "learning_rate": 4.740329609910268e-05, "loss": 1.5102, "step": 10930 }, { "epoch": 0.15, "learning_rate": 4.7400960571003734e-05, "loss": 0.518, "step": 10935 }, { "epoch": 0.15, "learning_rate": 4.7398624050654294e-05, "loss": 0.26, "step": 10940 }, { "epoch": 0.15, "learning_rate": 4.739628653815788e-05, "loss": 0.3743, "step": 10945 }, { "epoch": 0.15, "learning_rate": 4.7393948033618e-05, "loss": 0.5365, "step": 10950 }, { "epoch": 0.15, "learning_rate": 4.739160853713826e-05, "loss": 0.5195, "step": 10955 }, { "epoch": 0.15, "learning_rate": 4.738926804882229e-05, "loss": 0.9785, "step": 10960 }, { "epoch": 0.15, "learning_rate": 4.738692656877375e-05, "loss": 1.2768, "step": 10965 }, { "epoch": 0.15, "learning_rate": 4.7384584097096366e-05, "loss": 0.9448, "step": 10970 }, { "epoch": 0.15, "learning_rate": 4.738224063389389e-05, "loss": 0.4233, "step": 10975 }, { "epoch": 0.15, "learning_rate": 4.7379896179270125e-05, "loss": 0.5075, "step": 10980 }, { "epoch": 0.15, "learning_rate": 4.737755073332893e-05, "loss": 1.3353, "step": 10985 }, { "epoch": 0.15, "learning_rate": 4.737520429617418e-05, "loss": 0.4456, "step": 10990 }, { "epoch": 0.15, "learning_rate": 4.7372856867909824e-05, "loss": 0.7047, "step": 10995 }, { "epoch": 0.15, "learning_rate": 4.737050844863984e-05, "loss": 1.1544, "step": 11000 }, { "epoch": 0.15, "learning_rate": 4.736815903846824e-05, "loss": 0.9892, "step": 11005 }, { "epoch": 0.15, "learning_rate": 4.73658086374991e-05, "loss": 0.3335, "step": 11010 }, { "epoch": 0.15, "learning_rate": 4.736345724583654e-05, "loss": 0.9449, "step": 11015 }, { "epoch": 0.15, "learning_rate": 4.736110486358469e-05, "loss": 0.9536, "step": 11020 }, { "epoch": 0.15, "learning_rate": 4.735875149084778e-05, "loss": 0.888, "step": 11025 }, { "epoch": 0.15, "learning_rate": 4.7356397127730025e-05, "loss": 0.6724, "step": 11030 }, { "epoch": 0.15, "learning_rate": 4.735404177433573e-05, "loss": 0.5485, "step": 11035 }, { "epoch": 0.15, "learning_rate": 4.735168543076921e-05, "loss": 0.7831, "step": 11040 }, { "epoch": 0.15, "learning_rate": 4.734932809713485e-05, "loss": 1.1672, "step": 11045 }, { "epoch": 0.15, "learning_rate": 4.734696977353707e-05, "loss": 0.5772, "step": 11050 }, { "epoch": 0.15, "learning_rate": 4.7344610460080326e-05, "loss": 0.2092, "step": 11055 }, { "epoch": 0.15, "learning_rate": 4.7342250156869125e-05, "loss": 0.7579, "step": 11060 }, { "epoch": 0.15, "learning_rate": 4.733988886400801e-05, "loss": 0.2174, "step": 11065 }, { "epoch": 0.15, "learning_rate": 4.733752658160159e-05, "loss": 1.2513, "step": 11070 }, { "epoch": 0.15, "learning_rate": 4.733516330975449e-05, "loss": 0.5521, "step": 11075 }, { "epoch": 0.15, "learning_rate": 4.7332799048571396e-05, "loss": 0.8567, "step": 11080 }, { "epoch": 0.15, "learning_rate": 4.7330433798157026e-05, "loss": 0.5805, "step": 11085 }, { "epoch": 0.15, "learning_rate": 4.7328067558616163e-05, "loss": 1.1747, "step": 11090 }, { "epoch": 0.15, "learning_rate": 4.7325700330053605e-05, "loss": 1.2024, "step": 11095 }, { "epoch": 0.15, "learning_rate": 4.732333211257421e-05, "loss": 1.0597, "step": 11100 }, { "epoch": 0.15, "learning_rate": 4.7320962906282894e-05, "loss": 0.7227, "step": 11105 }, { "epoch": 0.15, "learning_rate": 4.731859271128459e-05, "loss": 0.5641, "step": 11110 }, { "epoch": 0.15, "learning_rate": 4.731622152768428e-05, "loss": 0.7796, "step": 11115 }, { "epoch": 0.15, "learning_rate": 4.7313849355586994e-05, "loss": 0.6174, "step": 11120 }, { "epoch": 0.15, "learning_rate": 4.731147619509783e-05, "loss": 0.9136, "step": 11125 }, { "epoch": 0.15, "learning_rate": 4.730910204632188e-05, "loss": 0.2762, "step": 11130 }, { "epoch": 0.15, "learning_rate": 4.7306726909364316e-05, "loss": 0.5945, "step": 11135 }, { "epoch": 0.15, "learning_rate": 4.7304350784330355e-05, "loss": 1.0562, "step": 11140 }, { "epoch": 0.15, "learning_rate": 4.730197367132523e-05, "loss": 0.3967, "step": 11145 }, { "epoch": 0.15, "learning_rate": 4.729959557045425e-05, "loss": 0.3012, "step": 11150 }, { "epoch": 0.15, "learning_rate": 4.729721648182275e-05, "loss": 0.8563, "step": 11155 }, { "epoch": 0.15, "learning_rate": 4.7294836405536104e-05, "loss": 1.7121, "step": 11160 }, { "epoch": 0.15, "learning_rate": 4.729245534169975e-05, "loss": 0.5286, "step": 11165 }, { "epoch": 0.15, "learning_rate": 4.729007329041915e-05, "loss": 0.5413, "step": 11170 }, { "epoch": 0.15, "learning_rate": 4.728769025179981e-05, "loss": 0.7856, "step": 11175 }, { "epoch": 0.15, "learning_rate": 4.728530622594729e-05, "loss": 0.7514, "step": 11180 }, { "epoch": 0.15, "learning_rate": 4.72829212129672e-05, "loss": 0.5114, "step": 11185 }, { "epoch": 0.15, "learning_rate": 4.728053521296518e-05, "loss": 1.1072, "step": 11190 }, { "epoch": 0.15, "learning_rate": 4.727814822604691e-05, "loss": 1.015, "step": 11195 }, { "epoch": 0.15, "learning_rate": 4.727576025231814e-05, "loss": 0.6481, "step": 11200 }, { "epoch": 0.15, "learning_rate": 4.727337129188463e-05, "loss": 0.7051, "step": 11205 }, { "epoch": 0.15, "learning_rate": 4.7270981344852195e-05, "loss": 0.5636, "step": 11210 }, { "epoch": 0.15, "learning_rate": 4.726859041132671e-05, "loss": 0.9688, "step": 11215 }, { "epoch": 0.15, "learning_rate": 4.726619849141407e-05, "loss": 1.2316, "step": 11220 }, { "epoch": 0.15, "learning_rate": 4.7263805585220234e-05, "loss": 0.2036, "step": 11225 }, { "epoch": 0.15, "learning_rate": 4.726141169285119e-05, "loss": 0.2478, "step": 11230 }, { "epoch": 0.15, "learning_rate": 4.725901681441298e-05, "loss": 1.1319, "step": 11235 }, { "epoch": 0.15, "learning_rate": 4.725662095001169e-05, "loss": 0.9345, "step": 11240 }, { "epoch": 0.15, "learning_rate": 4.725422409975343e-05, "loss": 0.1828, "step": 11245 }, { "epoch": 0.15, "learning_rate": 4.725182626374438e-05, "loss": 0.4511, "step": 11250 }, { "epoch": 0.15, "learning_rate": 4.724942744209076e-05, "loss": 1.1881, "step": 11255 }, { "epoch": 0.15, "learning_rate": 4.72470276348988e-05, "loss": 0.9072, "step": 11260 }, { "epoch": 0.15, "learning_rate": 4.7244626842274814e-05, "loss": 1.0133, "step": 11265 }, { "epoch": 0.15, "learning_rate": 4.7242225064325154e-05, "loss": 0.9189, "step": 11270 }, { "epoch": 0.15, "learning_rate": 4.723982230115619e-05, "loss": 0.7869, "step": 11275 }, { "epoch": 0.15, "learning_rate": 4.723741855287436e-05, "loss": 1.0067, "step": 11280 }, { "epoch": 0.15, "learning_rate": 4.7235013819586145e-05, "loss": 0.4006, "step": 11285 }, { "epoch": 0.15, "learning_rate": 4.723260810139805e-05, "loss": 0.8101, "step": 11290 }, { "epoch": 0.15, "learning_rate": 4.7230201398416655e-05, "loss": 1.0192, "step": 11295 }, { "epoch": 0.15, "learning_rate": 4.7227793710748534e-05, "loss": 0.622, "step": 11300 }, { "epoch": 0.15, "learning_rate": 4.722538503850036e-05, "loss": 0.4516, "step": 11305 }, { "epoch": 0.15, "learning_rate": 4.722297538177882e-05, "loss": 0.9, "step": 11310 }, { "epoch": 0.15, "learning_rate": 4.722056474069065e-05, "loss": 1.0423, "step": 11315 }, { "epoch": 0.15, "learning_rate": 4.721815311534263e-05, "loss": 0.9686, "step": 11320 }, { "epoch": 0.15, "learning_rate": 4.7215740505841576e-05, "loss": 0.6616, "step": 11325 }, { "epoch": 0.15, "learning_rate": 4.7213326912294364e-05, "loss": 0.4445, "step": 11330 }, { "epoch": 0.15, "learning_rate": 4.72109123348079e-05, "loss": 1.0013, "step": 11335 }, { "epoch": 0.15, "learning_rate": 4.720849677348914e-05, "loss": 0.9841, "step": 11340 }, { "epoch": 0.15, "learning_rate": 4.720608022844507e-05, "loss": 0.4283, "step": 11345 }, { "epoch": 0.15, "learning_rate": 4.720366269978275e-05, "loss": 0.9828, "step": 11350 }, { "epoch": 0.15, "learning_rate": 4.720124418760924e-05, "loss": 0.7449, "step": 11355 }, { "epoch": 0.15, "learning_rate": 4.719882469203168e-05, "loss": 0.9491, "step": 11360 }, { "epoch": 0.15, "learning_rate": 4.719640421315726e-05, "loss": 0.6613, "step": 11365 }, { "epoch": 0.15, "learning_rate": 4.719398275109317e-05, "loss": 0.4105, "step": 11370 }, { "epoch": 0.15, "learning_rate": 4.719156030594668e-05, "loss": 0.5717, "step": 11375 }, { "epoch": 0.15, "learning_rate": 4.7189136877825086e-05, "loss": 0.7141, "step": 11380 }, { "epoch": 0.15, "learning_rate": 4.718671246683574e-05, "loss": 0.9024, "step": 11385 }, { "epoch": 0.15, "learning_rate": 4.718428707308603e-05, "loss": 0.6936, "step": 11390 }, { "epoch": 0.15, "learning_rate": 4.718186069668338e-05, "loss": 0.6997, "step": 11395 }, { "epoch": 0.15, "learning_rate": 4.717943333773528e-05, "loss": 0.968, "step": 11400 }, { "epoch": 0.15, "learning_rate": 4.717700499634924e-05, "loss": 0.3095, "step": 11405 }, { "epoch": 0.15, "learning_rate": 4.7174575672632826e-05, "loss": 1.1099, "step": 11410 }, { "epoch": 0.15, "learning_rate": 4.7172145366693646e-05, "loss": 1.0479, "step": 11415 }, { "epoch": 0.15, "learning_rate": 4.716971407863935e-05, "loss": 0.692, "step": 11420 }, { "epoch": 0.15, "learning_rate": 4.716728180857764e-05, "loss": 0.382, "step": 11425 }, { "epoch": 0.15, "learning_rate": 4.7164848556616226e-05, "loss": 1.1458, "step": 11430 }, { "epoch": 0.15, "learning_rate": 4.7162414322862924e-05, "loss": 1.0735, "step": 11435 }, { "epoch": 0.15, "learning_rate": 4.715997910742554e-05, "loss": 0.9454, "step": 11440 }, { "epoch": 0.15, "learning_rate": 4.715754291041194e-05, "loss": 0.2914, "step": 11445 }, { "epoch": 0.15, "learning_rate": 4.715510573193005e-05, "loss": 1.0318, "step": 11450 }, { "epoch": 0.15, "learning_rate": 4.7152667572087804e-05, "loss": 0.4941, "step": 11455 }, { "epoch": 0.15, "learning_rate": 4.715022843099322e-05, "loss": 0.3833, "step": 11460 }, { "epoch": 0.15, "learning_rate": 4.7147788308754314e-05, "loss": 0.7025, "step": 11465 }, { "epoch": 0.15, "learning_rate": 4.714534720547921e-05, "loss": 0.5362, "step": 11470 }, { "epoch": 0.15, "learning_rate": 4.7142905121275995e-05, "loss": 1.2728, "step": 11475 }, { "epoch": 0.15, "learning_rate": 4.714046205625287e-05, "loss": 0.43, "step": 11480 }, { "epoch": 0.15, "learning_rate": 4.713801801051804e-05, "loss": 1.028, "step": 11485 }, { "epoch": 0.15, "learning_rate": 4.7135572984179765e-05, "loss": 0.8458, "step": 11490 }, { "epoch": 0.15, "learning_rate": 4.7133126977346346e-05, "loss": 0.3482, "step": 11495 }, { "epoch": 0.15, "learning_rate": 4.7130679990126135e-05, "loss": 1.2089, "step": 11500 }, { "epoch": 0.15, "learning_rate": 4.712823202262752e-05, "loss": 0.5194, "step": 11505 }, { "epoch": 0.15, "learning_rate": 4.7125783074958915e-05, "loss": 0.1843, "step": 11510 }, { "epoch": 0.15, "learning_rate": 4.712333314722882e-05, "loss": 0.5577, "step": 11515 }, { "epoch": 0.15, "learning_rate": 4.712088223954575e-05, "loss": 1.015, "step": 11520 }, { "epoch": 0.15, "learning_rate": 4.711843035201826e-05, "loss": 0.8109, "step": 11525 }, { "epoch": 0.15, "learning_rate": 4.711597748475497e-05, "loss": 0.756, "step": 11530 }, { "epoch": 0.15, "learning_rate": 4.711352363786451e-05, "loss": 0.8037, "step": 11535 }, { "epoch": 0.15, "learning_rate": 4.711106881145558e-05, "loss": 0.4477, "step": 11540 }, { "epoch": 0.15, "learning_rate": 4.7108613005636923e-05, "loss": 1.3553, "step": 11545 }, { "epoch": 0.15, "learning_rate": 4.710615622051732e-05, "loss": 1.1123, "step": 11550 }, { "epoch": 0.15, "learning_rate": 4.710369845620559e-05, "loss": 0.4254, "step": 11555 }, { "epoch": 0.15, "learning_rate": 4.71012397128106e-05, "loss": 0.9754, "step": 11560 }, { "epoch": 0.15, "learning_rate": 4.7098779990441256e-05, "loss": 1.0303, "step": 11565 }, { "epoch": 0.16, "learning_rate": 4.7096319289206515e-05, "loss": 0.6403, "step": 11570 }, { "epoch": 0.16, "learning_rate": 4.709385760921538e-05, "loss": 0.7508, "step": 11575 }, { "epoch": 0.16, "learning_rate": 4.7091394950576875e-05, "loss": 0.8289, "step": 11580 }, { "epoch": 0.16, "learning_rate": 4.70889313134001e-05, "loss": 0.8083, "step": 11585 }, { "epoch": 0.16, "learning_rate": 4.7086466697794176e-05, "loss": 0.2857, "step": 11590 }, { "epoch": 0.16, "learning_rate": 4.708400110386827e-05, "loss": 0.8453, "step": 11595 }, { "epoch": 0.16, "learning_rate": 4.70815345317316e-05, "loss": 0.636, "step": 11600 }, { "epoch": 0.16, "learning_rate": 4.707906698149341e-05, "loss": 0.2677, "step": 11605 }, { "epoch": 0.16, "learning_rate": 4.7076598453263034e-05, "loss": 1.0412, "step": 11610 }, { "epoch": 0.16, "learning_rate": 4.707412894714977e-05, "loss": 0.8344, "step": 11615 }, { "epoch": 0.16, "learning_rate": 4.707165846326304e-05, "loss": 0.6991, "step": 11620 }, { "epoch": 0.16, "learning_rate": 4.706918700171226e-05, "loss": 1.3357, "step": 11625 }, { "epoch": 0.16, "learning_rate": 4.706671456260689e-05, "loss": 0.3491, "step": 11630 }, { "epoch": 0.16, "learning_rate": 4.7064241146056474e-05, "loss": 0.7174, "step": 11635 }, { "epoch": 0.16, "learning_rate": 4.706176675217056e-05, "loss": 0.5807, "step": 11640 }, { "epoch": 0.16, "learning_rate": 4.7059291381058744e-05, "loss": 0.4976, "step": 11645 }, { "epoch": 0.16, "learning_rate": 4.7056815032830686e-05, "loss": 0.4809, "step": 11650 }, { "epoch": 0.16, "learning_rate": 4.7054337707596066e-05, "loss": 1.2348, "step": 11655 }, { "epoch": 0.16, "learning_rate": 4.705185940546461e-05, "loss": 1.0117, "step": 11660 }, { "epoch": 0.16, "learning_rate": 4.704938012654612e-05, "loss": 0.9202, "step": 11665 }, { "epoch": 0.16, "learning_rate": 4.7046899870950395e-05, "loss": 1.2833, "step": 11670 }, { "epoch": 0.16, "learning_rate": 4.7044418638787304e-05, "loss": 0.6552, "step": 11675 }, { "epoch": 0.16, "learning_rate": 4.704193643016675e-05, "loss": 0.1913, "step": 11680 }, { "epoch": 0.16, "learning_rate": 4.7039453245198685e-05, "loss": 0.3526, "step": 11685 }, { "epoch": 0.16, "learning_rate": 4.70369690839931e-05, "loss": 0.4972, "step": 11690 }, { "epoch": 0.16, "learning_rate": 4.703448394666003e-05, "loss": 0.9935, "step": 11695 }, { "epoch": 0.16, "learning_rate": 4.703199783330956e-05, "loss": 0.2902, "step": 11700 }, { "epoch": 0.16, "learning_rate": 4.702951074405181e-05, "loss": 0.5028, "step": 11705 }, { "epoch": 0.16, "learning_rate": 4.7027022678996934e-05, "loss": 0.1238, "step": 11710 }, { "epoch": 0.16, "learning_rate": 4.702453363825516e-05, "loss": 0.982, "step": 11715 }, { "epoch": 0.16, "learning_rate": 4.702204362193673e-05, "loss": 0.8326, "step": 11720 }, { "epoch": 0.16, "learning_rate": 4.7019552630151945e-05, "loss": 0.4706, "step": 11725 }, { "epoch": 0.16, "learning_rate": 4.701706066301113e-05, "loss": 0.1009, "step": 11730 }, { "epoch": 0.16, "learning_rate": 4.701456772062468e-05, "loss": 0.4743, "step": 11735 }, { "epoch": 0.16, "learning_rate": 4.7012073803103016e-05, "loss": 0.5488, "step": 11740 }, { "epoch": 0.16, "learning_rate": 4.70095789105566e-05, "loss": 0.6157, "step": 11745 }, { "epoch": 0.16, "learning_rate": 4.700708304309596e-05, "loss": 0.2852, "step": 11750 }, { "epoch": 0.16, "learning_rate": 4.700458620083162e-05, "loss": 0.6695, "step": 11755 }, { "epoch": 0.16, "learning_rate": 4.7002088383874216e-05, "loss": 0.2726, "step": 11760 }, { "epoch": 0.16, "learning_rate": 4.699958959233436e-05, "loss": 0.9301, "step": 11765 }, { "epoch": 0.16, "learning_rate": 4.699708982632275e-05, "loss": 1.0945, "step": 11770 }, { "epoch": 0.16, "learning_rate": 4.699458908595011e-05, "loss": 0.2481, "step": 11775 }, { "epoch": 0.16, "learning_rate": 4.69920873713272e-05, "loss": 0.9625, "step": 11780 }, { "epoch": 0.16, "learning_rate": 4.698958468256485e-05, "loss": 0.8037, "step": 11785 }, { "epoch": 0.16, "learning_rate": 4.698708101977391e-05, "loss": 0.8268, "step": 11790 }, { "epoch": 0.16, "learning_rate": 4.698457638306527e-05, "loss": 1.0628, "step": 11795 }, { "epoch": 0.16, "learning_rate": 4.698207077254989e-05, "loss": 0.8318, "step": 11800 }, { "epoch": 0.16, "learning_rate": 4.697956418833874e-05, "loss": 1.1315, "step": 11805 }, { "epoch": 0.16, "learning_rate": 4.6977056630542874e-05, "loss": 1.0291, "step": 11810 }, { "epoch": 0.16, "learning_rate": 4.697454809927333e-05, "loss": 0.3041, "step": 11815 }, { "epoch": 0.16, "learning_rate": 4.6972038594641247e-05, "loss": 0.6612, "step": 11820 }, { "epoch": 0.16, "learning_rate": 4.6969528116757774e-05, "loss": 0.5398, "step": 11825 }, { "epoch": 0.16, "learning_rate": 4.696701666573411e-05, "loss": 0.6127, "step": 11830 }, { "epoch": 0.16, "learning_rate": 4.696450424168152e-05, "loss": 1.4573, "step": 11835 }, { "epoch": 0.16, "learning_rate": 4.6961990844711265e-05, "loss": 0.4817, "step": 11840 }, { "epoch": 0.16, "learning_rate": 4.695947647493469e-05, "loss": 1.1725, "step": 11845 }, { "epoch": 0.16, "learning_rate": 4.695696113246317e-05, "loss": 0.4965, "step": 11850 }, { "epoch": 0.16, "learning_rate": 4.695444481740812e-05, "loss": 0.7147, "step": 11855 }, { "epoch": 0.16, "learning_rate": 4.6951927529881e-05, "loss": 1.2485, "step": 11860 }, { "epoch": 0.16, "learning_rate": 4.69494092699933e-05, "loss": 1.5091, "step": 11865 }, { "epoch": 0.16, "learning_rate": 4.6946890037856595e-05, "loss": 0.8794, "step": 11870 }, { "epoch": 0.16, "learning_rate": 4.694436983358245e-05, "loss": 0.5897, "step": 11875 }, { "epoch": 0.16, "learning_rate": 4.6941848657282507e-05, "loss": 0.2892, "step": 11880 }, { "epoch": 0.16, "learning_rate": 4.693932650906844e-05, "loss": 0.423, "step": 11885 }, { "epoch": 0.16, "learning_rate": 4.6936803389051966e-05, "loss": 0.667, "step": 11890 }, { "epoch": 0.16, "learning_rate": 4.693427929734485e-05, "loss": 0.1647, "step": 11895 }, { "epoch": 0.16, "learning_rate": 4.69317542340589e-05, "loss": 0.4423, "step": 11900 }, { "epoch": 0.16, "learning_rate": 4.692922819930595e-05, "loss": 0.8466, "step": 11905 }, { "epoch": 0.16, "learning_rate": 4.6926701193197904e-05, "loss": 1.0056, "step": 11910 }, { "epoch": 0.16, "learning_rate": 4.692417321584669e-05, "loss": 0.9829, "step": 11915 }, { "epoch": 0.16, "learning_rate": 4.6921644267364285e-05, "loss": 0.9561, "step": 11920 }, { "epoch": 0.16, "learning_rate": 4.691911434786271e-05, "loss": 0.6149, "step": 11925 }, { "epoch": 0.16, "learning_rate": 4.6916583457454025e-05, "loss": 0.6837, "step": 11930 }, { "epoch": 0.16, "learning_rate": 4.691405159625034e-05, "loss": 1.1159, "step": 11935 }, { "epoch": 0.16, "learning_rate": 4.69115187643638e-05, "loss": 0.9828, "step": 11940 }, { "epoch": 0.16, "learning_rate": 4.6908984961906604e-05, "loss": 0.8798, "step": 11945 }, { "epoch": 0.16, "learning_rate": 4.690695722120539e-05, "loss": 1.024, "step": 11950 }, { "epoch": 0.16, "learning_rate": 4.690442167200386e-05, "loss": 0.4456, "step": 11955 }, { "epoch": 0.16, "learning_rate": 4.690188515254603e-05, "loss": 0.7875, "step": 11960 }, { "epoch": 0.16, "learning_rate": 4.689934766294427e-05, "loss": 0.887, "step": 11965 }, { "epoch": 0.16, "learning_rate": 4.6896809203310966e-05, "loss": 0.3602, "step": 11970 }, { "epoch": 0.16, "learning_rate": 4.689426977375855e-05, "loss": 0.9683, "step": 11975 }, { "epoch": 0.16, "learning_rate": 4.689172937439953e-05, "loss": 0.1873, "step": 11980 }, { "epoch": 0.16, "learning_rate": 4.688918800534641e-05, "loss": 0.5291, "step": 11985 }, { "epoch": 0.16, "learning_rate": 4.688664566671177e-05, "loss": 0.3676, "step": 11990 }, { "epoch": 0.16, "learning_rate": 4.688410235860823e-05, "loss": 0.9044, "step": 11995 }, { "epoch": 0.16, "learning_rate": 4.6881558081148427e-05, "loss": 0.3896, "step": 12000 }, { "epoch": 0.16, "learning_rate": 4.687901283444508e-05, "loss": 0.9752, "step": 12005 }, { "epoch": 0.16, "learning_rate": 4.6876466618610914e-05, "loss": 1.4053, "step": 12010 }, { "epoch": 0.16, "learning_rate": 4.6873919433758725e-05, "loss": 1.0232, "step": 12015 }, { "epoch": 0.16, "learning_rate": 4.6871371280001344e-05, "loss": 1.0489, "step": 12020 }, { "epoch": 0.16, "learning_rate": 4.686882215745162e-05, "loss": 0.5473, "step": 12025 }, { "epoch": 0.16, "learning_rate": 4.686627206622249e-05, "loss": 0.6435, "step": 12030 }, { "epoch": 0.16, "learning_rate": 4.686372100642691e-05, "loss": 0.6418, "step": 12035 }, { "epoch": 0.16, "learning_rate": 4.6861168978177856e-05, "loss": 0.2262, "step": 12040 }, { "epoch": 0.16, "learning_rate": 4.685861598158838e-05, "loss": 0.6707, "step": 12045 }, { "epoch": 0.16, "learning_rate": 4.685606201677159e-05, "loss": 0.6567, "step": 12050 }, { "epoch": 0.16, "learning_rate": 4.685350708384058e-05, "loss": 0.782, "step": 12055 }, { "epoch": 0.16, "learning_rate": 4.685095118290854e-05, "loss": 1.4865, "step": 12060 }, { "epoch": 0.16, "learning_rate": 4.684839431408868e-05, "loss": 1.2122, "step": 12065 }, { "epoch": 0.16, "learning_rate": 4.6845836477494254e-05, "loss": 0.5383, "step": 12070 }, { "epoch": 0.16, "learning_rate": 4.6843277673238574e-05, "loss": 1.0972, "step": 12075 }, { "epoch": 0.16, "learning_rate": 4.684071790143496e-05, "loss": 0.4715, "step": 12080 }, { "epoch": 0.16, "learning_rate": 4.683815716219681e-05, "loss": 0.7425, "step": 12085 }, { "epoch": 0.16, "learning_rate": 4.683559545563755e-05, "loss": 0.768, "step": 12090 }, { "epoch": 0.16, "learning_rate": 4.683303278187065e-05, "loss": 1.1929, "step": 12095 }, { "epoch": 0.16, "learning_rate": 4.6830469141009634e-05, "loss": 1.0675, "step": 12100 }, { "epoch": 0.16, "learning_rate": 4.682790453316804e-05, "loss": 1.361, "step": 12105 }, { "epoch": 0.16, "learning_rate": 4.6825338958459485e-05, "loss": 0.8366, "step": 12110 }, { "epoch": 0.16, "learning_rate": 4.68227724169976e-05, "loss": 0.8037, "step": 12115 }, { "epoch": 0.16, "learning_rate": 4.6820204908896073e-05, "loss": 0.51, "step": 12120 }, { "epoch": 0.16, "learning_rate": 4.6817636434268624e-05, "loss": 0.5793, "step": 12125 }, { "epoch": 0.16, "learning_rate": 4.681506699322904e-05, "loss": 0.5033, "step": 12130 }, { "epoch": 0.16, "learning_rate": 4.681249658589112e-05, "loss": 0.5338, "step": 12135 }, { "epoch": 0.16, "learning_rate": 4.680992521236873e-05, "loss": 0.4118, "step": 12140 }, { "epoch": 0.16, "learning_rate": 4.680735287277576e-05, "loss": 0.7635, "step": 12145 }, { "epoch": 0.16, "learning_rate": 4.680477956722616e-05, "loss": 0.342, "step": 12150 }, { "epoch": 0.16, "learning_rate": 4.680220529583391e-05, "loss": 1.0542, "step": 12155 }, { "epoch": 0.16, "learning_rate": 4.679963005871304e-05, "loss": 0.9692, "step": 12160 }, { "epoch": 0.16, "learning_rate": 4.679705385597762e-05, "loss": 0.1899, "step": 12165 }, { "epoch": 0.16, "learning_rate": 4.6794476687741756e-05, "loss": 0.9283, "step": 12170 }, { "epoch": 0.16, "learning_rate": 4.679189855411962e-05, "loss": 0.672, "step": 12175 }, { "epoch": 0.16, "learning_rate": 4.678931945522539e-05, "loss": 0.9737, "step": 12180 }, { "epoch": 0.16, "learning_rate": 4.678673939117331e-05, "loss": 0.6227, "step": 12185 }, { "epoch": 0.16, "learning_rate": 4.678415836207768e-05, "loss": 0.9507, "step": 12190 }, { "epoch": 0.16, "learning_rate": 4.678157636805282e-05, "loss": 1.1241, "step": 12195 }, { "epoch": 0.16, "learning_rate": 4.677899340921309e-05, "loss": 1.0279, "step": 12200 }, { "epoch": 0.16, "learning_rate": 4.677640948567291e-05, "loss": 1.279, "step": 12205 }, { "epoch": 0.16, "learning_rate": 4.677382459754673e-05, "loss": 1.0877, "step": 12210 }, { "epoch": 0.16, "learning_rate": 4.6771238744949066e-05, "loss": 0.534, "step": 12215 }, { "epoch": 0.16, "learning_rate": 4.6768651927994434e-05, "loss": 0.9342, "step": 12220 }, { "epoch": 0.16, "learning_rate": 4.676606414679743e-05, "loss": 0.793, "step": 12225 }, { "epoch": 0.16, "learning_rate": 4.676347540147267e-05, "loss": 0.779, "step": 12230 }, { "epoch": 0.16, "learning_rate": 4.676088569213483e-05, "loss": 0.6378, "step": 12235 }, { "epoch": 0.16, "learning_rate": 4.675829501889862e-05, "loss": 1.2125, "step": 12240 }, { "epoch": 0.16, "learning_rate": 4.67557033818788e-05, "loss": 0.5785, "step": 12245 }, { "epoch": 0.16, "learning_rate": 4.6753110781190154e-05, "loss": 0.6681, "step": 12250 }, { "epoch": 0.16, "learning_rate": 4.675051721694753e-05, "loss": 0.8711, "step": 12255 }, { "epoch": 0.16, "learning_rate": 4.674792268926581e-05, "loss": 0.663, "step": 12260 }, { "epoch": 0.16, "learning_rate": 4.6745327198259915e-05, "loss": 0.8935, "step": 12265 }, { "epoch": 0.16, "learning_rate": 4.674273074404482e-05, "loss": 1.0768, "step": 12270 }, { "epoch": 0.16, "learning_rate": 4.674013332673552e-05, "loss": 0.835, "step": 12275 }, { "epoch": 0.16, "learning_rate": 4.6737534946447074e-05, "loss": 0.365, "step": 12280 }, { "epoch": 0.16, "learning_rate": 4.673493560329458e-05, "loss": 0.6624, "step": 12285 }, { "epoch": 0.16, "learning_rate": 4.673233529739318e-05, "loss": 0.6389, "step": 12290 }, { "epoch": 0.16, "learning_rate": 4.6729734028858054e-05, "loss": 1.0726, "step": 12295 }, { "epoch": 0.16, "learning_rate": 4.6727131797804416e-05, "loss": 0.4213, "step": 12300 }, { "epoch": 0.16, "learning_rate": 4.672452860434754e-05, "loss": 0.7518, "step": 12305 }, { "epoch": 0.16, "learning_rate": 4.6721924448602726e-05, "loss": 0.9185, "step": 12310 }, { "epoch": 0.17, "learning_rate": 4.671931933068533e-05, "loss": 0.8911, "step": 12315 }, { "epoch": 0.17, "learning_rate": 4.671671325071075e-05, "loss": 0.6617, "step": 12320 }, { "epoch": 0.17, "learning_rate": 4.671410620879441e-05, "loss": 1.2891, "step": 12325 }, { "epoch": 0.17, "learning_rate": 4.6711498205051805e-05, "loss": 0.5566, "step": 12330 }, { "epoch": 0.17, "learning_rate": 4.670888923959845e-05, "loss": 0.2104, "step": 12335 }, { "epoch": 0.17, "learning_rate": 4.6706279312549906e-05, "loss": 0.5424, "step": 12340 }, { "epoch": 0.17, "learning_rate": 4.670366842402178e-05, "loss": 1.2632, "step": 12345 }, { "epoch": 0.17, "learning_rate": 4.670105657412972e-05, "loss": 0.6569, "step": 12350 }, { "epoch": 0.17, "learning_rate": 4.669844376298942e-05, "loss": 1.117, "step": 12355 }, { "epoch": 0.17, "learning_rate": 4.6695829990716624e-05, "loss": 1.2668, "step": 12360 }, { "epoch": 0.17, "learning_rate": 4.669321525742709e-05, "loss": 0.664, "step": 12365 }, { "epoch": 0.17, "learning_rate": 4.669059956323666e-05, "loss": 0.6287, "step": 12370 }, { "epoch": 0.17, "learning_rate": 4.668798290826117e-05, "loss": 0.5492, "step": 12375 }, { "epoch": 0.17, "learning_rate": 4.6685365292616554e-05, "loss": 1.3283, "step": 12380 }, { "epoch": 0.17, "learning_rate": 4.668274671641874e-05, "loss": 0.7913, "step": 12385 }, { "epoch": 0.17, "learning_rate": 4.668012717978371e-05, "loss": 0.9303, "step": 12390 }, { "epoch": 0.17, "learning_rate": 4.6677506682827524e-05, "loss": 0.6117, "step": 12395 }, { "epoch": 0.17, "learning_rate": 4.667488522566623e-05, "loss": 0.658, "step": 12400 }, { "epoch": 0.17, "learning_rate": 4.6672262808415956e-05, "loss": 1.0393, "step": 12405 }, { "epoch": 0.17, "learning_rate": 4.666963943119287e-05, "loss": 0.5362, "step": 12410 }, { "epoch": 0.17, "learning_rate": 4.666701509411316e-05, "loss": 0.7081, "step": 12415 }, { "epoch": 0.17, "learning_rate": 4.666438979729308e-05, "loss": 0.9033, "step": 12420 }, { "epoch": 0.17, "learning_rate": 4.6661763540848914e-05, "loss": 1.0875, "step": 12425 }, { "epoch": 0.17, "learning_rate": 4.6659136324897004e-05, "loss": 0.4264, "step": 12430 }, { "epoch": 0.17, "learning_rate": 4.66565081495537e-05, "loss": 0.3569, "step": 12435 }, { "epoch": 0.17, "learning_rate": 4.6653879014935434e-05, "loss": 0.882, "step": 12440 }, { "epoch": 0.17, "learning_rate": 4.665124892115866e-05, "loss": 0.4113, "step": 12445 }, { "epoch": 0.17, "learning_rate": 4.664861786833987e-05, "loss": 0.6891, "step": 12450 }, { "epoch": 0.17, "learning_rate": 4.6645985856595616e-05, "loss": 1.0638, "step": 12455 }, { "epoch": 0.17, "learning_rate": 4.6643352886042484e-05, "loss": 0.8383, "step": 12460 }, { "epoch": 0.17, "learning_rate": 4.664071895679709e-05, "loss": 0.7372, "step": 12465 }, { "epoch": 0.17, "learning_rate": 4.663808406897612e-05, "loss": 0.1486, "step": 12470 }, { "epoch": 0.17, "learning_rate": 4.6635448222696274e-05, "loss": 1.2106, "step": 12475 }, { "epoch": 0.17, "learning_rate": 4.663281141807431e-05, "loss": 0.8072, "step": 12480 }, { "epoch": 0.17, "learning_rate": 4.6630173655227025e-05, "loss": 1.2409, "step": 12485 }, { "epoch": 0.17, "learning_rate": 4.662753493427127e-05, "loss": 1.6416, "step": 12490 }, { "epoch": 0.17, "learning_rate": 4.66248952553239e-05, "loss": 0.2931, "step": 12495 }, { "epoch": 0.17, "learning_rate": 4.662225461850186e-05, "loss": 0.5317, "step": 12500 }, { "epoch": 0.17, "learning_rate": 4.661961302392213e-05, "loss": 0.1499, "step": 12505 }, { "epoch": 0.17, "learning_rate": 4.661697047170168e-05, "loss": 1.579, "step": 12510 }, { "epoch": 0.17, "learning_rate": 4.6614326961957595e-05, "loss": 0.6083, "step": 12515 }, { "epoch": 0.17, "learning_rate": 4.661168249480695e-05, "loss": 0.6829, "step": 12520 }, { "epoch": 0.17, "learning_rate": 4.66090370703669e-05, "loss": 0.5665, "step": 12525 }, { "epoch": 0.17, "learning_rate": 4.6606390688754617e-05, "loss": 0.8083, "step": 12530 }, { "epoch": 0.17, "learning_rate": 4.6603743350087316e-05, "loss": 0.5652, "step": 12535 }, { "epoch": 0.17, "learning_rate": 4.660109505448226e-05, "loss": 0.7459, "step": 12540 }, { "epoch": 0.17, "learning_rate": 4.6598445802056766e-05, "loss": 0.8913, "step": 12545 }, { "epoch": 0.17, "learning_rate": 4.659579559292817e-05, "loss": 0.7731, "step": 12550 }, { "epoch": 0.17, "learning_rate": 4.6593144427213874e-05, "loss": 1.2302, "step": 12555 }, { "epoch": 0.17, "learning_rate": 4.659049230503131e-05, "loss": 1.2579, "step": 12560 }, { "epoch": 0.17, "learning_rate": 4.658783922649794e-05, "loss": 0.712, "step": 12565 }, { "epoch": 0.17, "learning_rate": 4.658518519173131e-05, "loss": 0.8817, "step": 12570 }, { "epoch": 0.17, "learning_rate": 4.658253020084895e-05, "loss": 0.7088, "step": 12575 }, { "epoch": 0.17, "learning_rate": 4.6579874253968484e-05, "loss": 0.4824, "step": 12580 }, { "epoch": 0.17, "learning_rate": 4.657721735120754e-05, "loss": 0.4775, "step": 12585 }, { "epoch": 0.17, "learning_rate": 4.657455949268382e-05, "loss": 0.9116, "step": 12590 }, { "epoch": 0.17, "learning_rate": 4.6571900678515045e-05, "loss": 0.5638, "step": 12595 }, { "epoch": 0.17, "learning_rate": 4.6569240908819004e-05, "loss": 0.4199, "step": 12600 }, { "epoch": 0.17, "learning_rate": 4.6566580183713485e-05, "loss": 0.5037, "step": 12605 }, { "epoch": 0.17, "learning_rate": 4.656391850331636e-05, "loss": 0.7074, "step": 12610 }, { "epoch": 0.17, "learning_rate": 4.6561255867745526e-05, "loss": 1.1767, "step": 12615 }, { "epoch": 0.17, "learning_rate": 4.655859227711893e-05, "loss": 1.0695, "step": 12620 }, { "epoch": 0.17, "learning_rate": 4.6555927731554547e-05, "loss": 0.586, "step": 12625 }, { "epoch": 0.17, "learning_rate": 4.6553262231170405e-05, "loss": 1.4298, "step": 12630 }, { "epoch": 0.17, "learning_rate": 4.6550595776084574e-05, "loss": 0.7506, "step": 12635 }, { "epoch": 0.17, "learning_rate": 4.654792836641516e-05, "loss": 0.1762, "step": 12640 }, { "epoch": 0.17, "learning_rate": 4.654526000228033e-05, "loss": 0.7795, "step": 12645 }, { "epoch": 0.17, "learning_rate": 4.6542590683798256e-05, "loss": 0.9445, "step": 12650 }, { "epoch": 0.17, "learning_rate": 4.65399204110872e-05, "loss": 0.5661, "step": 12655 }, { "epoch": 0.17, "learning_rate": 4.653724918426543e-05, "loss": 0.7014, "step": 12660 }, { "epoch": 0.17, "learning_rate": 4.653457700345127e-05, "loss": 0.9582, "step": 12665 }, { "epoch": 0.17, "learning_rate": 4.653190386876308e-05, "loss": 0.696, "step": 12670 }, { "epoch": 0.17, "learning_rate": 4.6529229780319265e-05, "loss": 0.9747, "step": 12675 }, { "epoch": 0.17, "learning_rate": 4.6526554738238284e-05, "loss": 0.267, "step": 12680 }, { "epoch": 0.17, "learning_rate": 4.652387874263861e-05, "loss": 0.6697, "step": 12685 }, { "epoch": 0.17, "learning_rate": 4.6521201793638816e-05, "loss": 0.9019, "step": 12690 }, { "epoch": 0.17, "learning_rate": 4.6518523891357424e-05, "loss": 0.9419, "step": 12695 }, { "epoch": 0.17, "learning_rate": 4.651584503591309e-05, "loss": 0.3028, "step": 12700 }, { "epoch": 0.17, "learning_rate": 4.6513165227424455e-05, "loss": 0.7799, "step": 12705 }, { "epoch": 0.17, "learning_rate": 4.651048446601023e-05, "loss": 0.7573, "step": 12710 }, { "epoch": 0.17, "learning_rate": 4.6507802751789155e-05, "loss": 0.4158, "step": 12715 }, { "epoch": 0.17, "learning_rate": 4.650512008488002e-05, "loss": 1.0618, "step": 12720 }, { "epoch": 0.17, "learning_rate": 4.650243646540165e-05, "loss": 0.3953, "step": 12725 }, { "epoch": 0.17, "learning_rate": 4.649975189347292e-05, "loss": 0.8016, "step": 12730 }, { "epoch": 0.17, "learning_rate": 4.649706636921274e-05, "loss": 1.0255, "step": 12735 }, { "epoch": 0.17, "learning_rate": 4.649437989274007e-05, "loss": 1.2339, "step": 12740 }, { "epoch": 0.17, "learning_rate": 4.64916924641739e-05, "loss": 0.3667, "step": 12745 }, { "epoch": 0.17, "learning_rate": 4.648900408363327e-05, "loss": 0.2223, "step": 12750 }, { "epoch": 0.17, "learning_rate": 4.648631475123727e-05, "loss": 0.7048, "step": 12755 }, { "epoch": 0.17, "learning_rate": 4.6483624467105015e-05, "loss": 0.4658, "step": 12760 }, { "epoch": 0.17, "learning_rate": 4.648093323135568e-05, "loss": 0.5817, "step": 12765 }, { "epoch": 0.17, "learning_rate": 4.647824104410846e-05, "loss": 0.4684, "step": 12770 }, { "epoch": 0.17, "learning_rate": 4.647554790548263e-05, "loss": 0.55, "step": 12775 }, { "epoch": 0.17, "learning_rate": 4.647285381559745e-05, "loss": 0.3121, "step": 12780 }, { "epoch": 0.17, "learning_rate": 4.647015877457228e-05, "loss": 0.7024, "step": 12785 }, { "epoch": 0.17, "learning_rate": 4.6467462782526494e-05, "loss": 0.6697, "step": 12790 }, { "epoch": 0.17, "learning_rate": 4.646476583957949e-05, "loss": 0.5003, "step": 12795 }, { "epoch": 0.17, "learning_rate": 4.646206794585076e-05, "loss": 0.2137, "step": 12800 }, { "epoch": 0.17, "learning_rate": 4.645936910145978e-05, "loss": 0.531, "step": 12805 }, { "epoch": 0.17, "learning_rate": 4.6456669306526106e-05, "loss": 0.922, "step": 12810 }, { "epoch": 0.17, "learning_rate": 4.6453968561169335e-05, "loss": 0.6136, "step": 12815 }, { "epoch": 0.17, "learning_rate": 4.645126686550908e-05, "loss": 0.3381, "step": 12820 }, { "epoch": 0.17, "learning_rate": 4.644856421966503e-05, "loss": 1.2706, "step": 12825 }, { "epoch": 0.17, "learning_rate": 4.644586062375688e-05, "loss": 1.0474, "step": 12830 }, { "epoch": 0.17, "learning_rate": 4.6443156077904394e-05, "loss": 0.6312, "step": 12835 }, { "epoch": 0.17, "learning_rate": 4.644045058222737e-05, "loss": 1.284, "step": 12840 }, { "epoch": 0.17, "learning_rate": 4.643774413684565e-05, "loss": 1.0817, "step": 12845 }, { "epoch": 0.17, "learning_rate": 4.6435036741879116e-05, "loss": 0.3759, "step": 12850 }, { "epoch": 0.17, "learning_rate": 4.643232839744769e-05, "loss": 0.7769, "step": 12855 }, { "epoch": 0.17, "learning_rate": 4.642961910367134e-05, "loss": 0.8713, "step": 12860 }, { "epoch": 0.17, "learning_rate": 4.642690886067007e-05, "loss": 0.567, "step": 12865 }, { "epoch": 0.17, "learning_rate": 4.642419766856394e-05, "loss": 0.9766, "step": 12870 }, { "epoch": 0.17, "learning_rate": 4.6421485527473025e-05, "loss": 1.0517, "step": 12875 }, { "epoch": 0.17, "learning_rate": 4.6418772437517474e-05, "loss": 0.7167, "step": 12880 }, { "epoch": 0.17, "learning_rate": 4.6416058398817456e-05, "loss": 1.2484, "step": 12885 }, { "epoch": 0.17, "learning_rate": 4.6413343411493196e-05, "loss": 0.6528, "step": 12890 }, { "epoch": 0.17, "learning_rate": 4.6410627475664944e-05, "loss": 0.9746, "step": 12895 }, { "epoch": 0.17, "learning_rate": 4.640791059145302e-05, "loss": 1.0548, "step": 12900 }, { "epoch": 0.17, "learning_rate": 4.640519275897776e-05, "loss": 0.5903, "step": 12905 }, { "epoch": 0.17, "learning_rate": 4.640247397835953e-05, "loss": 1.007, "step": 12910 }, { "epoch": 0.17, "learning_rate": 4.639975424971879e-05, "loss": 0.6337, "step": 12915 }, { "epoch": 0.17, "learning_rate": 4.639703357317599e-05, "loss": 1.66, "step": 12920 }, { "epoch": 0.17, "learning_rate": 4.639431194885165e-05, "loss": 0.9766, "step": 12925 }, { "epoch": 0.17, "learning_rate": 4.639158937686632e-05, "loss": 0.7997, "step": 12930 }, { "epoch": 0.17, "learning_rate": 4.63888658573406e-05, "loss": 0.8345, "step": 12935 }, { "epoch": 0.17, "learning_rate": 4.638614139039513e-05, "loss": 0.5946, "step": 12940 }, { "epoch": 0.17, "learning_rate": 4.638341597615059e-05, "loss": 0.6638, "step": 12945 }, { "epoch": 0.17, "learning_rate": 4.63806896147277e-05, "loss": 0.8419, "step": 12950 }, { "epoch": 0.17, "learning_rate": 4.637796230624722e-05, "loss": 0.5723, "step": 12955 }, { "epoch": 0.17, "learning_rate": 4.637523405082996e-05, "loss": 0.5237, "step": 12960 }, { "epoch": 0.17, "learning_rate": 4.6372504848596775e-05, "loss": 0.1727, "step": 12965 }, { "epoch": 0.17, "learning_rate": 4.636977469966855e-05, "loss": 0.6477, "step": 12970 }, { "epoch": 0.17, "learning_rate": 4.63670436041662e-05, "loss": 0.662, "step": 12975 }, { "epoch": 0.17, "learning_rate": 4.636431156221073e-05, "loss": 1.2313, "step": 12980 }, { "epoch": 0.17, "learning_rate": 4.636157857392313e-05, "loss": 0.5946, "step": 12985 }, { "epoch": 0.17, "learning_rate": 4.6358844639424475e-05, "loss": 0.7728, "step": 12990 }, { "epoch": 0.17, "learning_rate": 4.635610975883585e-05, "loss": 0.5783, "step": 12995 }, { "epoch": 0.17, "learning_rate": 4.635337393227841e-05, "loss": 1.4554, "step": 13000 }, { "epoch": 0.17, "learning_rate": 4.635063715987333e-05, "loss": 0.2031, "step": 13005 }, { "epoch": 0.17, "learning_rate": 4.634789944174184e-05, "loss": 0.5008, "step": 13010 }, { "epoch": 0.17, "learning_rate": 4.6345160778005205e-05, "loss": 1.4743, "step": 13015 }, { "epoch": 0.17, "learning_rate": 4.6342421168784735e-05, "loss": 0.8591, "step": 13020 }, { "epoch": 0.17, "learning_rate": 4.6339680614201776e-05, "loss": 1.2511, "step": 13025 }, { "epoch": 0.17, "learning_rate": 4.633693911437773e-05, "loss": 1.1588, "step": 13030 }, { "epoch": 0.17, "learning_rate": 4.633419666943402e-05, "loss": 1.3622, "step": 13035 }, { "epoch": 0.17, "learning_rate": 4.6331453279492134e-05, "loss": 0.6777, "step": 13040 }, { "epoch": 0.17, "learning_rate": 4.6328708944673584e-05, "loss": 0.7861, "step": 13045 }, { "epoch": 0.17, "learning_rate": 4.632596366509993e-05, "loss": 0.5241, "step": 13050 }, { "epoch": 0.17, "learning_rate": 4.6323217440892776e-05, "loss": 1.0394, "step": 13055 }, { "epoch": 0.17, "learning_rate": 4.6320470272173766e-05, "loss": 0.3779, "step": 13060 }, { "epoch": 0.18, "learning_rate": 4.6317722159064594e-05, "loss": 0.9405, "step": 13065 }, { "epoch": 0.18, "learning_rate": 4.631497310168697e-05, "loss": 0.9758, "step": 13070 }, { "epoch": 0.18, "learning_rate": 4.631222310016268e-05, "loss": 0.6904, "step": 13075 }, { "epoch": 0.18, "learning_rate": 4.630947215461352e-05, "loss": 0.5894, "step": 13080 }, { "epoch": 0.18, "learning_rate": 4.6306720265161357e-05, "loss": 0.6796, "step": 13085 }, { "epoch": 0.18, "learning_rate": 4.630396743192808e-05, "loss": 0.5004, "step": 13090 }, { "epoch": 0.18, "learning_rate": 4.630121365503562e-05, "loss": 0.244, "step": 13095 }, { "epoch": 0.18, "learning_rate": 4.629845893460597e-05, "loss": 1.3299, "step": 13100 }, { "epoch": 0.18, "learning_rate": 4.629570327076114e-05, "loss": 0.3116, "step": 13105 }, { "epoch": 0.18, "learning_rate": 4.62929466636232e-05, "loss": 0.5522, "step": 13110 }, { "epoch": 0.18, "learning_rate": 4.629018911331424e-05, "loss": 0.7905, "step": 13115 }, { "epoch": 0.18, "learning_rate": 4.628743061995642e-05, "loss": 1.4632, "step": 13120 }, { "epoch": 0.18, "learning_rate": 4.628467118367191e-05, "loss": 1.3437, "step": 13125 }, { "epoch": 0.18, "learning_rate": 4.6281910804582965e-05, "loss": 1.2456, "step": 13130 }, { "epoch": 0.18, "learning_rate": 4.627914948281183e-05, "loss": 0.3127, "step": 13135 }, { "epoch": 0.18, "learning_rate": 4.627638721848083e-05, "loss": 0.5661, "step": 13140 }, { "epoch": 0.18, "learning_rate": 4.627362401171233e-05, "loss": 0.7411, "step": 13145 }, { "epoch": 0.18, "learning_rate": 4.62708598626287e-05, "loss": 1.2937, "step": 13150 }, { "epoch": 0.18, "learning_rate": 4.62680947713524e-05, "loss": 0.9996, "step": 13155 }, { "epoch": 0.18, "learning_rate": 4.62653287380059e-05, "loss": 0.7, "step": 13160 }, { "epoch": 0.18, "learning_rate": 4.6262561762711725e-05, "loss": 0.4241, "step": 13165 }, { "epoch": 0.18, "learning_rate": 4.625979384559244e-05, "loss": 0.7083, "step": 13170 }, { "epoch": 0.18, "learning_rate": 4.625702498677064e-05, "loss": 0.4458, "step": 13175 }, { "epoch": 0.18, "learning_rate": 4.6254255186368985e-05, "loss": 0.4896, "step": 13180 }, { "epoch": 0.18, "learning_rate": 4.625148444451016e-05, "loss": 0.7331, "step": 13185 }, { "epoch": 0.18, "learning_rate": 4.624871276131688e-05, "loss": 0.7423, "step": 13190 }, { "epoch": 0.18, "learning_rate": 4.624594013691194e-05, "loss": 0.4418, "step": 13195 }, { "epoch": 0.18, "learning_rate": 4.624316657141814e-05, "loss": 0.8792, "step": 13200 }, { "epoch": 0.18, "learning_rate": 4.624039206495833e-05, "loss": 1.1821, "step": 13205 }, { "epoch": 0.18, "learning_rate": 4.623761661765542e-05, "loss": 1.1319, "step": 13210 }, { "epoch": 0.18, "learning_rate": 4.623484022963235e-05, "loss": 0.7324, "step": 13215 }, { "epoch": 0.18, "learning_rate": 4.623206290101208e-05, "loss": 0.9034, "step": 13220 }, { "epoch": 0.18, "learning_rate": 4.6229284631917645e-05, "loss": 0.8237, "step": 13225 }, { "epoch": 0.18, "learning_rate": 4.622650542247211e-05, "loss": 0.6984, "step": 13230 }, { "epoch": 0.18, "learning_rate": 4.622372527279858e-05, "loss": 0.4705, "step": 13235 }, { "epoch": 0.18, "learning_rate": 4.62209441830202e-05, "loss": 0.3434, "step": 13240 }, { "epoch": 0.18, "learning_rate": 4.621816215326015e-05, "loss": 0.711, "step": 13245 }, { "epoch": 0.18, "learning_rate": 4.621537918364167e-05, "loss": 0.6912, "step": 13250 }, { "epoch": 0.18, "learning_rate": 4.621259527428804e-05, "loss": 1.4875, "step": 13255 }, { "epoch": 0.18, "learning_rate": 4.620981042532255e-05, "loss": 0.2486, "step": 13260 }, { "epoch": 0.18, "learning_rate": 4.620702463686858e-05, "loss": 0.2033, "step": 13265 }, { "epoch": 0.18, "learning_rate": 4.6204237909049496e-05, "loss": 0.9884, "step": 13270 }, { "epoch": 0.18, "learning_rate": 4.620145024198877e-05, "loss": 1.0656, "step": 13275 }, { "epoch": 0.18, "learning_rate": 4.619866163580986e-05, "loss": 0.6722, "step": 13280 }, { "epoch": 0.18, "learning_rate": 4.619587209063629e-05, "loss": 1.2039, "step": 13285 }, { "epoch": 0.18, "learning_rate": 4.619308160659164e-05, "loss": 1.2649, "step": 13290 }, { "epoch": 0.18, "learning_rate": 4.6190290183799485e-05, "loss": 1.0172, "step": 13295 }, { "epoch": 0.18, "learning_rate": 4.6187497822383485e-05, "loss": 0.5736, "step": 13300 }, { "epoch": 0.18, "learning_rate": 4.618470452246734e-05, "loss": 1.8482, "step": 13305 }, { "epoch": 0.18, "learning_rate": 4.618191028417477e-05, "loss": 1.1588, "step": 13310 }, { "epoch": 0.18, "learning_rate": 4.6179115107629536e-05, "loss": 0.8935, "step": 13315 }, { "epoch": 0.18, "learning_rate": 4.6176318992955456e-05, "loss": 1.0254, "step": 13320 }, { "epoch": 0.18, "learning_rate": 4.617352194027639e-05, "loss": 0.8657, "step": 13325 }, { "epoch": 0.18, "learning_rate": 4.6170723949716235e-05, "loss": 0.4469, "step": 13330 }, { "epoch": 0.18, "learning_rate": 4.6167925021398916e-05, "loss": 0.9791, "step": 13335 }, { "epoch": 0.18, "learning_rate": 4.616512515544842e-05, "loss": 1.2732, "step": 13340 }, { "epoch": 0.18, "learning_rate": 4.616232435198877e-05, "loss": 0.6509, "step": 13345 }, { "epoch": 0.18, "learning_rate": 4.615952261114402e-05, "loss": 0.5573, "step": 13350 }, { "epoch": 0.18, "learning_rate": 4.615671993303827e-05, "loss": 0.6284, "step": 13355 }, { "epoch": 0.18, "learning_rate": 4.615391631779568e-05, "loss": 0.5664, "step": 13360 }, { "epoch": 0.18, "learning_rate": 4.6151111765540425e-05, "loss": 0.5944, "step": 13365 }, { "epoch": 0.18, "learning_rate": 4.6148306276396734e-05, "loss": 0.6937, "step": 13370 }, { "epoch": 0.18, "learning_rate": 4.614549985048887e-05, "loss": 0.1838, "step": 13375 }, { "epoch": 0.18, "learning_rate": 4.6142692487941155e-05, "loss": 0.4727, "step": 13380 }, { "epoch": 0.18, "learning_rate": 4.6139884188877944e-05, "loss": 0.7947, "step": 13385 }, { "epoch": 0.18, "learning_rate": 4.613707495342361e-05, "loss": 0.4572, "step": 13390 }, { "epoch": 0.18, "learning_rate": 4.613426478170261e-05, "loss": 1.1099, "step": 13395 }, { "epoch": 0.18, "learning_rate": 4.613145367383941e-05, "loss": 0.4736, "step": 13400 }, { "epoch": 0.18, "learning_rate": 4.6128641629958525e-05, "loss": 2.2276, "step": 13405 }, { "epoch": 0.18, "learning_rate": 4.6125828650184525e-05, "loss": 1.4006, "step": 13410 }, { "epoch": 0.18, "learning_rate": 4.6123014734642e-05, "loss": 1.227, "step": 13415 }, { "epoch": 0.18, "learning_rate": 4.61201998834556e-05, "loss": 0.5059, "step": 13420 }, { "epoch": 0.18, "learning_rate": 4.6117384096750003e-05, "loss": 0.8636, "step": 13425 }, { "epoch": 0.18, "learning_rate": 4.611456737464994e-05, "loss": 0.4791, "step": 13430 }, { "epoch": 0.18, "learning_rate": 4.611174971728018e-05, "loss": 0.6988, "step": 13435 }, { "epoch": 0.18, "learning_rate": 4.610893112476552e-05, "loss": 1.3564, "step": 13440 }, { "epoch": 0.18, "learning_rate": 4.6106111597230814e-05, "loss": 1.151, "step": 13445 }, { "epoch": 0.18, "learning_rate": 4.610329113480096e-05, "loss": 0.7608, "step": 13450 }, { "epoch": 0.18, "learning_rate": 4.6100469737600883e-05, "loss": 0.3429, "step": 13455 }, { "epoch": 0.18, "learning_rate": 4.609764740575556e-05, "loss": 0.3412, "step": 13460 }, { "epoch": 0.18, "learning_rate": 4.609482413939e-05, "loss": 1.1663, "step": 13465 }, { "epoch": 0.18, "learning_rate": 4.6091999938629277e-05, "loss": 0.4037, "step": 13470 }, { "epoch": 0.18, "learning_rate": 4.608917480359847e-05, "loss": 0.6408, "step": 13475 }, { "epoch": 0.18, "learning_rate": 4.608634873442272e-05, "loss": 0.9766, "step": 13480 }, { "epoch": 0.18, "learning_rate": 4.608352173122722e-05, "loss": 0.9354, "step": 13485 }, { "epoch": 0.18, "learning_rate": 4.608069379413718e-05, "loss": 1.1187, "step": 13490 }, { "epoch": 0.18, "learning_rate": 4.607786492327787e-05, "loss": 0.612, "step": 13495 }, { "epoch": 0.18, "learning_rate": 4.607503511877459e-05, "loss": 0.6058, "step": 13500 }, { "epoch": 0.18, "learning_rate": 4.6072204380752694e-05, "loss": 0.8133, "step": 13505 }, { "epoch": 0.18, "learning_rate": 4.6069372709337564e-05, "loss": 0.8106, "step": 13510 }, { "epoch": 0.18, "learning_rate": 4.606654010465463e-05, "loss": 0.5791, "step": 13515 }, { "epoch": 0.18, "learning_rate": 4.606370656682936e-05, "loss": 1.2481, "step": 13520 }, { "epoch": 0.18, "learning_rate": 4.6060872095987266e-05, "loss": 1.3482, "step": 13525 }, { "epoch": 0.18, "learning_rate": 4.60580366922539e-05, "loss": 0.4452, "step": 13530 }, { "epoch": 0.18, "learning_rate": 4.605520035575487e-05, "loss": 0.7676, "step": 13535 }, { "epoch": 0.18, "learning_rate": 4.605236308661579e-05, "loss": 0.5987, "step": 13540 }, { "epoch": 0.18, "learning_rate": 4.604952488496235e-05, "loss": 0.9509, "step": 13545 }, { "epoch": 0.18, "learning_rate": 4.604668575092027e-05, "loss": 0.9804, "step": 13550 }, { "epoch": 0.18, "learning_rate": 4.604384568461529e-05, "loss": 0.4331, "step": 13555 }, { "epoch": 0.18, "learning_rate": 4.604100468617324e-05, "loss": 0.562, "step": 13560 }, { "epoch": 0.18, "learning_rate": 4.603816275571995e-05, "loss": 0.6704, "step": 13565 }, { "epoch": 0.18, "learning_rate": 4.603531989338129e-05, "loss": 0.7474, "step": 13570 }, { "epoch": 0.18, "learning_rate": 4.6032476099283196e-05, "loss": 0.4902, "step": 13575 }, { "epoch": 0.18, "learning_rate": 4.6029631373551635e-05, "loss": 0.6413, "step": 13580 }, { "epoch": 0.18, "learning_rate": 4.602678571631261e-05, "loss": 0.5501, "step": 13585 }, { "epoch": 0.18, "learning_rate": 4.6023939127692173e-05, "loss": 1.1852, "step": 13590 }, { "epoch": 0.18, "learning_rate": 4.602109160781641e-05, "loss": 1.1965, "step": 13595 }, { "epoch": 0.18, "learning_rate": 4.601824315681146e-05, "loss": 0.6098, "step": 13600 }, { "epoch": 0.18, "learning_rate": 4.601539377480348e-05, "loss": 0.7346, "step": 13605 }, { "epoch": 0.18, "learning_rate": 4.60125434619187e-05, "loss": 0.9876, "step": 13610 }, { "epoch": 0.18, "learning_rate": 4.600969221828337e-05, "loss": 0.4229, "step": 13615 }, { "epoch": 0.18, "learning_rate": 4.600684004402378e-05, "loss": 0.4305, "step": 13620 }, { "epoch": 0.18, "learning_rate": 4.600398693926627e-05, "loss": 0.6589, "step": 13625 }, { "epoch": 0.18, "learning_rate": 4.6001132904137215e-05, "loss": 0.5071, "step": 13630 }, { "epoch": 0.18, "learning_rate": 4.599827793876304e-05, "loss": 1.2795, "step": 13635 }, { "epoch": 0.18, "learning_rate": 4.59954220432702e-05, "loss": 0.668, "step": 13640 }, { "epoch": 0.18, "learning_rate": 4.5992565217785196e-05, "loss": 0.8412, "step": 13645 }, { "epoch": 0.18, "learning_rate": 4.598970746243459e-05, "loss": 0.3823, "step": 13650 }, { "epoch": 0.18, "learning_rate": 4.598684877734494e-05, "loss": 0.5009, "step": 13655 }, { "epoch": 0.18, "learning_rate": 4.598398916264289e-05, "loss": 0.572, "step": 13660 }, { "epoch": 0.18, "learning_rate": 4.598112861845509e-05, "loss": 0.6788, "step": 13665 }, { "epoch": 0.18, "learning_rate": 4.597826714490827e-05, "loss": 0.3199, "step": 13670 }, { "epoch": 0.18, "learning_rate": 4.5975404742129155e-05, "loss": 0.8458, "step": 13675 }, { "epoch": 0.18, "learning_rate": 4.597254141024456e-05, "loss": 0.6381, "step": 13680 }, { "epoch": 0.18, "learning_rate": 4.596967714938129e-05, "loss": 1.5563, "step": 13685 }, { "epoch": 0.18, "learning_rate": 4.596681195966624e-05, "loss": 0.5971, "step": 13690 }, { "epoch": 0.18, "learning_rate": 4.596394584122631e-05, "loss": 1.36, "step": 13695 }, { "epoch": 0.18, "learning_rate": 4.596107879418845e-05, "loss": 0.364, "step": 13700 }, { "epoch": 0.18, "learning_rate": 4.5958210818679675e-05, "loss": 0.8758, "step": 13705 }, { "epoch": 0.18, "learning_rate": 4.595534191482701e-05, "loss": 0.6704, "step": 13710 }, { "epoch": 0.18, "learning_rate": 4.595247208275753e-05, "loss": 0.6088, "step": 13715 }, { "epoch": 0.18, "learning_rate": 4.594960132259836e-05, "loss": 0.582, "step": 13720 }, { "epoch": 0.18, "learning_rate": 4.594672963447666e-05, "loss": 0.1835, "step": 13725 }, { "epoch": 0.18, "learning_rate": 4.594385701851963e-05, "loss": 0.9911, "step": 13730 }, { "epoch": 0.18, "learning_rate": 4.594098347485452e-05, "loss": 0.555, "step": 13735 }, { "epoch": 0.18, "learning_rate": 4.5938109003608595e-05, "loss": 0.8049, "step": 13740 }, { "epoch": 0.18, "learning_rate": 4.59352336049092e-05, "loss": 0.4782, "step": 13745 }, { "epoch": 0.18, "learning_rate": 4.5932357278883684e-05, "loss": 1.2912, "step": 13750 }, { "epoch": 0.18, "learning_rate": 4.592948002565947e-05, "loss": 1.5407, "step": 13755 }, { "epoch": 0.18, "learning_rate": 4.592660184536399e-05, "loss": 0.7843, "step": 13760 }, { "epoch": 0.18, "learning_rate": 4.592372273812475e-05, "loss": 0.5546, "step": 13765 }, { "epoch": 0.18, "learning_rate": 4.592084270406927e-05, "loss": 0.7925, "step": 13770 }, { "epoch": 0.18, "learning_rate": 4.591796174332511e-05, "loss": 1.0635, "step": 13775 }, { "epoch": 0.18, "learning_rate": 4.5915079856019905e-05, "loss": 1.2646, "step": 13780 }, { "epoch": 0.18, "learning_rate": 4.591219704228129e-05, "loss": 1.2944, "step": 13785 }, { "epoch": 0.18, "learning_rate": 4.590931330223697e-05, "loss": 1.561, "step": 13790 }, { "epoch": 0.18, "learning_rate": 4.590642863601467e-05, "loss": 0.4118, "step": 13795 }, { "epoch": 0.18, "learning_rate": 4.5903543043742194e-05, "loss": 0.6498, "step": 13800 }, { "epoch": 0.18, "learning_rate": 4.590065652554732e-05, "loss": 0.9006, "step": 13805 }, { "epoch": 0.19, "learning_rate": 4.589776908155793e-05, "loss": 0.6969, "step": 13810 }, { "epoch": 0.19, "learning_rate": 4.589488071190191e-05, "loss": 0.6714, "step": 13815 }, { "epoch": 0.19, "learning_rate": 4.589199141670722e-05, "loss": 0.9817, "step": 13820 }, { "epoch": 0.19, "learning_rate": 4.5889101196101826e-05, "loss": 0.9778, "step": 13825 }, { "epoch": 0.19, "learning_rate": 4.5886210050213755e-05, "loss": 0.4388, "step": 13830 }, { "epoch": 0.19, "learning_rate": 4.588331797917106e-05, "loss": 0.8128, "step": 13835 }, { "epoch": 0.19, "learning_rate": 4.5880424983101866e-05, "loss": 0.7553, "step": 13840 }, { "epoch": 0.19, "learning_rate": 4.58775310621343e-05, "loss": 0.6685, "step": 13845 }, { "epoch": 0.19, "learning_rate": 4.587463621639656e-05, "loss": 0.8006, "step": 13850 }, { "epoch": 0.19, "learning_rate": 4.5871740446016866e-05, "loss": 1.3575, "step": 13855 }, { "epoch": 0.19, "learning_rate": 4.586884375112348e-05, "loss": 0.586, "step": 13860 }, { "epoch": 0.19, "learning_rate": 4.586594613184473e-05, "loss": 0.7046, "step": 13865 }, { "epoch": 0.19, "learning_rate": 4.586304758830895e-05, "loss": 1.1134, "step": 13870 }, { "epoch": 0.19, "learning_rate": 4.586014812064454e-05, "loss": 0.6912, "step": 13875 }, { "epoch": 0.19, "learning_rate": 4.5857247728979926e-05, "loss": 1.0933, "step": 13880 }, { "epoch": 0.19, "learning_rate": 4.585434641344358e-05, "loss": 0.79, "step": 13885 }, { "epoch": 0.19, "learning_rate": 4.585144417416403e-05, "loss": 0.7743, "step": 13890 }, { "epoch": 0.19, "learning_rate": 4.5848541011269806e-05, "loss": 1.5712, "step": 13895 }, { "epoch": 0.19, "learning_rate": 4.5845636924889524e-05, "loss": 0.2003, "step": 13900 }, { "epoch": 0.19, "learning_rate": 4.584273191515182e-05, "loss": 0.7495, "step": 13905 }, { "epoch": 0.19, "learning_rate": 4.583982598218535e-05, "loss": 0.6801, "step": 13910 }, { "epoch": 0.19, "learning_rate": 4.583691912611886e-05, "loss": 0.5045, "step": 13915 }, { "epoch": 0.19, "learning_rate": 4.583401134708109e-05, "loss": 1.1784, "step": 13920 }, { "epoch": 0.19, "learning_rate": 4.5831102645200854e-05, "loss": 1.1538, "step": 13925 }, { "epoch": 0.19, "learning_rate": 4.582819302060698e-05, "loss": 0.8408, "step": 13930 }, { "epoch": 0.19, "learning_rate": 4.582528247342835e-05, "loss": 0.7348, "step": 13935 }, { "epoch": 0.19, "learning_rate": 4.58223710037939e-05, "loss": 0.5944, "step": 13940 }, { "epoch": 0.19, "learning_rate": 4.581945861183258e-05, "loss": 0.7709, "step": 13945 }, { "epoch": 0.19, "learning_rate": 4.5816545297673406e-05, "loss": 1.2936, "step": 13950 }, { "epoch": 0.19, "learning_rate": 4.581363106144542e-05, "loss": 0.649, "step": 13955 }, { "epoch": 0.19, "learning_rate": 4.581071590327769e-05, "loss": 0.4065, "step": 13960 }, { "epoch": 0.19, "learning_rate": 4.580779982329937e-05, "loss": 0.5196, "step": 13965 }, { "epoch": 0.19, "learning_rate": 4.5804882821639614e-05, "loss": 0.4359, "step": 13970 }, { "epoch": 0.19, "learning_rate": 4.5801964898427635e-05, "loss": 0.7308, "step": 13975 }, { "epoch": 0.19, "learning_rate": 4.5799046053792676e-05, "loss": 0.3825, "step": 13980 }, { "epoch": 0.19, "learning_rate": 4.579612628786403e-05, "loss": 1.2404, "step": 13985 }, { "epoch": 0.19, "learning_rate": 4.579320560077104e-05, "loss": 1.509, "step": 13990 }, { "epoch": 0.19, "learning_rate": 4.5790283992643055e-05, "loss": 1.0061, "step": 13995 }, { "epoch": 0.19, "learning_rate": 4.57873614636095e-05, "loss": 0.4341, "step": 14000 }, { "epoch": 0.19, "learning_rate": 4.578443801379983e-05, "loss": 0.9833, "step": 14005 }, { "epoch": 0.19, "learning_rate": 4.5781513643343544e-05, "loss": 0.4704, "step": 14010 }, { "epoch": 0.19, "learning_rate": 4.577858835237017e-05, "loss": 0.3411, "step": 14015 }, { "epoch": 0.19, "learning_rate": 4.5775662141009273e-05, "loss": 0.7438, "step": 14020 }, { "epoch": 0.19, "learning_rate": 4.577273500939049e-05, "loss": 0.4194, "step": 14025 }, { "epoch": 0.19, "learning_rate": 4.576980695764346e-05, "loss": 0.5737, "step": 14030 }, { "epoch": 0.19, "learning_rate": 4.5766877985897894e-05, "loss": 0.818, "step": 14035 }, { "epoch": 0.19, "learning_rate": 4.576394809428353e-05, "loss": 0.6711, "step": 14040 }, { "epoch": 0.19, "learning_rate": 4.5761017282930144e-05, "loss": 0.997, "step": 14045 }, { "epoch": 0.19, "learning_rate": 4.5758085551967554e-05, "loss": 0.736, "step": 14050 }, { "epoch": 0.19, "learning_rate": 4.575515290152562e-05, "loss": 0.3033, "step": 14055 }, { "epoch": 0.19, "learning_rate": 4.575221933173426e-05, "loss": 0.9445, "step": 14060 }, { "epoch": 0.19, "learning_rate": 4.574928484272339e-05, "loss": 0.8746, "step": 14065 }, { "epoch": 0.19, "learning_rate": 4.5746349434623014e-05, "loss": 0.6076, "step": 14070 }, { "epoch": 0.19, "learning_rate": 4.5743413107563144e-05, "loss": 0.9588, "step": 14075 }, { "epoch": 0.19, "learning_rate": 4.574047586167385e-05, "loss": 1.1822, "step": 14080 }, { "epoch": 0.19, "learning_rate": 4.573753769708524e-05, "loss": 0.5702, "step": 14085 }, { "epoch": 0.19, "learning_rate": 4.573459861392746e-05, "loss": 0.2937, "step": 14090 }, { "epoch": 0.19, "learning_rate": 4.573165861233069e-05, "loss": 0.9546, "step": 14095 }, { "epoch": 0.19, "learning_rate": 4.5728717692425156e-05, "loss": 0.7121, "step": 14100 }, { "epoch": 0.19, "learning_rate": 4.5725775854341134e-05, "loss": 0.9317, "step": 14105 }, { "epoch": 0.19, "learning_rate": 4.572283309820893e-05, "loss": 0.9515, "step": 14110 }, { "epoch": 0.19, "learning_rate": 4.571988942415889e-05, "loss": 0.7628, "step": 14115 }, { "epoch": 0.19, "learning_rate": 4.5716944832321404e-05, "loss": 0.618, "step": 14120 }, { "epoch": 0.19, "learning_rate": 4.5713999322826916e-05, "loss": 1.053, "step": 14125 }, { "epoch": 0.19, "learning_rate": 4.571105289580588e-05, "loss": 0.6214, "step": 14130 }, { "epoch": 0.19, "learning_rate": 4.570810555138882e-05, "loss": 1.0088, "step": 14135 }, { "epoch": 0.19, "learning_rate": 4.570515728970628e-05, "loss": 0.328, "step": 14140 }, { "epoch": 0.19, "learning_rate": 4.570220811088886e-05, "loss": 1.0372, "step": 14145 }, { "epoch": 0.19, "learning_rate": 4.569925801506718e-05, "loss": 0.6943, "step": 14150 }, { "epoch": 0.19, "learning_rate": 4.5696307002371934e-05, "loss": 0.591, "step": 14155 }, { "epoch": 0.19, "learning_rate": 4.569335507293382e-05, "loss": 0.653, "step": 14160 }, { "epoch": 0.19, "learning_rate": 4.5690402226883614e-05, "loss": 0.8624, "step": 14165 }, { "epoch": 0.19, "learning_rate": 4.56874484643521e-05, "loss": 1.4963, "step": 14170 }, { "epoch": 0.19, "learning_rate": 4.5684493785470105e-05, "loss": 0.7467, "step": 14175 }, { "epoch": 0.19, "learning_rate": 4.5681538190368524e-05, "loss": 1.2953, "step": 14180 }, { "epoch": 0.19, "learning_rate": 4.567858167917826e-05, "loss": 0.1397, "step": 14185 }, { "epoch": 0.19, "learning_rate": 4.567562425203029e-05, "loss": 0.7994, "step": 14190 }, { "epoch": 0.19, "learning_rate": 4.567266590905559e-05, "loss": 0.6985, "step": 14195 }, { "epoch": 0.19, "learning_rate": 4.5669706650385227e-05, "loss": 0.4495, "step": 14200 }, { "epoch": 0.19, "learning_rate": 4.5666746476150254e-05, "loss": 0.1981, "step": 14205 }, { "epoch": 0.19, "learning_rate": 4.566378538648181e-05, "loss": 0.9353, "step": 14210 }, { "epoch": 0.19, "learning_rate": 4.566082338151105e-05, "loss": 0.5835, "step": 14215 }, { "epoch": 0.19, "learning_rate": 4.5657860461369176e-05, "loss": 0.4881, "step": 14220 }, { "epoch": 0.19, "learning_rate": 4.565548946642067e-05, "loss": 0.5836, "step": 14225 }, { "epoch": 0.19, "learning_rate": 4.565252489930155e-05, "loss": 1.4356, "step": 14230 }, { "epoch": 0.19, "learning_rate": 4.5649559417378905e-05, "loss": 0.7744, "step": 14235 }, { "epoch": 0.19, "learning_rate": 4.564659302078408e-05, "loss": 0.7864, "step": 14240 }, { "epoch": 0.19, "learning_rate": 4.564362570964847e-05, "loss": 0.7042, "step": 14245 }, { "epoch": 0.19, "learning_rate": 4.5640657484103535e-05, "loss": 0.9638, "step": 14250 }, { "epoch": 0.19, "learning_rate": 4.5637688344280715e-05, "loss": 0.9064, "step": 14255 }, { "epoch": 0.19, "learning_rate": 4.5634718290311565e-05, "loss": 0.7537, "step": 14260 }, { "epoch": 0.19, "learning_rate": 4.5631747322327615e-05, "loss": 0.7493, "step": 14265 }, { "epoch": 0.19, "learning_rate": 4.562877544046048e-05, "loss": 1.7855, "step": 14270 }, { "epoch": 0.19, "learning_rate": 4.56258026448418e-05, "loss": 0.4999, "step": 14275 }, { "epoch": 0.19, "learning_rate": 4.562282893560325e-05, "loss": 0.561, "step": 14280 }, { "epoch": 0.19, "learning_rate": 4.561985431287654e-05, "loss": 0.7022, "step": 14285 }, { "epoch": 0.19, "learning_rate": 4.5616878776793445e-05, "loss": 0.9849, "step": 14290 }, { "epoch": 0.19, "learning_rate": 4.5613902327485766e-05, "loss": 0.3251, "step": 14295 }, { "epoch": 0.19, "learning_rate": 4.561092496508535e-05, "loss": 0.5838, "step": 14300 }, { "epoch": 0.19, "learning_rate": 4.560794668972407e-05, "loss": 0.4488, "step": 14305 }, { "epoch": 0.19, "learning_rate": 4.560496750153384e-05, "loss": 0.5132, "step": 14310 }, { "epoch": 0.19, "learning_rate": 4.560198740064664e-05, "loss": 0.8225, "step": 14315 }, { "epoch": 0.19, "learning_rate": 4.5599006387194466e-05, "loss": 1.1273, "step": 14320 }, { "epoch": 0.19, "learning_rate": 4.559602446130936e-05, "loss": 0.4345, "step": 14325 }, { "epoch": 0.19, "learning_rate": 4.5593041623123414e-05, "loss": 1.6583, "step": 14330 }, { "epoch": 0.19, "learning_rate": 4.559005787276874e-05, "loss": 1.2889, "step": 14335 }, { "epoch": 0.19, "learning_rate": 4.5587073210377514e-05, "loss": 0.7112, "step": 14340 }, { "epoch": 0.19, "learning_rate": 4.558408763608194e-05, "loss": 0.5495, "step": 14345 }, { "epoch": 0.19, "learning_rate": 4.558110115001426e-05, "loss": 0.3485, "step": 14350 }, { "epoch": 0.19, "learning_rate": 4.5578113752306765e-05, "loss": 0.6939, "step": 14355 }, { "epoch": 0.19, "learning_rate": 4.557512544309178e-05, "loss": 0.7419, "step": 14360 }, { "epoch": 0.19, "learning_rate": 4.557213622250167e-05, "loss": 0.8604, "step": 14365 }, { "epoch": 0.19, "learning_rate": 4.556914609066885e-05, "loss": 1.3456, "step": 14370 }, { "epoch": 0.19, "learning_rate": 4.556615504772576e-05, "loss": 0.9493, "step": 14375 }, { "epoch": 0.19, "learning_rate": 4.556316309380489e-05, "loss": 0.8359, "step": 14380 }, { "epoch": 0.19, "learning_rate": 4.556017022903877e-05, "loss": 1.0775, "step": 14385 }, { "epoch": 0.19, "learning_rate": 4.5557176453559966e-05, "loss": 0.5147, "step": 14390 }, { "epoch": 0.19, "learning_rate": 4.555418176750109e-05, "loss": 0.8104, "step": 14395 }, { "epoch": 0.19, "learning_rate": 4.555118617099479e-05, "loss": 1.1449, "step": 14400 }, { "epoch": 0.19, "learning_rate": 4.5548189664173755e-05, "loss": 0.3518, "step": 14405 }, { "epoch": 0.19, "learning_rate": 4.554519224717073e-05, "loss": 0.5145, "step": 14410 }, { "epoch": 0.19, "learning_rate": 4.554219392011846e-05, "loss": 0.3994, "step": 14415 }, { "epoch": 0.19, "learning_rate": 4.5539194683149775e-05, "loss": 0.1813, "step": 14420 }, { "epoch": 0.19, "learning_rate": 4.5536194536397515e-05, "loss": 1.5593, "step": 14425 }, { "epoch": 0.19, "learning_rate": 4.553319347999458e-05, "loss": 1.3112, "step": 14430 }, { "epoch": 0.19, "learning_rate": 4.553019151407389e-05, "loss": 0.2851, "step": 14435 }, { "epoch": 0.19, "learning_rate": 4.552718863876844e-05, "loss": 0.7389, "step": 14440 }, { "epoch": 0.19, "learning_rate": 4.5524184854211216e-05, "loss": 0.5712, "step": 14445 }, { "epoch": 0.19, "learning_rate": 4.552118016053529e-05, "loss": 0.3326, "step": 14450 }, { "epoch": 0.19, "learning_rate": 4.551817455787374e-05, "loss": 0.8624, "step": 14455 }, { "epoch": 0.19, "learning_rate": 4.551516804635971e-05, "loss": 0.713, "step": 14460 }, { "epoch": 0.19, "learning_rate": 4.551216062612637e-05, "loss": 0.6249, "step": 14465 }, { "epoch": 0.19, "learning_rate": 4.5509152297306935e-05, "loss": 1.0909, "step": 14470 }, { "epoch": 0.19, "learning_rate": 4.550614306003465e-05, "loss": 0.5801, "step": 14475 }, { "epoch": 0.19, "learning_rate": 4.550313291444283e-05, "loss": 0.8084, "step": 14480 }, { "epoch": 0.19, "learning_rate": 4.5500121860664776e-05, "loss": 0.9832, "step": 14485 }, { "epoch": 0.19, "learning_rate": 4.54971098988339e-05, "loss": 0.4703, "step": 14490 }, { "epoch": 0.19, "learning_rate": 4.5494097029083595e-05, "loss": 1.2995, "step": 14495 }, { "epoch": 0.19, "learning_rate": 4.549108325154732e-05, "loss": 0.9241, "step": 14500 }, { "epoch": 0.19, "learning_rate": 4.5488068566358566e-05, "loss": 0.3002, "step": 14505 }, { "epoch": 0.19, "learning_rate": 4.548505297365087e-05, "loss": 0.2603, "step": 14510 }, { "epoch": 0.19, "learning_rate": 4.548203647355782e-05, "loss": 0.4805, "step": 14515 }, { "epoch": 0.19, "learning_rate": 4.547901906621302e-05, "loss": 0.5598, "step": 14520 }, { "epoch": 0.19, "learning_rate": 4.5476000751750126e-05, "loss": 1.2359, "step": 14525 }, { "epoch": 0.19, "learning_rate": 4.547298153030284e-05, "loss": 0.992, "step": 14530 }, { "epoch": 0.19, "learning_rate": 4.546996140200489e-05, "loss": 0.8876, "step": 14535 }, { "epoch": 0.19, "learning_rate": 4.546694036699006e-05, "loss": 1.1075, "step": 14540 }, { "epoch": 0.19, "learning_rate": 4.546391842539217e-05, "loss": 0.7793, "step": 14545 }, { "epoch": 0.19, "learning_rate": 4.546089557734507e-05, "loss": 0.248, "step": 14550 }, { "epoch": 0.2, "learning_rate": 4.545787182298266e-05, "loss": 0.4955, "step": 14555 }, { "epoch": 0.2, "learning_rate": 4.545484716243887e-05, "loss": 0.3746, "step": 14560 }, { "epoch": 0.2, "learning_rate": 4.5451821595847686e-05, "loss": 0.878, "step": 14565 }, { "epoch": 0.2, "learning_rate": 4.544879512334312e-05, "loss": 0.6054, "step": 14570 }, { "epoch": 0.2, "learning_rate": 4.5445767745059234e-05, "loss": 0.8131, "step": 14575 }, { "epoch": 0.2, "learning_rate": 4.544273946113012e-05, "loss": 0.6505, "step": 14580 }, { "epoch": 0.2, "learning_rate": 4.543971027168993e-05, "loss": 0.4443, "step": 14585 }, { "epoch": 0.2, "learning_rate": 4.543668017687282e-05, "loss": 1.4024, "step": 14590 }, { "epoch": 0.2, "learning_rate": 4.543364917681303e-05, "loss": 0.902, "step": 14595 }, { "epoch": 0.2, "learning_rate": 4.5430617271644806e-05, "loss": 0.5431, "step": 14600 }, { "epoch": 0.2, "learning_rate": 4.542758446150244e-05, "loss": 0.9085, "step": 14605 }, { "epoch": 0.2, "learning_rate": 4.5424550746520286e-05, "loss": 1.0691, "step": 14610 }, { "epoch": 0.2, "learning_rate": 4.542151612683271e-05, "loss": 0.7161, "step": 14615 }, { "epoch": 0.2, "learning_rate": 4.541848060257414e-05, "loss": 0.4904, "step": 14620 }, { "epoch": 0.2, "learning_rate": 4.5415444173879024e-05, "loss": 1.0111, "step": 14625 }, { "epoch": 0.2, "learning_rate": 4.541240684088187e-05, "loss": 0.8713, "step": 14630 }, { "epoch": 0.2, "learning_rate": 4.540936860371721e-05, "loss": 0.5312, "step": 14635 }, { "epoch": 0.2, "learning_rate": 4.540632946251963e-05, "loss": 0.951, "step": 14640 }, { "epoch": 0.2, "learning_rate": 4.540328941742374e-05, "loss": 1.2207, "step": 14645 }, { "epoch": 0.2, "learning_rate": 4.540024846856421e-05, "loss": 1.0532, "step": 14650 }, { "epoch": 0.2, "learning_rate": 4.539720661607573e-05, "loss": 0.9931, "step": 14655 }, { "epoch": 0.2, "learning_rate": 4.5394163860093035e-05, "loss": 0.927, "step": 14660 }, { "epoch": 0.2, "learning_rate": 4.5391120200750916e-05, "loss": 0.9679, "step": 14665 }, { "epoch": 0.2, "learning_rate": 4.538807563818418e-05, "loss": 0.8307, "step": 14670 }, { "epoch": 0.2, "learning_rate": 4.53850301725277e-05, "loss": 1.2087, "step": 14675 }, { "epoch": 0.2, "learning_rate": 4.5381983803916355e-05, "loss": 0.4409, "step": 14680 }, { "epoch": 0.2, "learning_rate": 4.5378936532485106e-05, "loss": 1.2046, "step": 14685 }, { "epoch": 0.2, "learning_rate": 4.5375888358368914e-05, "loss": 0.2511, "step": 14690 }, { "epoch": 0.2, "learning_rate": 4.53728392817028e-05, "loss": 0.3749, "step": 14695 }, { "epoch": 0.2, "learning_rate": 4.536978930262184e-05, "loss": 0.7088, "step": 14700 }, { "epoch": 0.2, "learning_rate": 4.536673842126112e-05, "loss": 0.8267, "step": 14705 }, { "epoch": 0.2, "learning_rate": 4.5363686637755774e-05, "loss": 0.4977, "step": 14710 }, { "epoch": 0.2, "learning_rate": 4.5360633952240996e-05, "loss": 0.9509, "step": 14715 }, { "epoch": 0.2, "learning_rate": 4.535758036485198e-05, "loss": 0.903, "step": 14720 }, { "epoch": 0.2, "learning_rate": 4.535452587572401e-05, "loss": 1.0293, "step": 14725 }, { "epoch": 0.2, "learning_rate": 4.5351470484992376e-05, "loss": 0.9387, "step": 14730 }, { "epoch": 0.2, "learning_rate": 4.53484141927924e-05, "loss": 1.0991, "step": 14735 }, { "epoch": 0.2, "learning_rate": 4.5345356999259494e-05, "loss": 0.8871, "step": 14740 }, { "epoch": 0.2, "learning_rate": 4.5342298904529045e-05, "loss": 0.3899, "step": 14745 }, { "epoch": 0.2, "learning_rate": 4.533923990873653e-05, "loss": 0.6049, "step": 14750 }, { "epoch": 0.2, "learning_rate": 4.533618001201744e-05, "loss": 0.4461, "step": 14755 }, { "epoch": 0.2, "learning_rate": 4.5333119214507306e-05, "loss": 1.091, "step": 14760 }, { "epoch": 0.2, "learning_rate": 4.533005751634172e-05, "loss": 0.6745, "step": 14765 }, { "epoch": 0.2, "learning_rate": 4.5326994917656296e-05, "loss": 0.3092, "step": 14770 }, { "epoch": 0.2, "learning_rate": 4.532393141858669e-05, "loss": 0.7487, "step": 14775 }, { "epoch": 0.2, "learning_rate": 4.5320867019268595e-05, "loss": 0.8244, "step": 14780 }, { "epoch": 0.2, "learning_rate": 4.531780171983776e-05, "loss": 0.6707, "step": 14785 }, { "epoch": 0.2, "learning_rate": 4.531473552042995e-05, "loss": 2.0487, "step": 14790 }, { "epoch": 0.2, "learning_rate": 4.5311668421180995e-05, "loss": 0.8277, "step": 14795 }, { "epoch": 0.2, "learning_rate": 4.5308600422226736e-05, "loss": 0.6854, "step": 14800 }, { "epoch": 0.2, "learning_rate": 4.530553152370308e-05, "loss": 1.1655, "step": 14805 }, { "epoch": 0.2, "learning_rate": 4.530246172574597e-05, "loss": 0.5875, "step": 14810 }, { "epoch": 0.2, "learning_rate": 4.5299391028491374e-05, "loss": 1.1003, "step": 14815 }, { "epoch": 0.2, "learning_rate": 4.529631943207531e-05, "loss": 0.6487, "step": 14820 }, { "epoch": 0.2, "learning_rate": 4.529324693663383e-05, "loss": 0.5208, "step": 14825 }, { "epoch": 0.2, "learning_rate": 4.529017354230304e-05, "loss": 0.6733, "step": 14830 }, { "epoch": 0.2, "learning_rate": 4.528709924921907e-05, "loss": 1.0024, "step": 14835 }, { "epoch": 0.2, "learning_rate": 4.5284024057518085e-05, "loss": 0.6416, "step": 14840 }, { "epoch": 0.2, "learning_rate": 4.5280947967336316e-05, "loss": 0.6439, "step": 14845 }, { "epoch": 0.2, "learning_rate": 4.527787097881003e-05, "loss": 0.7553, "step": 14850 }, { "epoch": 0.2, "learning_rate": 4.527479309207549e-05, "loss": 0.4533, "step": 14855 }, { "epoch": 0.2, "learning_rate": 4.5271714307269056e-05, "loss": 0.6862, "step": 14860 }, { "epoch": 0.2, "learning_rate": 4.52686346245271e-05, "loss": 0.9095, "step": 14865 }, { "epoch": 0.2, "learning_rate": 4.526555404398601e-05, "loss": 0.7529, "step": 14870 }, { "epoch": 0.2, "learning_rate": 4.526247256578228e-05, "loss": 1.081, "step": 14875 }, { "epoch": 0.2, "learning_rate": 4.5259390190052376e-05, "loss": 0.7424, "step": 14880 }, { "epoch": 0.2, "learning_rate": 4.525630691693284e-05, "loss": 0.5804, "step": 14885 }, { "epoch": 0.2, "learning_rate": 4.525322274656026e-05, "loss": 0.6492, "step": 14890 }, { "epoch": 0.2, "learning_rate": 4.5250137679071223e-05, "loss": 0.5241, "step": 14895 }, { "epoch": 0.2, "learning_rate": 4.5247051714602404e-05, "loss": 0.4515, "step": 14900 }, { "epoch": 0.2, "learning_rate": 4.524396485329048e-05, "loss": 1.1368, "step": 14905 }, { "epoch": 0.2, "learning_rate": 4.524087709527219e-05, "loss": 1.3259, "step": 14910 }, { "epoch": 0.2, "learning_rate": 4.5237788440684317e-05, "loss": 0.4861, "step": 14915 }, { "epoch": 0.2, "learning_rate": 4.523469888966365e-05, "loss": 1.1418, "step": 14920 }, { "epoch": 0.2, "learning_rate": 4.523160844234706e-05, "loss": 0.8653, "step": 14925 }, { "epoch": 0.2, "learning_rate": 4.522851709887143e-05, "loss": 0.8564, "step": 14930 }, { "epoch": 0.2, "learning_rate": 4.522542485937369e-05, "loss": 1.1363, "step": 14935 }, { "epoch": 0.2, "learning_rate": 4.5222331723990814e-05, "loss": 0.4073, "step": 14940 }, { "epoch": 0.2, "learning_rate": 4.521923769285981e-05, "loss": 0.8011, "step": 14945 }, { "epoch": 0.2, "learning_rate": 4.521614276611774e-05, "loss": 0.639, "step": 14950 }, { "epoch": 0.2, "learning_rate": 4.521304694390167e-05, "loss": 0.8468, "step": 14955 }, { "epoch": 0.2, "learning_rate": 4.520995022634875e-05, "loss": 0.7858, "step": 14960 }, { "epoch": 0.2, "learning_rate": 4.520685261359614e-05, "loss": 1.0908, "step": 14965 }, { "epoch": 0.2, "learning_rate": 4.520375410578106e-05, "loss": 0.3786, "step": 14970 }, { "epoch": 0.2, "learning_rate": 4.520065470304074e-05, "loss": 0.768, "step": 14975 }, { "epoch": 0.2, "learning_rate": 4.519755440551248e-05, "loss": 1.4481, "step": 14980 }, { "epoch": 0.2, "learning_rate": 4.51944532133336e-05, "loss": 0.7942, "step": 14985 }, { "epoch": 0.2, "learning_rate": 4.5191351126641476e-05, "loss": 0.9493, "step": 14990 }, { "epoch": 0.2, "learning_rate": 4.518824814557352e-05, "loss": 0.7031, "step": 14995 }, { "epoch": 0.2, "learning_rate": 4.5185144270267155e-05, "loss": 0.4496, "step": 15000 }, { "epoch": 0.2, "learning_rate": 4.5182039500859894e-05, "loss": 0.5582, "step": 15005 }, { "epoch": 0.2, "learning_rate": 4.517893383748924e-05, "loss": 0.6622, "step": 15010 }, { "epoch": 0.2, "learning_rate": 4.517582728029278e-05, "loss": 0.7996, "step": 15015 }, { "epoch": 0.2, "learning_rate": 4.51727198294081e-05, "loss": 0.7093, "step": 15020 }, { "epoch": 0.2, "learning_rate": 4.516961148497285e-05, "loss": 0.7797, "step": 15025 }, { "epoch": 0.2, "learning_rate": 4.516650224712473e-05, "loss": 0.7865, "step": 15030 }, { "epoch": 0.2, "learning_rate": 4.516339211600143e-05, "loss": 0.4436, "step": 15035 }, { "epoch": 0.2, "learning_rate": 4.516028109174075e-05, "loss": 1.47, "step": 15040 }, { "epoch": 0.2, "learning_rate": 4.5157169174480476e-05, "loss": 0.4248, "step": 15045 }, { "epoch": 0.2, "learning_rate": 4.515405636435844e-05, "loss": 1.0409, "step": 15050 }, { "epoch": 0.2, "learning_rate": 4.515094266151255e-05, "loss": 1.0565, "step": 15055 }, { "epoch": 0.2, "learning_rate": 4.51478280660807e-05, "loss": 0.7247, "step": 15060 }, { "epoch": 0.2, "learning_rate": 4.5144712578200866e-05, "loss": 0.5318, "step": 15065 }, { "epoch": 0.2, "learning_rate": 4.514159619801105e-05, "loss": 0.7138, "step": 15070 }, { "epoch": 0.2, "learning_rate": 4.513847892564928e-05, "loss": 0.8176, "step": 15075 }, { "epoch": 0.2, "learning_rate": 4.513536076125365e-05, "loss": 1.2685, "step": 15080 }, { "epoch": 0.2, "learning_rate": 4.5132241704962266e-05, "loss": 0.9256, "step": 15085 }, { "epoch": 0.2, "learning_rate": 4.5129121756913296e-05, "loss": 0.9111, "step": 15090 }, { "epoch": 0.2, "learning_rate": 4.512600091724494e-05, "loss": 1.082, "step": 15095 }, { "epoch": 0.2, "learning_rate": 4.5122879186095426e-05, "loss": 1.3532, "step": 15100 }, { "epoch": 0.2, "learning_rate": 4.511975656360303e-05, "loss": 0.4885, "step": 15105 }, { "epoch": 0.2, "learning_rate": 4.511663304990608e-05, "loss": 0.485, "step": 15110 }, { "epoch": 0.2, "learning_rate": 4.511350864514292e-05, "loss": 0.5999, "step": 15115 }, { "epoch": 0.2, "learning_rate": 4.511038334945197e-05, "loss": 0.6006, "step": 15120 }, { "epoch": 0.2, "learning_rate": 4.510725716297163e-05, "loss": 0.6764, "step": 15125 }, { "epoch": 0.2, "learning_rate": 4.510413008584039e-05, "loss": 0.3215, "step": 15130 }, { "epoch": 0.2, "learning_rate": 4.510100211819678e-05, "loss": 0.5175, "step": 15135 }, { "epoch": 0.2, "learning_rate": 4.509787326017932e-05, "loss": 1.3509, "step": 15140 }, { "epoch": 0.2, "learning_rate": 4.5094743511926626e-05, "loss": 0.3794, "step": 15145 }, { "epoch": 0.2, "learning_rate": 4.509161287357734e-05, "loss": 0.9836, "step": 15150 }, { "epoch": 0.2, "learning_rate": 4.5088481345270106e-05, "loss": 0.4954, "step": 15155 }, { "epoch": 0.2, "learning_rate": 4.508534892714365e-05, "loss": 0.4553, "step": 15160 }, { "epoch": 0.2, "learning_rate": 4.508221561933672e-05, "loss": 0.8731, "step": 15165 }, { "epoch": 0.2, "learning_rate": 4.50790814219881e-05, "loss": 0.4922, "step": 15170 }, { "epoch": 0.2, "learning_rate": 4.507594633523663e-05, "loss": 0.8416, "step": 15175 }, { "epoch": 0.2, "learning_rate": 4.5072810359221185e-05, "loss": 0.4411, "step": 15180 }, { "epoch": 0.2, "learning_rate": 4.5069673494080646e-05, "loss": 0.4622, "step": 15185 }, { "epoch": 0.2, "learning_rate": 4.5066535739953985e-05, "loss": 0.6284, "step": 15190 }, { "epoch": 0.2, "learning_rate": 4.506339709698018e-05, "loss": 0.6619, "step": 15195 }, { "epoch": 0.2, "learning_rate": 4.506025756529826e-05, "loss": 0.4603, "step": 15200 }, { "epoch": 0.2, "learning_rate": 4.505711714504728e-05, "loss": 1.4014, "step": 15205 }, { "epoch": 0.2, "learning_rate": 4.505397583636636e-05, "loss": 0.2935, "step": 15210 }, { "epoch": 0.2, "learning_rate": 4.505083363939464e-05, "loss": 1.2458, "step": 15215 }, { "epoch": 0.2, "learning_rate": 4.5047690554271295e-05, "loss": 0.5605, "step": 15220 }, { "epoch": 0.2, "learning_rate": 4.5044546581135554e-05, "loss": 0.7611, "step": 15225 }, { "epoch": 0.2, "learning_rate": 4.5041401720126685e-05, "loss": 1.4991, "step": 15230 }, { "epoch": 0.2, "learning_rate": 4.503825597138398e-05, "loss": 0.6877, "step": 15235 }, { "epoch": 0.2, "learning_rate": 4.503510933504678e-05, "loss": 0.8282, "step": 15240 }, { "epoch": 0.2, "learning_rate": 4.503196181125447e-05, "loss": 1.6741, "step": 15245 }, { "epoch": 0.2, "learning_rate": 4.5028813400146476e-05, "loss": 0.9444, "step": 15250 }, { "epoch": 0.2, "learning_rate": 4.5025664101862244e-05, "loss": 0.9185, "step": 15255 }, { "epoch": 0.2, "learning_rate": 4.502251391654128e-05, "loss": 0.9019, "step": 15260 }, { "epoch": 0.2, "learning_rate": 4.5019362844323107e-05, "loss": 0.2846, "step": 15265 }, { "epoch": 0.2, "learning_rate": 4.501621088534732e-05, "loss": 0.3701, "step": 15270 }, { "epoch": 0.2, "learning_rate": 4.5013058039753536e-05, "loss": 0.6199, "step": 15275 }, { "epoch": 0.2, "learning_rate": 4.500990430768139e-05, "loss": 0.3217, "step": 15280 }, { "epoch": 0.2, "learning_rate": 4.500674968927061e-05, "loss": 1.2058, "step": 15285 }, { "epoch": 0.2, "learning_rate": 4.5003594184660895e-05, "loss": 0.7786, "step": 15290 }, { "epoch": 0.2, "learning_rate": 4.5000437793992034e-05, "loss": 0.7481, "step": 15295 }, { "epoch": 0.2, "learning_rate": 4.499728051740384e-05, "loss": 0.8081, "step": 15300 }, { "epoch": 0.21, "learning_rate": 4.499412235503616e-05, "loss": 0.2455, "step": 15305 }, { "epoch": 0.21, "learning_rate": 4.4990963307028886e-05, "loss": 0.6767, "step": 15310 }, { "epoch": 0.21, "learning_rate": 4.498780337352195e-05, "loss": 0.6922, "step": 15315 }, { "epoch": 0.21, "learning_rate": 4.498464255465533e-05, "loss": 0.4338, "step": 15320 }, { "epoch": 0.21, "learning_rate": 4.498148085056901e-05, "loss": 0.5865, "step": 15325 }, { "epoch": 0.21, "learning_rate": 4.497831826140306e-05, "loss": 0.8072, "step": 15330 }, { "epoch": 0.21, "learning_rate": 4.4975154787297565e-05, "loss": 0.5173, "step": 15335 }, { "epoch": 0.21, "learning_rate": 4.497199042839264e-05, "loss": 0.7919, "step": 15340 }, { "epoch": 0.21, "learning_rate": 4.4968825184828454e-05, "loss": 0.9477, "step": 15345 }, { "epoch": 0.21, "learning_rate": 4.4965659056745214e-05, "loss": 0.7418, "step": 15350 }, { "epoch": 0.21, "learning_rate": 4.496249204428316e-05, "loss": 0.9969, "step": 15355 }, { "epoch": 0.21, "learning_rate": 4.495932414758258e-05, "loss": 1.0321, "step": 15360 }, { "epoch": 0.21, "learning_rate": 4.49561553667838e-05, "loss": 0.4034, "step": 15365 }, { "epoch": 0.21, "learning_rate": 4.495298570202716e-05, "loss": 0.6045, "step": 15370 }, { "epoch": 0.21, "learning_rate": 4.494981515345309e-05, "loss": 1.089, "step": 15375 }, { "epoch": 0.21, "learning_rate": 4.494664372120201e-05, "loss": 0.5011, "step": 15380 }, { "epoch": 0.21, "learning_rate": 4.49434714054144e-05, "loss": 1.1007, "step": 15385 }, { "epoch": 0.21, "learning_rate": 4.494029820623078e-05, "loss": 0.5664, "step": 15390 }, { "epoch": 0.21, "learning_rate": 4.493712412379171e-05, "loss": 0.5734, "step": 15395 }, { "epoch": 0.21, "learning_rate": 4.493394915823779e-05, "loss": 1.287, "step": 15400 }, { "epoch": 0.21, "learning_rate": 4.493077330970964e-05, "loss": 0.9043, "step": 15405 }, { "epoch": 0.21, "learning_rate": 4.492759657834794e-05, "loss": 0.4827, "step": 15410 }, { "epoch": 0.21, "learning_rate": 4.492441896429341e-05, "loss": 0.5567, "step": 15415 }, { "epoch": 0.21, "learning_rate": 4.492124046768681e-05, "loss": 0.6398, "step": 15420 }, { "epoch": 0.21, "learning_rate": 4.4918061088668906e-05, "loss": 0.8698, "step": 15425 }, { "epoch": 0.21, "learning_rate": 4.491488082738055e-05, "loss": 0.7955, "step": 15430 }, { "epoch": 0.21, "learning_rate": 4.49116996839626e-05, "loss": 0.7695, "step": 15435 }, { "epoch": 0.21, "learning_rate": 4.490851765855597e-05, "loss": 0.436, "step": 15440 }, { "epoch": 0.21, "learning_rate": 4.490533475130161e-05, "loss": 0.4736, "step": 15445 }, { "epoch": 0.21, "learning_rate": 4.49021509623405e-05, "loss": 0.1419, "step": 15450 }, { "epoch": 0.21, "learning_rate": 4.489896629181367e-05, "loss": 1.2868, "step": 15455 }, { "epoch": 0.21, "learning_rate": 4.489578073986218e-05, "loss": 0.8855, "step": 15460 }, { "epoch": 0.21, "learning_rate": 4.489259430662715e-05, "loss": 0.7092, "step": 15465 }, { "epoch": 0.21, "learning_rate": 4.4889406992249706e-05, "loss": 0.2406, "step": 15470 }, { "epoch": 0.21, "learning_rate": 4.488621879687103e-05, "loss": 0.3113, "step": 15475 }, { "epoch": 0.21, "learning_rate": 4.488302972063236e-05, "loss": 0.6926, "step": 15480 }, { "epoch": 0.21, "learning_rate": 4.4879839763674934e-05, "loss": 0.5444, "step": 15485 }, { "epoch": 0.21, "learning_rate": 4.487664892614007e-05, "loss": 1.2118, "step": 15490 }, { "epoch": 0.21, "learning_rate": 4.48734572081691e-05, "loss": 0.4382, "step": 15495 }, { "epoch": 0.21, "learning_rate": 4.487026460990339e-05, "loss": 0.8273, "step": 15500 }, { "epoch": 0.21, "learning_rate": 4.486707113148437e-05, "loss": 0.4626, "step": 15505 }, { "epoch": 0.21, "learning_rate": 4.48638767730535e-05, "loss": 1.1271, "step": 15510 }, { "epoch": 0.21, "learning_rate": 4.486068153475225e-05, "loss": 1.1857, "step": 15515 }, { "epoch": 0.21, "learning_rate": 4.485748541672218e-05, "loss": 1.0611, "step": 15520 }, { "epoch": 0.21, "learning_rate": 4.485428841910484e-05, "loss": 1.3626, "step": 15525 }, { "epoch": 0.21, "learning_rate": 4.4851090542041856e-05, "loss": 0.1662, "step": 15530 }, { "epoch": 0.21, "learning_rate": 4.484789178567488e-05, "loss": 1.2181, "step": 15535 }, { "epoch": 0.21, "learning_rate": 4.484469215014558e-05, "loss": 0.7812, "step": 15540 }, { "epoch": 0.21, "learning_rate": 4.4841491635595705e-05, "loss": 0.2887, "step": 15545 }, { "epoch": 0.21, "learning_rate": 4.483829024216701e-05, "loss": 0.4269, "step": 15550 }, { "epoch": 0.21, "learning_rate": 4.483508797000131e-05, "loss": 1.0119, "step": 15555 }, { "epoch": 0.21, "learning_rate": 4.4831884819240444e-05, "loss": 1.2295, "step": 15560 }, { "epoch": 0.21, "learning_rate": 4.4828680790026293e-05, "loss": 0.9327, "step": 15565 }, { "epoch": 0.21, "learning_rate": 4.482547588250079e-05, "loss": 0.4663, "step": 15570 }, { "epoch": 0.21, "learning_rate": 4.482227009680588e-05, "loss": 0.9207, "step": 15575 }, { "epoch": 0.21, "learning_rate": 4.481906343308357e-05, "loss": 0.778, "step": 15580 }, { "epoch": 0.21, "learning_rate": 4.4815855891475915e-05, "loss": 0.6855, "step": 15585 }, { "epoch": 0.21, "learning_rate": 4.481264747212498e-05, "loss": 0.7318, "step": 15590 }, { "epoch": 0.21, "learning_rate": 4.480943817517287e-05, "loss": 0.6333, "step": 15595 }, { "epoch": 0.21, "learning_rate": 4.4806228000761755e-05, "loss": 0.3865, "step": 15600 }, { "epoch": 0.21, "learning_rate": 4.480301694903383e-05, "loss": 0.5956, "step": 15605 }, { "epoch": 0.21, "learning_rate": 4.479980502013132e-05, "loss": 0.5576, "step": 15610 }, { "epoch": 0.21, "learning_rate": 4.479659221419651e-05, "loss": 0.4362, "step": 15615 }, { "epoch": 0.21, "learning_rate": 4.4793378531371696e-05, "loss": 0.5401, "step": 15620 }, { "epoch": 0.21, "learning_rate": 4.479016397179925e-05, "loss": 0.9102, "step": 15625 }, { "epoch": 0.21, "learning_rate": 4.4786948535621536e-05, "loss": 0.6168, "step": 15630 }, { "epoch": 0.21, "learning_rate": 4.4783732222980993e-05, "loss": 0.7033, "step": 15635 }, { "epoch": 0.21, "learning_rate": 4.478051503402009e-05, "loss": 0.6686, "step": 15640 }, { "epoch": 0.21, "learning_rate": 4.477729696888133e-05, "loss": 0.7361, "step": 15645 }, { "epoch": 0.21, "learning_rate": 4.4774078027707256e-05, "loss": 1.0751, "step": 15650 }, { "epoch": 0.21, "learning_rate": 4.477085821064045e-05, "loss": 1.0183, "step": 15655 }, { "epoch": 0.21, "learning_rate": 4.4767637517823546e-05, "loss": 1.2056, "step": 15660 }, { "epoch": 0.21, "learning_rate": 4.4764415949399185e-05, "loss": 0.5005, "step": 15665 }, { "epoch": 0.21, "learning_rate": 4.476119350551008e-05, "loss": 0.3177, "step": 15670 }, { "epoch": 0.21, "learning_rate": 4.475797018629896e-05, "loss": 1.0138, "step": 15675 }, { "epoch": 0.21, "learning_rate": 4.4754745991908605e-05, "loss": 0.3521, "step": 15680 }, { "epoch": 0.21, "learning_rate": 4.4751520922481846e-05, "loss": 1.1953, "step": 15685 }, { "epoch": 0.21, "learning_rate": 4.474829497816151e-05, "loss": 1.4224, "step": 15690 }, { "epoch": 0.21, "learning_rate": 4.4745068159090506e-05, "loss": 0.6991, "step": 15695 }, { "epoch": 0.21, "learning_rate": 4.474184046541177e-05, "loss": 0.3599, "step": 15700 }, { "epoch": 0.21, "learning_rate": 4.4738611897268265e-05, "loss": 0.752, "step": 15705 }, { "epoch": 0.21, "learning_rate": 4.4735382454803e-05, "loss": 0.9566, "step": 15710 }, { "epoch": 0.21, "learning_rate": 4.473215213815902e-05, "loss": 0.7253, "step": 15715 }, { "epoch": 0.21, "learning_rate": 4.4728920947479426e-05, "loss": 0.7946, "step": 15720 }, { "epoch": 0.21, "learning_rate": 4.472568888290733e-05, "loss": 0.7455, "step": 15725 }, { "epoch": 0.21, "learning_rate": 4.472245594458591e-05, "loss": 0.5897, "step": 15730 }, { "epoch": 0.21, "learning_rate": 4.471922213265835e-05, "loss": 0.7691, "step": 15735 }, { "epoch": 0.21, "learning_rate": 4.47159874472679e-05, "loss": 0.6987, "step": 15740 }, { "epoch": 0.21, "learning_rate": 4.4712751888557846e-05, "loss": 0.9502, "step": 15745 }, { "epoch": 0.21, "learning_rate": 4.47095154566715e-05, "loss": 1.1784, "step": 15750 }, { "epoch": 0.21, "learning_rate": 4.470627815175223e-05, "loss": 1.5017, "step": 15755 }, { "epoch": 0.21, "learning_rate": 4.470303997394342e-05, "loss": 0.1549, "step": 15760 }, { "epoch": 0.21, "learning_rate": 4.469980092338851e-05, "loss": 0.5994, "step": 15765 }, { "epoch": 0.21, "learning_rate": 4.469656100023098e-05, "loss": 1.2348, "step": 15770 }, { "epoch": 0.21, "learning_rate": 4.469332020461433e-05, "loss": 0.9684, "step": 15775 }, { "epoch": 0.21, "learning_rate": 4.469007853668212e-05, "loss": 1.1518, "step": 15780 }, { "epoch": 0.21, "learning_rate": 4.468683599657794e-05, "loss": 0.7375, "step": 15785 }, { "epoch": 0.21, "learning_rate": 4.4683592584445414e-05, "loss": 0.7283, "step": 15790 }, { "epoch": 0.21, "learning_rate": 4.468034830042821e-05, "loss": 0.7422, "step": 15795 }, { "epoch": 0.21, "learning_rate": 4.467710314467003e-05, "loss": 0.9713, "step": 15800 }, { "epoch": 0.21, "learning_rate": 4.467385711731462e-05, "loss": 1.1408, "step": 15805 }, { "epoch": 0.21, "learning_rate": 4.4670610218505775e-05, "loss": 1.0537, "step": 15810 }, { "epoch": 0.21, "learning_rate": 4.466736244838731e-05, "loss": 0.7138, "step": 15815 }, { "epoch": 0.21, "learning_rate": 4.466411380710307e-05, "loss": 1.2561, "step": 15820 }, { "epoch": 0.21, "learning_rate": 4.466086429479697e-05, "loss": 0.6558, "step": 15825 }, { "epoch": 0.21, "learning_rate": 4.465761391161293e-05, "loss": 0.5846, "step": 15830 }, { "epoch": 0.21, "learning_rate": 4.465436265769495e-05, "loss": 1.0302, "step": 15835 }, { "epoch": 0.21, "learning_rate": 4.465111053318703e-05, "loss": 0.4802, "step": 15840 }, { "epoch": 0.21, "learning_rate": 4.464785753823322e-05, "loss": 0.8332, "step": 15845 }, { "epoch": 0.21, "learning_rate": 4.464460367297762e-05, "loss": 0.5919, "step": 15850 }, { "epoch": 0.21, "learning_rate": 4.464134893756436e-05, "loss": 0.7233, "step": 15855 }, { "epoch": 0.21, "learning_rate": 4.46380933321376e-05, "loss": 0.4503, "step": 15860 }, { "epoch": 0.21, "learning_rate": 4.4634836856841555e-05, "loss": 0.6906, "step": 15865 }, { "epoch": 0.21, "learning_rate": 4.463157951182046e-05, "loss": 0.3532, "step": 15870 }, { "epoch": 0.21, "learning_rate": 4.4628321297218615e-05, "loss": 0.2849, "step": 15875 }, { "epoch": 0.21, "learning_rate": 4.462506221318033e-05, "loss": 0.9067, "step": 15880 }, { "epoch": 0.21, "learning_rate": 4.462180225984997e-05, "loss": 1.1045, "step": 15885 }, { "epoch": 0.21, "learning_rate": 4.461854143737194e-05, "loss": 0.7564, "step": 15890 }, { "epoch": 0.21, "learning_rate": 4.4615279745890656e-05, "loss": 0.7854, "step": 15895 }, { "epoch": 0.21, "learning_rate": 4.461201718555062e-05, "loss": 0.7783, "step": 15900 }, { "epoch": 0.21, "learning_rate": 4.460875375649635e-05, "loss": 0.7912, "step": 15905 }, { "epoch": 0.21, "learning_rate": 4.4605489458872376e-05, "loss": 0.4024, "step": 15910 }, { "epoch": 0.21, "learning_rate": 4.4602224292823305e-05, "loss": 0.4775, "step": 15915 }, { "epoch": 0.21, "learning_rate": 4.459895825849377e-05, "loss": 0.5464, "step": 15920 }, { "epoch": 0.21, "learning_rate": 4.459569135602843e-05, "loss": 1.0582, "step": 15925 }, { "epoch": 0.21, "learning_rate": 4.4592423585571996e-05, "loss": 0.3691, "step": 15930 }, { "epoch": 0.21, "learning_rate": 4.458915494726922e-05, "loss": 0.3974, "step": 15935 }, { "epoch": 0.21, "learning_rate": 4.458588544126487e-05, "loss": 0.9062, "step": 15940 }, { "epoch": 0.21, "learning_rate": 4.4582615067703794e-05, "loss": 0.7866, "step": 15945 }, { "epoch": 0.21, "learning_rate": 4.457934382673083e-05, "loss": 0.8666, "step": 15950 }, { "epoch": 0.21, "learning_rate": 4.457607171849089e-05, "loss": 0.9613, "step": 15955 }, { "epoch": 0.21, "learning_rate": 4.457279874312891e-05, "loss": 0.8252, "step": 15960 }, { "epoch": 0.21, "learning_rate": 4.456952490078986e-05, "loss": 0.8249, "step": 15965 }, { "epoch": 0.21, "learning_rate": 4.4566250191618765e-05, "loss": 1.0184, "step": 15970 }, { "epoch": 0.21, "learning_rate": 4.456297461576068e-05, "loss": 1.2609, "step": 15975 }, { "epoch": 0.21, "learning_rate": 4.4559698173360676e-05, "loss": 1.0142, "step": 15980 }, { "epoch": 0.21, "learning_rate": 4.455642086456391e-05, "loss": 0.6197, "step": 15985 }, { "epoch": 0.21, "learning_rate": 4.455314268951552e-05, "loss": 0.536, "step": 15990 }, { "epoch": 0.21, "learning_rate": 4.454986364836074e-05, "loss": 0.2093, "step": 15995 }, { "epoch": 0.21, "learning_rate": 4.454658374124481e-05, "loss": 0.5247, "step": 16000 }, { "epoch": 0.21, "learning_rate": 4.4543302968313005e-05, "loss": 0.6272, "step": 16005 }, { "epoch": 0.21, "learning_rate": 4.454002132971065e-05, "loss": 0.688, "step": 16010 }, { "epoch": 0.21, "learning_rate": 4.453673882558311e-05, "loss": 1.0652, "step": 16015 }, { "epoch": 0.21, "learning_rate": 4.4533455456075776e-05, "loss": 1.6326, "step": 16020 }, { "epoch": 0.21, "learning_rate": 4.453017122133409e-05, "loss": 0.7918, "step": 16025 }, { "epoch": 0.21, "learning_rate": 4.452688612150352e-05, "loss": 0.7861, "step": 16030 }, { "epoch": 0.21, "learning_rate": 4.4523600156729584e-05, "loss": 1.2545, "step": 16035 }, { "epoch": 0.21, "learning_rate": 4.452031332715784e-05, "loss": 1.3703, "step": 16040 }, { "epoch": 0.21, "learning_rate": 4.451702563293387e-05, "loss": 0.3448, "step": 16045 }, { "epoch": 0.22, "learning_rate": 4.451373707420331e-05, "loss": 0.4775, "step": 16050 }, { "epoch": 0.22, "learning_rate": 4.451044765111182e-05, "loss": 0.4627, "step": 16055 }, { "epoch": 0.22, "learning_rate": 4.45071573638051e-05, "loss": 0.3306, "step": 16060 }, { "epoch": 0.22, "learning_rate": 4.4503866212428904e-05, "loss": 0.6368, "step": 16065 }, { "epoch": 0.22, "learning_rate": 4.450057419712901e-05, "loss": 0.5365, "step": 16070 }, { "epoch": 0.22, "learning_rate": 4.4497281318051236e-05, "loss": 0.6118, "step": 16075 }, { "epoch": 0.22, "learning_rate": 4.4493987575341447e-05, "loss": 0.535, "step": 16080 }, { "epoch": 0.22, "learning_rate": 4.449069296914553e-05, "loss": 1.2247, "step": 16085 }, { "epoch": 0.22, "learning_rate": 4.4487397499609416e-05, "loss": 0.3995, "step": 16090 }, { "epoch": 0.22, "learning_rate": 4.4484101166879097e-05, "loss": 1.0037, "step": 16095 }, { "epoch": 0.22, "learning_rate": 4.4480803971100564e-05, "loss": 0.5037, "step": 16100 }, { "epoch": 0.22, "learning_rate": 4.447750591241988e-05, "loss": 0.2647, "step": 16105 }, { "epoch": 0.22, "learning_rate": 4.4474206990983125e-05, "loss": 0.6166, "step": 16110 }, { "epoch": 0.22, "learning_rate": 4.447090720693643e-05, "loss": 0.3635, "step": 16115 }, { "epoch": 0.22, "learning_rate": 4.4467606560425943e-05, "loss": 0.6967, "step": 16120 }, { "epoch": 0.22, "learning_rate": 4.4464305051597894e-05, "loss": 0.9609, "step": 16125 }, { "epoch": 0.22, "learning_rate": 4.44610026805985e-05, "loss": 1.0944, "step": 16130 }, { "epoch": 0.22, "learning_rate": 4.4457699447574056e-05, "loss": 0.5438, "step": 16135 }, { "epoch": 0.22, "learning_rate": 4.445439535267086e-05, "loss": 0.8048, "step": 16140 }, { "epoch": 0.22, "learning_rate": 4.445109039603528e-05, "loss": 0.7781, "step": 16145 }, { "epoch": 0.22, "learning_rate": 4.444778457781371e-05, "loss": 0.4673, "step": 16150 }, { "epoch": 0.22, "learning_rate": 4.444447789815257e-05, "loss": 0.821, "step": 16155 }, { "epoch": 0.22, "learning_rate": 4.444117035719835e-05, "loss": 1.2544, "step": 16160 }, { "epoch": 0.22, "learning_rate": 4.443786195509753e-05, "loss": 0.2771, "step": 16165 }, { "epoch": 0.22, "learning_rate": 4.443455269199668e-05, "loss": 0.679, "step": 16170 }, { "epoch": 0.22, "learning_rate": 4.443124256804236e-05, "loss": 0.427, "step": 16175 }, { "epoch": 0.22, "learning_rate": 4.4427931583381223e-05, "loss": 0.8322, "step": 16180 }, { "epoch": 0.22, "learning_rate": 4.44246197381599e-05, "loss": 1.748, "step": 16185 }, { "epoch": 0.22, "learning_rate": 4.44213070325251e-05, "loss": 0.5883, "step": 16190 }, { "epoch": 0.22, "learning_rate": 4.441799346662357e-05, "loss": 0.7671, "step": 16195 }, { "epoch": 0.22, "learning_rate": 4.4414679040602066e-05, "loss": 0.5161, "step": 16200 }, { "epoch": 0.22, "learning_rate": 4.4411363754607414e-05, "loss": 0.8463, "step": 16205 }, { "epoch": 0.22, "learning_rate": 4.440804760878646e-05, "loss": 1.0345, "step": 16210 }, { "epoch": 0.22, "learning_rate": 4.440473060328609e-05, "loss": 0.7761, "step": 16215 }, { "epoch": 0.22, "learning_rate": 4.440141273825323e-05, "loss": 0.6392, "step": 16220 }, { "epoch": 0.22, "learning_rate": 4.4398094013834855e-05, "loss": 0.5274, "step": 16225 }, { "epoch": 0.22, "learning_rate": 4.4394774430177953e-05, "loss": 0.5278, "step": 16230 }, { "epoch": 0.22, "learning_rate": 4.439145398742958e-05, "loss": 1.0112, "step": 16235 }, { "epoch": 0.22, "learning_rate": 4.4388132685736804e-05, "loss": 0.5874, "step": 16240 }, { "epoch": 0.22, "learning_rate": 4.438481052524675e-05, "loss": 0.5517, "step": 16245 }, { "epoch": 0.22, "learning_rate": 4.438148750610657e-05, "loss": 0.8237, "step": 16250 }, { "epoch": 0.22, "learning_rate": 4.437816362846345e-05, "loss": 0.9046, "step": 16255 }, { "epoch": 0.22, "learning_rate": 4.437483889246463e-05, "loss": 0.6384, "step": 16260 }, { "epoch": 0.22, "learning_rate": 4.437151329825737e-05, "loss": 0.4651, "step": 16265 }, { "epoch": 0.22, "learning_rate": 4.436818684598899e-05, "loss": 0.6566, "step": 16270 }, { "epoch": 0.22, "learning_rate": 4.4364859535806826e-05, "loss": 0.1717, "step": 16275 }, { "epoch": 0.22, "learning_rate": 4.436153136785827e-05, "loss": 1.1772, "step": 16280 }, { "epoch": 0.22, "learning_rate": 4.435820234229073e-05, "loss": 0.5973, "step": 16285 }, { "epoch": 0.22, "learning_rate": 4.435487245925167e-05, "loss": 0.2354, "step": 16290 }, { "epoch": 0.22, "learning_rate": 4.4351541718888595e-05, "loss": 0.7333, "step": 16295 }, { "epoch": 0.22, "learning_rate": 4.4348210121349034e-05, "loss": 0.4763, "step": 16300 }, { "epoch": 0.22, "learning_rate": 4.434487766678056e-05, "loss": 0.4738, "step": 16305 }, { "epoch": 0.22, "learning_rate": 4.434154435533079e-05, "loss": 0.8983, "step": 16310 }, { "epoch": 0.22, "learning_rate": 4.433821018714736e-05, "loss": 0.8976, "step": 16315 }, { "epoch": 0.22, "learning_rate": 4.4334875162377964e-05, "loss": 1.1985, "step": 16320 }, { "epoch": 0.22, "learning_rate": 4.433153928117034e-05, "loss": 0.955, "step": 16325 }, { "epoch": 0.22, "learning_rate": 4.432820254367222e-05, "loss": 0.6763, "step": 16330 }, { "epoch": 0.22, "learning_rate": 4.432486495003144e-05, "loss": 1.1933, "step": 16335 }, { "epoch": 0.22, "learning_rate": 4.432152650039581e-05, "loss": 0.9028, "step": 16340 }, { "epoch": 0.22, "learning_rate": 4.431818719491322e-05, "loss": 0.5178, "step": 16345 }, { "epoch": 0.22, "learning_rate": 4.431484703373159e-05, "loss": 1.4662, "step": 16350 }, { "epoch": 0.22, "learning_rate": 4.431150601699886e-05, "loss": 0.7025, "step": 16355 }, { "epoch": 0.22, "learning_rate": 4.430816414486303e-05, "loss": 0.665, "step": 16360 }, { "epoch": 0.22, "learning_rate": 4.430482141747213e-05, "loss": 0.6091, "step": 16365 }, { "epoch": 0.22, "learning_rate": 4.4301477834974206e-05, "loss": 0.472, "step": 16370 }, { "epoch": 0.22, "learning_rate": 4.4298133397517386e-05, "loss": 0.8731, "step": 16375 }, { "epoch": 0.22, "learning_rate": 4.4294788105249795e-05, "loss": 0.6806, "step": 16380 }, { "epoch": 0.22, "learning_rate": 4.4291441958319625e-05, "loss": 0.9489, "step": 16385 }, { "epoch": 0.22, "learning_rate": 4.428809495687508e-05, "loss": 0.3828, "step": 16390 }, { "epoch": 0.22, "learning_rate": 4.4284747101064436e-05, "loss": 0.347, "step": 16395 }, { "epoch": 0.22, "learning_rate": 4.4281398391035966e-05, "loss": 0.6774, "step": 16400 }, { "epoch": 0.22, "learning_rate": 4.4278048826938015e-05, "loss": 0.4817, "step": 16405 }, { "epoch": 0.22, "learning_rate": 4.4274698408918944e-05, "loss": 0.7774, "step": 16410 }, { "epoch": 0.22, "learning_rate": 4.427134713712716e-05, "loss": 1.0989, "step": 16415 }, { "epoch": 0.22, "learning_rate": 4.426799501171111e-05, "loss": 0.8767, "step": 16420 }, { "epoch": 0.22, "learning_rate": 4.426464203281927e-05, "loss": 0.5939, "step": 16425 }, { "epoch": 0.22, "learning_rate": 4.426128820060017e-05, "loss": 1.1092, "step": 16430 }, { "epoch": 0.22, "learning_rate": 4.425793351520237e-05, "loss": 1.2554, "step": 16435 }, { "epoch": 0.22, "learning_rate": 4.4254577976774446e-05, "loss": 1.1698, "step": 16440 }, { "epoch": 0.22, "learning_rate": 4.425122158546506e-05, "loss": 0.5357, "step": 16445 }, { "epoch": 0.22, "learning_rate": 4.424786434142286e-05, "loss": 0.8205, "step": 16450 }, { "epoch": 0.22, "learning_rate": 4.424450624479657e-05, "loss": 0.5119, "step": 16455 }, { "epoch": 0.22, "learning_rate": 4.424114729573493e-05, "loss": 0.8426, "step": 16460 }, { "epoch": 0.22, "learning_rate": 4.423778749438672e-05, "loss": 0.643, "step": 16465 }, { "epoch": 0.22, "learning_rate": 4.423442684090077e-05, "loss": 0.7211, "step": 16470 }, { "epoch": 0.22, "learning_rate": 4.4231065335425937e-05, "loss": 0.4802, "step": 16475 }, { "epoch": 0.22, "learning_rate": 4.422837551771413e-05, "loss": 0.756, "step": 16480 }, { "epoch": 0.22, "learning_rate": 4.4225012479034554e-05, "loss": 1.2354, "step": 16485 }, { "epoch": 0.22, "learning_rate": 4.422164858878311e-05, "loss": 1.3758, "step": 16490 }, { "epoch": 0.22, "learning_rate": 4.42182838471088e-05, "loss": 1.0235, "step": 16495 }, { "epoch": 0.22, "learning_rate": 4.421491825416065e-05, "loss": 1.5519, "step": 16500 }, { "epoch": 0.22, "learning_rate": 4.421155181008776e-05, "loss": 0.4996, "step": 16505 }, { "epoch": 0.22, "learning_rate": 4.420818451503923e-05, "loss": 0.3878, "step": 16510 }, { "epoch": 0.22, "learning_rate": 4.420481636916423e-05, "loss": 1.4082, "step": 16515 }, { "epoch": 0.22, "learning_rate": 4.420144737261194e-05, "loss": 0.8516, "step": 16520 }, { "epoch": 0.22, "learning_rate": 4.419807752553159e-05, "loss": 0.6332, "step": 16525 }, { "epoch": 0.22, "learning_rate": 4.419470682807245e-05, "loss": 1.4508, "step": 16530 }, { "epoch": 0.22, "learning_rate": 4.419133528038384e-05, "loss": 1.3998, "step": 16535 }, { "epoch": 0.22, "learning_rate": 4.418796288261507e-05, "loss": 0.8081, "step": 16540 }, { "epoch": 0.22, "learning_rate": 4.418458963491555e-05, "loss": 1.3121, "step": 16545 }, { "epoch": 0.22, "learning_rate": 4.418121553743468e-05, "loss": 0.3166, "step": 16550 }, { "epoch": 0.22, "learning_rate": 4.4177840590321925e-05, "loss": 0.6992, "step": 16555 }, { "epoch": 0.22, "learning_rate": 4.417446479372677e-05, "loss": 0.9031, "step": 16560 }, { "epoch": 0.22, "learning_rate": 4.4171088147798754e-05, "loss": 0.7025, "step": 16565 }, { "epoch": 0.22, "learning_rate": 4.416771065268745e-05, "loss": 0.7169, "step": 16570 }, { "epoch": 0.22, "learning_rate": 4.416433230854246e-05, "loss": 0.786, "step": 16575 }, { "epoch": 0.22, "learning_rate": 4.416095311551341e-05, "loss": 0.5093, "step": 16580 }, { "epoch": 0.22, "learning_rate": 4.4157573073750005e-05, "loss": 0.7724, "step": 16585 }, { "epoch": 0.22, "learning_rate": 4.4154192183401955e-05, "loss": 2.1743, "step": 16590 }, { "epoch": 0.22, "learning_rate": 4.415081044461901e-05, "loss": 0.9582, "step": 16595 }, { "epoch": 0.22, "learning_rate": 4.414742785755098e-05, "loss": 0.5349, "step": 16600 }, { "epoch": 0.22, "learning_rate": 4.414404442234769e-05, "loss": 0.4601, "step": 16605 }, { "epoch": 0.22, "learning_rate": 4.4140660139158995e-05, "loss": 1.0737, "step": 16610 }, { "epoch": 0.22, "learning_rate": 4.4137275008134816e-05, "loss": 0.8279, "step": 16615 }, { "epoch": 0.22, "learning_rate": 4.41338890294251e-05, "loss": 1.0597, "step": 16620 }, { "epoch": 0.22, "learning_rate": 4.4130502203179825e-05, "loss": 1.189, "step": 16625 }, { "epoch": 0.22, "learning_rate": 4.4127114529549005e-05, "loss": 0.1502, "step": 16630 }, { "epoch": 0.22, "learning_rate": 4.4123726008682694e-05, "loss": 0.77, "step": 16635 }, { "epoch": 0.22, "learning_rate": 4.412033664073101e-05, "loss": 0.9626, "step": 16640 }, { "epoch": 0.22, "learning_rate": 4.411694642584406e-05, "loss": 1.0951, "step": 16645 }, { "epoch": 0.22, "learning_rate": 4.411355536417202e-05, "loss": 0.6967, "step": 16650 }, { "epoch": 0.22, "learning_rate": 4.4110163455865104e-05, "loss": 0.5844, "step": 16655 }, { "epoch": 0.22, "learning_rate": 4.410677070107355e-05, "loss": 0.4233, "step": 16660 }, { "epoch": 0.22, "learning_rate": 4.4103377099947644e-05, "loss": 0.5834, "step": 16665 }, { "epoch": 0.22, "learning_rate": 4.4099982652637705e-05, "loss": 0.374, "step": 16670 }, { "epoch": 0.22, "learning_rate": 4.409658735929408e-05, "loss": 0.777, "step": 16675 }, { "epoch": 0.22, "learning_rate": 4.4093191220067185e-05, "loss": 0.9588, "step": 16680 }, { "epoch": 0.22, "learning_rate": 4.4089794235107435e-05, "loss": 0.4634, "step": 16685 }, { "epoch": 0.22, "learning_rate": 4.40863964045653e-05, "loss": 0.6191, "step": 16690 }, { "epoch": 0.22, "learning_rate": 4.408299772859129e-05, "loss": 1.0737, "step": 16695 }, { "epoch": 0.22, "learning_rate": 4.407959820733595e-05, "loss": 0.9552, "step": 16700 }, { "epoch": 0.22, "learning_rate": 4.407619784094987e-05, "loss": 0.8247, "step": 16705 }, { "epoch": 0.22, "learning_rate": 4.407279662958365e-05, "loss": 1.1727, "step": 16710 }, { "epoch": 0.22, "learning_rate": 4.406939457338796e-05, "loss": 0.7497, "step": 16715 }, { "epoch": 0.22, "learning_rate": 4.4065991672513494e-05, "loss": 1.2724, "step": 16720 }, { "epoch": 0.22, "learning_rate": 4.4062587927110986e-05, "loss": 0.8318, "step": 16725 }, { "epoch": 0.22, "learning_rate": 4.405918333733119e-05, "loss": 0.1893, "step": 16730 }, { "epoch": 0.22, "learning_rate": 4.405577790332493e-05, "loss": 0.9307, "step": 16735 }, { "epoch": 0.22, "learning_rate": 4.405237162524304e-05, "loss": 1.2756, "step": 16740 }, { "epoch": 0.22, "learning_rate": 4.40489645032364e-05, "loss": 0.5386, "step": 16745 }, { "epoch": 0.22, "learning_rate": 4.4045556537455934e-05, "loss": 0.7127, "step": 16750 }, { "epoch": 0.22, "learning_rate": 4.40421477280526e-05, "loss": 0.6637, "step": 16755 }, { "epoch": 0.22, "learning_rate": 4.403873807517738e-05, "loss": 0.3164, "step": 16760 }, { "epoch": 0.22, "learning_rate": 4.40353275789813e-05, "loss": 1.1424, "step": 16765 }, { "epoch": 0.22, "learning_rate": 4.4031916239615454e-05, "loss": 0.5716, "step": 16770 }, { "epoch": 0.22, "learning_rate": 4.402850405723094e-05, "loss": 0.9515, "step": 16775 }, { "epoch": 0.22, "learning_rate": 4.402509103197887e-05, "loss": 0.4894, "step": 16780 }, { "epoch": 0.22, "learning_rate": 4.4021677164010464e-05, "loss": 1.0955, "step": 16785 }, { "epoch": 0.22, "learning_rate": 4.4018262453476925e-05, "loss": 0.4591, "step": 16790 }, { "epoch": 0.23, "learning_rate": 4.401484690052949e-05, "loss": 0.7535, "step": 16795 }, { "epoch": 0.23, "learning_rate": 4.401143050531947e-05, "loss": 0.3957, "step": 16800 }, { "epoch": 0.23, "learning_rate": 4.4008013267998194e-05, "loss": 0.3011, "step": 16805 }, { "epoch": 0.23, "learning_rate": 4.4004595188717025e-05, "loss": 1.4709, "step": 16810 }, { "epoch": 0.23, "learning_rate": 4.400117626762736e-05, "loss": 0.8275, "step": 16815 }, { "epoch": 0.23, "learning_rate": 4.399775650488065e-05, "loss": 0.768, "step": 16820 }, { "epoch": 0.23, "learning_rate": 4.399433590062837e-05, "loss": 0.9996, "step": 16825 }, { "epoch": 0.23, "learning_rate": 4.399091445502204e-05, "loss": 0.9765, "step": 16830 }, { "epoch": 0.23, "learning_rate": 4.39874921682132e-05, "loss": 0.669, "step": 16835 }, { "epoch": 0.23, "learning_rate": 4.398406904035345e-05, "loss": 0.777, "step": 16840 }, { "epoch": 0.23, "learning_rate": 4.3980645071594416e-05, "loss": 0.565, "step": 16845 }, { "epoch": 0.23, "learning_rate": 4.397722026208777e-05, "loss": 0.998, "step": 16850 }, { "epoch": 0.23, "learning_rate": 4.39737946119852e-05, "loss": 1.004, "step": 16855 }, { "epoch": 0.23, "learning_rate": 4.397036812143845e-05, "loss": 0.549, "step": 16860 }, { "epoch": 0.23, "learning_rate": 4.39669407905993e-05, "loss": 0.6632, "step": 16865 }, { "epoch": 0.23, "learning_rate": 4.3963512619619556e-05, "loss": 0.5405, "step": 16870 }, { "epoch": 0.23, "learning_rate": 4.396008360865108e-05, "loss": 0.3932, "step": 16875 }, { "epoch": 0.23, "learning_rate": 4.3956653757845755e-05, "loss": 0.9186, "step": 16880 }, { "epoch": 0.23, "learning_rate": 4.395322306735551e-05, "loss": 1.1996, "step": 16885 }, { "epoch": 0.23, "learning_rate": 4.39497915373323e-05, "loss": 0.9258, "step": 16890 }, { "epoch": 0.23, "learning_rate": 4.394635916792812e-05, "loss": 0.5641, "step": 16895 }, { "epoch": 0.23, "learning_rate": 4.3942925959295025e-05, "loss": 0.9959, "step": 16900 }, { "epoch": 0.23, "learning_rate": 4.393949191158507e-05, "loss": 0.2688, "step": 16905 }, { "epoch": 0.23, "learning_rate": 4.3936057024950375e-05, "loss": 0.4613, "step": 16910 }, { "epoch": 0.23, "learning_rate": 4.3932621299543096e-05, "loss": 0.3953, "step": 16915 }, { "epoch": 0.23, "learning_rate": 4.3929184735515404e-05, "loss": 0.1197, "step": 16920 }, { "epoch": 0.23, "learning_rate": 4.392574733301953e-05, "loss": 0.4445, "step": 16925 }, { "epoch": 0.23, "learning_rate": 4.392230909220773e-05, "loss": 1.0641, "step": 16930 }, { "epoch": 0.23, "learning_rate": 4.39188700132323e-05, "loss": 0.4497, "step": 16935 }, { "epoch": 0.23, "learning_rate": 4.391543009624559e-05, "loss": 0.5784, "step": 16940 }, { "epoch": 0.23, "learning_rate": 4.391198934139994e-05, "loss": 1.2013, "step": 16945 }, { "epoch": 0.23, "learning_rate": 4.3908547748847785e-05, "loss": 0.4292, "step": 16950 }, { "epoch": 0.23, "learning_rate": 4.390510531874156e-05, "loss": 1.3107, "step": 16955 }, { "epoch": 0.23, "learning_rate": 4.3901662051233746e-05, "loss": 1.4472, "step": 16960 }, { "epoch": 0.23, "learning_rate": 4.389821794647687e-05, "loss": 0.732, "step": 16965 }, { "epoch": 0.23, "learning_rate": 4.389477300462348e-05, "loss": 0.5575, "step": 16970 }, { "epoch": 0.23, "learning_rate": 4.389132722582618e-05, "loss": 1.5479, "step": 16975 }, { "epoch": 0.23, "learning_rate": 4.3887880610237584e-05, "loss": 1.272, "step": 16980 }, { "epoch": 0.23, "learning_rate": 4.388443315801038e-05, "loss": 0.4242, "step": 16985 }, { "epoch": 0.23, "learning_rate": 4.388098486929726e-05, "loss": 1.0793, "step": 16990 }, { "epoch": 0.23, "learning_rate": 4.3877535744250965e-05, "loss": 0.888, "step": 16995 }, { "epoch": 0.23, "learning_rate": 4.387408578302428e-05, "loss": 0.7501, "step": 17000 }, { "epoch": 0.23, "learning_rate": 4.387063498577002e-05, "loss": 0.6483, "step": 17005 }, { "epoch": 0.23, "learning_rate": 4.386718335264104e-05, "loss": 0.7826, "step": 17010 }, { "epoch": 0.23, "learning_rate": 4.386373088379022e-05, "loss": 1.226, "step": 17015 }, { "epoch": 0.23, "learning_rate": 4.3860277579370497e-05, "loss": 0.344, "step": 17020 }, { "epoch": 0.23, "learning_rate": 4.3856823439534835e-05, "loss": 1.1155, "step": 17025 }, { "epoch": 0.23, "learning_rate": 4.385336846443623e-05, "loss": 0.3864, "step": 17030 }, { "epoch": 0.23, "learning_rate": 4.384991265422772e-05, "loss": 0.4538, "step": 17035 }, { "epoch": 0.23, "learning_rate": 4.3846456009062386e-05, "loss": 0.6774, "step": 17040 }, { "epoch": 0.23, "learning_rate": 4.384299852909334e-05, "loss": 0.4395, "step": 17045 }, { "epoch": 0.23, "learning_rate": 4.383954021447372e-05, "loss": 0.9562, "step": 17050 }, { "epoch": 0.23, "learning_rate": 4.3836081065356723e-05, "loss": 1.3035, "step": 17055 }, { "epoch": 0.23, "learning_rate": 4.3832621081895565e-05, "loss": 0.6077, "step": 17060 }, { "epoch": 0.23, "learning_rate": 4.382916026424351e-05, "loss": 0.8135, "step": 17065 }, { "epoch": 0.23, "learning_rate": 4.382569861255386e-05, "loss": 0.3368, "step": 17070 }, { "epoch": 0.23, "learning_rate": 4.382223612697994e-05, "loss": 0.5989, "step": 17075 }, { "epoch": 0.23, "learning_rate": 4.381877280767513e-05, "loss": 0.3217, "step": 17080 }, { "epoch": 0.23, "learning_rate": 4.381530865479283e-05, "loss": 0.4081, "step": 17085 }, { "epoch": 0.23, "learning_rate": 4.3811843668486476e-05, "loss": 0.9971, "step": 17090 }, { "epoch": 0.23, "learning_rate": 4.3808377848909575e-05, "loss": 0.6868, "step": 17095 }, { "epoch": 0.23, "learning_rate": 4.3804911196215624e-05, "loss": 1.0917, "step": 17100 }, { "epoch": 0.23, "learning_rate": 4.380144371055819e-05, "loss": 0.2878, "step": 17105 }, { "epoch": 0.23, "learning_rate": 4.379797539209085e-05, "loss": 0.2069, "step": 17110 }, { "epoch": 0.23, "learning_rate": 4.3794506240967245e-05, "loss": 0.2206, "step": 17115 }, { "epoch": 0.23, "learning_rate": 4.3791036257341044e-05, "loss": 0.3328, "step": 17120 }, { "epoch": 0.23, "learning_rate": 4.378756544136595e-05, "loss": 0.6117, "step": 17125 }, { "epoch": 0.23, "learning_rate": 4.378409379319569e-05, "loss": 0.7118, "step": 17130 }, { "epoch": 0.23, "learning_rate": 4.378062131298406e-05, "loss": 0.9586, "step": 17135 }, { "epoch": 0.23, "learning_rate": 4.377714800088485e-05, "loss": 0.6187, "step": 17140 }, { "epoch": 0.23, "learning_rate": 4.377367385705192e-05, "loss": 1.0268, "step": 17145 }, { "epoch": 0.23, "learning_rate": 4.377019888163917e-05, "loss": 0.6239, "step": 17150 }, { "epoch": 0.23, "learning_rate": 4.376672307480051e-05, "loss": 0.3919, "step": 17155 }, { "epoch": 0.23, "learning_rate": 4.376324643668991e-05, "loss": 0.967, "step": 17160 }, { "epoch": 0.23, "learning_rate": 4.3759768967461354e-05, "loss": 0.4043, "step": 17165 }, { "epoch": 0.23, "learning_rate": 4.375629066726889e-05, "loss": 0.6374, "step": 17170 }, { "epoch": 0.23, "learning_rate": 4.3752811536266583e-05, "loss": 0.6904, "step": 17175 }, { "epoch": 0.23, "learning_rate": 4.374933157460854e-05, "loss": 0.4648, "step": 17180 }, { "epoch": 0.23, "learning_rate": 4.374585078244891e-05, "loss": 0.3013, "step": 17185 }, { "epoch": 0.23, "learning_rate": 4.3742369159941876e-05, "loss": 1.358, "step": 17190 }, { "epoch": 0.23, "learning_rate": 4.373888670724165e-05, "loss": 1.0724, "step": 17195 }, { "epoch": 0.23, "learning_rate": 4.373540342450249e-05, "loss": 0.6966, "step": 17200 }, { "epoch": 0.23, "learning_rate": 4.373191931187869e-05, "loss": 1.2914, "step": 17205 }, { "epoch": 0.23, "learning_rate": 4.372843436952458e-05, "loss": 0.5306, "step": 17210 }, { "epoch": 0.23, "learning_rate": 4.3724948597594514e-05, "loss": 0.2797, "step": 17215 }, { "epoch": 0.23, "learning_rate": 4.3721461996242915e-05, "loss": 0.7621, "step": 17220 }, { "epoch": 0.23, "learning_rate": 4.37179745656242e-05, "loss": 1.0058, "step": 17225 }, { "epoch": 0.23, "learning_rate": 4.371448630589287e-05, "loss": 0.5684, "step": 17230 }, { "epoch": 0.23, "learning_rate": 4.3710997217203406e-05, "loss": 0.7507, "step": 17235 }, { "epoch": 0.23, "learning_rate": 4.370750729971038e-05, "loss": 0.7905, "step": 17240 }, { "epoch": 0.23, "learning_rate": 4.3704016553568365e-05, "loss": 0.4137, "step": 17245 }, { "epoch": 0.23, "learning_rate": 4.3700524978931995e-05, "loss": 0.6523, "step": 17250 }, { "epoch": 0.23, "learning_rate": 4.369703257595593e-05, "loss": 0.9015, "step": 17255 }, { "epoch": 0.23, "learning_rate": 4.3693539344794855e-05, "loss": 0.5817, "step": 17260 }, { "epoch": 0.23, "learning_rate": 4.3690045285603504e-05, "loss": 0.3827, "step": 17265 }, { "epoch": 0.23, "learning_rate": 4.368655039853665e-05, "loss": 0.3379, "step": 17270 }, { "epoch": 0.23, "learning_rate": 4.36830546837491e-05, "loss": 0.8931, "step": 17275 }, { "epoch": 0.23, "learning_rate": 4.3679558141395704e-05, "loss": 0.2533, "step": 17280 }, { "epoch": 0.23, "learning_rate": 4.3676060771631325e-05, "loss": 0.6594, "step": 17285 }, { "epoch": 0.23, "learning_rate": 4.3672562574610884e-05, "loss": 0.6213, "step": 17290 }, { "epoch": 0.23, "learning_rate": 4.366906355048935e-05, "loss": 1.1123, "step": 17295 }, { "epoch": 0.23, "learning_rate": 4.36655636994217e-05, "loss": 0.2224, "step": 17300 }, { "epoch": 0.23, "learning_rate": 4.366206302156294e-05, "loss": 0.75, "step": 17305 }, { "epoch": 0.23, "learning_rate": 4.365856151706816e-05, "loss": 0.4089, "step": 17310 }, { "epoch": 0.23, "learning_rate": 4.3655059186092464e-05, "loss": 0.5262, "step": 17315 }, { "epoch": 0.23, "learning_rate": 4.3651556028790955e-05, "loss": 0.7827, "step": 17320 }, { "epoch": 0.23, "learning_rate": 4.364805204531883e-05, "loss": 1.4069, "step": 17325 }, { "epoch": 0.23, "learning_rate": 4.36445472358313e-05, "loss": 0.2256, "step": 17330 }, { "epoch": 0.23, "learning_rate": 4.36410416004836e-05, "loss": 0.6668, "step": 17335 }, { "epoch": 0.23, "learning_rate": 4.363753513943102e-05, "loss": 0.1938, "step": 17340 }, { "epoch": 0.23, "learning_rate": 4.3634027852828865e-05, "loss": 0.4035, "step": 17345 }, { "epoch": 0.23, "learning_rate": 4.36305197408325e-05, "loss": 0.354, "step": 17350 }, { "epoch": 0.23, "learning_rate": 4.362701080359732e-05, "loss": 1.0317, "step": 17355 }, { "epoch": 0.23, "learning_rate": 4.3623501041278744e-05, "loss": 0.9178, "step": 17360 }, { "epoch": 0.23, "learning_rate": 4.361999045403225e-05, "loss": 1.0767, "step": 17365 }, { "epoch": 0.23, "learning_rate": 4.361647904201333e-05, "loss": 1.0767, "step": 17370 }, { "epoch": 0.23, "learning_rate": 4.361296680537752e-05, "loss": 0.8039, "step": 17375 }, { "epoch": 0.23, "learning_rate": 4.3609453744280405e-05, "loss": 1.0541, "step": 17380 }, { "epoch": 0.23, "learning_rate": 4.3605939858877573e-05, "loss": 0.525, "step": 17385 }, { "epoch": 0.23, "learning_rate": 4.360242514932471e-05, "loss": 0.8894, "step": 17390 }, { "epoch": 0.23, "learning_rate": 4.359890961577746e-05, "loss": 0.444, "step": 17395 }, { "epoch": 0.23, "learning_rate": 4.359539325839157e-05, "loss": 0.3529, "step": 17400 }, { "epoch": 0.23, "learning_rate": 4.359187607732279e-05, "loss": 1.2688, "step": 17405 }, { "epoch": 0.23, "learning_rate": 4.358835807272691e-05, "loss": 0.2744, "step": 17410 }, { "epoch": 0.23, "learning_rate": 4.3584839244759755e-05, "loss": 0.8456, "step": 17415 }, { "epoch": 0.23, "learning_rate": 4.358131959357721e-05, "loss": 0.3601, "step": 17420 }, { "epoch": 0.23, "learning_rate": 4.3577799119335164e-05, "loss": 0.5003, "step": 17425 }, { "epoch": 0.23, "learning_rate": 4.357427782218955e-05, "loss": 0.8432, "step": 17430 }, { "epoch": 0.23, "learning_rate": 4.3570755702296365e-05, "loss": 0.6826, "step": 17435 }, { "epoch": 0.23, "learning_rate": 4.356723275981159e-05, "loss": 0.5142, "step": 17440 }, { "epoch": 0.23, "learning_rate": 4.3563708994891316e-05, "loss": 0.4161, "step": 17445 }, { "epoch": 0.23, "learning_rate": 4.3560184407691594e-05, "loss": 0.8959, "step": 17450 }, { "epoch": 0.23, "learning_rate": 4.355665899836856e-05, "loss": 0.7315, "step": 17455 }, { "epoch": 0.23, "learning_rate": 4.355313276707836e-05, "loss": 0.1083, "step": 17460 }, { "epoch": 0.23, "learning_rate": 4.3549605713977205e-05, "loss": 0.8927, "step": 17465 }, { "epoch": 0.23, "learning_rate": 4.354607783922131e-05, "loss": 1.0717, "step": 17470 }, { "epoch": 0.23, "learning_rate": 4.354254914296696e-05, "loss": 0.5829, "step": 17475 }, { "epoch": 0.23, "learning_rate": 4.353901962537044e-05, "loss": 0.7445, "step": 17480 }, { "epoch": 0.23, "learning_rate": 4.3535489286588095e-05, "loss": 0.1948, "step": 17485 }, { "epoch": 0.23, "learning_rate": 4.353195812677632e-05, "loss": 0.3076, "step": 17490 }, { "epoch": 0.23, "learning_rate": 4.352842614609149e-05, "loss": 0.6207, "step": 17495 }, { "epoch": 0.23, "learning_rate": 4.35248933446901e-05, "loss": 0.836, "step": 17500 }, { "epoch": 0.23, "learning_rate": 4.35213597227286e-05, "loss": 1.0267, "step": 17505 }, { "epoch": 0.23, "learning_rate": 4.351782528036352e-05, "loss": 1.0156, "step": 17510 }, { "epoch": 0.23, "learning_rate": 4.351429001775143e-05, "loss": 0.9593, "step": 17515 }, { "epoch": 0.23, "learning_rate": 4.3510753935048915e-05, "loss": 0.9173, "step": 17520 }, { "epoch": 0.23, "learning_rate": 4.3507217032412606e-05, "loss": 0.3085, "step": 17525 }, { "epoch": 0.23, "learning_rate": 4.350367930999917e-05, "loss": 0.8361, "step": 17530 }, { "epoch": 0.23, "learning_rate": 4.350014076796531e-05, "loss": 0.3056, "step": 17535 }, { "epoch": 0.24, "learning_rate": 4.3496601406467776e-05, "loss": 1.4952, "step": 17540 }, { "epoch": 0.24, "learning_rate": 4.3493061225663325e-05, "loss": 0.9276, "step": 17545 }, { "epoch": 0.24, "learning_rate": 4.348952022570878e-05, "loss": 0.3868, "step": 17550 }, { "epoch": 0.24, "learning_rate": 4.3485978406761e-05, "loss": 0.6271, "step": 17555 }, { "epoch": 0.24, "learning_rate": 4.3482435768976847e-05, "loss": 0.8674, "step": 17560 }, { "epoch": 0.24, "learning_rate": 4.347889231251326e-05, "loss": 0.6332, "step": 17565 }, { "epoch": 0.24, "learning_rate": 4.347534803752718e-05, "loss": 0.9128, "step": 17570 }, { "epoch": 0.24, "learning_rate": 4.3471802944175624e-05, "loss": 0.4781, "step": 17575 }, { "epoch": 0.24, "learning_rate": 4.3468257032615614e-05, "loss": 1.0613, "step": 17580 }, { "epoch": 0.24, "learning_rate": 4.3464710303004195e-05, "loss": 0.7805, "step": 17585 }, { "epoch": 0.24, "learning_rate": 4.3461162755498494e-05, "loss": 0.4644, "step": 17590 }, { "epoch": 0.24, "learning_rate": 4.345761439025564e-05, "loss": 0.5486, "step": 17595 }, { "epoch": 0.24, "learning_rate": 4.345406520743282e-05, "loss": 0.426, "step": 17600 }, { "epoch": 0.24, "learning_rate": 4.3450515207187215e-05, "loss": 0.9279, "step": 17605 }, { "epoch": 0.24, "learning_rate": 4.3446964389676105e-05, "loss": 0.7245, "step": 17610 }, { "epoch": 0.24, "learning_rate": 4.3443412755056754e-05, "loss": 0.5891, "step": 17615 }, { "epoch": 0.24, "learning_rate": 4.343986030348649e-05, "loss": 0.7575, "step": 17620 }, { "epoch": 0.24, "learning_rate": 4.343630703512266e-05, "loss": 0.8771, "step": 17625 }, { "epoch": 0.24, "learning_rate": 4.343275295012267e-05, "loss": 1.0907, "step": 17630 }, { "epoch": 0.24, "learning_rate": 4.342919804864394e-05, "loss": 1.0772, "step": 17635 }, { "epoch": 0.24, "learning_rate": 4.342564233084393e-05, "loss": 0.7045, "step": 17640 }, { "epoch": 0.24, "learning_rate": 4.3422085796880145e-05, "loss": 0.4122, "step": 17645 }, { "epoch": 0.24, "learning_rate": 4.341852844691012e-05, "loss": 0.5572, "step": 17650 }, { "epoch": 0.24, "learning_rate": 4.3414970281091436e-05, "loss": 0.473, "step": 17655 }, { "epoch": 0.24, "learning_rate": 4.3411411299581695e-05, "loss": 0.919, "step": 17660 }, { "epoch": 0.24, "learning_rate": 4.340785150253854e-05, "loss": 1.0978, "step": 17665 }, { "epoch": 0.24, "learning_rate": 4.3404290890119656e-05, "loss": 0.5091, "step": 17670 }, { "epoch": 0.24, "learning_rate": 4.340072946248277e-05, "loss": 0.47, "step": 17675 }, { "epoch": 0.24, "learning_rate": 4.339716721978561e-05, "loss": 0.6923, "step": 17680 }, { "epoch": 0.24, "learning_rate": 4.339360416218599e-05, "loss": 1.1209, "step": 17685 }, { "epoch": 0.24, "learning_rate": 4.339004028984172e-05, "loss": 1.153, "step": 17690 }, { "epoch": 0.24, "learning_rate": 4.338647560291067e-05, "loss": 0.6266, "step": 17695 }, { "epoch": 0.24, "learning_rate": 4.3382910101550734e-05, "loss": 0.2248, "step": 17700 }, { "epoch": 0.24, "learning_rate": 4.337934378591984e-05, "loss": 0.6524, "step": 17705 }, { "epoch": 0.24, "learning_rate": 4.337577665617598e-05, "loss": 1.1029, "step": 17710 }, { "epoch": 0.24, "learning_rate": 4.3372208712477135e-05, "loss": 0.9421, "step": 17715 }, { "epoch": 0.24, "learning_rate": 4.336863995498136e-05, "loss": 0.4951, "step": 17720 }, { "epoch": 0.24, "learning_rate": 4.336507038384673e-05, "loss": 0.8548, "step": 17725 }, { "epoch": 0.24, "learning_rate": 4.336149999923136e-05, "loss": 0.9969, "step": 17730 }, { "epoch": 0.24, "learning_rate": 4.33579288012934e-05, "loss": 0.9276, "step": 17735 }, { "epoch": 0.24, "learning_rate": 4.335435679019104e-05, "loss": 0.4524, "step": 17740 }, { "epoch": 0.24, "learning_rate": 4.33507839660825e-05, "loss": 0.474, "step": 17745 }, { "epoch": 0.24, "learning_rate": 4.334721032912602e-05, "loss": 1.0934, "step": 17750 }, { "epoch": 0.24, "learning_rate": 4.3343635879479925e-05, "loss": 0.6729, "step": 17755 }, { "epoch": 0.24, "learning_rate": 4.334006061730253e-05, "loss": 1.1192, "step": 17760 }, { "epoch": 0.24, "learning_rate": 4.33364845427522e-05, "loss": 0.4075, "step": 17765 }, { "epoch": 0.24, "learning_rate": 4.3332907655987335e-05, "loss": 1.28, "step": 17770 }, { "epoch": 0.24, "learning_rate": 4.3329329957166385e-05, "loss": 0.7273, "step": 17775 }, { "epoch": 0.24, "learning_rate": 4.332575144644781e-05, "loss": 0.284, "step": 17780 }, { "epoch": 0.24, "learning_rate": 4.3322172123990126e-05, "loss": 0.9285, "step": 17785 }, { "epoch": 0.24, "learning_rate": 4.3318591989951886e-05, "loss": 0.5944, "step": 17790 }, { "epoch": 0.24, "learning_rate": 4.331501104449166e-05, "loss": 0.7583, "step": 17795 }, { "epoch": 0.24, "learning_rate": 4.331142928776808e-05, "loss": 0.2545, "step": 17800 }, { "epoch": 0.24, "learning_rate": 4.3307846719939785e-05, "loss": 1.3767, "step": 17805 }, { "epoch": 0.24, "learning_rate": 4.3304263341165474e-05, "loss": 1.4947, "step": 17810 }, { "epoch": 0.24, "learning_rate": 4.3300679151603874e-05, "loss": 0.7355, "step": 17815 }, { "epoch": 0.24, "learning_rate": 4.329709415141374e-05, "loss": 0.4119, "step": 17820 }, { "epoch": 0.24, "learning_rate": 4.3293508340753864e-05, "loss": 0.3776, "step": 17825 }, { "epoch": 0.24, "learning_rate": 4.32899217197831e-05, "loss": 0.7098, "step": 17830 }, { "epoch": 0.24, "learning_rate": 4.32863342886603e-05, "loss": 0.5923, "step": 17835 }, { "epoch": 0.24, "learning_rate": 4.328274604754438e-05, "loss": 0.8138, "step": 17840 }, { "epoch": 0.24, "learning_rate": 4.327915699659427e-05, "loss": 0.3587, "step": 17845 }, { "epoch": 0.24, "learning_rate": 4.3275567135968953e-05, "loss": 0.8663, "step": 17850 }, { "epoch": 0.24, "learning_rate": 4.327197646582743e-05, "loss": 0.5408, "step": 17855 }, { "epoch": 0.24, "learning_rate": 4.326838498632878e-05, "loss": 0.5085, "step": 17860 }, { "epoch": 0.24, "learning_rate": 4.326479269763207e-05, "loss": 0.5642, "step": 17865 }, { "epoch": 0.24, "learning_rate": 4.326119959989641e-05, "loss": 0.5153, "step": 17870 }, { "epoch": 0.24, "learning_rate": 4.325760569328097e-05, "loss": 0.5488, "step": 17875 }, { "epoch": 0.24, "learning_rate": 4.325401097794493e-05, "loss": 0.5496, "step": 17880 }, { "epoch": 0.24, "learning_rate": 4.3250415454047535e-05, "loss": 0.9666, "step": 17885 }, { "epoch": 0.24, "learning_rate": 4.3246819121748036e-05, "loss": 0.4063, "step": 17890 }, { "epoch": 0.24, "learning_rate": 4.3243221981205735e-05, "loss": 0.8853, "step": 17895 }, { "epoch": 0.24, "learning_rate": 4.3239624032579975e-05, "loss": 1.1293, "step": 17900 }, { "epoch": 0.24, "learning_rate": 4.3236025276030113e-05, "loss": 0.3431, "step": 17905 }, { "epoch": 0.24, "learning_rate": 4.323242571171556e-05, "loss": 0.6612, "step": 17910 }, { "epoch": 0.24, "learning_rate": 4.322882533979576e-05, "loss": 1.1584, "step": 17915 }, { "epoch": 0.24, "learning_rate": 4.322522416043021e-05, "loss": 0.3423, "step": 17920 }, { "epoch": 0.24, "learning_rate": 4.322162217377839e-05, "loss": 1.0146, "step": 17925 }, { "epoch": 0.24, "learning_rate": 4.3218019379999875e-05, "loss": 0.7754, "step": 17930 }, { "epoch": 0.24, "learning_rate": 4.321441577925425e-05, "loss": 1.0013, "step": 17935 }, { "epoch": 0.24, "learning_rate": 4.3210811371701123e-05, "loss": 0.8207, "step": 17940 }, { "epoch": 0.24, "learning_rate": 4.320720615750016e-05, "loss": 0.8214, "step": 17945 }, { "epoch": 0.24, "learning_rate": 4.320360013681104e-05, "loss": 0.4731, "step": 17950 }, { "epoch": 0.24, "learning_rate": 4.319999330979352e-05, "loss": 0.4874, "step": 17955 }, { "epoch": 0.24, "learning_rate": 4.319638567660734e-05, "loss": 1.0523, "step": 17960 }, { "epoch": 0.24, "learning_rate": 4.3192777237412305e-05, "loss": 1.0279, "step": 17965 }, { "epoch": 0.24, "learning_rate": 4.318916799236826e-05, "loss": 0.4347, "step": 17970 }, { "epoch": 0.24, "learning_rate": 4.318555794163507e-05, "loss": 1.0727, "step": 17975 }, { "epoch": 0.24, "learning_rate": 4.318194708537264e-05, "loss": 0.6077, "step": 17980 }, { "epoch": 0.24, "learning_rate": 4.3178335423740926e-05, "loss": 0.8332, "step": 17985 }, { "epoch": 0.24, "learning_rate": 4.317472295689988e-05, "loss": 0.4535, "step": 17990 }, { "epoch": 0.24, "learning_rate": 4.3171109685009546e-05, "loss": 0.6591, "step": 17995 }, { "epoch": 0.24, "learning_rate": 4.316749560822996e-05, "loss": 0.4505, "step": 18000 }, { "epoch": 0.24, "learning_rate": 4.3163880726721194e-05, "loss": 1.3163, "step": 18005 }, { "epoch": 0.24, "learning_rate": 4.31602650406434e-05, "loss": 1.1105, "step": 18010 }, { "epoch": 0.24, "learning_rate": 4.3156648550156706e-05, "loss": 0.5322, "step": 18015 }, { "epoch": 0.24, "learning_rate": 4.315303125542132e-05, "loss": 1.2623, "step": 18020 }, { "epoch": 0.24, "learning_rate": 4.3149413156597465e-05, "loss": 0.9977, "step": 18025 }, { "epoch": 0.24, "learning_rate": 4.31457942538454e-05, "loss": 0.7949, "step": 18030 }, { "epoch": 0.24, "learning_rate": 4.3142174547325434e-05, "loss": 0.8252, "step": 18035 }, { "epoch": 0.24, "learning_rate": 4.31385540371979e-05, "loss": 1.4925, "step": 18040 }, { "epoch": 0.24, "learning_rate": 4.313493272362317e-05, "loss": 0.9028, "step": 18045 }, { "epoch": 0.24, "learning_rate": 4.313131060676164e-05, "loss": 0.295, "step": 18050 }, { "epoch": 0.24, "learning_rate": 4.3127687686773766e-05, "loss": 0.2885, "step": 18055 }, { "epoch": 0.24, "learning_rate": 4.312406396382001e-05, "loss": 0.7056, "step": 18060 }, { "epoch": 0.24, "learning_rate": 4.312043943806089e-05, "loss": 0.6132, "step": 18065 }, { "epoch": 0.24, "learning_rate": 4.3116814109656965e-05, "loss": 0.905, "step": 18070 }, { "epoch": 0.24, "learning_rate": 4.311318797876881e-05, "loss": 0.5143, "step": 18075 }, { "epoch": 0.24, "learning_rate": 4.3109561045557035e-05, "loss": 1.3693, "step": 18080 }, { "epoch": 0.24, "learning_rate": 4.3105933310182314e-05, "loss": 0.7393, "step": 18085 }, { "epoch": 0.24, "learning_rate": 4.310230477280532e-05, "loss": 0.7877, "step": 18090 }, { "epoch": 0.24, "learning_rate": 4.30986754335868e-05, "loss": 1.0846, "step": 18095 }, { "epoch": 0.24, "learning_rate": 4.3095045292687495e-05, "loss": 0.7998, "step": 18100 }, { "epoch": 0.24, "learning_rate": 4.309141435026822e-05, "loss": 0.9253, "step": 18105 }, { "epoch": 0.24, "learning_rate": 4.308778260648978e-05, "loss": 0.6463, "step": 18110 }, { "epoch": 0.24, "learning_rate": 4.308415006151307e-05, "loss": 0.2275, "step": 18115 }, { "epoch": 0.24, "learning_rate": 4.308051671549899e-05, "loss": 1.0878, "step": 18120 }, { "epoch": 0.24, "learning_rate": 4.3076882568608466e-05, "loss": 0.6364, "step": 18125 }, { "epoch": 0.24, "learning_rate": 4.307324762100249e-05, "loss": 0.5943, "step": 18130 }, { "epoch": 0.24, "learning_rate": 4.306961187284205e-05, "loss": 0.6869, "step": 18135 }, { "epoch": 0.24, "learning_rate": 4.306597532428821e-05, "loss": 0.9188, "step": 18140 }, { "epoch": 0.24, "learning_rate": 4.3062337975502045e-05, "loss": 1.0699, "step": 18145 }, { "epoch": 0.24, "learning_rate": 4.3058699826644667e-05, "loss": 1.199, "step": 18150 }, { "epoch": 0.24, "learning_rate": 4.305506087787723e-05, "loss": 1.2551, "step": 18155 }, { "epoch": 0.24, "learning_rate": 4.305142112936092e-05, "loss": 1.3043, "step": 18160 }, { "epoch": 0.24, "learning_rate": 4.304778058125697e-05, "loss": 0.5756, "step": 18165 }, { "epoch": 0.24, "learning_rate": 4.304413923372663e-05, "loss": 0.7215, "step": 18170 }, { "epoch": 0.24, "learning_rate": 4.3040497086931195e-05, "loss": 1.0527, "step": 18175 }, { "epoch": 0.24, "learning_rate": 4.303685414103199e-05, "loss": 0.859, "step": 18180 }, { "epoch": 0.24, "learning_rate": 4.3033210396190385e-05, "loss": 1.314, "step": 18185 }, { "epoch": 0.24, "learning_rate": 4.302956585256777e-05, "loss": 0.862, "step": 18190 }, { "epoch": 0.24, "learning_rate": 4.302592051032559e-05, "loss": 0.7438, "step": 18195 }, { "epoch": 0.24, "learning_rate": 4.3022274369625316e-05, "loss": 0.4413, "step": 18200 }, { "epoch": 0.24, "learning_rate": 4.301862743062844e-05, "loss": 0.5867, "step": 18205 }, { "epoch": 0.24, "learning_rate": 4.3014979693496526e-05, "loss": 0.24, "step": 18210 }, { "epoch": 0.24, "learning_rate": 4.3011331158391133e-05, "loss": 1.1374, "step": 18215 }, { "epoch": 0.24, "learning_rate": 4.300768182547388e-05, "loss": 1.1778, "step": 18220 }, { "epoch": 0.24, "learning_rate": 4.30040316949064e-05, "loss": 0.4194, "step": 18225 }, { "epoch": 0.24, "learning_rate": 4.3000380766850404e-05, "loss": 0.4362, "step": 18230 }, { "epoch": 0.24, "learning_rate": 4.2996729041467576e-05, "loss": 1.2057, "step": 18235 }, { "epoch": 0.24, "learning_rate": 4.299307651891969e-05, "loss": 1.1675, "step": 18240 }, { "epoch": 0.24, "learning_rate": 4.298942319936854e-05, "loss": 1.0142, "step": 18245 }, { "epoch": 0.24, "learning_rate": 4.2985769082975937e-05, "loss": 0.513, "step": 18250 }, { "epoch": 0.24, "learning_rate": 4.2982114169903745e-05, "loss": 1.1792, "step": 18255 }, { "epoch": 0.24, "learning_rate": 4.2978458460313855e-05, "loss": 0.244, "step": 18260 }, { "epoch": 0.24, "learning_rate": 4.297480195436819e-05, "loss": 0.752, "step": 18265 }, { "epoch": 0.24, "learning_rate": 4.297114465222874e-05, "loss": 0.8179, "step": 18270 }, { "epoch": 0.24, "learning_rate": 4.296748655405748e-05, "loss": 0.7085, "step": 18275 }, { "epoch": 0.24, "learning_rate": 4.296382766001645e-05, "loss": 0.3675, "step": 18280 }, { "epoch": 0.24, "learning_rate": 4.2960167970267736e-05, "loss": 0.5194, "step": 18285 }, { "epoch": 0.25, "learning_rate": 4.2956507484973424e-05, "loss": 0.5168, "step": 18290 }, { "epoch": 0.25, "learning_rate": 4.2952846204295665e-05, "loss": 0.5012, "step": 18295 }, { "epoch": 0.25, "learning_rate": 4.294918412839664e-05, "loss": 0.8818, "step": 18300 }, { "epoch": 0.25, "learning_rate": 4.294552125743855e-05, "loss": 0.9045, "step": 18305 }, { "epoch": 0.25, "learning_rate": 4.2941857591583645e-05, "loss": 0.5258, "step": 18310 }, { "epoch": 0.25, "learning_rate": 4.293819313099421e-05, "loss": 0.6715, "step": 18315 }, { "epoch": 0.25, "learning_rate": 4.293452787583256e-05, "loss": 0.5052, "step": 18320 }, { "epoch": 0.25, "learning_rate": 4.293086182626106e-05, "loss": 0.7893, "step": 18325 }, { "epoch": 0.25, "learning_rate": 4.2927194982442075e-05, "loss": 1.2106, "step": 18330 }, { "epoch": 0.25, "learning_rate": 4.292352734453804e-05, "loss": 0.5821, "step": 18335 }, { "epoch": 0.25, "learning_rate": 4.291985891271142e-05, "loss": 1.1604, "step": 18340 }, { "epoch": 0.25, "learning_rate": 4.291618968712469e-05, "loss": 1.01, "step": 18345 }, { "epoch": 0.25, "learning_rate": 4.291251966794039e-05, "loss": 0.7776, "step": 18350 }, { "epoch": 0.25, "learning_rate": 4.2908848855321086e-05, "loss": 0.5424, "step": 18355 }, { "epoch": 0.25, "learning_rate": 4.290517724942937e-05, "loss": 0.9854, "step": 18360 }, { "epoch": 0.25, "learning_rate": 4.290150485042789e-05, "loss": 0.9099, "step": 18365 }, { "epoch": 0.25, "learning_rate": 4.289783165847929e-05, "loss": 0.6894, "step": 18370 }, { "epoch": 0.25, "learning_rate": 4.289415767374629e-05, "loss": 0.6603, "step": 18375 }, { "epoch": 0.25, "learning_rate": 4.289048289639164e-05, "loss": 0.7987, "step": 18380 }, { "epoch": 0.25, "learning_rate": 4.288680732657808e-05, "loss": 0.7456, "step": 18385 }, { "epoch": 0.25, "learning_rate": 4.288313096446845e-05, "loss": 0.2847, "step": 18390 }, { "epoch": 0.25, "learning_rate": 4.287945381022559e-05, "loss": 1.4594, "step": 18395 }, { "epoch": 0.25, "learning_rate": 4.287577586401237e-05, "loss": 0.8811, "step": 18400 }, { "epoch": 0.25, "learning_rate": 4.28720971259917e-05, "loss": 0.2254, "step": 18405 }, { "epoch": 0.25, "learning_rate": 4.2868417596326554e-05, "loss": 0.1954, "step": 18410 }, { "epoch": 0.25, "learning_rate": 4.2864737275179894e-05, "loss": 1.0516, "step": 18415 }, { "epoch": 0.25, "learning_rate": 4.286105616271475e-05, "loss": 0.581, "step": 18420 }, { "epoch": 0.25, "learning_rate": 4.285737425909417e-05, "loss": 1.0659, "step": 18425 }, { "epoch": 0.25, "learning_rate": 4.285369156448125e-05, "loss": 1.1183, "step": 18430 }, { "epoch": 0.25, "learning_rate": 4.285000807903912e-05, "loss": 0.3144, "step": 18435 }, { "epoch": 0.25, "learning_rate": 4.284632380293092e-05, "loss": 0.9505, "step": 18440 }, { "epoch": 0.25, "learning_rate": 4.2842638736319865e-05, "loss": 0.9383, "step": 18445 }, { "epoch": 0.25, "learning_rate": 4.283895287936917e-05, "loss": 0.3803, "step": 18450 }, { "epoch": 0.25, "learning_rate": 4.2835266232242116e-05, "loss": 0.3335, "step": 18455 }, { "epoch": 0.25, "learning_rate": 4.283157879510199e-05, "loss": 0.4905, "step": 18460 }, { "epoch": 0.25, "learning_rate": 4.2827890568112136e-05, "loss": 0.3449, "step": 18465 }, { "epoch": 0.25, "learning_rate": 4.282420155143592e-05, "loss": 1.3037, "step": 18470 }, { "epoch": 0.25, "learning_rate": 4.282051174523675e-05, "loss": 0.9986, "step": 18475 }, { "epoch": 0.25, "learning_rate": 4.281682114967806e-05, "loss": 0.9735, "step": 18480 }, { "epoch": 0.25, "learning_rate": 4.281312976492332e-05, "loss": 0.7552, "step": 18485 }, { "epoch": 0.25, "learning_rate": 4.280943759113606e-05, "loss": 0.7342, "step": 18490 }, { "epoch": 0.25, "learning_rate": 4.28057446284798e-05, "loss": 0.9237, "step": 18495 }, { "epoch": 0.25, "learning_rate": 4.280205087711814e-05, "loss": 0.4585, "step": 18500 }, { "epoch": 0.25, "learning_rate": 4.279835633721469e-05, "loss": 0.1411, "step": 18505 }, { "epoch": 0.25, "learning_rate": 4.279466100893309e-05, "loss": 0.6192, "step": 18510 }, { "epoch": 0.25, "learning_rate": 4.2790964892437036e-05, "loss": 1.201, "step": 18515 }, { "epoch": 0.25, "learning_rate": 4.2787267987890236e-05, "loss": 0.5654, "step": 18520 }, { "epoch": 0.25, "learning_rate": 4.278357029545646e-05, "loss": 0.5809, "step": 18525 }, { "epoch": 0.25, "learning_rate": 4.277987181529948e-05, "loss": 0.5807, "step": 18530 }, { "epoch": 0.25, "learning_rate": 4.277617254758314e-05, "loss": 1.0638, "step": 18535 }, { "epoch": 0.25, "learning_rate": 4.277247249247128e-05, "loss": 0.4517, "step": 18540 }, { "epoch": 0.25, "learning_rate": 4.2768771650127796e-05, "loss": 0.5972, "step": 18545 }, { "epoch": 0.25, "learning_rate": 4.276507002071663e-05, "loss": 0.6047, "step": 18550 }, { "epoch": 0.25, "learning_rate": 4.276136760440174e-05, "loss": 0.7515, "step": 18555 }, { "epoch": 0.25, "learning_rate": 4.275766440134711e-05, "loss": 0.4053, "step": 18560 }, { "epoch": 0.25, "learning_rate": 4.27539604117168e-05, "loss": 0.7946, "step": 18565 }, { "epoch": 0.25, "learning_rate": 4.275025563567485e-05, "loss": 0.533, "step": 18570 }, { "epoch": 0.25, "learning_rate": 4.274655007338539e-05, "loss": 0.8039, "step": 18575 }, { "epoch": 0.25, "learning_rate": 4.2742843725012536e-05, "loss": 0.3668, "step": 18580 }, { "epoch": 0.25, "learning_rate": 4.2739136590720476e-05, "loss": 0.3489, "step": 18585 }, { "epoch": 0.25, "learning_rate": 4.2735428670673404e-05, "loss": 0.6032, "step": 18590 }, { "epoch": 0.25, "learning_rate": 4.2731719965035575e-05, "loss": 0.8428, "step": 18595 }, { "epoch": 0.25, "learning_rate": 4.272801047397126e-05, "loss": 1.3151, "step": 18600 }, { "epoch": 0.25, "learning_rate": 4.272430019764477e-05, "loss": 0.3561, "step": 18605 }, { "epoch": 0.25, "learning_rate": 4.272058913622046e-05, "loss": 0.4527, "step": 18610 }, { "epoch": 0.25, "learning_rate": 4.27168772898627e-05, "loss": 0.4988, "step": 18615 }, { "epoch": 0.25, "learning_rate": 4.27131646587359e-05, "loss": 0.155, "step": 18620 }, { "epoch": 0.25, "learning_rate": 4.270945124300454e-05, "loss": 0.7773, "step": 18625 }, { "epoch": 0.25, "learning_rate": 4.270573704283308e-05, "loss": 1.4714, "step": 18630 }, { "epoch": 0.25, "learning_rate": 4.270202205838605e-05, "loss": 0.9636, "step": 18635 }, { "epoch": 0.25, "learning_rate": 4.2698306289828e-05, "loss": 0.4038, "step": 18640 }, { "epoch": 0.25, "learning_rate": 4.269458973732352e-05, "loss": 0.7973, "step": 18645 }, { "epoch": 0.25, "learning_rate": 4.269087240103724e-05, "loss": 0.4447, "step": 18650 }, { "epoch": 0.25, "learning_rate": 4.268715428113382e-05, "loss": 0.9155, "step": 18655 }, { "epoch": 0.25, "learning_rate": 4.268343537777795e-05, "loss": 0.4085, "step": 18660 }, { "epoch": 0.25, "learning_rate": 4.2679715691134356e-05, "loss": 1.6902, "step": 18665 }, { "epoch": 0.25, "learning_rate": 4.2675995221367814e-05, "loss": 1.0022, "step": 18670 }, { "epoch": 0.25, "learning_rate": 4.2672273968643115e-05, "loss": 1.4089, "step": 18675 }, { "epoch": 0.25, "learning_rate": 4.266855193312508e-05, "loss": 0.3322, "step": 18680 }, { "epoch": 0.25, "learning_rate": 4.2664829114978595e-05, "loss": 0.3171, "step": 18685 }, { "epoch": 0.25, "learning_rate": 4.2661105514368554e-05, "loss": 1.537, "step": 18690 }, { "epoch": 0.25, "learning_rate": 4.26573811314599e-05, "loss": 0.616, "step": 18695 }, { "epoch": 0.25, "learning_rate": 4.2653655966417584e-05, "loss": 0.9909, "step": 18700 }, { "epoch": 0.25, "learning_rate": 4.264993001940664e-05, "loss": 0.2878, "step": 18705 }, { "epoch": 0.25, "learning_rate": 4.264620329059209e-05, "loss": 1.232, "step": 18710 }, { "epoch": 0.25, "learning_rate": 4.264247578013901e-05, "loss": 1.0527, "step": 18715 }, { "epoch": 0.25, "learning_rate": 4.263874748821253e-05, "loss": 0.7228, "step": 18720 }, { "epoch": 0.25, "learning_rate": 4.263501841497777e-05, "loss": 0.61, "step": 18725 }, { "epoch": 0.25, "learning_rate": 4.263128856059992e-05, "loss": 1.7003, "step": 18730 }, { "epoch": 0.25, "learning_rate": 4.2627557925244196e-05, "loss": 1.2878, "step": 18735 }, { "epoch": 0.25, "learning_rate": 4.2623826509075835e-05, "loss": 1.1825, "step": 18740 }, { "epoch": 0.25, "learning_rate": 4.262009431226014e-05, "loss": 1.024, "step": 18745 }, { "epoch": 0.25, "learning_rate": 4.261636133496242e-05, "loss": 0.4118, "step": 18750 }, { "epoch": 0.25, "learning_rate": 4.261262757734801e-05, "loss": 0.7002, "step": 18755 }, { "epoch": 0.25, "learning_rate": 4.260889303958232e-05, "loss": 0.2908, "step": 18760 }, { "epoch": 0.25, "learning_rate": 4.260515772183077e-05, "loss": 0.7677, "step": 18765 }, { "epoch": 0.25, "learning_rate": 4.2601421624258795e-05, "loss": 1.081, "step": 18770 }, { "epoch": 0.25, "learning_rate": 4.2597684747031916e-05, "loss": 2.0616, "step": 18775 }, { "epoch": 0.25, "learning_rate": 4.259394709031562e-05, "loss": 0.335, "step": 18780 }, { "epoch": 0.25, "learning_rate": 4.259020865427551e-05, "loss": 0.7836, "step": 18785 }, { "epoch": 0.25, "learning_rate": 4.2586469439077145e-05, "loss": 0.5744, "step": 18790 }, { "epoch": 0.25, "learning_rate": 4.258272944488617e-05, "loss": 0.9429, "step": 18795 }, { "epoch": 0.25, "learning_rate": 4.2578988671868235e-05, "loss": 1.5664, "step": 18800 }, { "epoch": 0.25, "learning_rate": 4.257524712018906e-05, "loss": 0.4746, "step": 18805 }, { "epoch": 0.25, "learning_rate": 4.257150479001436e-05, "loss": 0.9952, "step": 18810 }, { "epoch": 0.25, "learning_rate": 4.25677616815099e-05, "loss": 0.9556, "step": 18815 }, { "epoch": 0.25, "learning_rate": 4.256401779484149e-05, "loss": 0.458, "step": 18820 }, { "epoch": 0.25, "learning_rate": 4.256027313017496e-05, "loss": 0.5751, "step": 18825 }, { "epoch": 0.25, "learning_rate": 4.2556527687676186e-05, "loss": 0.8037, "step": 18830 }, { "epoch": 0.25, "learning_rate": 4.255278146751106e-05, "loss": 1.0943, "step": 18835 }, { "epoch": 0.25, "learning_rate": 4.254903446984553e-05, "loss": 0.249, "step": 18840 }, { "epoch": 0.25, "learning_rate": 4.254528669484558e-05, "loss": 0.4573, "step": 18845 }, { "epoch": 0.25, "learning_rate": 4.254153814267719e-05, "loss": 0.7566, "step": 18850 }, { "epoch": 0.25, "learning_rate": 4.253778881350643e-05, "loss": 1.3264, "step": 18855 }, { "epoch": 0.25, "learning_rate": 4.253403870749936e-05, "loss": 1.2029, "step": 18860 }, { "epoch": 0.25, "learning_rate": 4.253028782482209e-05, "loss": 1.3095, "step": 18865 }, { "epoch": 0.25, "learning_rate": 4.2526536165640774e-05, "loss": 1.7969, "step": 18870 }, { "epoch": 0.25, "learning_rate": 4.2522783730121596e-05, "loss": 0.6019, "step": 18875 }, { "epoch": 0.25, "learning_rate": 4.251903051843075e-05, "loss": 0.6915, "step": 18880 }, { "epoch": 0.25, "learning_rate": 4.2515276530734504e-05, "loss": 0.9655, "step": 18885 }, { "epoch": 0.25, "learning_rate": 4.251152176719913e-05, "loss": 0.6872, "step": 18890 }, { "epoch": 0.25, "learning_rate": 4.250776622799095e-05, "loss": 1.188, "step": 18895 }, { "epoch": 0.25, "learning_rate": 4.250400991327632e-05, "loss": 0.9502, "step": 18900 }, { "epoch": 0.25, "learning_rate": 4.250025282322162e-05, "loss": 1.1958, "step": 18905 }, { "epoch": 0.25, "learning_rate": 4.249649495799327e-05, "loss": 1.4021, "step": 18910 }, { "epoch": 0.25, "learning_rate": 4.249273631775772e-05, "loss": 0.3684, "step": 18915 }, { "epoch": 0.25, "learning_rate": 4.248897690268147e-05, "loss": 0.7474, "step": 18920 }, { "epoch": 0.25, "learning_rate": 4.248521671293104e-05, "loss": 0.7445, "step": 18925 }, { "epoch": 0.25, "learning_rate": 4.248145574867298e-05, "loss": 0.8741, "step": 18930 }, { "epoch": 0.25, "learning_rate": 4.247769401007389e-05, "loss": 0.3796, "step": 18935 }, { "epoch": 0.25, "learning_rate": 4.247393149730039e-05, "loss": 0.6476, "step": 18940 }, { "epoch": 0.25, "learning_rate": 4.247016821051915e-05, "loss": 0.4631, "step": 18945 }, { "epoch": 0.25, "learning_rate": 4.2466404149896854e-05, "loss": 0.6586, "step": 18950 }, { "epoch": 0.25, "learning_rate": 4.2462639315600237e-05, "loss": 0.6385, "step": 18955 }, { "epoch": 0.25, "learning_rate": 4.245887370779605e-05, "loss": 0.2975, "step": 18960 }, { "epoch": 0.25, "learning_rate": 4.245510732665112e-05, "loss": 0.5142, "step": 18965 }, { "epoch": 0.25, "learning_rate": 4.2451340172332256e-05, "loss": 0.4999, "step": 18970 }, { "epoch": 0.25, "learning_rate": 4.2447572245006326e-05, "loss": 0.6427, "step": 18975 }, { "epoch": 0.25, "learning_rate": 4.244380354484023e-05, "loss": 0.8982, "step": 18980 }, { "epoch": 0.25, "learning_rate": 4.244003407200091e-05, "loss": 0.4071, "step": 18985 }, { "epoch": 0.25, "learning_rate": 4.243626382665533e-05, "loss": 1.6473, "step": 18990 }, { "epoch": 0.25, "learning_rate": 4.2432492808970494e-05, "loss": 0.4629, "step": 18995 }, { "epoch": 0.25, "learning_rate": 4.242872101911344e-05, "loss": 1.0945, "step": 19000 }, { "epoch": 0.25, "learning_rate": 4.2424948457251233e-05, "loss": 0.4301, "step": 19005 }, { "epoch": 0.25, "learning_rate": 4.242117512355098e-05, "loss": 0.8349, "step": 19010 }, { "epoch": 0.25, "learning_rate": 4.2417401018179835e-05, "loss": 0.0931, "step": 19015 }, { "epoch": 0.25, "learning_rate": 4.241362614130496e-05, "loss": 1.1967, "step": 19020 }, { "epoch": 0.25, "learning_rate": 4.240985049309356e-05, "loss": 1.0761, "step": 19025 }, { "epoch": 0.25, "learning_rate": 4.2406074073712876e-05, "loss": 0.5494, "step": 19030 }, { "epoch": 0.26, "learning_rate": 4.240229688333021e-05, "loss": 0.6987, "step": 19035 }, { "epoch": 0.26, "learning_rate": 4.2398518922112836e-05, "loss": 0.7908, "step": 19040 }, { "epoch": 0.26, "learning_rate": 4.2394740190228115e-05, "loss": 0.4836, "step": 19045 }, { "epoch": 0.26, "learning_rate": 4.239096068784344e-05, "loss": 0.5518, "step": 19050 }, { "epoch": 0.26, "learning_rate": 4.238718041512619e-05, "loss": 0.7591, "step": 19055 }, { "epoch": 0.26, "learning_rate": 4.238339937224385e-05, "loss": 0.4287, "step": 19060 }, { "epoch": 0.26, "learning_rate": 4.2379617559363885e-05, "loss": 1.1934, "step": 19065 }, { "epoch": 0.26, "learning_rate": 4.23758349766538e-05, "loss": 0.78, "step": 19070 }, { "epoch": 0.26, "learning_rate": 4.2372051624281164e-05, "loss": 0.8953, "step": 19075 }, { "epoch": 0.26, "learning_rate": 4.2368267502413536e-05, "loss": 0.9789, "step": 19080 }, { "epoch": 0.26, "learning_rate": 4.2364482611218556e-05, "loss": 0.7889, "step": 19085 }, { "epoch": 0.26, "learning_rate": 4.236069695086388e-05, "loss": 0.9881, "step": 19090 }, { "epoch": 0.26, "learning_rate": 4.235691052151717e-05, "loss": 0.8542, "step": 19095 }, { "epoch": 0.26, "learning_rate": 4.2353123323346156e-05, "loss": 0.5153, "step": 19100 }, { "epoch": 0.26, "learning_rate": 4.23493353565186e-05, "loss": 0.604, "step": 19105 }, { "epoch": 0.26, "learning_rate": 4.2345546621202283e-05, "loss": 0.5554, "step": 19110 }, { "epoch": 0.26, "learning_rate": 4.2341757117565026e-05, "loss": 1.0698, "step": 19115 }, { "epoch": 0.26, "learning_rate": 4.233796684577468e-05, "loss": 0.9957, "step": 19120 }, { "epoch": 0.26, "learning_rate": 4.233417580599915e-05, "loss": 0.2804, "step": 19125 }, { "epoch": 0.26, "learning_rate": 4.233038399840635e-05, "loss": 0.7219, "step": 19130 }, { "epoch": 0.26, "learning_rate": 4.232659142316424e-05, "loss": 0.705, "step": 19135 }, { "epoch": 0.26, "learning_rate": 4.232279808044081e-05, "loss": 1.2885, "step": 19140 }, { "epoch": 0.26, "learning_rate": 4.231900397040409e-05, "loss": 0.949, "step": 19145 }, { "epoch": 0.26, "learning_rate": 4.2315209093222145e-05, "loss": 0.6361, "step": 19150 }, { "epoch": 0.26, "learning_rate": 4.2311413449063053e-05, "loss": 0.5225, "step": 19155 }, { "epoch": 0.26, "learning_rate": 4.230761703809496e-05, "loss": 0.2326, "step": 19160 }, { "epoch": 0.26, "learning_rate": 4.230381986048601e-05, "loss": 0.9506, "step": 19165 }, { "epoch": 0.26, "learning_rate": 4.230002191640441e-05, "loss": 0.7788, "step": 19170 }, { "epoch": 0.26, "learning_rate": 4.2296223206018396e-05, "loss": 1.2332, "step": 19175 }, { "epoch": 0.26, "learning_rate": 4.2292423729496214e-05, "loss": 1.1326, "step": 19180 }, { "epoch": 0.26, "learning_rate": 4.2288623487006184e-05, "loss": 0.5077, "step": 19185 }, { "epoch": 0.26, "learning_rate": 4.228482247871662e-05, "loss": 0.8116, "step": 19190 }, { "epoch": 0.26, "learning_rate": 4.2281020704795894e-05, "loss": 0.6726, "step": 19195 }, { "epoch": 0.26, "learning_rate": 4.22772181654124e-05, "loss": 0.3158, "step": 19200 }, { "epoch": 0.26, "learning_rate": 4.2273414860734585e-05, "loss": 0.5959, "step": 19205 }, { "epoch": 0.26, "learning_rate": 4.2269610790930906e-05, "loss": 0.5094, "step": 19210 }, { "epoch": 0.26, "learning_rate": 4.2265805956169854e-05, "loss": 0.5731, "step": 19215 }, { "epoch": 0.26, "learning_rate": 4.226200035661998e-05, "loss": 0.8674, "step": 19220 }, { "epoch": 0.26, "learning_rate": 4.2258193992449865e-05, "loss": 0.6422, "step": 19225 }, { "epoch": 0.26, "learning_rate": 4.225438686382809e-05, "loss": 0.6416, "step": 19230 }, { "epoch": 0.26, "learning_rate": 4.225057897092329e-05, "loss": 0.5477, "step": 19235 }, { "epoch": 0.26, "learning_rate": 4.224677031390415e-05, "loss": 0.7737, "step": 19240 }, { "epoch": 0.26, "learning_rate": 4.224296089293937e-05, "loss": 0.3011, "step": 19245 }, { "epoch": 0.26, "learning_rate": 4.223915070819767e-05, "loss": 0.4468, "step": 19250 }, { "epoch": 0.26, "learning_rate": 4.223533975984785e-05, "loss": 0.6065, "step": 19255 }, { "epoch": 0.26, "learning_rate": 4.223152804805871e-05, "loss": 1.2158, "step": 19260 }, { "epoch": 0.26, "learning_rate": 4.222771557299907e-05, "loss": 0.7538, "step": 19265 }, { "epoch": 0.26, "learning_rate": 4.222390233483783e-05, "loss": 1.5002, "step": 19270 }, { "epoch": 0.26, "learning_rate": 4.2220088333743876e-05, "loss": 0.6033, "step": 19275 }, { "epoch": 0.26, "learning_rate": 4.221627356988617e-05, "loss": 0.818, "step": 19280 }, { "epoch": 0.26, "learning_rate": 4.221245804343367e-05, "loss": 0.7626, "step": 19285 }, { "epoch": 0.26, "learning_rate": 4.220864175455539e-05, "loss": 0.4788, "step": 19290 }, { "epoch": 0.26, "learning_rate": 4.220482470342037e-05, "loss": 0.5058, "step": 19295 }, { "epoch": 0.26, "learning_rate": 4.220100689019769e-05, "loss": 0.8164, "step": 19300 }, { "epoch": 0.26, "learning_rate": 4.2197188315056456e-05, "loss": 0.8423, "step": 19305 }, { "epoch": 0.26, "learning_rate": 4.219336897816581e-05, "loss": 0.4184, "step": 19310 }, { "epoch": 0.26, "learning_rate": 4.218954887969495e-05, "loss": 0.2382, "step": 19315 }, { "epoch": 0.26, "learning_rate": 4.218572801981306e-05, "loss": 0.9956, "step": 19320 }, { "epoch": 0.26, "learning_rate": 4.2181906398689396e-05, "loss": 0.8584, "step": 19325 }, { "epoch": 0.26, "learning_rate": 4.2178084016493234e-05, "loss": 0.979, "step": 19330 }, { "epoch": 0.26, "learning_rate": 4.21742608733939e-05, "loss": 0.9888, "step": 19335 }, { "epoch": 0.26, "learning_rate": 4.2170436969560726e-05, "loss": 1.0631, "step": 19340 }, { "epoch": 0.26, "learning_rate": 4.216661230516309e-05, "loss": 1.0433, "step": 19345 }, { "epoch": 0.26, "learning_rate": 4.216278688037042e-05, "loss": 0.8179, "step": 19350 }, { "epoch": 0.26, "learning_rate": 4.2158960695352146e-05, "loss": 0.6118, "step": 19355 }, { "epoch": 0.26, "learning_rate": 4.215513375027775e-05, "loss": 0.5644, "step": 19360 }, { "epoch": 0.26, "learning_rate": 4.215130604531677e-05, "loss": 1.5479, "step": 19365 }, { "epoch": 0.26, "learning_rate": 4.214747758063873e-05, "loss": 1.1391, "step": 19370 }, { "epoch": 0.26, "learning_rate": 4.2143648356413215e-05, "loss": 1.054, "step": 19375 }, { "epoch": 0.26, "learning_rate": 4.2139818372809844e-05, "loss": 0.3271, "step": 19380 }, { "epoch": 0.26, "learning_rate": 4.2135987629998273e-05, "loss": 0.3832, "step": 19385 }, { "epoch": 0.26, "learning_rate": 4.213215612814818e-05, "loss": 1.2266, "step": 19390 }, { "epoch": 0.26, "learning_rate": 4.2128323867429274e-05, "loss": 0.7176, "step": 19395 }, { "epoch": 0.26, "learning_rate": 4.212449084801132e-05, "loss": 0.7963, "step": 19400 }, { "epoch": 0.26, "learning_rate": 4.2120657070064086e-05, "loss": 1.5484, "step": 19405 }, { "epoch": 0.26, "learning_rate": 4.2116822533757395e-05, "loss": 1.2203, "step": 19410 }, { "epoch": 0.26, "learning_rate": 4.21129872392611e-05, "loss": 1.0104, "step": 19415 }, { "epoch": 0.26, "learning_rate": 4.210991845788171e-05, "loss": 0.9467, "step": 19420 }, { "epoch": 0.26, "learning_rate": 4.210608179907225e-05, "loss": 1.2062, "step": 19425 }, { "epoch": 0.26, "learning_rate": 4.210224438254895e-05, "loss": 0.611, "step": 19430 }, { "epoch": 0.26, "learning_rate": 4.209840620848179e-05, "loss": 0.2206, "step": 19435 }, { "epoch": 0.26, "learning_rate": 4.209456727704077e-05, "loss": 0.8861, "step": 19440 }, { "epoch": 0.26, "learning_rate": 4.209072758839594e-05, "loss": 0.5298, "step": 19445 }, { "epoch": 0.26, "learning_rate": 4.2086887142717384e-05, "loss": 0.3733, "step": 19450 }, { "epoch": 0.26, "learning_rate": 4.208304594017521e-05, "loss": 0.4574, "step": 19455 }, { "epoch": 0.26, "learning_rate": 4.207920398093956e-05, "loss": 0.6719, "step": 19460 }, { "epoch": 0.26, "learning_rate": 4.2075361265180625e-05, "loss": 0.7156, "step": 19465 }, { "epoch": 0.26, "learning_rate": 4.2071517793068605e-05, "loss": 0.7062, "step": 19470 }, { "epoch": 0.26, "learning_rate": 4.2067673564773756e-05, "loss": 1.158, "step": 19475 }, { "epoch": 0.26, "learning_rate": 4.206382858046636e-05, "loss": 0.2354, "step": 19480 }, { "epoch": 0.26, "learning_rate": 4.205998284031671e-05, "loss": 0.953, "step": 19485 }, { "epoch": 0.26, "learning_rate": 4.205613634449518e-05, "loss": 0.809, "step": 19490 }, { "epoch": 0.26, "learning_rate": 4.205228909317214e-05, "loss": 0.478, "step": 19495 }, { "epoch": 0.26, "learning_rate": 4.2048441086518e-05, "loss": 0.4081, "step": 19500 }, { "epoch": 0.26, "learning_rate": 4.2044592324703215e-05, "loss": 0.6818, "step": 19505 }, { "epoch": 0.26, "learning_rate": 4.204074280789826e-05, "loss": 1.0993, "step": 19510 }, { "epoch": 0.26, "learning_rate": 4.2036892536273644e-05, "loss": 0.8806, "step": 19515 }, { "epoch": 0.26, "learning_rate": 4.203304150999993e-05, "loss": 0.5775, "step": 19520 }, { "epoch": 0.26, "learning_rate": 4.202918972924769e-05, "loss": 0.2503, "step": 19525 }, { "epoch": 0.26, "learning_rate": 4.202533719418753e-05, "loss": 0.9831, "step": 19530 }, { "epoch": 0.26, "learning_rate": 4.202148390499011e-05, "loss": 0.272, "step": 19535 }, { "epoch": 0.26, "learning_rate": 4.2017629861826115e-05, "loss": 0.8105, "step": 19540 }, { "epoch": 0.26, "learning_rate": 4.201377506486624e-05, "loss": 0.441, "step": 19545 }, { "epoch": 0.26, "learning_rate": 4.200991951428127e-05, "loss": 1.3764, "step": 19550 }, { "epoch": 0.26, "learning_rate": 4.200606321024195e-05, "loss": 0.695, "step": 19555 }, { "epoch": 0.26, "learning_rate": 4.200220615291911e-05, "loss": 0.4461, "step": 19560 }, { "epoch": 0.26, "learning_rate": 4.1998348342483595e-05, "loss": 0.9564, "step": 19565 }, { "epoch": 0.26, "learning_rate": 4.199448977910629e-05, "loss": 0.765, "step": 19570 }, { "epoch": 0.26, "learning_rate": 4.199063046295811e-05, "loss": 0.943, "step": 19575 }, { "epoch": 0.26, "learning_rate": 4.198677039421e-05, "loss": 1.1662, "step": 19580 }, { "epoch": 0.26, "learning_rate": 4.1982909573032946e-05, "loss": 1.1854, "step": 19585 }, { "epoch": 0.26, "learning_rate": 4.1979047999597955e-05, "loss": 0.6693, "step": 19590 }, { "epoch": 0.26, "learning_rate": 4.197518567407609e-05, "loss": 0.7134, "step": 19595 }, { "epoch": 0.26, "learning_rate": 4.197132259663841e-05, "loss": 0.834, "step": 19600 }, { "epoch": 0.26, "learning_rate": 4.196745876745606e-05, "loss": 0.3296, "step": 19605 }, { "epoch": 0.26, "learning_rate": 4.196359418670016e-05, "loss": 0.1742, "step": 19610 }, { "epoch": 0.26, "learning_rate": 4.1959728854541915e-05, "loss": 0.5732, "step": 19615 }, { "epoch": 0.26, "learning_rate": 4.195586277115252e-05, "loss": 0.7262, "step": 19620 }, { "epoch": 0.26, "learning_rate": 4.195199593670323e-05, "loss": 1.2381, "step": 19625 }, { "epoch": 0.26, "learning_rate": 4.1948128351365335e-05, "loss": 0.8095, "step": 19630 }, { "epoch": 0.26, "learning_rate": 4.194426001531014e-05, "loss": 0.9091, "step": 19635 }, { "epoch": 0.26, "learning_rate": 4.1940390928708995e-05, "loss": 1.407, "step": 19640 }, { "epoch": 0.26, "learning_rate": 4.193652109173328e-05, "loss": 0.8103, "step": 19645 }, { "epoch": 0.26, "learning_rate": 4.1932650504554415e-05, "loss": 0.4757, "step": 19650 }, { "epoch": 0.26, "learning_rate": 4.192877916734385e-05, "loss": 0.4639, "step": 19655 }, { "epoch": 0.26, "learning_rate": 4.192490708027304e-05, "loss": 0.8762, "step": 19660 }, { "epoch": 0.26, "learning_rate": 4.1921034243513536e-05, "loss": 0.6656, "step": 19665 }, { "epoch": 0.26, "learning_rate": 4.191716065723686e-05, "loss": 0.4865, "step": 19670 }, { "epoch": 0.26, "learning_rate": 4.1913286321614614e-05, "loss": 0.2536, "step": 19675 }, { "epoch": 0.26, "learning_rate": 4.190941123681838e-05, "loss": 0.8254, "step": 19680 }, { "epoch": 0.26, "learning_rate": 4.190553540301984e-05, "loss": 1.2534, "step": 19685 }, { "epoch": 0.26, "learning_rate": 4.1901658820390655e-05, "loss": 0.3575, "step": 19690 }, { "epoch": 0.26, "learning_rate": 4.1897781489102525e-05, "loss": 0.8149, "step": 19695 }, { "epoch": 0.26, "learning_rate": 4.1893903409327225e-05, "loss": 0.6631, "step": 19700 }, { "epoch": 0.26, "learning_rate": 4.189002458123652e-05, "loss": 1.4508, "step": 19705 }, { "epoch": 0.26, "learning_rate": 4.1886145005002226e-05, "loss": 0.3563, "step": 19710 }, { "epoch": 0.26, "learning_rate": 4.1882264680796184e-05, "loss": 0.7305, "step": 19715 }, { "epoch": 0.26, "learning_rate": 4.187838360879027e-05, "loss": 0.4373, "step": 19720 }, { "epoch": 0.26, "learning_rate": 4.1874501789156416e-05, "loss": 1.2118, "step": 19725 }, { "epoch": 0.26, "learning_rate": 4.187061922206655e-05, "loss": 0.8281, "step": 19730 }, { "epoch": 0.26, "learning_rate": 4.186673590769264e-05, "loss": 0.5604, "step": 19735 }, { "epoch": 0.26, "learning_rate": 4.1862851846206725e-05, "loss": 0.5046, "step": 19740 }, { "epoch": 0.26, "learning_rate": 4.185896703778083e-05, "loss": 0.567, "step": 19745 }, { "epoch": 0.26, "learning_rate": 4.185508148258703e-05, "loss": 0.7693, "step": 19750 }, { "epoch": 0.26, "learning_rate": 4.1851195180797465e-05, "loss": 0.6202, "step": 19755 }, { "epoch": 0.26, "learning_rate": 4.184730813258424e-05, "loss": 0.6146, "step": 19760 }, { "epoch": 0.26, "learning_rate": 4.1843420338119555e-05, "loss": 0.5952, "step": 19765 }, { "epoch": 0.26, "learning_rate": 4.183953179757562e-05, "loss": 0.9218, "step": 19770 }, { "epoch": 0.26, "learning_rate": 4.1835642511124656e-05, "loss": 0.9157, "step": 19775 }, { "epoch": 0.27, "learning_rate": 4.183175247893896e-05, "loss": 0.8689, "step": 19780 }, { "epoch": 0.27, "learning_rate": 4.182786170119085e-05, "loss": 0.4252, "step": 19785 }, { "epoch": 0.27, "learning_rate": 4.182397017805264e-05, "loss": 0.3602, "step": 19790 }, { "epoch": 0.27, "learning_rate": 4.182007790969672e-05, "loss": 1.0693, "step": 19795 }, { "epoch": 0.27, "learning_rate": 4.181618489629549e-05, "loss": 0.8727, "step": 19800 }, { "epoch": 0.27, "learning_rate": 4.181229113802141e-05, "loss": 0.5072, "step": 19805 }, { "epoch": 0.27, "learning_rate": 4.180839663504694e-05, "loss": 0.2412, "step": 19810 }, { "epoch": 0.27, "learning_rate": 4.180450138754459e-05, "loss": 0.8084, "step": 19815 }, { "epoch": 0.27, "learning_rate": 4.1800605395686896e-05, "loss": 0.5599, "step": 19820 }, { "epoch": 0.27, "learning_rate": 4.179670865964643e-05, "loss": 0.9471, "step": 19825 }, { "epoch": 0.27, "learning_rate": 4.17928111795958e-05, "loss": 0.3286, "step": 19830 }, { "epoch": 0.27, "learning_rate": 4.178891295570766e-05, "loss": 0.9903, "step": 19835 }, { "epoch": 0.27, "learning_rate": 4.1785013988154656e-05, "loss": 0.6238, "step": 19840 }, { "epoch": 0.27, "learning_rate": 4.178111427710951e-05, "loss": 0.4965, "step": 19845 }, { "epoch": 0.27, "learning_rate": 4.1777213822744954e-05, "loss": 0.3951, "step": 19850 }, { "epoch": 0.27, "learning_rate": 4.177331262523376e-05, "loss": 1.022, "step": 19855 }, { "epoch": 0.27, "learning_rate": 4.1769410684748734e-05, "loss": 1.0618, "step": 19860 }, { "epoch": 0.27, "learning_rate": 4.1765508001462704e-05, "loss": 0.9394, "step": 19865 }, { "epoch": 0.27, "learning_rate": 4.176160457554855e-05, "loss": 1.2078, "step": 19870 }, { "epoch": 0.27, "learning_rate": 4.1757700407179155e-05, "loss": 0.5624, "step": 19875 }, { "epoch": 0.27, "learning_rate": 4.175379549652749e-05, "loss": 0.6883, "step": 19880 }, { "epoch": 0.27, "learning_rate": 4.1749889843766485e-05, "loss": 0.8004, "step": 19885 }, { "epoch": 0.27, "learning_rate": 4.174598344906916e-05, "loss": 0.492, "step": 19890 }, { "epoch": 0.27, "learning_rate": 4.174207631260855e-05, "loss": 0.1238, "step": 19895 }, { "epoch": 0.27, "learning_rate": 4.173816843455771e-05, "loss": 1.2187, "step": 19900 }, { "epoch": 0.27, "learning_rate": 4.1734259815089755e-05, "loss": 1.6869, "step": 19905 }, { "epoch": 0.27, "learning_rate": 4.173035045437781e-05, "loss": 0.5554, "step": 19910 }, { "epoch": 0.27, "learning_rate": 4.172644035259503e-05, "loss": 0.5359, "step": 19915 }, { "epoch": 0.27, "learning_rate": 4.172252950991463e-05, "loss": 0.4747, "step": 19920 }, { "epoch": 0.27, "learning_rate": 4.171861792650983e-05, "loss": 0.834, "step": 19925 }, { "epoch": 0.27, "learning_rate": 4.171470560255389e-05, "loss": 0.4444, "step": 19930 }, { "epoch": 0.27, "learning_rate": 4.171079253822012e-05, "loss": 0.7813, "step": 19935 }, { "epoch": 0.27, "learning_rate": 4.1706878733681845e-05, "loss": 0.6353, "step": 19940 }, { "epoch": 0.27, "learning_rate": 4.170296418911242e-05, "loss": 0.5658, "step": 19945 }, { "epoch": 0.27, "learning_rate": 4.169904890468525e-05, "loss": 0.8125, "step": 19950 }, { "epoch": 0.27, "learning_rate": 4.169513288057374e-05, "loss": 0.4032, "step": 19955 }, { "epoch": 0.27, "learning_rate": 4.169121611695138e-05, "loss": 0.97, "step": 19960 }, { "epoch": 0.27, "learning_rate": 4.168729861399164e-05, "loss": 1.2625, "step": 19965 }, { "epoch": 0.27, "learning_rate": 4.1683380371868064e-05, "loss": 0.6207, "step": 19970 }, { "epoch": 0.27, "learning_rate": 4.16794613907542e-05, "loss": 0.2654, "step": 19975 }, { "epoch": 0.27, "learning_rate": 4.167554167082365e-05, "loss": 0.6433, "step": 19980 }, { "epoch": 0.27, "learning_rate": 4.167162121225001e-05, "loss": 0.3757, "step": 19985 }, { "epoch": 0.27, "learning_rate": 4.1667700015206966e-05, "loss": 1.0294, "step": 19990 }, { "epoch": 0.27, "learning_rate": 4.16637780798682e-05, "loss": 1.1439, "step": 19995 }, { "epoch": 0.27, "learning_rate": 4.1659855406407425e-05, "loss": 0.7575, "step": 20000 }, { "epoch": 0.27, "learning_rate": 4.165593199499841e-05, "loss": 0.7503, "step": 20005 }, { "epoch": 0.27, "learning_rate": 4.165200784581493e-05, "loss": 0.5921, "step": 20010 }, { "epoch": 0.27, "learning_rate": 4.164808295903081e-05, "loss": 1.1687, "step": 20015 }, { "epoch": 0.27, "learning_rate": 4.16441573348199e-05, "loss": 0.5808, "step": 20020 }, { "epoch": 0.27, "learning_rate": 4.1640230973356084e-05, "loss": 0.9014, "step": 20025 }, { "epoch": 0.27, "learning_rate": 4.16363038748133e-05, "loss": 0.7926, "step": 20030 }, { "epoch": 0.27, "learning_rate": 4.1632376039365476e-05, "loss": 0.9864, "step": 20035 }, { "epoch": 0.27, "learning_rate": 4.162844746718659e-05, "loss": 0.2423, "step": 20040 }, { "epoch": 0.27, "learning_rate": 4.162451815845069e-05, "loss": 0.4583, "step": 20045 }, { "epoch": 0.27, "learning_rate": 4.1620588113331795e-05, "loss": 0.479, "step": 20050 }, { "epoch": 0.27, "learning_rate": 4.1616657332003996e-05, "loss": 0.6811, "step": 20055 }, { "epoch": 0.27, "learning_rate": 4.161272581464141e-05, "loss": 0.852, "step": 20060 }, { "epoch": 0.27, "learning_rate": 4.160879356141818e-05, "loss": 0.5519, "step": 20065 }, { "epoch": 0.27, "learning_rate": 4.160486057250849e-05, "loss": 0.843, "step": 20070 }, { "epoch": 0.27, "learning_rate": 4.160092684808654e-05, "loss": 0.2829, "step": 20075 }, { "epoch": 0.27, "learning_rate": 4.159699238832659e-05, "loss": 1.555, "step": 20080 }, { "epoch": 0.27, "learning_rate": 4.1593057193402906e-05, "loss": 0.4936, "step": 20085 }, { "epoch": 0.27, "learning_rate": 4.158912126348981e-05, "loss": 0.778, "step": 20090 }, { "epoch": 0.27, "learning_rate": 4.158518459876162e-05, "loss": 0.9395, "step": 20095 }, { "epoch": 0.27, "learning_rate": 4.158124719939274e-05, "loss": 0.846, "step": 20100 }, { "epoch": 0.27, "learning_rate": 4.157730906555755e-05, "loss": 1.1097, "step": 20105 }, { "epoch": 0.27, "learning_rate": 4.157337019743051e-05, "loss": 0.3419, "step": 20110 }, { "epoch": 0.27, "learning_rate": 4.1569430595186075e-05, "loss": 0.5743, "step": 20115 }, { "epoch": 0.27, "learning_rate": 4.156549025899876e-05, "loss": 0.7229, "step": 20120 }, { "epoch": 0.27, "learning_rate": 4.1561549189043116e-05, "loss": 1.0813, "step": 20125 }, { "epoch": 0.27, "learning_rate": 4.155760738549369e-05, "loss": 0.7565, "step": 20130 }, { "epoch": 0.27, "learning_rate": 4.1553664848525084e-05, "loss": 0.8755, "step": 20135 }, { "epoch": 0.27, "learning_rate": 4.154972157831195e-05, "loss": 0.6024, "step": 20140 }, { "epoch": 0.27, "learning_rate": 4.1545777575028945e-05, "loss": 0.186, "step": 20145 }, { "epoch": 0.27, "learning_rate": 4.154183283885076e-05, "loss": 0.7825, "step": 20150 }, { "epoch": 0.27, "learning_rate": 4.153788736995214e-05, "loss": 0.5114, "step": 20155 }, { "epoch": 0.27, "learning_rate": 4.153394116850786e-05, "loss": 0.9017, "step": 20160 }, { "epoch": 0.27, "learning_rate": 4.1529994234692685e-05, "loss": 0.3643, "step": 20165 }, { "epoch": 0.27, "learning_rate": 4.1526046568681476e-05, "loss": 0.5316, "step": 20170 }, { "epoch": 0.27, "learning_rate": 4.152209817064907e-05, "loss": 0.7246, "step": 20175 }, { "epoch": 0.27, "learning_rate": 4.151814904077038e-05, "loss": 1.487, "step": 20180 }, { "epoch": 0.27, "learning_rate": 4.151419917922032e-05, "loss": 1.2959, "step": 20185 }, { "epoch": 0.27, "learning_rate": 4.151024858617385e-05, "loss": 0.6696, "step": 20190 }, { "epoch": 0.27, "learning_rate": 4.150629726180598e-05, "loss": 0.8379, "step": 20195 }, { "epoch": 0.27, "learning_rate": 4.150234520629171e-05, "loss": 0.9612, "step": 20200 }, { "epoch": 0.27, "learning_rate": 4.149839241980611e-05, "loss": 1.1374, "step": 20205 }, { "epoch": 0.27, "learning_rate": 4.149443890252426e-05, "loss": 0.7092, "step": 20210 }, { "epoch": 0.27, "learning_rate": 4.149048465462128e-05, "loss": 0.9865, "step": 20215 }, { "epoch": 0.27, "learning_rate": 4.148652967627235e-05, "loss": 0.6659, "step": 20220 }, { "epoch": 0.27, "learning_rate": 4.148257396765262e-05, "loss": 0.516, "step": 20225 }, { "epoch": 0.27, "learning_rate": 4.1478617528937326e-05, "loss": 0.9571, "step": 20230 }, { "epoch": 0.27, "learning_rate": 4.147466036030171e-05, "loss": 0.8166, "step": 20235 }, { "epoch": 0.27, "learning_rate": 4.147070246192107e-05, "loss": 0.597, "step": 20240 }, { "epoch": 0.27, "learning_rate": 4.14667438339707e-05, "loss": 0.3444, "step": 20245 }, { "epoch": 0.27, "learning_rate": 4.146278447662597e-05, "loss": 0.5193, "step": 20250 }, { "epoch": 0.27, "learning_rate": 4.1458824390062246e-05, "loss": 0.5131, "step": 20255 }, { "epoch": 0.27, "learning_rate": 4.145486357445493e-05, "loss": 0.9646, "step": 20260 }, { "epoch": 0.27, "learning_rate": 4.1450902029979497e-05, "loss": 1.1023, "step": 20265 }, { "epoch": 0.27, "learning_rate": 4.14469397568114e-05, "loss": 1.4001, "step": 20270 }, { "epoch": 0.27, "learning_rate": 4.144297675512614e-05, "loss": 1.0197, "step": 20275 }, { "epoch": 0.27, "learning_rate": 4.143901302509929e-05, "loss": 0.4603, "step": 20280 }, { "epoch": 0.27, "learning_rate": 4.143504856690639e-05, "loss": 0.6951, "step": 20285 }, { "epoch": 0.27, "learning_rate": 4.1431083380723065e-05, "loss": 1.0495, "step": 20290 }, { "epoch": 0.27, "learning_rate": 4.1427117466724954e-05, "loss": 0.5706, "step": 20295 }, { "epoch": 0.27, "learning_rate": 4.1423150825087716e-05, "loss": 0.8855, "step": 20300 }, { "epoch": 0.27, "learning_rate": 4.141918345598706e-05, "loss": 0.7466, "step": 20305 }, { "epoch": 0.27, "learning_rate": 4.141521535959873e-05, "loss": 0.5163, "step": 20310 }, { "epoch": 0.27, "learning_rate": 4.1411246536098455e-05, "loss": 0.6364, "step": 20315 }, { "epoch": 0.27, "learning_rate": 4.1407276985662086e-05, "loss": 1.6519, "step": 20320 }, { "epoch": 0.27, "learning_rate": 4.1403306708465425e-05, "loss": 0.4959, "step": 20325 }, { "epoch": 0.27, "learning_rate": 4.1399335704684335e-05, "loss": 0.7384, "step": 20330 }, { "epoch": 0.27, "learning_rate": 4.1395363974494715e-05, "loss": 0.753, "step": 20335 }, { "epoch": 0.27, "learning_rate": 4.1391391518072496e-05, "loss": 1.0961, "step": 20340 }, { "epoch": 0.27, "learning_rate": 4.138741833559364e-05, "loss": 0.6568, "step": 20345 }, { "epoch": 0.27, "learning_rate": 4.1383444427234136e-05, "loss": 0.5273, "step": 20350 }, { "epoch": 0.27, "learning_rate": 4.137946979317e-05, "loss": 1.4852, "step": 20355 }, { "epoch": 0.27, "learning_rate": 4.137549443357731e-05, "loss": 0.5835, "step": 20360 }, { "epoch": 0.27, "learning_rate": 4.137151834863213e-05, "loss": 0.4334, "step": 20365 }, { "epoch": 0.27, "learning_rate": 4.136754153851059e-05, "loss": 0.6915, "step": 20370 }, { "epoch": 0.27, "learning_rate": 4.1363564003388857e-05, "loss": 0.9843, "step": 20375 }, { "epoch": 0.27, "learning_rate": 4.135958574344308e-05, "loss": 0.2397, "step": 20380 }, { "epoch": 0.27, "learning_rate": 4.135560675884952e-05, "loss": 0.7401, "step": 20385 }, { "epoch": 0.27, "learning_rate": 4.1351627049784395e-05, "loss": 1.0392, "step": 20390 }, { "epoch": 0.27, "learning_rate": 4.1347646616423995e-05, "loss": 1.0514, "step": 20395 }, { "epoch": 0.27, "learning_rate": 4.134366545894465e-05, "loss": 0.5038, "step": 20400 }, { "epoch": 0.27, "learning_rate": 4.133968357752267e-05, "loss": 0.5505, "step": 20405 }, { "epoch": 0.27, "learning_rate": 4.1335700972334455e-05, "loss": 0.9105, "step": 20410 }, { "epoch": 0.27, "learning_rate": 4.1331717643556425e-05, "loss": 0.322, "step": 20415 }, { "epoch": 0.27, "learning_rate": 4.1327733591365e-05, "loss": 1.2261, "step": 20420 }, { "epoch": 0.27, "learning_rate": 4.1323748815936664e-05, "loss": 0.7845, "step": 20425 }, { "epoch": 0.27, "learning_rate": 4.131976331744792e-05, "loss": 0.3483, "step": 20430 }, { "epoch": 0.27, "learning_rate": 4.13157770960753e-05, "loss": 0.2605, "step": 20435 }, { "epoch": 0.27, "learning_rate": 4.1311790151995386e-05, "loss": 0.8255, "step": 20440 }, { "epoch": 0.27, "learning_rate": 4.130780248538478e-05, "loss": 0.3779, "step": 20445 }, { "epoch": 0.27, "learning_rate": 4.13038140964201e-05, "loss": 1.2754, "step": 20450 }, { "epoch": 0.27, "learning_rate": 4.129982498527802e-05, "loss": 0.6292, "step": 20455 }, { "epoch": 0.27, "learning_rate": 4.129583515213525e-05, "loss": 0.4177, "step": 20460 }, { "epoch": 0.27, "learning_rate": 4.12918445971685e-05, "loss": 0.77, "step": 20465 }, { "epoch": 0.27, "learning_rate": 4.1287853320554536e-05, "loss": 0.4551, "step": 20470 }, { "epoch": 0.27, "learning_rate": 4.1283861322470166e-05, "loss": 0.2144, "step": 20475 }, { "epoch": 0.27, "learning_rate": 4.127986860309219e-05, "loss": 1.0236, "step": 20480 }, { "epoch": 0.27, "learning_rate": 4.1275875162597495e-05, "loss": 1.2017, "step": 20485 }, { "epoch": 0.27, "learning_rate": 4.127188100116295e-05, "loss": 0.9935, "step": 20490 }, { "epoch": 0.27, "learning_rate": 4.126788611896548e-05, "loss": 0.7543, "step": 20495 }, { "epoch": 0.27, "learning_rate": 4.126389051618205e-05, "loss": 0.7702, "step": 20500 }, { "epoch": 0.27, "learning_rate": 4.1259894192989625e-05, "loss": 0.6041, "step": 20505 }, { "epoch": 0.27, "learning_rate": 4.125589714956524e-05, "loss": 0.719, "step": 20510 }, { "epoch": 0.27, "learning_rate": 4.1251899386085926e-05, "loss": 0.3887, "step": 20515 }, { "epoch": 0.27, "learning_rate": 4.124790090272879e-05, "loss": 0.991, "step": 20520 }, { "epoch": 0.28, "learning_rate": 4.1243901699670915e-05, "loss": 0.8095, "step": 20525 }, { "epoch": 0.28, "learning_rate": 4.1239901777089473e-05, "loss": 0.9865, "step": 20530 }, { "epoch": 0.28, "learning_rate": 4.123590113516162e-05, "loss": 0.7833, "step": 20535 }, { "epoch": 0.28, "learning_rate": 4.1231899774064574e-05, "loss": 0.3803, "step": 20540 }, { "epoch": 0.28, "learning_rate": 4.122789769397558e-05, "loss": 0.2496, "step": 20545 }, { "epoch": 0.28, "learning_rate": 4.12238948950719e-05, "loss": 0.8946, "step": 20550 }, { "epoch": 0.28, "learning_rate": 4.121989137753084e-05, "loss": 0.1046, "step": 20555 }, { "epoch": 0.28, "learning_rate": 4.121588714152973e-05, "loss": 1.0393, "step": 20560 }, { "epoch": 0.28, "learning_rate": 4.121188218724595e-05, "loss": 1.2554, "step": 20565 }, { "epoch": 0.28, "learning_rate": 4.1207876514856905e-05, "loss": 0.953, "step": 20570 }, { "epoch": 0.28, "learning_rate": 4.1203870124540005e-05, "loss": 0.9678, "step": 20575 }, { "epoch": 0.28, "learning_rate": 4.119986301647273e-05, "loss": 0.5449, "step": 20580 }, { "epoch": 0.28, "learning_rate": 4.1195855190832566e-05, "loss": 0.6506, "step": 20585 }, { "epoch": 0.28, "learning_rate": 4.1191846647797036e-05, "loss": 0.8751, "step": 20590 }, { "epoch": 0.28, "learning_rate": 4.118783738754372e-05, "loss": 0.3897, "step": 20595 }, { "epoch": 0.28, "learning_rate": 4.118382741025019e-05, "loss": 0.5927, "step": 20600 }, { "epoch": 0.28, "learning_rate": 4.117981671609405e-05, "loss": 0.5458, "step": 20605 }, { "epoch": 0.28, "learning_rate": 4.1175805305252995e-05, "loss": 1.4906, "step": 20610 }, { "epoch": 0.28, "learning_rate": 4.117179317790468e-05, "loss": 1.0008, "step": 20615 }, { "epoch": 0.28, "learning_rate": 4.116778033422685e-05, "loss": 0.6083, "step": 20620 }, { "epoch": 0.28, "learning_rate": 4.1163766774397217e-05, "loss": 0.795, "step": 20625 }, { "epoch": 0.28, "learning_rate": 4.1159752498593585e-05, "loss": 0.5984, "step": 20630 }, { "epoch": 0.28, "learning_rate": 4.1155737506993764e-05, "loss": 0.8027, "step": 20635 }, { "epoch": 0.28, "learning_rate": 4.11517217997756e-05, "loss": 0.9183, "step": 20640 }, { "epoch": 0.28, "learning_rate": 4.114770537711695e-05, "loss": 0.3347, "step": 20645 }, { "epoch": 0.28, "learning_rate": 4.114368823919575e-05, "loss": 0.7326, "step": 20650 }, { "epoch": 0.28, "learning_rate": 4.113967038618993e-05, "loss": 0.3998, "step": 20655 }, { "epoch": 0.28, "learning_rate": 4.1135651818277445e-05, "loss": 0.6544, "step": 20660 }, { "epoch": 0.28, "learning_rate": 4.113163253563631e-05, "loss": 0.7179, "step": 20665 }, { "epoch": 0.28, "learning_rate": 4.112761253844456e-05, "loss": 0.4696, "step": 20670 }, { "epoch": 0.28, "learning_rate": 4.112359182688026e-05, "loss": 0.7733, "step": 20675 }, { "epoch": 0.28, "learning_rate": 4.11195704011215e-05, "loss": 0.6885, "step": 20680 }, { "epoch": 0.28, "learning_rate": 4.111554826134641e-05, "loss": 0.4521, "step": 20685 }, { "epoch": 0.28, "learning_rate": 4.1111525407733176e-05, "loss": 0.3516, "step": 20690 }, { "epoch": 0.28, "learning_rate": 4.110750184045995e-05, "loss": 0.617, "step": 20695 }, { "epoch": 0.28, "learning_rate": 4.110428247292597e-05, "loss": 0.5476, "step": 20700 }, { "epoch": 0.28, "learning_rate": 4.110025762151394e-05, "loss": 1.1937, "step": 20705 }, { "epoch": 0.28, "learning_rate": 4.1096232056941053e-05, "loss": 1.1015, "step": 20710 }, { "epoch": 0.28, "learning_rate": 4.1092205779385616e-05, "loss": 1.0593, "step": 20715 }, { "epoch": 0.28, "learning_rate": 4.1088178789025967e-05, "loss": 0.6828, "step": 20720 }, { "epoch": 0.28, "learning_rate": 4.1084151086040477e-05, "loss": 0.2803, "step": 20725 }, { "epoch": 0.28, "learning_rate": 4.1080122670607565e-05, "loss": 0.4392, "step": 20730 }, { "epoch": 0.28, "learning_rate": 4.107609354290567e-05, "loss": 1.0222, "step": 20735 }, { "epoch": 0.28, "learning_rate": 4.1072063703113255e-05, "loss": 0.3278, "step": 20740 }, { "epoch": 0.28, "learning_rate": 4.106803315140882e-05, "loss": 0.7894, "step": 20745 }, { "epoch": 0.28, "learning_rate": 4.1064001887970905e-05, "loss": 0.4302, "step": 20750 }, { "epoch": 0.28, "learning_rate": 4.105996991297807e-05, "loss": 0.8167, "step": 20755 }, { "epoch": 0.28, "learning_rate": 4.105593722660892e-05, "loss": 0.8834, "step": 20760 }, { "epoch": 0.28, "learning_rate": 4.105190382904207e-05, "loss": 0.5599, "step": 20765 }, { "epoch": 0.28, "learning_rate": 4.104786972045619e-05, "loss": 0.31, "step": 20770 }, { "epoch": 0.28, "learning_rate": 4.104383490102996e-05, "loss": 0.4624, "step": 20775 }, { "epoch": 0.28, "learning_rate": 4.103979937094211e-05, "loss": 1.1878, "step": 20780 }, { "epoch": 0.28, "learning_rate": 4.10357631303714e-05, "loss": 1.2796, "step": 20785 }, { "epoch": 0.28, "learning_rate": 4.10317261794966e-05, "loss": 1.078, "step": 20790 }, { "epoch": 0.28, "learning_rate": 4.1027688518496535e-05, "loss": 1.1738, "step": 20795 }, { "epoch": 0.28, "learning_rate": 4.102365014755005e-05, "loss": 1.6886, "step": 20800 }, { "epoch": 0.28, "learning_rate": 4.1019611066836035e-05, "loss": 0.9421, "step": 20805 }, { "epoch": 0.28, "learning_rate": 4.1015571276533396e-05, "loss": 0.5958, "step": 20810 }, { "epoch": 0.28, "learning_rate": 4.101153077682106e-05, "loss": 1.0673, "step": 20815 }, { "epoch": 0.28, "learning_rate": 4.100748956787802e-05, "loss": 1.4847, "step": 20820 }, { "epoch": 0.28, "learning_rate": 4.1003447649883274e-05, "loss": 0.5074, "step": 20825 }, { "epoch": 0.28, "learning_rate": 4.0999405023015857e-05, "loss": 0.5327, "step": 20830 }, { "epoch": 0.28, "learning_rate": 4.0995361687454844e-05, "loss": 0.5336, "step": 20835 }, { "epoch": 0.28, "learning_rate": 4.099131764337933e-05, "loss": 1.0735, "step": 20840 }, { "epoch": 0.28, "learning_rate": 4.0987272890968455e-05, "loss": 0.526, "step": 20845 }, { "epoch": 0.28, "learning_rate": 4.098322743040136e-05, "loss": 0.6411, "step": 20850 }, { "epoch": 0.28, "learning_rate": 4.097918126185726e-05, "loss": 0.6167, "step": 20855 }, { "epoch": 0.28, "learning_rate": 4.097513438551537e-05, "loss": 0.7149, "step": 20860 }, { "epoch": 0.28, "learning_rate": 4.097108680155494e-05, "loss": 0.8221, "step": 20865 }, { "epoch": 0.28, "learning_rate": 4.096703851015527e-05, "loss": 0.4826, "step": 20870 }, { "epoch": 0.28, "learning_rate": 4.0962989511495676e-05, "loss": 1.3608, "step": 20875 }, { "epoch": 0.28, "learning_rate": 4.095893980575551e-05, "loss": 0.1253, "step": 20880 }, { "epoch": 0.28, "learning_rate": 4.0954889393114143e-05, "loss": 1.8665, "step": 20885 }, { "epoch": 0.28, "learning_rate": 4.0950838273751004e-05, "loss": 1.4047, "step": 20890 }, { "epoch": 0.28, "learning_rate": 4.094678644784552e-05, "loss": 0.6072, "step": 20895 }, { "epoch": 0.28, "learning_rate": 4.094273391557718e-05, "loss": 1.0253, "step": 20900 }, { "epoch": 0.28, "learning_rate": 4.09386806771255e-05, "loss": 1.0778, "step": 20905 }, { "epoch": 0.28, "learning_rate": 4.093462673266998e-05, "loss": 0.9608, "step": 20910 }, { "epoch": 0.28, "learning_rate": 4.093057208239023e-05, "loss": 0.3532, "step": 20915 }, { "epoch": 0.28, "learning_rate": 4.0926516726465836e-05, "loss": 1.2641, "step": 20920 }, { "epoch": 0.28, "learning_rate": 4.092246066507642e-05, "loss": 1.2772, "step": 20925 }, { "epoch": 0.28, "learning_rate": 4.091840389840166e-05, "loss": 1.0556, "step": 20930 }, { "epoch": 0.28, "learning_rate": 4.0914346426621244e-05, "loss": 0.5213, "step": 20935 }, { "epoch": 0.28, "learning_rate": 4.091028824991488e-05, "loss": 0.5805, "step": 20940 }, { "epoch": 0.28, "learning_rate": 4.0906229368462365e-05, "loss": 1.085, "step": 20945 }, { "epoch": 0.28, "learning_rate": 4.0902169782443464e-05, "loss": 0.9699, "step": 20950 }, { "epoch": 0.28, "learning_rate": 4.0898109492037995e-05, "loss": 0.5032, "step": 20955 }, { "epoch": 0.28, "learning_rate": 4.0894048497425814e-05, "loss": 0.5649, "step": 20960 }, { "epoch": 0.28, "learning_rate": 4.0889986798786796e-05, "loss": 0.4614, "step": 20965 }, { "epoch": 0.28, "learning_rate": 4.088592439630086e-05, "loss": 1.0119, "step": 20970 }, { "epoch": 0.28, "learning_rate": 4.0881861290147943e-05, "loss": 0.4387, "step": 20975 }, { "epoch": 0.28, "learning_rate": 4.087779748050803e-05, "loss": 0.4526, "step": 20980 }, { "epoch": 0.28, "learning_rate": 4.0873732967561116e-05, "loss": 0.9752, "step": 20985 }, { "epoch": 0.28, "learning_rate": 4.0869667751487254e-05, "loss": 1.0436, "step": 20990 }, { "epoch": 0.28, "learning_rate": 4.0865601832466494e-05, "loss": 0.5092, "step": 20995 }, { "epoch": 0.28, "learning_rate": 4.086153521067896e-05, "loss": 0.5872, "step": 21000 }, { "epoch": 0.28, "learning_rate": 4.085746788630476e-05, "loss": 0.3203, "step": 21005 }, { "epoch": 0.28, "learning_rate": 4.085339985952407e-05, "loss": 0.4527, "step": 21010 }, { "epoch": 0.28, "learning_rate": 4.084933113051707e-05, "loss": 0.7394, "step": 21015 }, { "epoch": 0.28, "learning_rate": 4.0845261699464e-05, "loss": 0.5765, "step": 21020 }, { "epoch": 0.28, "learning_rate": 4.08411915665451e-05, "loss": 0.5461, "step": 21025 }, { "epoch": 0.28, "learning_rate": 4.083712073194067e-05, "loss": 1.3199, "step": 21030 }, { "epoch": 0.28, "learning_rate": 4.083304919583102e-05, "loss": 0.8582, "step": 21035 }, { "epoch": 0.28, "learning_rate": 4.082897695839651e-05, "loss": 0.8615, "step": 21040 }, { "epoch": 0.28, "learning_rate": 4.08249040198175e-05, "loss": 0.8796, "step": 21045 }, { "epoch": 0.28, "learning_rate": 4.0820830380274414e-05, "loss": 0.963, "step": 21050 }, { "epoch": 0.28, "learning_rate": 4.08167560399477e-05, "loss": 1.1994, "step": 21055 }, { "epoch": 0.28, "learning_rate": 4.0812680999017805e-05, "loss": 0.5702, "step": 21060 }, { "epoch": 0.28, "learning_rate": 4.080860525766527e-05, "loss": 0.6692, "step": 21065 }, { "epoch": 0.28, "learning_rate": 4.0804528816070595e-05, "loss": 0.6453, "step": 21070 }, { "epoch": 0.28, "learning_rate": 4.0800451674414364e-05, "loss": 0.4708, "step": 21075 }, { "epoch": 0.28, "learning_rate": 4.079637383287718e-05, "loss": 0.2351, "step": 21080 }, { "epoch": 0.28, "learning_rate": 4.079229529163965e-05, "loss": 0.4116, "step": 21085 }, { "epoch": 0.28, "learning_rate": 4.078821605088244e-05, "loss": 0.9698, "step": 21090 }, { "epoch": 0.28, "learning_rate": 4.0784136110786265e-05, "loss": 1.328, "step": 21095 }, { "epoch": 0.28, "learning_rate": 4.078005547153181e-05, "loss": 0.9003, "step": 21100 }, { "epoch": 0.28, "learning_rate": 4.077597413329985e-05, "loss": 0.8001, "step": 21105 }, { "epoch": 0.28, "learning_rate": 4.0771892096271156e-05, "loss": 0.3958, "step": 21110 }, { "epoch": 0.28, "learning_rate": 4.076780936062655e-05, "loss": 0.5997, "step": 21115 }, { "epoch": 0.28, "learning_rate": 4.076372592654688e-05, "loss": 0.8712, "step": 21120 }, { "epoch": 0.28, "learning_rate": 4.0759641794213e-05, "loss": 0.5388, "step": 21125 }, { "epoch": 0.28, "learning_rate": 4.0755556963805844e-05, "loss": 0.3528, "step": 21130 }, { "epoch": 0.28, "learning_rate": 4.0751471435506325e-05, "loss": 0.6828, "step": 21135 }, { "epoch": 0.28, "learning_rate": 4.0747385209495434e-05, "loss": 1.0102, "step": 21140 }, { "epoch": 0.28, "learning_rate": 4.074329828595416e-05, "loss": 0.7189, "step": 21145 }, { "epoch": 0.28, "learning_rate": 4.073921066506353e-05, "loss": 0.5082, "step": 21150 }, { "epoch": 0.28, "learning_rate": 4.073512234700461e-05, "loss": 1.0705, "step": 21155 }, { "epoch": 0.28, "learning_rate": 4.073103333195848e-05, "loss": 0.3786, "step": 21160 }, { "epoch": 0.28, "learning_rate": 4.0726943620106284e-05, "loss": 0.7188, "step": 21165 }, { "epoch": 0.28, "learning_rate": 4.072285321162916e-05, "loss": 0.7166, "step": 21170 }, { "epoch": 0.28, "learning_rate": 4.07187621067083e-05, "loss": 0.146, "step": 21175 }, { "epoch": 0.28, "learning_rate": 4.071467030552492e-05, "loss": 0.2259, "step": 21180 }, { "epoch": 0.28, "learning_rate": 4.0710577808260265e-05, "loss": 0.5746, "step": 21185 }, { "epoch": 0.28, "learning_rate": 4.0706484615095604e-05, "loss": 0.4891, "step": 21190 }, { "epoch": 0.28, "learning_rate": 4.070239072621226e-05, "loss": 1.3258, "step": 21195 }, { "epoch": 0.28, "learning_rate": 4.0698296141791545e-05, "loss": 0.6446, "step": 21200 }, { "epoch": 0.28, "learning_rate": 4.069420086201487e-05, "loss": 1.2107, "step": 21205 }, { "epoch": 0.28, "learning_rate": 4.06901048870636e-05, "loss": 1.0811, "step": 21210 }, { "epoch": 0.28, "learning_rate": 4.0686008217119174e-05, "loss": 0.8944, "step": 21215 }, { "epoch": 0.28, "learning_rate": 4.068191085236307e-05, "loss": 0.8935, "step": 21220 }, { "epoch": 0.28, "learning_rate": 4.0677812792976766e-05, "loss": 1.1864, "step": 21225 }, { "epoch": 0.28, "learning_rate": 4.067371403914179e-05, "loss": 0.4467, "step": 21230 }, { "epoch": 0.28, "learning_rate": 4.066961459103969e-05, "loss": 0.8847, "step": 21235 }, { "epoch": 0.28, "learning_rate": 4.066551444885206e-05, "loss": 0.7177, "step": 21240 }, { "epoch": 0.28, "learning_rate": 4.066141361276051e-05, "loss": 1.0495, "step": 21245 }, { "epoch": 0.28, "learning_rate": 4.065731208294669e-05, "loss": 0.3786, "step": 21250 }, { "epoch": 0.28, "learning_rate": 4.0653209859592274e-05, "loss": 1.0393, "step": 21255 }, { "epoch": 0.28, "learning_rate": 4.0649106942878974e-05, "loss": 0.9964, "step": 21260 }, { "epoch": 0.28, "learning_rate": 4.064500333298853e-05, "loss": 0.4425, "step": 21265 }, { "epoch": 0.28, "learning_rate": 4.06408990301027e-05, "loss": 1.1593, "step": 21270 }, { "epoch": 0.29, "learning_rate": 4.0636794034403294e-05, "loss": 1.0041, "step": 21275 }, { "epoch": 0.29, "learning_rate": 4.063268834607214e-05, "loss": 0.6444, "step": 21280 }, { "epoch": 0.29, "learning_rate": 4.06285819652911e-05, "loss": 0.8062, "step": 21285 }, { "epoch": 0.29, "learning_rate": 4.062447489224207e-05, "loss": 0.4539, "step": 21290 }, { "epoch": 0.29, "learning_rate": 4.0620367127106975e-05, "loss": 0.6481, "step": 21295 }, { "epoch": 0.29, "learning_rate": 4.061625867006775e-05, "loss": 1.2297, "step": 21300 }, { "epoch": 0.29, "learning_rate": 4.06121495213064e-05, "loss": 0.8961, "step": 21305 }, { "epoch": 0.29, "learning_rate": 4.060803968100492e-05, "loss": 0.4411, "step": 21310 }, { "epoch": 0.29, "learning_rate": 4.060392914934538e-05, "loss": 1.8296, "step": 21315 }, { "epoch": 0.29, "learning_rate": 4.0599817926509836e-05, "loss": 0.8948, "step": 21320 }, { "epoch": 0.29, "learning_rate": 4.05957060126804e-05, "loss": 1.3188, "step": 21325 }, { "epoch": 0.29, "learning_rate": 4.059159340803922e-05, "loss": 1.2612, "step": 21330 }, { "epoch": 0.29, "learning_rate": 4.0587480112768447e-05, "loss": 0.7933, "step": 21335 }, { "epoch": 0.29, "learning_rate": 4.058336612705028e-05, "loss": 0.7644, "step": 21340 }, { "epoch": 0.29, "learning_rate": 4.057925145106697e-05, "loss": 0.3653, "step": 21345 }, { "epoch": 0.29, "learning_rate": 4.057513608500075e-05, "loss": 0.7089, "step": 21350 }, { "epoch": 0.29, "learning_rate": 4.057102002903392e-05, "loss": 0.7181, "step": 21355 }, { "epoch": 0.29, "learning_rate": 4.056690328334881e-05, "loss": 0.4829, "step": 21360 }, { "epoch": 0.29, "learning_rate": 4.056278584812776e-05, "loss": 1.1643, "step": 21365 }, { "epoch": 0.29, "learning_rate": 4.055866772355315e-05, "loss": 0.4314, "step": 21370 }, { "epoch": 0.29, "learning_rate": 4.055454890980741e-05, "loss": 1.0225, "step": 21375 }, { "epoch": 0.29, "learning_rate": 4.055042940707296e-05, "loss": 0.1406, "step": 21380 }, { "epoch": 0.29, "learning_rate": 4.054630921553228e-05, "loss": 0.4497, "step": 21385 }, { "epoch": 0.29, "learning_rate": 4.054218833536789e-05, "loss": 0.2159, "step": 21390 }, { "epoch": 0.29, "learning_rate": 4.053806676676231e-05, "loss": 0.4503, "step": 21395 }, { "epoch": 0.29, "learning_rate": 4.05339445098981e-05, "loss": 0.657, "step": 21400 }, { "epoch": 0.29, "learning_rate": 4.052982156495786e-05, "loss": 0.846, "step": 21405 }, { "epoch": 0.29, "learning_rate": 4.0525697932124226e-05, "loss": 1.1251, "step": 21410 }, { "epoch": 0.29, "learning_rate": 4.0521573611579846e-05, "loss": 1.1924, "step": 21415 }, { "epoch": 0.29, "learning_rate": 4.05174486035074e-05, "loss": 0.9431, "step": 21420 }, { "epoch": 0.29, "learning_rate": 4.0513322908089614e-05, "loss": 0.2047, "step": 21425 }, { "epoch": 0.29, "learning_rate": 4.050919652550924e-05, "loss": 0.8371, "step": 21430 }, { "epoch": 0.29, "learning_rate": 4.050506945594904e-05, "loss": 0.5119, "step": 21435 }, { "epoch": 0.29, "learning_rate": 4.050094169959184e-05, "loss": 0.7513, "step": 21440 }, { "epoch": 0.29, "learning_rate": 4.049681325662047e-05, "loss": 0.7512, "step": 21445 }, { "epoch": 0.29, "learning_rate": 4.04926841272178e-05, "loss": 0.6708, "step": 21450 }, { "epoch": 0.29, "learning_rate": 4.0488554311566736e-05, "loss": 0.8151, "step": 21455 }, { "epoch": 0.29, "learning_rate": 4.048442380985019e-05, "loss": 1.1085, "step": 21460 }, { "epoch": 0.29, "learning_rate": 4.048029262225115e-05, "loss": 0.9362, "step": 21465 }, { "epoch": 0.29, "learning_rate": 4.0476160748952584e-05, "loss": 0.6961, "step": 21470 }, { "epoch": 0.29, "learning_rate": 4.047202819013752e-05, "loss": 0.9229, "step": 21475 }, { "epoch": 0.29, "learning_rate": 4.046789494598902e-05, "loss": 0.5353, "step": 21480 }, { "epoch": 0.29, "learning_rate": 4.046376101669015e-05, "loss": 1.0881, "step": 21485 }, { "epoch": 0.29, "learning_rate": 4.045962640242403e-05, "loss": 0.6544, "step": 21490 }, { "epoch": 0.29, "learning_rate": 4.045549110337381e-05, "loss": 0.6928, "step": 21495 }, { "epoch": 0.29, "learning_rate": 4.0451355119722646e-05, "loss": 0.4382, "step": 21500 }, { "epoch": 0.29, "learning_rate": 4.044721845165375e-05, "loss": 1.1284, "step": 21505 }, { "epoch": 0.29, "learning_rate": 4.0443081099350365e-05, "loss": 0.6674, "step": 21510 }, { "epoch": 0.29, "learning_rate": 4.043894306299574e-05, "loss": 1.0816, "step": 21515 }, { "epoch": 0.29, "learning_rate": 4.043480434277318e-05, "loss": 1.0221, "step": 21520 }, { "epoch": 0.29, "learning_rate": 4.0430664938866003e-05, "loss": 0.7431, "step": 21525 }, { "epoch": 0.29, "learning_rate": 4.042652485145757e-05, "loss": 0.5741, "step": 21530 }, { "epoch": 0.29, "learning_rate": 4.042238408073126e-05, "loss": 0.6068, "step": 21535 }, { "epoch": 0.29, "learning_rate": 4.04182426268705e-05, "loss": 0.5956, "step": 21540 }, { "epoch": 0.29, "learning_rate": 4.041410049005871e-05, "loss": 0.2545, "step": 21545 }, { "epoch": 0.29, "learning_rate": 4.0409957670479395e-05, "loss": 0.4006, "step": 21550 }, { "epoch": 0.29, "learning_rate": 4.040581416831604e-05, "loss": 0.6665, "step": 21555 }, { "epoch": 0.29, "learning_rate": 4.0401669983752195e-05, "loss": 0.7716, "step": 21560 }, { "epoch": 0.29, "learning_rate": 4.0397525116971424e-05, "loss": 1.4558, "step": 21565 }, { "epoch": 0.29, "learning_rate": 4.039337956815731e-05, "loss": 0.9787, "step": 21570 }, { "epoch": 0.29, "learning_rate": 4.03892333374935e-05, "loss": 1.1303, "step": 21575 }, { "epoch": 0.29, "learning_rate": 4.038508642516366e-05, "loss": 0.6742, "step": 21580 }, { "epoch": 0.29, "learning_rate": 4.0380938831351436e-05, "loss": 0.7049, "step": 21585 }, { "epoch": 0.29, "learning_rate": 4.0376790556240575e-05, "loss": 0.9314, "step": 21590 }, { "epoch": 0.29, "learning_rate": 4.037264160001483e-05, "loss": 0.7844, "step": 21595 }, { "epoch": 0.29, "learning_rate": 4.0368491962857954e-05, "loss": 0.2905, "step": 21600 }, { "epoch": 0.29, "learning_rate": 4.0364341644953784e-05, "loss": 1.0449, "step": 21605 }, { "epoch": 0.29, "learning_rate": 4.036019064648614e-05, "loss": 0.2528, "step": 21610 }, { "epoch": 0.29, "learning_rate": 4.0356038967638894e-05, "loss": 0.9752, "step": 21615 }, { "epoch": 0.29, "learning_rate": 4.035188660859595e-05, "loss": 1.0618, "step": 21620 }, { "epoch": 0.29, "learning_rate": 4.0347733569541224e-05, "loss": 0.7407, "step": 21625 }, { "epoch": 0.29, "learning_rate": 4.034357985065869e-05, "loss": 1.0345, "step": 21630 }, { "epoch": 0.29, "learning_rate": 4.033942545213232e-05, "loss": 1.1567, "step": 21635 }, { "epoch": 0.29, "learning_rate": 4.033527037414615e-05, "loss": 1.1227, "step": 21640 }, { "epoch": 0.29, "learning_rate": 4.0331114616884225e-05, "loss": 1.0773, "step": 21645 }, { "epoch": 0.29, "learning_rate": 4.032695818053062e-05, "loss": 0.7789, "step": 21650 }, { "epoch": 0.29, "learning_rate": 4.032280106526945e-05, "loss": 0.7218, "step": 21655 }, { "epoch": 0.29, "learning_rate": 4.031864327128485e-05, "loss": 0.5885, "step": 21660 }, { "epoch": 0.29, "learning_rate": 4.031448479876098e-05, "loss": 0.4771, "step": 21665 }, { "epoch": 0.29, "learning_rate": 4.031032564788205e-05, "loss": 0.2811, "step": 21670 }, { "epoch": 0.29, "learning_rate": 4.0306165818832294e-05, "loss": 0.3743, "step": 21675 }, { "epoch": 0.29, "learning_rate": 4.030200531179597e-05, "loss": 0.1943, "step": 21680 }, { "epoch": 0.29, "learning_rate": 4.029784412695736e-05, "loss": 0.6793, "step": 21685 }, { "epoch": 0.29, "learning_rate": 4.0293682264500784e-05, "loss": 1.4318, "step": 21690 }, { "epoch": 0.29, "learning_rate": 4.0289519724610604e-05, "loss": 0.9931, "step": 21695 }, { "epoch": 0.29, "learning_rate": 4.028535650747119e-05, "loss": 0.2591, "step": 21700 }, { "epoch": 0.29, "learning_rate": 4.028119261326695e-05, "loss": 0.9784, "step": 21705 }, { "epoch": 0.29, "learning_rate": 4.027702804218233e-05, "loss": 1.672, "step": 21710 }, { "epoch": 0.29, "learning_rate": 4.02728627944018e-05, "loss": 0.4849, "step": 21715 }, { "epoch": 0.29, "learning_rate": 4.0268696870109843e-05, "loss": 0.4278, "step": 21720 }, { "epoch": 0.29, "learning_rate": 4.026453026949101e-05, "loss": 0.4859, "step": 21725 }, { "epoch": 0.29, "learning_rate": 4.026036299272985e-05, "loss": 0.5917, "step": 21730 }, { "epoch": 0.29, "learning_rate": 4.0256195040010945e-05, "loss": 0.5303, "step": 21735 }, { "epoch": 0.29, "learning_rate": 4.025202641151894e-05, "loss": 0.3759, "step": 21740 }, { "epoch": 0.29, "learning_rate": 4.0247857107438466e-05, "loss": 0.5542, "step": 21745 }, { "epoch": 0.29, "learning_rate": 4.02436871279542e-05, "loss": 0.917, "step": 21750 }, { "epoch": 0.29, "learning_rate": 4.023951647325086e-05, "loss": 0.3804, "step": 21755 }, { "epoch": 0.29, "learning_rate": 4.023534514351317e-05, "loss": 0.4097, "step": 21760 }, { "epoch": 0.29, "learning_rate": 4.023117313892592e-05, "loss": 0.7227, "step": 21765 }, { "epoch": 0.29, "learning_rate": 4.0227000459673904e-05, "loss": 0.714, "step": 21770 }, { "epoch": 0.29, "learning_rate": 4.022282710594193e-05, "loss": 1.0733, "step": 21775 }, { "epoch": 0.29, "learning_rate": 4.021865307791489e-05, "loss": 0.7489, "step": 21780 }, { "epoch": 0.29, "learning_rate": 4.021447837577764e-05, "loss": 0.846, "step": 21785 }, { "epoch": 0.29, "learning_rate": 4.0210302999715124e-05, "loss": 0.886, "step": 21790 }, { "epoch": 0.29, "learning_rate": 4.0206126949912274e-05, "loss": 1.0981, "step": 21795 }, { "epoch": 0.29, "learning_rate": 4.020195022655408e-05, "loss": 0.744, "step": 21800 }, { "epoch": 0.29, "learning_rate": 4.019777282982554e-05, "loss": 0.3824, "step": 21805 }, { "epoch": 0.29, "learning_rate": 4.01935947599117e-05, "loss": 0.8872, "step": 21810 }, { "epoch": 0.29, "learning_rate": 4.0189416016997616e-05, "loss": 1.0278, "step": 21815 }, { "epoch": 0.29, "learning_rate": 4.018523660126839e-05, "loss": 0.5564, "step": 21820 }, { "epoch": 0.29, "learning_rate": 4.0181056512909167e-05, "loss": 0.3068, "step": 21825 }, { "epoch": 0.29, "learning_rate": 4.017687575210508e-05, "loss": 1.2407, "step": 21830 }, { "epoch": 0.29, "learning_rate": 4.017269431904132e-05, "loss": 0.8122, "step": 21835 }, { "epoch": 0.29, "learning_rate": 4.0168512213903114e-05, "loss": 0.6063, "step": 21840 }, { "epoch": 0.29, "learning_rate": 4.0164329436875705e-05, "loss": 0.8949, "step": 21845 }, { "epoch": 0.29, "learning_rate": 4.016014598814436e-05, "loss": 1.0302, "step": 21850 }, { "epoch": 0.29, "learning_rate": 4.01559618678944e-05, "loss": 0.3605, "step": 21855 }, { "epoch": 0.29, "learning_rate": 4.0151777076311144e-05, "loss": 0.652, "step": 21860 }, { "epoch": 0.29, "learning_rate": 4.014759161357997e-05, "loss": 1.0497, "step": 21865 }, { "epoch": 0.29, "learning_rate": 4.0143405479886265e-05, "loss": 0.9595, "step": 21870 }, { "epoch": 0.29, "learning_rate": 4.013921867541546e-05, "loss": 0.3731, "step": 21875 }, { "epoch": 0.29, "learning_rate": 4.0135031200353005e-05, "loss": 0.9256, "step": 21880 }, { "epoch": 0.29, "learning_rate": 4.013084305488439e-05, "loss": 0.7764, "step": 21885 }, { "epoch": 0.29, "learning_rate": 4.0126654239195115e-05, "loss": 0.6406, "step": 21890 }, { "epoch": 0.29, "learning_rate": 4.012246475347075e-05, "loss": 1.1587, "step": 21895 }, { "epoch": 0.29, "learning_rate": 4.0118274597896834e-05, "loss": 0.671, "step": 21900 }, { "epoch": 0.29, "learning_rate": 4.0114083772659e-05, "loss": 0.5117, "step": 21905 }, { "epoch": 0.29, "learning_rate": 4.010989227794286e-05, "loss": 1.046, "step": 21910 }, { "epoch": 0.29, "learning_rate": 4.0105700113934095e-05, "loss": 0.4859, "step": 21915 }, { "epoch": 0.29, "learning_rate": 4.010150728081838e-05, "loss": 0.6781, "step": 21920 }, { "epoch": 0.29, "learning_rate": 4.009731377878144e-05, "loss": 0.715, "step": 21925 }, { "epoch": 0.29, "learning_rate": 4.0093119608009034e-05, "loss": 0.5375, "step": 21930 }, { "epoch": 0.29, "learning_rate": 4.0088924768686934e-05, "loss": 0.4675, "step": 21935 }, { "epoch": 0.29, "learning_rate": 4.0084729261000957e-05, "loss": 0.9249, "step": 21940 }, { "epoch": 0.29, "learning_rate": 4.008053308513694e-05, "loss": 0.7757, "step": 21945 }, { "epoch": 0.29, "learning_rate": 4.007633624128076e-05, "loss": 0.8106, "step": 21950 }, { "epoch": 0.29, "learning_rate": 4.00721387296183e-05, "loss": 0.8872, "step": 21955 }, { "epoch": 0.29, "learning_rate": 4.006794055033549e-05, "loss": 0.5327, "step": 21960 }, { "epoch": 0.29, "learning_rate": 4.006374170361831e-05, "loss": 1.2999, "step": 21965 }, { "epoch": 0.29, "learning_rate": 4.005954218965273e-05, "loss": 0.6721, "step": 21970 }, { "epoch": 0.29, "learning_rate": 4.005534200862477e-05, "loss": 0.2676, "step": 21975 }, { "epoch": 0.29, "learning_rate": 4.0051141160720476e-05, "loss": 0.7062, "step": 21980 }, { "epoch": 0.29, "learning_rate": 4.004693964612594e-05, "loss": 0.263, "step": 21985 }, { "epoch": 0.29, "learning_rate": 4.0042737465027244e-05, "loss": 0.5731, "step": 21990 }, { "epoch": 0.29, "learning_rate": 4.0038534617610536e-05, "loss": 0.6074, "step": 21995 }, { "epoch": 0.29, "learning_rate": 4.003433110406197e-05, "loss": 1.0001, "step": 22000 }, { "epoch": 0.29, "learning_rate": 4.003012692456777e-05, "loss": 0.6938, "step": 22005 }, { "epoch": 0.29, "learning_rate": 4.002592207931413e-05, "loss": 0.9872, "step": 22010 }, { "epoch": 0.29, "learning_rate": 4.0021716568487315e-05, "loss": 0.7418, "step": 22015 }, { "epoch": 0.3, "learning_rate": 4.0017510392273604e-05, "loss": 0.6606, "step": 22020 }, { "epoch": 0.3, "learning_rate": 4.001330355085932e-05, "loss": 0.8532, "step": 22025 }, { "epoch": 0.3, "learning_rate": 4.000909604443079e-05, "loss": 0.6041, "step": 22030 }, { "epoch": 0.3, "learning_rate": 4.00048878731744e-05, "loss": 0.5085, "step": 22035 }, { "epoch": 0.3, "learning_rate": 4.0000679037276545e-05, "loss": 1.0331, "step": 22040 }, { "epoch": 0.3, "learning_rate": 3.999646953692365e-05, "loss": 1.2481, "step": 22045 }, { "epoch": 0.3, "learning_rate": 3.9992259372302186e-05, "loss": 1.0923, "step": 22050 }, { "epoch": 0.3, "learning_rate": 3.9988048543598636e-05, "loss": 1.5041, "step": 22055 }, { "epoch": 0.3, "learning_rate": 3.9983837050999504e-05, "loss": 0.8073, "step": 22060 }, { "epoch": 0.3, "learning_rate": 3.997962489469137e-05, "loss": 0.4985, "step": 22065 }, { "epoch": 0.3, "learning_rate": 3.997541207486079e-05, "loss": 0.2061, "step": 22070 }, { "epoch": 0.3, "learning_rate": 3.9971198591694366e-05, "loss": 0.2178, "step": 22075 }, { "epoch": 0.3, "learning_rate": 3.996698444537874e-05, "loss": 0.7986, "step": 22080 }, { "epoch": 0.3, "learning_rate": 3.996276963610059e-05, "loss": 0.3017, "step": 22085 }, { "epoch": 0.3, "learning_rate": 3.99585541640466e-05, "loss": 1.0275, "step": 22090 }, { "epoch": 0.3, "learning_rate": 3.995433802940349e-05, "loss": 0.1595, "step": 22095 }, { "epoch": 0.3, "learning_rate": 3.995012123235803e-05, "loss": 0.6246, "step": 22100 }, { "epoch": 0.3, "learning_rate": 3.9945903773096994e-05, "loss": 0.8941, "step": 22105 }, { "epoch": 0.3, "learning_rate": 3.9941685651807184e-05, "loss": 1.4313, "step": 22110 }, { "epoch": 0.3, "learning_rate": 3.993746686867545e-05, "loss": 0.6656, "step": 22115 }, { "epoch": 0.3, "learning_rate": 3.993324742388867e-05, "loss": 0.7044, "step": 22120 }, { "epoch": 0.3, "learning_rate": 3.9929027317633734e-05, "loss": 1.1123, "step": 22125 }, { "epoch": 0.3, "learning_rate": 3.992480655009757e-05, "loss": 0.6851, "step": 22130 }, { "epoch": 0.3, "learning_rate": 3.9920585121467145e-05, "loss": 1.1064, "step": 22135 }, { "epoch": 0.3, "learning_rate": 3.991636303192946e-05, "loss": 0.1724, "step": 22140 }, { "epoch": 0.3, "learning_rate": 3.991214028167149e-05, "loss": 0.9882, "step": 22145 }, { "epoch": 0.3, "learning_rate": 3.990791687088033e-05, "loss": 0.8487, "step": 22150 }, { "epoch": 0.3, "learning_rate": 3.990369279974303e-05, "loss": 0.4197, "step": 22155 }, { "epoch": 0.3, "learning_rate": 3.98994680684467e-05, "loss": 0.5099, "step": 22160 }, { "epoch": 0.3, "learning_rate": 3.9895242677178466e-05, "loss": 0.5551, "step": 22165 }, { "epoch": 0.3, "learning_rate": 3.989101662612551e-05, "loss": 0.1028, "step": 22170 }, { "epoch": 0.3, "learning_rate": 3.988678991547501e-05, "loss": 0.6365, "step": 22175 }, { "epoch": 0.3, "learning_rate": 3.988256254541419e-05, "loss": 0.818, "step": 22180 }, { "epoch": 0.3, "learning_rate": 3.987833451613031e-05, "loss": 0.5957, "step": 22185 }, { "epoch": 0.3, "learning_rate": 3.987410582781064e-05, "loss": 0.4597, "step": 22190 }, { "epoch": 0.3, "learning_rate": 3.98698764806425e-05, "loss": 0.6791, "step": 22195 }, { "epoch": 0.3, "learning_rate": 3.986564647481322e-05, "loss": 0.3104, "step": 22200 }, { "epoch": 0.3, "learning_rate": 3.986141581051017e-05, "loss": 0.7553, "step": 22205 }, { "epoch": 0.3, "learning_rate": 3.985718448792075e-05, "loss": 0.9636, "step": 22210 }, { "epoch": 0.3, "learning_rate": 3.985295250723239e-05, "loss": 0.2839, "step": 22215 }, { "epoch": 0.3, "learning_rate": 3.9848719868632534e-05, "loss": 0.59, "step": 22220 }, { "epoch": 0.3, "learning_rate": 3.984448657230868e-05, "loss": 0.8386, "step": 22225 }, { "epoch": 0.3, "learning_rate": 3.9840252618448334e-05, "loss": 1.0364, "step": 22230 }, { "epoch": 0.3, "learning_rate": 3.983601800723904e-05, "loss": 1.3607, "step": 22235 }, { "epoch": 0.3, "learning_rate": 3.9831782738868376e-05, "loss": 0.675, "step": 22240 }, { "epoch": 0.3, "learning_rate": 3.982754681352392e-05, "loss": 1.1474, "step": 22245 }, { "epoch": 0.3, "learning_rate": 3.982331023139334e-05, "loss": 0.586, "step": 22250 }, { "epoch": 0.3, "learning_rate": 3.981907299266427e-05, "loss": 0.6812, "step": 22255 }, { "epoch": 0.3, "learning_rate": 3.981483509752439e-05, "loss": 1.3801, "step": 22260 }, { "epoch": 0.3, "learning_rate": 3.981059654616145e-05, "loss": 0.8029, "step": 22265 }, { "epoch": 0.3, "learning_rate": 3.9806357338763165e-05, "loss": 0.6292, "step": 22270 }, { "epoch": 0.3, "learning_rate": 3.9802117475517333e-05, "loss": 0.4263, "step": 22275 }, { "epoch": 0.3, "learning_rate": 3.9797876956611745e-05, "loss": 0.745, "step": 22280 }, { "epoch": 0.3, "learning_rate": 3.979363578223424e-05, "loss": 0.4271, "step": 22285 }, { "epoch": 0.3, "learning_rate": 3.978939395257268e-05, "loss": 0.5103, "step": 22290 }, { "epoch": 0.3, "learning_rate": 3.9785151467814954e-05, "loss": 0.9572, "step": 22295 }, { "epoch": 0.3, "learning_rate": 3.978090832814899e-05, "loss": 0.9933, "step": 22300 }, { "epoch": 0.3, "learning_rate": 3.977666453376273e-05, "loss": 0.7518, "step": 22305 }, { "epoch": 0.3, "learning_rate": 3.977242008484417e-05, "loss": 0.3555, "step": 22310 }, { "epoch": 0.3, "learning_rate": 3.9768174981581284e-05, "loss": 1.3843, "step": 22315 }, { "epoch": 0.3, "learning_rate": 3.976392922416214e-05, "loss": 0.4011, "step": 22320 }, { "epoch": 0.3, "learning_rate": 3.975968281277479e-05, "loss": 0.2862, "step": 22325 }, { "epoch": 0.3, "learning_rate": 3.975543574760734e-05, "loss": 0.1036, "step": 22330 }, { "epoch": 0.3, "learning_rate": 3.9751188028847896e-05, "loss": 0.3543, "step": 22335 }, { "epoch": 0.3, "learning_rate": 3.9746939656684624e-05, "loss": 1.262, "step": 22340 }, { "epoch": 0.3, "learning_rate": 3.97426906313057e-05, "loss": 0.6031, "step": 22345 }, { "epoch": 0.3, "learning_rate": 3.9738440952899335e-05, "loss": 0.9469, "step": 22350 }, { "epoch": 0.3, "learning_rate": 3.9734190621653766e-05, "loss": 1.2565, "step": 22355 }, { "epoch": 0.3, "learning_rate": 3.9729939637757276e-05, "loss": 0.6685, "step": 22360 }, { "epoch": 0.3, "learning_rate": 3.9725688001398145e-05, "loss": 0.6323, "step": 22365 }, { "epoch": 0.3, "learning_rate": 3.972143571276471e-05, "loss": 0.5902, "step": 22370 }, { "epoch": 0.3, "learning_rate": 3.971718277204532e-05, "loss": 1.4259, "step": 22375 }, { "epoch": 0.3, "learning_rate": 3.971292917942836e-05, "loss": 1.0357, "step": 22380 }, { "epoch": 0.3, "learning_rate": 3.970867493510224e-05, "loss": 0.5136, "step": 22385 }, { "epoch": 0.3, "learning_rate": 3.970442003925541e-05, "loss": 0.3465, "step": 22390 }, { "epoch": 0.3, "learning_rate": 3.970016449207634e-05, "loss": 0.8861, "step": 22395 }, { "epoch": 0.3, "learning_rate": 3.969590829375352e-05, "loss": 0.7157, "step": 22400 }, { "epoch": 0.3, "learning_rate": 3.969165144447549e-05, "loss": 0.7834, "step": 22405 }, { "epoch": 0.3, "learning_rate": 3.9687393944430796e-05, "loss": 0.551, "step": 22410 }, { "epoch": 0.3, "learning_rate": 3.968313579380802e-05, "loss": 0.4506, "step": 22415 }, { "epoch": 0.3, "learning_rate": 3.96788769927958e-05, "loss": 0.4334, "step": 22420 }, { "epoch": 0.3, "learning_rate": 3.9674617541582764e-05, "loss": 0.9521, "step": 22425 }, { "epoch": 0.3, "learning_rate": 3.9670357440357584e-05, "loss": 0.4355, "step": 22430 }, { "epoch": 0.3, "learning_rate": 3.966609668930896e-05, "loss": 0.4039, "step": 22435 }, { "epoch": 0.3, "learning_rate": 3.9661835288625626e-05, "loss": 0.5199, "step": 22440 }, { "epoch": 0.3, "learning_rate": 3.965757323849634e-05, "loss": 0.7971, "step": 22445 }, { "epoch": 0.3, "learning_rate": 3.965331053910989e-05, "loss": 0.518, "step": 22450 }, { "epoch": 0.3, "learning_rate": 3.964904719065508e-05, "loss": 0.7205, "step": 22455 }, { "epoch": 0.3, "learning_rate": 3.9644783193320786e-05, "loss": 0.7089, "step": 22460 }, { "epoch": 0.3, "learning_rate": 3.9640518547295855e-05, "loss": 1.0885, "step": 22465 }, { "epoch": 0.3, "learning_rate": 3.963625325276919e-05, "loss": 0.8469, "step": 22470 }, { "epoch": 0.3, "learning_rate": 3.9631987309929735e-05, "loss": 0.4406, "step": 22475 }, { "epoch": 0.3, "learning_rate": 3.9627720718966446e-05, "loss": 1.1304, "step": 22480 }, { "epoch": 0.3, "learning_rate": 3.96234534800683e-05, "loss": 0.9597, "step": 22485 }, { "epoch": 0.3, "learning_rate": 3.961918559342433e-05, "loss": 0.7992, "step": 22490 }, { "epoch": 0.3, "learning_rate": 3.9614917059223574e-05, "loss": 0.9946, "step": 22495 }, { "epoch": 0.3, "learning_rate": 3.9610647877655104e-05, "loss": 0.4357, "step": 22500 }, { "epoch": 0.3, "learning_rate": 3.9606378048908035e-05, "loss": 1.3725, "step": 22505 }, { "epoch": 0.3, "learning_rate": 3.9602107573171485e-05, "loss": 0.72, "step": 22510 }, { "epoch": 0.3, "learning_rate": 3.959783645063463e-05, "loss": 1.1411, "step": 22515 }, { "epoch": 0.3, "learning_rate": 3.959356468148665e-05, "loss": 0.2, "step": 22520 }, { "epoch": 0.3, "learning_rate": 3.958929226591675e-05, "loss": 1.1359, "step": 22525 }, { "epoch": 0.3, "learning_rate": 3.958501920411422e-05, "loss": 1.0295, "step": 22530 }, { "epoch": 0.3, "learning_rate": 3.958074549626828e-05, "loss": 0.692, "step": 22535 }, { "epoch": 0.3, "learning_rate": 3.957647114256826e-05, "loss": 1.3146, "step": 22540 }, { "epoch": 0.3, "learning_rate": 3.9572196143203506e-05, "loss": 1.5299, "step": 22545 }, { "epoch": 0.3, "learning_rate": 3.956792049836335e-05, "loss": 0.1665, "step": 22550 }, { "epoch": 0.3, "learning_rate": 3.956364420823721e-05, "loss": 0.3838, "step": 22555 }, { "epoch": 0.3, "learning_rate": 3.955936727301449e-05, "loss": 0.7809, "step": 22560 }, { "epoch": 0.3, "learning_rate": 3.955508969288463e-05, "loss": 0.503, "step": 22565 }, { "epoch": 0.3, "learning_rate": 3.955081146803712e-05, "loss": 0.3653, "step": 22570 }, { "epoch": 0.3, "learning_rate": 3.954653259866146e-05, "loss": 0.9347, "step": 22575 }, { "epoch": 0.3, "learning_rate": 3.9542253084947166e-05, "loss": 0.7696, "step": 22580 }, { "epoch": 0.3, "learning_rate": 3.9537972927083825e-05, "loss": 1.2646, "step": 22585 }, { "epoch": 0.3, "learning_rate": 3.953369212526101e-05, "loss": 0.1685, "step": 22590 }, { "epoch": 0.3, "learning_rate": 3.9529410679668346e-05, "loss": 0.2128, "step": 22595 }, { "epoch": 0.3, "learning_rate": 3.952512859049548e-05, "loss": 0.3584, "step": 22600 }, { "epoch": 0.3, "learning_rate": 3.952084585793208e-05, "loss": 0.7732, "step": 22605 }, { "epoch": 0.3, "learning_rate": 3.951656248216785e-05, "loss": 0.6626, "step": 22610 }, { "epoch": 0.3, "learning_rate": 3.951227846339254e-05, "loss": 0.8291, "step": 22615 }, { "epoch": 0.3, "learning_rate": 3.950799380179588e-05, "loss": 0.6809, "step": 22620 }, { "epoch": 0.3, "learning_rate": 3.9503708497567686e-05, "loss": 0.2661, "step": 22625 }, { "epoch": 0.3, "learning_rate": 3.9499422550897764e-05, "loss": 0.9161, "step": 22630 }, { "epoch": 0.3, "learning_rate": 3.949513596197596e-05, "loss": 0.4863, "step": 22635 }, { "epoch": 0.3, "learning_rate": 3.949084873099215e-05, "loss": 1.1035, "step": 22640 }, { "epoch": 0.3, "learning_rate": 3.9486560858136234e-05, "loss": 0.6728, "step": 22645 }, { "epoch": 0.3, "learning_rate": 3.9482272343598146e-05, "loss": 0.8411, "step": 22650 }, { "epoch": 0.3, "learning_rate": 3.947798318756786e-05, "loss": 0.1972, "step": 22655 }, { "epoch": 0.3, "learning_rate": 3.947369339023533e-05, "loss": 0.6743, "step": 22660 }, { "epoch": 0.3, "learning_rate": 3.9469402951790605e-05, "loss": 1.1642, "step": 22665 }, { "epoch": 0.3, "learning_rate": 3.946511187242371e-05, "loss": 1.5916, "step": 22670 }, { "epoch": 0.3, "learning_rate": 3.946082015232473e-05, "loss": 0.7315, "step": 22675 }, { "epoch": 0.3, "learning_rate": 3.945652779168376e-05, "loss": 0.4939, "step": 22680 }, { "epoch": 0.3, "learning_rate": 3.945223479069093e-05, "loss": 0.4564, "step": 22685 }, { "epoch": 0.3, "learning_rate": 3.944794114953641e-05, "loss": 0.4943, "step": 22690 }, { "epoch": 0.3, "learning_rate": 3.9443646868410374e-05, "loss": 0.1228, "step": 22695 }, { "epoch": 0.3, "learning_rate": 3.9439351947503035e-05, "loss": 0.7159, "step": 22700 }, { "epoch": 0.3, "learning_rate": 3.943505638700465e-05, "loss": 0.9455, "step": 22705 }, { "epoch": 0.3, "learning_rate": 3.9430760187105484e-05, "loss": 1.2416, "step": 22710 }, { "epoch": 0.3, "learning_rate": 3.942646334799582e-05, "loss": 0.3849, "step": 22715 }, { "epoch": 0.3, "learning_rate": 3.942216586986602e-05, "loss": 0.895, "step": 22720 }, { "epoch": 0.3, "learning_rate": 3.941786775290642e-05, "loss": 0.1486, "step": 22725 }, { "epoch": 0.3, "learning_rate": 3.941356899730741e-05, "loss": 1.4329, "step": 22730 }, { "epoch": 0.3, "learning_rate": 3.9409269603259404e-05, "loss": 0.4382, "step": 22735 }, { "epoch": 0.3, "learning_rate": 3.940496957095284e-05, "loss": 0.8633, "step": 22740 }, { "epoch": 0.3, "learning_rate": 3.9400668900578185e-05, "loss": 0.8805, "step": 22745 }, { "epoch": 0.3, "learning_rate": 3.939636759232594e-05, "loss": 1.0227, "step": 22750 }, { "epoch": 0.3, "learning_rate": 3.939206564638665e-05, "loss": 1.4777, "step": 22755 }, { "epoch": 0.3, "learning_rate": 3.938776306295084e-05, "loss": 1.1568, "step": 22760 }, { "epoch": 0.31, "learning_rate": 3.938345984220911e-05, "loss": 0.3405, "step": 22765 }, { "epoch": 0.31, "learning_rate": 3.937915598435206e-05, "loss": 0.4206, "step": 22770 }, { "epoch": 0.31, "learning_rate": 3.937485148957034e-05, "loss": 1.4142, "step": 22775 }, { "epoch": 0.31, "learning_rate": 3.937054635805462e-05, "loss": 0.776, "step": 22780 }, { "epoch": 0.31, "learning_rate": 3.936624058999559e-05, "loss": 0.2718, "step": 22785 }, { "epoch": 0.31, "learning_rate": 3.936193418558396e-05, "loss": 0.7292, "step": 22790 }, { "epoch": 0.31, "learning_rate": 3.9357627145010514e-05, "loss": 0.6293, "step": 22795 }, { "epoch": 0.31, "learning_rate": 3.9353319468466e-05, "loss": 0.6224, "step": 22800 }, { "epoch": 0.31, "learning_rate": 3.934901115614125e-05, "loss": 0.6621, "step": 22805 }, { "epoch": 0.31, "learning_rate": 3.9344702208227094e-05, "loss": 0.6936, "step": 22810 }, { "epoch": 0.31, "learning_rate": 3.9340392624914385e-05, "loss": 0.9742, "step": 22815 }, { "epoch": 0.31, "learning_rate": 3.933608240639403e-05, "loss": 0.3422, "step": 22820 }, { "epoch": 0.31, "learning_rate": 3.9331771552856943e-05, "loss": 0.5568, "step": 22825 }, { "epoch": 0.31, "learning_rate": 3.932746006449408e-05, "loss": 0.3732, "step": 22830 }, { "epoch": 0.31, "learning_rate": 3.932314794149642e-05, "loss": 0.1079, "step": 22835 }, { "epoch": 0.31, "learning_rate": 3.931883518405495e-05, "loss": 0.5324, "step": 22840 }, { "epoch": 0.31, "learning_rate": 3.931452179236072e-05, "loss": 0.7583, "step": 22845 }, { "epoch": 0.31, "learning_rate": 3.931020776660479e-05, "loss": 1.2035, "step": 22850 }, { "epoch": 0.31, "learning_rate": 3.930589310697824e-05, "loss": 0.5492, "step": 22855 }, { "epoch": 0.31, "learning_rate": 3.930157781367221e-05, "loss": 0.9856, "step": 22860 }, { "epoch": 0.31, "learning_rate": 3.9297261886877825e-05, "loss": 0.7993, "step": 22865 }, { "epoch": 0.31, "learning_rate": 3.9292945326786254e-05, "loss": 0.6334, "step": 22870 }, { "epoch": 0.31, "learning_rate": 3.928862813358873e-05, "loss": 1.0093, "step": 22875 }, { "epoch": 0.31, "learning_rate": 3.928431030747645e-05, "loss": 0.5187, "step": 22880 }, { "epoch": 0.31, "learning_rate": 3.927999184864069e-05, "loss": 0.558, "step": 22885 }, { "epoch": 0.31, "learning_rate": 3.927567275727273e-05, "loss": 0.8676, "step": 22890 }, { "epoch": 0.31, "learning_rate": 3.927135303356389e-05, "loss": 0.7516, "step": 22895 }, { "epoch": 0.31, "learning_rate": 3.926703267770551e-05, "loss": 0.9682, "step": 22900 }, { "epoch": 0.31, "learning_rate": 3.9262711689888945e-05, "loss": 1.0728, "step": 22905 }, { "epoch": 0.31, "learning_rate": 3.9258390070305614e-05, "loss": 0.7652, "step": 22910 }, { "epoch": 0.31, "learning_rate": 3.925406781914693e-05, "loss": 0.3757, "step": 22915 }, { "epoch": 0.31, "learning_rate": 3.924974493660436e-05, "loss": 0.6992, "step": 22920 }, { "epoch": 0.31, "learning_rate": 3.924542142286938e-05, "loss": 1.5635, "step": 22925 }, { "epoch": 0.31, "learning_rate": 3.92410972781335e-05, "loss": 0.4817, "step": 22930 }, { "epoch": 0.31, "learning_rate": 3.9236772502588246e-05, "loss": 0.4374, "step": 22935 }, { "epoch": 0.31, "learning_rate": 3.92324470964252e-05, "loss": 1.1886, "step": 22940 }, { "epoch": 0.31, "learning_rate": 3.9228121059835955e-05, "loss": 1.1457, "step": 22945 }, { "epoch": 0.31, "learning_rate": 3.922379439301212e-05, "loss": 0.9873, "step": 22950 }, { "epoch": 0.31, "learning_rate": 3.921946709614536e-05, "loss": 1.3863, "step": 22955 }, { "epoch": 0.31, "learning_rate": 3.921513916942734e-05, "loss": 0.9121, "step": 22960 }, { "epoch": 0.31, "learning_rate": 3.921081061304977e-05, "loss": 1.6099, "step": 22965 }, { "epoch": 0.31, "learning_rate": 3.920648142720439e-05, "loss": 0.6618, "step": 22970 }, { "epoch": 0.31, "learning_rate": 3.920215161208295e-05, "loss": 0.0683, "step": 22975 }, { "epoch": 0.31, "learning_rate": 3.9197821167877244e-05, "loss": 0.8287, "step": 22980 }, { "epoch": 0.31, "learning_rate": 3.919349009477909e-05, "loss": 0.477, "step": 22985 }, { "epoch": 0.31, "learning_rate": 3.918915839298034e-05, "loss": 0.6129, "step": 22990 }, { "epoch": 0.31, "learning_rate": 3.918482606267286e-05, "loss": 0.805, "step": 22995 }, { "epoch": 0.31, "learning_rate": 3.918049310404854e-05, "loss": 0.8305, "step": 23000 }, { "epoch": 0.31, "learning_rate": 3.9176159517299325e-05, "loss": 0.0966, "step": 23005 }, { "epoch": 0.31, "learning_rate": 3.917182530261716e-05, "loss": 0.1906, "step": 23010 }, { "epoch": 0.31, "learning_rate": 3.916749046019404e-05, "loss": 0.9898, "step": 23015 }, { "epoch": 0.31, "learning_rate": 3.916315499022196e-05, "loss": 0.572, "step": 23020 }, { "epoch": 0.31, "learning_rate": 3.9158818892892976e-05, "loss": 1.0124, "step": 23025 }, { "epoch": 0.31, "learning_rate": 3.915448216839915e-05, "loss": 0.6669, "step": 23030 }, { "epoch": 0.31, "learning_rate": 3.915014481693258e-05, "loss": 0.9218, "step": 23035 }, { "epoch": 0.31, "learning_rate": 3.914580683868539e-05, "loss": 0.4342, "step": 23040 }, { "epoch": 0.31, "learning_rate": 3.914146823384971e-05, "loss": 0.8934, "step": 23045 }, { "epoch": 0.31, "learning_rate": 3.9137129002617746e-05, "loss": 0.3451, "step": 23050 }, { "epoch": 0.31, "learning_rate": 3.9132789145181694e-05, "loss": 0.649, "step": 23055 }, { "epoch": 0.31, "learning_rate": 3.912844866173377e-05, "loss": 0.8214, "step": 23060 }, { "epoch": 0.31, "learning_rate": 3.912410755246627e-05, "loss": 0.1025, "step": 23065 }, { "epoch": 0.31, "learning_rate": 3.911976581757146e-05, "loss": 0.1215, "step": 23070 }, { "epoch": 0.31, "learning_rate": 3.911542345724167e-05, "loss": 0.7339, "step": 23075 }, { "epoch": 0.31, "learning_rate": 3.911108047166924e-05, "loss": 0.3155, "step": 23080 }, { "epoch": 0.31, "learning_rate": 3.910673686104652e-05, "loss": 1.1439, "step": 23085 }, { "epoch": 0.31, "learning_rate": 3.9102392625565956e-05, "loss": 0.7883, "step": 23090 }, { "epoch": 0.31, "learning_rate": 3.909804776541993e-05, "loss": 0.8768, "step": 23095 }, { "epoch": 0.31, "learning_rate": 3.909370228080092e-05, "loss": 0.4122, "step": 23100 }, { "epoch": 0.31, "learning_rate": 3.9089356171901425e-05, "loss": 1.1863, "step": 23105 }, { "epoch": 0.31, "learning_rate": 3.9085009438913934e-05, "loss": 0.8494, "step": 23110 }, { "epoch": 0.31, "learning_rate": 3.9080662082030976e-05, "loss": 1.787, "step": 23115 }, { "epoch": 0.31, "learning_rate": 3.907631410144515e-05, "loss": 0.1161, "step": 23120 }, { "epoch": 0.31, "learning_rate": 3.9071965497349014e-05, "loss": 0.6746, "step": 23125 }, { "epoch": 0.31, "learning_rate": 3.906761626993521e-05, "loss": 0.7762, "step": 23130 }, { "epoch": 0.31, "learning_rate": 3.906326641939639e-05, "loss": 0.9024, "step": 23135 }, { "epoch": 0.31, "learning_rate": 3.905891594592522e-05, "loss": 0.9609, "step": 23140 }, { "epoch": 0.31, "learning_rate": 3.90545648497144e-05, "loss": 0.4082, "step": 23145 }, { "epoch": 0.31, "learning_rate": 3.9050213130956684e-05, "loss": 0.7051, "step": 23150 }, { "epoch": 0.31, "learning_rate": 3.9045860789844815e-05, "loss": 0.4714, "step": 23155 }, { "epoch": 0.31, "learning_rate": 3.904150782657158e-05, "loss": 0.5372, "step": 23160 }, { "epoch": 0.31, "learning_rate": 3.903715424132979e-05, "loss": 0.5082, "step": 23165 }, { "epoch": 0.31, "learning_rate": 3.903280003431229e-05, "loss": 0.7979, "step": 23170 }, { "epoch": 0.31, "learning_rate": 3.9028445205711964e-05, "loss": 0.6081, "step": 23175 }, { "epoch": 0.31, "learning_rate": 3.902408975572169e-05, "loss": 0.2541, "step": 23180 }, { "epoch": 0.31, "learning_rate": 3.901973368453441e-05, "loss": 0.5501, "step": 23185 }, { "epoch": 0.31, "learning_rate": 3.901537699234306e-05, "loss": 1.3347, "step": 23190 }, { "epoch": 0.31, "learning_rate": 3.9011019679340625e-05, "loss": 0.1708, "step": 23195 }, { "epoch": 0.31, "learning_rate": 3.9006661745720116e-05, "loss": 0.8576, "step": 23200 }, { "epoch": 0.31, "learning_rate": 3.900230319167456e-05, "loss": 0.7581, "step": 23205 }, { "epoch": 0.31, "learning_rate": 3.899794401739703e-05, "loss": 0.415, "step": 23210 }, { "epoch": 0.31, "learning_rate": 3.89935842230806e-05, "loss": 0.8994, "step": 23215 }, { "epoch": 0.31, "learning_rate": 3.898922380891841e-05, "loss": 0.4507, "step": 23220 }, { "epoch": 0.31, "learning_rate": 3.8984862775103576e-05, "loss": 0.4953, "step": 23225 }, { "epoch": 0.31, "learning_rate": 3.898050112182929e-05, "loss": 0.1799, "step": 23230 }, { "epoch": 0.31, "learning_rate": 3.897613884928876e-05, "loss": 0.6384, "step": 23235 }, { "epoch": 0.31, "learning_rate": 3.8971775957675186e-05, "loss": 1.0754, "step": 23240 }, { "epoch": 0.31, "learning_rate": 3.896741244718184e-05, "loss": 0.7074, "step": 23245 }, { "epoch": 0.31, "learning_rate": 3.896304831800199e-05, "loss": 0.711, "step": 23250 }, { "epoch": 0.31, "learning_rate": 3.8958683570328964e-05, "loss": 1.9548, "step": 23255 }, { "epoch": 0.31, "learning_rate": 3.895431820435609e-05, "loss": 0.374, "step": 23260 }, { "epoch": 0.31, "learning_rate": 3.894995222027672e-05, "loss": 0.6753, "step": 23265 }, { "epoch": 0.31, "learning_rate": 3.894558561828427e-05, "loss": 0.4215, "step": 23270 }, { "epoch": 0.31, "learning_rate": 3.894121839857214e-05, "loss": 1.0601, "step": 23275 }, { "epoch": 0.31, "learning_rate": 3.893685056133377e-05, "loss": 1.2408, "step": 23280 }, { "epoch": 0.31, "learning_rate": 3.893248210676266e-05, "loss": 0.4244, "step": 23285 }, { "epoch": 0.31, "learning_rate": 3.892811303505229e-05, "loss": 1.0237, "step": 23290 }, { "epoch": 0.31, "learning_rate": 3.892374334639619e-05, "loss": 1.3952, "step": 23295 }, { "epoch": 0.31, "learning_rate": 3.8919373040987916e-05, "loss": 0.7455, "step": 23300 }, { "epoch": 0.31, "learning_rate": 3.891500211902106e-05, "loss": 0.6963, "step": 23305 }, { "epoch": 0.31, "learning_rate": 3.891063058068922e-05, "loss": 0.3887, "step": 23310 }, { "epoch": 0.31, "learning_rate": 3.890625842618604e-05, "loss": 0.4984, "step": 23315 }, { "epoch": 0.31, "learning_rate": 3.890188565570517e-05, "loss": 0.0766, "step": 23320 }, { "epoch": 0.31, "learning_rate": 3.889751226944033e-05, "loss": 0.9138, "step": 23325 }, { "epoch": 0.31, "learning_rate": 3.8893138267585215e-05, "loss": 0.6254, "step": 23330 }, { "epoch": 0.31, "learning_rate": 3.888876365033358e-05, "loss": 1.0063, "step": 23335 }, { "epoch": 0.31, "learning_rate": 3.8884388417879216e-05, "loss": 0.6483, "step": 23340 }, { "epoch": 0.31, "learning_rate": 3.8880012570415886e-05, "loss": 0.9824, "step": 23345 }, { "epoch": 0.31, "learning_rate": 3.8875636108137447e-05, "loss": 0.7633, "step": 23350 }, { "epoch": 0.31, "learning_rate": 3.8871259031237745e-05, "loss": 0.4989, "step": 23355 }, { "epoch": 0.31, "learning_rate": 3.886688133991066e-05, "loss": 0.4342, "step": 23360 }, { "epoch": 0.31, "learning_rate": 3.8862503034350104e-05, "loss": 0.7018, "step": 23365 }, { "epoch": 0.31, "learning_rate": 3.8858124114750026e-05, "loss": 0.923, "step": 23370 }, { "epoch": 0.31, "learning_rate": 3.885374458130437e-05, "loss": 0.9624, "step": 23375 }, { "epoch": 0.31, "learning_rate": 3.884936443420715e-05, "loss": 0.7618, "step": 23380 }, { "epoch": 0.31, "learning_rate": 3.8844983673652355e-05, "loss": 1.2416, "step": 23385 }, { "epoch": 0.31, "learning_rate": 3.884060229983405e-05, "loss": 0.5916, "step": 23390 }, { "epoch": 0.31, "learning_rate": 3.883622031294631e-05, "loss": 0.0869, "step": 23395 }, { "epoch": 0.31, "learning_rate": 3.883183771318324e-05, "loss": 0.7152, "step": 23400 }, { "epoch": 0.31, "learning_rate": 3.8827454500738944e-05, "loss": 0.5328, "step": 23405 }, { "epoch": 0.31, "learning_rate": 3.88230706758076e-05, "loss": 0.9879, "step": 23410 }, { "epoch": 0.31, "learning_rate": 3.8818686238583374e-05, "loss": 1.0609, "step": 23415 }, { "epoch": 0.31, "learning_rate": 3.881430118926048e-05, "loss": 0.5349, "step": 23420 }, { "epoch": 0.31, "learning_rate": 3.880991552803316e-05, "loss": 0.3948, "step": 23425 }, { "epoch": 0.31, "learning_rate": 3.880552925509566e-05, "loss": 0.8813, "step": 23430 }, { "epoch": 0.31, "learning_rate": 3.8801142370642283e-05, "loss": 1.1901, "step": 23435 }, { "epoch": 0.31, "learning_rate": 3.879675487486735e-05, "loss": 0.2451, "step": 23440 }, { "epoch": 0.31, "learning_rate": 3.87923667679652e-05, "loss": 0.5081, "step": 23445 }, { "epoch": 0.31, "learning_rate": 3.8787978050130203e-05, "loss": 0.4217, "step": 23450 }, { "epoch": 0.31, "learning_rate": 3.878358872155675e-05, "loss": 0.7806, "step": 23455 }, { "epoch": 0.31, "learning_rate": 3.877919878243928e-05, "loss": 0.5808, "step": 23460 }, { "epoch": 0.31, "learning_rate": 3.877480823297224e-05, "loss": 0.6996, "step": 23465 }, { "epoch": 0.31, "learning_rate": 3.877041707335011e-05, "loss": 1.1667, "step": 23470 }, { "epoch": 0.31, "learning_rate": 3.8766025303767383e-05, "loss": 0.9691, "step": 23475 }, { "epoch": 0.31, "learning_rate": 3.876163292441861e-05, "loss": 1.0553, "step": 23480 }, { "epoch": 0.31, "learning_rate": 3.875723993549835e-05, "loss": 0.6593, "step": 23485 }, { "epoch": 0.31, "learning_rate": 3.8752846337201186e-05, "loss": 0.3731, "step": 23490 }, { "epoch": 0.31, "learning_rate": 3.874845212972173e-05, "loss": 0.5581, "step": 23495 }, { "epoch": 0.31, "learning_rate": 3.874405731325463e-05, "loss": 0.3325, "step": 23500 }, { "epoch": 0.31, "learning_rate": 3.873966188799455e-05, "loss": 0.6524, "step": 23505 }, { "epoch": 0.31, "learning_rate": 3.8735265854136185e-05, "loss": 0.8873, "step": 23510 }, { "epoch": 0.32, "learning_rate": 3.873086921187425e-05, "loss": 0.44, "step": 23515 }, { "epoch": 0.32, "learning_rate": 3.8726471961403507e-05, "loss": 0.8117, "step": 23520 }, { "epoch": 0.32, "learning_rate": 3.8722074102918734e-05, "loss": 1.1221, "step": 23525 }, { "epoch": 0.32, "learning_rate": 3.871767563661471e-05, "loss": 0.875, "step": 23530 }, { "epoch": 0.32, "learning_rate": 3.87132765626863e-05, "loss": 0.2997, "step": 23535 }, { "epoch": 0.32, "learning_rate": 3.8708876881328335e-05, "loss": 0.6645, "step": 23540 }, { "epoch": 0.32, "learning_rate": 3.8704476592735716e-05, "loss": 0.4537, "step": 23545 }, { "epoch": 0.32, "learning_rate": 3.870007569710334e-05, "loss": 0.9502, "step": 23550 }, { "epoch": 0.32, "learning_rate": 3.8695674194626154e-05, "loss": 0.898, "step": 23555 }, { "epoch": 0.32, "learning_rate": 3.8691272085499116e-05, "loss": 0.5563, "step": 23560 }, { "epoch": 0.32, "learning_rate": 3.868686936991722e-05, "loss": 1.2297, "step": 23565 }, { "epoch": 0.32, "learning_rate": 3.868246604807548e-05, "loss": 1.2051, "step": 23570 }, { "epoch": 0.32, "learning_rate": 3.8678062120168945e-05, "loss": 1.1428, "step": 23575 }, { "epoch": 0.32, "learning_rate": 3.8673657586392694e-05, "loss": 0.9051, "step": 23580 }, { "epoch": 0.32, "learning_rate": 3.8669252446941815e-05, "loss": 0.6665, "step": 23585 }, { "epoch": 0.32, "learning_rate": 3.8664846702011436e-05, "loss": 0.4815, "step": 23590 }, { "epoch": 0.32, "learning_rate": 3.866044035179671e-05, "loss": 0.4965, "step": 23595 }, { "epoch": 0.32, "learning_rate": 3.8656033396492823e-05, "loss": 0.2381, "step": 23600 }, { "epoch": 0.32, "learning_rate": 3.865162583629498e-05, "loss": 0.8256, "step": 23605 }, { "epoch": 0.32, "learning_rate": 3.8647217671398394e-05, "loss": 1.2712, "step": 23610 }, { "epoch": 0.32, "learning_rate": 3.864280890199835e-05, "loss": 0.766, "step": 23615 }, { "epoch": 0.32, "learning_rate": 3.863839952829012e-05, "loss": 0.3761, "step": 23620 }, { "epoch": 0.32, "learning_rate": 3.863398955046903e-05, "loss": 0.7984, "step": 23625 }, { "epoch": 0.32, "learning_rate": 3.8629578968730406e-05, "loss": 0.4039, "step": 23630 }, { "epoch": 0.32, "learning_rate": 3.862516778326962e-05, "loss": 1.1564, "step": 23635 }, { "epoch": 0.32, "learning_rate": 3.862075599428207e-05, "loss": 0.4095, "step": 23640 }, { "epoch": 0.32, "learning_rate": 3.861634360196317e-05, "loss": 1.1131, "step": 23645 }, { "epoch": 0.32, "learning_rate": 3.8611930606508364e-05, "loss": 0.1361, "step": 23650 }, { "epoch": 0.32, "learning_rate": 3.860751700811314e-05, "loss": 0.5455, "step": 23655 }, { "epoch": 0.32, "learning_rate": 3.860310280697298e-05, "loss": 0.1449, "step": 23660 }, { "epoch": 0.32, "learning_rate": 3.8598688003283426e-05, "loss": 0.9088, "step": 23665 }, { "epoch": 0.32, "learning_rate": 3.8594272597240025e-05, "loss": 0.369, "step": 23670 }, { "epoch": 0.32, "learning_rate": 3.858985658903835e-05, "loss": 0.8861, "step": 23675 }, { "epoch": 0.32, "learning_rate": 3.858543997887402e-05, "loss": 0.4745, "step": 23680 }, { "epoch": 0.32, "learning_rate": 3.8581022766942664e-05, "loss": 1.4327, "step": 23685 }, { "epoch": 0.32, "learning_rate": 3.857660495343994e-05, "loss": 0.5411, "step": 23690 }, { "epoch": 0.32, "learning_rate": 3.857218653856155e-05, "loss": 1.4805, "step": 23695 }, { "epoch": 0.32, "learning_rate": 3.856776752250319e-05, "loss": 0.4888, "step": 23700 }, { "epoch": 0.32, "learning_rate": 3.85633479054606e-05, "loss": 0.8763, "step": 23705 }, { "epoch": 0.32, "learning_rate": 3.855892768762957e-05, "loss": 1.2174, "step": 23710 }, { "epoch": 0.32, "learning_rate": 3.855450686920585e-05, "loss": 0.885, "step": 23715 }, { "epoch": 0.32, "learning_rate": 3.855008545038531e-05, "loss": 0.8236, "step": 23720 }, { "epoch": 0.32, "learning_rate": 3.8545663431363764e-05, "loss": 0.4047, "step": 23725 }, { "epoch": 0.32, "learning_rate": 3.85412408123371e-05, "loss": 1.4284, "step": 23730 }, { "epoch": 0.32, "learning_rate": 3.853681759350121e-05, "loss": 0.8037, "step": 23735 }, { "epoch": 0.32, "learning_rate": 3.853239377505201e-05, "loss": 0.3374, "step": 23740 }, { "epoch": 0.32, "learning_rate": 3.852796935718549e-05, "loss": 0.3545, "step": 23745 }, { "epoch": 0.32, "learning_rate": 3.8523544340097584e-05, "loss": 0.766, "step": 23750 }, { "epoch": 0.32, "learning_rate": 3.851911872398433e-05, "loss": 0.3855, "step": 23755 }, { "epoch": 0.32, "learning_rate": 3.851469250904175e-05, "loss": 0.8166, "step": 23760 }, { "epoch": 0.32, "learning_rate": 3.851026569546591e-05, "loss": 1.6127, "step": 23765 }, { "epoch": 0.32, "learning_rate": 3.8505838283452885e-05, "loss": 0.4721, "step": 23770 }, { "epoch": 0.32, "learning_rate": 3.850141027319879e-05, "loss": 1.0772, "step": 23775 }, { "epoch": 0.32, "learning_rate": 3.8496981664899765e-05, "loss": 0.3821, "step": 23780 }, { "epoch": 0.32, "learning_rate": 3.8492552458751974e-05, "loss": 0.8276, "step": 23785 }, { "epoch": 0.32, "learning_rate": 3.8488122654951606e-05, "loss": 0.3016, "step": 23790 }, { "epoch": 0.32, "learning_rate": 3.8483692253694896e-05, "loss": 0.2645, "step": 23795 }, { "epoch": 0.32, "learning_rate": 3.847926125517807e-05, "loss": 0.5956, "step": 23800 }, { "epoch": 0.32, "learning_rate": 3.84748296595974e-05, "loss": 0.8768, "step": 23805 }, { "epoch": 0.32, "learning_rate": 3.84703974671492e-05, "loss": 1.1143, "step": 23810 }, { "epoch": 0.32, "learning_rate": 3.846596467802978e-05, "loss": 0.8881, "step": 23815 }, { "epoch": 0.32, "learning_rate": 3.8461531292435485e-05, "loss": 0.3966, "step": 23820 }, { "epoch": 0.32, "learning_rate": 3.84570973105627e-05, "loss": 0.6174, "step": 23825 }, { "epoch": 0.32, "learning_rate": 3.845266273260783e-05, "loss": 0.5989, "step": 23830 }, { "epoch": 0.32, "learning_rate": 3.84482275587673e-05, "loss": 1.7389, "step": 23835 }, { "epoch": 0.32, "learning_rate": 3.844379178923757e-05, "loss": 0.593, "step": 23840 }, { "epoch": 0.32, "learning_rate": 3.843935542421513e-05, "loss": 1.1879, "step": 23845 }, { "epoch": 0.32, "learning_rate": 3.8434918463896475e-05, "loss": 0.7496, "step": 23850 }, { "epoch": 0.32, "learning_rate": 3.8430480908478136e-05, "loss": 0.8239, "step": 23855 }, { "epoch": 0.32, "learning_rate": 3.842604275815669e-05, "loss": 1.0711, "step": 23860 }, { "epoch": 0.32, "learning_rate": 3.842160401312872e-05, "loss": 0.6918, "step": 23865 }, { "epoch": 0.32, "learning_rate": 3.841716467359083e-05, "loss": 0.8704, "step": 23870 }, { "epoch": 0.32, "learning_rate": 3.841272473973968e-05, "loss": 0.8752, "step": 23875 }, { "epoch": 0.32, "learning_rate": 3.8408284211771924e-05, "loss": 0.3563, "step": 23880 }, { "epoch": 0.32, "learning_rate": 3.8403843089884254e-05, "loss": 0.607, "step": 23885 }, { "epoch": 0.32, "learning_rate": 3.8399401374273386e-05, "loss": 1.1755, "step": 23890 }, { "epoch": 0.32, "learning_rate": 3.8394959065136084e-05, "loss": 0.3341, "step": 23895 }, { "epoch": 0.32, "learning_rate": 3.83905161626691e-05, "loss": 0.483, "step": 23900 }, { "epoch": 0.32, "learning_rate": 3.838607266706924e-05, "loss": 0.5369, "step": 23905 }, { "epoch": 0.32, "learning_rate": 3.838162857853334e-05, "loss": 0.5859, "step": 23910 }, { "epoch": 0.32, "learning_rate": 3.837718389725823e-05, "loss": 0.8818, "step": 23915 }, { "epoch": 0.32, "learning_rate": 3.8372738623440796e-05, "loss": 0.5662, "step": 23920 }, { "epoch": 0.32, "learning_rate": 3.8368292757277956e-05, "loss": 0.2573, "step": 23925 }, { "epoch": 0.32, "learning_rate": 3.836384629896661e-05, "loss": 0.6653, "step": 23930 }, { "epoch": 0.32, "learning_rate": 3.835939924870374e-05, "loss": 1.3079, "step": 23935 }, { "epoch": 0.32, "learning_rate": 3.835495160668631e-05, "loss": 0.7263, "step": 23940 }, { "epoch": 0.32, "learning_rate": 3.8350503373111345e-05, "loss": 0.916, "step": 23945 }, { "epoch": 0.32, "learning_rate": 3.834605454817587e-05, "loss": 0.7341, "step": 23950 }, { "epoch": 0.32, "learning_rate": 3.834160513207694e-05, "loss": 0.8241, "step": 23955 }, { "epoch": 0.32, "learning_rate": 3.833715512501166e-05, "loss": 0.7049, "step": 23960 }, { "epoch": 0.32, "learning_rate": 3.833270452717712e-05, "loss": 0.937, "step": 23965 }, { "epoch": 0.32, "learning_rate": 3.8328253338770483e-05, "loss": 0.9856, "step": 23970 }, { "epoch": 0.32, "learning_rate": 3.8323801559988894e-05, "loss": 0.9845, "step": 23975 }, { "epoch": 0.32, "learning_rate": 3.831934919102955e-05, "loss": 1.1249, "step": 23980 }, { "epoch": 0.32, "learning_rate": 3.831489623208968e-05, "loss": 0.8142, "step": 23985 }, { "epoch": 0.32, "learning_rate": 3.831044268336652e-05, "loss": 0.7838, "step": 23990 }, { "epoch": 0.32, "learning_rate": 3.830598854505732e-05, "loss": 0.248, "step": 23995 }, { "epoch": 0.32, "learning_rate": 3.8301533817359414e-05, "loss": 0.7938, "step": 24000 }, { "epoch": 0.32, "learning_rate": 3.8297078500470104e-05, "loss": 0.7034, "step": 24005 }, { "epoch": 0.32, "learning_rate": 3.829262259458674e-05, "loss": 1.0375, "step": 24010 }, { "epoch": 0.32, "learning_rate": 3.8288166099906686e-05, "loss": 0.6956, "step": 24015 }, { "epoch": 0.32, "learning_rate": 3.828370901662736e-05, "loss": 1.4967, "step": 24020 }, { "epoch": 0.32, "learning_rate": 3.8279251344946176e-05, "loss": 0.8592, "step": 24025 }, { "epoch": 0.32, "learning_rate": 3.82747930850606e-05, "loss": 0.7223, "step": 24030 }, { "epoch": 0.32, "learning_rate": 3.82703342371681e-05, "loss": 1.0507, "step": 24035 }, { "epoch": 0.32, "learning_rate": 3.826587480146617e-05, "loss": 0.721, "step": 24040 }, { "epoch": 0.32, "learning_rate": 3.8261414778152375e-05, "loss": 0.8075, "step": 24045 }, { "epoch": 0.32, "learning_rate": 3.825695416742423e-05, "loss": 1.013, "step": 24050 }, { "epoch": 0.32, "learning_rate": 3.825249296947935e-05, "loss": 0.2566, "step": 24055 }, { "epoch": 0.32, "learning_rate": 3.824803118451533e-05, "loss": 0.8262, "step": 24060 }, { "epoch": 0.32, "learning_rate": 3.8243568812729793e-05, "loss": 0.9719, "step": 24065 }, { "epoch": 0.32, "learning_rate": 3.823910585432043e-05, "loss": 0.4145, "step": 24070 }, { "epoch": 0.32, "learning_rate": 3.82346423094849e-05, "loss": 0.5976, "step": 24075 }, { "epoch": 0.32, "learning_rate": 3.8230178178420936e-05, "loss": 0.6936, "step": 24080 }, { "epoch": 0.32, "learning_rate": 3.822571346132626e-05, "loss": 0.6088, "step": 24085 }, { "epoch": 0.32, "learning_rate": 3.822124815839865e-05, "loss": 1.0675, "step": 24090 }, { "epoch": 0.32, "learning_rate": 3.8216782269835885e-05, "loss": 0.867, "step": 24095 }, { "epoch": 0.32, "learning_rate": 3.821231579583579e-05, "loss": 0.8633, "step": 24100 }, { "epoch": 0.32, "learning_rate": 3.82078487365962e-05, "loss": 0.7463, "step": 24105 }, { "epoch": 0.32, "learning_rate": 3.820338109231499e-05, "loss": 0.4903, "step": 24110 }, { "epoch": 0.32, "learning_rate": 3.819891286319006e-05, "loss": 0.8759, "step": 24115 }, { "epoch": 0.32, "learning_rate": 3.8194444049419306e-05, "loss": 0.8537, "step": 24120 }, { "epoch": 0.32, "learning_rate": 3.8189974651200706e-05, "loss": 0.6817, "step": 24125 }, { "epoch": 0.32, "learning_rate": 3.818550466873221e-05, "loss": 1.1874, "step": 24130 }, { "epoch": 0.32, "learning_rate": 3.818103410221182e-05, "loss": 0.3722, "step": 24135 }, { "epoch": 0.32, "learning_rate": 3.8176562951837566e-05, "loss": 0.4252, "step": 24140 }, { "epoch": 0.32, "learning_rate": 3.817209121780749e-05, "loss": 0.3457, "step": 24145 }, { "epoch": 0.32, "learning_rate": 3.816761890031967e-05, "loss": 0.6843, "step": 24150 }, { "epoch": 0.32, "learning_rate": 3.8163145999572214e-05, "loss": 0.9472, "step": 24155 }, { "epoch": 0.32, "learning_rate": 3.8158672515763235e-05, "loss": 0.2857, "step": 24160 }, { "epoch": 0.32, "learning_rate": 3.81541984490909e-05, "loss": 0.1666, "step": 24165 }, { "epoch": 0.32, "learning_rate": 3.8149723799753385e-05, "loss": 1.5101, "step": 24170 }, { "epoch": 0.32, "learning_rate": 3.8145248567948886e-05, "loss": 0.7303, "step": 24175 }, { "epoch": 0.32, "learning_rate": 3.814077275387564e-05, "loss": 0.6192, "step": 24180 }, { "epoch": 0.32, "learning_rate": 3.81362963577319e-05, "loss": 0.8788, "step": 24185 }, { "epoch": 0.32, "learning_rate": 3.813181937971596e-05, "loss": 0.589, "step": 24190 }, { "epoch": 0.32, "learning_rate": 3.812734182002611e-05, "loss": 1.1872, "step": 24195 }, { "epoch": 0.32, "learning_rate": 3.8122863678860694e-05, "loss": 1.6408, "step": 24200 }, { "epoch": 0.32, "learning_rate": 3.8118384956418064e-05, "loss": 0.6828, "step": 24205 }, { "epoch": 0.32, "learning_rate": 3.811390565289661e-05, "loss": 0.8469, "step": 24210 }, { "epoch": 0.32, "learning_rate": 3.8109425768494744e-05, "loss": 0.823, "step": 24215 }, { "epoch": 0.32, "learning_rate": 3.8104945303410906e-05, "loss": 0.8629, "step": 24220 }, { "epoch": 0.32, "learning_rate": 3.810046425784355e-05, "loss": 0.9353, "step": 24225 }, { "epoch": 0.32, "learning_rate": 3.809598263199117e-05, "loss": 1.1871, "step": 24230 }, { "epoch": 0.32, "learning_rate": 3.809150042605227e-05, "loss": 0.5899, "step": 24235 }, { "epoch": 0.32, "learning_rate": 3.80870176402254e-05, "loss": 0.6751, "step": 24240 }, { "epoch": 0.32, "learning_rate": 3.8082534274709115e-05, "loss": 0.8383, "step": 24245 }, { "epoch": 0.32, "learning_rate": 3.807805032970202e-05, "loss": 0.2457, "step": 24250 }, { "epoch": 0.32, "learning_rate": 3.807356580540272e-05, "loss": 1.7371, "step": 24255 }, { "epoch": 0.33, "learning_rate": 3.806908070200986e-05, "loss": 0.9853, "step": 24260 }, { "epoch": 0.33, "learning_rate": 3.80645950197221e-05, "loss": 0.66, "step": 24265 }, { "epoch": 0.33, "learning_rate": 3.8060108758738145e-05, "loss": 1.0308, "step": 24270 }, { "epoch": 0.33, "learning_rate": 3.8055621919256715e-05, "loss": 0.7236, "step": 24275 }, { "epoch": 0.33, "learning_rate": 3.805113450147655e-05, "loss": 0.4188, "step": 24280 }, { "epoch": 0.33, "learning_rate": 3.804664650559641e-05, "loss": 0.6186, "step": 24285 }, { "epoch": 0.33, "learning_rate": 3.8042157931815106e-05, "loss": 0.9247, "step": 24290 }, { "epoch": 0.33, "learning_rate": 3.803766878033145e-05, "loss": 0.9918, "step": 24295 }, { "epoch": 0.33, "learning_rate": 3.8033179051344294e-05, "loss": 0.7281, "step": 24300 }, { "epoch": 0.33, "learning_rate": 3.802868874505251e-05, "loss": 0.6478, "step": 24305 }, { "epoch": 0.33, "learning_rate": 3.8024197861655e-05, "loss": 0.365, "step": 24310 }, { "epoch": 0.33, "learning_rate": 3.801970640135067e-05, "loss": 0.7387, "step": 24315 }, { "epoch": 0.33, "learning_rate": 3.801521436433849e-05, "loss": 0.3411, "step": 24320 }, { "epoch": 0.33, "learning_rate": 3.801072175081743e-05, "loss": 0.7468, "step": 24325 }, { "epoch": 0.33, "learning_rate": 3.8006228560986484e-05, "loss": 0.5464, "step": 24330 }, { "epoch": 0.33, "learning_rate": 3.8001734795044686e-05, "loss": 0.6094, "step": 24335 }, { "epoch": 0.33, "learning_rate": 3.799724045319107e-05, "loss": 0.3446, "step": 24340 }, { "epoch": 0.33, "learning_rate": 3.7992745535624736e-05, "loss": 1.2662, "step": 24345 }, { "epoch": 0.33, "learning_rate": 3.798825004254477e-05, "loss": 0.5556, "step": 24350 }, { "epoch": 0.33, "learning_rate": 3.7983753974150304e-05, "loss": 0.4311, "step": 24355 }, { "epoch": 0.33, "learning_rate": 3.7979257330640497e-05, "loss": 1.0037, "step": 24360 }, { "epoch": 0.33, "learning_rate": 3.797476011221452e-05, "loss": 0.4782, "step": 24365 }, { "epoch": 0.33, "learning_rate": 3.797026231907158e-05, "loss": 1.0164, "step": 24370 }, { "epoch": 0.33, "learning_rate": 3.7965763951410914e-05, "loss": 0.5538, "step": 24375 }, { "epoch": 0.33, "learning_rate": 3.796126500943177e-05, "loss": 0.9348, "step": 24380 }, { "epoch": 0.33, "learning_rate": 3.795676549333342e-05, "loss": 0.1577, "step": 24385 }, { "epoch": 0.33, "learning_rate": 3.795226540331519e-05, "loss": 0.9627, "step": 24390 }, { "epoch": 0.33, "learning_rate": 3.7947764739576394e-05, "loss": 0.6241, "step": 24395 }, { "epoch": 0.33, "learning_rate": 3.7943263502316394e-05, "loss": 0.2312, "step": 24400 }, { "epoch": 0.33, "learning_rate": 3.793876169173458e-05, "loss": 1.1381, "step": 24405 }, { "epoch": 0.33, "learning_rate": 3.793425930803034e-05, "loss": 1.0315, "step": 24410 }, { "epoch": 0.33, "learning_rate": 3.792975635140314e-05, "loss": 0.6693, "step": 24415 }, { "epoch": 0.33, "learning_rate": 3.792525282205242e-05, "loss": 0.3914, "step": 24420 }, { "epoch": 0.33, "learning_rate": 3.792074872017764e-05, "loss": 0.9577, "step": 24425 }, { "epoch": 0.33, "learning_rate": 3.791624404597835e-05, "loss": 0.4765, "step": 24430 }, { "epoch": 0.33, "learning_rate": 3.791173879965406e-05, "loss": 0.7258, "step": 24435 }, { "epoch": 0.33, "learning_rate": 3.790723298140434e-05, "loss": 0.7476, "step": 24440 }, { "epoch": 0.33, "learning_rate": 3.790272659142877e-05, "loss": 0.2048, "step": 24445 }, { "epoch": 0.33, "learning_rate": 3.7898219629926966e-05, "loss": 1.2109, "step": 24450 }, { "epoch": 0.33, "learning_rate": 3.7893712097098564e-05, "loss": 0.5894, "step": 24455 }, { "epoch": 0.33, "learning_rate": 3.788920399314321e-05, "loss": 1.2562, "step": 24460 }, { "epoch": 0.33, "learning_rate": 3.78846953182606e-05, "loss": 0.6419, "step": 24465 }, { "epoch": 0.33, "learning_rate": 3.788018607265046e-05, "loss": 0.5339, "step": 24470 }, { "epoch": 0.33, "learning_rate": 3.787567625651251e-05, "loss": 1.0746, "step": 24475 }, { "epoch": 0.33, "learning_rate": 3.787116587004651e-05, "loss": 0.4565, "step": 24480 }, { "epoch": 0.33, "learning_rate": 3.786665491345226e-05, "loss": 0.8327, "step": 24485 }, { "epoch": 0.33, "learning_rate": 3.786214338692957e-05, "loss": 0.4971, "step": 24490 }, { "epoch": 0.33, "learning_rate": 3.7857631290678275e-05, "loss": 0.8128, "step": 24495 }, { "epoch": 0.33, "learning_rate": 3.785311862489823e-05, "loss": 0.4459, "step": 24500 }, { "epoch": 0.33, "learning_rate": 3.784860538978934e-05, "loss": 0.4915, "step": 24505 }, { "epoch": 0.33, "learning_rate": 3.784409158555151e-05, "loss": 1.0629, "step": 24510 }, { "epoch": 0.33, "learning_rate": 3.783957721238468e-05, "loss": 0.9988, "step": 24515 }, { "epoch": 0.33, "learning_rate": 3.783506227048881e-05, "loss": 0.8574, "step": 24520 }, { "epoch": 0.33, "learning_rate": 3.7830546760063896e-05, "loss": 0.1478, "step": 24525 }, { "epoch": 0.33, "learning_rate": 3.782603068130996e-05, "loss": 0.6352, "step": 24530 }, { "epoch": 0.33, "learning_rate": 3.7821514034427006e-05, "loss": 0.872, "step": 24535 }, { "epoch": 0.33, "learning_rate": 3.781699681961514e-05, "loss": 0.4606, "step": 24540 }, { "epoch": 0.33, "learning_rate": 3.7812479037074436e-05, "loss": 0.309, "step": 24545 }, { "epoch": 0.33, "learning_rate": 3.7807960687005e-05, "loss": 0.4212, "step": 24550 }, { "epoch": 0.33, "learning_rate": 3.7803441769607004e-05, "loss": 0.9931, "step": 24555 }, { "epoch": 0.33, "learning_rate": 3.7798922285080575e-05, "loss": 0.3635, "step": 24560 }, { "epoch": 0.33, "learning_rate": 3.779440223362593e-05, "loss": 0.7206, "step": 24565 }, { "epoch": 0.33, "learning_rate": 3.7789881615443254e-05, "loss": 0.6232, "step": 24570 }, { "epoch": 0.33, "learning_rate": 3.778536043073282e-05, "loss": 0.5903, "step": 24575 }, { "epoch": 0.33, "learning_rate": 3.7780838679694887e-05, "loss": 0.1123, "step": 24580 }, { "epoch": 0.33, "learning_rate": 3.777631636252974e-05, "loss": 0.8093, "step": 24585 }, { "epoch": 0.33, "learning_rate": 3.777179347943769e-05, "loss": 0.1892, "step": 24590 }, { "epoch": 0.33, "learning_rate": 3.776727003061909e-05, "loss": 0.6841, "step": 24595 }, { "epoch": 0.33, "learning_rate": 3.77627460162743e-05, "loss": 0.6524, "step": 24600 }, { "epoch": 0.33, "learning_rate": 3.77582214366037e-05, "loss": 1.0141, "step": 24605 }, { "epoch": 0.33, "learning_rate": 3.7753696291807736e-05, "loss": 0.6354, "step": 24610 }, { "epoch": 0.33, "learning_rate": 3.7749170582086814e-05, "loss": 0.7018, "step": 24615 }, { "epoch": 0.33, "learning_rate": 3.774464430764143e-05, "loss": 0.6539, "step": 24620 }, { "epoch": 0.33, "learning_rate": 3.774011746867205e-05, "loss": 1.0639, "step": 24625 }, { "epoch": 0.33, "learning_rate": 3.773559006537921e-05, "loss": 0.8795, "step": 24630 }, { "epoch": 0.33, "learning_rate": 3.773106209796345e-05, "loss": 0.998, "step": 24635 }, { "epoch": 0.33, "learning_rate": 3.7726533566625335e-05, "loss": 0.282, "step": 24640 }, { "epoch": 0.33, "learning_rate": 3.7722004471565434e-05, "loss": 0.5552, "step": 24645 }, { "epoch": 0.33, "learning_rate": 3.7717474812984386e-05, "loss": 0.2324, "step": 24650 }, { "epoch": 0.33, "learning_rate": 3.771294459108283e-05, "loss": 0.5787, "step": 24655 }, { "epoch": 0.33, "learning_rate": 3.770841380606143e-05, "loss": 0.5955, "step": 24660 }, { "epoch": 0.33, "learning_rate": 3.770388245812088e-05, "loss": 1.0356, "step": 24665 }, { "epoch": 0.33, "learning_rate": 3.769935054746189e-05, "loss": 0.9986, "step": 24670 }, { "epoch": 0.33, "learning_rate": 3.76948180742852e-05, "loss": 0.5599, "step": 24675 }, { "epoch": 0.33, "learning_rate": 3.769028503879158e-05, "loss": 1.1153, "step": 24680 }, { "epoch": 0.33, "learning_rate": 3.7685751441181824e-05, "loss": 0.4767, "step": 24685 }, { "epoch": 0.33, "learning_rate": 3.7681217281656745e-05, "loss": 1.2054, "step": 24690 }, { "epoch": 0.33, "learning_rate": 3.7676682560417186e-05, "loss": 1.3261, "step": 24695 }, { "epoch": 0.33, "learning_rate": 3.7672147277664e-05, "loss": 0.298, "step": 24700 }, { "epoch": 0.33, "learning_rate": 3.7667611433598085e-05, "loss": 0.8418, "step": 24705 }, { "epoch": 0.33, "learning_rate": 3.766307502842037e-05, "loss": 1.1357, "step": 24710 }, { "epoch": 0.33, "learning_rate": 3.7658538062331775e-05, "loss": 1.1904, "step": 24715 }, { "epoch": 0.33, "learning_rate": 3.7654000535533276e-05, "loss": 0.538, "step": 24720 }, { "epoch": 0.33, "learning_rate": 3.764946244822585e-05, "loss": 1.4292, "step": 24725 }, { "epoch": 0.33, "learning_rate": 3.7644923800610526e-05, "loss": 0.9699, "step": 24730 }, { "epoch": 0.33, "learning_rate": 3.764038459288833e-05, "loss": 1.1509, "step": 24735 }, { "epoch": 0.33, "learning_rate": 3.763584482526035e-05, "loss": 1.4271, "step": 24740 }, { "epoch": 0.33, "learning_rate": 3.763130449792766e-05, "loss": 0.4773, "step": 24745 }, { "epoch": 0.33, "learning_rate": 3.7626763611091367e-05, "loss": 0.8146, "step": 24750 }, { "epoch": 0.33, "learning_rate": 3.7622222164952606e-05, "loss": 0.5348, "step": 24755 }, { "epoch": 0.33, "learning_rate": 3.761768015971255e-05, "loss": 0.6908, "step": 24760 }, { "epoch": 0.33, "learning_rate": 3.76131375955724e-05, "loss": 0.4882, "step": 24765 }, { "epoch": 0.33, "learning_rate": 3.760859447273336e-05, "loss": 1.3658, "step": 24770 }, { "epoch": 0.33, "learning_rate": 3.760405079139665e-05, "loss": 0.5717, "step": 24775 }, { "epoch": 0.33, "learning_rate": 3.759950655176355e-05, "loss": 0.6347, "step": 24780 }, { "epoch": 0.33, "learning_rate": 3.759496175403535e-05, "loss": 0.3313, "step": 24785 }, { "epoch": 0.33, "learning_rate": 3.759041639841334e-05, "loss": 0.9695, "step": 24790 }, { "epoch": 0.33, "learning_rate": 3.7585870485098886e-05, "loss": 0.9392, "step": 24795 }, { "epoch": 0.33, "learning_rate": 3.7581324014293326e-05, "loss": 0.9624, "step": 24800 }, { "epoch": 0.33, "learning_rate": 3.7576776986198065e-05, "loss": 1.0712, "step": 24805 }, { "epoch": 0.33, "learning_rate": 3.757222940101449e-05, "loss": 1.2983, "step": 24810 }, { "epoch": 0.33, "learning_rate": 3.7567681258944055e-05, "loss": 0.2944, "step": 24815 }, { "epoch": 0.33, "learning_rate": 3.756313256018822e-05, "loss": 1.053, "step": 24820 }, { "epoch": 0.33, "learning_rate": 3.755858330494846e-05, "loss": 0.8827, "step": 24825 }, { "epoch": 0.33, "learning_rate": 3.755403349342629e-05, "loss": 0.7918, "step": 24830 }, { "epoch": 0.33, "learning_rate": 3.755039324382064e-05, "loss": 1.1005, "step": 24835 }, { "epoch": 0.33, "learning_rate": 3.754584243149801e-05, "loss": 0.6088, "step": 24840 }, { "epoch": 0.33, "learning_rate": 3.754129106345732e-05, "loss": 0.444, "step": 24845 }, { "epoch": 0.33, "learning_rate": 3.753673913990018e-05, "loss": 0.3033, "step": 24850 }, { "epoch": 0.33, "learning_rate": 3.753218666102821e-05, "loss": 0.9081, "step": 24855 }, { "epoch": 0.33, "learning_rate": 3.752763362704308e-05, "loss": 0.5393, "step": 24860 }, { "epoch": 0.33, "learning_rate": 3.752308003814645e-05, "loss": 0.495, "step": 24865 }, { "epoch": 0.33, "learning_rate": 3.751852589454002e-05, "loss": 1.1215, "step": 24870 }, { "epoch": 0.33, "learning_rate": 3.7513971196425525e-05, "loss": 0.463, "step": 24875 }, { "epoch": 0.33, "learning_rate": 3.750941594400471e-05, "loss": 0.669, "step": 24880 }, { "epoch": 0.33, "learning_rate": 3.750486013747936e-05, "loss": 0.6337, "step": 24885 }, { "epoch": 0.33, "learning_rate": 3.7500303777051253e-05, "loss": 0.8088, "step": 24890 }, { "epoch": 0.33, "learning_rate": 3.7495746862922235e-05, "loss": 0.9268, "step": 24895 }, { "epoch": 0.33, "learning_rate": 3.7491189395294136e-05, "loss": 0.3662, "step": 24900 }, { "epoch": 0.33, "learning_rate": 3.748663137436884e-05, "loss": 0.7655, "step": 24905 }, { "epoch": 0.33, "learning_rate": 3.748207280034825e-05, "loss": 0.8145, "step": 24910 }, { "epoch": 0.33, "learning_rate": 3.747751367343428e-05, "loss": 0.8155, "step": 24915 }, { "epoch": 0.33, "learning_rate": 3.747295399382887e-05, "loss": 0.697, "step": 24920 }, { "epoch": 0.33, "learning_rate": 3.7468393761734e-05, "loss": 0.7679, "step": 24925 }, { "epoch": 0.33, "learning_rate": 3.746383297735166e-05, "loss": 0.9302, "step": 24930 }, { "epoch": 0.33, "learning_rate": 3.745927164088389e-05, "loss": 0.3735, "step": 24935 }, { "epoch": 0.33, "learning_rate": 3.745470975253271e-05, "loss": 0.8814, "step": 24940 }, { "epoch": 0.33, "learning_rate": 3.745014731250019e-05, "loss": 0.2171, "step": 24945 }, { "epoch": 0.33, "learning_rate": 3.744558432098844e-05, "loss": 1.0741, "step": 24950 }, { "epoch": 0.33, "learning_rate": 3.744102077819955e-05, "loss": 0.9237, "step": 24955 }, { "epoch": 0.33, "learning_rate": 3.7436456684335705e-05, "loss": 0.5488, "step": 24960 }, { "epoch": 0.33, "learning_rate": 3.743189203959903e-05, "loss": 0.6115, "step": 24965 }, { "epoch": 0.33, "learning_rate": 3.742732684419173e-05, "loss": 1.061, "step": 24970 }, { "epoch": 0.33, "learning_rate": 3.742276109831603e-05, "loss": 1.1368, "step": 24975 }, { "epoch": 0.33, "learning_rate": 3.741819480217417e-05, "loss": 0.8326, "step": 24980 }, { "epoch": 0.33, "learning_rate": 3.7413627955968395e-05, "loss": 1.0239, "step": 24985 }, { "epoch": 0.33, "learning_rate": 3.740906055990101e-05, "loss": 0.4666, "step": 24990 }, { "epoch": 0.33, "learning_rate": 3.740449261417432e-05, "loss": 0.8337, "step": 24995 }, { "epoch": 0.33, "learning_rate": 3.739992411899067e-05, "loss": 0.4585, "step": 25000 }, { "epoch": 0.34, "learning_rate": 3.7395355074552406e-05, "loss": 0.6289, "step": 25005 }, { "epoch": 0.34, "learning_rate": 3.739078548106193e-05, "loss": 0.6248, "step": 25010 }, { "epoch": 0.34, "learning_rate": 3.738621533872165e-05, "loss": 1.0946, "step": 25015 }, { "epoch": 0.34, "learning_rate": 3.738164464773399e-05, "loss": 0.738, "step": 25020 }, { "epoch": 0.34, "learning_rate": 3.737707340830143e-05, "loss": 1.1827, "step": 25025 }, { "epoch": 0.34, "learning_rate": 3.737250162062642e-05, "loss": 0.9645, "step": 25030 }, { "epoch": 0.34, "learning_rate": 3.7367929284911496e-05, "loss": 0.6003, "step": 25035 }, { "epoch": 0.34, "learning_rate": 3.736335640135918e-05, "loss": 0.8383, "step": 25040 }, { "epoch": 0.34, "learning_rate": 3.7358782970172025e-05, "loss": 0.4712, "step": 25045 }, { "epoch": 0.34, "learning_rate": 3.735420899155261e-05, "loss": 0.6935, "step": 25050 }, { "epoch": 0.34, "learning_rate": 3.734963446570355e-05, "loss": 0.6709, "step": 25055 }, { "epoch": 0.34, "learning_rate": 3.734505939282746e-05, "loss": 1.224, "step": 25060 }, { "epoch": 0.34, "learning_rate": 3.7340483773127e-05, "loss": 1.3794, "step": 25065 }, { "epoch": 0.34, "learning_rate": 3.733590760680485e-05, "loss": 0.9546, "step": 25070 }, { "epoch": 0.34, "learning_rate": 3.73313308940637e-05, "loss": 0.7895, "step": 25075 }, { "epoch": 0.34, "learning_rate": 3.7326753635106294e-05, "loss": 0.2234, "step": 25080 }, { "epoch": 0.34, "learning_rate": 3.732217583013536e-05, "loss": 0.4479, "step": 25085 }, { "epoch": 0.34, "learning_rate": 3.7317597479353694e-05, "loss": 0.4634, "step": 25090 }, { "epoch": 0.34, "learning_rate": 3.731301858296408e-05, "loss": 1.3039, "step": 25095 }, { "epoch": 0.34, "learning_rate": 3.730843914116934e-05, "loss": 0.6297, "step": 25100 }, { "epoch": 0.34, "learning_rate": 3.7303859154172324e-05, "loss": 0.427, "step": 25105 }, { "epoch": 0.34, "learning_rate": 3.72992786221759e-05, "loss": 0.5462, "step": 25110 }, { "epoch": 0.34, "learning_rate": 3.729469754538296e-05, "loss": 0.4477, "step": 25115 }, { "epoch": 0.34, "learning_rate": 3.729011592399643e-05, "loss": 0.5978, "step": 25120 }, { "epoch": 0.34, "learning_rate": 3.728553375821926e-05, "loss": 0.4483, "step": 25125 }, { "epoch": 0.34, "learning_rate": 3.72809510482544e-05, "loss": 0.3721, "step": 25130 }, { "epoch": 0.34, "learning_rate": 3.7276367794304846e-05, "loss": 0.4586, "step": 25135 }, { "epoch": 0.34, "learning_rate": 3.727178399657362e-05, "loss": 1.1228, "step": 25140 }, { "epoch": 0.34, "learning_rate": 3.7267199655263745e-05, "loss": 0.4032, "step": 25145 }, { "epoch": 0.34, "learning_rate": 3.7262614770578306e-05, "loss": 0.6571, "step": 25150 }, { "epoch": 0.34, "learning_rate": 3.725802934272039e-05, "loss": 1.3769, "step": 25155 }, { "epoch": 0.34, "learning_rate": 3.7253443371893084e-05, "loss": 1.2996, "step": 25160 }, { "epoch": 0.34, "learning_rate": 3.7248856858299544e-05, "loss": 0.9573, "step": 25165 }, { "epoch": 0.34, "learning_rate": 3.7244269802142925e-05, "loss": 0.4322, "step": 25170 }, { "epoch": 0.34, "learning_rate": 3.72396822036264e-05, "loss": 0.839, "step": 25175 }, { "epoch": 0.34, "learning_rate": 3.72350940629532e-05, "loss": 0.7183, "step": 25180 }, { "epoch": 0.34, "learning_rate": 3.723050538032654e-05, "loss": 0.5896, "step": 25185 }, { "epoch": 0.34, "learning_rate": 3.722591615594968e-05, "loss": 0.1468, "step": 25190 }, { "epoch": 0.34, "learning_rate": 3.722132639002589e-05, "loss": 0.5002, "step": 25195 }, { "epoch": 0.34, "learning_rate": 3.7216736082758484e-05, "loss": 0.9318, "step": 25200 }, { "epoch": 0.34, "learning_rate": 3.72121452343508e-05, "loss": 0.3283, "step": 25205 }, { "epoch": 0.34, "learning_rate": 3.720755384500617e-05, "loss": 1.2072, "step": 25210 }, { "epoch": 0.34, "learning_rate": 3.7202961914927974e-05, "loss": 0.3451, "step": 25215 }, { "epoch": 0.34, "learning_rate": 3.719836944431962e-05, "loss": 1.1923, "step": 25220 }, { "epoch": 0.34, "learning_rate": 3.719377643338452e-05, "loss": 0.1333, "step": 25225 }, { "epoch": 0.34, "learning_rate": 3.718918288232614e-05, "loss": 0.5606, "step": 25230 }, { "epoch": 0.34, "learning_rate": 3.718458879134792e-05, "loss": 1.001, "step": 25235 }, { "epoch": 0.34, "learning_rate": 3.717999416065339e-05, "loss": 0.8902, "step": 25240 }, { "epoch": 0.34, "learning_rate": 3.7175398990446045e-05, "loss": 1.0169, "step": 25245 }, { "epoch": 0.34, "learning_rate": 3.717080328092944e-05, "loss": 1.4466, "step": 25250 }, { "epoch": 0.34, "learning_rate": 3.7166207032307133e-05, "loss": 0.5957, "step": 25255 }, { "epoch": 0.34, "learning_rate": 3.716161024478273e-05, "loss": 1.1676, "step": 25260 }, { "epoch": 0.34, "learning_rate": 3.715701291855983e-05, "loss": 0.6203, "step": 25265 }, { "epoch": 0.34, "learning_rate": 3.715241505384208e-05, "loss": 0.656, "step": 25270 }, { "epoch": 0.34, "learning_rate": 3.7147816650833134e-05, "loss": 0.864, "step": 25275 }, { "epoch": 0.34, "learning_rate": 3.7143217709736686e-05, "loss": 0.6704, "step": 25280 }, { "epoch": 0.34, "learning_rate": 3.713861823075645e-05, "loss": 1.1392, "step": 25285 }, { "epoch": 0.34, "learning_rate": 3.7134018214096146e-05, "loss": 0.7649, "step": 25290 }, { "epoch": 0.34, "learning_rate": 3.7129417659959545e-05, "loss": 1.0141, "step": 25295 }, { "epoch": 0.34, "learning_rate": 3.712481656855042e-05, "loss": 0.8766, "step": 25300 }, { "epoch": 0.34, "learning_rate": 3.712021494007258e-05, "loss": 0.8754, "step": 25305 }, { "epoch": 0.34, "learning_rate": 3.711561277472985e-05, "loss": 0.921, "step": 25310 }, { "epoch": 0.34, "learning_rate": 3.711101007272609e-05, "loss": 0.4608, "step": 25315 }, { "epoch": 0.34, "learning_rate": 3.710640683426518e-05, "loss": 1.5622, "step": 25320 }, { "epoch": 0.34, "learning_rate": 3.7101803059551e-05, "loss": 0.1663, "step": 25325 }, { "epoch": 0.34, "learning_rate": 3.70971987487875e-05, "loss": 1.0434, "step": 25330 }, { "epoch": 0.34, "learning_rate": 3.7092593902178606e-05, "loss": 0.8344, "step": 25335 }, { "epoch": 0.34, "learning_rate": 3.7087988519928313e-05, "loss": 0.4787, "step": 25340 }, { "epoch": 0.34, "learning_rate": 3.70833826022406e-05, "loss": 0.8972, "step": 25345 }, { "epoch": 0.34, "learning_rate": 3.707877614931948e-05, "loss": 0.576, "step": 25350 }, { "epoch": 0.34, "learning_rate": 3.707416916136901e-05, "loss": 0.5048, "step": 25355 }, { "epoch": 0.34, "learning_rate": 3.7069561638593245e-05, "loss": 1.0268, "step": 25360 }, { "epoch": 0.34, "learning_rate": 3.706495358119629e-05, "loss": 0.7044, "step": 25365 }, { "epoch": 0.34, "learning_rate": 3.7060344989382243e-05, "loss": 0.4992, "step": 25370 }, { "epoch": 0.34, "learning_rate": 3.705573586335526e-05, "loss": 0.7311, "step": 25375 }, { "epoch": 0.34, "learning_rate": 3.705112620331948e-05, "loss": 0.8018, "step": 25380 }, { "epoch": 0.34, "learning_rate": 3.704651600947911e-05, "loss": 0.2323, "step": 25385 }, { "epoch": 0.34, "learning_rate": 3.704190528203833e-05, "loss": 0.3862, "step": 25390 }, { "epoch": 0.34, "learning_rate": 3.70372940212014e-05, "loss": 0.3348, "step": 25395 }, { "epoch": 0.34, "learning_rate": 3.703268222717257e-05, "loss": 1.0167, "step": 25400 }, { "epoch": 0.34, "learning_rate": 3.702806990015611e-05, "loss": 1.1389, "step": 25405 }, { "epoch": 0.34, "learning_rate": 3.7023457040356334e-05, "loss": 0.9082, "step": 25410 }, { "epoch": 0.34, "learning_rate": 3.701884364797755e-05, "loss": 1.3794, "step": 25415 }, { "epoch": 0.34, "learning_rate": 3.701422972322413e-05, "loss": 0.8392, "step": 25420 }, { "epoch": 0.34, "learning_rate": 3.700961526630044e-05, "loss": 0.7394, "step": 25425 }, { "epoch": 0.34, "learning_rate": 3.7005000277410875e-05, "loss": 1.3816, "step": 25430 }, { "epoch": 0.34, "learning_rate": 3.700038475675986e-05, "loss": 0.5372, "step": 25435 }, { "epoch": 0.34, "learning_rate": 3.699576870455182e-05, "loss": 0.294, "step": 25440 }, { "epoch": 0.34, "learning_rate": 3.699115212099125e-05, "loss": 0.6846, "step": 25445 }, { "epoch": 0.34, "learning_rate": 3.698653500628264e-05, "loss": 0.5982, "step": 25450 }, { "epoch": 0.34, "learning_rate": 3.698191736063048e-05, "loss": 0.1264, "step": 25455 }, { "epoch": 0.34, "learning_rate": 3.6977299184239336e-05, "loss": 0.6333, "step": 25460 }, { "epoch": 0.34, "learning_rate": 3.6972680477313757e-05, "loss": 0.4548, "step": 25465 }, { "epoch": 0.34, "learning_rate": 3.696806124005833e-05, "loss": 0.2762, "step": 25470 }, { "epoch": 0.34, "learning_rate": 3.6963441472677654e-05, "loss": 0.8023, "step": 25475 }, { "epoch": 0.34, "learning_rate": 3.695882117537638e-05, "loss": 1.5941, "step": 25480 }, { "epoch": 0.34, "learning_rate": 3.6954200348359165e-05, "loss": 1.2286, "step": 25485 }, { "epoch": 0.34, "learning_rate": 3.694957899183067e-05, "loss": 0.3596, "step": 25490 }, { "epoch": 0.34, "learning_rate": 3.6944957105995604e-05, "loss": 0.6267, "step": 25495 }, { "epoch": 0.34, "learning_rate": 3.69403346910587e-05, "loss": 0.7976, "step": 25500 }, { "epoch": 0.34, "learning_rate": 3.693571174722471e-05, "loss": 0.7497, "step": 25505 }, { "epoch": 0.34, "learning_rate": 3.693108827469839e-05, "loss": 0.9906, "step": 25510 }, { "epoch": 0.34, "learning_rate": 3.692646427368456e-05, "loss": 1.0564, "step": 25515 }, { "epoch": 0.34, "learning_rate": 3.6921839744388034e-05, "loss": 0.677, "step": 25520 }, { "epoch": 0.34, "learning_rate": 3.6917214687013635e-05, "loss": 0.8574, "step": 25525 }, { "epoch": 0.34, "learning_rate": 3.691258910176625e-05, "loss": 0.9662, "step": 25530 }, { "epoch": 0.34, "learning_rate": 3.690796298885077e-05, "loss": 1.1573, "step": 25535 }, { "epoch": 0.34, "learning_rate": 3.690333634847211e-05, "loss": 0.6715, "step": 25540 }, { "epoch": 0.34, "learning_rate": 3.689870918083518e-05, "loss": 0.9348, "step": 25545 }, { "epoch": 0.34, "learning_rate": 3.689408148614497e-05, "loss": 0.6911, "step": 25550 }, { "epoch": 0.34, "learning_rate": 3.6889453264606457e-05, "loss": 0.7139, "step": 25555 }, { "epoch": 0.34, "learning_rate": 3.6884824516424646e-05, "loss": 0.7431, "step": 25560 }, { "epoch": 0.34, "learning_rate": 3.688019524180457e-05, "loss": 0.5012, "step": 25565 }, { "epoch": 0.34, "learning_rate": 3.687556544095127e-05, "loss": 0.5865, "step": 25570 }, { "epoch": 0.34, "learning_rate": 3.687093511406984e-05, "loss": 0.4076, "step": 25575 }, { "epoch": 0.34, "learning_rate": 3.686630426136537e-05, "loss": 0.8633, "step": 25580 }, { "epoch": 0.34, "learning_rate": 3.686167288304298e-05, "loss": 0.8297, "step": 25585 }, { "epoch": 0.34, "learning_rate": 3.6857040979307834e-05, "loss": 0.1928, "step": 25590 }, { "epoch": 0.34, "learning_rate": 3.6852408550365094e-05, "loss": 0.6029, "step": 25595 }, { "epoch": 0.34, "learning_rate": 3.6847775596419935e-05, "loss": 0.3816, "step": 25600 }, { "epoch": 0.34, "learning_rate": 3.68431421176776e-05, "loss": 0.3201, "step": 25605 }, { "epoch": 0.34, "learning_rate": 3.683850811434332e-05, "loss": 0.856, "step": 25610 }, { "epoch": 0.34, "learning_rate": 3.683387358662235e-05, "loss": 0.3841, "step": 25615 }, { "epoch": 0.34, "learning_rate": 3.682923853471999e-05, "loss": 1.528, "step": 25620 }, { "epoch": 0.34, "learning_rate": 3.682460295884154e-05, "loss": 1.1839, "step": 25625 }, { "epoch": 0.34, "learning_rate": 3.681996685919233e-05, "loss": 0.4279, "step": 25630 }, { "epoch": 0.34, "learning_rate": 3.681533023597773e-05, "loss": 0.7809, "step": 25635 }, { "epoch": 0.34, "learning_rate": 3.681069308940311e-05, "loss": 0.47, "step": 25640 }, { "epoch": 0.34, "learning_rate": 3.6806055419673875e-05, "loss": 1.0999, "step": 25645 }, { "epoch": 0.34, "learning_rate": 3.680141722699544e-05, "loss": 0.5059, "step": 25650 }, { "epoch": 0.34, "learning_rate": 3.679677851157327e-05, "loss": 0.4826, "step": 25655 }, { "epoch": 0.34, "learning_rate": 3.679213927361283e-05, "loss": 0.7933, "step": 25660 }, { "epoch": 0.34, "learning_rate": 3.678749951331961e-05, "loss": 0.5034, "step": 25665 }, { "epoch": 0.34, "learning_rate": 3.678285923089913e-05, "loss": 0.5572, "step": 25670 }, { "epoch": 0.34, "learning_rate": 3.6778218426556945e-05, "loss": 0.4526, "step": 25675 }, { "epoch": 0.34, "learning_rate": 3.677357710049859e-05, "loss": 0.6359, "step": 25680 }, { "epoch": 0.34, "learning_rate": 3.6768935252929685e-05, "loss": 0.59, "step": 25685 }, { "epoch": 0.34, "learning_rate": 3.6764292884055823e-05, "loss": 0.5881, "step": 25690 }, { "epoch": 0.34, "learning_rate": 3.675964999408264e-05, "loss": 0.4125, "step": 25695 }, { "epoch": 0.34, "learning_rate": 3.67550065832158e-05, "loss": 1.1515, "step": 25700 }, { "epoch": 0.34, "learning_rate": 3.675036265166097e-05, "loss": 1.1213, "step": 25705 }, { "epoch": 0.34, "learning_rate": 3.6745718199623865e-05, "loss": 0.879, "step": 25710 }, { "epoch": 0.34, "learning_rate": 3.6741073227310194e-05, "loss": 0.5256, "step": 25715 }, { "epoch": 0.34, "learning_rate": 3.6736427734925735e-05, "loss": 1.5103, "step": 25720 }, { "epoch": 0.34, "learning_rate": 3.6731781722676226e-05, "loss": 0.9926, "step": 25725 }, { "epoch": 0.34, "learning_rate": 3.672713519076749e-05, "loss": 1.397, "step": 25730 }, { "epoch": 0.34, "learning_rate": 3.672248813940533e-05, "loss": 0.1354, "step": 25735 }, { "epoch": 0.34, "learning_rate": 3.67178405687956e-05, "loss": 0.7646, "step": 25740 }, { "epoch": 0.34, "learning_rate": 3.671319247914414e-05, "loss": 0.7609, "step": 25745 }, { "epoch": 0.35, "learning_rate": 3.670854387065686e-05, "loss": 0.8245, "step": 25750 }, { "epoch": 0.35, "learning_rate": 3.6703894743539666e-05, "loss": 0.9402, "step": 25755 }, { "epoch": 0.35, "learning_rate": 3.6699245097998485e-05, "loss": 0.4963, "step": 25760 }, { "epoch": 0.35, "learning_rate": 3.6694594934239275e-05, "loss": 0.9692, "step": 25765 }, { "epoch": 0.35, "learning_rate": 3.668994425246801e-05, "loss": 0.5942, "step": 25770 }, { "epoch": 0.35, "learning_rate": 3.668529305289071e-05, "loss": 1.1582, "step": 25775 }, { "epoch": 0.35, "learning_rate": 3.668064133571337e-05, "loss": 0.687, "step": 25780 }, { "epoch": 0.35, "learning_rate": 3.667598910114207e-05, "loss": 0.6307, "step": 25785 }, { "epoch": 0.35, "learning_rate": 3.6671336349382863e-05, "loss": 1.3139, "step": 25790 }, { "epoch": 0.35, "learning_rate": 3.6666683080641846e-05, "loss": 0.579, "step": 25795 }, { "epoch": 0.35, "learning_rate": 3.666202929512513e-05, "loss": 0.4161, "step": 25800 }, { "epoch": 0.35, "learning_rate": 3.6657374993038864e-05, "loss": 0.8353, "step": 25805 }, { "epoch": 0.35, "learning_rate": 3.665272017458921e-05, "loss": 0.5216, "step": 25810 }, { "epoch": 0.35, "learning_rate": 3.664806483998234e-05, "loss": 0.6245, "step": 25815 }, { "epoch": 0.35, "learning_rate": 3.6643408989424475e-05, "loss": 0.7449, "step": 25820 }, { "epoch": 0.35, "learning_rate": 3.663875262312184e-05, "loss": 0.4683, "step": 25825 }, { "epoch": 0.35, "learning_rate": 3.6634095741280696e-05, "loss": 0.9496, "step": 25830 }, { "epoch": 0.35, "learning_rate": 3.66294383441073e-05, "loss": 1.4436, "step": 25835 }, { "epoch": 0.35, "learning_rate": 3.6624780431807985e-05, "loss": 0.6321, "step": 25840 }, { "epoch": 0.35, "learning_rate": 3.662012200458904e-05, "loss": 0.5718, "step": 25845 }, { "epoch": 0.35, "learning_rate": 3.661546306265684e-05, "loss": 0.4895, "step": 25850 }, { "epoch": 0.35, "learning_rate": 3.661080360621771e-05, "loss": 0.6625, "step": 25855 }, { "epoch": 0.35, "learning_rate": 3.6606143635478086e-05, "loss": 0.4645, "step": 25860 }, { "epoch": 0.35, "learning_rate": 3.660148315064437e-05, "loss": 0.8321, "step": 25865 }, { "epoch": 0.35, "learning_rate": 3.659682215192298e-05, "loss": 0.7821, "step": 25870 }, { "epoch": 0.35, "learning_rate": 3.659216063952038e-05, "loss": 0.7061, "step": 25875 }, { "epoch": 0.35, "learning_rate": 3.6587498613643064e-05, "loss": 0.7197, "step": 25880 }, { "epoch": 0.35, "learning_rate": 3.658283607449753e-05, "loss": 1.8254, "step": 25885 }, { "epoch": 0.35, "learning_rate": 3.65781730222903e-05, "loss": 0.9511, "step": 25890 }, { "epoch": 0.35, "learning_rate": 3.657350945722794e-05, "loss": 0.8292, "step": 25895 }, { "epoch": 0.35, "learning_rate": 3.6568845379517006e-05, "loss": 0.5741, "step": 25900 }, { "epoch": 0.35, "learning_rate": 3.6564180789364095e-05, "loss": 0.0676, "step": 25905 }, { "epoch": 0.35, "learning_rate": 3.655951568697583e-05, "loss": 0.5319, "step": 25910 }, { "epoch": 0.35, "learning_rate": 3.655485007255884e-05, "loss": 1.6935, "step": 25915 }, { "epoch": 0.35, "learning_rate": 3.655018394631982e-05, "loss": 0.6139, "step": 25920 }, { "epoch": 0.35, "learning_rate": 3.654551730846543e-05, "loss": 0.8873, "step": 25925 }, { "epoch": 0.35, "learning_rate": 3.654085015920238e-05, "loss": 0.6035, "step": 25930 }, { "epoch": 0.35, "learning_rate": 3.65361824987374e-05, "loss": 0.5518, "step": 25935 }, { "epoch": 0.35, "learning_rate": 3.6531514327277247e-05, "loss": 0.3816, "step": 25940 }, { "epoch": 0.35, "learning_rate": 3.652684564502871e-05, "loss": 0.4501, "step": 25945 }, { "epoch": 0.35, "learning_rate": 3.6522176452198576e-05, "loss": 0.3587, "step": 25950 }, { "epoch": 0.35, "learning_rate": 3.651750674899366e-05, "loss": 0.4657, "step": 25955 }, { "epoch": 0.35, "learning_rate": 3.651283653562083e-05, "loss": 0.3683, "step": 25960 }, { "epoch": 0.35, "learning_rate": 3.6508165812286925e-05, "loss": 0.7415, "step": 25965 }, { "epoch": 0.35, "learning_rate": 3.650349457919885e-05, "loss": 0.6527, "step": 25970 }, { "epoch": 0.35, "learning_rate": 3.649882283656352e-05, "loss": 1.2408, "step": 25975 }, { "epoch": 0.35, "learning_rate": 3.649415058458787e-05, "loss": 1.1006, "step": 25980 }, { "epoch": 0.35, "learning_rate": 3.6489477823478845e-05, "loss": 1.1943, "step": 25985 }, { "epoch": 0.35, "learning_rate": 3.648480455344343e-05, "loss": 0.6399, "step": 25990 }, { "epoch": 0.35, "learning_rate": 3.6480130774688634e-05, "loss": 0.65, "step": 25995 }, { "epoch": 0.35, "learning_rate": 3.647545648742148e-05, "loss": 0.5918, "step": 26000 }, { "epoch": 0.35, "learning_rate": 3.647078169184901e-05, "loss": 0.7159, "step": 26005 }, { "epoch": 0.35, "learning_rate": 3.64661063881783e-05, "loss": 0.4211, "step": 26010 }, { "epoch": 0.35, "learning_rate": 3.646143057661644e-05, "loss": 0.9223, "step": 26015 }, { "epoch": 0.35, "learning_rate": 3.645675425737054e-05, "loss": 0.9391, "step": 26020 }, { "epoch": 0.35, "learning_rate": 3.6452077430647746e-05, "loss": 0.5509, "step": 26025 }, { "epoch": 0.35, "learning_rate": 3.6447400096655214e-05, "loss": 0.8542, "step": 26030 }, { "epoch": 0.35, "learning_rate": 3.6442722255600136e-05, "loss": 1.0352, "step": 26035 }, { "epoch": 0.35, "learning_rate": 3.64380439076897e-05, "loss": 0.9971, "step": 26040 }, { "epoch": 0.35, "learning_rate": 3.643336505313114e-05, "loss": 0.5534, "step": 26045 }, { "epoch": 0.35, "learning_rate": 3.6428685692131714e-05, "loss": 1.1888, "step": 26050 }, { "epoch": 0.35, "learning_rate": 3.642400582489868e-05, "loss": 0.5516, "step": 26055 }, { "epoch": 0.35, "learning_rate": 3.6419325451639344e-05, "loss": 0.9723, "step": 26060 }, { "epoch": 0.35, "learning_rate": 3.641464457256102e-05, "loss": 0.7129, "step": 26065 }, { "epoch": 0.35, "learning_rate": 3.640996318787105e-05, "loss": 1.3546, "step": 26070 }, { "epoch": 0.35, "learning_rate": 3.640528129777679e-05, "loss": 0.8021, "step": 26075 }, { "epoch": 0.35, "learning_rate": 3.640059890248562e-05, "loss": 1.0214, "step": 26080 }, { "epoch": 0.35, "learning_rate": 3.639591600220497e-05, "loss": 0.8388, "step": 26085 }, { "epoch": 0.35, "learning_rate": 3.639123259714224e-05, "loss": 0.6178, "step": 26090 }, { "epoch": 0.35, "learning_rate": 3.63865486875049e-05, "loss": 0.3919, "step": 26095 }, { "epoch": 0.35, "learning_rate": 3.638186427350041e-05, "loss": 1.1609, "step": 26100 }, { "epoch": 0.35, "learning_rate": 3.637717935533629e-05, "loss": 0.4439, "step": 26105 }, { "epoch": 0.35, "learning_rate": 3.637249393322003e-05, "loss": 0.3028, "step": 26110 }, { "epoch": 0.35, "learning_rate": 3.6367808007359195e-05, "loss": 0.9115, "step": 26115 }, { "epoch": 0.35, "learning_rate": 3.6363121577961325e-05, "loss": 0.6691, "step": 26120 }, { "epoch": 0.35, "learning_rate": 3.635843464523402e-05, "loss": 0.4499, "step": 26125 }, { "epoch": 0.35, "learning_rate": 3.635374720938489e-05, "loss": 0.3682, "step": 26130 }, { "epoch": 0.35, "learning_rate": 3.634905927062155e-05, "loss": 0.9254, "step": 26135 }, { "epoch": 0.35, "learning_rate": 3.634437082915168e-05, "loss": 0.9871, "step": 26140 }, { "epoch": 0.35, "learning_rate": 3.633968188518292e-05, "loss": 0.6867, "step": 26145 }, { "epoch": 0.35, "learning_rate": 3.633499243892299e-05, "loss": 0.3516, "step": 26150 }, { "epoch": 0.35, "learning_rate": 3.6330302490579595e-05, "loss": 0.5371, "step": 26155 }, { "epoch": 0.35, "learning_rate": 3.632561204036049e-05, "loss": 0.404, "step": 26160 }, { "epoch": 0.35, "learning_rate": 3.632092108847342e-05, "loss": 0.2862, "step": 26165 }, { "epoch": 0.35, "learning_rate": 3.63162296351262e-05, "loss": 0.6461, "step": 26170 }, { "epoch": 0.35, "learning_rate": 3.6311537680526606e-05, "loss": 0.7399, "step": 26175 }, { "epoch": 0.35, "learning_rate": 3.6306845224882496e-05, "loss": 0.8609, "step": 26180 }, { "epoch": 0.35, "learning_rate": 3.63021522684017e-05, "loss": 0.9501, "step": 26185 }, { "epoch": 0.35, "learning_rate": 3.62974588112921e-05, "loss": 0.7248, "step": 26190 }, { "epoch": 0.35, "learning_rate": 3.62927648537616e-05, "loss": 1.6832, "step": 26195 }, { "epoch": 0.35, "learning_rate": 3.628807039601811e-05, "loss": 0.2546, "step": 26200 }, { "epoch": 0.35, "learning_rate": 3.6283375438269576e-05, "loss": 0.6694, "step": 26205 }, { "epoch": 0.35, "learning_rate": 3.627867998072396e-05, "loss": 1.1886, "step": 26210 }, { "epoch": 0.35, "learning_rate": 3.627398402358924e-05, "loss": 1.1765, "step": 26215 }, { "epoch": 0.35, "learning_rate": 3.626928756707343e-05, "loss": 1.42, "step": 26220 }, { "epoch": 0.35, "learning_rate": 3.626459061138457e-05, "loss": 0.7918, "step": 26225 }, { "epoch": 0.35, "learning_rate": 3.6259893156730696e-05, "loss": 0.9894, "step": 26230 }, { "epoch": 0.35, "learning_rate": 3.625519520331988e-05, "loss": 0.988, "step": 26235 }, { "epoch": 0.35, "learning_rate": 3.625049675136023e-05, "loss": 0.3355, "step": 26240 }, { "epoch": 0.35, "learning_rate": 3.624579780105986e-05, "loss": 0.9665, "step": 26245 }, { "epoch": 0.35, "learning_rate": 3.62410983526269e-05, "loss": 0.3727, "step": 26250 }, { "epoch": 0.35, "learning_rate": 3.623639840626953e-05, "loss": 0.3487, "step": 26255 }, { "epoch": 0.35, "learning_rate": 3.623169796219592e-05, "loss": 0.5174, "step": 26260 }, { "epoch": 0.35, "learning_rate": 3.622699702061428e-05, "loss": 0.7892, "step": 26265 }, { "epoch": 0.35, "learning_rate": 3.622229558173284e-05, "loss": 0.4766, "step": 26270 }, { "epoch": 0.35, "learning_rate": 3.621759364575985e-05, "loss": 1.034, "step": 26275 }, { "epoch": 0.35, "learning_rate": 3.6212891212903583e-05, "loss": 1.0407, "step": 26280 }, { "epoch": 0.35, "learning_rate": 3.620818828337233e-05, "loss": 1.3402, "step": 26285 }, { "epoch": 0.35, "learning_rate": 3.62034848573744e-05, "loss": 0.9117, "step": 26290 }, { "epoch": 0.35, "learning_rate": 3.619878093511815e-05, "loss": 1.3666, "step": 26295 }, { "epoch": 0.35, "learning_rate": 3.619407651681193e-05, "loss": 0.4851, "step": 26300 }, { "epoch": 0.35, "learning_rate": 3.618937160266412e-05, "loss": 1.0405, "step": 26305 }, { "epoch": 0.35, "learning_rate": 3.618466619288313e-05, "loss": 0.9162, "step": 26310 }, { "epoch": 0.35, "learning_rate": 3.617996028767738e-05, "loss": 0.4314, "step": 26315 }, { "epoch": 0.35, "learning_rate": 3.617525388725532e-05, "loss": 0.4532, "step": 26320 }, { "epoch": 0.35, "learning_rate": 3.6170546991825425e-05, "loss": 0.932, "step": 26325 }, { "epoch": 0.35, "learning_rate": 3.616583960159618e-05, "loss": 0.6391, "step": 26330 }, { "epoch": 0.35, "learning_rate": 3.61611317167761e-05, "loss": 1.1319, "step": 26335 }, { "epoch": 0.35, "learning_rate": 3.615642333757373e-05, "loss": 0.5531, "step": 26340 }, { "epoch": 0.35, "learning_rate": 3.61517144641976e-05, "loss": 1.0274, "step": 26345 }, { "epoch": 0.35, "learning_rate": 3.614700509685633e-05, "loss": 0.9217, "step": 26350 }, { "epoch": 0.35, "learning_rate": 3.6142295235758496e-05, "loss": 0.2014, "step": 26355 }, { "epoch": 0.35, "learning_rate": 3.613758488111272e-05, "loss": 0.5293, "step": 26360 }, { "epoch": 0.35, "learning_rate": 3.613287403312766e-05, "loss": 0.5018, "step": 26365 }, { "epoch": 0.35, "learning_rate": 3.612816269201197e-05, "loss": 0.2083, "step": 26370 }, { "epoch": 0.35, "learning_rate": 3.6123450857974354e-05, "loss": 0.4089, "step": 26375 }, { "epoch": 0.35, "learning_rate": 3.6118738531223504e-05, "loss": 0.4858, "step": 26380 }, { "epoch": 0.35, "learning_rate": 3.611402571196817e-05, "loss": 0.4087, "step": 26385 }, { "epoch": 0.35, "learning_rate": 3.61093124004171e-05, "loss": 0.564, "step": 26390 }, { "epoch": 0.35, "learning_rate": 3.610459859677906e-05, "loss": 0.9541, "step": 26395 }, { "epoch": 0.35, "learning_rate": 3.609988430126286e-05, "loss": 0.7324, "step": 26400 }, { "epoch": 0.35, "learning_rate": 3.609516951407732e-05, "loss": 0.9133, "step": 26405 }, { "epoch": 0.35, "learning_rate": 3.609045423543127e-05, "loss": 0.9995, "step": 26410 }, { "epoch": 0.35, "learning_rate": 3.60857384655336e-05, "loss": 0.3894, "step": 26415 }, { "epoch": 0.35, "learning_rate": 3.608102220459316e-05, "loss": 0.4962, "step": 26420 }, { "epoch": 0.35, "learning_rate": 3.607630545281887e-05, "loss": 0.509, "step": 26425 }, { "epoch": 0.35, "learning_rate": 3.607158821041967e-05, "loss": 0.6231, "step": 26430 }, { "epoch": 0.35, "learning_rate": 3.6066870477604504e-05, "loss": 0.5876, "step": 26435 }, { "epoch": 0.35, "learning_rate": 3.606215225458233e-05, "loss": 0.5014, "step": 26440 }, { "epoch": 0.35, "learning_rate": 3.605743354156217e-05, "loss": 0.3262, "step": 26445 }, { "epoch": 0.35, "learning_rate": 3.6052714338753005e-05, "loss": 0.3089, "step": 26450 }, { "epoch": 0.35, "learning_rate": 3.60479946463639e-05, "loss": 0.7378, "step": 26455 }, { "epoch": 0.35, "learning_rate": 3.6043274464603904e-05, "loss": 0.8143, "step": 26460 }, { "epoch": 0.35, "learning_rate": 3.603855379368209e-05, "loss": 0.8192, "step": 26465 }, { "epoch": 0.35, "learning_rate": 3.6033832633807576e-05, "loss": 1.2463, "step": 26470 }, { "epoch": 0.35, "learning_rate": 3.6029110985189474e-05, "loss": 0.1497, "step": 26475 }, { "epoch": 0.35, "learning_rate": 3.6024388848036926e-05, "loss": 0.5135, "step": 26480 }, { "epoch": 0.35, "learning_rate": 3.601966622255911e-05, "loss": 1.2019, "step": 26485 }, { "epoch": 0.35, "learning_rate": 3.6014943108965216e-05, "loss": 1.2265, "step": 26490 }, { "epoch": 0.35, "learning_rate": 3.601021950746444e-05, "loss": 0.7158, "step": 26495 }, { "epoch": 0.36, "learning_rate": 3.600549541826602e-05, "loss": 0.7894, "step": 26500 }, { "epoch": 0.36, "learning_rate": 3.6000770841579214e-05, "loss": 1.1744, "step": 26505 }, { "epoch": 0.36, "learning_rate": 3.5996045777613293e-05, "loss": 1.2237, "step": 26510 }, { "epoch": 0.36, "learning_rate": 3.599132022657757e-05, "loss": 0.627, "step": 26515 }, { "epoch": 0.36, "learning_rate": 3.5986594188681335e-05, "loss": 0.8804, "step": 26520 }, { "epoch": 0.36, "learning_rate": 3.598186766413395e-05, "loss": 0.8367, "step": 26525 }, { "epoch": 0.36, "learning_rate": 3.597714065314476e-05, "loss": 0.7179, "step": 26530 }, { "epoch": 0.36, "learning_rate": 3.597241315592316e-05, "loss": 0.8129, "step": 26535 }, { "epoch": 0.36, "learning_rate": 3.5967685172678546e-05, "loss": 0.5557, "step": 26540 }, { "epoch": 0.36, "learning_rate": 3.5962956703620356e-05, "loss": 0.4957, "step": 26545 }, { "epoch": 0.36, "learning_rate": 3.595822774895802e-05, "loss": 0.5288, "step": 26550 }, { "epoch": 0.36, "learning_rate": 3.595444423573394e-05, "loss": 0.9559, "step": 26555 }, { "epoch": 0.36, "learning_rate": 3.594971440751205e-05, "loss": 0.9123, "step": 26560 }, { "epoch": 0.36, "learning_rate": 3.5944984094272584e-05, "loss": 0.4674, "step": 26565 }, { "epoch": 0.36, "learning_rate": 3.594025329622507e-05, "loss": 0.2576, "step": 26570 }, { "epoch": 0.36, "learning_rate": 3.593552201357908e-05, "loss": 0.3848, "step": 26575 }, { "epoch": 0.36, "learning_rate": 3.593079024654416e-05, "loss": 0.3784, "step": 26580 }, { "epoch": 0.36, "learning_rate": 3.5926057995329935e-05, "loss": 0.3355, "step": 26585 }, { "epoch": 0.36, "learning_rate": 3.592132526014599e-05, "loss": 1.2201, "step": 26590 }, { "epoch": 0.36, "learning_rate": 3.591659204120197e-05, "loss": 0.4852, "step": 26595 }, { "epoch": 0.36, "learning_rate": 3.5911858338707546e-05, "loss": 0.7287, "step": 26600 }, { "epoch": 0.36, "learning_rate": 3.590712415287239e-05, "loss": 0.4553, "step": 26605 }, { "epoch": 0.36, "learning_rate": 3.5902389483906196e-05, "loss": 0.4179, "step": 26610 }, { "epoch": 0.36, "learning_rate": 3.5897654332018695e-05, "loss": 0.9915, "step": 26615 }, { "epoch": 0.36, "learning_rate": 3.589291869741961e-05, "loss": 0.7967, "step": 26620 }, { "epoch": 0.36, "learning_rate": 3.5888182580318736e-05, "loss": 0.6751, "step": 26625 }, { "epoch": 0.36, "learning_rate": 3.588344598092584e-05, "loss": 0.6398, "step": 26630 }, { "epoch": 0.36, "learning_rate": 3.587870889945074e-05, "loss": 0.2999, "step": 26635 }, { "epoch": 0.36, "learning_rate": 3.587397133610326e-05, "loss": 0.4966, "step": 26640 }, { "epoch": 0.36, "learning_rate": 3.586923329109325e-05, "loss": 0.6976, "step": 26645 }, { "epoch": 0.36, "learning_rate": 3.586449476463058e-05, "loss": 0.8115, "step": 26650 }, { "epoch": 0.36, "learning_rate": 3.585975575692515e-05, "loss": 0.2324, "step": 26655 }, { "epoch": 0.36, "learning_rate": 3.585501626818687e-05, "loss": 0.3011, "step": 26660 }, { "epoch": 0.36, "learning_rate": 3.5850276298625666e-05, "loss": 1.4015, "step": 26665 }, { "epoch": 0.36, "learning_rate": 3.5845535848451514e-05, "loss": 0.8469, "step": 26670 }, { "epoch": 0.36, "learning_rate": 3.584079491787438e-05, "loss": 0.7024, "step": 26675 }, { "epoch": 0.36, "learning_rate": 3.583605350710426e-05, "loss": 0.8288, "step": 26680 }, { "epoch": 0.36, "learning_rate": 3.583131161635119e-05, "loss": 0.7614, "step": 26685 }, { "epoch": 0.36, "learning_rate": 3.582656924582519e-05, "loss": 0.8502, "step": 26690 }, { "epoch": 0.36, "learning_rate": 3.5821826395736355e-05, "loss": 1.183, "step": 26695 }, { "epoch": 0.36, "learning_rate": 3.5817083066294734e-05, "loss": 0.6774, "step": 26700 }, { "epoch": 0.36, "learning_rate": 3.5812339257710455e-05, "loss": 1.0444, "step": 26705 }, { "epoch": 0.36, "learning_rate": 3.5807594970193634e-05, "loss": 0.6386, "step": 26710 }, { "epoch": 0.36, "learning_rate": 3.580285020395443e-05, "loss": 0.614, "step": 26715 }, { "epoch": 0.36, "learning_rate": 3.579810495920301e-05, "loss": 1.0423, "step": 26720 }, { "epoch": 0.36, "learning_rate": 3.5793359236149557e-05, "loss": 0.3723, "step": 26725 }, { "epoch": 0.36, "learning_rate": 3.578861303500429e-05, "loss": 1.5825, "step": 26730 }, { "epoch": 0.36, "learning_rate": 3.5783866355977436e-05, "loss": 0.5901, "step": 26735 }, { "epoch": 0.36, "learning_rate": 3.577911919927926e-05, "loss": 1.2933, "step": 26740 }, { "epoch": 0.36, "learning_rate": 3.577437156512002e-05, "loss": 0.7702, "step": 26745 }, { "epoch": 0.36, "learning_rate": 3.576962345371003e-05, "loss": 0.3028, "step": 26750 }, { "epoch": 0.36, "learning_rate": 3.576487486525959e-05, "loss": 0.5622, "step": 26755 }, { "epoch": 0.36, "learning_rate": 3.576012579997905e-05, "loss": 0.5063, "step": 26760 }, { "epoch": 0.36, "learning_rate": 3.5755376258078777e-05, "loss": 0.5232, "step": 26765 }, { "epoch": 0.36, "learning_rate": 3.575062623976914e-05, "loss": 0.8166, "step": 26770 }, { "epoch": 0.36, "learning_rate": 3.574587574526054e-05, "loss": 1.2654, "step": 26775 }, { "epoch": 0.36, "learning_rate": 3.574112477476341e-05, "loss": 0.6519, "step": 26780 }, { "epoch": 0.36, "learning_rate": 3.5736373328488184e-05, "loss": 0.1109, "step": 26785 }, { "epoch": 0.36, "learning_rate": 3.573162140664533e-05, "loss": 1.3798, "step": 26790 }, { "epoch": 0.36, "learning_rate": 3.5726869009445346e-05, "loss": 0.5884, "step": 26795 }, { "epoch": 0.36, "learning_rate": 3.5722116137098725e-05, "loss": 0.9327, "step": 26800 }, { "epoch": 0.36, "learning_rate": 3.5717362789816e-05, "loss": 1.3185, "step": 26805 }, { "epoch": 0.36, "learning_rate": 3.571260896780772e-05, "loss": 0.6561, "step": 26810 }, { "epoch": 0.36, "learning_rate": 3.570785467128445e-05, "loss": 0.4103, "step": 26815 }, { "epoch": 0.36, "learning_rate": 3.57030999004568e-05, "loss": 0.6356, "step": 26820 }, { "epoch": 0.36, "learning_rate": 3.569834465553536e-05, "loss": 0.5268, "step": 26825 }, { "epoch": 0.36, "learning_rate": 3.569358893673078e-05, "loss": 0.4067, "step": 26830 }, { "epoch": 0.36, "learning_rate": 3.568883274425371e-05, "loss": 0.6636, "step": 26835 }, { "epoch": 0.36, "learning_rate": 3.568407607831482e-05, "loss": 0.8749, "step": 26840 }, { "epoch": 0.36, "learning_rate": 3.567931893912481e-05, "loss": 0.4932, "step": 26845 }, { "epoch": 0.36, "learning_rate": 3.5674561326894394e-05, "loss": 0.5239, "step": 26850 }, { "epoch": 0.36, "learning_rate": 3.566980324183432e-05, "loss": 0.2593, "step": 26855 }, { "epoch": 0.36, "learning_rate": 3.566504468415535e-05, "loss": 0.7366, "step": 26860 }, { "epoch": 0.36, "learning_rate": 3.566028565406824e-05, "loss": 0.9911, "step": 26865 }, { "epoch": 0.36, "learning_rate": 3.5655526151783814e-05, "loss": 0.8148, "step": 26870 }, { "epoch": 0.36, "learning_rate": 3.565076617751289e-05, "loss": 0.7483, "step": 26875 }, { "epoch": 0.36, "learning_rate": 3.564600573146631e-05, "loss": 0.8011, "step": 26880 }, { "epoch": 0.36, "learning_rate": 3.564124481385493e-05, "loss": 0.5418, "step": 26885 }, { "epoch": 0.36, "learning_rate": 3.5636483424889646e-05, "loss": 0.2303, "step": 26890 }, { "epoch": 0.36, "learning_rate": 3.563172156478135e-05, "loss": 0.6319, "step": 26895 }, { "epoch": 0.36, "learning_rate": 3.562695923374099e-05, "loss": 0.9214, "step": 26900 }, { "epoch": 0.36, "learning_rate": 3.562219643197949e-05, "loss": 0.9045, "step": 26905 }, { "epoch": 0.36, "learning_rate": 3.561743315970784e-05, "loss": 1.1255, "step": 26910 }, { "epoch": 0.36, "learning_rate": 3.5612669417137015e-05, "loss": 0.8647, "step": 26915 }, { "epoch": 0.36, "learning_rate": 3.560790520447802e-05, "loss": 1.4159, "step": 26920 }, { "epoch": 0.36, "learning_rate": 3.56031405219419e-05, "loss": 0.822, "step": 26925 }, { "epoch": 0.36, "learning_rate": 3.55983753697397e-05, "loss": 0.7975, "step": 26930 }, { "epoch": 0.36, "learning_rate": 3.559360974808249e-05, "loss": 1.2258, "step": 26935 }, { "epoch": 0.36, "learning_rate": 3.558884365718137e-05, "loss": 0.7869, "step": 26940 }, { "epoch": 0.36, "learning_rate": 3.5584077097247454e-05, "loss": 1.2144, "step": 26945 }, { "epoch": 0.36, "learning_rate": 3.557931006849187e-05, "loss": 0.7817, "step": 26950 }, { "epoch": 0.36, "learning_rate": 3.557454257112578e-05, "loss": 0.7054, "step": 26955 }, { "epoch": 0.36, "learning_rate": 3.556977460536035e-05, "loss": 0.5785, "step": 26960 }, { "epoch": 0.36, "learning_rate": 3.556500617140679e-05, "loss": 1.237, "step": 26965 }, { "epoch": 0.36, "learning_rate": 3.556023726947631e-05, "loss": 0.5291, "step": 26970 }, { "epoch": 0.36, "learning_rate": 3.555546789978015e-05, "loss": 0.7406, "step": 26975 }, { "epoch": 0.36, "learning_rate": 3.5550698062529564e-05, "loss": 1.4706, "step": 26980 }, { "epoch": 0.36, "learning_rate": 3.5545927757935844e-05, "loss": 0.4556, "step": 26985 }, { "epoch": 0.36, "learning_rate": 3.5541156986210283e-05, "loss": 0.7256, "step": 26990 }, { "epoch": 0.36, "learning_rate": 3.55363857475642e-05, "loss": 0.9043, "step": 26995 }, { "epoch": 0.36, "learning_rate": 3.553161404220894e-05, "loss": 0.4806, "step": 27000 }, { "epoch": 0.36, "learning_rate": 3.552684187035587e-05, "loss": 0.4908, "step": 27005 }, { "epoch": 0.36, "learning_rate": 3.5522069232216365e-05, "loss": 1.2424, "step": 27010 }, { "epoch": 0.36, "learning_rate": 3.551729612800184e-05, "loss": 0.3123, "step": 27015 }, { "epoch": 0.36, "learning_rate": 3.5512522557923705e-05, "loss": 0.5672, "step": 27020 }, { "epoch": 0.36, "learning_rate": 3.550774852219342e-05, "loss": 0.6169, "step": 27025 }, { "epoch": 0.36, "learning_rate": 3.550297402102244e-05, "loss": 0.8161, "step": 27030 }, { "epoch": 0.36, "learning_rate": 3.549819905462225e-05, "loss": 0.5842, "step": 27035 }, { "epoch": 0.36, "learning_rate": 3.549342362320437e-05, "loss": 0.7297, "step": 27040 }, { "epoch": 0.36, "learning_rate": 3.548864772698033e-05, "loss": 0.9277, "step": 27045 }, { "epoch": 0.36, "learning_rate": 3.548387136616165e-05, "loss": 0.5882, "step": 27050 }, { "epoch": 0.36, "learning_rate": 3.5479094540959924e-05, "loss": 0.9084, "step": 27055 }, { "epoch": 0.36, "learning_rate": 3.547431725158674e-05, "loss": 1.0114, "step": 27060 }, { "epoch": 0.36, "learning_rate": 3.5469539498253704e-05, "loss": 1.3494, "step": 27065 }, { "epoch": 0.36, "learning_rate": 3.546476128117244e-05, "loss": 1.1549, "step": 27070 }, { "epoch": 0.36, "learning_rate": 3.5459982600554606e-05, "loss": 1.0997, "step": 27075 }, { "epoch": 0.36, "learning_rate": 3.5455203456611874e-05, "loss": 0.8618, "step": 27080 }, { "epoch": 0.36, "learning_rate": 3.545042384955593e-05, "loss": 0.0825, "step": 27085 }, { "epoch": 0.36, "learning_rate": 3.5445643779598495e-05, "loss": 0.4421, "step": 27090 }, { "epoch": 0.36, "learning_rate": 3.54408632469513e-05, "loss": 1.4398, "step": 27095 }, { "epoch": 0.36, "learning_rate": 3.5436082251826095e-05, "loss": 1.5708, "step": 27100 }, { "epoch": 0.36, "learning_rate": 3.5431300794434655e-05, "loss": 0.9465, "step": 27105 }, { "epoch": 0.36, "learning_rate": 3.542651887498878e-05, "loss": 0.6775, "step": 27110 }, { "epoch": 0.36, "learning_rate": 3.542173649370028e-05, "loss": 0.9839, "step": 27115 }, { "epoch": 0.36, "learning_rate": 3.5416953650780985e-05, "loss": 0.651, "step": 27120 }, { "epoch": 0.36, "learning_rate": 3.541217034644277e-05, "loss": 0.2243, "step": 27125 }, { "epoch": 0.36, "learning_rate": 3.540738658089749e-05, "loss": 0.258, "step": 27130 }, { "epoch": 0.36, "learning_rate": 3.540260235435706e-05, "loss": 0.8341, "step": 27135 }, { "epoch": 0.36, "learning_rate": 3.539781766703337e-05, "loss": 0.3246, "step": 27140 }, { "epoch": 0.36, "learning_rate": 3.5393032519138395e-05, "loss": 0.799, "step": 27145 }, { "epoch": 0.36, "learning_rate": 3.5388246910884066e-05, "loss": 0.4785, "step": 27150 }, { "epoch": 0.36, "learning_rate": 3.5383460842482376e-05, "loss": 0.5415, "step": 27155 }, { "epoch": 0.36, "learning_rate": 3.5378674314145306e-05, "loss": 0.8006, "step": 27160 }, { "epoch": 0.36, "learning_rate": 3.5373887326084884e-05, "loss": 0.7167, "step": 27165 }, { "epoch": 0.36, "learning_rate": 3.536909987851317e-05, "loss": 0.9454, "step": 27170 }, { "epoch": 0.36, "learning_rate": 3.536431197164219e-05, "loss": 0.4842, "step": 27175 }, { "epoch": 0.36, "learning_rate": 3.535952360568405e-05, "loss": 1.0965, "step": 27180 }, { "epoch": 0.36, "learning_rate": 3.535473478085084e-05, "loss": 0.7922, "step": 27185 }, { "epoch": 0.36, "learning_rate": 3.534994549735469e-05, "loss": 0.4982, "step": 27190 }, { "epoch": 0.36, "learning_rate": 3.5345155755407725e-05, "loss": 0.3794, "step": 27195 }, { "epoch": 0.36, "learning_rate": 3.534036555522211e-05, "loss": 0.8957, "step": 27200 }, { "epoch": 0.36, "learning_rate": 3.5335574897010036e-05, "loss": 0.3869, "step": 27205 }, { "epoch": 0.36, "learning_rate": 3.533078378098371e-05, "loss": 0.347, "step": 27210 }, { "epoch": 0.36, "learning_rate": 3.532599220735534e-05, "loss": 0.3976, "step": 27215 }, { "epoch": 0.36, "learning_rate": 3.5321200176337165e-05, "loss": 0.4415, "step": 27220 }, { "epoch": 0.36, "learning_rate": 3.5316407688141464e-05, "loss": 0.3603, "step": 27225 }, { "epoch": 0.36, "learning_rate": 3.5311614742980514e-05, "loss": 0.7458, "step": 27230 }, { "epoch": 0.36, "learning_rate": 3.530682134106663e-05, "loss": 0.7052, "step": 27235 }, { "epoch": 0.36, "learning_rate": 3.530202748261211e-05, "loss": 0.6889, "step": 27240 }, { "epoch": 0.37, "learning_rate": 3.5297233167829314e-05, "loss": 0.4984, "step": 27245 }, { "epoch": 0.37, "learning_rate": 3.529243839693061e-05, "loss": 0.7056, "step": 27250 }, { "epoch": 0.37, "learning_rate": 3.5287643170128365e-05, "loss": 1.494, "step": 27255 }, { "epoch": 0.37, "learning_rate": 3.5282847487635007e-05, "loss": 1.3827, "step": 27260 }, { "epoch": 0.37, "learning_rate": 3.527805134966294e-05, "loss": 0.3802, "step": 27265 }, { "epoch": 0.37, "learning_rate": 3.527325475642462e-05, "loss": 0.6674, "step": 27270 }, { "epoch": 0.37, "learning_rate": 3.526845770813251e-05, "loss": 0.9448, "step": 27275 }, { "epoch": 0.37, "learning_rate": 3.526366020499911e-05, "loss": 0.5735, "step": 27280 }, { "epoch": 0.37, "learning_rate": 3.525886224723689e-05, "loss": 0.7558, "step": 27285 }, { "epoch": 0.37, "learning_rate": 3.5254063835058406e-05, "loss": 0.6964, "step": 27290 }, { "epoch": 0.37, "learning_rate": 3.5249264968676185e-05, "loss": 0.5992, "step": 27295 }, { "epoch": 0.37, "learning_rate": 3.524446564830281e-05, "loss": 0.4577, "step": 27300 }, { "epoch": 0.37, "learning_rate": 3.5239665874150854e-05, "loss": 1.1597, "step": 27305 }, { "epoch": 0.37, "learning_rate": 3.523486564643292e-05, "loss": 0.7086, "step": 27310 }, { "epoch": 0.37, "learning_rate": 3.5230064965361656e-05, "loss": 0.677, "step": 27315 }, { "epoch": 0.37, "learning_rate": 3.522526383114969e-05, "loss": 0.1747, "step": 27320 }, { "epoch": 0.37, "learning_rate": 3.522046224400969e-05, "loss": 0.9482, "step": 27325 }, { "epoch": 0.37, "learning_rate": 3.521566020415434e-05, "loss": 1.4685, "step": 27330 }, { "epoch": 0.37, "learning_rate": 3.521085771179635e-05, "loss": 0.4057, "step": 27335 }, { "epoch": 0.37, "learning_rate": 3.520605476714845e-05, "loss": 0.2727, "step": 27340 }, { "epoch": 0.37, "learning_rate": 3.520125137042339e-05, "loss": 0.7599, "step": 27345 }, { "epoch": 0.37, "learning_rate": 3.519644752183392e-05, "loss": 0.383, "step": 27350 }, { "epoch": 0.37, "learning_rate": 3.519164322159284e-05, "loss": 0.9041, "step": 27355 }, { "epoch": 0.37, "learning_rate": 3.5186838469912944e-05, "loss": 0.5179, "step": 27360 }, { "epoch": 0.37, "learning_rate": 3.518203326700707e-05, "loss": 1.4313, "step": 27365 }, { "epoch": 0.37, "learning_rate": 3.517722761308807e-05, "loss": 0.8923, "step": 27370 }, { "epoch": 0.37, "learning_rate": 3.5172421508368805e-05, "loss": 0.7582, "step": 27375 }, { "epoch": 0.37, "learning_rate": 3.516761495306214e-05, "loss": 0.9101, "step": 27380 }, { "epoch": 0.37, "learning_rate": 3.516280794738101e-05, "loss": 0.867, "step": 27385 }, { "epoch": 0.37, "learning_rate": 3.515800049153833e-05, "loss": 0.6096, "step": 27390 }, { "epoch": 0.37, "learning_rate": 3.515319258574705e-05, "loss": 0.2764, "step": 27395 }, { "epoch": 0.37, "learning_rate": 3.514838423022013e-05, "loss": 0.2707, "step": 27400 }, { "epoch": 0.37, "learning_rate": 3.514357542517056e-05, "loss": 1.1255, "step": 27405 }, { "epoch": 0.37, "learning_rate": 3.5138766170811346e-05, "loss": 0.2205, "step": 27410 }, { "epoch": 0.37, "learning_rate": 3.513395646735551e-05, "loss": 1.3319, "step": 27415 }, { "epoch": 0.37, "learning_rate": 3.51291463150161e-05, "loss": 0.9089, "step": 27420 }, { "epoch": 0.37, "learning_rate": 3.512433571400619e-05, "loss": 0.7845, "step": 27425 }, { "epoch": 0.37, "learning_rate": 3.511952466453886e-05, "loss": 1.1362, "step": 27430 }, { "epoch": 0.37, "learning_rate": 3.5114713166827205e-05, "loss": 0.8806, "step": 27435 }, { "epoch": 0.37, "learning_rate": 3.5109901221084364e-05, "loss": 0.8177, "step": 27440 }, { "epoch": 0.37, "learning_rate": 3.510508882752348e-05, "loss": 0.4456, "step": 27445 }, { "epoch": 0.37, "learning_rate": 3.510027598635771e-05, "loss": 0.427, "step": 27450 }, { "epoch": 0.37, "learning_rate": 3.509546269780025e-05, "loss": 0.5484, "step": 27455 }, { "epoch": 0.37, "learning_rate": 3.509064896206429e-05, "loss": 0.8768, "step": 27460 }, { "epoch": 0.37, "learning_rate": 3.508583477936307e-05, "loss": 0.7989, "step": 27465 }, { "epoch": 0.37, "learning_rate": 3.5081020149909815e-05, "loss": 0.2523, "step": 27470 }, { "epoch": 0.37, "learning_rate": 3.507620507391781e-05, "loss": 0.8702, "step": 27475 }, { "epoch": 0.37, "learning_rate": 3.507138955160033e-05, "loss": 1.4561, "step": 27480 }, { "epoch": 0.37, "learning_rate": 3.506657358317068e-05, "loss": 0.8696, "step": 27485 }, { "epoch": 0.37, "learning_rate": 3.506175716884218e-05, "loss": 0.6198, "step": 27490 }, { "epoch": 0.37, "learning_rate": 3.5056940308828174e-05, "loss": 1.1696, "step": 27495 }, { "epoch": 0.37, "learning_rate": 3.505212300334203e-05, "loss": 0.9714, "step": 27500 }, { "epoch": 0.37, "learning_rate": 3.5047305252597117e-05, "loss": 0.6284, "step": 27505 }, { "epoch": 0.37, "learning_rate": 3.5042487056806854e-05, "loss": 0.3249, "step": 27510 }, { "epoch": 0.37, "learning_rate": 3.5037668416184655e-05, "loss": 0.2515, "step": 27515 }, { "epoch": 0.37, "learning_rate": 3.503284933094396e-05, "loss": 0.3658, "step": 27520 }, { "epoch": 0.37, "learning_rate": 3.502802980129823e-05, "loss": 0.8739, "step": 27525 }, { "epoch": 0.37, "learning_rate": 3.502320982746095e-05, "loss": 0.588, "step": 27530 }, { "epoch": 0.37, "learning_rate": 3.5018389409645625e-05, "loss": 1.0338, "step": 27535 }, { "epoch": 0.37, "learning_rate": 3.501356854806577e-05, "loss": 0.7838, "step": 27540 }, { "epoch": 0.37, "learning_rate": 3.5008747242934915e-05, "loss": 0.4108, "step": 27545 }, { "epoch": 0.37, "learning_rate": 3.500392549446663e-05, "loss": 0.5252, "step": 27550 }, { "epoch": 0.37, "learning_rate": 3.4999103302874496e-05, "loss": 1.1259, "step": 27555 }, { "epoch": 0.37, "learning_rate": 3.4994280668372106e-05, "loss": 0.6462, "step": 27560 }, { "epoch": 0.37, "learning_rate": 3.4989457591173096e-05, "loss": 0.642, "step": 27565 }, { "epoch": 0.37, "learning_rate": 3.498463407149108e-05, "loss": 0.4451, "step": 27570 }, { "epoch": 0.37, "learning_rate": 3.497981010953973e-05, "loss": 0.7039, "step": 27575 }, { "epoch": 0.37, "learning_rate": 3.4974985705532714e-05, "loss": 0.3621, "step": 27580 }, { "epoch": 0.37, "learning_rate": 3.497016085968374e-05, "loss": 0.2736, "step": 27585 }, { "epoch": 0.37, "learning_rate": 3.496533557220651e-05, "loss": 0.5726, "step": 27590 }, { "epoch": 0.37, "learning_rate": 3.496050984331478e-05, "loss": 0.7999, "step": 27595 }, { "epoch": 0.37, "learning_rate": 3.4955683673222296e-05, "loss": 0.1556, "step": 27600 }, { "epoch": 0.37, "learning_rate": 3.495085706214282e-05, "loss": 1.0622, "step": 27605 }, { "epoch": 0.37, "learning_rate": 3.494603001029017e-05, "loss": 0.6763, "step": 27610 }, { "epoch": 0.37, "learning_rate": 3.494120251787814e-05, "loss": 0.6148, "step": 27615 }, { "epoch": 0.37, "learning_rate": 3.493637458512058e-05, "loss": 0.4799, "step": 27620 }, { "epoch": 0.37, "learning_rate": 3.493154621223134e-05, "loss": 1.0011, "step": 27625 }, { "epoch": 0.37, "learning_rate": 3.4926717399424274e-05, "loss": 0.4827, "step": 27630 }, { "epoch": 0.37, "learning_rate": 3.492188814691329e-05, "loss": 1.0707, "step": 27635 }, { "epoch": 0.37, "learning_rate": 3.491705845491231e-05, "loss": 0.6045, "step": 27640 }, { "epoch": 0.37, "learning_rate": 3.4912228323635254e-05, "loss": 0.6119, "step": 27645 }, { "epoch": 0.37, "learning_rate": 3.4907397753296076e-05, "loss": 0.3591, "step": 27650 }, { "epoch": 0.37, "learning_rate": 3.490256674410873e-05, "loss": 0.9201, "step": 27655 }, { "epoch": 0.37, "learning_rate": 3.489773529628722e-05, "loss": 0.4915, "step": 27660 }, { "epoch": 0.37, "learning_rate": 3.489290341004556e-05, "loss": 0.7616, "step": 27665 }, { "epoch": 0.37, "learning_rate": 3.4888071085597764e-05, "loss": 1.0784, "step": 27670 }, { "epoch": 0.37, "learning_rate": 3.48832383231579e-05, "loss": 0.72, "step": 27675 }, { "epoch": 0.37, "learning_rate": 3.487840512294001e-05, "loss": 0.1326, "step": 27680 }, { "epoch": 0.37, "learning_rate": 3.487357148515819e-05, "loss": 0.572, "step": 27685 }, { "epoch": 0.37, "learning_rate": 3.486873741002656e-05, "loss": 0.5757, "step": 27690 }, { "epoch": 0.37, "learning_rate": 3.4863902897759225e-05, "loss": 1.0244, "step": 27695 }, { "epoch": 0.37, "learning_rate": 3.4859067948570354e-05, "loss": 0.5718, "step": 27700 }, { "epoch": 0.37, "learning_rate": 3.485423256267409e-05, "loss": 0.7706, "step": 27705 }, { "epoch": 0.37, "learning_rate": 3.484939674028461e-05, "loss": 0.471, "step": 27710 }, { "epoch": 0.37, "learning_rate": 3.484456048161614e-05, "loss": 0.6466, "step": 27715 }, { "epoch": 0.37, "learning_rate": 3.4839723786882895e-05, "loss": 1.4377, "step": 27720 }, { "epoch": 0.37, "learning_rate": 3.48348866562991e-05, "loss": 0.6565, "step": 27725 }, { "epoch": 0.37, "learning_rate": 3.4830049090079045e-05, "loss": 0.2955, "step": 27730 }, { "epoch": 0.37, "learning_rate": 3.4825211088436985e-05, "loss": 0.4882, "step": 27735 }, { "epoch": 0.37, "learning_rate": 3.482037265158722e-05, "loss": 0.4105, "step": 27740 }, { "epoch": 0.37, "learning_rate": 3.481553377974409e-05, "loss": 0.6449, "step": 27745 }, { "epoch": 0.37, "learning_rate": 3.4810694473121913e-05, "loss": 0.9783, "step": 27750 }, { "epoch": 0.37, "learning_rate": 3.480585473193505e-05, "loss": 0.3067, "step": 27755 }, { "epoch": 0.37, "learning_rate": 3.480101455639789e-05, "loss": 1.1219, "step": 27760 }, { "epoch": 0.37, "learning_rate": 3.4796173946724805e-05, "loss": 0.5413, "step": 27765 }, { "epoch": 0.37, "learning_rate": 3.479133290313023e-05, "loss": 0.3446, "step": 27770 }, { "epoch": 0.37, "learning_rate": 3.4786491425828594e-05, "loss": 1.0713, "step": 27775 }, { "epoch": 0.37, "learning_rate": 3.4781649515034345e-05, "loss": 0.6934, "step": 27780 }, { "epoch": 0.37, "learning_rate": 3.477680717096195e-05, "loss": 0.7674, "step": 27785 }, { "epoch": 0.37, "learning_rate": 3.477196439382593e-05, "loss": 0.441, "step": 27790 }, { "epoch": 0.37, "learning_rate": 3.476712118384075e-05, "loss": 0.3061, "step": 27795 }, { "epoch": 0.37, "learning_rate": 3.476227754122098e-05, "loss": 0.7092, "step": 27800 }, { "epoch": 0.37, "learning_rate": 3.475743346618115e-05, "loss": 0.3691, "step": 27805 }, { "epoch": 0.37, "learning_rate": 3.4752588958935836e-05, "loss": 0.6727, "step": 27810 }, { "epoch": 0.37, "learning_rate": 3.474774401969962e-05, "loss": 1.0525, "step": 27815 }, { "epoch": 0.37, "learning_rate": 3.474289864868711e-05, "loss": 1.1674, "step": 27820 }, { "epoch": 0.37, "learning_rate": 3.473805284611293e-05, "loss": 0.9569, "step": 27825 }, { "epoch": 0.37, "learning_rate": 3.4733206612191726e-05, "loss": 1.2965, "step": 27830 }, { "epoch": 0.37, "learning_rate": 3.4728359947138166e-05, "loss": 0.121, "step": 27835 }, { "epoch": 0.37, "learning_rate": 3.4723512851166936e-05, "loss": 1.2553, "step": 27840 }, { "epoch": 0.37, "learning_rate": 3.471866532449272e-05, "loss": 0.8018, "step": 27845 }, { "epoch": 0.37, "learning_rate": 3.471381736733026e-05, "loss": 0.569, "step": 27850 }, { "epoch": 0.37, "learning_rate": 3.470896897989428e-05, "loss": 0.6604, "step": 27855 }, { "epoch": 0.37, "learning_rate": 3.470412016239955e-05, "loss": 0.6249, "step": 27860 }, { "epoch": 0.37, "learning_rate": 3.4699270915060846e-05, "loss": 0.8432, "step": 27865 }, { "epoch": 0.37, "learning_rate": 3.469442123809297e-05, "loss": 1.2025, "step": 27870 }, { "epoch": 0.37, "learning_rate": 3.468957113171072e-05, "loss": 0.718, "step": 27875 }, { "epoch": 0.37, "learning_rate": 3.4684720596128945e-05, "loss": 1.4424, "step": 27880 }, { "epoch": 0.37, "learning_rate": 3.4679869631562506e-05, "loss": 0.5538, "step": 27885 }, { "epoch": 0.37, "learning_rate": 3.4675018238226267e-05, "loss": 0.9815, "step": 27890 }, { "epoch": 0.37, "learning_rate": 3.4670166416335124e-05, "loss": 0.1881, "step": 27895 }, { "epoch": 0.37, "learning_rate": 3.466531416610399e-05, "loss": 0.6507, "step": 27900 }, { "epoch": 0.37, "learning_rate": 3.466046148774778e-05, "loss": 0.427, "step": 27905 }, { "epoch": 0.37, "learning_rate": 3.465560838148147e-05, "loss": 1.3976, "step": 27910 }, { "epoch": 0.37, "learning_rate": 3.465075484752001e-05, "loss": 0.8575, "step": 27915 }, { "epoch": 0.37, "learning_rate": 3.464590088607839e-05, "loss": 0.9161, "step": 27920 }, { "epoch": 0.37, "learning_rate": 3.464104649737162e-05, "loss": 1.1168, "step": 27925 }, { "epoch": 0.37, "learning_rate": 3.463619168161472e-05, "loss": 1.4219, "step": 27930 }, { "epoch": 0.37, "learning_rate": 3.463133643902273e-05, "loss": 1.0959, "step": 27935 }, { "epoch": 0.37, "learning_rate": 3.462648076981073e-05, "loss": 0.5543, "step": 27940 }, { "epoch": 0.37, "learning_rate": 3.462162467419379e-05, "loss": 0.4687, "step": 27945 }, { "epoch": 0.37, "learning_rate": 3.461676815238701e-05, "loss": 0.3834, "step": 27950 }, { "epoch": 0.37, "learning_rate": 3.4611911204605514e-05, "loss": 0.4506, "step": 27955 }, { "epoch": 0.37, "learning_rate": 3.460705383106443e-05, "loss": 1.4748, "step": 27960 }, { "epoch": 0.37, "learning_rate": 3.460219603197894e-05, "loss": 0.8141, "step": 27965 }, { "epoch": 0.37, "learning_rate": 3.459733780756419e-05, "loss": 0.7977, "step": 27970 }, { "epoch": 0.37, "learning_rate": 3.45924791580354e-05, "loss": 1.2865, "step": 27975 }, { "epoch": 0.37, "learning_rate": 3.458762008360777e-05, "loss": 0.6799, "step": 27980 }, { "epoch": 0.37, "learning_rate": 3.458276058449653e-05, "loss": 0.7511, "step": 27985 }, { "epoch": 0.38, "learning_rate": 3.457790066091694e-05, "loss": 0.3962, "step": 27990 }, { "epoch": 0.38, "learning_rate": 3.4573040313084274e-05, "loss": 1.506, "step": 27995 }, { "epoch": 0.38, "learning_rate": 3.4568179541213804e-05, "loss": 0.7768, "step": 28000 }, { "epoch": 0.38, "learning_rate": 3.456331834552086e-05, "loss": 0.6403, "step": 28005 }, { "epoch": 0.38, "learning_rate": 3.4558456726220744e-05, "loss": 0.8152, "step": 28010 }, { "epoch": 0.38, "learning_rate": 3.455359468352882e-05, "loss": 0.8796, "step": 28015 }, { "epoch": 0.38, "learning_rate": 3.454873221766045e-05, "loss": 1.3432, "step": 28020 }, { "epoch": 0.38, "learning_rate": 3.4543869328831e-05, "loss": 0.9553, "step": 28025 }, { "epoch": 0.38, "learning_rate": 3.45390060172559e-05, "loss": 0.7619, "step": 28030 }, { "epoch": 0.38, "learning_rate": 3.453414228315056e-05, "loss": 1.152, "step": 28035 }, { "epoch": 0.38, "learning_rate": 3.45292781267304e-05, "loss": 0.8928, "step": 28040 }, { "epoch": 0.38, "learning_rate": 3.45244135482109e-05, "loss": 0.1314, "step": 28045 }, { "epoch": 0.38, "learning_rate": 3.451954854780753e-05, "loss": 0.4182, "step": 28050 }, { "epoch": 0.38, "learning_rate": 3.451468312573578e-05, "loss": 1.2363, "step": 28055 }, { "epoch": 0.38, "learning_rate": 3.450981728221117e-05, "loss": 0.7973, "step": 28060 }, { "epoch": 0.38, "learning_rate": 3.4504951017449226e-05, "loss": 0.7718, "step": 28065 }, { "epoch": 0.38, "learning_rate": 3.45000843316655e-05, "loss": 0.5202, "step": 28070 }, { "epoch": 0.38, "learning_rate": 3.449521722507558e-05, "loss": 0.483, "step": 28075 }, { "epoch": 0.38, "learning_rate": 3.449034969789504e-05, "loss": 0.8839, "step": 28080 }, { "epoch": 0.38, "learning_rate": 3.4485481750339476e-05, "loss": 0.8203, "step": 28085 }, { "epoch": 0.38, "learning_rate": 3.448061338262454e-05, "loss": 0.4125, "step": 28090 }, { "epoch": 0.38, "learning_rate": 3.447574459496584e-05, "loss": 0.9979, "step": 28095 }, { "epoch": 0.38, "learning_rate": 3.447087538757907e-05, "loss": 0.9415, "step": 28100 }, { "epoch": 0.38, "learning_rate": 3.446600576067991e-05, "loss": 1.1704, "step": 28105 }, { "epoch": 0.38, "learning_rate": 3.446113571448404e-05, "loss": 0.2442, "step": 28110 }, { "epoch": 0.38, "learning_rate": 3.44562652492072e-05, "loss": 0.8485, "step": 28115 }, { "epoch": 0.38, "learning_rate": 3.4451394365065105e-05, "loss": 0.5164, "step": 28120 }, { "epoch": 0.38, "learning_rate": 3.444652306227353e-05, "loss": 0.7217, "step": 28125 }, { "epoch": 0.38, "learning_rate": 3.444165134104825e-05, "loss": 1.6135, "step": 28130 }, { "epoch": 0.38, "learning_rate": 3.443677920160504e-05, "loss": 0.4842, "step": 28135 }, { "epoch": 0.38, "learning_rate": 3.443190664415973e-05, "loss": 0.8017, "step": 28140 }, { "epoch": 0.38, "learning_rate": 3.442703366892814e-05, "loss": 0.9178, "step": 28145 }, { "epoch": 0.38, "learning_rate": 3.4422160276126115e-05, "loss": 0.6249, "step": 28150 }, { "epoch": 0.38, "learning_rate": 3.441728646596953e-05, "loss": 0.9479, "step": 28155 }, { "epoch": 0.38, "learning_rate": 3.441241223867427e-05, "loss": 0.2174, "step": 28160 }, { "epoch": 0.38, "learning_rate": 3.4407537594456233e-05, "loss": 1.1724, "step": 28165 }, { "epoch": 0.38, "learning_rate": 3.440266253353135e-05, "loss": 0.6087, "step": 28170 }, { "epoch": 0.38, "learning_rate": 3.439778705611555e-05, "loss": 0.2042, "step": 28175 }, { "epoch": 0.38, "learning_rate": 3.43929111624248e-05, "loss": 0.9718, "step": 28180 }, { "epoch": 0.38, "learning_rate": 3.438803485267509e-05, "loss": 0.996, "step": 28185 }, { "epoch": 0.38, "learning_rate": 3.438315812708239e-05, "loss": 0.4475, "step": 28190 }, { "epoch": 0.38, "learning_rate": 3.437828098586273e-05, "loss": 1.0813, "step": 28195 }, { "epoch": 0.38, "learning_rate": 3.4373403429232144e-05, "loss": 0.3438, "step": 28200 }, { "epoch": 0.38, "learning_rate": 3.436852545740668e-05, "loss": 1.1956, "step": 28205 }, { "epoch": 0.38, "learning_rate": 3.43636470706024e-05, "loss": 1.1659, "step": 28210 }, { "epoch": 0.38, "learning_rate": 3.4358768269035404e-05, "loss": 0.6251, "step": 28215 }, { "epoch": 0.38, "learning_rate": 3.435388905292179e-05, "loss": 0.3434, "step": 28220 }, { "epoch": 0.38, "learning_rate": 3.43490094224777e-05, "loss": 0.6239, "step": 28225 }, { "epoch": 0.38, "learning_rate": 3.434412937791924e-05, "loss": 0.9236, "step": 28230 }, { "epoch": 0.38, "learning_rate": 3.4339248919462615e-05, "loss": 0.8803, "step": 28235 }, { "epoch": 0.38, "learning_rate": 3.433436804732398e-05, "loss": 1.001, "step": 28240 }, { "epoch": 0.38, "learning_rate": 3.432948676171955e-05, "loss": 0.832, "step": 28245 }, { "epoch": 0.38, "learning_rate": 3.432460506286552e-05, "loss": 1.1343, "step": 28250 }, { "epoch": 0.38, "learning_rate": 3.4319722950978137e-05, "loss": 0.4289, "step": 28255 }, { "epoch": 0.38, "learning_rate": 3.431484042627364e-05, "loss": 0.2884, "step": 28260 }, { "epoch": 0.38, "learning_rate": 3.4309957488968326e-05, "loss": 0.3306, "step": 28265 }, { "epoch": 0.38, "learning_rate": 3.4305074139278475e-05, "loss": 0.7029, "step": 28270 }, { "epoch": 0.38, "learning_rate": 3.4300190377420385e-05, "loss": 0.286, "step": 28275 }, { "epoch": 0.38, "learning_rate": 3.429530620361039e-05, "loss": 0.9147, "step": 28280 }, { "epoch": 0.38, "learning_rate": 3.4290421618064834e-05, "loss": 1.6882, "step": 28285 }, { "epoch": 0.38, "learning_rate": 3.428553662100007e-05, "loss": 0.3975, "step": 28290 }, { "epoch": 0.38, "learning_rate": 3.4280651212632495e-05, "loss": 0.8318, "step": 28295 }, { "epoch": 0.38, "learning_rate": 3.427576539317851e-05, "loss": 0.4107, "step": 28300 }, { "epoch": 0.38, "learning_rate": 3.427087916285451e-05, "loss": 0.7668, "step": 28305 }, { "epoch": 0.38, "learning_rate": 3.426599252187695e-05, "loss": 0.9263, "step": 28310 }, { "epoch": 0.38, "learning_rate": 3.4261105470462275e-05, "loss": 0.8719, "step": 28315 }, { "epoch": 0.38, "learning_rate": 3.425621800882696e-05, "loss": 1.1211, "step": 28320 }, { "epoch": 0.38, "learning_rate": 3.42513301371875e-05, "loss": 0.6204, "step": 28325 }, { "epoch": 0.38, "learning_rate": 3.424644185576039e-05, "loss": 0.4214, "step": 28330 }, { "epoch": 0.38, "learning_rate": 3.424155316476217e-05, "loss": 0.7415, "step": 28335 }, { "epoch": 0.38, "learning_rate": 3.423666406440937e-05, "loss": 0.6513, "step": 28340 }, { "epoch": 0.38, "learning_rate": 3.4231774554918574e-05, "loss": 0.749, "step": 28345 }, { "epoch": 0.38, "learning_rate": 3.422688463650634e-05, "loss": 0.2095, "step": 28350 }, { "epoch": 0.38, "learning_rate": 3.422199430938929e-05, "loss": 0.3515, "step": 28355 }, { "epoch": 0.38, "learning_rate": 3.421710357378402e-05, "loss": 1.1351, "step": 28360 }, { "epoch": 0.38, "learning_rate": 3.421221242990717e-05, "loss": 0.8, "step": 28365 }, { "epoch": 0.38, "learning_rate": 3.420732087797539e-05, "loss": 0.7593, "step": 28370 }, { "epoch": 0.38, "learning_rate": 3.420242891820537e-05, "loss": 0.7895, "step": 28375 }, { "epoch": 0.38, "learning_rate": 3.4197536550813793e-05, "loss": 0.9663, "step": 28380 }, { "epoch": 0.38, "learning_rate": 3.4192643776017345e-05, "loss": 0.3777, "step": 28385 }, { "epoch": 0.38, "learning_rate": 3.418775059403278e-05, "loss": 0.7461, "step": 28390 }, { "epoch": 0.38, "learning_rate": 3.418285700507682e-05, "loss": 0.6838, "step": 28395 }, { "epoch": 0.38, "learning_rate": 3.417796300936623e-05, "loss": 0.5115, "step": 28400 }, { "epoch": 0.38, "learning_rate": 3.417306860711781e-05, "loss": 1.0015, "step": 28405 }, { "epoch": 0.38, "learning_rate": 3.4168173798548336e-05, "loss": 0.4654, "step": 28410 }, { "epoch": 0.38, "learning_rate": 3.416327858387462e-05, "loss": 0.7506, "step": 28415 }, { "epoch": 0.38, "learning_rate": 3.415838296331352e-05, "loss": 0.5852, "step": 28420 }, { "epoch": 0.38, "learning_rate": 3.4153486937081866e-05, "loss": 1.1624, "step": 28425 }, { "epoch": 0.38, "learning_rate": 3.414859050539653e-05, "loss": 0.5844, "step": 28430 }, { "epoch": 0.38, "learning_rate": 3.4143693668474415e-05, "loss": 1.5724, "step": 28435 }, { "epoch": 0.38, "learning_rate": 3.413879642653241e-05, "loss": 0.9944, "step": 28440 }, { "epoch": 0.38, "learning_rate": 3.4133898779787445e-05, "loss": 1.0879, "step": 28445 }, { "epoch": 0.38, "learning_rate": 3.412900072845645e-05, "loss": 0.1671, "step": 28450 }, { "epoch": 0.38, "learning_rate": 3.41241022727564e-05, "loss": 0.2137, "step": 28455 }, { "epoch": 0.38, "learning_rate": 3.411920341290427e-05, "loss": 0.2811, "step": 28460 }, { "epoch": 0.38, "learning_rate": 3.4114304149117044e-05, "loss": 0.3483, "step": 28465 }, { "epoch": 0.38, "learning_rate": 3.410940448161174e-05, "loss": 0.3529, "step": 28470 }, { "epoch": 0.38, "learning_rate": 3.410450441060539e-05, "loss": 0.3021, "step": 28475 }, { "epoch": 0.38, "learning_rate": 3.409960393631505e-05, "loss": 0.4065, "step": 28480 }, { "epoch": 0.38, "learning_rate": 3.4094703058957775e-05, "loss": 0.9493, "step": 28485 }, { "epoch": 0.38, "learning_rate": 3.4089801778750656e-05, "loss": 0.4623, "step": 28490 }, { "epoch": 0.38, "learning_rate": 3.408490009591079e-05, "loss": 0.5875, "step": 28495 }, { "epoch": 0.38, "learning_rate": 3.407999801065531e-05, "loss": 0.1622, "step": 28500 }, { "epoch": 0.38, "learning_rate": 3.407509552320133e-05, "loss": 0.6368, "step": 28505 }, { "epoch": 0.38, "learning_rate": 3.4070192633766025e-05, "loss": 1.1708, "step": 28510 }, { "epoch": 0.38, "learning_rate": 3.406528934256656e-05, "loss": 0.1508, "step": 28515 }, { "epoch": 0.38, "learning_rate": 3.4060385649820146e-05, "loss": 0.7735, "step": 28520 }, { "epoch": 0.38, "learning_rate": 3.4055481555743955e-05, "loss": 0.9622, "step": 28525 }, { "epoch": 0.38, "learning_rate": 3.4050577060555245e-05, "loss": 0.4384, "step": 28530 }, { "epoch": 0.38, "learning_rate": 3.404567216447124e-05, "loss": 1.5791, "step": 28535 }, { "epoch": 0.38, "learning_rate": 3.4040766867709226e-05, "loss": 1.3708, "step": 28540 }, { "epoch": 0.38, "learning_rate": 3.403586117048646e-05, "loss": 0.2727, "step": 28545 }, { "epoch": 0.38, "learning_rate": 3.4030955073020254e-05, "loss": 0.4575, "step": 28550 }, { "epoch": 0.38, "learning_rate": 3.4026048575527914e-05, "loss": 0.7073, "step": 28555 }, { "epoch": 0.38, "learning_rate": 3.402114167822678e-05, "loss": 1.3812, "step": 28560 }, { "epoch": 0.38, "learning_rate": 3.40162343813342e-05, "loss": 0.1977, "step": 28565 }, { "epoch": 0.38, "learning_rate": 3.4011326685067544e-05, "loss": 0.3769, "step": 28570 }, { "epoch": 0.38, "learning_rate": 3.400641858964421e-05, "loss": 0.6675, "step": 28575 }, { "epoch": 0.38, "learning_rate": 3.4001510095281574e-05, "loss": 0.5605, "step": 28580 }, { "epoch": 0.38, "learning_rate": 3.399660120219707e-05, "loss": 0.3806, "step": 28585 }, { "epoch": 0.38, "learning_rate": 3.3991691910608154e-05, "loss": 0.6052, "step": 28590 }, { "epoch": 0.38, "learning_rate": 3.398678222073227e-05, "loss": 0.7078, "step": 28595 }, { "epoch": 0.38, "learning_rate": 3.398187213278689e-05, "loss": 0.6076, "step": 28600 }, { "epoch": 0.38, "learning_rate": 3.3976961646989505e-05, "loss": 0.5151, "step": 28605 }, { "epoch": 0.38, "learning_rate": 3.3972050763557636e-05, "loss": 0.7162, "step": 28610 }, { "epoch": 0.38, "learning_rate": 3.3967139482708805e-05, "loss": 0.4684, "step": 28615 }, { "epoch": 0.38, "learning_rate": 3.396222780466055e-05, "loss": 0.3921, "step": 28620 }, { "epoch": 0.38, "learning_rate": 3.395731572963044e-05, "loss": 1.0612, "step": 28625 }, { "epoch": 0.38, "learning_rate": 3.395240325783606e-05, "loss": 0.0659, "step": 28630 }, { "epoch": 0.38, "learning_rate": 3.3947490389495e-05, "loss": 0.7463, "step": 28635 }, { "epoch": 0.38, "learning_rate": 3.394257712482488e-05, "loss": 0.8236, "step": 28640 }, { "epoch": 0.38, "learning_rate": 3.393766346404333e-05, "loss": 0.8926, "step": 28645 }, { "epoch": 0.38, "learning_rate": 3.3932749407368e-05, "loss": 0.964, "step": 28650 }, { "epoch": 0.38, "learning_rate": 3.392783495501657e-05, "loss": 0.2472, "step": 28655 }, { "epoch": 0.38, "learning_rate": 3.392292010720671e-05, "loss": 1.0122, "step": 28660 }, { "epoch": 0.38, "learning_rate": 3.391800486415613e-05, "loss": 1.0614, "step": 28665 }, { "epoch": 0.38, "learning_rate": 3.391308922608255e-05, "loss": 1.0059, "step": 28670 }, { "epoch": 0.38, "learning_rate": 3.3908173193203703e-05, "loss": 0.4913, "step": 28675 }, { "epoch": 0.38, "learning_rate": 3.390325676573736e-05, "loss": 0.4589, "step": 28680 }, { "epoch": 0.38, "learning_rate": 3.3898339943901275e-05, "loss": 0.4443, "step": 28685 }, { "epoch": 0.38, "learning_rate": 3.389342272791325e-05, "loss": 1.383, "step": 28690 }, { "epoch": 0.38, "learning_rate": 3.3888505117991086e-05, "loss": 0.2684, "step": 28695 }, { "epoch": 0.38, "learning_rate": 3.388358711435262e-05, "loss": 0.9642, "step": 28700 }, { "epoch": 0.38, "learning_rate": 3.387866871721569e-05, "loss": 0.2602, "step": 28705 }, { "epoch": 0.38, "learning_rate": 3.387374992679815e-05, "loss": 0.5734, "step": 28710 }, { "epoch": 0.38, "learning_rate": 3.386883074331788e-05, "loss": 0.4162, "step": 28715 }, { "epoch": 0.38, "learning_rate": 3.386391116699278e-05, "loss": 0.4784, "step": 28720 }, { "epoch": 0.38, "learning_rate": 3.385899119804076e-05, "loss": 0.6102, "step": 28725 }, { "epoch": 0.38, "learning_rate": 3.385407083667975e-05, "loss": 0.9703, "step": 28730 }, { "epoch": 0.39, "learning_rate": 3.38491500831277e-05, "loss": 0.6475, "step": 28735 }, { "epoch": 0.39, "learning_rate": 3.3844228937602576e-05, "loss": 0.7719, "step": 28740 }, { "epoch": 0.39, "learning_rate": 3.383930740032234e-05, "loss": 0.2504, "step": 28745 }, { "epoch": 0.39, "learning_rate": 3.383438547150501e-05, "loss": 0.4521, "step": 28750 }, { "epoch": 0.39, "learning_rate": 3.382946315136862e-05, "loss": 0.644, "step": 28755 }, { "epoch": 0.39, "learning_rate": 3.382454044013117e-05, "loss": 0.6331, "step": 28760 }, { "epoch": 0.39, "learning_rate": 3.381961733801073e-05, "loss": 1.2654, "step": 28765 }, { "epoch": 0.39, "learning_rate": 3.3814693845225366e-05, "loss": 0.4646, "step": 28770 }, { "epoch": 0.39, "learning_rate": 3.3809769961993165e-05, "loss": 0.8296, "step": 28775 }, { "epoch": 0.39, "learning_rate": 3.380484568853222e-05, "loss": 0.32, "step": 28780 }, { "epoch": 0.39, "learning_rate": 3.379992102506067e-05, "loss": 0.708, "step": 28785 }, { "epoch": 0.39, "learning_rate": 3.379499597179664e-05, "loss": 0.7375, "step": 28790 }, { "epoch": 0.39, "learning_rate": 3.3790070528958284e-05, "loss": 0.5657, "step": 28795 }, { "epoch": 0.39, "learning_rate": 3.378514469676378e-05, "loss": 0.6553, "step": 28800 }, { "epoch": 0.39, "learning_rate": 3.378021847543132e-05, "loss": 1.3686, "step": 28805 }, { "epoch": 0.39, "learning_rate": 3.377529186517911e-05, "loss": 0.5797, "step": 28810 }, { "epoch": 0.39, "learning_rate": 3.3770364866225365e-05, "loss": 0.4759, "step": 28815 }, { "epoch": 0.39, "learning_rate": 3.376543747878834e-05, "loss": 0.7944, "step": 28820 }, { "epoch": 0.39, "learning_rate": 3.376050970308628e-05, "loss": 0.7431, "step": 28825 }, { "epoch": 0.39, "learning_rate": 3.375558153933747e-05, "loss": 0.8104, "step": 28830 }, { "epoch": 0.39, "learning_rate": 3.37506529877602e-05, "loss": 0.8516, "step": 28835 }, { "epoch": 0.39, "learning_rate": 3.374572404857278e-05, "loss": 0.7407, "step": 28840 }, { "epoch": 0.39, "learning_rate": 3.374079472199355e-05, "loss": 0.5854, "step": 28845 }, { "epoch": 0.39, "learning_rate": 3.373586500824083e-05, "loss": 0.7857, "step": 28850 }, { "epoch": 0.39, "learning_rate": 3.3730934907533e-05, "loss": 0.9432, "step": 28855 }, { "epoch": 0.39, "learning_rate": 3.372600442008842e-05, "loss": 1.1684, "step": 28860 }, { "epoch": 0.39, "learning_rate": 3.3721073546125513e-05, "loss": 1.4259, "step": 28865 }, { "epoch": 0.39, "learning_rate": 3.371614228586267e-05, "loss": 0.2701, "step": 28870 }, { "epoch": 0.39, "learning_rate": 3.371121063951834e-05, "loss": 1.2121, "step": 28875 }, { "epoch": 0.39, "learning_rate": 3.3706278607310954e-05, "loss": 0.0926, "step": 28880 }, { "epoch": 0.39, "learning_rate": 3.3701346189458984e-05, "loss": 1.0226, "step": 28885 }, { "epoch": 0.39, "learning_rate": 3.36964133861809e-05, "loss": 1.0177, "step": 28890 }, { "epoch": 0.39, "learning_rate": 3.369148019769522e-05, "loss": 0.9941, "step": 28895 }, { "epoch": 0.39, "learning_rate": 3.3686546624220445e-05, "loss": 1.1144, "step": 28900 }, { "epoch": 0.39, "learning_rate": 3.3681612665975114e-05, "loss": 1.1327, "step": 28905 }, { "epoch": 0.39, "learning_rate": 3.367667832317777e-05, "loss": 0.324, "step": 28910 }, { "epoch": 0.39, "learning_rate": 3.367174359604699e-05, "loss": 0.325, "step": 28915 }, { "epoch": 0.39, "learning_rate": 3.366680848480135e-05, "loss": 0.5545, "step": 28920 }, { "epoch": 0.39, "learning_rate": 3.3661872989659445e-05, "loss": 0.4879, "step": 28925 }, { "epoch": 0.39, "learning_rate": 3.365693711083991e-05, "loss": 0.3052, "step": 28930 }, { "epoch": 0.39, "learning_rate": 3.365200084856137e-05, "loss": 0.3303, "step": 28935 }, { "epoch": 0.39, "learning_rate": 3.364706420304248e-05, "loss": 0.7165, "step": 28940 }, { "epoch": 0.39, "learning_rate": 3.3642127174501894e-05, "loss": 0.4207, "step": 28945 }, { "epoch": 0.39, "learning_rate": 3.3637189763158315e-05, "loss": 0.3072, "step": 28950 }, { "epoch": 0.39, "learning_rate": 3.3632251969230446e-05, "loss": 0.3284, "step": 28955 }, { "epoch": 0.39, "learning_rate": 3.3627313792936996e-05, "loss": 1.3824, "step": 28960 }, { "epoch": 0.39, "learning_rate": 3.3622375234496704e-05, "loss": 1.3489, "step": 28965 }, { "epoch": 0.39, "learning_rate": 3.361743629412832e-05, "loss": 0.7809, "step": 28970 }, { "epoch": 0.39, "learning_rate": 3.361249697205063e-05, "loss": 0.623, "step": 28975 }, { "epoch": 0.39, "learning_rate": 3.3607557268482416e-05, "loss": 0.6836, "step": 28980 }, { "epoch": 0.39, "learning_rate": 3.360261718364247e-05, "loss": 1.0901, "step": 28985 }, { "epoch": 0.39, "learning_rate": 3.359767671774962e-05, "loss": 0.6563, "step": 28990 }, { "epoch": 0.39, "learning_rate": 3.35927358710227e-05, "loss": 0.6111, "step": 28995 }, { "epoch": 0.39, "learning_rate": 3.358779464368058e-05, "loss": 0.1306, "step": 29000 }, { "epoch": 0.39, "learning_rate": 3.3582853035942106e-05, "loss": 0.2729, "step": 29005 }, { "epoch": 0.39, "learning_rate": 3.357791104802619e-05, "loss": 0.5707, "step": 29010 }, { "epoch": 0.39, "learning_rate": 3.357296868015173e-05, "loss": 0.292, "step": 29015 }, { "epoch": 0.39, "learning_rate": 3.3568025932537646e-05, "loss": 0.5725, "step": 29020 }, { "epoch": 0.39, "learning_rate": 3.3563082805402865e-05, "loss": 1.1768, "step": 29025 }, { "epoch": 0.39, "learning_rate": 3.355813929896637e-05, "loss": 0.6732, "step": 29030 }, { "epoch": 0.39, "learning_rate": 3.355319541344712e-05, "loss": 0.6021, "step": 29035 }, { "epoch": 0.39, "learning_rate": 3.35482511490641e-05, "loss": 0.4956, "step": 29040 }, { "epoch": 0.39, "learning_rate": 3.354330650603632e-05, "loss": 0.2411, "step": 29045 }, { "epoch": 0.39, "learning_rate": 3.3538361484582796e-05, "loss": 0.4038, "step": 29050 }, { "epoch": 0.39, "learning_rate": 3.353341608492258e-05, "loss": 1.2434, "step": 29055 }, { "epoch": 0.39, "learning_rate": 3.352847030727472e-05, "loss": 1.4178, "step": 29060 }, { "epoch": 0.39, "learning_rate": 3.35235241518583e-05, "loss": 0.8906, "step": 29065 }, { "epoch": 0.39, "learning_rate": 3.3518577618892394e-05, "loss": 0.9236, "step": 29070 }, { "epoch": 0.39, "learning_rate": 3.351363070859612e-05, "loss": 0.5978, "step": 29075 }, { "epoch": 0.39, "learning_rate": 3.350868342118859e-05, "loss": 0.8784, "step": 29080 }, { "epoch": 0.39, "learning_rate": 3.350373575688897e-05, "loss": 0.5106, "step": 29085 }, { "epoch": 0.39, "learning_rate": 3.349878771591638e-05, "loss": 1.1496, "step": 29090 }, { "epoch": 0.39, "learning_rate": 3.349383929849002e-05, "loss": 0.5959, "step": 29095 }, { "epoch": 0.39, "learning_rate": 3.348889050482907e-05, "loss": 0.9355, "step": 29100 }, { "epoch": 0.39, "learning_rate": 3.348394133515275e-05, "loss": 0.2771, "step": 29105 }, { "epoch": 0.39, "learning_rate": 3.3478991789680256e-05, "loss": 1.3261, "step": 29110 }, { "epoch": 0.39, "learning_rate": 3.347404186863085e-05, "loss": 1.0836, "step": 29115 }, { "epoch": 0.39, "learning_rate": 3.346909157222379e-05, "loss": 0.832, "step": 29120 }, { "epoch": 0.39, "learning_rate": 3.346414090067834e-05, "loss": 0.7346, "step": 29125 }, { "epoch": 0.39, "learning_rate": 3.345918985421379e-05, "loss": 1.8845, "step": 29130 }, { "epoch": 0.39, "learning_rate": 3.345423843304945e-05, "loss": 0.9217, "step": 29135 }, { "epoch": 0.39, "learning_rate": 3.3449286637404646e-05, "loss": 0.2504, "step": 29140 }, { "epoch": 0.39, "learning_rate": 3.3444334467498714e-05, "loss": 1.0635, "step": 29145 }, { "epoch": 0.39, "learning_rate": 3.343938192355101e-05, "loss": 0.8236, "step": 29150 }, { "epoch": 0.39, "learning_rate": 3.343442900578091e-05, "loss": 0.9458, "step": 29155 }, { "epoch": 0.39, "learning_rate": 3.3429475714407795e-05, "loss": 0.7844, "step": 29160 }, { "epoch": 0.39, "learning_rate": 3.342452204965108e-05, "loss": 1.2279, "step": 29165 }, { "epoch": 0.39, "learning_rate": 3.341956801173019e-05, "loss": 0.2365, "step": 29170 }, { "epoch": 0.39, "learning_rate": 3.341461360086455e-05, "loss": 0.3234, "step": 29175 }, { "epoch": 0.39, "learning_rate": 3.340965881727363e-05, "loss": 0.8499, "step": 29180 }, { "epoch": 0.39, "learning_rate": 3.3404703661176894e-05, "loss": 0.3925, "step": 29185 }, { "epoch": 0.39, "learning_rate": 3.339974813279384e-05, "loss": 0.7084, "step": 29190 }, { "epoch": 0.39, "learning_rate": 3.3394792232343955e-05, "loss": 0.7065, "step": 29195 }, { "epoch": 0.39, "learning_rate": 3.338983596004678e-05, "loss": 0.9241, "step": 29200 }, { "epoch": 0.39, "learning_rate": 3.338487931612184e-05, "loss": 0.5671, "step": 29205 }, { "epoch": 0.39, "learning_rate": 3.337992230078869e-05, "loss": 0.5129, "step": 29210 }, { "epoch": 0.39, "learning_rate": 3.337496491426691e-05, "loss": 0.5361, "step": 29215 }, { "epoch": 0.39, "learning_rate": 3.3370007156776095e-05, "loss": 0.5069, "step": 29220 }, { "epoch": 0.39, "learning_rate": 3.336504902853582e-05, "loss": 0.4724, "step": 29225 }, { "epoch": 0.39, "learning_rate": 3.336009052976574e-05, "loss": 0.7252, "step": 29230 }, { "epoch": 0.39, "learning_rate": 3.335513166068546e-05, "loss": 1.028, "step": 29235 }, { "epoch": 0.39, "learning_rate": 3.335017242151465e-05, "loss": 0.7033, "step": 29240 }, { "epoch": 0.39, "learning_rate": 3.334521281247297e-05, "loss": 0.84, "step": 29245 }, { "epoch": 0.39, "learning_rate": 3.3340252833780126e-05, "loss": 0.5622, "step": 29250 }, { "epoch": 0.39, "learning_rate": 3.33352924856558e-05, "loss": 0.3037, "step": 29255 }, { "epoch": 0.39, "learning_rate": 3.333033176831972e-05, "loss": 0.5303, "step": 29260 }, { "epoch": 0.39, "learning_rate": 3.332537068199161e-05, "loss": 0.9292, "step": 29265 }, { "epoch": 0.39, "learning_rate": 3.332040922689123e-05, "loss": 0.6512, "step": 29270 }, { "epoch": 0.39, "learning_rate": 3.3315447403238354e-05, "loss": 0.8902, "step": 29275 }, { "epoch": 0.39, "learning_rate": 3.331048521125275e-05, "loss": 1.0781, "step": 29280 }, { "epoch": 0.39, "learning_rate": 3.3305522651154235e-05, "loss": 1.3355, "step": 29285 }, { "epoch": 0.39, "learning_rate": 3.330055972316262e-05, "loss": 1.267, "step": 29290 }, { "epoch": 0.39, "learning_rate": 3.329559642749773e-05, "loss": 0.9328, "step": 29295 }, { "epoch": 0.39, "learning_rate": 3.3290632764379415e-05, "loss": 0.9355, "step": 29300 }, { "epoch": 0.39, "learning_rate": 3.3285668734027556e-05, "loss": 0.7931, "step": 29305 }, { "epoch": 0.39, "learning_rate": 3.328070433666202e-05, "loss": 0.3538, "step": 29310 }, { "epoch": 0.39, "learning_rate": 3.327573957250271e-05, "loss": 0.3549, "step": 29315 }, { "epoch": 0.39, "learning_rate": 3.3270774441769534e-05, "loss": 1.3672, "step": 29320 }, { "epoch": 0.39, "learning_rate": 3.326580894468243e-05, "loss": 0.7692, "step": 29325 }, { "epoch": 0.39, "learning_rate": 3.326084308146134e-05, "loss": 0.3305, "step": 29330 }, { "epoch": 0.39, "learning_rate": 3.325587685232623e-05, "loss": 0.7581, "step": 29335 }, { "epoch": 0.39, "learning_rate": 3.325091025749708e-05, "loss": 0.3159, "step": 29340 }, { "epoch": 0.39, "learning_rate": 3.324594329719389e-05, "loss": 0.781, "step": 29345 }, { "epoch": 0.39, "learning_rate": 3.324097597163666e-05, "loss": 0.8436, "step": 29350 }, { "epoch": 0.39, "learning_rate": 3.323600828104542e-05, "loss": 0.1523, "step": 29355 }, { "epoch": 0.39, "learning_rate": 3.323104022564022e-05, "loss": 0.2475, "step": 29360 }, { "epoch": 0.39, "learning_rate": 3.3226071805641115e-05, "loss": 0.4073, "step": 29365 }, { "epoch": 0.39, "learning_rate": 3.322110302126818e-05, "loss": 0.8285, "step": 29370 }, { "epoch": 0.39, "learning_rate": 3.3216133872741514e-05, "loss": 0.6165, "step": 29375 }, { "epoch": 0.39, "learning_rate": 3.3211164360281215e-05, "loss": 0.5049, "step": 29380 }, { "epoch": 0.39, "learning_rate": 3.320619448410742e-05, "loss": 0.8151, "step": 29385 }, { "epoch": 0.39, "learning_rate": 3.320122424444027e-05, "loss": 1.2445, "step": 29390 }, { "epoch": 0.39, "learning_rate": 3.3196253641499905e-05, "loss": 1.4142, "step": 29395 }, { "epoch": 0.39, "learning_rate": 3.319128267550651e-05, "loss": 0.1424, "step": 29400 }, { "epoch": 0.39, "learning_rate": 3.318631134668028e-05, "loss": 0.6583, "step": 29405 }, { "epoch": 0.39, "learning_rate": 3.31813396552414e-05, "loss": 0.6153, "step": 29410 }, { "epoch": 0.39, "learning_rate": 3.317636760141011e-05, "loss": 0.5148, "step": 29415 }, { "epoch": 0.39, "learning_rate": 3.317139518540664e-05, "loss": 0.5307, "step": 29420 }, { "epoch": 0.39, "learning_rate": 3.316642240745124e-05, "loss": 0.9607, "step": 29425 }, { "epoch": 0.39, "learning_rate": 3.316144926776419e-05, "loss": 0.4406, "step": 29430 }, { "epoch": 0.39, "learning_rate": 3.315647576656576e-05, "loss": 1.6862, "step": 29435 }, { "epoch": 0.39, "learning_rate": 3.3151501904076265e-05, "loss": 0.3164, "step": 29440 }, { "epoch": 0.39, "learning_rate": 3.3146527680516006e-05, "loss": 1.165, "step": 29445 }, { "epoch": 0.39, "learning_rate": 3.314155309610534e-05, "loss": 0.6961, "step": 29450 }, { "epoch": 0.39, "learning_rate": 3.31365781510646e-05, "loss": 0.6942, "step": 29455 }, { "epoch": 0.39, "learning_rate": 3.313160284561415e-05, "loss": 1.3986, "step": 29460 }, { "epoch": 0.39, "learning_rate": 3.312662717997437e-05, "loss": 0.3105, "step": 29465 }, { "epoch": 0.39, "learning_rate": 3.3121651154365674e-05, "loss": 0.8238, "step": 29470 }, { "epoch": 0.39, "learning_rate": 3.311667476900846e-05, "loss": 0.7647, "step": 29475 }, { "epoch": 0.39, "learning_rate": 3.3111698024123164e-05, "loss": 1.6622, "step": 29480 }, { "epoch": 0.4, "learning_rate": 3.310672091993021e-05, "loss": 0.3306, "step": 29485 }, { "epoch": 0.4, "learning_rate": 3.3101743456650085e-05, "loss": 0.9432, "step": 29490 }, { "epoch": 0.4, "learning_rate": 3.309676563450326e-05, "loss": 0.6261, "step": 29495 }, { "epoch": 0.4, "learning_rate": 3.309178745371022e-05, "loss": 1.9708, "step": 29500 }, { "epoch": 0.4, "learning_rate": 3.308680891449148e-05, "loss": 0.8313, "step": 29505 }, { "epoch": 0.4, "learning_rate": 3.308183001706757e-05, "loss": 1.2397, "step": 29510 }, { "epoch": 0.4, "learning_rate": 3.307685076165902e-05, "loss": 0.4819, "step": 29515 }, { "epoch": 0.4, "learning_rate": 3.307187114848638e-05, "loss": 1.3507, "step": 29520 }, { "epoch": 0.4, "learning_rate": 3.306689117777023e-05, "loss": 0.4562, "step": 29525 }, { "epoch": 0.4, "learning_rate": 3.306191084973116e-05, "loss": 0.8266, "step": 29530 }, { "epoch": 0.4, "learning_rate": 3.305693016458978e-05, "loss": 0.6202, "step": 29535 }, { "epoch": 0.4, "learning_rate": 3.305194912256669e-05, "loss": 0.8815, "step": 29540 }, { "epoch": 0.4, "learning_rate": 3.3046967723882536e-05, "loss": 1.0484, "step": 29545 }, { "epoch": 0.4, "learning_rate": 3.3041985968757984e-05, "loss": 1.0679, "step": 29550 }, { "epoch": 0.4, "learning_rate": 3.303700385741367e-05, "loss": 0.4711, "step": 29555 }, { "epoch": 0.4, "learning_rate": 3.30320213900703e-05, "loss": 0.5751, "step": 29560 }, { "epoch": 0.4, "learning_rate": 3.302703856694858e-05, "loss": 0.5511, "step": 29565 }, { "epoch": 0.4, "learning_rate": 3.302205538826919e-05, "loss": 0.5109, "step": 29570 }, { "epoch": 0.4, "learning_rate": 3.301707185425288e-05, "loss": 0.3941, "step": 29575 }, { "epoch": 0.4, "learning_rate": 3.3012087965120405e-05, "loss": 0.1925, "step": 29580 }, { "epoch": 0.4, "learning_rate": 3.300710372109251e-05, "loss": 0.7095, "step": 29585 }, { "epoch": 0.4, "learning_rate": 3.300211912238998e-05, "loss": 0.7967, "step": 29590 }, { "epoch": 0.4, "learning_rate": 3.29971341692336e-05, "loss": 0.6007, "step": 29595 }, { "epoch": 0.4, "learning_rate": 3.299214886184419e-05, "loss": 0.256, "step": 29600 }, { "epoch": 0.4, "learning_rate": 3.2987163200442575e-05, "loss": 0.8446, "step": 29605 }, { "epoch": 0.4, "learning_rate": 3.298217718524958e-05, "loss": 1.0538, "step": 29610 }, { "epoch": 0.4, "learning_rate": 3.297719081648607e-05, "loss": 0.5219, "step": 29615 }, { "epoch": 0.4, "learning_rate": 3.297220409437293e-05, "loss": 1.6243, "step": 29620 }, { "epoch": 0.4, "learning_rate": 3.2967217019131017e-05, "loss": 0.5145, "step": 29625 }, { "epoch": 0.4, "learning_rate": 3.296222959098125e-05, "loss": 0.5984, "step": 29630 }, { "epoch": 0.4, "learning_rate": 3.295724181014454e-05, "loss": 0.8585, "step": 29635 }, { "epoch": 0.4, "learning_rate": 3.295225367684184e-05, "loss": 0.2072, "step": 29640 }, { "epoch": 0.4, "learning_rate": 3.294726519129408e-05, "loss": 0.6553, "step": 29645 }, { "epoch": 0.4, "learning_rate": 3.294227635372223e-05, "loss": 0.7474, "step": 29650 }, { "epoch": 0.4, "learning_rate": 3.2937287164347274e-05, "loss": 0.796, "step": 29655 }, { "epoch": 0.4, "learning_rate": 3.293229762339021e-05, "loss": 0.8461, "step": 29660 }, { "epoch": 0.4, "learning_rate": 3.2927307731072034e-05, "loss": 1.4099, "step": 29665 }, { "epoch": 0.4, "learning_rate": 3.292231748761379e-05, "loss": 0.4744, "step": 29670 }, { "epoch": 0.4, "learning_rate": 3.291732689323652e-05, "loss": 1.1943, "step": 29675 }, { "epoch": 0.4, "learning_rate": 3.291233594816127e-05, "loss": 1.0616, "step": 29680 }, { "epoch": 0.4, "learning_rate": 3.290734465260912e-05, "loss": 0.9337, "step": 29685 }, { "epoch": 0.4, "learning_rate": 3.290235300680117e-05, "loss": 0.5438, "step": 29690 }, { "epoch": 0.4, "learning_rate": 3.2897361010958514e-05, "loss": 1.0176, "step": 29695 }, { "epoch": 0.4, "learning_rate": 3.2892368665302275e-05, "loss": 0.6641, "step": 29700 }, { "epoch": 0.4, "learning_rate": 3.2887375970053584e-05, "loss": 1.0159, "step": 29705 }, { "epoch": 0.4, "learning_rate": 3.28823829254336e-05, "loss": 0.3, "step": 29710 }, { "epoch": 0.4, "learning_rate": 3.287738953166349e-05, "loss": 0.1519, "step": 29715 }, { "epoch": 0.4, "learning_rate": 3.287239578896442e-05, "loss": 0.7483, "step": 29720 }, { "epoch": 0.4, "learning_rate": 3.286740169755762e-05, "loss": 0.1816, "step": 29725 }, { "epoch": 0.4, "learning_rate": 3.2862407257664276e-05, "loss": 0.2385, "step": 29730 }, { "epoch": 0.4, "learning_rate": 3.2857412469505614e-05, "loss": 0.7116, "step": 29735 }, { "epoch": 0.4, "learning_rate": 3.28524173333029e-05, "loss": 0.7599, "step": 29740 }, { "epoch": 0.4, "learning_rate": 3.2847421849277385e-05, "loss": 0.7105, "step": 29745 }, { "epoch": 0.4, "learning_rate": 3.284242601765033e-05, "loss": 1.2231, "step": 29750 }, { "epoch": 0.4, "learning_rate": 3.283742983864305e-05, "loss": 0.3408, "step": 29755 }, { "epoch": 0.4, "learning_rate": 3.283243331247683e-05, "loss": 0.1321, "step": 29760 }, { "epoch": 0.4, "learning_rate": 3.282743643937299e-05, "loss": 1.0587, "step": 29765 }, { "epoch": 0.4, "learning_rate": 3.282243921955289e-05, "loss": 0.6495, "step": 29770 }, { "epoch": 0.4, "learning_rate": 3.281744165323786e-05, "loss": 0.3766, "step": 29775 }, { "epoch": 0.4, "learning_rate": 3.281244374064928e-05, "loss": 0.7919, "step": 29780 }, { "epoch": 0.4, "learning_rate": 3.280744548200853e-05, "loss": 0.9986, "step": 29785 }, { "epoch": 0.4, "learning_rate": 3.280244687753699e-05, "loss": 0.4981, "step": 29790 }, { "epoch": 0.4, "learning_rate": 3.279744792745609e-05, "loss": 0.9357, "step": 29795 }, { "epoch": 0.4, "learning_rate": 3.279244863198727e-05, "loss": 0.1097, "step": 29800 }, { "epoch": 0.4, "learning_rate": 3.278744899135195e-05, "loss": 0.6034, "step": 29805 }, { "epoch": 0.4, "learning_rate": 3.27824490057716e-05, "loss": 0.5475, "step": 29810 }, { "epoch": 0.4, "learning_rate": 3.277744867546769e-05, "loss": 0.4091, "step": 29815 }, { "epoch": 0.4, "learning_rate": 3.277244800066172e-05, "loss": 0.661, "step": 29820 }, { "epoch": 0.4, "learning_rate": 3.2767446981575186e-05, "loss": 0.5762, "step": 29825 }, { "epoch": 0.4, "learning_rate": 3.27624456184296e-05, "loss": 0.352, "step": 29830 }, { "epoch": 0.4, "learning_rate": 3.275744391144653e-05, "loss": 0.8846, "step": 29835 }, { "epoch": 0.4, "learning_rate": 3.275244186084749e-05, "loss": 1.0609, "step": 29840 }, { "epoch": 0.4, "learning_rate": 3.274743946685405e-05, "loss": 1.2, "step": 29845 }, { "epoch": 0.4, "learning_rate": 3.274243672968782e-05, "loss": 0.4488, "step": 29850 }, { "epoch": 0.4, "learning_rate": 3.273743364957037e-05, "loss": 0.6856, "step": 29855 }, { "epoch": 0.4, "learning_rate": 3.273243022672331e-05, "loss": 1.1594, "step": 29860 }, { "epoch": 0.4, "learning_rate": 3.272742646136829e-05, "loss": 1.2273, "step": 29865 }, { "epoch": 0.4, "learning_rate": 3.2722422353726926e-05, "loss": 0.6822, "step": 29870 }, { "epoch": 0.4, "learning_rate": 3.271741790402088e-05, "loss": 1.1331, "step": 29875 }, { "epoch": 0.4, "learning_rate": 3.2712413112471844e-05, "loss": 0.7756, "step": 29880 }, { "epoch": 0.4, "learning_rate": 3.270740797930148e-05, "loss": 0.2217, "step": 29885 }, { "epoch": 0.4, "learning_rate": 3.270240250473151e-05, "loss": 0.8358, "step": 29890 }, { "epoch": 0.4, "learning_rate": 3.2697396688983645e-05, "loss": 0.6998, "step": 29895 }, { "epoch": 0.4, "learning_rate": 3.26923905322796e-05, "loss": 0.2707, "step": 29900 }, { "epoch": 0.4, "learning_rate": 3.268738403484116e-05, "loss": 0.6503, "step": 29905 }, { "epoch": 0.4, "learning_rate": 3.268237719689005e-05, "loss": 0.8045, "step": 29910 }, { "epoch": 0.4, "learning_rate": 3.2677370018648065e-05, "loss": 0.1975, "step": 29915 }, { "epoch": 0.4, "learning_rate": 3.267236250033701e-05, "loss": 1.3179, "step": 29920 }, { "epoch": 0.4, "learning_rate": 3.2667354642178665e-05, "loss": 0.7669, "step": 29925 }, { "epoch": 0.4, "learning_rate": 3.266234644439487e-05, "loss": 1.1352, "step": 29930 }, { "epoch": 0.4, "learning_rate": 3.2657337907207467e-05, "loss": 0.9384, "step": 29935 }, { "epoch": 0.4, "learning_rate": 3.26523290308383e-05, "loss": 0.6942, "step": 29940 }, { "epoch": 0.4, "learning_rate": 3.264731981550924e-05, "loss": 0.2737, "step": 29945 }, { "epoch": 0.4, "learning_rate": 3.264231026144218e-05, "loss": 1.1165, "step": 29950 }, { "epoch": 0.4, "learning_rate": 3.263730036885899e-05, "loss": 0.7503, "step": 29955 }, { "epoch": 0.4, "learning_rate": 3.2632290137981615e-05, "loss": 0.6554, "step": 29960 }, { "epoch": 0.4, "learning_rate": 3.2627279569031965e-05, "loss": 0.5958, "step": 29965 }, { "epoch": 0.4, "learning_rate": 3.2622268662231995e-05, "loss": 0.4408, "step": 29970 }, { "epoch": 0.4, "learning_rate": 3.261725741780365e-05, "loss": 0.9872, "step": 29975 }, { "epoch": 0.4, "learning_rate": 3.261224583596891e-05, "loss": 0.6927, "step": 29980 }, { "epoch": 0.4, "learning_rate": 3.2607233916949756e-05, "loss": 0.6329, "step": 29985 }, { "epoch": 0.4, "learning_rate": 3.260222166096821e-05, "loss": 1.2735, "step": 29990 }, { "epoch": 0.4, "learning_rate": 3.259720906824627e-05, "loss": 0.3883, "step": 29995 }, { "epoch": 0.4, "learning_rate": 3.259219613900598e-05, "loss": 0.5028, "step": 30000 }, { "epoch": 0.4, "learning_rate": 3.258718287346938e-05, "loss": 0.6, "step": 30005 }, { "epoch": 0.4, "learning_rate": 3.2582169271858534e-05, "loss": 0.5745, "step": 30010 }, { "epoch": 0.4, "learning_rate": 3.257715533439552e-05, "loss": 0.9878, "step": 30015 }, { "epoch": 0.4, "learning_rate": 3.257214106130244e-05, "loss": 0.6634, "step": 30020 }, { "epoch": 0.4, "learning_rate": 3.25671264528014e-05, "loss": 0.5303, "step": 30025 }, { "epoch": 0.4, "learning_rate": 3.25621115091145e-05, "loss": 0.4611, "step": 30030 }, { "epoch": 0.4, "learning_rate": 3.25570962304639e-05, "loss": 0.468, "step": 30035 }, { "epoch": 0.4, "learning_rate": 3.255208061707174e-05, "loss": 0.123, "step": 30040 }, { "epoch": 0.4, "learning_rate": 3.254706466916019e-05, "loss": 1.0365, "step": 30045 }, { "epoch": 0.4, "learning_rate": 3.2542048386951436e-05, "loss": 0.3339, "step": 30050 }, { "epoch": 0.4, "learning_rate": 3.2537031770667664e-05, "loss": 1.0082, "step": 30055 }, { "epoch": 0.4, "learning_rate": 3.2532014820531093e-05, "loss": 0.5138, "step": 30060 }, { "epoch": 0.4, "learning_rate": 3.2526997536763946e-05, "loss": 0.9841, "step": 30065 }, { "epoch": 0.4, "learning_rate": 3.2521979919588475e-05, "loss": 0.7426, "step": 30070 }, { "epoch": 0.4, "learning_rate": 3.251696196922692e-05, "loss": 0.4212, "step": 30075 }, { "epoch": 0.4, "learning_rate": 3.2511943685901545e-05, "loss": 0.5152, "step": 30080 }, { "epoch": 0.4, "learning_rate": 3.250692506983466e-05, "loss": 0.3495, "step": 30085 }, { "epoch": 0.4, "learning_rate": 3.250190612124854e-05, "loss": 0.6338, "step": 30090 }, { "epoch": 0.4, "learning_rate": 3.2496886840365516e-05, "loss": 1.0662, "step": 30095 }, { "epoch": 0.4, "learning_rate": 3.249186722740791e-05, "loss": 1.0578, "step": 30100 }, { "epoch": 0.4, "learning_rate": 3.2486847282598066e-05, "loss": 0.1877, "step": 30105 }, { "epoch": 0.4, "learning_rate": 3.248182700615834e-05, "loss": 1.5111, "step": 30110 }, { "epoch": 0.4, "learning_rate": 3.247680639831111e-05, "loss": 1.0192, "step": 30115 }, { "epoch": 0.4, "learning_rate": 3.2471785459278756e-05, "loss": 0.9749, "step": 30120 }, { "epoch": 0.4, "learning_rate": 3.24667641892837e-05, "loss": 0.8003, "step": 30125 }, { "epoch": 0.4, "learning_rate": 3.246174258854834e-05, "loss": 0.6971, "step": 30130 }, { "epoch": 0.4, "learning_rate": 3.2456720657295106e-05, "loss": 0.6415, "step": 30135 }, { "epoch": 0.4, "learning_rate": 3.245169839574646e-05, "loss": 0.6535, "step": 30140 }, { "epoch": 0.4, "learning_rate": 3.244667580412485e-05, "loss": 0.8255, "step": 30145 }, { "epoch": 0.4, "learning_rate": 3.2441652882652756e-05, "loss": 1.2864, "step": 30150 }, { "epoch": 0.4, "learning_rate": 3.243662963155267e-05, "loss": 0.677, "step": 30155 }, { "epoch": 0.4, "learning_rate": 3.2431606051047104e-05, "loss": 0.8703, "step": 30160 }, { "epoch": 0.4, "learning_rate": 3.242658214135856e-05, "loss": 0.1324, "step": 30165 }, { "epoch": 0.4, "learning_rate": 3.242155790270958e-05, "loss": 0.3075, "step": 30170 }, { "epoch": 0.4, "learning_rate": 3.241653333532271e-05, "loss": 0.8154, "step": 30175 }, { "epoch": 0.4, "learning_rate": 3.241150843942053e-05, "loss": 0.926, "step": 30180 }, { "epoch": 0.4, "learning_rate": 3.2406483215225606e-05, "loss": 1.0035, "step": 30185 }, { "epoch": 0.4, "learning_rate": 3.240145766296051e-05, "loss": 0.7105, "step": 30190 }, { "epoch": 0.4, "learning_rate": 3.2396431782847886e-05, "loss": 0.6863, "step": 30195 }, { "epoch": 0.4, "learning_rate": 3.239140557511033e-05, "loss": 1.5834, "step": 30200 }, { "epoch": 0.4, "learning_rate": 3.238637903997048e-05, "loss": 0.8231, "step": 30205 }, { "epoch": 0.4, "learning_rate": 3.2381352177650995e-05, "loss": 1.3525, "step": 30210 }, { "epoch": 0.4, "learning_rate": 3.2376324988374546e-05, "loss": 0.5155, "step": 30215 }, { "epoch": 0.4, "learning_rate": 3.237129747236379e-05, "loss": 1.3863, "step": 30220 }, { "epoch": 0.4, "learning_rate": 3.236626962984144e-05, "loss": 1.0388, "step": 30225 }, { "epoch": 0.41, "learning_rate": 3.236124146103019e-05, "loss": 0.6342, "step": 30230 }, { "epoch": 0.41, "learning_rate": 3.2356212966152776e-05, "loss": 0.5613, "step": 30235 }, { "epoch": 0.41, "learning_rate": 3.235118414543193e-05, "loss": 0.6573, "step": 30240 }, { "epoch": 0.41, "learning_rate": 3.2346154999090404e-05, "loss": 0.6402, "step": 30245 }, { "epoch": 0.41, "learning_rate": 3.2341125527350966e-05, "loss": 0.3512, "step": 30250 }, { "epoch": 0.41, "learning_rate": 3.233609573043639e-05, "loss": 0.2672, "step": 30255 }, { "epoch": 0.41, "learning_rate": 3.233106560856947e-05, "loss": 0.684, "step": 30260 }, { "epoch": 0.41, "learning_rate": 3.2326035161973026e-05, "loss": 0.8482, "step": 30265 }, { "epoch": 0.41, "learning_rate": 3.232100439086988e-05, "loss": 0.8224, "step": 30270 }, { "epoch": 0.41, "learning_rate": 3.2315973295482856e-05, "loss": 0.599, "step": 30275 }, { "epoch": 0.41, "learning_rate": 3.2310941876034815e-05, "loss": 0.7283, "step": 30280 }, { "epoch": 0.41, "learning_rate": 3.230591013274862e-05, "loss": 0.8375, "step": 30285 }, { "epoch": 0.41, "learning_rate": 3.230087806584717e-05, "loss": 0.4957, "step": 30290 }, { "epoch": 0.41, "learning_rate": 3.229584567555334e-05, "loss": 0.3967, "step": 30295 }, { "epoch": 0.41, "learning_rate": 3.229081296209005e-05, "loss": 0.5243, "step": 30300 }, { "epoch": 0.41, "learning_rate": 3.228577992568022e-05, "loss": 0.8884, "step": 30305 }, { "epoch": 0.41, "learning_rate": 3.2280746566546786e-05, "loss": 0.6799, "step": 30310 }, { "epoch": 0.41, "learning_rate": 3.22757128849127e-05, "loss": 0.6722, "step": 30315 }, { "epoch": 0.41, "learning_rate": 3.2270678881000936e-05, "loss": 0.986, "step": 30320 }, { "epoch": 0.41, "learning_rate": 3.226564455503448e-05, "loss": 0.7173, "step": 30325 }, { "epoch": 0.41, "learning_rate": 3.226060990723631e-05, "loss": 1.0774, "step": 30330 }, { "epoch": 0.41, "learning_rate": 3.2255574937829443e-05, "loss": 0.4013, "step": 30335 }, { "epoch": 0.41, "learning_rate": 3.22505396470369e-05, "loss": 0.914, "step": 30340 }, { "epoch": 0.41, "learning_rate": 3.224550403508174e-05, "loss": 0.8656, "step": 30345 }, { "epoch": 0.41, "learning_rate": 3.224046810218699e-05, "loss": 1.1124, "step": 30350 }, { "epoch": 0.41, "learning_rate": 3.2235431848575724e-05, "loss": 0.3451, "step": 30355 }, { "epoch": 0.41, "learning_rate": 3.2230395274471034e-05, "loss": 0.7184, "step": 30360 }, { "epoch": 0.41, "learning_rate": 3.2225358380095996e-05, "loss": 0.517, "step": 30365 }, { "epoch": 0.41, "learning_rate": 3.2220321165673733e-05, "loss": 0.7479, "step": 30370 }, { "epoch": 0.41, "learning_rate": 3.221528363142737e-05, "loss": 1.3136, "step": 30375 }, { "epoch": 0.41, "learning_rate": 3.2210245777580035e-05, "loss": 1.5373, "step": 30380 }, { "epoch": 0.41, "learning_rate": 3.2205207604354884e-05, "loss": 0.8639, "step": 30385 }, { "epoch": 0.41, "learning_rate": 3.220016911197508e-05, "loss": 1.2509, "step": 30390 }, { "epoch": 0.41, "learning_rate": 3.21951303006638e-05, "loss": 0.6764, "step": 30395 }, { "epoch": 0.41, "learning_rate": 3.219009117064425e-05, "loss": 0.6176, "step": 30400 }, { "epoch": 0.41, "learning_rate": 3.218505172213964e-05, "loss": 0.8382, "step": 30405 }, { "epoch": 0.41, "learning_rate": 3.2180011955373174e-05, "loss": 0.8089, "step": 30410 }, { "epoch": 0.41, "learning_rate": 3.217497187056811e-05, "loss": 0.8125, "step": 30415 }, { "epoch": 0.41, "learning_rate": 3.216993146794767e-05, "loss": 1.084, "step": 30420 }, { "epoch": 0.41, "learning_rate": 3.2164890747735146e-05, "loss": 1.2753, "step": 30425 }, { "epoch": 0.41, "learning_rate": 3.21598497101538e-05, "loss": 0.9153, "step": 30430 }, { "epoch": 0.41, "learning_rate": 3.2154808355426945e-05, "loss": 0.6046, "step": 30435 }, { "epoch": 0.41, "learning_rate": 3.2149766683777866e-05, "loss": 0.6375, "step": 30440 }, { "epoch": 0.41, "learning_rate": 3.214472469542989e-05, "loss": 0.8265, "step": 30445 }, { "epoch": 0.41, "learning_rate": 3.2139682390606354e-05, "loss": 1.0059, "step": 30450 }, { "epoch": 0.41, "learning_rate": 3.2134639769530614e-05, "loss": 1.0906, "step": 30455 }, { "epoch": 0.41, "learning_rate": 3.212959683242602e-05, "loss": 0.6255, "step": 30460 }, { "epoch": 0.41, "learning_rate": 3.212455357951596e-05, "loss": 0.9004, "step": 30465 }, { "epoch": 0.41, "learning_rate": 3.211951001102381e-05, "loss": 1.3826, "step": 30470 }, { "epoch": 0.41, "learning_rate": 3.211446612717299e-05, "loss": 0.431, "step": 30475 }, { "epoch": 0.41, "learning_rate": 3.210942192818691e-05, "loss": 1.1597, "step": 30480 }, { "epoch": 0.41, "learning_rate": 3.210437741428901e-05, "loss": 1.1295, "step": 30485 }, { "epoch": 0.41, "learning_rate": 3.209933258570274e-05, "loss": 1.1086, "step": 30490 }, { "epoch": 0.41, "learning_rate": 3.209428744265154e-05, "loss": 0.6624, "step": 30495 }, { "epoch": 0.41, "learning_rate": 3.20892419853589e-05, "loss": 0.7061, "step": 30500 }, { "epoch": 0.41, "learning_rate": 3.2084196214048305e-05, "loss": 0.9133, "step": 30505 }, { "epoch": 0.41, "learning_rate": 3.207915012894327e-05, "loss": 1.1287, "step": 30510 }, { "epoch": 0.41, "learning_rate": 3.2074103730267294e-05, "loss": 0.3077, "step": 30515 }, { "epoch": 0.41, "learning_rate": 3.206905701824391e-05, "loss": 0.5792, "step": 30520 }, { "epoch": 0.41, "learning_rate": 3.2064009993096665e-05, "loss": 0.8353, "step": 30525 }, { "epoch": 0.41, "learning_rate": 3.205896265504912e-05, "loss": 0.4275, "step": 30530 }, { "epoch": 0.41, "learning_rate": 3.2053915004324844e-05, "loss": 0.3596, "step": 30535 }, { "epoch": 0.41, "learning_rate": 3.2048867041147424e-05, "loss": 0.6465, "step": 30540 }, { "epoch": 0.41, "learning_rate": 3.204381876574046e-05, "loss": 1.227, "step": 30545 }, { "epoch": 0.41, "learning_rate": 3.203877017832756e-05, "loss": 0.9774, "step": 30550 }, { "epoch": 0.41, "learning_rate": 3.203372127913236e-05, "loss": 1.1531, "step": 30555 }, { "epoch": 0.41, "learning_rate": 3.202867206837849e-05, "loss": 0.9975, "step": 30560 }, { "epoch": 0.41, "learning_rate": 3.202362254628961e-05, "loss": 0.5979, "step": 30565 }, { "epoch": 0.41, "learning_rate": 3.201857271308939e-05, "loss": 0.3522, "step": 30570 }, { "epoch": 0.41, "learning_rate": 3.201352256900152e-05, "loss": 0.9167, "step": 30575 }, { "epoch": 0.41, "learning_rate": 3.200847211424968e-05, "loss": 0.444, "step": 30580 }, { "epoch": 0.41, "learning_rate": 3.200342134905759e-05, "loss": 0.5936, "step": 30585 }, { "epoch": 0.41, "learning_rate": 3.199837027364897e-05, "loss": 0.4294, "step": 30590 }, { "epoch": 0.41, "learning_rate": 3.199331888824756e-05, "loss": 1.0548, "step": 30595 }, { "epoch": 0.41, "learning_rate": 3.198826719307711e-05, "loss": 0.6605, "step": 30600 }, { "epoch": 0.41, "learning_rate": 3.198321518836138e-05, "loss": 0.7041, "step": 30605 }, { "epoch": 0.41, "learning_rate": 3.197816287432416e-05, "loss": 0.3789, "step": 30610 }, { "epoch": 0.41, "learning_rate": 3.197311025118923e-05, "loss": 0.6984, "step": 30615 }, { "epoch": 0.41, "learning_rate": 3.19680573191804e-05, "loss": 0.4393, "step": 30620 }, { "epoch": 0.41, "learning_rate": 3.1963004078521496e-05, "loss": 0.5215, "step": 30625 }, { "epoch": 0.41, "learning_rate": 3.195795052943634e-05, "loss": 0.9913, "step": 30630 }, { "epoch": 0.41, "learning_rate": 3.19528966721488e-05, "loss": 0.8676, "step": 30635 }, { "epoch": 0.41, "learning_rate": 3.1947842506882704e-05, "loss": 0.6775, "step": 30640 }, { "epoch": 0.41, "learning_rate": 3.194278803386195e-05, "loss": 1.0698, "step": 30645 }, { "epoch": 0.41, "learning_rate": 3.193773325331042e-05, "loss": 0.3991, "step": 30650 }, { "epoch": 0.41, "learning_rate": 3.193267816545202e-05, "loss": 0.888, "step": 30655 }, { "epoch": 0.41, "learning_rate": 3.192762277051066e-05, "loss": 0.3815, "step": 30660 }, { "epoch": 0.41, "learning_rate": 3.192256706871026e-05, "loss": 0.7575, "step": 30665 }, { "epoch": 0.41, "learning_rate": 3.1917511060274774e-05, "loss": 1.1909, "step": 30670 }, { "epoch": 0.41, "learning_rate": 3.191245474542816e-05, "loss": 0.9041, "step": 30675 }, { "epoch": 0.41, "learning_rate": 3.1907398124394385e-05, "loss": 0.5639, "step": 30680 }, { "epoch": 0.41, "learning_rate": 3.190234119739742e-05, "loss": 0.5903, "step": 30685 }, { "epoch": 0.41, "learning_rate": 3.189728396466127e-05, "loss": 0.7554, "step": 30690 }, { "epoch": 0.41, "learning_rate": 3.189222642640996e-05, "loss": 0.8798, "step": 30695 }, { "epoch": 0.41, "learning_rate": 3.188716858286749e-05, "loss": 1.135, "step": 30700 }, { "epoch": 0.41, "learning_rate": 3.1882110434257914e-05, "loss": 0.4576, "step": 30705 }, { "epoch": 0.41, "learning_rate": 3.187705198080527e-05, "loss": 0.9089, "step": 30710 }, { "epoch": 0.41, "learning_rate": 3.187199322273363e-05, "loss": 0.7039, "step": 30715 }, { "epoch": 0.41, "learning_rate": 3.186693416026707e-05, "loss": 1.1944, "step": 30720 }, { "epoch": 0.41, "learning_rate": 3.1861874793629684e-05, "loss": 1.5006, "step": 30725 }, { "epoch": 0.41, "learning_rate": 3.1856815123045567e-05, "loss": 0.7739, "step": 30730 }, { "epoch": 0.41, "learning_rate": 3.1851755148738846e-05, "loss": 0.499, "step": 30735 }, { "epoch": 0.41, "learning_rate": 3.1846694870933654e-05, "loss": 1.1664, "step": 30740 }, { "epoch": 0.41, "learning_rate": 3.184163428985413e-05, "loss": 0.3864, "step": 30745 }, { "epoch": 0.41, "learning_rate": 3.183657340572444e-05, "loss": 0.504, "step": 30750 }, { "epoch": 0.41, "learning_rate": 3.1832524480375196e-05, "loss": 0.6495, "step": 30755 }, { "epoch": 0.41, "learning_rate": 3.182746305132011e-05, "loss": 0.3792, "step": 30760 }, { "epoch": 0.41, "learning_rate": 3.182240131984257e-05, "loss": 0.7403, "step": 30765 }, { "epoch": 0.41, "learning_rate": 3.1817339286166786e-05, "loss": 1.0269, "step": 30770 }, { "epoch": 0.41, "learning_rate": 3.181227695051697e-05, "loss": 0.4211, "step": 30775 }, { "epoch": 0.41, "learning_rate": 3.180721431311738e-05, "loss": 0.607, "step": 30780 }, { "epoch": 0.41, "learning_rate": 3.180215137419223e-05, "loss": 1.049, "step": 30785 }, { "epoch": 0.41, "learning_rate": 3.1797088133965824e-05, "loss": 0.7357, "step": 30790 }, { "epoch": 0.41, "learning_rate": 3.1792024592662416e-05, "loss": 0.4576, "step": 30795 }, { "epoch": 0.41, "learning_rate": 3.1786960750506295e-05, "loss": 0.5515, "step": 30800 }, { "epoch": 0.41, "learning_rate": 3.178189660772176e-05, "loss": 0.4008, "step": 30805 }, { "epoch": 0.41, "learning_rate": 3.1776832164533146e-05, "loss": 1.6337, "step": 30810 }, { "epoch": 0.41, "learning_rate": 3.1771767421164754e-05, "loss": 1.3445, "step": 30815 }, { "epoch": 0.41, "learning_rate": 3.176670237784096e-05, "loss": 1.6009, "step": 30820 }, { "epoch": 0.41, "learning_rate": 3.17616370347861e-05, "loss": 0.8343, "step": 30825 }, { "epoch": 0.41, "learning_rate": 3.175657139222453e-05, "loss": 0.5076, "step": 30830 }, { "epoch": 0.41, "learning_rate": 3.175150545038067e-05, "loss": 0.5452, "step": 30835 }, { "epoch": 0.41, "learning_rate": 3.174643920947888e-05, "loss": 0.8567, "step": 30840 }, { "epoch": 0.41, "learning_rate": 3.17413726697436e-05, "loss": 1.2108, "step": 30845 }, { "epoch": 0.41, "learning_rate": 3.173630583139923e-05, "loss": 0.6971, "step": 30850 }, { "epoch": 0.41, "learning_rate": 3.1731238694670215e-05, "loss": 1.2636, "step": 30855 }, { "epoch": 0.41, "learning_rate": 3.172617125978099e-05, "loss": 0.5658, "step": 30860 }, { "epoch": 0.41, "learning_rate": 3.172110352695604e-05, "loss": 1.1492, "step": 30865 }, { "epoch": 0.41, "learning_rate": 3.171603549641982e-05, "loss": 0.8568, "step": 30870 }, { "epoch": 0.41, "learning_rate": 3.1710967168396836e-05, "loss": 0.7315, "step": 30875 }, { "epoch": 0.41, "learning_rate": 3.1705898543111575e-05, "loss": 0.4679, "step": 30880 }, { "epoch": 0.41, "learning_rate": 3.1700829620788556e-05, "loss": 0.5489, "step": 30885 }, { "epoch": 0.41, "learning_rate": 3.169576040165231e-05, "loss": 0.9364, "step": 30890 }, { "epoch": 0.41, "learning_rate": 3.169069088592737e-05, "loss": 0.6285, "step": 30895 }, { "epoch": 0.41, "learning_rate": 3.1685621073838306e-05, "loss": 0.3764, "step": 30900 }, { "epoch": 0.41, "learning_rate": 3.168055096560967e-05, "loss": 0.7061, "step": 30905 }, { "epoch": 0.41, "learning_rate": 3.167548056146605e-05, "loss": 0.2545, "step": 30910 }, { "epoch": 0.41, "learning_rate": 3.167040986163203e-05, "loss": 0.8169, "step": 30915 }, { "epoch": 0.41, "learning_rate": 3.166533886633224e-05, "loss": 1.7627, "step": 30920 }, { "epoch": 0.41, "learning_rate": 3.166026757579127e-05, "loss": 0.5939, "step": 30925 }, { "epoch": 0.41, "learning_rate": 3.1655195990233775e-05, "loss": 0.638, "step": 30930 }, { "epoch": 0.41, "learning_rate": 3.165012410988439e-05, "loss": 0.428, "step": 30935 }, { "epoch": 0.41, "learning_rate": 3.164505193496777e-05, "loss": 1.3914, "step": 30940 }, { "epoch": 0.41, "learning_rate": 3.1639979465708606e-05, "loss": 0.5733, "step": 30945 }, { "epoch": 0.41, "learning_rate": 3.163490670233156e-05, "loss": 0.7168, "step": 30950 }, { "epoch": 0.41, "learning_rate": 3.1629833645061346e-05, "loss": 0.5082, "step": 30955 }, { "epoch": 0.41, "learning_rate": 3.162476029412267e-05, "loss": 0.6515, "step": 30960 }, { "epoch": 0.41, "learning_rate": 3.161968664974025e-05, "loss": 0.6402, "step": 30965 }, { "epoch": 0.41, "learning_rate": 3.1614612712138824e-05, "loss": 1.3404, "step": 30970 }, { "epoch": 0.42, "learning_rate": 3.1609538481543164e-05, "loss": 0.6304, "step": 30975 }, { "epoch": 0.42, "learning_rate": 3.1604463958178e-05, "loss": 0.4017, "step": 30980 }, { "epoch": 0.42, "learning_rate": 3.159938914226813e-05, "loss": 0.811, "step": 30985 }, { "epoch": 0.42, "learning_rate": 3.159431403403834e-05, "loss": 0.4456, "step": 30990 }, { "epoch": 0.42, "learning_rate": 3.158923863371342e-05, "loss": 1.2377, "step": 30995 }, { "epoch": 0.42, "learning_rate": 3.15841629415182e-05, "loss": 0.7143, "step": 31000 }, { "epoch": 0.42, "learning_rate": 3.157908695767749e-05, "loss": 1.1555, "step": 31005 }, { "epoch": 0.42, "learning_rate": 3.157401068241616e-05, "loss": 0.8483, "step": 31010 }, { "epoch": 0.42, "learning_rate": 3.156893411595904e-05, "loss": 0.6444, "step": 31015 }, { "epoch": 0.42, "learning_rate": 3.1563857258530997e-05, "loss": 0.6583, "step": 31020 }, { "epoch": 0.42, "learning_rate": 3.155878011035692e-05, "loss": 0.914, "step": 31025 }, { "epoch": 0.42, "learning_rate": 3.1553702671661695e-05, "loss": 0.3096, "step": 31030 }, { "epoch": 0.42, "learning_rate": 3.154862494267022e-05, "loss": 0.7695, "step": 31035 }, { "epoch": 0.42, "learning_rate": 3.1543546923607436e-05, "loss": 0.6905, "step": 31040 }, { "epoch": 0.42, "learning_rate": 3.153846861469825e-05, "loss": 0.4239, "step": 31045 }, { "epoch": 0.42, "learning_rate": 3.153339001616762e-05, "loss": 0.5653, "step": 31050 }, { "epoch": 0.42, "learning_rate": 3.1528311128240495e-05, "loss": 0.5674, "step": 31055 }, { "epoch": 0.42, "learning_rate": 3.152323195114184e-05, "loss": 0.565, "step": 31060 }, { "epoch": 0.42, "learning_rate": 3.1518152485096665e-05, "loss": 1.0833, "step": 31065 }, { "epoch": 0.42, "learning_rate": 3.151307273032993e-05, "loss": 0.5371, "step": 31070 }, { "epoch": 0.42, "learning_rate": 3.150799268706666e-05, "loss": 0.7849, "step": 31075 }, { "epoch": 0.42, "learning_rate": 3.150291235553187e-05, "loss": 1.6721, "step": 31080 }, { "epoch": 0.42, "learning_rate": 3.14978317359506e-05, "loss": 0.9079, "step": 31085 }, { "epoch": 0.42, "learning_rate": 3.1492750828547884e-05, "loss": 1.457, "step": 31090 }, { "epoch": 0.42, "learning_rate": 3.14876696335488e-05, "loss": 0.8844, "step": 31095 }, { "epoch": 0.42, "learning_rate": 3.1482588151178396e-05, "loss": 1.0555, "step": 31100 }, { "epoch": 0.42, "learning_rate": 3.147750638166177e-05, "loss": 0.7152, "step": 31105 }, { "epoch": 0.42, "learning_rate": 3.1472424325224025e-05, "loss": 0.7312, "step": 31110 }, { "epoch": 0.42, "learning_rate": 3.146734198209026e-05, "loss": 0.796, "step": 31115 }, { "epoch": 0.42, "learning_rate": 3.14622593524856e-05, "loss": 0.139, "step": 31120 }, { "epoch": 0.42, "learning_rate": 3.145717643663518e-05, "loss": 0.823, "step": 31125 }, { "epoch": 0.42, "learning_rate": 3.1452093234764144e-05, "loss": 1.1425, "step": 31130 }, { "epoch": 0.42, "learning_rate": 3.144700974709765e-05, "loss": 0.5653, "step": 31135 }, { "epoch": 0.42, "learning_rate": 3.1441925973860894e-05, "loss": 0.9816, "step": 31140 }, { "epoch": 0.42, "learning_rate": 3.1436841915279045e-05, "loss": 1.1799, "step": 31145 }, { "epoch": 0.42, "learning_rate": 3.14317575715773e-05, "loss": 0.8003, "step": 31150 }, { "epoch": 0.42, "learning_rate": 3.142667294298086e-05, "loss": 0.5645, "step": 31155 }, { "epoch": 0.42, "learning_rate": 3.1421588029714964e-05, "loss": 0.1845, "step": 31160 }, { "epoch": 0.42, "learning_rate": 3.1416502832004853e-05, "loss": 0.7281, "step": 31165 }, { "epoch": 0.42, "learning_rate": 3.1411417350075765e-05, "loss": 0.7885, "step": 31170 }, { "epoch": 0.42, "learning_rate": 3.140633158415296e-05, "loss": 1.5627, "step": 31175 }, { "epoch": 0.42, "learning_rate": 3.140124553446171e-05, "loss": 0.6175, "step": 31180 }, { "epoch": 0.42, "learning_rate": 3.139615920122732e-05, "loss": 0.5819, "step": 31185 }, { "epoch": 0.42, "learning_rate": 3.1391072584675065e-05, "loss": 0.6986, "step": 31190 }, { "epoch": 0.42, "learning_rate": 3.138598568503028e-05, "loss": 0.7183, "step": 31195 }, { "epoch": 0.42, "learning_rate": 3.1380898502518265e-05, "loss": 0.7293, "step": 31200 }, { "epoch": 0.42, "learning_rate": 3.137581103736438e-05, "loss": 0.757, "step": 31205 }, { "epoch": 0.42, "learning_rate": 3.137072328979395e-05, "loss": 1.0087, "step": 31210 }, { "epoch": 0.42, "learning_rate": 3.136563526003236e-05, "loss": 1.0705, "step": 31215 }, { "epoch": 0.42, "learning_rate": 3.136054694830497e-05, "loss": 0.8145, "step": 31220 }, { "epoch": 0.42, "learning_rate": 3.135545835483718e-05, "loss": 0.599, "step": 31225 }, { "epoch": 0.42, "learning_rate": 3.135036947985437e-05, "loss": 0.296, "step": 31230 }, { "epoch": 0.42, "learning_rate": 3.1345280323581966e-05, "loss": 1.1437, "step": 31235 }, { "epoch": 0.42, "learning_rate": 3.1340190886245377e-05, "loss": 0.5081, "step": 31240 }, { "epoch": 0.42, "learning_rate": 3.133510116807007e-05, "loss": 0.7734, "step": 31245 }, { "epoch": 0.42, "learning_rate": 3.133001116928146e-05, "loss": 0.738, "step": 31250 }, { "epoch": 0.42, "learning_rate": 3.132492089010504e-05, "loss": 0.9485, "step": 31255 }, { "epoch": 0.42, "learning_rate": 3.131983033076625e-05, "loss": 1.2341, "step": 31260 }, { "epoch": 0.42, "learning_rate": 3.13147394914906e-05, "loss": 0.2593, "step": 31265 }, { "epoch": 0.42, "learning_rate": 3.130964837250358e-05, "loss": 1.1979, "step": 31270 }, { "epoch": 0.42, "learning_rate": 3.130455697403071e-05, "loss": 0.7077, "step": 31275 }, { "epoch": 0.42, "learning_rate": 3.1299465296297504e-05, "loss": 1.3887, "step": 31280 }, { "epoch": 0.42, "learning_rate": 3.1294373339529494e-05, "loss": 1.1176, "step": 31285 }, { "epoch": 0.42, "learning_rate": 3.128928110395224e-05, "loss": 0.2596, "step": 31290 }, { "epoch": 0.42, "learning_rate": 3.128418858979129e-05, "loss": 0.5462, "step": 31295 }, { "epoch": 0.42, "learning_rate": 3.127909579727223e-05, "loss": 0.4901, "step": 31300 }, { "epoch": 0.42, "learning_rate": 3.1274002726620645e-05, "loss": 0.1371, "step": 31305 }, { "epoch": 0.42, "learning_rate": 3.1268909378062124e-05, "loss": 0.7791, "step": 31310 }, { "epoch": 0.42, "learning_rate": 3.126381575182228e-05, "loss": 0.4245, "step": 31315 }, { "epoch": 0.42, "learning_rate": 3.1258721848126735e-05, "loss": 1.2318, "step": 31320 }, { "epoch": 0.42, "learning_rate": 3.125362766720111e-05, "loss": 1.2233, "step": 31325 }, { "epoch": 0.42, "learning_rate": 3.1248533209271085e-05, "loss": 0.6145, "step": 31330 }, { "epoch": 0.42, "learning_rate": 3.1243438474562295e-05, "loss": 0.9678, "step": 31335 }, { "epoch": 0.42, "learning_rate": 3.1238343463300405e-05, "loss": 0.7884, "step": 31340 }, { "epoch": 0.42, "learning_rate": 3.123324817571112e-05, "loss": 1.6241, "step": 31345 }, { "epoch": 0.42, "learning_rate": 3.1228152612020114e-05, "loss": 0.9047, "step": 31350 }, { "epoch": 0.42, "learning_rate": 3.122305677245312e-05, "loss": 0.5267, "step": 31355 }, { "epoch": 0.42, "learning_rate": 3.121796065723583e-05, "loss": 0.8395, "step": 31360 }, { "epoch": 0.42, "learning_rate": 3.1212864266594e-05, "loss": 1.0435, "step": 31365 }, { "epoch": 0.42, "learning_rate": 3.120776760075337e-05, "loss": 0.9985, "step": 31370 }, { "epoch": 0.42, "learning_rate": 3.1202670659939676e-05, "loss": 1.8042, "step": 31375 }, { "epoch": 0.42, "learning_rate": 3.1197573444378706e-05, "loss": 0.4487, "step": 31380 }, { "epoch": 0.42, "learning_rate": 3.119247595429625e-05, "loss": 0.7588, "step": 31385 }, { "epoch": 0.42, "learning_rate": 3.118737818991808e-05, "loss": 1.1406, "step": 31390 }, { "epoch": 0.42, "learning_rate": 3.118228015147001e-05, "loss": 1.1463, "step": 31395 }, { "epoch": 0.42, "learning_rate": 3.117718183917787e-05, "loss": 0.6479, "step": 31400 }, { "epoch": 0.42, "learning_rate": 3.117208325326746e-05, "loss": 0.2711, "step": 31405 }, { "epoch": 0.42, "learning_rate": 3.116698439396465e-05, "loss": 0.7172, "step": 31410 }, { "epoch": 0.42, "learning_rate": 3.116188526149528e-05, "loss": 0.6584, "step": 31415 }, { "epoch": 0.42, "learning_rate": 3.115678585608523e-05, "loss": 0.4037, "step": 31420 }, { "epoch": 0.42, "learning_rate": 3.115168617796035e-05, "loss": 0.2291, "step": 31425 }, { "epoch": 0.42, "learning_rate": 3.1146586227346556e-05, "loss": 0.8248, "step": 31430 }, { "epoch": 0.42, "learning_rate": 3.114148600446975e-05, "loss": 0.8688, "step": 31435 }, { "epoch": 0.42, "learning_rate": 3.113638550955583e-05, "loss": 0.1966, "step": 31440 }, { "epoch": 0.42, "learning_rate": 3.113128474283074e-05, "loss": 0.654, "step": 31445 }, { "epoch": 0.42, "learning_rate": 3.11261837045204e-05, "loss": 0.8078, "step": 31450 }, { "epoch": 0.42, "learning_rate": 3.112108239485078e-05, "loss": 1.0863, "step": 31455 }, { "epoch": 0.42, "learning_rate": 3.111598081404782e-05, "loss": 0.5363, "step": 31460 }, { "epoch": 0.42, "learning_rate": 3.111087896233752e-05, "loss": 0.944, "step": 31465 }, { "epoch": 0.42, "learning_rate": 3.110577683994585e-05, "loss": 0.9981, "step": 31470 }, { "epoch": 0.42, "learning_rate": 3.110067444709881e-05, "loss": 0.6486, "step": 31475 }, { "epoch": 0.42, "learning_rate": 3.109557178402241e-05, "loss": 0.7593, "step": 31480 }, { "epoch": 0.42, "learning_rate": 3.109046885094268e-05, "loss": 0.4353, "step": 31485 }, { "epoch": 0.42, "learning_rate": 3.1085365648085647e-05, "loss": 0.3819, "step": 31490 }, { "epoch": 0.42, "learning_rate": 3.108026217567737e-05, "loss": 0.9846, "step": 31495 }, { "epoch": 0.42, "learning_rate": 3.1075158433943885e-05, "loss": 0.2463, "step": 31500 }, { "epoch": 0.42, "learning_rate": 3.1070054423111273e-05, "loss": 0.5602, "step": 31505 }, { "epoch": 0.42, "learning_rate": 3.1064950143405624e-05, "loss": 0.8174, "step": 31510 }, { "epoch": 0.42, "learning_rate": 3.105984559505302e-05, "loss": 0.5463, "step": 31515 }, { "epoch": 0.42, "learning_rate": 3.1054740778279576e-05, "loss": 0.3886, "step": 31520 }, { "epoch": 0.42, "learning_rate": 3.104963569331141e-05, "loss": 0.7683, "step": 31525 }, { "epoch": 0.42, "learning_rate": 3.1044530340374646e-05, "loss": 0.5209, "step": 31530 }, { "epoch": 0.42, "learning_rate": 3.1039424719695434e-05, "loss": 1.0454, "step": 31535 }, { "epoch": 0.42, "learning_rate": 3.1034318831499906e-05, "loss": 0.4643, "step": 31540 }, { "epoch": 0.42, "learning_rate": 3.102921267601425e-05, "loss": 0.552, "step": 31545 }, { "epoch": 0.42, "learning_rate": 3.102410625346464e-05, "loss": 0.7378, "step": 31550 }, { "epoch": 0.42, "learning_rate": 3.1018999564077254e-05, "loss": 0.7618, "step": 31555 }, { "epoch": 0.42, "learning_rate": 3.10138926080783e-05, "loss": 1.3617, "step": 31560 }, { "epoch": 0.42, "learning_rate": 3.100878538569399e-05, "loss": 0.6859, "step": 31565 }, { "epoch": 0.42, "learning_rate": 3.100367789715055e-05, "loss": 0.6857, "step": 31570 }, { "epoch": 0.42, "learning_rate": 3.099857014267422e-05, "loss": 0.6539, "step": 31575 }, { "epoch": 0.42, "learning_rate": 3.099346212249124e-05, "loss": 0.4741, "step": 31580 }, { "epoch": 0.42, "learning_rate": 3.098835383682787e-05, "loss": 0.9952, "step": 31585 }, { "epoch": 0.42, "learning_rate": 3.098324528591038e-05, "loss": 0.6749, "step": 31590 }, { "epoch": 0.42, "learning_rate": 3.097813646996506e-05, "loss": 0.4291, "step": 31595 }, { "epoch": 0.42, "learning_rate": 3.097302738921821e-05, "loss": 1.0875, "step": 31600 }, { "epoch": 0.42, "learning_rate": 3.096791804389612e-05, "loss": 0.8577, "step": 31605 }, { "epoch": 0.42, "learning_rate": 3.096280843422512e-05, "loss": 0.3405, "step": 31610 }, { "epoch": 0.42, "learning_rate": 3.0957698560431534e-05, "loss": 0.5521, "step": 31615 }, { "epoch": 0.42, "learning_rate": 3.0952588422741716e-05, "loss": 0.7059, "step": 31620 }, { "epoch": 0.42, "learning_rate": 3.0947478021382e-05, "loss": 0.1288, "step": 31625 }, { "epoch": 0.42, "learning_rate": 3.094236735657877e-05, "loss": 0.64, "step": 31630 }, { "epoch": 0.42, "learning_rate": 3.093725642855839e-05, "loss": 0.4562, "step": 31635 }, { "epoch": 0.42, "learning_rate": 3.093214523754725e-05, "loss": 1.1634, "step": 31640 }, { "epoch": 0.42, "learning_rate": 3.0927033783771764e-05, "loss": 0.6518, "step": 31645 }, { "epoch": 0.42, "learning_rate": 3.092192206745833e-05, "loss": 1.3601, "step": 31650 }, { "epoch": 0.42, "learning_rate": 3.091681008883336e-05, "loss": 0.7011, "step": 31655 }, { "epoch": 0.42, "learning_rate": 3.0911697848123325e-05, "loss": 0.4593, "step": 31660 }, { "epoch": 0.42, "learning_rate": 3.0906585345554645e-05, "loss": 0.7243, "step": 31665 }, { "epoch": 0.42, "learning_rate": 3.090147258135377e-05, "loss": 0.7748, "step": 31670 }, { "epoch": 0.42, "learning_rate": 3.08963595557472e-05, "loss": 0.6619, "step": 31675 }, { "epoch": 0.42, "learning_rate": 3.089124626896139e-05, "loss": 0.1145, "step": 31680 }, { "epoch": 0.42, "learning_rate": 3.0886132721222855e-05, "loss": 1.1827, "step": 31685 }, { "epoch": 0.42, "learning_rate": 3.088101891275808e-05, "loss": 1.308, "step": 31690 }, { "epoch": 0.42, "learning_rate": 3.087590484379359e-05, "loss": 0.3808, "step": 31695 }, { "epoch": 0.42, "learning_rate": 3.0870790514555916e-05, "loss": 0.8751, "step": 31700 }, { "epoch": 0.42, "learning_rate": 3.086567592527159e-05, "loss": 0.3444, "step": 31705 }, { "epoch": 0.42, "learning_rate": 3.0860561076167155e-05, "loss": 0.8356, "step": 31710 }, { "epoch": 0.42, "learning_rate": 3.08554459674692e-05, "loss": 1.3133, "step": 31715 }, { "epoch": 0.43, "learning_rate": 3.0850330599404275e-05, "loss": 1.2862, "step": 31720 }, { "epoch": 0.43, "learning_rate": 3.084521497219897e-05, "loss": 0.5604, "step": 31725 }, { "epoch": 0.43, "learning_rate": 3.0840099086079886e-05, "loss": 1.1012, "step": 31730 }, { "epoch": 0.43, "learning_rate": 3.0834982941273626e-05, "loss": 0.2909, "step": 31735 }, { "epoch": 0.43, "learning_rate": 3.082986653800682e-05, "loss": 0.8013, "step": 31740 }, { "epoch": 0.43, "learning_rate": 3.08247498765061e-05, "loss": 1.0208, "step": 31745 }, { "epoch": 0.43, "learning_rate": 3.0819632956998085e-05, "loss": 0.4628, "step": 31750 }, { "epoch": 0.43, "learning_rate": 3.0814515779709456e-05, "loss": 0.2335, "step": 31755 }, { "epoch": 0.43, "learning_rate": 3.080939834486686e-05, "loss": 0.757, "step": 31760 }, { "epoch": 0.43, "learning_rate": 3.080428065269698e-05, "loss": 0.927, "step": 31765 }, { "epoch": 0.43, "learning_rate": 3.079916270342651e-05, "loss": 0.4836, "step": 31770 }, { "epoch": 0.43, "learning_rate": 3.079404449728215e-05, "loss": 0.5037, "step": 31775 }, { "epoch": 0.43, "learning_rate": 3.0788926034490596e-05, "loss": 0.1767, "step": 31780 }, { "epoch": 0.43, "learning_rate": 3.078380731527857e-05, "loss": 0.5121, "step": 31785 }, { "epoch": 0.43, "learning_rate": 3.0778688339872835e-05, "loss": 0.7692, "step": 31790 }, { "epoch": 0.43, "learning_rate": 3.0773569108500104e-05, "loss": 1.2527, "step": 31795 }, { "epoch": 0.43, "learning_rate": 3.076844962138716e-05, "loss": 0.6812, "step": 31800 }, { "epoch": 0.43, "learning_rate": 3.076332987876074e-05, "loss": 0.936, "step": 31805 }, { "epoch": 0.43, "learning_rate": 3.075820988084765e-05, "loss": 0.9028, "step": 31810 }, { "epoch": 0.43, "learning_rate": 3.075308962787466e-05, "loss": 0.8654, "step": 31815 }, { "epoch": 0.43, "learning_rate": 3.074796912006859e-05, "loss": 0.514, "step": 31820 }, { "epoch": 0.43, "learning_rate": 3.074284835765624e-05, "loss": 0.7184, "step": 31825 }, { "epoch": 0.43, "learning_rate": 3.0737727340864445e-05, "loss": 0.6686, "step": 31830 }, { "epoch": 0.43, "learning_rate": 3.073260606992002e-05, "loss": 0.5561, "step": 31835 }, { "epoch": 0.43, "learning_rate": 3.0727484545049835e-05, "loss": 0.561, "step": 31840 }, { "epoch": 0.43, "learning_rate": 3.0722362766480736e-05, "loss": 1.4597, "step": 31845 }, { "epoch": 0.43, "learning_rate": 3.07172407344396e-05, "loss": 0.8439, "step": 31850 }, { "epoch": 0.43, "learning_rate": 3.07121184491533e-05, "loss": 1.0316, "step": 31855 }, { "epoch": 0.43, "learning_rate": 3.0706995910848723e-05, "loss": 0.5932, "step": 31860 }, { "epoch": 0.43, "learning_rate": 3.070187311975279e-05, "loss": 0.8035, "step": 31865 }, { "epoch": 0.43, "learning_rate": 3.069675007609239e-05, "loss": 0.8308, "step": 31870 }, { "epoch": 0.43, "learning_rate": 3.069162678009446e-05, "loss": 1.1505, "step": 31875 }, { "epoch": 0.43, "learning_rate": 3.068650323198595e-05, "loss": 0.2454, "step": 31880 }, { "epoch": 0.43, "learning_rate": 3.068137943199379e-05, "loss": 0.4211, "step": 31885 }, { "epoch": 0.43, "learning_rate": 3.0676255380344946e-05, "loss": 1.0163, "step": 31890 }, { "epoch": 0.43, "learning_rate": 3.067113107726638e-05, "loss": 0.822, "step": 31895 }, { "epoch": 0.43, "learning_rate": 3.066600652298509e-05, "loss": 1.2192, "step": 31900 }, { "epoch": 0.43, "learning_rate": 3.066088171772805e-05, "loss": 1.699, "step": 31905 }, { "epoch": 0.43, "learning_rate": 3.0655756661722276e-05, "loss": 0.673, "step": 31910 }, { "epoch": 0.43, "learning_rate": 3.065063135519477e-05, "loss": 0.75, "step": 31915 }, { "epoch": 0.43, "learning_rate": 3.064550579837257e-05, "loss": 0.7511, "step": 31920 }, { "epoch": 0.43, "learning_rate": 3.06403799914827e-05, "loss": 0.5492, "step": 31925 }, { "epoch": 0.43, "learning_rate": 3.0635253934752214e-05, "loss": 1.0041, "step": 31930 }, { "epoch": 0.43, "learning_rate": 3.0630127628408184e-05, "loss": 1.374, "step": 31935 }, { "epoch": 0.43, "learning_rate": 3.062500107267766e-05, "loss": 0.3574, "step": 31940 }, { "epoch": 0.43, "learning_rate": 3.061987426778772e-05, "loss": 0.3054, "step": 31945 }, { "epoch": 0.43, "learning_rate": 3.0614747213965475e-05, "loss": 1.162, "step": 31950 }, { "epoch": 0.43, "learning_rate": 3.060961991143802e-05, "loss": 0.2015, "step": 31955 }, { "epoch": 0.43, "learning_rate": 3.0604492360432454e-05, "loss": 0.4379, "step": 31960 }, { "epoch": 0.43, "learning_rate": 3.059936456117593e-05, "loss": 0.3214, "step": 31965 }, { "epoch": 0.43, "learning_rate": 3.059423651389556e-05, "loss": 0.3714, "step": 31970 }, { "epoch": 0.43, "learning_rate": 3.0589108218818504e-05, "loss": 0.9074, "step": 31975 }, { "epoch": 0.43, "learning_rate": 3.058397967617191e-05, "loss": 0.842, "step": 31980 }, { "epoch": 0.43, "learning_rate": 3.0578850886182955e-05, "loss": 0.4051, "step": 31985 }, { "epoch": 0.43, "learning_rate": 3.0573721849078816e-05, "loss": 0.3325, "step": 31990 }, { "epoch": 0.43, "learning_rate": 3.056859256508668e-05, "loss": 0.2897, "step": 31995 }, { "epoch": 0.43, "learning_rate": 3.056346303443376e-05, "loss": 0.7755, "step": 32000 }, { "epoch": 0.43, "learning_rate": 3.055833325734725e-05, "loss": 0.8347, "step": 32005 }, { "epoch": 0.43, "learning_rate": 3.055320323405439e-05, "loss": 0.4618, "step": 32010 }, { "epoch": 0.43, "learning_rate": 3.054807296478241e-05, "loss": 1.0508, "step": 32015 }, { "epoch": 0.43, "learning_rate": 3.0542942449758554e-05, "loss": 1.2662, "step": 32020 }, { "epoch": 0.43, "learning_rate": 3.053781168921007e-05, "loss": 0.5777, "step": 32025 }, { "epoch": 0.43, "learning_rate": 3.0532680683364246e-05, "loss": 0.4011, "step": 32030 }, { "epoch": 0.43, "learning_rate": 3.052754943244834e-05, "loss": 0.8899, "step": 32035 }, { "epoch": 0.43, "learning_rate": 3.052241793668965e-05, "loss": 0.8876, "step": 32040 }, { "epoch": 0.43, "learning_rate": 3.051728619631547e-05, "loss": 0.4835, "step": 32045 }, { "epoch": 0.43, "learning_rate": 3.051215421155312e-05, "loss": 0.8011, "step": 32050 }, { "epoch": 0.43, "learning_rate": 3.0507021982629903e-05, "loss": 0.7181, "step": 32055 }, { "epoch": 0.43, "learning_rate": 3.050188950977317e-05, "loss": 0.5867, "step": 32060 }, { "epoch": 0.43, "learning_rate": 3.0496756793210257e-05, "loss": 0.6674, "step": 32065 }, { "epoch": 0.43, "learning_rate": 3.0491623833168513e-05, "loss": 0.9988, "step": 32070 }, { "epoch": 0.43, "learning_rate": 3.0486490629875315e-05, "loss": 0.4609, "step": 32075 }, { "epoch": 0.43, "learning_rate": 3.0481357183558025e-05, "loss": 0.895, "step": 32080 }, { "epoch": 0.43, "learning_rate": 3.047622349444403e-05, "loss": 0.6589, "step": 32085 }, { "epoch": 0.43, "learning_rate": 3.0471089562760742e-05, "loss": 1.101, "step": 32090 }, { "epoch": 0.43, "learning_rate": 3.0465955388735545e-05, "loss": 0.7476, "step": 32095 }, { "epoch": 0.43, "learning_rate": 3.046082097259588e-05, "loss": 0.3924, "step": 32100 }, { "epoch": 0.43, "learning_rate": 3.0455686314569164e-05, "loss": 0.6519, "step": 32105 }, { "epoch": 0.43, "learning_rate": 3.045055141488283e-05, "loss": 0.7781, "step": 32110 }, { "epoch": 0.43, "learning_rate": 3.0445416273764344e-05, "loss": 0.8874, "step": 32115 }, { "epoch": 0.43, "learning_rate": 3.044028089144116e-05, "loss": 0.9719, "step": 32120 }, { "epoch": 0.43, "learning_rate": 3.0435145268140747e-05, "loss": 0.6723, "step": 32125 }, { "epoch": 0.43, "learning_rate": 3.0430009404090593e-05, "loss": 0.4244, "step": 32130 }, { "epoch": 0.43, "learning_rate": 3.0424873299518182e-05, "loss": 0.9896, "step": 32135 }, { "epoch": 0.43, "learning_rate": 3.0419736954651022e-05, "loss": 0.9806, "step": 32140 }, { "epoch": 0.43, "learning_rate": 3.041460036971664e-05, "loss": 0.8687, "step": 32145 }, { "epoch": 0.43, "learning_rate": 3.040946354494254e-05, "loss": 0.7986, "step": 32150 }, { "epoch": 0.43, "learning_rate": 3.0404326480556273e-05, "loss": 1.0886, "step": 32155 }, { "epoch": 0.43, "learning_rate": 3.039918917678538e-05, "loss": 0.6853, "step": 32160 }, { "epoch": 0.43, "learning_rate": 3.039405163385741e-05, "loss": 0.3615, "step": 32165 }, { "epoch": 0.43, "learning_rate": 3.0388913851999944e-05, "loss": 0.8351, "step": 32170 }, { "epoch": 0.43, "learning_rate": 3.038377583144056e-05, "loss": 0.7374, "step": 32175 }, { "epoch": 0.43, "learning_rate": 3.0378637572406833e-05, "loss": 0.7098, "step": 32180 }, { "epoch": 0.43, "learning_rate": 3.037349907512637e-05, "loss": 0.9512, "step": 32185 }, { "epoch": 0.43, "learning_rate": 3.0368360339826785e-05, "loss": 0.5835, "step": 32190 }, { "epoch": 0.43, "learning_rate": 3.036322136673569e-05, "loss": 1.012, "step": 32195 }, { "epoch": 0.43, "learning_rate": 3.0358082156080726e-05, "loss": 0.1373, "step": 32200 }, { "epoch": 0.43, "learning_rate": 3.0352942708089515e-05, "loss": 0.3828, "step": 32205 }, { "epoch": 0.43, "learning_rate": 3.0347803022989734e-05, "loss": 0.9864, "step": 32210 }, { "epoch": 0.43, "learning_rate": 3.0342663101009034e-05, "loss": 1.1146, "step": 32215 }, { "epoch": 0.43, "learning_rate": 3.033752294237508e-05, "loss": 0.5442, "step": 32220 }, { "epoch": 0.43, "learning_rate": 3.0332382547315562e-05, "loss": 0.6417, "step": 32225 }, { "epoch": 0.43, "learning_rate": 3.0327241916058186e-05, "loss": 0.407, "step": 32230 }, { "epoch": 0.43, "learning_rate": 3.032210104883063e-05, "loss": 0.2885, "step": 32235 }, { "epoch": 0.43, "learning_rate": 3.0316959945860634e-05, "loss": 0.9336, "step": 32240 }, { "epoch": 0.43, "learning_rate": 3.0311818607375908e-05, "loss": 0.4513, "step": 32245 }, { "epoch": 0.43, "learning_rate": 3.0306677033604185e-05, "loss": 0.6582, "step": 32250 }, { "epoch": 0.43, "learning_rate": 3.030153522477323e-05, "loss": 0.1106, "step": 32255 }, { "epoch": 0.43, "learning_rate": 3.0296393181110777e-05, "loss": 1.4252, "step": 32260 }, { "epoch": 0.43, "learning_rate": 3.0291250902844615e-05, "loss": 1.0108, "step": 32265 }, { "epoch": 0.43, "learning_rate": 3.0286108390202505e-05, "loss": 0.9683, "step": 32270 }, { "epoch": 0.43, "learning_rate": 3.028096564341223e-05, "loss": 0.249, "step": 32275 }, { "epoch": 0.43, "learning_rate": 3.0275822662701603e-05, "loss": 2.1821, "step": 32280 }, { "epoch": 0.43, "learning_rate": 3.027067944829843e-05, "loss": 0.3936, "step": 32285 }, { "epoch": 0.43, "learning_rate": 3.0265536000430515e-05, "loss": 0.7174, "step": 32290 }, { "epoch": 0.43, "learning_rate": 3.026039231932571e-05, "loss": 0.9531, "step": 32295 }, { "epoch": 0.43, "learning_rate": 3.0255248405211833e-05, "loss": 0.8019, "step": 32300 }, { "epoch": 0.43, "learning_rate": 3.0250104258316746e-05, "loss": 0.4124, "step": 32305 }, { "epoch": 0.43, "learning_rate": 3.0244959878868312e-05, "loss": 0.1825, "step": 32310 }, { "epoch": 0.43, "learning_rate": 3.0239815267094383e-05, "loss": 0.7698, "step": 32315 }, { "epoch": 0.43, "learning_rate": 3.0234670423222867e-05, "loss": 0.3062, "step": 32320 }, { "epoch": 0.43, "learning_rate": 3.022952534748163e-05, "loss": 1.0488, "step": 32325 }, { "epoch": 0.43, "learning_rate": 3.022438004009858e-05, "loss": 0.5016, "step": 32330 }, { "epoch": 0.43, "learning_rate": 3.0219234501301637e-05, "loss": 0.4056, "step": 32335 }, { "epoch": 0.43, "learning_rate": 3.0214088731318712e-05, "loss": 0.4062, "step": 32340 }, { "epoch": 0.43, "learning_rate": 3.0208942730377743e-05, "loss": 0.7744, "step": 32345 }, { "epoch": 0.43, "learning_rate": 3.020379649870667e-05, "loss": 0.6777, "step": 32350 }, { "epoch": 0.43, "learning_rate": 3.019865003653345e-05, "loss": 1.0205, "step": 32355 }, { "epoch": 0.43, "learning_rate": 3.0193503344086033e-05, "loss": 0.4855, "step": 32360 }, { "epoch": 0.43, "learning_rate": 3.018835642159241e-05, "loss": 0.1932, "step": 32365 }, { "epoch": 0.43, "learning_rate": 3.0183209269280543e-05, "loss": 1.0105, "step": 32370 }, { "epoch": 0.43, "learning_rate": 3.017806188737845e-05, "loss": 0.8595, "step": 32375 }, { "epoch": 0.43, "learning_rate": 3.017291427611412e-05, "loss": 0.4924, "step": 32380 }, { "epoch": 0.43, "learning_rate": 3.016776643571555e-05, "loss": 0.9898, "step": 32385 }, { "epoch": 0.43, "learning_rate": 3.0162618366410787e-05, "loss": 0.5702, "step": 32390 }, { "epoch": 0.43, "learning_rate": 3.0157470068427867e-05, "loss": 0.834, "step": 32395 }, { "epoch": 0.43, "learning_rate": 3.0152321541994814e-05, "loss": 0.5641, "step": 32400 }, { "epoch": 0.43, "learning_rate": 3.0147172787339705e-05, "loss": 0.9924, "step": 32405 }, { "epoch": 0.43, "learning_rate": 3.0142023804690583e-05, "loss": 0.6643, "step": 32410 }, { "epoch": 0.43, "learning_rate": 3.0136874594275532e-05, "loss": 0.5091, "step": 32415 }, { "epoch": 0.43, "learning_rate": 3.0131725156322637e-05, "loss": 1.2748, "step": 32420 }, { "epoch": 0.43, "learning_rate": 3.0126575491059988e-05, "loss": 0.6775, "step": 32425 }, { "epoch": 0.43, "learning_rate": 3.0121425598715702e-05, "loss": 1.2364, "step": 32430 }, { "epoch": 0.43, "learning_rate": 3.011627547951788e-05, "loss": 0.8466, "step": 32435 }, { "epoch": 0.43, "learning_rate": 3.011112513369464e-05, "loss": 0.7778, "step": 32440 }, { "epoch": 0.43, "learning_rate": 3.010597456147413e-05, "loss": 0.7403, "step": 32445 }, { "epoch": 0.43, "learning_rate": 3.0100823763084502e-05, "loss": 0.632, "step": 32450 }, { "epoch": 0.43, "learning_rate": 3.0095672738753887e-05, "loss": 0.6648, "step": 32455 }, { "epoch": 0.43, "learning_rate": 3.0090521488710475e-05, "loss": 1.3186, "step": 32460 }, { "epoch": 0.43, "learning_rate": 3.0085370013182417e-05, "loss": 0.1911, "step": 32465 }, { "epoch": 0.44, "learning_rate": 3.008021831239791e-05, "loss": 1.0123, "step": 32470 }, { "epoch": 0.44, "learning_rate": 3.0075066386585156e-05, "loss": 0.4745, "step": 32475 }, { "epoch": 0.44, "learning_rate": 3.006991423597234e-05, "loss": 1.2885, "step": 32480 }, { "epoch": 0.44, "learning_rate": 3.00647618607877e-05, "loss": 0.4859, "step": 32485 }, { "epoch": 0.44, "learning_rate": 3.0059609261259443e-05, "loss": 0.8082, "step": 32490 }, { "epoch": 0.44, "learning_rate": 3.0054456437615803e-05, "loss": 0.9251, "step": 32495 }, { "epoch": 0.44, "learning_rate": 3.0049303390085027e-05, "loss": 0.4251, "step": 32500 }, { "epoch": 0.44, "learning_rate": 3.004415011889538e-05, "loss": 1.0495, "step": 32505 }, { "epoch": 0.44, "learning_rate": 3.003899662427511e-05, "loss": 0.7633, "step": 32510 }, { "epoch": 0.44, "learning_rate": 3.0033842906452507e-05, "loss": 0.6916, "step": 32515 }, { "epoch": 0.44, "learning_rate": 3.0028688965655842e-05, "loss": 0.5862, "step": 32520 }, { "epoch": 0.44, "learning_rate": 3.0023534802113412e-05, "loss": 0.7878, "step": 32525 }, { "epoch": 0.44, "learning_rate": 3.0018380416053526e-05, "loss": 0.4363, "step": 32530 }, { "epoch": 0.44, "learning_rate": 3.0013225807704494e-05, "loss": 0.3853, "step": 32535 }, { "epoch": 0.44, "learning_rate": 3.000807097729464e-05, "loss": 0.7542, "step": 32540 }, { "epoch": 0.44, "learning_rate": 3.00029159250523e-05, "loss": 0.8269, "step": 32545 }, { "epoch": 0.44, "learning_rate": 2.9997760651205804e-05, "loss": 0.7499, "step": 32550 }, { "epoch": 0.44, "learning_rate": 2.999260515598351e-05, "loss": 0.6203, "step": 32555 }, { "epoch": 0.44, "learning_rate": 2.99874494396138e-05, "loss": 0.7466, "step": 32560 }, { "epoch": 0.44, "learning_rate": 2.9982293502325022e-05, "loss": 0.3791, "step": 32565 }, { "epoch": 0.44, "learning_rate": 2.9977137344345567e-05, "loss": 0.4652, "step": 32570 }, { "epoch": 0.44, "learning_rate": 2.997198096590383e-05, "loss": 0.8247, "step": 32575 }, { "epoch": 0.44, "learning_rate": 2.996682436722821e-05, "loss": 0.693, "step": 32580 }, { "epoch": 0.44, "learning_rate": 2.9961667548547117e-05, "loss": 0.938, "step": 32585 }, { "epoch": 0.44, "learning_rate": 2.9956510510088974e-05, "loss": 0.7006, "step": 32590 }, { "epoch": 0.44, "learning_rate": 2.995135325208222e-05, "loss": 0.9593, "step": 32595 }, { "epoch": 0.44, "learning_rate": 2.994619577475528e-05, "loss": 1.0408, "step": 32600 }, { "epoch": 0.44, "learning_rate": 2.9941038078336613e-05, "loss": 0.5453, "step": 32605 }, { "epoch": 0.44, "learning_rate": 2.9935880163054674e-05, "loss": 0.9291, "step": 32610 }, { "epoch": 0.44, "learning_rate": 2.993072202913795e-05, "loss": 0.3723, "step": 32615 }, { "epoch": 0.44, "learning_rate": 2.9925563676814892e-05, "loss": 1.1431, "step": 32620 }, { "epoch": 0.44, "learning_rate": 2.992040510631402e-05, "loss": 0.3961, "step": 32625 }, { "epoch": 0.44, "learning_rate": 2.991524631786381e-05, "loss": 0.8114, "step": 32630 }, { "epoch": 0.44, "learning_rate": 2.9910087311692774e-05, "loss": 0.4783, "step": 32635 }, { "epoch": 0.44, "learning_rate": 2.9904928088029443e-05, "loss": 0.6216, "step": 32640 }, { "epoch": 0.44, "learning_rate": 2.9899768647102333e-05, "loss": 0.1622, "step": 32645 }, { "epoch": 0.44, "learning_rate": 2.9894608989139982e-05, "loss": 0.9935, "step": 32650 }, { "epoch": 0.44, "learning_rate": 2.988944911437095e-05, "loss": 0.5156, "step": 32655 }, { "epoch": 0.44, "learning_rate": 2.988428902302377e-05, "loss": 1.0722, "step": 32660 }, { "epoch": 0.44, "learning_rate": 2.9879128715327025e-05, "loss": 1.4635, "step": 32665 }, { "epoch": 0.44, "learning_rate": 2.9873968191509296e-05, "loss": 0.5941, "step": 32670 }, { "epoch": 0.44, "learning_rate": 2.986880745179915e-05, "loss": 0.6152, "step": 32675 }, { "epoch": 0.44, "learning_rate": 2.9863646496425196e-05, "loss": 0.8262, "step": 32680 }, { "epoch": 0.44, "learning_rate": 2.985848532561603e-05, "loss": 0.5473, "step": 32685 }, { "epoch": 0.44, "learning_rate": 2.9853323939600276e-05, "loss": 0.6767, "step": 32690 }, { "epoch": 0.44, "learning_rate": 2.984816233860655e-05, "loss": 0.3208, "step": 32695 }, { "epoch": 0.44, "learning_rate": 2.9843000522863486e-05, "loss": 0.2027, "step": 32700 }, { "epoch": 0.44, "learning_rate": 2.983783849259973e-05, "loss": 0.9766, "step": 32705 }, { "epoch": 0.44, "learning_rate": 2.9832676248043933e-05, "loss": 1.0535, "step": 32710 }, { "epoch": 0.44, "learning_rate": 2.982751378942475e-05, "loss": 1.3302, "step": 32715 }, { "epoch": 0.44, "learning_rate": 2.982235111697086e-05, "loss": 0.7295, "step": 32720 }, { "epoch": 0.44, "learning_rate": 2.9817188230910943e-05, "loss": 0.7566, "step": 32725 }, { "epoch": 0.44, "learning_rate": 2.981202513147368e-05, "loss": 0.8256, "step": 32730 }, { "epoch": 0.44, "learning_rate": 2.9806861818887788e-05, "loss": 0.6868, "step": 32735 }, { "epoch": 0.44, "learning_rate": 2.9801698293381958e-05, "loss": 0.6647, "step": 32740 }, { "epoch": 0.44, "learning_rate": 2.9796534555184914e-05, "loss": 0.6999, "step": 32745 }, { "epoch": 0.44, "learning_rate": 2.9791370604525394e-05, "loss": 0.5997, "step": 32750 }, { "epoch": 0.44, "learning_rate": 2.9786206441632116e-05, "loss": 0.9036, "step": 32755 }, { "epoch": 0.44, "learning_rate": 2.9781042066733843e-05, "loss": 0.9272, "step": 32760 }, { "epoch": 0.44, "learning_rate": 2.9775877480059332e-05, "loss": 0.6734, "step": 32765 }, { "epoch": 0.44, "learning_rate": 2.9770712681837327e-05, "loss": 0.9743, "step": 32770 }, { "epoch": 0.44, "learning_rate": 2.976554767229663e-05, "loss": 1.3876, "step": 32775 }, { "epoch": 0.44, "learning_rate": 2.976038245166601e-05, "loss": 0.5711, "step": 32780 }, { "epoch": 0.44, "learning_rate": 2.9755217020174254e-05, "loss": 1.3044, "step": 32785 }, { "epoch": 0.44, "learning_rate": 2.9750051378050185e-05, "loss": 1.2027, "step": 32790 }, { "epoch": 0.44, "learning_rate": 2.9744885525522598e-05, "loss": 0.6846, "step": 32795 }, { "epoch": 0.44, "learning_rate": 2.9739719462820315e-05, "loss": 0.7373, "step": 32800 }, { "epoch": 0.44, "learning_rate": 2.973455319017218e-05, "loss": 0.6147, "step": 32805 }, { "epoch": 0.44, "learning_rate": 2.972938670780702e-05, "loss": 0.2762, "step": 32810 }, { "epoch": 0.44, "learning_rate": 2.9724220015953697e-05, "loss": 0.592, "step": 32815 }, { "epoch": 0.44, "learning_rate": 2.9719053114841062e-05, "loss": 0.6174, "step": 32820 }, { "epoch": 0.44, "learning_rate": 2.9713886004697965e-05, "loss": 0.8851, "step": 32825 }, { "epoch": 0.44, "learning_rate": 2.970871868575332e-05, "loss": 0.6855, "step": 32830 }, { "epoch": 0.44, "learning_rate": 2.9703551158235987e-05, "loss": 0.6365, "step": 32835 }, { "epoch": 0.44, "learning_rate": 2.9698383422374863e-05, "loss": 0.5121, "step": 32840 }, { "epoch": 0.44, "learning_rate": 2.9693215478398872e-05, "loss": 0.6581, "step": 32845 }, { "epoch": 0.44, "learning_rate": 2.9688047326536906e-05, "loss": 0.8765, "step": 32850 }, { "epoch": 0.44, "learning_rate": 2.9682878967017895e-05, "loss": 1.1568, "step": 32855 }, { "epoch": 0.44, "learning_rate": 2.967771040007078e-05, "loss": 0.1901, "step": 32860 }, { "epoch": 0.44, "learning_rate": 2.967254162592449e-05, "loss": 0.5027, "step": 32865 }, { "epoch": 0.44, "learning_rate": 2.966737264480799e-05, "loss": 0.9884, "step": 32870 }, { "epoch": 0.44, "learning_rate": 2.9662203456950226e-05, "loss": 0.5987, "step": 32875 }, { "epoch": 0.44, "learning_rate": 2.965703406258017e-05, "loss": 0.7785, "step": 32880 }, { "epoch": 0.44, "learning_rate": 2.965186446192681e-05, "loss": 0.5895, "step": 32885 }, { "epoch": 0.44, "learning_rate": 2.9646694655219127e-05, "loss": 1.0935, "step": 32890 }, { "epoch": 0.44, "learning_rate": 2.9641524642686113e-05, "loss": 1.3356, "step": 32895 }, { "epoch": 0.44, "learning_rate": 2.9636354424556783e-05, "loss": 1.1783, "step": 32900 }, { "epoch": 0.44, "learning_rate": 2.963118400106014e-05, "loss": 0.7325, "step": 32905 }, { "epoch": 0.44, "learning_rate": 2.9626013372425214e-05, "loss": 0.4162, "step": 32910 }, { "epoch": 0.44, "learning_rate": 2.962084253888105e-05, "loss": 0.7417, "step": 32915 }, { "epoch": 0.44, "learning_rate": 2.961567150065667e-05, "loss": 0.4493, "step": 32920 }, { "epoch": 0.44, "learning_rate": 2.9610500257981137e-05, "loss": 0.5261, "step": 32925 }, { "epoch": 0.44, "learning_rate": 2.9605328811083516e-05, "loss": 1.1349, "step": 32930 }, { "epoch": 0.44, "learning_rate": 2.9600157160192847e-05, "loss": 0.7555, "step": 32935 }, { "epoch": 0.44, "learning_rate": 2.9594985305538248e-05, "loss": 0.572, "step": 32940 }, { "epoch": 0.44, "learning_rate": 2.9589813247348784e-05, "loss": 0.8451, "step": 32945 }, { "epoch": 0.44, "learning_rate": 2.958464098585355e-05, "loss": 0.9089, "step": 32950 }, { "epoch": 0.44, "learning_rate": 2.9579468521281666e-05, "loss": 0.791, "step": 32955 }, { "epoch": 0.44, "learning_rate": 2.9574295853862234e-05, "loss": 0.3818, "step": 32960 }, { "epoch": 0.44, "learning_rate": 2.9569122983824372e-05, "loss": 0.882, "step": 32965 }, { "epoch": 0.44, "learning_rate": 2.9563949911397227e-05, "loss": 0.6199, "step": 32970 }, { "epoch": 0.44, "learning_rate": 2.955877663680993e-05, "loss": 1.0227, "step": 32975 }, { "epoch": 0.44, "learning_rate": 2.9553603160291643e-05, "loss": 0.7893, "step": 32980 }, { "epoch": 0.44, "learning_rate": 2.954842948207151e-05, "loss": 1.7309, "step": 32985 }, { "epoch": 0.44, "learning_rate": 2.9543255602378704e-05, "loss": 1.0507, "step": 32990 }, { "epoch": 0.44, "learning_rate": 2.9538081521442412e-05, "loss": 0.3383, "step": 32995 }, { "epoch": 0.44, "learning_rate": 2.953290723949181e-05, "loss": 1.3812, "step": 33000 }, { "epoch": 0.44, "learning_rate": 2.9527732756756087e-05, "loss": 0.8223, "step": 33005 }, { "epoch": 0.44, "learning_rate": 2.952255807346446e-05, "loss": 0.6931, "step": 33010 }, { "epoch": 0.44, "learning_rate": 2.9517383189846138e-05, "loss": 0.4911, "step": 33015 }, { "epoch": 0.44, "learning_rate": 2.9512208106130335e-05, "loss": 0.4238, "step": 33020 }, { "epoch": 0.44, "learning_rate": 2.9507032822546293e-05, "loss": 0.5249, "step": 33025 }, { "epoch": 0.44, "learning_rate": 2.950185733932324e-05, "loss": 0.5744, "step": 33030 }, { "epoch": 0.44, "learning_rate": 2.9496681656690434e-05, "loss": 0.7896, "step": 33035 }, { "epoch": 0.44, "learning_rate": 2.9491505774877122e-05, "loss": 1.0834, "step": 33040 }, { "epoch": 0.44, "learning_rate": 2.948632969411257e-05, "loss": 0.6696, "step": 33045 }, { "epoch": 0.44, "learning_rate": 2.9481153414626066e-05, "loss": 1.1583, "step": 33050 }, { "epoch": 0.44, "learning_rate": 2.9475976936646883e-05, "loss": 0.7264, "step": 33055 }, { "epoch": 0.44, "learning_rate": 2.9470800260404314e-05, "loss": 0.6986, "step": 33060 }, { "epoch": 0.44, "learning_rate": 2.946562338612766e-05, "loss": 0.8618, "step": 33065 }, { "epoch": 0.44, "learning_rate": 2.9460446314046226e-05, "loss": 0.7652, "step": 33070 }, { "epoch": 0.44, "learning_rate": 2.9455269044389332e-05, "loss": 1.0437, "step": 33075 }, { "epoch": 0.44, "learning_rate": 2.9450091577386317e-05, "loss": 0.5365, "step": 33080 }, { "epoch": 0.44, "learning_rate": 2.9444913913266515e-05, "loss": 0.8266, "step": 33085 }, { "epoch": 0.44, "learning_rate": 2.9439736052259247e-05, "loss": 1.2161, "step": 33090 }, { "epoch": 0.44, "learning_rate": 2.9434557994593893e-05, "loss": 0.447, "step": 33095 }, { "epoch": 0.44, "learning_rate": 2.9429379740499803e-05, "loss": 0.4436, "step": 33100 }, { "epoch": 0.44, "learning_rate": 2.942420129020635e-05, "loss": 0.6294, "step": 33105 }, { "epoch": 0.44, "learning_rate": 2.9419022643942918e-05, "loss": 0.5553, "step": 33110 }, { "epoch": 0.44, "learning_rate": 2.9413843801938886e-05, "loss": 1.7091, "step": 33115 }, { "epoch": 0.44, "learning_rate": 2.9408664764423654e-05, "loss": 1.5007, "step": 33120 }, { "epoch": 0.44, "learning_rate": 2.940348553162663e-05, "loss": 0.3825, "step": 33125 }, { "epoch": 0.44, "learning_rate": 2.9398306103777222e-05, "loss": 0.8451, "step": 33130 }, { "epoch": 0.44, "learning_rate": 2.939312648110487e-05, "loss": 0.5127, "step": 33135 }, { "epoch": 0.44, "learning_rate": 2.938794666383899e-05, "loss": 0.5255, "step": 33140 }, { "epoch": 0.44, "learning_rate": 2.9382766652209016e-05, "loss": 1.2148, "step": 33145 }, { "epoch": 0.44, "learning_rate": 2.9377586446444412e-05, "loss": 0.7345, "step": 33150 }, { "epoch": 0.44, "learning_rate": 2.9372406046774626e-05, "loss": 0.7583, "step": 33155 }, { "epoch": 0.44, "learning_rate": 2.9367225453429124e-05, "loss": 0.3655, "step": 33160 }, { "epoch": 0.44, "learning_rate": 2.9362044666637394e-05, "loss": 0.7311, "step": 33165 }, { "epoch": 0.44, "learning_rate": 2.93568636866289e-05, "loss": 0.69, "step": 33170 }, { "epoch": 0.44, "learning_rate": 2.9351682513633145e-05, "loss": 0.7298, "step": 33175 }, { "epoch": 0.44, "learning_rate": 2.9346501147879617e-05, "loss": 0.5914, "step": 33180 }, { "epoch": 0.44, "learning_rate": 2.9341319589597837e-05, "loss": 0.738, "step": 33185 }, { "epoch": 0.44, "learning_rate": 2.9336137839017325e-05, "loss": 1.0838, "step": 33190 }, { "epoch": 0.44, "learning_rate": 2.9330955896367596e-05, "loss": 0.6033, "step": 33195 }, { "epoch": 0.44, "learning_rate": 2.9325773761878183e-05, "loss": 0.3833, "step": 33200 }, { "epoch": 0.44, "learning_rate": 2.932059143577863e-05, "loss": 0.4289, "step": 33205 }, { "epoch": 0.44, "learning_rate": 2.9315408918298504e-05, "loss": 0.2807, "step": 33210 }, { "epoch": 0.45, "learning_rate": 2.9310226209667347e-05, "loss": 0.9983, "step": 33215 }, { "epoch": 0.45, "learning_rate": 2.9305043310114733e-05, "loss": 0.3758, "step": 33220 }, { "epoch": 0.45, "learning_rate": 2.9299860219870235e-05, "loss": 0.8688, "step": 33225 }, { "epoch": 0.45, "learning_rate": 2.9294676939163447e-05, "loss": 0.7514, "step": 33230 }, { "epoch": 0.45, "learning_rate": 2.928949346822395e-05, "loss": 1.3314, "step": 33235 }, { "epoch": 0.45, "learning_rate": 2.928430980728135e-05, "loss": 0.5217, "step": 33240 }, { "epoch": 0.45, "learning_rate": 2.927912595656527e-05, "loss": 1.0729, "step": 33245 }, { "epoch": 0.45, "learning_rate": 2.9273941916305314e-05, "loss": 0.7283, "step": 33250 }, { "epoch": 0.45, "learning_rate": 2.9268757686731107e-05, "loss": 0.3143, "step": 33255 }, { "epoch": 0.45, "learning_rate": 2.9263573268072292e-05, "loss": 0.5851, "step": 33260 }, { "epoch": 0.45, "learning_rate": 2.9258388660558506e-05, "loss": 1.8663, "step": 33265 }, { "epoch": 0.45, "learning_rate": 2.925320386441942e-05, "loss": 0.5692, "step": 33270 }, { "epoch": 0.45, "learning_rate": 2.9248018879884674e-05, "loss": 0.4971, "step": 33275 }, { "epoch": 0.45, "learning_rate": 2.9242833707183943e-05, "loss": 0.9812, "step": 33280 }, { "epoch": 0.45, "learning_rate": 2.923764834654691e-05, "loss": 1.0016, "step": 33285 }, { "epoch": 0.45, "learning_rate": 2.9232462798203247e-05, "loss": 0.5077, "step": 33290 }, { "epoch": 0.45, "learning_rate": 2.9227277062382656e-05, "loss": 0.9219, "step": 33295 }, { "epoch": 0.45, "learning_rate": 2.922209113931485e-05, "loss": 0.682, "step": 33300 }, { "epoch": 0.45, "learning_rate": 2.9216905029229523e-05, "loss": 1.5977, "step": 33305 }, { "epoch": 0.45, "learning_rate": 2.9211718732356402e-05, "loss": 0.5841, "step": 33310 }, { "epoch": 0.45, "learning_rate": 2.9206532248925206e-05, "loss": 0.489, "step": 33315 }, { "epoch": 0.45, "learning_rate": 2.920134557916568e-05, "loss": 0.6783, "step": 33320 }, { "epoch": 0.45, "learning_rate": 2.9196158723307565e-05, "loss": 0.3824, "step": 33325 }, { "epoch": 0.45, "learning_rate": 2.919097168158061e-05, "loss": 0.8721, "step": 33330 }, { "epoch": 0.45, "learning_rate": 2.918578445421457e-05, "loss": 0.6602, "step": 33335 }, { "epoch": 0.45, "learning_rate": 2.9180597041439235e-05, "loss": 0.988, "step": 33340 }, { "epoch": 0.45, "learning_rate": 2.9175409443484347e-05, "loss": 1.011, "step": 33345 }, { "epoch": 0.45, "learning_rate": 2.9170221660579723e-05, "loss": 1.1225, "step": 33350 }, { "epoch": 0.45, "learning_rate": 2.9165033692955136e-05, "loss": 0.4721, "step": 33355 }, { "epoch": 0.45, "learning_rate": 2.91598455408404e-05, "loss": 0.3193, "step": 33360 }, { "epoch": 0.45, "learning_rate": 2.9154657204465313e-05, "loss": 1.3145, "step": 33365 }, { "epoch": 0.45, "learning_rate": 2.9149468684059693e-05, "loss": 0.4056, "step": 33370 }, { "epoch": 0.45, "learning_rate": 2.9144279979853372e-05, "loss": 1.0971, "step": 33375 }, { "epoch": 0.45, "learning_rate": 2.913909109207618e-05, "loss": 1.2984, "step": 33380 }, { "epoch": 0.45, "learning_rate": 2.913390202095797e-05, "loss": 0.3864, "step": 33385 }, { "epoch": 0.45, "learning_rate": 2.9128712766728573e-05, "loss": 0.8357, "step": 33390 }, { "epoch": 0.45, "learning_rate": 2.9123523329617856e-05, "loss": 0.7631, "step": 33395 }, { "epoch": 0.45, "learning_rate": 2.9118333709855683e-05, "loss": 0.6078, "step": 33400 }, { "epoch": 0.45, "learning_rate": 2.911314390767193e-05, "loss": 0.2971, "step": 33405 }, { "epoch": 0.45, "learning_rate": 2.9107953923296488e-05, "loss": 0.5986, "step": 33410 }, { "epoch": 0.45, "learning_rate": 2.9102763756959234e-05, "loss": 0.9629, "step": 33415 }, { "epoch": 0.45, "learning_rate": 2.9097573408890068e-05, "loss": 0.7854, "step": 33420 }, { "epoch": 0.45, "learning_rate": 2.9092382879318903e-05, "loss": 0.9043, "step": 33425 }, { "epoch": 0.45, "learning_rate": 2.9087192168475642e-05, "loss": 0.727, "step": 33430 }, { "epoch": 0.45, "learning_rate": 2.9082001276590226e-05, "loss": 0.6863, "step": 33435 }, { "epoch": 0.45, "learning_rate": 2.9076810203892574e-05, "loss": 0.8636, "step": 33440 }, { "epoch": 0.45, "learning_rate": 2.9071618950612616e-05, "loss": 1.3623, "step": 33445 }, { "epoch": 0.45, "learning_rate": 2.9066427516980322e-05, "loss": 1.0693, "step": 33450 }, { "epoch": 0.45, "learning_rate": 2.906123590322562e-05, "loss": 0.8931, "step": 33455 }, { "epoch": 0.45, "learning_rate": 2.905604410957849e-05, "loss": 0.5343, "step": 33460 }, { "epoch": 0.45, "learning_rate": 2.90508521362689e-05, "loss": 0.525, "step": 33465 }, { "epoch": 0.45, "learning_rate": 2.9045659983526828e-05, "loss": 0.9324, "step": 33470 }, { "epoch": 0.45, "learning_rate": 2.9040467651582254e-05, "loss": 0.6056, "step": 33475 }, { "epoch": 0.45, "learning_rate": 2.9035275140665174e-05, "loss": 0.4031, "step": 33480 }, { "epoch": 0.45, "learning_rate": 2.9030082451005592e-05, "loss": 0.6877, "step": 33485 }, { "epoch": 0.45, "learning_rate": 2.9024889582833532e-05, "loss": 0.4827, "step": 33490 }, { "epoch": 0.45, "learning_rate": 2.9019696536378994e-05, "loss": 1.1538, "step": 33495 }, { "epoch": 0.45, "learning_rate": 2.9014503311872005e-05, "loss": 1.5126, "step": 33500 }, { "epoch": 0.45, "learning_rate": 2.9009309909542605e-05, "loss": 0.5089, "step": 33505 }, { "epoch": 0.45, "learning_rate": 2.9004116329620835e-05, "loss": 0.9556, "step": 33510 }, { "epoch": 0.45, "learning_rate": 2.899892257233674e-05, "loss": 0.4007, "step": 33515 }, { "epoch": 0.45, "learning_rate": 2.899372863792038e-05, "loss": 0.3009, "step": 33520 }, { "epoch": 0.45, "learning_rate": 2.898853452660183e-05, "loss": 0.1545, "step": 33525 }, { "epoch": 0.45, "learning_rate": 2.8983340238611147e-05, "loss": 0.5035, "step": 33530 }, { "epoch": 0.45, "learning_rate": 2.8978145774178423e-05, "loss": 0.4765, "step": 33535 }, { "epoch": 0.45, "learning_rate": 2.897295113353374e-05, "loss": 0.5694, "step": 33540 }, { "epoch": 0.45, "learning_rate": 2.8967756316907203e-05, "loss": 0.5794, "step": 33545 }, { "epoch": 0.45, "learning_rate": 2.896256132452891e-05, "loss": 1.0251, "step": 33550 }, { "epoch": 0.45, "learning_rate": 2.8957366156628967e-05, "loss": 0.8477, "step": 33555 }, { "epoch": 0.45, "learning_rate": 2.895217081343751e-05, "loss": 0.727, "step": 33560 }, { "epoch": 0.45, "learning_rate": 2.8946975295184654e-05, "loss": 1.054, "step": 33565 }, { "epoch": 0.45, "learning_rate": 2.8941779602100537e-05, "loss": 1.1238, "step": 33570 }, { "epoch": 0.45, "learning_rate": 2.8936583734415313e-05, "loss": 1.2799, "step": 33575 }, { "epoch": 0.45, "learning_rate": 2.8931387692359114e-05, "loss": 0.4684, "step": 33580 }, { "epoch": 0.45, "learning_rate": 2.8926191476162112e-05, "loss": 0.8296, "step": 33585 }, { "epoch": 0.45, "learning_rate": 2.8920995086054464e-05, "loss": 0.6713, "step": 33590 }, { "epoch": 0.45, "learning_rate": 2.8915798522266353e-05, "loss": 0.8053, "step": 33595 }, { "epoch": 0.45, "learning_rate": 2.8910601785027964e-05, "loss": 0.5691, "step": 33600 }, { "epoch": 0.45, "learning_rate": 2.8905404874569474e-05, "loss": 0.839, "step": 33605 }, { "epoch": 0.45, "learning_rate": 2.8900207791121086e-05, "loss": 0.2757, "step": 33610 }, { "epoch": 0.45, "learning_rate": 2.8895010534913013e-05, "loss": 0.309, "step": 33615 }, { "epoch": 0.45, "learning_rate": 2.888981310617545e-05, "loss": 0.6537, "step": 33620 }, { "epoch": 0.45, "learning_rate": 2.888461550513863e-05, "loss": 0.951, "step": 33625 }, { "epoch": 0.45, "learning_rate": 2.8879417732032778e-05, "loss": 0.2602, "step": 33630 }, { "epoch": 0.45, "learning_rate": 2.887421978708813e-05, "loss": 1.1163, "step": 33635 }, { "epoch": 0.45, "learning_rate": 2.8869021670534925e-05, "loss": 0.3727, "step": 33640 }, { "epoch": 0.45, "learning_rate": 2.886382338260341e-05, "loss": 1.0103, "step": 33645 }, { "epoch": 0.45, "learning_rate": 2.885862492352386e-05, "loss": 0.6615, "step": 33650 }, { "epoch": 0.45, "learning_rate": 2.885342629352652e-05, "loss": 0.3485, "step": 33655 }, { "epoch": 0.45, "learning_rate": 2.8848227492841685e-05, "loss": 0.6585, "step": 33660 }, { "epoch": 0.45, "learning_rate": 2.884302852169961e-05, "loss": 1.0564, "step": 33665 }, { "epoch": 0.45, "learning_rate": 2.8837829380330607e-05, "loss": 0.8673, "step": 33670 }, { "epoch": 0.45, "learning_rate": 2.883263006896496e-05, "loss": 0.2439, "step": 33675 }, { "epoch": 0.45, "learning_rate": 2.8827430587832978e-05, "loss": 0.6893, "step": 33680 }, { "epoch": 0.45, "learning_rate": 2.8822230937164966e-05, "loss": 0.8689, "step": 33685 }, { "epoch": 0.45, "learning_rate": 2.881703111719125e-05, "loss": 0.316, "step": 33690 }, { "epoch": 0.45, "learning_rate": 2.881183112814215e-05, "loss": 0.3139, "step": 33695 }, { "epoch": 0.45, "learning_rate": 2.8806630970247993e-05, "loss": 0.3613, "step": 33700 }, { "epoch": 0.45, "learning_rate": 2.8801430643739135e-05, "loss": 0.5373, "step": 33705 }, { "epoch": 0.45, "learning_rate": 2.8796230148845914e-05, "loss": 0.8202, "step": 33710 }, { "epoch": 0.45, "learning_rate": 2.8791029485798693e-05, "loss": 0.8863, "step": 33715 }, { "epoch": 0.45, "learning_rate": 2.878582865482783e-05, "loss": 0.5873, "step": 33720 }, { "epoch": 0.45, "learning_rate": 2.8780627656163696e-05, "loss": 1.3712, "step": 33725 }, { "epoch": 0.45, "learning_rate": 2.877542649003667e-05, "loss": 0.3685, "step": 33730 }, { "epoch": 0.45, "learning_rate": 2.8770225156677144e-05, "loss": 0.5218, "step": 33735 }, { "epoch": 0.45, "learning_rate": 2.8765023656315503e-05, "loss": 1.1655, "step": 33740 }, { "epoch": 0.45, "learning_rate": 2.875982198918215e-05, "loss": 0.4554, "step": 33745 }, { "epoch": 0.45, "learning_rate": 2.8755660535554667e-05, "loss": 0.5406, "step": 33750 }, { "epoch": 0.45, "learning_rate": 2.875045856881286e-05, "loss": 0.4816, "step": 33755 }, { "epoch": 0.45, "learning_rate": 2.8745256435944507e-05, "loss": 0.815, "step": 33760 }, { "epoch": 0.45, "learning_rate": 2.874005413718003e-05, "loss": 0.2759, "step": 33765 }, { "epoch": 0.45, "learning_rate": 2.8734851672749868e-05, "loss": 1.1077, "step": 33770 }, { "epoch": 0.45, "learning_rate": 2.872964904288446e-05, "loss": 0.6303, "step": 33775 }, { "epoch": 0.45, "learning_rate": 2.8724446247814252e-05, "loss": 1.216, "step": 33780 }, { "epoch": 0.45, "learning_rate": 2.8719243287769715e-05, "loss": 0.1588, "step": 33785 }, { "epoch": 0.45, "learning_rate": 2.8714040162981305e-05, "loss": 0.9416, "step": 33790 }, { "epoch": 0.45, "learning_rate": 2.8708836873679496e-05, "loss": 0.4566, "step": 33795 }, { "epoch": 0.45, "learning_rate": 2.8703633420094766e-05, "loss": 0.4457, "step": 33800 }, { "epoch": 0.45, "learning_rate": 2.8698429802457603e-05, "loss": 0.395, "step": 33805 }, { "epoch": 0.45, "learning_rate": 2.869322602099851e-05, "loss": 0.3165, "step": 33810 }, { "epoch": 0.45, "learning_rate": 2.868802207594798e-05, "loss": 0.8538, "step": 33815 }, { "epoch": 0.45, "learning_rate": 2.8682817967536512e-05, "loss": 0.6268, "step": 33820 }, { "epoch": 0.45, "learning_rate": 2.8677613695994647e-05, "loss": 0.7271, "step": 33825 }, { "epoch": 0.45, "learning_rate": 2.867240926155289e-05, "loss": 0.8078, "step": 33830 }, { "epoch": 0.45, "learning_rate": 2.866720466444177e-05, "loss": 0.5944, "step": 33835 }, { "epoch": 0.45, "learning_rate": 2.8661999904891828e-05, "loss": 0.5989, "step": 33840 }, { "epoch": 0.45, "learning_rate": 2.865679498313362e-05, "loss": 1.0426, "step": 33845 }, { "epoch": 0.45, "learning_rate": 2.8651589899397678e-05, "loss": 0.9079, "step": 33850 }, { "epoch": 0.45, "learning_rate": 2.8646384653914582e-05, "loss": 0.8713, "step": 33855 }, { "epoch": 0.45, "learning_rate": 2.8641179246914883e-05, "loss": 0.7869, "step": 33860 }, { "epoch": 0.45, "learning_rate": 2.8635973678629158e-05, "loss": 0.1346, "step": 33865 }, { "epoch": 0.45, "learning_rate": 2.863076794928799e-05, "loss": 0.2991, "step": 33870 }, { "epoch": 0.45, "learning_rate": 2.862556205912197e-05, "loss": 0.4022, "step": 33875 }, { "epoch": 0.45, "learning_rate": 2.8620356008361687e-05, "loss": 0.903, "step": 33880 }, { "epoch": 0.45, "learning_rate": 2.8615149797237744e-05, "loss": 0.2529, "step": 33885 }, { "epoch": 0.45, "learning_rate": 2.860994342598075e-05, "loss": 0.6956, "step": 33890 }, { "epoch": 0.45, "learning_rate": 2.8604736894821322e-05, "loss": 0.4007, "step": 33895 }, { "epoch": 0.45, "learning_rate": 2.859953020399009e-05, "loss": 0.4598, "step": 33900 }, { "epoch": 0.45, "learning_rate": 2.8594323353717667e-05, "loss": 0.4835, "step": 33905 }, { "epoch": 0.45, "learning_rate": 2.8589116344234712e-05, "loss": 0.5128, "step": 33910 }, { "epoch": 0.45, "learning_rate": 2.858390917577185e-05, "loss": 0.5377, "step": 33915 }, { "epoch": 0.45, "learning_rate": 2.8578701848559742e-05, "loss": 0.7927, "step": 33920 }, { "epoch": 0.45, "learning_rate": 2.857349436282905e-05, "loss": 0.8419, "step": 33925 }, { "epoch": 0.45, "learning_rate": 2.8568286718810432e-05, "loss": 1.1954, "step": 33930 }, { "epoch": 0.45, "learning_rate": 2.856307891673457e-05, "loss": 0.5184, "step": 33935 }, { "epoch": 0.45, "learning_rate": 2.8557870956832132e-05, "loss": 0.976, "step": 33940 }, { "epoch": 0.45, "learning_rate": 2.855266283933381e-05, "loss": 0.7111, "step": 33945 }, { "epoch": 0.45, "learning_rate": 2.85474545644703e-05, "loss": 0.7651, "step": 33950 }, { "epoch": 0.45, "learning_rate": 2.85422461324723e-05, "loss": 0.9065, "step": 33955 }, { "epoch": 0.46, "learning_rate": 2.8537037543570515e-05, "loss": 0.4065, "step": 33960 }, { "epoch": 0.46, "learning_rate": 2.853182879799567e-05, "loss": 0.8239, "step": 33965 }, { "epoch": 0.46, "learning_rate": 2.852661989597847e-05, "loss": 1.2257, "step": 33970 }, { "epoch": 0.46, "learning_rate": 2.8521410837749647e-05, "loss": 0.3479, "step": 33975 }, { "epoch": 0.46, "learning_rate": 2.8516201623539952e-05, "loss": 0.4383, "step": 33980 }, { "epoch": 0.46, "learning_rate": 2.851099225358011e-05, "loss": 0.4716, "step": 33985 }, { "epoch": 0.46, "learning_rate": 2.8505782728100883e-05, "loss": 1.0529, "step": 33990 }, { "epoch": 0.46, "learning_rate": 2.8500573047333017e-05, "loss": 0.3909, "step": 33995 }, { "epoch": 0.46, "learning_rate": 2.8495363211507275e-05, "loss": 0.9135, "step": 34000 }, { "epoch": 0.46, "learning_rate": 2.8490153220854427e-05, "loss": 0.3605, "step": 34005 }, { "epoch": 0.46, "learning_rate": 2.848494307560526e-05, "loss": 0.7266, "step": 34010 }, { "epoch": 0.46, "learning_rate": 2.847973277599054e-05, "loss": 0.9081, "step": 34015 }, { "epoch": 0.46, "learning_rate": 2.8474522322241078e-05, "loss": 0.3825, "step": 34020 }, { "epoch": 0.46, "learning_rate": 2.846931171458765e-05, "loss": 0.344, "step": 34025 }, { "epoch": 0.46, "learning_rate": 2.8464100953261068e-05, "loss": 0.2751, "step": 34030 }, { "epoch": 0.46, "learning_rate": 2.8458890038492154e-05, "loss": 1.3295, "step": 34035 }, { "epoch": 0.46, "learning_rate": 2.8453678970511704e-05, "loss": 0.6124, "step": 34040 }, { "epoch": 0.46, "learning_rate": 2.844846774955056e-05, "loss": 0.623, "step": 34045 }, { "epoch": 0.46, "learning_rate": 2.8443256375839556e-05, "loss": 0.5233, "step": 34050 }, { "epoch": 0.46, "learning_rate": 2.8438044849609508e-05, "loss": 0.8362, "step": 34055 }, { "epoch": 0.46, "learning_rate": 2.843283317109127e-05, "loss": 0.8784, "step": 34060 }, { "epoch": 0.46, "learning_rate": 2.8427621340515708e-05, "loss": 0.3388, "step": 34065 }, { "epoch": 0.46, "learning_rate": 2.842240935811366e-05, "loss": 0.2889, "step": 34070 }, { "epoch": 0.46, "learning_rate": 2.841719722411601e-05, "loss": 1.0134, "step": 34075 }, { "epoch": 0.46, "learning_rate": 2.8411984938753606e-05, "loss": 1.1694, "step": 34080 }, { "epoch": 0.46, "learning_rate": 2.8406772502257345e-05, "loss": 0.3786, "step": 34085 }, { "epoch": 0.46, "learning_rate": 2.8401559914858105e-05, "loss": 0.3402, "step": 34090 }, { "epoch": 0.46, "learning_rate": 2.8396347176786774e-05, "loss": 0.51, "step": 34095 }, { "epoch": 0.46, "learning_rate": 2.8391134288274263e-05, "loss": 0.4076, "step": 34100 }, { "epoch": 0.46, "learning_rate": 2.8385921249551467e-05, "loss": 1.1659, "step": 34105 }, { "epoch": 0.46, "learning_rate": 2.838070806084929e-05, "loss": 0.9322, "step": 34110 }, { "epoch": 0.46, "learning_rate": 2.8375494722398666e-05, "loss": 0.7129, "step": 34115 }, { "epoch": 0.46, "learning_rate": 2.8370281234430517e-05, "loss": 0.3793, "step": 34120 }, { "epoch": 0.46, "learning_rate": 2.8365067597175765e-05, "loss": 0.5087, "step": 34125 }, { "epoch": 0.46, "learning_rate": 2.8359853810865356e-05, "loss": 0.3166, "step": 34130 }, { "epoch": 0.46, "learning_rate": 2.8354639875730228e-05, "loss": 0.3872, "step": 34135 }, { "epoch": 0.46, "learning_rate": 2.8349425792001334e-05, "loss": 1.2204, "step": 34140 }, { "epoch": 0.46, "learning_rate": 2.8344211559909638e-05, "loss": 0.9735, "step": 34145 }, { "epoch": 0.46, "learning_rate": 2.83389971796861e-05, "loss": 0.3299, "step": 34150 }, { "epoch": 0.46, "learning_rate": 2.833378265156169e-05, "loss": 0.7304, "step": 34155 }, { "epoch": 0.46, "learning_rate": 2.8328567975767395e-05, "loss": 1.009, "step": 34160 }, { "epoch": 0.46, "learning_rate": 2.8323353152534176e-05, "loss": 0.3847, "step": 34165 }, { "epoch": 0.46, "learning_rate": 2.8318138182093052e-05, "loss": 0.8106, "step": 34170 }, { "epoch": 0.46, "learning_rate": 2.8312923064675e-05, "loss": 0.502, "step": 34175 }, { "epoch": 0.46, "learning_rate": 2.8307707800511034e-05, "loss": 0.5695, "step": 34180 }, { "epoch": 0.46, "learning_rate": 2.830249238983216e-05, "loss": 0.4583, "step": 34185 }, { "epoch": 0.46, "learning_rate": 2.829727683286939e-05, "loss": 0.1845, "step": 34190 }, { "epoch": 0.46, "learning_rate": 2.8292061129853752e-05, "loss": 0.604, "step": 34195 }, { "epoch": 0.46, "learning_rate": 2.8286845281016284e-05, "loss": 0.4652, "step": 34200 }, { "epoch": 0.46, "learning_rate": 2.8281629286588007e-05, "loss": 0.7149, "step": 34205 }, { "epoch": 0.46, "learning_rate": 2.8276413146799973e-05, "loss": 0.8032, "step": 34210 }, { "epoch": 0.46, "learning_rate": 2.827119686188323e-05, "loss": 0.7497, "step": 34215 }, { "epoch": 0.46, "learning_rate": 2.826598043206882e-05, "loss": 0.6502, "step": 34220 }, { "epoch": 0.46, "learning_rate": 2.826076385758783e-05, "loss": 0.6959, "step": 34225 }, { "epoch": 0.46, "learning_rate": 2.8255547138671314e-05, "loss": 0.4598, "step": 34230 }, { "epoch": 0.46, "learning_rate": 2.8250330275550336e-05, "loss": 1.1661, "step": 34235 }, { "epoch": 0.46, "learning_rate": 2.824511326845599e-05, "loss": 0.4928, "step": 34240 }, { "epoch": 0.46, "learning_rate": 2.8239896117619367e-05, "loss": 0.5086, "step": 34245 }, { "epoch": 0.46, "learning_rate": 2.8234678823271548e-05, "loss": 0.5247, "step": 34250 }, { "epoch": 0.46, "learning_rate": 2.8229461385643646e-05, "loss": 1.2427, "step": 34255 }, { "epoch": 0.46, "learning_rate": 2.822424380496676e-05, "loss": 0.8456, "step": 34260 }, { "epoch": 0.46, "learning_rate": 2.8219026081472e-05, "loss": 0.6173, "step": 34265 }, { "epoch": 0.46, "learning_rate": 2.8213808215390496e-05, "loss": 0.3394, "step": 34270 }, { "epoch": 0.46, "learning_rate": 2.820859020695335e-05, "loss": 0.7046, "step": 34275 }, { "epoch": 0.46, "learning_rate": 2.8203372056391725e-05, "loss": 0.3285, "step": 34280 }, { "epoch": 0.46, "learning_rate": 2.8198153763936747e-05, "loss": 0.5327, "step": 34285 }, { "epoch": 0.46, "learning_rate": 2.8192935329819547e-05, "loss": 0.2654, "step": 34290 }, { "epoch": 0.46, "learning_rate": 2.8187716754271288e-05, "loss": 0.4617, "step": 34295 }, { "epoch": 0.46, "learning_rate": 2.8182498037523124e-05, "loss": 0.3174, "step": 34300 }, { "epoch": 0.46, "learning_rate": 2.8177279179806214e-05, "loss": 0.9286, "step": 34305 }, { "epoch": 0.46, "learning_rate": 2.8172060181351744e-05, "loss": 0.6534, "step": 34310 }, { "epoch": 0.46, "learning_rate": 2.8166841042390873e-05, "loss": 0.7082, "step": 34315 }, { "epoch": 0.46, "learning_rate": 2.8161621763154784e-05, "loss": 0.733, "step": 34320 }, { "epoch": 0.46, "learning_rate": 2.815640234387467e-05, "loss": 0.7666, "step": 34325 }, { "epoch": 0.46, "learning_rate": 2.8151182784781714e-05, "loss": 1.655, "step": 34330 }, { "epoch": 0.46, "learning_rate": 2.8145963086107137e-05, "loss": 1.2149, "step": 34335 }, { "epoch": 0.46, "learning_rate": 2.8140743248082134e-05, "loss": 1.5432, "step": 34340 }, { "epoch": 0.46, "learning_rate": 2.8135523270937913e-05, "loss": 0.4579, "step": 34345 }, { "epoch": 0.46, "learning_rate": 2.8130303154905703e-05, "loss": 0.5999, "step": 34350 }, { "epoch": 0.46, "learning_rate": 2.8125082900216716e-05, "loss": 1.0415, "step": 34355 }, { "epoch": 0.46, "learning_rate": 2.811986250710219e-05, "loss": 0.8211, "step": 34360 }, { "epoch": 0.46, "learning_rate": 2.8114641975793372e-05, "loss": 0.3838, "step": 34365 }, { "epoch": 0.46, "learning_rate": 2.8109421306521494e-05, "loss": 1.4947, "step": 34370 }, { "epoch": 0.46, "learning_rate": 2.8104200499517804e-05, "loss": 0.9842, "step": 34375 }, { "epoch": 0.46, "learning_rate": 2.809897955501356e-05, "loss": 1.1224, "step": 34380 }, { "epoch": 0.46, "learning_rate": 2.809375847324003e-05, "loss": 0.6272, "step": 34385 }, { "epoch": 0.46, "learning_rate": 2.8088537254428475e-05, "loss": 0.24, "step": 34390 }, { "epoch": 0.46, "learning_rate": 2.8083315898810174e-05, "loss": 0.9894, "step": 34395 }, { "epoch": 0.46, "learning_rate": 2.80780944066164e-05, "loss": 0.7764, "step": 34400 }, { "epoch": 0.46, "learning_rate": 2.807287277807845e-05, "loss": 1.7066, "step": 34405 }, { "epoch": 0.46, "learning_rate": 2.8067651013427605e-05, "loss": 0.692, "step": 34410 }, { "epoch": 0.46, "learning_rate": 2.806242911289516e-05, "loss": 1.228, "step": 34415 }, { "epoch": 0.46, "learning_rate": 2.805720707671244e-05, "loss": 0.758, "step": 34420 }, { "epoch": 0.46, "learning_rate": 2.8051984905110735e-05, "loss": 0.904, "step": 34425 }, { "epoch": 0.46, "learning_rate": 2.8046762598321363e-05, "loss": 0.522, "step": 34430 }, { "epoch": 0.46, "learning_rate": 2.804154015657565e-05, "loss": 0.7881, "step": 34435 }, { "epoch": 0.46, "learning_rate": 2.8036317580104925e-05, "loss": 1.0323, "step": 34440 }, { "epoch": 0.46, "learning_rate": 2.8031094869140528e-05, "loss": 0.9363, "step": 34445 }, { "epoch": 0.46, "learning_rate": 2.8025872023913792e-05, "loss": 0.9685, "step": 34450 }, { "epoch": 0.46, "learning_rate": 2.8020649044656056e-05, "loss": 0.7638, "step": 34455 }, { "epoch": 0.46, "learning_rate": 2.801542593159869e-05, "loss": 0.5511, "step": 34460 }, { "epoch": 0.46, "learning_rate": 2.801020268497303e-05, "loss": 0.6062, "step": 34465 }, { "epoch": 0.46, "learning_rate": 2.8004979305010455e-05, "loss": 0.8416, "step": 34470 }, { "epoch": 0.46, "learning_rate": 2.7999755791942327e-05, "loss": 0.7804, "step": 34475 }, { "epoch": 0.46, "learning_rate": 2.7994532146000035e-05, "loss": 1.0278, "step": 34480 }, { "epoch": 0.46, "learning_rate": 2.798930836741494e-05, "loss": 0.6618, "step": 34485 }, { "epoch": 0.46, "learning_rate": 2.798408445641844e-05, "loss": 0.3006, "step": 34490 }, { "epoch": 0.46, "learning_rate": 2.7978860413241925e-05, "loss": 1.1579, "step": 34495 }, { "epoch": 0.46, "learning_rate": 2.7973636238116806e-05, "loss": 0.6094, "step": 34500 }, { "epoch": 0.46, "learning_rate": 2.7968411931274475e-05, "loss": 1.1326, "step": 34505 }, { "epoch": 0.46, "learning_rate": 2.7963187492946343e-05, "loss": 0.5648, "step": 34510 }, { "epoch": 0.46, "learning_rate": 2.7957962923363835e-05, "loss": 1.0248, "step": 34515 }, { "epoch": 0.46, "learning_rate": 2.7952738222758364e-05, "loss": 1.1548, "step": 34520 }, { "epoch": 0.46, "learning_rate": 2.7947513391361357e-05, "loss": 0.8149, "step": 34525 }, { "epoch": 0.46, "learning_rate": 2.7942288429404256e-05, "loss": 0.3477, "step": 34530 }, { "epoch": 0.46, "learning_rate": 2.7937063337118502e-05, "loss": 1.678, "step": 34535 }, { "epoch": 0.46, "learning_rate": 2.7931838114735532e-05, "loss": 0.6079, "step": 34540 }, { "epoch": 0.46, "learning_rate": 2.7926612762486798e-05, "loss": 0.9692, "step": 34545 }, { "epoch": 0.46, "learning_rate": 2.792138728060376e-05, "loss": 1.2368, "step": 34550 }, { "epoch": 0.46, "learning_rate": 2.7916161669317885e-05, "loss": 0.4626, "step": 34555 }, { "epoch": 0.46, "learning_rate": 2.7910935928860643e-05, "loss": 0.8452, "step": 34560 }, { "epoch": 0.46, "learning_rate": 2.7905710059463492e-05, "loss": 0.7557, "step": 34565 }, { "epoch": 0.46, "learning_rate": 2.790048406135793e-05, "loss": 0.2713, "step": 34570 }, { "epoch": 0.46, "learning_rate": 2.7895257934775426e-05, "loss": 1.0497, "step": 34575 }, { "epoch": 0.46, "learning_rate": 2.7890031679947483e-05, "loss": 0.3019, "step": 34580 }, { "epoch": 0.46, "learning_rate": 2.78848052971056e-05, "loss": 0.6914, "step": 34585 }, { "epoch": 0.46, "learning_rate": 2.7879578786481275e-05, "loss": 0.2827, "step": 34590 }, { "epoch": 0.46, "learning_rate": 2.787435214830601e-05, "loss": 0.5055, "step": 34595 }, { "epoch": 0.46, "learning_rate": 2.7869125382811322e-05, "loss": 0.4872, "step": 34600 }, { "epoch": 0.46, "learning_rate": 2.7863898490228735e-05, "loss": 0.593, "step": 34605 }, { "epoch": 0.46, "learning_rate": 2.7858671470789778e-05, "loss": 1.181, "step": 34610 }, { "epoch": 0.46, "learning_rate": 2.785344432472598e-05, "loss": 0.6644, "step": 34615 }, { "epoch": 0.46, "learning_rate": 2.7848217052268867e-05, "loss": 0.5988, "step": 34620 }, { "epoch": 0.46, "learning_rate": 2.7842989653649987e-05, "loss": 0.4228, "step": 34625 }, { "epoch": 0.46, "learning_rate": 2.7837762129100885e-05, "loss": 0.3991, "step": 34630 }, { "epoch": 0.46, "learning_rate": 2.7832534478853124e-05, "loss": 0.8296, "step": 34635 }, { "epoch": 0.46, "learning_rate": 2.7827306703138255e-05, "loss": 0.852, "step": 34640 }, { "epoch": 0.46, "learning_rate": 2.7822078802187844e-05, "loss": 0.9549, "step": 34645 }, { "epoch": 0.46, "learning_rate": 2.7816850776233462e-05, "loss": 0.7864, "step": 34650 }, { "epoch": 0.46, "learning_rate": 2.781162262550668e-05, "loss": 1.1308, "step": 34655 }, { "epoch": 0.46, "learning_rate": 2.7806394350239073e-05, "loss": 0.4029, "step": 34660 }, { "epoch": 0.46, "learning_rate": 2.780116595066225e-05, "loss": 0.8889, "step": 34665 }, { "epoch": 0.46, "learning_rate": 2.779593742700779e-05, "loss": 0.6554, "step": 34670 }, { "epoch": 0.46, "learning_rate": 2.779070877950728e-05, "loss": 0.5692, "step": 34675 }, { "epoch": 0.46, "learning_rate": 2.778548000839234e-05, "loss": 1.0515, "step": 34680 }, { "epoch": 0.46, "learning_rate": 2.778025111389457e-05, "loss": 1.3051, "step": 34685 }, { "epoch": 0.46, "learning_rate": 2.777502209624558e-05, "loss": 0.8445, "step": 34690 }, { "epoch": 0.46, "learning_rate": 2.7769792955677e-05, "loss": 0.4602, "step": 34695 }, { "epoch": 0.46, "learning_rate": 2.7764563692420443e-05, "loss": 1.0582, "step": 34700 }, { "epoch": 0.46, "learning_rate": 2.7759334306707547e-05, "loss": 0.4034, "step": 34705 }, { "epoch": 0.47, "learning_rate": 2.7754104798769942e-05, "loss": 0.7194, "step": 34710 }, { "epoch": 0.47, "learning_rate": 2.7748875168839277e-05, "loss": 0.6576, "step": 34715 }, { "epoch": 0.47, "learning_rate": 2.7743645417147195e-05, "loss": 0.6726, "step": 34720 }, { "epoch": 0.47, "learning_rate": 2.773841554392535e-05, "loss": 0.833, "step": 34725 }, { "epoch": 0.47, "learning_rate": 2.7733185549405393e-05, "loss": 0.719, "step": 34730 }, { "epoch": 0.47, "learning_rate": 2.7727955433818993e-05, "loss": 1.0307, "step": 34735 }, { "epoch": 0.47, "learning_rate": 2.772272519739781e-05, "loss": 0.267, "step": 34740 }, { "epoch": 0.47, "learning_rate": 2.771749484037352e-05, "loss": 0.697, "step": 34745 }, { "epoch": 0.47, "learning_rate": 2.7712264362977806e-05, "loss": 0.5841, "step": 34750 }, { "epoch": 0.47, "learning_rate": 2.7707033765442357e-05, "loss": 1.0985, "step": 34755 }, { "epoch": 0.47, "learning_rate": 2.7701803047998848e-05, "loss": 1.2969, "step": 34760 }, { "epoch": 0.47, "learning_rate": 2.7696572210878978e-05, "loss": 0.7109, "step": 34765 }, { "epoch": 0.47, "learning_rate": 2.7691341254314452e-05, "loss": 0.74, "step": 34770 }, { "epoch": 0.47, "learning_rate": 2.7686110178536978e-05, "loss": 0.6457, "step": 34775 }, { "epoch": 0.47, "learning_rate": 2.768087898377826e-05, "loss": 0.8556, "step": 34780 }, { "epoch": 0.47, "learning_rate": 2.767564767027001e-05, "loss": 0.94, "step": 34785 }, { "epoch": 0.47, "learning_rate": 2.7670416238243957e-05, "loss": 0.6126, "step": 34790 }, { "epoch": 0.47, "learning_rate": 2.766518468793182e-05, "loss": 0.8038, "step": 34795 }, { "epoch": 0.47, "learning_rate": 2.7659953019565337e-05, "loss": 0.5529, "step": 34800 }, { "epoch": 0.47, "learning_rate": 2.765472123337625e-05, "loss": 1.191, "step": 34805 }, { "epoch": 0.47, "learning_rate": 2.7649489329596288e-05, "loss": 1.4047, "step": 34810 }, { "epoch": 0.47, "learning_rate": 2.7644257308457207e-05, "loss": 0.1754, "step": 34815 }, { "epoch": 0.47, "learning_rate": 2.7639025170190748e-05, "loss": 0.7301, "step": 34820 }, { "epoch": 0.47, "learning_rate": 2.7633792915028677e-05, "loss": 1.1189, "step": 34825 }, { "epoch": 0.47, "learning_rate": 2.7628560543202763e-05, "loss": 1.0979, "step": 34830 }, { "epoch": 0.47, "learning_rate": 2.7623328054944768e-05, "loss": 0.6182, "step": 34835 }, { "epoch": 0.47, "learning_rate": 2.761809545048646e-05, "loss": 0.6236, "step": 34840 }, { "epoch": 0.47, "learning_rate": 2.7612862730059626e-05, "loss": 0.7934, "step": 34845 }, { "epoch": 0.47, "learning_rate": 2.7607629893896037e-05, "loss": 0.2462, "step": 34850 }, { "epoch": 0.47, "learning_rate": 2.7602396942227488e-05, "loss": 0.7182, "step": 34855 }, { "epoch": 0.47, "learning_rate": 2.7597163875285785e-05, "loss": 0.5928, "step": 34860 }, { "epoch": 0.47, "learning_rate": 2.7591930693302713e-05, "loss": 0.5096, "step": 34865 }, { "epoch": 0.47, "learning_rate": 2.7586697396510068e-05, "loss": 0.7841, "step": 34870 }, { "epoch": 0.47, "learning_rate": 2.7581463985139676e-05, "loss": 0.235, "step": 34875 }, { "epoch": 0.47, "learning_rate": 2.7576230459423346e-05, "loss": 0.4345, "step": 34880 }, { "epoch": 0.47, "learning_rate": 2.757099681959289e-05, "loss": 0.3601, "step": 34885 }, { "epoch": 0.47, "learning_rate": 2.7565763065880147e-05, "loss": 0.6932, "step": 34890 }, { "epoch": 0.47, "learning_rate": 2.7560529198516927e-05, "loss": 0.105, "step": 34895 }, { "epoch": 0.47, "learning_rate": 2.7555295217735077e-05, "loss": 0.9916, "step": 34900 }, { "epoch": 0.47, "learning_rate": 2.7550061123766434e-05, "loss": 0.5223, "step": 34905 }, { "epoch": 0.47, "learning_rate": 2.7544826916842837e-05, "loss": 0.2305, "step": 34910 }, { "epoch": 0.47, "learning_rate": 2.753959259719614e-05, "loss": 0.5414, "step": 34915 }, { "epoch": 0.47, "learning_rate": 2.75343581650582e-05, "loss": 0.7972, "step": 34920 }, { "epoch": 0.47, "learning_rate": 2.7529123620660868e-05, "loss": 1.3059, "step": 34925 }, { "epoch": 0.47, "learning_rate": 2.752388896423601e-05, "loss": 0.8331, "step": 34930 }, { "epoch": 0.47, "learning_rate": 2.75186541960155e-05, "loss": 0.9245, "step": 34935 }, { "epoch": 0.47, "learning_rate": 2.7513419316231215e-05, "loss": 1.0226, "step": 34940 }, { "epoch": 0.47, "learning_rate": 2.7508184325115028e-05, "loss": 1.0013, "step": 34945 }, { "epoch": 0.47, "learning_rate": 2.7502949222898815e-05, "loss": 0.8321, "step": 34950 }, { "epoch": 0.47, "learning_rate": 2.749771400981448e-05, "loss": 0.1905, "step": 34955 }, { "epoch": 0.47, "learning_rate": 2.7492478686093904e-05, "loss": 0.7879, "step": 34960 }, { "epoch": 0.47, "learning_rate": 2.7487243251968996e-05, "loss": 0.2489, "step": 34965 }, { "epoch": 0.47, "learning_rate": 2.7482007707671658e-05, "loss": 0.7653, "step": 34970 }, { "epoch": 0.47, "learning_rate": 2.7476772053433797e-05, "loss": 0.8005, "step": 34975 }, { "epoch": 0.47, "learning_rate": 2.7471536289487314e-05, "loss": 0.1577, "step": 34980 }, { "epoch": 0.47, "learning_rate": 2.7466300416064144e-05, "loss": 1.1973, "step": 34985 }, { "epoch": 0.47, "learning_rate": 2.7461064433396207e-05, "loss": 0.3165, "step": 34990 }, { "epoch": 0.47, "learning_rate": 2.7455828341715424e-05, "loss": 0.726, "step": 34995 }, { "epoch": 0.47, "learning_rate": 2.7450592141253734e-05, "loss": 0.7324, "step": 35000 }, { "epoch": 0.47, "learning_rate": 2.7445355832243068e-05, "loss": 1.4008, "step": 35005 }, { "epoch": 0.47, "learning_rate": 2.7440119414915373e-05, "loss": 0.7914, "step": 35010 }, { "epoch": 0.47, "learning_rate": 2.74348828895026e-05, "loss": 0.6969, "step": 35015 }, { "epoch": 0.47, "learning_rate": 2.7429646256236697e-05, "loss": 0.3026, "step": 35020 }, { "epoch": 0.47, "learning_rate": 2.742440951534962e-05, "loss": 0.8442, "step": 35025 }, { "epoch": 0.47, "learning_rate": 2.7419172667073327e-05, "loss": 0.2617, "step": 35030 }, { "epoch": 0.47, "learning_rate": 2.7413935711639787e-05, "loss": 1.0494, "step": 35035 }, { "epoch": 0.47, "learning_rate": 2.740869864928097e-05, "loss": 0.5912, "step": 35040 }, { "epoch": 0.47, "learning_rate": 2.740346148022886e-05, "loss": 1.0207, "step": 35045 }, { "epoch": 0.47, "learning_rate": 2.7398224204715422e-05, "loss": 0.5414, "step": 35050 }, { "epoch": 0.47, "learning_rate": 2.739298682297266e-05, "loss": 0.4752, "step": 35055 }, { "epoch": 0.47, "learning_rate": 2.7387749335232543e-05, "loss": 0.2777, "step": 35060 }, { "epoch": 0.47, "learning_rate": 2.7382511741727078e-05, "loss": 0.7578, "step": 35065 }, { "epoch": 0.47, "learning_rate": 2.7377274042688267e-05, "loss": 1.3144, "step": 35070 }, { "epoch": 0.47, "learning_rate": 2.7372036238348102e-05, "loss": 0.6332, "step": 35075 }, { "epoch": 0.47, "learning_rate": 2.736679832893861e-05, "loss": 0.4873, "step": 35080 }, { "epoch": 0.47, "learning_rate": 2.7361560314691788e-05, "loss": 0.7606, "step": 35085 }, { "epoch": 0.47, "learning_rate": 2.7356322195839656e-05, "loss": 0.8697, "step": 35090 }, { "epoch": 0.47, "learning_rate": 2.7351083972614238e-05, "loss": 0.6018, "step": 35095 }, { "epoch": 0.47, "learning_rate": 2.7345845645247563e-05, "loss": 0.7327, "step": 35100 }, { "epoch": 0.47, "learning_rate": 2.7340607213971666e-05, "loss": 0.8222, "step": 35105 }, { "epoch": 0.47, "learning_rate": 2.7335368679018573e-05, "loss": 0.8445, "step": 35110 }, { "epoch": 0.47, "learning_rate": 2.7330130040620332e-05, "loss": 0.519, "step": 35115 }, { "epoch": 0.47, "learning_rate": 2.7324891299008985e-05, "loss": 0.28, "step": 35120 }, { "epoch": 0.47, "learning_rate": 2.7319652454416595e-05, "loss": 0.8141, "step": 35125 }, { "epoch": 0.47, "learning_rate": 2.73144135070752e-05, "loss": 0.75, "step": 35130 }, { "epoch": 0.47, "learning_rate": 2.7309174457216867e-05, "loss": 0.2599, "step": 35135 }, { "epoch": 0.47, "learning_rate": 2.7303935305073658e-05, "loss": 0.7482, "step": 35140 }, { "epoch": 0.47, "learning_rate": 2.7298696050877636e-05, "loss": 1.4217, "step": 35145 }, { "epoch": 0.47, "learning_rate": 2.729345669486088e-05, "loss": 0.5303, "step": 35150 }, { "epoch": 0.47, "learning_rate": 2.728821723725547e-05, "loss": 0.7826, "step": 35155 }, { "epoch": 0.47, "learning_rate": 2.728297767829348e-05, "loss": 0.3527, "step": 35160 }, { "epoch": 0.47, "learning_rate": 2.727773801820701e-05, "loss": 0.8037, "step": 35165 }, { "epoch": 0.47, "learning_rate": 2.727249825722813e-05, "loss": 0.7466, "step": 35170 }, { "epoch": 0.47, "learning_rate": 2.7267258395588948e-05, "loss": 0.8376, "step": 35175 }, { "epoch": 0.47, "learning_rate": 2.7262018433521563e-05, "loss": 1.0592, "step": 35180 }, { "epoch": 0.47, "learning_rate": 2.725677837125808e-05, "loss": 0.6709, "step": 35185 }, { "epoch": 0.47, "learning_rate": 2.7251538209030607e-05, "loss": 0.7447, "step": 35190 }, { "epoch": 0.47, "learning_rate": 2.7246297947071254e-05, "loss": 1.0953, "step": 35195 }, { "epoch": 0.47, "learning_rate": 2.7241057585612133e-05, "loss": 1.0367, "step": 35200 }, { "epoch": 0.47, "learning_rate": 2.7235817124885376e-05, "loss": 0.551, "step": 35205 }, { "epoch": 0.47, "learning_rate": 2.723057656512311e-05, "loss": 0.6006, "step": 35210 }, { "epoch": 0.47, "learning_rate": 2.722533590655746e-05, "loss": 0.5759, "step": 35215 }, { "epoch": 0.47, "learning_rate": 2.7220095149420566e-05, "loss": 0.8436, "step": 35220 }, { "epoch": 0.47, "learning_rate": 2.721485429394456e-05, "loss": 0.6422, "step": 35225 }, { "epoch": 0.47, "learning_rate": 2.7209613340361582e-05, "loss": 0.1159, "step": 35230 }, { "epoch": 0.47, "learning_rate": 2.7204372288903795e-05, "loss": 0.4892, "step": 35235 }, { "epoch": 0.47, "learning_rate": 2.719913113980334e-05, "loss": 0.2063, "step": 35240 }, { "epoch": 0.47, "learning_rate": 2.7193889893292385e-05, "loss": 0.6493, "step": 35245 }, { "epoch": 0.47, "learning_rate": 2.7188648549603078e-05, "loss": 0.898, "step": 35250 }, { "epoch": 0.47, "learning_rate": 2.718340710896759e-05, "loss": 1.0098, "step": 35255 }, { "epoch": 0.47, "learning_rate": 2.7178165571618085e-05, "loss": 0.8085, "step": 35260 }, { "epoch": 0.47, "learning_rate": 2.7172923937786752e-05, "loss": 0.6724, "step": 35265 }, { "epoch": 0.47, "learning_rate": 2.716768220770576e-05, "loss": 0.4473, "step": 35270 }, { "epoch": 0.47, "learning_rate": 2.7162440381607285e-05, "loss": 0.5622, "step": 35275 }, { "epoch": 0.47, "learning_rate": 2.7157198459723516e-05, "loss": 0.3418, "step": 35280 }, { "epoch": 0.47, "learning_rate": 2.7151956442286652e-05, "loss": 0.4098, "step": 35285 }, { "epoch": 0.47, "learning_rate": 2.7146714329528882e-05, "loss": 0.9976, "step": 35290 }, { "epoch": 0.47, "learning_rate": 2.714147212168241e-05, "loss": 0.5481, "step": 35295 }, { "epoch": 0.47, "learning_rate": 2.7136229818979435e-05, "loss": 1.2609, "step": 35300 }, { "epoch": 0.47, "learning_rate": 2.713098742165217e-05, "loss": 0.2191, "step": 35305 }, { "epoch": 0.47, "learning_rate": 2.7125744929932818e-05, "loss": 1.2333, "step": 35310 }, { "epoch": 0.47, "learning_rate": 2.7120502344053593e-05, "loss": 0.3979, "step": 35315 }, { "epoch": 0.47, "learning_rate": 2.711525966424674e-05, "loss": 0.5367, "step": 35320 }, { "epoch": 0.47, "learning_rate": 2.711001689074445e-05, "loss": 0.4688, "step": 35325 }, { "epoch": 0.47, "learning_rate": 2.7104774023778977e-05, "loss": 0.3047, "step": 35330 }, { "epoch": 0.47, "learning_rate": 2.7099531063582544e-05, "loss": 0.6496, "step": 35335 }, { "epoch": 0.47, "learning_rate": 2.709428801038738e-05, "loss": 0.8811, "step": 35340 }, { "epoch": 0.47, "learning_rate": 2.708904486442575e-05, "loss": 1.0703, "step": 35345 }, { "epoch": 0.47, "learning_rate": 2.7083801625929873e-05, "loss": 0.5937, "step": 35350 }, { "epoch": 0.47, "learning_rate": 2.7078558295132012e-05, "loss": 0.5458, "step": 35355 }, { "epoch": 0.47, "learning_rate": 2.707331487226442e-05, "loss": 0.6337, "step": 35360 }, { "epoch": 0.47, "learning_rate": 2.7068071357559343e-05, "loss": 1.3482, "step": 35365 }, { "epoch": 0.47, "learning_rate": 2.7062827751249054e-05, "loss": 1.323, "step": 35370 }, { "epoch": 0.47, "learning_rate": 2.705758405356582e-05, "loss": 0.7142, "step": 35375 }, { "epoch": 0.47, "learning_rate": 2.7052340264741904e-05, "loss": 0.5896, "step": 35380 }, { "epoch": 0.47, "learning_rate": 2.7047096385009586e-05, "loss": 1.1756, "step": 35385 }, { "epoch": 0.47, "learning_rate": 2.704185241460113e-05, "loss": 0.2298, "step": 35390 }, { "epoch": 0.47, "learning_rate": 2.7036608353748833e-05, "loss": 0.6434, "step": 35395 }, { "epoch": 0.47, "learning_rate": 2.703136420268497e-05, "loss": 0.682, "step": 35400 }, { "epoch": 0.47, "learning_rate": 2.7026119961641845e-05, "loss": 0.0984, "step": 35405 }, { "epoch": 0.47, "learning_rate": 2.7020875630851737e-05, "loss": 1.1802, "step": 35410 }, { "epoch": 0.47, "learning_rate": 2.701563121054695e-05, "loss": 0.686, "step": 35415 }, { "epoch": 0.47, "learning_rate": 2.7010386700959784e-05, "loss": 0.7556, "step": 35420 }, { "epoch": 0.47, "learning_rate": 2.700514210232254e-05, "loss": 0.7717, "step": 35425 }, { "epoch": 0.47, "learning_rate": 2.6999897414867536e-05, "loss": 0.9362, "step": 35430 }, { "epoch": 0.47, "learning_rate": 2.6994652638827078e-05, "loss": 0.5535, "step": 35435 }, { "epoch": 0.47, "learning_rate": 2.6989407774433494e-05, "loss": 0.9749, "step": 35440 }, { "epoch": 0.47, "learning_rate": 2.698416282191909e-05, "loss": 0.4998, "step": 35445 }, { "epoch": 0.47, "learning_rate": 2.6978917781516206e-05, "loss": 0.661, "step": 35450 }, { "epoch": 0.48, "learning_rate": 2.697367265345716e-05, "loss": 0.458, "step": 35455 }, { "epoch": 0.48, "learning_rate": 2.696842743797429e-05, "loss": 0.8293, "step": 35460 }, { "epoch": 0.48, "learning_rate": 2.696318213529994e-05, "loss": 0.5271, "step": 35465 }, { "epoch": 0.48, "learning_rate": 2.695793674566644e-05, "loss": 0.4082, "step": 35470 }, { "epoch": 0.48, "learning_rate": 2.695269126930613e-05, "loss": 0.3627, "step": 35475 }, { "epoch": 0.48, "learning_rate": 2.694744570645137e-05, "loss": 1.0271, "step": 35480 }, { "epoch": 0.48, "learning_rate": 2.694220005733451e-05, "loss": 0.1909, "step": 35485 }, { "epoch": 0.48, "learning_rate": 2.69369543221879e-05, "loss": 0.4474, "step": 35490 }, { "epoch": 0.48, "learning_rate": 2.6931708501243907e-05, "loss": 0.7366, "step": 35495 }, { "epoch": 0.48, "learning_rate": 2.692646259473489e-05, "loss": 0.6857, "step": 35500 }, { "epoch": 0.48, "learning_rate": 2.6921216602893216e-05, "loss": 1.0765, "step": 35505 }, { "epoch": 0.48, "learning_rate": 2.691597052595126e-05, "loss": 0.5656, "step": 35510 }, { "epoch": 0.48, "learning_rate": 2.6910724364141397e-05, "loss": 1.7076, "step": 35515 }, { "epoch": 0.48, "learning_rate": 2.6905478117696002e-05, "loss": 0.8773, "step": 35520 }, { "epoch": 0.48, "learning_rate": 2.6900231786847464e-05, "loss": 0.896, "step": 35525 }, { "epoch": 0.48, "learning_rate": 2.6894985371828156e-05, "loss": 0.7847, "step": 35530 }, { "epoch": 0.48, "learning_rate": 2.688973887287048e-05, "loss": 0.1989, "step": 35535 }, { "epoch": 0.48, "learning_rate": 2.688449229020683e-05, "loss": 0.7026, "step": 35540 }, { "epoch": 0.48, "learning_rate": 2.6879245624069594e-05, "loss": 0.2385, "step": 35545 }, { "epoch": 0.48, "learning_rate": 2.687399887469118e-05, "loss": 0.6003, "step": 35550 }, { "epoch": 0.48, "learning_rate": 2.686875204230399e-05, "loss": 0.1849, "step": 35555 }, { "epoch": 0.48, "learning_rate": 2.6863505127140433e-05, "loss": 0.6743, "step": 35560 }, { "epoch": 0.48, "learning_rate": 2.685825812943292e-05, "loss": 2.0351, "step": 35565 }, { "epoch": 0.48, "learning_rate": 2.6853011049413875e-05, "loss": 0.6908, "step": 35570 }, { "epoch": 0.48, "learning_rate": 2.684776388731571e-05, "loss": 0.5314, "step": 35575 }, { "epoch": 0.48, "learning_rate": 2.6842516643370848e-05, "loss": 0.6982, "step": 35580 }, { "epoch": 0.48, "learning_rate": 2.6837269317811715e-05, "loss": 1.2443, "step": 35585 }, { "epoch": 0.48, "learning_rate": 2.6832021910870735e-05, "loss": 0.4236, "step": 35590 }, { "epoch": 0.48, "learning_rate": 2.6826774422780366e-05, "loss": 0.9684, "step": 35595 }, { "epoch": 0.48, "learning_rate": 2.6821526853773017e-05, "loss": 0.7109, "step": 35600 }, { "epoch": 0.48, "learning_rate": 2.6816279204081146e-05, "loss": 0.5613, "step": 35605 }, { "epoch": 0.48, "learning_rate": 2.6811031473937187e-05, "loss": 1.0708, "step": 35610 }, { "epoch": 0.48, "learning_rate": 2.6805783663573597e-05, "loss": 0.8863, "step": 35615 }, { "epoch": 0.48, "learning_rate": 2.680053577322283e-05, "loss": 0.7908, "step": 35620 }, { "epoch": 0.48, "learning_rate": 2.679528780311733e-05, "loss": 0.8871, "step": 35625 }, { "epoch": 0.48, "learning_rate": 2.6790039753489565e-05, "loss": 0.4631, "step": 35630 }, { "epoch": 0.48, "learning_rate": 2.6784791624572e-05, "loss": 0.5115, "step": 35635 }, { "epoch": 0.48, "learning_rate": 2.6779543416597086e-05, "loss": 0.382, "step": 35640 }, { "epoch": 0.48, "learning_rate": 2.67742951297973e-05, "loss": 1.2644, "step": 35645 }, { "epoch": 0.48, "learning_rate": 2.676904676440512e-05, "loss": 0.4408, "step": 35650 }, { "epoch": 0.48, "learning_rate": 2.6763798320653017e-05, "loss": 0.6246, "step": 35655 }, { "epoch": 0.48, "learning_rate": 2.675854979877348e-05, "loss": 0.1332, "step": 35660 }, { "epoch": 0.48, "learning_rate": 2.6753301198998976e-05, "loss": 0.9984, "step": 35665 }, { "epoch": 0.48, "learning_rate": 2.6748052521562002e-05, "loss": 1.323, "step": 35670 }, { "epoch": 0.48, "learning_rate": 2.6742803766695046e-05, "loss": 0.6969, "step": 35675 }, { "epoch": 0.48, "learning_rate": 2.6737554934630605e-05, "loss": 1.0189, "step": 35680 }, { "epoch": 0.48, "learning_rate": 2.6732306025601172e-05, "loss": 0.9645, "step": 35685 }, { "epoch": 0.48, "learning_rate": 2.6727057039839255e-05, "loss": 0.6301, "step": 35690 }, { "epoch": 0.48, "learning_rate": 2.6721807977577334e-05, "loss": 0.779, "step": 35695 }, { "epoch": 0.48, "learning_rate": 2.671655883904795e-05, "loss": 1.0248, "step": 35700 }, { "epoch": 0.48, "learning_rate": 2.6711309624483593e-05, "loss": 0.6954, "step": 35705 }, { "epoch": 0.48, "learning_rate": 2.6706060334116777e-05, "loss": 0.5961, "step": 35710 }, { "epoch": 0.48, "learning_rate": 2.670081096818003e-05, "loss": 0.5519, "step": 35715 }, { "epoch": 0.48, "learning_rate": 2.6695561526905853e-05, "loss": 0.3171, "step": 35720 }, { "epoch": 0.48, "learning_rate": 2.669031201052679e-05, "loss": 0.6134, "step": 35725 }, { "epoch": 0.48, "learning_rate": 2.668506241927537e-05, "loss": 0.6288, "step": 35730 }, { "epoch": 0.48, "learning_rate": 2.6679812753384105e-05, "loss": 1.0592, "step": 35735 }, { "epoch": 0.48, "learning_rate": 2.6674563013085547e-05, "loss": 0.5168, "step": 35740 }, { "epoch": 0.48, "learning_rate": 2.6669313198612222e-05, "loss": 1.0178, "step": 35745 }, { "epoch": 0.48, "learning_rate": 2.6664063310196662e-05, "loss": 1.276, "step": 35750 }, { "epoch": 0.48, "learning_rate": 2.6658813348071437e-05, "loss": 0.8894, "step": 35755 }, { "epoch": 0.48, "learning_rate": 2.6653563312469076e-05, "loss": 1.0932, "step": 35760 }, { "epoch": 0.48, "learning_rate": 2.664831320362213e-05, "loss": 0.4398, "step": 35765 }, { "epoch": 0.48, "learning_rate": 2.664306302176316e-05, "loss": 0.4652, "step": 35770 }, { "epoch": 0.48, "learning_rate": 2.663781276712471e-05, "loss": 0.8349, "step": 35775 }, { "epoch": 0.48, "learning_rate": 2.663256243993935e-05, "loss": 0.1945, "step": 35780 }, { "epoch": 0.48, "learning_rate": 2.662731204043965e-05, "loss": 0.7336, "step": 35785 }, { "epoch": 0.48, "learning_rate": 2.662206156885816e-05, "loss": 0.2386, "step": 35790 }, { "epoch": 0.48, "learning_rate": 2.6616811025427457e-05, "loss": 1.0715, "step": 35795 }, { "epoch": 0.48, "learning_rate": 2.661156041038012e-05, "loss": 0.176, "step": 35800 }, { "epoch": 0.48, "learning_rate": 2.6606309723948707e-05, "loss": 0.9027, "step": 35805 }, { "epoch": 0.48, "learning_rate": 2.6601058966365822e-05, "loss": 0.83, "step": 35810 }, { "epoch": 0.48, "learning_rate": 2.6595808137864037e-05, "loss": 0.638, "step": 35815 }, { "epoch": 0.48, "learning_rate": 2.659055723867593e-05, "loss": 1.9227, "step": 35820 }, { "epoch": 0.48, "learning_rate": 2.6585306269034094e-05, "loss": 1.3688, "step": 35825 }, { "epoch": 0.48, "learning_rate": 2.658005522917112e-05, "loss": 1.3189, "step": 35830 }, { "epoch": 0.48, "learning_rate": 2.6574804119319596e-05, "loss": 0.3515, "step": 35835 }, { "epoch": 0.48, "learning_rate": 2.6569552939712144e-05, "loss": 0.6331, "step": 35840 }, { "epoch": 0.48, "learning_rate": 2.656430169058134e-05, "loss": 0.6119, "step": 35845 }, { "epoch": 0.48, "learning_rate": 2.65590503721598e-05, "loss": 0.367, "step": 35850 }, { "epoch": 0.48, "learning_rate": 2.655379898468013e-05, "loss": 0.7225, "step": 35855 }, { "epoch": 0.48, "learning_rate": 2.6548547528374928e-05, "loss": 0.8208, "step": 35860 }, { "epoch": 0.48, "learning_rate": 2.654329600347683e-05, "loss": 0.9492, "step": 35865 }, { "epoch": 0.48, "learning_rate": 2.653804441021844e-05, "loss": 1.1493, "step": 35870 }, { "epoch": 0.48, "learning_rate": 2.6532792748832365e-05, "loss": 0.8168, "step": 35875 }, { "epoch": 0.48, "learning_rate": 2.652754101955125e-05, "loss": 0.7309, "step": 35880 }, { "epoch": 0.48, "learning_rate": 2.6522289222607704e-05, "loss": 0.2334, "step": 35885 }, { "epoch": 0.48, "learning_rate": 2.6517037358234365e-05, "loss": 0.6492, "step": 35890 }, { "epoch": 0.48, "learning_rate": 2.651178542666386e-05, "loss": 0.5227, "step": 35895 }, { "epoch": 0.48, "learning_rate": 2.650653342812882e-05, "loss": 0.135, "step": 35900 }, { "epoch": 0.48, "learning_rate": 2.6502331781242662e-05, "loss": 1.5258, "step": 35905 }, { "epoch": 0.48, "learning_rate": 2.6497079662757724e-05, "loss": 0.8831, "step": 35910 }, { "epoch": 0.48, "learning_rate": 2.6491827477959635e-05, "loss": 0.5219, "step": 35915 }, { "epoch": 0.48, "learning_rate": 2.6486575227081056e-05, "loss": 0.6212, "step": 35920 }, { "epoch": 0.48, "learning_rate": 2.6481322910354634e-05, "loss": 0.4404, "step": 35925 }, { "epoch": 0.48, "learning_rate": 2.647607052801302e-05, "loss": 1.3804, "step": 35930 }, { "epoch": 0.48, "learning_rate": 2.6470818080288857e-05, "loss": 1.2636, "step": 35935 }, { "epoch": 0.48, "learning_rate": 2.6465565567414812e-05, "loss": 0.8521, "step": 35940 }, { "epoch": 0.48, "learning_rate": 2.646031298962355e-05, "loss": 0.1883, "step": 35945 }, { "epoch": 0.48, "learning_rate": 2.645506034714773e-05, "loss": 1.1481, "step": 35950 }, { "epoch": 0.48, "learning_rate": 2.6449807640220015e-05, "loss": 0.8056, "step": 35955 }, { "epoch": 0.48, "learning_rate": 2.6444554869073075e-05, "loss": 0.4028, "step": 35960 }, { "epoch": 0.48, "learning_rate": 2.643930203393958e-05, "loss": 0.5561, "step": 35965 }, { "epoch": 0.48, "learning_rate": 2.6434049135052202e-05, "loss": 0.2901, "step": 35970 }, { "epoch": 0.48, "learning_rate": 2.6428796172643623e-05, "loss": 0.6144, "step": 35975 }, { "epoch": 0.48, "learning_rate": 2.642354314694652e-05, "loss": 0.4836, "step": 35980 }, { "epoch": 0.48, "learning_rate": 2.641829005819359e-05, "loss": 1.5051, "step": 35985 }, { "epoch": 0.48, "learning_rate": 2.6413036906617495e-05, "loss": 0.5223, "step": 35990 }, { "epoch": 0.48, "learning_rate": 2.6407783692450934e-05, "loss": 0.8882, "step": 35995 }, { "epoch": 0.48, "learning_rate": 2.640253041592659e-05, "loss": 1.3775, "step": 36000 }, { "epoch": 0.48, "learning_rate": 2.6397277077277183e-05, "loss": 0.6507, "step": 36005 }, { "epoch": 0.48, "learning_rate": 2.6392023676735384e-05, "loss": 0.3002, "step": 36010 }, { "epoch": 0.48, "learning_rate": 2.63867702145339e-05, "loss": 1.2059, "step": 36015 }, { "epoch": 0.48, "learning_rate": 2.6381516690905434e-05, "loss": 1.0015, "step": 36020 }, { "epoch": 0.48, "learning_rate": 2.6376263106082686e-05, "loss": 0.7145, "step": 36025 }, { "epoch": 0.48, "learning_rate": 2.6371009460298368e-05, "loss": 0.5025, "step": 36030 }, { "epoch": 0.48, "learning_rate": 2.63657557537852e-05, "loss": 0.3984, "step": 36035 }, { "epoch": 0.48, "learning_rate": 2.6360501986775883e-05, "loss": 0.3017, "step": 36040 }, { "epoch": 0.48, "learning_rate": 2.635524815950312e-05, "loss": 0.4292, "step": 36045 }, { "epoch": 0.48, "learning_rate": 2.6349994272199652e-05, "loss": 0.591, "step": 36050 }, { "epoch": 0.48, "learning_rate": 2.6344740325098192e-05, "loss": 0.4909, "step": 36055 }, { "epoch": 0.48, "learning_rate": 2.6339486318431468e-05, "loss": 0.8839, "step": 36060 }, { "epoch": 0.48, "learning_rate": 2.6334232252432193e-05, "loss": 0.3984, "step": 36065 }, { "epoch": 0.48, "learning_rate": 2.632897812733311e-05, "loss": 0.2062, "step": 36070 }, { "epoch": 0.48, "learning_rate": 2.6323723943366946e-05, "loss": 0.7523, "step": 36075 }, { "epoch": 0.48, "learning_rate": 2.6318469700766428e-05, "loss": 0.6568, "step": 36080 }, { "epoch": 0.48, "learning_rate": 2.6313215399764296e-05, "loss": 0.7073, "step": 36085 }, { "epoch": 0.48, "learning_rate": 2.6307961040593298e-05, "loss": 0.5899, "step": 36090 }, { "epoch": 0.48, "learning_rate": 2.6302706623486175e-05, "loss": 0.8564, "step": 36095 }, { "epoch": 0.48, "learning_rate": 2.6297452148675657e-05, "loss": 0.9962, "step": 36100 }, { "epoch": 0.48, "learning_rate": 2.62921976163945e-05, "loss": 0.5816, "step": 36105 }, { "epoch": 0.48, "learning_rate": 2.6286943026875456e-05, "loss": 0.1179, "step": 36110 }, { "epoch": 0.48, "learning_rate": 2.6281688380351265e-05, "loss": 1.7359, "step": 36115 }, { "epoch": 0.48, "learning_rate": 2.62764336770547e-05, "loss": 2.0633, "step": 36120 }, { "epoch": 0.48, "learning_rate": 2.6271178917218507e-05, "loss": 0.2301, "step": 36125 }, { "epoch": 0.48, "learning_rate": 2.626592410107545e-05, "loss": 0.7604, "step": 36130 }, { "epoch": 0.48, "learning_rate": 2.6260669228858286e-05, "loss": 0.8685, "step": 36135 }, { "epoch": 0.48, "learning_rate": 2.625541430079978e-05, "loss": 0.2433, "step": 36140 }, { "epoch": 0.48, "learning_rate": 2.6250159317132706e-05, "loss": 0.5956, "step": 36145 }, { "epoch": 0.48, "learning_rate": 2.6244904278089832e-05, "loss": 0.8025, "step": 36150 }, { "epoch": 0.48, "learning_rate": 2.623964918390392e-05, "loss": 0.3619, "step": 36155 }, { "epoch": 0.48, "learning_rate": 2.6234394034807746e-05, "loss": 0.893, "step": 36160 }, { "epoch": 0.48, "learning_rate": 2.62291388310341e-05, "loss": 0.5136, "step": 36165 }, { "epoch": 0.48, "learning_rate": 2.622388357281575e-05, "loss": 1.3192, "step": 36170 }, { "epoch": 0.48, "learning_rate": 2.621862826038548e-05, "loss": 0.4505, "step": 36175 }, { "epoch": 0.48, "learning_rate": 2.6213372893976074e-05, "loss": 0.5428, "step": 36180 }, { "epoch": 0.48, "learning_rate": 2.6208117473820328e-05, "loss": 1.0918, "step": 36185 }, { "epoch": 0.48, "learning_rate": 2.620286200015101e-05, "loss": 0.7618, "step": 36190 }, { "epoch": 0.48, "learning_rate": 2.6197606473200924e-05, "loss": 0.3883, "step": 36195 }, { "epoch": 0.49, "learning_rate": 2.619235089320287e-05, "loss": 0.247, "step": 36200 }, { "epoch": 0.49, "learning_rate": 2.618709526038964e-05, "loss": 0.4012, "step": 36205 }, { "epoch": 0.49, "learning_rate": 2.6181839574994016e-05, "loss": 0.3241, "step": 36210 }, { "epoch": 0.49, "learning_rate": 2.6176583837248815e-05, "loss": 0.291, "step": 36215 }, { "epoch": 0.49, "learning_rate": 2.6171328047386846e-05, "loss": 0.8127, "step": 36220 }, { "epoch": 0.49, "learning_rate": 2.616607220564089e-05, "loss": 0.1299, "step": 36225 }, { "epoch": 0.49, "learning_rate": 2.616081631224378e-05, "loss": 0.8927, "step": 36230 }, { "epoch": 0.49, "learning_rate": 2.615556036742831e-05, "loss": 0.6108, "step": 36235 }, { "epoch": 0.49, "learning_rate": 2.61503043714273e-05, "loss": 0.5121, "step": 36240 }, { "epoch": 0.49, "learning_rate": 2.6145048324473554e-05, "loss": 1.3796, "step": 36245 }, { "epoch": 0.49, "learning_rate": 2.6139792226799897e-05, "loss": 0.4198, "step": 36250 }, { "epoch": 0.49, "learning_rate": 2.6134536078639156e-05, "loss": 0.6239, "step": 36255 }, { "epoch": 0.49, "learning_rate": 2.612927988022414e-05, "loss": 1.1708, "step": 36260 }, { "epoch": 0.49, "learning_rate": 2.612402363178767e-05, "loss": 1.2554, "step": 36265 }, { "epoch": 0.49, "learning_rate": 2.6118767333562572e-05, "loss": 0.9203, "step": 36270 }, { "epoch": 0.49, "learning_rate": 2.611351098578169e-05, "loss": 0.307, "step": 36275 }, { "epoch": 0.49, "learning_rate": 2.6108254588677832e-05, "loss": 0.4363, "step": 36280 }, { "epoch": 0.49, "learning_rate": 2.610299814248385e-05, "loss": 0.3212, "step": 36285 }, { "epoch": 0.49, "learning_rate": 2.6097741647432562e-05, "loss": 0.5182, "step": 36290 }, { "epoch": 0.49, "learning_rate": 2.609248510375681e-05, "loss": 0.619, "step": 36295 }, { "epoch": 0.49, "learning_rate": 2.6087228511689432e-05, "loss": 0.1276, "step": 36300 }, { "epoch": 0.49, "learning_rate": 2.6081971871463274e-05, "loss": 0.4333, "step": 36305 }, { "epoch": 0.49, "learning_rate": 2.6076715183311172e-05, "loss": 0.7369, "step": 36310 }, { "epoch": 0.49, "learning_rate": 2.6071458447465986e-05, "loss": 0.5211, "step": 36315 }, { "epoch": 0.49, "learning_rate": 2.6066201664160534e-05, "loss": 0.9926, "step": 36320 }, { "epoch": 0.49, "learning_rate": 2.606094483362769e-05, "loss": 0.866, "step": 36325 }, { "epoch": 0.49, "learning_rate": 2.60556879561003e-05, "loss": 0.7775, "step": 36330 }, { "epoch": 0.49, "learning_rate": 2.6050431031811205e-05, "loss": 0.6922, "step": 36335 }, { "epoch": 0.49, "learning_rate": 2.6045174060993282e-05, "loss": 0.6787, "step": 36340 }, { "epoch": 0.49, "learning_rate": 2.6039917043879374e-05, "loss": 0.348, "step": 36345 }, { "epoch": 0.49, "learning_rate": 2.603465998070234e-05, "loss": 0.4494, "step": 36350 }, { "epoch": 0.49, "learning_rate": 2.6029402871695047e-05, "loss": 0.2235, "step": 36355 }, { "epoch": 0.49, "learning_rate": 2.6024145717090358e-05, "loss": 0.6191, "step": 36360 }, { "epoch": 0.49, "learning_rate": 2.6018888517121136e-05, "loss": 0.3382, "step": 36365 }, { "epoch": 0.49, "learning_rate": 2.6013631272020256e-05, "loss": 0.4372, "step": 36370 }, { "epoch": 0.49, "learning_rate": 2.6008373982020572e-05, "loss": 0.564, "step": 36375 }, { "epoch": 0.49, "learning_rate": 2.6003116647354968e-05, "loss": 0.5463, "step": 36380 }, { "epoch": 0.49, "learning_rate": 2.599785926825632e-05, "loss": 0.4921, "step": 36385 }, { "epoch": 0.49, "learning_rate": 2.599260184495749e-05, "loss": 0.7228, "step": 36390 }, { "epoch": 0.49, "learning_rate": 2.5987344377691376e-05, "loss": 0.4734, "step": 36395 }, { "epoch": 0.49, "learning_rate": 2.5982086866690835e-05, "loss": 0.4722, "step": 36400 }, { "epoch": 0.49, "learning_rate": 2.597682931218876e-05, "loss": 0.5475, "step": 36405 }, { "epoch": 0.49, "learning_rate": 2.5971571714418035e-05, "loss": 0.7852, "step": 36410 }, { "epoch": 0.49, "learning_rate": 2.5966314073611548e-05, "loss": 0.1556, "step": 36415 }, { "epoch": 0.49, "learning_rate": 2.596105639000218e-05, "loss": 0.5674, "step": 36420 }, { "epoch": 0.49, "learning_rate": 2.5955798663822822e-05, "loss": 0.9462, "step": 36425 }, { "epoch": 0.49, "learning_rate": 2.5950540895306362e-05, "loss": 0.5282, "step": 36430 }, { "epoch": 0.49, "learning_rate": 2.5945283084685694e-05, "loss": 0.5981, "step": 36435 }, { "epoch": 0.49, "learning_rate": 2.594002523219372e-05, "loss": 0.4455, "step": 36440 }, { "epoch": 0.49, "learning_rate": 2.5934767338063325e-05, "loss": 0.5951, "step": 36445 }, { "epoch": 0.49, "learning_rate": 2.5929509402527418e-05, "loss": 0.9489, "step": 36450 }, { "epoch": 0.49, "learning_rate": 2.5924251425818897e-05, "loss": 0.7327, "step": 36455 }, { "epoch": 0.49, "learning_rate": 2.5918993408170657e-05, "loss": 1.1373, "step": 36460 }, { "epoch": 0.49, "learning_rate": 2.591373534981561e-05, "loss": 0.8936, "step": 36465 }, { "epoch": 0.49, "learning_rate": 2.590847725098665e-05, "loss": 1.0354, "step": 36470 }, { "epoch": 0.49, "learning_rate": 2.5903219111916703e-05, "loss": 0.579, "step": 36475 }, { "epoch": 0.49, "learning_rate": 2.5897960932838668e-05, "loss": 0.3588, "step": 36480 }, { "epoch": 0.49, "learning_rate": 2.589270271398545e-05, "loss": 0.4196, "step": 36485 }, { "epoch": 0.49, "learning_rate": 2.5887444455589965e-05, "loss": 0.5637, "step": 36490 }, { "epoch": 0.49, "learning_rate": 2.588218615788514e-05, "loss": 0.7326, "step": 36495 }, { "epoch": 0.49, "learning_rate": 2.5876927821103876e-05, "loss": 0.9441, "step": 36500 }, { "epoch": 0.49, "learning_rate": 2.5871669445479096e-05, "loss": 1.2902, "step": 36505 }, { "epoch": 0.49, "learning_rate": 2.586641103124372e-05, "loss": 0.6253, "step": 36510 }, { "epoch": 0.49, "learning_rate": 2.586115257863067e-05, "loss": 0.5878, "step": 36515 }, { "epoch": 0.49, "learning_rate": 2.5855894087872873e-05, "loss": 0.6999, "step": 36520 }, { "epoch": 0.49, "learning_rate": 2.5850635559203246e-05, "loss": 0.6219, "step": 36525 }, { "epoch": 0.49, "learning_rate": 2.5845376992854723e-05, "loss": 0.7782, "step": 36530 }, { "epoch": 0.49, "learning_rate": 2.584011838906023e-05, "loss": 0.6931, "step": 36535 }, { "epoch": 0.49, "learning_rate": 2.5834859748052692e-05, "loss": 0.6626, "step": 36540 }, { "epoch": 0.49, "learning_rate": 2.582960107006504e-05, "loss": 0.575, "step": 36545 }, { "epoch": 0.49, "learning_rate": 2.5824342355330217e-05, "loss": 1.2521, "step": 36550 }, { "epoch": 0.49, "learning_rate": 2.5819083604081145e-05, "loss": 0.8117, "step": 36555 }, { "epoch": 0.49, "learning_rate": 2.5813824816550775e-05, "loss": 0.6011, "step": 36560 }, { "epoch": 0.49, "learning_rate": 2.5808565992972035e-05, "loss": 0.8637, "step": 36565 }, { "epoch": 0.49, "learning_rate": 2.5803307133577858e-05, "loss": 0.5821, "step": 36570 }, { "epoch": 0.49, "learning_rate": 2.5798048238601206e-05, "loss": 1.0694, "step": 36575 }, { "epoch": 0.49, "learning_rate": 2.5792789308275e-05, "loss": 0.1757, "step": 36580 }, { "epoch": 0.49, "learning_rate": 2.57875303428322e-05, "loss": 1.0495, "step": 36585 }, { "epoch": 0.49, "learning_rate": 2.5782271342505747e-05, "loss": 1.0154, "step": 36590 }, { "epoch": 0.49, "learning_rate": 2.5777012307528586e-05, "loss": 1.0474, "step": 36595 }, { "epoch": 0.49, "learning_rate": 2.577175323813366e-05, "loss": 0.5606, "step": 36600 }, { "epoch": 0.49, "learning_rate": 2.5766494134553936e-05, "loss": 0.3461, "step": 36605 }, { "epoch": 0.49, "learning_rate": 2.576123499702235e-05, "loss": 0.816, "step": 36610 }, { "epoch": 0.49, "learning_rate": 2.5755975825771865e-05, "loss": 0.7188, "step": 36615 }, { "epoch": 0.49, "learning_rate": 2.575071662103543e-05, "loss": 0.5347, "step": 36620 }, { "epoch": 0.49, "learning_rate": 2.5745457383046007e-05, "loss": 0.6839, "step": 36625 }, { "epoch": 0.49, "learning_rate": 2.5740198112036552e-05, "loss": 0.7259, "step": 36630 }, { "epoch": 0.49, "learning_rate": 2.5734938808240018e-05, "loss": 0.8595, "step": 36635 }, { "epoch": 0.49, "learning_rate": 2.5729679471889378e-05, "loss": 0.8019, "step": 36640 }, { "epoch": 0.49, "learning_rate": 2.572442010321759e-05, "loss": 0.3449, "step": 36645 }, { "epoch": 0.49, "learning_rate": 2.5719160702457613e-05, "loss": 0.8208, "step": 36650 }, { "epoch": 0.49, "learning_rate": 2.5713901269842404e-05, "loss": 1.1301, "step": 36655 }, { "epoch": 0.49, "learning_rate": 2.5708641805604954e-05, "loss": 0.5584, "step": 36660 }, { "epoch": 0.49, "learning_rate": 2.5703382309978215e-05, "loss": 1.1542, "step": 36665 }, { "epoch": 0.49, "learning_rate": 2.5698122783195155e-05, "loss": 0.1895, "step": 36670 }, { "epoch": 0.49, "learning_rate": 2.569286322548875e-05, "loss": 0.5199, "step": 36675 }, { "epoch": 0.49, "learning_rate": 2.5687603637091968e-05, "loss": 0.8502, "step": 36680 }, { "epoch": 0.49, "learning_rate": 2.5682344018237785e-05, "loss": 0.6591, "step": 36685 }, { "epoch": 0.49, "learning_rate": 2.5677084369159176e-05, "loss": 0.4834, "step": 36690 }, { "epoch": 0.49, "learning_rate": 2.5671824690089126e-05, "loss": 1.0447, "step": 36695 }, { "epoch": 0.49, "learning_rate": 2.5666564981260592e-05, "loss": 1.1534, "step": 36700 }, { "epoch": 0.49, "learning_rate": 2.566130524290657e-05, "loss": 0.9103, "step": 36705 }, { "epoch": 0.49, "learning_rate": 2.5656045475260025e-05, "loss": 0.8903, "step": 36710 }, { "epoch": 0.49, "learning_rate": 2.565078567855396e-05, "loss": 1.3932, "step": 36715 }, { "epoch": 0.49, "learning_rate": 2.564552585302134e-05, "loss": 0.337, "step": 36720 }, { "epoch": 0.49, "learning_rate": 2.5640265998895153e-05, "loss": 1.2305, "step": 36725 }, { "epoch": 0.49, "learning_rate": 2.5635006116408382e-05, "loss": 1.0536, "step": 36730 }, { "epoch": 0.49, "learning_rate": 2.562974620579402e-05, "loss": 0.5222, "step": 36735 }, { "epoch": 0.49, "learning_rate": 2.5624486267285058e-05, "loss": 1.1434, "step": 36740 }, { "epoch": 0.49, "learning_rate": 2.5619226301114468e-05, "loss": 0.462, "step": 36745 }, { "epoch": 0.49, "learning_rate": 2.5613966307515257e-05, "loss": 0.5764, "step": 36750 }, { "epoch": 0.49, "learning_rate": 2.560870628672042e-05, "loss": 0.3396, "step": 36755 }, { "epoch": 0.49, "learning_rate": 2.5603446238962925e-05, "loss": 0.9929, "step": 36760 }, { "epoch": 0.49, "learning_rate": 2.559818616447578e-05, "loss": 0.8914, "step": 36765 }, { "epoch": 0.49, "learning_rate": 2.5592926063491985e-05, "loss": 0.6204, "step": 36770 }, { "epoch": 0.49, "learning_rate": 2.558766593624453e-05, "loss": 0.2002, "step": 36775 }, { "epoch": 0.49, "learning_rate": 2.558240578296642e-05, "loss": 0.8704, "step": 36780 }, { "epoch": 0.49, "learning_rate": 2.557714560389064e-05, "loss": 0.8756, "step": 36785 }, { "epoch": 0.49, "learning_rate": 2.55718853992502e-05, "loss": 0.539, "step": 36790 }, { "epoch": 0.49, "learning_rate": 2.5566625169278096e-05, "loss": 0.5855, "step": 36795 }, { "epoch": 0.49, "learning_rate": 2.5561364914207336e-05, "loss": 0.2922, "step": 36800 }, { "epoch": 0.49, "learning_rate": 2.5556104634270917e-05, "loss": 1.2798, "step": 36805 }, { "epoch": 0.49, "learning_rate": 2.5550844329701852e-05, "loss": 0.6257, "step": 36810 }, { "epoch": 0.49, "learning_rate": 2.5545584000733125e-05, "loss": 0.8184, "step": 36815 }, { "epoch": 0.49, "learning_rate": 2.554032364759776e-05, "loss": 0.973, "step": 36820 }, { "epoch": 0.49, "learning_rate": 2.553506327052877e-05, "loss": 0.583, "step": 36825 }, { "epoch": 0.49, "learning_rate": 2.552980286975914e-05, "loss": 1.2014, "step": 36830 }, { "epoch": 0.49, "learning_rate": 2.5524542445521903e-05, "loss": 1.0428, "step": 36835 }, { "epoch": 0.49, "learning_rate": 2.551928199805006e-05, "loss": 0.7208, "step": 36840 }, { "epoch": 0.49, "learning_rate": 2.5514021527576613e-05, "loss": 0.4786, "step": 36845 }, { "epoch": 0.49, "learning_rate": 2.5508761034334594e-05, "loss": 0.4354, "step": 36850 }, { "epoch": 0.49, "learning_rate": 2.5503500518557e-05, "loss": 0.766, "step": 36855 }, { "epoch": 0.49, "learning_rate": 2.549823998047686e-05, "loss": 0.7158, "step": 36860 }, { "epoch": 0.49, "learning_rate": 2.549297942032718e-05, "loss": 0.8767, "step": 36865 }, { "epoch": 0.49, "learning_rate": 2.5487718838340972e-05, "loss": 1.2458, "step": 36870 }, { "epoch": 0.49, "learning_rate": 2.5482458234751262e-05, "loss": 0.4757, "step": 36875 }, { "epoch": 0.49, "learning_rate": 2.5477197609791066e-05, "loss": 1.1301, "step": 36880 }, { "epoch": 0.49, "learning_rate": 2.54719369636934e-05, "loss": 1.2874, "step": 36885 }, { "epoch": 0.49, "learning_rate": 2.5466676296691293e-05, "loss": 1.3394, "step": 36890 }, { "epoch": 0.49, "learning_rate": 2.5461415609017757e-05, "loss": 0.5673, "step": 36895 }, { "epoch": 0.49, "learning_rate": 2.5456154900905814e-05, "loss": 1.5496, "step": 36900 }, { "epoch": 0.49, "learning_rate": 2.5450894172588503e-05, "loss": 0.5496, "step": 36905 }, { "epoch": 0.49, "learning_rate": 2.5445633424298827e-05, "loss": 0.5147, "step": 36910 }, { "epoch": 0.49, "learning_rate": 2.5440372656269823e-05, "loss": 0.6738, "step": 36915 }, { "epoch": 0.49, "learning_rate": 2.5435111868734517e-05, "loss": 0.8045, "step": 36920 }, { "epoch": 0.49, "learning_rate": 2.5429851061925926e-05, "loss": 0.8749, "step": 36925 }, { "epoch": 0.49, "learning_rate": 2.5424590236077078e-05, "loss": 0.2462, "step": 36930 }, { "epoch": 0.49, "learning_rate": 2.541932939142102e-05, "loss": 0.6845, "step": 36935 }, { "epoch": 0.49, "learning_rate": 2.5414068528190756e-05, "loss": 0.7638, "step": 36940 }, { "epoch": 0.5, "learning_rate": 2.5408807646619337e-05, "loss": 0.4905, "step": 36945 }, { "epoch": 0.5, "learning_rate": 2.5403546746939776e-05, "loss": 0.8215, "step": 36950 }, { "epoch": 0.5, "learning_rate": 2.5398285829385117e-05, "loss": 0.6558, "step": 36955 }, { "epoch": 0.5, "learning_rate": 2.5393024894188387e-05, "loss": 0.5155, "step": 36960 }, { "epoch": 0.5, "learning_rate": 2.5387763941582627e-05, "loss": 0.8596, "step": 36965 }, { "epoch": 0.5, "learning_rate": 2.5382502971800858e-05, "loss": 1.1737, "step": 36970 }, { "epoch": 0.5, "learning_rate": 2.5377241985076126e-05, "loss": 1.1919, "step": 36975 }, { "epoch": 0.5, "learning_rate": 2.5371980981641457e-05, "loss": 0.2212, "step": 36980 }, { "epoch": 0.5, "learning_rate": 2.536671996172989e-05, "loss": 0.3806, "step": 36985 }, { "epoch": 0.5, "learning_rate": 2.5361458925574466e-05, "loss": 1.1917, "step": 36990 }, { "epoch": 0.5, "learning_rate": 2.5356197873408216e-05, "loss": 0.6693, "step": 36995 }, { "epoch": 0.5, "learning_rate": 2.5350936805464192e-05, "loss": 0.659, "step": 37000 }, { "epoch": 0.5, "learning_rate": 2.5345675721975416e-05, "loss": 0.369, "step": 37005 }, { "epoch": 0.5, "learning_rate": 2.534041462317493e-05, "loss": 0.481, "step": 37010 }, { "epoch": 0.5, "learning_rate": 2.533515350929579e-05, "loss": 0.3277, "step": 37015 }, { "epoch": 0.5, "learning_rate": 2.532989238057102e-05, "loss": 0.6016, "step": 37020 }, { "epoch": 0.5, "learning_rate": 2.532463123723367e-05, "loss": 0.9939, "step": 37025 }, { "epoch": 0.5, "learning_rate": 2.531937007951678e-05, "loss": 0.7595, "step": 37030 }, { "epoch": 0.5, "learning_rate": 2.5314108907653395e-05, "loss": 1.0733, "step": 37035 }, { "epoch": 0.5, "learning_rate": 2.530884772187655e-05, "loss": 0.1739, "step": 37040 }, { "epoch": 0.5, "learning_rate": 2.5303586522419304e-05, "loss": 0.7931, "step": 37045 }, { "epoch": 0.5, "learning_rate": 2.5298325309514685e-05, "loss": 0.9156, "step": 37050 }, { "epoch": 0.5, "learning_rate": 2.5293064083395755e-05, "loss": 0.278, "step": 37055 }, { "epoch": 0.5, "learning_rate": 2.528780284429555e-05, "loss": 0.6727, "step": 37060 }, { "epoch": 0.5, "learning_rate": 2.5282541592447118e-05, "loss": 1.07, "step": 37065 }, { "epoch": 0.5, "learning_rate": 2.527728032808351e-05, "loss": 1.1991, "step": 37070 }, { "epoch": 0.5, "learning_rate": 2.5272019051437766e-05, "loss": 0.946, "step": 37075 }, { "epoch": 0.5, "learning_rate": 2.5266757762742943e-05, "loss": 0.5167, "step": 37080 }, { "epoch": 0.5, "learning_rate": 2.5261496462232087e-05, "loss": 0.6962, "step": 37085 }, { "epoch": 0.5, "learning_rate": 2.5256235150138236e-05, "loss": 0.4583, "step": 37090 }, { "epoch": 0.5, "learning_rate": 2.525097382669446e-05, "loss": 0.3043, "step": 37095 }, { "epoch": 0.5, "learning_rate": 2.52457124921338e-05, "loss": 0.7101, "step": 37100 }, { "epoch": 0.5, "learning_rate": 2.5240451146689297e-05, "loss": 0.8512, "step": 37105 }, { "epoch": 0.5, "learning_rate": 2.5235189790594022e-05, "loss": 1.1243, "step": 37110 }, { "epoch": 0.5, "learning_rate": 2.5229928424081008e-05, "loss": 0.5671, "step": 37115 }, { "epoch": 0.5, "learning_rate": 2.522466704738331e-05, "loss": 0.8169, "step": 37120 }, { "epoch": 0.5, "learning_rate": 2.5219405660733998e-05, "loss": 0.746, "step": 37125 }, { "epoch": 0.5, "learning_rate": 2.52141442643661e-05, "loss": 0.6457, "step": 37130 }, { "epoch": 0.5, "learning_rate": 2.5208882858512696e-05, "loss": 0.8701, "step": 37135 }, { "epoch": 0.5, "learning_rate": 2.520362144340682e-05, "loss": 0.2474, "step": 37140 }, { "epoch": 0.5, "learning_rate": 2.5198360019281526e-05, "loss": 1.0413, "step": 37145 }, { "epoch": 0.5, "learning_rate": 2.519309858636989e-05, "loss": 0.7128, "step": 37150 }, { "epoch": 0.5, "learning_rate": 2.5187837144904946e-05, "loss": 0.5753, "step": 37155 }, { "epoch": 0.5, "learning_rate": 2.5182575695119753e-05, "loss": 0.5199, "step": 37160 }, { "epoch": 0.5, "learning_rate": 2.5177314237247374e-05, "loss": 0.5302, "step": 37165 }, { "epoch": 0.5, "learning_rate": 2.517205277152086e-05, "loss": 0.8846, "step": 37170 }, { "epoch": 0.5, "learning_rate": 2.5166791298173263e-05, "loss": 0.6217, "step": 37175 }, { "epoch": 0.5, "learning_rate": 2.5161529817437656e-05, "loss": 0.3644, "step": 37180 }, { "epoch": 0.5, "learning_rate": 2.5156268329547076e-05, "loss": 0.7063, "step": 37185 }, { "epoch": 0.5, "learning_rate": 2.51510068347346e-05, "loss": 0.4418, "step": 37190 }, { "epoch": 0.5, "learning_rate": 2.5145745333233277e-05, "loss": 0.3925, "step": 37195 }, { "epoch": 0.5, "learning_rate": 2.5140483825276155e-05, "loss": 1.0577, "step": 37200 }, { "epoch": 0.5, "learning_rate": 2.5135222311096312e-05, "loss": 0.8187, "step": 37205 }, { "epoch": 0.5, "learning_rate": 2.5129960790926798e-05, "loss": 0.6272, "step": 37210 }, { "epoch": 0.5, "learning_rate": 2.5124699265000662e-05, "loss": 0.7523, "step": 37215 }, { "epoch": 0.5, "learning_rate": 2.5119437733550983e-05, "loss": 0.5116, "step": 37220 }, { "epoch": 0.5, "learning_rate": 2.51141761968108e-05, "loss": 0.3006, "step": 37225 }, { "epoch": 0.5, "learning_rate": 2.510891465501318e-05, "loss": 0.9562, "step": 37230 }, { "epoch": 0.5, "learning_rate": 2.51036531083912e-05, "loss": 0.3392, "step": 37235 }, { "epoch": 0.5, "learning_rate": 2.50983915571779e-05, "loss": 0.4805, "step": 37240 }, { "epoch": 0.5, "learning_rate": 2.509313000160634e-05, "loss": 0.393, "step": 37245 }, { "epoch": 0.5, "learning_rate": 2.5087868441909594e-05, "loss": 1.1392, "step": 37250 }, { "epoch": 0.5, "learning_rate": 2.5082606878320707e-05, "loss": 0.3178, "step": 37255 }, { "epoch": 0.5, "learning_rate": 2.507734531107276e-05, "loss": 0.6283, "step": 37260 }, { "epoch": 0.5, "learning_rate": 2.50720837403988e-05, "loss": 0.7545, "step": 37265 }, { "epoch": 0.5, "learning_rate": 2.5066822166531884e-05, "loss": 1.149, "step": 37270 }, { "epoch": 0.5, "learning_rate": 2.506156058970509e-05, "loss": 0.8366, "step": 37275 }, { "epoch": 0.5, "learning_rate": 2.5056299010151463e-05, "loss": 0.7571, "step": 37280 }, { "epoch": 0.5, "learning_rate": 2.5051037428104068e-05, "loss": 1.3128, "step": 37285 }, { "epoch": 0.5, "learning_rate": 2.5045775843795975e-05, "loss": 1.0509, "step": 37290 }, { "epoch": 0.5, "learning_rate": 2.5040514257460242e-05, "loss": 0.5436, "step": 37295 }, { "epoch": 0.5, "learning_rate": 2.5035252669329934e-05, "loss": 1.2501, "step": 37300 }, { "epoch": 0.5, "learning_rate": 2.50299910796381e-05, "loss": 0.4486, "step": 37305 }, { "epoch": 0.5, "learning_rate": 2.5024729488617814e-05, "loss": 0.9053, "step": 37310 }, { "epoch": 0.5, "learning_rate": 2.501946789650214e-05, "loss": 0.8061, "step": 37315 }, { "epoch": 0.5, "learning_rate": 2.5014206303524134e-05, "loss": 0.564, "step": 37320 }, { "epoch": 0.5, "learning_rate": 2.500894470991686e-05, "loss": 0.5257, "step": 37325 }, { "epoch": 0.5, "learning_rate": 2.500368311591338e-05, "loss": 0.8179, "step": 37330 }, { "epoch": 0.5, "learning_rate": 2.499842152174675e-05, "loss": 0.82, "step": 37335 }, { "epoch": 0.5, "learning_rate": 2.499315992765004e-05, "loss": 0.9337, "step": 37340 }, { "epoch": 0.5, "learning_rate": 2.4987898333856315e-05, "loss": 0.2594, "step": 37345 }, { "epoch": 0.5, "learning_rate": 2.498263674059864e-05, "loss": 0.3818, "step": 37350 }, { "epoch": 0.5, "learning_rate": 2.4977375148110064e-05, "loss": 0.5352, "step": 37355 }, { "epoch": 0.5, "learning_rate": 2.4972113556623652e-05, "loss": 1.0266, "step": 37360 }, { "epoch": 0.5, "learning_rate": 2.4966851966372475e-05, "loss": 0.6726, "step": 37365 }, { "epoch": 0.5, "learning_rate": 2.4961590377589586e-05, "loss": 0.6192, "step": 37370 }, { "epoch": 0.5, "learning_rate": 2.495632879050805e-05, "loss": 0.4963, "step": 37375 }, { "epoch": 0.5, "learning_rate": 2.495106720536094e-05, "loss": 1.3332, "step": 37380 }, { "epoch": 0.5, "learning_rate": 2.49458056223813e-05, "loss": 0.2106, "step": 37385 }, { "epoch": 0.5, "learning_rate": 2.49405440418022e-05, "loss": 0.6772, "step": 37390 }, { "epoch": 0.5, "learning_rate": 2.4935282463856708e-05, "loss": 0.746, "step": 37395 }, { "epoch": 0.5, "learning_rate": 2.493002088877787e-05, "loss": 0.5256, "step": 37400 }, { "epoch": 0.5, "learning_rate": 2.4924759316798755e-05, "loss": 0.8574, "step": 37405 }, { "epoch": 0.5, "learning_rate": 2.491949774815244e-05, "loss": 1.2086, "step": 37410 }, { "epoch": 0.5, "learning_rate": 2.4914236183071956e-05, "loss": 0.8749, "step": 37415 }, { "epoch": 0.5, "learning_rate": 2.4908974621790387e-05, "loss": 1.4146, "step": 37420 }, { "epoch": 0.5, "learning_rate": 2.4903713064540796e-05, "loss": 0.8176, "step": 37425 }, { "epoch": 0.5, "learning_rate": 2.4898451511556223e-05, "loss": 0.555, "step": 37430 }, { "epoch": 0.5, "learning_rate": 2.4893189963069736e-05, "loss": 0.7988, "step": 37435 }, { "epoch": 0.5, "learning_rate": 2.4887928419314407e-05, "loss": 0.5325, "step": 37440 }, { "epoch": 0.5, "learning_rate": 2.488266688052329e-05, "loss": 1.1411, "step": 37445 }, { "epoch": 0.5, "learning_rate": 2.487740534692944e-05, "loss": 0.4176, "step": 37450 }, { "epoch": 0.5, "learning_rate": 2.4872143818765916e-05, "loss": 0.9254, "step": 37455 }, { "epoch": 0.5, "learning_rate": 2.4866882296265794e-05, "loss": 0.4366, "step": 37460 }, { "epoch": 0.5, "learning_rate": 2.486162077966211e-05, "loss": 0.9037, "step": 37465 }, { "epoch": 0.5, "learning_rate": 2.485635926918793e-05, "loss": 0.5071, "step": 37470 }, { "epoch": 0.5, "learning_rate": 2.4851097765076325e-05, "loss": 1.112, "step": 37475 }, { "epoch": 0.5, "learning_rate": 2.4845836267560337e-05, "loss": 1.0544, "step": 37480 }, { "epoch": 0.5, "learning_rate": 2.484057477687303e-05, "loss": 0.3204, "step": 37485 }, { "epoch": 0.5, "learning_rate": 2.4835313293247477e-05, "loss": 0.4959, "step": 37490 }, { "epoch": 0.5, "learning_rate": 2.483005181691671e-05, "loss": 1.0898, "step": 37495 }, { "epoch": 0.5, "learning_rate": 2.4824790348113793e-05, "loss": 0.6285, "step": 37500 }, { "epoch": 0.5, "learning_rate": 2.4819528887071797e-05, "loss": 0.2287, "step": 37505 }, { "epoch": 0.5, "learning_rate": 2.4814267434023762e-05, "loss": 0.4968, "step": 37510 }, { "epoch": 0.5, "learning_rate": 2.4809005989202748e-05, "loss": 1.4394, "step": 37515 }, { "epoch": 0.5, "learning_rate": 2.480374455284182e-05, "loss": 0.509, "step": 37520 }, { "epoch": 0.5, "learning_rate": 2.479848312517402e-05, "loss": 0.2179, "step": 37525 }, { "epoch": 0.5, "learning_rate": 2.4793221706432413e-05, "loss": 0.5496, "step": 37530 }, { "epoch": 0.5, "learning_rate": 2.4787960296850056e-05, "loss": 0.6418, "step": 37535 }, { "epoch": 0.5, "learning_rate": 2.4782698896659988e-05, "loss": 0.3724, "step": 37540 }, { "epoch": 0.5, "learning_rate": 2.4777437506095273e-05, "loss": 0.2209, "step": 37545 }, { "epoch": 0.5, "learning_rate": 2.477217612538896e-05, "loss": 0.7603, "step": 37550 }, { "epoch": 0.5, "learning_rate": 2.476691475477412e-05, "loss": 0.7523, "step": 37555 }, { "epoch": 0.5, "learning_rate": 2.4761653394483774e-05, "loss": 0.5997, "step": 37560 }, { "epoch": 0.5, "learning_rate": 2.4756392044750994e-05, "loss": 0.6036, "step": 37565 }, { "epoch": 0.5, "learning_rate": 2.4751130705808838e-05, "loss": 0.9249, "step": 37570 }, { "epoch": 0.5, "learning_rate": 2.4745869377890337e-05, "loss": 0.9749, "step": 37575 }, { "epoch": 0.5, "learning_rate": 2.4740608061228553e-05, "loss": 1.2645, "step": 37580 }, { "epoch": 0.5, "learning_rate": 2.4735346756056536e-05, "loss": 1.1356, "step": 37585 }, { "epoch": 0.5, "learning_rate": 2.4730085462607327e-05, "loss": 0.5473, "step": 37590 }, { "epoch": 0.5, "learning_rate": 2.4724824181113984e-05, "loss": 0.6941, "step": 37595 }, { "epoch": 0.5, "learning_rate": 2.4719562911809564e-05, "loss": 0.856, "step": 37600 }, { "epoch": 0.5, "learning_rate": 2.4714301654927095e-05, "loss": 0.6797, "step": 37605 }, { "epoch": 0.5, "learning_rate": 2.470904041069963e-05, "loss": 0.3386, "step": 37610 }, { "epoch": 0.5, "learning_rate": 2.4703779179360224e-05, "loss": 0.5892, "step": 37615 }, { "epoch": 0.5, "learning_rate": 2.4698517961141916e-05, "loss": 0.7645, "step": 37620 }, { "epoch": 0.5, "learning_rate": 2.4693256756277754e-05, "loss": 1.1059, "step": 37625 }, { "epoch": 0.5, "learning_rate": 2.468799556500079e-05, "loss": 0.6099, "step": 37630 }, { "epoch": 0.5, "learning_rate": 2.468273438754405e-05, "loss": 0.9904, "step": 37635 }, { "epoch": 0.5, "learning_rate": 2.4677473224140593e-05, "loss": 1.2925, "step": 37640 }, { "epoch": 0.5, "learning_rate": 2.467221207502347e-05, "loss": 1.2725, "step": 37645 }, { "epoch": 0.5, "learning_rate": 2.46669509404257e-05, "loss": 0.218, "step": 37650 }, { "epoch": 0.5, "learning_rate": 2.466168982058034e-05, "loss": 0.653, "step": 37655 }, { "epoch": 0.5, "learning_rate": 2.465642871572043e-05, "loss": 0.3429, "step": 37660 }, { "epoch": 0.5, "learning_rate": 2.4651167626079007e-05, "loss": 0.5374, "step": 37665 }, { "epoch": 0.5, "learning_rate": 2.464590655188911e-05, "loss": 0.6538, "step": 37670 }, { "epoch": 0.5, "learning_rate": 2.4640645493383785e-05, "loss": 1.0777, "step": 37675 }, { "epoch": 0.5, "learning_rate": 2.4635384450796075e-05, "loss": 0.4285, "step": 37680 }, { "epoch": 0.5, "learning_rate": 2.4630123424359e-05, "loss": 0.9556, "step": 37685 }, { "epoch": 0.5, "learning_rate": 2.4624862414305605e-05, "loss": 0.3573, "step": 37690 }, { "epoch": 0.51, "learning_rate": 2.4619601420868937e-05, "loss": 0.8813, "step": 37695 }, { "epoch": 0.51, "learning_rate": 2.4614340444282013e-05, "loss": 0.7945, "step": 37700 }, { "epoch": 0.51, "learning_rate": 2.4609079484777885e-05, "loss": 0.6729, "step": 37705 }, { "epoch": 0.51, "learning_rate": 2.4603818542589586e-05, "loss": 0.4104, "step": 37710 }, { "epoch": 0.51, "learning_rate": 2.459855761795013e-05, "loss": 0.2179, "step": 37715 }, { "epoch": 0.51, "learning_rate": 2.459329671109256e-05, "loss": 0.9847, "step": 37720 }, { "epoch": 0.51, "learning_rate": 2.458803582224993e-05, "loss": 0.6144, "step": 37725 }, { "epoch": 0.51, "learning_rate": 2.458277495165524e-05, "loss": 0.5593, "step": 37730 }, { "epoch": 0.51, "learning_rate": 2.457751409954153e-05, "loss": 0.8575, "step": 37735 }, { "epoch": 0.51, "learning_rate": 2.4572253266141838e-05, "loss": 0.8651, "step": 37740 }, { "epoch": 0.51, "learning_rate": 2.4566992451689184e-05, "loss": 0.4214, "step": 37745 }, { "epoch": 0.51, "learning_rate": 2.4561731656416596e-05, "loss": 0.3229, "step": 37750 }, { "epoch": 0.51, "learning_rate": 2.4556470880557114e-05, "loss": 1.2583, "step": 37755 }, { "epoch": 0.51, "learning_rate": 2.4551210124343742e-05, "loss": 1.2089, "step": 37760 }, { "epoch": 0.51, "learning_rate": 2.454594938800952e-05, "loss": 0.7758, "step": 37765 }, { "epoch": 0.51, "learning_rate": 2.454068867178747e-05, "loss": 0.7959, "step": 37770 }, { "epoch": 0.51, "learning_rate": 2.4535427975910605e-05, "loss": 0.6021, "step": 37775 }, { "epoch": 0.51, "learning_rate": 2.453016730061196e-05, "loss": 0.6233, "step": 37780 }, { "epoch": 0.51, "learning_rate": 2.4524906646124555e-05, "loss": 0.9891, "step": 37785 }, { "epoch": 0.51, "learning_rate": 2.451964601268142e-05, "loss": 1.4271, "step": 37790 }, { "epoch": 0.51, "learning_rate": 2.451438540051555e-05, "loss": 0.9364, "step": 37795 }, { "epoch": 0.51, "learning_rate": 2.4509124809859976e-05, "loss": 0.5818, "step": 37800 }, { "epoch": 0.51, "learning_rate": 2.4503864240947723e-05, "loss": 0.3979, "step": 37805 }, { "epoch": 0.51, "learning_rate": 2.44986036940118e-05, "loss": 1.3187, "step": 37810 }, { "epoch": 0.51, "learning_rate": 2.4493343169285222e-05, "loss": 0.2968, "step": 37815 }, { "epoch": 0.51, "learning_rate": 2.448808266700102e-05, "loss": 0.3662, "step": 37820 }, { "epoch": 0.51, "learning_rate": 2.4482822187392184e-05, "loss": 0.269, "step": 37825 }, { "epoch": 0.51, "learning_rate": 2.447756173069173e-05, "loss": 0.7704, "step": 37830 }, { "epoch": 0.51, "learning_rate": 2.4472301297132696e-05, "loss": 0.8247, "step": 37835 }, { "epoch": 0.51, "learning_rate": 2.4467040886948064e-05, "loss": 0.8756, "step": 37840 }, { "epoch": 0.51, "learning_rate": 2.446178050037085e-05, "loss": 1.2698, "step": 37845 }, { "epoch": 0.51, "learning_rate": 2.445652013763408e-05, "loss": 1.0313, "step": 37850 }, { "epoch": 0.51, "learning_rate": 2.4451259798970738e-05, "loss": 0.3654, "step": 37855 }, { "epoch": 0.51, "learning_rate": 2.4445999484613844e-05, "loss": 0.4023, "step": 37860 }, { "epoch": 0.51, "learning_rate": 2.444073919479641e-05, "loss": 0.4325, "step": 37865 }, { "epoch": 0.51, "learning_rate": 2.443547892975142e-05, "loss": 0.433, "step": 37870 }, { "epoch": 0.51, "learning_rate": 2.4430218689711893e-05, "loss": 0.4698, "step": 37875 }, { "epoch": 0.51, "learning_rate": 2.442495847491083e-05, "loss": 0.4228, "step": 37880 }, { "epoch": 0.51, "learning_rate": 2.4419698285581228e-05, "loss": 0.6602, "step": 37885 }, { "epoch": 0.51, "learning_rate": 2.4414438121956083e-05, "loss": 0.3982, "step": 37890 }, { "epoch": 0.51, "learning_rate": 2.4409177984268406e-05, "loss": 0.5178, "step": 37895 }, { "epoch": 0.51, "learning_rate": 2.4403917872751194e-05, "loss": 0.9369, "step": 37900 }, { "epoch": 0.51, "learning_rate": 2.439865778763743e-05, "loss": 0.3927, "step": 37905 }, { "epoch": 0.51, "learning_rate": 2.439339772916012e-05, "loss": 0.771, "step": 37910 }, { "epoch": 0.51, "learning_rate": 2.4388137697552258e-05, "loss": 0.711, "step": 37915 }, { "epoch": 0.51, "learning_rate": 2.438287769304683e-05, "loss": 0.7596, "step": 37920 }, { "epoch": 0.51, "learning_rate": 2.4377617715876833e-05, "loss": 0.7272, "step": 37925 }, { "epoch": 0.51, "learning_rate": 2.4372357766275267e-05, "loss": 1.1963, "step": 37930 }, { "epoch": 0.51, "learning_rate": 2.43670978444751e-05, "loss": 0.5492, "step": 37935 }, { "epoch": 0.51, "learning_rate": 2.4361837950709332e-05, "loss": 0.8511, "step": 37940 }, { "epoch": 0.51, "learning_rate": 2.4356578085210962e-05, "loss": 0.6573, "step": 37945 }, { "epoch": 0.51, "learning_rate": 2.4351318248212957e-05, "loss": 0.2249, "step": 37950 }, { "epoch": 0.51, "learning_rate": 2.4346058439948305e-05, "loss": 0.4561, "step": 37955 }, { "epoch": 0.51, "learning_rate": 2.434079866065e-05, "loss": 0.6506, "step": 37960 }, { "epoch": 0.51, "learning_rate": 2.4335538910551008e-05, "loss": 0.1786, "step": 37965 }, { "epoch": 0.51, "learning_rate": 2.4330279189884318e-05, "loss": 1.1554, "step": 37970 }, { "epoch": 0.51, "learning_rate": 2.4325019498882925e-05, "loss": 0.222, "step": 37975 }, { "epoch": 0.51, "learning_rate": 2.4319759837779778e-05, "loss": 0.8565, "step": 37980 }, { "epoch": 0.51, "learning_rate": 2.4314500206807867e-05, "loss": 0.7181, "step": 37985 }, { "epoch": 0.51, "learning_rate": 2.4309240606200173e-05, "loss": 0.5513, "step": 37990 }, { "epoch": 0.51, "learning_rate": 2.4303981036189657e-05, "loss": 0.4183, "step": 37995 }, { "epoch": 0.51, "learning_rate": 2.4298721497009303e-05, "loss": 0.5932, "step": 38000 }, { "epoch": 0.51, "learning_rate": 2.4293461988892074e-05, "loss": 1.0238, "step": 38005 }, { "epoch": 0.51, "learning_rate": 2.4288202512070957e-05, "loss": 0.3933, "step": 38010 }, { "epoch": 0.51, "learning_rate": 2.4282943066778897e-05, "loss": 1.0421, "step": 38015 }, { "epoch": 0.51, "learning_rate": 2.427768365324887e-05, "loss": 0.51, "step": 38020 }, { "epoch": 0.51, "learning_rate": 2.4272424271713852e-05, "loss": 0.5596, "step": 38025 }, { "epoch": 0.51, "learning_rate": 2.4267164922406793e-05, "loss": 0.6023, "step": 38030 }, { "epoch": 0.51, "learning_rate": 2.426190560556066e-05, "loss": 1.4555, "step": 38035 }, { "epoch": 0.51, "learning_rate": 2.4256646321408427e-05, "loss": 0.7674, "step": 38040 }, { "epoch": 0.51, "learning_rate": 2.425138707018303e-05, "loss": 0.5437, "step": 38045 }, { "epoch": 0.51, "learning_rate": 2.424612785211744e-05, "loss": 0.552, "step": 38050 }, { "epoch": 0.51, "learning_rate": 2.424086866744463e-05, "loss": 0.3452, "step": 38055 }, { "epoch": 0.51, "learning_rate": 2.423560951639753e-05, "loss": 0.5829, "step": 38060 }, { "epoch": 0.51, "learning_rate": 2.4230350399209102e-05, "loss": 0.659, "step": 38065 }, { "epoch": 0.51, "learning_rate": 2.4225091316112304e-05, "loss": 0.8471, "step": 38070 }, { "epoch": 0.51, "learning_rate": 2.4219832267340084e-05, "loss": 0.9057, "step": 38075 }, { "epoch": 0.51, "learning_rate": 2.4214573253125388e-05, "loss": 0.5773, "step": 38080 }, { "epoch": 0.51, "learning_rate": 2.420931427370118e-05, "loss": 0.9841, "step": 38085 }, { "epoch": 0.51, "learning_rate": 2.4204055329300383e-05, "loss": 0.7691, "step": 38090 }, { "epoch": 0.51, "learning_rate": 2.419879642015595e-05, "loss": 1.6291, "step": 38095 }, { "epoch": 0.51, "learning_rate": 2.4193537546500835e-05, "loss": 1.065, "step": 38100 }, { "epoch": 0.51, "learning_rate": 2.418827870856797e-05, "loss": 0.6637, "step": 38105 }, { "epoch": 0.51, "learning_rate": 2.4183019906590294e-05, "loss": 1.2468, "step": 38110 }, { "epoch": 0.51, "learning_rate": 2.4177761140800746e-05, "loss": 1.3584, "step": 38115 }, { "epoch": 0.51, "learning_rate": 2.4172502411432283e-05, "loss": 0.8139, "step": 38120 }, { "epoch": 0.51, "learning_rate": 2.416724371871781e-05, "loss": 0.6682, "step": 38125 }, { "epoch": 0.51, "learning_rate": 2.416198506289027e-05, "loss": 0.6547, "step": 38130 }, { "epoch": 0.51, "learning_rate": 2.415672644418261e-05, "loss": 0.1514, "step": 38135 }, { "epoch": 0.51, "learning_rate": 2.4151467862827744e-05, "loss": 1.1166, "step": 38140 }, { "epoch": 0.51, "learning_rate": 2.4146209319058603e-05, "loss": 0.8159, "step": 38145 }, { "epoch": 0.51, "learning_rate": 2.414095081310813e-05, "loss": 1.0514, "step": 38150 }, { "epoch": 0.51, "learning_rate": 2.413569234520922e-05, "loss": 1.3945, "step": 38155 }, { "epoch": 0.51, "learning_rate": 2.4130433915594825e-05, "loss": 1.2118, "step": 38160 }, { "epoch": 0.51, "learning_rate": 2.4125175524497867e-05, "loss": 0.9443, "step": 38165 }, { "epoch": 0.51, "learning_rate": 2.4119917172151243e-05, "loss": 0.9561, "step": 38170 }, { "epoch": 0.51, "learning_rate": 2.411465885878789e-05, "loss": 0.8431, "step": 38175 }, { "epoch": 0.51, "learning_rate": 2.4109400584640724e-05, "loss": 0.6373, "step": 38180 }, { "epoch": 0.51, "learning_rate": 2.410414234994265e-05, "loss": 0.3351, "step": 38185 }, { "epoch": 0.51, "learning_rate": 2.409888415492659e-05, "loss": 1.1625, "step": 38190 }, { "epoch": 0.51, "learning_rate": 2.4093625999825457e-05, "loss": 0.6324, "step": 38195 }, { "epoch": 0.51, "learning_rate": 2.4088367884872156e-05, "loss": 0.7076, "step": 38200 }, { "epoch": 0.51, "learning_rate": 2.4083109810299593e-05, "loss": 0.7242, "step": 38205 }, { "epoch": 0.51, "learning_rate": 2.4077851776340683e-05, "loss": 0.6831, "step": 38210 }, { "epoch": 0.51, "learning_rate": 2.4072593783228325e-05, "loss": 0.7249, "step": 38215 }, { "epoch": 0.51, "learning_rate": 2.406733583119542e-05, "loss": 1.539, "step": 38220 }, { "epoch": 0.51, "learning_rate": 2.406207792047487e-05, "loss": 0.4346, "step": 38225 }, { "epoch": 0.51, "learning_rate": 2.405682005129959e-05, "loss": 1.7841, "step": 38230 }, { "epoch": 0.51, "learning_rate": 2.4051562223902448e-05, "loss": 1.1738, "step": 38235 }, { "epoch": 0.51, "learning_rate": 2.4046304438516358e-05, "loss": 0.8718, "step": 38240 }, { "epoch": 0.51, "learning_rate": 2.4041046695374217e-05, "loss": 0.3524, "step": 38245 }, { "epoch": 0.51, "learning_rate": 2.40357889947089e-05, "loss": 0.8079, "step": 38250 }, { "epoch": 0.51, "learning_rate": 2.4030531336753308e-05, "loss": 0.4427, "step": 38255 }, { "epoch": 0.51, "learning_rate": 2.4025273721740336e-05, "loss": 0.2539, "step": 38260 }, { "epoch": 0.51, "learning_rate": 2.4020016149902854e-05, "loss": 0.7998, "step": 38265 }, { "epoch": 0.51, "learning_rate": 2.4014758621473753e-05, "loss": 0.8662, "step": 38270 }, { "epoch": 0.51, "learning_rate": 2.400950113668593e-05, "loss": 0.5434, "step": 38275 }, { "epoch": 0.51, "learning_rate": 2.4004243695772237e-05, "loss": 0.4813, "step": 38280 }, { "epoch": 0.51, "learning_rate": 2.399898629896557e-05, "loss": 0.4916, "step": 38285 }, { "epoch": 0.51, "learning_rate": 2.3993728946498807e-05, "loss": 1.6411, "step": 38290 }, { "epoch": 0.51, "learning_rate": 2.398847163860481e-05, "loss": 0.6163, "step": 38295 }, { "epoch": 0.51, "learning_rate": 2.398321437551646e-05, "loss": 0.3575, "step": 38300 }, { "epoch": 0.51, "learning_rate": 2.3977957157466636e-05, "loss": 0.4277, "step": 38305 }, { "epoch": 0.51, "learning_rate": 2.3972699984688187e-05, "loss": 0.696, "step": 38310 }, { "epoch": 0.51, "learning_rate": 2.3967442857413992e-05, "loss": 0.3126, "step": 38315 }, { "epoch": 0.51, "learning_rate": 2.3962185775876913e-05, "loss": 0.5208, "step": 38320 }, { "epoch": 0.51, "learning_rate": 2.395692874030981e-05, "loss": 1.4788, "step": 38325 }, { "epoch": 0.51, "learning_rate": 2.3951671750945544e-05, "loss": 0.9846, "step": 38330 }, { "epoch": 0.51, "learning_rate": 2.3946414808016983e-05, "loss": 1.2002, "step": 38335 }, { "epoch": 0.51, "learning_rate": 2.394115791175697e-05, "loss": 0.2322, "step": 38340 }, { "epoch": 0.51, "learning_rate": 2.393590106239836e-05, "loss": 0.6539, "step": 38345 }, { "epoch": 0.51, "learning_rate": 2.393064426017401e-05, "loss": 0.4884, "step": 38350 }, { "epoch": 0.51, "learning_rate": 2.392538750531678e-05, "loss": 0.4404, "step": 38355 }, { "epoch": 0.51, "learning_rate": 2.3920130798059495e-05, "loss": 0.6928, "step": 38360 }, { "epoch": 0.51, "learning_rate": 2.3914874138635017e-05, "loss": 1.0976, "step": 38365 }, { "epoch": 0.51, "learning_rate": 2.390961752727619e-05, "loss": 0.6931, "step": 38370 }, { "epoch": 0.51, "learning_rate": 2.3904360964215847e-05, "loss": 1.1595, "step": 38375 }, { "epoch": 0.51, "learning_rate": 2.389910444968683e-05, "loss": 1.1554, "step": 38380 }, { "epoch": 0.51, "learning_rate": 2.389384798392199e-05, "loss": 0.5338, "step": 38385 }, { "epoch": 0.51, "learning_rate": 2.388859156715414e-05, "loss": 1.3922, "step": 38390 }, { "epoch": 0.51, "learning_rate": 2.3883335199616126e-05, "loss": 0.2615, "step": 38395 }, { "epoch": 0.51, "learning_rate": 2.387807888154078e-05, "loss": 1.1222, "step": 38400 }, { "epoch": 0.51, "learning_rate": 2.387282261316092e-05, "loss": 0.2788, "step": 38405 }, { "epoch": 0.51, "learning_rate": 2.386756639470938e-05, "loss": 0.7547, "step": 38410 }, { "epoch": 0.51, "learning_rate": 2.3862310226418992e-05, "loss": 0.4903, "step": 38415 }, { "epoch": 0.51, "learning_rate": 2.3857054108522562e-05, "loss": 0.7678, "step": 38420 }, { "epoch": 0.51, "learning_rate": 2.3851798041252916e-05, "loss": 0.7026, "step": 38425 }, { "epoch": 0.51, "learning_rate": 2.3846542024842878e-05, "loss": 0.2344, "step": 38430 }, { "epoch": 0.51, "learning_rate": 2.384128605952525e-05, "loss": 0.4998, "step": 38435 }, { "epoch": 0.52, "learning_rate": 2.3836030145532853e-05, "loss": 0.7238, "step": 38440 }, { "epoch": 0.52, "learning_rate": 2.383077428309851e-05, "loss": 0.6133, "step": 38445 }, { "epoch": 0.52, "learning_rate": 2.3825518472455005e-05, "loss": 0.6155, "step": 38450 }, { "epoch": 0.52, "learning_rate": 2.3820262713835155e-05, "loss": 0.5564, "step": 38455 }, { "epoch": 0.52, "learning_rate": 2.3815007007471763e-05, "loss": 0.3559, "step": 38460 }, { "epoch": 0.52, "learning_rate": 2.3809751353597644e-05, "loss": 0.3453, "step": 38465 }, { "epoch": 0.52, "learning_rate": 2.380449575244558e-05, "loss": 0.9931, "step": 38470 }, { "epoch": 0.52, "learning_rate": 2.379924020424837e-05, "loss": 0.7, "step": 38475 }, { "epoch": 0.52, "learning_rate": 2.3793984709238816e-05, "loss": 0.854, "step": 38480 }, { "epoch": 0.52, "learning_rate": 2.37887292676497e-05, "loss": 0.5152, "step": 38485 }, { "epoch": 0.52, "learning_rate": 2.378347387971382e-05, "loss": 0.5724, "step": 38490 }, { "epoch": 0.52, "learning_rate": 2.3778218545663972e-05, "loss": 0.2359, "step": 38495 }, { "epoch": 0.52, "learning_rate": 2.3772963265732917e-05, "loss": 0.1013, "step": 38500 }, { "epoch": 0.52, "learning_rate": 2.3767708040153453e-05, "loss": 0.9424, "step": 38505 }, { "epoch": 0.52, "learning_rate": 2.3762452869158363e-05, "loss": 0.3542, "step": 38510 }, { "epoch": 0.52, "learning_rate": 2.3757197752980413e-05, "loss": 0.3745, "step": 38515 }, { "epoch": 0.52, "learning_rate": 2.3751942691852385e-05, "loss": 0.9158, "step": 38520 }, { "epoch": 0.52, "learning_rate": 2.3746687686007063e-05, "loss": 0.4726, "step": 38525 }, { "epoch": 0.52, "learning_rate": 2.3741432735677195e-05, "loss": 0.1777, "step": 38530 }, { "epoch": 0.52, "learning_rate": 2.3736177841095563e-05, "loss": 0.3113, "step": 38535 }, { "epoch": 0.52, "learning_rate": 2.3730923002494935e-05, "loss": 0.4562, "step": 38540 }, { "epoch": 0.52, "learning_rate": 2.3725668220108062e-05, "loss": 0.4882, "step": 38545 }, { "epoch": 0.52, "learning_rate": 2.3720413494167708e-05, "loss": 0.6757, "step": 38550 }, { "epoch": 0.52, "learning_rate": 2.371515882490665e-05, "loss": 0.9579, "step": 38555 }, { "epoch": 0.52, "learning_rate": 2.3709904212557618e-05, "loss": 0.2685, "step": 38560 }, { "epoch": 0.52, "learning_rate": 2.3704649657353374e-05, "loss": 0.8056, "step": 38565 }, { "epoch": 0.52, "learning_rate": 2.3699395159526663e-05, "loss": 0.8258, "step": 38570 }, { "epoch": 0.52, "learning_rate": 2.3694140719310255e-05, "loss": 0.104, "step": 38575 }, { "epoch": 0.52, "learning_rate": 2.3688886336936873e-05, "loss": 0.7142, "step": 38580 }, { "epoch": 0.52, "learning_rate": 2.3683632012639265e-05, "loss": 0.6946, "step": 38585 }, { "epoch": 0.52, "learning_rate": 2.367837774665018e-05, "loss": 0.3504, "step": 38590 }, { "epoch": 0.52, "learning_rate": 2.367312353920234e-05, "loss": 0.9015, "step": 38595 }, { "epoch": 0.52, "learning_rate": 2.3667869390528494e-05, "loss": 1.0516, "step": 38600 }, { "epoch": 0.52, "learning_rate": 2.366261530086138e-05, "loss": 0.9847, "step": 38605 }, { "epoch": 0.52, "learning_rate": 2.3657361270433705e-05, "loss": 0.5348, "step": 38610 }, { "epoch": 0.52, "learning_rate": 2.3652107299478205e-05, "loss": 1.2234, "step": 38615 }, { "epoch": 0.52, "learning_rate": 2.3646853388227618e-05, "loss": 1.1324, "step": 38620 }, { "epoch": 0.52, "learning_rate": 2.364159953691465e-05, "loss": 0.6406, "step": 38625 }, { "epoch": 0.52, "learning_rate": 2.3636345745772028e-05, "loss": 0.9789, "step": 38630 }, { "epoch": 0.52, "learning_rate": 2.3631092015032473e-05, "loss": 0.5293, "step": 38635 }, { "epoch": 0.52, "learning_rate": 2.362583834492869e-05, "loss": 0.3614, "step": 38640 }, { "epoch": 0.52, "learning_rate": 2.362058473569339e-05, "loss": 0.5108, "step": 38645 }, { "epoch": 0.52, "learning_rate": 2.361533118755929e-05, "loss": 0.6401, "step": 38650 }, { "epoch": 0.52, "learning_rate": 2.3610077700759085e-05, "loss": 0.7737, "step": 38655 }, { "epoch": 0.52, "learning_rate": 2.3604824275525486e-05, "loss": 0.6432, "step": 38660 }, { "epoch": 0.52, "learning_rate": 2.35995709120912e-05, "loss": 0.5402, "step": 38665 }, { "epoch": 0.52, "learning_rate": 2.359431761068891e-05, "loss": 0.8475, "step": 38670 }, { "epoch": 0.52, "learning_rate": 2.358906437155131e-05, "loss": 0.5995, "step": 38675 }, { "epoch": 0.52, "learning_rate": 2.3583811194911103e-05, "loss": 0.7669, "step": 38680 }, { "epoch": 0.52, "learning_rate": 2.3578558081000988e-05, "loss": 0.874, "step": 38685 }, { "epoch": 0.52, "learning_rate": 2.3573305030053627e-05, "loss": 0.652, "step": 38690 }, { "epoch": 0.52, "learning_rate": 2.3568052042301717e-05, "loss": 0.5594, "step": 38695 }, { "epoch": 0.52, "learning_rate": 2.3562799117977942e-05, "loss": 0.8967, "step": 38700 }, { "epoch": 0.52, "learning_rate": 2.355754625731497e-05, "loss": 0.5131, "step": 38705 }, { "epoch": 0.52, "learning_rate": 2.3552293460545487e-05, "loss": 0.6533, "step": 38710 }, { "epoch": 0.52, "learning_rate": 2.3547040727902167e-05, "loss": 0.4662, "step": 38715 }, { "epoch": 0.52, "learning_rate": 2.3541788059617665e-05, "loss": 1.2458, "step": 38720 }, { "epoch": 0.52, "learning_rate": 2.3536535455924655e-05, "loss": 1.175, "step": 38725 }, { "epoch": 0.52, "learning_rate": 2.353128291705581e-05, "loss": 0.7933, "step": 38730 }, { "epoch": 0.52, "learning_rate": 2.3526030443243776e-05, "loss": 0.8087, "step": 38735 }, { "epoch": 0.52, "learning_rate": 2.3520778034721222e-05, "loss": 0.8038, "step": 38740 }, { "epoch": 0.52, "learning_rate": 2.351552569172081e-05, "loss": 0.7731, "step": 38745 }, { "epoch": 0.52, "learning_rate": 2.3510273414475173e-05, "loss": 0.811, "step": 38750 }, { "epoch": 0.52, "learning_rate": 2.350502120321697e-05, "loss": 0.8245, "step": 38755 }, { "epoch": 0.52, "learning_rate": 2.3499769058178854e-05, "loss": 0.4295, "step": 38760 }, { "epoch": 0.52, "learning_rate": 2.3494516979593462e-05, "loss": 0.3387, "step": 38765 }, { "epoch": 0.52, "learning_rate": 2.3489264967693435e-05, "loss": 0.3031, "step": 38770 }, { "epoch": 0.52, "learning_rate": 2.348401302271142e-05, "loss": 0.7128, "step": 38775 }, { "epoch": 0.52, "learning_rate": 2.3478761144880032e-05, "loss": 0.8443, "step": 38780 }, { "epoch": 0.52, "learning_rate": 2.347350933443191e-05, "loss": 0.9685, "step": 38785 }, { "epoch": 0.52, "learning_rate": 2.3468257591599695e-05, "loss": 0.4832, "step": 38790 }, { "epoch": 0.52, "learning_rate": 2.3463005916616015e-05, "loss": 0.1587, "step": 38795 }, { "epoch": 0.52, "learning_rate": 2.3457754309713476e-05, "loss": 0.8147, "step": 38800 }, { "epoch": 0.52, "learning_rate": 2.3452502771124702e-05, "loss": 0.9173, "step": 38805 }, { "epoch": 0.52, "learning_rate": 2.344725130108232e-05, "loss": 0.7473, "step": 38810 }, { "epoch": 0.52, "learning_rate": 2.344199989981893e-05, "loss": 0.4108, "step": 38815 }, { "epoch": 0.52, "learning_rate": 2.3436748567567152e-05, "loss": 0.5376, "step": 38820 }, { "epoch": 0.52, "learning_rate": 2.3431497304559603e-05, "loss": 1.0624, "step": 38825 }, { "epoch": 0.52, "learning_rate": 2.3426246111028867e-05, "loss": 1.1831, "step": 38830 }, { "epoch": 0.52, "learning_rate": 2.342099498720755e-05, "loss": 0.7619, "step": 38835 }, { "epoch": 0.52, "learning_rate": 2.3415743933328262e-05, "loss": 0.7584, "step": 38840 }, { "epoch": 0.52, "learning_rate": 2.3410492949623593e-05, "loss": 1.9373, "step": 38845 }, { "epoch": 0.52, "learning_rate": 2.340524203632613e-05, "loss": 0.6057, "step": 38850 }, { "epoch": 0.52, "learning_rate": 2.3399991193668474e-05, "loss": 0.4378, "step": 38855 }, { "epoch": 0.52, "learning_rate": 2.3394740421883195e-05, "loss": 0.6896, "step": 38860 }, { "epoch": 0.52, "learning_rate": 2.3389489721202883e-05, "loss": 0.7261, "step": 38865 }, { "epoch": 0.52, "learning_rate": 2.3384239091860126e-05, "loss": 0.9049, "step": 38870 }, { "epoch": 0.52, "learning_rate": 2.3378988534087492e-05, "loss": 1.2836, "step": 38875 }, { "epoch": 0.52, "learning_rate": 2.3373738048117553e-05, "loss": 0.6457, "step": 38880 }, { "epoch": 0.52, "learning_rate": 2.3368487634182895e-05, "loss": 1.104, "step": 38885 }, { "epoch": 0.52, "learning_rate": 2.3363237292516054e-05, "loss": 0.5388, "step": 38890 }, { "epoch": 0.52, "learning_rate": 2.335798702334962e-05, "loss": 0.7264, "step": 38895 }, { "epoch": 0.52, "learning_rate": 2.3352736826916155e-05, "loss": 0.4649, "step": 38900 }, { "epoch": 0.52, "learning_rate": 2.3347486703448196e-05, "loss": 0.4435, "step": 38905 }, { "epoch": 0.52, "learning_rate": 2.3342236653178314e-05, "loss": 0.8546, "step": 38910 }, { "epoch": 0.52, "learning_rate": 2.333698667633905e-05, "loss": 0.6094, "step": 38915 }, { "epoch": 0.52, "learning_rate": 2.3331736773162964e-05, "loss": 1.3266, "step": 38920 }, { "epoch": 0.52, "learning_rate": 2.3326486943882582e-05, "loss": 0.7208, "step": 38925 }, { "epoch": 0.52, "learning_rate": 2.3321237188730465e-05, "loss": 0.3943, "step": 38930 }, { "epoch": 0.52, "learning_rate": 2.3315987507939146e-05, "loss": 0.5379, "step": 38935 }, { "epoch": 0.52, "learning_rate": 2.3310737901741147e-05, "loss": 0.8378, "step": 38940 }, { "epoch": 0.52, "learning_rate": 2.3305488370369008e-05, "loss": 0.559, "step": 38945 }, { "epoch": 0.52, "learning_rate": 2.330023891405526e-05, "loss": 0.41, "step": 38950 }, { "epoch": 0.52, "learning_rate": 2.3294989533032423e-05, "loss": 0.4747, "step": 38955 }, { "epoch": 0.52, "learning_rate": 2.328974022753302e-05, "loss": 0.4278, "step": 38960 }, { "epoch": 0.52, "learning_rate": 2.3284490997789575e-05, "loss": 0.8696, "step": 38965 }, { "epoch": 0.52, "learning_rate": 2.3279241844034587e-05, "loss": 0.8173, "step": 38970 }, { "epoch": 0.52, "learning_rate": 2.327399276650058e-05, "loss": 0.741, "step": 38975 }, { "epoch": 0.52, "learning_rate": 2.3268743765420063e-05, "loss": 0.1779, "step": 38980 }, { "epoch": 0.52, "learning_rate": 2.3263494841025527e-05, "loss": 0.1854, "step": 38985 }, { "epoch": 0.52, "learning_rate": 2.3258245993549484e-05, "loss": 0.5166, "step": 38990 }, { "epoch": 0.52, "learning_rate": 2.325299722322444e-05, "loss": 0.8561, "step": 38995 }, { "epoch": 0.52, "learning_rate": 2.3247748530282865e-05, "loss": 0.5426, "step": 39000 }, { "epoch": 0.52, "learning_rate": 2.324249991495727e-05, "loss": 1.1173, "step": 39005 }, { "epoch": 0.52, "learning_rate": 2.3237251377480143e-05, "loss": 1.0467, "step": 39010 }, { "epoch": 0.52, "learning_rate": 2.3232002918083954e-05, "loss": 0.3956, "step": 39015 }, { "epoch": 0.52, "learning_rate": 2.322675453700119e-05, "loss": 0.9034, "step": 39020 }, { "epoch": 0.52, "learning_rate": 2.3221506234464325e-05, "loss": 0.8905, "step": 39025 }, { "epoch": 0.52, "learning_rate": 2.3216258010705848e-05, "loss": 0.7188, "step": 39030 }, { "epoch": 0.52, "learning_rate": 2.3211009865958204e-05, "loss": 0.5064, "step": 39035 }, { "epoch": 0.52, "learning_rate": 2.3205761800453878e-05, "loss": 0.7692, "step": 39040 }, { "epoch": 0.52, "learning_rate": 2.320051381442534e-05, "loss": 0.4401, "step": 39045 }, { "epoch": 0.52, "learning_rate": 2.3195265908105025e-05, "loss": 0.9518, "step": 39050 }, { "epoch": 0.52, "learning_rate": 2.31900180817254e-05, "loss": 0.406, "step": 39055 }, { "epoch": 0.52, "learning_rate": 2.3184770335518925e-05, "loss": 0.6314, "step": 39060 }, { "epoch": 0.52, "learning_rate": 2.317952266971804e-05, "loss": 0.3568, "step": 39065 }, { "epoch": 0.52, "learning_rate": 2.317427508455519e-05, "loss": 0.2852, "step": 39070 }, { "epoch": 0.52, "learning_rate": 2.3169027580262833e-05, "loss": 0.8881, "step": 39075 }, { "epoch": 0.52, "learning_rate": 2.3163780157073385e-05, "loss": 0.2617, "step": 39080 }, { "epoch": 0.52, "learning_rate": 2.3158532815219284e-05, "loss": 0.8681, "step": 39085 }, { "epoch": 0.52, "learning_rate": 2.3153285554932974e-05, "loss": 1.1024, "step": 39090 }, { "epoch": 0.52, "learning_rate": 2.3148038376446873e-05, "loss": 0.4819, "step": 39095 }, { "epoch": 0.52, "learning_rate": 2.3142791279993402e-05, "loss": 0.2659, "step": 39100 }, { "epoch": 0.52, "learning_rate": 2.3137544265804994e-05, "loss": 1.0152, "step": 39105 }, { "epoch": 0.52, "learning_rate": 2.3132297334114054e-05, "loss": 1.1714, "step": 39110 }, { "epoch": 0.52, "learning_rate": 2.3127050485152995e-05, "loss": 0.7283, "step": 39115 }, { "epoch": 0.52, "learning_rate": 2.3121803719154246e-05, "loss": 1.0149, "step": 39120 }, { "epoch": 0.52, "learning_rate": 2.311655703635018e-05, "loss": 0.514, "step": 39125 }, { "epoch": 0.52, "learning_rate": 2.3111310436973212e-05, "loss": 1.0799, "step": 39130 }, { "epoch": 0.52, "learning_rate": 2.3106063921255745e-05, "loss": 0.6161, "step": 39135 }, { "epoch": 0.52, "learning_rate": 2.3100817489430183e-05, "loss": 0.3909, "step": 39140 }, { "epoch": 0.52, "learning_rate": 2.309557114172889e-05, "loss": 0.4798, "step": 39145 }, { "epoch": 0.52, "learning_rate": 2.3090324878384273e-05, "loss": 0.8104, "step": 39150 }, { "epoch": 0.52, "learning_rate": 2.308507869962872e-05, "loss": 0.9164, "step": 39155 }, { "epoch": 0.52, "learning_rate": 2.307983260569459e-05, "loss": 1.1971, "step": 39160 }, { "epoch": 0.52, "learning_rate": 2.307458659681427e-05, "loss": 1.283, "step": 39165 }, { "epoch": 0.52, "learning_rate": 2.3069340673220135e-05, "loss": 0.9611, "step": 39170 }, { "epoch": 0.52, "learning_rate": 2.3064094835144544e-05, "loss": 0.7942, "step": 39175 }, { "epoch": 0.52, "learning_rate": 2.305884908281987e-05, "loss": 0.4939, "step": 39180 }, { "epoch": 0.53, "learning_rate": 2.3053603416478477e-05, "loss": 0.6254, "step": 39185 }, { "epoch": 0.53, "learning_rate": 2.304835783635271e-05, "loss": 0.3386, "step": 39190 }, { "epoch": 0.53, "learning_rate": 2.3043112342674923e-05, "loss": 0.6897, "step": 39195 }, { "epoch": 0.53, "learning_rate": 2.3037866935677475e-05, "loss": 1.0176, "step": 39200 }, { "epoch": 0.53, "learning_rate": 2.3032621615592698e-05, "loss": 0.7552, "step": 39205 }, { "epoch": 0.53, "learning_rate": 2.3027376382652945e-05, "loss": 1.1839, "step": 39210 }, { "epoch": 0.53, "learning_rate": 2.302213123709055e-05, "loss": 0.7974, "step": 39215 }, { "epoch": 0.53, "learning_rate": 2.3016886179137844e-05, "loss": 0.3218, "step": 39220 }, { "epoch": 0.53, "learning_rate": 2.301164120902716e-05, "loss": 0.7673, "step": 39225 }, { "epoch": 0.53, "learning_rate": 2.300639632699083e-05, "loss": 0.6215, "step": 39230 }, { "epoch": 0.53, "learning_rate": 2.300115153326116e-05, "loss": 0.5753, "step": 39235 }, { "epoch": 0.53, "learning_rate": 2.299590682807048e-05, "loss": 0.6883, "step": 39240 }, { "epoch": 0.53, "learning_rate": 2.29906622116511e-05, "loss": 0.7505, "step": 39245 }, { "epoch": 0.53, "learning_rate": 2.2985417684235337e-05, "loss": 0.7679, "step": 39250 }, { "epoch": 0.53, "learning_rate": 2.2980173246055485e-05, "loss": 1.1465, "step": 39255 }, { "epoch": 0.53, "learning_rate": 2.2974928897343854e-05, "loss": 0.7732, "step": 39260 }, { "epoch": 0.53, "learning_rate": 2.2969684638332754e-05, "loss": 0.6617, "step": 39265 }, { "epoch": 0.53, "learning_rate": 2.2964440469254453e-05, "loss": 0.7939, "step": 39270 }, { "epoch": 0.53, "learning_rate": 2.295919639034126e-05, "loss": 0.1926, "step": 39275 }, { "epoch": 0.53, "learning_rate": 2.2953952401825457e-05, "loss": 0.9925, "step": 39280 }, { "epoch": 0.53, "learning_rate": 2.2948708503939326e-05, "loss": 0.6818, "step": 39285 }, { "epoch": 0.53, "learning_rate": 2.2943464696915144e-05, "loss": 1.1997, "step": 39290 }, { "epoch": 0.53, "learning_rate": 2.29382209809852e-05, "loss": 0.8852, "step": 39295 }, { "epoch": 0.53, "learning_rate": 2.293297735638174e-05, "loss": 0.3427, "step": 39300 }, { "epoch": 0.53, "learning_rate": 2.2927733823337032e-05, "loss": 0.4789, "step": 39305 }, { "epoch": 0.53, "learning_rate": 2.292249038208337e-05, "loss": 0.4065, "step": 39310 }, { "epoch": 0.53, "learning_rate": 2.291724703285298e-05, "loss": 0.1847, "step": 39315 }, { "epoch": 0.53, "learning_rate": 2.2912003775878126e-05, "loss": 1.3539, "step": 39320 }, { "epoch": 0.53, "learning_rate": 2.290676061139106e-05, "loss": 0.7514, "step": 39325 }, { "epoch": 0.53, "learning_rate": 2.2901517539624027e-05, "loss": 0.9581, "step": 39330 }, { "epoch": 0.53, "learning_rate": 2.2896274560809268e-05, "loss": 0.953, "step": 39335 }, { "epoch": 0.53, "learning_rate": 2.289103167517903e-05, "loss": 1.1468, "step": 39340 }, { "epoch": 0.53, "learning_rate": 2.2885788882965526e-05, "loss": 1.6703, "step": 39345 }, { "epoch": 0.53, "learning_rate": 2.2880546184401e-05, "loss": 0.544, "step": 39350 }, { "epoch": 0.53, "learning_rate": 2.2875303579717673e-05, "loss": 0.7609, "step": 39355 }, { "epoch": 0.53, "learning_rate": 2.2870061069147775e-05, "loss": 0.8719, "step": 39360 }, { "epoch": 0.53, "learning_rate": 2.286481865292351e-05, "loss": 0.6179, "step": 39365 }, { "epoch": 0.53, "learning_rate": 2.2859576331277098e-05, "loss": 0.8628, "step": 39370 }, { "epoch": 0.53, "learning_rate": 2.2854334104440757e-05, "loss": 0.1989, "step": 39375 }, { "epoch": 0.53, "learning_rate": 2.2849091972646666e-05, "loss": 1.247, "step": 39380 }, { "epoch": 0.53, "learning_rate": 2.2843849936127044e-05, "loss": 0.2819, "step": 39385 }, { "epoch": 0.53, "learning_rate": 2.2838607995114087e-05, "loss": 0.3792, "step": 39390 }, { "epoch": 0.53, "learning_rate": 2.2833366149839973e-05, "loss": 1.2848, "step": 39395 }, { "epoch": 0.53, "learning_rate": 2.2828124400536905e-05, "loss": 0.7338, "step": 39400 }, { "epoch": 0.53, "learning_rate": 2.282288274743707e-05, "loss": 0.9719, "step": 39405 }, { "epoch": 0.53, "learning_rate": 2.2817641190772625e-05, "loss": 0.8611, "step": 39410 }, { "epoch": 0.53, "learning_rate": 2.2812399730775753e-05, "loss": 0.5335, "step": 39415 }, { "epoch": 0.53, "learning_rate": 2.2807158367678648e-05, "loss": 0.8522, "step": 39420 }, { "epoch": 0.53, "learning_rate": 2.2801917101713443e-05, "loss": 0.7237, "step": 39425 }, { "epoch": 0.53, "learning_rate": 2.2796675933112314e-05, "loss": 1.0174, "step": 39430 }, { "epoch": 0.53, "learning_rate": 2.2791434862107423e-05, "loss": 0.6814, "step": 39435 }, { "epoch": 0.53, "learning_rate": 2.2786193888930913e-05, "loss": 0.4004, "step": 39440 }, { "epoch": 0.53, "learning_rate": 2.278095301381494e-05, "loss": 0.4642, "step": 39445 }, { "epoch": 0.53, "learning_rate": 2.2775712236991656e-05, "loss": 0.7005, "step": 39450 }, { "epoch": 0.53, "learning_rate": 2.2770471558693183e-05, "loss": 1.3007, "step": 39455 }, { "epoch": 0.53, "learning_rate": 2.2765230979151668e-05, "loss": 0.9651, "step": 39460 }, { "epoch": 0.53, "learning_rate": 2.2759990498599234e-05, "loss": 0.2273, "step": 39465 }, { "epoch": 0.53, "learning_rate": 2.2754750117268026e-05, "loss": 0.5973, "step": 39470 }, { "epoch": 0.53, "learning_rate": 2.2749509835390145e-05, "loss": 1.0963, "step": 39475 }, { "epoch": 0.53, "learning_rate": 2.274426965319772e-05, "loss": 0.9251, "step": 39480 }, { "epoch": 0.53, "learning_rate": 2.273902957092288e-05, "loss": 0.8444, "step": 39485 }, { "epoch": 0.53, "learning_rate": 2.2733789588797703e-05, "loss": 0.6466, "step": 39490 }, { "epoch": 0.53, "learning_rate": 2.2728549707054314e-05, "loss": 0.3211, "step": 39495 }, { "epoch": 0.53, "learning_rate": 2.272330992592481e-05, "loss": 0.486, "step": 39500 }, { "epoch": 0.53, "learning_rate": 2.2718070245641286e-05, "loss": 0.7807, "step": 39505 }, { "epoch": 0.53, "learning_rate": 2.2712830666435832e-05, "loss": 1.2066, "step": 39510 }, { "epoch": 0.53, "learning_rate": 2.2707591188540543e-05, "loss": 0.6852, "step": 39515 }, { "epoch": 0.53, "learning_rate": 2.2702351812187483e-05, "loss": 1.0491, "step": 39520 }, { "epoch": 0.53, "learning_rate": 2.269711253760875e-05, "loss": 0.271, "step": 39525 }, { "epoch": 0.53, "learning_rate": 2.269187336503642e-05, "loss": 0.5583, "step": 39530 }, { "epoch": 0.53, "learning_rate": 2.2686634294702543e-05, "loss": 0.5099, "step": 39535 }, { "epoch": 0.53, "learning_rate": 2.2681395326839195e-05, "loss": 0.9831, "step": 39540 }, { "epoch": 0.53, "learning_rate": 2.2676156461678436e-05, "loss": 0.7835, "step": 39545 }, { "epoch": 0.53, "learning_rate": 2.2670917699452316e-05, "loss": 0.8053, "step": 39550 }, { "epoch": 0.53, "learning_rate": 2.266567904039289e-05, "loss": 0.3774, "step": 39555 }, { "epoch": 0.53, "learning_rate": 2.2660440484732216e-05, "loss": 1.3786, "step": 39560 }, { "epoch": 0.53, "learning_rate": 2.265520203270231e-05, "loss": 0.7054, "step": 39565 }, { "epoch": 0.53, "learning_rate": 2.2649963684535223e-05, "loss": 0.7743, "step": 39570 }, { "epoch": 0.53, "learning_rate": 2.2644725440463e-05, "loss": 0.902, "step": 39575 }, { "epoch": 0.53, "learning_rate": 2.2639487300717645e-05, "loss": 1.6931, "step": 39580 }, { "epoch": 0.53, "learning_rate": 2.2634249265531197e-05, "loss": 0.6086, "step": 39585 }, { "epoch": 0.53, "learning_rate": 2.262901133513567e-05, "loss": 1.4188, "step": 39590 }, { "epoch": 0.53, "learning_rate": 2.262377350976309e-05, "loss": 1.2299, "step": 39595 }, { "epoch": 0.53, "learning_rate": 2.2618535789645445e-05, "loss": 1.1117, "step": 39600 }, { "epoch": 0.53, "learning_rate": 2.261329817501475e-05, "loss": 0.3743, "step": 39605 }, { "epoch": 0.53, "learning_rate": 2.260806066610301e-05, "loss": 0.7092, "step": 39610 }, { "epoch": 0.53, "learning_rate": 2.2602823263142213e-05, "loss": 0.6547, "step": 39615 }, { "epoch": 0.53, "learning_rate": 2.259758596636435e-05, "loss": 0.5808, "step": 39620 }, { "epoch": 0.53, "learning_rate": 2.259234877600142e-05, "loss": 0.4995, "step": 39625 }, { "epoch": 0.53, "learning_rate": 2.258711169228538e-05, "loss": 1.3907, "step": 39630 }, { "epoch": 0.53, "learning_rate": 2.2581874715448226e-05, "loss": 1.8984, "step": 39635 }, { "epoch": 0.53, "learning_rate": 2.2576637845721938e-05, "loss": 0.6919, "step": 39640 }, { "epoch": 0.53, "learning_rate": 2.2571401083338455e-05, "loss": 0.9683, "step": 39645 }, { "epoch": 0.53, "learning_rate": 2.2566164428529756e-05, "loss": 0.2091, "step": 39650 }, { "epoch": 0.53, "learning_rate": 2.2560927881527798e-05, "loss": 0.0479, "step": 39655 }, { "epoch": 0.53, "learning_rate": 2.2555691442564534e-05, "loss": 0.9002, "step": 39660 }, { "epoch": 0.53, "learning_rate": 2.2550455111871908e-05, "loss": 0.6067, "step": 39665 }, { "epoch": 0.53, "learning_rate": 2.2545218889681874e-05, "loss": 0.6462, "step": 39670 }, { "epoch": 0.53, "learning_rate": 2.2539982776226355e-05, "loss": 0.8712, "step": 39675 }, { "epoch": 0.53, "learning_rate": 2.253474677173729e-05, "loss": 0.9311, "step": 39680 }, { "epoch": 0.53, "learning_rate": 2.2529510876446613e-05, "loss": 0.8338, "step": 39685 }, { "epoch": 0.53, "learning_rate": 2.2524275090586246e-05, "loss": 0.6485, "step": 39690 }, { "epoch": 0.53, "learning_rate": 2.25190394143881e-05, "loss": 0.7903, "step": 39695 }, { "epoch": 0.53, "learning_rate": 2.2514850952542244e-05, "loss": 0.5974, "step": 39700 }, { "epoch": 0.53, "learning_rate": 2.250961547432053e-05, "loss": 1.186, "step": 39705 }, { "epoch": 0.53, "learning_rate": 2.2504380106410394e-05, "loss": 1.0289, "step": 39710 }, { "epoch": 0.53, "learning_rate": 2.249914484904374e-05, "loss": 1.0075, "step": 39715 }, { "epoch": 0.53, "learning_rate": 2.249390970245245e-05, "loss": 0.7312, "step": 39720 }, { "epoch": 0.53, "learning_rate": 2.2488674666868422e-05, "loss": 1.3593, "step": 39725 }, { "epoch": 0.53, "learning_rate": 2.2483439742523555e-05, "loss": 1.1346, "step": 39730 }, { "epoch": 0.53, "learning_rate": 2.2478204929649707e-05, "loss": 0.5247, "step": 39735 }, { "epoch": 0.53, "learning_rate": 2.2472970228478763e-05, "loss": 0.7597, "step": 39740 }, { "epoch": 0.53, "learning_rate": 2.246773563924259e-05, "loss": 0.4985, "step": 39745 }, { "epoch": 0.53, "learning_rate": 2.2462501162173077e-05, "loss": 0.8121, "step": 39750 }, { "epoch": 0.53, "learning_rate": 2.2457266797502058e-05, "loss": 0.5718, "step": 39755 }, { "epoch": 0.53, "learning_rate": 2.2452032545461397e-05, "loss": 0.4992, "step": 39760 }, { "epoch": 0.53, "learning_rate": 2.2446798406282953e-05, "loss": 0.5492, "step": 39765 }, { "epoch": 0.53, "learning_rate": 2.2441564380198562e-05, "loss": 0.8892, "step": 39770 }, { "epoch": 0.53, "learning_rate": 2.2436330467440068e-05, "loss": 0.7089, "step": 39775 }, { "epoch": 0.53, "learning_rate": 2.243109666823932e-05, "loss": 0.6376, "step": 39780 }, { "epoch": 0.53, "learning_rate": 2.242586298282813e-05, "loss": 0.2166, "step": 39785 }, { "epoch": 0.53, "learning_rate": 2.2420629411438325e-05, "loss": 0.7294, "step": 39790 }, { "epoch": 0.53, "learning_rate": 2.2415395954301744e-05, "loss": 0.9705, "step": 39795 }, { "epoch": 0.53, "learning_rate": 2.2410162611650186e-05, "loss": 0.3651, "step": 39800 }, { "epoch": 0.53, "learning_rate": 2.2404929383715465e-05, "loss": 1.3771, "step": 39805 }, { "epoch": 0.53, "learning_rate": 2.2399696270729403e-05, "loss": 0.8491, "step": 39810 }, { "epoch": 0.53, "learning_rate": 2.2394463272923773e-05, "loss": 1.2571, "step": 39815 }, { "epoch": 0.53, "learning_rate": 2.238923039053039e-05, "loss": 0.4509, "step": 39820 }, { "epoch": 0.53, "learning_rate": 2.2383997623781042e-05, "loss": 1.4584, "step": 39825 }, { "epoch": 0.53, "learning_rate": 2.2378764972907506e-05, "loss": 0.5724, "step": 39830 }, { "epoch": 0.53, "learning_rate": 2.2373532438141567e-05, "loss": 1.2909, "step": 39835 }, { "epoch": 0.53, "learning_rate": 2.2368300019715018e-05, "loss": 1.2248, "step": 39840 }, { "epoch": 0.53, "learning_rate": 2.2363067717859592e-05, "loss": 0.5655, "step": 39845 }, { "epoch": 0.53, "learning_rate": 2.2357835532807082e-05, "loss": 0.5506, "step": 39850 }, { "epoch": 0.53, "learning_rate": 2.235260346478923e-05, "loss": 0.564, "step": 39855 }, { "epoch": 0.53, "learning_rate": 2.2347371514037817e-05, "loss": 0.559, "step": 39860 }, { "epoch": 0.53, "learning_rate": 2.234213968078456e-05, "loss": 0.7027, "step": 39865 }, { "epoch": 0.53, "learning_rate": 2.233690796526123e-05, "loss": 0.7863, "step": 39870 }, { "epoch": 0.53, "learning_rate": 2.233167636769955e-05, "loss": 0.599, "step": 39875 }, { "epoch": 0.53, "learning_rate": 2.2326444888331256e-05, "loss": 0.2654, "step": 39880 }, { "epoch": 0.53, "learning_rate": 2.2321213527388074e-05, "loss": 0.5656, "step": 39885 }, { "epoch": 0.53, "learning_rate": 2.2315982285101748e-05, "loss": 0.8611, "step": 39890 }, { "epoch": 0.53, "learning_rate": 2.2310751161703962e-05, "loss": 0.8166, "step": 39895 }, { "epoch": 0.53, "learning_rate": 2.230552015742645e-05, "loss": 0.9061, "step": 39900 }, { "epoch": 0.53, "learning_rate": 2.2300289272500918e-05, "loss": 0.5843, "step": 39905 }, { "epoch": 0.53, "learning_rate": 2.229505850715906e-05, "loss": 0.5346, "step": 39910 }, { "epoch": 0.53, "learning_rate": 2.2289827861632582e-05, "loss": 0.7084, "step": 39915 }, { "epoch": 0.53, "learning_rate": 2.2284597336153175e-05, "loss": 0.8035, "step": 39920 }, { "epoch": 0.53, "learning_rate": 2.2279366930952515e-05, "loss": 0.4581, "step": 39925 }, { "epoch": 0.54, "learning_rate": 2.227413664626229e-05, "loss": 0.511, "step": 39930 }, { "epoch": 0.54, "learning_rate": 2.2268906482314176e-05, "loss": 0.6989, "step": 39935 }, { "epoch": 0.54, "learning_rate": 2.2263676439339838e-05, "loss": 0.5207, "step": 39940 }, { "epoch": 0.54, "learning_rate": 2.2258446517570944e-05, "loss": 0.4812, "step": 39945 }, { "epoch": 0.54, "learning_rate": 2.2253216717239168e-05, "loss": 0.6702, "step": 39950 }, { "epoch": 0.54, "learning_rate": 2.2247987038576136e-05, "loss": 0.2732, "step": 39955 }, { "epoch": 0.54, "learning_rate": 2.224275748181351e-05, "loss": 0.8165, "step": 39960 }, { "epoch": 0.54, "learning_rate": 2.2237528047182925e-05, "loss": 0.7017, "step": 39965 }, { "epoch": 0.54, "learning_rate": 2.223229873491605e-05, "loss": 1.1226, "step": 39970 }, { "epoch": 0.54, "learning_rate": 2.2227069545244478e-05, "loss": 0.5512, "step": 39975 }, { "epoch": 0.54, "learning_rate": 2.2221840478399856e-05, "loss": 0.4555, "step": 39980 }, { "epoch": 0.54, "learning_rate": 2.2216611534613806e-05, "loss": 0.6393, "step": 39985 }, { "epoch": 0.54, "learning_rate": 2.2211382714117933e-05, "loss": 0.9897, "step": 39990 }, { "epoch": 0.54, "learning_rate": 2.220615401714386e-05, "loss": 0.9421, "step": 39995 }, { "epoch": 0.54, "learning_rate": 2.2200925443923196e-05, "loss": 0.093, "step": 40000 }, { "epoch": 0.54, "learning_rate": 2.2195696994687518e-05, "loss": 0.594, "step": 40005 }, { "epoch": 0.54, "learning_rate": 2.2190468669668435e-05, "loss": 0.6355, "step": 40010 }, { "epoch": 0.54, "learning_rate": 2.218524046909754e-05, "loss": 0.4339, "step": 40015 }, { "epoch": 0.54, "learning_rate": 2.2180012393206406e-05, "loss": 0.5296, "step": 40020 }, { "epoch": 0.54, "learning_rate": 2.2174784442226614e-05, "loss": 0.2728, "step": 40025 }, { "epoch": 0.54, "learning_rate": 2.2169556616389747e-05, "loss": 0.6196, "step": 40030 }, { "epoch": 0.54, "learning_rate": 2.216432891592735e-05, "loss": 0.709, "step": 40035 }, { "epoch": 0.54, "learning_rate": 2.2159101341071e-05, "loss": 1.1129, "step": 40040 }, { "epoch": 0.54, "learning_rate": 2.215387389205225e-05, "loss": 0.9812, "step": 40045 }, { "epoch": 0.54, "learning_rate": 2.2148646569102642e-05, "loss": 0.4539, "step": 40050 }, { "epoch": 0.54, "learning_rate": 2.2143419372453727e-05, "loss": 1.3383, "step": 40055 }, { "epoch": 0.54, "learning_rate": 2.2138192302337056e-05, "loss": 1.3979, "step": 40060 }, { "epoch": 0.54, "learning_rate": 2.2132965358984138e-05, "loss": 0.5555, "step": 40065 }, { "epoch": 0.54, "learning_rate": 2.2127738542626503e-05, "loss": 0.8512, "step": 40070 }, { "epoch": 0.54, "learning_rate": 2.2122511853495687e-05, "loss": 0.6843, "step": 40075 }, { "epoch": 0.54, "learning_rate": 2.2117285291823208e-05, "loss": 0.5701, "step": 40080 }, { "epoch": 0.54, "learning_rate": 2.2112058857840566e-05, "loss": 1.0665, "step": 40085 }, { "epoch": 0.54, "learning_rate": 2.210683255177926e-05, "loss": 1.0836, "step": 40090 }, { "epoch": 0.54, "learning_rate": 2.210160637387081e-05, "loss": 1.4088, "step": 40095 }, { "epoch": 0.54, "learning_rate": 2.209638032434669e-05, "loss": 0.9429, "step": 40100 }, { "epoch": 0.54, "learning_rate": 2.2091154403438395e-05, "loss": 0.5527, "step": 40105 }, { "epoch": 0.54, "learning_rate": 2.2085928611377415e-05, "loss": 0.4841, "step": 40110 }, { "epoch": 0.54, "learning_rate": 2.2080702948395214e-05, "loss": 0.7739, "step": 40115 }, { "epoch": 0.54, "learning_rate": 2.207547741472326e-05, "loss": 1.0935, "step": 40120 }, { "epoch": 0.54, "learning_rate": 2.2070252010593038e-05, "loss": 0.925, "step": 40125 }, { "epoch": 0.54, "learning_rate": 2.2065026736235987e-05, "loss": 0.7207, "step": 40130 }, { "epoch": 0.54, "learning_rate": 2.205980159188357e-05, "loss": 0.7099, "step": 40135 }, { "epoch": 0.54, "learning_rate": 2.2054576577767243e-05, "loss": 1.411, "step": 40140 }, { "epoch": 0.54, "learning_rate": 2.2049351694118427e-05, "loss": 0.3133, "step": 40145 }, { "epoch": 0.54, "learning_rate": 2.2044126941168566e-05, "loss": 0.7647, "step": 40150 }, { "epoch": 0.54, "learning_rate": 2.20389023191491e-05, "loss": 0.2903, "step": 40155 }, { "epoch": 0.54, "learning_rate": 2.2033677828291445e-05, "loss": 1.1076, "step": 40160 }, { "epoch": 0.54, "learning_rate": 2.2028453468827023e-05, "loss": 0.921, "step": 40165 }, { "epoch": 0.54, "learning_rate": 2.2023229240987256e-05, "loss": 0.2541, "step": 40170 }, { "epoch": 0.54, "learning_rate": 2.2018005145003528e-05, "loss": 0.4771, "step": 40175 }, { "epoch": 0.54, "learning_rate": 2.201278118110725e-05, "loss": 1.1008, "step": 40180 }, { "epoch": 0.54, "learning_rate": 2.2007557349529838e-05, "loss": 0.2357, "step": 40185 }, { "epoch": 0.54, "learning_rate": 2.2002333650502653e-05, "loss": 0.5524, "step": 40190 }, { "epoch": 0.54, "learning_rate": 2.1997110084257092e-05, "loss": 0.6252, "step": 40195 }, { "epoch": 0.54, "learning_rate": 2.199188665102453e-05, "loss": 0.7718, "step": 40200 }, { "epoch": 0.54, "learning_rate": 2.1986663351036345e-05, "loss": 0.4512, "step": 40205 }, { "epoch": 0.54, "learning_rate": 2.198144018452389e-05, "loss": 0.6309, "step": 40210 }, { "epoch": 0.54, "learning_rate": 2.197621715171854e-05, "loss": 0.3974, "step": 40215 }, { "epoch": 0.54, "learning_rate": 2.1970994252851648e-05, "loss": 0.9394, "step": 40220 }, { "epoch": 0.54, "learning_rate": 2.196577148815455e-05, "loss": 0.8769, "step": 40225 }, { "epoch": 0.54, "learning_rate": 2.1960548857858593e-05, "loss": 0.8343, "step": 40230 }, { "epoch": 0.54, "learning_rate": 2.195532636219512e-05, "loss": 0.389, "step": 40235 }, { "epoch": 0.54, "learning_rate": 2.1950104001395456e-05, "loss": 0.3205, "step": 40240 }, { "epoch": 0.54, "learning_rate": 2.194488177569092e-05, "loss": 0.8284, "step": 40245 }, { "epoch": 0.54, "learning_rate": 2.1939659685312854e-05, "loss": 0.6614, "step": 40250 }, { "epoch": 0.54, "learning_rate": 2.1934437730492543e-05, "loss": 1.3935, "step": 40255 }, { "epoch": 0.54, "learning_rate": 2.19292159114613e-05, "loss": 0.8467, "step": 40260 }, { "epoch": 0.54, "learning_rate": 2.1923994228450436e-05, "loss": 0.6248, "step": 40265 }, { "epoch": 0.54, "learning_rate": 2.1918772681691236e-05, "loss": 0.4923, "step": 40270 }, { "epoch": 0.54, "learning_rate": 2.191355127141499e-05, "loss": 0.4398, "step": 40275 }, { "epoch": 0.54, "learning_rate": 2.1908329997852992e-05, "loss": 1.2534, "step": 40280 }, { "epoch": 0.54, "learning_rate": 2.190310886123649e-05, "loss": 0.9327, "step": 40285 }, { "epoch": 0.54, "learning_rate": 2.1897887861796783e-05, "loss": 0.5238, "step": 40290 }, { "epoch": 0.54, "learning_rate": 2.189266699976513e-05, "loss": 0.5665, "step": 40295 }, { "epoch": 0.54, "learning_rate": 2.1887446275372772e-05, "loss": 0.2463, "step": 40300 }, { "epoch": 0.54, "learning_rate": 2.1882225688850975e-05, "loss": 0.8502, "step": 40305 }, { "epoch": 0.54, "learning_rate": 2.187700524043098e-05, "loss": 0.8139, "step": 40310 }, { "epoch": 0.54, "learning_rate": 2.1871784930344037e-05, "loss": 0.8159, "step": 40315 }, { "epoch": 0.54, "learning_rate": 2.1866564758821367e-05, "loss": 1.2015, "step": 40320 }, { "epoch": 0.54, "learning_rate": 2.18613447260942e-05, "loss": 0.8331, "step": 40325 }, { "epoch": 0.54, "learning_rate": 2.185612483239377e-05, "loss": 0.5036, "step": 40330 }, { "epoch": 0.54, "learning_rate": 2.185090507795127e-05, "loss": 1.2827, "step": 40335 }, { "epoch": 0.54, "learning_rate": 2.184568546299792e-05, "loss": 1.0168, "step": 40340 }, { "epoch": 0.54, "learning_rate": 2.1840465987764937e-05, "loss": 0.7146, "step": 40345 }, { "epoch": 0.54, "learning_rate": 2.183524665248349e-05, "loss": 0.4825, "step": 40350 }, { "epoch": 0.54, "learning_rate": 2.1830027457384784e-05, "loss": 0.8018, "step": 40355 }, { "epoch": 0.54, "learning_rate": 2.1824808402700016e-05, "loss": 0.6993, "step": 40360 }, { "epoch": 0.54, "learning_rate": 2.181958948866034e-05, "loss": 1.025, "step": 40365 }, { "epoch": 0.54, "learning_rate": 2.181437071549694e-05, "loss": 1.7122, "step": 40370 }, { "epoch": 0.54, "learning_rate": 2.1809152083440985e-05, "loss": 0.7185, "step": 40375 }, { "epoch": 0.54, "learning_rate": 2.180393359272362e-05, "loss": 1.4574, "step": 40380 }, { "epoch": 0.54, "learning_rate": 2.1798715243576013e-05, "loss": 0.8535, "step": 40385 }, { "epoch": 0.54, "learning_rate": 2.179349703622931e-05, "loss": 0.9845, "step": 40390 }, { "epoch": 0.54, "learning_rate": 2.1788278970914635e-05, "loss": 0.8865, "step": 40395 }, { "epoch": 0.54, "learning_rate": 2.1783061047863136e-05, "loss": 0.8595, "step": 40400 }, { "epoch": 0.54, "learning_rate": 2.1777843267305954e-05, "loss": 0.9254, "step": 40405 }, { "epoch": 0.54, "learning_rate": 2.1772625629474182e-05, "loss": 0.4092, "step": 40410 }, { "epoch": 0.54, "learning_rate": 2.176740813459895e-05, "loss": 0.9535, "step": 40415 }, { "epoch": 0.54, "learning_rate": 2.1762190782911363e-05, "loss": 0.7829, "step": 40420 }, { "epoch": 0.54, "learning_rate": 2.175697357464253e-05, "loss": 0.4733, "step": 40425 }, { "epoch": 0.54, "learning_rate": 2.1751756510023542e-05, "loss": 0.8166, "step": 40430 }, { "epoch": 0.54, "learning_rate": 2.1746539589285486e-05, "loss": 0.846, "step": 40435 }, { "epoch": 0.54, "learning_rate": 2.1741322812659464e-05, "loss": 0.7247, "step": 40440 }, { "epoch": 0.54, "learning_rate": 2.1736106180376527e-05, "loss": 0.4092, "step": 40445 }, { "epoch": 0.54, "learning_rate": 2.1730889692667758e-05, "loss": 1.1577, "step": 40450 }, { "epoch": 0.54, "learning_rate": 2.1725673349764224e-05, "loss": 0.4357, "step": 40455 }, { "epoch": 0.54, "learning_rate": 2.1720457151896977e-05, "loss": 0.9055, "step": 40460 }, { "epoch": 0.54, "learning_rate": 2.1715241099297066e-05, "loss": 0.7857, "step": 40465 }, { "epoch": 0.54, "learning_rate": 2.171002519219556e-05, "loss": 0.6968, "step": 40470 }, { "epoch": 0.54, "learning_rate": 2.1704809430823465e-05, "loss": 0.6414, "step": 40475 }, { "epoch": 0.54, "learning_rate": 2.1699593815411824e-05, "loss": 0.3472, "step": 40480 }, { "epoch": 0.54, "learning_rate": 2.1694378346191673e-05, "loss": 0.3679, "step": 40485 }, { "epoch": 0.54, "learning_rate": 2.1689163023394018e-05, "loss": 1.3506, "step": 40490 }, { "epoch": 0.54, "learning_rate": 2.168394784724988e-05, "loss": 1.4142, "step": 40495 }, { "epoch": 0.54, "learning_rate": 2.167873281799026e-05, "loss": 1.0995, "step": 40500 }, { "epoch": 0.54, "learning_rate": 2.1673517935846163e-05, "loss": 0.2636, "step": 40505 }, { "epoch": 0.54, "learning_rate": 2.1668303201048578e-05, "loss": 0.6602, "step": 40510 }, { "epoch": 0.54, "learning_rate": 2.1663088613828504e-05, "loss": 0.7995, "step": 40515 }, { "epoch": 0.54, "learning_rate": 2.1657874174416898e-05, "loss": 0.8921, "step": 40520 }, { "epoch": 0.54, "learning_rate": 2.1652659883044744e-05, "loss": 0.4332, "step": 40525 }, { "epoch": 0.54, "learning_rate": 2.1647445739943014e-05, "loss": 0.8387, "step": 40530 }, { "epoch": 0.54, "learning_rate": 2.1642231745342673e-05, "loss": 0.7704, "step": 40535 }, { "epoch": 0.54, "learning_rate": 2.163701789947466e-05, "loss": 1.1287, "step": 40540 }, { "epoch": 0.54, "learning_rate": 2.1631804202569928e-05, "loss": 0.5718, "step": 40545 }, { "epoch": 0.54, "learning_rate": 2.162659065485943e-05, "loss": 0.4294, "step": 40550 }, { "epoch": 0.54, "learning_rate": 2.162137725657408e-05, "loss": 0.7082, "step": 40555 }, { "epoch": 0.54, "learning_rate": 2.1616164007944813e-05, "loss": 0.3093, "step": 40560 }, { "epoch": 0.54, "learning_rate": 2.161095090920256e-05, "loss": 0.3825, "step": 40565 }, { "epoch": 0.54, "learning_rate": 2.1605737960578222e-05, "loss": 0.5389, "step": 40570 }, { "epoch": 0.54, "learning_rate": 2.1600525162302706e-05, "loss": 0.7158, "step": 40575 }, { "epoch": 0.54, "learning_rate": 2.159531251460693e-05, "loss": 0.5659, "step": 40580 }, { "epoch": 0.54, "learning_rate": 2.159010001772177e-05, "loss": 0.5985, "step": 40585 }, { "epoch": 0.54, "learning_rate": 2.158488767187812e-05, "loss": 0.4782, "step": 40590 }, { "epoch": 0.54, "learning_rate": 2.157967547730686e-05, "loss": 0.4415, "step": 40595 }, { "epoch": 0.54, "learning_rate": 2.1574463434238868e-05, "loss": 0.7301, "step": 40600 }, { "epoch": 0.54, "learning_rate": 2.1569251542905e-05, "loss": 1.2419, "step": 40605 }, { "epoch": 0.54, "learning_rate": 2.156403980353614e-05, "loss": 0.5321, "step": 40610 }, { "epoch": 0.54, "learning_rate": 2.1558828216363115e-05, "loss": 0.7913, "step": 40615 }, { "epoch": 0.54, "learning_rate": 2.1553616781616786e-05, "loss": 0.5371, "step": 40620 }, { "epoch": 0.54, "learning_rate": 2.1548405499528003e-05, "loss": 0.1949, "step": 40625 }, { "epoch": 0.54, "learning_rate": 2.1543194370327576e-05, "loss": 0.3596, "step": 40630 }, { "epoch": 0.54, "learning_rate": 2.153798339424635e-05, "loss": 0.879, "step": 40635 }, { "epoch": 0.54, "learning_rate": 2.1532772571515134e-05, "loss": 0.5476, "step": 40640 }, { "epoch": 0.54, "learning_rate": 2.1527561902364755e-05, "loss": 0.3708, "step": 40645 }, { "epoch": 0.54, "learning_rate": 2.1522351387026005e-05, "loss": 0.9433, "step": 40650 }, { "epoch": 0.54, "learning_rate": 2.151714102572969e-05, "loss": 1.1373, "step": 40655 }, { "epoch": 0.54, "learning_rate": 2.1511930818706616e-05, "loss": 0.3557, "step": 40660 }, { "epoch": 0.54, "learning_rate": 2.1506720766187542e-05, "loss": 0.6202, "step": 40665 }, { "epoch": 0.54, "learning_rate": 2.1501510868403265e-05, "loss": 0.6737, "step": 40670 }, { "epoch": 0.54, "learning_rate": 2.1496301125584563e-05, "loss": 0.2933, "step": 40675 }, { "epoch": 0.55, "learning_rate": 2.149109153796218e-05, "loss": 0.1842, "step": 40680 }, { "epoch": 0.55, "learning_rate": 2.148588210576689e-05, "loss": 0.576, "step": 40685 }, { "epoch": 0.55, "learning_rate": 2.1480672829229452e-05, "loss": 0.9606, "step": 40690 }, { "epoch": 0.55, "learning_rate": 2.1475463708580594e-05, "loss": 0.4606, "step": 40695 }, { "epoch": 0.55, "learning_rate": 2.1470254744051055e-05, "loss": 1.0248, "step": 40700 }, { "epoch": 0.55, "learning_rate": 2.1465045935871587e-05, "loss": 0.9026, "step": 40705 }, { "epoch": 0.55, "learning_rate": 2.145983728427289e-05, "loss": 0.9886, "step": 40710 }, { "epoch": 0.55, "learning_rate": 2.1454628789485684e-05, "loss": 0.5913, "step": 40715 }, { "epoch": 0.55, "learning_rate": 2.1449420451740695e-05, "loss": 0.3061, "step": 40720 }, { "epoch": 0.55, "learning_rate": 2.1444212271268613e-05, "loss": 0.4997, "step": 40725 }, { "epoch": 0.55, "learning_rate": 2.1439004248300136e-05, "loss": 0.434, "step": 40730 }, { "epoch": 0.55, "learning_rate": 2.1433796383065972e-05, "loss": 1.126, "step": 40735 }, { "epoch": 0.55, "learning_rate": 2.142858867579677e-05, "loss": 0.7776, "step": 40740 }, { "epoch": 0.55, "learning_rate": 2.1423381126723224e-05, "loss": 1.0911, "step": 40745 }, { "epoch": 0.55, "learning_rate": 2.141817373607601e-05, "loss": 1.3896, "step": 40750 }, { "epoch": 0.55, "learning_rate": 2.141296650408577e-05, "loss": 0.9619, "step": 40755 }, { "epoch": 0.55, "learning_rate": 2.140775943098317e-05, "loss": 0.6997, "step": 40760 }, { "epoch": 0.55, "learning_rate": 2.1402552516998854e-05, "loss": 0.783, "step": 40765 }, { "epoch": 0.55, "learning_rate": 2.139734576236348e-05, "loss": 0.9878, "step": 40770 }, { "epoch": 0.55, "learning_rate": 2.139213916730765e-05, "loss": 0.9636, "step": 40775 }, { "epoch": 0.55, "learning_rate": 2.1386932732062005e-05, "loss": 0.7481, "step": 40780 }, { "epoch": 0.55, "learning_rate": 2.1381726456857175e-05, "loss": 0.6062, "step": 40785 }, { "epoch": 0.55, "learning_rate": 2.137652034192375e-05, "loss": 0.3017, "step": 40790 }, { "epoch": 0.55, "learning_rate": 2.137131438749235e-05, "loss": 0.9077, "step": 40795 }, { "epoch": 0.55, "learning_rate": 2.1366108593793576e-05, "loss": 1.2066, "step": 40800 }, { "epoch": 0.55, "learning_rate": 2.1360902961058005e-05, "loss": 0.8259, "step": 40805 }, { "epoch": 0.55, "learning_rate": 2.135569748951622e-05, "loss": 0.3358, "step": 40810 }, { "epoch": 0.55, "learning_rate": 2.1350492179398817e-05, "loss": 0.8626, "step": 40815 }, { "epoch": 0.55, "learning_rate": 2.134528703093635e-05, "loss": 1.0799, "step": 40820 }, { "epoch": 0.55, "learning_rate": 2.1340082044359376e-05, "loss": 1.1772, "step": 40825 }, { "epoch": 0.55, "learning_rate": 2.1334877219898462e-05, "loss": 0.6481, "step": 40830 }, { "epoch": 0.55, "learning_rate": 2.1329672557784152e-05, "loss": 0.4473, "step": 40835 }, { "epoch": 0.55, "learning_rate": 2.132446805824698e-05, "loss": 0.3794, "step": 40840 }, { "epoch": 0.55, "learning_rate": 2.13192637215175e-05, "loss": 0.772, "step": 40845 }, { "epoch": 0.55, "learning_rate": 2.131405954782621e-05, "loss": 1.1706, "step": 40850 }, { "epoch": 0.55, "learning_rate": 2.1308855537403644e-05, "loss": 0.4547, "step": 40855 }, { "epoch": 0.55, "learning_rate": 2.1303651690480313e-05, "loss": 1.1771, "step": 40860 }, { "epoch": 0.55, "learning_rate": 2.1298448007286717e-05, "loss": 0.0776, "step": 40865 }, { "epoch": 0.55, "learning_rate": 2.1293244488053356e-05, "loss": 1.5006, "step": 40870 }, { "epoch": 0.55, "learning_rate": 2.1288041133010718e-05, "loss": 0.3583, "step": 40875 }, { "epoch": 0.55, "learning_rate": 2.12828379423893e-05, "loss": 0.4558, "step": 40880 }, { "epoch": 0.55, "learning_rate": 2.1277634916419556e-05, "loss": 0.5257, "step": 40885 }, { "epoch": 0.55, "learning_rate": 2.127243205533196e-05, "loss": 0.6123, "step": 40890 }, { "epoch": 0.55, "learning_rate": 2.1267229359356982e-05, "loss": 0.6637, "step": 40895 }, { "epoch": 0.55, "learning_rate": 2.1262026828725064e-05, "loss": 1.2094, "step": 40900 }, { "epoch": 0.55, "learning_rate": 2.1256824463666654e-05, "loss": 1.2015, "step": 40905 }, { "epoch": 0.55, "learning_rate": 2.125162226441221e-05, "loss": 0.3555, "step": 40910 }, { "epoch": 0.55, "learning_rate": 2.1246420231192125e-05, "loss": 0.6477, "step": 40915 }, { "epoch": 0.55, "learning_rate": 2.124121836423685e-05, "loss": 1.0049, "step": 40920 }, { "epoch": 0.55, "learning_rate": 2.1236016663776812e-05, "loss": 0.8484, "step": 40925 }, { "epoch": 0.55, "learning_rate": 2.123081513004239e-05, "loss": 0.2513, "step": 40930 }, { "epoch": 0.55, "learning_rate": 2.122561376326401e-05, "loss": 0.851, "step": 40935 }, { "epoch": 0.55, "learning_rate": 2.1220412563672055e-05, "loss": 0.9733, "step": 40940 }, { "epoch": 0.55, "learning_rate": 2.121521153149691e-05, "loss": 0.4753, "step": 40945 }, { "epoch": 0.55, "learning_rate": 2.121001066696896e-05, "loss": 0.4078, "step": 40950 }, { "epoch": 0.55, "learning_rate": 2.120480997031859e-05, "loss": 0.7972, "step": 40955 }, { "epoch": 0.55, "learning_rate": 2.1199609441776143e-05, "loss": 0.8433, "step": 40960 }, { "epoch": 0.55, "learning_rate": 2.119440908157198e-05, "loss": 0.2465, "step": 40965 }, { "epoch": 0.55, "learning_rate": 2.1189208889936463e-05, "loss": 0.8, "step": 40970 }, { "epoch": 0.55, "learning_rate": 2.1184008867099918e-05, "loss": 0.802, "step": 40975 }, { "epoch": 0.55, "learning_rate": 2.1178809013292694e-05, "loss": 1.1767, "step": 40980 }, { "epoch": 0.55, "learning_rate": 2.1173609328745113e-05, "loss": 0.5137, "step": 40985 }, { "epoch": 0.55, "learning_rate": 2.1168409813687507e-05, "loss": 0.578, "step": 40990 }, { "epoch": 0.55, "learning_rate": 2.1163210468350166e-05, "loss": 0.6696, "step": 40995 }, { "epoch": 0.55, "learning_rate": 2.1158011292963407e-05, "loss": 1.1505, "step": 41000 }, { "epoch": 0.55, "learning_rate": 2.115281228775753e-05, "loss": 0.7022, "step": 41005 }, { "epoch": 0.55, "learning_rate": 2.1147613452962818e-05, "loss": 1.2963, "step": 41010 }, { "epoch": 0.55, "learning_rate": 2.114241478880956e-05, "loss": 0.4299, "step": 41015 }, { "epoch": 0.55, "learning_rate": 2.1137216295528035e-05, "loss": 0.9534, "step": 41020 }, { "epoch": 0.55, "learning_rate": 2.113201797334849e-05, "loss": 0.407, "step": 41025 }, { "epoch": 0.55, "learning_rate": 2.1126819822501197e-05, "loss": 0.8435, "step": 41030 }, { "epoch": 0.55, "learning_rate": 2.1121621843216425e-05, "loss": 0.6917, "step": 41035 }, { "epoch": 0.55, "learning_rate": 2.1116424035724393e-05, "loss": 0.716, "step": 41040 }, { "epoch": 0.55, "learning_rate": 2.1111226400255346e-05, "loss": 1.0818, "step": 41045 }, { "epoch": 0.55, "learning_rate": 2.110602893703952e-05, "loss": 0.7418, "step": 41050 }, { "epoch": 0.55, "learning_rate": 2.1100831646307123e-05, "loss": 0.9556, "step": 41055 }, { "epoch": 0.55, "learning_rate": 2.1095634528288376e-05, "loss": 0.9536, "step": 41060 }, { "epoch": 0.55, "learning_rate": 2.1090437583213502e-05, "loss": 0.7507, "step": 41065 }, { "epoch": 0.55, "learning_rate": 2.1085240811312672e-05, "loss": 0.7218, "step": 41070 }, { "epoch": 0.55, "learning_rate": 2.1080044212816088e-05, "loss": 0.512, "step": 41075 }, { "epoch": 0.55, "learning_rate": 2.1074847787953943e-05, "loss": 0.8789, "step": 41080 }, { "epoch": 0.55, "learning_rate": 2.1069651536956393e-05, "loss": 0.8943, "step": 41085 }, { "epoch": 0.55, "learning_rate": 2.1064455460053624e-05, "loss": 0.6302, "step": 41090 }, { "epoch": 0.55, "learning_rate": 2.1059259557475782e-05, "loss": 0.8251, "step": 41095 }, { "epoch": 0.55, "learning_rate": 2.105406382945304e-05, "loss": 0.379, "step": 41100 }, { "epoch": 0.55, "learning_rate": 2.1048868276215523e-05, "loss": 0.3916, "step": 41105 }, { "epoch": 0.55, "learning_rate": 2.104367289799337e-05, "loss": 0.7251, "step": 41110 }, { "epoch": 0.55, "learning_rate": 2.103847769501672e-05, "loss": 0.5583, "step": 41115 }, { "epoch": 0.55, "learning_rate": 2.1033282667515686e-05, "loss": 1.0691, "step": 41120 }, { "epoch": 0.55, "learning_rate": 2.1028087815720383e-05, "loss": 0.9314, "step": 41125 }, { "epoch": 0.55, "learning_rate": 2.1022893139860924e-05, "loss": 0.6637, "step": 41130 }, { "epoch": 0.55, "learning_rate": 2.1017698640167398e-05, "loss": 0.4869, "step": 41135 }, { "epoch": 0.55, "learning_rate": 2.1012504316869903e-05, "loss": 0.8049, "step": 41140 }, { "epoch": 0.55, "learning_rate": 2.1007310170198523e-05, "loss": 1.0503, "step": 41145 }, { "epoch": 0.55, "learning_rate": 2.100211620038332e-05, "loss": 0.7807, "step": 41150 }, { "epoch": 0.55, "learning_rate": 2.0996922407654368e-05, "loss": 0.6888, "step": 41155 }, { "epoch": 0.55, "learning_rate": 2.099172879224173e-05, "loss": 0.952, "step": 41160 }, { "epoch": 0.55, "learning_rate": 2.098653535437545e-05, "loss": 0.4726, "step": 41165 }, { "epoch": 0.55, "learning_rate": 2.0981342094285575e-05, "loss": 0.9121, "step": 41170 }, { "epoch": 0.55, "learning_rate": 2.097614901220215e-05, "loss": 0.3679, "step": 41175 }, { "epoch": 0.55, "learning_rate": 2.0970956108355185e-05, "loss": 0.6308, "step": 41180 }, { "epoch": 0.55, "learning_rate": 2.0965763382974706e-05, "loss": 0.2115, "step": 41185 }, { "epoch": 0.55, "learning_rate": 2.096057083629073e-05, "loss": 0.1853, "step": 41190 }, { "epoch": 0.55, "learning_rate": 2.0955378468533255e-05, "loss": 0.2314, "step": 41195 }, { "epoch": 0.55, "learning_rate": 2.095018627993228e-05, "loss": 0.4218, "step": 41200 }, { "epoch": 0.55, "learning_rate": 2.094499427071779e-05, "loss": 0.7691, "step": 41205 }, { "epoch": 0.55, "learning_rate": 2.0939802441119778e-05, "loss": 0.2815, "step": 41210 }, { "epoch": 0.55, "learning_rate": 2.0934610791368194e-05, "loss": 0.825, "step": 41215 }, { "epoch": 0.55, "learning_rate": 2.0929419321693015e-05, "loss": 0.9764, "step": 41220 }, { "epoch": 0.55, "learning_rate": 2.09242280323242e-05, "loss": 0.624, "step": 41225 }, { "epoch": 0.55, "learning_rate": 2.091903692349169e-05, "loss": 1.148, "step": 41230 }, { "epoch": 0.55, "learning_rate": 2.0913845995425424e-05, "loss": 0.3669, "step": 41235 }, { "epoch": 0.55, "learning_rate": 2.0908655248355348e-05, "loss": 0.8137, "step": 41240 }, { "epoch": 0.55, "learning_rate": 2.0903464682511365e-05, "loss": 0.8255, "step": 41245 }, { "epoch": 0.55, "learning_rate": 2.0898274298123405e-05, "loss": 0.9852, "step": 41250 }, { "epoch": 0.55, "learning_rate": 2.0893084095421383e-05, "loss": 0.9134, "step": 41255 }, { "epoch": 0.55, "learning_rate": 2.088789407463518e-05, "loss": 0.1732, "step": 41260 }, { "epoch": 0.55, "learning_rate": 2.08827042359947e-05, "loss": 0.6607, "step": 41265 }, { "epoch": 0.55, "learning_rate": 2.0877514579729823e-05, "loss": 0.4656, "step": 41270 }, { "epoch": 0.55, "learning_rate": 2.0872325106070424e-05, "loss": 0.3713, "step": 41275 }, { "epoch": 0.55, "learning_rate": 2.0867135815246374e-05, "loss": 1.5124, "step": 41280 }, { "epoch": 0.55, "learning_rate": 2.0861946707487542e-05, "loss": 0.7735, "step": 41285 }, { "epoch": 0.55, "learning_rate": 2.0856757783023757e-05, "loss": 0.6471, "step": 41290 }, { "epoch": 0.55, "learning_rate": 2.0851569042084873e-05, "loss": 0.7493, "step": 41295 }, { "epoch": 0.55, "learning_rate": 2.0846380484900734e-05, "loss": 1.0654, "step": 41300 }, { "epoch": 0.55, "learning_rate": 2.0841192111701153e-05, "loss": 0.7901, "step": 41305 }, { "epoch": 0.55, "learning_rate": 2.0836003922715954e-05, "loss": 0.9565, "step": 41310 }, { "epoch": 0.55, "learning_rate": 2.0830815918174955e-05, "loss": 0.8504, "step": 41315 }, { "epoch": 0.55, "learning_rate": 2.0825628098307958e-05, "loss": 1.028, "step": 41320 }, { "epoch": 0.55, "learning_rate": 2.0820440463344743e-05, "loss": 0.8016, "step": 41325 }, { "epoch": 0.55, "learning_rate": 2.08152530135151e-05, "loss": 0.747, "step": 41330 }, { "epoch": 0.55, "learning_rate": 2.0810065749048833e-05, "loss": 0.9241, "step": 41335 }, { "epoch": 0.55, "learning_rate": 2.0804878670175678e-05, "loss": 0.4534, "step": 41340 }, { "epoch": 0.55, "learning_rate": 2.079969177712541e-05, "loss": 0.9986, "step": 41345 }, { "epoch": 0.55, "learning_rate": 2.079450507012779e-05, "loss": 0.541, "step": 41350 }, { "epoch": 0.55, "learning_rate": 2.078931854941255e-05, "loss": 0.9566, "step": 41355 }, { "epoch": 0.55, "learning_rate": 2.078413221520943e-05, "loss": 0.8142, "step": 41360 }, { "epoch": 0.55, "learning_rate": 2.0778946067748176e-05, "loss": 0.769, "step": 41365 }, { "epoch": 0.55, "learning_rate": 2.077376010725848e-05, "loss": 0.4833, "step": 41370 }, { "epoch": 0.55, "learning_rate": 2.076857433397007e-05, "loss": 0.2988, "step": 41375 }, { "epoch": 0.55, "learning_rate": 2.0763388748112654e-05, "loss": 0.6917, "step": 41380 }, { "epoch": 0.55, "learning_rate": 2.0758203349915913e-05, "loss": 0.5861, "step": 41385 }, { "epoch": 0.55, "learning_rate": 2.0753018139609544e-05, "loss": 0.1773, "step": 41390 }, { "epoch": 0.55, "learning_rate": 2.0747833117423237e-05, "loss": 0.6717, "step": 41395 }, { "epoch": 0.55, "learning_rate": 2.074264828358664e-05, "loss": 1.085, "step": 41400 }, { "epoch": 0.55, "learning_rate": 2.073746363832942e-05, "loss": 0.9209, "step": 41405 }, { "epoch": 0.55, "learning_rate": 2.0732279181881247e-05, "loss": 1.0821, "step": 41410 }, { "epoch": 0.55, "learning_rate": 2.0727094914471746e-05, "loss": 0.2719, "step": 41415 }, { "epoch": 0.55, "learning_rate": 2.0721910836330567e-05, "loss": 0.7509, "step": 41420 }, { "epoch": 0.56, "learning_rate": 2.071672694768734e-05, "loss": 0.6744, "step": 41425 }, { "epoch": 0.56, "learning_rate": 2.0711543248771677e-05, "loss": 1.254, "step": 41430 }, { "epoch": 0.56, "learning_rate": 2.0706359739813193e-05, "loss": 1.3438, "step": 41435 }, { "epoch": 0.56, "learning_rate": 2.0701176421041483e-05, "loss": 1.4743, "step": 41440 }, { "epoch": 0.56, "learning_rate": 2.069599329268617e-05, "loss": 0.925, "step": 41445 }, { "epoch": 0.56, "learning_rate": 2.069081035497681e-05, "loss": 0.5309, "step": 41450 }, { "epoch": 0.56, "learning_rate": 2.0685627608142993e-05, "loss": 0.9611, "step": 41455 }, { "epoch": 0.56, "learning_rate": 2.0680445052414293e-05, "loss": 0.4118, "step": 41460 }, { "epoch": 0.56, "learning_rate": 2.0675262688020263e-05, "loss": 0.7483, "step": 41465 }, { "epoch": 0.56, "learning_rate": 2.067008051519046e-05, "loss": 0.3899, "step": 41470 }, { "epoch": 0.56, "learning_rate": 2.066489853415444e-05, "loss": 0.6933, "step": 41475 }, { "epoch": 0.56, "learning_rate": 2.0659716745141716e-05, "loss": 1.0061, "step": 41480 }, { "epoch": 0.56, "learning_rate": 2.0654535148381825e-05, "loss": 0.3179, "step": 41485 }, { "epoch": 0.56, "learning_rate": 2.0649353744104293e-05, "loss": 0.4413, "step": 41490 }, { "epoch": 0.56, "learning_rate": 2.0644172532538618e-05, "loss": 0.307, "step": 41495 }, { "epoch": 0.56, "learning_rate": 2.0638991513914312e-05, "loss": 0.1504, "step": 41500 }, { "epoch": 0.56, "learning_rate": 2.0633810688460874e-05, "loss": 1.1803, "step": 41505 }, { "epoch": 0.56, "learning_rate": 2.0628630056407766e-05, "loss": 0.6698, "step": 41510 }, { "epoch": 0.56, "learning_rate": 2.062344961798448e-05, "loss": 0.2754, "step": 41515 }, { "epoch": 0.56, "learning_rate": 2.0618269373420486e-05, "loss": 0.6829, "step": 41520 }, { "epoch": 0.56, "learning_rate": 2.0613089322945227e-05, "loss": 0.7031, "step": 41525 }, { "epoch": 0.56, "learning_rate": 2.0607909466788173e-05, "loss": 0.1354, "step": 41530 }, { "epoch": 0.56, "learning_rate": 2.060272980517876e-05, "loss": 0.5056, "step": 41535 }, { "epoch": 0.56, "learning_rate": 2.059755033834641e-05, "loss": 1.1282, "step": 41540 }, { "epoch": 0.56, "learning_rate": 2.059237106652055e-05, "loss": 0.5498, "step": 41545 }, { "epoch": 0.56, "learning_rate": 2.0587191989930604e-05, "loss": 0.4394, "step": 41550 }, { "epoch": 0.56, "learning_rate": 2.0582013108805993e-05, "loss": 0.5428, "step": 41555 }, { "epoch": 0.56, "learning_rate": 2.0576834423376082e-05, "loss": 0.4927, "step": 41560 }, { "epoch": 0.56, "learning_rate": 2.057165593387028e-05, "loss": 0.7639, "step": 41565 }, { "epoch": 0.56, "learning_rate": 2.056647764051797e-05, "loss": 0.7662, "step": 41570 }, { "epoch": 0.56, "learning_rate": 2.0561299543548516e-05, "loss": 0.9168, "step": 41575 }, { "epoch": 0.56, "learning_rate": 2.0556121643191282e-05, "loss": 0.5184, "step": 41580 }, { "epoch": 0.56, "learning_rate": 2.0550943939675645e-05, "loss": 0.3449, "step": 41585 }, { "epoch": 0.56, "learning_rate": 2.054576643323092e-05, "loss": 0.5415, "step": 41590 }, { "epoch": 0.56, "learning_rate": 2.0540589124086455e-05, "loss": 0.7054, "step": 41595 }, { "epoch": 0.56, "learning_rate": 2.0535412012471594e-05, "loss": 1.7067, "step": 41600 }, { "epoch": 0.56, "learning_rate": 2.0530235098615636e-05, "loss": 0.9149, "step": 41605 }, { "epoch": 0.56, "learning_rate": 2.05250583827479e-05, "loss": 0.6174, "step": 41610 }, { "epoch": 0.56, "learning_rate": 2.0519881865097705e-05, "loss": 0.2873, "step": 41615 }, { "epoch": 0.56, "learning_rate": 2.0514705545894312e-05, "loss": 1.5334, "step": 41620 }, { "epoch": 0.56, "learning_rate": 2.0509529425367034e-05, "loss": 0.3442, "step": 41625 }, { "epoch": 0.56, "learning_rate": 2.0504353503745135e-05, "loss": 0.4352, "step": 41630 }, { "epoch": 0.56, "learning_rate": 2.0499177781257883e-05, "loss": 0.6188, "step": 41635 }, { "epoch": 0.56, "learning_rate": 2.0494002258134537e-05, "loss": 1.2057, "step": 41640 }, { "epoch": 0.56, "learning_rate": 2.048882693460436e-05, "loss": 1.3596, "step": 41645 }, { "epoch": 0.56, "learning_rate": 2.048365181089657e-05, "loss": 0.7263, "step": 41650 }, { "epoch": 0.56, "learning_rate": 2.0478476887240407e-05, "loss": 0.8485, "step": 41655 }, { "epoch": 0.56, "learning_rate": 2.0473302163865098e-05, "loss": 0.9242, "step": 41660 }, { "epoch": 0.56, "learning_rate": 2.046812764099987e-05, "loss": 0.5554, "step": 41665 }, { "epoch": 0.56, "learning_rate": 2.0462953318873903e-05, "loss": 0.2346, "step": 41670 }, { "epoch": 0.56, "learning_rate": 2.0457779197716408e-05, "loss": 0.55, "step": 41675 }, { "epoch": 0.56, "learning_rate": 2.0452605277756576e-05, "loss": 0.8535, "step": 41680 }, { "epoch": 0.56, "learning_rate": 2.0447431559223574e-05, "loss": 0.697, "step": 41685 }, { "epoch": 0.56, "learning_rate": 2.044225804234658e-05, "loss": 0.3618, "step": 41690 }, { "epoch": 0.56, "learning_rate": 2.043708472735476e-05, "loss": 1.1012, "step": 41695 }, { "epoch": 0.56, "learning_rate": 2.043191161447725e-05, "loss": 0.0778, "step": 41700 }, { "epoch": 0.56, "learning_rate": 2.0426738703943203e-05, "loss": 0.7504, "step": 41705 }, { "epoch": 0.56, "learning_rate": 2.0421565995981755e-05, "loss": 0.7334, "step": 41710 }, { "epoch": 0.56, "learning_rate": 2.0416393490822027e-05, "loss": 0.2833, "step": 41715 }, { "epoch": 0.56, "learning_rate": 2.0411221188693133e-05, "loss": 0.5289, "step": 41720 }, { "epoch": 0.56, "learning_rate": 2.0406049089824193e-05, "loss": 1.0568, "step": 41725 }, { "epoch": 0.56, "learning_rate": 2.040087719444429e-05, "loss": 0.5189, "step": 41730 }, { "epoch": 0.56, "learning_rate": 2.0395705502782514e-05, "loss": 0.9266, "step": 41735 }, { "epoch": 0.56, "learning_rate": 2.0390534015067958e-05, "loss": 0.9451, "step": 41740 }, { "epoch": 0.56, "learning_rate": 2.0385362731529677e-05, "loss": 0.8129, "step": 41745 }, { "epoch": 0.56, "learning_rate": 2.038019165239674e-05, "loss": 0.7919, "step": 41750 }, { "epoch": 0.56, "learning_rate": 2.0375020777898215e-05, "loss": 0.8159, "step": 41755 }, { "epoch": 0.56, "learning_rate": 2.0369850108263112e-05, "loss": 0.5165, "step": 41760 }, { "epoch": 0.56, "learning_rate": 2.036467964372049e-05, "loss": 0.8094, "step": 41765 }, { "epoch": 0.56, "learning_rate": 2.0359509384499377e-05, "loss": 0.5144, "step": 41770 }, { "epoch": 0.56, "learning_rate": 2.0354339330828788e-05, "loss": 0.1571, "step": 41775 }, { "epoch": 0.56, "learning_rate": 2.0349169482937712e-05, "loss": 0.5352, "step": 41780 }, { "epoch": 0.56, "learning_rate": 2.0343999841055166e-05, "loss": 0.5747, "step": 41785 }, { "epoch": 0.56, "learning_rate": 2.0338830405410133e-05, "loss": 0.3268, "step": 41790 }, { "epoch": 0.56, "learning_rate": 2.0333661176231593e-05, "loss": 0.4895, "step": 41795 }, { "epoch": 0.56, "learning_rate": 2.032849215374852e-05, "loss": 0.2772, "step": 41800 }, { "epoch": 0.56, "learning_rate": 2.032332333818988e-05, "loss": 0.568, "step": 41805 }, { "epoch": 0.56, "learning_rate": 2.031815472978461e-05, "loss": 0.284, "step": 41810 }, { "epoch": 0.56, "learning_rate": 2.0312986328761664e-05, "loss": 1.0624, "step": 41815 }, { "epoch": 0.56, "learning_rate": 2.0307818135349978e-05, "loss": 0.451, "step": 41820 }, { "epoch": 0.56, "learning_rate": 2.0302650149778472e-05, "loss": 0.3846, "step": 41825 }, { "epoch": 0.56, "learning_rate": 2.029748237227606e-05, "loss": 1.3429, "step": 41830 }, { "epoch": 0.56, "learning_rate": 2.029231480307167e-05, "loss": 0.6758, "step": 41835 }, { "epoch": 0.56, "learning_rate": 2.0287147442394168e-05, "loss": 0.8833, "step": 41840 }, { "epoch": 0.56, "learning_rate": 2.0281980290472455e-05, "loss": 0.4358, "step": 41845 }, { "epoch": 0.56, "learning_rate": 2.027681334753542e-05, "loss": 0.3049, "step": 41850 }, { "epoch": 0.56, "learning_rate": 2.027164661381192e-05, "loss": 0.6699, "step": 41855 }, { "epoch": 0.56, "learning_rate": 2.0266480089530815e-05, "loss": 1.1397, "step": 41860 }, { "epoch": 0.56, "learning_rate": 2.0261313774920974e-05, "loss": 0.8273, "step": 41865 }, { "epoch": 0.56, "learning_rate": 2.025614767021121e-05, "loss": 1.7512, "step": 41870 }, { "epoch": 0.56, "learning_rate": 2.0250981775630378e-05, "loss": 0.9665, "step": 41875 }, { "epoch": 0.56, "learning_rate": 2.0245816091407295e-05, "loss": 0.4744, "step": 41880 }, { "epoch": 0.56, "learning_rate": 2.0240650617770786e-05, "loss": 1.2586, "step": 41885 }, { "epoch": 0.56, "learning_rate": 2.023548535494963e-05, "loss": 0.9402, "step": 41890 }, { "epoch": 0.56, "learning_rate": 2.0230320303172638e-05, "loss": 0.2325, "step": 41895 }, { "epoch": 0.56, "learning_rate": 2.02251554626686e-05, "loss": 0.6468, "step": 41900 }, { "epoch": 0.56, "learning_rate": 2.021999083366628e-05, "loss": 1.1122, "step": 41905 }, { "epoch": 0.56, "learning_rate": 2.0214826416394454e-05, "loss": 0.8127, "step": 41910 }, { "epoch": 0.56, "learning_rate": 2.020966221108189e-05, "loss": 0.9836, "step": 41915 }, { "epoch": 0.56, "learning_rate": 2.0204498217957316e-05, "loss": 0.8101, "step": 41920 }, { "epoch": 0.56, "learning_rate": 2.0199334437249478e-05, "loss": 0.6713, "step": 41925 }, { "epoch": 0.56, "learning_rate": 2.0194170869187113e-05, "loss": 0.5806, "step": 41930 }, { "epoch": 0.56, "learning_rate": 2.0189007513998927e-05, "loss": 1.0417, "step": 41935 }, { "epoch": 0.56, "learning_rate": 2.0183844371913643e-05, "loss": 0.6865, "step": 41940 }, { "epoch": 0.56, "learning_rate": 2.017868144315997e-05, "loss": 0.7997, "step": 41945 }, { "epoch": 0.56, "learning_rate": 2.0173518727966578e-05, "loss": 1.1317, "step": 41950 }, { "epoch": 0.56, "learning_rate": 2.0168356226562158e-05, "loss": 0.6451, "step": 41955 }, { "epoch": 0.56, "learning_rate": 2.016319393917539e-05, "loss": 1.1127, "step": 41960 }, { "epoch": 0.56, "learning_rate": 2.0158031866034933e-05, "loss": 1.3439, "step": 41965 }, { "epoch": 0.56, "learning_rate": 2.0152870007369433e-05, "loss": 0.796, "step": 41970 }, { "epoch": 0.56, "learning_rate": 2.014770836340756e-05, "loss": 1.2952, "step": 41975 }, { "epoch": 0.56, "learning_rate": 2.014254693437791e-05, "loss": 1.0193, "step": 41980 }, { "epoch": 0.56, "learning_rate": 2.0137385720509136e-05, "loss": 0.5147, "step": 41985 }, { "epoch": 0.56, "learning_rate": 2.013222472202986e-05, "loss": 0.3408, "step": 41990 }, { "epoch": 0.56, "learning_rate": 2.0127063939168666e-05, "loss": 0.4988, "step": 41995 }, { "epoch": 0.56, "learning_rate": 2.0121903372154157e-05, "loss": 0.2387, "step": 42000 }, { "epoch": 0.56, "learning_rate": 2.011674302121493e-05, "loss": 0.8492, "step": 42005 }, { "epoch": 0.56, "learning_rate": 2.0111582886579557e-05, "loss": 0.4562, "step": 42010 }, { "epoch": 0.56, "learning_rate": 2.0106422968476606e-05, "loss": 0.5935, "step": 42015 }, { "epoch": 0.56, "learning_rate": 2.010126326713463e-05, "loss": 1.5233, "step": 42020 }, { "epoch": 0.56, "learning_rate": 2.00961037827822e-05, "loss": 1.205, "step": 42025 }, { "epoch": 0.56, "learning_rate": 2.0090944515647825e-05, "loss": 0.9908, "step": 42030 }, { "epoch": 0.56, "learning_rate": 2.0085785465960047e-05, "loss": 0.5191, "step": 42035 }, { "epoch": 0.56, "learning_rate": 2.0080626633947396e-05, "loss": 0.5635, "step": 42040 }, { "epoch": 0.56, "learning_rate": 2.0075468019838366e-05, "loss": 0.5635, "step": 42045 }, { "epoch": 0.56, "learning_rate": 2.007030962386147e-05, "loss": 0.8756, "step": 42050 }, { "epoch": 0.56, "learning_rate": 2.0065151446245205e-05, "loss": 0.8918, "step": 42055 }, { "epoch": 0.56, "learning_rate": 2.0059993487218032e-05, "loss": 0.9738, "step": 42060 }, { "epoch": 0.56, "learning_rate": 2.005483574700843e-05, "loss": 0.8109, "step": 42065 }, { "epoch": 0.56, "learning_rate": 2.0049678225844874e-05, "loss": 0.3782, "step": 42070 }, { "epoch": 0.56, "learning_rate": 2.00445209239558e-05, "loss": 1.105, "step": 42075 }, { "epoch": 0.56, "learning_rate": 2.0039363841569658e-05, "loss": 1.3889, "step": 42080 }, { "epoch": 0.56, "learning_rate": 2.0034206978914885e-05, "loss": 0.5874, "step": 42085 }, { "epoch": 0.56, "learning_rate": 2.0029050336219897e-05, "loss": 0.7151, "step": 42090 }, { "epoch": 0.56, "learning_rate": 2.0023893913713106e-05, "loss": 0.2781, "step": 42095 }, { "epoch": 0.56, "learning_rate": 2.0018737711622933e-05, "loss": 0.3583, "step": 42100 }, { "epoch": 0.56, "learning_rate": 2.0013581730177748e-05, "loss": 1.1257, "step": 42105 }, { "epoch": 0.56, "learning_rate": 2.0008425969605948e-05, "loss": 0.1746, "step": 42110 }, { "epoch": 0.56, "learning_rate": 2.00032704301359e-05, "loss": 0.8112, "step": 42115 }, { "epoch": 0.56, "learning_rate": 1.9998115111995986e-05, "loss": 0.5179, "step": 42120 }, { "epoch": 0.56, "learning_rate": 1.999296001541454e-05, "loss": 0.4897, "step": 42125 }, { "epoch": 0.56, "learning_rate": 1.9987805140619916e-05, "loss": 0.9143, "step": 42130 }, { "epoch": 0.56, "learning_rate": 1.998368140062418e-05, "loss": 1.2458, "step": 42135 }, { "epoch": 0.56, "learning_rate": 1.9978526925621233e-05, "loss": 0.2042, "step": 42140 }, { "epoch": 0.56, "learning_rate": 1.9973372673044426e-05, "loss": 0.6541, "step": 42145 }, { "epoch": 0.56, "learning_rate": 1.996821864312206e-05, "loss": 0.8426, "step": 42150 }, { "epoch": 0.56, "learning_rate": 1.9963064836082434e-05, "loss": 0.9652, "step": 42155 }, { "epoch": 0.56, "learning_rate": 1.995791125215384e-05, "loss": 0.754, "step": 42160 }, { "epoch": 0.56, "learning_rate": 1.9952757891564555e-05, "loss": 0.6881, "step": 42165 }, { "epoch": 0.57, "learning_rate": 1.994760475454284e-05, "loss": 0.2598, "step": 42170 }, { "epoch": 0.57, "learning_rate": 1.9942451841316956e-05, "loss": 0.9135, "step": 42175 }, { "epoch": 0.57, "learning_rate": 1.993729915211516e-05, "loss": 0.633, "step": 42180 }, { "epoch": 0.57, "learning_rate": 1.9932146687165678e-05, "loss": 0.4259, "step": 42185 }, { "epoch": 0.57, "learning_rate": 1.9926994446696744e-05, "loss": 0.5327, "step": 42190 }, { "epoch": 0.57, "learning_rate": 1.992184243093659e-05, "loss": 0.8701, "step": 42195 }, { "epoch": 0.57, "learning_rate": 1.9916690640113394e-05, "loss": 0.2545, "step": 42200 }, { "epoch": 0.57, "learning_rate": 1.9911539074455372e-05, "loss": 1.1036, "step": 42205 }, { "epoch": 0.57, "learning_rate": 1.9906387734190728e-05, "loss": 0.8405, "step": 42210 }, { "epoch": 0.57, "learning_rate": 1.990123661954761e-05, "loss": 0.8147, "step": 42215 }, { "epoch": 0.57, "learning_rate": 1.9896085730754205e-05, "loss": 0.828, "step": 42220 }, { "epoch": 0.57, "learning_rate": 1.9890935068038672e-05, "loss": 0.4256, "step": 42225 }, { "epoch": 0.57, "learning_rate": 1.988578463162915e-05, "loss": 1.1072, "step": 42230 }, { "epoch": 0.57, "learning_rate": 1.988063442175378e-05, "loss": 0.7577, "step": 42235 }, { "epoch": 0.57, "learning_rate": 1.9875484438640714e-05, "loss": 0.6028, "step": 42240 }, { "epoch": 0.57, "learning_rate": 1.987033468251803e-05, "loss": 0.3679, "step": 42245 }, { "epoch": 0.57, "learning_rate": 1.986518515361386e-05, "loss": 0.8676, "step": 42250 }, { "epoch": 0.57, "learning_rate": 1.9860035852156306e-05, "loss": 0.9695, "step": 42255 }, { "epoch": 0.57, "learning_rate": 1.985488677837344e-05, "loss": 0.4324, "step": 42260 }, { "epoch": 0.57, "learning_rate": 1.9849737932493352e-05, "loss": 0.3607, "step": 42265 }, { "epoch": 0.57, "learning_rate": 1.984458931474411e-05, "loss": 1.0818, "step": 42270 }, { "epoch": 0.57, "learning_rate": 1.983944092535378e-05, "loss": 0.6594, "step": 42275 }, { "epoch": 0.57, "learning_rate": 1.9834292764550385e-05, "loss": 0.4572, "step": 42280 }, { "epoch": 0.57, "learning_rate": 1.982914483256198e-05, "loss": 0.9322, "step": 42285 }, { "epoch": 0.57, "learning_rate": 1.9823997129616594e-05, "loss": 0.8311, "step": 42290 }, { "epoch": 0.57, "learning_rate": 1.9818849655942234e-05, "loss": 0.2301, "step": 42295 }, { "epoch": 0.57, "learning_rate": 1.9813702411766916e-05, "loss": 0.1551, "step": 42300 }, { "epoch": 0.57, "learning_rate": 1.9808555397318645e-05, "loss": 0.3169, "step": 42305 }, { "epoch": 0.57, "learning_rate": 1.9803408612825382e-05, "loss": 0.323, "step": 42310 }, { "epoch": 0.57, "learning_rate": 1.9798262058515126e-05, "loss": 0.6502, "step": 42315 }, { "epoch": 0.57, "learning_rate": 1.9793115734615845e-05, "loss": 0.327, "step": 42320 }, { "epoch": 0.57, "learning_rate": 1.978796964135548e-05, "loss": 1.2357, "step": 42325 }, { "epoch": 0.57, "learning_rate": 1.9782823778961984e-05, "loss": 0.8073, "step": 42330 }, { "epoch": 0.57, "learning_rate": 1.97776781476633e-05, "loss": 1.2687, "step": 42335 }, { "epoch": 0.57, "learning_rate": 1.977253274768734e-05, "loss": 0.7002, "step": 42340 }, { "epoch": 0.57, "learning_rate": 1.9767387579262032e-05, "loss": 0.4566, "step": 42345 }, { "epoch": 0.57, "learning_rate": 1.976224264261528e-05, "loss": 0.1409, "step": 42350 }, { "epoch": 0.57, "learning_rate": 1.9757097937974968e-05, "loss": 0.9291, "step": 42355 }, { "epoch": 0.57, "learning_rate": 1.975195346556899e-05, "loss": 0.4623, "step": 42360 }, { "epoch": 0.57, "learning_rate": 1.974680922562522e-05, "loss": 0.3265, "step": 42365 }, { "epoch": 0.57, "learning_rate": 1.974166521837152e-05, "loss": 0.4597, "step": 42370 }, { "epoch": 0.57, "learning_rate": 1.973652144403574e-05, "loss": 1.16, "step": 42375 }, { "epoch": 0.57, "learning_rate": 1.9731377902845726e-05, "loss": 1.0154, "step": 42380 }, { "epoch": 0.57, "learning_rate": 1.9726234595029326e-05, "loss": 0.3777, "step": 42385 }, { "epoch": 0.57, "learning_rate": 1.972109152081434e-05, "loss": 0.9565, "step": 42390 }, { "epoch": 0.57, "learning_rate": 1.971594868042859e-05, "loss": 0.4193, "step": 42395 }, { "epoch": 0.57, "learning_rate": 1.9710806074099883e-05, "loss": 0.9476, "step": 42400 }, { "epoch": 0.57, "learning_rate": 1.9705663702056e-05, "loss": 1.4016, "step": 42405 }, { "epoch": 0.57, "learning_rate": 1.9700521564524728e-05, "loss": 1.2425, "step": 42410 }, { "epoch": 0.57, "learning_rate": 1.969537966173385e-05, "loss": 0.3065, "step": 42415 }, { "epoch": 0.57, "learning_rate": 1.9690237993911097e-05, "loss": 0.4075, "step": 42420 }, { "epoch": 0.57, "learning_rate": 1.9685096561284243e-05, "loss": 0.7155, "step": 42425 }, { "epoch": 0.57, "learning_rate": 1.9679955364081034e-05, "loss": 0.6481, "step": 42430 }, { "epoch": 0.57, "learning_rate": 1.9674814402529177e-05, "loss": 0.8384, "step": 42435 }, { "epoch": 0.57, "learning_rate": 1.9669673676856397e-05, "loss": 0.4163, "step": 42440 }, { "epoch": 0.57, "learning_rate": 1.9664533187290414e-05, "loss": 0.4356, "step": 42445 }, { "epoch": 0.57, "learning_rate": 1.9659392934058913e-05, "loss": 0.8569, "step": 42450 }, { "epoch": 0.57, "learning_rate": 1.965425291738959e-05, "loss": 0.9721, "step": 42455 }, { "epoch": 0.57, "learning_rate": 1.964911313751012e-05, "loss": 0.7415, "step": 42460 }, { "epoch": 0.57, "learning_rate": 1.9643973594648164e-05, "loss": 1.1856, "step": 42465 }, { "epoch": 0.57, "learning_rate": 1.9638834289031384e-05, "loss": 1.2428, "step": 42470 }, { "epoch": 0.57, "learning_rate": 1.9633695220887427e-05, "loss": 0.6769, "step": 42475 }, { "epoch": 0.57, "learning_rate": 1.962855639044392e-05, "loss": 0.6119, "step": 42480 }, { "epoch": 0.57, "learning_rate": 1.9623417797928495e-05, "loss": 0.7216, "step": 42485 }, { "epoch": 0.57, "learning_rate": 1.961827944356876e-05, "loss": 0.4436, "step": 42490 }, { "epoch": 0.57, "learning_rate": 1.9613141327592333e-05, "loss": 0.7616, "step": 42495 }, { "epoch": 0.57, "learning_rate": 1.9608003450226788e-05, "loss": 0.712, "step": 42500 }, { "epoch": 0.57, "learning_rate": 1.960286581169971e-05, "loss": 0.6199, "step": 42505 }, { "epoch": 0.57, "learning_rate": 1.959772841223868e-05, "loss": 0.7767, "step": 42510 }, { "epoch": 0.57, "learning_rate": 1.9592591252071254e-05, "loss": 0.3662, "step": 42515 }, { "epoch": 0.57, "learning_rate": 1.958745433142498e-05, "loss": 0.5547, "step": 42520 }, { "epoch": 0.57, "learning_rate": 1.958231765052741e-05, "loss": 0.7677, "step": 42525 }, { "epoch": 0.57, "learning_rate": 1.9577181209606056e-05, "loss": 0.7169, "step": 42530 }, { "epoch": 0.57, "learning_rate": 1.9572045008888447e-05, "loss": 0.8935, "step": 42535 }, { "epoch": 0.57, "learning_rate": 1.9566909048602095e-05, "loss": 0.3169, "step": 42540 }, { "epoch": 0.57, "learning_rate": 1.9561773328974484e-05, "loss": 1.1459, "step": 42545 }, { "epoch": 0.57, "learning_rate": 1.955663785023311e-05, "loss": 0.3997, "step": 42550 }, { "epoch": 0.57, "learning_rate": 1.955150261260545e-05, "loss": 0.9728, "step": 42555 }, { "epoch": 0.57, "learning_rate": 1.954636761631896e-05, "loss": 1.1593, "step": 42560 }, { "epoch": 0.57, "learning_rate": 1.95412328616011e-05, "loss": 0.9947, "step": 42565 }, { "epoch": 0.57, "learning_rate": 1.9536098348679326e-05, "loss": 0.6916, "step": 42570 }, { "epoch": 0.57, "learning_rate": 1.953096407778105e-05, "loss": 1.3147, "step": 42575 }, { "epoch": 0.57, "learning_rate": 1.952583004913371e-05, "loss": 0.9854, "step": 42580 }, { "epoch": 0.57, "learning_rate": 1.952069626296471e-05, "loss": 0.5918, "step": 42585 }, { "epoch": 0.57, "learning_rate": 1.951556271950145e-05, "loss": 0.2657, "step": 42590 }, { "epoch": 0.57, "learning_rate": 1.9510429418971327e-05, "loss": 0.7593, "step": 42595 }, { "epoch": 0.57, "learning_rate": 1.9505296361601726e-05, "loss": 0.831, "step": 42600 }, { "epoch": 0.57, "learning_rate": 1.9500163547619996e-05, "loss": 0.8354, "step": 42605 }, { "epoch": 0.57, "learning_rate": 1.9495030977253507e-05, "loss": 0.4531, "step": 42610 }, { "epoch": 0.57, "learning_rate": 1.9489898650729605e-05, "loss": 0.3836, "step": 42615 }, { "epoch": 0.57, "learning_rate": 1.948476656827563e-05, "loss": 0.7506, "step": 42620 }, { "epoch": 0.57, "learning_rate": 1.9479634730118902e-05, "loss": 0.7825, "step": 42625 }, { "epoch": 0.57, "learning_rate": 1.947450313648673e-05, "loss": 0.3642, "step": 42630 }, { "epoch": 0.57, "learning_rate": 1.946937178760644e-05, "loss": 0.5985, "step": 42635 }, { "epoch": 0.57, "learning_rate": 1.9464240683705305e-05, "loss": 0.6654, "step": 42640 }, { "epoch": 0.57, "learning_rate": 1.9459109825010612e-05, "loss": 0.7389, "step": 42645 }, { "epoch": 0.57, "learning_rate": 1.9453979211749644e-05, "loss": 0.6666, "step": 42650 }, { "epoch": 0.57, "learning_rate": 1.9448848844149637e-05, "loss": 0.6905, "step": 42655 }, { "epoch": 0.57, "learning_rate": 1.944371872243786e-05, "loss": 0.5232, "step": 42660 }, { "epoch": 0.57, "learning_rate": 1.943858884684155e-05, "loss": 0.7411, "step": 42665 }, { "epoch": 0.57, "learning_rate": 1.9433459217587925e-05, "loss": 0.6514, "step": 42670 }, { "epoch": 0.57, "learning_rate": 1.942832983490421e-05, "loss": 0.5471, "step": 42675 }, { "epoch": 0.57, "learning_rate": 1.9423200699017613e-05, "loss": 0.7739, "step": 42680 }, { "epoch": 0.57, "learning_rate": 1.941807181015532e-05, "loss": 0.4314, "step": 42685 }, { "epoch": 0.57, "learning_rate": 1.941294316854452e-05, "loss": 0.7922, "step": 42690 }, { "epoch": 0.57, "learning_rate": 1.940781477441239e-05, "loss": 0.7144, "step": 42695 }, { "epoch": 0.57, "learning_rate": 1.9402686627986085e-05, "loss": 1.2372, "step": 42700 }, { "epoch": 0.57, "learning_rate": 1.9397558729492764e-05, "loss": 0.6975, "step": 42705 }, { "epoch": 0.57, "learning_rate": 1.9392431079159568e-05, "loss": 1.478, "step": 42710 }, { "epoch": 0.57, "learning_rate": 1.938730367721361e-05, "loss": 0.3673, "step": 42715 }, { "epoch": 0.57, "learning_rate": 1.9382176523882024e-05, "loss": 0.7066, "step": 42720 }, { "epoch": 0.57, "learning_rate": 1.9377049619391906e-05, "loss": 0.6858, "step": 42725 }, { "epoch": 0.57, "learning_rate": 1.9371922963970372e-05, "loss": 1.3327, "step": 42730 }, { "epoch": 0.57, "learning_rate": 1.936679655784449e-05, "loss": 0.7592, "step": 42735 }, { "epoch": 0.57, "learning_rate": 1.9361670401241333e-05, "loss": 0.395, "step": 42740 }, { "epoch": 0.57, "learning_rate": 1.9356544494387975e-05, "loss": 0.8423, "step": 42745 }, { "epoch": 0.57, "learning_rate": 1.9351418837511462e-05, "loss": 0.5941, "step": 42750 }, { "epoch": 0.57, "learning_rate": 1.9346293430838832e-05, "loss": 0.9128, "step": 42755 }, { "epoch": 0.57, "learning_rate": 1.934116827459713e-05, "loss": 1.2383, "step": 42760 }, { "epoch": 0.57, "learning_rate": 1.9336043369013353e-05, "loss": 0.6487, "step": 42765 }, { "epoch": 0.57, "learning_rate": 1.9330918714314517e-05, "loss": 0.4227, "step": 42770 }, { "epoch": 0.57, "learning_rate": 1.9325794310727627e-05, "loss": 1.3106, "step": 42775 }, { "epoch": 0.57, "learning_rate": 1.9320670158479655e-05, "loss": 1.0686, "step": 42780 }, { "epoch": 0.57, "learning_rate": 1.9315546257797585e-05, "loss": 0.5314, "step": 42785 }, { "epoch": 0.57, "learning_rate": 1.9310422608908385e-05, "loss": 0.6395, "step": 42790 }, { "epoch": 0.57, "learning_rate": 1.930529921203899e-05, "loss": 0.8662, "step": 42795 }, { "epoch": 0.57, "learning_rate": 1.930017606741635e-05, "loss": 0.7173, "step": 42800 }, { "epoch": 0.57, "learning_rate": 1.9295053175267403e-05, "loss": 0.2412, "step": 42805 }, { "epoch": 0.57, "learning_rate": 1.928993053581905e-05, "loss": 0.8588, "step": 42810 }, { "epoch": 0.57, "learning_rate": 1.928480814929821e-05, "loss": 0.3801, "step": 42815 }, { "epoch": 0.57, "learning_rate": 1.9279686015931785e-05, "loss": 0.7658, "step": 42820 }, { "epoch": 0.57, "learning_rate": 1.9274564135946645e-05, "loss": 1.1913, "step": 42825 }, { "epoch": 0.57, "learning_rate": 1.9269442509569668e-05, "loss": 1.0157, "step": 42830 }, { "epoch": 0.57, "learning_rate": 1.9264321137027713e-05, "loss": 0.1342, "step": 42835 }, { "epoch": 0.57, "learning_rate": 1.9259200018547653e-05, "loss": 0.3896, "step": 42840 }, { "epoch": 0.57, "learning_rate": 1.9254079154356303e-05, "loss": 0.547, "step": 42845 }, { "epoch": 0.57, "learning_rate": 1.9248958544680498e-05, "loss": 0.9132, "step": 42850 }, { "epoch": 0.57, "learning_rate": 1.9243838189747067e-05, "loss": 1.3503, "step": 42855 }, { "epoch": 0.57, "learning_rate": 1.9238718089782797e-05, "loss": 0.9886, "step": 42860 }, { "epoch": 0.57, "learning_rate": 1.9233598245014495e-05, "loss": 0.5455, "step": 42865 }, { "epoch": 0.57, "learning_rate": 1.9228478655668954e-05, "loss": 0.6527, "step": 42870 }, { "epoch": 0.57, "learning_rate": 1.922335932197292e-05, "loss": 1.1885, "step": 42875 }, { "epoch": 0.57, "learning_rate": 1.9218240244153172e-05, "loss": 0.9468, "step": 42880 }, { "epoch": 0.57, "learning_rate": 1.921312142243646e-05, "loss": 1.5771, "step": 42885 }, { "epoch": 0.57, "learning_rate": 1.9208002857049517e-05, "loss": 0.5854, "step": 42890 }, { "epoch": 0.57, "learning_rate": 1.9202884548219065e-05, "loss": 0.2832, "step": 42895 }, { "epoch": 0.57, "learning_rate": 1.919776649617184e-05, "loss": 0.8245, "step": 42900 }, { "epoch": 0.57, "learning_rate": 1.919264870113452e-05, "loss": 0.849, "step": 42905 }, { "epoch": 0.57, "learning_rate": 1.9187531163333807e-05, "loss": 0.2179, "step": 42910 }, { "epoch": 0.57, "learning_rate": 1.918241388299639e-05, "loss": 0.3679, "step": 42915 }, { "epoch": 0.58, "learning_rate": 1.917729686034893e-05, "loss": 0.9278, "step": 42920 }, { "epoch": 0.58, "learning_rate": 1.917218009561809e-05, "loss": 0.4782, "step": 42925 }, { "epoch": 0.58, "learning_rate": 1.9167063589030527e-05, "loss": 0.5919, "step": 42930 }, { "epoch": 0.58, "learning_rate": 1.9161947340812853e-05, "loss": 0.7564, "step": 42935 }, { "epoch": 0.58, "learning_rate": 1.9156831351191702e-05, "loss": 1.1448, "step": 42940 }, { "epoch": 0.58, "learning_rate": 1.915171562039369e-05, "loss": 0.4893, "step": 42945 }, { "epoch": 0.58, "learning_rate": 1.9146600148645433e-05, "loss": 1.1701, "step": 42950 }, { "epoch": 0.58, "learning_rate": 1.9141484936173494e-05, "loss": 0.6868, "step": 42955 }, { "epoch": 0.58, "learning_rate": 1.9136369983204465e-05, "loss": 1.0021, "step": 42960 }, { "epoch": 0.58, "learning_rate": 1.9131255289964912e-05, "loss": 1.3454, "step": 42965 }, { "epoch": 0.58, "learning_rate": 1.9126140856681387e-05, "loss": 0.6926, "step": 42970 }, { "epoch": 0.58, "learning_rate": 1.9121026683580433e-05, "loss": 0.3744, "step": 42975 }, { "epoch": 0.58, "learning_rate": 1.91159127708886e-05, "loss": 0.9414, "step": 42980 }, { "epoch": 0.58, "learning_rate": 1.911079911883238e-05, "loss": 0.7973, "step": 42985 }, { "epoch": 0.58, "learning_rate": 1.91056857276383e-05, "loss": 0.3251, "step": 42990 }, { "epoch": 0.58, "learning_rate": 1.9100572597532855e-05, "loss": 1.2887, "step": 42995 }, { "epoch": 0.58, "learning_rate": 1.9095459728742528e-05, "loss": 0.9133, "step": 43000 }, { "epoch": 0.58, "learning_rate": 1.9090347121493796e-05, "loss": 0.6324, "step": 43005 }, { "epoch": 0.58, "learning_rate": 1.9085234776013132e-05, "loss": 0.287, "step": 43010 }, { "epoch": 0.58, "learning_rate": 1.9080122692526962e-05, "loss": 0.3675, "step": 43015 }, { "epoch": 0.58, "learning_rate": 1.9075010871261746e-05, "loss": 0.9715, "step": 43020 }, { "epoch": 0.58, "learning_rate": 1.906989931244391e-05, "loss": 0.5881, "step": 43025 }, { "epoch": 0.58, "learning_rate": 1.906478801629986e-05, "loss": 0.4232, "step": 43030 }, { "epoch": 0.58, "learning_rate": 1.9059676983056007e-05, "loss": 0.4807, "step": 43035 }, { "epoch": 0.58, "learning_rate": 1.905456621293876e-05, "loss": 0.5066, "step": 43040 }, { "epoch": 0.58, "learning_rate": 1.904945570617447e-05, "loss": 0.4675, "step": 43045 }, { "epoch": 0.58, "learning_rate": 1.904434546298952e-05, "loss": 1.0042, "step": 43050 }, { "epoch": 0.58, "learning_rate": 1.9039235483610278e-05, "loss": 0.5142, "step": 43055 }, { "epoch": 0.58, "learning_rate": 1.903412576826309e-05, "loss": 0.8586, "step": 43060 }, { "epoch": 0.58, "learning_rate": 1.902901631717428e-05, "loss": 0.726, "step": 43065 }, { "epoch": 0.58, "learning_rate": 1.9023907130570168e-05, "loss": 0.8667, "step": 43070 }, { "epoch": 0.58, "learning_rate": 1.901879820867708e-05, "loss": 1.2617, "step": 43075 }, { "epoch": 0.58, "learning_rate": 1.9013689551721307e-05, "loss": 0.4996, "step": 43080 }, { "epoch": 0.58, "learning_rate": 1.9008581159929135e-05, "loss": 1.1145, "step": 43085 }, { "epoch": 0.58, "learning_rate": 1.9003473033526853e-05, "loss": 0.5794, "step": 43090 }, { "epoch": 0.58, "learning_rate": 1.8998365172740706e-05, "loss": 1.0668, "step": 43095 }, { "epoch": 0.58, "learning_rate": 1.8993257577796958e-05, "loss": 0.8856, "step": 43100 }, { "epoch": 0.58, "learning_rate": 1.898815024892185e-05, "loss": 0.3413, "step": 43105 }, { "epoch": 0.58, "learning_rate": 1.898304318634161e-05, "loss": 0.9632, "step": 43110 }, { "epoch": 0.58, "learning_rate": 1.8977936390282453e-05, "loss": 1.0954, "step": 43115 }, { "epoch": 0.58, "learning_rate": 1.8972829860970595e-05, "loss": 0.2639, "step": 43120 }, { "epoch": 0.58, "learning_rate": 1.8967723598632212e-05, "loss": 0.732, "step": 43125 }, { "epoch": 0.58, "learning_rate": 1.8962617603493496e-05, "loss": 0.2114, "step": 43130 }, { "epoch": 0.58, "learning_rate": 1.895751187578062e-05, "loss": 0.9393, "step": 43135 }, { "epoch": 0.58, "learning_rate": 1.8952406415719733e-05, "loss": 0.7097, "step": 43140 }, { "epoch": 0.58, "learning_rate": 1.8947301223536986e-05, "loss": 0.553, "step": 43145 }, { "epoch": 0.58, "learning_rate": 1.8942196299458526e-05, "loss": 1.2424, "step": 43150 }, { "epoch": 0.58, "learning_rate": 1.8937091643710448e-05, "loss": 0.8592, "step": 43155 }, { "epoch": 0.58, "learning_rate": 1.8931987256518885e-05, "loss": 1.1918, "step": 43160 }, { "epoch": 0.58, "learning_rate": 1.8926883138109925e-05, "loss": 0.4271, "step": 43165 }, { "epoch": 0.58, "learning_rate": 1.8921779288709674e-05, "loss": 0.641, "step": 43170 }, { "epoch": 0.58, "learning_rate": 1.8916675708544178e-05, "loss": 0.7363, "step": 43175 }, { "epoch": 0.58, "learning_rate": 1.8911572397839517e-05, "loss": 0.6353, "step": 43180 }, { "epoch": 0.58, "learning_rate": 1.8906469356821744e-05, "loss": 0.6732, "step": 43185 }, { "epoch": 0.58, "learning_rate": 1.8901366585716888e-05, "loss": 0.5255, "step": 43190 }, { "epoch": 0.58, "learning_rate": 1.889626408475098e-05, "loss": 0.7116, "step": 43195 }, { "epoch": 0.58, "learning_rate": 1.889116185415005e-05, "loss": 0.6298, "step": 43200 }, { "epoch": 0.58, "learning_rate": 1.8886059894140075e-05, "loss": 0.6939, "step": 43205 }, { "epoch": 0.58, "learning_rate": 1.8880958204947065e-05, "loss": 0.6104, "step": 43210 }, { "epoch": 0.58, "learning_rate": 1.8875856786796995e-05, "loss": 0.6311, "step": 43215 }, { "epoch": 0.58, "learning_rate": 1.8870755639915823e-05, "loss": 0.9268, "step": 43220 }, { "epoch": 0.58, "learning_rate": 1.8865654764529518e-05, "loss": 1.1008, "step": 43225 }, { "epoch": 0.58, "learning_rate": 1.8860554160864026e-05, "loss": 1.1774, "step": 43230 }, { "epoch": 0.58, "learning_rate": 1.885545382914526e-05, "loss": 0.5709, "step": 43235 }, { "epoch": 0.58, "learning_rate": 1.885035376959915e-05, "loss": 0.8292, "step": 43240 }, { "epoch": 0.58, "learning_rate": 1.8845253982451607e-05, "loss": 0.7463, "step": 43245 }, { "epoch": 0.58, "learning_rate": 1.8840154467928516e-05, "loss": 0.8867, "step": 43250 }, { "epoch": 0.58, "learning_rate": 1.8835055226255764e-05, "loss": 0.8874, "step": 43255 }, { "epoch": 0.58, "learning_rate": 1.8829956257659234e-05, "loss": 1.3751, "step": 43260 }, { "epoch": 0.58, "learning_rate": 1.882485756236476e-05, "loss": 0.4818, "step": 43265 }, { "epoch": 0.58, "learning_rate": 1.8819759140598206e-05, "loss": 1.2999, "step": 43270 }, { "epoch": 0.58, "learning_rate": 1.8814660992585414e-05, "loss": 0.4078, "step": 43275 }, { "epoch": 0.58, "learning_rate": 1.8809563118552187e-05, "loss": 1.1057, "step": 43280 }, { "epoch": 0.58, "learning_rate": 1.8804465518724343e-05, "loss": 0.5355, "step": 43285 }, { "epoch": 0.58, "learning_rate": 1.879936819332768e-05, "loss": 0.8123, "step": 43290 }, { "epoch": 0.58, "learning_rate": 1.8794271142587993e-05, "loss": 1.3911, "step": 43295 }, { "epoch": 0.58, "learning_rate": 1.878917436673104e-05, "loss": 0.3603, "step": 43300 }, { "epoch": 0.58, "learning_rate": 1.8784077865982595e-05, "loss": 0.9872, "step": 43305 }, { "epoch": 0.58, "learning_rate": 1.877898164056841e-05, "loss": 1.4411, "step": 43310 }, { "epoch": 0.58, "learning_rate": 1.877388569071421e-05, "loss": 0.7015, "step": 43315 }, { "epoch": 0.58, "learning_rate": 1.8768790016645717e-05, "loss": 0.2298, "step": 43320 }, { "epoch": 0.58, "learning_rate": 1.8763694618588664e-05, "loss": 0.324, "step": 43325 }, { "epoch": 0.58, "learning_rate": 1.8758599496768734e-05, "loss": 1.0715, "step": 43330 }, { "epoch": 0.58, "learning_rate": 1.875350465141162e-05, "loss": 0.9398, "step": 43335 }, { "epoch": 0.58, "learning_rate": 1.8748410082743012e-05, "loss": 0.8108, "step": 43340 }, { "epoch": 0.58, "learning_rate": 1.874331579098855e-05, "loss": 1.0377, "step": 43345 }, { "epoch": 0.58, "learning_rate": 1.87382217763739e-05, "loss": 0.3892, "step": 43350 }, { "epoch": 0.58, "learning_rate": 1.8733128039124698e-05, "loss": 0.5432, "step": 43355 }, { "epoch": 0.58, "learning_rate": 1.8728034579466573e-05, "loss": 0.3732, "step": 43360 }, { "epoch": 0.58, "learning_rate": 1.872294139762513e-05, "loss": 0.9436, "step": 43365 }, { "epoch": 0.58, "learning_rate": 1.8717848493825995e-05, "loss": 0.269, "step": 43370 }, { "epoch": 0.58, "learning_rate": 1.8712755868294733e-05, "loss": 0.8906, "step": 43375 }, { "epoch": 0.58, "learning_rate": 1.8707663521256933e-05, "loss": 0.4282, "step": 43380 }, { "epoch": 0.58, "learning_rate": 1.8702571452938167e-05, "loss": 0.655, "step": 43385 }, { "epoch": 0.58, "learning_rate": 1.8697479663563975e-05, "loss": 0.6002, "step": 43390 }, { "epoch": 0.58, "learning_rate": 1.86923881533599e-05, "loss": 0.9991, "step": 43395 }, { "epoch": 0.58, "learning_rate": 1.8687296922551473e-05, "loss": 0.3356, "step": 43400 }, { "epoch": 0.58, "learning_rate": 1.868220597136422e-05, "loss": 0.3135, "step": 43405 }, { "epoch": 0.58, "learning_rate": 1.867711530002363e-05, "loss": 0.6371, "step": 43410 }, { "epoch": 0.58, "learning_rate": 1.8672024908755194e-05, "loss": 0.3988, "step": 43415 }, { "epoch": 0.58, "learning_rate": 1.8666934797784414e-05, "loss": 1.3217, "step": 43420 }, { "epoch": 0.58, "learning_rate": 1.8661844967336723e-05, "loss": 0.6321, "step": 43425 }, { "epoch": 0.58, "learning_rate": 1.8656755417637595e-05, "loss": 1.022, "step": 43430 }, { "epoch": 0.58, "learning_rate": 1.865166614891247e-05, "loss": 1.2992, "step": 43435 }, { "epoch": 0.58, "learning_rate": 1.8646577161386776e-05, "loss": 0.7483, "step": 43440 }, { "epoch": 0.58, "learning_rate": 1.8641488455285923e-05, "loss": 1.0853, "step": 43445 }, { "epoch": 0.58, "learning_rate": 1.863640003083533e-05, "loss": 0.5315, "step": 43450 }, { "epoch": 0.58, "learning_rate": 1.863131188826037e-05, "loss": 0.5694, "step": 43455 }, { "epoch": 0.58, "learning_rate": 1.8626224027786435e-05, "loss": 0.1459, "step": 43460 }, { "epoch": 0.58, "learning_rate": 1.8621136449638894e-05, "loss": 1.9908, "step": 43465 }, { "epoch": 0.58, "learning_rate": 1.8616049154043086e-05, "loss": 0.7068, "step": 43470 }, { "epoch": 0.58, "learning_rate": 1.8610962141224365e-05, "loss": 0.6381, "step": 43475 }, { "epoch": 0.58, "learning_rate": 1.8605875411408062e-05, "loss": 0.6843, "step": 43480 }, { "epoch": 0.58, "learning_rate": 1.860078896481949e-05, "loss": 0.6854, "step": 43485 }, { "epoch": 0.58, "learning_rate": 1.8595702801683946e-05, "loss": 0.5815, "step": 43490 }, { "epoch": 0.58, "learning_rate": 1.859061692222674e-05, "loss": 0.5702, "step": 43495 }, { "epoch": 0.58, "learning_rate": 1.8585531326673128e-05, "loss": 1.0652, "step": 43500 }, { "epoch": 0.58, "learning_rate": 1.858044601524839e-05, "loss": 0.5811, "step": 43505 }, { "epoch": 0.58, "learning_rate": 1.8575360988177777e-05, "loss": 0.2242, "step": 43510 }, { "epoch": 0.58, "learning_rate": 1.8570276245686536e-05, "loss": 0.4997, "step": 43515 }, { "epoch": 0.58, "learning_rate": 1.8565191787999886e-05, "loss": 0.7108, "step": 43520 }, { "epoch": 0.58, "learning_rate": 1.8560107615343044e-05, "loss": 0.691, "step": 43525 }, { "epoch": 0.58, "learning_rate": 1.855502372794123e-05, "loss": 0.3363, "step": 43530 }, { "epoch": 0.58, "learning_rate": 1.854994012601961e-05, "loss": 0.9711, "step": 43535 }, { "epoch": 0.58, "learning_rate": 1.8544856809803375e-05, "loss": 0.1969, "step": 43540 }, { "epoch": 0.58, "learning_rate": 1.8539773779517694e-05, "loss": 0.8801, "step": 43545 }, { "epoch": 0.58, "learning_rate": 1.853469103538771e-05, "loss": 0.8297, "step": 43550 }, { "epoch": 0.58, "learning_rate": 1.852960857763857e-05, "loss": 0.7876, "step": 43555 }, { "epoch": 0.58, "learning_rate": 1.8524526406495407e-05, "loss": 0.7221, "step": 43560 }, { "epoch": 0.58, "learning_rate": 1.8519444522183318e-05, "loss": 0.3463, "step": 43565 }, { "epoch": 0.58, "learning_rate": 1.851436292492741e-05, "loss": 0.486, "step": 43570 }, { "epoch": 0.58, "learning_rate": 1.8509281614952798e-05, "loss": 1.1416, "step": 43575 }, { "epoch": 0.58, "learning_rate": 1.8504200592484522e-05, "loss": 0.5264, "step": 43580 }, { "epoch": 0.58, "learning_rate": 1.8499119857747666e-05, "loss": 0.9282, "step": 43585 }, { "epoch": 0.58, "learning_rate": 1.8494039410967284e-05, "loss": 0.7796, "step": 43590 }, { "epoch": 0.58, "learning_rate": 1.8488959252368398e-05, "loss": 0.6156, "step": 43595 }, { "epoch": 0.58, "learning_rate": 1.848387938217605e-05, "loss": 0.9528, "step": 43600 }, { "epoch": 0.58, "learning_rate": 1.8478799800615248e-05, "loss": 0.7114, "step": 43605 }, { "epoch": 0.58, "learning_rate": 1.8473720507910985e-05, "loss": 0.658, "step": 43610 }, { "epoch": 0.58, "learning_rate": 1.8468641504288255e-05, "loss": 0.0592, "step": 43615 }, { "epoch": 0.58, "learning_rate": 1.8463562789972027e-05, "loss": 0.6681, "step": 43620 }, { "epoch": 0.58, "learning_rate": 1.8458484365187273e-05, "loss": 0.3929, "step": 43625 }, { "epoch": 0.58, "learning_rate": 1.845340623015893e-05, "loss": 0.2693, "step": 43630 }, { "epoch": 0.58, "learning_rate": 1.844832838511194e-05, "loss": 0.6318, "step": 43635 }, { "epoch": 0.58, "learning_rate": 1.844325083027124e-05, "loss": 0.9516, "step": 43640 }, { "epoch": 0.58, "learning_rate": 1.843817356586171e-05, "loss": 0.2795, "step": 43645 }, { "epoch": 0.58, "learning_rate": 1.8433096592108265e-05, "loss": 0.3941, "step": 43650 }, { "epoch": 0.58, "learning_rate": 1.8428019909235793e-05, "loss": 0.4798, "step": 43655 }, { "epoch": 0.58, "learning_rate": 1.8422943517469155e-05, "loss": 0.4295, "step": 43660 }, { "epoch": 0.59, "learning_rate": 1.8417867417033217e-05, "loss": 0.4864, "step": 43665 }, { "epoch": 0.59, "learning_rate": 1.841279160815283e-05, "loss": 0.5201, "step": 43670 }, { "epoch": 0.59, "learning_rate": 1.8407716091052813e-05, "loss": 0.608, "step": 43675 }, { "epoch": 0.59, "learning_rate": 1.8402640865957986e-05, "loss": 0.6668, "step": 43680 }, { "epoch": 0.59, "learning_rate": 1.839756593309318e-05, "loss": 1.2803, "step": 43685 }, { "epoch": 0.59, "learning_rate": 1.839249129268316e-05, "loss": 0.4004, "step": 43690 }, { "epoch": 0.59, "learning_rate": 1.8387416944952717e-05, "loss": 0.2634, "step": 43695 }, { "epoch": 0.59, "learning_rate": 1.8382342890126633e-05, "loss": 0.9016, "step": 43700 }, { "epoch": 0.59, "learning_rate": 1.8377269128429642e-05, "loss": 1.1477, "step": 43705 }, { "epoch": 0.59, "learning_rate": 1.83721956600865e-05, "loss": 0.9494, "step": 43710 }, { "epoch": 0.59, "learning_rate": 1.8367122485321943e-05, "loss": 0.7766, "step": 43715 }, { "epoch": 0.59, "learning_rate": 1.836204960436066e-05, "loss": 0.2016, "step": 43720 }, { "epoch": 0.59, "learning_rate": 1.8356977017427375e-05, "loss": 0.5537, "step": 43725 }, { "epoch": 0.59, "learning_rate": 1.8351904724746774e-05, "loss": 0.8953, "step": 43730 }, { "epoch": 0.59, "learning_rate": 1.834683272654354e-05, "loss": 1.3381, "step": 43735 }, { "epoch": 0.59, "learning_rate": 1.8341761023042326e-05, "loss": 0.6474, "step": 43740 }, { "epoch": 0.59, "learning_rate": 1.833668961446779e-05, "loss": 0.8156, "step": 43745 }, { "epoch": 0.59, "learning_rate": 1.8331618501044574e-05, "loss": 0.6178, "step": 43750 }, { "epoch": 0.59, "learning_rate": 1.8326547682997292e-05, "loss": 0.6412, "step": 43755 }, { "epoch": 0.59, "learning_rate": 1.832147716055056e-05, "loss": 0.7278, "step": 43760 }, { "epoch": 0.59, "learning_rate": 1.8316406933928983e-05, "loss": 0.3338, "step": 43765 }, { "epoch": 0.59, "learning_rate": 1.8311337003357137e-05, "loss": 0.5929, "step": 43770 }, { "epoch": 0.59, "learning_rate": 1.8306267369059598e-05, "loss": 0.6252, "step": 43775 }, { "epoch": 0.59, "learning_rate": 1.830119803126094e-05, "loss": 1.0059, "step": 43780 }, { "epoch": 0.59, "learning_rate": 1.8296128990185685e-05, "loss": 1.005, "step": 43785 }, { "epoch": 0.59, "learning_rate": 1.829106024605837e-05, "loss": 0.7821, "step": 43790 }, { "epoch": 0.59, "learning_rate": 1.828599179910354e-05, "loss": 0.5734, "step": 43795 }, { "epoch": 0.59, "learning_rate": 1.8280923649545673e-05, "loss": 0.5454, "step": 43800 }, { "epoch": 0.59, "learning_rate": 1.8275855797609272e-05, "loss": 0.9195, "step": 43805 }, { "epoch": 0.59, "learning_rate": 1.8270788243518827e-05, "loss": 1.0677, "step": 43810 }, { "epoch": 0.59, "learning_rate": 1.826572098749879e-05, "loss": 1.0714, "step": 43815 }, { "epoch": 0.59, "learning_rate": 1.826065402977363e-05, "loss": 1.1075, "step": 43820 }, { "epoch": 0.59, "learning_rate": 1.8255587370567783e-05, "loss": 1.0275, "step": 43825 }, { "epoch": 0.59, "learning_rate": 1.8250521010105664e-05, "loss": 0.7148, "step": 43830 }, { "epoch": 0.59, "learning_rate": 1.82454549486117e-05, "loss": 1.1187, "step": 43835 }, { "epoch": 0.59, "learning_rate": 1.8240389186310296e-05, "loss": 0.4981, "step": 43840 }, { "epoch": 0.59, "learning_rate": 1.823532372342583e-05, "loss": 0.4456, "step": 43845 }, { "epoch": 0.59, "learning_rate": 1.8230258560182677e-05, "loss": 0.4691, "step": 43850 }, { "epoch": 0.59, "learning_rate": 1.8225193696805204e-05, "loss": 0.6886, "step": 43855 }, { "epoch": 0.59, "learning_rate": 1.8220129133517767e-05, "loss": 1.1647, "step": 43860 }, { "epoch": 0.59, "learning_rate": 1.821506487054468e-05, "loss": 0.702, "step": 43865 }, { "epoch": 0.59, "learning_rate": 1.8210000908110274e-05, "loss": 0.8141, "step": 43870 }, { "epoch": 0.59, "learning_rate": 1.8204937246438863e-05, "loss": 0.451, "step": 43875 }, { "epoch": 0.59, "learning_rate": 1.8199873885754738e-05, "loss": 0.7606, "step": 43880 }, { "epoch": 0.59, "learning_rate": 1.8194810826282173e-05, "loss": 0.3312, "step": 43885 }, { "epoch": 0.59, "learning_rate": 1.8189748068245456e-05, "loss": 1.0973, "step": 43890 }, { "epoch": 0.59, "learning_rate": 1.8184685611868813e-05, "loss": 0.3396, "step": 43895 }, { "epoch": 0.59, "learning_rate": 1.817962345737651e-05, "loss": 0.9069, "step": 43900 }, { "epoch": 0.59, "learning_rate": 1.8174561604992775e-05, "loss": 0.8457, "step": 43905 }, { "epoch": 0.59, "learning_rate": 1.8169500054941802e-05, "loss": 0.5096, "step": 43910 }, { "epoch": 0.59, "learning_rate": 1.8164438807447803e-05, "loss": 0.5826, "step": 43915 }, { "epoch": 0.59, "learning_rate": 1.8159377862734978e-05, "loss": 1.0711, "step": 43920 }, { "epoch": 0.59, "learning_rate": 1.8154317221027484e-05, "loss": 0.9031, "step": 43925 }, { "epoch": 0.59, "learning_rate": 1.8149256882549488e-05, "loss": 0.3288, "step": 43930 }, { "epoch": 0.59, "learning_rate": 1.814419684752515e-05, "loss": 0.425, "step": 43935 }, { "epoch": 0.59, "learning_rate": 1.8139137116178583e-05, "loss": 1.1297, "step": 43940 }, { "epoch": 0.59, "learning_rate": 1.8134077688733918e-05, "loss": 0.8761, "step": 43945 }, { "epoch": 0.59, "learning_rate": 1.8129018565415266e-05, "loss": 0.5342, "step": 43950 }, { "epoch": 0.59, "learning_rate": 1.812395974644671e-05, "loss": 0.5372, "step": 43955 }, { "epoch": 0.59, "learning_rate": 1.8118901232052343e-05, "loss": 0.7606, "step": 43960 }, { "epoch": 0.59, "learning_rate": 1.8113843022456223e-05, "loss": 0.3228, "step": 43965 }, { "epoch": 0.59, "learning_rate": 1.810878511788242e-05, "loss": 0.2399, "step": 43970 }, { "epoch": 0.59, "learning_rate": 1.8103727518554947e-05, "loss": 0.4177, "step": 43975 }, { "epoch": 0.59, "learning_rate": 1.8098670224697845e-05, "loss": 0.7766, "step": 43980 }, { "epoch": 0.59, "learning_rate": 1.8093613236535134e-05, "loss": 0.2748, "step": 43985 }, { "epoch": 0.59, "learning_rate": 1.8088556554290796e-05, "loss": 0.3846, "step": 43990 }, { "epoch": 0.59, "learning_rate": 1.8083500178188828e-05, "loss": 1.2404, "step": 43995 }, { "epoch": 0.59, "learning_rate": 1.8078444108453207e-05, "loss": 0.6567, "step": 44000 }, { "epoch": 0.59, "learning_rate": 1.8073388345307874e-05, "loss": 0.6983, "step": 44005 }, { "epoch": 0.59, "learning_rate": 1.8068332888976784e-05, "loss": 0.545, "step": 44010 }, { "epoch": 0.59, "learning_rate": 1.8063277739683882e-05, "loss": 0.7991, "step": 44015 }, { "epoch": 0.59, "learning_rate": 1.8058222897653065e-05, "loss": 1.6173, "step": 44020 }, { "epoch": 0.59, "learning_rate": 1.8053168363108243e-05, "loss": 0.556, "step": 44025 }, { "epoch": 0.59, "learning_rate": 1.8048114136273313e-05, "loss": 0.6125, "step": 44030 }, { "epoch": 0.59, "learning_rate": 1.804306021737214e-05, "loss": 0.9125, "step": 44035 }, { "epoch": 0.59, "learning_rate": 1.80380066066286e-05, "loss": 0.7535, "step": 44040 }, { "epoch": 0.59, "learning_rate": 1.8032953304266543e-05, "loss": 0.5101, "step": 44045 }, { "epoch": 0.59, "learning_rate": 1.8027900310509794e-05, "loss": 0.6679, "step": 44050 }, { "epoch": 0.59, "learning_rate": 1.802284762558218e-05, "loss": 0.8695, "step": 44055 }, { "epoch": 0.59, "learning_rate": 1.8017795249707514e-05, "loss": 0.4455, "step": 44060 }, { "epoch": 0.59, "learning_rate": 1.8012743183109582e-05, "loss": 0.6879, "step": 44065 }, { "epoch": 0.59, "learning_rate": 1.8007691426012174e-05, "loss": 0.8892, "step": 44070 }, { "epoch": 0.59, "learning_rate": 1.800263997863905e-05, "loss": 0.9839, "step": 44075 }, { "epoch": 0.59, "learning_rate": 1.799758884121398e-05, "loss": 1.4091, "step": 44080 }, { "epoch": 0.59, "learning_rate": 1.7992538013960687e-05, "loss": 0.861, "step": 44085 }, { "epoch": 0.59, "learning_rate": 1.7987487497102896e-05, "loss": 0.7882, "step": 44090 }, { "epoch": 0.59, "learning_rate": 1.7982437290864335e-05, "loss": 1.4284, "step": 44095 }, { "epoch": 0.59, "learning_rate": 1.7977387395468688e-05, "loss": 1.1169, "step": 44100 }, { "epoch": 0.59, "learning_rate": 1.7972337811139643e-05, "loss": 0.5629, "step": 44105 }, { "epoch": 0.59, "learning_rate": 1.7967288538100885e-05, "loss": 0.5807, "step": 44110 }, { "epoch": 0.59, "learning_rate": 1.7962239576576058e-05, "loss": 0.6784, "step": 44115 }, { "epoch": 0.59, "learning_rate": 1.79571909267888e-05, "loss": 0.7314, "step": 44120 }, { "epoch": 0.59, "learning_rate": 1.795214258896277e-05, "loss": 0.4734, "step": 44125 }, { "epoch": 0.59, "learning_rate": 1.794709456332155e-05, "loss": 0.5542, "step": 44130 }, { "epoch": 0.59, "learning_rate": 1.7942046850088755e-05, "loss": 0.5847, "step": 44135 }, { "epoch": 0.59, "learning_rate": 1.793699944948798e-05, "loss": 0.7762, "step": 44140 }, { "epoch": 0.59, "learning_rate": 1.7931952361742787e-05, "loss": 0.6671, "step": 44145 }, { "epoch": 0.59, "learning_rate": 1.7926905587076747e-05, "loss": 1.0792, "step": 44150 }, { "epoch": 0.59, "learning_rate": 1.7922868392911137e-05, "loss": 0.735, "step": 44155 }, { "epoch": 0.59, "learning_rate": 1.7917822182350896e-05, "loss": 0.9811, "step": 44160 }, { "epoch": 0.59, "learning_rate": 1.7912776285495704e-05, "loss": 0.771, "step": 44165 }, { "epoch": 0.59, "learning_rate": 1.7907730702569066e-05, "loss": 1.0038, "step": 44170 }, { "epoch": 0.59, "learning_rate": 1.7902685433794473e-05, "loss": 0.7205, "step": 44175 }, { "epoch": 0.59, "learning_rate": 1.789764047939541e-05, "loss": 0.089, "step": 44180 }, { "epoch": 0.59, "learning_rate": 1.789259583959535e-05, "loss": 0.7567, "step": 44185 }, { "epoch": 0.59, "learning_rate": 1.7887551514617727e-05, "loss": 1.0158, "step": 44190 }, { "epoch": 0.59, "learning_rate": 1.788250750468599e-05, "loss": 0.4361, "step": 44195 }, { "epoch": 0.59, "learning_rate": 1.787746381002357e-05, "loss": 0.6987, "step": 44200 }, { "epoch": 0.59, "learning_rate": 1.7872420430853866e-05, "loss": 1.2491, "step": 44205 }, { "epoch": 0.59, "learning_rate": 1.7867377367400275e-05, "loss": 0.3625, "step": 44210 }, { "epoch": 0.59, "learning_rate": 1.786233461988619e-05, "loss": 0.3718, "step": 44215 }, { "epoch": 0.59, "learning_rate": 1.785729218853497e-05, "loss": 0.6124, "step": 44220 }, { "epoch": 0.59, "learning_rate": 1.785225007356997e-05, "loss": 0.9636, "step": 44225 }, { "epoch": 0.59, "learning_rate": 1.7847208275214526e-05, "loss": 0.9609, "step": 44230 }, { "epoch": 0.59, "learning_rate": 1.784216679369199e-05, "loss": 1.129, "step": 44235 }, { "epoch": 0.59, "learning_rate": 1.783712562922564e-05, "loss": 0.2644, "step": 44240 }, { "epoch": 0.59, "learning_rate": 1.7832084782038792e-05, "loss": 0.9719, "step": 44245 }, { "epoch": 0.59, "learning_rate": 1.7827044252354735e-05, "loss": 0.5398, "step": 44250 }, { "epoch": 0.59, "learning_rate": 1.7822004040396727e-05, "loss": 0.9433, "step": 44255 }, { "epoch": 0.59, "learning_rate": 1.7816964146388026e-05, "loss": 0.6902, "step": 44260 }, { "epoch": 0.59, "learning_rate": 1.781192457055189e-05, "loss": 0.9005, "step": 44265 }, { "epoch": 0.59, "learning_rate": 1.7806885313111526e-05, "loss": 0.3675, "step": 44270 }, { "epoch": 0.59, "learning_rate": 1.780184637429016e-05, "loss": 0.7356, "step": 44275 }, { "epoch": 0.59, "learning_rate": 1.7796807754310986e-05, "loss": 0.4627, "step": 44280 }, { "epoch": 0.59, "learning_rate": 1.779176945339719e-05, "loss": 0.6707, "step": 44285 }, { "epoch": 0.59, "learning_rate": 1.7786731471771946e-05, "loss": 0.5607, "step": 44290 }, { "epoch": 0.59, "learning_rate": 1.7781693809658422e-05, "loss": 0.5438, "step": 44295 }, { "epoch": 0.59, "learning_rate": 1.777665646727974e-05, "loss": 0.6175, "step": 44300 }, { "epoch": 0.59, "learning_rate": 1.777161944485904e-05, "loss": 0.4099, "step": 44305 }, { "epoch": 0.59, "learning_rate": 1.7766582742619437e-05, "loss": 0.2818, "step": 44310 }, { "epoch": 0.59, "learning_rate": 1.776154636078403e-05, "loss": 0.7422, "step": 44315 }, { "epoch": 0.59, "learning_rate": 1.7756510299575905e-05, "loss": 1.0216, "step": 44320 }, { "epoch": 0.59, "learning_rate": 1.7751474559218145e-05, "loss": 0.6791, "step": 44325 }, { "epoch": 0.59, "learning_rate": 1.774643913993379e-05, "loss": 0.259, "step": 44330 }, { "epoch": 0.59, "learning_rate": 1.7741404041945885e-05, "loss": 0.7395, "step": 44335 }, { "epoch": 0.59, "learning_rate": 1.7736369265477477e-05, "loss": 0.4809, "step": 44340 }, { "epoch": 0.59, "learning_rate": 1.7731334810751576e-05, "loss": 0.7763, "step": 44345 }, { "epoch": 0.59, "learning_rate": 1.772630067799117e-05, "loss": 0.9676, "step": 44350 }, { "epoch": 0.59, "learning_rate": 1.7721266867419258e-05, "loss": 0.5463, "step": 44355 }, { "epoch": 0.59, "learning_rate": 1.7716233379258814e-05, "loss": 0.7177, "step": 44360 }, { "epoch": 0.59, "learning_rate": 1.7711200213732787e-05, "loss": 0.551, "step": 44365 }, { "epoch": 0.59, "learning_rate": 1.7706167371064124e-05, "loss": 1.1097, "step": 44370 }, { "epoch": 0.59, "learning_rate": 1.7701134851475766e-05, "loss": 0.2493, "step": 44375 }, { "epoch": 0.59, "learning_rate": 1.769610265519061e-05, "loss": 1.1203, "step": 44380 }, { "epoch": 0.59, "learning_rate": 1.769107078243157e-05, "loss": 0.5981, "step": 44385 }, { "epoch": 0.59, "learning_rate": 1.7686039233421528e-05, "loss": 1.2708, "step": 44390 }, { "epoch": 0.59, "learning_rate": 1.7681008008383354e-05, "loss": 0.6607, "step": 44395 }, { "epoch": 0.59, "learning_rate": 1.7675977107539908e-05, "loss": 1.0361, "step": 44400 }, { "epoch": 0.59, "learning_rate": 1.7670946531114052e-05, "loss": 0.2639, "step": 44405 }, { "epoch": 0.6, "learning_rate": 1.7665916279328583e-05, "loss": 1.1324, "step": 44410 }, { "epoch": 0.6, "learning_rate": 1.766088635240633e-05, "loss": 0.4586, "step": 44415 }, { "epoch": 0.6, "learning_rate": 1.7655856750570106e-05, "loss": 0.0918, "step": 44420 }, { "epoch": 0.6, "learning_rate": 1.7650827474042674e-05, "loss": 1.3639, "step": 44425 }, { "epoch": 0.6, "learning_rate": 1.7645798523046823e-05, "loss": 1.0994, "step": 44430 }, { "epoch": 0.6, "learning_rate": 1.7640769897805316e-05, "loss": 0.7633, "step": 44435 }, { "epoch": 0.6, "learning_rate": 1.7635741598540874e-05, "loss": 1.0227, "step": 44440 }, { "epoch": 0.6, "learning_rate": 1.763071362547623e-05, "loss": 1.0192, "step": 44445 }, { "epoch": 0.6, "learning_rate": 1.7625685978834122e-05, "loss": 0.3446, "step": 44450 }, { "epoch": 0.6, "learning_rate": 1.7620658658837226e-05, "loss": 0.8624, "step": 44455 }, { "epoch": 0.6, "learning_rate": 1.7615631665708227e-05, "loss": 0.4496, "step": 44460 }, { "epoch": 0.6, "learning_rate": 1.7610604999669804e-05, "loss": 1.0246, "step": 44465 }, { "epoch": 0.6, "learning_rate": 1.7605578660944623e-05, "loss": 0.8319, "step": 44470 }, { "epoch": 0.6, "learning_rate": 1.7600552649755302e-05, "loss": 0.9978, "step": 44475 }, { "epoch": 0.6, "learning_rate": 1.7595526966324482e-05, "loss": 0.364, "step": 44480 }, { "epoch": 0.6, "learning_rate": 1.7590501610874788e-05, "loss": 1.0059, "step": 44485 }, { "epoch": 0.6, "learning_rate": 1.758547658362879e-05, "loss": 0.7856, "step": 44490 }, { "epoch": 0.6, "learning_rate": 1.7580451884809083e-05, "loss": 0.8562, "step": 44495 }, { "epoch": 0.6, "learning_rate": 1.7575427514638247e-05, "loss": 1.6683, "step": 44500 }, { "epoch": 0.6, "learning_rate": 1.7570403473338825e-05, "loss": 0.763, "step": 44505 }, { "epoch": 0.6, "learning_rate": 1.756537976113336e-05, "loss": 1.0331, "step": 44510 }, { "epoch": 0.6, "learning_rate": 1.7560356378244387e-05, "loss": 0.4715, "step": 44515 }, { "epoch": 0.6, "learning_rate": 1.7555333324894393e-05, "loss": 0.67, "step": 44520 }, { "epoch": 0.6, "learning_rate": 1.7550310601305892e-05, "loss": 1.2624, "step": 44525 }, { "epoch": 0.6, "learning_rate": 1.7545288207701366e-05, "loss": 0.8428, "step": 44530 }, { "epoch": 0.6, "learning_rate": 1.7540266144303273e-05, "loss": 0.5949, "step": 44535 }, { "epoch": 0.6, "learning_rate": 1.7535244411334068e-05, "loss": 1.4048, "step": 44540 }, { "epoch": 0.6, "learning_rate": 1.75302230090162e-05, "loss": 0.7239, "step": 44545 }, { "epoch": 0.6, "learning_rate": 1.752520193757207e-05, "loss": 0.2633, "step": 44550 }, { "epoch": 0.6, "learning_rate": 1.7520181197224107e-05, "loss": 0.9713, "step": 44555 }, { "epoch": 0.6, "learning_rate": 1.75151607881947e-05, "loss": 0.6645, "step": 44560 }, { "epoch": 0.6, "learning_rate": 1.751014071070622e-05, "loss": 0.6384, "step": 44565 }, { "epoch": 0.6, "learning_rate": 1.7505120964981032e-05, "loss": 0.1803, "step": 44570 }, { "epoch": 0.6, "learning_rate": 1.750010155124149e-05, "loss": 0.8611, "step": 44575 }, { "epoch": 0.6, "learning_rate": 1.7495082469709936e-05, "loss": 0.2993, "step": 44580 }, { "epoch": 0.6, "learning_rate": 1.7490063720608678e-05, "loss": 0.931, "step": 44585 }, { "epoch": 0.6, "learning_rate": 1.7485045304160023e-05, "loss": 0.9047, "step": 44590 }, { "epoch": 0.6, "learning_rate": 1.7480027220586274e-05, "loss": 0.5962, "step": 44595 }, { "epoch": 0.6, "learning_rate": 1.7475009470109692e-05, "loss": 1.3667, "step": 44600 }, { "epoch": 0.6, "learning_rate": 1.746999205295254e-05, "loss": 0.8744, "step": 44605 }, { "epoch": 0.6, "learning_rate": 1.7464974969337077e-05, "loss": 0.4398, "step": 44610 }, { "epoch": 0.6, "learning_rate": 1.7459958219485523e-05, "loss": 0.1192, "step": 44615 }, { "epoch": 0.6, "learning_rate": 1.7454941803620096e-05, "loss": 0.6377, "step": 44620 }, { "epoch": 0.6, "learning_rate": 1.7449925721963005e-05, "loss": 0.1237, "step": 44625 }, { "epoch": 0.6, "learning_rate": 1.744490997473643e-05, "loss": 0.8387, "step": 44630 }, { "epoch": 0.6, "learning_rate": 1.7439894562162546e-05, "loss": 0.3786, "step": 44635 }, { "epoch": 0.6, "learning_rate": 1.7434879484463514e-05, "loss": 0.4934, "step": 44640 }, { "epoch": 0.6, "learning_rate": 1.7429864741861466e-05, "loss": 0.4772, "step": 44645 }, { "epoch": 0.6, "learning_rate": 1.7424850334578542e-05, "loss": 1.0571, "step": 44650 }, { "epoch": 0.6, "learning_rate": 1.741983626283686e-05, "loss": 0.201, "step": 44655 }, { "epoch": 0.6, "learning_rate": 1.7414822526858486e-05, "loss": 0.3045, "step": 44660 }, { "epoch": 0.6, "learning_rate": 1.740980912686554e-05, "loss": 1.1286, "step": 44665 }, { "epoch": 0.6, "learning_rate": 1.7404796063080087e-05, "loss": 0.5436, "step": 44670 }, { "epoch": 0.6, "learning_rate": 1.7399783335724164e-05, "loss": 0.2209, "step": 44675 }, { "epoch": 0.6, "learning_rate": 1.739477094501981e-05, "loss": 0.7453, "step": 44680 }, { "epoch": 0.6, "learning_rate": 1.7389758891189055e-05, "loss": 0.7466, "step": 44685 }, { "epoch": 0.6, "learning_rate": 1.7384747174453915e-05, "loss": 0.3868, "step": 44690 }, { "epoch": 0.6, "learning_rate": 1.7379735795036374e-05, "loss": 0.5591, "step": 44695 }, { "epoch": 0.6, "learning_rate": 1.7374724753158414e-05, "loss": 0.833, "step": 44700 }, { "epoch": 0.6, "learning_rate": 1.7369714049042007e-05, "loss": 1.1304, "step": 44705 }, { "epoch": 0.6, "learning_rate": 1.736470368290909e-05, "loss": 1.2048, "step": 44710 }, { "epoch": 0.6, "learning_rate": 1.7359693654981596e-05, "loss": 0.5078, "step": 44715 }, { "epoch": 0.6, "learning_rate": 1.7354683965481454e-05, "loss": 1.7584, "step": 44720 }, { "epoch": 0.6, "learning_rate": 1.7349674614630566e-05, "loss": 1.0831, "step": 44725 }, { "epoch": 0.6, "learning_rate": 1.7344665602650814e-05, "loss": 0.5279, "step": 44730 }, { "epoch": 0.6, "learning_rate": 1.7339656929764087e-05, "loss": 0.414, "step": 44735 }, { "epoch": 0.6, "learning_rate": 1.7334648596192227e-05, "loss": 0.6665, "step": 44740 }, { "epoch": 0.6, "learning_rate": 1.7329640602157085e-05, "loss": 0.6082, "step": 44745 }, { "epoch": 0.6, "learning_rate": 1.7324632947880494e-05, "loss": 0.9016, "step": 44750 }, { "epoch": 0.6, "learning_rate": 1.7319625633584264e-05, "loss": 0.4599, "step": 44755 }, { "epoch": 0.6, "learning_rate": 1.731461865949019e-05, "loss": 0.8088, "step": 44760 }, { "epoch": 0.6, "learning_rate": 1.7309612025820065e-05, "loss": 0.6891, "step": 44765 }, { "epoch": 0.6, "learning_rate": 1.7304605732795654e-05, "loss": 0.984, "step": 44770 }, { "epoch": 0.6, "learning_rate": 1.7299599780638707e-05, "loss": 0.7071, "step": 44775 }, { "epoch": 0.6, "learning_rate": 1.7294594169570977e-05, "loss": 0.9406, "step": 44780 }, { "epoch": 0.6, "learning_rate": 1.7289588899814164e-05, "loss": 0.8914, "step": 44785 }, { "epoch": 0.6, "learning_rate": 1.728458397158999e-05, "loss": 0.8356, "step": 44790 }, { "epoch": 0.6, "learning_rate": 1.7279579385120144e-05, "loss": 0.9993, "step": 44795 }, { "epoch": 0.6, "learning_rate": 1.7274575140626318e-05, "loss": 0.5389, "step": 44800 }, { "epoch": 0.6, "learning_rate": 1.7269571238330157e-05, "loss": 0.8235, "step": 44805 }, { "epoch": 0.6, "learning_rate": 1.7264567678453313e-05, "loss": 0.5567, "step": 44810 }, { "epoch": 0.6, "learning_rate": 1.7259564461217437e-05, "loss": 0.4317, "step": 44815 }, { "epoch": 0.6, "learning_rate": 1.7254561586844113e-05, "loss": 0.2542, "step": 44820 }, { "epoch": 0.6, "learning_rate": 1.724955905555497e-05, "loss": 1.2145, "step": 44825 }, { "epoch": 0.6, "learning_rate": 1.7244556867571586e-05, "loss": 0.4041, "step": 44830 }, { "epoch": 0.6, "learning_rate": 1.7239555023115533e-05, "loss": 0.8788, "step": 44835 }, { "epoch": 0.6, "learning_rate": 1.7234553522408364e-05, "loss": 0.6651, "step": 44840 }, { "epoch": 0.6, "learning_rate": 1.722955236567164e-05, "loss": 0.7447, "step": 44845 }, { "epoch": 0.6, "learning_rate": 1.7224551553126857e-05, "loss": 0.5335, "step": 44850 }, { "epoch": 0.6, "learning_rate": 1.7219551084995544e-05, "loss": 0.42, "step": 44855 }, { "epoch": 0.6, "learning_rate": 1.7214550961499197e-05, "loss": 0.8736, "step": 44860 }, { "epoch": 0.6, "learning_rate": 1.7209551182859287e-05, "loss": 0.74, "step": 44865 }, { "epoch": 0.6, "learning_rate": 1.720455174929729e-05, "loss": 0.8286, "step": 44870 }, { "epoch": 0.6, "learning_rate": 1.719955266103465e-05, "loss": 1.1779, "step": 44875 }, { "epoch": 0.6, "learning_rate": 1.71945539182928e-05, "loss": 0.4699, "step": 44880 }, { "epoch": 0.6, "learning_rate": 1.7189555521293162e-05, "loss": 0.6794, "step": 44885 }, { "epoch": 0.6, "learning_rate": 1.7184557470257148e-05, "loss": 0.5998, "step": 44890 }, { "epoch": 0.6, "learning_rate": 1.7179559765406132e-05, "loss": 0.8893, "step": 44895 }, { "epoch": 0.6, "learning_rate": 1.7174562406961492e-05, "loss": 0.9202, "step": 44900 }, { "epoch": 0.6, "learning_rate": 1.7169565395144587e-05, "loss": 0.863, "step": 44905 }, { "epoch": 0.6, "learning_rate": 1.716456873017677e-05, "loss": 0.8055, "step": 44910 }, { "epoch": 0.6, "learning_rate": 1.7159572412279353e-05, "loss": 0.732, "step": 44915 }, { "epoch": 0.6, "learning_rate": 1.715457644167365e-05, "loss": 0.9874, "step": 44920 }, { "epoch": 0.6, "learning_rate": 1.714958081858097e-05, "loss": 0.985, "step": 44925 }, { "epoch": 0.6, "learning_rate": 1.714458554322258e-05, "loss": 0.3704, "step": 44930 }, { "epoch": 0.6, "learning_rate": 1.713959061581975e-05, "loss": 1.3681, "step": 44935 }, { "epoch": 0.6, "learning_rate": 1.7134596036593734e-05, "loss": 0.912, "step": 44940 }, { "epoch": 0.6, "learning_rate": 1.7129601805765762e-05, "loss": 0.3546, "step": 44945 }, { "epoch": 0.6, "learning_rate": 1.7124607923557052e-05, "loss": 0.5013, "step": 44950 }, { "epoch": 0.6, "learning_rate": 1.7119614390188827e-05, "loss": 0.2683, "step": 44955 }, { "epoch": 0.6, "learning_rate": 1.711462120588225e-05, "loss": 0.8018, "step": 44960 }, { "epoch": 0.6, "learning_rate": 1.7109628370858495e-05, "loss": 0.6398, "step": 44965 }, { "epoch": 0.6, "learning_rate": 1.7104635885338743e-05, "loss": 0.5093, "step": 44970 }, { "epoch": 0.6, "learning_rate": 1.7099643749544113e-05, "loss": 1.1952, "step": 44975 }, { "epoch": 0.6, "learning_rate": 1.7094651963695744e-05, "loss": 0.6248, "step": 44980 }, { "epoch": 0.6, "learning_rate": 1.7089660528014746e-05, "loss": 0.2995, "step": 44985 }, { "epoch": 0.6, "learning_rate": 1.7084669442722205e-05, "loss": 1.1478, "step": 44990 }, { "epoch": 0.6, "learning_rate": 1.7079678708039216e-05, "loss": 0.2309, "step": 44995 }, { "epoch": 0.6, "learning_rate": 1.7074688324186843e-05, "loss": 0.6798, "step": 45000 }, { "epoch": 0.6, "learning_rate": 1.7069698291386115e-05, "loss": 0.3557, "step": 45005 }, { "epoch": 0.6, "learning_rate": 1.7064708609858082e-05, "loss": 1.2638, "step": 45010 }, { "epoch": 0.6, "learning_rate": 1.7059719279823755e-05, "loss": 0.6734, "step": 45015 }, { "epoch": 0.6, "learning_rate": 1.705473030150415e-05, "loss": 0.6883, "step": 45020 }, { "epoch": 0.6, "learning_rate": 1.7049741675120234e-05, "loss": 0.7189, "step": 45025 }, { "epoch": 0.6, "learning_rate": 1.7044753400892987e-05, "loss": 1.3089, "step": 45030 }, { "epoch": 0.6, "learning_rate": 1.7039765479043383e-05, "loss": 0.5451, "step": 45035 }, { "epoch": 0.6, "learning_rate": 1.7034777909792327e-05, "loss": 0.7945, "step": 45040 }, { "epoch": 0.6, "learning_rate": 1.7029790693360764e-05, "loss": 0.7249, "step": 45045 }, { "epoch": 0.6, "learning_rate": 1.7024803829969606e-05, "loss": 0.477, "step": 45050 }, { "epoch": 0.6, "learning_rate": 1.701981731983973e-05, "loss": 0.8025, "step": 45055 }, { "epoch": 0.6, "learning_rate": 1.7014831163192027e-05, "loss": 0.6502, "step": 45060 }, { "epoch": 0.6, "learning_rate": 1.7009845360247365e-05, "loss": 0.3991, "step": 45065 }, { "epoch": 0.6, "learning_rate": 1.7004859911226567e-05, "loss": 0.9343, "step": 45070 }, { "epoch": 0.6, "learning_rate": 1.6999874816350475e-05, "loss": 0.9461, "step": 45075 }, { "epoch": 0.6, "learning_rate": 1.699489007583992e-05, "loss": 0.6316, "step": 45080 }, { "epoch": 0.6, "learning_rate": 1.6989905689915676e-05, "loss": 0.9227, "step": 45085 }, { "epoch": 0.6, "learning_rate": 1.6984921658798535e-05, "loss": 0.8178, "step": 45090 }, { "epoch": 0.6, "learning_rate": 1.697993798270927e-05, "loss": 0.2282, "step": 45095 }, { "epoch": 0.6, "learning_rate": 1.6974954661868628e-05, "loss": 0.3435, "step": 45100 }, { "epoch": 0.6, "learning_rate": 1.6969971696497343e-05, "loss": 0.4519, "step": 45105 }, { "epoch": 0.6, "learning_rate": 1.696498908681615e-05, "loss": 0.3679, "step": 45110 }, { "epoch": 0.6, "learning_rate": 1.6960006833045736e-05, "loss": 0.4611, "step": 45115 }, { "epoch": 0.6, "learning_rate": 1.6955024935406793e-05, "loss": 0.5092, "step": 45120 }, { "epoch": 0.6, "learning_rate": 1.6950043394120002e-05, "loss": 1.2841, "step": 45125 }, { "epoch": 0.6, "learning_rate": 1.6945062209406014e-05, "loss": 0.8025, "step": 45130 }, { "epoch": 0.6, "learning_rate": 1.694008138148547e-05, "loss": 0.8255, "step": 45135 }, { "epoch": 0.6, "learning_rate": 1.6935100910579e-05, "loss": 0.5216, "step": 45140 }, { "epoch": 0.6, "learning_rate": 1.6930120796907222e-05, "loss": 0.5679, "step": 45145 }, { "epoch": 0.6, "learning_rate": 1.6925141040690708e-05, "loss": 0.2026, "step": 45150 }, { "epoch": 0.61, "learning_rate": 1.692016164215005e-05, "loss": 0.5234, "step": 45155 }, { "epoch": 0.61, "learning_rate": 1.6915182601505815e-05, "loss": 0.9379, "step": 45160 }, { "epoch": 0.61, "learning_rate": 1.691020391897854e-05, "loss": 0.4436, "step": 45165 }, { "epoch": 0.61, "learning_rate": 1.6905225594788755e-05, "loss": 0.5365, "step": 45170 }, { "epoch": 0.61, "learning_rate": 1.6900247629156994e-05, "loss": 0.995, "step": 45175 }, { "epoch": 0.61, "learning_rate": 1.689527002230372e-05, "loss": 0.6022, "step": 45180 }, { "epoch": 0.61, "learning_rate": 1.6890292774449452e-05, "loss": 0.5123, "step": 45185 }, { "epoch": 0.61, "learning_rate": 1.6885315885814646e-05, "loss": 0.1737, "step": 45190 }, { "epoch": 0.61, "learning_rate": 1.688033935661974e-05, "loss": 0.5216, "step": 45195 }, { "epoch": 0.61, "learning_rate": 1.687536318708518e-05, "loss": 0.8148, "step": 45200 }, { "epoch": 0.61, "learning_rate": 1.687038737743139e-05, "loss": 0.4613, "step": 45205 }, { "epoch": 0.61, "learning_rate": 1.686541192787876e-05, "loss": 0.8493, "step": 45210 }, { "epoch": 0.61, "learning_rate": 1.6860436838647688e-05, "loss": 0.7639, "step": 45215 }, { "epoch": 0.61, "learning_rate": 1.6855462109958552e-05, "loss": 1.624, "step": 45220 }, { "epoch": 0.61, "learning_rate": 1.6850487742031692e-05, "loss": 0.4431, "step": 45225 }, { "epoch": 0.61, "learning_rate": 1.6845513735087452e-05, "loss": 1.0672, "step": 45230 }, { "epoch": 0.61, "learning_rate": 1.6840540089346162e-05, "loss": 0.247, "step": 45235 }, { "epoch": 0.61, "learning_rate": 1.683556680502812e-05, "loss": 0.7153, "step": 45240 }, { "epoch": 0.61, "learning_rate": 1.6830593882353627e-05, "loss": 0.592, "step": 45245 }, { "epoch": 0.61, "learning_rate": 1.682562132154295e-05, "loss": 0.3005, "step": 45250 }, { "epoch": 0.61, "learning_rate": 1.682064912281637e-05, "loss": 0.8558, "step": 45255 }, { "epoch": 0.61, "learning_rate": 1.68156772863941e-05, "loss": 0.4322, "step": 45260 }, { "epoch": 0.61, "learning_rate": 1.681070581249638e-05, "loss": 0.5462, "step": 45265 }, { "epoch": 0.61, "learning_rate": 1.680573470134343e-05, "loss": 0.4555, "step": 45270 }, { "epoch": 0.61, "learning_rate": 1.680076395315543e-05, "loss": 0.8696, "step": 45275 }, { "epoch": 0.61, "learning_rate": 1.6795793568152567e-05, "loss": 1.1613, "step": 45280 }, { "epoch": 0.61, "learning_rate": 1.6790823546555017e-05, "loss": 0.3184, "step": 45285 }, { "epoch": 0.61, "learning_rate": 1.67858538885829e-05, "loss": 0.2757, "step": 45290 }, { "epoch": 0.61, "learning_rate": 1.6780884594456366e-05, "loss": 1.2957, "step": 45295 }, { "epoch": 0.61, "learning_rate": 1.6775915664395535e-05, "loss": 0.7181, "step": 45300 }, { "epoch": 0.61, "learning_rate": 1.6770947098620487e-05, "loss": 0.7088, "step": 45305 }, { "epoch": 0.61, "learning_rate": 1.6765978897351314e-05, "loss": 0.7431, "step": 45310 }, { "epoch": 0.61, "learning_rate": 1.6761011060808086e-05, "loss": 0.6434, "step": 45315 }, { "epoch": 0.61, "learning_rate": 1.6756043589210847e-05, "loss": 0.3931, "step": 45320 }, { "epoch": 0.61, "learning_rate": 1.6751076482779632e-05, "loss": 0.9493, "step": 45325 }, { "epoch": 0.61, "learning_rate": 1.6746109741734473e-05, "loss": 0.402, "step": 45330 }, { "epoch": 0.61, "learning_rate": 1.6741143366295348e-05, "loss": 1.0685, "step": 45335 }, { "epoch": 0.61, "learning_rate": 1.6736177356682255e-05, "loss": 0.1821, "step": 45340 }, { "epoch": 0.61, "learning_rate": 1.6731211713115165e-05, "loss": 0.7207, "step": 45345 }, { "epoch": 0.61, "learning_rate": 1.6726246435814025e-05, "loss": 0.5489, "step": 45350 }, { "epoch": 0.61, "learning_rate": 1.6721281524998776e-05, "loss": 0.7531, "step": 45355 }, { "epoch": 0.61, "learning_rate": 1.6716316980889335e-05, "loss": 0.404, "step": 45360 }, { "epoch": 0.61, "learning_rate": 1.6711352803705622e-05, "loss": 1.1902, "step": 45365 }, { "epoch": 0.61, "learning_rate": 1.6706388993667503e-05, "loss": 0.6808, "step": 45370 }, { "epoch": 0.61, "learning_rate": 1.6701425550994865e-05, "loss": 0.4739, "step": 45375 }, { "epoch": 0.61, "learning_rate": 1.669646247590756e-05, "loss": 0.9715, "step": 45380 }, { "epoch": 0.61, "learning_rate": 1.669149976862542e-05, "loss": 0.387, "step": 45385 }, { "epoch": 0.61, "learning_rate": 1.668653742936827e-05, "loss": 0.8547, "step": 45390 }, { "epoch": 0.61, "learning_rate": 1.6681575458355936e-05, "loss": 1.1294, "step": 45395 }, { "epoch": 0.61, "learning_rate": 1.667661385580818e-05, "loss": 0.4164, "step": 45400 }, { "epoch": 0.61, "learning_rate": 1.667165262194479e-05, "loss": 0.4481, "step": 45405 }, { "epoch": 0.61, "learning_rate": 1.6666691756985535e-05, "loss": 0.6599, "step": 45410 }, { "epoch": 0.61, "learning_rate": 1.666173126115014e-05, "loss": 0.2523, "step": 45415 }, { "epoch": 0.61, "learning_rate": 1.6656771134658327e-05, "loss": 0.8393, "step": 45420 }, { "epoch": 0.61, "learning_rate": 1.6651811377729825e-05, "loss": 1.2027, "step": 45425 }, { "epoch": 0.61, "learning_rate": 1.6646851990584304e-05, "loss": 1.48, "step": 45430 }, { "epoch": 0.61, "learning_rate": 1.6641892973441453e-05, "loss": 0.4405, "step": 45435 }, { "epoch": 0.61, "learning_rate": 1.6636934326520938e-05, "loss": 1.7743, "step": 45440 }, { "epoch": 0.61, "learning_rate": 1.6631976050042385e-05, "loss": 0.6126, "step": 45445 }, { "epoch": 0.61, "learning_rate": 1.6627018144225426e-05, "loss": 0.6668, "step": 45450 }, { "epoch": 0.61, "learning_rate": 1.662206060928968e-05, "loss": 0.6734, "step": 45455 }, { "epoch": 0.61, "learning_rate": 1.6617103445454734e-05, "loss": 0.683, "step": 45460 }, { "epoch": 0.61, "learning_rate": 1.6612146652940164e-05, "loss": 0.4906, "step": 45465 }, { "epoch": 0.61, "learning_rate": 1.6607190231965534e-05, "loss": 0.4974, "step": 45470 }, { "epoch": 0.61, "learning_rate": 1.6602234182750402e-05, "loss": 0.4493, "step": 45475 }, { "epoch": 0.61, "learning_rate": 1.6597278505514268e-05, "loss": 0.7701, "step": 45480 }, { "epoch": 0.61, "learning_rate": 1.6592323200476663e-05, "loss": 0.8784, "step": 45485 }, { "epoch": 0.61, "learning_rate": 1.6587368267857082e-05, "loss": 0.649, "step": 45490 }, { "epoch": 0.61, "learning_rate": 1.6582413707874993e-05, "loss": 1.3285, "step": 45495 }, { "epoch": 0.61, "learning_rate": 1.6577459520749865e-05, "loss": 1.8094, "step": 45500 }, { "epoch": 0.61, "learning_rate": 1.657250570670115e-05, "loss": 0.4325, "step": 45505 }, { "epoch": 0.61, "learning_rate": 1.6567552265948266e-05, "loss": 0.6739, "step": 45510 }, { "epoch": 0.61, "learning_rate": 1.656259919871063e-05, "loss": 0.5777, "step": 45515 }, { "epoch": 0.61, "learning_rate": 1.6557646505207646e-05, "loss": 1.3198, "step": 45520 }, { "epoch": 0.61, "learning_rate": 1.655269418565868e-05, "loss": 1.0025, "step": 45525 }, { "epoch": 0.61, "learning_rate": 1.6547742240283097e-05, "loss": 0.9505, "step": 45530 }, { "epoch": 0.61, "learning_rate": 1.6542790669300257e-05, "loss": 0.6428, "step": 45535 }, { "epoch": 0.61, "learning_rate": 1.653783947292947e-05, "loss": 1.4327, "step": 45540 }, { "epoch": 0.61, "learning_rate": 1.6532888651390067e-05, "loss": 0.4413, "step": 45545 }, { "epoch": 0.61, "learning_rate": 1.6527938204901338e-05, "loss": 1.0113, "step": 45550 }, { "epoch": 0.61, "learning_rate": 1.652298813368256e-05, "loss": 0.5817, "step": 45555 }, { "epoch": 0.61, "learning_rate": 1.6518038437952992e-05, "loss": 1.4488, "step": 45560 }, { "epoch": 0.61, "learning_rate": 1.6513089117931895e-05, "loss": 0.8356, "step": 45565 }, { "epoch": 0.61, "learning_rate": 1.6508140173838488e-05, "loss": 0.7412, "step": 45570 }, { "epoch": 0.61, "learning_rate": 1.6503191605891988e-05, "loss": 1.3252, "step": 45575 }, { "epoch": 0.61, "learning_rate": 1.649824341431159e-05, "loss": 0.6607, "step": 45580 }, { "epoch": 0.61, "learning_rate": 1.6493295599316488e-05, "loss": 0.8287, "step": 45585 }, { "epoch": 0.61, "learning_rate": 1.6488348161125823e-05, "loss": 0.5458, "step": 45590 }, { "epoch": 0.61, "learning_rate": 1.648340109995875e-05, "loss": 0.9823, "step": 45595 }, { "epoch": 0.61, "learning_rate": 1.6478454416034407e-05, "loss": 0.7816, "step": 45600 }, { "epoch": 0.61, "learning_rate": 1.6473508109571893e-05, "loss": 0.2699, "step": 45605 }, { "epoch": 0.61, "learning_rate": 1.6468562180790315e-05, "loss": 0.9054, "step": 45610 }, { "epoch": 0.61, "learning_rate": 1.6463616629908757e-05, "loss": 0.9614, "step": 45615 }, { "epoch": 0.61, "learning_rate": 1.6458671457146273e-05, "loss": 0.7504, "step": 45620 }, { "epoch": 0.61, "learning_rate": 1.6453726662721908e-05, "loss": 1.2148, "step": 45625 }, { "epoch": 0.61, "learning_rate": 1.644878224685471e-05, "loss": 0.4872, "step": 45630 }, { "epoch": 0.61, "learning_rate": 1.6443838209763668e-05, "loss": 0.5822, "step": 45635 }, { "epoch": 0.61, "learning_rate": 1.6438894551667784e-05, "loss": 1.2558, "step": 45640 }, { "epoch": 0.61, "learning_rate": 1.643395127278605e-05, "loss": 0.5199, "step": 45645 }, { "epoch": 0.61, "learning_rate": 1.6429008373337415e-05, "loss": 0.681, "step": 45650 }, { "epoch": 0.61, "learning_rate": 1.642406585354083e-05, "loss": 0.9014, "step": 45655 }, { "epoch": 0.61, "learning_rate": 1.6419123713615232e-05, "loss": 0.459, "step": 45660 }, { "epoch": 0.61, "learning_rate": 1.6414181953779516e-05, "loss": 0.7695, "step": 45665 }, { "epoch": 0.61, "learning_rate": 1.6409240574252588e-05, "loss": 1.3248, "step": 45670 }, { "epoch": 0.61, "learning_rate": 1.6404299575253324e-05, "loss": 1.2282, "step": 45675 }, { "epoch": 0.61, "learning_rate": 1.6399358957000585e-05, "loss": 0.4013, "step": 45680 }, { "epoch": 0.61, "learning_rate": 1.6394418719713215e-05, "loss": 0.9177, "step": 45685 }, { "epoch": 0.61, "learning_rate": 1.6389478863610052e-05, "loss": 0.7148, "step": 45690 }, { "epoch": 0.61, "learning_rate": 1.638453938890989e-05, "loss": 0.7163, "step": 45695 }, { "epoch": 0.61, "learning_rate": 1.6379600295831534e-05, "loss": 0.4786, "step": 45700 }, { "epoch": 0.61, "learning_rate": 1.637466158459375e-05, "loss": 0.3056, "step": 45705 }, { "epoch": 0.61, "learning_rate": 1.636972325541532e-05, "loss": 1.3961, "step": 45710 }, { "epoch": 0.61, "learning_rate": 1.6364785308514968e-05, "loss": 0.815, "step": 45715 }, { "epoch": 0.61, "learning_rate": 1.635984774411142e-05, "loss": 0.4798, "step": 45720 }, { "epoch": 0.61, "learning_rate": 1.6354910562423405e-05, "loss": 0.4065, "step": 45725 }, { "epoch": 0.61, "learning_rate": 1.634997376366959e-05, "loss": 1.3047, "step": 45730 }, { "epoch": 0.61, "learning_rate": 1.634503734806867e-05, "loss": 0.9346, "step": 45735 }, { "epoch": 0.61, "learning_rate": 1.63401013158393e-05, "loss": 1.3339, "step": 45740 }, { "epoch": 0.61, "learning_rate": 1.6335165667200107e-05, "loss": 0.5163, "step": 45745 }, { "epoch": 0.61, "learning_rate": 1.6330230402369727e-05, "loss": 0.7321, "step": 45750 }, { "epoch": 0.61, "learning_rate": 1.6325295521566776e-05, "loss": 0.9128, "step": 45755 }, { "epoch": 0.61, "learning_rate": 1.6320361025009827e-05, "loss": 0.8216, "step": 45760 }, { "epoch": 0.61, "learning_rate": 1.631542691291746e-05, "loss": 1.0855, "step": 45765 }, { "epoch": 0.61, "learning_rate": 1.6310493185508245e-05, "loss": 0.496, "step": 45770 }, { "epoch": 0.61, "learning_rate": 1.63055598430007e-05, "loss": 0.3443, "step": 45775 }, { "epoch": 0.61, "learning_rate": 1.6300626885613355e-05, "loss": 0.8798, "step": 45780 }, { "epoch": 0.61, "learning_rate": 1.6295694313564727e-05, "loss": 0.39, "step": 45785 }, { "epoch": 0.61, "learning_rate": 1.6290762127073288e-05, "loss": 0.5829, "step": 45790 }, { "epoch": 0.61, "learning_rate": 1.6285830326357517e-05, "loss": 0.8434, "step": 45795 }, { "epoch": 0.61, "learning_rate": 1.6280898911635872e-05, "loss": 0.3606, "step": 45800 }, { "epoch": 0.61, "learning_rate": 1.6275967883126774e-05, "loss": 0.7139, "step": 45805 }, { "epoch": 0.61, "learning_rate": 1.6271037241048658e-05, "loss": 1.042, "step": 45810 }, { "epoch": 0.61, "learning_rate": 1.6266106985619917e-05, "loss": 0.2315, "step": 45815 }, { "epoch": 0.61, "learning_rate": 1.626117711705896e-05, "loss": 0.9455, "step": 45820 }, { "epoch": 0.61, "learning_rate": 1.6256247635584125e-05, "loss": 1.6074, "step": 45825 }, { "epoch": 0.61, "learning_rate": 1.6251318541413774e-05, "loss": 0.4233, "step": 45830 }, { "epoch": 0.61, "learning_rate": 1.624638983476625e-05, "loss": 0.2229, "step": 45835 }, { "epoch": 0.61, "learning_rate": 1.624146151585986e-05, "loss": 0.5633, "step": 45840 }, { "epoch": 0.61, "learning_rate": 1.6236533584912906e-05, "loss": 0.816, "step": 45845 }, { "epoch": 0.61, "learning_rate": 1.6231606042143682e-05, "loss": 1.1101, "step": 45850 }, { "epoch": 0.61, "learning_rate": 1.6226678887770433e-05, "loss": 1.0703, "step": 45855 }, { "epoch": 0.61, "learning_rate": 1.622175212201142e-05, "loss": 0.7531, "step": 45860 }, { "epoch": 0.61, "learning_rate": 1.6216825745084874e-05, "loss": 0.3133, "step": 45865 }, { "epoch": 0.61, "learning_rate": 1.6211899757209e-05, "loss": 0.5899, "step": 45870 }, { "epoch": 0.61, "learning_rate": 1.6206974158602008e-05, "loss": 0.5536, "step": 45875 }, { "epoch": 0.61, "learning_rate": 1.6202048949482073e-05, "loss": 1.1448, "step": 45880 }, { "epoch": 0.61, "learning_rate": 1.6197124130067347e-05, "loss": 0.9678, "step": 45885 }, { "epoch": 0.61, "learning_rate": 1.6192199700575985e-05, "loss": 0.801, "step": 45890 }, { "epoch": 0.61, "learning_rate": 1.6187275661226118e-05, "loss": 0.3442, "step": 45895 }, { "epoch": 0.61, "learning_rate": 1.618235201223584e-05, "loss": 0.7112, "step": 45900 }, { "epoch": 0.62, "learning_rate": 1.617742875382326e-05, "loss": 0.5121, "step": 45905 }, { "epoch": 0.62, "learning_rate": 1.6172505886206458e-05, "loss": 0.7557, "step": 45910 }, { "epoch": 0.62, "learning_rate": 1.616758340960347e-05, "loss": 1.4529, "step": 45915 }, { "epoch": 0.62, "learning_rate": 1.6162661324232347e-05, "loss": 0.7039, "step": 45920 }, { "epoch": 0.62, "learning_rate": 1.615773963031112e-05, "loss": 0.5701, "step": 45925 }, { "epoch": 0.62, "learning_rate": 1.61528183280578e-05, "loss": 0.2512, "step": 45930 }, { "epoch": 0.62, "learning_rate": 1.6147897417690354e-05, "loss": 0.4804, "step": 45935 }, { "epoch": 0.62, "learning_rate": 1.6142976899426772e-05, "loss": 0.4802, "step": 45940 }, { "epoch": 0.62, "learning_rate": 1.6138056773485005e-05, "loss": 1.1246, "step": 45945 }, { "epoch": 0.62, "learning_rate": 1.6133137040082986e-05, "loss": 0.5746, "step": 45950 }, { "epoch": 0.62, "learning_rate": 1.6128217699438634e-05, "loss": 0.6338, "step": 45955 }, { "epoch": 0.62, "learning_rate": 1.6123298751769865e-05, "loss": 0.529, "step": 45960 }, { "epoch": 0.62, "learning_rate": 1.6118380197294543e-05, "loss": 0.7506, "step": 45965 }, { "epoch": 0.62, "learning_rate": 1.6113462036230544e-05, "loss": 0.8487, "step": 45970 }, { "epoch": 0.62, "learning_rate": 1.610854426879572e-05, "loss": 0.7315, "step": 45975 }, { "epoch": 0.62, "learning_rate": 1.6103626895207906e-05, "loss": 0.4647, "step": 45980 }, { "epoch": 0.62, "learning_rate": 1.6098709915684907e-05, "loss": 0.5983, "step": 45985 }, { "epoch": 0.62, "learning_rate": 1.609379333044454e-05, "loss": 0.5503, "step": 45990 }, { "epoch": 0.62, "learning_rate": 1.6088877139704557e-05, "loss": 0.3825, "step": 45995 }, { "epoch": 0.62, "learning_rate": 1.608396134368274e-05, "loss": 0.6649, "step": 46000 }, { "epoch": 0.62, "learning_rate": 1.6079045942596837e-05, "loss": 0.9273, "step": 46005 }, { "epoch": 0.62, "learning_rate": 1.6074130936664562e-05, "loss": 0.8262, "step": 46010 }, { "epoch": 0.62, "learning_rate": 1.6069216326103628e-05, "loss": 0.6411, "step": 46015 }, { "epoch": 0.62, "learning_rate": 1.6064302111131746e-05, "loss": 0.3417, "step": 46020 }, { "epoch": 0.62, "learning_rate": 1.6059388291966566e-05, "loss": 0.6061, "step": 46025 }, { "epoch": 0.62, "learning_rate": 1.605447486882575e-05, "loss": 0.4593, "step": 46030 }, { "epoch": 0.62, "learning_rate": 1.6049561841926948e-05, "loss": 0.6825, "step": 46035 }, { "epoch": 0.62, "learning_rate": 1.604464921148779e-05, "loss": 0.5014, "step": 46040 }, { "epoch": 0.62, "learning_rate": 1.603973697772586e-05, "loss": 0.5552, "step": 46045 }, { "epoch": 0.62, "learning_rate": 1.6034825140858753e-05, "loss": 0.9651, "step": 46050 }, { "epoch": 0.62, "learning_rate": 1.602991370110405e-05, "loss": 1.3447, "step": 46055 }, { "epoch": 0.62, "learning_rate": 1.6025002658679283e-05, "loss": 0.6813, "step": 46060 }, { "epoch": 0.62, "learning_rate": 1.6020092013802003e-05, "loss": 0.5741, "step": 46065 }, { "epoch": 0.62, "learning_rate": 1.601518176668973e-05, "loss": 0.6145, "step": 46070 }, { "epoch": 0.62, "learning_rate": 1.6010271917559945e-05, "loss": 0.5249, "step": 46075 }, { "epoch": 0.62, "learning_rate": 1.6005362466630143e-05, "loss": 0.4171, "step": 46080 }, { "epoch": 0.62, "learning_rate": 1.6000453414117784e-05, "loss": 0.7672, "step": 46085 }, { "epoch": 0.62, "learning_rate": 1.5995544760240317e-05, "loss": 1.1324, "step": 46090 }, { "epoch": 0.62, "learning_rate": 1.5990636505215164e-05, "loss": 0.889, "step": 46095 }, { "epoch": 0.62, "learning_rate": 1.5985728649259755e-05, "loss": 1.0377, "step": 46100 }, { "epoch": 0.62, "learning_rate": 1.5980821192591455e-05, "loss": 1.0373, "step": 46105 }, { "epoch": 0.62, "learning_rate": 1.5975914135427662e-05, "loss": 0.7767, "step": 46110 }, { "epoch": 0.62, "learning_rate": 1.5971007477985726e-05, "loss": 0.984, "step": 46115 }, { "epoch": 0.62, "learning_rate": 1.5966101220482983e-05, "loss": 0.7467, "step": 46120 }, { "epoch": 0.62, "learning_rate": 1.5961195363136762e-05, "loss": 0.7526, "step": 46125 }, { "epoch": 0.62, "learning_rate": 1.595628990616438e-05, "loss": 0.387, "step": 46130 }, { "epoch": 0.62, "learning_rate": 1.595138484978309e-05, "loss": 0.7211, "step": 46135 }, { "epoch": 0.62, "learning_rate": 1.594648019421019e-05, "loss": 1.0418, "step": 46140 }, { "epoch": 0.62, "learning_rate": 1.5941575939662927e-05, "loss": 1.0017, "step": 46145 }, { "epoch": 0.62, "learning_rate": 1.593667208635854e-05, "loss": 0.4883, "step": 46150 }, { "epoch": 0.62, "learning_rate": 1.5931768634514225e-05, "loss": 0.4305, "step": 46155 }, { "epoch": 0.62, "learning_rate": 1.5926865584347196e-05, "loss": 0.6959, "step": 46160 }, { "epoch": 0.62, "learning_rate": 1.592196293607463e-05, "loss": 1.2414, "step": 46165 }, { "epoch": 0.62, "learning_rate": 1.5917060689913686e-05, "loss": 0.5103, "step": 46170 }, { "epoch": 0.62, "learning_rate": 1.5912158846081517e-05, "loss": 0.4009, "step": 46175 }, { "epoch": 0.62, "learning_rate": 1.5907257404795255e-05, "loss": 0.9279, "step": 46180 }, { "epoch": 0.62, "learning_rate": 1.5902356366271993e-05, "loss": 0.4011, "step": 46185 }, { "epoch": 0.62, "learning_rate": 1.5897455730728824e-05, "loss": 0.9478, "step": 46190 }, { "epoch": 0.62, "learning_rate": 1.5892555498382834e-05, "loss": 0.6575, "step": 46195 }, { "epoch": 0.62, "learning_rate": 1.5887655669451067e-05, "loss": 0.5042, "step": 46200 }, { "epoch": 0.62, "learning_rate": 1.5882756244150572e-05, "loss": 0.9982, "step": 46205 }, { "epoch": 0.62, "learning_rate": 1.5877857222698367e-05, "loss": 0.3418, "step": 46210 }, { "epoch": 0.62, "learning_rate": 1.5872958605311442e-05, "loss": 0.817, "step": 46215 }, { "epoch": 0.62, "learning_rate": 1.586806039220679e-05, "loss": 0.6716, "step": 46220 }, { "epoch": 0.62, "learning_rate": 1.586316258360138e-05, "loss": 0.7318, "step": 46225 }, { "epoch": 0.62, "learning_rate": 1.5858265179712156e-05, "loss": 1.3619, "step": 46230 }, { "epoch": 0.62, "learning_rate": 1.5853368180756047e-05, "loss": 1.3254, "step": 46235 }, { "epoch": 0.62, "learning_rate": 1.584847158694998e-05, "loss": 0.6015, "step": 46240 }, { "epoch": 0.62, "learning_rate": 1.5843575398510825e-05, "loss": 0.7007, "step": 46245 }, { "epoch": 0.62, "learning_rate": 1.5838679615655473e-05, "loss": 0.9151, "step": 46250 }, { "epoch": 0.62, "learning_rate": 1.583378423860078e-05, "loss": 1.4897, "step": 46255 }, { "epoch": 0.62, "learning_rate": 1.58288892675636e-05, "loss": 0.7531, "step": 46260 }, { "epoch": 0.62, "learning_rate": 1.5823994702760736e-05, "loss": 1.1119, "step": 46265 }, { "epoch": 0.62, "learning_rate": 1.5819100544409e-05, "loss": 0.7492, "step": 46270 }, { "epoch": 0.62, "learning_rate": 1.5814206792725184e-05, "loss": 1.1836, "step": 46275 }, { "epoch": 0.62, "learning_rate": 1.5809313447926046e-05, "loss": 1.119, "step": 46280 }, { "epoch": 0.62, "learning_rate": 1.580442051022834e-05, "loss": 0.6108, "step": 46285 }, { "epoch": 0.62, "learning_rate": 1.5799527979848815e-05, "loss": 1.3461, "step": 46290 }, { "epoch": 0.62, "learning_rate": 1.5794635857004163e-05, "loss": 1.2924, "step": 46295 }, { "epoch": 0.62, "learning_rate": 1.578974414191109e-05, "loss": 0.7566, "step": 46300 }, { "epoch": 0.62, "learning_rate": 1.5784852834786274e-05, "loss": 1.1158, "step": 46305 }, { "epoch": 0.62, "learning_rate": 1.5779961935846376e-05, "loss": 0.7787, "step": 46310 }, { "epoch": 0.62, "learning_rate": 1.5775071445308034e-05, "loss": 0.5188, "step": 46315 }, { "epoch": 0.62, "learning_rate": 1.5770181363387887e-05, "loss": 0.5038, "step": 46320 }, { "epoch": 0.62, "learning_rate": 1.576529169030252e-05, "loss": 0.5, "step": 46325 }, { "epoch": 0.62, "learning_rate": 1.5760402426268532e-05, "loss": 1.231, "step": 46330 }, { "epoch": 0.62, "learning_rate": 1.5755513571502502e-05, "loss": 0.8894, "step": 46335 }, { "epoch": 0.62, "learning_rate": 1.5750625126220956e-05, "loss": 0.5219, "step": 46340 }, { "epoch": 0.62, "learning_rate": 1.5745737090640452e-05, "loss": 0.4621, "step": 46345 }, { "epoch": 0.62, "learning_rate": 1.5740849464977504e-05, "loss": 0.6576, "step": 46350 }, { "epoch": 0.62, "learning_rate": 1.573596224944859e-05, "loss": 0.601, "step": 46355 }, { "epoch": 0.62, "learning_rate": 1.5731075444270208e-05, "loss": 0.6831, "step": 46360 }, { "epoch": 0.62, "learning_rate": 1.572618904965882e-05, "loss": 0.7871, "step": 46365 }, { "epoch": 0.62, "learning_rate": 1.572130306583085e-05, "loss": 0.3989, "step": 46370 }, { "epoch": 0.62, "learning_rate": 1.5716417493002737e-05, "loss": 0.4868, "step": 46375 }, { "epoch": 0.62, "learning_rate": 1.5711532331390888e-05, "loss": 0.6617, "step": 46380 }, { "epoch": 0.62, "learning_rate": 1.5706647581211686e-05, "loss": 0.3344, "step": 46385 }, { "epoch": 0.62, "learning_rate": 1.5701763242681504e-05, "loss": 1.1374, "step": 46390 }, { "epoch": 0.62, "learning_rate": 1.5696879316016688e-05, "loss": 0.8373, "step": 46395 }, { "epoch": 0.62, "learning_rate": 1.569199580143359e-05, "loss": 0.7899, "step": 46400 }, { "epoch": 0.62, "learning_rate": 1.56871126991485e-05, "loss": 0.7027, "step": 46405 }, { "epoch": 0.62, "learning_rate": 1.5682230009377724e-05, "loss": 0.6274, "step": 46410 }, { "epoch": 0.62, "learning_rate": 1.5677347732337553e-05, "loss": 0.8557, "step": 46415 }, { "epoch": 0.62, "learning_rate": 1.5672465868244228e-05, "loss": 0.5785, "step": 46420 }, { "epoch": 0.62, "learning_rate": 1.5667584417314006e-05, "loss": 0.8489, "step": 46425 }, { "epoch": 0.62, "learning_rate": 1.5662703379763112e-05, "loss": 0.6454, "step": 46430 }, { "epoch": 0.62, "learning_rate": 1.5657822755807737e-05, "loss": 0.6304, "step": 46435 }, { "epoch": 0.62, "learning_rate": 1.5652942545664075e-05, "loss": 1.4773, "step": 46440 }, { "epoch": 0.62, "learning_rate": 1.5648062749548304e-05, "loss": 0.7267, "step": 46445 }, { "epoch": 0.62, "learning_rate": 1.5643183367676555e-05, "loss": 1.0498, "step": 46450 }, { "epoch": 0.62, "learning_rate": 1.563830440026498e-05, "loss": 0.4836, "step": 46455 }, { "epoch": 0.62, "learning_rate": 1.5633425847529688e-05, "loss": 1.4828, "step": 46460 }, { "epoch": 0.62, "learning_rate": 1.5628547709686765e-05, "loss": 0.4394, "step": 46465 }, { "epoch": 0.62, "learning_rate": 1.5623669986952293e-05, "loss": 0.7221, "step": 46470 }, { "epoch": 0.62, "learning_rate": 1.5618792679542345e-05, "loss": 1.0354, "step": 46475 }, { "epoch": 0.62, "learning_rate": 1.561391578767294e-05, "loss": 0.3426, "step": 46480 }, { "epoch": 0.62, "learning_rate": 1.5609039311560106e-05, "loss": 2.0265, "step": 46485 }, { "epoch": 0.62, "learning_rate": 1.5604163251419847e-05, "loss": 0.1369, "step": 46490 }, { "epoch": 0.62, "learning_rate": 1.559928760746816e-05, "loss": 0.5197, "step": 46495 }, { "epoch": 0.62, "learning_rate": 1.5594412379920993e-05, "loss": 1.5454, "step": 46500 }, { "epoch": 0.62, "learning_rate": 1.5589537568994306e-05, "loss": 0.9443, "step": 46505 }, { "epoch": 0.62, "learning_rate": 1.5584663174904032e-05, "loss": 1.0099, "step": 46510 }, { "epoch": 0.62, "learning_rate": 1.557978919786607e-05, "loss": 0.3426, "step": 46515 }, { "epoch": 0.62, "learning_rate": 1.5574915638096316e-05, "loss": 0.7861, "step": 46520 }, { "epoch": 0.62, "learning_rate": 1.557004249581065e-05, "loss": 0.2769, "step": 46525 }, { "epoch": 0.62, "learning_rate": 1.5565169771224925e-05, "loss": 0.6329, "step": 46530 }, { "epoch": 0.62, "learning_rate": 1.5560297464554975e-05, "loss": 1.1054, "step": 46535 }, { "epoch": 0.62, "learning_rate": 1.555542557601663e-05, "loss": 0.2477, "step": 46540 }, { "epoch": 0.62, "learning_rate": 1.5550554105825678e-05, "loss": 0.3641, "step": 46545 }, { "epoch": 0.62, "learning_rate": 1.5545683054197894e-05, "loss": 0.7394, "step": 46550 }, { "epoch": 0.62, "learning_rate": 1.554081242134907e-05, "loss": 0.5803, "step": 46555 }, { "epoch": 0.62, "learning_rate": 1.5535942207494923e-05, "loss": 0.2895, "step": 46560 }, { "epoch": 0.62, "learning_rate": 1.5531072412851188e-05, "loss": 0.7893, "step": 46565 }, { "epoch": 0.62, "learning_rate": 1.552620303763358e-05, "loss": 0.3631, "step": 46570 }, { "epoch": 0.62, "learning_rate": 1.5521334082057777e-05, "loss": 0.5272, "step": 46575 }, { "epoch": 0.62, "learning_rate": 1.551646554633945e-05, "loss": 0.9315, "step": 46580 }, { "epoch": 0.62, "learning_rate": 1.551159743069427e-05, "loss": 0.7121, "step": 46585 }, { "epoch": 0.62, "learning_rate": 1.550672973533784e-05, "loss": 0.9508, "step": 46590 }, { "epoch": 0.62, "learning_rate": 1.550186246048579e-05, "loss": 0.3146, "step": 46595 }, { "epoch": 0.62, "learning_rate": 1.549699560635372e-05, "loss": 0.7586, "step": 46600 }, { "epoch": 0.62, "learning_rate": 1.5492129173157204e-05, "loss": 0.744, "step": 46605 }, { "epoch": 0.62, "learning_rate": 1.548726316111179e-05, "loss": 0.4191, "step": 46610 }, { "epoch": 0.62, "learning_rate": 1.5482397570433035e-05, "loss": 0.9248, "step": 46615 }, { "epoch": 0.62, "learning_rate": 1.547753240133646e-05, "loss": 0.7309, "step": 46620 }, { "epoch": 0.62, "learning_rate": 1.5472667654037552e-05, "loss": 0.9047, "step": 46625 }, { "epoch": 0.62, "learning_rate": 1.5467803328751802e-05, "loss": 0.9843, "step": 46630 }, { "epoch": 0.62, "learning_rate": 1.5462939425694677e-05, "loss": 0.436, "step": 46635 }, { "epoch": 0.62, "learning_rate": 1.5458075945081624e-05, "loss": 0.5917, "step": 46640 }, { "epoch": 0.62, "learning_rate": 1.5453212887128064e-05, "loss": 0.4183, "step": 46645 }, { "epoch": 0.63, "learning_rate": 1.5448350252049425e-05, "loss": 0.5684, "step": 46650 }, { "epoch": 0.63, "learning_rate": 1.5443488040061076e-05, "loss": 0.8582, "step": 46655 }, { "epoch": 0.63, "learning_rate": 1.5438626251378392e-05, "loss": 0.357, "step": 46660 }, { "epoch": 0.63, "learning_rate": 1.5433764886216745e-05, "loss": 0.5427, "step": 46665 }, { "epoch": 0.63, "learning_rate": 1.5428903944791444e-05, "loss": 0.7895, "step": 46670 }, { "epoch": 0.63, "learning_rate": 1.542404342731782e-05, "loss": 0.7527, "step": 46675 }, { "epoch": 0.63, "learning_rate": 1.5419183334011163e-05, "loss": 0.9578, "step": 46680 }, { "epoch": 0.63, "learning_rate": 1.5414323665086752e-05, "loss": 0.8561, "step": 46685 }, { "epoch": 0.63, "learning_rate": 1.540946442075985e-05, "loss": 1.0475, "step": 46690 }, { "epoch": 0.63, "learning_rate": 1.54046056012457e-05, "loss": 0.7706, "step": 46695 }, { "epoch": 0.63, "learning_rate": 1.539974720675951e-05, "loss": 0.5802, "step": 46700 }, { "epoch": 0.63, "learning_rate": 1.5394889237516486e-05, "loss": 0.5572, "step": 46705 }, { "epoch": 0.63, "learning_rate": 1.539003169373182e-05, "loss": 0.438, "step": 46710 }, { "epoch": 0.63, "learning_rate": 1.5385174575620676e-05, "loss": 1.3382, "step": 46715 }, { "epoch": 0.63, "learning_rate": 1.538031788339819e-05, "loss": 0.7308, "step": 46720 }, { "epoch": 0.63, "learning_rate": 1.53754616172795e-05, "loss": 0.5802, "step": 46725 }, { "epoch": 0.63, "learning_rate": 1.537060577747972e-05, "loss": 0.722, "step": 46730 }, { "epoch": 0.63, "learning_rate": 1.5365750364213916e-05, "loss": 0.8458, "step": 46735 }, { "epoch": 0.63, "learning_rate": 1.5360895377697175e-05, "loss": 0.8373, "step": 46740 }, { "epoch": 0.63, "learning_rate": 1.5356040818144553e-05, "loss": 0.5245, "step": 46745 }, { "epoch": 0.63, "learning_rate": 1.535118668577107e-05, "loss": 0.7673, "step": 46750 }, { "epoch": 0.63, "learning_rate": 1.534633298079174e-05, "loss": 1.1652, "step": 46755 }, { "epoch": 0.63, "learning_rate": 1.5341479703421575e-05, "loss": 0.3246, "step": 46760 }, { "epoch": 0.63, "learning_rate": 1.5336626853875526e-05, "loss": 0.7859, "step": 46765 }, { "epoch": 0.63, "learning_rate": 1.5331774432368568e-05, "loss": 0.5535, "step": 46770 }, { "epoch": 0.63, "learning_rate": 1.5326922439115643e-05, "loss": 0.7943, "step": 46775 }, { "epoch": 0.63, "learning_rate": 1.5322070874331652e-05, "loss": 1.0904, "step": 46780 }, { "epoch": 0.63, "learning_rate": 1.5317219738231502e-05, "loss": 0.9346, "step": 46785 }, { "epoch": 0.63, "learning_rate": 1.5312369031030084e-05, "loss": 1.1716, "step": 46790 }, { "epoch": 0.63, "learning_rate": 1.530751875294225e-05, "loss": 0.2701, "step": 46795 }, { "epoch": 0.63, "learning_rate": 1.5302668904182837e-05, "loss": 0.3335, "step": 46800 }, { "epoch": 0.63, "learning_rate": 1.5297819484966694e-05, "loss": 0.9013, "step": 46805 }, { "epoch": 0.63, "learning_rate": 1.5292970495508598e-05, "loss": 0.8536, "step": 46810 }, { "epoch": 0.63, "learning_rate": 1.5288121936023344e-05, "loss": 0.9324, "step": 46815 }, { "epoch": 0.63, "learning_rate": 1.5283273806725705e-05, "loss": 1.0592, "step": 46820 }, { "epoch": 0.63, "learning_rate": 1.5278426107830425e-05, "loss": 1.0904, "step": 46825 }, { "epoch": 0.63, "learning_rate": 1.5273578839552232e-05, "loss": 0.5691, "step": 46830 }, { "epoch": 0.63, "learning_rate": 1.5268732002105835e-05, "loss": 1.2327, "step": 46835 }, { "epoch": 0.63, "learning_rate": 1.5263885595705936e-05, "loss": 0.5703, "step": 46840 }, { "epoch": 0.63, "learning_rate": 1.525903962056719e-05, "loss": 0.7976, "step": 46845 }, { "epoch": 0.63, "learning_rate": 1.5254194076904255e-05, "loss": 0.8867, "step": 46850 }, { "epoch": 0.63, "learning_rate": 1.5249348964931768e-05, "loss": 0.2788, "step": 46855 }, { "epoch": 0.63, "learning_rate": 1.5244504284864336e-05, "loss": 0.2934, "step": 46860 }, { "epoch": 0.63, "learning_rate": 1.5239660036916562e-05, "loss": 0.5247, "step": 46865 }, { "epoch": 0.63, "learning_rate": 1.5234816221303028e-05, "loss": 0.6094, "step": 46870 }, { "epoch": 0.63, "learning_rate": 1.5229972838238265e-05, "loss": 0.6215, "step": 46875 }, { "epoch": 0.63, "learning_rate": 1.5225129887936834e-05, "loss": 1.222, "step": 46880 }, { "epoch": 0.63, "learning_rate": 1.5220287370613257e-05, "loss": 0.5123, "step": 46885 }, { "epoch": 0.63, "learning_rate": 1.5215445286482011e-05, "loss": 1.2386, "step": 46890 }, { "epoch": 0.63, "learning_rate": 1.521060363575759e-05, "loss": 0.7789, "step": 46895 }, { "epoch": 0.63, "learning_rate": 1.5205762418654457e-05, "loss": 0.464, "step": 46900 }, { "epoch": 0.63, "learning_rate": 1.5200921635387043e-05, "loss": 1.0625, "step": 46905 }, { "epoch": 0.63, "learning_rate": 1.5196081286169783e-05, "loss": 0.7242, "step": 46910 }, { "epoch": 0.63, "learning_rate": 1.519124137121708e-05, "loss": 0.9929, "step": 46915 }, { "epoch": 0.63, "learning_rate": 1.5186401890743303e-05, "loss": 0.7712, "step": 46920 }, { "epoch": 0.63, "learning_rate": 1.5181562844962829e-05, "loss": 0.7707, "step": 46925 }, { "epoch": 0.63, "learning_rate": 1.5176724234090007e-05, "loss": 0.7062, "step": 46930 }, { "epoch": 0.63, "learning_rate": 1.5171886058339146e-05, "loss": 1.3418, "step": 46935 }, { "epoch": 0.63, "learning_rate": 1.5167048317924567e-05, "loss": 0.4998, "step": 46940 }, { "epoch": 0.63, "learning_rate": 1.5162211013060557e-05, "loss": 0.6008, "step": 46945 }, { "epoch": 0.63, "learning_rate": 1.515737414396139e-05, "loss": 1.1768, "step": 46950 }, { "epoch": 0.63, "learning_rate": 1.5152537710841297e-05, "loss": 0.5972, "step": 46955 }, { "epoch": 0.63, "learning_rate": 1.514770171391452e-05, "loss": 0.3271, "step": 46960 }, { "epoch": 0.63, "learning_rate": 1.5142866153395269e-05, "loss": 1.1338, "step": 46965 }, { "epoch": 0.63, "learning_rate": 1.5138031029497734e-05, "loss": 0.2253, "step": 46970 }, { "epoch": 0.63, "learning_rate": 1.5133196342436081e-05, "loss": 0.5262, "step": 46975 }, { "epoch": 0.63, "learning_rate": 1.5128362092424474e-05, "loss": 0.8639, "step": 46980 }, { "epoch": 0.63, "learning_rate": 1.512352827967704e-05, "loss": 0.4822, "step": 46985 }, { "epoch": 0.63, "learning_rate": 1.5118694904407888e-05, "loss": 0.496, "step": 46990 }, { "epoch": 0.63, "learning_rate": 1.5113861966831127e-05, "loss": 0.3719, "step": 46995 }, { "epoch": 0.63, "learning_rate": 1.5109029467160818e-05, "loss": 0.505, "step": 47000 }, { "epoch": 0.63, "learning_rate": 1.5104197405611014e-05, "loss": 0.7274, "step": 47005 }, { "epoch": 0.63, "learning_rate": 1.5099365782395766e-05, "loss": 0.9203, "step": 47010 }, { "epoch": 0.63, "learning_rate": 1.5094534597729076e-05, "loss": 1.2685, "step": 47015 }, { "epoch": 0.63, "learning_rate": 1.5089703851824948e-05, "loss": 0.6108, "step": 47020 }, { "epoch": 0.63, "learning_rate": 1.508487354489737e-05, "loss": 0.0844, "step": 47025 }, { "epoch": 0.63, "learning_rate": 1.5080043677160282e-05, "loss": 1.1922, "step": 47030 }, { "epoch": 0.63, "learning_rate": 1.507521424882763e-05, "loss": 1.1925, "step": 47035 }, { "epoch": 0.63, "learning_rate": 1.5070385260113336e-05, "loss": 0.4662, "step": 47040 }, { "epoch": 0.63, "learning_rate": 1.5065556711231299e-05, "loss": 0.9226, "step": 47045 }, { "epoch": 0.63, "learning_rate": 1.5060728602395397e-05, "loss": 0.5211, "step": 47050 }, { "epoch": 0.63, "learning_rate": 1.5055900933819492e-05, "loss": 0.4031, "step": 47055 }, { "epoch": 0.63, "learning_rate": 1.5051073705717438e-05, "loss": 0.8512, "step": 47060 }, { "epoch": 0.63, "learning_rate": 1.5046246918303036e-05, "loss": 0.5422, "step": 47065 }, { "epoch": 0.63, "learning_rate": 1.5041420571790099e-05, "loss": 0.4991, "step": 47070 }, { "epoch": 0.63, "learning_rate": 1.5036594666392415e-05, "loss": 1.1721, "step": 47075 }, { "epoch": 0.63, "learning_rate": 1.5031769202323737e-05, "loss": 0.244, "step": 47080 }, { "epoch": 0.63, "learning_rate": 1.502694417979781e-05, "loss": 0.6449, "step": 47085 }, { "epoch": 0.63, "learning_rate": 1.5022119599028373e-05, "loss": 0.7834, "step": 47090 }, { "epoch": 0.63, "learning_rate": 1.5018260252621092e-05, "loss": 0.8737, "step": 47095 }, { "epoch": 0.63, "learning_rate": 1.5013436467551829e-05, "loss": 0.4552, "step": 47100 }, { "epoch": 0.63, "learning_rate": 1.5008613124837384e-05, "loss": 0.2062, "step": 47105 }, { "epoch": 0.63, "learning_rate": 1.5003790224691377e-05, "loss": 0.505, "step": 47110 }, { "epoch": 0.63, "learning_rate": 1.499896776732746e-05, "loss": 0.4686, "step": 47115 }, { "epoch": 0.63, "learning_rate": 1.4994145752959238e-05, "loss": 0.7247, "step": 47120 }, { "epoch": 0.63, "learning_rate": 1.4989324181800299e-05, "loss": 0.8322, "step": 47125 }, { "epoch": 0.63, "learning_rate": 1.4984503054064218e-05, "loss": 0.7791, "step": 47130 }, { "epoch": 0.63, "learning_rate": 1.4979682369964554e-05, "loss": 0.905, "step": 47135 }, { "epoch": 0.63, "learning_rate": 1.497486212971482e-05, "loss": 0.5911, "step": 47140 }, { "epoch": 0.63, "learning_rate": 1.497004233352854e-05, "loss": 0.5918, "step": 47145 }, { "epoch": 0.63, "learning_rate": 1.4965222981619212e-05, "loss": 0.6466, "step": 47150 }, { "epoch": 0.63, "learning_rate": 1.4960404074200295e-05, "loss": 1.1367, "step": 47155 }, { "epoch": 0.63, "learning_rate": 1.4955585611485257e-05, "loss": 0.6029, "step": 47160 }, { "epoch": 0.63, "learning_rate": 1.4950767593687531e-05, "loss": 0.9299, "step": 47165 }, { "epoch": 0.63, "learning_rate": 1.4945950021020522e-05, "loss": 0.6756, "step": 47170 }, { "epoch": 0.63, "learning_rate": 1.4941132893697623e-05, "loss": 0.498, "step": 47175 }, { "epoch": 0.63, "learning_rate": 1.4936316211932219e-05, "loss": 0.7837, "step": 47180 }, { "epoch": 0.63, "learning_rate": 1.4931499975937657e-05, "loss": 0.754, "step": 47185 }, { "epoch": 0.63, "learning_rate": 1.492668418592727e-05, "loss": 0.5188, "step": 47190 }, { "epoch": 0.63, "learning_rate": 1.4921868842114396e-05, "loss": 0.4596, "step": 47195 }, { "epoch": 0.63, "learning_rate": 1.4917053944712297e-05, "loss": 0.4427, "step": 47200 }, { "epoch": 0.63, "learning_rate": 1.4912239493934266e-05, "loss": 0.6492, "step": 47205 }, { "epoch": 0.63, "learning_rate": 1.4907425489993555e-05, "loss": 0.3784, "step": 47210 }, { "epoch": 0.63, "learning_rate": 1.4902611933103416e-05, "loss": 0.5451, "step": 47215 }, { "epoch": 0.63, "learning_rate": 1.4897798823477043e-05, "loss": 1.3255, "step": 47220 }, { "epoch": 0.63, "learning_rate": 1.4892986161327643e-05, "loss": 0.3924, "step": 47225 }, { "epoch": 0.63, "learning_rate": 1.48881739468684e-05, "loss": 0.323, "step": 47230 }, { "epoch": 0.63, "learning_rate": 1.4883362180312455e-05, "loss": 0.2895, "step": 47235 }, { "epoch": 0.63, "learning_rate": 1.4878550861872953e-05, "loss": 0.7898, "step": 47240 }, { "epoch": 0.63, "learning_rate": 1.4873739991763025e-05, "loss": 0.6411, "step": 47245 }, { "epoch": 0.63, "learning_rate": 1.4868929570195741e-05, "loss": 1.4158, "step": 47250 }, { "epoch": 0.63, "learning_rate": 1.4864119597384197e-05, "loss": 0.6901, "step": 47255 }, { "epoch": 0.63, "learning_rate": 1.485931007354145e-05, "loss": 0.6569, "step": 47260 }, { "epoch": 0.63, "learning_rate": 1.4854500998880527e-05, "loss": 1.6439, "step": 47265 }, { "epoch": 0.63, "learning_rate": 1.4849692373614455e-05, "loss": 0.947, "step": 47270 }, { "epoch": 0.63, "learning_rate": 1.4844884197956244e-05, "loss": 0.8831, "step": 47275 }, { "epoch": 0.63, "learning_rate": 1.4840076472118844e-05, "loss": 0.4366, "step": 47280 }, { "epoch": 0.63, "learning_rate": 1.4835269196315229e-05, "loss": 0.842, "step": 47285 }, { "epoch": 0.63, "learning_rate": 1.4830462370758341e-05, "loss": 0.127, "step": 47290 }, { "epoch": 0.63, "learning_rate": 1.4825655995661091e-05, "loss": 0.3016, "step": 47295 }, { "epoch": 0.63, "learning_rate": 1.4820850071236374e-05, "loss": 0.7352, "step": 47300 }, { "epoch": 0.63, "learning_rate": 1.481604459769709e-05, "loss": 1.0496, "step": 47305 }, { "epoch": 0.63, "learning_rate": 1.481123957525607e-05, "loss": 0.8379, "step": 47310 }, { "epoch": 0.63, "learning_rate": 1.4806435004126157e-05, "loss": 1.0228, "step": 47315 }, { "epoch": 0.63, "learning_rate": 1.4801630884520184e-05, "loss": 0.8687, "step": 47320 }, { "epoch": 0.63, "learning_rate": 1.4796827216650949e-05, "loss": 0.5576, "step": 47325 }, { "epoch": 0.63, "learning_rate": 1.4792024000731219e-05, "loss": 0.5417, "step": 47330 }, { "epoch": 0.63, "learning_rate": 1.4787221236973752e-05, "loss": 0.8286, "step": 47335 }, { "epoch": 0.63, "learning_rate": 1.4782418925591296e-05, "loss": 0.6662, "step": 47340 }, { "epoch": 0.63, "learning_rate": 1.4777617066796561e-05, "loss": 0.8354, "step": 47345 }, { "epoch": 0.63, "learning_rate": 1.477281566080225e-05, "loss": 0.6466, "step": 47350 }, { "epoch": 0.63, "learning_rate": 1.4768014707821048e-05, "loss": 0.5345, "step": 47355 }, { "epoch": 0.63, "learning_rate": 1.4763214208065598e-05, "loss": 1.0203, "step": 47360 }, { "epoch": 0.63, "learning_rate": 1.4758414161748547e-05, "loss": 0.5061, "step": 47365 }, { "epoch": 0.63, "learning_rate": 1.4753614569082513e-05, "loss": 1.2171, "step": 47370 }, { "epoch": 0.63, "learning_rate": 1.4748815430280089e-05, "loss": 0.986, "step": 47375 }, { "epoch": 0.63, "learning_rate": 1.4744016745553854e-05, "loss": 0.3383, "step": 47380 }, { "epoch": 0.63, "learning_rate": 1.4739218515116379e-05, "loss": 0.7876, "step": 47385 }, { "epoch": 0.63, "learning_rate": 1.4734420739180183e-05, "loss": 0.7204, "step": 47390 }, { "epoch": 0.64, "learning_rate": 1.472962341795779e-05, "loss": 0.5911, "step": 47395 }, { "epoch": 0.64, "learning_rate": 1.4724826551661702e-05, "loss": 0.6242, "step": 47400 }, { "epoch": 0.64, "learning_rate": 1.472003014050439e-05, "loss": 0.2745, "step": 47405 }, { "epoch": 0.64, "learning_rate": 1.4715234184698311e-05, "loss": 0.8172, "step": 47410 }, { "epoch": 0.64, "learning_rate": 1.4710438684455918e-05, "loss": 0.7541, "step": 47415 }, { "epoch": 0.64, "learning_rate": 1.4705643639989602e-05, "loss": 0.7044, "step": 47420 }, { "epoch": 0.64, "learning_rate": 1.4700849051511767e-05, "loss": 0.7283, "step": 47425 }, { "epoch": 0.64, "learning_rate": 1.4696054919234797e-05, "loss": 0.8209, "step": 47430 }, { "epoch": 0.64, "learning_rate": 1.469126124337106e-05, "loss": 0.5544, "step": 47435 }, { "epoch": 0.64, "learning_rate": 1.4686468024132866e-05, "loss": 1.0529, "step": 47440 }, { "epoch": 0.64, "learning_rate": 1.4681675261732536e-05, "loss": 1.1545, "step": 47445 }, { "epoch": 0.64, "learning_rate": 1.4676882956382382e-05, "loss": 0.7526, "step": 47450 }, { "epoch": 0.64, "learning_rate": 1.4672091108294662e-05, "loss": 0.8708, "step": 47455 }, { "epoch": 0.64, "learning_rate": 1.4667299717681631e-05, "loss": 0.7755, "step": 47460 }, { "epoch": 0.64, "learning_rate": 1.4662508784755547e-05, "loss": 1.0578, "step": 47465 }, { "epoch": 0.64, "learning_rate": 1.4657718309728593e-05, "loss": 0.3532, "step": 47470 }, { "epoch": 0.64, "learning_rate": 1.465292829281298e-05, "loss": 0.7243, "step": 47475 }, { "epoch": 0.64, "learning_rate": 1.4648138734220881e-05, "loss": 1.1016, "step": 47480 }, { "epoch": 0.64, "learning_rate": 1.4643349634164443e-05, "loss": 0.434, "step": 47485 }, { "epoch": 0.64, "learning_rate": 1.4638560992855805e-05, "loss": 0.7327, "step": 47490 }, { "epoch": 0.64, "learning_rate": 1.4633772810507088e-05, "loss": 0.1441, "step": 47495 }, { "epoch": 0.64, "learning_rate": 1.4628985087330366e-05, "loss": 0.6567, "step": 47500 }, { "epoch": 0.64, "learning_rate": 1.4624197823537717e-05, "loss": 1.1289, "step": 47505 }, { "epoch": 0.64, "learning_rate": 1.4619411019341204e-05, "loss": 0.2215, "step": 47510 }, { "epoch": 0.64, "learning_rate": 1.4614624674952842e-05, "loss": 1.6186, "step": 47515 }, { "epoch": 0.64, "learning_rate": 1.4609838790584652e-05, "loss": 1.108, "step": 47520 }, { "epoch": 0.64, "learning_rate": 1.4605053366448635e-05, "loss": 0.3826, "step": 47525 }, { "epoch": 0.64, "learning_rate": 1.4600268402756733e-05, "loss": 0.8496, "step": 47530 }, { "epoch": 0.64, "learning_rate": 1.4595483899720919e-05, "loss": 1.5929, "step": 47535 }, { "epoch": 0.64, "learning_rate": 1.459069985755312e-05, "loss": 1.1618, "step": 47540 }, { "epoch": 0.64, "learning_rate": 1.458591627646524e-05, "loss": 1.1074, "step": 47545 }, { "epoch": 0.64, "learning_rate": 1.4581133156669157e-05, "loss": 0.6245, "step": 47550 }, { "epoch": 0.64, "learning_rate": 1.4576350498376768e-05, "loss": 0.3024, "step": 47555 }, { "epoch": 0.64, "learning_rate": 1.4571568301799898e-05, "loss": 0.6941, "step": 47560 }, { "epoch": 0.64, "learning_rate": 1.456678656715038e-05, "loss": 0.8416, "step": 47565 }, { "epoch": 0.64, "learning_rate": 1.4562005294640015e-05, "loss": 0.8468, "step": 47570 }, { "epoch": 0.64, "learning_rate": 1.4557224484480605e-05, "loss": 0.5544, "step": 47575 }, { "epoch": 0.64, "learning_rate": 1.4552444136883907e-05, "loss": 0.8303, "step": 47580 }, { "epoch": 0.64, "learning_rate": 1.4547664252061655e-05, "loss": 1.215, "step": 47585 }, { "epoch": 0.64, "learning_rate": 1.4542884830225607e-05, "loss": 0.3331, "step": 47590 }, { "epoch": 0.64, "learning_rate": 1.4538105871587427e-05, "loss": 0.7712, "step": 47595 }, { "epoch": 0.64, "learning_rate": 1.4533327376358825e-05, "loss": 1.0795, "step": 47600 }, { "epoch": 0.64, "learning_rate": 1.4528549344751458e-05, "loss": 0.8512, "step": 47605 }, { "epoch": 0.64, "learning_rate": 1.4523771776976955e-05, "loss": 0.6291, "step": 47610 }, { "epoch": 0.64, "learning_rate": 1.4518994673246963e-05, "loss": 0.5613, "step": 47615 }, { "epoch": 0.64, "learning_rate": 1.4514218033773076e-05, "loss": 0.8987, "step": 47620 }, { "epoch": 0.64, "learning_rate": 1.4509441858766865e-05, "loss": 0.5179, "step": 47625 }, { "epoch": 0.64, "learning_rate": 1.450466614843989e-05, "loss": 0.5085, "step": 47630 }, { "epoch": 0.64, "learning_rate": 1.449989090300371e-05, "loss": 0.507, "step": 47635 }, { "epoch": 0.64, "learning_rate": 1.4495116122669832e-05, "loss": 0.5992, "step": 47640 }, { "epoch": 0.64, "learning_rate": 1.4490341807649743e-05, "loss": 1.2164, "step": 47645 }, { "epoch": 0.64, "learning_rate": 1.4485567958154948e-05, "loss": 0.8462, "step": 47650 }, { "epoch": 0.64, "learning_rate": 1.4480794574396886e-05, "loss": 0.6959, "step": 47655 }, { "epoch": 0.64, "learning_rate": 1.4476021656586992e-05, "loss": 1.0746, "step": 47660 }, { "epoch": 0.64, "learning_rate": 1.4471249204936696e-05, "loss": 1.0739, "step": 47665 }, { "epoch": 0.64, "learning_rate": 1.4466477219657386e-05, "loss": 0.3873, "step": 47670 }, { "epoch": 0.64, "learning_rate": 1.446170570096044e-05, "loss": 1.1549, "step": 47675 }, { "epoch": 0.64, "learning_rate": 1.4456934649057199e-05, "loss": 0.5823, "step": 47680 }, { "epoch": 0.64, "learning_rate": 1.4452164064159019e-05, "loss": 0.5628, "step": 47685 }, { "epoch": 0.64, "learning_rate": 1.44473939464772e-05, "loss": 1.951, "step": 47690 }, { "epoch": 0.64, "learning_rate": 1.4442624296223028e-05, "loss": 1.4315, "step": 47695 }, { "epoch": 0.64, "learning_rate": 1.44378551136078e-05, "loss": 0.4031, "step": 47700 }, { "epoch": 0.64, "learning_rate": 1.4433086398842732e-05, "loss": 0.7677, "step": 47705 }, { "epoch": 0.64, "learning_rate": 1.442831815213908e-05, "loss": 0.7159, "step": 47710 }, { "epoch": 0.64, "learning_rate": 1.4423550373708048e-05, "loss": 0.4084, "step": 47715 }, { "epoch": 0.64, "learning_rate": 1.441878306376081e-05, "loss": 0.9237, "step": 47720 }, { "epoch": 0.64, "learning_rate": 1.4414016222508559e-05, "loss": 0.7922, "step": 47725 }, { "epoch": 0.64, "learning_rate": 1.4409249850162426e-05, "loss": 0.6515, "step": 47730 }, { "epoch": 0.64, "learning_rate": 1.4404483946933542e-05, "loss": 0.8271, "step": 47735 }, { "epoch": 0.64, "learning_rate": 1.4399718513033e-05, "loss": 1.7095, "step": 47740 }, { "epoch": 0.64, "learning_rate": 1.4394953548671907e-05, "loss": 0.8525, "step": 47745 }, { "epoch": 0.64, "learning_rate": 1.439018905406132e-05, "loss": 0.2976, "step": 47750 }, { "epoch": 0.64, "learning_rate": 1.4385425029412263e-05, "loss": 0.543, "step": 47755 }, { "epoch": 0.64, "learning_rate": 1.4380661474935791e-05, "loss": 0.229, "step": 47760 }, { "epoch": 0.64, "learning_rate": 1.4375898390842884e-05, "loss": 0.328, "step": 47765 }, { "epoch": 0.64, "learning_rate": 1.4371135777344519e-05, "loss": 0.3472, "step": 47770 }, { "epoch": 0.64, "learning_rate": 1.4366373634651673e-05, "loss": 1.1272, "step": 47775 }, { "epoch": 0.64, "learning_rate": 1.4361611962975278e-05, "loss": 0.1771, "step": 47780 }, { "epoch": 0.64, "learning_rate": 1.435685076252625e-05, "loss": 0.5428, "step": 47785 }, { "epoch": 0.64, "learning_rate": 1.4352090033515478e-05, "loss": 0.7791, "step": 47790 }, { "epoch": 0.64, "learning_rate": 1.4347329776153855e-05, "loss": 0.7101, "step": 47795 }, { "epoch": 0.64, "learning_rate": 1.4342569990652233e-05, "loss": 1.3205, "step": 47800 }, { "epoch": 0.64, "learning_rate": 1.4337810677221431e-05, "loss": 0.4602, "step": 47805 }, { "epoch": 0.64, "learning_rate": 1.4333051836072298e-05, "loss": 0.5081, "step": 47810 }, { "epoch": 0.64, "learning_rate": 1.432829346741558e-05, "loss": 0.4241, "step": 47815 }, { "epoch": 0.64, "learning_rate": 1.4323535571462082e-05, "loss": 0.5316, "step": 47820 }, { "epoch": 0.64, "learning_rate": 1.4318778148422548e-05, "loss": 0.6571, "step": 47825 }, { "epoch": 0.64, "learning_rate": 1.4314021198507693e-05, "loss": 0.3326, "step": 47830 }, { "epoch": 0.64, "learning_rate": 1.4309264721928251e-05, "loss": 0.5295, "step": 47835 }, { "epoch": 0.64, "learning_rate": 1.43045087188949e-05, "loss": 0.6547, "step": 47840 }, { "epoch": 0.64, "learning_rate": 1.429975318961829e-05, "loss": 1.3684, "step": 47845 }, { "epoch": 0.64, "learning_rate": 1.4294998134309096e-05, "loss": 0.8914, "step": 47850 }, { "epoch": 0.64, "learning_rate": 1.4290243553177923e-05, "loss": 0.8402, "step": 47855 }, { "epoch": 0.64, "learning_rate": 1.4285489446435388e-05, "loss": 0.7034, "step": 47860 }, { "epoch": 0.64, "learning_rate": 1.4280735814292054e-05, "loss": 0.52, "step": 47865 }, { "epoch": 0.64, "learning_rate": 1.427598265695851e-05, "loss": 1.171, "step": 47870 }, { "epoch": 0.64, "learning_rate": 1.4271229974645279e-05, "loss": 1.2078, "step": 47875 }, { "epoch": 0.64, "learning_rate": 1.426647776756288e-05, "loss": 1.3094, "step": 47880 }, { "epoch": 0.64, "learning_rate": 1.4261726035921824e-05, "loss": 1.119, "step": 47885 }, { "epoch": 0.64, "learning_rate": 1.4256974779932586e-05, "loss": 0.4007, "step": 47890 }, { "epoch": 0.64, "learning_rate": 1.4252223999805617e-05, "loss": 0.9432, "step": 47895 }, { "epoch": 0.64, "learning_rate": 1.4247473695751345e-05, "loss": 0.4962, "step": 47900 }, { "epoch": 0.64, "learning_rate": 1.4242723867980207e-05, "loss": 0.6116, "step": 47905 }, { "epoch": 0.64, "learning_rate": 1.4237974516702585e-05, "loss": 1.24, "step": 47910 }, { "epoch": 0.64, "learning_rate": 1.4233225642128841e-05, "loss": 0.641, "step": 47915 }, { "epoch": 0.64, "learning_rate": 1.4228477244469356e-05, "loss": 0.2953, "step": 47920 }, { "epoch": 0.64, "learning_rate": 1.422372932393442e-05, "loss": 1.0832, "step": 47925 }, { "epoch": 0.64, "learning_rate": 1.4218981880734374e-05, "loss": 0.5495, "step": 47930 }, { "epoch": 0.64, "learning_rate": 1.4214234915079495e-05, "loss": 0.3809, "step": 47935 }, { "epoch": 0.64, "learning_rate": 1.4209488427180039e-05, "loss": 1.1205, "step": 47940 }, { "epoch": 0.64, "learning_rate": 1.4204742417246275e-05, "loss": 0.8902, "step": 47945 }, { "epoch": 0.64, "learning_rate": 1.4199996885488414e-05, "loss": 0.6746, "step": 47950 }, { "epoch": 0.64, "learning_rate": 1.4195251832116647e-05, "loss": 0.6336, "step": 47955 }, { "epoch": 0.64, "learning_rate": 1.4190507257341183e-05, "loss": 1.107, "step": 47960 }, { "epoch": 0.64, "learning_rate": 1.4185763161372168e-05, "loss": 0.2442, "step": 47965 }, { "epoch": 0.64, "learning_rate": 1.4181019544419743e-05, "loss": 0.4808, "step": 47970 }, { "epoch": 0.64, "learning_rate": 1.4176276406694018e-05, "loss": 0.7785, "step": 47975 }, { "epoch": 0.64, "learning_rate": 1.4171533748405105e-05, "loss": 0.8764, "step": 47980 }, { "epoch": 0.64, "learning_rate": 1.4166791569763077e-05, "loss": 0.4007, "step": 47985 }, { "epoch": 0.64, "learning_rate": 1.4162049870977972e-05, "loss": 0.5974, "step": 47990 }, { "epoch": 0.64, "learning_rate": 1.4157308652259852e-05, "loss": 0.8718, "step": 47995 }, { "epoch": 0.64, "learning_rate": 1.4152567913818712e-05, "loss": 0.3535, "step": 48000 }, { "epoch": 0.64, "learning_rate": 1.4147827655864546e-05, "loss": 0.5588, "step": 48005 }, { "epoch": 0.64, "learning_rate": 1.4143087878607315e-05, "loss": 0.8992, "step": 48010 }, { "epoch": 0.64, "learning_rate": 1.4138348582256983e-05, "loss": 1.1868, "step": 48015 }, { "epoch": 0.64, "learning_rate": 1.413360976702347e-05, "loss": 0.4637, "step": 48020 }, { "epoch": 0.64, "learning_rate": 1.4128871433116669e-05, "loss": 1.2196, "step": 48025 }, { "epoch": 0.64, "learning_rate": 1.4124133580746501e-05, "loss": 1.4004, "step": 48030 }, { "epoch": 0.64, "learning_rate": 1.4119396210122782e-05, "loss": 0.6188, "step": 48035 }, { "epoch": 0.64, "learning_rate": 1.411465932145539e-05, "loss": 0.6561, "step": 48040 }, { "epoch": 0.64, "learning_rate": 1.4109922914954133e-05, "loss": 1.079, "step": 48045 }, { "epoch": 0.64, "learning_rate": 1.4105186990828794e-05, "loss": 0.9145, "step": 48050 }, { "epoch": 0.64, "learning_rate": 1.4100451549289182e-05, "loss": 0.6041, "step": 48055 }, { "epoch": 0.64, "learning_rate": 1.4095716590545033e-05, "loss": 0.3892, "step": 48060 }, { "epoch": 0.64, "learning_rate": 1.4090982114806082e-05, "loss": 0.7939, "step": 48065 }, { "epoch": 0.64, "learning_rate": 1.4086248122282052e-05, "loss": 0.7114, "step": 48070 }, { "epoch": 0.64, "learning_rate": 1.4081514613182633e-05, "loss": 0.317, "step": 48075 }, { "epoch": 0.64, "learning_rate": 1.4076781587717494e-05, "loss": 0.233, "step": 48080 }, { "epoch": 0.64, "learning_rate": 1.4072049046096272e-05, "loss": 0.2805, "step": 48085 }, { "epoch": 0.64, "learning_rate": 1.4067316988528617e-05, "loss": 1.2151, "step": 48090 }, { "epoch": 0.64, "learning_rate": 1.4062585415224125e-05, "loss": 0.0838, "step": 48095 }, { "epoch": 0.64, "learning_rate": 1.4057854326392373e-05, "loss": 0.4438, "step": 48100 }, { "epoch": 0.64, "learning_rate": 1.405312372224294e-05, "loss": 0.7485, "step": 48105 }, { "epoch": 0.64, "learning_rate": 1.404839360298536e-05, "loss": 0.4096, "step": 48110 }, { "epoch": 0.64, "learning_rate": 1.4043663968829151e-05, "loss": 0.6576, "step": 48115 }, { "epoch": 0.64, "learning_rate": 1.4038934819983812e-05, "loss": 0.4413, "step": 48120 }, { "epoch": 0.64, "learning_rate": 1.403420615665883e-05, "loss": 1.083, "step": 48125 }, { "epoch": 0.64, "learning_rate": 1.4029477979063658e-05, "loss": 1.3785, "step": 48130 }, { "epoch": 0.64, "learning_rate": 1.4024750287407718e-05, "loss": 0.3401, "step": 48135 }, { "epoch": 0.65, "learning_rate": 1.4020023081900448e-05, "loss": 0.5714, "step": 48140 }, { "epoch": 0.65, "learning_rate": 1.4015296362751206e-05, "loss": 0.28, "step": 48145 }, { "epoch": 0.65, "learning_rate": 1.4010570130169393e-05, "loss": 0.9687, "step": 48150 }, { "epoch": 0.65, "learning_rate": 1.4005844384364345e-05, "loss": 0.3621, "step": 48155 }, { "epoch": 0.65, "learning_rate": 1.4001119125545376e-05, "loss": 0.7232, "step": 48160 }, { "epoch": 0.65, "learning_rate": 1.3996394353921816e-05, "loss": 0.3725, "step": 48165 }, { "epoch": 0.65, "learning_rate": 1.3991670069702936e-05, "loss": 0.7599, "step": 48170 }, { "epoch": 0.65, "learning_rate": 1.398694627309799e-05, "loss": 0.1529, "step": 48175 }, { "epoch": 0.65, "learning_rate": 1.3982222964316238e-05, "loss": 0.6939, "step": 48180 }, { "epoch": 0.65, "learning_rate": 1.3977500143566885e-05, "loss": 0.6735, "step": 48185 }, { "epoch": 0.65, "learning_rate": 1.3972777811059134e-05, "loss": 0.7558, "step": 48190 }, { "epoch": 0.65, "learning_rate": 1.396805596700215e-05, "loss": 0.8147, "step": 48195 }, { "epoch": 0.65, "learning_rate": 1.3963334611605105e-05, "loss": 0.4543, "step": 48200 }, { "epoch": 0.65, "learning_rate": 1.395861374507712e-05, "loss": 0.865, "step": 48205 }, { "epoch": 0.65, "learning_rate": 1.39538933676273e-05, "loss": 1.076, "step": 48210 }, { "epoch": 0.65, "learning_rate": 1.3949173479464761e-05, "loss": 0.2431, "step": 48215 }, { "epoch": 0.65, "learning_rate": 1.394445408079853e-05, "loss": 0.2349, "step": 48220 }, { "epoch": 0.65, "learning_rate": 1.3939735171837686e-05, "loss": 0.8728, "step": 48225 }, { "epoch": 0.65, "learning_rate": 1.393501675279123e-05, "loss": 0.4904, "step": 48230 }, { "epoch": 0.65, "learning_rate": 1.3930298823868184e-05, "loss": 0.8737, "step": 48235 }, { "epoch": 0.65, "learning_rate": 1.3925581385277523e-05, "loss": 0.574, "step": 48240 }, { "epoch": 0.65, "learning_rate": 1.3920864437228193e-05, "loss": 0.82, "step": 48245 }, { "epoch": 0.65, "learning_rate": 1.391614797992916e-05, "loss": 0.3876, "step": 48250 }, { "epoch": 0.65, "learning_rate": 1.3911432013589298e-05, "loss": 0.596, "step": 48255 }, { "epoch": 0.65, "learning_rate": 1.390671653841753e-05, "loss": 0.4941, "step": 48260 }, { "epoch": 0.65, "learning_rate": 1.3902001554622735e-05, "loss": 0.2665, "step": 48265 }, { "epoch": 0.65, "learning_rate": 1.3897287062413732e-05, "loss": 0.4798, "step": 48270 }, { "epoch": 0.65, "learning_rate": 1.389257306199938e-05, "loss": 0.8739, "step": 48275 }, { "epoch": 0.65, "learning_rate": 1.388785955358847e-05, "loss": 0.4959, "step": 48280 }, { "epoch": 0.65, "learning_rate": 1.3883146537389779e-05, "loss": 0.8883, "step": 48285 }, { "epoch": 0.65, "learning_rate": 1.3878434013612091e-05, "loss": 0.9975, "step": 48290 }, { "epoch": 0.65, "learning_rate": 1.3873721982464139e-05, "loss": 0.4886, "step": 48295 }, { "epoch": 0.65, "learning_rate": 1.3869010444154634e-05, "loss": 0.7087, "step": 48300 }, { "epoch": 0.65, "learning_rate": 1.3864299398892275e-05, "loss": 0.6027, "step": 48305 }, { "epoch": 0.65, "learning_rate": 1.3859588846885752e-05, "loss": 0.8019, "step": 48310 }, { "epoch": 0.65, "learning_rate": 1.3854878788343706e-05, "loss": 0.7916, "step": 48315 }, { "epoch": 0.65, "learning_rate": 1.3850169223474768e-05, "loss": 1.2357, "step": 48320 }, { "epoch": 0.65, "learning_rate": 1.3845460152487566e-05, "loss": 0.6313, "step": 48325 }, { "epoch": 0.65, "learning_rate": 1.384075157559066e-05, "loss": 0.5699, "step": 48330 }, { "epoch": 0.65, "learning_rate": 1.383604349299264e-05, "loss": 0.7792, "step": 48335 }, { "epoch": 0.65, "learning_rate": 1.3831335904902031e-05, "loss": 0.3878, "step": 48340 }, { "epoch": 0.65, "learning_rate": 1.3826628811527375e-05, "loss": 0.5728, "step": 48345 }, { "epoch": 0.65, "learning_rate": 1.3821922213077168e-05, "loss": 0.5819, "step": 48350 }, { "epoch": 0.65, "learning_rate": 1.3817216109759874e-05, "loss": 0.724, "step": 48355 }, { "epoch": 0.65, "learning_rate": 1.3812510501783976e-05, "loss": 0.8216, "step": 48360 }, { "epoch": 0.65, "learning_rate": 1.3807805389357878e-05, "loss": 0.9593, "step": 48365 }, { "epoch": 0.65, "learning_rate": 1.3803100772690009e-05, "loss": 1.0691, "step": 48370 }, { "epoch": 0.65, "learning_rate": 1.3798396651988777e-05, "loss": 0.5589, "step": 48375 }, { "epoch": 0.65, "learning_rate": 1.3793693027462511e-05, "loss": 0.3336, "step": 48380 }, { "epoch": 0.65, "learning_rate": 1.3788989899319593e-05, "loss": 0.9957, "step": 48385 }, { "epoch": 0.65, "learning_rate": 1.3784287267768337e-05, "loss": 0.6479, "step": 48390 }, { "epoch": 0.65, "learning_rate": 1.3779585133017034e-05, "loss": 0.4179, "step": 48395 }, { "epoch": 0.65, "learning_rate": 1.3774883495273985e-05, "loss": 1.0269, "step": 48400 }, { "epoch": 0.65, "learning_rate": 1.377018235474744e-05, "loss": 0.4434, "step": 48405 }, { "epoch": 0.65, "learning_rate": 1.3765481711645634e-05, "loss": 1.4102, "step": 48410 }, { "epoch": 0.65, "learning_rate": 1.3760781566176778e-05, "loss": 1.0272, "step": 48415 }, { "epoch": 0.65, "learning_rate": 1.3756081918549077e-05, "loss": 0.4522, "step": 48420 }, { "epoch": 0.65, "learning_rate": 1.3751382768970695e-05, "loss": 0.6573, "step": 48425 }, { "epoch": 0.65, "learning_rate": 1.3746684117649772e-05, "loss": 0.8188, "step": 48430 }, { "epoch": 0.65, "learning_rate": 1.3741985964794465e-05, "loss": 0.9373, "step": 48435 }, { "epoch": 0.65, "learning_rate": 1.3737288310612838e-05, "loss": 0.6501, "step": 48440 }, { "epoch": 0.65, "learning_rate": 1.3732591155313001e-05, "loss": 0.6798, "step": 48445 }, { "epoch": 0.65, "learning_rate": 1.3727894499103e-05, "loss": 0.6637, "step": 48450 }, { "epoch": 0.65, "learning_rate": 1.3723198342190888e-05, "loss": 1.1569, "step": 48455 }, { "epoch": 0.65, "learning_rate": 1.3718502684784674e-05, "loss": 1.0814, "step": 48460 }, { "epoch": 0.65, "learning_rate": 1.3713807527092343e-05, "loss": 1.2965, "step": 48465 }, { "epoch": 0.65, "learning_rate": 1.3709112869321891e-05, "loss": 1.12, "step": 48470 }, { "epoch": 0.65, "learning_rate": 1.3704418711681236e-05, "loss": 0.7093, "step": 48475 }, { "epoch": 0.65, "learning_rate": 1.3699725054378321e-05, "loss": 0.7866, "step": 48480 }, { "epoch": 0.65, "learning_rate": 1.3695031897621072e-05, "loss": 0.9804, "step": 48485 }, { "epoch": 0.65, "learning_rate": 1.3690339241617334e-05, "loss": 0.8256, "step": 48490 }, { "epoch": 0.65, "learning_rate": 1.3685647086574999e-05, "loss": 0.6738, "step": 48495 }, { "epoch": 0.65, "learning_rate": 1.3680955432701889e-05, "loss": 0.2726, "step": 48500 }, { "epoch": 0.65, "learning_rate": 1.3676264280205819e-05, "loss": 0.8494, "step": 48505 }, { "epoch": 0.65, "learning_rate": 1.3671573629294601e-05, "loss": 1.3464, "step": 48510 }, { "epoch": 0.65, "learning_rate": 1.3666883480175996e-05, "loss": 0.4771, "step": 48515 }, { "epoch": 0.65, "learning_rate": 1.3662193833057758e-05, "loss": 0.6034, "step": 48520 }, { "epoch": 0.65, "learning_rate": 1.3657504688147598e-05, "loss": 0.78, "step": 48525 }, { "epoch": 0.65, "learning_rate": 1.3652816045653244e-05, "loss": 0.4178, "step": 48530 }, { "epoch": 0.65, "learning_rate": 1.3648127905782376e-05, "loss": 0.4227, "step": 48535 }, { "epoch": 0.65, "learning_rate": 1.3643440268742637e-05, "loss": 0.5524, "step": 48540 }, { "epoch": 0.65, "learning_rate": 1.36387531347417e-05, "loss": 0.8265, "step": 48545 }, { "epoch": 0.65, "learning_rate": 1.3634066503987142e-05, "loss": 0.8096, "step": 48550 }, { "epoch": 0.65, "learning_rate": 1.3629380376686584e-05, "loss": 0.2055, "step": 48555 }, { "epoch": 0.65, "learning_rate": 1.362469475304758e-05, "loss": 0.5618, "step": 48560 }, { "epoch": 0.65, "learning_rate": 1.36200096332777e-05, "loss": 0.5421, "step": 48565 }, { "epoch": 0.65, "learning_rate": 1.3615325017584463e-05, "loss": 0.2241, "step": 48570 }, { "epoch": 0.65, "learning_rate": 1.361064090617536e-05, "loss": 0.4281, "step": 48575 }, { "epoch": 0.65, "learning_rate": 1.3605957299257905e-05, "loss": 0.6714, "step": 48580 }, { "epoch": 0.65, "learning_rate": 1.3601274197039518e-05, "loss": 0.7329, "step": 48585 }, { "epoch": 0.65, "learning_rate": 1.359659159972766e-05, "loss": 0.2905, "step": 48590 }, { "epoch": 0.65, "learning_rate": 1.3591909507529766e-05, "loss": 0.6628, "step": 48595 }, { "epoch": 0.65, "learning_rate": 1.3587227920653183e-05, "loss": 0.7959, "step": 48600 }, { "epoch": 0.65, "learning_rate": 1.3582546839305322e-05, "loss": 0.5056, "step": 48605 }, { "epoch": 0.65, "learning_rate": 1.3577866263693514e-05, "loss": 0.3047, "step": 48610 }, { "epoch": 0.65, "learning_rate": 1.3573186194025078e-05, "loss": 0.3963, "step": 48615 }, { "epoch": 0.65, "learning_rate": 1.3568506630507338e-05, "loss": 0.9226, "step": 48620 }, { "epoch": 0.65, "learning_rate": 1.3563827573347562e-05, "loss": 0.7434, "step": 48625 }, { "epoch": 0.65, "learning_rate": 1.3559149022753012e-05, "loss": 0.4019, "step": 48630 }, { "epoch": 0.65, "learning_rate": 1.3554470978930914e-05, "loss": 0.5017, "step": 48635 }, { "epoch": 0.65, "learning_rate": 1.3549793442088502e-05, "loss": 0.6241, "step": 48640 }, { "epoch": 0.65, "learning_rate": 1.3545116412432957e-05, "loss": 0.9755, "step": 48645 }, { "epoch": 0.65, "learning_rate": 1.3540439890171436e-05, "loss": 0.8036, "step": 48650 }, { "epoch": 0.65, "learning_rate": 1.3535763875511117e-05, "loss": 0.5063, "step": 48655 }, { "epoch": 0.65, "learning_rate": 1.3531088368659087e-05, "loss": 0.662, "step": 48660 }, { "epoch": 0.65, "learning_rate": 1.3526413369822474e-05, "loss": 0.5663, "step": 48665 }, { "epoch": 0.65, "learning_rate": 1.352173887920834e-05, "loss": 0.6076, "step": 48670 }, { "epoch": 0.65, "learning_rate": 1.3517064897023757e-05, "loss": 1.365, "step": 48675 }, { "epoch": 0.65, "learning_rate": 1.3512391423475752e-05, "loss": 0.6367, "step": 48680 }, { "epoch": 0.65, "learning_rate": 1.3507718458771329e-05, "loss": 1.2274, "step": 48685 }, { "epoch": 0.65, "learning_rate": 1.3503046003117491e-05, "loss": 0.6091, "step": 48690 }, { "epoch": 0.65, "learning_rate": 1.3498374056721197e-05, "loss": 0.4654, "step": 48695 }, { "epoch": 0.65, "learning_rate": 1.3493702619789384e-05, "loss": 0.9508, "step": 48700 }, { "epoch": 0.65, "learning_rate": 1.3489031692529004e-05, "loss": 0.9632, "step": 48705 }, { "epoch": 0.65, "learning_rate": 1.3484361275146905e-05, "loss": 0.3681, "step": 48710 }, { "epoch": 0.65, "learning_rate": 1.3479691367850006e-05, "loss": 1.2659, "step": 48715 }, { "epoch": 0.65, "learning_rate": 1.3475021970845142e-05, "loss": 0.9171, "step": 48720 }, { "epoch": 0.65, "learning_rate": 1.3470353084339139e-05, "loss": 1.3326, "step": 48725 }, { "epoch": 0.65, "learning_rate": 1.3465684708538822e-05, "loss": 0.4038, "step": 48730 }, { "epoch": 0.65, "learning_rate": 1.3461016843650969e-05, "loss": 0.9216, "step": 48735 }, { "epoch": 0.65, "learning_rate": 1.3456349489882341e-05, "loss": 1.1089, "step": 48740 }, { "epoch": 0.65, "learning_rate": 1.3451682647439673e-05, "loss": 0.2428, "step": 48745 }, { "epoch": 0.65, "learning_rate": 1.3447016316529696e-05, "loss": 1.0185, "step": 48750 }, { "epoch": 0.65, "learning_rate": 1.3442350497359097e-05, "loss": 0.5367, "step": 48755 }, { "epoch": 0.65, "learning_rate": 1.3437685190134542e-05, "loss": 0.4472, "step": 48760 }, { "epoch": 0.65, "learning_rate": 1.3433020395062709e-05, "loss": 0.7359, "step": 48765 }, { "epoch": 0.65, "learning_rate": 1.3428356112350186e-05, "loss": 0.6753, "step": 48770 }, { "epoch": 0.65, "learning_rate": 1.3423692342203602e-05, "loss": 1.3313, "step": 48775 }, { "epoch": 0.65, "learning_rate": 1.3419029084829537e-05, "loss": 1.2361, "step": 48780 }, { "epoch": 0.65, "learning_rate": 1.3414366340434534e-05, "loss": 0.539, "step": 48785 }, { "epoch": 0.65, "learning_rate": 1.3409704109225152e-05, "loss": 0.7699, "step": 48790 }, { "epoch": 0.65, "learning_rate": 1.340504239140788e-05, "loss": 0.2777, "step": 48795 }, { "epoch": 0.65, "learning_rate": 1.3400381187189237e-05, "loss": 0.7484, "step": 48800 }, { "epoch": 0.65, "learning_rate": 1.3395720496775671e-05, "loss": 0.7771, "step": 48805 }, { "epoch": 0.65, "learning_rate": 1.3391060320373628e-05, "loss": 0.6351, "step": 48810 }, { "epoch": 0.65, "learning_rate": 1.3386400658189551e-05, "loss": 0.3577, "step": 48815 }, { "epoch": 0.65, "learning_rate": 1.3381741510429808e-05, "loss": 0.8587, "step": 48820 }, { "epoch": 0.65, "learning_rate": 1.33770828773008e-05, "loss": 0.706, "step": 48825 }, { "epoch": 0.65, "learning_rate": 1.3372424759008873e-05, "loss": 1.1543, "step": 48830 }, { "epoch": 0.65, "learning_rate": 1.3367767155760347e-05, "loss": 1.362, "step": 48835 }, { "epoch": 0.65, "learning_rate": 1.3363110067761553e-05, "loss": 0.518, "step": 48840 }, { "epoch": 0.65, "learning_rate": 1.3358453495218765e-05, "loss": 0.8196, "step": 48845 }, { "epoch": 0.65, "learning_rate": 1.3353797438338245e-05, "loss": 0.2337, "step": 48850 }, { "epoch": 0.65, "learning_rate": 1.3349141897326226e-05, "loss": 0.2403, "step": 48855 }, { "epoch": 0.65, "learning_rate": 1.3344486872388942e-05, "loss": 0.529, "step": 48860 }, { "epoch": 0.65, "learning_rate": 1.333983236373258e-05, "loss": 1.0849, "step": 48865 }, { "epoch": 0.65, "learning_rate": 1.33351783715633e-05, "loss": 0.6067, "step": 48870 }, { "epoch": 0.65, "learning_rate": 1.3330524896087283e-05, "loss": 0.5899, "step": 48875 }, { "epoch": 0.65, "learning_rate": 1.332587193751061e-05, "loss": 0.6924, "step": 48880 }, { "epoch": 0.65, "learning_rate": 1.3321219496039417e-05, "loss": 0.8473, "step": 48885 }, { "epoch": 0.66, "learning_rate": 1.3316567571879773e-05, "loss": 0.9333, "step": 48890 }, { "epoch": 0.66, "learning_rate": 1.3311916165237726e-05, "loss": 0.425, "step": 48895 }, { "epoch": 0.66, "learning_rate": 1.3307265276319328e-05, "loss": 1.2895, "step": 48900 }, { "epoch": 0.66, "learning_rate": 1.3302614905330571e-05, "loss": 0.9261, "step": 48905 }, { "epoch": 0.66, "learning_rate": 1.3297965052477465e-05, "loss": 0.306, "step": 48910 }, { "epoch": 0.66, "learning_rate": 1.3293315717965964e-05, "loss": 0.5321, "step": 48915 }, { "epoch": 0.66, "learning_rate": 1.3288666902002e-05, "loss": 0.6433, "step": 48920 }, { "epoch": 0.66, "learning_rate": 1.328401860479152e-05, "loss": 0.2378, "step": 48925 }, { "epoch": 0.66, "learning_rate": 1.3279370826540383e-05, "loss": 1.421, "step": 48930 }, { "epoch": 0.66, "learning_rate": 1.3274723567454495e-05, "loss": 0.6628, "step": 48935 }, { "epoch": 0.66, "learning_rate": 1.3270076827739691e-05, "loss": 0.4545, "step": 48940 }, { "epoch": 0.66, "learning_rate": 1.3265430607601792e-05, "loss": 0.6484, "step": 48945 }, { "epoch": 0.66, "learning_rate": 1.3260784907246618e-05, "loss": 1.3712, "step": 48950 }, { "epoch": 0.66, "learning_rate": 1.3256139726879946e-05, "loss": 0.5885, "step": 48955 }, { "epoch": 0.66, "learning_rate": 1.325149506670753e-05, "loss": 0.6646, "step": 48960 }, { "epoch": 0.66, "learning_rate": 1.3246850926935095e-05, "loss": 0.7546, "step": 48965 }, { "epoch": 0.66, "learning_rate": 1.3242207307768379e-05, "loss": 1.7534, "step": 48970 }, { "epoch": 0.66, "learning_rate": 1.3237564209413057e-05, "loss": 0.9181, "step": 48975 }, { "epoch": 0.66, "learning_rate": 1.323292163207478e-05, "loss": 0.3382, "step": 48980 }, { "epoch": 0.66, "learning_rate": 1.3228279575959229e-05, "loss": 0.4242, "step": 48985 }, { "epoch": 0.66, "learning_rate": 1.3223638041271979e-05, "loss": 0.6862, "step": 48990 }, { "epoch": 0.66, "learning_rate": 1.321899702821866e-05, "loss": 0.985, "step": 48995 }, { "epoch": 0.66, "learning_rate": 1.3214356537004834e-05, "loss": 0.3192, "step": 49000 }, { "epoch": 0.66, "learning_rate": 1.320971656783604e-05, "loss": 0.5946, "step": 49005 }, { "epoch": 0.66, "learning_rate": 1.320507712091783e-05, "loss": 0.8973, "step": 49010 }, { "epoch": 0.66, "learning_rate": 1.3200438196455684e-05, "loss": 0.7077, "step": 49015 }, { "epoch": 0.66, "learning_rate": 1.3195799794655105e-05, "loss": 0.8494, "step": 49020 }, { "epoch": 0.66, "learning_rate": 1.3191161915721539e-05, "loss": 0.4609, "step": 49025 }, { "epoch": 0.66, "learning_rate": 1.3186524559860413e-05, "loss": 0.665, "step": 49030 }, { "epoch": 0.66, "learning_rate": 1.318188772727717e-05, "loss": 0.9743, "step": 49035 }, { "epoch": 0.66, "learning_rate": 1.3177251418177155e-05, "loss": 0.8193, "step": 49040 }, { "epoch": 0.66, "learning_rate": 1.3172615632765764e-05, "loss": 1.0523, "step": 49045 }, { "epoch": 0.66, "learning_rate": 1.3167980371248329e-05, "loss": 0.368, "step": 49050 }, { "epoch": 0.66, "learning_rate": 1.3163345633830163e-05, "loss": 1.1041, "step": 49055 }, { "epoch": 0.66, "learning_rate": 1.3158711420716577e-05, "loss": 0.7615, "step": 49060 }, { "epoch": 0.66, "learning_rate": 1.3154077732112835e-05, "loss": 1.05, "step": 49065 }, { "epoch": 0.66, "learning_rate": 1.3149444568224184e-05, "loss": 0.542, "step": 49070 }, { "epoch": 0.66, "learning_rate": 1.3144811929255847e-05, "loss": 0.6168, "step": 49075 }, { "epoch": 0.66, "learning_rate": 1.3140179815413039e-05, "loss": 0.5645, "step": 49080 }, { "epoch": 0.66, "learning_rate": 1.3135548226900932e-05, "loss": 0.742, "step": 49085 }, { "epoch": 0.66, "learning_rate": 1.3130917163924672e-05, "loss": 0.6758, "step": 49090 }, { "epoch": 0.66, "learning_rate": 1.3126286626689423e-05, "loss": 1.4696, "step": 49095 }, { "epoch": 0.66, "learning_rate": 1.3121656615400258e-05, "loss": 0.6812, "step": 49100 }, { "epoch": 0.66, "learning_rate": 1.3117027130262277e-05, "loss": 0.6443, "step": 49105 }, { "epoch": 0.66, "learning_rate": 1.3112398171480561e-05, "loss": 0.9772, "step": 49110 }, { "epoch": 0.66, "learning_rate": 1.310776973926012e-05, "loss": 0.9747, "step": 49115 }, { "epoch": 0.66, "learning_rate": 1.3103141833805993e-05, "loss": 0.3529, "step": 49120 }, { "epoch": 0.66, "learning_rate": 1.3098514455323152e-05, "loss": 1.0374, "step": 49125 }, { "epoch": 0.66, "learning_rate": 1.3093887604016592e-05, "loss": 0.7653, "step": 49130 }, { "epoch": 0.66, "learning_rate": 1.3089261280091248e-05, "loss": 0.9269, "step": 49135 }, { "epoch": 0.66, "learning_rate": 1.3084635483752028e-05, "loss": 0.5103, "step": 49140 }, { "epoch": 0.66, "learning_rate": 1.308001021520387e-05, "loss": 0.6424, "step": 49145 }, { "epoch": 0.66, "learning_rate": 1.3075385474651603e-05, "loss": 1.6774, "step": 49150 }, { "epoch": 0.66, "learning_rate": 1.307076126230011e-05, "loss": 0.9316, "step": 49155 }, { "epoch": 0.66, "learning_rate": 1.3066137578354215e-05, "loss": 1.0072, "step": 49160 }, { "epoch": 0.66, "learning_rate": 1.3061514423018715e-05, "loss": 1.2087, "step": 49165 }, { "epoch": 0.66, "learning_rate": 1.3056891796498405e-05, "loss": 0.7017, "step": 49170 }, { "epoch": 0.66, "learning_rate": 1.3052269698998043e-05, "loss": 1.2744, "step": 49175 }, { "epoch": 0.66, "learning_rate": 1.3047648130722356e-05, "loss": 0.8375, "step": 49180 }, { "epoch": 0.66, "learning_rate": 1.3043027091876055e-05, "loss": 0.8174, "step": 49185 }, { "epoch": 0.66, "learning_rate": 1.3038406582663846e-05, "loss": 0.8784, "step": 49190 }, { "epoch": 0.66, "learning_rate": 1.3033786603290383e-05, "loss": 0.4243, "step": 49195 }, { "epoch": 0.66, "learning_rate": 1.3029167153960292e-05, "loss": 0.5641, "step": 49200 }, { "epoch": 0.66, "learning_rate": 1.3024548234878233e-05, "loss": 0.7319, "step": 49205 }, { "epoch": 0.66, "learning_rate": 1.3019929846248757e-05, "loss": 0.3026, "step": 49210 }, { "epoch": 0.66, "learning_rate": 1.3015311988276452e-05, "loss": 0.7896, "step": 49215 }, { "epoch": 0.66, "learning_rate": 1.301069466116589e-05, "loss": 0.2696, "step": 49220 }, { "epoch": 0.66, "learning_rate": 1.3006077865121552e-05, "loss": 1.4414, "step": 49225 }, { "epoch": 0.66, "learning_rate": 1.3001461600347975e-05, "loss": 0.2162, "step": 49230 }, { "epoch": 0.66, "learning_rate": 1.2996845867049607e-05, "loss": 0.2331, "step": 49235 }, { "epoch": 0.66, "learning_rate": 1.2992230665430933e-05, "loss": 0.6641, "step": 49240 }, { "epoch": 0.66, "learning_rate": 1.2987615995696362e-05, "loss": 0.7534, "step": 49245 }, { "epoch": 0.66, "learning_rate": 1.2983001858050298e-05, "loss": 0.8085, "step": 49250 }, { "epoch": 0.66, "learning_rate": 1.2978388252697155e-05, "loss": 0.4987, "step": 49255 }, { "epoch": 0.66, "learning_rate": 1.2973775179841247e-05, "loss": 0.8495, "step": 49260 }, { "epoch": 0.66, "learning_rate": 1.2969162639686943e-05, "loss": 1.2857, "step": 49265 }, { "epoch": 0.66, "learning_rate": 1.2964550632438549e-05, "loss": 0.7455, "step": 49270 }, { "epoch": 0.66, "learning_rate": 1.2959939158300339e-05, "loss": 0.8273, "step": 49275 }, { "epoch": 0.66, "learning_rate": 1.2955328217476598e-05, "loss": 0.6291, "step": 49280 }, { "epoch": 0.66, "learning_rate": 1.2950717810171558e-05, "loss": 0.6975, "step": 49285 }, { "epoch": 0.66, "learning_rate": 1.2946107936589443e-05, "loss": 0.738, "step": 49290 }, { "epoch": 0.66, "learning_rate": 1.294149859693443e-05, "loss": 0.9649, "step": 49295 }, { "epoch": 0.66, "learning_rate": 1.2936889791410714e-05, "loss": 1.2602, "step": 49300 }, { "epoch": 0.66, "learning_rate": 1.2932281520222428e-05, "loss": 0.4151, "step": 49305 }, { "epoch": 0.66, "learning_rate": 1.292767378357369e-05, "loss": 0.9864, "step": 49310 }, { "epoch": 0.66, "learning_rate": 1.2923066581668628e-05, "loss": 0.8003, "step": 49315 }, { "epoch": 0.66, "learning_rate": 1.2918459914711276e-05, "loss": 0.3798, "step": 49320 }, { "epoch": 0.66, "learning_rate": 1.2913853782905707e-05, "loss": 0.1462, "step": 49325 }, { "epoch": 0.66, "learning_rate": 1.2909248186455971e-05, "loss": 0.916, "step": 49330 }, { "epoch": 0.66, "learning_rate": 1.2904643125566035e-05, "loss": 1.6641, "step": 49335 }, { "epoch": 0.66, "learning_rate": 1.29000386004399e-05, "loss": 0.3177, "step": 49340 }, { "epoch": 0.66, "learning_rate": 1.2895434611281521e-05, "loss": 0.3907, "step": 49345 }, { "epoch": 0.66, "learning_rate": 1.2890831158294834e-05, "loss": 0.7002, "step": 49350 }, { "epoch": 0.66, "learning_rate": 1.2886228241683749e-05, "loss": 0.9311, "step": 49355 }, { "epoch": 0.66, "learning_rate": 1.2881625861652138e-05, "loss": 0.7303, "step": 49360 }, { "epoch": 0.66, "learning_rate": 1.2877024018403896e-05, "loss": 0.8312, "step": 49365 }, { "epoch": 0.66, "learning_rate": 1.287242271214282e-05, "loss": 0.7777, "step": 49370 }, { "epoch": 0.66, "learning_rate": 1.2867821943072755e-05, "loss": 0.4558, "step": 49375 }, { "epoch": 0.66, "learning_rate": 1.2863221711397485e-05, "loss": 1.8812, "step": 49380 }, { "epoch": 0.66, "learning_rate": 1.2858622017320764e-05, "loss": 0.4076, "step": 49385 }, { "epoch": 0.66, "learning_rate": 1.2854022861046355e-05, "loss": 0.8587, "step": 49390 }, { "epoch": 0.66, "learning_rate": 1.284942424277797e-05, "loss": 0.6784, "step": 49395 }, { "epoch": 0.66, "learning_rate": 1.2844826162719304e-05, "loss": 0.883, "step": 49400 }, { "epoch": 0.66, "learning_rate": 1.2840228621074018e-05, "loss": 0.4966, "step": 49405 }, { "epoch": 0.66, "learning_rate": 1.2835631618045778e-05, "loss": 0.9195, "step": 49410 }, { "epoch": 0.66, "learning_rate": 1.2831035153838206e-05, "loss": 0.8271, "step": 49415 }, { "epoch": 0.66, "learning_rate": 1.2826439228654885e-05, "loss": 0.4757, "step": 49420 }, { "epoch": 0.66, "learning_rate": 1.282184384269942e-05, "loss": 0.3126, "step": 49425 }, { "epoch": 0.66, "learning_rate": 1.2817248996175335e-05, "loss": 0.365, "step": 49430 }, { "epoch": 0.66, "learning_rate": 1.2812654689286165e-05, "loss": 0.8222, "step": 49435 }, { "epoch": 0.66, "learning_rate": 1.2808060922235444e-05, "loss": 0.658, "step": 49440 }, { "epoch": 0.66, "learning_rate": 1.2803467695226606e-05, "loss": 0.6638, "step": 49445 }, { "epoch": 0.66, "learning_rate": 1.2798875008463145e-05, "loss": 1.4929, "step": 49450 }, { "epoch": 0.66, "learning_rate": 1.2794282862148482e-05, "loss": 0.4821, "step": 49455 }, { "epoch": 0.66, "learning_rate": 1.2789691256486014e-05, "loss": 0.8224, "step": 49460 }, { "epoch": 0.66, "learning_rate": 1.2785100191679145e-05, "loss": 1.423, "step": 49465 }, { "epoch": 0.66, "learning_rate": 1.2780509667931217e-05, "loss": 0.9863, "step": 49470 }, { "epoch": 0.66, "learning_rate": 1.2775919685445603e-05, "loss": 0.8379, "step": 49475 }, { "epoch": 0.66, "learning_rate": 1.277133024442557e-05, "loss": 0.3144, "step": 49480 }, { "epoch": 0.66, "learning_rate": 1.276674134507444e-05, "loss": 0.6167, "step": 49485 }, { "epoch": 0.66, "learning_rate": 1.2762152987595466e-05, "loss": 1.3064, "step": 49490 }, { "epoch": 0.66, "learning_rate": 1.275756517219188e-05, "loss": 0.3017, "step": 49495 }, { "epoch": 0.66, "learning_rate": 1.275297789906692e-05, "loss": 0.477, "step": 49500 }, { "epoch": 0.66, "learning_rate": 1.2748391168423767e-05, "loss": 0.4594, "step": 49505 }, { "epoch": 0.66, "learning_rate": 1.2743804980465596e-05, "loss": 0.8176, "step": 49510 }, { "epoch": 0.66, "learning_rate": 1.2739219335395542e-05, "loss": 1.8143, "step": 49515 }, { "epoch": 0.66, "learning_rate": 1.2734634233416737e-05, "loss": 0.3991, "step": 49520 }, { "epoch": 0.66, "learning_rate": 1.2730049674732276e-05, "loss": 0.3566, "step": 49525 }, { "epoch": 0.66, "learning_rate": 1.2725465659545216e-05, "loss": 0.5851, "step": 49530 }, { "epoch": 0.66, "learning_rate": 1.272088218805864e-05, "loss": 0.9678, "step": 49535 }, { "epoch": 0.66, "learning_rate": 1.271629926047554e-05, "loss": 0.2645, "step": 49540 }, { "epoch": 0.66, "learning_rate": 1.2711716876998924e-05, "loss": 0.5721, "step": 49545 }, { "epoch": 0.66, "learning_rate": 1.2707135037831795e-05, "loss": 0.1628, "step": 49550 }, { "epoch": 0.66, "learning_rate": 1.2702553743177064e-05, "loss": 0.1918, "step": 49555 }, { "epoch": 0.66, "learning_rate": 1.269797299323769e-05, "loss": 0.6136, "step": 49560 }, { "epoch": 0.66, "learning_rate": 1.2693392788216568e-05, "loss": 0.7762, "step": 49565 }, { "epoch": 0.66, "learning_rate": 1.2688813128316566e-05, "loss": 0.163, "step": 49570 }, { "epoch": 0.66, "learning_rate": 1.2684234013740563e-05, "loss": 0.6536, "step": 49575 }, { "epoch": 0.66, "learning_rate": 1.2679655444691369e-05, "loss": 0.1015, "step": 49580 }, { "epoch": 0.66, "learning_rate": 1.267507742137182e-05, "loss": 0.8103, "step": 49585 }, { "epoch": 0.66, "learning_rate": 1.2670499943984664e-05, "loss": 0.6765, "step": 49590 }, { "epoch": 0.66, "learning_rate": 1.2665923012732689e-05, "loss": 0.4927, "step": 49595 }, { "epoch": 0.66, "learning_rate": 1.2661346627818616e-05, "loss": 0.6733, "step": 49600 }, { "epoch": 0.66, "learning_rate": 1.265677078944515e-05, "loss": 0.3957, "step": 49605 }, { "epoch": 0.66, "learning_rate": 1.2652195497814997e-05, "loss": 0.7423, "step": 49610 }, { "epoch": 0.66, "learning_rate": 1.2647620753130809e-05, "loss": 1.0064, "step": 49615 }, { "epoch": 0.66, "learning_rate": 1.2643046555595226e-05, "loss": 0.702, "step": 49620 }, { "epoch": 0.66, "learning_rate": 1.263847290541085e-05, "loss": 0.3186, "step": 49625 }, { "epoch": 0.66, "learning_rate": 1.2633899802780292e-05, "loss": 0.6889, "step": 49630 }, { "epoch": 0.67, "learning_rate": 1.2629327247906106e-05, "loss": 0.5272, "step": 49635 }, { "epoch": 0.67, "learning_rate": 1.2624755240990824e-05, "loss": 0.9553, "step": 49640 }, { "epoch": 0.67, "learning_rate": 1.2620183782236983e-05, "loss": 0.8958, "step": 49645 }, { "epoch": 0.67, "learning_rate": 1.2615612871847068e-05, "loss": 0.6702, "step": 49650 }, { "epoch": 0.67, "learning_rate": 1.2611042510023535e-05, "loss": 0.5305, "step": 49655 }, { "epoch": 0.67, "learning_rate": 1.260647269696886e-05, "loss": 0.5176, "step": 49660 }, { "epoch": 0.67, "learning_rate": 1.260190343288542e-05, "loss": 1.2517, "step": 49665 }, { "epoch": 0.67, "learning_rate": 1.2597334717975645e-05, "loss": 0.7293, "step": 49670 }, { "epoch": 0.67, "learning_rate": 1.259276655244189e-05, "loss": 0.6571, "step": 49675 }, { "epoch": 0.67, "learning_rate": 1.2588198936486495e-05, "loss": 0.7364, "step": 49680 }, { "epoch": 0.67, "learning_rate": 1.2583631870311804e-05, "loss": 0.6104, "step": 49685 }, { "epoch": 0.67, "learning_rate": 1.2579065354120095e-05, "loss": 1.2034, "step": 49690 }, { "epoch": 0.67, "learning_rate": 1.257449938811367e-05, "loss": 0.8566, "step": 49695 }, { "epoch": 0.67, "learning_rate": 1.256993397249474e-05, "loss": 0.6181, "step": 49700 }, { "epoch": 0.67, "learning_rate": 1.2565369107465557e-05, "loss": 1.5006, "step": 49705 }, { "epoch": 0.67, "learning_rate": 1.2560804793228318e-05, "loss": 0.398, "step": 49710 }, { "epoch": 0.67, "learning_rate": 1.2556241029985182e-05, "loss": 0.5585, "step": 49715 }, { "epoch": 0.67, "learning_rate": 1.2551677817938325e-05, "loss": 0.6316, "step": 49720 }, { "epoch": 0.67, "learning_rate": 1.2547115157289863e-05, "loss": 0.367, "step": 49725 }, { "epoch": 0.67, "learning_rate": 1.2542553048241902e-05, "loss": 0.5239, "step": 49730 }, { "epoch": 0.67, "learning_rate": 1.2537991490996508e-05, "loss": 0.8597, "step": 49735 }, { "epoch": 0.67, "learning_rate": 1.2533430485755755e-05, "loss": 0.7092, "step": 49740 }, { "epoch": 0.67, "learning_rate": 1.2528870032721663e-05, "loss": 0.431, "step": 49745 }, { "epoch": 0.67, "learning_rate": 1.2524310132096225e-05, "loss": 0.785, "step": 49750 }, { "epoch": 0.67, "learning_rate": 1.2519750784081447e-05, "loss": 0.7515, "step": 49755 }, { "epoch": 0.67, "learning_rate": 1.2515191988879272e-05, "loss": 0.3224, "step": 49760 }, { "epoch": 0.67, "learning_rate": 1.2510633746691622e-05, "loss": 0.5577, "step": 49765 }, { "epoch": 0.67, "learning_rate": 1.2506076057720433e-05, "loss": 0.5165, "step": 49770 }, { "epoch": 0.67, "learning_rate": 1.2501518922167554e-05, "loss": 0.9994, "step": 49775 }, { "epoch": 0.67, "learning_rate": 1.2496962340234866e-05, "loss": 1.0892, "step": 49780 }, { "epoch": 0.67, "learning_rate": 1.2492406312124195e-05, "loss": 1.3361, "step": 49785 }, { "epoch": 0.67, "learning_rate": 1.2488761888523123e-05, "loss": 1.1704, "step": 49790 }, { "epoch": 0.67, "learning_rate": 1.2484206857800618e-05, "loss": 0.4287, "step": 49795 }, { "epoch": 0.67, "learning_rate": 1.247965238146515e-05, "loss": 0.6166, "step": 49800 }, { "epoch": 0.67, "learning_rate": 1.2475098459718431e-05, "loss": 0.722, "step": 49805 }, { "epoch": 0.67, "learning_rate": 1.2470545092762198e-05, "loss": 1.1018, "step": 49810 }, { "epoch": 0.67, "learning_rate": 1.2465992280798133e-05, "loss": 0.6625, "step": 49815 }, { "epoch": 0.67, "learning_rate": 1.2461440024027895e-05, "loss": 0.8683, "step": 49820 }, { "epoch": 0.67, "learning_rate": 1.2456888322653145e-05, "loss": 0.4454, "step": 49825 }, { "epoch": 0.67, "learning_rate": 1.2452337176875493e-05, "loss": 0.8972, "step": 49830 }, { "epoch": 0.67, "learning_rate": 1.2447786586896528e-05, "loss": 0.9094, "step": 49835 }, { "epoch": 0.67, "learning_rate": 1.2443236552917812e-05, "loss": 0.7368, "step": 49840 }, { "epoch": 0.67, "learning_rate": 1.2438687075140905e-05, "loss": 0.4284, "step": 49845 }, { "epoch": 0.67, "learning_rate": 1.243413815376732e-05, "loss": 0.7294, "step": 49850 }, { "epoch": 0.67, "learning_rate": 1.242958978899854e-05, "loss": 1.0044, "step": 49855 }, { "epoch": 0.67, "learning_rate": 1.2425041981036054e-05, "loss": 0.6565, "step": 49860 }, { "epoch": 0.67, "learning_rate": 1.2420494730081297e-05, "loss": 0.694, "step": 49865 }, { "epoch": 0.67, "learning_rate": 1.2415948036335681e-05, "loss": 0.5421, "step": 49870 }, { "epoch": 0.67, "learning_rate": 1.2411401900000622e-05, "loss": 0.4443, "step": 49875 }, { "epoch": 0.67, "learning_rate": 1.2406856321277477e-05, "loss": 0.9466, "step": 49880 }, { "epoch": 0.67, "learning_rate": 1.2402311300367597e-05, "loss": 0.5723, "step": 49885 }, { "epoch": 0.67, "learning_rate": 1.2397766837472294e-05, "loss": 0.7755, "step": 49890 }, { "epoch": 0.67, "learning_rate": 1.239322293279288e-05, "loss": 0.9179, "step": 49895 }, { "epoch": 0.67, "learning_rate": 1.2388679586530624e-05, "loss": 1.1619, "step": 49900 }, { "epoch": 0.67, "learning_rate": 1.2384136798886758e-05, "loss": 0.9006, "step": 49905 }, { "epoch": 0.67, "learning_rate": 1.2379594570062536e-05, "loss": 0.3286, "step": 49910 }, { "epoch": 0.67, "learning_rate": 1.2375052900259119e-05, "loss": 0.6426, "step": 49915 }, { "epoch": 0.67, "learning_rate": 1.2370511789677702e-05, "loss": 0.618, "step": 49920 }, { "epoch": 0.67, "learning_rate": 1.2365971238519435e-05, "loss": 0.5841, "step": 49925 }, { "epoch": 0.67, "learning_rate": 1.2361431246985425e-05, "loss": 0.639, "step": 49930 }, { "epoch": 0.67, "learning_rate": 1.2356891815276792e-05, "loss": 0.7822, "step": 49935 }, { "epoch": 0.67, "learning_rate": 1.2352352943594597e-05, "loss": 0.4566, "step": 49940 }, { "epoch": 0.67, "learning_rate": 1.2347814632139895e-05, "loss": 0.2955, "step": 49945 }, { "epoch": 0.67, "learning_rate": 1.23432768811137e-05, "loss": 0.5908, "step": 49950 }, { "epoch": 0.67, "learning_rate": 1.2338739690717028e-05, "loss": 1.434, "step": 49955 }, { "epoch": 0.67, "learning_rate": 1.2334203061150842e-05, "loss": 0.3661, "step": 49960 }, { "epoch": 0.67, "learning_rate": 1.232966699261609e-05, "loss": 0.2704, "step": 49965 }, { "epoch": 0.67, "learning_rate": 1.232513148531371e-05, "loss": 1.3789, "step": 49970 }, { "epoch": 0.67, "learning_rate": 1.2320596539444595e-05, "loss": 0.5757, "step": 49975 }, { "epoch": 0.67, "learning_rate": 1.2316062155209612e-05, "loss": 0.7479, "step": 49980 }, { "epoch": 0.67, "learning_rate": 1.231152833280963e-05, "loss": 0.6031, "step": 49985 }, { "epoch": 0.67, "learning_rate": 1.2306995072445463e-05, "loss": 1.0259, "step": 49990 }, { "epoch": 0.67, "learning_rate": 1.230246237431791e-05, "loss": 0.6755, "step": 49995 }, { "epoch": 0.67, "learning_rate": 1.2297930238627745e-05, "loss": 0.6026, "step": 50000 }, { "epoch": 0.67, "learning_rate": 1.2293398665575731e-05, "loss": 0.2694, "step": 50005 }, { "epoch": 0.67, "learning_rate": 1.228886765536259e-05, "loss": 0.2716, "step": 50010 }, { "epoch": 0.67, "learning_rate": 1.228433720818901e-05, "loss": 1.1387, "step": 50015 }, { "epoch": 0.67, "learning_rate": 1.2279807324255693e-05, "loss": 0.2388, "step": 50020 }, { "epoch": 0.67, "learning_rate": 1.2275278003763258e-05, "loss": 0.9551, "step": 50025 }, { "epoch": 0.67, "learning_rate": 1.2270749246912356e-05, "loss": 0.8988, "step": 50030 }, { "epoch": 0.67, "learning_rate": 1.226622105390358e-05, "loss": 0.5022, "step": 50035 }, { "epoch": 0.67, "learning_rate": 1.2261693424937497e-05, "loss": 0.6812, "step": 50040 }, { "epoch": 0.67, "learning_rate": 1.2257166360214678e-05, "loss": 0.632, "step": 50045 }, { "epoch": 0.67, "learning_rate": 1.2252639859935636e-05, "loss": 1.1678, "step": 50050 }, { "epoch": 0.67, "learning_rate": 1.2248113924300878e-05, "loss": 0.7429, "step": 50055 }, { "epoch": 0.67, "learning_rate": 1.2243588553510869e-05, "loss": 0.6884, "step": 50060 }, { "epoch": 0.67, "learning_rate": 1.2239063747766075e-05, "loss": 0.6794, "step": 50065 }, { "epoch": 0.67, "learning_rate": 1.2234539507266918e-05, "loss": 0.501, "step": 50070 }, { "epoch": 0.67, "learning_rate": 1.2230015832213787e-05, "loss": 0.9375, "step": 50075 }, { "epoch": 0.67, "learning_rate": 1.2225492722807078e-05, "loss": 0.393, "step": 50080 }, { "epoch": 0.67, "learning_rate": 1.2220970179247132e-05, "loss": 0.8365, "step": 50085 }, { "epoch": 0.67, "learning_rate": 1.2216448201734264e-05, "loss": 1.5429, "step": 50090 }, { "epoch": 0.67, "learning_rate": 1.22119267904688e-05, "loss": 0.4785, "step": 50095 }, { "epoch": 0.67, "learning_rate": 1.2207405945651e-05, "loss": 0.6316, "step": 50100 }, { "epoch": 0.67, "learning_rate": 1.2202885667481121e-05, "loss": 0.6083, "step": 50105 }, { "epoch": 0.67, "learning_rate": 1.2198365956159372e-05, "loss": 0.3313, "step": 50110 }, { "epoch": 0.67, "learning_rate": 1.2193846811885978e-05, "loss": 0.4547, "step": 50115 }, { "epoch": 0.67, "learning_rate": 1.2189328234861103e-05, "loss": 0.5069, "step": 50120 }, { "epoch": 0.67, "learning_rate": 1.2184810225284885e-05, "loss": 1.0883, "step": 50125 }, { "epoch": 0.67, "learning_rate": 1.2180292783357483e-05, "loss": 0.3726, "step": 50130 }, { "epoch": 0.67, "learning_rate": 1.2175775909278955e-05, "loss": 0.8389, "step": 50135 }, { "epoch": 0.67, "learning_rate": 1.2171259603249407e-05, "loss": 0.5487, "step": 50140 }, { "epoch": 0.67, "learning_rate": 1.216674386546888e-05, "loss": 0.7325, "step": 50145 }, { "epoch": 0.67, "learning_rate": 1.2162228696137387e-05, "loss": 1.5365, "step": 50150 }, { "epoch": 0.67, "learning_rate": 1.2157714095454947e-05, "loss": 0.5509, "step": 50155 }, { "epoch": 0.67, "learning_rate": 1.2153200063621523e-05, "loss": 0.6111, "step": 50160 }, { "epoch": 0.67, "learning_rate": 1.2148686600837068e-05, "loss": 0.4854, "step": 50165 }, { "epoch": 0.67, "learning_rate": 1.214417370730149e-05, "loss": 1.0385, "step": 50170 }, { "epoch": 0.67, "learning_rate": 1.2139661383214715e-05, "loss": 0.4746, "step": 50175 }, { "epoch": 0.67, "learning_rate": 1.2135149628776598e-05, "loss": 0.826, "step": 50180 }, { "epoch": 0.67, "learning_rate": 1.2130638444186987e-05, "loss": 0.581, "step": 50185 }, { "epoch": 0.67, "learning_rate": 1.2126127829645717e-05, "loss": 0.6424, "step": 50190 }, { "epoch": 0.67, "learning_rate": 1.2121617785352576e-05, "loss": 0.2343, "step": 50195 }, { "epoch": 0.67, "learning_rate": 1.2117108311507334e-05, "loss": 0.7269, "step": 50200 }, { "epoch": 0.67, "learning_rate": 1.2112599408309746e-05, "loss": 0.2355, "step": 50205 }, { "epoch": 0.67, "learning_rate": 1.2108091075959535e-05, "loss": 0.4814, "step": 50210 }, { "epoch": 0.67, "learning_rate": 1.2103583314656391e-05, "loss": 0.195, "step": 50215 }, { "epoch": 0.67, "learning_rate": 1.2099076124599982e-05, "loss": 0.4461, "step": 50220 }, { "epoch": 0.67, "learning_rate": 1.2094569505989964e-05, "loss": 0.6069, "step": 50225 }, { "epoch": 0.67, "learning_rate": 1.2090063459025955e-05, "loss": 0.6712, "step": 50230 }, { "epoch": 0.67, "learning_rate": 1.208555798390754e-05, "loss": 1.0351, "step": 50235 }, { "epoch": 0.67, "learning_rate": 1.2081053080834314e-05, "loss": 0.7468, "step": 50240 }, { "epoch": 0.67, "learning_rate": 1.2076548750005787e-05, "loss": 0.7027, "step": 50245 }, { "epoch": 0.67, "learning_rate": 1.2072044991621506e-05, "loss": 0.9275, "step": 50250 }, { "epoch": 0.67, "learning_rate": 1.2067541805880956e-05, "loss": 0.8123, "step": 50255 }, { "epoch": 0.67, "learning_rate": 1.2063039192983594e-05, "loss": 0.4603, "step": 50260 }, { "epoch": 0.67, "learning_rate": 1.2058537153128886e-05, "loss": 1.03, "step": 50265 }, { "epoch": 0.67, "learning_rate": 1.2054035686516235e-05, "loss": 0.9905, "step": 50270 }, { "epoch": 0.67, "learning_rate": 1.2049534793345038e-05, "loss": 0.4469, "step": 50275 }, { "epoch": 0.67, "learning_rate": 1.204503447381465e-05, "loss": 0.1129, "step": 50280 }, { "epoch": 0.67, "learning_rate": 1.2040534728124437e-05, "loss": 0.7152, "step": 50285 }, { "epoch": 0.67, "learning_rate": 1.2036035556473696e-05, "loss": 1.0455, "step": 50290 }, { "epoch": 0.67, "learning_rate": 1.2031536959061715e-05, "loss": 0.9657, "step": 50295 }, { "epoch": 0.67, "learning_rate": 1.2027038936087778e-05, "loss": 0.757, "step": 50300 }, { "epoch": 0.67, "learning_rate": 1.2022541487751115e-05, "loss": 0.1146, "step": 50305 }, { "epoch": 0.67, "learning_rate": 1.2018044614250929e-05, "loss": 1.0271, "step": 50310 }, { "epoch": 0.67, "learning_rate": 1.201354831578643e-05, "loss": 0.6633, "step": 50315 }, { "epoch": 0.67, "learning_rate": 1.200905259255677e-05, "loss": 0.4018, "step": 50320 }, { "epoch": 0.67, "learning_rate": 1.2004557444761091e-05, "loss": 0.9869, "step": 50325 }, { "epoch": 0.67, "learning_rate": 1.2000062872598494e-05, "loss": 1.106, "step": 50330 }, { "epoch": 0.67, "learning_rate": 1.1995568876268081e-05, "loss": 0.9422, "step": 50335 }, { "epoch": 0.67, "learning_rate": 1.199107545596891e-05, "loss": 0.8225, "step": 50340 }, { "epoch": 0.67, "learning_rate": 1.1986582611900007e-05, "loss": 0.7533, "step": 50345 }, { "epoch": 0.67, "learning_rate": 1.1982090344260408e-05, "loss": 0.6673, "step": 50350 }, { "epoch": 0.67, "learning_rate": 1.197759865324906e-05, "loss": 1.2759, "step": 50355 }, { "epoch": 0.67, "learning_rate": 1.197310753906495e-05, "loss": 0.7579, "step": 50360 }, { "epoch": 0.67, "learning_rate": 1.1968617001907009e-05, "loss": 0.8632, "step": 50365 }, { "epoch": 0.67, "learning_rate": 1.196412704197413e-05, "loss": 0.4638, "step": 50370 }, { "epoch": 0.67, "learning_rate": 1.1959637659465214e-05, "loss": 0.9338, "step": 50375 }, { "epoch": 0.68, "learning_rate": 1.1955148854579113e-05, "loss": 0.8915, "step": 50380 }, { "epoch": 0.68, "learning_rate": 1.1950660627514653e-05, "loss": 0.5131, "step": 50385 }, { "epoch": 0.68, "learning_rate": 1.1946172978470637e-05, "loss": 0.9092, "step": 50390 }, { "epoch": 0.68, "learning_rate": 1.1941685907645864e-05, "loss": 0.9488, "step": 50395 }, { "epoch": 0.68, "learning_rate": 1.1937199415239073e-05, "loss": 0.3708, "step": 50400 }, { "epoch": 0.68, "learning_rate": 1.1932713501448986e-05, "loss": 0.547, "step": 50405 }, { "epoch": 0.68, "learning_rate": 1.1928228166474328e-05, "loss": 0.3774, "step": 50410 }, { "epoch": 0.68, "learning_rate": 1.1923743410513769e-05, "loss": 0.4893, "step": 50415 }, { "epoch": 0.68, "learning_rate": 1.1919259233765944e-05, "loss": 0.7968, "step": 50420 }, { "epoch": 0.68, "learning_rate": 1.191477563642951e-05, "loss": 0.8662, "step": 50425 }, { "epoch": 0.68, "learning_rate": 1.1910292618703048e-05, "loss": 1.0936, "step": 50430 }, { "epoch": 0.68, "learning_rate": 1.1905810180785138e-05, "loss": 0.9448, "step": 50435 }, { "epoch": 0.68, "learning_rate": 1.1901328322874317e-05, "loss": 0.5444, "step": 50440 }, { "epoch": 0.68, "learning_rate": 1.1896847045169133e-05, "loss": 0.989, "step": 50445 }, { "epoch": 0.68, "learning_rate": 1.189236634786807e-05, "loss": 0.2083, "step": 50450 }, { "epoch": 0.68, "learning_rate": 1.1887886231169593e-05, "loss": 0.8047, "step": 50455 }, { "epoch": 0.68, "learning_rate": 1.1883406695272179e-05, "loss": 0.5577, "step": 50460 }, { "epoch": 0.68, "learning_rate": 1.1878927740374207e-05, "loss": 0.6222, "step": 50465 }, { "epoch": 0.68, "learning_rate": 1.1874449366674107e-05, "loss": 0.5879, "step": 50470 }, { "epoch": 0.68, "learning_rate": 1.1869971574370232e-05, "loss": 0.458, "step": 50475 }, { "epoch": 0.68, "learning_rate": 1.1865494363660918e-05, "loss": 0.5458, "step": 50480 }, { "epoch": 0.68, "learning_rate": 1.1861017734744504e-05, "loss": 1.0369, "step": 50485 }, { "epoch": 0.68, "learning_rate": 1.1856541687819272e-05, "loss": 1.4772, "step": 50490 }, { "epoch": 0.68, "learning_rate": 1.185206622308349e-05, "loss": 0.4767, "step": 50495 }, { "epoch": 0.68, "learning_rate": 1.1847591340735387e-05, "loss": 0.2313, "step": 50500 }, { "epoch": 0.68, "learning_rate": 1.1843117040973198e-05, "loss": 1.5279, "step": 50505 }, { "epoch": 0.68, "learning_rate": 1.1838643323995103e-05, "loss": 0.7788, "step": 50510 }, { "epoch": 0.68, "learning_rate": 1.1834170189999252e-05, "loss": 0.272, "step": 50515 }, { "epoch": 0.68, "learning_rate": 1.1829697639183806e-05, "loss": 0.4016, "step": 50520 }, { "epoch": 0.68, "learning_rate": 1.1825225671746867e-05, "loss": 1.2629, "step": 50525 }, { "epoch": 0.68, "learning_rate": 1.182075428788651e-05, "loss": 1.1864, "step": 50530 }, { "epoch": 0.68, "learning_rate": 1.1816283487800814e-05, "loss": 0.8807, "step": 50535 }, { "epoch": 0.68, "learning_rate": 1.1811813271687801e-05, "loss": 0.3771, "step": 50540 }, { "epoch": 0.68, "learning_rate": 1.1807343639745483e-05, "loss": 1.3594, "step": 50545 }, { "epoch": 0.68, "learning_rate": 1.180287459217183e-05, "loss": 1.006, "step": 50550 }, { "epoch": 0.68, "learning_rate": 1.1798406129164822e-05, "loss": 0.7577, "step": 50555 }, { "epoch": 0.68, "learning_rate": 1.1793938250922377e-05, "loss": 1.0145, "step": 50560 }, { "epoch": 0.68, "learning_rate": 1.1789470957642388e-05, "loss": 1.0949, "step": 50565 }, { "epoch": 0.68, "learning_rate": 1.1785004249522763e-05, "loss": 1.4668, "step": 50570 }, { "epoch": 0.68, "learning_rate": 1.178053812676132e-05, "loss": 0.7132, "step": 50575 }, { "epoch": 0.68, "learning_rate": 1.1776072589555915e-05, "loss": 0.3513, "step": 50580 }, { "epoch": 0.68, "learning_rate": 1.1771607638104334e-05, "loss": 0.8665, "step": 50585 }, { "epoch": 0.68, "learning_rate": 1.1767143272604344e-05, "loss": 0.5824, "step": 50590 }, { "epoch": 0.68, "learning_rate": 1.176267949325372e-05, "loss": 0.3483, "step": 50595 }, { "epoch": 0.68, "learning_rate": 1.1758216300250167e-05, "loss": 0.3933, "step": 50600 }, { "epoch": 0.68, "learning_rate": 1.1753753693791383e-05, "loss": 0.8829, "step": 50605 }, { "epoch": 0.68, "learning_rate": 1.1749291674075037e-05, "loss": 0.287, "step": 50610 }, { "epoch": 0.68, "learning_rate": 1.1744830241298785e-05, "loss": 0.4059, "step": 50615 }, { "epoch": 0.68, "learning_rate": 1.1740369395660239e-05, "loss": 0.3561, "step": 50620 }, { "epoch": 0.68, "learning_rate": 1.1735909137356984e-05, "loss": 0.2897, "step": 50625 }, { "epoch": 0.68, "learning_rate": 1.1731449466586608e-05, "loss": 0.3042, "step": 50630 }, { "epoch": 0.68, "learning_rate": 1.1726990383546638e-05, "loss": 0.8819, "step": 50635 }, { "epoch": 0.68, "learning_rate": 1.1722531888434583e-05, "loss": 1.0193, "step": 50640 }, { "epoch": 0.68, "learning_rate": 1.171807398144795e-05, "loss": 0.6251, "step": 50645 }, { "epoch": 0.68, "learning_rate": 1.171361666278419e-05, "loss": 0.5882, "step": 50650 }, { "epoch": 0.68, "learning_rate": 1.1709159932640742e-05, "loss": 0.9391, "step": 50655 }, { "epoch": 0.68, "learning_rate": 1.170470379121501e-05, "loss": 0.8331, "step": 50660 }, { "epoch": 0.68, "learning_rate": 1.1700248238704394e-05, "loss": 0.5419, "step": 50665 }, { "epoch": 0.68, "learning_rate": 1.1695793275306247e-05, "loss": 0.5515, "step": 50670 }, { "epoch": 0.68, "learning_rate": 1.1691338901217885e-05, "loss": 1.2007, "step": 50675 }, { "epoch": 0.68, "learning_rate": 1.168688511663665e-05, "loss": 0.5684, "step": 50680 }, { "epoch": 0.68, "learning_rate": 1.1682431921759781e-05, "loss": 0.3202, "step": 50685 }, { "epoch": 0.68, "learning_rate": 1.1677979316784562e-05, "loss": 0.4106, "step": 50690 }, { "epoch": 0.68, "learning_rate": 1.1673527301908212e-05, "loss": 1.5035, "step": 50695 }, { "epoch": 0.68, "learning_rate": 1.1669075877327922e-05, "loss": 0.8007, "step": 50700 }, { "epoch": 0.68, "learning_rate": 1.166462504324089e-05, "loss": 0.7541, "step": 50705 }, { "epoch": 0.68, "learning_rate": 1.166017479984425e-05, "loss": 0.579, "step": 50710 }, { "epoch": 0.68, "learning_rate": 1.1655725147335123e-05, "loss": 0.7537, "step": 50715 }, { "epoch": 0.68, "learning_rate": 1.165127608591062e-05, "loss": 0.8822, "step": 50720 }, { "epoch": 0.68, "learning_rate": 1.1646827615767805e-05, "loss": 1.2097, "step": 50725 }, { "epoch": 0.68, "learning_rate": 1.1642379737103725e-05, "loss": 0.7003, "step": 50730 }, { "epoch": 0.68, "learning_rate": 1.1637932450115385e-05, "loss": 1.2925, "step": 50735 }, { "epoch": 0.68, "learning_rate": 1.1633485754999799e-05, "loss": 1.1139, "step": 50740 }, { "epoch": 0.68, "learning_rate": 1.1629039651953924e-05, "loss": 0.9018, "step": 50745 }, { "epoch": 0.68, "learning_rate": 1.1624594141174689e-05, "loss": 0.1023, "step": 50750 }, { "epoch": 0.68, "learning_rate": 1.1620149222859029e-05, "loss": 0.9271, "step": 50755 }, { "epoch": 0.68, "learning_rate": 1.1615704897203822e-05, "loss": 0.6858, "step": 50760 }, { "epoch": 0.68, "learning_rate": 1.1611261164405926e-05, "loss": 0.6159, "step": 50765 }, { "epoch": 0.68, "learning_rate": 1.1606818024662172e-05, "loss": 0.5451, "step": 50770 }, { "epoch": 0.68, "learning_rate": 1.1602375478169383e-05, "loss": 0.3459, "step": 50775 }, { "epoch": 0.68, "learning_rate": 1.1597933525124335e-05, "loss": 0.5572, "step": 50780 }, { "epoch": 0.68, "learning_rate": 1.1593492165723773e-05, "loss": 0.3284, "step": 50785 }, { "epoch": 0.68, "learning_rate": 1.1589051400164458e-05, "loss": 0.5074, "step": 50790 }, { "epoch": 0.68, "learning_rate": 1.1584611228643052e-05, "loss": 1.2844, "step": 50795 }, { "epoch": 0.68, "learning_rate": 1.1580171651356265e-05, "loss": 0.7052, "step": 50800 }, { "epoch": 0.68, "learning_rate": 1.1575732668500736e-05, "loss": 0.8806, "step": 50805 }, { "epoch": 0.68, "learning_rate": 1.157129428027308e-05, "loss": 1.102, "step": 50810 }, { "epoch": 0.68, "learning_rate": 1.1566856486869914e-05, "loss": 0.6012, "step": 50815 }, { "epoch": 0.68, "learning_rate": 1.1562419288487806e-05, "loss": 0.7889, "step": 50820 }, { "epoch": 0.68, "learning_rate": 1.1557982685323284e-05, "loss": 0.7037, "step": 50825 }, { "epoch": 0.68, "learning_rate": 1.1553546677572891e-05, "loss": 0.8625, "step": 50830 }, { "epoch": 0.68, "learning_rate": 1.154911126543311e-05, "loss": 0.9007, "step": 50835 }, { "epoch": 0.68, "learning_rate": 1.1544676449100408e-05, "loss": 1.2372, "step": 50840 }, { "epoch": 0.68, "learning_rate": 1.1540242228771214e-05, "loss": 1.0581, "step": 50845 }, { "epoch": 0.68, "learning_rate": 1.1535808604641963e-05, "loss": 0.4509, "step": 50850 }, { "epoch": 0.68, "learning_rate": 1.1531375576909029e-05, "loss": 1.2841, "step": 50855 }, { "epoch": 0.68, "learning_rate": 1.1526943145768767e-05, "loss": 0.5675, "step": 50860 }, { "epoch": 0.68, "learning_rate": 1.1522511311417533e-05, "loss": 0.6031, "step": 50865 }, { "epoch": 0.68, "learning_rate": 1.1518080074051618e-05, "loss": 0.7463, "step": 50870 }, { "epoch": 0.68, "learning_rate": 1.151364943386731e-05, "loss": 0.2412, "step": 50875 }, { "epoch": 0.68, "learning_rate": 1.1509219391060851e-05, "loss": 1.1599, "step": 50880 }, { "epoch": 0.68, "learning_rate": 1.1504789945828492e-05, "loss": 0.2252, "step": 50885 }, { "epoch": 0.68, "learning_rate": 1.1500361098366422e-05, "loss": 0.6414, "step": 50890 }, { "epoch": 0.68, "learning_rate": 1.1495932848870811e-05, "loss": 0.5771, "step": 50895 }, { "epoch": 0.68, "learning_rate": 1.1491505197537833e-05, "loss": 0.4017, "step": 50900 }, { "epoch": 0.68, "learning_rate": 1.1487078144563576e-05, "loss": 0.8285, "step": 50905 }, { "epoch": 0.68, "learning_rate": 1.1482651690144163e-05, "loss": 0.9546, "step": 50910 }, { "epoch": 0.68, "learning_rate": 1.1478225834475658e-05, "loss": 1.1332, "step": 50915 }, { "epoch": 0.68, "learning_rate": 1.147380057775409e-05, "loss": 0.8052, "step": 50920 }, { "epoch": 0.68, "learning_rate": 1.1469375920175496e-05, "loss": 0.1526, "step": 50925 }, { "epoch": 0.68, "learning_rate": 1.1464951861935857e-05, "loss": 0.6099, "step": 50930 }, { "epoch": 0.68, "learning_rate": 1.1460528403231127e-05, "loss": 1.3153, "step": 50935 }, { "epoch": 0.68, "learning_rate": 1.1456105544257262e-05, "loss": 0.5746, "step": 50940 }, { "epoch": 0.68, "learning_rate": 1.1451683285210165e-05, "loss": 0.6185, "step": 50945 }, { "epoch": 0.68, "learning_rate": 1.1447261626285719e-05, "loss": 0.2255, "step": 50950 }, { "epoch": 0.68, "learning_rate": 1.144284056767977e-05, "loss": 1.0513, "step": 50955 }, { "epoch": 0.68, "learning_rate": 1.1438420109588166e-05, "loss": 0.2557, "step": 50960 }, { "epoch": 0.68, "learning_rate": 1.1434000252206709e-05, "loss": 0.7496, "step": 50965 }, { "epoch": 0.68, "learning_rate": 1.1429580995731162e-05, "loss": 0.7712, "step": 50970 }, { "epoch": 0.68, "learning_rate": 1.1425162340357293e-05, "loss": 0.7832, "step": 50975 }, { "epoch": 0.68, "learning_rate": 1.1420744286280822e-05, "loss": 1.298, "step": 50980 }, { "epoch": 0.68, "learning_rate": 1.1416326833697444e-05, "loss": 1.0465, "step": 50985 }, { "epoch": 0.68, "learning_rate": 1.1411909982802821e-05, "loss": 0.3632, "step": 50990 }, { "epoch": 0.68, "learning_rate": 1.1407493733792616e-05, "loss": 0.7104, "step": 50995 }, { "epoch": 0.68, "learning_rate": 1.1403078086862437e-05, "loss": 0.7376, "step": 51000 }, { "epoch": 0.68, "learning_rate": 1.1398663042207865e-05, "loss": 1.399, "step": 51005 }, { "epoch": 0.68, "learning_rate": 1.1394248600024496e-05, "loss": 0.5863, "step": 51010 }, { "epoch": 0.68, "learning_rate": 1.1389834760507829e-05, "loss": 0.5435, "step": 51015 }, { "epoch": 0.68, "learning_rate": 1.1385421523853398e-05, "loss": 0.8891, "step": 51020 }, { "epoch": 0.68, "learning_rate": 1.1381008890256683e-05, "loss": 0.4338, "step": 51025 }, { "epoch": 0.68, "learning_rate": 1.1376596859913133e-05, "loss": 1.1297, "step": 51030 }, { "epoch": 0.68, "learning_rate": 1.1372185433018193e-05, "loss": 1.0145, "step": 51035 }, { "epoch": 0.68, "learning_rate": 1.1367774609767262e-05, "loss": 0.8147, "step": 51040 }, { "epoch": 0.68, "learning_rate": 1.1363364390355708e-05, "loss": 0.362, "step": 51045 }, { "epoch": 0.68, "learning_rate": 1.1358954774978897e-05, "loss": 0.4388, "step": 51050 }, { "epoch": 0.68, "learning_rate": 1.1354545763832144e-05, "loss": 0.5143, "step": 51055 }, { "epoch": 0.68, "learning_rate": 1.1350137357110752e-05, "loss": 0.1394, "step": 51060 }, { "epoch": 0.68, "learning_rate": 1.1345729555009973e-05, "loss": 1.1681, "step": 51065 }, { "epoch": 0.68, "learning_rate": 1.1341322357725076e-05, "loss": 0.6848, "step": 51070 }, { "epoch": 0.68, "learning_rate": 1.1336915765451266e-05, "loss": 0.6876, "step": 51075 }, { "epoch": 0.68, "learning_rate": 1.1332509778383727e-05, "loss": 1.1603, "step": 51080 }, { "epoch": 0.68, "learning_rate": 1.1328104396717634e-05, "loss": 0.3242, "step": 51085 }, { "epoch": 0.68, "learning_rate": 1.1323699620648117e-05, "loss": 0.9083, "step": 51090 }, { "epoch": 0.68, "learning_rate": 1.1319295450370291e-05, "loss": 0.5297, "step": 51095 }, { "epoch": 0.68, "learning_rate": 1.131489188607922e-05, "loss": 0.6766, "step": 51100 }, { "epoch": 0.68, "learning_rate": 1.1310488927969986e-05, "loss": 1.3055, "step": 51105 }, { "epoch": 0.68, "learning_rate": 1.1306086576237607e-05, "loss": 0.3226, "step": 51110 }, { "epoch": 0.68, "learning_rate": 1.1301684831077073e-05, "loss": 0.8449, "step": 51115 }, { "epoch": 0.68, "learning_rate": 1.1297283692683391e-05, "loss": 0.7208, "step": 51120 }, { "epoch": 0.69, "learning_rate": 1.129288316125147e-05, "loss": 1.1532, "step": 51125 }, { "epoch": 0.69, "learning_rate": 1.1288483236976255e-05, "loss": 0.3449, "step": 51130 }, { "epoch": 0.69, "learning_rate": 1.128408392005264e-05, "loss": 1.5379, "step": 51135 }, { "epoch": 0.69, "learning_rate": 1.127968521067548e-05, "loss": 0.4172, "step": 51140 }, { "epoch": 0.69, "learning_rate": 1.1275287109039634e-05, "loss": 0.595, "step": 51145 }, { "epoch": 0.69, "learning_rate": 1.1270889615339906e-05, "loss": 1.2126, "step": 51150 }, { "epoch": 0.69, "learning_rate": 1.1266492729771073e-05, "loss": 1.3069, "step": 51155 }, { "epoch": 0.69, "learning_rate": 1.1262096452527915e-05, "loss": 0.556, "step": 51160 }, { "epoch": 0.69, "learning_rate": 1.1257700783805155e-05, "loss": 1.3243, "step": 51165 }, { "epoch": 0.69, "learning_rate": 1.1253305723797502e-05, "loss": 0.7238, "step": 51170 }, { "epoch": 0.69, "learning_rate": 1.1248911272699621e-05, "loss": 0.594, "step": 51175 }, { "epoch": 0.69, "learning_rate": 1.1244517430706186e-05, "loss": 1.3796, "step": 51180 }, { "epoch": 0.69, "learning_rate": 1.1240124198011814e-05, "loss": 0.7343, "step": 51185 }, { "epoch": 0.69, "learning_rate": 1.1235731574811093e-05, "loss": 1.0515, "step": 51190 }, { "epoch": 0.69, "learning_rate": 1.1231339561298609e-05, "loss": 1.0063, "step": 51195 }, { "epoch": 0.69, "learning_rate": 1.12269481576689e-05, "loss": 0.2495, "step": 51200 }, { "epoch": 0.69, "learning_rate": 1.1222557364116486e-05, "loss": 0.4234, "step": 51205 }, { "epoch": 0.69, "learning_rate": 1.1218167180835842e-05, "loss": 0.5314, "step": 51210 }, { "epoch": 0.69, "learning_rate": 1.1213777608021456e-05, "loss": 1.1315, "step": 51215 }, { "epoch": 0.69, "learning_rate": 1.1209388645867749e-05, "loss": 0.711, "step": 51220 }, { "epoch": 0.69, "learning_rate": 1.1205000294569126e-05, "loss": 1.0384, "step": 51225 }, { "epoch": 0.69, "learning_rate": 1.1200612554319993e-05, "loss": 0.5138, "step": 51230 }, { "epoch": 0.69, "learning_rate": 1.1196225425314668e-05, "loss": 0.6563, "step": 51235 }, { "epoch": 0.69, "learning_rate": 1.1191838907747499e-05, "loss": 0.7889, "step": 51240 }, { "epoch": 0.69, "learning_rate": 1.1187453001812805e-05, "loss": 1.4534, "step": 51245 }, { "epoch": 0.69, "learning_rate": 1.1183067707704826e-05, "loss": 0.9043, "step": 51250 }, { "epoch": 0.69, "learning_rate": 1.1178683025617827e-05, "loss": 0.1294, "step": 51255 }, { "epoch": 0.69, "learning_rate": 1.1174298955746026e-05, "loss": 0.5196, "step": 51260 }, { "epoch": 0.69, "learning_rate": 1.1169915498283607e-05, "loss": 0.9679, "step": 51265 }, { "epoch": 0.69, "learning_rate": 1.1165532653424749e-05, "loss": 1.017, "step": 51270 }, { "epoch": 0.69, "learning_rate": 1.1161150421363581e-05, "loss": 0.4535, "step": 51275 }, { "epoch": 0.69, "learning_rate": 1.1156768802294217e-05, "loss": 0.7373, "step": 51280 }, { "epoch": 0.69, "learning_rate": 1.1152387796410733e-05, "loss": 1.2138, "step": 51285 }, { "epoch": 0.69, "learning_rate": 1.1148007403907198e-05, "loss": 0.9052, "step": 51290 }, { "epoch": 0.69, "learning_rate": 1.1143627624977638e-05, "loss": 1.2049, "step": 51295 }, { "epoch": 0.69, "learning_rate": 1.1139248459816043e-05, "loss": 0.1603, "step": 51300 }, { "epoch": 0.69, "learning_rate": 1.1134869908616416e-05, "loss": 0.8992, "step": 51305 }, { "epoch": 0.69, "learning_rate": 1.1130491971572667e-05, "loss": 1.2445, "step": 51310 }, { "epoch": 0.69, "learning_rate": 1.1126114648878749e-05, "loss": 0.999, "step": 51315 }, { "epoch": 0.69, "learning_rate": 1.1121737940728532e-05, "loss": 0.5095, "step": 51320 }, { "epoch": 0.69, "learning_rate": 1.1117361847315905e-05, "loss": 0.4542, "step": 51325 }, { "epoch": 0.69, "learning_rate": 1.1112986368834693e-05, "loss": 0.7084, "step": 51330 }, { "epoch": 0.69, "learning_rate": 1.1108611505478703e-05, "loss": 0.5652, "step": 51335 }, { "epoch": 0.69, "learning_rate": 1.1104237257441743e-05, "loss": 0.6373, "step": 51340 }, { "epoch": 0.69, "learning_rate": 1.1099863624917536e-05, "loss": 0.7648, "step": 51345 }, { "epoch": 0.69, "learning_rate": 1.1095490608099832e-05, "loss": 0.7236, "step": 51350 }, { "epoch": 0.69, "learning_rate": 1.109111820718235e-05, "loss": 0.3931, "step": 51355 }, { "epoch": 0.69, "learning_rate": 1.108674642235873e-05, "loss": 0.7334, "step": 51360 }, { "epoch": 0.69, "learning_rate": 1.1082375253822644e-05, "loss": 0.7275, "step": 51365 }, { "epoch": 0.69, "learning_rate": 1.1078004701767709e-05, "loss": 0.6717, "step": 51370 }, { "epoch": 0.69, "learning_rate": 1.1073634766387506e-05, "loss": 0.3633, "step": 51375 }, { "epoch": 0.69, "learning_rate": 1.1069265447875618e-05, "loss": 1.578, "step": 51380 }, { "epoch": 0.69, "learning_rate": 1.1064896746425583e-05, "loss": 0.8958, "step": 51385 }, { "epoch": 0.69, "learning_rate": 1.10605286622309e-05, "loss": 0.3756, "step": 51390 }, { "epoch": 0.69, "learning_rate": 1.1056161195485058e-05, "loss": 0.9029, "step": 51395 }, { "epoch": 0.69, "learning_rate": 1.1051794346381522e-05, "loss": 0.4551, "step": 51400 }, { "epoch": 0.69, "learning_rate": 1.1047428115113717e-05, "loss": 0.6298, "step": 51405 }, { "epoch": 0.69, "learning_rate": 1.1043062501875035e-05, "loss": 0.5523, "step": 51410 }, { "epoch": 0.69, "learning_rate": 1.1038697506858874e-05, "loss": 1.1113, "step": 51415 }, { "epoch": 0.69, "learning_rate": 1.1034333130258553e-05, "loss": 0.3135, "step": 51420 }, { "epoch": 0.69, "learning_rate": 1.1029969372267416e-05, "loss": 0.6805, "step": 51425 }, { "epoch": 0.69, "learning_rate": 1.1025606233078733e-05, "loss": 0.2202, "step": 51430 }, { "epoch": 0.69, "learning_rate": 1.1021243712885795e-05, "loss": 0.2, "step": 51435 }, { "epoch": 0.69, "learning_rate": 1.1016881811881826e-05, "loss": 1.0838, "step": 51440 }, { "epoch": 0.69, "learning_rate": 1.101252053026003e-05, "loss": 0.6463, "step": 51445 }, { "epoch": 0.69, "learning_rate": 1.1008159868213613e-05, "loss": 0.7877, "step": 51450 }, { "epoch": 0.69, "learning_rate": 1.1003799825935696e-05, "loss": 0.4961, "step": 51455 }, { "epoch": 0.69, "learning_rate": 1.0999440403619427e-05, "loss": 1.0638, "step": 51460 }, { "epoch": 0.69, "learning_rate": 1.0995081601457923e-05, "loss": 0.7268, "step": 51465 }, { "epoch": 0.69, "learning_rate": 1.0990723419644223e-05, "loss": 0.2946, "step": 51470 }, { "epoch": 0.69, "learning_rate": 1.0986365858371398e-05, "loss": 0.6782, "step": 51475 }, { "epoch": 0.69, "learning_rate": 1.0982008917832456e-05, "loss": 0.4071, "step": 51480 }, { "epoch": 0.69, "learning_rate": 1.0977652598220384e-05, "loss": 0.8146, "step": 51485 }, { "epoch": 0.69, "learning_rate": 1.0973296899728156e-05, "loss": 0.4812, "step": 51490 }, { "epoch": 0.69, "learning_rate": 1.09689418225487e-05, "loss": 0.2376, "step": 51495 }, { "epoch": 0.69, "learning_rate": 1.0964587366874931e-05, "loss": 0.4056, "step": 51500 }, { "epoch": 0.69, "learning_rate": 1.0960233532899714e-05, "loss": 0.4824, "step": 51505 }, { "epoch": 0.69, "learning_rate": 1.095588032081592e-05, "loss": 0.4788, "step": 51510 }, { "epoch": 0.69, "learning_rate": 1.0951527730816368e-05, "loss": 0.6819, "step": 51515 }, { "epoch": 0.69, "learning_rate": 1.0947175763093848e-05, "loss": 1.0453, "step": 51520 }, { "epoch": 0.69, "learning_rate": 1.0942824417841152e-05, "loss": 0.2826, "step": 51525 }, { "epoch": 0.69, "learning_rate": 1.0938473695250994e-05, "loss": 0.8097, "step": 51530 }, { "epoch": 0.69, "learning_rate": 1.0934123595516111e-05, "loss": 0.217, "step": 51535 }, { "epoch": 0.69, "learning_rate": 1.0929774118829175e-05, "loss": 0.6492, "step": 51540 }, { "epoch": 0.69, "learning_rate": 1.0925425265382863e-05, "loss": 0.6113, "step": 51545 }, { "epoch": 0.69, "learning_rate": 1.0921077035369797e-05, "loss": 0.4966, "step": 51550 }, { "epoch": 0.69, "learning_rate": 1.0916729428982578e-05, "loss": 0.2393, "step": 51555 }, { "epoch": 0.69, "learning_rate": 1.0912382446413807e-05, "loss": 1.0301, "step": 51560 }, { "epoch": 0.69, "learning_rate": 1.0908036087855993e-05, "loss": 0.3229, "step": 51565 }, { "epoch": 0.69, "learning_rate": 1.0903690353501685e-05, "loss": 0.3686, "step": 51570 }, { "epoch": 0.69, "learning_rate": 1.0899345243543391e-05, "loss": 1.4944, "step": 51575 }, { "epoch": 0.69, "learning_rate": 1.0895000758173538e-05, "loss": 0.6046, "step": 51580 }, { "epoch": 0.69, "learning_rate": 1.0890656897584597e-05, "loss": 0.9064, "step": 51585 }, { "epoch": 0.69, "learning_rate": 1.0886313661968969e-05, "loss": 0.5756, "step": 51590 }, { "epoch": 0.69, "learning_rate": 1.0881971051519027e-05, "loss": 0.624, "step": 51595 }, { "epoch": 0.69, "learning_rate": 1.0877629066427148e-05, "loss": 0.5466, "step": 51600 }, { "epoch": 0.69, "learning_rate": 1.0873287706885648e-05, "loss": 0.3746, "step": 51605 }, { "epoch": 0.69, "learning_rate": 1.086894697308683e-05, "loss": 0.5535, "step": 51610 }, { "epoch": 0.69, "learning_rate": 1.0864606865222953e-05, "loss": 0.2665, "step": 51615 }, { "epoch": 0.69, "learning_rate": 1.086026738348629e-05, "loss": 0.3137, "step": 51620 }, { "epoch": 0.69, "learning_rate": 1.0855928528069037e-05, "loss": 0.69, "step": 51625 }, { "epoch": 0.69, "learning_rate": 1.0851590299163383e-05, "loss": 0.7842, "step": 51630 }, { "epoch": 0.69, "learning_rate": 1.0847252696961515e-05, "loss": 0.8552, "step": 51635 }, { "epoch": 0.69, "learning_rate": 1.084291572165553e-05, "loss": 0.7744, "step": 51640 }, { "epoch": 0.69, "learning_rate": 1.0838579373437562e-05, "loss": 0.5499, "step": 51645 }, { "epoch": 0.69, "learning_rate": 1.0834243652499674e-05, "loss": 0.829, "step": 51650 }, { "epoch": 0.69, "learning_rate": 1.0829908559033927e-05, "loss": 0.542, "step": 51655 }, { "epoch": 0.69, "learning_rate": 1.0825574093232343e-05, "loss": 0.3624, "step": 51660 }, { "epoch": 0.69, "learning_rate": 1.0821240255286904e-05, "loss": 0.731, "step": 51665 }, { "epoch": 0.69, "learning_rate": 1.08169070453896e-05, "loss": 0.5634, "step": 51670 }, { "epoch": 0.69, "learning_rate": 1.0812574463732356e-05, "loss": 0.49, "step": 51675 }, { "epoch": 0.69, "learning_rate": 1.0808242510507075e-05, "loss": 0.5599, "step": 51680 }, { "epoch": 0.69, "learning_rate": 1.0803911185905672e-05, "loss": 0.4772, "step": 51685 }, { "epoch": 0.69, "learning_rate": 1.0799580490119963e-05, "loss": 0.8793, "step": 51690 }, { "epoch": 0.69, "learning_rate": 1.0795250423341805e-05, "loss": 0.2946, "step": 51695 }, { "epoch": 0.69, "learning_rate": 1.079092098576299e-05, "loss": 1.1316, "step": 51700 }, { "epoch": 0.69, "learning_rate": 1.0786592177575281e-05, "loss": 0.9978, "step": 51705 }, { "epoch": 0.69, "learning_rate": 1.0782263998970438e-05, "loss": 0.5342, "step": 51710 }, { "epoch": 0.69, "learning_rate": 1.0777936450140172e-05, "loss": 1.3106, "step": 51715 }, { "epoch": 0.69, "learning_rate": 1.0773609531276172e-05, "loss": 1.2566, "step": 51720 }, { "epoch": 0.69, "learning_rate": 1.0769283242570086e-05, "loss": 0.5218, "step": 51725 }, { "epoch": 0.69, "learning_rate": 1.0764957584213569e-05, "loss": 0.7164, "step": 51730 }, { "epoch": 0.69, "learning_rate": 1.0760632556398215e-05, "loss": 0.5892, "step": 51735 }, { "epoch": 0.69, "learning_rate": 1.0756308159315592e-05, "loss": 0.5381, "step": 51740 }, { "epoch": 0.69, "learning_rate": 1.0751984393157277e-05, "loss": 0.4019, "step": 51745 }, { "epoch": 0.69, "learning_rate": 1.0747661258114753e-05, "loss": 0.9275, "step": 51750 }, { "epoch": 0.69, "learning_rate": 1.0743338754379545e-05, "loss": 0.6437, "step": 51755 }, { "epoch": 0.69, "learning_rate": 1.0739016882143094e-05, "loss": 0.6325, "step": 51760 }, { "epoch": 0.69, "learning_rate": 1.0734695641596861e-05, "loss": 0.6037, "step": 51765 }, { "epoch": 0.69, "learning_rate": 1.0730375032932244e-05, "loss": 0.9136, "step": 51770 }, { "epoch": 0.69, "learning_rate": 1.0726055056340614e-05, "loss": 0.6214, "step": 51775 }, { "epoch": 0.69, "learning_rate": 1.0721735712013344e-05, "loss": 0.6645, "step": 51780 }, { "epoch": 0.69, "learning_rate": 1.0717417000141753e-05, "loss": 0.161, "step": 51785 }, { "epoch": 0.69, "learning_rate": 1.0713098920917123e-05, "loss": 1.2304, "step": 51790 }, { "epoch": 0.69, "learning_rate": 1.0708781474530755e-05, "loss": 0.3883, "step": 51795 }, { "epoch": 0.69, "learning_rate": 1.0704464661173851e-05, "loss": 1.0212, "step": 51800 }, { "epoch": 0.69, "learning_rate": 1.0700148481037655e-05, "loss": 0.8503, "step": 51805 }, { "epoch": 0.69, "learning_rate": 1.0695832934313344e-05, "loss": 1.1209, "step": 51810 }, { "epoch": 0.69, "learning_rate": 1.069151802119206e-05, "loss": 0.9601, "step": 51815 }, { "epoch": 0.69, "learning_rate": 1.0687203741864953e-05, "loss": 0.723, "step": 51820 }, { "epoch": 0.69, "learning_rate": 1.0682890096523118e-05, "loss": 0.1638, "step": 51825 }, { "epoch": 0.69, "learning_rate": 1.0678577085357624e-05, "loss": 1.4323, "step": 51830 }, { "epoch": 0.69, "learning_rate": 1.0674264708559508e-05, "loss": 1.0953, "step": 51835 }, { "epoch": 0.69, "learning_rate": 1.0669952966319808e-05, "loss": 1.4395, "step": 51840 }, { "epoch": 0.69, "learning_rate": 1.0665641858829494e-05, "loss": 0.4651, "step": 51845 }, { "epoch": 0.69, "learning_rate": 1.066133138627953e-05, "loss": 0.3522, "step": 51850 }, { "epoch": 0.69, "learning_rate": 1.0657021548860869e-05, "loss": 1.085, "step": 51855 }, { "epoch": 0.69, "learning_rate": 1.0652712346764379e-05, "loss": 0.7442, "step": 51860 }, { "epoch": 0.69, "learning_rate": 1.0648403780180963e-05, "loss": 0.9568, "step": 51865 }, { "epoch": 0.69, "learning_rate": 1.064409584930146e-05, "loss": 0.5047, "step": 51870 }, { "epoch": 0.7, "learning_rate": 1.0639788554316682e-05, "loss": 1.02, "step": 51875 }, { "epoch": 0.7, "learning_rate": 1.0635481895417441e-05, "loss": 1.0904, "step": 51880 }, { "epoch": 0.7, "learning_rate": 1.0631175872794478e-05, "loss": 0.5884, "step": 51885 }, { "epoch": 0.7, "learning_rate": 1.0626870486638546e-05, "loss": 0.5624, "step": 51890 }, { "epoch": 0.7, "learning_rate": 1.0622565737140348e-05, "loss": 0.5383, "step": 51895 }, { "epoch": 0.7, "learning_rate": 1.0618261624490547e-05, "loss": 0.671, "step": 51900 }, { "epoch": 0.7, "learning_rate": 1.0613958148879827e-05, "loss": 1.1099, "step": 51905 }, { "epoch": 0.7, "learning_rate": 1.0609655310498773e-05, "loss": 0.2169, "step": 51910 }, { "epoch": 0.7, "learning_rate": 1.0605353109538002e-05, "loss": 0.9065, "step": 51915 }, { "epoch": 0.7, "learning_rate": 1.0601051546188076e-05, "loss": 0.3079, "step": 51920 }, { "epoch": 0.7, "learning_rate": 1.059675062063952e-05, "loss": 0.545, "step": 51925 }, { "epoch": 0.7, "learning_rate": 1.0592450333082864e-05, "loss": 1.0964, "step": 51930 }, { "epoch": 0.7, "learning_rate": 1.058815068370858e-05, "loss": 0.676, "step": 51935 }, { "epoch": 0.7, "learning_rate": 1.0583851672707124e-05, "loss": 0.9955, "step": 51940 }, { "epoch": 0.7, "learning_rate": 1.0579553300268905e-05, "loss": 0.5638, "step": 51945 }, { "epoch": 0.7, "learning_rate": 1.0575255566584342e-05, "loss": 0.8386, "step": 51950 }, { "epoch": 0.7, "learning_rate": 1.0570958471843789e-05, "loss": 0.6419, "step": 51955 }, { "epoch": 0.7, "learning_rate": 1.0566662016237584e-05, "loss": 0.6435, "step": 51960 }, { "epoch": 0.7, "learning_rate": 1.0562366199956059e-05, "loss": 1.1404, "step": 51965 }, { "epoch": 0.7, "learning_rate": 1.0558071023189467e-05, "loss": 0.7167, "step": 51970 }, { "epoch": 0.7, "learning_rate": 1.0553776486128087e-05, "loss": 0.5947, "step": 51975 }, { "epoch": 0.7, "learning_rate": 1.0549482588962134e-05, "loss": 0.4823, "step": 51980 }, { "epoch": 0.7, "learning_rate": 1.05451893318818e-05, "loss": 1.0272, "step": 51985 }, { "epoch": 0.7, "learning_rate": 1.0540896715077276e-05, "loss": 0.6224, "step": 51990 }, { "epoch": 0.7, "learning_rate": 1.0536604738738676e-05, "loss": 0.6746, "step": 51995 }, { "epoch": 0.7, "learning_rate": 1.053231340305614e-05, "loss": 1.0118, "step": 52000 }, { "epoch": 0.7, "learning_rate": 1.0528022708219743e-05, "loss": 0.9542, "step": 52005 }, { "epoch": 0.7, "learning_rate": 1.0523732654419527e-05, "loss": 0.7006, "step": 52010 }, { "epoch": 0.7, "learning_rate": 1.051944324184555e-05, "loss": 0.9006, "step": 52015 }, { "epoch": 0.7, "learning_rate": 1.0515154470687777e-05, "loss": 0.9912, "step": 52020 }, { "epoch": 0.7, "learning_rate": 1.0510866341136206e-05, "loss": 0.162, "step": 52025 }, { "epoch": 0.7, "learning_rate": 1.0506578853380766e-05, "loss": 0.9479, "step": 52030 }, { "epoch": 0.7, "learning_rate": 1.0502292007611366e-05, "loss": 2.7782, "step": 52035 }, { "epoch": 0.7, "learning_rate": 1.0498005804017911e-05, "loss": 0.9582, "step": 52040 }, { "epoch": 0.7, "learning_rate": 1.0493720242790245e-05, "loss": 0.362, "step": 52045 }, { "epoch": 0.7, "learning_rate": 1.0489435324118201e-05, "loss": 1.0696, "step": 52050 }, { "epoch": 0.7, "learning_rate": 1.0485151048191569e-05, "loss": 0.6727, "step": 52055 }, { "epoch": 0.7, "learning_rate": 1.0480867415200141e-05, "loss": 0.8135, "step": 52060 }, { "epoch": 0.7, "learning_rate": 1.0476584425333646e-05, "loss": 0.2925, "step": 52065 }, { "epoch": 0.7, "learning_rate": 1.0472302078781796e-05, "loss": 1.1224, "step": 52070 }, { "epoch": 0.7, "learning_rate": 1.0468020375734303e-05, "loss": 0.3578, "step": 52075 }, { "epoch": 0.7, "learning_rate": 1.0463739316380786e-05, "loss": 0.9023, "step": 52080 }, { "epoch": 0.7, "learning_rate": 1.0459458900910896e-05, "loss": 1.1989, "step": 52085 }, { "epoch": 0.7, "learning_rate": 1.045517912951425e-05, "loss": 0.6136, "step": 52090 }, { "epoch": 0.7, "learning_rate": 1.0450900002380385e-05, "loss": 0.5832, "step": 52095 }, { "epoch": 0.7, "learning_rate": 1.044662151969887e-05, "loss": 0.6486, "step": 52100 }, { "epoch": 0.7, "learning_rate": 1.0442343681659208e-05, "loss": 0.3467, "step": 52105 }, { "epoch": 0.7, "learning_rate": 1.0438066488450898e-05, "loss": 1.131, "step": 52110 }, { "epoch": 0.7, "learning_rate": 1.0433789940263394e-05, "loss": 0.7131, "step": 52115 }, { "epoch": 0.7, "learning_rate": 1.0429514037286111e-05, "loss": 0.9087, "step": 52120 }, { "epoch": 0.7, "learning_rate": 1.0425238779708482e-05, "loss": 0.4724, "step": 52125 }, { "epoch": 0.7, "learning_rate": 1.0420964167719842e-05, "loss": 0.4738, "step": 52130 }, { "epoch": 0.7, "learning_rate": 1.0416690201509562e-05, "loss": 0.9065, "step": 52135 }, { "epoch": 0.7, "learning_rate": 1.0412416881266949e-05, "loss": 0.851, "step": 52140 }, { "epoch": 0.7, "learning_rate": 1.0408144207181277e-05, "loss": 0.8807, "step": 52145 }, { "epoch": 0.7, "learning_rate": 1.0403872179441826e-05, "loss": 0.9493, "step": 52150 }, { "epoch": 0.7, "learning_rate": 1.0399600798237816e-05, "loss": 0.7577, "step": 52155 }, { "epoch": 0.7, "learning_rate": 1.0395330063758446e-05, "loss": 0.4492, "step": 52160 }, { "epoch": 0.7, "learning_rate": 1.0391059976192879e-05, "loss": 0.3856, "step": 52165 }, { "epoch": 0.7, "learning_rate": 1.0386790535730282e-05, "loss": 0.4083, "step": 52170 }, { "epoch": 0.7, "learning_rate": 1.0382521742559753e-05, "loss": 0.5191, "step": 52175 }, { "epoch": 0.7, "learning_rate": 1.0378253596870374e-05, "loss": 0.9221, "step": 52180 }, { "epoch": 0.7, "learning_rate": 1.037398609885123e-05, "loss": 1.0208, "step": 52185 }, { "epoch": 0.7, "learning_rate": 1.0369719248691311e-05, "loss": 0.839, "step": 52190 }, { "epoch": 0.7, "learning_rate": 1.0365453046579635e-05, "loss": 1.0367, "step": 52195 }, { "epoch": 0.7, "learning_rate": 1.0361187492705194e-05, "loss": 0.7807, "step": 52200 }, { "epoch": 0.7, "learning_rate": 1.0356922587256893e-05, "loss": 0.6754, "step": 52205 }, { "epoch": 0.7, "learning_rate": 1.0352658330423673e-05, "loss": 0.7253, "step": 52210 }, { "epoch": 0.7, "learning_rate": 1.0348394722394403e-05, "loss": 0.6765, "step": 52215 }, { "epoch": 0.7, "learning_rate": 1.0344131763357955e-05, "loss": 0.8934, "step": 52220 }, { "epoch": 0.7, "learning_rate": 1.033986945350315e-05, "loss": 0.8435, "step": 52225 }, { "epoch": 0.7, "learning_rate": 1.0335607793018775e-05, "loss": 0.6155, "step": 52230 }, { "epoch": 0.7, "learning_rate": 1.0331346782093631e-05, "loss": 0.7164, "step": 52235 }, { "epoch": 0.7, "learning_rate": 1.0327086420916421e-05, "loss": 1.6761, "step": 52240 }, { "epoch": 0.7, "learning_rate": 1.0322826709675884e-05, "loss": 0.3343, "step": 52245 }, { "epoch": 0.7, "learning_rate": 1.0318567648560698e-05, "loss": 0.2596, "step": 52250 }, { "epoch": 0.7, "learning_rate": 1.0314309237759506e-05, "loss": 0.568, "step": 52255 }, { "epoch": 0.7, "learning_rate": 1.0310051477460955e-05, "loss": 0.616, "step": 52260 }, { "epoch": 0.7, "learning_rate": 1.030579436785363e-05, "loss": 0.5811, "step": 52265 }, { "epoch": 0.7, "learning_rate": 1.0301537909126103e-05, "loss": 0.4419, "step": 52270 }, { "epoch": 0.7, "learning_rate": 1.0297282101466905e-05, "loss": 0.553, "step": 52275 }, { "epoch": 0.7, "learning_rate": 1.029302694506456e-05, "loss": 0.5489, "step": 52280 }, { "epoch": 0.7, "learning_rate": 1.0288772440107547e-05, "loss": 1.0148, "step": 52285 }, { "epoch": 0.7, "learning_rate": 1.0284518586784309e-05, "loss": 1.1541, "step": 52290 }, { "epoch": 0.7, "learning_rate": 1.0280265385283295e-05, "loss": 0.1713, "step": 52295 }, { "epoch": 0.7, "learning_rate": 1.0276012835792865e-05, "loss": 0.3265, "step": 52300 }, { "epoch": 0.7, "learning_rate": 1.0271760938501404e-05, "loss": 0.7711, "step": 52305 }, { "epoch": 0.7, "learning_rate": 1.0267509693597268e-05, "loss": 0.5056, "step": 52310 }, { "epoch": 0.7, "learning_rate": 1.0263259101268735e-05, "loss": 0.5879, "step": 52315 }, { "epoch": 0.7, "learning_rate": 1.0259009161704103e-05, "loss": 0.4539, "step": 52320 }, { "epoch": 0.7, "learning_rate": 1.025475987509161e-05, "loss": 0.6998, "step": 52325 }, { "epoch": 0.7, "learning_rate": 1.0250511241619495e-05, "loss": 0.5157, "step": 52330 }, { "epoch": 0.7, "learning_rate": 1.0246263261475945e-05, "loss": 0.5809, "step": 52335 }, { "epoch": 0.7, "learning_rate": 1.024201593484911e-05, "loss": 0.2615, "step": 52340 }, { "epoch": 0.7, "learning_rate": 1.0237769261927157e-05, "loss": 1.2935, "step": 52345 }, { "epoch": 0.7, "learning_rate": 1.0233523242898155e-05, "loss": 0.9691, "step": 52350 }, { "epoch": 0.7, "learning_rate": 1.0229277877950208e-05, "loss": 0.8495, "step": 52355 }, { "epoch": 0.7, "learning_rate": 1.0225033167271353e-05, "loss": 1.347, "step": 52360 }, { "epoch": 0.7, "learning_rate": 1.0220789111049606e-05, "loss": 0.527, "step": 52365 }, { "epoch": 0.7, "learning_rate": 1.021654570947297e-05, "loss": 0.6483, "step": 52370 }, { "epoch": 0.7, "learning_rate": 1.02123029627294e-05, "loss": 0.6079, "step": 52375 }, { "epoch": 0.7, "learning_rate": 1.0208060871006828e-05, "loss": 0.4075, "step": 52380 }, { "epoch": 0.7, "learning_rate": 1.020381943449315e-05, "loss": 0.6783, "step": 52385 }, { "epoch": 0.7, "learning_rate": 1.0199578653376256e-05, "loss": 0.3477, "step": 52390 }, { "epoch": 0.7, "learning_rate": 1.0195338527843985e-05, "loss": 0.3439, "step": 52395 }, { "epoch": 0.7, "learning_rate": 1.0191099058084141e-05, "loss": 0.8262, "step": 52400 }, { "epoch": 0.7, "learning_rate": 1.018686024428454e-05, "loss": 1.0373, "step": 52405 }, { "epoch": 0.7, "learning_rate": 1.0182622086632907e-05, "loss": 0.5856, "step": 52410 }, { "epoch": 0.7, "learning_rate": 1.0178384585316984e-05, "loss": 0.38, "step": 52415 }, { "epoch": 0.7, "learning_rate": 1.0174147740524492e-05, "loss": 0.3944, "step": 52420 }, { "epoch": 0.7, "learning_rate": 1.0169911552443068e-05, "loss": 0.853, "step": 52425 }, { "epoch": 0.7, "learning_rate": 1.0165676021260375e-05, "loss": 1.5068, "step": 52430 }, { "epoch": 0.7, "learning_rate": 1.0161441147164014e-05, "loss": 1.0409, "step": 52435 }, { "epoch": 0.7, "learning_rate": 1.0157206930341583e-05, "loss": 0.7448, "step": 52440 }, { "epoch": 0.7, "learning_rate": 1.015297337098063e-05, "loss": 1.0329, "step": 52445 }, { "epoch": 0.7, "learning_rate": 1.0149586996990151e-05, "loss": 2.2663, "step": 52450 }, { "epoch": 0.7, "learning_rate": 1.014535462153239e-05, "loss": 0.4607, "step": 52455 }, { "epoch": 0.7, "learning_rate": 1.0141122904061115e-05, "loss": 0.602, "step": 52460 }, { "epoch": 0.7, "learning_rate": 1.0136891844763758e-05, "loss": 0.9394, "step": 52465 }, { "epoch": 0.7, "learning_rate": 1.0132661443827726e-05, "loss": 0.3474, "step": 52470 }, { "epoch": 0.7, "learning_rate": 1.0128431701440422e-05, "loss": 1.0254, "step": 52475 }, { "epoch": 0.7, "learning_rate": 1.0124202617789192e-05, "loss": 0.611, "step": 52480 }, { "epoch": 0.7, "learning_rate": 1.0119974193061365e-05, "loss": 0.3808, "step": 52485 }, { "epoch": 0.7, "learning_rate": 1.0115746427444231e-05, "loss": 0.3892, "step": 52490 }, { "epoch": 0.7, "learning_rate": 1.0111519321125076e-05, "loss": 1.1568, "step": 52495 }, { "epoch": 0.7, "learning_rate": 1.010729287429113e-05, "loss": 0.6649, "step": 52500 }, { "epoch": 0.7, "learning_rate": 1.0103067087129591e-05, "loss": 0.7077, "step": 52505 }, { "epoch": 0.7, "learning_rate": 1.0098841959827667e-05, "loss": 0.7796, "step": 52510 }, { "epoch": 0.7, "learning_rate": 1.0094617492572495e-05, "loss": 0.7652, "step": 52515 }, { "epoch": 0.7, "learning_rate": 1.0090393685551196e-05, "loss": 0.6638, "step": 52520 }, { "epoch": 0.7, "learning_rate": 1.0086170538950862e-05, "loss": 0.4895, "step": 52525 }, { "epoch": 0.7, "learning_rate": 1.0081948052958567e-05, "loss": 0.4812, "step": 52530 }, { "epoch": 0.7, "learning_rate": 1.0077726227761342e-05, "loss": 0.9254, "step": 52535 }, { "epoch": 0.7, "learning_rate": 1.0073505063546182e-05, "loss": 0.3231, "step": 52540 }, { "epoch": 0.7, "learning_rate": 1.006928456050008e-05, "loss": 0.9284, "step": 52545 }, { "epoch": 0.7, "learning_rate": 1.006506471880998e-05, "loss": 0.7802, "step": 52550 }, { "epoch": 0.7, "learning_rate": 1.0060845538662783e-05, "loss": 1.144, "step": 52555 }, { "epoch": 0.7, "learning_rate": 1.005662702024541e-05, "loss": 1.0962, "step": 52560 }, { "epoch": 0.7, "learning_rate": 1.0052409163744683e-05, "loss": 0.7448, "step": 52565 }, { "epoch": 0.7, "learning_rate": 1.004819196934746e-05, "loss": 0.4746, "step": 52570 }, { "epoch": 0.7, "learning_rate": 1.0043975437240527e-05, "loss": 1.0299, "step": 52575 }, { "epoch": 0.7, "learning_rate": 1.0039759567610654e-05, "loss": 0.4346, "step": 52580 }, { "epoch": 0.7, "learning_rate": 1.0035544360644594e-05, "loss": 0.6761, "step": 52585 }, { "epoch": 0.7, "learning_rate": 1.0031329816529059e-05, "loss": 1.3309, "step": 52590 }, { "epoch": 0.7, "learning_rate": 1.0027115935450724e-05, "loss": 1.0796, "step": 52595 }, { "epoch": 0.7, "learning_rate": 1.0022902717596236e-05, "loss": 0.7352, "step": 52600 }, { "epoch": 0.7, "learning_rate": 1.0018690163152241e-05, "loss": 0.5119, "step": 52605 }, { "epoch": 0.7, "learning_rate": 1.0014478272305323e-05, "loss": 0.5604, "step": 52610 }, { "epoch": 0.7, "learning_rate": 1.0010267045242037e-05, "loss": 0.5093, "step": 52615 }, { "epoch": 0.71, "learning_rate": 1.0006056482148936e-05, "loss": 0.3642, "step": 52620 }, { "epoch": 0.71, "learning_rate": 1.0001846583212524e-05, "loss": 1.1415, "step": 52625 }, { "epoch": 0.71, "learning_rate": 9.997637348619274e-06, "loss": 0.8876, "step": 52630 }, { "epoch": 0.71, "learning_rate": 9.993428778555627e-06, "loss": 0.5089, "step": 52635 }, { "epoch": 0.71, "learning_rate": 9.98922087320802e-06, "loss": 1.0779, "step": 52640 }, { "epoch": 0.71, "learning_rate": 9.985013632762826e-06, "loss": 1.2908, "step": 52645 }, { "epoch": 0.71, "learning_rate": 9.980807057406405e-06, "loss": 0.9027, "step": 52650 }, { "epoch": 0.71, "learning_rate": 9.976601147325104e-06, "loss": 0.4923, "step": 52655 }, { "epoch": 0.71, "learning_rate": 9.972395902705208e-06, "loss": 0.6757, "step": 52660 }, { "epoch": 0.71, "learning_rate": 9.968191323732986e-06, "loss": 0.8355, "step": 52665 }, { "epoch": 0.71, "learning_rate": 9.963987410594706e-06, "loss": 0.5964, "step": 52670 }, { "epoch": 0.71, "learning_rate": 9.959784163476541e-06, "loss": 1.2956, "step": 52675 }, { "epoch": 0.71, "learning_rate": 9.955581582564702e-06, "loss": 1.0648, "step": 52680 }, { "epoch": 0.71, "learning_rate": 9.951379668045335e-06, "loss": 1.5539, "step": 52685 }, { "epoch": 0.71, "learning_rate": 9.947178420104556e-06, "loss": 0.7754, "step": 52690 }, { "epoch": 0.71, "learning_rate": 9.942977838928472e-06, "loss": 0.1376, "step": 52695 }, { "epoch": 0.71, "learning_rate": 9.938777924703144e-06, "loss": 0.638, "step": 52700 }, { "epoch": 0.71, "learning_rate": 9.934578677614604e-06, "loss": 0.0996, "step": 52705 }, { "epoch": 0.71, "learning_rate": 9.930380097848849e-06, "loss": 0.5536, "step": 52710 }, { "epoch": 0.71, "learning_rate": 9.926182185591874e-06, "loss": 0.5858, "step": 52715 }, { "epoch": 0.71, "learning_rate": 9.921984941029617e-06, "loss": 1.0571, "step": 52720 }, { "epoch": 0.71, "learning_rate": 9.917788364347986e-06, "loss": 0.5825, "step": 52725 }, { "epoch": 0.71, "learning_rate": 9.913592455732881e-06, "loss": 0.7248, "step": 52730 }, { "epoch": 0.71, "learning_rate": 9.909397215370159e-06, "loss": 0.8469, "step": 52735 }, { "epoch": 0.71, "learning_rate": 9.905202643445644e-06, "loss": 0.7622, "step": 52740 }, { "epoch": 0.71, "learning_rate": 9.901008740145127e-06, "loss": 0.5878, "step": 52745 }, { "epoch": 0.71, "learning_rate": 9.896815505654391e-06, "loss": 0.9449, "step": 52750 }, { "epoch": 0.71, "learning_rate": 9.89262294015917e-06, "loss": 1.4389, "step": 52755 }, { "epoch": 0.71, "learning_rate": 9.888431043845168e-06, "loss": 0.7029, "step": 52760 }, { "epoch": 0.71, "learning_rate": 9.884239816898074e-06, "loss": 0.9724, "step": 52765 }, { "epoch": 0.71, "learning_rate": 9.880049259503537e-06, "loss": 0.6592, "step": 52770 }, { "epoch": 0.71, "learning_rate": 9.875859371847165e-06, "loss": 0.9986, "step": 52775 }, { "epoch": 0.71, "learning_rate": 9.871670154114579e-06, "loss": 0.4924, "step": 52780 }, { "epoch": 0.71, "learning_rate": 9.867481606491302e-06, "loss": 1.1027, "step": 52785 }, { "epoch": 0.71, "learning_rate": 9.863293729162892e-06, "loss": 0.5008, "step": 52790 }, { "epoch": 0.71, "learning_rate": 9.859106522314842e-06, "loss": 0.5387, "step": 52795 }, { "epoch": 0.71, "learning_rate": 9.854919986132618e-06, "loss": 0.261, "step": 52800 }, { "epoch": 0.71, "learning_rate": 9.85073412080168e-06, "loss": 0.1915, "step": 52805 }, { "epoch": 0.71, "learning_rate": 9.846548926507429e-06, "loss": 0.6263, "step": 52810 }, { "epoch": 0.71, "learning_rate": 9.842364403435253e-06, "loss": 0.8862, "step": 52815 }, { "epoch": 0.71, "learning_rate": 9.838180551770493e-06, "loss": 0.5156, "step": 52820 }, { "epoch": 0.71, "learning_rate": 9.833997371698489e-06, "loss": 0.6571, "step": 52825 }, { "epoch": 0.71, "learning_rate": 9.829814863404529e-06, "loss": 0.8801, "step": 52830 }, { "epoch": 0.71, "learning_rate": 9.825633027073868e-06, "loss": 1.0958, "step": 52835 }, { "epoch": 0.71, "learning_rate": 9.821451862891759e-06, "loss": 0.6552, "step": 52840 }, { "epoch": 0.71, "learning_rate": 9.817271371043396e-06, "loss": 0.8822, "step": 52845 }, { "epoch": 0.71, "learning_rate": 9.813091551713946e-06, "loss": 0.6768, "step": 52850 }, { "epoch": 0.71, "learning_rate": 9.808912405088572e-06, "loss": 0.5212, "step": 52855 }, { "epoch": 0.71, "learning_rate": 9.804733931352378e-06, "loss": 0.721, "step": 52860 }, { "epoch": 0.71, "learning_rate": 9.800556130690452e-06, "loss": 0.9643, "step": 52865 }, { "epoch": 0.71, "learning_rate": 9.796379003287839e-06, "loss": 0.5028, "step": 52870 }, { "epoch": 0.71, "learning_rate": 9.792202549329585e-06, "loss": 0.7486, "step": 52875 }, { "epoch": 0.71, "learning_rate": 9.788026769000677e-06, "loss": 1.143, "step": 52880 }, { "epoch": 0.71, "learning_rate": 9.783851662486068e-06, "loss": 1.0592, "step": 52885 }, { "epoch": 0.71, "learning_rate": 9.779677229970727e-06, "loss": 1.3658, "step": 52890 }, { "epoch": 0.71, "learning_rate": 9.775503471639522e-06, "loss": 0.6492, "step": 52895 }, { "epoch": 0.71, "learning_rate": 9.771330387677355e-06, "loss": 0.988, "step": 52900 }, { "epoch": 0.71, "learning_rate": 9.767157978269065e-06, "loss": 0.4986, "step": 52905 }, { "epoch": 0.71, "learning_rate": 9.762986243599458e-06, "loss": 0.2193, "step": 52910 }, { "epoch": 0.71, "learning_rate": 9.758815183853346e-06, "loss": 1.393, "step": 52915 }, { "epoch": 0.71, "learning_rate": 9.754644799215471e-06, "loss": 0.1575, "step": 52920 }, { "epoch": 0.71, "learning_rate": 9.750475089870559e-06, "loss": 0.2914, "step": 52925 }, { "epoch": 0.71, "learning_rate": 9.746306056003301e-06, "loss": 0.6092, "step": 52930 }, { "epoch": 0.71, "learning_rate": 9.742137697798382e-06, "loss": 0.51, "step": 52935 }, { "epoch": 0.71, "learning_rate": 9.737970015440432e-06, "loss": 0.8422, "step": 52940 }, { "epoch": 0.71, "learning_rate": 9.733803009114045e-06, "loss": 0.1632, "step": 52945 }, { "epoch": 0.71, "learning_rate": 9.729636679003822e-06, "loss": 1.113, "step": 52950 }, { "epoch": 0.71, "learning_rate": 9.725471025294297e-06, "loss": 0.5674, "step": 52955 }, { "epoch": 0.71, "learning_rate": 9.721306048169982e-06, "loss": 0.2837, "step": 52960 }, { "epoch": 0.71, "learning_rate": 9.717141747815381e-06, "loss": 0.8976, "step": 52965 }, { "epoch": 0.71, "learning_rate": 9.71297812441494e-06, "loss": 0.7207, "step": 52970 }, { "epoch": 0.71, "learning_rate": 9.708815178153091e-06, "loss": 0.9572, "step": 52975 }, { "epoch": 0.71, "learning_rate": 9.704652909214223e-06, "loss": 0.6009, "step": 52980 }, { "epoch": 0.71, "learning_rate": 9.70049131778272e-06, "loss": 0.261, "step": 52985 }, { "epoch": 0.71, "learning_rate": 9.696330404042908e-06, "loss": 0.2904, "step": 52990 }, { "epoch": 0.71, "learning_rate": 9.692170168179091e-06, "loss": 0.3782, "step": 52995 }, { "epoch": 0.71, "learning_rate": 9.688010610375569e-06, "loss": 0.7975, "step": 53000 }, { "epoch": 0.71, "learning_rate": 9.683851730816557e-06, "loss": 1.1034, "step": 53005 }, { "epoch": 0.71, "learning_rate": 9.680525115629203e-06, "loss": 2.2526, "step": 53010 }, { "epoch": 0.71, "learning_rate": 9.676367457374555e-06, "loss": 0.8338, "step": 53015 }, { "epoch": 0.71, "learning_rate": 9.672210477880164e-06, "loss": 0.1971, "step": 53020 }, { "epoch": 0.71, "learning_rate": 9.66805417733016e-06, "loss": 0.9946, "step": 53025 }, { "epoch": 0.71, "learning_rate": 9.66389855590867e-06, "loss": 0.6098, "step": 53030 }, { "epoch": 0.71, "learning_rate": 9.659743613799734e-06, "loss": 0.4111, "step": 53035 }, { "epoch": 0.71, "learning_rate": 9.655589351187418e-06, "loss": 0.8544, "step": 53040 }, { "epoch": 0.71, "learning_rate": 9.651435768255728e-06, "loss": 0.9141, "step": 53045 }, { "epoch": 0.71, "learning_rate": 9.64728286518864e-06, "loss": 0.76, "step": 53050 }, { "epoch": 0.71, "learning_rate": 9.643130642170122e-06, "loss": 0.7332, "step": 53055 }, { "epoch": 0.71, "learning_rate": 9.638979099384088e-06, "loss": 0.5838, "step": 53060 }, { "epoch": 0.71, "learning_rate": 9.634828237014431e-06, "loss": 0.2794, "step": 53065 }, { "epoch": 0.71, "learning_rate": 9.630678055245004e-06, "loss": 0.5223, "step": 53070 }, { "epoch": 0.71, "learning_rate": 9.62652855425966e-06, "loss": 0.7952, "step": 53075 }, { "epoch": 0.71, "learning_rate": 9.622379734242188e-06, "loss": 0.3572, "step": 53080 }, { "epoch": 0.71, "learning_rate": 9.618231595376354e-06, "loss": 0.7174, "step": 53085 }, { "epoch": 0.71, "learning_rate": 9.614084137845916e-06, "loss": 0.3355, "step": 53090 }, { "epoch": 0.71, "learning_rate": 9.609937361834576e-06, "loss": 0.5064, "step": 53095 }, { "epoch": 0.71, "learning_rate": 9.60579126752601e-06, "loss": 0.6728, "step": 53100 }, { "epoch": 0.71, "learning_rate": 9.601645855103885e-06, "loss": 0.901, "step": 53105 }, { "epoch": 0.71, "learning_rate": 9.597501124751812e-06, "loss": 0.6661, "step": 53110 }, { "epoch": 0.71, "learning_rate": 9.593357076653384e-06, "loss": 0.5308, "step": 53115 }, { "epoch": 0.71, "learning_rate": 9.589213710992151e-06, "loss": 0.3182, "step": 53120 }, { "epoch": 0.71, "learning_rate": 9.585071027951662e-06, "loss": 0.7011, "step": 53125 }, { "epoch": 0.71, "learning_rate": 9.580929027715407e-06, "loss": 1.2193, "step": 53130 }, { "epoch": 0.71, "learning_rate": 9.57678771046685e-06, "loss": 0.7428, "step": 53135 }, { "epoch": 0.71, "learning_rate": 9.572647076389454e-06, "loss": 1.3238, "step": 53140 }, { "epoch": 0.71, "learning_rate": 9.568507125666593e-06, "loss": 0.4367, "step": 53145 }, { "epoch": 0.71, "learning_rate": 9.564367858481676e-06, "loss": 0.9718, "step": 53150 }, { "epoch": 0.71, "learning_rate": 9.56022927501804e-06, "loss": 0.4149, "step": 53155 }, { "epoch": 0.71, "learning_rate": 9.556091375458994e-06, "loss": 0.4118, "step": 53160 }, { "epoch": 0.71, "learning_rate": 9.551954159987848e-06, "loss": 0.4224, "step": 53165 }, { "epoch": 0.71, "learning_rate": 9.547817628787848e-06, "loss": 1.0575, "step": 53170 }, { "epoch": 0.71, "learning_rate": 9.543681782042221e-06, "loss": 0.8471, "step": 53175 }, { "epoch": 0.71, "learning_rate": 9.53954661993416e-06, "loss": 1.2796, "step": 53180 }, { "epoch": 0.71, "learning_rate": 9.535412142646841e-06, "loss": 0.9745, "step": 53185 }, { "epoch": 0.71, "learning_rate": 9.531278350363401e-06, "loss": 0.314, "step": 53190 }, { "epoch": 0.71, "learning_rate": 9.527145243266933e-06, "loss": 1.2131, "step": 53195 }, { "epoch": 0.71, "learning_rate": 9.523012821540531e-06, "loss": 1.6109, "step": 53200 }, { "epoch": 0.71, "learning_rate": 9.518881085367232e-06, "loss": 0.6023, "step": 53205 }, { "epoch": 0.71, "learning_rate": 9.51475003493004e-06, "loss": 0.2411, "step": 53210 }, { "epoch": 0.71, "learning_rate": 9.510619670411963e-06, "loss": 0.6376, "step": 53215 }, { "epoch": 0.71, "learning_rate": 9.506489991995942e-06, "loss": 0.9642, "step": 53220 }, { "epoch": 0.71, "learning_rate": 9.502360999864907e-06, "loss": 0.6351, "step": 53225 }, { "epoch": 0.71, "learning_rate": 9.498232694201733e-06, "loss": 0.7345, "step": 53230 }, { "epoch": 0.71, "learning_rate": 9.49410507518931e-06, "loss": 1.1371, "step": 53235 }, { "epoch": 0.71, "learning_rate": 9.489978143010458e-06, "loss": 0.7948, "step": 53240 }, { "epoch": 0.71, "learning_rate": 9.48585189784797e-06, "loss": 0.5016, "step": 53245 }, { "epoch": 0.71, "learning_rate": 9.481726339884647e-06, "loss": 0.2733, "step": 53250 }, { "epoch": 0.71, "learning_rate": 9.477601469303194e-06, "loss": 0.6797, "step": 53255 }, { "epoch": 0.71, "learning_rate": 9.473477286286347e-06, "loss": 0.6599, "step": 53260 }, { "epoch": 0.71, "learning_rate": 9.469353791016782e-06, "loss": 0.5551, "step": 53265 }, { "epoch": 0.71, "learning_rate": 9.465230983677137e-06, "loss": 0.1865, "step": 53270 }, { "epoch": 0.71, "learning_rate": 9.461108864450049e-06, "loss": 0.4256, "step": 53275 }, { "epoch": 0.71, "learning_rate": 9.4569874335181e-06, "loss": 0.8336, "step": 53280 }, { "epoch": 0.71, "learning_rate": 9.45286669106385e-06, "loss": 0.0575, "step": 53285 }, { "epoch": 0.71, "learning_rate": 9.448746637269814e-06, "loss": 0.0949, "step": 53290 }, { "epoch": 0.71, "learning_rate": 9.444627272318512e-06, "loss": 1.1347, "step": 53295 }, { "epoch": 0.71, "learning_rate": 9.440508596392402e-06, "loss": 0.7025, "step": 53300 }, { "epoch": 0.71, "learning_rate": 9.43639060967391e-06, "loss": 0.7471, "step": 53305 }, { "epoch": 0.71, "learning_rate": 9.43227331234546e-06, "loss": 0.6523, "step": 53310 }, { "epoch": 0.71, "learning_rate": 9.42815670458942e-06, "loss": 0.8567, "step": 53315 }, { "epoch": 0.71, "learning_rate": 9.424040786588127e-06, "loss": 0.5281, "step": 53320 }, { "epoch": 0.71, "learning_rate": 9.419925558523906e-06, "loss": 0.8382, "step": 53325 }, { "epoch": 0.71, "learning_rate": 9.415811020579044e-06, "loss": 0.2461, "step": 53330 }, { "epoch": 0.71, "learning_rate": 9.411697172935788e-06, "loss": 0.5413, "step": 53335 }, { "epoch": 0.71, "learning_rate": 9.40758401577635e-06, "loss": 1.0673, "step": 53340 }, { "epoch": 0.71, "learning_rate": 9.403471549282944e-06, "loss": 0.8274, "step": 53345 }, { "epoch": 0.71, "learning_rate": 9.399359773637723e-06, "loss": 0.3229, "step": 53350 }, { "epoch": 0.71, "learning_rate": 9.395248689022804e-06, "loss": 0.4783, "step": 53355 }, { "epoch": 0.71, "learning_rate": 9.391138295620319e-06, "loss": 0.6063, "step": 53360 }, { "epoch": 0.72, "learning_rate": 9.387028593612302e-06, "loss": 0.9406, "step": 53365 }, { "epoch": 0.72, "learning_rate": 9.382919583180819e-06, "loss": 0.3993, "step": 53370 }, { "epoch": 0.72, "learning_rate": 9.378811264507867e-06, "loss": 0.7917, "step": 53375 }, { "epoch": 0.72, "learning_rate": 9.374703637775418e-06, "loss": 0.5877, "step": 53380 }, { "epoch": 0.72, "learning_rate": 9.370596703165432e-06, "loss": 0.685, "step": 53385 }, { "epoch": 0.72, "learning_rate": 9.366490460859825e-06, "loss": 1.0199, "step": 53390 }, { "epoch": 0.72, "learning_rate": 9.362384911040476e-06, "loss": 0.4944, "step": 53395 }, { "epoch": 0.72, "learning_rate": 9.358280053889234e-06, "loss": 0.4503, "step": 53400 }, { "epoch": 0.72, "learning_rate": 9.354175889587943e-06, "loss": 1.2132, "step": 53405 }, { "epoch": 0.72, "learning_rate": 9.350072418318387e-06, "loss": 1.1892, "step": 53410 }, { "epoch": 0.72, "learning_rate": 9.34596964026232e-06, "loss": 0.3607, "step": 53415 }, { "epoch": 0.72, "learning_rate": 9.341867555601488e-06, "loss": 1.0576, "step": 53420 }, { "epoch": 0.72, "learning_rate": 9.337766164517592e-06, "loss": 0.9069, "step": 53425 }, { "epoch": 0.72, "learning_rate": 9.33366546719229e-06, "loss": 0.8981, "step": 53430 }, { "epoch": 0.72, "learning_rate": 9.329565463807241e-06, "loss": 0.113, "step": 53435 }, { "epoch": 0.72, "learning_rate": 9.325466154544044e-06, "loss": 1.5595, "step": 53440 }, { "epoch": 0.72, "learning_rate": 9.321367539584277e-06, "loss": 0.5906, "step": 53445 }, { "epoch": 0.72, "learning_rate": 9.317269619109486e-06, "loss": 0.2815, "step": 53450 }, { "epoch": 0.72, "learning_rate": 9.313172393301198e-06, "loss": 1.0351, "step": 53455 }, { "epoch": 0.72, "learning_rate": 9.309075862340896e-06, "loss": 0.69, "step": 53460 }, { "epoch": 0.72, "learning_rate": 9.304980026410023e-06, "loss": 0.7566, "step": 53465 }, { "epoch": 0.72, "learning_rate": 9.300884885690037e-06, "loss": 0.0935, "step": 53470 }, { "epoch": 0.72, "learning_rate": 9.296790440362288e-06, "loss": 0.8431, "step": 53475 }, { "epoch": 0.72, "learning_rate": 9.292696690608174e-06, "loss": 0.3725, "step": 53480 }, { "epoch": 0.72, "learning_rate": 9.288603636609014e-06, "loss": 1.1029, "step": 53485 }, { "epoch": 0.72, "learning_rate": 9.284511278546101e-06, "loss": 0.6208, "step": 53490 }, { "epoch": 0.72, "learning_rate": 9.280419616600728e-06, "loss": 1.04, "step": 53495 }, { "epoch": 0.72, "learning_rate": 9.276328650954122e-06, "loss": 0.4622, "step": 53500 }, { "epoch": 0.72, "learning_rate": 9.272238381787485e-06, "loss": 0.756, "step": 53505 }, { "epoch": 0.72, "learning_rate": 9.268148809282012e-06, "loss": 1.4141, "step": 53510 }, { "epoch": 0.72, "learning_rate": 9.264059933618847e-06, "loss": 0.4818, "step": 53515 }, { "epoch": 0.72, "learning_rate": 9.259971754979097e-06, "loss": 1.1101, "step": 53520 }, { "epoch": 0.72, "learning_rate": 9.255884273543847e-06, "loss": 0.4867, "step": 53525 }, { "epoch": 0.72, "learning_rate": 9.251797489494169e-06, "loss": 0.9199, "step": 53530 }, { "epoch": 0.72, "learning_rate": 9.247711403011073e-06, "loss": 0.7202, "step": 53535 }, { "epoch": 0.72, "learning_rate": 9.243626014275548e-06, "loss": 1.2319, "step": 53540 }, { "epoch": 0.72, "learning_rate": 9.239541323468573e-06, "loss": 0.5439, "step": 53545 }, { "epoch": 0.72, "learning_rate": 9.23545733077107e-06, "loss": 1.3088, "step": 53550 }, { "epoch": 0.72, "learning_rate": 9.231374036363941e-06, "loss": 0.6498, "step": 53555 }, { "epoch": 0.72, "learning_rate": 9.227291440428043e-06, "loss": 1.1011, "step": 53560 }, { "epoch": 0.72, "learning_rate": 9.223209543144237e-06, "loss": 0.9403, "step": 53565 }, { "epoch": 0.72, "learning_rate": 9.219128344693317e-06, "loss": 0.6274, "step": 53570 }, { "epoch": 0.72, "learning_rate": 9.215047845256056e-06, "loss": 0.7653, "step": 53575 }, { "epoch": 0.72, "learning_rate": 9.210968045013221e-06, "loss": 0.5373, "step": 53580 }, { "epoch": 0.72, "learning_rate": 9.206888944145495e-06, "loss": 0.5604, "step": 53585 }, { "epoch": 0.72, "learning_rate": 9.202810542833587e-06, "loss": 0.6409, "step": 53590 }, { "epoch": 0.72, "learning_rate": 9.198732841258142e-06, "loss": 0.3277, "step": 53595 }, { "epoch": 0.72, "learning_rate": 9.194655839599773e-06, "loss": 0.4493, "step": 53600 }, { "epoch": 0.72, "learning_rate": 9.190579538039084e-06, "loss": 0.5344, "step": 53605 }, { "epoch": 0.72, "learning_rate": 9.186503936756632e-06, "loss": 0.6687, "step": 53610 }, { "epoch": 0.72, "learning_rate": 9.182429035932933e-06, "loss": 1.0469, "step": 53615 }, { "epoch": 0.72, "learning_rate": 9.178354835748504e-06, "loss": 0.9061, "step": 53620 }, { "epoch": 0.72, "learning_rate": 9.174281336383803e-06, "loss": 0.5515, "step": 53625 }, { "epoch": 0.72, "learning_rate": 9.170208538019264e-06, "loss": 0.699, "step": 53630 }, { "epoch": 0.72, "learning_rate": 9.166136440835287e-06, "loss": 0.4497, "step": 53635 }, { "epoch": 0.72, "learning_rate": 9.162065045012258e-06, "loss": 0.3427, "step": 53640 }, { "epoch": 0.72, "learning_rate": 9.157994350730514e-06, "loss": 0.6478, "step": 53645 }, { "epoch": 0.72, "learning_rate": 9.153924358170355e-06, "loss": 0.7611, "step": 53650 }, { "epoch": 0.72, "learning_rate": 9.14985506751208e-06, "loss": 0.9005, "step": 53655 }, { "epoch": 0.72, "learning_rate": 9.14578647893593e-06, "loss": 0.1981, "step": 53660 }, { "epoch": 0.72, "learning_rate": 9.141718592622123e-06, "loss": 0.6748, "step": 53665 }, { "epoch": 0.72, "learning_rate": 9.13765140875084e-06, "loss": 0.546, "step": 53670 }, { "epoch": 0.72, "learning_rate": 9.133584927502248e-06, "loss": 1.0352, "step": 53675 }, { "epoch": 0.72, "learning_rate": 9.129519149056467e-06, "loss": 1.3193, "step": 53680 }, { "epoch": 0.72, "learning_rate": 9.125454073593582e-06, "loss": 0.6861, "step": 53685 }, { "epoch": 0.72, "learning_rate": 9.121389701293682e-06, "loss": 0.2987, "step": 53690 }, { "epoch": 0.72, "learning_rate": 9.117326032336763e-06, "loss": 0.7916, "step": 53695 }, { "epoch": 0.72, "learning_rate": 9.113263066902847e-06, "loss": 0.2488, "step": 53700 }, { "epoch": 0.72, "learning_rate": 9.109200805171902e-06, "loss": 0.9154, "step": 53705 }, { "epoch": 0.72, "learning_rate": 9.105139247323851e-06, "loss": 0.9852, "step": 53710 }, { "epoch": 0.72, "learning_rate": 9.101078393538622e-06, "loss": 0.4949, "step": 53715 }, { "epoch": 0.72, "learning_rate": 9.09701824399608e-06, "loss": 0.1761, "step": 53720 }, { "epoch": 0.72, "learning_rate": 9.09295879887606e-06, "loss": 0.8357, "step": 53725 }, { "epoch": 0.72, "learning_rate": 9.088900058358397e-06, "loss": 1.1845, "step": 53730 }, { "epoch": 0.72, "learning_rate": 9.084842022622859e-06, "loss": 0.4705, "step": 53735 }, { "epoch": 0.72, "learning_rate": 9.080784691849197e-06, "loss": 1.0566, "step": 53740 }, { "epoch": 0.72, "learning_rate": 9.076728066217125e-06, "loss": 0.282, "step": 53745 }, { "epoch": 0.72, "learning_rate": 9.072672145906344e-06, "loss": 0.5711, "step": 53750 }, { "epoch": 0.72, "learning_rate": 9.068616931096507e-06, "loss": 0.62, "step": 53755 }, { "epoch": 0.72, "learning_rate": 9.064562421967229e-06, "loss": 0.6564, "step": 53760 }, { "epoch": 0.72, "learning_rate": 9.06050861869813e-06, "loss": 0.2392, "step": 53765 }, { "epoch": 0.72, "learning_rate": 9.05645552146874e-06, "loss": 0.3176, "step": 53770 }, { "epoch": 0.72, "learning_rate": 9.052403130458615e-06, "loss": 0.8188, "step": 53775 }, { "epoch": 0.72, "learning_rate": 9.048351445847243e-06, "loss": 1.2862, "step": 53780 }, { "epoch": 0.72, "learning_rate": 9.044300467814102e-06, "loss": 0.2718, "step": 53785 }, { "epoch": 0.72, "learning_rate": 9.040250196538627e-06, "loss": 0.5629, "step": 53790 }, { "epoch": 0.72, "learning_rate": 9.036200632200218e-06, "loss": 0.427, "step": 53795 }, { "epoch": 0.72, "learning_rate": 9.032151774978273e-06, "loss": 0.3687, "step": 53800 }, { "epoch": 0.72, "learning_rate": 9.028103625052101e-06, "loss": 1.6102, "step": 53805 }, { "epoch": 0.72, "learning_rate": 9.024056182601042e-06, "loss": 0.1645, "step": 53810 }, { "epoch": 0.72, "learning_rate": 9.020009447804372e-06, "loss": 0.3866, "step": 53815 }, { "epoch": 0.72, "learning_rate": 9.015963420841329e-06, "loss": 0.2379, "step": 53820 }, { "epoch": 0.72, "learning_rate": 9.011918101891149e-06, "loss": 0.9133, "step": 53825 }, { "epoch": 0.72, "learning_rate": 9.007873491133006e-06, "loss": 0.8718, "step": 53830 }, { "epoch": 0.72, "learning_rate": 9.00382958874606e-06, "loss": 0.3761, "step": 53835 }, { "epoch": 0.72, "learning_rate": 8.99978639490944e-06, "loss": 0.3934, "step": 53840 }, { "epoch": 0.72, "learning_rate": 8.99574390980224e-06, "loss": 0.3548, "step": 53845 }, { "epoch": 0.72, "learning_rate": 8.991702133603516e-06, "loss": 0.6728, "step": 53850 }, { "epoch": 0.72, "learning_rate": 8.987661066492292e-06, "loss": 0.6402, "step": 53855 }, { "epoch": 0.72, "learning_rate": 8.983620708647585e-06, "loss": 0.4791, "step": 53860 }, { "epoch": 0.72, "learning_rate": 8.979581060248355e-06, "loss": 0.5856, "step": 53865 }, { "epoch": 0.72, "learning_rate": 8.975542121473524e-06, "loss": 0.1325, "step": 53870 }, { "epoch": 0.72, "learning_rate": 8.971503892502029e-06, "loss": 1.172, "step": 53875 }, { "epoch": 0.72, "learning_rate": 8.967466373512706e-06, "loss": 1.2085, "step": 53880 }, { "epoch": 0.72, "learning_rate": 8.963429564684422e-06, "loss": 0.6751, "step": 53885 }, { "epoch": 0.72, "learning_rate": 8.95939346619597e-06, "loss": 1.1489, "step": 53890 }, { "epoch": 0.72, "learning_rate": 8.95535807822615e-06, "loss": 0.4707, "step": 53895 }, { "epoch": 0.72, "learning_rate": 8.951323400953698e-06, "loss": 0.5739, "step": 53900 }, { "epoch": 0.72, "learning_rate": 8.947289434557321e-06, "loss": 0.6262, "step": 53905 }, { "epoch": 0.72, "learning_rate": 8.943256179215732e-06, "loss": 0.8844, "step": 53910 }, { "epoch": 0.72, "learning_rate": 8.939223635107544e-06, "loss": 0.5099, "step": 53915 }, { "epoch": 0.72, "learning_rate": 8.935191802411401e-06, "loss": 0.9951, "step": 53920 }, { "epoch": 0.72, "learning_rate": 8.931160681305909e-06, "loss": 1.0325, "step": 53925 }, { "epoch": 0.72, "learning_rate": 8.92713027196959e-06, "loss": 0.5324, "step": 53930 }, { "epoch": 0.72, "learning_rate": 8.923100574581003e-06, "loss": 0.6852, "step": 53935 }, { "epoch": 0.72, "learning_rate": 8.919071589318626e-06, "loss": 0.6155, "step": 53940 }, { "epoch": 0.72, "learning_rate": 8.915043316360922e-06, "loss": 0.7878, "step": 53945 }, { "epoch": 0.72, "learning_rate": 8.911015755886335e-06, "loss": 0.6871, "step": 53950 }, { "epoch": 0.72, "learning_rate": 8.90698890807326e-06, "loss": 1.0338, "step": 53955 }, { "epoch": 0.72, "learning_rate": 8.902962773100065e-06, "loss": 1.1979, "step": 53960 }, { "epoch": 0.72, "learning_rate": 8.898937351145079e-06, "loss": 1.5717, "step": 53965 }, { "epoch": 0.72, "learning_rate": 8.894912642386627e-06, "loss": 0.7278, "step": 53970 }, { "epoch": 0.72, "learning_rate": 8.890888647002973e-06, "loss": 0.402, "step": 53975 }, { "epoch": 0.72, "learning_rate": 8.886865365172353e-06, "loss": 1.1594, "step": 53980 }, { "epoch": 0.72, "learning_rate": 8.882842797073002e-06, "loss": 1.2186, "step": 53985 }, { "epoch": 0.72, "learning_rate": 8.878820942883067e-06, "loss": 0.6784, "step": 53990 }, { "epoch": 0.72, "learning_rate": 8.87479980278072e-06, "loss": 0.8472, "step": 53995 }, { "epoch": 0.72, "learning_rate": 8.870779376944064e-06, "loss": 0.667, "step": 54000 }, { "epoch": 0.72, "learning_rate": 8.866759665551197e-06, "loss": 0.5851, "step": 54005 }, { "epoch": 0.72, "learning_rate": 8.862740668780161e-06, "loss": 0.981, "step": 54010 }, { "epoch": 0.72, "learning_rate": 8.858722386808978e-06, "loss": 0.3694, "step": 54015 }, { "epoch": 0.72, "learning_rate": 8.854704819815657e-06, "loss": 0.3074, "step": 54020 }, { "epoch": 0.72, "learning_rate": 8.850687967978121e-06, "loss": 0.6309, "step": 54025 }, { "epoch": 0.72, "learning_rate": 8.846671831474316e-06, "loss": 0.648, "step": 54030 }, { "epoch": 0.72, "learning_rate": 8.842656410482153e-06, "loss": 0.745, "step": 54035 }, { "epoch": 0.72, "learning_rate": 8.838641705179463e-06, "loss": 0.6802, "step": 54040 }, { "epoch": 0.72, "learning_rate": 8.834627715744101e-06, "loss": 0.4598, "step": 54045 }, { "epoch": 0.72, "learning_rate": 8.830614442353858e-06, "loss": 0.2362, "step": 54050 }, { "epoch": 0.72, "learning_rate": 8.826601885186495e-06, "loss": 0.9389, "step": 54055 }, { "epoch": 0.72, "learning_rate": 8.82259004441976e-06, "loss": 0.4868, "step": 54060 }, { "epoch": 0.72, "learning_rate": 8.818578920231358e-06, "loss": 1.6567, "step": 54065 }, { "epoch": 0.72, "learning_rate": 8.814568512798955e-06, "loss": 0.7774, "step": 54070 }, { "epoch": 0.72, "learning_rate": 8.810558822300183e-06, "loss": 0.6523, "step": 54075 }, { "epoch": 0.72, "learning_rate": 8.806549848912671e-06, "loss": 0.7826, "step": 54080 }, { "epoch": 0.72, "learning_rate": 8.80254159281399e-06, "loss": 0.8815, "step": 54085 }, { "epoch": 0.72, "learning_rate": 8.798534054181672e-06, "loss": 0.2935, "step": 54090 }, { "epoch": 0.72, "learning_rate": 8.794527233193262e-06, "loss": 0.951, "step": 54095 }, { "epoch": 0.72, "learning_rate": 8.790521130026202e-06, "loss": 0.927, "step": 54100 }, { "epoch": 0.72, "learning_rate": 8.78651574485797e-06, "loss": 1.214, "step": 54105 }, { "epoch": 0.72, "learning_rate": 8.782511077865973e-06, "loss": 1.1174, "step": 54110 }, { "epoch": 0.73, "learning_rate": 8.778507129227607e-06, "loss": 0.8082, "step": 54115 }, { "epoch": 0.73, "learning_rate": 8.774503899120224e-06, "loss": 0.9065, "step": 54120 }, { "epoch": 0.73, "learning_rate": 8.770501387721134e-06, "loss": 0.4543, "step": 54125 }, { "epoch": 0.73, "learning_rate": 8.766499595207655e-06, "loss": 0.9988, "step": 54130 }, { "epoch": 0.73, "learning_rate": 8.762498521757014e-06, "loss": 0.6266, "step": 54135 }, { "epoch": 0.73, "learning_rate": 8.758498167546458e-06, "loss": 0.5193, "step": 54140 }, { "epoch": 0.73, "learning_rate": 8.754498532753194e-06, "loss": 1.3661, "step": 54145 }, { "epoch": 0.73, "learning_rate": 8.750499617554354e-06, "loss": 0.8838, "step": 54150 }, { "epoch": 0.73, "learning_rate": 8.746501422127095e-06, "loss": 0.5823, "step": 54155 }, { "epoch": 0.73, "learning_rate": 8.74250394664851e-06, "loss": 0.5522, "step": 54160 }, { "epoch": 0.73, "learning_rate": 8.73850719129566e-06, "loss": 0.7591, "step": 54165 }, { "epoch": 0.73, "learning_rate": 8.734511156245596e-06, "loss": 0.5124, "step": 54170 }, { "epoch": 0.73, "learning_rate": 8.73051584167531e-06, "loss": 1.0375, "step": 54175 }, { "epoch": 0.73, "learning_rate": 8.726521247761782e-06, "loss": 0.3357, "step": 54180 }, { "epoch": 0.73, "learning_rate": 8.722527374681941e-06, "loss": 1.2771, "step": 54185 }, { "epoch": 0.73, "learning_rate": 8.71853422261271e-06, "loss": 0.7869, "step": 54190 }, { "epoch": 0.73, "learning_rate": 8.71454179173096e-06, "loss": 1.2381, "step": 54195 }, { "epoch": 0.73, "learning_rate": 8.710550082213529e-06, "loss": 0.8344, "step": 54200 }, { "epoch": 0.73, "learning_rate": 8.706559094237249e-06, "loss": 1.1068, "step": 54205 }, { "epoch": 0.73, "learning_rate": 8.702568827978874e-06, "loss": 0.9696, "step": 54210 }, { "epoch": 0.73, "learning_rate": 8.698579283615172e-06, "loss": 0.5833, "step": 54215 }, { "epoch": 0.73, "learning_rate": 8.694590461322846e-06, "loss": 2.2805, "step": 54220 }, { "epoch": 0.73, "learning_rate": 8.6906023612786e-06, "loss": 0.899, "step": 54225 }, { "epoch": 0.73, "learning_rate": 8.686614983659074e-06, "loss": 0.8607, "step": 54230 }, { "epoch": 0.73, "learning_rate": 8.682628328640885e-06, "loss": 0.1534, "step": 54235 }, { "epoch": 0.73, "learning_rate": 8.67864239640064e-06, "loss": 0.5686, "step": 54240 }, { "epoch": 0.73, "learning_rate": 8.674657187114871e-06, "loss": 0.8188, "step": 54245 }, { "epoch": 0.73, "learning_rate": 8.670672700960115e-06, "loss": 0.147, "step": 54250 }, { "epoch": 0.73, "learning_rate": 8.666688938112882e-06, "loss": 0.608, "step": 54255 }, { "epoch": 0.73, "learning_rate": 8.662705898749599e-06, "loss": 0.4702, "step": 54260 }, { "epoch": 0.73, "learning_rate": 8.658723583046718e-06, "loss": 0.8074, "step": 54265 }, { "epoch": 0.73, "learning_rate": 8.654741991180632e-06, "loss": 0.6581, "step": 54270 }, { "epoch": 0.73, "learning_rate": 8.650761123327694e-06, "loss": 0.5646, "step": 54275 }, { "epoch": 0.73, "learning_rate": 8.646780979664255e-06, "loss": 0.163, "step": 54280 }, { "epoch": 0.73, "learning_rate": 8.642801560366604e-06, "loss": 0.6296, "step": 54285 }, { "epoch": 0.73, "learning_rate": 8.63882286561101e-06, "loss": 0.3875, "step": 54290 }, { "epoch": 0.73, "learning_rate": 8.634844895573705e-06, "loss": 0.5092, "step": 54295 }, { "epoch": 0.73, "learning_rate": 8.630867650430907e-06, "loss": 0.5802, "step": 54300 }, { "epoch": 0.73, "learning_rate": 8.62689113035878e-06, "loss": 0.5238, "step": 54305 }, { "epoch": 0.73, "learning_rate": 8.622915335533455e-06, "loss": 1.0073, "step": 54310 }, { "epoch": 0.73, "learning_rate": 8.618940266131065e-06, "loss": 1.213, "step": 54315 }, { "epoch": 0.73, "learning_rate": 8.614965922327653e-06, "loss": 0.5441, "step": 54320 }, { "epoch": 0.73, "learning_rate": 8.610992304299287e-06, "loss": 0.5013, "step": 54325 }, { "epoch": 0.73, "learning_rate": 8.60701941222197e-06, "loss": 0.6885, "step": 54330 }, { "epoch": 0.73, "learning_rate": 8.603047246271676e-06, "loss": 0.3266, "step": 54335 }, { "epoch": 0.73, "learning_rate": 8.599075806624363e-06, "loss": 0.5531, "step": 54340 }, { "epoch": 0.73, "learning_rate": 8.595105093455932e-06, "loss": 0.6352, "step": 54345 }, { "epoch": 0.73, "learning_rate": 8.591135106942291e-06, "loss": 0.6814, "step": 54350 }, { "epoch": 0.73, "learning_rate": 8.58716584725926e-06, "loss": 1.1841, "step": 54355 }, { "epoch": 0.73, "learning_rate": 8.58319731458267e-06, "loss": 1.01, "step": 54360 }, { "epoch": 0.73, "learning_rate": 8.579229509088321e-06, "loss": 0.8044, "step": 54365 }, { "epoch": 0.73, "learning_rate": 8.57526243095194e-06, "loss": 0.2275, "step": 54370 }, { "epoch": 0.73, "learning_rate": 8.571296080349272e-06, "loss": 1.3316, "step": 54375 }, { "epoch": 0.73, "learning_rate": 8.567330457455998e-06, "loss": 0.9058, "step": 54380 }, { "epoch": 0.73, "learning_rate": 8.563365562447767e-06, "loss": 0.5842, "step": 54385 }, { "epoch": 0.73, "learning_rate": 8.55940139550022e-06, "loss": 0.4286, "step": 54390 }, { "epoch": 0.73, "learning_rate": 8.55543795678894e-06, "loss": 1.1725, "step": 54395 }, { "epoch": 0.73, "learning_rate": 8.551475246489487e-06, "loss": 0.6147, "step": 54400 }, { "epoch": 0.73, "learning_rate": 8.547513264777385e-06, "loss": 1.0198, "step": 54405 }, { "epoch": 0.73, "learning_rate": 8.543552011828144e-06, "loss": 0.8146, "step": 54410 }, { "epoch": 0.73, "learning_rate": 8.539591487817219e-06, "loss": 0.3071, "step": 54415 }, { "epoch": 0.73, "learning_rate": 8.535631692920037e-06, "loss": 0.5957, "step": 54420 }, { "epoch": 0.73, "learning_rate": 8.531672627312018e-06, "loss": 1.0736, "step": 54425 }, { "epoch": 0.73, "learning_rate": 8.527714291168495e-06, "loss": 0.7366, "step": 54430 }, { "epoch": 0.73, "learning_rate": 8.52375668466483e-06, "loss": 0.3421, "step": 54435 }, { "epoch": 0.73, "learning_rate": 8.519799807976314e-06, "loss": 0.7697, "step": 54440 }, { "epoch": 0.73, "learning_rate": 8.515843661278214e-06, "loss": 0.9248, "step": 54445 }, { "epoch": 0.73, "learning_rate": 8.511888244745777e-06, "loss": 0.931, "step": 54450 }, { "epoch": 0.73, "learning_rate": 8.507933558554195e-06, "loss": 0.4567, "step": 54455 }, { "epoch": 0.73, "learning_rate": 8.50397960287866e-06, "loss": 0.6078, "step": 54460 }, { "epoch": 0.73, "learning_rate": 8.5000263778943e-06, "loss": 0.8468, "step": 54465 }, { "epoch": 0.73, "learning_rate": 8.496073883776218e-06, "loss": 0.3712, "step": 54470 }, { "epoch": 0.73, "learning_rate": 8.492122120699511e-06, "loss": 0.2879, "step": 54475 }, { "epoch": 0.73, "learning_rate": 8.488171088839192e-06, "loss": 1.192, "step": 54480 }, { "epoch": 0.73, "learning_rate": 8.484220788370295e-06, "loss": 0.4944, "step": 54485 }, { "epoch": 0.73, "learning_rate": 8.480271219467792e-06, "loss": 1.0935, "step": 54490 }, { "epoch": 0.73, "learning_rate": 8.47632238230662e-06, "loss": 0.8824, "step": 54495 }, { "epoch": 0.73, "learning_rate": 8.47237427706171e-06, "loss": 0.4494, "step": 54500 }, { "epoch": 0.73, "learning_rate": 8.468426903907933e-06, "loss": 1.3857, "step": 54505 }, { "epoch": 0.73, "learning_rate": 8.464480263020141e-06, "loss": 0.8496, "step": 54510 }, { "epoch": 0.73, "learning_rate": 8.460534354573141e-06, "loss": 0.8617, "step": 54515 }, { "epoch": 0.73, "learning_rate": 8.45658917874173e-06, "loss": 0.722, "step": 54520 }, { "epoch": 0.73, "learning_rate": 8.452644735700658e-06, "loss": 0.3939, "step": 54525 }, { "epoch": 0.73, "learning_rate": 8.44870102562463e-06, "loss": 0.7238, "step": 54530 }, { "epoch": 0.73, "learning_rate": 8.44475804868836e-06, "loss": 0.8459, "step": 54535 }, { "epoch": 0.73, "learning_rate": 8.440815805066468e-06, "loss": 0.7093, "step": 54540 }, { "epoch": 0.73, "learning_rate": 8.436874294933602e-06, "loss": 0.4862, "step": 54545 }, { "epoch": 0.73, "learning_rate": 8.432933518464343e-06, "loss": 0.5424, "step": 54550 }, { "epoch": 0.73, "learning_rate": 8.428993475833236e-06, "loss": 1.0985, "step": 54555 }, { "epoch": 0.73, "learning_rate": 8.425054167214825e-06, "loss": 0.9779, "step": 54560 }, { "epoch": 0.73, "learning_rate": 8.421115592783583e-06, "loss": 0.6618, "step": 54565 }, { "epoch": 0.73, "learning_rate": 8.417177752713989e-06, "loss": 0.9297, "step": 54570 }, { "epoch": 0.73, "learning_rate": 8.413240647180459e-06, "loss": 0.4387, "step": 54575 }, { "epoch": 0.73, "learning_rate": 8.409304276357378e-06, "loss": 0.5065, "step": 54580 }, { "epoch": 0.73, "learning_rate": 8.405368640419135e-06, "loss": 0.7327, "step": 54585 }, { "epoch": 0.73, "learning_rate": 8.401433739540024e-06, "loss": 0.6261, "step": 54590 }, { "epoch": 0.73, "learning_rate": 8.397499573894366e-06, "loss": 0.7959, "step": 54595 }, { "epoch": 0.73, "learning_rate": 8.393566143656418e-06, "loss": 0.4822, "step": 54600 }, { "epoch": 0.73, "learning_rate": 8.3896334490004e-06, "loss": 1.0455, "step": 54605 }, { "epoch": 0.73, "learning_rate": 8.38570149010053e-06, "loss": 0.6135, "step": 54610 }, { "epoch": 0.73, "learning_rate": 8.381770267130967e-06, "loss": 0.9595, "step": 54615 }, { "epoch": 0.73, "learning_rate": 8.377839780265843e-06, "loss": 0.2373, "step": 54620 }, { "epoch": 0.73, "learning_rate": 8.373910029679249e-06, "loss": 0.3478, "step": 54625 }, { "epoch": 0.73, "learning_rate": 8.36998101554527e-06, "loss": 0.9161, "step": 54630 }, { "epoch": 0.73, "learning_rate": 8.366052738037938e-06, "loss": 0.3961, "step": 54635 }, { "epoch": 0.73, "learning_rate": 8.362125197331242e-06, "loss": 0.6957, "step": 54640 }, { "epoch": 0.73, "learning_rate": 8.358198393599182e-06, "loss": 0.3803, "step": 54645 }, { "epoch": 0.73, "learning_rate": 8.354272327015657e-06, "loss": 0.576, "step": 54650 }, { "epoch": 0.73, "learning_rate": 8.350346997754601e-06, "loss": 0.4193, "step": 54655 }, { "epoch": 0.73, "learning_rate": 8.346422405989878e-06, "loss": 0.3862, "step": 54660 }, { "epoch": 0.73, "learning_rate": 8.34249855189532e-06, "loss": 0.894, "step": 54665 }, { "epoch": 0.73, "learning_rate": 8.338575435644749e-06, "loss": 0.8227, "step": 54670 }, { "epoch": 0.73, "learning_rate": 8.334653057411923e-06, "loss": 0.1759, "step": 54675 }, { "epoch": 0.73, "learning_rate": 8.330731417370602e-06, "loss": 0.4736, "step": 54680 }, { "epoch": 0.73, "learning_rate": 8.326810515694484e-06, "loss": 0.6905, "step": 54685 }, { "epoch": 0.73, "learning_rate": 8.32289035255724e-06, "loss": 0.7262, "step": 54690 }, { "epoch": 0.73, "learning_rate": 8.318970928132536e-06, "loss": 0.8154, "step": 54695 }, { "epoch": 0.73, "learning_rate": 8.31505224259395e-06, "loss": 0.3513, "step": 54700 }, { "epoch": 0.73, "learning_rate": 8.311134296115087e-06, "loss": 0.8108, "step": 54705 }, { "epoch": 0.73, "learning_rate": 8.307217088869481e-06, "loss": 1.1044, "step": 54710 }, { "epoch": 0.73, "learning_rate": 8.30330062103064e-06, "loss": 0.6419, "step": 54715 }, { "epoch": 0.73, "learning_rate": 8.299384892772057e-06, "loss": 0.8654, "step": 54720 }, { "epoch": 0.73, "learning_rate": 8.295469904267176e-06, "loss": 0.5764, "step": 54725 }, { "epoch": 0.73, "learning_rate": 8.291555655689406e-06, "loss": 0.67, "step": 54730 }, { "epoch": 0.73, "learning_rate": 8.28764214721212e-06, "loss": 0.808, "step": 54735 }, { "epoch": 0.73, "learning_rate": 8.283729379008693e-06, "loss": 0.2526, "step": 54740 }, { "epoch": 0.73, "learning_rate": 8.27981735125242e-06, "loss": 0.5521, "step": 54745 }, { "epoch": 0.73, "learning_rate": 8.275906064116582e-06, "loss": 0.3352, "step": 54750 }, { "epoch": 0.73, "learning_rate": 8.271995517774455e-06, "loss": 0.3349, "step": 54755 }, { "epoch": 0.73, "learning_rate": 8.268085712399224e-06, "loss": 0.5082, "step": 54760 }, { "epoch": 0.73, "learning_rate": 8.264176648164093e-06, "loss": 1.2406, "step": 54765 }, { "epoch": 0.73, "learning_rate": 8.260268325242212e-06, "loss": 0.4351, "step": 54770 }, { "epoch": 0.73, "learning_rate": 8.25636074380669e-06, "loss": 0.3598, "step": 54775 }, { "epoch": 0.73, "learning_rate": 8.25245390403063e-06, "loss": 1.0025, "step": 54780 }, { "epoch": 0.73, "learning_rate": 8.248547806087067e-06, "loss": 0.5099, "step": 54785 }, { "epoch": 0.73, "learning_rate": 8.24464245014904e-06, "loss": 0.3333, "step": 54790 }, { "epoch": 0.73, "learning_rate": 8.240737836389528e-06, "loss": 0.5321, "step": 54795 }, { "epoch": 0.73, "learning_rate": 8.236833964981478e-06, "loss": 1.7393, "step": 54800 }, { "epoch": 0.73, "learning_rate": 8.232930836097837e-06, "loss": 0.644, "step": 54805 }, { "epoch": 0.73, "learning_rate": 8.22902844991146e-06, "loss": 1.337, "step": 54810 }, { "epoch": 0.73, "learning_rate": 8.22512680659523e-06, "loss": 0.634, "step": 54815 }, { "epoch": 0.73, "learning_rate": 8.221225906321955e-06, "loss": 0.851, "step": 54820 }, { "epoch": 0.73, "learning_rate": 8.217325749264429e-06, "loss": 0.6687, "step": 54825 }, { "epoch": 0.73, "learning_rate": 8.213426335595414e-06, "loss": 0.5761, "step": 54830 }, { "epoch": 0.73, "learning_rate": 8.209527665487638e-06, "loss": 0.7449, "step": 54835 }, { "epoch": 0.73, "learning_rate": 8.20562973911378e-06, "loss": 0.461, "step": 54840 }, { "epoch": 0.73, "learning_rate": 8.2017325566465e-06, "loss": 0.6963, "step": 54845 }, { "epoch": 0.73, "learning_rate": 8.197836118258437e-06, "loss": 0.7659, "step": 54850 }, { "epoch": 0.73, "learning_rate": 8.193940424122174e-06, "loss": 1.1922, "step": 54855 }, { "epoch": 0.74, "learning_rate": 8.190045474410263e-06, "loss": 0.9476, "step": 54860 }, { "epoch": 0.74, "learning_rate": 8.18615126929526e-06, "loss": 0.4923, "step": 54865 }, { "epoch": 0.74, "learning_rate": 8.18225780894962e-06, "loss": 1.0204, "step": 54870 }, { "epoch": 0.74, "learning_rate": 8.178365093545823e-06, "loss": 0.5627, "step": 54875 }, { "epoch": 0.74, "learning_rate": 8.174473123256313e-06, "loss": 0.229, "step": 54880 }, { "epoch": 0.74, "learning_rate": 8.170581898253449e-06, "loss": 0.8508, "step": 54885 }, { "epoch": 0.74, "learning_rate": 8.166691418709624e-06, "loss": 0.3411, "step": 54890 }, { "epoch": 0.74, "learning_rate": 8.162801684797144e-06, "loss": 1.2075, "step": 54895 }, { "epoch": 0.74, "learning_rate": 8.158912696688326e-06, "loss": 0.7473, "step": 54900 }, { "epoch": 0.74, "learning_rate": 8.155024454555421e-06, "loss": 0.5403, "step": 54905 }, { "epoch": 0.74, "learning_rate": 8.151136958570651e-06, "loss": 0.5863, "step": 54910 }, { "epoch": 0.74, "learning_rate": 8.147250208906237e-06, "loss": 0.7347, "step": 54915 }, { "epoch": 0.74, "learning_rate": 8.143364205734314e-06, "loss": 1.0777, "step": 54920 }, { "epoch": 0.74, "learning_rate": 8.139478949227034e-06, "loss": 0.4993, "step": 54925 }, { "epoch": 0.74, "learning_rate": 8.135594439556482e-06, "loss": 0.6106, "step": 54930 }, { "epoch": 0.74, "learning_rate": 8.131710676894722e-06, "loss": 0.8138, "step": 54935 }, { "epoch": 0.74, "learning_rate": 8.127827661413796e-06, "loss": 0.4268, "step": 54940 }, { "epoch": 0.74, "learning_rate": 8.123945393285695e-06, "loss": 0.2485, "step": 54945 }, { "epoch": 0.74, "learning_rate": 8.120063872682385e-06, "loss": 0.6687, "step": 54950 }, { "epoch": 0.74, "learning_rate": 8.116183099775789e-06, "loss": 0.9117, "step": 54955 }, { "epoch": 0.74, "learning_rate": 8.112303074737825e-06, "loss": 0.7766, "step": 54960 }, { "epoch": 0.74, "learning_rate": 8.108423797740349e-06, "loss": 1.3518, "step": 54965 }, { "epoch": 0.74, "learning_rate": 8.104545268955183e-06, "loss": 0.7876, "step": 54970 }, { "epoch": 0.74, "learning_rate": 8.100667488554154e-06, "loss": 0.2983, "step": 54975 }, { "epoch": 0.74, "learning_rate": 8.096790456708992e-06, "loss": 0.4611, "step": 54980 }, { "epoch": 0.74, "learning_rate": 8.092914173591449e-06, "loss": 0.7658, "step": 54985 }, { "epoch": 0.74, "learning_rate": 8.089038639373243e-06, "loss": 0.7209, "step": 54990 }, { "epoch": 0.74, "learning_rate": 8.085163854226002e-06, "loss": 0.7428, "step": 54995 }, { "epoch": 0.74, "learning_rate": 8.081289818321392e-06, "loss": 0.4465, "step": 55000 }, { "epoch": 0.74, "learning_rate": 8.077416531831e-06, "loss": 0.2765, "step": 55005 }, { "epoch": 0.74, "learning_rate": 8.073543994926386e-06, "loss": 0.7309, "step": 55010 }, { "epoch": 0.74, "learning_rate": 8.0696722077791e-06, "loss": 1.0742, "step": 55015 }, { "epoch": 0.74, "learning_rate": 8.06580117056063e-06, "loss": 0.8634, "step": 55020 }, { "epoch": 0.74, "learning_rate": 8.061930883442464e-06, "loss": 1.0474, "step": 55025 }, { "epoch": 0.74, "learning_rate": 8.058061346596006e-06, "loss": 0.7972, "step": 55030 }, { "epoch": 0.74, "learning_rate": 8.05419256019268e-06, "loss": 1.1837, "step": 55035 }, { "epoch": 0.74, "learning_rate": 8.050324524403846e-06, "loss": 0.5933, "step": 55040 }, { "epoch": 0.74, "learning_rate": 8.046457239400829e-06, "loss": 0.6425, "step": 55045 }, { "epoch": 0.74, "learning_rate": 8.042590705354953e-06, "loss": 1.0328, "step": 55050 }, { "epoch": 0.74, "learning_rate": 8.038724922437469e-06, "loss": 0.8631, "step": 55055 }, { "epoch": 0.74, "learning_rate": 8.034859890819619e-06, "loss": 1.0449, "step": 55060 }, { "epoch": 0.74, "learning_rate": 8.030995610672592e-06, "loss": 1.2589, "step": 55065 }, { "epoch": 0.74, "learning_rate": 8.027132082167577e-06, "loss": 0.3618, "step": 55070 }, { "epoch": 0.74, "learning_rate": 8.023269305475695e-06, "loss": 1.0279, "step": 55075 }, { "epoch": 0.74, "learning_rate": 8.019407280768046e-06, "loss": 0.8512, "step": 55080 }, { "epoch": 0.74, "learning_rate": 8.015546008215715e-06, "loss": 0.4611, "step": 55085 }, { "epoch": 0.74, "learning_rate": 8.011685487989712e-06, "loss": 0.5754, "step": 55090 }, { "epoch": 0.74, "learning_rate": 8.007825720261053e-06, "loss": 0.9357, "step": 55095 }, { "epoch": 0.74, "learning_rate": 8.003966705200721e-06, "loss": 1.1995, "step": 55100 }, { "epoch": 0.74, "learning_rate": 8.000108442979617e-06, "loss": 0.9855, "step": 55105 }, { "epoch": 0.74, "learning_rate": 7.996250933768674e-06, "loss": 0.422, "step": 55110 }, { "epoch": 0.74, "learning_rate": 7.992394177738743e-06, "loss": 0.7267, "step": 55115 }, { "epoch": 0.74, "learning_rate": 7.988538175060655e-06, "loss": 0.4541, "step": 55120 }, { "epoch": 0.74, "learning_rate": 7.984682925905232e-06, "loss": 0.4149, "step": 55125 }, { "epoch": 0.74, "learning_rate": 7.980828430443221e-06, "loss": 0.1524, "step": 55130 }, { "epoch": 0.74, "learning_rate": 7.976974688845381e-06, "loss": 0.7124, "step": 55135 }, { "epoch": 0.74, "learning_rate": 7.973121701282384e-06, "loss": 0.4305, "step": 55140 }, { "epoch": 0.74, "learning_rate": 7.969269467924922e-06, "loss": 0.501, "step": 55145 }, { "epoch": 0.74, "learning_rate": 7.965417988943619e-06, "loss": 0.8553, "step": 55150 }, { "epoch": 0.74, "learning_rate": 7.96156726450907e-06, "loss": 0.7373, "step": 55155 }, { "epoch": 0.74, "learning_rate": 7.957717294791858e-06, "loss": 0.4467, "step": 55160 }, { "epoch": 0.74, "learning_rate": 7.95386807996251e-06, "loss": 0.6095, "step": 55165 }, { "epoch": 0.74, "learning_rate": 7.950019620191529e-06, "loss": 0.4424, "step": 55170 }, { "epoch": 0.74, "learning_rate": 7.94617191564937e-06, "loss": 0.4645, "step": 55175 }, { "epoch": 0.74, "learning_rate": 7.942324966506486e-06, "loss": 1.5085, "step": 55180 }, { "epoch": 0.74, "learning_rate": 7.93847877293327e-06, "loss": 0.8795, "step": 55185 }, { "epoch": 0.74, "learning_rate": 7.934633335100078e-06, "loss": 0.59, "step": 55190 }, { "epoch": 0.74, "learning_rate": 7.930788653177273e-06, "loss": 0.6026, "step": 55195 }, { "epoch": 0.74, "learning_rate": 7.926944727335117e-06, "loss": 0.6346, "step": 55200 }, { "epoch": 0.74, "learning_rate": 7.923101557743897e-06, "loss": 1.447, "step": 55205 }, { "epoch": 0.74, "learning_rate": 7.919259144573862e-06, "loss": 0.2661, "step": 55210 }, { "epoch": 0.74, "learning_rate": 7.91541748799518e-06, "loss": 0.9068, "step": 55215 }, { "epoch": 0.74, "learning_rate": 7.911576588178039e-06, "loss": 0.5474, "step": 55220 }, { "epoch": 0.74, "learning_rate": 7.907736445292563e-06, "loss": 1.2154, "step": 55225 }, { "epoch": 0.74, "learning_rate": 7.903897059508844e-06, "loss": 0.548, "step": 55230 }, { "epoch": 0.74, "learning_rate": 7.900058430996965e-06, "loss": 0.5783, "step": 55235 }, { "epoch": 0.74, "learning_rate": 7.896220559926939e-06, "loss": 0.4909, "step": 55240 }, { "epoch": 0.74, "learning_rate": 7.892383446468796e-06, "loss": 0.218, "step": 55245 }, { "epoch": 0.74, "learning_rate": 7.888547090792458e-06, "loss": 0.6541, "step": 55250 }, { "epoch": 0.74, "learning_rate": 7.88471149306789e-06, "loss": 0.0758, "step": 55255 }, { "epoch": 0.74, "learning_rate": 7.880876653464975e-06, "loss": 0.363, "step": 55260 }, { "epoch": 0.74, "learning_rate": 7.877042572153572e-06, "loss": 0.8558, "step": 55265 }, { "epoch": 0.74, "learning_rate": 7.873209249303532e-06, "loss": 0.3535, "step": 55270 }, { "epoch": 0.74, "learning_rate": 7.869376685084634e-06, "loss": 0.9786, "step": 55275 }, { "epoch": 0.74, "learning_rate": 7.86554487966665e-06, "loss": 0.7644, "step": 55280 }, { "epoch": 0.74, "learning_rate": 7.8617138332193e-06, "loss": 0.6955, "step": 55285 }, { "epoch": 0.74, "learning_rate": 7.857883545912292e-06, "loss": 0.8454, "step": 55290 }, { "epoch": 0.74, "learning_rate": 7.854054017915286e-06, "loss": 0.8654, "step": 55295 }, { "epoch": 0.74, "learning_rate": 7.850225249397899e-06, "loss": 0.5404, "step": 55300 }, { "epoch": 0.74, "learning_rate": 7.846397240529744e-06, "loss": 0.7455, "step": 55305 }, { "epoch": 0.74, "learning_rate": 7.842569991480375e-06, "loss": 0.4231, "step": 55310 }, { "epoch": 0.74, "learning_rate": 7.83874350241931e-06, "loss": 0.6928, "step": 55315 }, { "epoch": 0.74, "learning_rate": 7.834917773516071e-06, "loss": 1.0014, "step": 55320 }, { "epoch": 0.74, "learning_rate": 7.831092804940082e-06, "loss": 0.3817, "step": 55325 }, { "epoch": 0.74, "learning_rate": 7.827268596860799e-06, "loss": 0.7385, "step": 55330 }, { "epoch": 0.74, "learning_rate": 7.823445149447603e-06, "loss": 0.8444, "step": 55335 }, { "epoch": 0.74, "learning_rate": 7.819622462869849e-06, "loss": 1.3074, "step": 55340 }, { "epoch": 0.74, "learning_rate": 7.815800537296875e-06, "loss": 0.2963, "step": 55345 }, { "epoch": 0.74, "learning_rate": 7.81197937289796e-06, "loss": 0.6291, "step": 55350 }, { "epoch": 0.74, "learning_rate": 7.808158969842388e-06, "loss": 0.468, "step": 55355 }, { "epoch": 0.74, "learning_rate": 7.804339328299346e-06, "loss": 1.4909, "step": 55360 }, { "epoch": 0.74, "learning_rate": 7.800520448438054e-06, "loss": 0.9205, "step": 55365 }, { "epoch": 0.74, "learning_rate": 7.796702330427661e-06, "loss": 0.9896, "step": 55370 }, { "epoch": 0.74, "learning_rate": 7.792884974437281e-06, "loss": 0.1665, "step": 55375 }, { "epoch": 0.74, "learning_rate": 7.789068380636019e-06, "loss": 0.7019, "step": 55380 }, { "epoch": 0.74, "learning_rate": 7.785252549192926e-06, "loss": 1.1796, "step": 55385 }, { "epoch": 0.74, "learning_rate": 7.781437480277021e-06, "loss": 0.9754, "step": 55390 }, { "epoch": 0.74, "learning_rate": 7.777623174057286e-06, "loss": 0.798, "step": 55395 }, { "epoch": 0.74, "learning_rate": 7.773809630702692e-06, "loss": 0.3071, "step": 55400 }, { "epoch": 0.74, "learning_rate": 7.76999685038215e-06, "loss": 0.4405, "step": 55405 }, { "epoch": 0.74, "learning_rate": 7.766184833264542e-06, "loss": 0.2377, "step": 55410 }, { "epoch": 0.74, "learning_rate": 7.762373579518734e-06, "loss": 0.9027, "step": 55415 }, { "epoch": 0.74, "learning_rate": 7.758563089313542e-06, "loss": 0.7772, "step": 55420 }, { "epoch": 0.74, "learning_rate": 7.75475336281774e-06, "loss": 0.6941, "step": 55425 }, { "epoch": 0.74, "learning_rate": 7.750944400200102e-06, "loss": 0.3477, "step": 55430 }, { "epoch": 0.74, "learning_rate": 7.747136201629321e-06, "loss": 0.2188, "step": 55435 }, { "epoch": 0.74, "learning_rate": 7.7433287672741e-06, "loss": 0.9914, "step": 55440 }, { "epoch": 0.74, "learning_rate": 7.739522097303082e-06, "loss": 1.0153, "step": 55445 }, { "epoch": 0.74, "learning_rate": 7.735716191884874e-06, "loss": 0.377, "step": 55450 }, { "epoch": 0.74, "learning_rate": 7.731911051188076e-06, "loss": 0.6346, "step": 55455 }, { "epoch": 0.74, "learning_rate": 7.728106675381222e-06, "loss": 1.2805, "step": 55460 }, { "epoch": 0.74, "learning_rate": 7.724303064632849e-06, "loss": 1.4514, "step": 55465 }, { "epoch": 0.74, "learning_rate": 7.720500219111406e-06, "loss": 1.017, "step": 55470 }, { "epoch": 0.74, "learning_rate": 7.716698138985367e-06, "loss": 1.1729, "step": 55475 }, { "epoch": 0.74, "learning_rate": 7.712896824423135e-06, "loss": 0.5221, "step": 55480 }, { "epoch": 0.74, "learning_rate": 7.70909627559308e-06, "loss": 0.3127, "step": 55485 }, { "epoch": 0.74, "learning_rate": 7.705296492663564e-06, "loss": 0.4969, "step": 55490 }, { "epoch": 0.74, "learning_rate": 7.70149747580289e-06, "loss": 0.1694, "step": 55495 }, { "epoch": 0.74, "learning_rate": 7.697699225179338e-06, "loss": 0.2386, "step": 55500 }, { "epoch": 0.74, "learning_rate": 7.69390174096114e-06, "loss": 1.5387, "step": 55505 }, { "epoch": 0.74, "learning_rate": 7.690105023316525e-06, "loss": 0.1151, "step": 55510 }, { "epoch": 0.74, "learning_rate": 7.686309072413656e-06, "loss": 0.487, "step": 55515 }, { "epoch": 0.74, "learning_rate": 7.682513888420673e-06, "loss": 0.6755, "step": 55520 }, { "epoch": 0.74, "learning_rate": 7.678719471505693e-06, "loss": 1.0329, "step": 55525 }, { "epoch": 0.74, "learning_rate": 7.674925821836787e-06, "loss": 0.7829, "step": 55530 }, { "epoch": 0.74, "learning_rate": 7.671132939581982e-06, "loss": 0.3686, "step": 55535 }, { "epoch": 0.74, "learning_rate": 7.66734082490931e-06, "loss": 0.9657, "step": 55540 }, { "epoch": 0.74, "learning_rate": 7.663549477986714e-06, "loss": 0.7922, "step": 55545 }, { "epoch": 0.74, "learning_rate": 7.65975889898215e-06, "loss": 1.0595, "step": 55550 }, { "epoch": 0.74, "learning_rate": 7.65596908806352e-06, "loss": 0.8782, "step": 55555 }, { "epoch": 0.74, "learning_rate": 7.652180045398677e-06, "loss": 0.6037, "step": 55560 }, { "epoch": 0.74, "learning_rate": 7.64839177115548e-06, "loss": 0.7571, "step": 55565 }, { "epoch": 0.74, "learning_rate": 7.64460426550172e-06, "loss": 0.7267, "step": 55570 }, { "epoch": 0.74, "learning_rate": 7.640817528605166e-06, "loss": 0.7613, "step": 55575 }, { "epoch": 0.74, "learning_rate": 7.63703156063354e-06, "loss": 0.5301, "step": 55580 }, { "epoch": 0.74, "learning_rate": 7.633246361754559e-06, "loss": 0.4705, "step": 55585 }, { "epoch": 0.74, "learning_rate": 7.629461932135884e-06, "loss": 1.012, "step": 55590 }, { "epoch": 0.74, "learning_rate": 7.625678271945133e-06, "loss": 0.759, "step": 55595 }, { "epoch": 0.74, "learning_rate": 7.621895381349922e-06, "loss": 0.9719, "step": 55600 }, { "epoch": 0.75, "learning_rate": 7.618113260517807e-06, "loss": 1.2418, "step": 55605 }, { "epoch": 0.75, "learning_rate": 7.614331909616315e-06, "loss": 0.7985, "step": 55610 }, { "epoch": 0.75, "learning_rate": 7.610551328812934e-06, "loss": 1.8255, "step": 55615 }, { "epoch": 0.75, "learning_rate": 7.606771518275141e-06, "loss": 0.3871, "step": 55620 }, { "epoch": 0.75, "learning_rate": 7.602992478170351e-06, "loss": 0.356, "step": 55625 }, { "epoch": 0.75, "learning_rate": 7.599214208665956e-06, "loss": 1.1048, "step": 55630 }, { "epoch": 0.75, "learning_rate": 7.595436709929321e-06, "loss": 0.2031, "step": 55635 }, { "epoch": 0.75, "learning_rate": 7.591659982127772e-06, "loss": 0.9713, "step": 55640 }, { "epoch": 0.75, "learning_rate": 7.587884025428585e-06, "loss": 0.6241, "step": 55645 }, { "epoch": 0.75, "learning_rate": 7.5841088399990435e-06, "loss": 0.6595, "step": 55650 }, { "epoch": 0.75, "learning_rate": 7.580334426006333e-06, "loss": 0.3766, "step": 55655 }, { "epoch": 0.75, "learning_rate": 7.576560783617668e-06, "loss": 0.9188, "step": 55660 }, { "epoch": 0.75, "learning_rate": 7.5727879130001925e-06, "loss": 0.3726, "step": 55665 }, { "epoch": 0.75, "learning_rate": 7.56901581432102e-06, "loss": 1.0044, "step": 55670 }, { "epoch": 0.75, "learning_rate": 7.56524448774725e-06, "loss": 0.7134, "step": 55675 }, { "epoch": 0.75, "learning_rate": 7.561473933445929e-06, "loss": 0.5139, "step": 55680 }, { "epoch": 0.75, "learning_rate": 7.5577041515840665e-06, "loss": 0.2169, "step": 55685 }, { "epoch": 0.75, "learning_rate": 7.553935142328644e-06, "loss": 0.3983, "step": 55690 }, { "epoch": 0.75, "learning_rate": 7.55016690584662e-06, "loss": 0.8126, "step": 55695 }, { "epoch": 0.75, "learning_rate": 7.546399442304905e-06, "loss": 0.5788, "step": 55700 }, { "epoch": 0.75, "learning_rate": 7.542632751870368e-06, "loss": 0.1676, "step": 55705 }, { "epoch": 0.75, "learning_rate": 7.5388668347098734e-06, "loss": 0.6667, "step": 55710 }, { "epoch": 0.75, "learning_rate": 7.5351016909902205e-06, "loss": 2.0343, "step": 55715 }, { "epoch": 0.75, "learning_rate": 7.531337320878182e-06, "loss": 0.3647, "step": 55720 }, { "epoch": 0.75, "learning_rate": 7.527573724540515e-06, "loss": 0.5486, "step": 55725 }, { "epoch": 0.75, "learning_rate": 7.523810902143918e-06, "loss": 0.5281, "step": 55730 }, { "epoch": 0.75, "learning_rate": 7.520048853855071e-06, "loss": 0.4818, "step": 55735 }, { "epoch": 0.75, "learning_rate": 7.5162875798406e-06, "loss": 0.7044, "step": 55740 }, { "epoch": 0.75, "learning_rate": 7.512527080267132e-06, "loss": 0.8391, "step": 55745 }, { "epoch": 0.75, "learning_rate": 7.508767355301225e-06, "loss": 0.6724, "step": 55750 }, { "epoch": 0.75, "learning_rate": 7.50500840510941e-06, "loss": 0.8577, "step": 55755 }, { "epoch": 0.75, "learning_rate": 7.501250229858214e-06, "loss": 1.0459, "step": 55760 }, { "epoch": 0.75, "learning_rate": 7.497492829714073e-06, "loss": 1.1035, "step": 55765 }, { "epoch": 0.75, "learning_rate": 7.493736204843446e-06, "loss": 0.3473, "step": 55770 }, { "epoch": 0.75, "learning_rate": 7.489980355412724e-06, "loss": 0.7475, "step": 55775 }, { "epoch": 0.75, "learning_rate": 7.486225281588264e-06, "loss": 0.7288, "step": 55780 }, { "epoch": 0.75, "learning_rate": 7.4824709835364135e-06, "loss": 0.2118, "step": 55785 }, { "epoch": 0.75, "learning_rate": 7.478717461423462e-06, "loss": 0.5576, "step": 55790 }, { "epoch": 0.75, "learning_rate": 7.474964715415669e-06, "loss": 0.1185, "step": 55795 }, { "epoch": 0.75, "learning_rate": 7.471212745679257e-06, "loss": 0.3526, "step": 55800 }, { "epoch": 0.75, "learning_rate": 7.467461552380437e-06, "loss": 0.159, "step": 55805 }, { "epoch": 0.75, "learning_rate": 7.463711135685353e-06, "loss": 0.8505, "step": 55810 }, { "epoch": 0.75, "learning_rate": 7.4599614957601286e-06, "loss": 0.5785, "step": 55815 }, { "epoch": 0.75, "learning_rate": 7.45621263277087e-06, "loss": 0.5322, "step": 55820 }, { "epoch": 0.75, "learning_rate": 7.45246454688362e-06, "loss": 0.5179, "step": 55825 }, { "epoch": 0.75, "learning_rate": 7.448717238264397e-06, "loss": 0.5402, "step": 55830 }, { "epoch": 0.75, "learning_rate": 7.444970707079202e-06, "loss": 0.4183, "step": 55835 }, { "epoch": 0.75, "learning_rate": 7.441224953493978e-06, "loss": 0.6326, "step": 55840 }, { "epoch": 0.75, "learning_rate": 7.437479977674644e-06, "loss": 0.3439, "step": 55845 }, { "epoch": 0.75, "learning_rate": 7.4337357797870765e-06, "loss": 0.9833, "step": 55850 }, { "epoch": 0.75, "learning_rate": 7.429992359997142e-06, "loss": 0.5425, "step": 55855 }, { "epoch": 0.75, "learning_rate": 7.426249718470649e-06, "loss": 0.4773, "step": 55860 }, { "epoch": 0.75, "learning_rate": 7.422507855373362e-06, "loss": 0.7357, "step": 55865 }, { "epoch": 0.75, "learning_rate": 7.418766770871058e-06, "loss": 0.9611, "step": 55870 }, { "epoch": 0.75, "learning_rate": 7.415026465129413e-06, "loss": 0.8117, "step": 55875 }, { "epoch": 0.75, "learning_rate": 7.41128693831413e-06, "loss": 0.4702, "step": 55880 }, { "epoch": 0.75, "learning_rate": 7.4075481905908405e-06, "loss": 0.475, "step": 55885 }, { "epoch": 0.75, "learning_rate": 7.403810222125146e-06, "loss": 0.3324, "step": 55890 }, { "epoch": 0.75, "learning_rate": 7.400073033082635e-06, "loss": 0.5216, "step": 55895 }, { "epoch": 0.75, "learning_rate": 7.396336623628841e-06, "loss": 0.571, "step": 55900 }, { "epoch": 0.75, "learning_rate": 7.392600993929266e-06, "loss": 0.4962, "step": 55905 }, { "epoch": 0.75, "learning_rate": 7.38886614414937e-06, "loss": 0.4184, "step": 55910 }, { "epoch": 0.75, "learning_rate": 7.385132074454609e-06, "loss": 0.7022, "step": 55915 }, { "epoch": 0.75, "learning_rate": 7.381398785010371e-06, "loss": 1.0008, "step": 55920 }, { "epoch": 0.75, "learning_rate": 7.377666275982015e-06, "loss": 0.9988, "step": 55925 }, { "epoch": 0.75, "learning_rate": 7.373934547534891e-06, "loss": 0.59, "step": 55930 }, { "epoch": 0.75, "learning_rate": 7.370203599834285e-06, "loss": 1.0855, "step": 55935 }, { "epoch": 0.75, "learning_rate": 7.366473433045454e-06, "loss": 0.7982, "step": 55940 }, { "epoch": 0.75, "learning_rate": 7.362744047333636e-06, "loss": 0.5934, "step": 55945 }, { "epoch": 0.75, "learning_rate": 7.359015442864025e-06, "loss": 0.3399, "step": 55950 }, { "epoch": 0.75, "learning_rate": 7.355287619801773e-06, "loss": 0.9774, "step": 55955 }, { "epoch": 0.75, "learning_rate": 7.351560578311997e-06, "loss": 0.5873, "step": 55960 }, { "epoch": 0.75, "learning_rate": 7.3478343185598045e-06, "loss": 0.5864, "step": 55965 }, { "epoch": 0.75, "learning_rate": 7.34410884071024e-06, "loss": 1.1793, "step": 55970 }, { "epoch": 0.75, "learning_rate": 7.340384144928314e-06, "loss": 0.6417, "step": 55975 }, { "epoch": 0.75, "learning_rate": 7.336660231379042e-06, "loss": 0.6338, "step": 55980 }, { "epoch": 0.75, "learning_rate": 7.332937100227335e-06, "loss": 0.2955, "step": 55985 }, { "epoch": 0.75, "learning_rate": 7.329214751638138e-06, "loss": 0.1578, "step": 55990 }, { "epoch": 0.75, "learning_rate": 7.325493185776325e-06, "loss": 0.536, "step": 55995 }, { "epoch": 0.75, "learning_rate": 7.321772402806734e-06, "loss": 0.834, "step": 56000 }, { "epoch": 0.75, "learning_rate": 7.318052402894191e-06, "loss": 0.954, "step": 56005 }, { "epoch": 0.75, "learning_rate": 7.314333186203464e-06, "loss": 1.6785, "step": 56010 }, { "epoch": 0.75, "learning_rate": 7.3106147528993e-06, "loss": 0.8954, "step": 56015 }, { "epoch": 0.75, "learning_rate": 7.306897103146398e-06, "loss": 0.7163, "step": 56020 }, { "epoch": 0.75, "learning_rate": 7.303180237109447e-06, "loss": 1.1501, "step": 56025 }, { "epoch": 0.75, "learning_rate": 7.299464154953076e-06, "loss": 0.3138, "step": 56030 }, { "epoch": 0.75, "learning_rate": 7.29574885684188e-06, "loss": 1.1296, "step": 56035 }, { "epoch": 0.75, "learning_rate": 7.292034342940449e-06, "loss": 0.3321, "step": 56040 }, { "epoch": 0.75, "learning_rate": 7.288320613413305e-06, "loss": 0.8156, "step": 56045 }, { "epoch": 0.75, "learning_rate": 7.284607668424942e-06, "loss": 1.4733, "step": 56050 }, { "epoch": 0.75, "learning_rate": 7.28089550813984e-06, "loss": 0.5862, "step": 56055 }, { "epoch": 0.75, "learning_rate": 7.27718413272242e-06, "loss": 0.6699, "step": 56060 }, { "epoch": 0.75, "learning_rate": 7.273473542337078e-06, "loss": 0.2355, "step": 56065 }, { "epoch": 0.75, "learning_rate": 7.269763737148169e-06, "loss": 0.6932, "step": 56070 }, { "epoch": 0.75, "learning_rate": 7.266054717320031e-06, "loss": 1.4711, "step": 56075 }, { "epoch": 0.75, "learning_rate": 7.262346483016952e-06, "loss": 0.8044, "step": 56080 }, { "epoch": 0.75, "learning_rate": 7.258639034403175e-06, "loss": 1.2978, "step": 56085 }, { "epoch": 0.75, "learning_rate": 7.2549323716429476e-06, "loss": 0.3933, "step": 56090 }, { "epoch": 0.75, "learning_rate": 7.251226494900423e-06, "loss": 0.5676, "step": 56095 }, { "epoch": 0.75, "learning_rate": 7.24752140433978e-06, "loss": 0.4931, "step": 56100 }, { "epoch": 0.75, "learning_rate": 7.243817100125125e-06, "loss": 0.4765, "step": 56105 }, { "epoch": 0.75, "learning_rate": 7.240113582420535e-06, "loss": 0.7854, "step": 56110 }, { "epoch": 0.75, "learning_rate": 7.236410851390072e-06, "loss": 0.5732, "step": 56115 }, { "epoch": 0.75, "learning_rate": 7.232708907197735e-06, "loss": 0.618, "step": 56120 }, { "epoch": 0.75, "learning_rate": 7.229007750007511e-06, "loss": 0.7388, "step": 56125 }, { "epoch": 0.75, "learning_rate": 7.225307379983329e-06, "loss": 1.1189, "step": 56130 }, { "epoch": 0.75, "learning_rate": 7.221607797289104e-06, "loss": 0.1951, "step": 56135 }, { "epoch": 0.75, "learning_rate": 7.217909002088727e-06, "loss": 1.3206, "step": 56140 }, { "epoch": 0.75, "learning_rate": 7.214210994546009e-06, "loss": 0.9554, "step": 56145 }, { "epoch": 0.75, "learning_rate": 7.210513774824768e-06, "loss": 1.0991, "step": 56150 }, { "epoch": 0.75, "learning_rate": 7.20681734308877e-06, "loss": 0.249, "step": 56155 }, { "epoch": 0.75, "learning_rate": 7.203121699501739e-06, "loss": 1.0818, "step": 56160 }, { "epoch": 0.75, "learning_rate": 7.1994268442273915e-06, "loss": 0.5317, "step": 56165 }, { "epoch": 0.75, "learning_rate": 7.195732777429379e-06, "loss": 1.1633, "step": 56170 }, { "epoch": 0.75, "learning_rate": 7.192039499271333e-06, "loss": 0.8364, "step": 56175 }, { "epoch": 0.75, "learning_rate": 7.18834700991684e-06, "loss": 0.6932, "step": 56180 }, { "epoch": 0.75, "learning_rate": 7.184655309529473e-06, "loss": 0.3818, "step": 56185 }, { "epoch": 0.75, "learning_rate": 7.1809643982727465e-06, "loss": 0.8974, "step": 56190 }, { "epoch": 0.75, "learning_rate": 7.177274276310145e-06, "loss": 0.4998, "step": 56195 }, { "epoch": 0.75, "learning_rate": 7.173584943805145e-06, "loss": 0.3022, "step": 56200 }, { "epoch": 0.75, "learning_rate": 7.169896400921133e-06, "loss": 0.937, "step": 56205 }, { "epoch": 0.75, "learning_rate": 7.166208647821518e-06, "loss": 0.4669, "step": 56210 }, { "epoch": 0.75, "learning_rate": 7.162521684669637e-06, "loss": 0.7318, "step": 56215 }, { "epoch": 0.75, "learning_rate": 7.158835511628803e-06, "loss": 0.6076, "step": 56220 }, { "epoch": 0.75, "learning_rate": 7.155150128862307e-06, "loss": 0.7171, "step": 56225 }, { "epoch": 0.75, "learning_rate": 7.151465536533383e-06, "loss": 0.4827, "step": 56230 }, { "epoch": 0.75, "learning_rate": 7.147781734805245e-06, "loss": 0.6165, "step": 56235 }, { "epoch": 0.75, "learning_rate": 7.144098723841056e-06, "loss": 0.6593, "step": 56240 }, { "epoch": 0.75, "learning_rate": 7.140416503803968e-06, "loss": 1.0422, "step": 56245 }, { "epoch": 0.75, "learning_rate": 7.136735074857082e-06, "loss": 0.5595, "step": 56250 }, { "epoch": 0.75, "learning_rate": 7.133054437163458e-06, "loss": 0.5732, "step": 56255 }, { "epoch": 0.75, "learning_rate": 7.129374590886145e-06, "loss": 0.639, "step": 56260 }, { "epoch": 0.75, "learning_rate": 7.125695536188132e-06, "loss": 0.4567, "step": 56265 }, { "epoch": 0.75, "learning_rate": 7.1220172732323784e-06, "loss": 0.784, "step": 56270 }, { "epoch": 0.75, "learning_rate": 7.118339802181825e-06, "loss": 0.654, "step": 56275 }, { "epoch": 0.75, "learning_rate": 7.114663123199361e-06, "loss": 0.4924, "step": 56280 }, { "epoch": 0.75, "learning_rate": 7.110987236447842e-06, "loss": 0.7634, "step": 56285 }, { "epoch": 0.75, "learning_rate": 7.107312142090086e-06, "loss": 1.008, "step": 56290 }, { "epoch": 0.75, "learning_rate": 7.103637840288893e-06, "loss": 0.5714, "step": 56295 }, { "epoch": 0.75, "learning_rate": 7.099964331207012e-06, "loss": 0.6459, "step": 56300 }, { "epoch": 0.75, "learning_rate": 7.096291615007156e-06, "loss": 0.6968, "step": 56305 }, { "epoch": 0.75, "learning_rate": 7.092619691852023e-06, "loss": 0.5778, "step": 56310 }, { "epoch": 0.75, "learning_rate": 7.088948561904235e-06, "loss": 0.4638, "step": 56315 }, { "epoch": 0.75, "learning_rate": 7.085278225326428e-06, "loss": 0.2893, "step": 56320 }, { "epoch": 0.75, "learning_rate": 7.081608682281171e-06, "loss": 0.7204, "step": 56325 }, { "epoch": 0.75, "learning_rate": 7.077939932930999e-06, "loss": 0.9844, "step": 56330 }, { "epoch": 0.75, "learning_rate": 7.074271977438435e-06, "loss": 0.3434, "step": 56335 }, { "epoch": 0.75, "learning_rate": 7.070604815965942e-06, "loss": 0.7749, "step": 56340 }, { "epoch": 0.75, "learning_rate": 7.066938448675958e-06, "loss": 0.2429, "step": 56345 }, { "epoch": 0.76, "learning_rate": 7.063272875730876e-06, "loss": 1.3392, "step": 56350 }, { "epoch": 0.76, "learning_rate": 7.05960809729308e-06, "loss": 0.8281, "step": 56355 }, { "epoch": 0.76, "learning_rate": 7.05594411352489e-06, "loss": 0.3324, "step": 56360 }, { "epoch": 0.76, "learning_rate": 7.0522809245886e-06, "loss": 0.3385, "step": 56365 }, { "epoch": 0.76, "learning_rate": 7.048618530646481e-06, "loss": 1.5397, "step": 56370 }, { "epoch": 0.76, "learning_rate": 7.044956931860752e-06, "loss": 0.59, "step": 56375 }, { "epoch": 0.76, "learning_rate": 7.041296128393599e-06, "loss": 0.8422, "step": 56380 }, { "epoch": 0.76, "learning_rate": 7.037636120407192e-06, "loss": 1.2274, "step": 56385 }, { "epoch": 0.76, "learning_rate": 7.033976908063639e-06, "loss": 0.7475, "step": 56390 }, { "epoch": 0.76, "learning_rate": 7.030318491525029e-06, "loss": 0.5718, "step": 56395 }, { "epoch": 0.76, "learning_rate": 7.026660870953403e-06, "loss": 0.4108, "step": 56400 }, { "epoch": 0.76, "learning_rate": 7.02300404651079e-06, "loss": 1.0464, "step": 56405 }, { "epoch": 0.76, "learning_rate": 7.019348018359162e-06, "loss": 0.4614, "step": 56410 }, { "epoch": 0.76, "learning_rate": 7.015692786660455e-06, "loss": 1.1438, "step": 56415 }, { "epoch": 0.76, "learning_rate": 7.0120383515766e-06, "loss": 1.0621, "step": 56420 }, { "epoch": 0.76, "learning_rate": 7.0083847132694365e-06, "loss": 0.5841, "step": 56425 }, { "epoch": 0.76, "learning_rate": 7.004731871900832e-06, "loss": 0.6163, "step": 56430 }, { "epoch": 0.76, "learning_rate": 7.001079827632578e-06, "loss": 1.0564, "step": 56435 }, { "epoch": 0.76, "learning_rate": 6.997428580626433e-06, "loss": 0.9153, "step": 56440 }, { "epoch": 0.76, "learning_rate": 6.9937781310441485e-06, "loss": 0.2439, "step": 56445 }, { "epoch": 0.76, "learning_rate": 6.990128479047406e-06, "loss": 0.9062, "step": 56450 }, { "epoch": 0.76, "learning_rate": 6.986479624797873e-06, "loss": 0.9865, "step": 56455 }, { "epoch": 0.76, "learning_rate": 6.982831568457168e-06, "loss": 0.4275, "step": 56460 }, { "epoch": 0.76, "learning_rate": 6.979184310186895e-06, "loss": 0.96, "step": 56465 }, { "epoch": 0.76, "learning_rate": 6.9755378501486e-06, "loss": 1.1198, "step": 56470 }, { "epoch": 0.76, "learning_rate": 6.971892188503798e-06, "loss": 0.7228, "step": 56475 }, { "epoch": 0.76, "learning_rate": 6.9682473254139874e-06, "loss": 1.0292, "step": 56480 }, { "epoch": 0.76, "learning_rate": 6.964603261040611e-06, "loss": 0.2667, "step": 56485 }, { "epoch": 0.76, "learning_rate": 6.960959995545071e-06, "loss": 0.6458, "step": 56490 }, { "epoch": 0.76, "learning_rate": 6.95731752908877e-06, "loss": 0.3942, "step": 56495 }, { "epoch": 0.76, "learning_rate": 6.953675861833034e-06, "loss": 0.8684, "step": 56500 }, { "epoch": 0.76, "learning_rate": 6.9500349939391755e-06, "loss": 1.1284, "step": 56505 }, { "epoch": 0.76, "learning_rate": 6.946394925568456e-06, "loss": 0.7631, "step": 56510 }, { "epoch": 0.76, "learning_rate": 6.94275565688213e-06, "loss": 1.226, "step": 56515 }, { "epoch": 0.76, "learning_rate": 6.939117188041394e-06, "loss": 1.5982, "step": 56520 }, { "epoch": 0.76, "learning_rate": 6.935479519207403e-06, "loss": 1.2025, "step": 56525 }, { "epoch": 0.76, "learning_rate": 6.931842650541306e-06, "loss": 0.9617, "step": 56530 }, { "epoch": 0.76, "learning_rate": 6.928206582204175e-06, "loss": 0.4306, "step": 56535 }, { "epoch": 0.76, "learning_rate": 6.924571314357089e-06, "loss": 0.6565, "step": 56540 }, { "epoch": 0.76, "learning_rate": 6.920936847161069e-06, "loss": 1.3565, "step": 56545 }, { "epoch": 0.76, "learning_rate": 6.9173031807770874e-06, "loss": 0.8124, "step": 56550 }, { "epoch": 0.76, "learning_rate": 6.913670315366119e-06, "loss": 1.36, "step": 56555 }, { "epoch": 0.76, "learning_rate": 6.910038251089074e-06, "loss": 1.1718, "step": 56560 }, { "epoch": 0.76, "learning_rate": 6.906406988106834e-06, "loss": 0.4712, "step": 56565 }, { "epoch": 0.76, "learning_rate": 6.9027765265802345e-06, "loss": 0.7832, "step": 56570 }, { "epoch": 0.76, "learning_rate": 6.899146866670106e-06, "loss": 0.7842, "step": 56575 }, { "epoch": 0.76, "learning_rate": 6.895518008537216e-06, "loss": 0.8528, "step": 56580 }, { "epoch": 0.76, "learning_rate": 6.891889952342298e-06, "loss": 1.1346, "step": 56585 }, { "epoch": 0.76, "learning_rate": 6.888262698246067e-06, "loss": 0.8775, "step": 56590 }, { "epoch": 0.76, "learning_rate": 6.88463624640919e-06, "loss": 0.5805, "step": 56595 }, { "epoch": 0.76, "learning_rate": 6.881010596992293e-06, "loss": 0.559, "step": 56600 }, { "epoch": 0.76, "learning_rate": 6.877385750155988e-06, "loss": 0.4437, "step": 56605 }, { "epoch": 0.76, "learning_rate": 6.873761706060827e-06, "loss": 0.5906, "step": 56610 }, { "epoch": 0.76, "learning_rate": 6.87013846486734e-06, "loss": 0.6242, "step": 56615 }, { "epoch": 0.76, "learning_rate": 6.866516026736011e-06, "loss": 2.3425, "step": 56620 }, { "epoch": 0.76, "learning_rate": 6.862894391827313e-06, "loss": 0.7561, "step": 56625 }, { "epoch": 0.76, "learning_rate": 6.859273560301654e-06, "loss": 0.2554, "step": 56630 }, { "epoch": 0.76, "learning_rate": 6.855653532319414e-06, "loss": 1.1098, "step": 56635 }, { "epoch": 0.76, "learning_rate": 6.8520343080409635e-06, "loss": 1.2593, "step": 56640 }, { "epoch": 0.76, "learning_rate": 6.8484158876265885e-06, "loss": 1.4965, "step": 56645 }, { "epoch": 0.76, "learning_rate": 6.8447982712365884e-06, "loss": 0.6346, "step": 56650 }, { "epoch": 0.76, "learning_rate": 6.841181459031193e-06, "loss": 0.4943, "step": 56655 }, { "epoch": 0.76, "learning_rate": 6.837565451170611e-06, "loss": 1.1892, "step": 56660 }, { "epoch": 0.76, "learning_rate": 6.833950247815018e-06, "loss": 0.652, "step": 56665 }, { "epoch": 0.76, "learning_rate": 6.83033584912455e-06, "loss": 0.4559, "step": 56670 }, { "epoch": 0.76, "learning_rate": 6.8267222552592964e-06, "loss": 0.76, "step": 56675 }, { "epoch": 0.76, "learning_rate": 6.823109466379338e-06, "loss": 1.1157, "step": 56680 }, { "epoch": 0.76, "learning_rate": 6.819497482644691e-06, "loss": 1.222, "step": 56685 }, { "epoch": 0.76, "learning_rate": 6.815886304215352e-06, "loss": 0.7118, "step": 56690 }, { "epoch": 0.76, "learning_rate": 6.812275931251269e-06, "loss": 0.8245, "step": 56695 }, { "epoch": 0.76, "learning_rate": 6.8086663639123805e-06, "loss": 0.3192, "step": 56700 }, { "epoch": 0.76, "learning_rate": 6.805057602358564e-06, "loss": 0.7089, "step": 56705 }, { "epoch": 0.76, "learning_rate": 6.801449646749664e-06, "loss": 0.9496, "step": 56710 }, { "epoch": 0.76, "learning_rate": 6.797842497245505e-06, "loss": 0.9235, "step": 56715 }, { "epoch": 0.76, "learning_rate": 6.794236154005862e-06, "loss": 0.3891, "step": 56720 }, { "epoch": 0.76, "learning_rate": 6.790630617190474e-06, "loss": 0.6804, "step": 56725 }, { "epoch": 0.76, "learning_rate": 6.787025886959048e-06, "loss": 0.8229, "step": 56730 }, { "epoch": 0.76, "learning_rate": 6.783421963471262e-06, "loss": 0.1537, "step": 56735 }, { "epoch": 0.76, "learning_rate": 6.779818846886751e-06, "loss": 0.4782, "step": 56740 }, { "epoch": 0.76, "learning_rate": 6.776216537365104e-06, "loss": 0.6573, "step": 56745 }, { "epoch": 0.76, "learning_rate": 6.772615035065907e-06, "loss": 0.8784, "step": 56750 }, { "epoch": 0.76, "learning_rate": 6.7690143401486634e-06, "loss": 0.623, "step": 56755 }, { "epoch": 0.76, "learning_rate": 6.765414452772884e-06, "loss": 0.825, "step": 56760 }, { "epoch": 0.76, "learning_rate": 6.761815373098019e-06, "loss": 0.8508, "step": 56765 }, { "epoch": 0.76, "learning_rate": 6.758217101283482e-06, "loss": 0.6433, "step": 56770 }, { "epoch": 0.76, "learning_rate": 6.754619637488674e-06, "loss": 0.7646, "step": 56775 }, { "epoch": 0.76, "learning_rate": 6.75102298187294e-06, "loss": 0.762, "step": 56780 }, { "epoch": 0.76, "learning_rate": 6.747427134595582e-06, "loss": 0.9325, "step": 56785 }, { "epoch": 0.76, "learning_rate": 6.743832095815894e-06, "loss": 0.437, "step": 56790 }, { "epoch": 0.76, "learning_rate": 6.740237865693113e-06, "loss": 0.6687, "step": 56795 }, { "epoch": 0.76, "learning_rate": 6.736644444386444e-06, "loss": 0.9291, "step": 56800 }, { "epoch": 0.76, "learning_rate": 6.733051832055048e-06, "loss": 0.4212, "step": 56805 }, { "epoch": 0.76, "learning_rate": 6.729460028858078e-06, "loss": 0.3936, "step": 56810 }, { "epoch": 0.76, "learning_rate": 6.7258690349546235e-06, "loss": 0.9142, "step": 56815 }, { "epoch": 0.76, "learning_rate": 6.722278850503741e-06, "loss": 0.7675, "step": 56820 }, { "epoch": 0.76, "learning_rate": 6.718689475664472e-06, "loss": 0.9597, "step": 56825 }, { "epoch": 0.76, "learning_rate": 6.715100910595801e-06, "loss": 0.3595, "step": 56830 }, { "epoch": 0.76, "learning_rate": 6.711513155456683e-06, "loss": 0.447, "step": 56835 }, { "epoch": 0.76, "learning_rate": 6.707926210406029e-06, "loss": 0.2193, "step": 56840 }, { "epoch": 0.76, "learning_rate": 6.704340075602741e-06, "loss": 0.9194, "step": 56845 }, { "epoch": 0.76, "learning_rate": 6.700754751205656e-06, "loss": 0.5628, "step": 56850 }, { "epoch": 0.76, "learning_rate": 6.697170237373582e-06, "loss": 0.2548, "step": 56855 }, { "epoch": 0.76, "learning_rate": 6.693586534265314e-06, "loss": 1.559, "step": 56860 }, { "epoch": 0.76, "learning_rate": 6.690003642039564e-06, "loss": 1.1896, "step": 56865 }, { "epoch": 0.76, "learning_rate": 6.686421560855058e-06, "loss": 0.88, "step": 56870 }, { "epoch": 0.76, "learning_rate": 6.682840290870454e-06, "loss": 1.178, "step": 56875 }, { "epoch": 0.76, "learning_rate": 6.679259832244383e-06, "loss": 0.7742, "step": 56880 }, { "epoch": 0.76, "learning_rate": 6.675680185135452e-06, "loss": 0.8366, "step": 56885 }, { "epoch": 0.76, "learning_rate": 6.672101349702215e-06, "loss": 0.4943, "step": 56890 }, { "epoch": 0.76, "learning_rate": 6.6685233261031905e-06, "loss": 0.6086, "step": 56895 }, { "epoch": 0.76, "learning_rate": 6.6649461144968785e-06, "loss": 0.2821, "step": 56900 }, { "epoch": 0.76, "learning_rate": 6.661369715041726e-06, "loss": 0.6143, "step": 56905 }, { "epoch": 0.76, "learning_rate": 6.657794127896153e-06, "loss": 0.3984, "step": 56910 }, { "epoch": 0.76, "learning_rate": 6.654219353218527e-06, "loss": 1.5252, "step": 56915 }, { "epoch": 0.76, "learning_rate": 6.65064539116721e-06, "loss": 1.2558, "step": 56920 }, { "epoch": 0.76, "learning_rate": 6.6470722419005034e-06, "loss": 0.8915, "step": 56925 }, { "epoch": 0.76, "learning_rate": 6.643499905576672e-06, "loss": 1.0295, "step": 56930 }, { "epoch": 0.76, "learning_rate": 6.639928382353969e-06, "loss": 0.8814, "step": 56935 }, { "epoch": 0.76, "learning_rate": 6.636357672390587e-06, "loss": 1.3468, "step": 56940 }, { "epoch": 0.76, "learning_rate": 6.632787775844687e-06, "loss": 0.6692, "step": 56945 }, { "epoch": 0.76, "learning_rate": 6.629218692874395e-06, "loss": 1.0486, "step": 56950 }, { "epoch": 0.76, "learning_rate": 6.6256504236378135e-06, "loss": 0.3676, "step": 56955 }, { "epoch": 0.76, "learning_rate": 6.622082968292998e-06, "loss": 0.4147, "step": 56960 }, { "epoch": 0.76, "learning_rate": 6.6185163269979534e-06, "loss": 0.476, "step": 56965 }, { "epoch": 0.76, "learning_rate": 6.614950499910694e-06, "loss": 1.3031, "step": 56970 }, { "epoch": 0.76, "learning_rate": 6.611385487189134e-06, "loss": 1.1136, "step": 56975 }, { "epoch": 0.76, "learning_rate": 6.607821288991209e-06, "loss": 0.4457, "step": 56980 }, { "epoch": 0.76, "learning_rate": 6.604257905474786e-06, "loss": 0.3859, "step": 56985 }, { "epoch": 0.76, "learning_rate": 6.600695336797702e-06, "loss": 0.3729, "step": 56990 }, { "epoch": 0.76, "learning_rate": 6.5971335831177734e-06, "loss": 0.8036, "step": 56995 }, { "epoch": 0.76, "learning_rate": 6.593572644592757e-06, "loss": 0.6977, "step": 57000 }, { "epoch": 0.76, "learning_rate": 6.590012521380384e-06, "loss": 0.5558, "step": 57005 }, { "epoch": 0.76, "learning_rate": 6.58645321363836e-06, "loss": 0.4439, "step": 57010 }, { "epoch": 0.76, "learning_rate": 6.58289472152434e-06, "loss": 0.3138, "step": 57015 }, { "epoch": 0.76, "learning_rate": 6.5793370451959436e-06, "loss": 0.5104, "step": 57020 }, { "epoch": 0.76, "learning_rate": 6.575780184810754e-06, "loss": 0.7613, "step": 57025 }, { "epoch": 0.76, "learning_rate": 6.572224140526337e-06, "loss": 0.6969, "step": 57030 }, { "epoch": 0.76, "learning_rate": 6.5686689125002e-06, "loss": 1.1629, "step": 57035 }, { "epoch": 0.76, "learning_rate": 6.565114500889813e-06, "loss": 1.2283, "step": 57040 }, { "epoch": 0.76, "learning_rate": 6.561560905852632e-06, "loss": 1.2382, "step": 57045 }, { "epoch": 0.76, "learning_rate": 6.5580081275460585e-06, "loss": 0.1993, "step": 57050 }, { "epoch": 0.76, "learning_rate": 6.554456166127465e-06, "loss": 0.8042, "step": 57055 }, { "epoch": 0.76, "learning_rate": 6.550905021754175e-06, "loss": 0.9493, "step": 57060 }, { "epoch": 0.76, "learning_rate": 6.547354694583502e-06, "loss": 0.8007, "step": 57065 }, { "epoch": 0.76, "learning_rate": 6.5438051847727e-06, "loss": 0.7397, "step": 57070 }, { "epoch": 0.76, "learning_rate": 6.540256492478989e-06, "loss": 0.2579, "step": 57075 }, { "epoch": 0.76, "learning_rate": 6.536708617859577e-06, "loss": 0.4371, "step": 57080 }, { "epoch": 0.76, "learning_rate": 6.533161561071588e-06, "loss": 0.5179, "step": 57085 }, { "epoch": 0.76, "learning_rate": 6.529615322272159e-06, "loss": 1.0855, "step": 57090 }, { "epoch": 0.76, "learning_rate": 6.526069901618378e-06, "loss": 0.3491, "step": 57095 }, { "epoch": 0.77, "learning_rate": 6.522525299267265e-06, "loss": 0.6674, "step": 57100 }, { "epoch": 0.77, "learning_rate": 6.518981515375849e-06, "loss": 0.5413, "step": 57105 }, { "epoch": 0.77, "learning_rate": 6.515438550101094e-06, "loss": 0.1101, "step": 57110 }, { "epoch": 0.77, "learning_rate": 6.511896403599929e-06, "loss": 0.58, "step": 57115 }, { "epoch": 0.77, "learning_rate": 6.508355076029269e-06, "loss": 1.0795, "step": 57120 }, { "epoch": 0.77, "learning_rate": 6.504814567545967e-06, "loss": 0.3894, "step": 57125 }, { "epoch": 0.77, "learning_rate": 6.501274878306851e-06, "loss": 0.1068, "step": 57130 }, { "epoch": 0.77, "learning_rate": 6.497736008468702e-06, "loss": 0.5038, "step": 57135 }, { "epoch": 0.77, "learning_rate": 6.494197958188295e-06, "loss": 0.6645, "step": 57140 }, { "epoch": 0.77, "learning_rate": 6.490660727622333e-06, "loss": 1.1999, "step": 57145 }, { "epoch": 0.77, "learning_rate": 6.487124316927498e-06, "loss": 0.3059, "step": 57150 }, { "epoch": 0.77, "learning_rate": 6.483588726260442e-06, "loss": 0.6433, "step": 57155 }, { "epoch": 0.77, "learning_rate": 6.480053955777776e-06, "loss": 0.7245, "step": 57160 }, { "epoch": 0.77, "learning_rate": 6.4765200056360635e-06, "loss": 0.4699, "step": 57165 }, { "epoch": 0.77, "learning_rate": 6.472986875991838e-06, "loss": 1.223, "step": 57170 }, { "epoch": 0.77, "learning_rate": 6.469454567001615e-06, "loss": 0.565, "step": 57175 }, { "epoch": 0.77, "learning_rate": 6.4659230788218476e-06, "loss": 0.8012, "step": 57180 }, { "epoch": 0.77, "learning_rate": 6.462392411608958e-06, "loss": 0.7248, "step": 57185 }, { "epoch": 0.77, "learning_rate": 6.458862565519358e-06, "loss": 0.5401, "step": 57190 }, { "epoch": 0.77, "learning_rate": 6.455333540709374e-06, "loss": 1.1895, "step": 57195 }, { "epoch": 0.77, "learning_rate": 6.451805337335337e-06, "loss": 0.1559, "step": 57200 }, { "epoch": 0.77, "learning_rate": 6.448277955553544e-06, "loss": 0.3212, "step": 57205 }, { "epoch": 0.77, "learning_rate": 6.444751395520215e-06, "loss": 0.4947, "step": 57210 }, { "epoch": 0.77, "learning_rate": 6.441225657391575e-06, "loss": 0.6035, "step": 57215 }, { "epoch": 0.77, "learning_rate": 6.437700741323793e-06, "loss": 0.9244, "step": 57220 }, { "epoch": 0.77, "learning_rate": 6.434176647472995e-06, "loss": 0.6037, "step": 57225 }, { "epoch": 0.77, "learning_rate": 6.430653375995296e-06, "loss": 1.4936, "step": 57230 }, { "epoch": 0.77, "learning_rate": 6.427130927046754e-06, "loss": 0.4868, "step": 57235 }, { "epoch": 0.77, "learning_rate": 6.423609300783398e-06, "loss": 0.6339, "step": 57240 }, { "epoch": 0.77, "learning_rate": 6.420088497361204e-06, "loss": 0.7148, "step": 57245 }, { "epoch": 0.77, "learning_rate": 6.416568516936147e-06, "loss": 1.2772, "step": 57250 }, { "epoch": 0.77, "learning_rate": 6.413049359664133e-06, "loss": 0.6122, "step": 57255 }, { "epoch": 0.77, "learning_rate": 6.409531025701038e-06, "loss": 1.1041, "step": 57260 }, { "epoch": 0.77, "learning_rate": 6.406013515202719e-06, "loss": 0.7298, "step": 57265 }, { "epoch": 0.77, "learning_rate": 6.40249682832498e-06, "loss": 0.8378, "step": 57270 }, { "epoch": 0.77, "learning_rate": 6.398980965223592e-06, "loss": 0.8975, "step": 57275 }, { "epoch": 0.77, "learning_rate": 6.395465926054281e-06, "loss": 1.3667, "step": 57280 }, { "epoch": 0.77, "learning_rate": 6.391951710972763e-06, "loss": 0.6217, "step": 57285 }, { "epoch": 0.77, "learning_rate": 6.388438320134687e-06, "loss": 0.872, "step": 57290 }, { "epoch": 0.77, "learning_rate": 6.384925753695681e-06, "loss": 1.0909, "step": 57295 }, { "epoch": 0.77, "learning_rate": 6.3814140118113454e-06, "loss": 0.5151, "step": 57300 }, { "epoch": 0.77, "learning_rate": 6.377903094637211e-06, "loss": 0.461, "step": 57305 }, { "epoch": 0.77, "learning_rate": 6.374393002328805e-06, "loss": 1.1641, "step": 57310 }, { "epoch": 0.77, "learning_rate": 6.370883735041624e-06, "loss": 0.9039, "step": 57315 }, { "epoch": 0.77, "learning_rate": 6.36737529293108e-06, "loss": 1.1995, "step": 57320 }, { "epoch": 0.77, "learning_rate": 6.363867676152602e-06, "loss": 0.3318, "step": 57325 }, { "epoch": 0.77, "learning_rate": 6.360360884861552e-06, "loss": 0.7811, "step": 57330 }, { "epoch": 0.77, "learning_rate": 6.356854919213254e-06, "loss": 0.338, "step": 57335 }, { "epoch": 0.77, "learning_rate": 6.353349779363024e-06, "loss": 0.3194, "step": 57340 }, { "epoch": 0.77, "learning_rate": 6.349845465466112e-06, "loss": 0.4121, "step": 57345 }, { "epoch": 0.77, "learning_rate": 6.346341977677741e-06, "loss": 0.8721, "step": 57350 }, { "epoch": 0.77, "learning_rate": 6.342839316153093e-06, "loss": 1.1573, "step": 57355 }, { "epoch": 0.77, "learning_rate": 6.339337481047333e-06, "loss": 0.8146, "step": 57360 }, { "epoch": 0.77, "learning_rate": 6.335836472515566e-06, "loss": 0.6658, "step": 57365 }, { "epoch": 0.77, "learning_rate": 6.332336290712862e-06, "loss": 0.5722, "step": 57370 }, { "epoch": 0.77, "learning_rate": 6.328836935794275e-06, "loss": 0.6922, "step": 57375 }, { "epoch": 0.77, "learning_rate": 6.325338407914802e-06, "loss": 0.7557, "step": 57380 }, { "epoch": 0.77, "learning_rate": 6.321840707229412e-06, "loss": 0.3456, "step": 57385 }, { "epoch": 0.77, "learning_rate": 6.318343833893029e-06, "loss": 0.4415, "step": 57390 }, { "epoch": 0.77, "learning_rate": 6.314847788060557e-06, "loss": 0.7413, "step": 57395 }, { "epoch": 0.77, "learning_rate": 6.3113525698868524e-06, "loss": 0.6195, "step": 57400 }, { "epoch": 0.77, "learning_rate": 6.307858179526724e-06, "loss": 0.8847, "step": 57405 }, { "epoch": 0.77, "learning_rate": 6.304364617134978e-06, "loss": 0.8866, "step": 57410 }, { "epoch": 0.77, "learning_rate": 6.3008718828663355e-06, "loss": 0.7092, "step": 57415 }, { "epoch": 0.77, "learning_rate": 6.29737997687552e-06, "loss": 0.6395, "step": 57420 }, { "epoch": 0.77, "learning_rate": 6.293888899317216e-06, "loss": 0.4868, "step": 57425 }, { "epoch": 0.77, "learning_rate": 6.290398650346038e-06, "loss": 0.5599, "step": 57430 }, { "epoch": 0.77, "learning_rate": 6.286909230116606e-06, "loss": 0.6217, "step": 57435 }, { "epoch": 0.77, "learning_rate": 6.283420638783477e-06, "loss": 0.9173, "step": 57440 }, { "epoch": 0.77, "learning_rate": 6.279932876501168e-06, "loss": 0.2735, "step": 57445 }, { "epoch": 0.77, "learning_rate": 6.276445943424189e-06, "loss": 0.2362, "step": 57450 }, { "epoch": 0.77, "learning_rate": 6.2729598397069824e-06, "loss": 0.663, "step": 57455 }, { "epoch": 0.77, "learning_rate": 6.269474565503969e-06, "loss": 0.7434, "step": 57460 }, { "epoch": 0.77, "learning_rate": 6.265990120969514e-06, "loss": 0.5848, "step": 57465 }, { "epoch": 0.77, "learning_rate": 6.2625065062579845e-06, "loss": 0.6105, "step": 57470 }, { "epoch": 0.77, "learning_rate": 6.259023721523677e-06, "loss": 0.2695, "step": 57475 }, { "epoch": 0.77, "learning_rate": 6.25554176692085e-06, "loss": 0.6097, "step": 57480 }, { "epoch": 0.77, "learning_rate": 6.252060642603763e-06, "loss": 0.7415, "step": 57485 }, { "epoch": 0.77, "learning_rate": 6.248580348726582e-06, "loss": 0.5464, "step": 57490 }, { "epoch": 0.77, "learning_rate": 6.245100885443489e-06, "loss": 0.8902, "step": 57495 }, { "epoch": 0.77, "learning_rate": 6.241622252908591e-06, "loss": 0.7024, "step": 57500 }, { "epoch": 0.77, "learning_rate": 6.2381444512759905e-06, "loss": 0.5082, "step": 57505 }, { "epoch": 0.77, "learning_rate": 6.234667480699724e-06, "loss": 0.9663, "step": 57510 }, { "epoch": 0.77, "learning_rate": 6.231191341333806e-06, "loss": 0.6465, "step": 57515 }, { "epoch": 0.77, "learning_rate": 6.227716033332218e-06, "loss": 0.5126, "step": 57520 }, { "epoch": 0.77, "learning_rate": 6.224241556848897e-06, "loss": 0.4832, "step": 57525 }, { "epoch": 0.77, "learning_rate": 6.220767912037734e-06, "loss": 0.6589, "step": 57530 }, { "epoch": 0.77, "learning_rate": 6.217295099052619e-06, "loss": 0.5946, "step": 57535 }, { "epoch": 0.77, "learning_rate": 6.213823118047349e-06, "loss": 0.3687, "step": 57540 }, { "epoch": 0.77, "learning_rate": 6.210351969175737e-06, "loss": 1.2206, "step": 57545 }, { "epoch": 0.77, "learning_rate": 6.206881652591534e-06, "loss": 0.6007, "step": 57550 }, { "epoch": 0.77, "learning_rate": 6.2034121684484445e-06, "loss": 0.1274, "step": 57555 }, { "epoch": 0.77, "learning_rate": 6.1999435169001695e-06, "loss": 1.0964, "step": 57560 }, { "epoch": 0.77, "learning_rate": 6.19647569810034e-06, "loss": 0.703, "step": 57565 }, { "epoch": 0.77, "learning_rate": 6.193008712202566e-06, "loss": 1.3113, "step": 57570 }, { "epoch": 0.77, "learning_rate": 6.189542559360411e-06, "loss": 0.8896, "step": 57575 }, { "epoch": 0.77, "learning_rate": 6.186077239727425e-06, "loss": 0.7514, "step": 57580 }, { "epoch": 0.77, "learning_rate": 6.182612753457093e-06, "loss": 0.8556, "step": 57585 }, { "epoch": 0.77, "learning_rate": 6.179149100702866e-06, "loss": 1.1306, "step": 57590 }, { "epoch": 0.77, "learning_rate": 6.175686281618192e-06, "loss": 0.4987, "step": 57595 }, { "epoch": 0.77, "learning_rate": 6.172224296356424e-06, "loss": 0.6576, "step": 57600 }, { "epoch": 0.77, "learning_rate": 6.168763145070938e-06, "loss": 0.8861, "step": 57605 }, { "epoch": 0.77, "learning_rate": 6.165302827915026e-06, "loss": 0.2463, "step": 57610 }, { "epoch": 0.77, "learning_rate": 6.161843345041979e-06, "loss": 0.4941, "step": 57615 }, { "epoch": 0.77, "learning_rate": 6.1583846966050294e-06, "loss": 0.2429, "step": 57620 }, { "epoch": 0.77, "learning_rate": 6.154926882757367e-06, "loss": 0.7937, "step": 57625 }, { "epoch": 0.77, "learning_rate": 6.151469903652171e-06, "loss": 0.71, "step": 57630 }, { "epoch": 0.77, "learning_rate": 6.1480137594425644e-06, "loss": 1.0302, "step": 57635 }, { "epoch": 0.77, "learning_rate": 6.144558450281626e-06, "loss": 0.5857, "step": 57640 }, { "epoch": 0.77, "learning_rate": 6.141103976322432e-06, "loss": 0.4837, "step": 57645 }, { "epoch": 0.77, "learning_rate": 6.1376503377179674e-06, "loss": 0.7493, "step": 57650 }, { "epoch": 0.77, "learning_rate": 6.134197534621239e-06, "loss": 1.3555, "step": 57655 }, { "epoch": 0.77, "learning_rate": 6.130745567185175e-06, "loss": 0.2792, "step": 57660 }, { "epoch": 0.77, "learning_rate": 6.127294435562675e-06, "loss": 0.7531, "step": 57665 }, { "epoch": 0.77, "learning_rate": 6.123844139906621e-06, "loss": 0.3923, "step": 57670 }, { "epoch": 0.77, "learning_rate": 6.12039468036984e-06, "loss": 0.6186, "step": 57675 }, { "epoch": 0.77, "learning_rate": 6.116946057105119e-06, "loss": 0.8444, "step": 57680 }, { "epoch": 0.77, "learning_rate": 6.1134982702652135e-06, "loss": 0.8608, "step": 57685 }, { "epoch": 0.77, "learning_rate": 6.110051320002855e-06, "loss": 0.1885, "step": 57690 }, { "epoch": 0.77, "learning_rate": 6.106605206470722e-06, "loss": 0.7743, "step": 57695 }, { "epoch": 0.77, "learning_rate": 6.1031599298214476e-06, "loss": 0.8663, "step": 57700 }, { "epoch": 0.77, "learning_rate": 6.0997154902076665e-06, "loss": 0.6169, "step": 57705 }, { "epoch": 0.77, "learning_rate": 6.096271887781918e-06, "loss": 0.8773, "step": 57710 }, { "epoch": 0.77, "learning_rate": 6.092829122696761e-06, "loss": 0.6323, "step": 57715 }, { "epoch": 0.77, "learning_rate": 6.089387195104676e-06, "loss": 0.5581, "step": 57720 }, { "epoch": 0.77, "learning_rate": 6.085946105158141e-06, "loss": 1.3376, "step": 57725 }, { "epoch": 0.77, "learning_rate": 6.082505853009565e-06, "loss": 0.7377, "step": 57730 }, { "epoch": 0.77, "learning_rate": 6.079066438811334e-06, "loss": 0.6256, "step": 57735 }, { "epoch": 0.77, "learning_rate": 6.07562786271581e-06, "loss": 0.8152, "step": 57740 }, { "epoch": 0.77, "learning_rate": 6.072190124875294e-06, "loss": 0.4141, "step": 57745 }, { "epoch": 0.77, "learning_rate": 6.068753225442056e-06, "loss": 0.6704, "step": 57750 }, { "epoch": 0.77, "learning_rate": 6.065317164568354e-06, "loss": 1.3982, "step": 57755 }, { "epoch": 0.77, "learning_rate": 6.061881942406361e-06, "loss": 1.0812, "step": 57760 }, { "epoch": 0.77, "learning_rate": 6.05844755910826e-06, "loss": 0.9711, "step": 57765 }, { "epoch": 0.77, "learning_rate": 6.055014014826171e-06, "loss": 0.9553, "step": 57770 }, { "epoch": 0.77, "learning_rate": 6.051581309712176e-06, "loss": 0.7904, "step": 57775 }, { "epoch": 0.77, "learning_rate": 6.048149443918338e-06, "loss": 0.5736, "step": 57780 }, { "epoch": 0.77, "learning_rate": 6.044718417596668e-06, "loss": 1.0448, "step": 57785 }, { "epoch": 0.77, "learning_rate": 6.041288230899142e-06, "loss": 0.1084, "step": 57790 }, { "epoch": 0.77, "learning_rate": 6.03785888397769e-06, "loss": 0.7263, "step": 57795 }, { "epoch": 0.77, "learning_rate": 6.034430376984235e-06, "loss": 1.3591, "step": 57800 }, { "epoch": 0.77, "learning_rate": 6.031002710070633e-06, "loss": 0.6242, "step": 57805 }, { "epoch": 0.77, "learning_rate": 6.027575883388703e-06, "loss": 0.355, "step": 57810 }, { "epoch": 0.77, "learning_rate": 6.024149897090261e-06, "loss": 0.8734, "step": 57815 }, { "epoch": 0.77, "learning_rate": 6.020724751327028e-06, "loss": 0.8042, "step": 57820 }, { "epoch": 0.77, "learning_rate": 6.017300446250748e-06, "loss": 1.4007, "step": 57825 }, { "epoch": 0.77, "learning_rate": 6.013876982013084e-06, "loss": 0.4124, "step": 57830 }, { "epoch": 0.77, "learning_rate": 6.010454358765691e-06, "loss": 0.5644, "step": 57835 }, { "epoch": 0.77, "learning_rate": 6.007032576660168e-06, "loss": 0.3379, "step": 57840 }, { "epoch": 0.78, "learning_rate": 6.004295756699757e-06, "loss": 1.7152, "step": 57845 }, { "epoch": 0.78, "learning_rate": 6.000875489031518e-06, "loss": 0.7914, "step": 57850 }, { "epoch": 0.78, "learning_rate": 5.9974560629294465e-06, "loss": 0.2553, "step": 57855 }, { "epoch": 0.78, "learning_rate": 5.9940374785450195e-06, "loss": 0.8193, "step": 57860 }, { "epoch": 0.78, "learning_rate": 5.990619736029635e-06, "loss": 0.9695, "step": 57865 }, { "epoch": 0.78, "learning_rate": 5.9872028355347e-06, "loss": 1.1398, "step": 57870 }, { "epoch": 0.78, "learning_rate": 5.983786777211556e-06, "loss": 1.4121, "step": 57875 }, { "epoch": 0.78, "learning_rate": 5.980371561211529e-06, "loss": 0.5342, "step": 57880 }, { "epoch": 0.78, "learning_rate": 5.976957187685891e-06, "loss": 0.942, "step": 57885 }, { "epoch": 0.78, "learning_rate": 5.973543656785871e-06, "loss": 0.9499, "step": 57890 }, { "epoch": 0.78, "learning_rate": 5.970130968662696e-06, "loss": 0.6861, "step": 57895 }, { "epoch": 0.78, "learning_rate": 5.966719123467501e-06, "loss": 0.7317, "step": 57900 }, { "epoch": 0.78, "learning_rate": 5.963308121351438e-06, "loss": 0.8465, "step": 57905 }, { "epoch": 0.78, "learning_rate": 5.9598979624655855e-06, "loss": 0.6623, "step": 57910 }, { "epoch": 0.78, "learning_rate": 5.956488646960992e-06, "loss": 1.1603, "step": 57915 }, { "epoch": 0.78, "learning_rate": 5.953080174988684e-06, "loss": 0.3265, "step": 57920 }, { "epoch": 0.78, "learning_rate": 5.949672546699639e-06, "loss": 1.1444, "step": 57925 }, { "epoch": 0.78, "learning_rate": 5.946265762244793e-06, "loss": 0.8709, "step": 57930 }, { "epoch": 0.78, "learning_rate": 5.9428598217750455e-06, "loss": 0.8922, "step": 57935 }, { "epoch": 0.78, "learning_rate": 5.939454725441273e-06, "loss": 0.5586, "step": 57940 }, { "epoch": 0.78, "learning_rate": 5.9360504733943e-06, "loss": 0.4325, "step": 57945 }, { "epoch": 0.78, "learning_rate": 5.93264706578491e-06, "loss": 0.2814, "step": 57950 }, { "epoch": 0.78, "learning_rate": 5.929244502763878e-06, "loss": 0.173, "step": 57955 }, { "epoch": 0.78, "learning_rate": 5.925842784481892e-06, "loss": 0.9405, "step": 57960 }, { "epoch": 0.78, "learning_rate": 5.922441911089646e-06, "loss": 1.1663, "step": 57965 }, { "epoch": 0.78, "learning_rate": 5.919041882737797e-06, "loss": 0.4368, "step": 57970 }, { "epoch": 0.78, "learning_rate": 5.915642699576917e-06, "loss": 0.5636, "step": 57975 }, { "epoch": 0.78, "learning_rate": 5.912244361757599e-06, "loss": 1.1202, "step": 57980 }, { "epoch": 0.78, "learning_rate": 5.908846869430354e-06, "loss": 0.4485, "step": 57985 }, { "epoch": 0.78, "learning_rate": 5.90545022274569e-06, "loss": 0.9794, "step": 57990 }, { "epoch": 0.78, "learning_rate": 5.902054421854053e-06, "loss": 0.1449, "step": 57995 }, { "epoch": 0.78, "learning_rate": 5.8986594669058535e-06, "loss": 0.5894, "step": 58000 }, { "epoch": 0.78, "learning_rate": 5.895265358051496e-06, "loss": 0.4997, "step": 58005 }, { "epoch": 0.78, "learning_rate": 5.891872095441289e-06, "loss": 0.8009, "step": 58010 }, { "epoch": 0.78, "learning_rate": 5.888479679225562e-06, "loss": 0.6906, "step": 58015 }, { "epoch": 0.78, "learning_rate": 5.885088109554571e-06, "loss": 1.0438, "step": 58020 }, { "epoch": 0.78, "learning_rate": 5.881697386578542e-06, "loss": 0.9367, "step": 58025 }, { "epoch": 0.78, "learning_rate": 5.8783075104476786e-06, "loss": 0.4223, "step": 58030 }, { "epoch": 0.78, "learning_rate": 5.874918481312131e-06, "loss": 0.5586, "step": 58035 }, { "epoch": 0.78, "learning_rate": 5.871530299322014e-06, "loss": 0.8065, "step": 58040 }, { "epoch": 0.78, "learning_rate": 5.868142964627402e-06, "loss": 1.4229, "step": 58045 }, { "epoch": 0.78, "learning_rate": 5.86475647737835e-06, "loss": 0.6052, "step": 58050 }, { "epoch": 0.78, "learning_rate": 5.8613708377248555e-06, "loss": 1.3727, "step": 58055 }, { "epoch": 0.78, "learning_rate": 5.857986045816877e-06, "loss": 0.3939, "step": 58060 }, { "epoch": 0.78, "learning_rate": 5.8546021018043685e-06, "loss": 0.7962, "step": 58065 }, { "epoch": 0.78, "learning_rate": 5.851219005837189e-06, "loss": 0.9182, "step": 58070 }, { "epoch": 0.78, "learning_rate": 5.847836758065209e-06, "loss": 1.0138, "step": 58075 }, { "epoch": 0.78, "learning_rate": 5.844455358638262e-06, "loss": 0.5311, "step": 58080 }, { "epoch": 0.78, "learning_rate": 5.841074807706096e-06, "loss": 0.1025, "step": 58085 }, { "epoch": 0.78, "learning_rate": 5.837695105418473e-06, "loss": 1.0253, "step": 58090 }, { "epoch": 0.78, "learning_rate": 5.8343162519250895e-06, "loss": 0.1849, "step": 58095 }, { "epoch": 0.78, "learning_rate": 5.830938247375608e-06, "loss": 0.4739, "step": 58100 }, { "epoch": 0.78, "learning_rate": 5.827561091919667e-06, "loss": 0.747, "step": 58105 }, { "epoch": 0.78, "learning_rate": 5.824184785706848e-06, "loss": 0.6069, "step": 58110 }, { "epoch": 0.78, "learning_rate": 5.8208093288867226e-06, "loss": 0.6861, "step": 58115 }, { "epoch": 0.78, "learning_rate": 5.817434721608781e-06, "loss": 1.0656, "step": 58120 }, { "epoch": 0.78, "learning_rate": 5.8140609640225194e-06, "loss": 0.5605, "step": 58125 }, { "epoch": 0.78, "learning_rate": 5.8106880562773745e-06, "loss": 0.835, "step": 58130 }, { "epoch": 0.78, "learning_rate": 5.807315998522739e-06, "loss": 0.2238, "step": 58135 }, { "epoch": 0.78, "learning_rate": 5.803944790907994e-06, "loss": 0.4106, "step": 58140 }, { "epoch": 0.78, "learning_rate": 5.800574433582459e-06, "loss": 0.7428, "step": 58145 }, { "epoch": 0.78, "learning_rate": 5.797204926695426e-06, "loss": 0.6909, "step": 58150 }, { "epoch": 0.78, "learning_rate": 5.793836270396139e-06, "loss": 0.5883, "step": 58155 }, { "epoch": 0.78, "learning_rate": 5.790468464833828e-06, "loss": 0.6244, "step": 58160 }, { "epoch": 0.78, "learning_rate": 5.787101510157661e-06, "loss": 0.5523, "step": 58165 }, { "epoch": 0.78, "learning_rate": 5.7837354065167715e-06, "loss": 1.0081, "step": 58170 }, { "epoch": 0.78, "learning_rate": 5.78037015406028e-06, "loss": 1.5569, "step": 58175 }, { "epoch": 0.78, "learning_rate": 5.7770057529372255e-06, "loss": 1.3552, "step": 58180 }, { "epoch": 0.78, "learning_rate": 5.7736422032966445e-06, "loss": 0.7583, "step": 58185 }, { "epoch": 0.78, "learning_rate": 5.770279505287543e-06, "loss": 0.4451, "step": 58190 }, { "epoch": 0.78, "learning_rate": 5.76691765905884e-06, "loss": 1.1744, "step": 58195 }, { "epoch": 0.78, "learning_rate": 5.763556664759473e-06, "loss": 0.9015, "step": 58200 }, { "epoch": 0.78, "learning_rate": 5.760196522538311e-06, "loss": 1.4546, "step": 58205 }, { "epoch": 0.78, "learning_rate": 5.75683723254418e-06, "loss": 0.762, "step": 58210 }, { "epoch": 0.78, "learning_rate": 5.7534787949258985e-06, "loss": 0.4951, "step": 58215 }, { "epoch": 0.78, "learning_rate": 5.75012120983221e-06, "loss": 1.6202, "step": 58220 }, { "epoch": 0.78, "learning_rate": 5.746764477411862e-06, "loss": 0.7279, "step": 58225 }, { "epoch": 0.78, "learning_rate": 5.743408597813513e-06, "loss": 0.7851, "step": 58230 }, { "epoch": 0.78, "learning_rate": 5.74005357118583e-06, "loss": 0.4069, "step": 58235 }, { "epoch": 0.78, "learning_rate": 5.736699397677422e-06, "loss": 1.2678, "step": 58240 }, { "epoch": 0.78, "learning_rate": 5.733346077436852e-06, "loss": 0.8574, "step": 58245 }, { "epoch": 0.78, "learning_rate": 5.729993610612669e-06, "loss": 0.9577, "step": 58250 }, { "epoch": 0.78, "learning_rate": 5.726641997353366e-06, "loss": 0.6344, "step": 58255 }, { "epoch": 0.78, "learning_rate": 5.723291237807399e-06, "loss": 0.6211, "step": 58260 }, { "epoch": 0.78, "learning_rate": 5.719941332123185e-06, "loss": 0.2884, "step": 58265 }, { "epoch": 0.78, "learning_rate": 5.7165922804491235e-06, "loss": 0.9982, "step": 58270 }, { "epoch": 0.78, "learning_rate": 5.71324408293355e-06, "loss": 0.5956, "step": 58275 }, { "epoch": 0.78, "learning_rate": 5.709896739724771e-06, "loss": 0.4649, "step": 58280 }, { "epoch": 0.78, "learning_rate": 5.706550250971066e-06, "loss": 0.4678, "step": 58285 }, { "epoch": 0.78, "learning_rate": 5.703204616820662e-06, "loss": 0.7745, "step": 58290 }, { "epoch": 0.78, "learning_rate": 5.6998598374217506e-06, "loss": 1.3299, "step": 58295 }, { "epoch": 0.78, "learning_rate": 5.696515912922504e-06, "loss": 0.5097, "step": 58300 }, { "epoch": 0.78, "learning_rate": 5.693172843471017e-06, "loss": 0.9237, "step": 58305 }, { "epoch": 0.78, "learning_rate": 5.68983062921539e-06, "loss": 0.9778, "step": 58310 }, { "epoch": 0.78, "learning_rate": 5.686489270303663e-06, "loss": 0.6557, "step": 58315 }, { "epoch": 0.78, "learning_rate": 5.6831487668838305e-06, "loss": 0.6003, "step": 58320 }, { "epoch": 0.78, "learning_rate": 5.679809119103874e-06, "loss": 0.54, "step": 58325 }, { "epoch": 0.78, "learning_rate": 5.676470327111713e-06, "loss": 0.4663, "step": 58330 }, { "epoch": 0.78, "learning_rate": 5.673132391055256e-06, "loss": 0.636, "step": 58335 }, { "epoch": 0.78, "learning_rate": 5.669795311082332e-06, "loss": 0.6142, "step": 58340 }, { "epoch": 0.78, "learning_rate": 5.666459087340775e-06, "loss": 0.1835, "step": 58345 }, { "epoch": 0.78, "learning_rate": 5.663123719978361e-06, "loss": 1.0698, "step": 58350 }, { "epoch": 0.78, "learning_rate": 5.659789209142819e-06, "loss": 0.6713, "step": 58355 }, { "epoch": 0.78, "learning_rate": 5.656455554981862e-06, "loss": 0.8112, "step": 58360 }, { "epoch": 0.78, "learning_rate": 5.653122757643156e-06, "loss": 0.3707, "step": 58365 }, { "epoch": 0.78, "learning_rate": 5.64979081727432e-06, "loss": 0.9645, "step": 58370 }, { "epoch": 0.78, "learning_rate": 5.646459734022938e-06, "loss": 0.4152, "step": 58375 }, { "epoch": 0.78, "learning_rate": 5.643129508036577e-06, "loss": 0.7263, "step": 58380 }, { "epoch": 0.78, "learning_rate": 5.639800139462734e-06, "loss": 0.8275, "step": 58385 }, { "epoch": 0.78, "learning_rate": 5.636471628448886e-06, "loss": 0.3264, "step": 58390 }, { "epoch": 0.78, "learning_rate": 5.633143975142477e-06, "loss": 0.1429, "step": 58395 }, { "epoch": 0.78, "learning_rate": 5.629817179690902e-06, "loss": 0.8451, "step": 58400 }, { "epoch": 0.78, "learning_rate": 5.626491242241513e-06, "loss": 0.6239, "step": 58405 }, { "epoch": 0.78, "learning_rate": 5.623166162941651e-06, "loss": 0.6851, "step": 58410 }, { "epoch": 0.78, "learning_rate": 5.619841941938578e-06, "loss": 0.4513, "step": 58415 }, { "epoch": 0.78, "learning_rate": 5.616518579379556e-06, "loss": 0.9208, "step": 58420 }, { "epoch": 0.78, "learning_rate": 5.6131960754117895e-06, "loss": 0.3303, "step": 58425 }, { "epoch": 0.78, "learning_rate": 5.609874430182441e-06, "loss": 0.8528, "step": 58430 }, { "epoch": 0.78, "learning_rate": 5.606553643838655e-06, "loss": 0.4562, "step": 58435 }, { "epoch": 0.78, "learning_rate": 5.603233716527514e-06, "loss": 0.6347, "step": 58440 }, { "epoch": 0.78, "learning_rate": 5.599914648396093e-06, "loss": 0.3655, "step": 58445 }, { "epoch": 0.78, "learning_rate": 5.596596439591387e-06, "loss": 0.3933, "step": 58450 }, { "epoch": 0.78, "learning_rate": 5.593279090260389e-06, "loss": 0.4167, "step": 58455 }, { "epoch": 0.78, "learning_rate": 5.589962600550042e-06, "loss": 0.1579, "step": 58460 }, { "epoch": 0.78, "learning_rate": 5.586646970607237e-06, "loss": 0.9341, "step": 58465 }, { "epoch": 0.78, "learning_rate": 5.583332200578858e-06, "loss": 0.4465, "step": 58470 }, { "epoch": 0.78, "learning_rate": 5.580018290611725e-06, "loss": 0.5085, "step": 58475 }, { "epoch": 0.78, "learning_rate": 5.576705240852626e-06, "loss": 0.3117, "step": 58480 }, { "epoch": 0.78, "learning_rate": 5.573393051448306e-06, "loss": 0.2342, "step": 58485 }, { "epoch": 0.78, "learning_rate": 5.570081722545489e-06, "loss": 0.474, "step": 58490 }, { "epoch": 0.78, "learning_rate": 5.566771254290851e-06, "loss": 0.7955, "step": 58495 }, { "epoch": 0.78, "learning_rate": 5.563461646831017e-06, "loss": 1.0314, "step": 58500 }, { "epoch": 0.78, "learning_rate": 5.560152900312601e-06, "loss": 0.4916, "step": 58505 }, { "epoch": 0.78, "learning_rate": 5.556845014882156e-06, "loss": 1.0216, "step": 58510 }, { "epoch": 0.78, "learning_rate": 5.5535379906862e-06, "loss": 0.5289, "step": 58515 }, { "epoch": 0.78, "learning_rate": 5.550231827871239e-06, "loss": 0.3611, "step": 58520 }, { "epoch": 0.78, "learning_rate": 5.546926526583687e-06, "loss": 0.6433, "step": 58525 }, { "epoch": 0.78, "learning_rate": 5.543622086969977e-06, "loss": 0.9996, "step": 58530 }, { "epoch": 0.78, "learning_rate": 5.54031850917647e-06, "loss": 0.1805, "step": 58535 }, { "epoch": 0.78, "learning_rate": 5.537015793349496e-06, "loss": 0.6557, "step": 58540 }, { "epoch": 0.78, "learning_rate": 5.533713939635357e-06, "loss": 0.1947, "step": 58545 }, { "epoch": 0.78, "learning_rate": 5.5304129481802965e-06, "loss": 1.2106, "step": 58550 }, { "epoch": 0.78, "learning_rate": 5.527112819130553e-06, "loss": 0.6812, "step": 58555 }, { "epoch": 0.78, "learning_rate": 5.523813552632278e-06, "loss": 0.55, "step": 58560 }, { "epoch": 0.78, "learning_rate": 5.520515148831634e-06, "loss": 1.4284, "step": 58565 }, { "epoch": 0.78, "learning_rate": 5.517217607874714e-06, "loss": 0.7962, "step": 58570 }, { "epoch": 0.78, "learning_rate": 5.513920929907579e-06, "loss": 0.651, "step": 58575 }, { "epoch": 0.78, "learning_rate": 5.51062511507627e-06, "loss": 0.7578, "step": 58580 }, { "epoch": 0.78, "learning_rate": 5.507330163526764e-06, "loss": 0.6582, "step": 58585 }, { "epoch": 0.79, "learning_rate": 5.504036075405014e-06, "loss": 0.8074, "step": 58590 }, { "epoch": 0.79, "learning_rate": 5.500742850856921e-06, "loss": 0.7479, "step": 58595 }, { "epoch": 0.79, "learning_rate": 5.497450490028377e-06, "loss": 0.7542, "step": 58600 }, { "epoch": 0.79, "learning_rate": 5.49415899306521e-06, "loss": 0.7507, "step": 58605 }, { "epoch": 0.79, "learning_rate": 5.490868360113205e-06, "loss": 0.7127, "step": 58610 }, { "epoch": 0.79, "learning_rate": 5.487578591318138e-06, "loss": 0.2351, "step": 58615 }, { "epoch": 0.79, "learning_rate": 5.484289686825725e-06, "loss": 0.651, "step": 58620 }, { "epoch": 0.79, "learning_rate": 5.4810016467816335e-06, "loss": 0.7657, "step": 58625 }, { "epoch": 0.79, "learning_rate": 5.477714471331535e-06, "loss": 0.7125, "step": 58630 }, { "epoch": 0.79, "learning_rate": 5.474428160621003e-06, "loss": 1.2777, "step": 58635 }, { "epoch": 0.79, "learning_rate": 5.47114271479563e-06, "loss": 0.8908, "step": 58640 }, { "epoch": 0.79, "learning_rate": 5.467858134000931e-06, "loss": 0.6402, "step": 58645 }, { "epoch": 0.79, "learning_rate": 5.464574418382396e-06, "loss": 0.488, "step": 58650 }, { "epoch": 0.79, "learning_rate": 5.461291568085489e-06, "loss": 0.6521, "step": 58655 }, { "epoch": 0.79, "learning_rate": 5.458009583255613e-06, "loss": 0.9655, "step": 58660 }, { "epoch": 0.79, "learning_rate": 5.45472846403815e-06, "loss": 0.8918, "step": 58665 }, { "epoch": 0.79, "learning_rate": 5.451448210578428e-06, "loss": 0.7362, "step": 58670 }, { "epoch": 0.79, "learning_rate": 5.448168823021757e-06, "loss": 0.5151, "step": 58675 }, { "epoch": 0.79, "learning_rate": 5.444890301513391e-06, "loss": 0.3837, "step": 58680 }, { "epoch": 0.79, "learning_rate": 5.441612646198549e-06, "loss": 0.8223, "step": 58685 }, { "epoch": 0.79, "learning_rate": 5.438335857222427e-06, "loss": 0.444, "step": 58690 }, { "epoch": 0.79, "learning_rate": 5.435059934730161e-06, "loss": 0.4647, "step": 58695 }, { "epoch": 0.79, "learning_rate": 5.4317848788668525e-06, "loss": 0.2433, "step": 58700 }, { "epoch": 0.79, "learning_rate": 5.428510689777583e-06, "loss": 0.539, "step": 58705 }, { "epoch": 0.79, "learning_rate": 5.42523736760738e-06, "loss": 0.7863, "step": 58710 }, { "epoch": 0.79, "learning_rate": 5.421964912501229e-06, "loss": 1.1696, "step": 58715 }, { "epoch": 0.79, "learning_rate": 5.418693324604082e-06, "loss": 0.1411, "step": 58720 }, { "epoch": 0.79, "learning_rate": 5.415422604060863e-06, "loss": 0.45, "step": 58725 }, { "epoch": 0.79, "learning_rate": 5.4121527510164475e-06, "loss": 0.5735, "step": 58730 }, { "epoch": 0.79, "learning_rate": 5.40888376561566e-06, "loss": 1.4286, "step": 58735 }, { "epoch": 0.79, "learning_rate": 5.405615648003326e-06, "loss": 0.6324, "step": 58740 }, { "epoch": 0.79, "learning_rate": 5.402348398324178e-06, "loss": 0.2228, "step": 58745 }, { "epoch": 0.79, "learning_rate": 5.399082016722956e-06, "loss": 0.4978, "step": 58750 }, { "epoch": 0.79, "learning_rate": 5.395816503344342e-06, "loss": 1.3599, "step": 58755 }, { "epoch": 0.79, "learning_rate": 5.392551858332976e-06, "loss": 0.9187, "step": 58760 }, { "epoch": 0.79, "learning_rate": 5.389288081833472e-06, "loss": 0.5571, "step": 58765 }, { "epoch": 0.79, "learning_rate": 5.386025173990397e-06, "loss": 1.2605, "step": 58770 }, { "epoch": 0.79, "learning_rate": 5.3827631349482846e-06, "loss": 0.8601, "step": 58775 }, { "epoch": 0.79, "learning_rate": 5.379501964851616e-06, "loss": 0.6309, "step": 58780 }, { "epoch": 0.79, "learning_rate": 5.376241663844858e-06, "loss": 0.7757, "step": 58785 }, { "epoch": 0.79, "learning_rate": 5.372982232072418e-06, "loss": 0.7924, "step": 58790 }, { "epoch": 0.79, "learning_rate": 5.36972366967867e-06, "loss": 1.1979, "step": 58795 }, { "epoch": 0.79, "learning_rate": 5.366465976807961e-06, "loss": 0.544, "step": 58800 }, { "epoch": 0.79, "learning_rate": 5.363209153604587e-06, "loss": 0.2252, "step": 58805 }, { "epoch": 0.79, "learning_rate": 5.3599532002128e-06, "loss": 0.4382, "step": 58810 }, { "epoch": 0.79, "learning_rate": 5.356698116776837e-06, "loss": 0.3549, "step": 58815 }, { "epoch": 0.79, "learning_rate": 5.353443903440877e-06, "loss": 0.4072, "step": 58820 }, { "epoch": 0.79, "learning_rate": 5.350190560349061e-06, "loss": 0.7873, "step": 58825 }, { "epoch": 0.79, "learning_rate": 5.346938087645492e-06, "loss": 1.0043, "step": 58830 }, { "epoch": 0.79, "learning_rate": 5.343686485474253e-06, "loss": 0.7123, "step": 58835 }, { "epoch": 0.79, "learning_rate": 5.340435753979364e-06, "loss": 0.7624, "step": 58840 }, { "epoch": 0.79, "learning_rate": 5.337185893304811e-06, "loss": 0.9484, "step": 58845 }, { "epoch": 0.79, "learning_rate": 5.333936903594567e-06, "loss": 1.0781, "step": 58850 }, { "epoch": 0.79, "learning_rate": 5.330688784992519e-06, "loss": 1.0172, "step": 58855 }, { "epoch": 0.79, "learning_rate": 5.327441537642558e-06, "loss": 0.5285, "step": 58860 }, { "epoch": 0.79, "learning_rate": 5.324195161688522e-06, "loss": 1.7024, "step": 58865 }, { "epoch": 0.79, "learning_rate": 5.320949657274199e-06, "loss": 0.7552, "step": 58870 }, { "epoch": 0.79, "learning_rate": 5.317705024543359e-06, "loss": 1.115, "step": 58875 }, { "epoch": 0.79, "learning_rate": 5.314461263639719e-06, "loss": 0.611, "step": 58880 }, { "epoch": 0.79, "learning_rate": 5.311218374706964e-06, "loss": 0.4711, "step": 58885 }, { "epoch": 0.79, "learning_rate": 5.307976357888728e-06, "loss": 0.9686, "step": 58890 }, { "epoch": 0.79, "learning_rate": 5.304735213328629e-06, "loss": 1.0178, "step": 58895 }, { "epoch": 0.79, "learning_rate": 5.301494941170227e-06, "loss": 1.2164, "step": 58900 }, { "epoch": 0.79, "learning_rate": 5.2982555415570454e-06, "loss": 0.4921, "step": 58905 }, { "epoch": 0.79, "learning_rate": 5.295017014632583e-06, "loss": 0.4856, "step": 58910 }, { "epoch": 0.79, "learning_rate": 5.291779360540289e-06, "loss": 0.6993, "step": 58915 }, { "epoch": 0.79, "learning_rate": 5.288542579423564e-06, "loss": 0.22, "step": 58920 }, { "epoch": 0.79, "learning_rate": 5.285306671425797e-06, "loss": 0.3862, "step": 58925 }, { "epoch": 0.79, "learning_rate": 5.282071636690314e-06, "loss": 0.619, "step": 58930 }, { "epoch": 0.79, "learning_rate": 5.27883747536041e-06, "loss": 0.5746, "step": 58935 }, { "epoch": 0.79, "learning_rate": 5.275604187579339e-06, "loss": 0.5351, "step": 58940 }, { "epoch": 0.79, "learning_rate": 5.272371773490331e-06, "loss": 0.8069, "step": 58945 }, { "epoch": 0.79, "learning_rate": 5.269140233236561e-06, "loss": 1.4967, "step": 58950 }, { "epoch": 0.79, "learning_rate": 5.265909566961158e-06, "loss": 0.6224, "step": 58955 }, { "epoch": 0.79, "learning_rate": 5.262679774807252e-06, "loss": 0.9997, "step": 58960 }, { "epoch": 0.79, "learning_rate": 5.259450856917874e-06, "loss": 0.8404, "step": 58965 }, { "epoch": 0.79, "learning_rate": 5.256222813436071e-06, "loss": 0.4523, "step": 58970 }, { "epoch": 0.79, "learning_rate": 5.252995644504821e-06, "loss": 1.3422, "step": 58975 }, { "epoch": 0.79, "learning_rate": 5.249769350267067e-06, "loss": 1.1812, "step": 58980 }, { "epoch": 0.79, "learning_rate": 5.2465439308657325e-06, "loss": 0.8234, "step": 58985 }, { "epoch": 0.79, "learning_rate": 5.243319386443677e-06, "loss": 0.5768, "step": 58990 }, { "epoch": 0.79, "learning_rate": 5.240095717143731e-06, "loss": 0.3671, "step": 58995 }, { "epoch": 0.79, "learning_rate": 5.236872923108685e-06, "loss": 0.5413, "step": 59000 }, { "epoch": 0.79, "learning_rate": 5.233651004481302e-06, "loss": 0.6466, "step": 59005 }, { "epoch": 0.79, "learning_rate": 5.23042996140429e-06, "loss": 0.5294, "step": 59010 }, { "epoch": 0.79, "learning_rate": 5.2272097940203214e-06, "loss": 1.1176, "step": 59015 }, { "epoch": 0.79, "learning_rate": 5.2239905024720455e-06, "loss": 1.3893, "step": 59020 }, { "epoch": 0.79, "learning_rate": 5.220772086902057e-06, "loss": 0.5296, "step": 59025 }, { "epoch": 0.79, "learning_rate": 5.217554547452902e-06, "loss": 0.1989, "step": 59030 }, { "epoch": 0.79, "learning_rate": 5.21433788426712e-06, "loss": 1.2733, "step": 59035 }, { "epoch": 0.79, "learning_rate": 5.211122097487186e-06, "loss": 0.3865, "step": 59040 }, { "epoch": 0.79, "learning_rate": 5.207907187255543e-06, "loss": 0.7094, "step": 59045 }, { "epoch": 0.79, "learning_rate": 5.2046931537145845e-06, "loss": 0.7376, "step": 59050 }, { "epoch": 0.79, "learning_rate": 5.201479997006698e-06, "loss": 0.5101, "step": 59055 }, { "epoch": 0.79, "learning_rate": 5.198267717274194e-06, "loss": 1.2842, "step": 59060 }, { "epoch": 0.79, "learning_rate": 5.19505631465936e-06, "loss": 0.5871, "step": 59065 }, { "epoch": 0.79, "learning_rate": 5.191845789304467e-06, "loss": 0.6117, "step": 59070 }, { "epoch": 0.79, "learning_rate": 5.188636141351691e-06, "loss": 0.8001, "step": 59075 }, { "epoch": 0.79, "learning_rate": 5.18542737094323e-06, "loss": 0.8292, "step": 59080 }, { "epoch": 0.79, "learning_rate": 5.182219478221207e-06, "loss": 0.8131, "step": 59085 }, { "epoch": 0.79, "learning_rate": 5.179012463327709e-06, "loss": 1.2919, "step": 59090 }, { "epoch": 0.79, "learning_rate": 5.175806326404803e-06, "loss": 0.6179, "step": 59095 }, { "epoch": 0.79, "learning_rate": 5.172601067594501e-06, "loss": 0.4437, "step": 59100 }, { "epoch": 0.79, "learning_rate": 5.1693966870387775e-06, "loss": 0.521, "step": 59105 }, { "epoch": 0.79, "learning_rate": 5.1661931848795645e-06, "loss": 1.2514, "step": 59110 }, { "epoch": 0.79, "learning_rate": 5.162990561258768e-06, "loss": 0.9056, "step": 59115 }, { "epoch": 0.79, "learning_rate": 5.159788816318262e-06, "loss": 1.0815, "step": 59120 }, { "epoch": 0.79, "learning_rate": 5.15658795019984e-06, "loss": 0.5163, "step": 59125 }, { "epoch": 0.79, "learning_rate": 5.153387963045305e-06, "loss": 0.8517, "step": 59130 }, { "epoch": 0.79, "learning_rate": 5.150188854996396e-06, "loss": 0.5882, "step": 59135 }, { "epoch": 0.79, "learning_rate": 5.146990626194806e-06, "loss": 1.0564, "step": 59140 }, { "epoch": 0.79, "learning_rate": 5.143793276782216e-06, "loss": 1.0564, "step": 59145 }, { "epoch": 0.79, "learning_rate": 5.140596806900247e-06, "loss": 0.5627, "step": 59150 }, { "epoch": 0.79, "learning_rate": 5.137401216690488e-06, "loss": 0.6967, "step": 59155 }, { "epoch": 0.79, "learning_rate": 5.134206506294478e-06, "loss": 0.4429, "step": 59160 }, { "epoch": 0.79, "learning_rate": 5.131012675853739e-06, "loss": 0.4289, "step": 59165 }, { "epoch": 0.79, "learning_rate": 5.127819725509739e-06, "loss": 0.7368, "step": 59170 }, { "epoch": 0.79, "learning_rate": 5.124627655403902e-06, "loss": 0.6692, "step": 59175 }, { "epoch": 0.79, "learning_rate": 5.121436465677637e-06, "loss": 1.074, "step": 59180 }, { "epoch": 0.79, "learning_rate": 5.118246156472276e-06, "loss": 0.673, "step": 59185 }, { "epoch": 0.79, "learning_rate": 5.115056727929152e-06, "loss": 0.7984, "step": 59190 }, { "epoch": 0.79, "learning_rate": 5.111868180189533e-06, "loss": 0.9882, "step": 59195 }, { "epoch": 0.79, "learning_rate": 5.108680513394648e-06, "loss": 1.2076, "step": 59200 }, { "epoch": 0.79, "learning_rate": 5.105493727685712e-06, "loss": 0.5599, "step": 59205 }, { "epoch": 0.79, "learning_rate": 5.102307823203875e-06, "loss": 0.315, "step": 59210 }, { "epoch": 0.79, "learning_rate": 5.099122800090256e-06, "loss": 1.1234, "step": 59215 }, { "epoch": 0.79, "learning_rate": 5.095938658485927e-06, "loss": 0.6265, "step": 59220 }, { "epoch": 0.79, "learning_rate": 5.09275539853194e-06, "loss": 0.5933, "step": 59225 }, { "epoch": 0.79, "learning_rate": 5.089573020369309e-06, "loss": 0.8318, "step": 59230 }, { "epoch": 0.79, "learning_rate": 5.086391524138973e-06, "loss": 1.0105, "step": 59235 }, { "epoch": 0.79, "learning_rate": 5.0832109099818725e-06, "loss": 0.5497, "step": 59240 }, { "epoch": 0.79, "learning_rate": 5.0800311780388905e-06, "loss": 0.6519, "step": 59245 }, { "epoch": 0.79, "learning_rate": 5.076852328450862e-06, "loss": 0.9276, "step": 59250 }, { "epoch": 0.79, "learning_rate": 5.07367436135861e-06, "loss": 1.1203, "step": 59255 }, { "epoch": 0.79, "learning_rate": 5.070497276902897e-06, "loss": 0.7592, "step": 59260 }, { "epoch": 0.79, "learning_rate": 5.0673210752244486e-06, "loss": 0.7807, "step": 59265 }, { "epoch": 0.79, "learning_rate": 5.06414575646395e-06, "loss": 0.4621, "step": 59270 }, { "epoch": 0.79, "learning_rate": 5.0609713207620676e-06, "loss": 0.5866, "step": 59275 }, { "epoch": 0.79, "learning_rate": 5.057797768259401e-06, "loss": 0.5944, "step": 59280 }, { "epoch": 0.79, "learning_rate": 5.054625099096519e-06, "loss": 0.8169, "step": 59285 }, { "epoch": 0.79, "learning_rate": 5.051453313413976e-06, "loss": 0.3737, "step": 59290 }, { "epoch": 0.79, "learning_rate": 5.04828241135224e-06, "loss": 0.6629, "step": 59295 }, { "epoch": 0.79, "learning_rate": 5.045112393051782e-06, "loss": 0.7445, "step": 59300 }, { "epoch": 0.79, "learning_rate": 5.041943258653015e-06, "loss": 0.5365, "step": 59305 }, { "epoch": 0.79, "learning_rate": 5.0387750082963064e-06, "loss": 0.9823, "step": 59310 }, { "epoch": 0.79, "learning_rate": 5.035607642122009e-06, "loss": 1.1653, "step": 59315 }, { "epoch": 0.79, "learning_rate": 5.032441160270415e-06, "loss": 0.2656, "step": 59320 }, { "epoch": 0.79, "learning_rate": 5.029275562881783e-06, "loss": 0.3977, "step": 59325 }, { "epoch": 0.79, "learning_rate": 5.026110850096327e-06, "loss": 0.7943, "step": 59330 }, { "epoch": 0.8, "learning_rate": 5.022947022054242e-06, "loss": 0.4981, "step": 59335 }, { "epoch": 0.8, "learning_rate": 5.019784078895659e-06, "loss": 0.7412, "step": 59340 }, { "epoch": 0.8, "learning_rate": 5.016622020760678e-06, "loss": 0.6469, "step": 59345 }, { "epoch": 0.8, "learning_rate": 5.013460847789375e-06, "loss": 1.0768, "step": 59350 }, { "epoch": 0.8, "learning_rate": 5.0103005601217665e-06, "loss": 0.9965, "step": 59355 }, { "epoch": 0.8, "learning_rate": 5.007141157897832e-06, "loss": 0.9067, "step": 59360 }, { "epoch": 0.8, "learning_rate": 5.003982641257529e-06, "loss": 0.672, "step": 59365 }, { "epoch": 0.8, "learning_rate": 5.000825010340757e-06, "loss": 0.524, "step": 59370 }, { "epoch": 0.8, "learning_rate": 4.997668265287386e-06, "loss": 0.4312, "step": 59375 }, { "epoch": 0.8, "learning_rate": 4.994512406237234e-06, "loss": 0.7877, "step": 59380 }, { "epoch": 0.8, "learning_rate": 4.991357433330107e-06, "loss": 0.9725, "step": 59385 }, { "epoch": 0.8, "learning_rate": 4.9882033467057445e-06, "loss": 0.842, "step": 59390 }, { "epoch": 0.8, "learning_rate": 4.98505014650385e-06, "loss": 0.4841, "step": 59395 }, { "epoch": 0.8, "learning_rate": 4.981897832864116e-06, "loss": 1.0727, "step": 59400 }, { "epoch": 0.8, "learning_rate": 4.978746405926149e-06, "loss": 1.1367, "step": 59405 }, { "epoch": 0.8, "learning_rate": 4.975595865829558e-06, "loss": 0.7388, "step": 59410 }, { "epoch": 0.8, "learning_rate": 4.972446212713894e-06, "loss": 0.4993, "step": 59415 }, { "epoch": 0.8, "learning_rate": 4.969297446718657e-06, "loss": 0.8217, "step": 59420 }, { "epoch": 0.8, "learning_rate": 4.966149567983341e-06, "loss": 0.4087, "step": 59425 }, { "epoch": 0.8, "learning_rate": 4.963002576647374e-06, "loss": 0.5217, "step": 59430 }, { "epoch": 0.8, "learning_rate": 4.959856472850152e-06, "loss": 0.7327, "step": 59435 }, { "epoch": 0.8, "learning_rate": 4.956711256731022e-06, "loss": 0.4449, "step": 59440 }, { "epoch": 0.8, "learning_rate": 4.953566928429318e-06, "loss": 0.3368, "step": 59445 }, { "epoch": 0.8, "learning_rate": 4.9504234880843075e-06, "loss": 0.4847, "step": 59450 }, { "epoch": 0.8, "learning_rate": 4.947280935835227e-06, "loss": 0.8385, "step": 59455 }, { "epoch": 0.8, "learning_rate": 4.944139271821285e-06, "loss": 0.6697, "step": 59460 }, { "epoch": 0.8, "learning_rate": 4.94099849618164e-06, "loss": 0.5195, "step": 59465 }, { "epoch": 0.8, "learning_rate": 4.937858609055401e-06, "loss": 0.3501, "step": 59470 }, { "epoch": 0.8, "learning_rate": 4.9347196105816644e-06, "loss": 0.8626, "step": 59475 }, { "epoch": 0.8, "learning_rate": 4.931581500899466e-06, "loss": 0.6, "step": 59480 }, { "epoch": 0.8, "learning_rate": 4.92844428014781e-06, "loss": 0.4054, "step": 59485 }, { "epoch": 0.8, "learning_rate": 4.925307948465646e-06, "loss": 0.992, "step": 59490 }, { "epoch": 0.8, "learning_rate": 4.92217250599192e-06, "loss": 0.6937, "step": 59495 }, { "epoch": 0.8, "learning_rate": 4.9190379528655045e-06, "loss": 0.6422, "step": 59500 }, { "epoch": 0.8, "learning_rate": 4.91590428922524e-06, "loss": 0.1831, "step": 59505 }, { "epoch": 0.8, "learning_rate": 4.912771515209949e-06, "loss": 0.3705, "step": 59510 }, { "epoch": 0.8, "learning_rate": 4.909639630958377e-06, "loss": 0.7477, "step": 59515 }, { "epoch": 0.8, "learning_rate": 4.906508636609264e-06, "loss": 0.6554, "step": 59520 }, { "epoch": 0.8, "learning_rate": 4.903378532301295e-06, "loss": 0.1455, "step": 59525 }, { "epoch": 0.8, "learning_rate": 4.900249318173109e-06, "loss": 0.398, "step": 59530 }, { "epoch": 0.8, "learning_rate": 4.89712099436333e-06, "loss": 0.5328, "step": 59535 }, { "epoch": 0.8, "learning_rate": 4.893993561010518e-06, "loss": 0.6901, "step": 59540 }, { "epoch": 0.8, "learning_rate": 4.890867018253201e-06, "loss": 0.3923, "step": 59545 }, { "epoch": 0.8, "learning_rate": 4.8877413662298756e-06, "loss": 0.3723, "step": 59550 }, { "epoch": 0.8, "learning_rate": 4.88461660507899e-06, "loss": 0.4494, "step": 59555 }, { "epoch": 0.8, "learning_rate": 4.881492734938955e-06, "loss": 0.8779, "step": 59560 }, { "epoch": 0.8, "learning_rate": 4.878369755948137e-06, "loss": 0.537, "step": 59565 }, { "epoch": 0.8, "learning_rate": 4.875247668244878e-06, "loss": 0.6709, "step": 59570 }, { "epoch": 0.8, "learning_rate": 4.872126471967467e-06, "loss": 0.7224, "step": 59575 }, { "epoch": 0.8, "learning_rate": 4.8690061672541475e-06, "loss": 0.7504, "step": 59580 }, { "epoch": 0.8, "learning_rate": 4.865886754243154e-06, "loss": 0.2869, "step": 59585 }, { "epoch": 0.8, "learning_rate": 4.8627682330726455e-06, "loss": 0.9466, "step": 59590 }, { "epoch": 0.8, "learning_rate": 4.859650603880763e-06, "loss": 0.4419, "step": 59595 }, { "epoch": 0.8, "learning_rate": 4.856533866805593e-06, "loss": 0.9903, "step": 59600 }, { "epoch": 0.8, "learning_rate": 4.8534180219852035e-06, "loss": 0.2412, "step": 59605 }, { "epoch": 0.8, "learning_rate": 4.850303069557608e-06, "loss": 0.837, "step": 59610 }, { "epoch": 0.8, "learning_rate": 4.8471890096607714e-06, "loss": 0.91, "step": 59615 }, { "epoch": 0.8, "learning_rate": 4.844075842432655e-06, "loss": 0.3156, "step": 59620 }, { "epoch": 0.8, "learning_rate": 4.840963568011128e-06, "loss": 0.2645, "step": 59625 }, { "epoch": 0.8, "learning_rate": 4.837852186534069e-06, "loss": 0.4596, "step": 59630 }, { "epoch": 0.8, "learning_rate": 4.834741698139289e-06, "loss": 0.5941, "step": 59635 }, { "epoch": 0.8, "learning_rate": 4.831632102964564e-06, "loss": 0.9772, "step": 59640 }, { "epoch": 0.8, "learning_rate": 4.828523401147645e-06, "loss": 0.4172, "step": 59645 }, { "epoch": 0.8, "learning_rate": 4.825415592826222e-06, "loss": 0.6673, "step": 59650 }, { "epoch": 0.8, "learning_rate": 4.822308678137952e-06, "loss": 1.0629, "step": 59655 }, { "epoch": 0.8, "learning_rate": 4.819202657220468e-06, "loss": 0.6045, "step": 59660 }, { "epoch": 0.8, "learning_rate": 4.8160975302113445e-06, "loss": 0.7594, "step": 59665 }, { "epoch": 0.8, "learning_rate": 4.812993297248125e-06, "loss": 0.2678, "step": 59670 }, { "epoch": 0.8, "learning_rate": 4.809889958468303e-06, "loss": 0.6953, "step": 59675 }, { "epoch": 0.8, "learning_rate": 4.8067875140093535e-06, "loss": 0.8074, "step": 59680 }, { "epoch": 0.8, "learning_rate": 4.8036859640086945e-06, "loss": 0.5724, "step": 59685 }, { "epoch": 0.8, "learning_rate": 4.800585308603703e-06, "loss": 0.8423, "step": 59690 }, { "epoch": 0.8, "learning_rate": 4.7974855479317324e-06, "loss": 0.7296, "step": 59695 }, { "epoch": 0.8, "learning_rate": 4.794386682130084e-06, "loss": 0.8933, "step": 59700 }, { "epoch": 0.8, "learning_rate": 4.7912887113360175e-06, "loss": 1.026, "step": 59705 }, { "epoch": 0.8, "learning_rate": 4.7881916356867536e-06, "loss": 0.4512, "step": 59710 }, { "epoch": 0.8, "learning_rate": 4.7850954553194935e-06, "loss": 0.7775, "step": 59715 }, { "epoch": 0.8, "learning_rate": 4.78200017037137e-06, "loss": 0.2986, "step": 59720 }, { "epoch": 0.8, "learning_rate": 4.778905780979487e-06, "loss": 0.5934, "step": 59725 }, { "epoch": 0.8, "learning_rate": 4.7758122872809255e-06, "loss": 0.514, "step": 59730 }, { "epoch": 0.8, "learning_rate": 4.772719689412689e-06, "loss": 0.7282, "step": 59735 }, { "epoch": 0.8, "learning_rate": 4.769627987511785e-06, "loss": 0.5538, "step": 59740 }, { "epoch": 0.8, "learning_rate": 4.76653718171515e-06, "loss": 1.3114, "step": 59745 }, { "epoch": 0.8, "learning_rate": 4.763447272159685e-06, "loss": 0.9757, "step": 59750 }, { "epoch": 0.8, "learning_rate": 4.7603582589822755e-06, "loss": 1.1858, "step": 59755 }, { "epoch": 0.8, "learning_rate": 4.757270142319736e-06, "loss": 0.2836, "step": 59760 }, { "epoch": 0.8, "learning_rate": 4.754182922308853e-06, "loss": 0.2857, "step": 59765 }, { "epoch": 0.8, "learning_rate": 4.751096599086386e-06, "loss": 0.9003, "step": 59770 }, { "epoch": 0.8, "learning_rate": 4.748011172789038e-06, "loss": 0.6913, "step": 59775 }, { "epoch": 0.8, "learning_rate": 4.7449266435534796e-06, "loss": 1.5391, "step": 59780 }, { "epoch": 0.8, "learning_rate": 4.741843011516328e-06, "loss": 0.9121, "step": 59785 }, { "epoch": 0.8, "learning_rate": 4.7387602768141915e-06, "loss": 0.7854, "step": 59790 }, { "epoch": 0.8, "learning_rate": 4.7356784395836104e-06, "loss": 0.3926, "step": 59795 }, { "epoch": 0.8, "learning_rate": 4.7325974999610865e-06, "loss": 1.1096, "step": 59800 }, { "epoch": 0.8, "learning_rate": 4.729517458083107e-06, "loss": 0.8804, "step": 59805 }, { "epoch": 0.8, "learning_rate": 4.726438314086096e-06, "loss": 0.4915, "step": 59810 }, { "epoch": 0.8, "learning_rate": 4.723360068106439e-06, "loss": 0.3864, "step": 59815 }, { "epoch": 0.8, "learning_rate": 4.720282720280486e-06, "loss": 0.9218, "step": 59820 }, { "epoch": 0.8, "learning_rate": 4.717206270744556e-06, "loss": 0.2765, "step": 59825 }, { "epoch": 0.8, "learning_rate": 4.714130719634919e-06, "loss": 0.8059, "step": 59830 }, { "epoch": 0.8, "learning_rate": 4.711056067087796e-06, "loss": 0.4707, "step": 59835 }, { "epoch": 0.8, "learning_rate": 4.7079823132394005e-06, "loss": 0.3086, "step": 59840 }, { "epoch": 0.8, "learning_rate": 4.704909458225859e-06, "loss": 0.3727, "step": 59845 }, { "epoch": 0.8, "learning_rate": 4.701837502183301e-06, "loss": 1.5089, "step": 59850 }, { "epoch": 0.8, "learning_rate": 4.698766445247793e-06, "loss": 0.5352, "step": 59855 }, { "epoch": 0.8, "learning_rate": 4.695696287555363e-06, "loss": 0.6083, "step": 59860 }, { "epoch": 0.8, "learning_rate": 4.692627029242011e-06, "loss": 0.7825, "step": 59865 }, { "epoch": 0.8, "learning_rate": 4.689558670443689e-06, "loss": 0.6353, "step": 59870 }, { "epoch": 0.8, "learning_rate": 4.686491211296301e-06, "loss": 0.3298, "step": 59875 }, { "epoch": 0.8, "learning_rate": 4.683424651935733e-06, "loss": 1.1068, "step": 59880 }, { "epoch": 0.8, "learning_rate": 4.680358992497813e-06, "loss": 0.4121, "step": 59885 }, { "epoch": 0.8, "learning_rate": 4.6772942331183346e-06, "loss": 0.8437, "step": 59890 }, { "epoch": 0.8, "learning_rate": 4.674230373933045e-06, "loss": 1.2995, "step": 59895 }, { "epoch": 0.8, "learning_rate": 4.671167415077665e-06, "loss": 0.5501, "step": 59900 }, { "epoch": 0.8, "learning_rate": 4.668105356687871e-06, "loss": 0.3047, "step": 59905 }, { "epoch": 0.8, "learning_rate": 4.6650441988992845e-06, "loss": 0.3366, "step": 59910 }, { "epoch": 0.8, "learning_rate": 4.6619839418475146e-06, "loss": 0.403, "step": 59915 }, { "epoch": 0.8, "learning_rate": 4.658924585668107e-06, "loss": 0.4797, "step": 59920 }, { "epoch": 0.8, "learning_rate": 4.655866130496575e-06, "loss": 0.694, "step": 59925 }, { "epoch": 0.8, "learning_rate": 4.652808576468393e-06, "loss": 0.8158, "step": 59930 }, { "epoch": 0.8, "learning_rate": 4.649751923719001e-06, "loss": 1.3127, "step": 59935 }, { "epoch": 0.8, "learning_rate": 4.646696172383788e-06, "loss": 1.6739, "step": 59940 }, { "epoch": 0.8, "learning_rate": 4.643641322598108e-06, "loss": 0.9703, "step": 59945 }, { "epoch": 0.8, "learning_rate": 4.640587374497287e-06, "loss": 0.4189, "step": 59950 }, { "epoch": 0.8, "learning_rate": 4.6375343282165805e-06, "loss": 0.5406, "step": 59955 }, { "epoch": 0.8, "learning_rate": 4.634482183891231e-06, "loss": 0.9897, "step": 59960 }, { "epoch": 0.8, "learning_rate": 4.631430941656448e-06, "loss": 1.3045, "step": 59965 }, { "epoch": 0.8, "learning_rate": 4.628380601647362e-06, "loss": 0.2447, "step": 59970 }, { "epoch": 0.8, "learning_rate": 4.625331163999105e-06, "loss": 1.1857, "step": 59975 }, { "epoch": 0.8, "learning_rate": 4.6222826288467465e-06, "loss": 0.5531, "step": 59980 }, { "epoch": 0.8, "learning_rate": 4.619234996325314e-06, "loss": 0.1114, "step": 59985 }, { "epoch": 0.8, "learning_rate": 4.6161882665698155e-06, "loss": 0.8695, "step": 59990 }, { "epoch": 0.8, "learning_rate": 4.613142439715201e-06, "loss": 1.2424, "step": 59995 }, { "epoch": 0.8, "learning_rate": 4.610097515896383e-06, "loss": 1.2317, "step": 60000 }, { "epoch": 0.8, "learning_rate": 4.607053495248234e-06, "loss": 0.224, "step": 60005 }, { "epoch": 0.8, "learning_rate": 4.604010377905596e-06, "loss": 1.1834, "step": 60010 }, { "epoch": 0.8, "learning_rate": 4.600968164003261e-06, "loss": 0.5113, "step": 60015 }, { "epoch": 0.8, "learning_rate": 4.597926853675977e-06, "loss": 0.67, "step": 60020 }, { "epoch": 0.8, "learning_rate": 4.594886447058472e-06, "loss": 0.7192, "step": 60025 }, { "epoch": 0.8, "learning_rate": 4.5918469442854135e-06, "loss": 0.552, "step": 60030 }, { "epoch": 0.8, "learning_rate": 4.588808345491435e-06, "loss": 1.2166, "step": 60035 }, { "epoch": 0.8, "learning_rate": 4.5857706508111275e-06, "loss": 0.6166, "step": 60040 }, { "epoch": 0.8, "learning_rate": 4.582733860379057e-06, "loss": 0.4105, "step": 60045 }, { "epoch": 0.8, "learning_rate": 4.579697974329733e-06, "loss": 1.0425, "step": 60050 }, { "epoch": 0.8, "learning_rate": 4.576662992797623e-06, "loss": 0.3378, "step": 60055 }, { "epoch": 0.8, "learning_rate": 4.5736289159171805e-06, "loss": 0.94, "step": 60060 }, { "epoch": 0.8, "learning_rate": 4.5705957438227725e-06, "loss": 0.4007, "step": 60065 }, { "epoch": 0.8, "learning_rate": 4.567563476648767e-06, "loss": 0.4437, "step": 60070 }, { "epoch": 0.8, "learning_rate": 4.564532114529496e-06, "loss": 0.996, "step": 60075 }, { "epoch": 0.8, "learning_rate": 4.561501657599201e-06, "loss": 0.5472, "step": 60080 }, { "epoch": 0.81, "learning_rate": 4.558472105992139e-06, "loss": 0.5489, "step": 60085 }, { "epoch": 0.81, "learning_rate": 4.555443459842499e-06, "loss": 0.3515, "step": 60090 }, { "epoch": 0.81, "learning_rate": 4.552415719284425e-06, "loss": 1.3542, "step": 60095 }, { "epoch": 0.81, "learning_rate": 4.549388884452046e-06, "loss": 0.6595, "step": 60100 }, { "epoch": 0.81, "learning_rate": 4.546362955479427e-06, "loss": 0.7176, "step": 60105 }, { "epoch": 0.81, "learning_rate": 4.543337932500602e-06, "loss": 0.1715, "step": 60110 }, { "epoch": 0.81, "learning_rate": 4.540313815649561e-06, "loss": 1.3306, "step": 60115 }, { "epoch": 0.81, "learning_rate": 4.537290605060265e-06, "loss": 1.0024, "step": 60120 }, { "epoch": 0.81, "learning_rate": 4.534268300866626e-06, "loss": 0.7173, "step": 60125 }, { "epoch": 0.81, "learning_rate": 4.531246903202507e-06, "loss": 0.4692, "step": 60130 }, { "epoch": 0.81, "learning_rate": 4.528226412201755e-06, "loss": 0.5977, "step": 60135 }, { "epoch": 0.81, "learning_rate": 4.525206827998154e-06, "loss": 0.8937, "step": 60140 }, { "epoch": 0.81, "learning_rate": 4.522188150725462e-06, "loss": 1.492, "step": 60145 }, { "epoch": 0.81, "learning_rate": 4.519170380517379e-06, "loss": 0.7226, "step": 60150 }, { "epoch": 0.81, "learning_rate": 4.51615351750759e-06, "loss": 0.5656, "step": 60155 }, { "epoch": 0.81, "learning_rate": 4.513137561829725e-06, "loss": 0.8817, "step": 60160 }, { "epoch": 0.81, "learning_rate": 4.510122513617368e-06, "loss": 0.3579, "step": 60165 }, { "epoch": 0.81, "learning_rate": 4.507108373004087e-06, "loss": 0.483, "step": 60170 }, { "epoch": 0.81, "learning_rate": 4.504095140123371e-06, "loss": 0.853, "step": 60175 }, { "epoch": 0.81, "learning_rate": 4.501082815108704e-06, "loss": 0.5703, "step": 60180 }, { "epoch": 0.81, "learning_rate": 4.498071398093523e-06, "loss": 0.375, "step": 60185 }, { "epoch": 0.81, "learning_rate": 4.495060889211203e-06, "loss": 0.8286, "step": 60190 }, { "epoch": 0.81, "learning_rate": 4.492051288595106e-06, "loss": 1.0477, "step": 60195 }, { "epoch": 0.81, "learning_rate": 4.489042596378543e-06, "loss": 0.9576, "step": 60200 }, { "epoch": 0.81, "learning_rate": 4.48603481269477e-06, "loss": 0.1933, "step": 60205 }, { "epoch": 0.81, "learning_rate": 4.483027937677034e-06, "loss": 0.8243, "step": 60210 }, { "epoch": 0.81, "learning_rate": 4.480021971458517e-06, "loss": 0.4529, "step": 60215 }, { "epoch": 0.81, "learning_rate": 4.477016914172369e-06, "loss": 0.5365, "step": 60220 }, { "epoch": 0.81, "learning_rate": 4.474012765951691e-06, "loss": 0.4882, "step": 60225 }, { "epoch": 0.81, "learning_rate": 4.4710095269295645e-06, "loss": 0.37, "step": 60230 }, { "epoch": 0.81, "learning_rate": 4.468007197239016e-06, "loss": 0.5342, "step": 60235 }, { "epoch": 0.81, "learning_rate": 4.465005777013023e-06, "loss": 0.4326, "step": 60240 }, { "epoch": 0.81, "learning_rate": 4.4620052663845445e-06, "loss": 0.6626, "step": 60245 }, { "epoch": 0.81, "learning_rate": 4.459005665486488e-06, "loss": 0.993, "step": 60250 }, { "epoch": 0.81, "learning_rate": 4.456006974451715e-06, "loss": 0.3503, "step": 60255 }, { "epoch": 0.81, "learning_rate": 4.453009193413049e-06, "loss": 0.6714, "step": 60260 }, { "epoch": 0.81, "learning_rate": 4.4500123225032885e-06, "loss": 0.4951, "step": 60265 }, { "epoch": 0.81, "learning_rate": 4.4470163618551716e-06, "loss": 0.6941, "step": 60270 }, { "epoch": 0.81, "learning_rate": 4.444021311601404e-06, "loss": 0.7744, "step": 60275 }, { "epoch": 0.81, "learning_rate": 4.441027171874665e-06, "loss": 0.8025, "step": 60280 }, { "epoch": 0.81, "learning_rate": 4.438033942807554e-06, "loss": 0.3203, "step": 60285 }, { "epoch": 0.81, "learning_rate": 4.435041624532674e-06, "loss": 1.1995, "step": 60290 }, { "epoch": 0.81, "learning_rate": 4.432050217182579e-06, "loss": 0.7277, "step": 60295 }, { "epoch": 0.81, "learning_rate": 4.429059720889747e-06, "loss": 0.9153, "step": 60300 }, { "epoch": 0.81, "learning_rate": 4.426070135786664e-06, "loss": 0.7751, "step": 60305 }, { "epoch": 0.81, "learning_rate": 4.4236791238498e-06, "loss": 0.4868, "step": 60310 }, { "epoch": 0.81, "learning_rate": 4.4206911792219304e-06, "loss": 0.4455, "step": 60315 }, { "epoch": 0.81, "learning_rate": 4.417704146154481e-06, "loss": 0.6298, "step": 60320 }, { "epoch": 0.81, "learning_rate": 4.414718024779779e-06, "loss": 0.6893, "step": 60325 }, { "epoch": 0.81, "learning_rate": 4.411732815230074e-06, "loss": 0.5218, "step": 60330 }, { "epoch": 0.81, "learning_rate": 4.4087485176376095e-06, "loss": 0.725, "step": 60335 }, { "epoch": 0.81, "learning_rate": 4.405765132134574e-06, "loss": 0.748, "step": 60340 }, { "epoch": 0.81, "learning_rate": 4.402782658853103e-06, "loss": 0.6544, "step": 60345 }, { "epoch": 0.81, "learning_rate": 4.399801097925324e-06, "loss": 0.2437, "step": 60350 }, { "epoch": 0.81, "learning_rate": 4.396820449483297e-06, "loss": 1.0296, "step": 60355 }, { "epoch": 0.81, "learning_rate": 4.3938407136590475e-06, "loss": 0.493, "step": 60360 }, { "epoch": 0.81, "learning_rate": 4.3908618905845605e-06, "loss": 0.966, "step": 60365 }, { "epoch": 0.81, "learning_rate": 4.387883980391794e-06, "loss": 1.5025, "step": 60370 }, { "epoch": 0.81, "learning_rate": 4.38490698321265e-06, "loss": 0.2006, "step": 60375 }, { "epoch": 0.81, "learning_rate": 4.381930899178982e-06, "loss": 0.631, "step": 60380 }, { "epoch": 0.81, "learning_rate": 4.378955728422643e-06, "loss": 0.6347, "step": 60385 }, { "epoch": 0.81, "learning_rate": 4.3759814710753854e-06, "loss": 0.5538, "step": 60390 }, { "epoch": 0.81, "learning_rate": 4.373008127268977e-06, "loss": 0.8426, "step": 60395 }, { "epoch": 0.81, "learning_rate": 4.370035697135108e-06, "loss": 0.7996, "step": 60400 }, { "epoch": 0.81, "learning_rate": 4.367064180805458e-06, "loss": 0.4598, "step": 60405 }, { "epoch": 0.81, "learning_rate": 4.364093578411641e-06, "loss": 1.6398, "step": 60410 }, { "epoch": 0.81, "learning_rate": 4.361123890085231e-06, "loss": 0.4106, "step": 60415 }, { "epoch": 0.81, "learning_rate": 4.3581551159577876e-06, "loss": 1.1244, "step": 60420 }, { "epoch": 0.81, "learning_rate": 4.3551872561608056e-06, "loss": 1.1449, "step": 60425 }, { "epoch": 0.81, "learning_rate": 4.352220310825738e-06, "loss": 0.4008, "step": 60430 }, { "epoch": 0.81, "learning_rate": 4.349254280084025e-06, "loss": 0.412, "step": 60435 }, { "epoch": 0.81, "learning_rate": 4.346289164067024e-06, "loss": 0.7691, "step": 60440 }, { "epoch": 0.81, "learning_rate": 4.3433249629060924e-06, "loss": 1.0684, "step": 60445 }, { "epoch": 0.81, "learning_rate": 4.340361676732521e-06, "loss": 0.3947, "step": 60450 }, { "epoch": 0.81, "learning_rate": 4.337399305677567e-06, "loss": 1.1789, "step": 60455 }, { "epoch": 0.81, "learning_rate": 4.334437849872455e-06, "loss": 0.6045, "step": 60460 }, { "epoch": 0.81, "learning_rate": 4.331477309448362e-06, "loss": 1.1915, "step": 60465 }, { "epoch": 0.81, "learning_rate": 4.32851768453642e-06, "loss": 0.7608, "step": 60470 }, { "epoch": 0.81, "learning_rate": 4.325558975267724e-06, "loss": 0.7024, "step": 60475 }, { "epoch": 0.81, "learning_rate": 4.322601181773342e-06, "loss": 0.7417, "step": 60480 }, { "epoch": 0.81, "learning_rate": 4.319644304184281e-06, "loss": 0.6069, "step": 60485 }, { "epoch": 0.81, "learning_rate": 4.316688342631509e-06, "loss": 1.1746, "step": 60490 }, { "epoch": 0.81, "learning_rate": 4.313733297245981e-06, "loss": 0.6873, "step": 60495 }, { "epoch": 0.81, "learning_rate": 4.3107791681585655e-06, "loss": 0.9915, "step": 60500 }, { "epoch": 0.81, "learning_rate": 4.307825955500136e-06, "loss": 0.1959, "step": 60505 }, { "epoch": 0.81, "learning_rate": 4.304873659401496e-06, "loss": 0.4075, "step": 60510 }, { "epoch": 0.81, "learning_rate": 4.3019222799934115e-06, "loss": 1.275, "step": 60515 }, { "epoch": 0.81, "learning_rate": 4.298971817406627e-06, "loss": 1.0459, "step": 60520 }, { "epoch": 0.81, "learning_rate": 4.2960222717718215e-06, "loss": 0.86, "step": 60525 }, { "epoch": 0.81, "learning_rate": 4.293073643219656e-06, "loss": 0.5813, "step": 60530 }, { "epoch": 0.81, "learning_rate": 4.290125931880734e-06, "loss": 1.0054, "step": 60535 }, { "epoch": 0.81, "learning_rate": 4.287179137885619e-06, "loss": 0.9572, "step": 60540 }, { "epoch": 0.81, "learning_rate": 4.284233261364859e-06, "loss": 1.0099, "step": 60545 }, { "epoch": 0.81, "learning_rate": 4.281288302448916e-06, "loss": 1.1024, "step": 60550 }, { "epoch": 0.81, "learning_rate": 4.2783442612682525e-06, "loss": 0.4048, "step": 60555 }, { "epoch": 0.81, "learning_rate": 4.275401137953272e-06, "loss": 0.6609, "step": 60560 }, { "epoch": 0.81, "learning_rate": 4.272458932634335e-06, "loss": 0.4458, "step": 60565 }, { "epoch": 0.81, "learning_rate": 4.269517645441773e-06, "loss": 1.0595, "step": 60570 }, { "epoch": 0.81, "learning_rate": 4.26657727650587e-06, "loss": 0.7983, "step": 60575 }, { "epoch": 0.81, "learning_rate": 4.263637825956867e-06, "loss": 0.2124, "step": 60580 }, { "epoch": 0.81, "learning_rate": 4.260699293924964e-06, "loss": 0.5526, "step": 60585 }, { "epoch": 0.81, "learning_rate": 4.257761680540332e-06, "loss": 0.9383, "step": 60590 }, { "epoch": 0.81, "learning_rate": 4.2548249859330845e-06, "loss": 0.4673, "step": 60595 }, { "epoch": 0.81, "learning_rate": 4.251889210233301e-06, "loss": 1.1394, "step": 60600 }, { "epoch": 0.81, "learning_rate": 4.2489543535710385e-06, "loss": 0.8336, "step": 60605 }, { "epoch": 0.81, "learning_rate": 4.246020416076271e-06, "loss": 0.4792, "step": 60610 }, { "epoch": 0.81, "learning_rate": 4.243087397878978e-06, "loss": 0.2371, "step": 60615 }, { "epoch": 0.81, "learning_rate": 4.240155299109067e-06, "loss": 0.5505, "step": 60620 }, { "epoch": 0.81, "learning_rate": 4.237224119896416e-06, "loss": 0.7817, "step": 60625 }, { "epoch": 0.81, "learning_rate": 4.234293860370866e-06, "loss": 0.854, "step": 60630 }, { "epoch": 0.81, "learning_rate": 4.2313645206622035e-06, "loss": 0.8658, "step": 60635 }, { "epoch": 0.81, "learning_rate": 4.228436100900199e-06, "loss": 0.3658, "step": 60640 }, { "epoch": 0.81, "learning_rate": 4.225508601214559e-06, "loss": 0.7254, "step": 60645 }, { "epoch": 0.81, "learning_rate": 4.22258202173495e-06, "loss": 0.3695, "step": 60650 }, { "epoch": 0.81, "learning_rate": 4.219656362591021e-06, "loss": 0.6599, "step": 60655 }, { "epoch": 0.81, "learning_rate": 4.216731623912342e-06, "loss": 0.4506, "step": 60660 }, { "epoch": 0.81, "learning_rate": 4.213807805828488e-06, "loss": 0.8301, "step": 60665 }, { "epoch": 0.81, "learning_rate": 4.2108849084689535e-06, "loss": 1.1277, "step": 60670 }, { "epoch": 0.81, "learning_rate": 4.207962931963208e-06, "loss": 1.0812, "step": 60675 }, { "epoch": 0.81, "learning_rate": 4.20504187644069e-06, "loss": 0.1729, "step": 60680 }, { "epoch": 0.81, "learning_rate": 4.202121742030785e-06, "loss": 1.1394, "step": 60685 }, { "epoch": 0.81, "learning_rate": 4.199202528862839e-06, "loss": 0.9157, "step": 60690 }, { "epoch": 0.81, "learning_rate": 4.196284237066148e-06, "loss": 0.35, "step": 60695 }, { "epoch": 0.81, "learning_rate": 4.193366866769999e-06, "loss": 0.5881, "step": 60700 }, { "epoch": 0.81, "learning_rate": 4.1904504181036e-06, "loss": 0.2296, "step": 60705 }, { "epoch": 0.81, "learning_rate": 4.187534891196138e-06, "loss": 1.0107, "step": 60710 }, { "epoch": 0.81, "learning_rate": 4.184620286176769e-06, "loss": 1.2009, "step": 60715 }, { "epoch": 0.81, "learning_rate": 4.181706603174576e-06, "loss": 0.7244, "step": 60720 }, { "epoch": 0.81, "learning_rate": 4.178793842318626e-06, "loss": 0.7711, "step": 60725 }, { "epoch": 0.81, "learning_rate": 4.175882003737961e-06, "loss": 0.1439, "step": 60730 }, { "epoch": 0.81, "learning_rate": 4.172971087561526e-06, "loss": 0.7658, "step": 60735 }, { "epoch": 0.81, "learning_rate": 4.170061093918284e-06, "loss": 0.6266, "step": 60740 }, { "epoch": 0.81, "learning_rate": 4.167152022937124e-06, "loss": 0.9188, "step": 60745 }, { "epoch": 0.81, "learning_rate": 4.164243874746909e-06, "loss": 0.3807, "step": 60750 }, { "epoch": 0.81, "learning_rate": 4.161336649476455e-06, "loss": 0.9517, "step": 60755 }, { "epoch": 0.81, "learning_rate": 4.158430347254527e-06, "loss": 0.8085, "step": 60760 }, { "epoch": 0.81, "learning_rate": 4.155524968209879e-06, "loss": 0.6167, "step": 60765 }, { "epoch": 0.81, "learning_rate": 4.152620512471184e-06, "loss": 0.4361, "step": 60770 }, { "epoch": 0.81, "learning_rate": 4.1497169801671065e-06, "loss": 1.5718, "step": 60775 }, { "epoch": 0.81, "learning_rate": 4.146814371426258e-06, "loss": 0.7135, "step": 60780 }, { "epoch": 0.81, "learning_rate": 4.143912686377202e-06, "loss": 0.8037, "step": 60785 }, { "epoch": 0.81, "learning_rate": 4.14101192514848e-06, "loss": 0.6351, "step": 60790 }, { "epoch": 0.81, "learning_rate": 4.138112087868573e-06, "loss": 0.4667, "step": 60795 }, { "epoch": 0.81, "learning_rate": 4.135213174665936e-06, "loss": 0.5889, "step": 60800 }, { "epoch": 0.81, "learning_rate": 4.132315185668964e-06, "loss": 1.1777, "step": 60805 }, { "epoch": 0.81, "learning_rate": 4.1294181210060374e-06, "loss": 1.0911, "step": 60810 }, { "epoch": 0.81, "learning_rate": 4.126521980805476e-06, "loss": 0.7493, "step": 60815 }, { "epoch": 0.81, "learning_rate": 4.123626765195556e-06, "loss": 0.8073, "step": 60820 }, { "epoch": 0.81, "learning_rate": 4.120732474304545e-06, "loss": 0.5202, "step": 60825 }, { "epoch": 0.82, "learning_rate": 4.117839108260616e-06, "loss": 0.6761, "step": 60830 }, { "epoch": 0.82, "learning_rate": 4.114946667191944e-06, "loss": 0.5923, "step": 60835 }, { "epoch": 0.82, "learning_rate": 4.112055151226662e-06, "loss": 0.5641, "step": 60840 }, { "epoch": 0.82, "learning_rate": 4.1091645604928255e-06, "loss": 0.4819, "step": 60845 }, { "epoch": 0.82, "learning_rate": 4.106274895118495e-06, "loss": 0.7046, "step": 60850 }, { "epoch": 0.82, "learning_rate": 4.103386155231648e-06, "loss": 0.1799, "step": 60855 }, { "epoch": 0.82, "learning_rate": 4.1004983409602595e-06, "loss": 1.0184, "step": 60860 }, { "epoch": 0.82, "learning_rate": 4.0976114524322375e-06, "loss": 1.0044, "step": 60865 }, { "epoch": 0.82, "learning_rate": 4.09472548977545e-06, "loss": 1.0933, "step": 60870 }, { "epoch": 0.82, "learning_rate": 4.091840453117752e-06, "loss": 0.2759, "step": 60875 }, { "epoch": 0.82, "learning_rate": 4.088956342586905e-06, "loss": 1.1073, "step": 60880 }, { "epoch": 0.82, "learning_rate": 4.086073158310688e-06, "loss": 0.2667, "step": 60885 }, { "epoch": 0.82, "learning_rate": 4.0831909004168e-06, "loss": 0.4144, "step": 60890 }, { "epoch": 0.82, "learning_rate": 4.080309569032903e-06, "loss": 0.8241, "step": 60895 }, { "epoch": 0.82, "learning_rate": 4.0774291642866415e-06, "loss": 0.7571, "step": 60900 }, { "epoch": 0.82, "learning_rate": 4.074549686305598e-06, "loss": 1.2386, "step": 60905 }, { "epoch": 0.82, "learning_rate": 4.071671135217314e-06, "loss": 0.5891, "step": 60910 }, { "epoch": 0.82, "learning_rate": 4.0687935111492936e-06, "loss": 0.5092, "step": 60915 }, { "epoch": 0.82, "learning_rate": 4.0659168142290095e-06, "loss": 0.4797, "step": 60920 }, { "epoch": 0.82, "learning_rate": 4.063041044583882e-06, "loss": 0.6264, "step": 60925 }, { "epoch": 0.82, "learning_rate": 4.060166202341284e-06, "loss": 1.0175, "step": 60930 }, { "epoch": 0.82, "learning_rate": 4.057292287628578e-06, "loss": 1.0232, "step": 60935 }, { "epoch": 0.82, "learning_rate": 4.05441930057304e-06, "loss": 0.7969, "step": 60940 }, { "epoch": 0.82, "learning_rate": 4.051547241301937e-06, "loss": 0.3702, "step": 60945 }, { "epoch": 0.82, "learning_rate": 4.048676109942501e-06, "loss": 0.4965, "step": 60950 }, { "epoch": 0.82, "learning_rate": 4.045805906621886e-06, "loss": 1.1834, "step": 60955 }, { "epoch": 0.82, "learning_rate": 4.042936631467245e-06, "loss": 0.6118, "step": 60960 }, { "epoch": 0.82, "learning_rate": 4.040068284605661e-06, "loss": 0.4694, "step": 60965 }, { "epoch": 0.82, "learning_rate": 4.037200866164198e-06, "loss": 0.7669, "step": 60970 }, { "epoch": 0.82, "learning_rate": 4.034334376269863e-06, "loss": 0.5059, "step": 60975 }, { "epoch": 0.82, "learning_rate": 4.031468815049621e-06, "loss": 0.3303, "step": 60980 }, { "epoch": 0.82, "learning_rate": 4.028604182630421e-06, "loss": 0.6971, "step": 60985 }, { "epoch": 0.82, "learning_rate": 4.025740479139125e-06, "loss": 0.2787, "step": 60990 }, { "epoch": 0.82, "learning_rate": 4.022877704702604e-06, "loss": 1.1675, "step": 60995 }, { "epoch": 0.82, "learning_rate": 4.020015859447654e-06, "loss": 0.5759, "step": 61000 }, { "epoch": 0.82, "learning_rate": 4.017154943501036e-06, "loss": 0.9776, "step": 61005 }, { "epoch": 0.82, "learning_rate": 4.014294956989487e-06, "loss": 0.3942, "step": 61010 }, { "epoch": 0.82, "learning_rate": 4.011435900039681e-06, "loss": 0.3975, "step": 61015 }, { "epoch": 0.82, "learning_rate": 4.0085777727782635e-06, "loss": 1.0946, "step": 61020 }, { "epoch": 0.82, "learning_rate": 4.005720575331828e-06, "loss": 1.0702, "step": 61025 }, { "epoch": 0.82, "learning_rate": 4.002864307826945e-06, "loss": 0.6138, "step": 61030 }, { "epoch": 0.82, "learning_rate": 4.000008970390129e-06, "loss": 1.0961, "step": 61035 }, { "epoch": 0.82, "learning_rate": 3.9971545631478505e-06, "loss": 0.6118, "step": 61040 }, { "epoch": 0.82, "learning_rate": 3.994301086226563e-06, "loss": 0.9381, "step": 61045 }, { "epoch": 0.82, "learning_rate": 3.991448539752635e-06, "loss": 0.7752, "step": 61050 }, { "epoch": 0.82, "learning_rate": 3.988596923852434e-06, "loss": 0.5431, "step": 61055 }, { "epoch": 0.82, "learning_rate": 3.985746238652286e-06, "loss": 0.3658, "step": 61060 }, { "epoch": 0.82, "learning_rate": 3.982896484278437e-06, "loss": 0.4476, "step": 61065 }, { "epoch": 0.82, "learning_rate": 3.9800476608571335e-06, "loss": 0.5488, "step": 61070 }, { "epoch": 0.82, "learning_rate": 3.977199768514553e-06, "loss": 1.0017, "step": 61075 }, { "epoch": 0.82, "learning_rate": 3.974352807376855e-06, "loss": 0.3631, "step": 61080 }, { "epoch": 0.82, "learning_rate": 3.971506777570142e-06, "loss": 0.7056, "step": 61085 }, { "epoch": 0.82, "learning_rate": 3.968661679220468e-06, "loss": 0.2546, "step": 61090 }, { "epoch": 0.82, "learning_rate": 3.965817512453879e-06, "loss": 1.1125, "step": 61095 }, { "epoch": 0.82, "learning_rate": 3.962974277396328e-06, "loss": 1.183, "step": 61100 }, { "epoch": 0.82, "learning_rate": 3.96013197417378e-06, "loss": 0.2202, "step": 61105 }, { "epoch": 0.82, "learning_rate": 3.957290602912128e-06, "loss": 1.3119, "step": 61110 }, { "epoch": 0.82, "learning_rate": 3.954450163737219e-06, "loss": 0.3281, "step": 61115 }, { "epoch": 0.82, "learning_rate": 3.95161065677489e-06, "loss": 0.3899, "step": 61120 }, { "epoch": 0.82, "learning_rate": 3.948772082150906e-06, "loss": 0.5574, "step": 61125 }, { "epoch": 0.82, "learning_rate": 3.9459344399910005e-06, "loss": 0.6469, "step": 61130 }, { "epoch": 0.82, "learning_rate": 3.9430977304208665e-06, "loss": 0.1946, "step": 61135 }, { "epoch": 0.82, "learning_rate": 3.9402619535661625e-06, "loss": 0.3869, "step": 61140 }, { "epoch": 0.82, "learning_rate": 3.937994003721915e-06, "loss": 1.0465, "step": 61145 }, { "epoch": 0.82, "learning_rate": 3.93515990607149e-06, "loss": 0.6988, "step": 61150 }, { "epoch": 0.82, "learning_rate": 3.932326741488096e-06, "loss": 0.4614, "step": 61155 }, { "epoch": 0.82, "learning_rate": 3.929494510097231e-06, "loss": 1.0468, "step": 61160 }, { "epoch": 0.82, "learning_rate": 3.9266632120243395e-06, "loss": 0.2721, "step": 61165 }, { "epoch": 0.82, "learning_rate": 3.9238328473948485e-06, "loss": 0.5808, "step": 61170 }, { "epoch": 0.82, "learning_rate": 3.9210034163341205e-06, "loss": 0.7427, "step": 61175 }, { "epoch": 0.82, "learning_rate": 3.918174918967479e-06, "loss": 0.6736, "step": 61180 }, { "epoch": 0.82, "learning_rate": 3.915347355420226e-06, "loss": 0.4633, "step": 61185 }, { "epoch": 0.82, "learning_rate": 3.9125207258176036e-06, "loss": 0.5504, "step": 61190 }, { "epoch": 0.82, "learning_rate": 3.90969503028481e-06, "loss": 0.4863, "step": 61195 }, { "epoch": 0.82, "learning_rate": 3.906870268947024e-06, "loss": 0.6592, "step": 61200 }, { "epoch": 0.82, "learning_rate": 3.9040464419293514e-06, "loss": 0.4711, "step": 61205 }, { "epoch": 0.82, "learning_rate": 3.901223549356886e-06, "loss": 0.4091, "step": 61210 }, { "epoch": 0.82, "learning_rate": 3.898401591354664e-06, "loss": 0.747, "step": 61215 }, { "epoch": 0.82, "learning_rate": 3.895580568047675e-06, "loss": 0.8551, "step": 61220 }, { "epoch": 0.82, "learning_rate": 3.892760479560892e-06, "loss": 1.2081, "step": 61225 }, { "epoch": 0.82, "learning_rate": 3.889941326019225e-06, "loss": 0.5456, "step": 61230 }, { "epoch": 0.82, "learning_rate": 3.887123107547546e-06, "loss": 0.7303, "step": 61235 }, { "epoch": 0.82, "learning_rate": 3.884305824270684e-06, "loss": 0.7814, "step": 61240 }, { "epoch": 0.82, "learning_rate": 3.881489476313441e-06, "loss": 0.3295, "step": 61245 }, { "epoch": 0.82, "learning_rate": 3.878674063800561e-06, "loss": 0.7137, "step": 61250 }, { "epoch": 0.82, "learning_rate": 3.875859586856748e-06, "loss": 0.3941, "step": 61255 }, { "epoch": 0.82, "learning_rate": 3.873046045606679e-06, "loss": 0.3941, "step": 61260 }, { "epoch": 0.82, "learning_rate": 3.870233440174975e-06, "loss": 0.7949, "step": 61265 }, { "epoch": 0.82, "learning_rate": 3.867421770686222e-06, "loss": 1.4335, "step": 61270 }, { "epoch": 0.82, "learning_rate": 3.8646110372649565e-06, "loss": 0.886, "step": 61275 }, { "epoch": 0.82, "learning_rate": 3.861801240035689e-06, "loss": 1.6515, "step": 61280 }, { "epoch": 0.82, "learning_rate": 3.858992379122878e-06, "loss": 0.7936, "step": 61285 }, { "epoch": 0.82, "learning_rate": 3.856184454650932e-06, "loss": 0.3591, "step": 61290 }, { "epoch": 0.82, "learning_rate": 3.85337746674424e-06, "loss": 0.8295, "step": 61295 }, { "epoch": 0.82, "learning_rate": 3.850571415527135e-06, "loss": 0.6072, "step": 61300 }, { "epoch": 0.82, "learning_rate": 3.847766301123903e-06, "loss": 1.2172, "step": 61305 }, { "epoch": 0.82, "learning_rate": 3.844962123658813e-06, "loss": 0.6068, "step": 61310 }, { "epoch": 0.82, "learning_rate": 3.842158883256056e-06, "loss": 0.3034, "step": 61315 }, { "epoch": 0.82, "learning_rate": 3.839356580039815e-06, "loss": 0.5261, "step": 61320 }, { "epoch": 0.82, "learning_rate": 3.836555214134216e-06, "loss": 0.8439, "step": 61325 }, { "epoch": 0.82, "learning_rate": 3.833754785663338e-06, "loss": 0.6797, "step": 61330 }, { "epoch": 0.82, "learning_rate": 3.8309552947512344e-06, "loss": 0.9855, "step": 61335 }, { "epoch": 0.82, "learning_rate": 3.8281567415219075e-06, "loss": 0.9175, "step": 61340 }, { "epoch": 0.82, "learning_rate": 3.825359126099318e-06, "loss": 1.1139, "step": 61345 }, { "epoch": 0.82, "learning_rate": 3.822562448607381e-06, "loss": 0.4037, "step": 61350 }, { "epoch": 0.82, "learning_rate": 3.819766709169983e-06, "loss": 0.7008, "step": 61355 }, { "epoch": 0.82, "learning_rate": 3.81697190791096e-06, "loss": 0.1435, "step": 61360 }, { "epoch": 0.82, "learning_rate": 3.8141780449541003e-06, "loss": 1.0545, "step": 61365 }, { "epoch": 0.82, "learning_rate": 3.8113851204231695e-06, "loss": 0.4452, "step": 61370 }, { "epoch": 0.82, "learning_rate": 3.8085931344418765e-06, "loss": 1.0666, "step": 61375 }, { "epoch": 0.82, "learning_rate": 3.8058020871338804e-06, "loss": 0.1663, "step": 61380 }, { "epoch": 0.82, "learning_rate": 3.803011978622831e-06, "loss": 0.5491, "step": 61385 }, { "epoch": 0.82, "learning_rate": 3.800222809032303e-06, "loss": 0.9911, "step": 61390 }, { "epoch": 0.82, "learning_rate": 3.797434578485845e-06, "loss": 1.036, "step": 61395 }, { "epoch": 0.82, "learning_rate": 3.794647287106959e-06, "loss": 0.7888, "step": 61400 }, { "epoch": 0.82, "learning_rate": 3.791860935019115e-06, "loss": 1.1074, "step": 61405 }, { "epoch": 0.82, "learning_rate": 3.7890755223457307e-06, "loss": 0.774, "step": 61410 }, { "epoch": 0.82, "learning_rate": 3.7862910492101803e-06, "loss": 0.4644, "step": 61415 }, { "epoch": 0.82, "learning_rate": 3.783507515735818e-06, "loss": 0.477, "step": 61420 }, { "epoch": 0.82, "learning_rate": 3.7807249220459194e-06, "loss": 0.3979, "step": 61425 }, { "epoch": 0.82, "learning_rate": 3.777943268263756e-06, "loss": 1.0287, "step": 61430 }, { "epoch": 0.82, "learning_rate": 3.7751625545125348e-06, "loss": 0.3912, "step": 61435 }, { "epoch": 0.82, "learning_rate": 3.772382780915423e-06, "loss": 0.1688, "step": 61440 }, { "epoch": 0.82, "learning_rate": 3.7696039475955598e-06, "loss": 0.3367, "step": 61445 }, { "epoch": 0.82, "learning_rate": 3.7668260546760313e-06, "loss": 0.3885, "step": 61450 }, { "epoch": 0.82, "learning_rate": 3.764049102279882e-06, "loss": 1.0347, "step": 61455 }, { "epoch": 0.82, "learning_rate": 3.7612730905301095e-06, "loss": 0.2371, "step": 61460 }, { "epoch": 0.82, "learning_rate": 3.7584980195496945e-06, "loss": 0.8422, "step": 61465 }, { "epoch": 0.82, "learning_rate": 3.7557238894615458e-06, "loss": 0.8026, "step": 61470 }, { "epoch": 0.82, "learning_rate": 3.752950700388544e-06, "loss": 0.9957, "step": 61475 }, { "epoch": 0.82, "learning_rate": 3.7501784524535343e-06, "loss": 0.6749, "step": 61480 }, { "epoch": 0.82, "learning_rate": 3.747407145779308e-06, "loss": 0.9956, "step": 61485 }, { "epoch": 0.82, "learning_rate": 3.7446367804886196e-06, "loss": 0.6353, "step": 61490 }, { "epoch": 0.82, "learning_rate": 3.74186735670419e-06, "loss": 1.3835, "step": 61495 }, { "epoch": 0.82, "learning_rate": 3.739098874548683e-06, "loss": 0.8173, "step": 61500 }, { "epoch": 0.82, "learning_rate": 3.7363313341447326e-06, "loss": 0.6312, "step": 61505 }, { "epoch": 0.82, "learning_rate": 3.7335647356149195e-06, "loss": 0.7843, "step": 61510 }, { "epoch": 0.82, "learning_rate": 3.730799079081801e-06, "loss": 0.7242, "step": 61515 }, { "epoch": 0.82, "learning_rate": 3.728034364667879e-06, "loss": 0.7523, "step": 61520 }, { "epoch": 0.82, "learning_rate": 3.7252705924956055e-06, "loss": 0.8536, "step": 61525 }, { "epoch": 0.82, "learning_rate": 3.7225077626874243e-06, "loss": 1.0765, "step": 61530 }, { "epoch": 0.82, "learning_rate": 3.7197458753656876e-06, "loss": 0.3824, "step": 61535 }, { "epoch": 0.82, "learning_rate": 3.716984930652756e-06, "loss": 0.0962, "step": 61540 }, { "epoch": 0.82, "learning_rate": 3.7142249286709146e-06, "loss": 0.41, "step": 61545 }, { "epoch": 0.82, "learning_rate": 3.7114658695424133e-06, "loss": 1.1977, "step": 61550 }, { "epoch": 0.82, "learning_rate": 3.708707753389476e-06, "loss": 0.8715, "step": 61555 }, { "epoch": 0.82, "learning_rate": 3.7059505803342693e-06, "loss": 0.4387, "step": 61560 }, { "epoch": 0.82, "learning_rate": 3.70319435049892e-06, "loss": 0.3161, "step": 61565 }, { "epoch": 0.82, "learning_rate": 3.700439064005512e-06, "loss": 0.864, "step": 61570 }, { "epoch": 0.83, "learning_rate": 3.6976847209760994e-06, "loss": 0.3328, "step": 61575 }, { "epoch": 0.83, "learning_rate": 3.6949313215326825e-06, "loss": 0.5056, "step": 61580 }, { "epoch": 0.83, "learning_rate": 3.6921788657972163e-06, "loss": 0.9852, "step": 61585 }, { "epoch": 0.83, "learning_rate": 3.6894273538916337e-06, "loss": 0.3536, "step": 61590 }, { "epoch": 0.83, "learning_rate": 3.6866767859378037e-06, "loss": 0.5872, "step": 61595 }, { "epoch": 0.83, "learning_rate": 3.6839271620575598e-06, "loss": 0.333, "step": 61600 }, { "epoch": 0.83, "learning_rate": 3.6811784823727103e-06, "loss": 0.5115, "step": 61605 }, { "epoch": 0.83, "learning_rate": 3.6784307470049963e-06, "loss": 0.4652, "step": 61610 }, { "epoch": 0.83, "learning_rate": 3.6756839560761314e-06, "loss": 0.531, "step": 61615 }, { "epoch": 0.83, "learning_rate": 3.6729381097077795e-06, "loss": 0.4019, "step": 61620 }, { "epoch": 0.83, "learning_rate": 3.6701932080215802e-06, "loss": 0.6515, "step": 61625 }, { "epoch": 0.83, "learning_rate": 3.6674492511391127e-06, "loss": 0.1926, "step": 61630 }, { "epoch": 0.83, "learning_rate": 3.6647062391819115e-06, "loss": 0.5166, "step": 61635 }, { "epoch": 0.83, "learning_rate": 3.661964172271501e-06, "loss": 0.4243, "step": 61640 }, { "epoch": 0.83, "learning_rate": 3.6592230505293147e-06, "loss": 0.33, "step": 61645 }, { "epoch": 0.83, "learning_rate": 3.6564828740767886e-06, "loss": 0.8021, "step": 61650 }, { "epoch": 0.83, "learning_rate": 3.6537436430352902e-06, "loss": 0.9137, "step": 61655 }, { "epoch": 0.83, "learning_rate": 3.651005357526155e-06, "loss": 0.4439, "step": 61660 }, { "epoch": 0.83, "learning_rate": 3.648268017670678e-06, "loss": 0.7722, "step": 61665 }, { "epoch": 0.83, "learning_rate": 3.6455316235901123e-06, "loss": 0.6479, "step": 61670 }, { "epoch": 0.83, "learning_rate": 3.6427961754056605e-06, "loss": 0.7098, "step": 61675 }, { "epoch": 0.83, "learning_rate": 3.6400616732384875e-06, "loss": 1.0468, "step": 61680 }, { "epoch": 0.83, "learning_rate": 3.6373281172097263e-06, "loss": 1.0155, "step": 61685 }, { "epoch": 0.83, "learning_rate": 3.6345955074404552e-06, "loss": 0.45, "step": 61690 }, { "epoch": 0.83, "learning_rate": 3.631863844051711e-06, "loss": 0.7177, "step": 61695 }, { "epoch": 0.83, "learning_rate": 3.6291331271645024e-06, "loss": 0.9632, "step": 61700 }, { "epoch": 0.83, "learning_rate": 3.62640335689978e-06, "loss": 0.7937, "step": 61705 }, { "epoch": 0.83, "learning_rate": 3.6236745333784543e-06, "loss": 0.5026, "step": 61710 }, { "epoch": 0.83, "learning_rate": 3.6209466567214105e-06, "loss": 0.1977, "step": 61715 }, { "epoch": 0.83, "learning_rate": 3.6182197270494765e-06, "loss": 0.5428, "step": 61720 }, { "epoch": 0.83, "learning_rate": 3.6154937444834366e-06, "loss": 1.0038, "step": 61725 }, { "epoch": 0.83, "learning_rate": 3.612768709144035e-06, "loss": 0.0578, "step": 61730 }, { "epoch": 0.83, "learning_rate": 3.6100446211519866e-06, "loss": 0.5633, "step": 61735 }, { "epoch": 0.83, "learning_rate": 3.6073214806279535e-06, "loss": 0.8613, "step": 61740 }, { "epoch": 0.83, "learning_rate": 3.604599287692548e-06, "loss": 0.3843, "step": 61745 }, { "epoch": 0.83, "learning_rate": 3.6018780424663665e-06, "loss": 1.22, "step": 61750 }, { "epoch": 0.83, "learning_rate": 3.5991577450699252e-06, "loss": 0.7285, "step": 61755 }, { "epoch": 0.83, "learning_rate": 3.5964383956237386e-06, "loss": 1.2054, "step": 61760 }, { "epoch": 0.83, "learning_rate": 3.5937199942482513e-06, "loss": 0.6638, "step": 61765 }, { "epoch": 0.83, "learning_rate": 3.5910025410638678e-06, "loss": 0.9473, "step": 61770 }, { "epoch": 0.83, "learning_rate": 3.5882860361909744e-06, "loss": 0.7874, "step": 61775 }, { "epoch": 0.83, "learning_rate": 3.585570479749889e-06, "loss": 0.6008, "step": 61780 }, { "epoch": 0.83, "learning_rate": 3.582855871860899e-06, "loss": 1.1658, "step": 61785 }, { "epoch": 0.83, "learning_rate": 3.5801422126442415e-06, "loss": 0.903, "step": 61790 }, { "epoch": 0.83, "learning_rate": 3.577429502220131e-06, "loss": 1.2164, "step": 61795 }, { "epoch": 0.83, "learning_rate": 3.574717740708716e-06, "loss": 0.336, "step": 61800 }, { "epoch": 0.83, "learning_rate": 3.572006928230115e-06, "loss": 0.605, "step": 61805 }, { "epoch": 0.83, "learning_rate": 3.5692970649044116e-06, "loss": 0.8332, "step": 61810 }, { "epoch": 0.83, "learning_rate": 3.5665881508516326e-06, "loss": 0.2088, "step": 61815 }, { "epoch": 0.83, "learning_rate": 3.5638801861917647e-06, "loss": 0.3715, "step": 61820 }, { "epoch": 0.83, "learning_rate": 3.561173171044771e-06, "loss": 0.8837, "step": 61825 }, { "epoch": 0.83, "learning_rate": 3.5584671055305496e-06, "loss": 1.1619, "step": 61830 }, { "epoch": 0.83, "learning_rate": 3.5557619897689657e-06, "loss": 0.3292, "step": 61835 }, { "epoch": 0.83, "learning_rate": 3.5530578238798406e-06, "loss": 0.6375, "step": 61840 }, { "epoch": 0.83, "learning_rate": 3.5503546079829615e-06, "loss": 0.4506, "step": 61845 }, { "epoch": 0.83, "learning_rate": 3.547652342198063e-06, "loss": 0.7867, "step": 61850 }, { "epoch": 0.83, "learning_rate": 3.544951026644838e-06, "loss": 1.1618, "step": 61855 }, { "epoch": 0.83, "learning_rate": 3.5422506614429614e-06, "loss": 0.1828, "step": 61860 }, { "epoch": 0.83, "learning_rate": 3.539551246712014e-06, "loss": 0.699, "step": 61865 }, { "epoch": 0.83, "learning_rate": 3.5368527825715927e-06, "loss": 0.5536, "step": 61870 }, { "epoch": 0.83, "learning_rate": 3.534155269141215e-06, "loss": 0.4798, "step": 61875 }, { "epoch": 0.83, "learning_rate": 3.5314587065403637e-06, "loss": 0.4358, "step": 61880 }, { "epoch": 0.83, "learning_rate": 3.5287630948884933e-06, "loss": 0.6675, "step": 61885 }, { "epoch": 0.83, "learning_rate": 3.5260684343049993e-06, "loss": 0.5412, "step": 61890 }, { "epoch": 0.83, "learning_rate": 3.5233747249092427e-06, "loss": 1.0996, "step": 61895 }, { "epoch": 0.83, "learning_rate": 3.5206819668205382e-06, "loss": 0.7295, "step": 61900 }, { "epoch": 0.83, "learning_rate": 3.517990160158169e-06, "loss": 0.5203, "step": 61905 }, { "epoch": 0.83, "learning_rate": 3.515299305041364e-06, "loss": 0.4631, "step": 61910 }, { "epoch": 0.83, "learning_rate": 3.512609401589312e-06, "loss": 0.7838, "step": 61915 }, { "epoch": 0.83, "learning_rate": 3.5099204499211695e-06, "loss": 0.6928, "step": 61920 }, { "epoch": 0.83, "learning_rate": 3.5072324501560394e-06, "loss": 1.173, "step": 61925 }, { "epoch": 0.83, "learning_rate": 3.5045454024129813e-06, "loss": 0.8221, "step": 61930 }, { "epoch": 0.83, "learning_rate": 3.501859306811031e-06, "loss": 0.348, "step": 61935 }, { "epoch": 0.83, "learning_rate": 3.49917416346916e-06, "loss": 0.5753, "step": 61940 }, { "epoch": 0.83, "learning_rate": 3.4964899725063063e-06, "loss": 0.4348, "step": 61945 }, { "epoch": 0.83, "learning_rate": 3.493806734041366e-06, "loss": 0.159, "step": 61950 }, { "epoch": 0.83, "learning_rate": 3.4911244481932003e-06, "loss": 0.399, "step": 61955 }, { "epoch": 0.83, "learning_rate": 3.488443115080614e-06, "loss": 1.0892, "step": 61960 }, { "epoch": 0.83, "learning_rate": 3.485762734822373e-06, "loss": 0.5862, "step": 61965 }, { "epoch": 0.83, "learning_rate": 3.483083307537224e-06, "loss": 1.424, "step": 61970 }, { "epoch": 0.83, "learning_rate": 3.4804048333438253e-06, "loss": 1.2041, "step": 61975 }, { "epoch": 0.83, "learning_rate": 3.477727312360843e-06, "loss": 0.8848, "step": 61980 }, { "epoch": 0.83, "learning_rate": 3.4750507447068647e-06, "loss": 0.1281, "step": 61985 }, { "epoch": 0.83, "learning_rate": 3.4723751305004463e-06, "loss": 0.7471, "step": 61990 }, { "epoch": 0.83, "learning_rate": 3.4697004698601182e-06, "loss": 0.8685, "step": 61995 }, { "epoch": 0.83, "learning_rate": 3.467026762904346e-06, "loss": 0.7882, "step": 62000 }, { "epoch": 0.83, "learning_rate": 3.464354009751561e-06, "loss": 0.7236, "step": 62005 }, { "epoch": 0.83, "learning_rate": 3.461682210520148e-06, "loss": 0.7465, "step": 62010 }, { "epoch": 0.83, "learning_rate": 3.4590113653284682e-06, "loss": 1.1838, "step": 62015 }, { "epoch": 0.83, "learning_rate": 3.4563414742948163e-06, "loss": 0.5474, "step": 62020 }, { "epoch": 0.83, "learning_rate": 3.453672537537453e-06, "loss": 0.7954, "step": 62025 }, { "epoch": 0.83, "learning_rate": 3.4510045551746084e-06, "loss": 0.5593, "step": 62030 }, { "epoch": 0.83, "learning_rate": 3.4483375273244576e-06, "loss": 1.204, "step": 62035 }, { "epoch": 0.83, "learning_rate": 3.445671454105129e-06, "loss": 0.9322, "step": 62040 }, { "epoch": 0.83, "learning_rate": 3.443006335634727e-06, "loss": 0.9591, "step": 62045 }, { "epoch": 0.83, "learning_rate": 3.4403421720312966e-06, "loss": 0.5863, "step": 62050 }, { "epoch": 0.83, "learning_rate": 3.437678963412849e-06, "loss": 0.892, "step": 62055 }, { "epoch": 0.83, "learning_rate": 3.4350167098973455e-06, "loss": 1.0627, "step": 62060 }, { "epoch": 0.83, "learning_rate": 3.4323554116027195e-06, "loss": 0.7612, "step": 62065 }, { "epoch": 0.83, "learning_rate": 3.4296950686468514e-06, "loss": 0.9125, "step": 62070 }, { "epoch": 0.83, "learning_rate": 3.4270356811475723e-06, "loss": 0.1515, "step": 62075 }, { "epoch": 0.83, "learning_rate": 3.4243772492226987e-06, "loss": 0.6709, "step": 62080 }, { "epoch": 0.83, "learning_rate": 3.421719772989962e-06, "loss": 0.7772, "step": 62085 }, { "epoch": 0.83, "learning_rate": 3.4190632525670925e-06, "loss": 0.3331, "step": 62090 }, { "epoch": 0.83, "learning_rate": 3.4164076880717542e-06, "loss": 0.6976, "step": 62095 }, { "epoch": 0.83, "learning_rate": 3.4137530796215705e-06, "loss": 0.7289, "step": 62100 }, { "epoch": 0.83, "learning_rate": 3.4110994273341384e-06, "loss": 1.484, "step": 62105 }, { "epoch": 0.83, "learning_rate": 3.4084467313269946e-06, "loss": 0.9483, "step": 62110 }, { "epoch": 0.83, "learning_rate": 3.4057949917176425e-06, "loss": 0.5191, "step": 62115 }, { "epoch": 0.83, "learning_rate": 3.4031442086235348e-06, "loss": 0.634, "step": 62120 }, { "epoch": 0.83, "learning_rate": 3.4004943821620976e-06, "loss": 0.948, "step": 62125 }, { "epoch": 0.83, "learning_rate": 3.397845512450701e-06, "loss": 0.9477, "step": 62130 }, { "epoch": 0.83, "learning_rate": 3.39519759960667e-06, "loss": 0.7376, "step": 62135 }, { "epoch": 0.83, "learning_rate": 3.3925506437473055e-06, "loss": 0.7289, "step": 62140 }, { "epoch": 0.83, "learning_rate": 3.3899046449898497e-06, "loss": 0.5731, "step": 62145 }, { "epoch": 0.83, "learning_rate": 3.387259603451498e-06, "loss": 1.2387, "step": 62150 }, { "epoch": 0.83, "learning_rate": 3.384615519249429e-06, "loss": 0.3637, "step": 62155 }, { "epoch": 0.83, "learning_rate": 3.3819723925007542e-06, "loss": 0.6807, "step": 62160 }, { "epoch": 0.83, "learning_rate": 3.3793302233225493e-06, "loss": 0.2885, "step": 62165 }, { "epoch": 0.83, "learning_rate": 3.3766890118318463e-06, "loss": 0.5937, "step": 62170 }, { "epoch": 0.83, "learning_rate": 3.3740487581456455e-06, "loss": 0.9689, "step": 62175 }, { "epoch": 0.83, "learning_rate": 3.371409462380895e-06, "loss": 0.5707, "step": 62180 }, { "epoch": 0.83, "learning_rate": 3.368771124654496e-06, "loss": 1.3577, "step": 62185 }, { "epoch": 0.83, "learning_rate": 3.3661337450833304e-06, "loss": 0.3919, "step": 62190 }, { "epoch": 0.83, "learning_rate": 3.3634973237841956e-06, "loss": 0.4648, "step": 62195 }, { "epoch": 0.83, "learning_rate": 3.360861860873893e-06, "loss": 0.5262, "step": 62200 }, { "epoch": 0.83, "learning_rate": 3.3582273564691512e-06, "loss": 1.0055, "step": 62205 }, { "epoch": 0.83, "learning_rate": 3.3555938106866607e-06, "loss": 0.7243, "step": 62210 }, { "epoch": 0.83, "learning_rate": 3.352961223643089e-06, "loss": 0.4595, "step": 62215 }, { "epoch": 0.83, "learning_rate": 3.3503295954550373e-06, "loss": 0.271, "step": 62220 }, { "epoch": 0.83, "learning_rate": 3.3476989262390736e-06, "loss": 0.339, "step": 62225 }, { "epoch": 0.83, "learning_rate": 3.3450692161117208e-06, "loss": 0.6614, "step": 62230 }, { "epoch": 0.83, "learning_rate": 3.34244046518947e-06, "loss": 0.4679, "step": 62235 }, { "epoch": 0.83, "learning_rate": 3.3398126735887547e-06, "loss": 0.3321, "step": 62240 }, { "epoch": 0.83, "learning_rate": 3.3371858414259743e-06, "loss": 0.4302, "step": 62245 }, { "epoch": 0.83, "learning_rate": 3.3345599688174883e-06, "loss": 0.38, "step": 62250 }, { "epoch": 0.83, "learning_rate": 3.331935055879609e-06, "loss": 1.2823, "step": 62255 }, { "epoch": 0.83, "learning_rate": 3.329311102728597e-06, "loss": 0.3473, "step": 62260 }, { "epoch": 0.83, "learning_rate": 3.326688109480694e-06, "loss": 0.7661, "step": 62265 }, { "epoch": 0.83, "learning_rate": 3.3240660762520802e-06, "loss": 0.4852, "step": 62270 }, { "epoch": 0.83, "learning_rate": 3.321445003158899e-06, "loss": 0.607, "step": 62275 }, { "epoch": 0.83, "learning_rate": 3.3188248903172432e-06, "loss": 0.3419, "step": 62280 }, { "epoch": 0.83, "learning_rate": 3.316205737843181e-06, "loss": 1.1691, "step": 62285 }, { "epoch": 0.83, "learning_rate": 3.3135875458527254e-06, "loss": 0.4593, "step": 62290 }, { "epoch": 0.83, "learning_rate": 3.310970314461842e-06, "loss": 0.7362, "step": 62295 }, { "epoch": 0.83, "learning_rate": 3.3083540437864796e-06, "loss": 0.638, "step": 62300 }, { "epoch": 0.83, "learning_rate": 3.305738733942501e-06, "loss": 0.2299, "step": 62305 }, { "epoch": 0.83, "learning_rate": 3.3031243850457695e-06, "loss": 0.5546, "step": 62310 }, { "epoch": 0.83, "learning_rate": 3.3005109972120805e-06, "loss": 0.5924, "step": 62315 }, { "epoch": 0.83, "learning_rate": 3.2978985705571926e-06, "loss": 0.5949, "step": 62320 }, { "epoch": 0.84, "learning_rate": 3.2952871051968286e-06, "loss": 0.7182, "step": 62325 }, { "epoch": 0.84, "learning_rate": 3.292676601246661e-06, "loss": 0.5261, "step": 62330 }, { "epoch": 0.84, "learning_rate": 3.290067058822316e-06, "loss": 1.0334, "step": 62335 }, { "epoch": 0.84, "learning_rate": 3.287458478039393e-06, "loss": 0.6972, "step": 62340 }, { "epoch": 0.84, "learning_rate": 3.2848508590134384e-06, "loss": 1.1719, "step": 62345 }, { "epoch": 0.84, "learning_rate": 3.282244201859952e-06, "loss": 0.7442, "step": 62350 }, { "epoch": 0.84, "learning_rate": 3.279638506694391e-06, "loss": 0.5595, "step": 62355 }, { "epoch": 0.84, "learning_rate": 3.277033773632185e-06, "loss": 1.0489, "step": 62360 }, { "epoch": 0.84, "learning_rate": 3.2744300027887085e-06, "loss": 1.0841, "step": 62365 }, { "epoch": 0.84, "learning_rate": 3.2718271942792866e-06, "loss": 0.7904, "step": 62370 }, { "epoch": 0.84, "learning_rate": 3.269225348219221e-06, "loss": 0.9221, "step": 62375 }, { "epoch": 0.84, "learning_rate": 3.266624464723761e-06, "loss": 0.4651, "step": 62380 }, { "epoch": 0.84, "learning_rate": 3.2640245439081063e-06, "loss": 0.6949, "step": 62385 }, { "epoch": 0.84, "learning_rate": 3.261425585887415e-06, "loss": 0.3542, "step": 62390 }, { "epoch": 0.84, "learning_rate": 3.258827590776825e-06, "loss": 0.6162, "step": 62395 }, { "epoch": 0.84, "learning_rate": 3.2562305586914003e-06, "loss": 0.6714, "step": 62400 }, { "epoch": 0.84, "learning_rate": 3.2536344897461794e-06, "loss": 1.3421, "step": 62405 }, { "epoch": 0.84, "learning_rate": 3.2510393840561676e-06, "loss": 1.4775, "step": 62410 }, { "epoch": 0.84, "learning_rate": 3.248445241736295e-06, "loss": 1.0691, "step": 62415 }, { "epoch": 0.84, "learning_rate": 3.2458520629014803e-06, "loss": 0.4956, "step": 62420 }, { "epoch": 0.84, "learning_rate": 3.2432598476665883e-06, "loss": 0.1464, "step": 62425 }, { "epoch": 0.84, "learning_rate": 3.2406685961464344e-06, "loss": 1.1301, "step": 62430 }, { "epoch": 0.84, "learning_rate": 3.238078308455808e-06, "loss": 0.3406, "step": 62435 }, { "epoch": 0.84, "learning_rate": 3.2354889847094422e-06, "loss": 0.839, "step": 62440 }, { "epoch": 0.84, "learning_rate": 3.232900625022023e-06, "loss": 0.7109, "step": 62445 }, { "epoch": 0.84, "learning_rate": 3.2303132295082166e-06, "loss": 0.7309, "step": 62450 }, { "epoch": 0.84, "learning_rate": 3.227726798282621e-06, "loss": 0.7733, "step": 62455 }, { "epoch": 0.84, "learning_rate": 3.225141331459805e-06, "loss": 0.7287, "step": 62460 }, { "epoch": 0.84, "learning_rate": 3.2225568291542886e-06, "loss": 0.7192, "step": 62465 }, { "epoch": 0.84, "learning_rate": 3.21997329148056e-06, "loss": 1.0041, "step": 62470 }, { "epoch": 0.84, "learning_rate": 3.217390718553054e-06, "loss": 0.4966, "step": 62475 }, { "epoch": 0.84, "learning_rate": 3.2148091104861553e-06, "loss": 0.8997, "step": 62480 }, { "epoch": 0.84, "learning_rate": 3.212228467394232e-06, "loss": 0.2916, "step": 62485 }, { "epoch": 0.84, "learning_rate": 3.2096487893915893e-06, "loss": 0.5155, "step": 62490 }, { "epoch": 0.84, "learning_rate": 3.207070076592489e-06, "loss": 0.6969, "step": 62495 }, { "epoch": 0.84, "learning_rate": 3.2044923291111527e-06, "loss": 0.4038, "step": 62500 }, { "epoch": 0.84, "learning_rate": 3.2019155470617707e-06, "loss": 1.1576, "step": 62505 }, { "epoch": 0.84, "learning_rate": 3.1993397305584818e-06, "loss": 0.7016, "step": 62510 }, { "epoch": 0.84, "learning_rate": 3.1967648797153666e-06, "loss": 0.1894, "step": 62515 }, { "epoch": 0.84, "learning_rate": 3.194190994646504e-06, "loss": 0.5866, "step": 62520 }, { "epoch": 0.84, "learning_rate": 3.191618075465877e-06, "loss": 0.9337, "step": 62525 }, { "epoch": 0.84, "learning_rate": 3.18904612228747e-06, "loss": 0.6147, "step": 62530 }, { "epoch": 0.84, "learning_rate": 3.1864751352252057e-06, "loss": 1.0823, "step": 62535 }, { "epoch": 0.84, "learning_rate": 3.183905114392957e-06, "loss": 0.9445, "step": 62540 }, { "epoch": 0.84, "learning_rate": 3.1813360599045714e-06, "loss": 1.2931, "step": 62545 }, { "epoch": 0.84, "learning_rate": 3.1787679718738474e-06, "loss": 0.4718, "step": 62550 }, { "epoch": 0.84, "learning_rate": 3.176200850414526e-06, "loss": 0.9596, "step": 62555 }, { "epoch": 0.84, "learning_rate": 3.1736346956403317e-06, "loss": 1.3461, "step": 62560 }, { "epoch": 0.84, "learning_rate": 3.171069507664928e-06, "loss": 0.7011, "step": 62565 }, { "epoch": 0.84, "learning_rate": 3.168505286601936e-06, "loss": 1.2673, "step": 62570 }, { "epoch": 0.84, "learning_rate": 3.1659420325649363e-06, "loss": 0.9725, "step": 62575 }, { "epoch": 0.84, "learning_rate": 3.1633797456674774e-06, "loss": 1.5407, "step": 62580 }, { "epoch": 0.84, "learning_rate": 3.1608184260230516e-06, "loss": 0.7147, "step": 62585 }, { "epoch": 0.84, "learning_rate": 3.1582580737451046e-06, "loss": 1.016, "step": 62590 }, { "epoch": 0.84, "learning_rate": 3.155698688947059e-06, "loss": 0.4947, "step": 62595 }, { "epoch": 0.84, "learning_rate": 3.1531402717422804e-06, "loss": 0.6853, "step": 62600 }, { "epoch": 0.84, "learning_rate": 3.1505828222440887e-06, "loss": 1.543, "step": 62605 }, { "epoch": 0.84, "learning_rate": 3.1480263405657655e-06, "loss": 0.337, "step": 62610 }, { "epoch": 0.84, "learning_rate": 3.145470826820557e-06, "loss": 1.3477, "step": 62615 }, { "epoch": 0.84, "learning_rate": 3.1429162811216577e-06, "loss": 0.524, "step": 62620 }, { "epoch": 0.84, "learning_rate": 3.140362703582214e-06, "loss": 0.5558, "step": 62625 }, { "epoch": 0.84, "learning_rate": 3.1378100943153523e-06, "loss": 0.6008, "step": 62630 }, { "epoch": 0.84, "learning_rate": 3.1352584534341173e-06, "loss": 1.0584, "step": 62635 }, { "epoch": 0.84, "learning_rate": 3.1327077810515553e-06, "loss": 0.6834, "step": 62640 }, { "epoch": 0.84, "learning_rate": 3.1301580772806398e-06, "loss": 1.3139, "step": 62645 }, { "epoch": 0.84, "learning_rate": 3.1276093422343055e-06, "loss": 1.0242, "step": 62650 }, { "epoch": 0.84, "learning_rate": 3.1250615760254566e-06, "loss": 0.5502, "step": 62655 }, { "epoch": 0.84, "learning_rate": 3.122514778766944e-06, "loss": 0.8116, "step": 62660 }, { "epoch": 0.84, "learning_rate": 3.1199689505715723e-06, "loss": 0.7748, "step": 62665 }, { "epoch": 0.84, "learning_rate": 3.117424091552118e-06, "loss": 0.9865, "step": 62670 }, { "epoch": 0.84, "learning_rate": 3.114880201821302e-06, "loss": 0.6959, "step": 62675 }, { "epoch": 0.84, "learning_rate": 3.1123372814918033e-06, "loss": 0.3765, "step": 62680 }, { "epoch": 0.84, "learning_rate": 3.10979533067626e-06, "loss": 0.7529, "step": 62685 }, { "epoch": 0.84, "learning_rate": 3.1072543494872737e-06, "loss": 1.335, "step": 62690 }, { "epoch": 0.84, "learning_rate": 3.1047143380373955e-06, "loss": 0.9942, "step": 62695 }, { "epoch": 0.84, "learning_rate": 3.1021752964391276e-06, "loss": 0.7166, "step": 62700 }, { "epoch": 0.84, "learning_rate": 3.0996372248049467e-06, "loss": 1.1891, "step": 62705 }, { "epoch": 0.84, "learning_rate": 3.0971001232472736e-06, "loss": 0.8579, "step": 62710 }, { "epoch": 0.84, "learning_rate": 3.094563991878488e-06, "loss": 0.1979, "step": 62715 }, { "epoch": 0.84, "learning_rate": 3.0920288308109226e-06, "loss": 1.3022, "step": 62720 }, { "epoch": 0.84, "learning_rate": 3.0894946401568843e-06, "loss": 0.781, "step": 62725 }, { "epoch": 0.84, "learning_rate": 3.0869614200286167e-06, "loss": 1.219, "step": 62730 }, { "epoch": 0.84, "learning_rate": 3.0844291705383278e-06, "loss": 0.4883, "step": 62735 }, { "epoch": 0.84, "learning_rate": 3.0818978917981966e-06, "loss": 0.928, "step": 62740 }, { "epoch": 0.84, "learning_rate": 3.079367583920323e-06, "loss": 0.9586, "step": 62745 }, { "epoch": 0.84, "learning_rate": 3.076838247016803e-06, "loss": 0.4389, "step": 62750 }, { "epoch": 0.84, "learning_rate": 3.0743098811996775e-06, "loss": 0.584, "step": 62755 }, { "epoch": 0.84, "learning_rate": 3.0717824865809263e-06, "loss": 0.8378, "step": 62760 }, { "epoch": 0.84, "learning_rate": 3.0692560632725133e-06, "loss": 0.3825, "step": 62765 }, { "epoch": 0.84, "learning_rate": 3.066730611386337e-06, "loss": 0.8702, "step": 62770 }, { "epoch": 0.84, "learning_rate": 3.064206131034264e-06, "loss": 0.7292, "step": 62775 }, { "epoch": 0.84, "learning_rate": 3.0616826223281216e-06, "loss": 0.8292, "step": 62780 }, { "epoch": 0.84, "learning_rate": 3.0591600853796836e-06, "loss": 1.2448, "step": 62785 }, { "epoch": 0.84, "learning_rate": 3.056638520300689e-06, "loss": 0.6532, "step": 62790 }, { "epoch": 0.84, "learning_rate": 3.0541179272028238e-06, "loss": 0.5711, "step": 62795 }, { "epoch": 0.84, "learning_rate": 3.0515983061977476e-06, "loss": 0.6655, "step": 62800 }, { "epoch": 0.84, "learning_rate": 3.0490796573970636e-06, "loss": 0.4694, "step": 62805 }, { "epoch": 0.84, "learning_rate": 3.046561980912327e-06, "loss": 1.0462, "step": 62810 }, { "epoch": 0.84, "learning_rate": 3.0440452768550704e-06, "loss": 0.8374, "step": 62815 }, { "epoch": 0.84, "learning_rate": 3.041529545336766e-06, "loss": 0.8304, "step": 62820 }, { "epoch": 0.84, "learning_rate": 3.039014786468847e-06, "loss": 1.3856, "step": 62825 }, { "epoch": 0.84, "learning_rate": 3.0365010003627015e-06, "loss": 0.5751, "step": 62830 }, { "epoch": 0.84, "learning_rate": 3.0339881871296855e-06, "loss": 1.0317, "step": 62835 }, { "epoch": 0.84, "learning_rate": 3.0314763468811015e-06, "loss": 0.5375, "step": 62840 }, { "epoch": 0.84, "learning_rate": 3.0289654797282048e-06, "loss": 0.7761, "step": 62845 }, { "epoch": 0.84, "learning_rate": 3.0264555857822314e-06, "loss": 1.0256, "step": 62850 }, { "epoch": 0.84, "learning_rate": 3.0239466651543342e-06, "loss": 0.8626, "step": 62855 }, { "epoch": 0.84, "learning_rate": 3.0214387179556574e-06, "loss": 0.5495, "step": 62860 }, { "epoch": 0.84, "learning_rate": 3.018931744297299e-06, "loss": 0.7838, "step": 62865 }, { "epoch": 0.84, "learning_rate": 3.0164257442902856e-06, "loss": 0.9287, "step": 62870 }, { "epoch": 0.84, "learning_rate": 3.0139207180456373e-06, "loss": 0.8523, "step": 62875 }, { "epoch": 0.84, "learning_rate": 3.0114166656743105e-06, "loss": 0.6775, "step": 62880 }, { "epoch": 0.84, "learning_rate": 3.0089135872872127e-06, "loss": 0.5352, "step": 62885 }, { "epoch": 0.84, "learning_rate": 3.0064114829952307e-06, "loss": 1.192, "step": 62890 }, { "epoch": 0.84, "learning_rate": 3.0039103529091895e-06, "loss": 0.3403, "step": 62895 }, { "epoch": 0.84, "learning_rate": 3.0014101971398754e-06, "loss": 1.11, "step": 62900 }, { "epoch": 0.84, "learning_rate": 2.998911015798031e-06, "loss": 0.8637, "step": 62905 }, { "epoch": 0.84, "learning_rate": 2.9964128089943643e-06, "loss": 0.4177, "step": 62910 }, { "epoch": 0.84, "learning_rate": 2.9939155768395316e-06, "loss": 0.5086, "step": 62915 }, { "epoch": 0.84, "learning_rate": 2.9914193194441385e-06, "loss": 0.6564, "step": 62920 }, { "epoch": 0.84, "learning_rate": 2.9889240369187722e-06, "loss": 0.6193, "step": 62925 }, { "epoch": 0.84, "learning_rate": 2.986429729373949e-06, "loss": 0.3712, "step": 62930 }, { "epoch": 0.84, "learning_rate": 2.9839363969201618e-06, "loss": 1.1306, "step": 62935 }, { "epoch": 0.84, "learning_rate": 2.981444039667841e-06, "loss": 0.9176, "step": 62940 }, { "epoch": 0.84, "learning_rate": 2.9789526577274017e-06, "loss": 0.6179, "step": 62945 }, { "epoch": 0.84, "learning_rate": 2.9764622512091915e-06, "loss": 1.0626, "step": 62950 }, { "epoch": 0.84, "learning_rate": 2.9739728202235166e-06, "loss": 0.8651, "step": 62955 }, { "epoch": 0.84, "learning_rate": 2.971484364880667e-06, "loss": 1.3979, "step": 62960 }, { "epoch": 0.84, "learning_rate": 2.9689968852908397e-06, "loss": 0.4968, "step": 62965 }, { "epoch": 0.84, "learning_rate": 2.966510381564236e-06, "loss": 0.8759, "step": 62970 }, { "epoch": 0.84, "learning_rate": 2.964024853811001e-06, "loss": 0.1869, "step": 62975 }, { "epoch": 0.84, "learning_rate": 2.9615403021412138e-06, "loss": 0.7409, "step": 62980 }, { "epoch": 0.84, "learning_rate": 2.9590567266649383e-06, "loss": 0.5801, "step": 62985 }, { "epoch": 0.84, "learning_rate": 2.9565741274921842e-06, "loss": 0.3952, "step": 62990 }, { "epoch": 0.84, "learning_rate": 2.954092504732911e-06, "loss": 1.3062, "step": 62995 }, { "epoch": 0.84, "learning_rate": 2.9516118584970553e-06, "loss": 1.2791, "step": 63000 }, { "epoch": 0.84, "learning_rate": 2.9491321888944877e-06, "loss": 0.9656, "step": 63005 }, { "epoch": 0.84, "learning_rate": 2.9466534960350455e-06, "loss": 1.4787, "step": 63010 }, { "epoch": 0.84, "learning_rate": 2.9441757800285212e-06, "loss": 0.5765, "step": 63015 }, { "epoch": 0.84, "learning_rate": 2.9416990409846716e-06, "loss": 0.7269, "step": 63020 }, { "epoch": 0.84, "learning_rate": 2.9392232790132006e-06, "loss": 1.058, "step": 63025 }, { "epoch": 0.84, "learning_rate": 2.9367484942237676e-06, "loss": 1.0739, "step": 63030 }, { "epoch": 0.84, "learning_rate": 2.9342746867260075e-06, "loss": 0.4557, "step": 63035 }, { "epoch": 0.84, "learning_rate": 2.9318018566294763e-06, "loss": 0.5588, "step": 63040 }, { "epoch": 0.84, "learning_rate": 2.929330004043726e-06, "loss": 0.4609, "step": 63045 }, { "epoch": 0.84, "learning_rate": 2.9268591290782326e-06, "loss": 1.1216, "step": 63050 }, { "epoch": 0.84, "learning_rate": 2.924389231842459e-06, "loss": 1.3109, "step": 63055 }, { "epoch": 0.84, "learning_rate": 2.9219203124458e-06, "loss": 0.6079, "step": 63060 }, { "epoch": 0.84, "learning_rate": 2.9194523709976134e-06, "loss": 0.6963, "step": 63065 }, { "epoch": 0.85, "learning_rate": 2.916985407607231e-06, "loss": 0.4603, "step": 63070 }, { "epoch": 0.85, "learning_rate": 2.9145194223839073e-06, "loss": 0.7473, "step": 63075 }, { "epoch": 0.85, "learning_rate": 2.912054415436882e-06, "loss": 0.9818, "step": 63080 }, { "epoch": 0.85, "learning_rate": 2.909590386875358e-06, "loss": 0.6975, "step": 63085 }, { "epoch": 0.85, "learning_rate": 2.907127336808449e-06, "loss": 0.6686, "step": 63090 }, { "epoch": 0.85, "learning_rate": 2.90466526534528e-06, "loss": 0.5612, "step": 63095 }, { "epoch": 0.85, "learning_rate": 2.9022041725948994e-06, "loss": 1.5458, "step": 63100 }, { "epoch": 0.85, "learning_rate": 2.8997440586663175e-06, "loss": 0.8496, "step": 63105 }, { "epoch": 0.85, "learning_rate": 2.8972849236685168e-06, "loss": 1.0003, "step": 63110 }, { "epoch": 0.85, "learning_rate": 2.894826767710415e-06, "loss": 0.8006, "step": 63115 }, { "epoch": 0.85, "learning_rate": 2.892369590900901e-06, "loss": 0.6709, "step": 63120 }, { "epoch": 0.85, "learning_rate": 2.889913393348806e-06, "loss": 0.7837, "step": 63125 }, { "epoch": 0.85, "learning_rate": 2.887458175162938e-06, "loss": 1.4779, "step": 63130 }, { "epoch": 0.85, "learning_rate": 2.8850039364520494e-06, "loss": 0.7483, "step": 63135 }, { "epoch": 0.85, "learning_rate": 2.8825506773248438e-06, "loss": 0.1855, "step": 63140 }, { "epoch": 0.85, "learning_rate": 2.880098397890002e-06, "loss": 0.8574, "step": 63145 }, { "epoch": 0.85, "learning_rate": 2.877647098256128e-06, "loss": 0.5156, "step": 63150 }, { "epoch": 0.85, "learning_rate": 2.875196778531822e-06, "loss": 0.5134, "step": 63155 }, { "epoch": 0.85, "learning_rate": 2.8727474388256013e-06, "loss": 1.1762, "step": 63160 }, { "epoch": 0.85, "learning_rate": 2.8702990792459775e-06, "loss": 0.3577, "step": 63165 }, { "epoch": 0.85, "learning_rate": 2.867851699901394e-06, "loss": 0.6014, "step": 63170 }, { "epoch": 0.85, "learning_rate": 2.8654053009002506e-06, "loss": 0.6445, "step": 63175 }, { "epoch": 0.85, "learning_rate": 2.8629598823509214e-06, "loss": 0.7287, "step": 63180 }, { "epoch": 0.85, "learning_rate": 2.860515444361722e-06, "loss": 0.8493, "step": 63185 }, { "epoch": 0.85, "learning_rate": 2.858071987040922e-06, "loss": 0.8706, "step": 63190 }, { "epoch": 0.85, "learning_rate": 2.855629510496771e-06, "loss": 0.8765, "step": 63195 }, { "epoch": 0.85, "learning_rate": 2.8531880148374377e-06, "loss": 0.5785, "step": 63200 }, { "epoch": 0.85, "learning_rate": 2.8507475001710833e-06, "loss": 1.3784, "step": 63205 }, { "epoch": 0.85, "learning_rate": 2.8483079666058066e-06, "loss": 0.3205, "step": 63210 }, { "epoch": 0.85, "learning_rate": 2.845869414249658e-06, "loss": 0.5623, "step": 63215 }, { "epoch": 0.85, "learning_rate": 2.843431843210667e-06, "loss": 0.438, "step": 63220 }, { "epoch": 0.85, "learning_rate": 2.840995253596801e-06, "loss": 0.763, "step": 63225 }, { "epoch": 0.85, "learning_rate": 2.838559645515987e-06, "loss": 0.3695, "step": 63230 }, { "epoch": 0.85, "learning_rate": 2.8361250190761026e-06, "loss": 0.6601, "step": 63235 }, { "epoch": 0.85, "learning_rate": 2.8336913743850056e-06, "loss": 0.3364, "step": 63240 }, { "epoch": 0.85, "learning_rate": 2.831258711550483e-06, "loss": 0.3412, "step": 63245 }, { "epoch": 0.85, "learning_rate": 2.8288270306802923e-06, "loss": 0.915, "step": 63250 }, { "epoch": 0.85, "learning_rate": 2.82639633188215e-06, "loss": 1.0365, "step": 63255 }, { "epoch": 0.85, "learning_rate": 2.8239666152637124e-06, "loss": 0.5563, "step": 63260 }, { "epoch": 0.85, "learning_rate": 2.821537880932615e-06, "loss": 0.7036, "step": 63265 }, { "epoch": 0.85, "learning_rate": 2.8191101289964302e-06, "loss": 1.4036, "step": 63270 }, { "epoch": 0.85, "learning_rate": 2.816683359562702e-06, "loss": 0.6914, "step": 63275 }, { "epoch": 0.85, "learning_rate": 2.8142575727389237e-06, "loss": 0.6421, "step": 63280 }, { "epoch": 0.85, "learning_rate": 2.8118327686325356e-06, "loss": 0.5377, "step": 63285 }, { "epoch": 0.85, "learning_rate": 2.8094089473509585e-06, "loss": 0.7539, "step": 63290 }, { "epoch": 0.85, "learning_rate": 2.806986109001547e-06, "loss": 0.2708, "step": 63295 }, { "epoch": 0.85, "learning_rate": 2.8045642536916215e-06, "loss": 0.6385, "step": 63300 }, { "epoch": 0.85, "learning_rate": 2.802143381528466e-06, "loss": 0.7592, "step": 63305 }, { "epoch": 0.85, "learning_rate": 2.799723492619297e-06, "loss": 0.8232, "step": 63310 }, { "epoch": 0.85, "learning_rate": 2.79730458707132e-06, "loss": 0.3576, "step": 63315 }, { "epoch": 0.85, "learning_rate": 2.7948866649916694e-06, "loss": 0.5569, "step": 63320 }, { "epoch": 0.85, "learning_rate": 2.7924697264874484e-06, "loss": 0.7552, "step": 63325 }, { "epoch": 0.85, "learning_rate": 2.7900537716657237e-06, "loss": 0.2136, "step": 63330 }, { "epoch": 0.85, "learning_rate": 2.787638800633502e-06, "loss": 0.2524, "step": 63335 }, { "epoch": 0.85, "learning_rate": 2.7852248134977552e-06, "loss": 0.7531, "step": 63340 }, { "epoch": 0.85, "learning_rate": 2.78281181036541e-06, "loss": 0.7992, "step": 63345 }, { "epoch": 0.85, "learning_rate": 2.780399791343358e-06, "loss": 0.9275, "step": 63350 }, { "epoch": 0.85, "learning_rate": 2.77798875653843e-06, "loss": 0.3334, "step": 63355 }, { "epoch": 0.85, "learning_rate": 2.7755787060574244e-06, "loss": 0.4549, "step": 63360 }, { "epoch": 0.85, "learning_rate": 2.7731696400071087e-06, "loss": 0.7922, "step": 63365 }, { "epoch": 0.85, "learning_rate": 2.770761558494167e-06, "loss": 0.6937, "step": 63370 }, { "epoch": 0.85, "learning_rate": 2.768354461625286e-06, "loss": 0.7798, "step": 63375 }, { "epoch": 0.85, "learning_rate": 2.765948349507075e-06, "loss": 0.5206, "step": 63380 }, { "epoch": 0.85, "learning_rate": 2.763543222246126e-06, "loss": 0.9443, "step": 63385 }, { "epoch": 0.85, "learning_rate": 2.761139079948963e-06, "loss": 0.8925, "step": 63390 }, { "epoch": 0.85, "learning_rate": 2.7587359227220804e-06, "loss": 0.7188, "step": 63395 }, { "epoch": 0.85, "learning_rate": 2.756333750671927e-06, "loss": 0.4289, "step": 63400 }, { "epoch": 0.85, "learning_rate": 2.7539325639049095e-06, "loss": 1.3514, "step": 63405 }, { "epoch": 0.85, "learning_rate": 2.7515323625273815e-06, "loss": 1.0531, "step": 63410 }, { "epoch": 0.85, "learning_rate": 2.7491331466456744e-06, "loss": 0.6467, "step": 63415 }, { "epoch": 0.85, "learning_rate": 2.7467349163660422e-06, "loss": 0.8542, "step": 63420 }, { "epoch": 0.85, "learning_rate": 2.744337671794725e-06, "loss": 1.002, "step": 63425 }, { "epoch": 0.85, "learning_rate": 2.74194141303791e-06, "loss": 0.5048, "step": 63430 }, { "epoch": 0.85, "learning_rate": 2.7395461402017318e-06, "loss": 0.7373, "step": 63435 }, { "epoch": 0.85, "learning_rate": 2.7371518533922973e-06, "loss": 0.4537, "step": 63440 }, { "epoch": 0.85, "learning_rate": 2.7347585527156603e-06, "loss": 1.1664, "step": 63445 }, { "epoch": 0.85, "learning_rate": 2.732366238277828e-06, "loss": 0.8108, "step": 63450 }, { "epoch": 0.85, "learning_rate": 2.7299749101847654e-06, "loss": 0.9096, "step": 63455 }, { "epoch": 0.85, "learning_rate": 2.727584568542407e-06, "loss": 0.9442, "step": 63460 }, { "epoch": 0.85, "learning_rate": 2.725195213456627e-06, "loss": 0.8576, "step": 63465 }, { "epoch": 0.85, "learning_rate": 2.7228068450332543e-06, "loss": 0.6952, "step": 63470 }, { "epoch": 0.85, "learning_rate": 2.7204194633781018e-06, "loss": 0.202, "step": 63475 }, { "epoch": 0.85, "learning_rate": 2.7180330685968924e-06, "loss": 1.5764, "step": 63480 }, { "epoch": 0.85, "learning_rate": 2.7156476607953533e-06, "loss": 0.2613, "step": 63485 }, { "epoch": 0.85, "learning_rate": 2.7132632400791307e-06, "loss": 1.1848, "step": 63490 }, { "epoch": 0.85, "learning_rate": 2.7108798065538566e-06, "loss": 0.784, "step": 63495 }, { "epoch": 0.85, "learning_rate": 2.7084973603250965e-06, "loss": 0.7722, "step": 63500 }, { "epoch": 0.85, "learning_rate": 2.7061159014983766e-06, "loss": 1.0942, "step": 63505 }, { "epoch": 0.85, "learning_rate": 2.7037354301791966e-06, "loss": 0.7644, "step": 63510 }, { "epoch": 0.85, "learning_rate": 2.7013559464729914e-06, "loss": 0.5252, "step": 63515 }, { "epoch": 0.85, "learning_rate": 2.6989774504851572e-06, "loss": 0.4979, "step": 63520 }, { "epoch": 0.85, "learning_rate": 2.6965999423210595e-06, "loss": 1.353, "step": 63525 }, { "epoch": 0.85, "learning_rate": 2.694223422085998e-06, "loss": 0.528, "step": 63530 }, { "epoch": 0.85, "learning_rate": 2.6918478898852517e-06, "loss": 0.8691, "step": 63535 }, { "epoch": 0.85, "learning_rate": 2.689473345824037e-06, "loss": 0.7634, "step": 63540 }, { "epoch": 0.85, "learning_rate": 2.687099790007533e-06, "loss": 1.2308, "step": 63545 }, { "epoch": 0.85, "learning_rate": 2.6847272225408866e-06, "loss": 1.3921, "step": 63550 }, { "epoch": 0.85, "learning_rate": 2.682355643529183e-06, "loss": 0.3819, "step": 63555 }, { "epoch": 0.85, "learning_rate": 2.6799850530774744e-06, "loss": 0.6828, "step": 63560 }, { "epoch": 0.85, "learning_rate": 2.6776154512907574e-06, "loss": 0.7662, "step": 63565 }, { "epoch": 0.85, "learning_rate": 2.6752468382740064e-06, "loss": 0.7383, "step": 63570 }, { "epoch": 0.85, "learning_rate": 2.6728792141321346e-06, "loss": 0.7452, "step": 63575 }, { "epoch": 0.85, "learning_rate": 2.670512578970008e-06, "loss": 0.5414, "step": 63580 }, { "epoch": 0.85, "learning_rate": 2.6681469328924736e-06, "loss": 0.9087, "step": 63585 }, { "epoch": 0.85, "learning_rate": 2.665782276004297e-06, "loss": 0.5686, "step": 63590 }, { "epoch": 0.85, "learning_rate": 2.6634186084102315e-06, "loss": 0.6605, "step": 63595 }, { "epoch": 0.85, "learning_rate": 2.661055930214984e-06, "loss": 1.1939, "step": 63600 }, { "epoch": 0.85, "learning_rate": 2.6586942415231934e-06, "loss": 0.2093, "step": 63605 }, { "epoch": 0.85, "learning_rate": 2.656333542439479e-06, "loss": 1.0308, "step": 63610 }, { "epoch": 0.85, "learning_rate": 2.6539738330684044e-06, "loss": 0.8799, "step": 63615 }, { "epoch": 0.85, "learning_rate": 2.6516151135144995e-06, "loss": 0.6762, "step": 63620 }, { "epoch": 0.85, "learning_rate": 2.6492573838822423e-06, "loss": 0.7072, "step": 63625 }, { "epoch": 0.85, "learning_rate": 2.6469006442760567e-06, "loss": 0.6609, "step": 63630 }, { "epoch": 0.85, "learning_rate": 2.644544894800355e-06, "loss": 1.1464, "step": 63635 }, { "epoch": 0.85, "learning_rate": 2.6421901355594638e-06, "loss": 0.5049, "step": 63640 }, { "epoch": 0.85, "learning_rate": 2.6398363666577026e-06, "loss": 0.3081, "step": 63645 }, { "epoch": 0.85, "learning_rate": 2.637483588199324e-06, "loss": 0.2928, "step": 63650 }, { "epoch": 0.85, "learning_rate": 2.6351318002885428e-06, "loss": 0.6074, "step": 63655 }, { "epoch": 0.85, "learning_rate": 2.6327810030295414e-06, "loss": 0.8885, "step": 63660 }, { "epoch": 0.85, "learning_rate": 2.6304311965264394e-06, "loss": 0.6443, "step": 63665 }, { "epoch": 0.85, "learning_rate": 2.628082380883326e-06, "loss": 0.1889, "step": 63670 }, { "epoch": 0.85, "learning_rate": 2.6257345562042346e-06, "loss": 0.6631, "step": 63675 }, { "epoch": 0.85, "learning_rate": 2.6233877225931707e-06, "loss": 0.5305, "step": 63680 }, { "epoch": 0.85, "learning_rate": 2.621041880154085e-06, "loss": 0.9985, "step": 63685 }, { "epoch": 0.85, "learning_rate": 2.6186970289908797e-06, "loss": 0.5943, "step": 63690 }, { "epoch": 0.85, "learning_rate": 2.616353169207436e-06, "loss": 0.7153, "step": 63695 }, { "epoch": 0.85, "learning_rate": 2.6140103009075572e-06, "loss": 0.3975, "step": 63700 }, { "epoch": 0.85, "learning_rate": 2.611668424195027e-06, "loss": 0.7243, "step": 63705 }, { "epoch": 0.85, "learning_rate": 2.6093275391735894e-06, "loss": 0.8337, "step": 63710 }, { "epoch": 0.85, "learning_rate": 2.606987645946915e-06, "loss": 0.5216, "step": 63715 }, { "epoch": 0.85, "learning_rate": 2.604648744618665e-06, "loss": 0.4691, "step": 63720 }, { "epoch": 0.85, "learning_rate": 2.602310835292432e-06, "loss": 0.0588, "step": 63725 }, { "epoch": 0.85, "learning_rate": 2.59997391807178e-06, "loss": 0.8452, "step": 63730 }, { "epoch": 0.85, "learning_rate": 2.5976379930602202e-06, "loss": 0.2028, "step": 63735 }, { "epoch": 0.85, "learning_rate": 2.595303060361215e-06, "loss": 1.1913, "step": 63740 }, { "epoch": 0.85, "learning_rate": 2.5929691200782093e-06, "loss": 1.0015, "step": 63745 }, { "epoch": 0.85, "learning_rate": 2.5906361723145615e-06, "loss": 0.763, "step": 63750 }, { "epoch": 0.85, "learning_rate": 2.588304217173626e-06, "loss": 0.7306, "step": 63755 }, { "epoch": 0.85, "learning_rate": 2.5859732547586917e-06, "loss": 0.7179, "step": 63760 }, { "epoch": 0.85, "learning_rate": 2.5836432851730013e-06, "loss": 0.4793, "step": 63765 }, { "epoch": 0.85, "learning_rate": 2.581314308519775e-06, "loss": 0.8422, "step": 63770 }, { "epoch": 0.85, "learning_rate": 2.578986324902169e-06, "loss": 0.9064, "step": 63775 }, { "epoch": 0.85, "learning_rate": 2.5766593344232983e-06, "loss": 0.7745, "step": 63780 }, { "epoch": 0.85, "learning_rate": 2.5743333371862327e-06, "loss": 0.7257, "step": 63785 }, { "epoch": 0.85, "learning_rate": 2.5720083332940155e-06, "loss": 0.935, "step": 63790 }, { "epoch": 0.85, "learning_rate": 2.569684322849622e-06, "loss": 0.5778, "step": 63795 }, { "epoch": 0.85, "learning_rate": 2.567361305955995e-06, "loss": 0.6706, "step": 63800 }, { "epoch": 0.85, "learning_rate": 2.565039282716045e-06, "loss": 0.7335, "step": 63805 }, { "epoch": 0.85, "learning_rate": 2.562718253232607e-06, "loss": 0.8352, "step": 63810 }, { "epoch": 0.86, "learning_rate": 2.5603982176084977e-06, "loss": 0.7405, "step": 63815 }, { "epoch": 0.86, "learning_rate": 2.5580791759464984e-06, "loss": 1.2872, "step": 63820 }, { "epoch": 0.86, "learning_rate": 2.5557611283493073e-06, "loss": 0.6471, "step": 63825 }, { "epoch": 0.86, "learning_rate": 2.553444074919617e-06, "loss": 0.504, "step": 63830 }, { "epoch": 0.86, "learning_rate": 2.551128015760054e-06, "loss": 0.7835, "step": 63835 }, { "epoch": 0.86, "learning_rate": 2.5488129509732174e-06, "loss": 1.1682, "step": 63840 }, { "epoch": 0.86, "learning_rate": 2.5464988806616465e-06, "loss": 0.323, "step": 63845 }, { "epoch": 0.86, "learning_rate": 2.5441858049278372e-06, "loss": 0.7793, "step": 63850 }, { "epoch": 0.86, "learning_rate": 2.5418737238742636e-06, "loss": 1.1776, "step": 63855 }, { "epoch": 0.86, "learning_rate": 2.539562637603321e-06, "loss": 1.0178, "step": 63860 }, { "epoch": 0.86, "learning_rate": 2.5372525462173947e-06, "loss": 0.8051, "step": 63865 }, { "epoch": 0.86, "learning_rate": 2.5349434498187997e-06, "loss": 0.4563, "step": 63870 }, { "epoch": 0.86, "learning_rate": 2.532635348509818e-06, "loss": 1.217, "step": 63875 }, { "epoch": 0.86, "learning_rate": 2.5303282423926933e-06, "loss": 0.7121, "step": 63880 }, { "epoch": 0.86, "learning_rate": 2.528022131569616e-06, "loss": 0.3079, "step": 63885 }, { "epoch": 0.86, "learning_rate": 2.525717016142734e-06, "loss": 0.4757, "step": 63890 }, { "epoch": 0.86, "learning_rate": 2.5234128962141473e-06, "loss": 1.1582, "step": 63895 }, { "epoch": 0.86, "learning_rate": 2.5211097718859294e-06, "loss": 1.3846, "step": 63900 }, { "epoch": 0.86, "learning_rate": 2.5188076432600876e-06, "loss": 0.5416, "step": 63905 }, { "epoch": 0.86, "learning_rate": 2.5165065104385933e-06, "loss": 0.2888, "step": 63910 }, { "epoch": 0.86, "learning_rate": 2.5142063735233894e-06, "loss": 0.812, "step": 63915 }, { "epoch": 0.86, "learning_rate": 2.5119072326163423e-06, "loss": 0.5238, "step": 63920 }, { "epoch": 0.86, "learning_rate": 2.509609087819298e-06, "loss": 0.8893, "step": 63925 }, { "epoch": 0.86, "learning_rate": 2.507311939234064e-06, "loss": 0.8192, "step": 63930 }, { "epoch": 0.86, "learning_rate": 2.505015786962378e-06, "loss": 1.2611, "step": 63935 }, { "epoch": 0.86, "learning_rate": 2.502720631105954e-06, "loss": 0.5683, "step": 63940 }, { "epoch": 0.86, "learning_rate": 2.5004264717664537e-06, "loss": 0.3033, "step": 63945 }, { "epoch": 0.86, "learning_rate": 2.498133309045503e-06, "loss": 0.6481, "step": 63950 }, { "epoch": 0.86, "learning_rate": 2.495841143044675e-06, "loss": 0.8978, "step": 63955 }, { "epoch": 0.86, "learning_rate": 2.4935499738654917e-06, "loss": 0.191, "step": 63960 }, { "epoch": 0.86, "learning_rate": 2.491259801609461e-06, "loss": 0.5642, "step": 63965 }, { "epoch": 0.86, "learning_rate": 2.488970626378001e-06, "loss": 0.6096, "step": 63970 }, { "epoch": 0.86, "learning_rate": 2.4866824482725287e-06, "loss": 0.4958, "step": 63975 }, { "epoch": 0.86, "learning_rate": 2.484395267394393e-06, "loss": 0.9534, "step": 63980 }, { "epoch": 0.86, "learning_rate": 2.482109083844902e-06, "loss": 0.7234, "step": 63985 }, { "epoch": 0.86, "learning_rate": 2.4798238977253305e-06, "loss": 0.7812, "step": 63990 }, { "epoch": 0.86, "learning_rate": 2.477539709136892e-06, "loss": 0.9073, "step": 63995 }, { "epoch": 0.86, "learning_rate": 2.4752565181807715e-06, "loss": 0.6695, "step": 64000 }, { "epoch": 0.86, "learning_rate": 2.4729743249580937e-06, "loss": 0.6001, "step": 64005 }, { "epoch": 0.86, "learning_rate": 2.4706931295699565e-06, "loss": 0.894, "step": 64010 }, { "epoch": 0.86, "learning_rate": 2.468412932117406e-06, "loss": 0.486, "step": 64015 }, { "epoch": 0.86, "learning_rate": 2.466133732701434e-06, "loss": 0.9097, "step": 64020 }, { "epoch": 0.86, "learning_rate": 2.463855531423015e-06, "loss": 1.12, "step": 64025 }, { "epoch": 0.86, "learning_rate": 2.4615783283830406e-06, "loss": 1.1403, "step": 64030 }, { "epoch": 0.86, "learning_rate": 2.4593021236823914e-06, "loss": 0.2779, "step": 64035 }, { "epoch": 0.86, "learning_rate": 2.457026917421898e-06, "loss": 0.9941, "step": 64040 }, { "epoch": 0.86, "learning_rate": 2.4547527097023263e-06, "loss": 0.5464, "step": 64045 }, { "epoch": 0.86, "learning_rate": 2.4524795006244217e-06, "loss": 0.8301, "step": 64050 }, { "epoch": 0.86, "learning_rate": 2.4502072902888694e-06, "loss": 0.2072, "step": 64055 }, { "epoch": 0.86, "learning_rate": 2.4479360787963284e-06, "loss": 0.6792, "step": 64060 }, { "epoch": 0.86, "learning_rate": 2.445665866247393e-06, "loss": 0.3628, "step": 64065 }, { "epoch": 0.86, "learning_rate": 2.443396652742616e-06, "loss": 0.7521, "step": 64070 }, { "epoch": 0.86, "learning_rate": 2.441128438382534e-06, "loss": 0.7928, "step": 64075 }, { "epoch": 0.86, "learning_rate": 2.438861223267591e-06, "loss": 0.6664, "step": 64080 }, { "epoch": 0.86, "learning_rate": 2.4365950074982323e-06, "loss": 1.1133, "step": 64085 }, { "epoch": 0.86, "learning_rate": 2.434329791174836e-06, "loss": 0.9491, "step": 64090 }, { "epoch": 0.86, "learning_rate": 2.4320655743977292e-06, "loss": 0.6203, "step": 64095 }, { "epoch": 0.86, "learning_rate": 2.429802357267219e-06, "loss": 0.8266, "step": 64100 }, { "epoch": 0.86, "learning_rate": 2.4275401398835495e-06, "loss": 0.338, "step": 64105 }, { "epoch": 0.86, "learning_rate": 2.4252789223469268e-06, "loss": 0.6221, "step": 64110 }, { "epoch": 0.86, "learning_rate": 2.423018704757504e-06, "loss": 0.1711, "step": 64115 }, { "epoch": 0.86, "learning_rate": 2.420759487215407e-06, "loss": 0.6971, "step": 64120 }, { "epoch": 0.86, "learning_rate": 2.4185012698207055e-06, "loss": 0.7481, "step": 64125 }, { "epoch": 0.86, "learning_rate": 2.416244052673422e-06, "loss": 0.6469, "step": 64130 }, { "epoch": 0.86, "learning_rate": 2.413987835873549e-06, "loss": 1.3151, "step": 64135 }, { "epoch": 0.86, "learning_rate": 2.4117326195210205e-06, "loss": 0.9681, "step": 64140 }, { "epoch": 0.86, "learning_rate": 2.409478403715726e-06, "loss": 1.3921, "step": 64145 }, { "epoch": 0.86, "learning_rate": 2.4072251885575297e-06, "loss": 0.5704, "step": 64150 }, { "epoch": 0.86, "learning_rate": 2.404972974146222e-06, "loss": 0.7668, "step": 64155 }, { "epoch": 0.86, "learning_rate": 2.402721760581575e-06, "loss": 0.6639, "step": 64160 }, { "epoch": 0.86, "learning_rate": 2.4004715479632983e-06, "loss": 1.1054, "step": 64165 }, { "epoch": 0.86, "learning_rate": 2.3982223363910763e-06, "loss": 1.0268, "step": 64170 }, { "epoch": 0.86, "learning_rate": 2.3959741259645313e-06, "loss": 0.5227, "step": 64175 }, { "epoch": 0.86, "learning_rate": 2.3937269167832453e-06, "loss": 0.523, "step": 64180 }, { "epoch": 0.86, "learning_rate": 2.3914807089467696e-06, "loss": 0.3035, "step": 64185 }, { "epoch": 0.86, "learning_rate": 2.3892355025545793e-06, "loss": 0.5868, "step": 64190 }, { "epoch": 0.86, "learning_rate": 2.3869912977061454e-06, "loss": 0.5136, "step": 64195 }, { "epoch": 0.86, "learning_rate": 2.3847480945008688e-06, "loss": 0.4338, "step": 64200 }, { "epoch": 0.86, "learning_rate": 2.3825058930381035e-06, "loss": 0.6687, "step": 64205 }, { "epoch": 0.86, "learning_rate": 2.3802646934171837e-06, "loss": 0.5224, "step": 64210 }, { "epoch": 0.86, "learning_rate": 2.3780244957373714e-06, "loss": 0.507, "step": 64215 }, { "epoch": 0.86, "learning_rate": 2.375785300097902e-06, "loss": 0.9208, "step": 64220 }, { "epoch": 0.86, "learning_rate": 2.373547106597954e-06, "loss": 0.811, "step": 64225 }, { "epoch": 0.86, "learning_rate": 2.3713099153366754e-06, "loss": 0.949, "step": 64230 }, { "epoch": 0.86, "learning_rate": 2.3690737264131595e-06, "loss": 0.2529, "step": 64235 }, { "epoch": 0.86, "learning_rate": 2.3668385399264555e-06, "loss": 0.1362, "step": 64240 }, { "epoch": 0.86, "learning_rate": 2.3646043559755774e-06, "loss": 0.5529, "step": 64245 }, { "epoch": 0.86, "learning_rate": 2.362371174659486e-06, "loss": 0.2961, "step": 64250 }, { "epoch": 0.86, "learning_rate": 2.3601389960770966e-06, "loss": 1.1135, "step": 64255 }, { "epoch": 0.86, "learning_rate": 2.357907820327293e-06, "loss": 0.4399, "step": 64260 }, { "epoch": 0.86, "learning_rate": 2.3556776475088886e-06, "loss": 0.5586, "step": 64265 }, { "epoch": 0.86, "learning_rate": 2.353448477720682e-06, "loss": 0.6163, "step": 64270 }, { "epoch": 0.86, "learning_rate": 2.351220311061414e-06, "loss": 1.2626, "step": 64275 }, { "epoch": 0.86, "learning_rate": 2.3489931476297687e-06, "loss": 0.6063, "step": 64280 }, { "epoch": 0.86, "learning_rate": 2.3467669875244154e-06, "loss": 0.991, "step": 64285 }, { "epoch": 0.86, "learning_rate": 2.3445418308439494e-06, "loss": 0.528, "step": 64290 }, { "epoch": 0.86, "learning_rate": 2.3423176776869476e-06, "loss": 0.7647, "step": 64295 }, { "epoch": 0.86, "learning_rate": 2.3400945281519093e-06, "loss": 0.4268, "step": 64300 }, { "epoch": 0.86, "learning_rate": 2.337872382337325e-06, "loss": 1.2656, "step": 64305 }, { "epoch": 0.86, "learning_rate": 2.3356512403416186e-06, "loss": 0.8282, "step": 64310 }, { "epoch": 0.86, "learning_rate": 2.3334311022631726e-06, "loss": 0.6015, "step": 64315 }, { "epoch": 0.86, "learning_rate": 2.3312119682003364e-06, "loss": 0.6713, "step": 64320 }, { "epoch": 0.86, "learning_rate": 2.3289938382514006e-06, "loss": 0.752, "step": 64325 }, { "epoch": 0.86, "learning_rate": 2.3267767125146167e-06, "loss": 0.553, "step": 64330 }, { "epoch": 0.86, "learning_rate": 2.324560591088193e-06, "loss": 0.472, "step": 64335 }, { "epoch": 0.86, "learning_rate": 2.322345474070295e-06, "loss": 0.9669, "step": 64340 }, { "epoch": 0.86, "learning_rate": 2.3201313615590415e-06, "loss": 0.3399, "step": 64345 }, { "epoch": 0.86, "learning_rate": 2.3179182536524986e-06, "loss": 0.7754, "step": 64350 }, { "epoch": 0.86, "learning_rate": 2.315706150448707e-06, "loss": 0.8405, "step": 64355 }, { "epoch": 0.86, "learning_rate": 2.3134950520456472e-06, "loss": 0.9731, "step": 64360 }, { "epoch": 0.86, "learning_rate": 2.311284958541257e-06, "loss": 0.3981, "step": 64365 }, { "epoch": 0.86, "learning_rate": 2.309075870033442e-06, "loss": 1.5274, "step": 64370 }, { "epoch": 0.86, "learning_rate": 2.306867786620037e-06, "loss": 0.7813, "step": 64375 }, { "epoch": 0.86, "learning_rate": 2.3046607083988673e-06, "loss": 0.6371, "step": 64380 }, { "epoch": 0.86, "learning_rate": 2.3024546354676823e-06, "loss": 0.2655, "step": 64385 }, { "epoch": 0.86, "learning_rate": 2.3002495679242035e-06, "loss": 0.5265, "step": 64390 }, { "epoch": 0.86, "learning_rate": 2.2980455058661086e-06, "loss": 1.0161, "step": 64395 }, { "epoch": 0.86, "learning_rate": 2.2958424493910195e-06, "loss": 0.7689, "step": 64400 }, { "epoch": 0.86, "learning_rate": 2.2936403985965333e-06, "loss": 1.01, "step": 64405 }, { "epoch": 0.86, "learning_rate": 2.2914393535801715e-06, "loss": 2.3841, "step": 64410 }, { "epoch": 0.86, "learning_rate": 2.2892393144394455e-06, "loss": 0.5891, "step": 64415 }, { "epoch": 0.86, "learning_rate": 2.287040281271799e-06, "loss": 0.4651, "step": 64420 }, { "epoch": 0.86, "learning_rate": 2.2848422541746322e-06, "loss": 0.7233, "step": 64425 }, { "epoch": 0.86, "learning_rate": 2.2826452332453203e-06, "loss": 0.9343, "step": 64430 }, { "epoch": 0.86, "learning_rate": 2.280449218581171e-06, "loss": 0.4605, "step": 64435 }, { "epoch": 0.86, "learning_rate": 2.2782542102794594e-06, "loss": 1.3558, "step": 64440 }, { "epoch": 0.86, "learning_rate": 2.2760602084374084e-06, "loss": 0.6268, "step": 64445 }, { "epoch": 0.86, "learning_rate": 2.2738672131522113e-06, "loss": 0.7201, "step": 64450 }, { "epoch": 0.86, "learning_rate": 2.271675224521e-06, "loss": 0.6951, "step": 64455 }, { "epoch": 0.86, "learning_rate": 2.269484242640868e-06, "loss": 0.5336, "step": 64460 }, { "epoch": 0.86, "learning_rate": 2.267294267608869e-06, "loss": 0.9551, "step": 64465 }, { "epoch": 0.86, "learning_rate": 2.265105299522005e-06, "loss": 1.2544, "step": 64470 }, { "epoch": 0.86, "learning_rate": 2.2629173384772357e-06, "loss": 0.4081, "step": 64475 }, { "epoch": 0.86, "learning_rate": 2.2607303845714854e-06, "loss": 0.4762, "step": 64480 }, { "epoch": 0.86, "learning_rate": 2.258544437901611e-06, "loss": 0.4676, "step": 64485 }, { "epoch": 0.86, "learning_rate": 2.2563594985644475e-06, "loss": 0.8977, "step": 64490 }, { "epoch": 0.86, "learning_rate": 2.254175566656777e-06, "loss": 1.1222, "step": 64495 }, { "epoch": 0.86, "learning_rate": 2.25199264227533e-06, "loss": 0.5002, "step": 64500 }, { "epoch": 0.86, "learning_rate": 2.24981072551681e-06, "loss": 1.0495, "step": 64505 }, { "epoch": 0.86, "learning_rate": 2.2476298164778533e-06, "loss": 0.5249, "step": 64510 }, { "epoch": 0.86, "learning_rate": 2.2454499152550794e-06, "loss": 1.3788, "step": 64515 }, { "epoch": 0.86, "learning_rate": 2.2432710219450258e-06, "loss": 0.517, "step": 64520 }, { "epoch": 0.86, "learning_rate": 2.2410931366442233e-06, "loss": 0.7085, "step": 64525 }, { "epoch": 0.86, "learning_rate": 2.2389162594491363e-06, "loss": 0.8488, "step": 64530 }, { "epoch": 0.86, "learning_rate": 2.236740390456185e-06, "loss": 0.3565, "step": 64535 }, { "epoch": 0.86, "learning_rate": 2.234565529761756e-06, "loss": 1.0866, "step": 64540 }, { "epoch": 0.86, "learning_rate": 2.2323916774621837e-06, "loss": 0.7054, "step": 64545 }, { "epoch": 0.86, "learning_rate": 2.230218833653752e-06, "loss": 0.4532, "step": 64550 }, { "epoch": 0.86, "learning_rate": 2.2280469984327175e-06, "loss": 0.9522, "step": 64555 }, { "epoch": 0.87, "learning_rate": 2.2258761718952747e-06, "loss": 0.8254, "step": 64560 }, { "epoch": 0.87, "learning_rate": 2.2237063541375835e-06, "loss": 1.1896, "step": 64565 }, { "epoch": 0.87, "learning_rate": 2.22153754525575e-06, "loss": 0.898, "step": 64570 }, { "epoch": 0.87, "learning_rate": 2.2193697453458505e-06, "loss": 0.4589, "step": 64575 }, { "epoch": 0.87, "learning_rate": 2.2172029545039055e-06, "loss": 1.0702, "step": 64580 }, { "epoch": 0.87, "learning_rate": 2.215037172825882e-06, "loss": 0.3644, "step": 64585 }, { "epoch": 0.87, "learning_rate": 2.212872400407734e-06, "loss": 0.5545, "step": 64590 }, { "epoch": 0.87, "learning_rate": 2.2107086373453296e-06, "loss": 0.6129, "step": 64595 }, { "epoch": 0.87, "learning_rate": 2.208545883734525e-06, "loss": 0.5575, "step": 64600 }, { "epoch": 0.87, "learning_rate": 2.2063841396711164e-06, "loss": 0.6228, "step": 64605 }, { "epoch": 0.87, "learning_rate": 2.204223405250852e-06, "loss": 0.825, "step": 64610 }, { "epoch": 0.87, "learning_rate": 2.2020636805694522e-06, "loss": 0.1861, "step": 64615 }, { "epoch": 0.87, "learning_rate": 2.199904965722571e-06, "loss": 0.51, "step": 64620 }, { "epoch": 0.87, "learning_rate": 2.1977472608058435e-06, "loss": 0.7777, "step": 64625 }, { "epoch": 0.87, "learning_rate": 2.1955905659148292e-06, "loss": 0.9288, "step": 64630 }, { "epoch": 0.87, "learning_rate": 2.1934348811450707e-06, "loss": 0.6243, "step": 64635 }, { "epoch": 0.87, "learning_rate": 2.1912802065920473e-06, "loss": 1.3212, "step": 64640 }, { "epoch": 0.87, "learning_rate": 2.1891265423511996e-06, "loss": 1.5601, "step": 64645 }, { "epoch": 0.87, "learning_rate": 2.186973888517929e-06, "loss": 0.5004, "step": 64650 }, { "epoch": 0.87, "learning_rate": 2.1848222451875872e-06, "loss": 0.4103, "step": 64655 }, { "epoch": 0.87, "learning_rate": 2.1826716124554753e-06, "loss": 0.1241, "step": 64660 }, { "epoch": 0.87, "learning_rate": 2.180521990416862e-06, "loss": 0.2841, "step": 64665 }, { "epoch": 0.87, "learning_rate": 2.178373379166962e-06, "loss": 0.3708, "step": 64670 }, { "epoch": 0.87, "learning_rate": 2.17622577880095e-06, "loss": 0.2627, "step": 64675 }, { "epoch": 0.87, "learning_rate": 2.1740791894139466e-06, "loss": 0.8499, "step": 64680 }, { "epoch": 0.87, "learning_rate": 2.171933611101046e-06, "loss": 0.7305, "step": 64685 }, { "epoch": 0.87, "learning_rate": 2.169789043957282e-06, "loss": 0.8783, "step": 64690 }, { "epoch": 0.87, "learning_rate": 2.167645488077641e-06, "loss": 0.4754, "step": 64695 }, { "epoch": 0.87, "learning_rate": 2.1655029435570877e-06, "loss": 0.1699, "step": 64700 }, { "epoch": 0.87, "learning_rate": 2.163361410490508e-06, "loss": 0.8125, "step": 64705 }, { "epoch": 0.87, "learning_rate": 2.161220888972773e-06, "loss": 0.9768, "step": 64710 }, { "epoch": 0.87, "learning_rate": 2.159081379098696e-06, "loss": 0.1912, "step": 64715 }, { "epoch": 0.87, "learning_rate": 2.1569428809630394e-06, "loss": 0.874, "step": 64720 }, { "epoch": 0.87, "learning_rate": 2.154805394660536e-06, "loss": 0.3483, "step": 64725 }, { "epoch": 0.87, "learning_rate": 2.152668920285858e-06, "loss": 0.7556, "step": 64730 }, { "epoch": 0.87, "learning_rate": 2.1505334579336566e-06, "loss": 0.9671, "step": 64735 }, { "epoch": 0.87, "learning_rate": 2.1483990076984985e-06, "loss": 0.9103, "step": 64740 }, { "epoch": 0.87, "learning_rate": 2.146265569674949e-06, "loss": 0.3638, "step": 64745 }, { "epoch": 0.87, "learning_rate": 2.1441331439574996e-06, "loss": 0.7438, "step": 64750 }, { "epoch": 0.87, "learning_rate": 2.1420017306406027e-06, "loss": 0.1751, "step": 64755 }, { "epoch": 0.87, "learning_rate": 2.1398713298186795e-06, "loss": 0.6076, "step": 64760 }, { "epoch": 0.87, "learning_rate": 2.137741941586091e-06, "loss": 1.3459, "step": 64765 }, { "epoch": 0.87, "learning_rate": 2.1356135660371536e-06, "loss": 0.8937, "step": 64770 }, { "epoch": 0.87, "learning_rate": 2.133486203266152e-06, "loss": 0.8084, "step": 64775 }, { "epoch": 0.87, "learning_rate": 2.131359853367315e-06, "loss": 1.0297, "step": 64780 }, { "epoch": 0.87, "learning_rate": 2.1292345164348275e-06, "loss": 1.0151, "step": 64785 }, { "epoch": 0.87, "learning_rate": 2.1271101925628285e-06, "loss": 0.6516, "step": 64790 }, { "epoch": 0.87, "learning_rate": 2.124986881845423e-06, "loss": 0.7465, "step": 64795 }, { "epoch": 0.87, "learning_rate": 2.1228645843766577e-06, "loss": 0.9273, "step": 64800 }, { "epoch": 0.87, "learning_rate": 2.1207433002505356e-06, "loss": 0.87, "step": 64805 }, { "epoch": 0.87, "learning_rate": 2.1186230295610343e-06, "loss": 0.3642, "step": 64810 }, { "epoch": 0.87, "learning_rate": 2.116503772402051e-06, "loss": 0.7907, "step": 64815 }, { "epoch": 0.87, "learning_rate": 2.1143855288674715e-06, "loss": 0.4248, "step": 64820 }, { "epoch": 0.87, "learning_rate": 2.1122682990511205e-06, "loss": 1.318, "step": 64825 }, { "epoch": 0.87, "learning_rate": 2.110152083046776e-06, "loss": 0.549, "step": 64830 }, { "epoch": 0.87, "learning_rate": 2.108036880948186e-06, "loss": 0.5083, "step": 64835 }, { "epoch": 0.87, "learning_rate": 2.1059226928490355e-06, "loss": 0.8796, "step": 64840 }, { "epoch": 0.87, "learning_rate": 2.1038095188429753e-06, "loss": 0.2169, "step": 64845 }, { "epoch": 0.87, "learning_rate": 2.101697359023602e-06, "loss": 0.4325, "step": 64850 }, { "epoch": 0.87, "learning_rate": 2.0995862134844834e-06, "loss": 1.0453, "step": 64855 }, { "epoch": 0.87, "learning_rate": 2.0974760823191303e-06, "loss": 1.1985, "step": 64860 }, { "epoch": 0.87, "learning_rate": 2.095366965621004e-06, "loss": 0.6512, "step": 64865 }, { "epoch": 0.87, "learning_rate": 2.0932588634835354e-06, "loss": 0.4939, "step": 64870 }, { "epoch": 0.87, "learning_rate": 2.0911517760001025e-06, "loss": 0.4733, "step": 64875 }, { "epoch": 0.87, "learning_rate": 2.089045703264031e-06, "loss": 0.4984, "step": 64880 }, { "epoch": 0.87, "learning_rate": 2.086940645368618e-06, "loss": 0.9887, "step": 64885 }, { "epoch": 0.87, "learning_rate": 2.084836602407106e-06, "loss": 1.2696, "step": 64890 }, { "epoch": 0.87, "learning_rate": 2.0827335744726923e-06, "loss": 0.5406, "step": 64895 }, { "epoch": 0.87, "learning_rate": 2.080631561658522e-06, "loss": 0.3693, "step": 64900 }, { "epoch": 0.87, "learning_rate": 2.078530564057718e-06, "loss": 0.9828, "step": 64905 }, { "epoch": 0.87, "learning_rate": 2.076430581763339e-06, "loss": 0.628, "step": 64910 }, { "epoch": 0.87, "learning_rate": 2.0743316148683967e-06, "loss": 1.0808, "step": 64915 }, { "epoch": 0.87, "learning_rate": 2.072233663465878e-06, "loss": 0.4795, "step": 64920 }, { "epoch": 0.87, "learning_rate": 2.0701367276486945e-06, "loss": 0.4286, "step": 64925 }, { "epoch": 0.87, "learning_rate": 2.068040807509747e-06, "loss": 1.6242, "step": 64930 }, { "epoch": 0.87, "learning_rate": 2.0659459031418638e-06, "loss": 0.7966, "step": 64935 }, { "epoch": 0.87, "learning_rate": 2.0638520146378375e-06, "loss": 0.8278, "step": 64940 }, { "epoch": 0.87, "learning_rate": 2.0617591420904277e-06, "loss": 0.9359, "step": 64945 }, { "epoch": 0.87, "learning_rate": 2.0596672855923286e-06, "loss": 0.3468, "step": 64950 }, { "epoch": 0.87, "learning_rate": 2.057576445236206e-06, "loss": 0.6773, "step": 64955 }, { "epoch": 0.87, "learning_rate": 2.0554866211146604e-06, "loss": 1.0067, "step": 64960 }, { "epoch": 0.87, "learning_rate": 2.0533978133202734e-06, "loss": 0.5766, "step": 64965 }, { "epoch": 0.87, "learning_rate": 2.0513100219455712e-06, "loss": 1.0344, "step": 64970 }, { "epoch": 0.87, "learning_rate": 2.049223247083021e-06, "loss": 0.3535, "step": 64975 }, { "epoch": 0.87, "learning_rate": 2.047137488825063e-06, "loss": 1.0661, "step": 64980 }, { "epoch": 0.87, "learning_rate": 2.045052747264084e-06, "loss": 0.8394, "step": 64985 }, { "epoch": 0.87, "learning_rate": 2.0429690224924275e-06, "loss": 0.6487, "step": 64990 }, { "epoch": 0.87, "learning_rate": 2.0408863146023945e-06, "loss": 0.5655, "step": 64995 }, { "epoch": 0.87, "learning_rate": 2.0388046236862384e-06, "loss": 0.32, "step": 65000 }, { "epoch": 0.87, "learning_rate": 2.036723949836164e-06, "loss": 0.8042, "step": 65005 }, { "epoch": 0.87, "learning_rate": 2.034644293144333e-06, "loss": 0.765, "step": 65010 }, { "epoch": 0.87, "learning_rate": 2.032565653702875e-06, "loss": 0.402, "step": 65015 }, { "epoch": 0.87, "learning_rate": 2.0304880316038525e-06, "loss": 0.9113, "step": 65020 }, { "epoch": 0.87, "learning_rate": 2.0284114269392974e-06, "loss": 0.8413, "step": 65025 }, { "epoch": 0.87, "learning_rate": 2.0263358398011967e-06, "loss": 0.5213, "step": 65030 }, { "epoch": 0.87, "learning_rate": 2.0242612702814802e-06, "loss": 0.5893, "step": 65035 }, { "epoch": 0.87, "learning_rate": 2.022187718472046e-06, "loss": 0.3119, "step": 65040 }, { "epoch": 0.87, "learning_rate": 2.0201151844647436e-06, "loss": 0.8973, "step": 65045 }, { "epoch": 0.87, "learning_rate": 2.0180436683513687e-06, "loss": 0.7726, "step": 65050 }, { "epoch": 0.87, "learning_rate": 2.0159731702236897e-06, "loss": 0.5379, "step": 65055 }, { "epoch": 0.87, "learning_rate": 2.013903690173413e-06, "loss": 0.3572, "step": 65060 }, { "epoch": 0.87, "learning_rate": 2.011835228292208e-06, "loss": 0.7851, "step": 65065 }, { "epoch": 0.87, "learning_rate": 2.00976778467169e-06, "loss": 0.299, "step": 65070 }, { "epoch": 0.87, "learning_rate": 2.0077013594034437e-06, "loss": 0.8152, "step": 65075 }, { "epoch": 0.87, "learning_rate": 2.0056359525790075e-06, "loss": 0.4495, "step": 65080 }, { "epoch": 0.87, "learning_rate": 2.003571564289855e-06, "loss": 0.7289, "step": 65085 }, { "epoch": 0.87, "learning_rate": 2.0015081946274385e-06, "loss": 0.5855, "step": 65090 }, { "epoch": 0.87, "learning_rate": 1.999445843683151e-06, "loss": 1.0811, "step": 65095 }, { "epoch": 0.87, "learning_rate": 1.997384511548339e-06, "loss": 0.6699, "step": 65100 }, { "epoch": 0.87, "learning_rate": 1.9953241983143188e-06, "loss": 0.693, "step": 65105 }, { "epoch": 0.87, "learning_rate": 1.9932649040723504e-06, "loss": 0.6396, "step": 65110 }, { "epoch": 0.87, "learning_rate": 1.9912066289136445e-06, "loss": 0.2457, "step": 65115 }, { "epoch": 0.87, "learning_rate": 1.989149372929375e-06, "loss": 0.5694, "step": 65120 }, { "epoch": 0.87, "learning_rate": 1.9870931362106686e-06, "loss": 0.2501, "step": 65125 }, { "epoch": 0.87, "learning_rate": 1.985037918848609e-06, "loss": 0.7466, "step": 65130 }, { "epoch": 0.87, "learning_rate": 1.9829837209342254e-06, "loss": 1.1055, "step": 65135 }, { "epoch": 0.87, "learning_rate": 1.980930542558521e-06, "loss": 0.4449, "step": 65140 }, { "epoch": 0.87, "learning_rate": 1.9788783838124213e-06, "loss": 0.5222, "step": 65145 }, { "epoch": 0.87, "learning_rate": 1.976827244786847e-06, "loss": 0.9556, "step": 65150 }, { "epoch": 0.87, "learning_rate": 1.974777125572641e-06, "loss": 0.7672, "step": 65155 }, { "epoch": 0.87, "learning_rate": 1.9727280262606147e-06, "loss": 0.5314, "step": 65160 }, { "epoch": 0.87, "learning_rate": 1.9706799469415368e-06, "loss": 0.8535, "step": 65165 }, { "epoch": 0.87, "learning_rate": 1.968632887706126e-06, "loss": 0.6467, "step": 65170 }, { "epoch": 0.87, "learning_rate": 1.966586848645058e-06, "loss": 0.608, "step": 65175 }, { "epoch": 0.87, "learning_rate": 1.9645418298489536e-06, "loss": 0.9437, "step": 65180 }, { "epoch": 0.87, "learning_rate": 1.9624978314084026e-06, "loss": 1.1413, "step": 65185 }, { "epoch": 0.87, "learning_rate": 1.9604548534139566e-06, "loss": 0.6023, "step": 65190 }, { "epoch": 0.87, "learning_rate": 1.9584128959560855e-06, "loss": 0.5694, "step": 65195 }, { "epoch": 0.87, "learning_rate": 1.9563719591252555e-06, "loss": 1.0227, "step": 65200 }, { "epoch": 0.87, "learning_rate": 1.954332043011864e-06, "loss": 0.737, "step": 65205 }, { "epoch": 0.87, "learning_rate": 1.9522931477062634e-06, "loss": 0.4075, "step": 65210 }, { "epoch": 0.87, "learning_rate": 1.950255273298779e-06, "loss": 0.8599, "step": 65215 }, { "epoch": 0.87, "learning_rate": 1.9482184198796715e-06, "loss": 1.3345, "step": 65220 }, { "epoch": 0.87, "learning_rate": 1.9461825875391608e-06, "loss": 0.4409, "step": 65225 }, { "epoch": 0.87, "learning_rate": 1.944147776367425e-06, "loss": 0.2892, "step": 65230 }, { "epoch": 0.87, "learning_rate": 1.9421139864546023e-06, "loss": 0.7566, "step": 65235 }, { "epoch": 0.87, "learning_rate": 1.940081217890774e-06, "loss": 0.8408, "step": 65240 }, { "epoch": 0.87, "learning_rate": 1.938049470765979e-06, "loss": 0.8964, "step": 65245 }, { "epoch": 0.87, "learning_rate": 1.936018745170226e-06, "loss": 0.4593, "step": 65250 }, { "epoch": 0.87, "learning_rate": 1.9339890411934488e-06, "loss": 0.3331, "step": 65255 }, { "epoch": 0.87, "learning_rate": 1.9319603589255638e-06, "loss": 1.0627, "step": 65260 }, { "epoch": 0.87, "learning_rate": 1.92993269845643e-06, "loss": 0.2616, "step": 65265 }, { "epoch": 0.87, "learning_rate": 1.9279060598758586e-06, "loss": 0.6288, "step": 65270 }, { "epoch": 0.87, "learning_rate": 1.9258804432736255e-06, "loss": 0.9797, "step": 65275 }, { "epoch": 0.87, "learning_rate": 1.9238558487394532e-06, "loss": 0.8699, "step": 65280 }, { "epoch": 0.87, "learning_rate": 1.92183227636302e-06, "loss": 0.5119, "step": 65285 }, { "epoch": 0.87, "learning_rate": 1.9198097262339566e-06, "loss": 0.7536, "step": 65290 }, { "epoch": 0.87, "learning_rate": 1.9177881984418554e-06, "loss": 0.8349, "step": 65295 }, { "epoch": 0.87, "learning_rate": 1.91576769307627e-06, "loss": 0.7022, "step": 65300 }, { "epoch": 0.87, "learning_rate": 1.913748210226679e-06, "loss": 0.8255, "step": 65305 }, { "epoch": 0.88, "learning_rate": 1.911729749982552e-06, "loss": 0.5315, "step": 65310 }, { "epoch": 0.88, "learning_rate": 1.9097123124332873e-06, "loss": 0.7899, "step": 65315 }, { "epoch": 0.88, "learning_rate": 1.907695897668246e-06, "loss": 0.4903, "step": 65320 }, { "epoch": 0.88, "learning_rate": 1.9056805057767552e-06, "loss": 0.2736, "step": 65325 }, { "epoch": 0.88, "learning_rate": 1.9036661368480812e-06, "loss": 0.4787, "step": 65330 }, { "epoch": 0.88, "learning_rate": 1.9016527909714477e-06, "loss": 0.4923, "step": 65335 }, { "epoch": 0.88, "learning_rate": 1.8996404682360357e-06, "loss": 0.7857, "step": 65340 }, { "epoch": 0.88, "learning_rate": 1.8976291687309884e-06, "loss": 0.6137, "step": 65345 }, { "epoch": 0.88, "learning_rate": 1.8956188925453893e-06, "loss": 0.1294, "step": 65350 }, { "epoch": 0.88, "learning_rate": 1.8936096397682818e-06, "loss": 0.4831, "step": 65355 }, { "epoch": 0.88, "learning_rate": 1.8916014104886775e-06, "loss": 0.5019, "step": 65360 }, { "epoch": 0.88, "learning_rate": 1.8895942047955166e-06, "loss": 0.3323, "step": 65365 }, { "epoch": 0.88, "learning_rate": 1.88758802277772e-06, "loss": 0.8504, "step": 65370 }, { "epoch": 0.88, "learning_rate": 1.8855828645241437e-06, "loss": 0.8782, "step": 65375 }, { "epoch": 0.88, "learning_rate": 1.883578730123603e-06, "loss": 1.1444, "step": 65380 }, { "epoch": 0.88, "learning_rate": 1.8815756196648854e-06, "loss": 0.22, "step": 65385 }, { "epoch": 0.88, "learning_rate": 1.8795735332367059e-06, "loss": 0.2003, "step": 65390 }, { "epoch": 0.88, "learning_rate": 1.8775724709277492e-06, "loss": 1.0296, "step": 65395 }, { "epoch": 0.88, "learning_rate": 1.8755724328266582e-06, "loss": 1.2078, "step": 65400 }, { "epoch": 0.88, "learning_rate": 1.873573419022015e-06, "loss": 0.8185, "step": 65405 }, { "epoch": 0.88, "learning_rate": 1.871575429602379e-06, "loss": 1.3206, "step": 65410 }, { "epoch": 0.88, "learning_rate": 1.869578464656238e-06, "loss": 0.9707, "step": 65415 }, { "epoch": 0.88, "learning_rate": 1.8675825242720573e-06, "loss": 0.9024, "step": 65420 }, { "epoch": 0.88, "learning_rate": 1.8655876085382413e-06, "loss": 0.5573, "step": 65425 }, { "epoch": 0.88, "learning_rate": 1.8635937175431523e-06, "loss": 0.2503, "step": 65430 }, { "epoch": 0.88, "learning_rate": 1.8616008513751199e-06, "loss": 0.4273, "step": 65435 }, { "epoch": 0.88, "learning_rate": 1.8596090101224094e-06, "loss": 1.0644, "step": 65440 }, { "epoch": 0.88, "learning_rate": 1.8576181938732533e-06, "loss": 0.8616, "step": 65445 }, { "epoch": 0.88, "learning_rate": 1.8556284027158284e-06, "loss": 0.9634, "step": 65450 }, { "epoch": 0.88, "learning_rate": 1.853639636738283e-06, "loss": 1.0538, "step": 65455 }, { "epoch": 0.88, "learning_rate": 1.8516518960287055e-06, "loss": 0.5383, "step": 65460 }, { "epoch": 0.88, "learning_rate": 1.8496651806751337e-06, "loss": 0.983, "step": 65465 }, { "epoch": 0.88, "learning_rate": 1.8476794907655887e-06, "loss": 0.5661, "step": 65470 }, { "epoch": 0.88, "learning_rate": 1.845694826388003e-06, "loss": 0.6519, "step": 65475 }, { "epoch": 0.88, "learning_rate": 1.8437111876303065e-06, "loss": 0.4151, "step": 65480 }, { "epoch": 0.88, "learning_rate": 1.8417285745803565e-06, "loss": 0.5313, "step": 65485 }, { "epoch": 0.88, "learning_rate": 1.8397469873259688e-06, "loss": 1.055, "step": 65490 }, { "epoch": 0.88, "learning_rate": 1.837766425954926e-06, "loss": 1.1667, "step": 65495 }, { "epoch": 0.88, "learning_rate": 1.8357868905549524e-06, "loss": 1.0365, "step": 65500 }, { "epoch": 0.88, "learning_rate": 1.8338083812137307e-06, "loss": 0.6223, "step": 65505 }, { "epoch": 0.88, "learning_rate": 1.8318308980189048e-06, "loss": 0.822, "step": 65510 }, { "epoch": 0.88, "learning_rate": 1.8298544410580627e-06, "loss": 0.6158, "step": 65515 }, { "epoch": 0.88, "learning_rate": 1.8278790104187538e-06, "loss": 0.5412, "step": 65520 }, { "epoch": 0.88, "learning_rate": 1.8259046061884722e-06, "loss": 1.0552, "step": 65525 }, { "epoch": 0.88, "learning_rate": 1.823931228454684e-06, "loss": 0.8794, "step": 65530 }, { "epoch": 0.88, "learning_rate": 1.8219588773047969e-06, "loss": 0.6484, "step": 65535 }, { "epoch": 0.88, "learning_rate": 1.8199875528261717e-06, "loss": 0.9667, "step": 65540 }, { "epoch": 0.88, "learning_rate": 1.8180172551061358e-06, "loss": 0.6354, "step": 65545 }, { "epoch": 0.88, "learning_rate": 1.816047984231961e-06, "loss": 0.3439, "step": 65550 }, { "epoch": 0.88, "learning_rate": 1.814079740290872e-06, "loss": 0.3485, "step": 65555 }, { "epoch": 0.88, "learning_rate": 1.8121125233700547e-06, "loss": 0.2948, "step": 65560 }, { "epoch": 0.88, "learning_rate": 1.8101463335566477e-06, "loss": 0.277, "step": 65565 }, { "epoch": 0.88, "learning_rate": 1.8081811709377449e-06, "loss": 0.8508, "step": 65570 }, { "epoch": 0.88, "learning_rate": 1.8062170356003855e-06, "loss": 0.4357, "step": 65575 }, { "epoch": 0.88, "learning_rate": 1.8042539276315855e-06, "loss": 1.4305, "step": 65580 }, { "epoch": 0.88, "learning_rate": 1.802291847118287e-06, "loss": 0.8404, "step": 65585 }, { "epoch": 0.88, "learning_rate": 1.8003307941474062e-06, "loss": 0.5287, "step": 65590 }, { "epoch": 0.88, "learning_rate": 1.798370768805807e-06, "loss": 0.964, "step": 65595 }, { "epoch": 0.88, "learning_rate": 1.7964117711803036e-06, "loss": 0.2909, "step": 65600 }, { "epoch": 0.88, "learning_rate": 1.7944538013576789e-06, "loss": 0.559, "step": 65605 }, { "epoch": 0.88, "learning_rate": 1.7924968594246582e-06, "loss": 1.0435, "step": 65610 }, { "epoch": 0.88, "learning_rate": 1.7905409454679195e-06, "loss": 0.6158, "step": 65615 }, { "epoch": 0.88, "learning_rate": 1.7885860595741071e-06, "loss": 0.279, "step": 65620 }, { "epoch": 0.88, "learning_rate": 1.7866322018298104e-06, "loss": 1.0699, "step": 65625 }, { "epoch": 0.88, "learning_rate": 1.7846793723215737e-06, "loss": 0.4224, "step": 65630 }, { "epoch": 0.88, "learning_rate": 1.782727571135892e-06, "loss": 1.1024, "step": 65635 }, { "epoch": 0.88, "learning_rate": 1.7807767983592323e-06, "loss": 0.8161, "step": 65640 }, { "epoch": 0.88, "learning_rate": 1.778827054078e-06, "loss": 0.3455, "step": 65645 }, { "epoch": 0.88, "learning_rate": 1.7768783383785514e-06, "loss": 0.2968, "step": 65650 }, { "epoch": 0.88, "learning_rate": 1.7749306513472147e-06, "loss": 1.0527, "step": 65655 }, { "epoch": 0.88, "learning_rate": 1.7729839930702595e-06, "loss": 0.5878, "step": 65660 }, { "epoch": 0.88, "learning_rate": 1.7710383636339118e-06, "loss": 1.2954, "step": 65665 }, { "epoch": 0.88, "learning_rate": 1.7690937631243494e-06, "loss": 0.3842, "step": 65670 }, { "epoch": 0.88, "learning_rate": 1.7671501916277173e-06, "loss": 0.1964, "step": 65675 }, { "epoch": 0.88, "learning_rate": 1.7652076492301024e-06, "loss": 0.8052, "step": 65680 }, { "epoch": 0.88, "learning_rate": 1.763266136017541e-06, "loss": 0.4016, "step": 65685 }, { "epoch": 0.88, "learning_rate": 1.7613256520760513e-06, "loss": 0.5486, "step": 65690 }, { "epoch": 0.88, "learning_rate": 1.7593861974915665e-06, "loss": 0.1226, "step": 65695 }, { "epoch": 0.88, "learning_rate": 1.7574477723500099e-06, "loss": 0.5522, "step": 65700 }, { "epoch": 0.88, "learning_rate": 1.7555103767372377e-06, "loss": 0.4388, "step": 65705 }, { "epoch": 0.88, "learning_rate": 1.7535740107390619e-06, "loss": 0.7918, "step": 65710 }, { "epoch": 0.88, "learning_rate": 1.751638674441264e-06, "loss": 0.1981, "step": 65715 }, { "epoch": 0.88, "learning_rate": 1.7497043679295638e-06, "loss": 0.7566, "step": 65720 }, { "epoch": 0.88, "learning_rate": 1.7477710912896377e-06, "loss": 0.2172, "step": 65725 }, { "epoch": 0.88, "learning_rate": 1.7458388446071312e-06, "loss": 0.9918, "step": 65730 }, { "epoch": 0.88, "learning_rate": 1.7439076279676282e-06, "loss": 0.3393, "step": 65735 }, { "epoch": 0.88, "learning_rate": 1.7419774414566687e-06, "loss": 0.9086, "step": 65740 }, { "epoch": 0.88, "learning_rate": 1.7400482851597483e-06, "loss": 0.652, "step": 65745 }, { "epoch": 0.88, "learning_rate": 1.7381201591623263e-06, "loss": 0.9605, "step": 65750 }, { "epoch": 0.88, "learning_rate": 1.7361930635498069e-06, "loss": 1.0496, "step": 65755 }, { "epoch": 0.88, "learning_rate": 1.7342669984075465e-06, "loss": 0.837, "step": 65760 }, { "epoch": 0.88, "learning_rate": 1.732341963820866e-06, "loss": 0.5105, "step": 65765 }, { "epoch": 0.88, "learning_rate": 1.7304179598750331e-06, "loss": 0.5086, "step": 65770 }, { "epoch": 0.88, "learning_rate": 1.7284949866552686e-06, "loss": 0.2485, "step": 65775 }, { "epoch": 0.88, "learning_rate": 1.7265730442467487e-06, "loss": 0.5476, "step": 65780 }, { "epoch": 0.88, "learning_rate": 1.7246521327346139e-06, "loss": 0.6739, "step": 65785 }, { "epoch": 0.88, "learning_rate": 1.7227322522039485e-06, "loss": 0.495, "step": 65790 }, { "epoch": 0.88, "learning_rate": 1.7208134027397876e-06, "loss": 0.4748, "step": 65795 }, { "epoch": 0.88, "learning_rate": 1.7188955844271382e-06, "loss": 1.1057, "step": 65800 }, { "epoch": 0.88, "learning_rate": 1.7169787973509322e-06, "loss": 0.978, "step": 65805 }, { "epoch": 0.88, "learning_rate": 1.7150630415960905e-06, "loss": 0.8958, "step": 65810 }, { "epoch": 0.88, "learning_rate": 1.713148317247465e-06, "loss": 1.0638, "step": 65815 }, { "epoch": 0.88, "learning_rate": 1.7112346243898652e-06, "loss": 0.1894, "step": 65820 }, { "epoch": 0.88, "learning_rate": 1.7093219631080653e-06, "loss": 0.7032, "step": 65825 }, { "epoch": 0.88, "learning_rate": 1.7074103334867835e-06, "loss": 0.5214, "step": 65830 }, { "epoch": 0.88, "learning_rate": 1.7054997356106883e-06, "loss": 1.1474, "step": 65835 }, { "epoch": 0.88, "learning_rate": 1.703590169564423e-06, "loss": 0.4132, "step": 65840 }, { "epoch": 0.88, "learning_rate": 1.7016816354325644e-06, "loss": 0.8263, "step": 65845 }, { "epoch": 0.88, "learning_rate": 1.6997741332996503e-06, "loss": 0.9525, "step": 65850 }, { "epoch": 0.88, "learning_rate": 1.6978676632501688e-06, "loss": 0.5659, "step": 65855 }, { "epoch": 0.88, "learning_rate": 1.6959622253685803e-06, "loss": 0.6427, "step": 65860 }, { "epoch": 0.88, "learning_rate": 1.694057819739278e-06, "loss": 0.3494, "step": 65865 }, { "epoch": 0.88, "learning_rate": 1.6921544464466144e-06, "loss": 0.4335, "step": 65870 }, { "epoch": 0.88, "learning_rate": 1.690252105574905e-06, "loss": 0.8915, "step": 65875 }, { "epoch": 0.88, "learning_rate": 1.6883507972084156e-06, "loss": 1.0048, "step": 65880 }, { "epoch": 0.88, "learning_rate": 1.6864505214313596e-06, "loss": 1.0793, "step": 65885 }, { "epoch": 0.88, "learning_rate": 1.684551278327909e-06, "loss": 0.7706, "step": 65890 }, { "epoch": 0.88, "learning_rate": 1.6826530679821956e-06, "loss": 0.7276, "step": 65895 }, { "epoch": 0.88, "learning_rate": 1.6807558904782972e-06, "loss": 1.0939, "step": 65900 }, { "epoch": 0.88, "learning_rate": 1.6788597459002492e-06, "loss": 0.9242, "step": 65905 }, { "epoch": 0.88, "learning_rate": 1.6769646343320484e-06, "loss": 0.6824, "step": 65910 }, { "epoch": 0.88, "learning_rate": 1.6750705558576273e-06, "loss": 0.6357, "step": 65915 }, { "epoch": 0.88, "learning_rate": 1.673177510560886e-06, "loss": 0.4574, "step": 65920 }, { "epoch": 0.88, "learning_rate": 1.6712854985256904e-06, "loss": 0.7436, "step": 65925 }, { "epoch": 0.88, "learning_rate": 1.669394519835829e-06, "loss": 0.8416, "step": 65930 }, { "epoch": 0.88, "learning_rate": 1.6675045745750767e-06, "loss": 0.5414, "step": 65935 }, { "epoch": 0.88, "learning_rate": 1.6656156628271413e-06, "loss": 0.6955, "step": 65940 }, { "epoch": 0.88, "learning_rate": 1.6637277846756894e-06, "loss": 0.857, "step": 65945 }, { "epoch": 0.88, "learning_rate": 1.6618409402043539e-06, "loss": 0.4898, "step": 65950 }, { "epoch": 0.88, "learning_rate": 1.6599551294967098e-06, "loss": 0.7964, "step": 65955 }, { "epoch": 0.88, "learning_rate": 1.6580703526362845e-06, "loss": 0.5801, "step": 65960 }, { "epoch": 0.88, "learning_rate": 1.6561866097065616e-06, "loss": 0.8715, "step": 65965 }, { "epoch": 0.88, "learning_rate": 1.6543039007909904e-06, "loss": 0.5571, "step": 65970 }, { "epoch": 0.88, "learning_rate": 1.6524222259729633e-06, "loss": 0.6283, "step": 65975 }, { "epoch": 0.88, "learning_rate": 1.650541585335824e-06, "loss": 0.8277, "step": 65980 }, { "epoch": 0.88, "learning_rate": 1.6486619789628788e-06, "loss": 0.6719, "step": 65985 }, { "epoch": 0.88, "learning_rate": 1.6467834069373883e-06, "loss": 0.4954, "step": 65990 }, { "epoch": 0.88, "learning_rate": 1.6449058693425612e-06, "loss": 0.7239, "step": 65995 }, { "epoch": 0.88, "learning_rate": 1.643029366261556e-06, "loss": 0.1796, "step": 66000 }, { "epoch": 0.88, "learning_rate": 1.6411538977775032e-06, "loss": 1.0827, "step": 66005 }, { "epoch": 0.88, "learning_rate": 1.6392794639734726e-06, "loss": 0.6171, "step": 66010 }, { "epoch": 0.88, "learning_rate": 1.6374060649324869e-06, "loss": 0.3195, "step": 66015 }, { "epoch": 0.88, "learning_rate": 1.6355337007375405e-06, "loss": 0.3628, "step": 66020 }, { "epoch": 0.88, "learning_rate": 1.633662371471556e-06, "loss": 0.6287, "step": 66025 }, { "epoch": 0.88, "learning_rate": 1.6317920772174284e-06, "loss": 0.819, "step": 66030 }, { "epoch": 0.88, "learning_rate": 1.629922818058016e-06, "loss": 0.6584, "step": 66035 }, { "epoch": 0.88, "learning_rate": 1.6280545940760949e-06, "loss": 0.5436, "step": 66040 }, { "epoch": 0.88, "learning_rate": 1.6261874053544345e-06, "loss": 1.0623, "step": 66045 }, { "epoch": 0.88, "learning_rate": 1.6243212519757355e-06, "loss": 1.1188, "step": 66050 }, { "epoch": 0.89, "learning_rate": 1.622456134022657e-06, "loss": 0.538, "step": 66055 }, { "epoch": 0.89, "learning_rate": 1.6205920515778212e-06, "loss": 0.761, "step": 66060 }, { "epoch": 0.89, "learning_rate": 1.6187290047237929e-06, "loss": 1.164, "step": 66065 }, { "epoch": 0.89, "learning_rate": 1.616866993543098e-06, "loss": 0.7573, "step": 66070 }, { "epoch": 0.89, "learning_rate": 1.6150060181182092e-06, "loss": 0.8963, "step": 66075 }, { "epoch": 0.89, "learning_rate": 1.613146078531566e-06, "loss": 0.8449, "step": 66080 }, { "epoch": 0.89, "learning_rate": 1.6112871748655501e-06, "loss": 0.7151, "step": 66085 }, { "epoch": 0.89, "learning_rate": 1.6094293072025007e-06, "loss": 0.8861, "step": 66090 }, { "epoch": 0.89, "learning_rate": 1.6075724756247163e-06, "loss": 0.4715, "step": 66095 }, { "epoch": 0.89, "learning_rate": 1.605716680214442e-06, "loss": 0.5334, "step": 66100 }, { "epoch": 0.89, "learning_rate": 1.6038619210538813e-06, "loss": 0.3643, "step": 66105 }, { "epoch": 0.89, "learning_rate": 1.6020081982251856e-06, "loss": 1.0476, "step": 66110 }, { "epoch": 0.89, "learning_rate": 1.600155511810475e-06, "loss": 0.9071, "step": 66115 }, { "epoch": 0.89, "learning_rate": 1.598303861891809e-06, "loss": 0.486, "step": 66120 }, { "epoch": 0.89, "learning_rate": 1.5964532485512051e-06, "loss": 0.097, "step": 66125 }, { "epoch": 0.89, "learning_rate": 1.5946036718706425e-06, "loss": 0.4798, "step": 66130 }, { "epoch": 0.89, "learning_rate": 1.5927551319320388e-06, "loss": 0.6491, "step": 66135 }, { "epoch": 0.89, "learning_rate": 1.5909076288172786e-06, "loss": 0.7366, "step": 66140 }, { "epoch": 0.89, "learning_rate": 1.5890611626082047e-06, "loss": 0.6332, "step": 66145 }, { "epoch": 0.89, "learning_rate": 1.587215733386596e-06, "loss": 0.4347, "step": 66150 }, { "epoch": 0.89, "learning_rate": 1.5853713412342014e-06, "loss": 0.6123, "step": 66155 }, { "epoch": 0.89, "learning_rate": 1.5835279862327162e-06, "loss": 0.6322, "step": 66160 }, { "epoch": 0.89, "learning_rate": 1.5816856684637892e-06, "loss": 0.9471, "step": 66165 }, { "epoch": 0.89, "learning_rate": 1.579844388009033e-06, "loss": 0.9361, "step": 66170 }, { "epoch": 0.89, "learning_rate": 1.5780041449500016e-06, "loss": 0.3383, "step": 66175 }, { "epoch": 0.89, "learning_rate": 1.5761649393682133e-06, "loss": 1.3028, "step": 66180 }, { "epoch": 0.89, "learning_rate": 1.5743267713451248e-06, "loss": 0.8873, "step": 66185 }, { "epoch": 0.89, "learning_rate": 1.5724896409621715e-06, "loss": 0.7902, "step": 66190 }, { "epoch": 0.89, "learning_rate": 1.5706535483007212e-06, "loss": 1.19, "step": 66195 }, { "epoch": 0.89, "learning_rate": 1.5688184934421035e-06, "loss": 0.3821, "step": 66200 }, { "epoch": 0.89, "learning_rate": 1.5669844764676062e-06, "loss": 0.7825, "step": 66205 }, { "epoch": 0.89, "learning_rate": 1.565151497458467e-06, "loss": 0.7001, "step": 66210 }, { "epoch": 0.89, "learning_rate": 1.5633195564958736e-06, "loss": 0.8107, "step": 66215 }, { "epoch": 0.89, "learning_rate": 1.5614886536609724e-06, "loss": 0.5593, "step": 66220 }, { "epoch": 0.89, "learning_rate": 1.5596587890348651e-06, "loss": 0.4058, "step": 66225 }, { "epoch": 0.89, "learning_rate": 1.5578299626986093e-06, "loss": 0.6955, "step": 66230 }, { "epoch": 0.89, "learning_rate": 1.5560021747332009e-06, "loss": 0.1795, "step": 66235 }, { "epoch": 0.89, "learning_rate": 1.5545406920423029e-06, "loss": 1.3217, "step": 66240 }, { "epoch": 0.89, "learning_rate": 1.552714773348432e-06, "loss": 1.054, "step": 66245 }, { "epoch": 0.89, "learning_rate": 1.5508898932519916e-06, "loss": 0.9317, "step": 66250 }, { "epoch": 0.89, "learning_rate": 1.5490660518338168e-06, "loss": 0.8691, "step": 66255 }, { "epoch": 0.89, "learning_rate": 1.5472432491746985e-06, "loss": 1.0384, "step": 66260 }, { "epoch": 0.89, "learning_rate": 1.5454214853553667e-06, "loss": 0.3958, "step": 66265 }, { "epoch": 0.89, "learning_rate": 1.5436007604565289e-06, "loss": 0.4562, "step": 66270 }, { "epoch": 0.89, "learning_rate": 1.541781074558829e-06, "loss": 0.4473, "step": 66275 }, { "epoch": 0.89, "learning_rate": 1.5399624277428666e-06, "loss": 1.0665, "step": 66280 }, { "epoch": 0.89, "learning_rate": 1.5381448200892073e-06, "loss": 0.8311, "step": 66285 }, { "epoch": 0.89, "learning_rate": 1.5363282516783483e-06, "loss": 0.2394, "step": 66290 }, { "epoch": 0.89, "learning_rate": 1.5345127225907696e-06, "loss": 0.5673, "step": 66295 }, { "epoch": 0.89, "learning_rate": 1.5326982329068816e-06, "loss": 0.4353, "step": 66300 }, { "epoch": 0.89, "learning_rate": 1.5308847827070539e-06, "loss": 0.248, "step": 66305 }, { "epoch": 0.89, "learning_rate": 1.5290723720716243e-06, "loss": 0.9754, "step": 66310 }, { "epoch": 0.89, "learning_rate": 1.5272610010808652e-06, "loss": 0.6769, "step": 66315 }, { "epoch": 0.89, "learning_rate": 1.5254506698150123e-06, "loss": 0.5932, "step": 66320 }, { "epoch": 0.89, "learning_rate": 1.523641378354254e-06, "loss": 0.5375, "step": 66325 }, { "epoch": 0.89, "learning_rate": 1.5218331267787378e-06, "loss": 0.1589, "step": 66330 }, { "epoch": 0.89, "learning_rate": 1.5200259151685548e-06, "loss": 0.9392, "step": 66335 }, { "epoch": 0.89, "learning_rate": 1.5182197436037548e-06, "loss": 0.4067, "step": 66340 }, { "epoch": 0.89, "learning_rate": 1.5164146121643518e-06, "loss": 0.7157, "step": 66345 }, { "epoch": 0.89, "learning_rate": 1.5146105209302875e-06, "loss": 0.7956, "step": 66350 }, { "epoch": 0.89, "learning_rate": 1.5128074699814893e-06, "loss": 0.4328, "step": 66355 }, { "epoch": 0.89, "learning_rate": 1.5110054593978129e-06, "loss": 0.8793, "step": 66360 }, { "epoch": 0.89, "learning_rate": 1.5092044892590862e-06, "loss": 0.5748, "step": 66365 }, { "epoch": 0.89, "learning_rate": 1.5074045596450815e-06, "loss": 0.3518, "step": 66370 }, { "epoch": 0.89, "learning_rate": 1.505605670635518e-06, "loss": 0.9667, "step": 66375 }, { "epoch": 0.89, "learning_rate": 1.503807822310091e-06, "loss": 0.399, "step": 66380 }, { "epoch": 0.89, "learning_rate": 1.5020110147484306e-06, "loss": 1.0493, "step": 66385 }, { "epoch": 0.89, "learning_rate": 1.5002152480301178e-06, "loss": 0.6216, "step": 66390 }, { "epoch": 0.89, "learning_rate": 1.4984205222347141e-06, "loss": 0.6039, "step": 66395 }, { "epoch": 0.89, "learning_rate": 1.4966268374417002e-06, "loss": 0.1112, "step": 66400 }, { "epoch": 0.89, "learning_rate": 1.494834193730535e-06, "loss": 1.5535, "step": 66405 }, { "epoch": 0.89, "learning_rate": 1.493042591180624e-06, "loss": 0.4142, "step": 66410 }, { "epoch": 0.89, "learning_rate": 1.4912520298713205e-06, "loss": 0.8167, "step": 66415 }, { "epoch": 0.89, "learning_rate": 1.4894625098819448e-06, "loss": 0.7701, "step": 66420 }, { "epoch": 0.89, "learning_rate": 1.4876740312917608e-06, "loss": 0.5997, "step": 66425 }, { "epoch": 0.89, "learning_rate": 1.4858865941799887e-06, "loss": 0.3244, "step": 66430 }, { "epoch": 0.89, "learning_rate": 1.4841001986257985e-06, "loss": 0.6351, "step": 66435 }, { "epoch": 0.89, "learning_rate": 1.4823148447083269e-06, "loss": 1.0513, "step": 66440 }, { "epoch": 0.89, "learning_rate": 1.480530532506655e-06, "loss": 0.5939, "step": 66445 }, { "epoch": 0.89, "learning_rate": 1.478747262099811e-06, "loss": 0.7648, "step": 66450 }, { "epoch": 0.89, "learning_rate": 1.4769650335667962e-06, "loss": 1.5181, "step": 66455 }, { "epoch": 0.89, "learning_rate": 1.4751838469865415e-06, "loss": 1.1632, "step": 66460 }, { "epoch": 0.89, "learning_rate": 1.473403702437956e-06, "loss": 1.0103, "step": 66465 }, { "epoch": 0.89, "learning_rate": 1.4716245999998824e-06, "loss": 0.9483, "step": 66470 }, { "epoch": 0.89, "learning_rate": 1.469846539751135e-06, "loss": 0.7046, "step": 66475 }, { "epoch": 0.89, "learning_rate": 1.4680695217704655e-06, "loss": 0.5079, "step": 66480 }, { "epoch": 0.89, "learning_rate": 1.4662935461365878e-06, "loss": 1.056, "step": 66485 }, { "epoch": 0.89, "learning_rate": 1.4645186129281756e-06, "loss": 1.2226, "step": 66490 }, { "epoch": 0.89, "learning_rate": 1.462744722223844e-06, "loss": 1.0067, "step": 66495 }, { "epoch": 0.89, "learning_rate": 1.4609718741021627e-06, "loss": 0.552, "step": 66500 }, { "epoch": 0.89, "learning_rate": 1.4592000686416723e-06, "loss": 0.4224, "step": 66505 }, { "epoch": 0.89, "learning_rate": 1.4574293059208433e-06, "loss": 0.7369, "step": 66510 }, { "epoch": 0.89, "learning_rate": 1.4556595860181183e-06, "loss": 0.3677, "step": 66515 }, { "epoch": 0.89, "learning_rate": 1.4538909090118846e-06, "loss": 1.133, "step": 66520 }, { "epoch": 0.89, "learning_rate": 1.4521232749804825e-06, "loss": 1.1273, "step": 66525 }, { "epoch": 0.89, "learning_rate": 1.4503566840022187e-06, "loss": 0.6547, "step": 66530 }, { "epoch": 0.89, "learning_rate": 1.4485911361553361e-06, "loss": 0.6793, "step": 66535 }, { "epoch": 0.89, "learning_rate": 1.4468266315180445e-06, "loss": 0.6953, "step": 66540 }, { "epoch": 0.89, "learning_rate": 1.4450631701684951e-06, "loss": 0.8136, "step": 66545 }, { "epoch": 0.89, "learning_rate": 1.443300752184809e-06, "loss": 0.6512, "step": 66550 }, { "epoch": 0.89, "learning_rate": 1.4415393776450487e-06, "loss": 1.0251, "step": 66555 }, { "epoch": 0.89, "learning_rate": 1.439779046627232e-06, "loss": 0.3666, "step": 66560 }, { "epoch": 0.89, "learning_rate": 1.4380197592093442e-06, "loss": 0.4597, "step": 66565 }, { "epoch": 0.89, "learning_rate": 1.436261515469295e-06, "loss": 0.4733, "step": 66570 }, { "epoch": 0.89, "learning_rate": 1.4345043154849747e-06, "loss": 0.7522, "step": 66575 }, { "epoch": 0.89, "learning_rate": 1.4327481593342241e-06, "loss": 0.7257, "step": 66580 }, { "epoch": 0.89, "learning_rate": 1.4309930470948251e-06, "loss": 0.7348, "step": 66585 }, { "epoch": 0.89, "learning_rate": 1.4292389788445242e-06, "loss": 0.5339, "step": 66590 }, { "epoch": 0.89, "learning_rate": 1.4274859546610092e-06, "loss": 0.6617, "step": 66595 }, { "epoch": 0.89, "learning_rate": 1.4257339746219428e-06, "loss": 0.9014, "step": 66600 }, { "epoch": 0.89, "learning_rate": 1.4239830388049214e-06, "loss": 0.7164, "step": 66605 }, { "epoch": 0.89, "learning_rate": 1.4222331472875022e-06, "loss": 0.637, "step": 66610 }, { "epoch": 0.89, "learning_rate": 1.420484300147204e-06, "loss": 0.5914, "step": 66615 }, { "epoch": 0.89, "learning_rate": 1.4187364974614813e-06, "loss": 0.9094, "step": 66620 }, { "epoch": 0.89, "learning_rate": 1.4169897393077613e-06, "loss": 0.4181, "step": 66625 }, { "epoch": 0.89, "learning_rate": 1.4152440257634125e-06, "loss": 0.5926, "step": 66630 }, { "epoch": 0.89, "learning_rate": 1.4134993569057619e-06, "loss": 0.2179, "step": 66635 }, { "epoch": 0.89, "learning_rate": 1.4117557328120923e-06, "loss": 1.2283, "step": 66640 }, { "epoch": 0.89, "learning_rate": 1.4100131535596334e-06, "loss": 1.0704, "step": 66645 }, { "epoch": 0.89, "learning_rate": 1.408271619225579e-06, "loss": 0.7186, "step": 66650 }, { "epoch": 0.89, "learning_rate": 1.4065311298870592e-06, "loss": 0.5855, "step": 66655 }, { "epoch": 0.89, "learning_rate": 1.4047916856211791e-06, "loss": 0.5331, "step": 66660 }, { "epoch": 0.89, "learning_rate": 1.4030532865049878e-06, "loss": 0.4687, "step": 66665 }, { "epoch": 0.89, "learning_rate": 1.4013159326154768e-06, "loss": 0.5554, "step": 66670 }, { "epoch": 0.89, "learning_rate": 1.3995796240296204e-06, "loss": 0.1999, "step": 66675 }, { "epoch": 0.89, "learning_rate": 1.3978443608243074e-06, "loss": 0.6079, "step": 66680 }, { "epoch": 0.89, "learning_rate": 1.3961101430764122e-06, "loss": 0.294, "step": 66685 }, { "epoch": 0.89, "learning_rate": 1.3943769708627569e-06, "loss": 1.3402, "step": 66690 }, { "epoch": 0.89, "learning_rate": 1.392644844260102e-06, "loss": 1.0015, "step": 66695 }, { "epoch": 0.89, "learning_rate": 1.390913763345178e-06, "loss": 1.721, "step": 66700 }, { "epoch": 0.89, "learning_rate": 1.3891837281946596e-06, "loss": 0.4633, "step": 66705 }, { "epoch": 0.89, "learning_rate": 1.3874547388851827e-06, "loss": 0.4608, "step": 66710 }, { "epoch": 0.89, "learning_rate": 1.3857267954933334e-06, "loss": 1.1028, "step": 66715 }, { "epoch": 0.89, "learning_rate": 1.383999898095642e-06, "loss": 1.1654, "step": 66720 }, { "epoch": 0.89, "learning_rate": 1.382274046768617e-06, "loss": 0.4904, "step": 66725 }, { "epoch": 0.89, "learning_rate": 1.3805492415886912e-06, "loss": 0.2148, "step": 66730 }, { "epoch": 0.89, "learning_rate": 1.3788254826322704e-06, "loss": 0.5271, "step": 66735 }, { "epoch": 0.89, "learning_rate": 1.3771027699757077e-06, "loss": 0.3769, "step": 66740 }, { "epoch": 0.89, "learning_rate": 1.3753811036953058e-06, "loss": 0.9405, "step": 66745 }, { "epoch": 0.89, "learning_rate": 1.3736604838673367e-06, "loss": 0.6007, "step": 66750 }, { "epoch": 0.89, "learning_rate": 1.3719409105680092e-06, "loss": 0.7083, "step": 66755 }, { "epoch": 0.89, "learning_rate": 1.37022238387349e-06, "loss": 0.3343, "step": 66760 }, { "epoch": 0.89, "learning_rate": 1.368504903859902e-06, "loss": 0.4132, "step": 66765 }, { "epoch": 0.89, "learning_rate": 1.3667884706033224e-06, "loss": 0.5477, "step": 66770 }, { "epoch": 0.89, "learning_rate": 1.3650730841797826e-06, "loss": 0.0981, "step": 66775 }, { "epoch": 0.89, "learning_rate": 1.3633587446652607e-06, "loss": 0.5201, "step": 66780 }, { "epoch": 0.89, "learning_rate": 1.3616454521357014e-06, "loss": 0.7253, "step": 66785 }, { "epoch": 0.89, "learning_rate": 1.3599332066669828e-06, "loss": 0.5286, "step": 66790 }, { "epoch": 0.89, "learning_rate": 1.3582220083349556e-06, "loss": 0.8537, "step": 66795 }, { "epoch": 0.9, "learning_rate": 1.3565118572154257e-06, "loss": 0.4099, "step": 66800 }, { "epoch": 0.9, "learning_rate": 1.3548027533841268e-06, "loss": 0.5264, "step": 66805 }, { "epoch": 0.9, "learning_rate": 1.353094696916779e-06, "loss": 0.4367, "step": 66810 }, { "epoch": 0.9, "learning_rate": 1.3513876878890276e-06, "loss": 1.0109, "step": 66815 }, { "epoch": 0.9, "learning_rate": 1.3496817263764976e-06, "loss": 0.3389, "step": 66820 }, { "epoch": 0.9, "learning_rate": 1.347976812454746e-06, "loss": 1.3161, "step": 66825 }, { "epoch": 0.9, "learning_rate": 1.3462729461992923e-06, "loss": 0.8018, "step": 66830 }, { "epoch": 0.9, "learning_rate": 1.3445701276856183e-06, "loss": 1.1727, "step": 66835 }, { "epoch": 0.9, "learning_rate": 1.3428683569891353e-06, "loss": 0.9352, "step": 66840 }, { "epoch": 0.9, "learning_rate": 1.3411676341852337e-06, "loss": 0.8416, "step": 66845 }, { "epoch": 0.9, "learning_rate": 1.3394679593492471e-06, "loss": 1.3385, "step": 66850 }, { "epoch": 0.9, "learning_rate": 1.3377693325564543e-06, "loss": 0.7622, "step": 66855 }, { "epoch": 0.9, "learning_rate": 1.3360717538821066e-06, "loss": 0.9787, "step": 66860 }, { "epoch": 0.9, "learning_rate": 1.3343752234013933e-06, "loss": 1.1386, "step": 66865 }, { "epoch": 0.9, "learning_rate": 1.3326797411894604e-06, "loss": 0.7863, "step": 66870 }, { "epoch": 0.9, "learning_rate": 1.3309853073214086e-06, "loss": 0.4954, "step": 66875 }, { "epoch": 0.9, "learning_rate": 1.3292919218722999e-06, "loss": 0.3982, "step": 66880 }, { "epoch": 0.9, "learning_rate": 1.3275995849171385e-06, "loss": 1.5217, "step": 66885 }, { "epoch": 0.9, "learning_rate": 1.3259082965308812e-06, "loss": 1.0395, "step": 66890 }, { "epoch": 0.9, "learning_rate": 1.3242180567884566e-06, "loss": 1.1341, "step": 66895 }, { "epoch": 0.9, "learning_rate": 1.3225288657647162e-06, "loss": 0.46, "step": 66900 }, { "epoch": 0.9, "learning_rate": 1.3208407235344945e-06, "loss": 1.483, "step": 66905 }, { "epoch": 0.9, "learning_rate": 1.3191536301725732e-06, "loss": 0.5592, "step": 66910 }, { "epoch": 0.9, "learning_rate": 1.3174675857536678e-06, "loss": 0.2673, "step": 66915 }, { "epoch": 0.9, "learning_rate": 1.3157825903524713e-06, "loss": 0.5443, "step": 66920 }, { "epoch": 0.9, "learning_rate": 1.3140986440436127e-06, "loss": 1.091, "step": 66925 }, { "epoch": 0.9, "learning_rate": 1.3124157469016935e-06, "loss": 1.0137, "step": 66930 }, { "epoch": 0.9, "learning_rate": 1.3107338990012486e-06, "loss": 0.9883, "step": 66935 }, { "epoch": 0.9, "learning_rate": 1.3090531004167766e-06, "loss": 1.0791, "step": 66940 }, { "epoch": 0.9, "learning_rate": 1.3073733512227377e-06, "loss": 0.8846, "step": 66945 }, { "epoch": 0.9, "learning_rate": 1.3056946514935191e-06, "loss": 1.0292, "step": 66950 }, { "epoch": 0.9, "learning_rate": 1.3040170013034952e-06, "loss": 0.7714, "step": 66955 }, { "epoch": 0.9, "learning_rate": 1.3023404007269673e-06, "loss": 0.5616, "step": 66960 }, { "epoch": 0.9, "learning_rate": 1.300664849838204e-06, "loss": 1.2068, "step": 66965 }, { "epoch": 0.9, "learning_rate": 1.2989903487114263e-06, "loss": 0.9901, "step": 66970 }, { "epoch": 0.9, "learning_rate": 1.2973168974208028e-06, "loss": 1.0161, "step": 66975 }, { "epoch": 0.9, "learning_rate": 1.2956444960404602e-06, "loss": 0.3056, "step": 66980 }, { "epoch": 0.9, "learning_rate": 1.2939731446444752e-06, "loss": 0.8209, "step": 66985 }, { "epoch": 0.9, "learning_rate": 1.2923028433068834e-06, "loss": 0.2315, "step": 66990 }, { "epoch": 0.9, "learning_rate": 1.2906335921016726e-06, "loss": 0.5146, "step": 66995 }, { "epoch": 0.9, "learning_rate": 1.2889653911027726e-06, "loss": 0.5436, "step": 67000 }, { "epoch": 0.9, "learning_rate": 1.2872982403840883e-06, "loss": 0.1738, "step": 67005 }, { "epoch": 0.9, "learning_rate": 1.2856321400194633e-06, "loss": 0.5416, "step": 67010 }, { "epoch": 0.9, "learning_rate": 1.2839670900826884e-06, "loss": 0.2996, "step": 67015 }, { "epoch": 0.9, "learning_rate": 1.2823030906475325e-06, "loss": 0.6828, "step": 67020 }, { "epoch": 0.9, "learning_rate": 1.2806401417876867e-06, "loss": 0.6271, "step": 67025 }, { "epoch": 0.9, "learning_rate": 1.2789782435768228e-06, "loss": 0.8603, "step": 67030 }, { "epoch": 0.9, "learning_rate": 1.2773173960885455e-06, "loss": 0.7474, "step": 67035 }, { "epoch": 0.9, "learning_rate": 1.2756575993964292e-06, "loss": 0.64, "step": 67040 }, { "epoch": 0.9, "learning_rate": 1.2739988535739933e-06, "loss": 0.4566, "step": 67045 }, { "epoch": 0.9, "learning_rate": 1.2723411586947064e-06, "loss": 0.8456, "step": 67050 }, { "epoch": 0.9, "learning_rate": 1.2706845148320073e-06, "loss": 0.3741, "step": 67055 }, { "epoch": 0.9, "learning_rate": 1.269028922059265e-06, "loss": 0.5703, "step": 67060 }, { "epoch": 0.9, "learning_rate": 1.2673743804498206e-06, "loss": 0.6525, "step": 67065 }, { "epoch": 0.9, "learning_rate": 1.2657208900769629e-06, "loss": 0.4328, "step": 67070 }, { "epoch": 0.9, "learning_rate": 1.264068451013925e-06, "loss": 0.7238, "step": 67075 }, { "epoch": 0.9, "learning_rate": 1.2624170633339122e-06, "loss": 0.1972, "step": 67080 }, { "epoch": 0.9, "learning_rate": 1.2607667271100687e-06, "loss": 0.465, "step": 67085 }, { "epoch": 0.9, "learning_rate": 1.2591174424154945e-06, "loss": 0.283, "step": 67090 }, { "epoch": 0.9, "learning_rate": 1.257469209323242e-06, "loss": 0.9347, "step": 67095 }, { "epoch": 0.9, "learning_rate": 1.2558220279063283e-06, "loss": 0.5835, "step": 67100 }, { "epoch": 0.9, "learning_rate": 1.2541758982377084e-06, "loss": 0.66, "step": 67105 }, { "epoch": 0.9, "learning_rate": 1.252530820390299e-06, "loss": 0.1379, "step": 67110 }, { "epoch": 0.9, "learning_rate": 1.25088679443697e-06, "loss": 0.9774, "step": 67115 }, { "epoch": 0.9, "learning_rate": 1.2492438204505436e-06, "loss": 0.9887, "step": 67120 }, { "epoch": 0.9, "learning_rate": 1.247601898503792e-06, "loss": 0.4702, "step": 67125 }, { "epoch": 0.9, "learning_rate": 1.245961028669454e-06, "loss": 0.753, "step": 67130 }, { "epoch": 0.9, "learning_rate": 1.244321211020197e-06, "loss": 0.5063, "step": 67135 }, { "epoch": 0.9, "learning_rate": 1.2426824456286678e-06, "loss": 0.5405, "step": 67140 }, { "epoch": 0.9, "learning_rate": 1.2410447325674478e-06, "loss": 0.9083, "step": 67145 }, { "epoch": 0.9, "learning_rate": 1.23940807190909e-06, "loss": 0.9322, "step": 67150 }, { "epoch": 0.9, "learning_rate": 1.2377724637260807e-06, "loss": 0.8699, "step": 67155 }, { "epoch": 0.9, "learning_rate": 1.236137908090873e-06, "loss": 1.0646, "step": 67160 }, { "epoch": 0.9, "learning_rate": 1.234504405075873e-06, "loss": 0.4792, "step": 67165 }, { "epoch": 0.9, "learning_rate": 1.2328719547534256e-06, "loss": 0.8173, "step": 67170 }, { "epoch": 0.9, "learning_rate": 1.2312405571958535e-06, "loss": 0.1726, "step": 67175 }, { "epoch": 0.9, "learning_rate": 1.2296102124754127e-06, "loss": 0.557, "step": 67180 }, { "epoch": 0.9, "learning_rate": 1.227980920664315e-06, "loss": 0.7167, "step": 67185 }, { "epoch": 0.9, "learning_rate": 1.2263526818347387e-06, "loss": 0.1365, "step": 67190 }, { "epoch": 0.9, "learning_rate": 1.2247254960588038e-06, "loss": 1.3194, "step": 67195 }, { "epoch": 0.9, "learning_rate": 1.2230993634085836e-06, "loss": 0.5045, "step": 67200 }, { "epoch": 0.9, "learning_rate": 1.2214742839561088e-06, "loss": 0.4927, "step": 67205 }, { "epoch": 0.9, "learning_rate": 1.219850257773364e-06, "loss": 0.781, "step": 67210 }, { "epoch": 0.9, "learning_rate": 1.2182272849322857e-06, "loss": 0.3616, "step": 67215 }, { "epoch": 0.9, "learning_rate": 1.2166053655047582e-06, "loss": 0.6939, "step": 67220 }, { "epoch": 0.9, "learning_rate": 1.2149844995626325e-06, "loss": 0.6887, "step": 67225 }, { "epoch": 0.9, "learning_rate": 1.2133646871776982e-06, "loss": 1.1741, "step": 67230 }, { "epoch": 0.9, "learning_rate": 1.2117459284217065e-06, "loss": 0.0822, "step": 67235 }, { "epoch": 0.9, "learning_rate": 1.2101282233663691e-06, "loss": 0.8054, "step": 67240 }, { "epoch": 0.9, "learning_rate": 1.2085115720833262e-06, "loss": 0.821, "step": 67245 }, { "epoch": 0.9, "learning_rate": 1.2068959746441983e-06, "loss": 0.6178, "step": 67250 }, { "epoch": 0.9, "learning_rate": 1.2052814311205447e-06, "loss": 1.1502, "step": 67255 }, { "epoch": 0.9, "learning_rate": 1.203667941583883e-06, "loss": 0.6019, "step": 67260 }, { "epoch": 0.9, "learning_rate": 1.2020555061056844e-06, "loss": 0.3865, "step": 67265 }, { "epoch": 0.9, "learning_rate": 1.2004441247573634e-06, "loss": 0.8119, "step": 67270 }, { "epoch": 0.9, "learning_rate": 1.1988337976103103e-06, "loss": 0.8985, "step": 67275 }, { "epoch": 0.9, "learning_rate": 1.1972245247358404e-06, "loss": 0.3676, "step": 67280 }, { "epoch": 0.9, "learning_rate": 1.1956163062052466e-06, "loss": 0.4843, "step": 67285 }, { "epoch": 0.9, "learning_rate": 1.194009142089758e-06, "loss": 0.6678, "step": 67290 }, { "epoch": 0.9, "learning_rate": 1.192403032460565e-06, "loss": 0.9334, "step": 67295 }, { "epoch": 0.9, "learning_rate": 1.1907979773888161e-06, "loss": 1.1414, "step": 67300 }, { "epoch": 0.9, "learning_rate": 1.1891939769456017e-06, "loss": 0.3759, "step": 67305 }, { "epoch": 0.9, "learning_rate": 1.1875910312019734e-06, "loss": 0.7252, "step": 67310 }, { "epoch": 0.9, "learning_rate": 1.1859891402289297e-06, "loss": 0.2622, "step": 67315 }, { "epoch": 0.9, "learning_rate": 1.1843883040974335e-06, "loss": 0.474, "step": 67320 }, { "epoch": 0.9, "learning_rate": 1.1827885228783863e-06, "loss": 1.0692, "step": 67325 }, { "epoch": 0.9, "learning_rate": 1.181189796642654e-06, "loss": 1.0629, "step": 67330 }, { "epoch": 0.9, "learning_rate": 1.1795921254610542e-06, "loss": 1.2687, "step": 67335 }, { "epoch": 0.9, "learning_rate": 1.1779955094043533e-06, "loss": 0.8129, "step": 67340 }, { "epoch": 0.9, "learning_rate": 1.1763999485432692e-06, "loss": 1.1172, "step": 67345 }, { "epoch": 0.9, "learning_rate": 1.1748054429484901e-06, "loss": 0.8145, "step": 67350 }, { "epoch": 0.9, "learning_rate": 1.173211992690626e-06, "loss": 0.4235, "step": 67355 }, { "epoch": 0.9, "learning_rate": 1.1716195978402761e-06, "loss": 0.5533, "step": 67360 }, { "epoch": 0.9, "learning_rate": 1.1700282584679673e-06, "loss": 0.1889, "step": 67365 }, { "epoch": 0.9, "learning_rate": 1.1684379746441849e-06, "loss": 0.2241, "step": 67370 }, { "epoch": 0.9, "learning_rate": 1.166848746439378e-06, "loss": 1.0597, "step": 67375 }, { "epoch": 0.9, "learning_rate": 1.1652605739239348e-06, "loss": 1.0781, "step": 67380 }, { "epoch": 0.9, "learning_rate": 1.1636734571682156e-06, "loss": 0.7489, "step": 67385 }, { "epoch": 0.9, "learning_rate": 1.1620873962425033e-06, "loss": 1.1701, "step": 67390 }, { "epoch": 0.9, "learning_rate": 1.1605023912170664e-06, "loss": 0.6297, "step": 67395 }, { "epoch": 0.9, "learning_rate": 1.1589184421621103e-06, "loss": 0.4713, "step": 67400 }, { "epoch": 0.9, "learning_rate": 1.1573355491477895e-06, "loss": 0.4931, "step": 67405 }, { "epoch": 0.9, "learning_rate": 1.155753712244223e-06, "loss": 0.596, "step": 67410 }, { "epoch": 0.9, "learning_rate": 1.1541729315214827e-06, "loss": 0.6265, "step": 67415 }, { "epoch": 0.9, "learning_rate": 1.1525932070495821e-06, "loss": 0.565, "step": 67420 }, { "epoch": 0.9, "learning_rate": 1.1510145388984956e-06, "loss": 0.8066, "step": 67425 }, { "epoch": 0.9, "learning_rate": 1.1494369271381534e-06, "loss": 0.5091, "step": 67430 }, { "epoch": 0.9, "learning_rate": 1.1478603718384355e-06, "loss": 0.5606, "step": 67435 }, { "epoch": 0.9, "learning_rate": 1.1462848730691727e-06, "loss": 0.1436, "step": 67440 }, { "epoch": 0.9, "learning_rate": 1.144710430900156e-06, "loss": 0.67, "step": 67445 }, { "epoch": 0.9, "learning_rate": 1.1431370454011215e-06, "loss": 0.535, "step": 67450 }, { "epoch": 0.9, "learning_rate": 1.1415647166417631e-06, "loss": 1.3667, "step": 67455 }, { "epoch": 0.9, "learning_rate": 1.1399934446917337e-06, "loss": 0.516, "step": 67460 }, { "epoch": 0.9, "learning_rate": 1.1384232296206194e-06, "loss": 0.2943, "step": 67465 }, { "epoch": 0.9, "learning_rate": 1.1368540714979836e-06, "loss": 0.3559, "step": 67470 }, { "epoch": 0.9, "learning_rate": 1.1352859703933294e-06, "loss": 0.4268, "step": 67475 }, { "epoch": 0.9, "learning_rate": 1.1337189263761122e-06, "loss": 0.7595, "step": 67480 }, { "epoch": 0.9, "learning_rate": 1.1321529395157488e-06, "loss": 1.0594, "step": 67485 }, { "epoch": 0.9, "learning_rate": 1.130588009881603e-06, "loss": 0.4722, "step": 67490 }, { "epoch": 0.9, "learning_rate": 1.1290241375429971e-06, "loss": 0.6271, "step": 67495 }, { "epoch": 0.9, "learning_rate": 1.1274613225691954e-06, "loss": 0.9088, "step": 67500 }, { "epoch": 0.9, "learning_rate": 1.1258995650294258e-06, "loss": 0.5433, "step": 67505 }, { "epoch": 0.9, "learning_rate": 1.1243388649928716e-06, "loss": 0.8233, "step": 67510 }, { "epoch": 0.9, "learning_rate": 1.1227792225286526e-06, "loss": 0.4873, "step": 67515 }, { "epoch": 0.9, "learning_rate": 1.1212206377058664e-06, "loss": 2.079, "step": 67520 }, { "epoch": 0.9, "learning_rate": 1.1196631105935413e-06, "loss": 0.5088, "step": 67525 }, { "epoch": 0.9, "learning_rate": 1.1181066412606689e-06, "loss": 0.7431, "step": 67530 }, { "epoch": 0.9, "learning_rate": 1.1165512297761999e-06, "loss": 0.19, "step": 67535 }, { "epoch": 0.9, "learning_rate": 1.1149968762090234e-06, "loss": 0.9985, "step": 67540 }, { "epoch": 0.91, "learning_rate": 1.113443580627993e-06, "loss": 1.0965, "step": 67545 }, { "epoch": 0.91, "learning_rate": 1.111891343101909e-06, "loss": 1.0253, "step": 67550 }, { "epoch": 0.91, "learning_rate": 1.110340163699533e-06, "loss": 0.3805, "step": 67555 }, { "epoch": 0.91, "learning_rate": 1.1087900424895714e-06, "loss": 0.6007, "step": 67560 }, { "epoch": 0.91, "learning_rate": 1.107240979540683e-06, "loss": 0.6441, "step": 67565 }, { "epoch": 0.91, "learning_rate": 1.1056929749214962e-06, "loss": 0.362, "step": 67570 }, { "epoch": 0.91, "learning_rate": 1.1041460287005617e-06, "loss": 0.535, "step": 67575 }, { "epoch": 0.91, "learning_rate": 1.1026001409464165e-06, "loss": 0.7837, "step": 67580 }, { "epoch": 0.91, "learning_rate": 1.101055311727528e-06, "loss": 0.6089, "step": 67585 }, { "epoch": 0.91, "learning_rate": 1.0995115411123247e-06, "loss": 1.43, "step": 67590 }, { "epoch": 0.91, "learning_rate": 1.0979688291691936e-06, "loss": 1.6851, "step": 67595 }, { "epoch": 0.91, "learning_rate": 1.0964271759664608e-06, "loss": 0.3834, "step": 67600 }, { "epoch": 0.91, "learning_rate": 1.0948865815724268e-06, "loss": 0.7649, "step": 67605 }, { "epoch": 0.91, "learning_rate": 1.0933470460553152e-06, "loss": 0.727, "step": 67610 }, { "epoch": 0.91, "learning_rate": 1.0918085694833324e-06, "loss": 0.9983, "step": 67615 }, { "epoch": 0.91, "learning_rate": 1.0902711519246212e-06, "loss": 0.8769, "step": 67620 }, { "epoch": 0.91, "learning_rate": 1.088734793447277e-06, "loss": 1.0149, "step": 67625 }, { "epoch": 0.91, "learning_rate": 1.0871994941193592e-06, "loss": 0.6665, "step": 67630 }, { "epoch": 0.91, "learning_rate": 1.0856652540088746e-06, "loss": 0.4131, "step": 67635 }, { "epoch": 0.91, "learning_rate": 1.0841320731837745e-06, "loss": 0.809, "step": 67640 }, { "epoch": 0.91, "learning_rate": 1.0825999517119822e-06, "loss": 0.8722, "step": 67645 }, { "epoch": 0.91, "learning_rate": 1.0810688896613547e-06, "loss": 0.4556, "step": 67650 }, { "epoch": 0.91, "learning_rate": 1.0795388870997124e-06, "loss": 0.5288, "step": 67655 }, { "epoch": 0.91, "learning_rate": 1.0780099440948238e-06, "loss": 1.1311, "step": 67660 }, { "epoch": 0.91, "learning_rate": 1.0764820607144205e-06, "loss": 0.9581, "step": 67665 }, { "epoch": 0.91, "learning_rate": 1.074955237026179e-06, "loss": 0.4927, "step": 67670 }, { "epoch": 0.91, "learning_rate": 1.0734294730977201e-06, "loss": 1.3488, "step": 67675 }, { "epoch": 0.91, "learning_rate": 1.0719047689966427e-06, "loss": 0.8026, "step": 67680 }, { "epoch": 0.91, "learning_rate": 1.0703811247904705e-06, "loss": 0.8085, "step": 67685 }, { "epoch": 0.91, "learning_rate": 1.0688585405466994e-06, "loss": 0.7588, "step": 67690 }, { "epoch": 0.91, "learning_rate": 1.067337016332773e-06, "loss": 1.0307, "step": 67695 }, { "epoch": 0.91, "learning_rate": 1.0658165522160785e-06, "loss": 1.2758, "step": 67700 }, { "epoch": 0.91, "learning_rate": 1.064297148263979e-06, "loss": 0.4141, "step": 67705 }, { "epoch": 0.91, "learning_rate": 1.0627788045437653e-06, "loss": 0.4072, "step": 67710 }, { "epoch": 0.91, "learning_rate": 1.0612615211227001e-06, "loss": 0.467, "step": 67715 }, { "epoch": 0.91, "learning_rate": 1.059745298067985e-06, "loss": 0.6658, "step": 67720 }, { "epoch": 0.91, "learning_rate": 1.058230135446786e-06, "loss": 0.5941, "step": 67725 }, { "epoch": 0.91, "learning_rate": 1.0567160333262134e-06, "loss": 1.2007, "step": 67730 }, { "epoch": 0.91, "learning_rate": 1.0552029917733352e-06, "loss": 0.8046, "step": 67735 }, { "epoch": 0.91, "learning_rate": 1.0536910108551733e-06, "loss": 0.7321, "step": 67740 }, { "epoch": 0.91, "learning_rate": 1.0521800906387019e-06, "loss": 0.5121, "step": 67745 }, { "epoch": 0.91, "learning_rate": 1.0506702311908423e-06, "loss": 1.1457, "step": 67750 }, { "epoch": 0.91, "learning_rate": 1.049161432578477e-06, "loss": 0.4168, "step": 67755 }, { "epoch": 0.91, "learning_rate": 1.0476536948684418e-06, "loss": 1.2989, "step": 67760 }, { "epoch": 0.91, "learning_rate": 1.0461470181275163e-06, "loss": 0.956, "step": 67765 }, { "epoch": 0.91, "learning_rate": 1.044641402422436e-06, "loss": 0.487, "step": 67770 }, { "epoch": 0.91, "learning_rate": 1.0431368478199033e-06, "loss": 0.8883, "step": 67775 }, { "epoch": 0.91, "learning_rate": 1.0416333543865536e-06, "loss": 0.2734, "step": 67780 }, { "epoch": 0.91, "learning_rate": 1.040130922188981e-06, "loss": 1.4646, "step": 67785 }, { "epoch": 0.91, "learning_rate": 1.0386295512937517e-06, "loss": 0.7574, "step": 67790 }, { "epoch": 0.91, "learning_rate": 1.0371292417673484e-06, "loss": 1.1625, "step": 67795 }, { "epoch": 0.91, "learning_rate": 1.035629993676243e-06, "loss": 1.2256, "step": 67800 }, { "epoch": 0.91, "learning_rate": 1.0341318070868383e-06, "loss": 0.9217, "step": 67805 }, { "epoch": 0.91, "learning_rate": 1.032634682065492e-06, "loss": 0.3449, "step": 67810 }, { "epoch": 0.91, "learning_rate": 1.0311386186785315e-06, "loss": 0.3283, "step": 67815 }, { "epoch": 0.91, "learning_rate": 1.0296436169922096e-06, "loss": 0.7881, "step": 67820 }, { "epoch": 0.91, "learning_rate": 1.028149677072765e-06, "loss": 0.4931, "step": 67825 }, { "epoch": 0.91, "learning_rate": 1.0266567989863557e-06, "loss": 0.8156, "step": 67830 }, { "epoch": 0.91, "learning_rate": 1.0251649827991177e-06, "loss": 0.0427, "step": 67835 }, { "epoch": 0.91, "learning_rate": 1.023674228577129e-06, "loss": 1.2695, "step": 67840 }, { "epoch": 0.91, "learning_rate": 1.0221845363864196e-06, "loss": 0.406, "step": 67845 }, { "epoch": 0.91, "learning_rate": 1.0206959062929817e-06, "loss": 0.9218, "step": 67850 }, { "epoch": 0.91, "learning_rate": 1.0192083383627483e-06, "loss": 0.9266, "step": 67855 }, { "epoch": 0.91, "learning_rate": 1.017721832661611e-06, "loss": 0.8562, "step": 67860 }, { "epoch": 0.91, "learning_rate": 1.0162363892554205e-06, "loss": 1.2135, "step": 67865 }, { "epoch": 0.91, "learning_rate": 1.014752008209971e-06, "loss": 0.191, "step": 67870 }, { "epoch": 0.91, "learning_rate": 1.0132686895910127e-06, "loss": 0.6042, "step": 67875 }, { "epoch": 0.91, "learning_rate": 1.0117864334642486e-06, "loss": 0.672, "step": 67880 }, { "epoch": 0.91, "learning_rate": 1.0103052398953373e-06, "loss": 1.0415, "step": 67885 }, { "epoch": 0.91, "learning_rate": 1.0088251089498873e-06, "loss": 1.6006, "step": 67890 }, { "epoch": 0.91, "learning_rate": 1.0073460406934576e-06, "loss": 0.9716, "step": 67895 }, { "epoch": 0.91, "learning_rate": 1.0058680351915734e-06, "loss": 0.4599, "step": 67900 }, { "epoch": 0.91, "learning_rate": 1.0043910925096906e-06, "loss": 0.7088, "step": 67905 }, { "epoch": 0.91, "learning_rate": 1.0029152127132374e-06, "loss": 0.4464, "step": 67910 }, { "epoch": 0.91, "learning_rate": 1.0014403958675893e-06, "loss": 0.6201, "step": 67915 }, { "epoch": 0.91, "learning_rate": 9.999666420380666e-07, "loss": 1.1388, "step": 67920 }, { "epoch": 0.91, "learning_rate": 9.984939512899555e-07, "loss": 1.4636, "step": 67925 }, { "epoch": 0.91, "learning_rate": 9.970223236884874e-07, "loss": 0.3795, "step": 67930 }, { "epoch": 0.91, "learning_rate": 9.955517592988462e-07, "loss": 0.5555, "step": 67935 }, { "epoch": 0.91, "learning_rate": 9.940822581861714e-07, "loss": 1.0339, "step": 67940 }, { "epoch": 0.91, "learning_rate": 9.926138204155526e-07, "loss": 1.0063, "step": 67945 }, { "epoch": 0.91, "learning_rate": 9.91146446052041e-07, "loss": 0.6422, "step": 67950 }, { "epoch": 0.91, "learning_rate": 9.896801351606255e-07, "loss": 0.3625, "step": 67955 }, { "epoch": 0.91, "learning_rate": 9.88214887806263e-07, "loss": 1.0118, "step": 67960 }, { "epoch": 0.91, "learning_rate": 9.867507040538515e-07, "loss": 1.0526, "step": 67965 }, { "epoch": 0.91, "learning_rate": 9.852875839682502e-07, "loss": 1.2417, "step": 67970 }, { "epoch": 0.91, "learning_rate": 9.838255276142655e-07, "loss": 0.5743, "step": 67975 }, { "epoch": 0.91, "learning_rate": 9.823645350566651e-07, "loss": 1.0864, "step": 67980 }, { "epoch": 0.91, "learning_rate": 9.809046063601556e-07, "loss": 0.768, "step": 67985 }, { "epoch": 0.91, "learning_rate": 9.794457415894076e-07, "loss": 1.1833, "step": 67990 }, { "epoch": 0.91, "learning_rate": 9.77987940809047e-07, "loss": 1.3434, "step": 67995 }, { "epoch": 0.91, "learning_rate": 9.765312040836388e-07, "loss": 0.5119, "step": 68000 }, { "epoch": 0.91, "learning_rate": 9.750755314777093e-07, "loss": 0.1277, "step": 68005 }, { "epoch": 0.91, "learning_rate": 9.736209230557486e-07, "loss": 0.7755, "step": 68010 }, { "epoch": 0.91, "learning_rate": 9.721673788821745e-07, "loss": 0.8367, "step": 68015 }, { "epoch": 0.91, "learning_rate": 9.707148990213827e-07, "loss": 0.6397, "step": 68020 }, { "epoch": 0.91, "learning_rate": 9.692634835377052e-07, "loss": 0.713, "step": 68025 }, { "epoch": 0.91, "learning_rate": 9.678131324954292e-07, "loss": 0.3992, "step": 68030 }, { "epoch": 0.91, "learning_rate": 9.663638459588066e-07, "loss": 0.8137, "step": 68035 }, { "epoch": 0.91, "learning_rate": 9.64915623992027e-07, "loss": 1.0908, "step": 68040 }, { "epoch": 0.91, "learning_rate": 9.634684666592425e-07, "loss": 0.8764, "step": 68045 }, { "epoch": 0.91, "learning_rate": 9.620223740245516e-07, "loss": 1.1405, "step": 68050 }, { "epoch": 0.91, "learning_rate": 9.605773461520112e-07, "loss": 0.7884, "step": 68055 }, { "epoch": 0.91, "learning_rate": 9.591333831056342e-07, "loss": 0.9039, "step": 68060 }, { "epoch": 0.91, "learning_rate": 9.576904849493695e-07, "loss": 0.5336, "step": 68065 }, { "epoch": 0.91, "learning_rate": 9.56248651747141e-07, "loss": 0.8142, "step": 68070 }, { "epoch": 0.91, "learning_rate": 9.548078835628084e-07, "loss": 0.6272, "step": 68075 }, { "epoch": 0.91, "learning_rate": 9.533681804601902e-07, "loss": 0.3909, "step": 68080 }, { "epoch": 0.91, "learning_rate": 9.519295425030633e-07, "loss": 0.5007, "step": 68085 }, { "epoch": 0.91, "learning_rate": 9.50491969755149e-07, "loss": 1.295, "step": 68090 }, { "epoch": 0.91, "learning_rate": 9.49055462280124e-07, "loss": 0.4431, "step": 68095 }, { "epoch": 0.91, "learning_rate": 9.476200201416153e-07, "loss": 0.7717, "step": 68100 }, { "epoch": 0.91, "learning_rate": 9.461856434032135e-07, "loss": 0.9033, "step": 68105 }, { "epoch": 0.91, "learning_rate": 9.447523321284513e-07, "loss": 0.6809, "step": 68110 }, { "epoch": 0.91, "learning_rate": 9.433200863808111e-07, "loss": 0.2122, "step": 68115 }, { "epoch": 0.91, "learning_rate": 9.418889062237452e-07, "loss": 0.4276, "step": 68120 }, { "epoch": 0.91, "learning_rate": 9.404587917206359e-07, "loss": 0.9922, "step": 68125 }, { "epoch": 0.91, "learning_rate": 9.390297429348411e-07, "loss": 0.8181, "step": 68130 }, { "epoch": 0.91, "learning_rate": 9.376017599296544e-07, "loss": 0.9393, "step": 68135 }, { "epoch": 0.91, "learning_rate": 9.361748427683253e-07, "loss": 0.4296, "step": 68140 }, { "epoch": 0.91, "learning_rate": 9.347489915140672e-07, "loss": 0.5506, "step": 68145 }, { "epoch": 0.91, "learning_rate": 9.333242062300324e-07, "loss": 0.623, "step": 68150 }, { "epoch": 0.91, "learning_rate": 9.319004869793341e-07, "loss": 0.4736, "step": 68155 }, { "epoch": 0.91, "learning_rate": 9.30477833825033e-07, "loss": 0.6749, "step": 68160 }, { "epoch": 0.91, "learning_rate": 9.290562468301483e-07, "loss": 0.3308, "step": 68165 }, { "epoch": 0.91, "learning_rate": 9.276357260576546e-07, "loss": 0.4842, "step": 68170 }, { "epoch": 0.91, "learning_rate": 9.262162715704626e-07, "loss": 0.3213, "step": 68175 }, { "epoch": 0.91, "learning_rate": 9.247978834314525e-07, "loss": 0.8494, "step": 68180 }, { "epoch": 0.91, "learning_rate": 9.233805617034546e-07, "loss": 0.5103, "step": 68185 }, { "epoch": 0.91, "learning_rate": 9.21964306449244e-07, "loss": 0.4766, "step": 68190 }, { "epoch": 0.91, "learning_rate": 9.205491177315562e-07, "loss": 0.211, "step": 68195 }, { "epoch": 0.91, "learning_rate": 9.191349956130774e-07, "loss": 0.7615, "step": 68200 }, { "epoch": 0.91, "learning_rate": 9.177219401564463e-07, "loss": 0.2814, "step": 68205 }, { "epoch": 0.91, "learning_rate": 9.163099514242491e-07, "loss": 0.434, "step": 68210 }, { "epoch": 0.91, "learning_rate": 9.148990294790383e-07, "loss": 1.8496, "step": 68215 }, { "epoch": 0.91, "learning_rate": 9.134891743833085e-07, "loss": 0.6917, "step": 68220 }, { "epoch": 0.91, "learning_rate": 9.120803861995014e-07, "loss": 0.9388, "step": 68225 }, { "epoch": 0.91, "learning_rate": 9.10672664990031e-07, "loss": 0.4499, "step": 68230 }, { "epoch": 0.91, "learning_rate": 9.092660108172418e-07, "loss": 0.9896, "step": 68235 }, { "epoch": 0.91, "learning_rate": 9.078604237434479e-07, "loss": 0.7349, "step": 68240 }, { "epoch": 0.91, "learning_rate": 9.064559038309106e-07, "loss": 0.5947, "step": 68245 }, { "epoch": 0.91, "learning_rate": 9.050524511418357e-07, "loss": 0.3809, "step": 68250 }, { "epoch": 0.91, "learning_rate": 9.036500657383956e-07, "loss": 1.2552, "step": 68255 }, { "epoch": 0.91, "learning_rate": 9.022487476827102e-07, "loss": 0.5529, "step": 68260 }, { "epoch": 0.91, "learning_rate": 9.008484970368463e-07, "loss": 0.5531, "step": 68265 }, { "epoch": 0.91, "learning_rate": 8.994493138628268e-07, "loss": 0.2028, "step": 68270 }, { "epoch": 0.91, "learning_rate": 8.980511982226297e-07, "loss": 0.9274, "step": 68275 }, { "epoch": 0.91, "learning_rate": 8.966541501781944e-07, "loss": 1.1722, "step": 68280 }, { "epoch": 0.91, "learning_rate": 8.952581697913908e-07, "loss": 0.5918, "step": 68285 }, { "epoch": 0.91, "learning_rate": 8.938632571240585e-07, "loss": 0.5751, "step": 68290 }, { "epoch": 0.92, "learning_rate": 8.92469412237984e-07, "loss": 0.5931, "step": 68295 }, { "epoch": 0.92, "learning_rate": 8.910766351949068e-07, "loss": 0.8329, "step": 68300 }, { "epoch": 0.92, "learning_rate": 8.896849260565248e-07, "loss": 0.5307, "step": 68305 }, { "epoch": 0.92, "learning_rate": 8.882942848844805e-07, "loss": 0.684, "step": 68310 }, { "epoch": 0.92, "learning_rate": 8.869047117403717e-07, "loss": 0.6081, "step": 68315 }, { "epoch": 0.92, "learning_rate": 8.855162066857464e-07, "loss": 0.6512, "step": 68320 }, { "epoch": 0.92, "learning_rate": 8.841287697821166e-07, "loss": 0.8484, "step": 68325 }, { "epoch": 0.92, "learning_rate": 8.82742401090933e-07, "loss": 1.0783, "step": 68330 }, { "epoch": 0.92, "learning_rate": 8.813571006736049e-07, "loss": 0.6965, "step": 68335 }, { "epoch": 0.92, "learning_rate": 8.799728685914998e-07, "loss": 0.4915, "step": 68340 }, { "epoch": 0.92, "learning_rate": 8.785897049059244e-07, "loss": 1.2615, "step": 68345 }, { "epoch": 0.92, "learning_rate": 8.77207609678149e-07, "loss": 1.053, "step": 68350 }, { "epoch": 0.92, "learning_rate": 8.758265829693968e-07, "loss": 0.7038, "step": 68355 }, { "epoch": 0.92, "learning_rate": 8.744466248408329e-07, "loss": 0.5223, "step": 68360 }, { "epoch": 0.92, "learning_rate": 8.730677353535916e-07, "loss": 1.0772, "step": 68365 }, { "epoch": 0.92, "learning_rate": 8.716899145687434e-07, "loss": 0.3633, "step": 68370 }, { "epoch": 0.92, "learning_rate": 8.703131625473204e-07, "loss": 0.6488, "step": 68375 }, { "epoch": 0.92, "learning_rate": 8.689374793503125e-07, "loss": 0.5216, "step": 68380 }, { "epoch": 0.92, "learning_rate": 8.675628650386458e-07, "loss": 0.6528, "step": 68385 }, { "epoch": 0.92, "learning_rate": 8.66189319673219e-07, "loss": 0.8158, "step": 68390 }, { "epoch": 0.92, "learning_rate": 8.648168433148613e-07, "loss": 0.8904, "step": 68395 }, { "epoch": 0.92, "learning_rate": 8.634454360243766e-07, "loss": 0.5468, "step": 68400 }, { "epoch": 0.92, "learning_rate": 8.620750978625081e-07, "loss": 0.5739, "step": 68405 }, { "epoch": 0.92, "learning_rate": 8.607058288899516e-07, "loss": 0.857, "step": 68410 }, { "epoch": 0.92, "learning_rate": 8.593376291673644e-07, "loss": 1.339, "step": 68415 }, { "epoch": 0.92, "learning_rate": 8.579704987553478e-07, "loss": 0.5595, "step": 68420 }, { "epoch": 0.92, "learning_rate": 8.566044377144588e-07, "loss": 1.1071, "step": 68425 }, { "epoch": 0.92, "learning_rate": 8.552394461052049e-07, "loss": 0.65, "step": 68430 }, { "epoch": 0.92, "learning_rate": 8.538755239880541e-07, "loss": 0.4618, "step": 68435 }, { "epoch": 0.92, "learning_rate": 8.525126714234194e-07, "loss": 0.39, "step": 68440 }, { "epoch": 0.92, "learning_rate": 8.511508884716635e-07, "loss": 0.4301, "step": 68445 }, { "epoch": 0.92, "learning_rate": 8.497901751931159e-07, "loss": 0.7897, "step": 68450 }, { "epoch": 0.92, "learning_rate": 8.484305316480395e-07, "loss": 1.2622, "step": 68455 }, { "epoch": 0.92, "learning_rate": 8.470719578966668e-07, "loss": 0.2066, "step": 68460 }, { "epoch": 0.92, "learning_rate": 8.457144539991718e-07, "loss": 1.1341, "step": 68465 }, { "epoch": 0.92, "learning_rate": 8.443580200156842e-07, "loss": 0.72, "step": 68470 }, { "epoch": 0.92, "learning_rate": 8.43002656006292e-07, "loss": 0.6571, "step": 68475 }, { "epoch": 0.92, "learning_rate": 8.416483620310278e-07, "loss": 0.606, "step": 68480 }, { "epoch": 0.92, "learning_rate": 8.402951381498797e-07, "loss": 0.356, "step": 68485 }, { "epoch": 0.92, "learning_rate": 8.389429844227914e-07, "loss": 0.8665, "step": 68490 }, { "epoch": 0.92, "learning_rate": 8.375919009096539e-07, "loss": 0.2428, "step": 68495 }, { "epoch": 0.92, "learning_rate": 8.362418876703165e-07, "loss": 0.591, "step": 68500 }, { "epoch": 0.92, "learning_rate": 8.348929447645731e-07, "loss": 0.6937, "step": 68505 }, { "epoch": 0.92, "learning_rate": 8.335450722521787e-07, "loss": 1.0299, "step": 68510 }, { "epoch": 0.92, "learning_rate": 8.321982701928383e-07, "loss": 0.2437, "step": 68515 }, { "epoch": 0.92, "learning_rate": 8.30852538646204e-07, "loss": 1.4289, "step": 68520 }, { "epoch": 0.92, "learning_rate": 8.295078776718896e-07, "loss": 0.8195, "step": 68525 }, { "epoch": 0.92, "learning_rate": 8.281642873294554e-07, "loss": 0.355, "step": 68530 }, { "epoch": 0.92, "learning_rate": 8.268217676784178e-07, "loss": 0.8805, "step": 68535 }, { "epoch": 0.92, "learning_rate": 8.254803187782351e-07, "loss": 1.0535, "step": 68540 }, { "epoch": 0.92, "learning_rate": 8.241399406883371e-07, "loss": 0.3899, "step": 68545 }, { "epoch": 0.92, "learning_rate": 8.228006334680932e-07, "loss": 0.4117, "step": 68550 }, { "epoch": 0.92, "learning_rate": 8.214623971768226e-07, "loss": 0.8334, "step": 68555 }, { "epoch": 0.92, "learning_rate": 8.201252318738112e-07, "loss": 1.3621, "step": 68560 }, { "epoch": 0.92, "learning_rate": 8.187891376182782e-07, "loss": 1.3257, "step": 68565 }, { "epoch": 0.92, "learning_rate": 8.174541144694153e-07, "loss": 0.3616, "step": 68570 }, { "epoch": 0.92, "learning_rate": 8.16120162486353e-07, "loss": 0.2832, "step": 68575 }, { "epoch": 0.92, "learning_rate": 8.147872817281771e-07, "loss": 0.8864, "step": 68580 }, { "epoch": 0.92, "learning_rate": 8.134554722539323e-07, "loss": 1.2549, "step": 68585 }, { "epoch": 0.92, "learning_rate": 8.121247341226073e-07, "loss": 0.8437, "step": 68590 }, { "epoch": 0.92, "learning_rate": 8.107950673931469e-07, "loss": 1.23, "step": 68595 }, { "epoch": 0.92, "learning_rate": 8.094664721244538e-07, "loss": 0.5612, "step": 68600 }, { "epoch": 0.92, "learning_rate": 8.081389483753726e-07, "loss": 0.8164, "step": 68605 }, { "epoch": 0.92, "learning_rate": 8.068124962047091e-07, "loss": 0.7896, "step": 68610 }, { "epoch": 0.92, "learning_rate": 8.054871156712162e-07, "loss": 0.4428, "step": 68615 }, { "epoch": 0.92, "learning_rate": 8.041628068336026e-07, "loss": 1.1131, "step": 68620 }, { "epoch": 0.92, "learning_rate": 8.028395697505298e-07, "loss": 0.7666, "step": 68625 }, { "epoch": 0.92, "learning_rate": 8.015174044806089e-07, "loss": 0.3986, "step": 68630 }, { "epoch": 0.92, "learning_rate": 8.001963110824046e-07, "loss": 1.0351, "step": 68635 }, { "epoch": 0.92, "learning_rate": 7.988762896144391e-07, "loss": 0.8182, "step": 68640 }, { "epoch": 0.92, "learning_rate": 7.975573401351772e-07, "loss": 0.781, "step": 68645 }, { "epoch": 0.92, "learning_rate": 7.962394627030439e-07, "loss": 0.9023, "step": 68650 }, { "epoch": 0.92, "learning_rate": 7.949226573764151e-07, "loss": 1.4228, "step": 68655 }, { "epoch": 0.92, "learning_rate": 7.93606924213619e-07, "loss": 0.7565, "step": 68660 }, { "epoch": 0.92, "learning_rate": 7.92292263272934e-07, "loss": 0.8076, "step": 68665 }, { "epoch": 0.92, "learning_rate": 7.909786746125997e-07, "loss": 0.6778, "step": 68670 }, { "epoch": 0.92, "learning_rate": 7.896661582907888e-07, "loss": 0.8371, "step": 68675 }, { "epoch": 0.92, "learning_rate": 7.883547143656495e-07, "loss": 1.2264, "step": 68680 }, { "epoch": 0.92, "learning_rate": 7.870443428952712e-07, "loss": 0.3778, "step": 68685 }, { "epoch": 0.92, "learning_rate": 7.857350439376909e-07, "loss": 0.1371, "step": 68690 }, { "epoch": 0.92, "learning_rate": 7.844268175509123e-07, "loss": 0.9044, "step": 68695 }, { "epoch": 0.92, "learning_rate": 7.831196637928778e-07, "loss": 0.6056, "step": 68700 }, { "epoch": 0.92, "learning_rate": 7.818135827214856e-07, "loss": 0.6332, "step": 68705 }, { "epoch": 0.92, "learning_rate": 7.80508574394595e-07, "loss": 0.6639, "step": 68710 }, { "epoch": 0.92, "learning_rate": 7.792046388700098e-07, "loss": 0.358, "step": 68715 }, { "epoch": 0.92, "learning_rate": 7.779017762054835e-07, "loss": 0.8147, "step": 68720 }, { "epoch": 0.92, "learning_rate": 7.765999864587286e-07, "loss": 0.8938, "step": 68725 }, { "epoch": 0.92, "learning_rate": 7.7529926968741e-07, "loss": 0.8443, "step": 68730 }, { "epoch": 0.92, "learning_rate": 7.739996259491428e-07, "loss": 0.7188, "step": 68735 }, { "epoch": 0.92, "learning_rate": 7.72701055301489e-07, "loss": 1.1077, "step": 68740 }, { "epoch": 0.92, "learning_rate": 7.714035578019752e-07, "loss": 0.4214, "step": 68745 }, { "epoch": 0.92, "learning_rate": 7.701071335080745e-07, "loss": 1.0898, "step": 68750 }, { "epoch": 0.92, "learning_rate": 7.688117824772079e-07, "loss": 0.7112, "step": 68755 }, { "epoch": 0.92, "learning_rate": 7.675175047667515e-07, "loss": 1.0201, "step": 68760 }, { "epoch": 0.92, "learning_rate": 7.662243004340402e-07, "loss": 1.0147, "step": 68765 }, { "epoch": 0.92, "learning_rate": 7.64932169536356e-07, "loss": 0.3292, "step": 68770 }, { "epoch": 0.92, "learning_rate": 7.636411121309306e-07, "loss": 0.5528, "step": 68775 }, { "epoch": 0.92, "learning_rate": 7.623511282749573e-07, "loss": 0.7416, "step": 68780 }, { "epoch": 0.92, "learning_rate": 7.610622180255683e-07, "loss": 0.3813, "step": 68785 }, { "epoch": 0.92, "learning_rate": 7.597743814398567e-07, "loss": 0.868, "step": 68790 }, { "epoch": 0.92, "learning_rate": 7.584876185748768e-07, "loss": 1.3247, "step": 68795 }, { "epoch": 0.92, "learning_rate": 7.572019294876137e-07, "loss": 1.4306, "step": 68800 }, { "epoch": 0.92, "learning_rate": 7.559173142350245e-07, "loss": 0.9644, "step": 68805 }, { "epoch": 0.92, "learning_rate": 7.546337728740082e-07, "loss": 0.642, "step": 68810 }, { "epoch": 0.92, "learning_rate": 7.533513054614194e-07, "loss": 0.9564, "step": 68815 }, { "epoch": 0.92, "learning_rate": 7.520699120540681e-07, "loss": 1.0453, "step": 68820 }, { "epoch": 0.92, "learning_rate": 7.507895927087089e-07, "loss": 1.2849, "step": 68825 }, { "epoch": 0.92, "learning_rate": 7.495103474820575e-07, "loss": 1.1265, "step": 68830 }, { "epoch": 0.92, "learning_rate": 7.482321764307714e-07, "loss": 0.4806, "step": 68835 }, { "epoch": 0.92, "learning_rate": 7.469550796114777e-07, "loss": 0.9748, "step": 68840 }, { "epoch": 0.92, "learning_rate": 7.456790570807392e-07, "loss": 0.2818, "step": 68845 }, { "epoch": 0.92, "learning_rate": 7.444041088950749e-07, "loss": 0.7063, "step": 68850 }, { "epoch": 0.92, "learning_rate": 7.431302351109643e-07, "loss": 0.4854, "step": 68855 }, { "epoch": 0.92, "learning_rate": 7.41857435784829e-07, "loss": 0.9004, "step": 68860 }, { "epoch": 0.92, "learning_rate": 7.405857109730519e-07, "loss": 0.6577, "step": 68865 }, { "epoch": 0.92, "learning_rate": 7.393150607319599e-07, "loss": 0.2883, "step": 68870 }, { "epoch": 0.92, "learning_rate": 7.380454851178387e-07, "loss": 0.8259, "step": 68875 }, { "epoch": 0.92, "learning_rate": 7.367769841869238e-07, "loss": 1.1515, "step": 68880 }, { "epoch": 0.92, "learning_rate": 7.355095579954008e-07, "loss": 0.8479, "step": 68885 }, { "epoch": 0.92, "learning_rate": 7.342432065994193e-07, "loss": 0.4194, "step": 68890 }, { "epoch": 0.92, "learning_rate": 7.329779300550621e-07, "loss": 0.5206, "step": 68895 }, { "epoch": 0.92, "learning_rate": 7.317137284183762e-07, "loss": 0.2318, "step": 68900 }, { "epoch": 0.92, "learning_rate": 7.304506017453694e-07, "loss": 0.8593, "step": 68905 }, { "epoch": 0.92, "learning_rate": 7.291885500919749e-07, "loss": 0.6661, "step": 68910 }, { "epoch": 0.92, "learning_rate": 7.279275735141116e-07, "loss": 0.8086, "step": 68915 }, { "epoch": 0.92, "learning_rate": 7.26667672067624e-07, "loss": 1.0691, "step": 68920 }, { "epoch": 0.92, "learning_rate": 7.25408845808323e-07, "loss": 0.8858, "step": 68925 }, { "epoch": 0.92, "learning_rate": 7.241510947919694e-07, "loss": 0.9734, "step": 68930 }, { "epoch": 0.92, "learning_rate": 7.228944190742743e-07, "loss": 0.8407, "step": 68935 }, { "epoch": 0.92, "learning_rate": 7.216388187109013e-07, "loss": 0.7906, "step": 68940 }, { "epoch": 0.92, "learning_rate": 7.203842937574645e-07, "loss": 0.7121, "step": 68945 }, { "epoch": 0.92, "learning_rate": 7.191308442695416e-07, "loss": 0.6866, "step": 68950 }, { "epoch": 0.92, "learning_rate": 7.178784703026464e-07, "loss": 0.6123, "step": 68955 }, { "epoch": 0.92, "learning_rate": 7.166271719122541e-07, "loss": 0.6596, "step": 68960 }, { "epoch": 0.92, "learning_rate": 7.153769491537926e-07, "loss": 0.8821, "step": 68965 }, { "epoch": 0.92, "learning_rate": 7.141278020826425e-07, "loss": 1.0584, "step": 68970 }, { "epoch": 0.92, "learning_rate": 7.128797307541318e-07, "loss": 0.7685, "step": 68975 }, { "epoch": 0.92, "learning_rate": 7.116327352235414e-07, "loss": 0.5987, "step": 68980 }, { "epoch": 0.92, "learning_rate": 7.10386815546113e-07, "loss": 1.0473, "step": 68985 }, { "epoch": 0.92, "learning_rate": 7.091419717770331e-07, "loss": 0.6245, "step": 68990 }, { "epoch": 0.92, "learning_rate": 7.078982039714355e-07, "loss": 0.5269, "step": 68995 }, { "epoch": 0.92, "learning_rate": 7.066555121844231e-07, "loss": 0.7197, "step": 69000 }, { "epoch": 0.92, "learning_rate": 7.054138964710328e-07, "loss": 0.3534, "step": 69005 }, { "epoch": 0.92, "learning_rate": 7.041733568862619e-07, "loss": 0.5574, "step": 69010 }, { "epoch": 0.92, "learning_rate": 7.029338934850693e-07, "loss": 1.1039, "step": 69015 }, { "epoch": 0.92, "learning_rate": 7.016955063223474e-07, "loss": 0.7451, "step": 69020 }, { "epoch": 0.92, "learning_rate": 7.004581954529549e-07, "loss": 0.3367, "step": 69025 }, { "epoch": 0.92, "learning_rate": 6.99221960931698e-07, "loss": 0.7088, "step": 69030 }, { "epoch": 0.92, "learning_rate": 6.979868028133329e-07, "loss": 1.2708, "step": 69035 }, { "epoch": 0.93, "learning_rate": 6.967527211525743e-07, "loss": 0.5973, "step": 69040 }, { "epoch": 0.93, "learning_rate": 6.955197160040866e-07, "loss": 0.7396, "step": 69045 }, { "epoch": 0.93, "learning_rate": 6.942877874224846e-07, "loss": 0.7926, "step": 69050 }, { "epoch": 0.93, "learning_rate": 6.930569354623329e-07, "loss": 0.2491, "step": 69055 }, { "epoch": 0.93, "learning_rate": 6.918271601781573e-07, "loss": 1.0487, "step": 69060 }, { "epoch": 0.93, "learning_rate": 6.905984616244282e-07, "loss": 0.5267, "step": 69065 }, { "epoch": 0.93, "learning_rate": 6.893708398555687e-07, "loss": 0.5122, "step": 69070 }, { "epoch": 0.93, "learning_rate": 6.881442949259603e-07, "loss": 0.5035, "step": 69075 }, { "epoch": 0.93, "learning_rate": 6.869188268899318e-07, "loss": 0.6726, "step": 69080 }, { "epoch": 0.93, "learning_rate": 6.856944358017647e-07, "loss": 1.0611, "step": 69085 }, { "epoch": 0.93, "learning_rate": 6.844711217156935e-07, "loss": 0.4646, "step": 69090 }, { "epoch": 0.93, "learning_rate": 6.832488846859053e-07, "loss": 0.6914, "step": 69095 }, { "epoch": 0.93, "learning_rate": 6.820277247665375e-07, "loss": 0.5342, "step": 69100 }, { "epoch": 0.93, "learning_rate": 6.808076420116799e-07, "loss": 1.2433, "step": 69105 }, { "epoch": 0.93, "learning_rate": 6.795886364753867e-07, "loss": 0.4191, "step": 69110 }, { "epoch": 0.93, "learning_rate": 6.78370708211637e-07, "loss": 0.3531, "step": 69115 }, { "epoch": 0.93, "learning_rate": 6.771538572743901e-07, "loss": 0.6433, "step": 69120 }, { "epoch": 0.93, "learning_rate": 6.759380837175506e-07, "loss": 0.5214, "step": 69125 }, { "epoch": 0.93, "learning_rate": 6.747233875949554e-07, "loss": 0.427, "step": 69130 }, { "epoch": 0.93, "learning_rate": 6.735097689604231e-07, "loss": 0.5458, "step": 69135 }, { "epoch": 0.93, "learning_rate": 6.722972278677075e-07, "loss": 0.3776, "step": 69140 }, { "epoch": 0.93, "learning_rate": 6.710857643705132e-07, "loss": 0.2328, "step": 69145 }, { "epoch": 0.93, "learning_rate": 6.698753785225081e-07, "loss": 0.5864, "step": 69150 }, { "epoch": 0.93, "learning_rate": 6.686660703773051e-07, "loss": 0.274, "step": 69155 }, { "epoch": 0.93, "learning_rate": 6.674578399884668e-07, "loss": 0.9121, "step": 69160 }, { "epoch": 0.93, "learning_rate": 6.662506874095142e-07, "loss": 1.1003, "step": 69165 }, { "epoch": 0.93, "learning_rate": 6.650446126939214e-07, "loss": 1.0249, "step": 69170 }, { "epoch": 0.93, "learning_rate": 6.638396158951065e-07, "loss": 0.4112, "step": 69175 }, { "epoch": 0.93, "learning_rate": 6.626356970664438e-07, "loss": 0.6218, "step": 69180 }, { "epoch": 0.93, "learning_rate": 6.614328562612682e-07, "loss": 0.3209, "step": 69185 }, { "epoch": 0.93, "learning_rate": 6.602310935328537e-07, "loss": 0.7953, "step": 69190 }, { "epoch": 0.93, "learning_rate": 6.590304089344329e-07, "loss": 0.3901, "step": 69195 }, { "epoch": 0.93, "learning_rate": 6.57830802519191e-07, "loss": 0.6954, "step": 69200 }, { "epoch": 0.93, "learning_rate": 6.566322743402659e-07, "loss": 0.796, "step": 69205 }, { "epoch": 0.93, "learning_rate": 6.55434824450743e-07, "loss": 0.7055, "step": 69210 }, { "epoch": 0.93, "learning_rate": 6.542384529036633e-07, "loss": 0.3716, "step": 69215 }, { "epoch": 0.93, "learning_rate": 6.530431597520259e-07, "loss": 0.7479, "step": 69220 }, { "epoch": 0.93, "learning_rate": 6.518489450487747e-07, "loss": 0.2329, "step": 69225 }, { "epoch": 0.93, "learning_rate": 6.506558088468006e-07, "loss": 0.3817, "step": 69230 }, { "epoch": 0.93, "learning_rate": 6.494637511989616e-07, "loss": 0.4649, "step": 69235 }, { "epoch": 0.93, "learning_rate": 6.482727721580539e-07, "loss": 0.8109, "step": 69240 }, { "epoch": 0.93, "learning_rate": 6.470828717768357e-07, "loss": 0.7292, "step": 69245 }, { "epoch": 0.93, "learning_rate": 6.458940501080119e-07, "loss": 0.7855, "step": 69250 }, { "epoch": 0.93, "learning_rate": 6.447063072042403e-07, "loss": 0.1862, "step": 69255 }, { "epoch": 0.93, "learning_rate": 6.435196431181372e-07, "loss": 0.8531, "step": 69260 }, { "epoch": 0.93, "learning_rate": 6.423340579022607e-07, "loss": 1.0532, "step": 69265 }, { "epoch": 0.93, "learning_rate": 6.411495516091298e-07, "loss": 1.0482, "step": 69270 }, { "epoch": 0.93, "learning_rate": 6.399661242912053e-07, "loss": 0.5849, "step": 69275 }, { "epoch": 0.93, "learning_rate": 6.387837760009146e-07, "loss": 1.0607, "step": 69280 }, { "epoch": 0.93, "learning_rate": 6.376025067906299e-07, "loss": 0.426, "step": 69285 }, { "epoch": 0.93, "learning_rate": 6.364223167126676e-07, "loss": 1.3662, "step": 69290 }, { "epoch": 0.93, "learning_rate": 6.352432058193136e-07, "loss": 0.6523, "step": 69295 }, { "epoch": 0.93, "learning_rate": 6.340651741627928e-07, "loss": 0.3372, "step": 69300 }, { "epoch": 0.93, "learning_rate": 6.328882217952859e-07, "loss": 0.9607, "step": 69305 }, { "epoch": 0.93, "learning_rate": 6.317123487689231e-07, "loss": 0.744, "step": 69310 }, { "epoch": 0.93, "learning_rate": 6.305375551357934e-07, "loss": 0.6451, "step": 69315 }, { "epoch": 0.93, "learning_rate": 6.293638409479357e-07, "loss": 0.9004, "step": 69320 }, { "epoch": 0.93, "learning_rate": 6.281912062573336e-07, "loss": 0.918, "step": 69325 }, { "epoch": 0.93, "learning_rate": 6.270196511159371e-07, "loss": 0.1303, "step": 69330 }, { "epoch": 0.93, "learning_rate": 6.258491755756323e-07, "loss": 0.6838, "step": 69335 }, { "epoch": 0.93, "learning_rate": 6.246797796882697e-07, "loss": 0.5288, "step": 69340 }, { "epoch": 0.93, "learning_rate": 6.235114635056494e-07, "loss": 0.5502, "step": 69345 }, { "epoch": 0.93, "learning_rate": 6.22344227079516e-07, "loss": 0.577, "step": 69350 }, { "epoch": 0.93, "learning_rate": 6.211780704615783e-07, "loss": 0.4308, "step": 69355 }, { "epoch": 0.93, "learning_rate": 6.200129937034894e-07, "loss": 0.6975, "step": 69360 }, { "epoch": 0.93, "learning_rate": 6.188489968568523e-07, "loss": 0.8672, "step": 69365 }, { "epoch": 0.93, "learning_rate": 6.176860799732315e-07, "loss": 1.1394, "step": 69370 }, { "epoch": 0.93, "learning_rate": 6.165242431041385e-07, "loss": 0.9219, "step": 69375 }, { "epoch": 0.93, "learning_rate": 6.153634863010321e-07, "loss": 0.8631, "step": 69380 }, { "epoch": 0.93, "learning_rate": 6.142038096153297e-07, "loss": 0.4271, "step": 69385 }, { "epoch": 0.93, "learning_rate": 6.130452130984038e-07, "loss": 0.505, "step": 69390 }, { "epoch": 0.93, "learning_rate": 6.11887696801569e-07, "loss": 1.2771, "step": 69395 }, { "epoch": 0.93, "learning_rate": 6.107312607760984e-07, "loss": 1.0266, "step": 69400 }, { "epoch": 0.93, "learning_rate": 6.095759050732175e-07, "loss": 0.8553, "step": 69405 }, { "epoch": 0.93, "learning_rate": 6.084216297441048e-07, "loss": 0.3993, "step": 69410 }, { "epoch": 0.93, "learning_rate": 6.07268434839886e-07, "loss": 1.1902, "step": 69415 }, { "epoch": 0.93, "learning_rate": 6.061163204116399e-07, "loss": 0.4531, "step": 69420 }, { "epoch": 0.93, "learning_rate": 6.049652865104033e-07, "loss": 1.2366, "step": 69425 }, { "epoch": 0.93, "learning_rate": 6.038153331871632e-07, "loss": 0.7418, "step": 69430 }, { "epoch": 0.93, "learning_rate": 6.026664604928484e-07, "loss": 0.5298, "step": 69435 }, { "epoch": 0.93, "learning_rate": 6.015186684783569e-07, "loss": 0.8719, "step": 69440 }, { "epoch": 0.93, "learning_rate": 6.00371957194526e-07, "loss": 0.831, "step": 69445 }, { "epoch": 0.93, "learning_rate": 5.992263266921455e-07, "loss": 0.7081, "step": 69450 }, { "epoch": 0.93, "learning_rate": 5.980817770219749e-07, "loss": 0.4348, "step": 69455 }, { "epoch": 0.93, "learning_rate": 5.96938308234693e-07, "loss": 0.4826, "step": 69460 }, { "epoch": 0.93, "learning_rate": 5.957959203809649e-07, "loss": 0.2672, "step": 69465 }, { "epoch": 0.93, "learning_rate": 5.946546135113862e-07, "loss": 0.6938, "step": 69470 }, { "epoch": 0.93, "learning_rate": 5.935143876765109e-07, "loss": 0.6979, "step": 69475 }, { "epoch": 0.93, "learning_rate": 5.923752429268487e-07, "loss": 0.6362, "step": 69480 }, { "epoch": 0.93, "learning_rate": 5.912371793128534e-07, "loss": 1.1273, "step": 69485 }, { "epoch": 0.93, "learning_rate": 5.901001968849407e-07, "loss": 1.084, "step": 69490 }, { "epoch": 0.93, "learning_rate": 5.889642956934644e-07, "loss": 0.4541, "step": 69495 }, { "epoch": 0.93, "learning_rate": 5.878294757887509e-07, "loss": 0.4277, "step": 69500 }, { "epoch": 0.93, "learning_rate": 5.866957372210602e-07, "loss": 0.5878, "step": 69505 }, { "epoch": 0.93, "learning_rate": 5.855630800406103e-07, "loss": 0.9804, "step": 69510 }, { "epoch": 0.93, "learning_rate": 5.844315042975751e-07, "loss": 0.5175, "step": 69515 }, { "epoch": 0.93, "learning_rate": 5.833010100420782e-07, "loss": 0.7083, "step": 69520 }, { "epoch": 0.93, "learning_rate": 5.821715973241965e-07, "loss": 0.5782, "step": 69525 }, { "epoch": 0.93, "learning_rate": 5.81043266193948e-07, "loss": 0.678, "step": 69530 }, { "epoch": 0.93, "learning_rate": 5.799160167013235e-07, "loss": 0.7292, "step": 69535 }, { "epoch": 0.93, "learning_rate": 5.787898488962467e-07, "loss": 0.5446, "step": 69540 }, { "epoch": 0.93, "learning_rate": 5.776647628286058e-07, "loss": 1.0214, "step": 69545 }, { "epoch": 0.93, "learning_rate": 5.76540758548233e-07, "loss": 0.5848, "step": 69550 }, { "epoch": 0.93, "learning_rate": 5.754178361049217e-07, "loss": 0.6309, "step": 69555 }, { "epoch": 0.93, "learning_rate": 5.742959955484018e-07, "loss": 0.4472, "step": 69560 }, { "epoch": 0.93, "learning_rate": 5.731752369283777e-07, "loss": 0.416, "step": 69565 }, { "epoch": 0.93, "learning_rate": 5.720555602944849e-07, "loss": 0.0861, "step": 69570 }, { "epoch": 0.93, "learning_rate": 5.709369656963198e-07, "loss": 0.4267, "step": 69575 }, { "epoch": 0.93, "learning_rate": 5.698194531834344e-07, "loss": 0.6233, "step": 69580 }, { "epoch": 0.93, "learning_rate": 5.687030228053253e-07, "loss": 1.3552, "step": 69585 }, { "epoch": 0.93, "learning_rate": 5.675876746114472e-07, "loss": 0.3551, "step": 69590 }, { "epoch": 0.93, "learning_rate": 5.664734086512053e-07, "loss": 0.7224, "step": 69595 }, { "epoch": 0.93, "learning_rate": 5.653602249739515e-07, "loss": 0.8694, "step": 69600 }, { "epoch": 0.93, "learning_rate": 5.642481236289965e-07, "loss": 0.4278, "step": 69605 }, { "epoch": 0.93, "learning_rate": 5.631371046656037e-07, "loss": 0.5715, "step": 69610 }, { "epoch": 0.93, "learning_rate": 5.620271681329836e-07, "loss": 0.7959, "step": 69615 }, { "epoch": 0.93, "learning_rate": 5.609183140802998e-07, "loss": 0.7364, "step": 69620 }, { "epoch": 0.93, "learning_rate": 5.598105425566685e-07, "loss": 0.7473, "step": 69625 }, { "epoch": 0.93, "learning_rate": 5.587038536111616e-07, "loss": 0.3855, "step": 69630 }, { "epoch": 0.93, "learning_rate": 5.575982472927982e-07, "loss": 0.97, "step": 69635 }, { "epoch": 0.93, "learning_rate": 5.564937236505502e-07, "loss": 0.5328, "step": 69640 }, { "epoch": 0.93, "learning_rate": 5.553902827333424e-07, "loss": 0.1027, "step": 69645 }, { "epoch": 0.93, "learning_rate": 5.542879245900551e-07, "loss": 0.415, "step": 69650 }, { "epoch": 0.93, "learning_rate": 5.531866492695103e-07, "loss": 0.4936, "step": 69655 }, { "epoch": 0.93, "learning_rate": 5.52086456820497e-07, "loss": 0.1829, "step": 69660 }, { "epoch": 0.93, "learning_rate": 5.509873472917427e-07, "loss": 0.7823, "step": 69665 }, { "epoch": 0.93, "learning_rate": 5.498893207319334e-07, "loss": 0.6553, "step": 69670 }, { "epoch": 0.93, "learning_rate": 5.487923771897136e-07, "loss": 0.7529, "step": 69675 }, { "epoch": 0.93, "learning_rate": 5.476965167136583e-07, "loss": 0.2861, "step": 69680 }, { "epoch": 0.93, "learning_rate": 5.466017393523204e-07, "loss": 0.5667, "step": 69685 }, { "epoch": 0.93, "learning_rate": 5.455080451541889e-07, "loss": 0.7013, "step": 69690 }, { "epoch": 0.93, "learning_rate": 5.444154341677054e-07, "loss": 1.3547, "step": 69695 }, { "epoch": 0.93, "learning_rate": 5.43323906441276e-07, "loss": 0.5471, "step": 69700 }, { "epoch": 0.93, "learning_rate": 5.422334620232422e-07, "loss": 0.5858, "step": 69705 }, { "epoch": 0.93, "learning_rate": 5.411441009619072e-07, "loss": 0.2579, "step": 69710 }, { "epoch": 0.93, "learning_rate": 5.400558233055242e-07, "loss": 0.9664, "step": 69715 }, { "epoch": 0.93, "learning_rate": 5.389686291022989e-07, "loss": 0.4366, "step": 69720 }, { "epoch": 0.93, "learning_rate": 5.378825184003899e-07, "loss": 0.719, "step": 69725 }, { "epoch": 0.93, "learning_rate": 5.367974912479035e-07, "loss": 0.3836, "step": 69730 }, { "epoch": 0.93, "learning_rate": 5.357135476929065e-07, "loss": 1.1332, "step": 69735 }, { "epoch": 0.93, "learning_rate": 5.346306877834051e-07, "loss": 0.9681, "step": 69740 }, { "epoch": 0.93, "learning_rate": 5.335489115673664e-07, "loss": 0.3873, "step": 69745 }, { "epoch": 0.93, "learning_rate": 5.324682190927105e-07, "loss": 1.056, "step": 69750 }, { "epoch": 0.93, "learning_rate": 5.313886104073073e-07, "loss": 0.4044, "step": 69755 }, { "epoch": 0.93, "learning_rate": 5.303100855589771e-07, "loss": 0.4191, "step": 69760 }, { "epoch": 0.93, "learning_rate": 5.29232644595487e-07, "loss": 0.9072, "step": 69765 }, { "epoch": 0.93, "learning_rate": 5.281562875645713e-07, "loss": 1.4011, "step": 69770 }, { "epoch": 0.93, "learning_rate": 5.270810145139027e-07, "loss": 0.9652, "step": 69775 }, { "epoch": 0.93, "learning_rate": 5.260068254911072e-07, "loss": 0.4163, "step": 69780 }, { "epoch": 0.94, "learning_rate": 5.249337205437771e-07, "loss": 0.4508, "step": 69785 }, { "epoch": 0.94, "learning_rate": 5.238616997194329e-07, "loss": 0.5515, "step": 69790 }, { "epoch": 0.94, "learning_rate": 5.227907630655671e-07, "loss": 0.14, "step": 69795 }, { "epoch": 0.94, "learning_rate": 5.217209106296139e-07, "loss": 0.6276, "step": 69800 }, { "epoch": 0.94, "learning_rate": 5.206521424589605e-07, "loss": 0.8483, "step": 69805 }, { "epoch": 0.94, "learning_rate": 5.195844586009552e-07, "loss": 0.9573, "step": 69810 }, { "epoch": 0.94, "learning_rate": 5.185178591028878e-07, "loss": 1.2876, "step": 69815 }, { "epoch": 0.94, "learning_rate": 5.174523440119983e-07, "loss": 1.2957, "step": 69820 }, { "epoch": 0.94, "learning_rate": 5.163879133754878e-07, "loss": 0.8817, "step": 69825 }, { "epoch": 0.94, "learning_rate": 5.153245672405077e-07, "loss": 0.1719, "step": 69830 }, { "epoch": 0.94, "learning_rate": 5.142623056541562e-07, "loss": 0.7303, "step": 69835 }, { "epoch": 0.94, "learning_rate": 5.132011286634847e-07, "loss": 0.2937, "step": 69840 }, { "epoch": 0.94, "learning_rate": 5.121410363155027e-07, "loss": 0.5686, "step": 69845 }, { "epoch": 0.94, "learning_rate": 5.110820286571589e-07, "loss": 0.6546, "step": 69850 }, { "epoch": 0.94, "learning_rate": 5.100241057353682e-07, "loss": 0.4448, "step": 69855 }, { "epoch": 0.94, "learning_rate": 5.089672675969909e-07, "loss": 0.523, "step": 69860 }, { "epoch": 0.94, "learning_rate": 5.079115142888391e-07, "loss": 0.5088, "step": 69865 }, { "epoch": 0.94, "learning_rate": 5.068568458576784e-07, "loss": 0.802, "step": 69870 }, { "epoch": 0.94, "learning_rate": 5.058032623502212e-07, "loss": 0.8615, "step": 69875 }, { "epoch": 0.94, "learning_rate": 5.047507638131416e-07, "loss": 0.4094, "step": 69880 }, { "epoch": 0.94, "learning_rate": 5.036993502930576e-07, "loss": 0.5743, "step": 69885 }, { "epoch": 0.94, "learning_rate": 5.026490218365376e-07, "loss": 1.1848, "step": 69890 }, { "epoch": 0.94, "learning_rate": 5.015997784901166e-07, "loss": 0.7551, "step": 69895 }, { "epoch": 0.94, "learning_rate": 5.005516203002575e-07, "loss": 0.9776, "step": 69900 }, { "epoch": 0.94, "learning_rate": 4.995045473133952e-07, "loss": 0.6085, "step": 69905 }, { "epoch": 0.94, "learning_rate": 4.984585595759123e-07, "loss": 1.2401, "step": 69910 }, { "epoch": 0.94, "learning_rate": 4.974136571341354e-07, "loss": 0.7834, "step": 69915 }, { "epoch": 0.94, "learning_rate": 4.963698400343497e-07, "loss": 0.9445, "step": 69920 }, { "epoch": 0.94, "learning_rate": 4.953271083227961e-07, "loss": 0.5482, "step": 69925 }, { "epoch": 0.94, "learning_rate": 4.942854620456572e-07, "loss": 0.7118, "step": 69930 }, { "epoch": 0.94, "learning_rate": 4.932449012490708e-07, "loss": 0.9882, "step": 69935 }, { "epoch": 0.94, "learning_rate": 4.922054259791364e-07, "loss": 0.1789, "step": 69940 }, { "epoch": 0.94, "learning_rate": 4.913746273733145e-07, "loss": 0.9439, "step": 69945 }, { "epoch": 0.94, "learning_rate": 4.903371061673434e-07, "loss": 1.0816, "step": 69950 }, { "epoch": 0.94, "learning_rate": 4.893006706168185e-07, "loss": 0.2032, "step": 69955 }, { "epoch": 0.94, "learning_rate": 4.882653207676502e-07, "loss": 1.0834, "step": 69960 }, { "epoch": 0.94, "learning_rate": 4.87231056665699e-07, "loss": 1.0897, "step": 69965 }, { "epoch": 0.94, "learning_rate": 4.861978783567784e-07, "loss": 0.5987, "step": 69970 }, { "epoch": 0.94, "learning_rate": 4.851657858866543e-07, "loss": 0.5147, "step": 69975 }, { "epoch": 0.94, "learning_rate": 4.841347793010404e-07, "loss": 0.8348, "step": 69980 }, { "epoch": 0.94, "learning_rate": 4.831048586456111e-07, "loss": 0.8095, "step": 69985 }, { "epoch": 0.94, "learning_rate": 4.820760239659799e-07, "loss": 0.4933, "step": 69990 }, { "epoch": 0.94, "learning_rate": 4.810482753077189e-07, "loss": 0.0952, "step": 69995 }, { "epoch": 0.94, "learning_rate": 4.80021612716361e-07, "loss": 1.1144, "step": 70000 }, { "epoch": 0.94, "learning_rate": 4.789960362373697e-07, "loss": 0.5696, "step": 70005 }, { "epoch": 0.94, "learning_rate": 4.779715459161809e-07, "loss": 0.3091, "step": 70010 }, { "epoch": 0.94, "learning_rate": 4.769481417981725e-07, "loss": 0.641, "step": 70015 }, { "epoch": 0.94, "learning_rate": 4.7592582392867733e-07, "loss": 0.9131, "step": 70020 }, { "epoch": 0.94, "learning_rate": 4.749045923529816e-07, "loss": 0.5182, "step": 70025 }, { "epoch": 0.94, "learning_rate": 4.738844471163101e-07, "loss": 0.5901, "step": 70030 }, { "epoch": 0.94, "learning_rate": 4.728653882638656e-07, "loss": 0.6785, "step": 70035 }, { "epoch": 0.94, "learning_rate": 4.718474158407732e-07, "loss": 0.8926, "step": 70040 }, { "epoch": 0.94, "learning_rate": 4.7083052989213004e-07, "loss": 0.8252, "step": 70045 }, { "epoch": 0.94, "learning_rate": 4.6981473046298075e-07, "loss": 0.5938, "step": 70050 }, { "epoch": 0.94, "learning_rate": 4.6880001759831705e-07, "loss": 1.0875, "step": 70055 }, { "epoch": 0.94, "learning_rate": 4.677863913430863e-07, "loss": 0.3038, "step": 70060 }, { "epoch": 0.94, "learning_rate": 4.667738517421888e-07, "loss": 0.2619, "step": 70065 }, { "epoch": 0.94, "learning_rate": 4.6576239884047466e-07, "loss": 0.2054, "step": 70070 }, { "epoch": 0.94, "learning_rate": 4.647520326827443e-07, "loss": 0.3114, "step": 70075 }, { "epoch": 0.94, "learning_rate": 4.637427533137506e-07, "loss": 1.7242, "step": 70080 }, { "epoch": 0.94, "learning_rate": 4.627345607782052e-07, "loss": 0.9555, "step": 70085 }, { "epoch": 0.94, "learning_rate": 4.617274551207612e-07, "loss": 0.7094, "step": 70090 }, { "epoch": 0.94, "learning_rate": 4.6072143638603016e-07, "loss": 0.8832, "step": 70095 }, { "epoch": 0.94, "learning_rate": 4.597165046185736e-07, "loss": 0.4809, "step": 70100 }, { "epoch": 0.94, "learning_rate": 4.5871265986290324e-07, "loss": 1.7173, "step": 70105 }, { "epoch": 0.94, "learning_rate": 4.5770990216348895e-07, "loss": 0.8144, "step": 70110 }, { "epoch": 0.94, "learning_rate": 4.567082315647425e-07, "loss": 1.1065, "step": 70115 }, { "epoch": 0.94, "learning_rate": 4.5570764811103674e-07, "loss": 0.4374, "step": 70120 }, { "epoch": 0.94, "learning_rate": 4.5470815184668613e-07, "loss": 0.596, "step": 70125 }, { "epoch": 0.94, "learning_rate": 4.5370974281597476e-07, "loss": 0.8177, "step": 70130 }, { "epoch": 0.94, "learning_rate": 4.5271242106311727e-07, "loss": 0.4632, "step": 70135 }, { "epoch": 0.94, "learning_rate": 4.517161866322922e-07, "loss": 0.9783, "step": 70140 }, { "epoch": 0.94, "learning_rate": 4.507210395676337e-07, "loss": 0.4681, "step": 70145 }, { "epoch": 0.94, "learning_rate": 4.49726979913212e-07, "loss": 0.7898, "step": 70150 }, { "epoch": 0.94, "learning_rate": 4.4873400771306415e-07, "loss": 0.4335, "step": 70155 }, { "epoch": 0.94, "learning_rate": 4.477421230111772e-07, "loss": 0.2798, "step": 70160 }, { "epoch": 0.94, "learning_rate": 4.4675132585147716e-07, "loss": 0.8303, "step": 70165 }, { "epoch": 0.94, "learning_rate": 4.4576161627786215e-07, "loss": 0.7966, "step": 70170 }, { "epoch": 0.94, "learning_rate": 4.4477299433416666e-07, "loss": 0.594, "step": 70175 }, { "epoch": 0.94, "learning_rate": 4.4378546006418056e-07, "loss": 1.7349, "step": 70180 }, { "epoch": 0.94, "learning_rate": 4.4279901351164664e-07, "loss": 0.5679, "step": 70185 }, { "epoch": 0.94, "learning_rate": 4.418136547202606e-07, "loss": 0.7358, "step": 70190 }, { "epoch": 0.94, "learning_rate": 4.4082938373367077e-07, "loss": 0.5993, "step": 70195 }, { "epoch": 0.94, "learning_rate": 4.398462005954729e-07, "loss": 0.6016, "step": 70200 }, { "epoch": 0.94, "learning_rate": 4.388641053492154e-07, "loss": 0.9069, "step": 70205 }, { "epoch": 0.94, "learning_rate": 4.3788309803840523e-07, "loss": 0.2422, "step": 70210 }, { "epoch": 0.94, "learning_rate": 4.3690317870649365e-07, "loss": 0.7753, "step": 70215 }, { "epoch": 0.94, "learning_rate": 4.359243473968877e-07, "loss": 0.4075, "step": 70220 }, { "epoch": 0.94, "learning_rate": 4.3494660415293876e-07, "loss": 0.94, "step": 70225 }, { "epoch": 0.94, "learning_rate": 4.3396994901796217e-07, "loss": 0.8421, "step": 70230 }, { "epoch": 0.94, "learning_rate": 4.3299438203521505e-07, "loss": 0.5714, "step": 70235 }, { "epoch": 0.94, "learning_rate": 4.3201990324791277e-07, "loss": 0.2796, "step": 70240 }, { "epoch": 0.94, "learning_rate": 4.310465126992208e-07, "loss": 0.685, "step": 70245 }, { "epoch": 0.94, "learning_rate": 4.300742104322492e-07, "loss": 1.0253, "step": 70250 }, { "epoch": 0.94, "learning_rate": 4.2910299649007724e-07, "loss": 0.2928, "step": 70255 }, { "epoch": 0.94, "learning_rate": 4.2813287091571233e-07, "loss": 0.3667, "step": 70260 }, { "epoch": 0.94, "learning_rate": 4.271638337521366e-07, "loss": 0.1907, "step": 70265 }, { "epoch": 0.94, "learning_rate": 4.2619588504226593e-07, "loss": 1.0314, "step": 70270 }, { "epoch": 0.94, "learning_rate": 4.2522902482897977e-07, "loss": 0.7124, "step": 70275 }, { "epoch": 0.94, "learning_rate": 4.24263253155105e-07, "loss": 0.4608, "step": 70280 }, { "epoch": 0.94, "learning_rate": 4.2329857006341845e-07, "loss": 1.0634, "step": 70285 }, { "epoch": 0.94, "learning_rate": 4.223349755966527e-07, "loss": 0.6342, "step": 70290 }, { "epoch": 0.94, "learning_rate": 4.213724697974875e-07, "loss": 0.1689, "step": 70295 }, { "epoch": 0.94, "learning_rate": 4.2041105270856084e-07, "loss": 0.6319, "step": 70300 }, { "epoch": 0.94, "learning_rate": 4.1945072437245547e-07, "loss": 0.5079, "step": 70305 }, { "epoch": 0.94, "learning_rate": 4.184914848317095e-07, "loss": 1.4149, "step": 70310 }, { "epoch": 0.94, "learning_rate": 4.17533334128814e-07, "loss": 0.5025, "step": 70315 }, { "epoch": 0.94, "learning_rate": 4.1657627230621275e-07, "loss": 0.9314, "step": 70320 }, { "epoch": 0.94, "learning_rate": 4.156202994062913e-07, "loss": 0.3847, "step": 70325 }, { "epoch": 0.94, "learning_rate": 4.1466541547140193e-07, "loss": 0.4126, "step": 70330 }, { "epoch": 0.94, "learning_rate": 4.137116205438357e-07, "loss": 0.7704, "step": 70335 }, { "epoch": 0.94, "learning_rate": 4.1275891466584506e-07, "loss": 1.136, "step": 70340 }, { "epoch": 0.94, "learning_rate": 4.118072978796267e-07, "loss": 0.5497, "step": 70345 }, { "epoch": 0.94, "learning_rate": 4.108567702273358e-07, "loss": 1.1674, "step": 70350 }, { "epoch": 0.94, "learning_rate": 4.0990733175107486e-07, "loss": 1.1934, "step": 70355 }, { "epoch": 0.94, "learning_rate": 4.0895898249289635e-07, "loss": 0.4976, "step": 70360 }, { "epoch": 0.94, "learning_rate": 4.080117224948138e-07, "loss": 0.7156, "step": 70365 }, { "epoch": 0.94, "learning_rate": 4.07065551798777e-07, "loss": 0.5425, "step": 70370 }, { "epoch": 0.94, "learning_rate": 4.061204704467053e-07, "loss": 0.2296, "step": 70375 }, { "epoch": 0.94, "learning_rate": 4.051764784804568e-07, "loss": 0.5789, "step": 70380 }, { "epoch": 0.94, "learning_rate": 4.042335759418453e-07, "loss": 1.0623, "step": 70385 }, { "epoch": 0.94, "learning_rate": 4.0329176287263737e-07, "loss": 0.7101, "step": 70390 }, { "epoch": 0.94, "learning_rate": 4.023510393145524e-07, "loss": 1.3739, "step": 70395 }, { "epoch": 0.94, "learning_rate": 4.0141140530925714e-07, "loss": 0.7288, "step": 70400 }, { "epoch": 0.94, "learning_rate": 4.0047286089837377e-07, "loss": 0.4731, "step": 70405 }, { "epoch": 0.94, "learning_rate": 3.9953540612347464e-07, "loss": 0.4489, "step": 70410 }, { "epoch": 0.94, "learning_rate": 3.985990410260876e-07, "loss": 0.5024, "step": 70415 }, { "epoch": 0.94, "learning_rate": 3.976637656476823e-07, "loss": 0.671, "step": 70420 }, { "epoch": 0.94, "learning_rate": 3.967295800296922e-07, "loss": 0.7698, "step": 70425 }, { "epoch": 0.94, "learning_rate": 3.9579648421349533e-07, "loss": 1.0017, "step": 70430 }, { "epoch": 0.94, "learning_rate": 3.948644782404226e-07, "loss": 0.2289, "step": 70435 }, { "epoch": 0.94, "learning_rate": 3.9393356215176034e-07, "loss": 0.7128, "step": 70440 }, { "epoch": 0.94, "learning_rate": 3.9300373598873953e-07, "loss": 0.2389, "step": 70445 }, { "epoch": 0.94, "learning_rate": 3.9207499979254937e-07, "loss": 0.5632, "step": 70450 }, { "epoch": 0.94, "learning_rate": 3.9114735360432364e-07, "loss": 0.8056, "step": 70455 }, { "epoch": 0.94, "learning_rate": 3.902207974651573e-07, "loss": 0.7387, "step": 70460 }, { "epoch": 0.94, "learning_rate": 3.892953314160924e-07, "loss": 0.2655, "step": 70465 }, { "epoch": 0.94, "learning_rate": 3.8837095549811853e-07, "loss": 0.4344, "step": 70470 }, { "epoch": 0.94, "learning_rate": 3.8744766975218893e-07, "loss": 0.7718, "step": 70475 }, { "epoch": 0.94, "learning_rate": 3.865254742191876e-07, "loss": 0.4918, "step": 70480 }, { "epoch": 0.94, "learning_rate": 3.8560436893997356e-07, "loss": 1.0628, "step": 70485 }, { "epoch": 0.94, "learning_rate": 3.8468435395534463e-07, "loss": 0.6895, "step": 70490 }, { "epoch": 0.94, "learning_rate": 3.8376542930605163e-07, "loss": 0.3278, "step": 70495 }, { "epoch": 0.94, "learning_rate": 3.828475950327981e-07, "loss": 0.5177, "step": 70500 }, { "epoch": 0.94, "learning_rate": 3.8193085117624315e-07, "loss": 1.5329, "step": 70505 }, { "epoch": 0.94, "learning_rate": 3.8101519777698766e-07, "loss": 0.5732, "step": 70510 }, { "epoch": 0.94, "learning_rate": 3.801006348755964e-07, "loss": 0.2061, "step": 70515 }, { "epoch": 0.94, "learning_rate": 3.791871625125759e-07, "loss": 0.4831, "step": 70520 }, { "epoch": 0.94, "learning_rate": 3.7827478072839094e-07, "loss": 0.4962, "step": 70525 }, { "epoch": 0.94, "learning_rate": 3.7736348956345366e-07, "loss": 0.5966, "step": 70530 }, { "epoch": 0.95, "learning_rate": 3.764532890581318e-07, "loss": 0.9226, "step": 70535 }, { "epoch": 0.95, "learning_rate": 3.7554417925274034e-07, "loss": 0.6453, "step": 70540 }, { "epoch": 0.95, "learning_rate": 3.746361601875498e-07, "loss": 1.0276, "step": 70545 }, { "epoch": 0.95, "learning_rate": 3.737292319027835e-07, "loss": 0.4915, "step": 70550 }, { "epoch": 0.95, "learning_rate": 3.728233944386067e-07, "loss": 0.2419, "step": 70555 }, { "epoch": 0.95, "learning_rate": 3.7191864783515106e-07, "loss": 0.8688, "step": 70560 }, { "epoch": 0.95, "learning_rate": 3.710149921324874e-07, "loss": 1.3524, "step": 70565 }, { "epoch": 0.95, "learning_rate": 3.701124273706419e-07, "loss": 0.7366, "step": 70570 }, { "epoch": 0.95, "learning_rate": 3.6921095358959933e-07, "loss": 1.3136, "step": 70575 }, { "epoch": 0.95, "learning_rate": 3.683105708292861e-07, "loss": 0.6025, "step": 70580 }, { "epoch": 0.95, "learning_rate": 3.674112791295897e-07, "loss": 0.3048, "step": 70585 }, { "epoch": 0.95, "learning_rate": 3.6651307853033666e-07, "loss": 0.6144, "step": 70590 }, { "epoch": 0.95, "learning_rate": 3.656159690713201e-07, "loss": 0.172, "step": 70595 }, { "epoch": 0.95, "learning_rate": 3.647199507922722e-07, "loss": 0.793, "step": 70600 }, { "epoch": 0.95, "learning_rate": 3.638250237328833e-07, "loss": 0.7412, "step": 70605 }, { "epoch": 0.95, "learning_rate": 3.6293118793279403e-07, "loss": 0.612, "step": 70610 }, { "epoch": 0.95, "learning_rate": 3.6203844343160044e-07, "loss": 0.4493, "step": 70615 }, { "epoch": 0.95, "learning_rate": 3.6114679026884315e-07, "loss": 0.4675, "step": 70620 }, { "epoch": 0.95, "learning_rate": 3.602562284840183e-07, "loss": 0.3467, "step": 70625 }, { "epoch": 0.95, "learning_rate": 3.5936675811657493e-07, "loss": 0.4879, "step": 70630 }, { "epoch": 0.95, "learning_rate": 3.5847837920590933e-07, "loss": 0.5696, "step": 70635 }, { "epoch": 0.95, "learning_rate": 3.575910917913733e-07, "loss": 0.9588, "step": 70640 }, { "epoch": 0.95, "learning_rate": 3.567048959122715e-07, "loss": 0.8925, "step": 70645 }, { "epoch": 0.95, "learning_rate": 3.5581979160785594e-07, "loss": 0.849, "step": 70650 }, { "epoch": 0.95, "learning_rate": 3.549357789173313e-07, "loss": 0.5359, "step": 70655 }, { "epoch": 0.95, "learning_rate": 3.540528578798608e-07, "loss": 0.6578, "step": 70660 }, { "epoch": 0.95, "learning_rate": 3.5317102853454354e-07, "loss": 0.3561, "step": 70665 }, { "epoch": 0.95, "learning_rate": 3.522902909204484e-07, "loss": 1.0533, "step": 70670 }, { "epoch": 0.95, "learning_rate": 3.514106450765858e-07, "loss": 0.5489, "step": 70675 }, { "epoch": 0.95, "learning_rate": 3.505320910419163e-07, "loss": 0.5278, "step": 70680 }, { "epoch": 0.95, "learning_rate": 3.496546288553587e-07, "loss": 0.6875, "step": 70685 }, { "epoch": 0.95, "learning_rate": 3.487782585557764e-07, "loss": 1.272, "step": 70690 }, { "epoch": 0.95, "learning_rate": 3.479029801819966e-07, "loss": 0.5094, "step": 70695 }, { "epoch": 0.95, "learning_rate": 3.470287937727801e-07, "loss": 0.6313, "step": 70700 }, { "epoch": 0.95, "learning_rate": 3.461556993668541e-07, "loss": 0.1361, "step": 70705 }, { "epoch": 0.95, "learning_rate": 3.4528369700289055e-07, "loss": 0.4498, "step": 70710 }, { "epoch": 0.95, "learning_rate": 3.4441278671951684e-07, "loss": 1.1536, "step": 70715 }, { "epoch": 0.95, "learning_rate": 3.4354296855530764e-07, "loss": 0.468, "step": 70720 }, { "epoch": 0.95, "learning_rate": 3.426742425487933e-07, "loss": 1.1331, "step": 70725 }, { "epoch": 0.95, "learning_rate": 3.4180660873845136e-07, "loss": 0.7545, "step": 70730 }, { "epoch": 0.95, "learning_rate": 3.4094006716271774e-07, "loss": 1.0303, "step": 70735 }, { "epoch": 0.95, "learning_rate": 3.4007461785997563e-07, "loss": 0.6815, "step": 70740 }, { "epoch": 0.95, "learning_rate": 3.3921026086855544e-07, "loss": 1.2291, "step": 70745 }, { "epoch": 0.95, "learning_rate": 3.38346996226746e-07, "loss": 0.6167, "step": 70750 }, { "epoch": 0.95, "learning_rate": 3.3748482397278627e-07, "loss": 0.9157, "step": 70755 }, { "epoch": 0.95, "learning_rate": 3.3662374414486776e-07, "loss": 1.0225, "step": 70760 }, { "epoch": 0.95, "learning_rate": 3.357637567811295e-07, "loss": 0.57, "step": 70765 }, { "epoch": 0.95, "learning_rate": 3.3490486191966874e-07, "loss": 0.4683, "step": 70770 }, { "epoch": 0.95, "learning_rate": 3.3404705959852177e-07, "loss": 0.7868, "step": 70775 }, { "epoch": 0.95, "learning_rate": 3.331903498556943e-07, "loss": 0.1935, "step": 70780 }, { "epoch": 0.95, "learning_rate": 3.323347327291282e-07, "loss": 0.774, "step": 70785 }, { "epoch": 0.95, "learning_rate": 3.3148020825672363e-07, "loss": 0.7358, "step": 70790 }, { "epoch": 0.95, "learning_rate": 3.3062677647633654e-07, "loss": 0.4437, "step": 70795 }, { "epoch": 0.95, "learning_rate": 3.2977443742576166e-07, "loss": 1.7913, "step": 70800 }, { "epoch": 0.95, "learning_rate": 3.2892319114276316e-07, "loss": 0.6358, "step": 70805 }, { "epoch": 0.95, "learning_rate": 3.280730376650387e-07, "loss": 0.6566, "step": 70810 }, { "epoch": 0.95, "learning_rate": 3.272239770302471e-07, "loss": 1.1401, "step": 70815 }, { "epoch": 0.95, "learning_rate": 3.2637600927600544e-07, "loss": 0.8452, "step": 70820 }, { "epoch": 0.95, "learning_rate": 3.255291344398614e-07, "loss": 0.3991, "step": 70825 }, { "epoch": 0.95, "learning_rate": 3.246833525593379e-07, "loss": 0.5251, "step": 70830 }, { "epoch": 0.95, "learning_rate": 3.2383866367189654e-07, "loss": 0.8511, "step": 70835 }, { "epoch": 0.95, "learning_rate": 3.2299506781494905e-07, "loss": 0.6928, "step": 70840 }, { "epoch": 0.95, "learning_rate": 3.221525650258655e-07, "loss": 1.1118, "step": 70845 }, { "epoch": 0.95, "learning_rate": 3.213111553419634e-07, "loss": 0.8497, "step": 70850 }, { "epoch": 0.95, "learning_rate": 3.204708388005156e-07, "loss": 0.6146, "step": 70855 }, { "epoch": 0.95, "learning_rate": 3.1963161543873685e-07, "loss": 1.2698, "step": 70860 }, { "epoch": 0.95, "learning_rate": 3.1879348529381127e-07, "loss": 0.6382, "step": 70865 }, { "epoch": 0.95, "learning_rate": 3.1795644840285353e-07, "loss": 0.1386, "step": 70870 }, { "epoch": 0.95, "learning_rate": 3.1712050480294795e-07, "loss": 0.4098, "step": 70875 }, { "epoch": 0.95, "learning_rate": 3.1628565453112046e-07, "loss": 0.4357, "step": 70880 }, { "epoch": 0.95, "learning_rate": 3.1545189762434426e-07, "loss": 0.5763, "step": 70885 }, { "epoch": 0.95, "learning_rate": 3.1461923411956195e-07, "loss": 0.9174, "step": 70890 }, { "epoch": 0.95, "learning_rate": 3.137876640536469e-07, "loss": 1.0396, "step": 70895 }, { "epoch": 0.95, "learning_rate": 3.1295718746343907e-07, "loss": 0.6811, "step": 70900 }, { "epoch": 0.95, "learning_rate": 3.1212780438572007e-07, "loss": 1.1173, "step": 70905 }, { "epoch": 0.95, "learning_rate": 3.112995148572301e-07, "loss": 0.6439, "step": 70910 }, { "epoch": 0.95, "learning_rate": 3.104723189146619e-07, "loss": 0.5221, "step": 70915 }, { "epoch": 0.95, "learning_rate": 3.096462165946473e-07, "loss": 0.3129, "step": 70920 }, { "epoch": 0.95, "learning_rate": 3.0882120793378486e-07, "loss": 0.8206, "step": 70925 }, { "epoch": 0.95, "learning_rate": 3.079972929686203e-07, "loss": 0.8297, "step": 70930 }, { "epoch": 0.95, "learning_rate": 3.0717447173564116e-07, "loss": 1.6226, "step": 70935 }, { "epoch": 0.95, "learning_rate": 3.0635274427129876e-07, "loss": 0.3681, "step": 70940 }, { "epoch": 0.95, "learning_rate": 3.055321106119946e-07, "loss": 0.5903, "step": 70945 }, { "epoch": 0.95, "learning_rate": 3.047125707940718e-07, "loss": 0.6681, "step": 70950 }, { "epoch": 0.95, "learning_rate": 3.038941248538374e-07, "loss": 1.0117, "step": 70955 }, { "epoch": 0.95, "learning_rate": 3.03076772827543e-07, "loss": 1.4718, "step": 70960 }, { "epoch": 0.95, "learning_rate": 3.0226051475139294e-07, "loss": 0.2752, "step": 70965 }, { "epoch": 0.95, "learning_rate": 3.014453506615417e-07, "loss": 1.24, "step": 70970 }, { "epoch": 0.95, "learning_rate": 3.0063128059409917e-07, "loss": 0.3546, "step": 70975 }, { "epoch": 0.95, "learning_rate": 2.998183045851227e-07, "loss": 1.2846, "step": 70980 }, { "epoch": 0.95, "learning_rate": 2.990064226706252e-07, "loss": 0.6115, "step": 70985 }, { "epoch": 0.95, "learning_rate": 2.9819563488656943e-07, "loss": 1.2841, "step": 70990 }, { "epoch": 0.95, "learning_rate": 2.9738594126886566e-07, "loss": 0.6378, "step": 70995 }, { "epoch": 0.95, "learning_rate": 2.965773418533824e-07, "loss": 0.6057, "step": 71000 }, { "epoch": 0.95, "learning_rate": 2.957698366759354e-07, "loss": 0.3741, "step": 71005 }, { "epoch": 0.95, "learning_rate": 2.949634257722905e-07, "loss": 0.2619, "step": 71010 }, { "epoch": 0.95, "learning_rate": 2.9415810917817476e-07, "loss": 0.8882, "step": 71015 }, { "epoch": 0.95, "learning_rate": 2.9335388692925404e-07, "loss": 0.3538, "step": 71020 }, { "epoch": 0.95, "learning_rate": 2.925507590611526e-07, "loss": 0.351, "step": 71025 }, { "epoch": 0.95, "learning_rate": 2.91748725609442e-07, "loss": 0.7041, "step": 71030 }, { "epoch": 0.95, "learning_rate": 2.909477866096522e-07, "loss": 0.4123, "step": 71035 }, { "epoch": 0.95, "learning_rate": 2.9014794209726584e-07, "loss": 0.2154, "step": 71040 }, { "epoch": 0.95, "learning_rate": 2.893491921076991e-07, "loss": 0.2629, "step": 71045 }, { "epoch": 0.95, "learning_rate": 2.8855153667634304e-07, "loss": 0.2439, "step": 71050 }, { "epoch": 0.95, "learning_rate": 2.8775497583852785e-07, "loss": 1.1865, "step": 71055 }, { "epoch": 0.95, "learning_rate": 2.8695950962953076e-07, "loss": 0.394, "step": 71060 }, { "epoch": 0.95, "learning_rate": 2.861651380845959e-07, "loss": 0.5766, "step": 71065 }, { "epoch": 0.95, "learning_rate": 2.853718612389061e-07, "loss": 0.8664, "step": 71070 }, { "epoch": 0.95, "learning_rate": 2.845796791276001e-07, "loss": 1.3809, "step": 71075 }, { "epoch": 0.95, "learning_rate": 2.8378859178576356e-07, "loss": 0.7706, "step": 71080 }, { "epoch": 0.95, "learning_rate": 2.8299859924844353e-07, "loss": 0.7539, "step": 71085 }, { "epoch": 0.95, "learning_rate": 2.8220970155062865e-07, "loss": 0.5487, "step": 71090 }, { "epoch": 0.95, "learning_rate": 2.8142189872726597e-07, "loss": 0.1226, "step": 71095 }, { "epoch": 0.95, "learning_rate": 2.806351908132526e-07, "loss": 0.4849, "step": 71100 }, { "epoch": 0.95, "learning_rate": 2.7984957784342735e-07, "loss": 0.2069, "step": 71105 }, { "epoch": 0.95, "learning_rate": 2.790650598525985e-07, "loss": 0.8658, "step": 71110 }, { "epoch": 0.95, "learning_rate": 2.7828163687551314e-07, "loss": 0.4596, "step": 71115 }, { "epoch": 0.95, "learning_rate": 2.774993089468686e-07, "loss": 0.3869, "step": 71120 }, { "epoch": 0.95, "learning_rate": 2.7671807610132607e-07, "loss": 0.3186, "step": 71125 }, { "epoch": 0.95, "learning_rate": 2.759379383734856e-07, "loss": 0.1843, "step": 71130 }, { "epoch": 0.95, "learning_rate": 2.7515889579790286e-07, "loss": 0.2584, "step": 71135 }, { "epoch": 0.95, "learning_rate": 2.7438094840908366e-07, "loss": 0.6461, "step": 71140 }, { "epoch": 0.95, "learning_rate": 2.7360409624149205e-07, "loss": 1.3818, "step": 71145 }, { "epoch": 0.95, "learning_rate": 2.7282833932953944e-07, "loss": 1.2369, "step": 71150 }, { "epoch": 0.95, "learning_rate": 2.7205367770758163e-07, "loss": 1.1675, "step": 71155 }, { "epoch": 0.95, "learning_rate": 2.712801114099384e-07, "loss": 0.5706, "step": 71160 }, { "epoch": 0.95, "learning_rate": 2.705076404708712e-07, "loss": 0.3129, "step": 71165 }, { "epoch": 0.95, "learning_rate": 2.6973626492459716e-07, "loss": 1.2417, "step": 71170 }, { "epoch": 0.95, "learning_rate": 2.6896598480528613e-07, "loss": 1.2888, "step": 71175 }, { "epoch": 0.95, "learning_rate": 2.6819680014705807e-07, "loss": 0.5475, "step": 71180 }, { "epoch": 0.95, "learning_rate": 2.6742871098398016e-07, "loss": 0.2083, "step": 71185 }, { "epoch": 0.95, "learning_rate": 2.666617173500752e-07, "loss": 0.7266, "step": 71190 }, { "epoch": 0.95, "learning_rate": 2.658958192793215e-07, "loss": 0.848, "step": 71195 }, { "epoch": 0.95, "learning_rate": 2.6513101680564477e-07, "loss": 1.0721, "step": 71200 }, { "epoch": 0.95, "learning_rate": 2.6436730996291516e-07, "loss": 0.5977, "step": 71205 }, { "epoch": 0.95, "learning_rate": 2.636046987849694e-07, "loss": 0.7973, "step": 71210 }, { "epoch": 0.95, "learning_rate": 2.6284318330557777e-07, "loss": 1.1737, "step": 71215 }, { "epoch": 0.95, "learning_rate": 2.6208276355847994e-07, "loss": 0.7512, "step": 71220 }, { "epoch": 0.95, "learning_rate": 2.613234395773573e-07, "loss": 0.1846, "step": 71225 }, { "epoch": 0.95, "learning_rate": 2.6056521139583846e-07, "loss": 0.5727, "step": 71230 }, { "epoch": 0.95, "learning_rate": 2.5980807904751883e-07, "loss": 0.3851, "step": 71235 }, { "epoch": 0.95, "learning_rate": 2.590520425659271e-07, "loss": 0.5732, "step": 71240 }, { "epoch": 0.95, "learning_rate": 2.5829710198455314e-07, "loss": 0.6353, "step": 71245 }, { "epoch": 0.95, "learning_rate": 2.575432573368397e-07, "loss": 0.8142, "step": 71250 }, { "epoch": 0.95, "learning_rate": 2.5679050865617673e-07, "loss": 0.3934, "step": 71255 }, { "epoch": 0.95, "learning_rate": 2.560388559759125e-07, "loss": 0.2602, "step": 71260 }, { "epoch": 0.95, "learning_rate": 2.552882993293315e-07, "loss": 1.0496, "step": 71265 }, { "epoch": 0.95, "learning_rate": 2.5453883874968776e-07, "loss": 0.9317, "step": 71270 }, { "epoch": 0.95, "learning_rate": 2.537904742701741e-07, "loss": 0.2558, "step": 71275 }, { "epoch": 0.96, "learning_rate": 2.530432059239418e-07, "loss": 0.7239, "step": 71280 }, { "epoch": 0.96, "learning_rate": 2.522970337440894e-07, "loss": 0.6566, "step": 71285 }, { "epoch": 0.96, "learning_rate": 2.5155195776367104e-07, "loss": 0.9461, "step": 71290 }, { "epoch": 0.96, "learning_rate": 2.50807978015688e-07, "loss": 0.3361, "step": 71295 }, { "epoch": 0.96, "learning_rate": 2.500650945330946e-07, "loss": 0.6862, "step": 71300 }, { "epoch": 0.96, "learning_rate": 2.4932330734879773e-07, "loss": 0.8275, "step": 71305 }, { "epoch": 0.96, "learning_rate": 2.485826164956545e-07, "loss": 0.4204, "step": 71310 }, { "epoch": 0.96, "learning_rate": 2.478430220064748e-07, "loss": 0.6797, "step": 71315 }, { "epoch": 0.96, "learning_rate": 2.471045239140185e-07, "loss": 1.2587, "step": 71320 }, { "epoch": 0.96, "learning_rate": 2.4636712225099555e-07, "loss": 1.4455, "step": 71325 }, { "epoch": 0.96, "learning_rate": 2.4563081705006876e-07, "loss": 0.702, "step": 71330 }, { "epoch": 0.96, "learning_rate": 2.4489560834385914e-07, "loss": 0.8935, "step": 71335 }, { "epoch": 0.96, "learning_rate": 2.441614961649241e-07, "loss": 0.7247, "step": 71340 }, { "epoch": 0.96, "learning_rate": 2.434284805457876e-07, "loss": 0.7003, "step": 71345 }, { "epoch": 0.96, "learning_rate": 2.426965615189153e-07, "loss": 0.2709, "step": 71350 }, { "epoch": 0.96, "learning_rate": 2.419657391167257e-07, "loss": 0.6072, "step": 71355 }, { "epoch": 0.96, "learning_rate": 2.412360133715985e-07, "loss": 0.5699, "step": 71360 }, { "epoch": 0.96, "learning_rate": 2.4050738431584674e-07, "loss": 1.0368, "step": 71365 }, { "epoch": 0.96, "learning_rate": 2.397798519817557e-07, "loss": 0.4468, "step": 71370 }, { "epoch": 0.96, "learning_rate": 2.390534164015412e-07, "loss": 1.0158, "step": 71375 }, { "epoch": 0.96, "learning_rate": 2.3832807760738597e-07, "loss": 0.6619, "step": 71380 }, { "epoch": 0.96, "learning_rate": 2.3760383563141976e-07, "loss": 0.7605, "step": 71385 }, { "epoch": 0.96, "learning_rate": 2.368806905057197e-07, "loss": 1.0759, "step": 71390 }, { "epoch": 0.96, "learning_rate": 2.3615864226232133e-07, "loss": 1.0872, "step": 71395 }, { "epoch": 0.96, "learning_rate": 2.3543769093320178e-07, "loss": 0.7184, "step": 71400 }, { "epoch": 0.96, "learning_rate": 2.3471783655030223e-07, "loss": 0.4854, "step": 71405 }, { "epoch": 0.96, "learning_rate": 2.3399907914550546e-07, "loss": 0.948, "step": 71410 }, { "epoch": 0.96, "learning_rate": 2.3328141875064713e-07, "loss": 0.6325, "step": 71415 }, { "epoch": 0.96, "learning_rate": 2.3256485539752127e-07, "loss": 0.152, "step": 71420 }, { "epoch": 0.96, "learning_rate": 2.318493891178608e-07, "loss": 0.7389, "step": 71425 }, { "epoch": 0.96, "learning_rate": 2.311350199433654e-07, "loss": 0.7828, "step": 71430 }, { "epoch": 0.96, "learning_rate": 2.3042174790567085e-07, "loss": 0.4869, "step": 71435 }, { "epoch": 0.96, "learning_rate": 2.2970957303637686e-07, "loss": 0.1896, "step": 71440 }, { "epoch": 0.96, "learning_rate": 2.289984953670249e-07, "loss": 1.1583, "step": 71445 }, { "epoch": 0.96, "learning_rate": 2.2828851492911473e-07, "loss": 0.9954, "step": 71450 }, { "epoch": 0.96, "learning_rate": 2.2757963175409346e-07, "loss": 0.5874, "step": 71455 }, { "epoch": 0.96, "learning_rate": 2.2687184587336375e-07, "loss": 1.0211, "step": 71460 }, { "epoch": 0.96, "learning_rate": 2.261651573182727e-07, "loss": 1.0046, "step": 71465 }, { "epoch": 0.96, "learning_rate": 2.2545956612012864e-07, "loss": 0.7189, "step": 71470 }, { "epoch": 0.96, "learning_rate": 2.2475507231017878e-07, "loss": 1.1019, "step": 71475 }, { "epoch": 0.96, "learning_rate": 2.2405167591963705e-07, "loss": 0.9217, "step": 71480 }, { "epoch": 0.96, "learning_rate": 2.2334937697965352e-07, "loss": 0.8957, "step": 71485 }, { "epoch": 0.96, "learning_rate": 2.2264817552133943e-07, "loss": 0.5082, "step": 71490 }, { "epoch": 0.96, "learning_rate": 2.2194807157575327e-07, "loss": 0.6581, "step": 71495 }, { "epoch": 0.96, "learning_rate": 2.2124906517390632e-07, "loss": 0.5508, "step": 71500 }, { "epoch": 0.96, "learning_rate": 2.205511563467627e-07, "loss": 0.7523, "step": 71505 }, { "epoch": 0.96, "learning_rate": 2.198543451252366e-07, "loss": 0.1345, "step": 71510 }, { "epoch": 0.96, "learning_rate": 2.1915863154019224e-07, "loss": 0.8932, "step": 71515 }, { "epoch": 0.96, "learning_rate": 2.1846401562244101e-07, "loss": 0.683, "step": 71520 }, { "epoch": 0.96, "learning_rate": 2.1777049740276112e-07, "loss": 0.9401, "step": 71525 }, { "epoch": 0.96, "learning_rate": 2.170780769118641e-07, "loss": 1.5053, "step": 71530 }, { "epoch": 0.96, "learning_rate": 2.1638675418042265e-07, "loss": 1.0311, "step": 71535 }, { "epoch": 0.96, "learning_rate": 2.1569652923905947e-07, "loss": 0.6797, "step": 71540 }, { "epoch": 0.96, "learning_rate": 2.1500740211835013e-07, "loss": 0.9153, "step": 71545 }, { "epoch": 0.96, "learning_rate": 2.1431937284881466e-07, "loss": 0.7641, "step": 71550 }, { "epoch": 0.96, "learning_rate": 2.136324414609342e-07, "loss": 0.3242, "step": 71555 }, { "epoch": 0.96, "learning_rate": 2.1294660798513168e-07, "loss": 0.9448, "step": 71560 }, { "epoch": 0.96, "learning_rate": 2.1226187245179108e-07, "loss": 1.0409, "step": 71565 }, { "epoch": 0.96, "learning_rate": 2.1157823489124097e-07, "loss": 0.9786, "step": 71570 }, { "epoch": 0.96, "learning_rate": 2.1089569533375985e-07, "loss": 1.6467, "step": 71575 }, { "epoch": 0.96, "learning_rate": 2.1021425380958747e-07, "loss": 0.3242, "step": 71580 }, { "epoch": 0.96, "learning_rate": 2.0953391034890247e-07, "loss": 0.8377, "step": 71585 }, { "epoch": 0.96, "learning_rate": 2.088546649818418e-07, "loss": 1.069, "step": 71590 }, { "epoch": 0.96, "learning_rate": 2.0817651773849255e-07, "loss": 0.7225, "step": 71595 }, { "epoch": 0.96, "learning_rate": 2.0749946864889458e-07, "loss": 0.4501, "step": 71600 }, { "epoch": 0.96, "learning_rate": 2.0682351774303776e-07, "loss": 0.6686, "step": 71605 }, { "epoch": 0.96, "learning_rate": 2.0614866505085928e-07, "loss": 0.8024, "step": 71610 }, { "epoch": 0.96, "learning_rate": 2.054749106022602e-07, "loss": 0.7351, "step": 71615 }, { "epoch": 0.96, "learning_rate": 2.048022544270778e-07, "loss": 0.2946, "step": 71620 }, { "epoch": 0.96, "learning_rate": 2.0413069655510765e-07, "loss": 0.6504, "step": 71625 }, { "epoch": 0.96, "learning_rate": 2.034602370160982e-07, "loss": 0.8984, "step": 71630 }, { "epoch": 0.96, "learning_rate": 2.0279087583974788e-07, "loss": 0.3561, "step": 71635 }, { "epoch": 0.96, "learning_rate": 2.0212261305570524e-07, "loss": 0.9628, "step": 71640 }, { "epoch": 0.96, "learning_rate": 2.0145544869357158e-07, "loss": 0.9824, "step": 71645 }, { "epoch": 0.96, "learning_rate": 2.0078938278289828e-07, "loss": 1.0204, "step": 71650 }, { "epoch": 0.96, "learning_rate": 2.0012441535318672e-07, "loss": 0.7193, "step": 71655 }, { "epoch": 0.96, "learning_rate": 1.9946054643389666e-07, "loss": 0.8093, "step": 71660 }, { "epoch": 0.96, "learning_rate": 1.987977760544296e-07, "loss": 0.6692, "step": 71665 }, { "epoch": 0.96, "learning_rate": 1.9813610424414264e-07, "loss": 0.5843, "step": 71670 }, { "epoch": 0.96, "learning_rate": 1.9747553103234838e-07, "loss": 1.0313, "step": 71675 }, { "epoch": 0.96, "learning_rate": 1.968160564483068e-07, "loss": 1.0435, "step": 71680 }, { "epoch": 0.96, "learning_rate": 1.9615768052122229e-07, "loss": 0.7723, "step": 71685 }, { "epoch": 0.96, "learning_rate": 1.9550040328026875e-07, "loss": 0.4039, "step": 71690 }, { "epoch": 0.96, "learning_rate": 1.9484422475455067e-07, "loss": 0.9789, "step": 71695 }, { "epoch": 0.96, "learning_rate": 1.9418914497313922e-07, "loss": 0.271, "step": 71700 }, { "epoch": 0.96, "learning_rate": 1.9353516396504735e-07, "loss": 0.7874, "step": 71705 }, { "epoch": 0.96, "learning_rate": 1.9288228175924627e-07, "loss": 1.1754, "step": 71710 }, { "epoch": 0.96, "learning_rate": 1.922304983846518e-07, "loss": 0.8158, "step": 71715 }, { "epoch": 0.96, "learning_rate": 1.91579813870138e-07, "loss": 0.4305, "step": 71720 }, { "epoch": 0.96, "learning_rate": 1.9093022824452632e-07, "loss": 0.4242, "step": 71725 }, { "epoch": 0.96, "learning_rate": 1.9028174153659095e-07, "loss": 0.7553, "step": 71730 }, { "epoch": 0.96, "learning_rate": 1.8963435377505333e-07, "loss": 1.1726, "step": 71735 }, { "epoch": 0.96, "learning_rate": 1.8898806498859057e-07, "loss": 0.7515, "step": 71740 }, { "epoch": 0.96, "learning_rate": 1.883428752058325e-07, "loss": 0.4147, "step": 71745 }, { "epoch": 0.96, "learning_rate": 1.8769878445535626e-07, "loss": 1.2346, "step": 71750 }, { "epoch": 0.96, "learning_rate": 1.8705579276569186e-07, "loss": 0.1522, "step": 71755 }, { "epoch": 0.96, "learning_rate": 1.86413900165322e-07, "loss": 0.7476, "step": 71760 }, { "epoch": 0.96, "learning_rate": 1.85773106682674e-07, "loss": 1.5536, "step": 71765 }, { "epoch": 0.96, "learning_rate": 1.8513341234613901e-07, "loss": 0.7266, "step": 71770 }, { "epoch": 0.96, "learning_rate": 1.8449481718404714e-07, "loss": 0.6959, "step": 71775 }, { "epoch": 0.96, "learning_rate": 1.838573212246869e-07, "loss": 0.8017, "step": 71780 }, { "epoch": 0.96, "learning_rate": 1.8322092449629957e-07, "loss": 0.5939, "step": 71785 }, { "epoch": 0.96, "learning_rate": 1.8258562702706817e-07, "loss": 0.4724, "step": 71790 }, { "epoch": 0.96, "learning_rate": 1.8195142884513406e-07, "loss": 0.7224, "step": 71795 }, { "epoch": 0.96, "learning_rate": 1.8131832997859144e-07, "loss": 0.6169, "step": 71800 }, { "epoch": 0.96, "learning_rate": 1.8068633045548454e-07, "loss": 0.9529, "step": 71805 }, { "epoch": 0.96, "learning_rate": 1.8005543030380767e-07, "loss": 0.7522, "step": 71810 }, { "epoch": 0.96, "learning_rate": 1.7942562955149956e-07, "loss": 0.7535, "step": 71815 }, { "epoch": 0.96, "learning_rate": 1.7879692822646843e-07, "loss": 1.0154, "step": 71820 }, { "epoch": 0.96, "learning_rate": 1.7816932635655315e-07, "loss": 0.3499, "step": 71825 }, { "epoch": 0.96, "learning_rate": 1.7754282396955646e-07, "loss": 0.6737, "step": 71830 }, { "epoch": 0.96, "learning_rate": 1.7691742109323394e-07, "loss": 1.0696, "step": 71835 }, { "epoch": 0.96, "learning_rate": 1.7629311775528012e-07, "loss": 0.2698, "step": 71840 }, { "epoch": 0.96, "learning_rate": 1.756699139833534e-07, "loss": 1.1758, "step": 71845 }, { "epoch": 0.96, "learning_rate": 1.7504780980505676e-07, "loss": 0.363, "step": 71850 }, { "epoch": 0.96, "learning_rate": 1.7442680524794863e-07, "loss": 0.5216, "step": 71855 }, { "epoch": 0.96, "learning_rate": 1.7380690033953207e-07, "loss": 0.5928, "step": 71860 }, { "epoch": 0.96, "learning_rate": 1.7318809510726841e-07, "loss": 0.7502, "step": 71865 }, { "epoch": 0.96, "learning_rate": 1.7257038957856908e-07, "loss": 0.8126, "step": 71870 }, { "epoch": 0.96, "learning_rate": 1.7195378378079273e-07, "loss": 0.5872, "step": 71875 }, { "epoch": 0.96, "learning_rate": 1.7133827774125367e-07, "loss": 0.8253, "step": 71880 }, { "epoch": 0.96, "learning_rate": 1.7072387148721613e-07, "loss": 0.8354, "step": 71885 }, { "epoch": 0.96, "learning_rate": 1.7011056504589173e-07, "loss": 0.3725, "step": 71890 }, { "epoch": 0.96, "learning_rate": 1.694983584444504e-07, "loss": 0.5238, "step": 71895 }, { "epoch": 0.96, "learning_rate": 1.6888725171000653e-07, "loss": 0.7358, "step": 71900 }, { "epoch": 0.96, "learning_rate": 1.6827724486963293e-07, "loss": 0.5352, "step": 71905 }, { "epoch": 0.96, "learning_rate": 1.6766833795034965e-07, "loss": 0.5207, "step": 71910 }, { "epoch": 0.96, "learning_rate": 1.67060530979124e-07, "loss": 0.7185, "step": 71915 }, { "epoch": 0.96, "learning_rate": 1.6645382398288444e-07, "loss": 0.5198, "step": 71920 }, { "epoch": 0.96, "learning_rate": 1.6584821698850117e-07, "loss": 0.2854, "step": 71925 }, { "epoch": 0.96, "learning_rate": 1.6524371002279993e-07, "loss": 0.5816, "step": 71930 }, { "epoch": 0.96, "learning_rate": 1.6464030311255928e-07, "loss": 1.3675, "step": 71935 }, { "epoch": 0.96, "learning_rate": 1.6403799628450234e-07, "loss": 0.5313, "step": 71940 }, { "epoch": 0.96, "learning_rate": 1.6343678956531327e-07, "loss": 0.7468, "step": 71945 }, { "epoch": 0.96, "learning_rate": 1.6283668298162357e-07, "loss": 1.0786, "step": 71950 }, { "epoch": 0.96, "learning_rate": 1.6223767656001198e-07, "loss": 0.63, "step": 71955 }, { "epoch": 0.96, "learning_rate": 1.6163977032700728e-07, "loss": 0.6312, "step": 71960 }, { "epoch": 0.96, "learning_rate": 1.6104296430910214e-07, "loss": 1.1846, "step": 71965 }, { "epoch": 0.96, "learning_rate": 1.6044725853272823e-07, "loss": 0.6644, "step": 71970 }, { "epoch": 0.96, "learning_rate": 1.5985265302427277e-07, "loss": 0.1715, "step": 71975 }, { "epoch": 0.96, "learning_rate": 1.59259147810073e-07, "loss": 0.25, "step": 71980 }, { "epoch": 0.96, "learning_rate": 1.5866674291641627e-07, "loss": 0.5464, "step": 71985 }, { "epoch": 0.96, "learning_rate": 1.5807543836954818e-07, "loss": 0.6607, "step": 71990 }, { "epoch": 0.96, "learning_rate": 1.5748523419565896e-07, "loss": 0.9843, "step": 71995 }, { "epoch": 0.96, "learning_rate": 1.568961304208888e-07, "loss": 0.2987, "step": 72000 }, { "epoch": 0.96, "learning_rate": 1.5630812707133347e-07, "loss": 0.7024, "step": 72005 }, { "epoch": 0.96, "learning_rate": 1.557212241730388e-07, "loss": 0.5641, "step": 72010 }, { "epoch": 0.96, "learning_rate": 1.5513542175200346e-07, "loss": 0.5542, "step": 72015 }, { "epoch": 0.96, "learning_rate": 1.5455071983417335e-07, "loss": 1.1005, "step": 72020 }, { "epoch": 0.97, "learning_rate": 1.539671184454472e-07, "loss": 0.8521, "step": 72025 }, { "epoch": 0.97, "learning_rate": 1.5338461761167932e-07, "loss": 1.1382, "step": 72030 }, { "epoch": 0.97, "learning_rate": 1.5280321735866855e-07, "loss": 0.3472, "step": 72035 }, { "epoch": 0.97, "learning_rate": 1.5222291771216644e-07, "loss": 1.0809, "step": 72040 }, { "epoch": 0.97, "learning_rate": 1.5164371869788309e-07, "loss": 1.1989, "step": 72045 }, { "epoch": 0.97, "learning_rate": 1.510656203414673e-07, "loss": 0.2168, "step": 72050 }, { "epoch": 0.97, "learning_rate": 1.5048862266852925e-07, "loss": 1.3731, "step": 72055 }, { "epoch": 0.97, "learning_rate": 1.49912725704629e-07, "loss": 0.2958, "step": 72060 }, { "epoch": 0.97, "learning_rate": 1.493379294752739e-07, "loss": 1.0725, "step": 72065 }, { "epoch": 0.97, "learning_rate": 1.487642340059242e-07, "loss": 1.108, "step": 72070 }, { "epoch": 0.97, "learning_rate": 1.4819163932199287e-07, "loss": 0.6028, "step": 72075 }, { "epoch": 0.97, "learning_rate": 1.4762014544884018e-07, "loss": 0.6862, "step": 72080 }, { "epoch": 0.97, "learning_rate": 1.4704975241178198e-07, "loss": 0.5814, "step": 72085 }, { "epoch": 0.97, "learning_rate": 1.4648046023608698e-07, "loss": 1.0229, "step": 72090 }, { "epoch": 0.97, "learning_rate": 1.459122689469683e-07, "loss": 0.6687, "step": 72095 }, { "epoch": 0.97, "learning_rate": 1.4534517856959474e-07, "loss": 0.5351, "step": 72100 }, { "epoch": 0.97, "learning_rate": 1.4477918912908782e-07, "loss": 0.5479, "step": 72105 }, { "epoch": 0.97, "learning_rate": 1.4421430065051368e-07, "loss": 0.2532, "step": 72110 }, { "epoch": 0.97, "learning_rate": 1.4365051315889666e-07, "loss": 0.6223, "step": 72115 }, { "epoch": 0.97, "learning_rate": 1.4308782667921128e-07, "loss": 0.573, "step": 72120 }, { "epoch": 0.97, "learning_rate": 1.4252624123637647e-07, "loss": 0.8111, "step": 72125 }, { "epoch": 0.97, "learning_rate": 1.4196575685527514e-07, "loss": 0.7907, "step": 72130 }, { "epoch": 0.97, "learning_rate": 1.4140637356072627e-07, "loss": 0.7456, "step": 72135 }, { "epoch": 0.97, "learning_rate": 1.4084809137751565e-07, "loss": 1.0561, "step": 72140 }, { "epoch": 0.97, "learning_rate": 1.4029091033036234e-07, "loss": 0.6903, "step": 72145 }, { "epoch": 0.97, "learning_rate": 1.3973483044395775e-07, "loss": 0.8325, "step": 72150 }, { "epoch": 0.97, "learning_rate": 1.3917985174292658e-07, "loss": 0.4456, "step": 72155 }, { "epoch": 0.97, "learning_rate": 1.3862597425185198e-07, "loss": 0.9363, "step": 72160 }, { "epoch": 0.97, "learning_rate": 1.3807319799526985e-07, "loss": 0.858, "step": 72165 }, { "epoch": 0.97, "learning_rate": 1.3752152299766618e-07, "loss": 1.0615, "step": 72170 }, { "epoch": 0.97, "learning_rate": 1.369709492834742e-07, "loss": 0.2052, "step": 72175 }, { "epoch": 0.97, "learning_rate": 1.3642147687708275e-07, "loss": 0.3107, "step": 72180 }, { "epoch": 0.97, "learning_rate": 1.3587310580283342e-07, "loss": 1.0086, "step": 72185 }, { "epoch": 0.97, "learning_rate": 1.3532583608501237e-07, "loss": 1.0439, "step": 72190 }, { "epoch": 0.97, "learning_rate": 1.347796677478641e-07, "loss": 0.8328, "step": 72195 }, { "epoch": 0.97, "learning_rate": 1.3423460081558038e-07, "loss": 0.6261, "step": 72200 }, { "epoch": 0.97, "learning_rate": 1.3369063531230298e-07, "loss": 0.1956, "step": 72205 }, { "epoch": 0.97, "learning_rate": 1.331477712621265e-07, "loss": 1.0932, "step": 72210 }, { "epoch": 0.97, "learning_rate": 1.32606008689104e-07, "loss": 0.344, "step": 72215 }, { "epoch": 0.97, "learning_rate": 1.320653476172218e-07, "loss": 0.5335, "step": 72220 }, { "epoch": 0.97, "learning_rate": 1.3152578807043847e-07, "loss": 0.6574, "step": 72225 }, { "epoch": 0.97, "learning_rate": 1.3098733007264884e-07, "loss": 0.7395, "step": 72230 }, { "epoch": 0.97, "learning_rate": 1.304499736477033e-07, "loss": 1.2747, "step": 72235 }, { "epoch": 0.97, "learning_rate": 1.2991371881940495e-07, "loss": 1.0817, "step": 72240 }, { "epoch": 0.97, "learning_rate": 1.2937856561150984e-07, "loss": 0.715, "step": 72245 }, { "epoch": 0.97, "learning_rate": 1.2884451404772125e-07, "loss": 0.3395, "step": 72250 }, { "epoch": 0.97, "learning_rate": 1.2831156415168965e-07, "loss": 0.5323, "step": 72255 }, { "epoch": 0.97, "learning_rate": 1.2777971594702952e-07, "loss": 0.5273, "step": 72260 }, { "epoch": 0.97, "learning_rate": 1.2724896945729702e-07, "loss": 0.8759, "step": 72265 }, { "epoch": 0.97, "learning_rate": 1.267193247060011e-07, "loss": 0.6759, "step": 72270 }, { "epoch": 0.97, "learning_rate": 1.2619078171660083e-07, "loss": 0.9556, "step": 72275 }, { "epoch": 0.97, "learning_rate": 1.2566334051250795e-07, "loss": 1.5536, "step": 72280 }, { "epoch": 0.97, "learning_rate": 1.2513700111708716e-07, "loss": 0.7643, "step": 72285 }, { "epoch": 0.97, "learning_rate": 1.2461176355365313e-07, "loss": 0.4918, "step": 72290 }, { "epoch": 0.97, "learning_rate": 1.2408762784547056e-07, "loss": 0.6426, "step": 72295 }, { "epoch": 0.97, "learning_rate": 1.2356459401575703e-07, "loss": 0.1861, "step": 72300 }, { "epoch": 0.97, "learning_rate": 1.2304266208767457e-07, "loss": 1.3068, "step": 72305 }, { "epoch": 0.97, "learning_rate": 1.225218320843491e-07, "loss": 0.3113, "step": 72310 }, { "epoch": 0.97, "learning_rate": 1.2200210402885104e-07, "loss": 0.418, "step": 72315 }, { "epoch": 0.97, "learning_rate": 1.2148347794419534e-07, "loss": 1.1893, "step": 72320 }, { "epoch": 0.97, "learning_rate": 1.2096595385336085e-07, "loss": 0.4626, "step": 72325 }, { "epoch": 0.97, "learning_rate": 1.204495317792681e-07, "loss": 0.3448, "step": 72330 }, { "epoch": 0.97, "learning_rate": 1.1993421174479048e-07, "loss": 0.6558, "step": 72335 }, { "epoch": 0.97, "learning_rate": 1.194199937727597e-07, "loss": 0.5795, "step": 72340 }, { "epoch": 0.97, "learning_rate": 1.1890687788594646e-07, "loss": 1.1048, "step": 72345 }, { "epoch": 0.97, "learning_rate": 1.1839486410708256e-07, "loss": 1.1968, "step": 72350 }, { "epoch": 0.97, "learning_rate": 1.1788395245884987e-07, "loss": 1.4491, "step": 72355 }, { "epoch": 0.97, "learning_rate": 1.1737414296387473e-07, "loss": 0.2012, "step": 72360 }, { "epoch": 0.97, "learning_rate": 1.1686543564474184e-07, "loss": 0.2142, "step": 72365 }, { "epoch": 0.97, "learning_rate": 1.1635783052398319e-07, "loss": 0.9689, "step": 72370 }, { "epoch": 0.97, "learning_rate": 1.1585132762408357e-07, "loss": 0.4083, "step": 72375 }, { "epoch": 0.97, "learning_rate": 1.1534592696748058e-07, "loss": 0.9649, "step": 72380 }, { "epoch": 0.97, "learning_rate": 1.1484162857655634e-07, "loss": 2.1976, "step": 72385 }, { "epoch": 0.97, "learning_rate": 1.1433843247365405e-07, "loss": 0.7709, "step": 72390 }, { "epoch": 0.97, "learning_rate": 1.1383633868105869e-07, "loss": 0.638, "step": 72395 }, { "epoch": 0.97, "learning_rate": 1.133353472210108e-07, "loss": 0.9513, "step": 72400 }, { "epoch": 0.97, "learning_rate": 1.128354581157065e-07, "loss": 0.3636, "step": 72405 }, { "epoch": 0.97, "learning_rate": 1.1233667138728087e-07, "loss": 1.02, "step": 72410 }, { "epoch": 0.97, "learning_rate": 1.1183898705783291e-07, "loss": 0.7444, "step": 72415 }, { "epoch": 0.97, "learning_rate": 1.1134240514940886e-07, "loss": 0.8818, "step": 72420 }, { "epoch": 0.97, "learning_rate": 1.1084692568399945e-07, "loss": 1.2269, "step": 72425 }, { "epoch": 0.97, "learning_rate": 1.1035254868355383e-07, "loss": 1.0633, "step": 72430 }, { "epoch": 0.97, "learning_rate": 1.0985927416997388e-07, "loss": 1.2023, "step": 72435 }, { "epoch": 0.97, "learning_rate": 1.0936710216510603e-07, "loss": 0.8003, "step": 72440 }, { "epoch": 0.97, "learning_rate": 1.0887603269075231e-07, "loss": 0.7545, "step": 72445 }, { "epoch": 0.97, "learning_rate": 1.0838606576866195e-07, "loss": 0.6147, "step": 72450 }, { "epoch": 0.97, "learning_rate": 1.0789720142053983e-07, "loss": 0.5236, "step": 72455 }, { "epoch": 0.97, "learning_rate": 1.0740943966804362e-07, "loss": 0.4742, "step": 72460 }, { "epoch": 0.97, "learning_rate": 1.0692278053277272e-07, "loss": 0.1829, "step": 72465 }, { "epoch": 0.97, "learning_rate": 1.0643722403628764e-07, "loss": 0.3138, "step": 72470 }, { "epoch": 0.97, "learning_rate": 1.0595277020009342e-07, "loss": 0.4142, "step": 72475 }, { "epoch": 0.97, "learning_rate": 1.0546941904565344e-07, "loss": 0.9356, "step": 72480 }, { "epoch": 0.97, "learning_rate": 1.0498717059437279e-07, "loss": 0.7071, "step": 72485 }, { "epoch": 0.97, "learning_rate": 1.0450602486761219e-07, "loss": 0.8381, "step": 72490 }, { "epoch": 0.97, "learning_rate": 1.0402598188669066e-07, "loss": 0.7137, "step": 72495 }, { "epoch": 0.97, "learning_rate": 1.0354704167286622e-07, "loss": 0.3491, "step": 72500 }, { "epoch": 0.97, "learning_rate": 1.0306920424735523e-07, "loss": 0.7349, "step": 72505 }, { "epoch": 0.97, "learning_rate": 1.025924696313213e-07, "loss": 0.6143, "step": 72510 }, { "epoch": 0.97, "learning_rate": 1.0211683784588366e-07, "loss": 0.9327, "step": 72515 }, { "epoch": 0.97, "learning_rate": 1.0164230891211157e-07, "loss": 0.256, "step": 72520 }, { "epoch": 0.97, "learning_rate": 1.0116888285101877e-07, "loss": 1.3201, "step": 72525 }, { "epoch": 0.97, "learning_rate": 1.0069655968358294e-07, "loss": 0.5029, "step": 72530 }, { "epoch": 0.97, "learning_rate": 1.0022533943072343e-07, "loss": 0.9346, "step": 72535 }, { "epoch": 0.97, "learning_rate": 9.975522211330968e-08, "loss": 1.9227, "step": 72540 }, { "epoch": 0.97, "learning_rate": 9.928620775216668e-08, "loss": 1.0445, "step": 72545 }, { "epoch": 0.97, "learning_rate": 9.881829636807227e-08, "loss": 0.4526, "step": 72550 }, { "epoch": 0.97, "learning_rate": 9.835148798174876e-08, "loss": 0.5947, "step": 72555 }, { "epoch": 0.97, "learning_rate": 9.788578261387682e-08, "loss": 1.1063, "step": 72560 }, { "epoch": 0.97, "learning_rate": 9.742118028508163e-08, "loss": 0.4382, "step": 72565 }, { "epoch": 0.97, "learning_rate": 9.695768101594671e-08, "loss": 0.4664, "step": 72570 }, { "epoch": 0.97, "learning_rate": 9.64952848270001e-08, "loss": 0.8938, "step": 72575 }, { "epoch": 0.97, "learning_rate": 9.603399173872262e-08, "loss": 0.7541, "step": 72580 }, { "epoch": 0.97, "learning_rate": 9.557380177154795e-08, "loss": 0.6969, "step": 72585 }, { "epoch": 0.97, "learning_rate": 9.511471494586255e-08, "loss": 0.3877, "step": 72590 }, { "epoch": 0.97, "learning_rate": 9.465673128200014e-08, "loss": 0.4032, "step": 72595 }, { "epoch": 0.97, "learning_rate": 9.419985080024729e-08, "loss": 0.7201, "step": 72600 }, { "epoch": 0.97, "learning_rate": 9.374407352084058e-08, "loss": 1.1099, "step": 72605 }, { "epoch": 0.97, "learning_rate": 9.328939946396942e-08, "loss": 0.515, "step": 72610 }, { "epoch": 0.97, "learning_rate": 9.283582864977325e-08, "loss": 0.4177, "step": 72615 }, { "epoch": 0.97, "learning_rate": 9.238336109834434e-08, "loss": 0.5484, "step": 72620 }, { "epoch": 0.97, "learning_rate": 9.19319968297222e-08, "loss": 0.4701, "step": 72625 }, { "epoch": 0.97, "learning_rate": 9.148173586390473e-08, "loss": 0.8077, "step": 72630 }, { "epoch": 0.97, "learning_rate": 9.103257822082878e-08, "loss": 0.8653, "step": 72635 }, { "epoch": 0.97, "learning_rate": 9.058452392039507e-08, "loss": 1.1586, "step": 72640 }, { "epoch": 0.97, "learning_rate": 9.013757298245162e-08, "loss": 0.9605, "step": 72645 }, { "epoch": 0.97, "learning_rate": 8.969172542679095e-08, "loss": 0.5977, "step": 72650 }, { "epoch": 0.97, "learning_rate": 8.924698127316389e-08, "loss": 0.8383, "step": 72655 }, { "epoch": 0.97, "learning_rate": 8.880334054127137e-08, "loss": 1.447, "step": 72660 }, { "epoch": 0.97, "learning_rate": 8.836080325076713e-08, "loss": 1.1432, "step": 72665 }, { "epoch": 0.97, "learning_rate": 8.791936942124657e-08, "loss": 0.2876, "step": 72670 }, { "epoch": 0.97, "learning_rate": 8.747903907226907e-08, "loss": 0.474, "step": 72675 }, { "epoch": 0.97, "learning_rate": 8.703981222333568e-08, "loss": 0.4541, "step": 72680 }, { "epoch": 0.97, "learning_rate": 8.660168889390308e-08, "loss": 0.6084, "step": 72685 }, { "epoch": 0.97, "learning_rate": 8.616466910337794e-08, "loss": 0.4041, "step": 72690 }, { "epoch": 0.97, "learning_rate": 8.572875287111703e-08, "loss": 0.8169, "step": 72695 }, { "epoch": 0.97, "learning_rate": 8.529394021643267e-08, "loss": 0.7467, "step": 72700 }, { "epoch": 0.97, "learning_rate": 8.486023115857889e-08, "loss": 0.3626, "step": 72705 }, { "epoch": 0.97, "learning_rate": 8.442762571677365e-08, "loss": 1.1578, "step": 72710 }, { "epoch": 0.97, "learning_rate": 8.399612391017386e-08, "loss": 1.0219, "step": 72715 }, { "epoch": 0.97, "learning_rate": 8.356572575789479e-08, "loss": 0.4004, "step": 72720 }, { "epoch": 0.97, "learning_rate": 8.313643127900172e-08, "loss": 1.0204, "step": 72725 }, { "epoch": 0.97, "learning_rate": 8.270824049251002e-08, "loss": 0.6676, "step": 72730 }, { "epoch": 0.97, "learning_rate": 8.228115341738507e-08, "loss": 0.8616, "step": 72735 }, { "epoch": 0.97, "learning_rate": 8.185517007254784e-08, "loss": 0.511, "step": 72740 }, { "epoch": 0.97, "learning_rate": 8.143029047686379e-08, "loss": 0.4446, "step": 72745 }, { "epoch": 0.97, "learning_rate": 8.100651464915398e-08, "loss": 0.6628, "step": 72750 }, { "epoch": 0.97, "learning_rate": 8.058384260818952e-08, "loss": 0.8242, "step": 72755 }, { "epoch": 0.97, "learning_rate": 8.016227437269152e-08, "loss": 0.6481, "step": 72760 }, { "epoch": 0.97, "learning_rate": 7.974180996133673e-08, "loss": 0.2495, "step": 72765 }, { "epoch": 0.98, "learning_rate": 7.932244939274636e-08, "loss": 1.0019, "step": 72770 }, { "epoch": 0.98, "learning_rate": 7.890419268549998e-08, "loss": 0.2757, "step": 72775 }, { "epoch": 0.98, "learning_rate": 7.848703985811889e-08, "loss": 0.6577, "step": 72780 }, { "epoch": 0.98, "learning_rate": 7.807099092908277e-08, "loss": 0.6968, "step": 72785 }, { "epoch": 0.98, "learning_rate": 7.765604591682408e-08, "loss": 1.0827, "step": 72790 }, { "epoch": 0.98, "learning_rate": 7.7242204839717e-08, "loss": 0.9943, "step": 72795 }, { "epoch": 0.98, "learning_rate": 7.682946771609967e-08, "loss": 0.4209, "step": 72800 }, { "epoch": 0.98, "learning_rate": 7.641783456424634e-08, "loss": 0.4925, "step": 72805 }, { "epoch": 0.98, "learning_rate": 7.60073054023952e-08, "loss": 0.8518, "step": 72810 }, { "epoch": 0.98, "learning_rate": 7.559788024873172e-08, "loss": 1.2587, "step": 72815 }, { "epoch": 0.98, "learning_rate": 7.51895591213858e-08, "loss": 1.2594, "step": 72820 }, { "epoch": 0.98, "learning_rate": 7.478234203845136e-08, "loss": 0.9278, "step": 72825 }, { "epoch": 0.98, "learning_rate": 7.437622901795838e-08, "loss": 0.4611, "step": 72830 }, { "epoch": 0.98, "learning_rate": 7.397122007790081e-08, "loss": 0.7168, "step": 72835 }, { "epoch": 0.98, "learning_rate": 7.356731523621707e-08, "loss": 0.8483, "step": 72840 }, { "epoch": 0.98, "learning_rate": 7.316451451079842e-08, "loss": 0.5728, "step": 72845 }, { "epoch": 0.98, "learning_rate": 7.276281791948891e-08, "loss": 0.5739, "step": 72850 }, { "epoch": 0.98, "learning_rate": 7.236222548007709e-08, "loss": 0.2887, "step": 72855 }, { "epoch": 0.98, "learning_rate": 7.196273721030988e-08, "loss": 0.9927, "step": 72860 }, { "epoch": 0.98, "learning_rate": 7.156435312788423e-08, "loss": 0.7851, "step": 72865 }, { "epoch": 0.98, "learning_rate": 7.116707325044159e-08, "loss": 0.9354, "step": 72870 }, { "epoch": 0.98, "learning_rate": 7.077089759558452e-08, "loss": 0.9149, "step": 72875 }, { "epoch": 0.98, "learning_rate": 7.037582618086014e-08, "loss": 0.4737, "step": 72880 }, { "epoch": 0.98, "learning_rate": 6.998185902376552e-08, "loss": 0.8633, "step": 72885 }, { "epoch": 0.98, "learning_rate": 6.958899614175618e-08, "loss": 0.7302, "step": 72890 }, { "epoch": 0.98, "learning_rate": 6.919723755222929e-08, "loss": 0.9882, "step": 72895 }, { "epoch": 0.98, "learning_rate": 6.880658327254042e-08, "loss": 1.0626, "step": 72900 }, { "epoch": 0.98, "learning_rate": 6.841703331999516e-08, "loss": 0.6684, "step": 72905 }, { "epoch": 0.98, "learning_rate": 6.802858771184362e-08, "loss": 1.4889, "step": 72910 }, { "epoch": 0.98, "learning_rate": 6.764124646529702e-08, "loss": 0.6686, "step": 72915 }, { "epoch": 0.98, "learning_rate": 6.72550095975083e-08, "loss": 1.041, "step": 72920 }, { "epoch": 0.98, "learning_rate": 6.686987712558879e-08, "loss": 0.5385, "step": 72925 }, { "epoch": 0.98, "learning_rate": 6.648584906659705e-08, "loss": 0.636, "step": 72930 }, { "epoch": 0.98, "learning_rate": 6.610292543754726e-08, "loss": 0.493, "step": 72935 }, { "epoch": 0.98, "learning_rate": 6.572110625539251e-08, "loss": 0.4316, "step": 72940 }, { "epoch": 0.98, "learning_rate": 6.534039153705263e-08, "loss": 0.1851, "step": 72945 }, { "epoch": 0.98, "learning_rate": 6.49607812993891e-08, "loss": 1.4758, "step": 72950 }, { "epoch": 0.98, "learning_rate": 6.458227555921903e-08, "loss": 0.9643, "step": 72955 }, { "epoch": 0.98, "learning_rate": 6.420487433330403e-08, "loss": 0.2704, "step": 72960 }, { "epoch": 0.98, "learning_rate": 6.382857763836125e-08, "loss": 0.4675, "step": 72965 }, { "epoch": 0.98, "learning_rate": 6.34533854910635e-08, "loss": 0.5415, "step": 72970 }, { "epoch": 0.98, "learning_rate": 6.307929790802803e-08, "loss": 0.2077, "step": 72975 }, { "epoch": 0.98, "learning_rate": 6.270631490582212e-08, "loss": 0.8254, "step": 72980 }, { "epoch": 0.98, "learning_rate": 6.23344365009687e-08, "loss": 0.1899, "step": 72985 }, { "epoch": 0.98, "learning_rate": 6.19636627099407e-08, "loss": 2.1039, "step": 72990 }, { "epoch": 0.98, "learning_rate": 6.159399354916384e-08, "loss": 0.4079, "step": 72995 }, { "epoch": 0.98, "learning_rate": 6.122542903500839e-08, "loss": 0.5616, "step": 73000 }, { "epoch": 0.98, "learning_rate": 6.085796918380016e-08, "loss": 0.8467, "step": 73005 }, { "epoch": 0.98, "learning_rate": 6.049161401182057e-08, "loss": 0.8673, "step": 73010 }, { "epoch": 0.98, "learning_rate": 6.012636353529278e-08, "loss": 0.8275, "step": 73015 }, { "epoch": 0.98, "learning_rate": 5.976221777039548e-08, "loss": 0.2237, "step": 73020 }, { "epoch": 0.98, "learning_rate": 5.9399176733260234e-08, "loss": 1.1356, "step": 73025 }, { "epoch": 0.98, "learning_rate": 5.903724043996861e-08, "loss": 1.6227, "step": 73030 }, { "epoch": 0.98, "learning_rate": 5.8676408906549466e-08, "loss": 0.9947, "step": 73035 }, { "epoch": 0.98, "learning_rate": 5.831668214899e-08, "loss": 0.7859, "step": 73040 }, { "epoch": 0.98, "learning_rate": 5.7958060183221916e-08, "loss": 0.3726, "step": 73045 }, { "epoch": 0.98, "learning_rate": 5.760054302512974e-08, "loss": 1.7768, "step": 73050 }, { "epoch": 0.98, "learning_rate": 5.724413069055079e-08, "loss": 0.3549, "step": 73055 }, { "epoch": 0.98, "learning_rate": 5.688882319527244e-08, "loss": 0.3401, "step": 73060 }, { "epoch": 0.98, "learning_rate": 5.653462055503489e-08, "loss": 0.6319, "step": 73065 }, { "epoch": 0.98, "learning_rate": 5.61815227855228e-08, "loss": 0.8212, "step": 73070 }, { "epoch": 0.98, "learning_rate": 5.582952990237922e-08, "loss": 0.3088, "step": 73075 }, { "epoch": 0.98, "learning_rate": 5.5478641921197225e-08, "loss": 0.6847, "step": 73080 }, { "epoch": 0.98, "learning_rate": 5.5128858857517175e-08, "loss": 0.3291, "step": 73085 }, { "epoch": 0.98, "learning_rate": 5.478018072683222e-08, "loss": 0.67, "step": 73090 }, { "epoch": 0.98, "learning_rate": 5.4432607544588344e-08, "loss": 1.5504, "step": 73095 }, { "epoch": 0.98, "learning_rate": 5.408613932618156e-08, "loss": 0.4574, "step": 73100 }, { "epoch": 0.98, "learning_rate": 5.374077608696071e-08, "loss": 0.6275, "step": 73105 }, { "epoch": 0.98, "learning_rate": 5.3396517842219107e-08, "loss": 0.1709, "step": 73110 }, { "epoch": 0.98, "learning_rate": 5.305336460720844e-08, "loss": 1.2892, "step": 73115 }, { "epoch": 0.98, "learning_rate": 5.2711316397127674e-08, "loss": 0.3443, "step": 73120 }, { "epoch": 0.98, "learning_rate": 5.2370373227128564e-08, "loss": 0.6299, "step": 73125 }, { "epoch": 0.98, "learning_rate": 5.203053511231293e-08, "loss": 1.1099, "step": 73130 }, { "epoch": 0.98, "learning_rate": 5.1691802067732606e-08, "loss": 1.0912, "step": 73135 }, { "epoch": 0.98, "learning_rate": 5.1354174108395045e-08, "loss": 0.6021, "step": 73140 }, { "epoch": 0.98, "learning_rate": 5.1017651249252175e-08, "loss": 0.6692, "step": 73145 }, { "epoch": 0.98, "learning_rate": 5.0682233505211506e-08, "loss": 0.2715, "step": 73150 }, { "epoch": 0.98, "learning_rate": 5.0347920891130604e-08, "loss": 0.562, "step": 73155 }, { "epoch": 0.98, "learning_rate": 5.0014713421817073e-08, "loss": 1.8389, "step": 73160 }, { "epoch": 0.98, "learning_rate": 4.968261111203132e-08, "loss": 0.7316, "step": 73165 }, { "epoch": 0.98, "learning_rate": 4.9351613976483805e-08, "loss": 0.1045, "step": 73170 }, { "epoch": 0.98, "learning_rate": 4.902172202983501e-08, "loss": 0.8547, "step": 73175 }, { "epoch": 0.98, "learning_rate": 4.869293528669827e-08, "loss": 0.5098, "step": 73180 }, { "epoch": 0.98, "learning_rate": 4.836525376163692e-08, "loss": 0.5902, "step": 73185 }, { "epoch": 0.98, "learning_rate": 4.8038677469164354e-08, "loss": 0.5375, "step": 73190 }, { "epoch": 0.98, "learning_rate": 4.7713206423749545e-08, "loss": 0.6441, "step": 73195 }, { "epoch": 0.98, "learning_rate": 4.7388840639805976e-08, "loss": 0.489, "step": 73200 }, { "epoch": 0.98, "learning_rate": 4.7065580131705475e-08, "loss": 0.5531, "step": 73205 }, { "epoch": 0.98, "learning_rate": 4.67434249137616e-08, "loss": 1.4122, "step": 73210 }, { "epoch": 0.98, "learning_rate": 4.642237500024904e-08, "loss": 0.6061, "step": 73215 }, { "epoch": 0.98, "learning_rate": 4.61024304053842e-08, "loss": 0.767, "step": 73220 }, { "epoch": 0.98, "learning_rate": 4.578359114334185e-08, "loss": 0.1292, "step": 73225 }, { "epoch": 0.98, "learning_rate": 4.5465857228244035e-08, "loss": 1.0154, "step": 73230 }, { "epoch": 0.98, "learning_rate": 4.51492286741656e-08, "loss": 0.8082, "step": 73235 }, { "epoch": 0.98, "learning_rate": 4.483370549513144e-08, "loss": 0.5776, "step": 73240 }, { "epoch": 0.98, "learning_rate": 4.4519287705116487e-08, "loss": 0.1951, "step": 73245 }, { "epoch": 0.98, "learning_rate": 4.4205975318051264e-08, "loss": 0.9097, "step": 73250 }, { "epoch": 0.98, "learning_rate": 4.389376834781078e-08, "loss": 0.9496, "step": 73255 }, { "epoch": 0.98, "learning_rate": 4.358266680822287e-08, "loss": 0.6843, "step": 73260 }, { "epoch": 0.98, "learning_rate": 4.327267071307095e-08, "loss": 0.5345, "step": 73265 }, { "epoch": 0.98, "learning_rate": 4.2963780076082924e-08, "loss": 0.7698, "step": 73270 }, { "epoch": 0.98, "learning_rate": 4.2717463505570484e-08, "loss": 0.6985, "step": 73275 }, { "epoch": 0.98, "learning_rate": 4.2410562727729364e-08, "loss": 1.0455, "step": 73280 }, { "epoch": 0.98, "learning_rate": 4.210476744624381e-08, "loss": 0.8116, "step": 73285 }, { "epoch": 0.98, "learning_rate": 4.180007767465299e-08, "loss": 0.5852, "step": 73290 }, { "epoch": 0.98, "learning_rate": 4.1496493426460004e-08, "loss": 0.5083, "step": 73295 }, { "epoch": 0.98, "learning_rate": 4.119401471510687e-08, "loss": 0.2646, "step": 73300 }, { "epoch": 0.98, "learning_rate": 4.0892641553993974e-08, "loss": 0.3345, "step": 73305 }, { "epoch": 0.98, "learning_rate": 4.0592373956471755e-08, "loss": 0.3338, "step": 73310 }, { "epoch": 0.98, "learning_rate": 4.0293211935837906e-08, "loss": 0.7534, "step": 73315 }, { "epoch": 0.98, "learning_rate": 3.9995155505345714e-08, "loss": 0.5814, "step": 73320 }, { "epoch": 0.98, "learning_rate": 3.9698204678198517e-08, "loss": 0.7578, "step": 73325 }, { "epoch": 0.98, "learning_rate": 3.940235946754689e-08, "loss": 0.89, "step": 73330 }, { "epoch": 0.98, "learning_rate": 3.910761988649703e-08, "loss": 0.3439, "step": 73335 }, { "epoch": 0.98, "learning_rate": 3.8813985948105145e-08, "loss": 0.1725, "step": 73340 }, { "epoch": 0.98, "learning_rate": 3.8521457665374736e-08, "loss": 1.2246, "step": 73345 }, { "epoch": 0.98, "learning_rate": 3.8230035051267655e-08, "loss": 1.0, "step": 73350 }, { "epoch": 0.98, "learning_rate": 3.793971811869024e-08, "loss": 0.9636, "step": 73355 }, { "epoch": 0.98, "learning_rate": 3.765050688049887e-08, "loss": 0.7392, "step": 73360 }, { "epoch": 0.98, "learning_rate": 3.736240134951108e-08, "loss": 0.8454, "step": 73365 }, { "epoch": 0.98, "learning_rate": 3.707540153848332e-08, "loss": 1.0883, "step": 73370 }, { "epoch": 0.98, "learning_rate": 3.678950746013044e-08, "loss": 0.8158, "step": 73375 }, { "epoch": 0.98, "learning_rate": 3.650471912711173e-08, "loss": 0.8461, "step": 73380 }, { "epoch": 0.98, "learning_rate": 3.622103655205045e-08, "loss": 1.0899, "step": 73385 }, { "epoch": 0.98, "learning_rate": 3.593845974750598e-08, "loss": 0.2724, "step": 73390 }, { "epoch": 0.98, "learning_rate": 3.5656988725993325e-08, "loss": 1.3312, "step": 73395 }, { "epoch": 0.98, "learning_rate": 3.537662349998583e-08, "loss": 0.2028, "step": 73400 }, { "epoch": 0.98, "learning_rate": 3.509736408190134e-08, "loss": 0.4412, "step": 73405 }, { "epoch": 0.98, "learning_rate": 3.481921048410775e-08, "loss": 0.4937, "step": 73410 }, { "epoch": 0.98, "learning_rate": 3.4542162718922964e-08, "loss": 0.8067, "step": 73415 }, { "epoch": 0.98, "learning_rate": 3.426622079862607e-08, "loss": 0.6641, "step": 73420 }, { "epoch": 0.98, "learning_rate": 3.3991384735432286e-08, "loss": 0.4969, "step": 73425 }, { "epoch": 0.98, "learning_rate": 3.371765454152076e-08, "loss": 1.1741, "step": 73430 }, { "epoch": 0.98, "learning_rate": 3.3445030229015126e-08, "loss": 0.5509, "step": 73435 }, { "epoch": 0.98, "learning_rate": 3.317351180999184e-08, "loss": 0.4828, "step": 73440 }, { "epoch": 0.98, "learning_rate": 3.2903099296474616e-08, "loss": 0.3797, "step": 73445 }, { "epoch": 0.98, "learning_rate": 3.263379270044553e-08, "loss": 0.9841, "step": 73450 }, { "epoch": 0.98, "learning_rate": 3.236559203383116e-08, "loss": 0.6761, "step": 73455 }, { "epoch": 0.98, "learning_rate": 3.209849730851089e-08, "loss": 0.9424, "step": 73460 }, { "epoch": 0.98, "learning_rate": 3.1832508536319696e-08, "loss": 0.7272, "step": 73465 }, { "epoch": 0.98, "learning_rate": 3.156762572903427e-08, "loss": 0.6681, "step": 73470 }, { "epoch": 0.98, "learning_rate": 3.1303848898389665e-08, "loss": 1.0402, "step": 73475 }, { "epoch": 0.98, "learning_rate": 3.1041178056070984e-08, "loss": 1.5129, "step": 73480 }, { "epoch": 0.98, "learning_rate": 3.077961321371059e-08, "loss": 0.5338, "step": 73485 }, { "epoch": 0.98, "learning_rate": 3.051915438289643e-08, "loss": 0.3069, "step": 73490 }, { "epoch": 0.98, "learning_rate": 3.02598015751665e-08, "loss": 1.058, "step": 73495 }, { "epoch": 0.98, "learning_rate": 3.0001554802008835e-08, "loss": 0.5871, "step": 73500 }, { "epoch": 0.98, "learning_rate": 2.9744414074858728e-08, "loss": 0.7273, "step": 73505 }, { "epoch": 0.98, "learning_rate": 2.9488379405109846e-08, "loss": 1.3714, "step": 73510 }, { "epoch": 0.98, "learning_rate": 2.9233450804103113e-08, "loss": 0.8375, "step": 73515 }, { "epoch": 0.99, "learning_rate": 2.89796282831295e-08, "loss": 0.4742, "step": 73520 }, { "epoch": 0.99, "learning_rate": 2.8726911853432792e-08, "loss": 0.8759, "step": 73525 }, { "epoch": 0.99, "learning_rate": 2.8475301526204033e-08, "loss": 0.7454, "step": 73530 }, { "epoch": 0.99, "learning_rate": 2.8224797312592643e-08, "loss": 1.0816, "step": 73535 }, { "epoch": 0.99, "learning_rate": 2.7975399223692523e-08, "loss": 0.9917, "step": 73540 }, { "epoch": 0.99, "learning_rate": 2.7727107270553164e-08, "loss": 1.0007, "step": 73545 }, { "epoch": 0.99, "learning_rate": 2.747992146416578e-08, "loss": 0.4784, "step": 73550 }, { "epoch": 0.99, "learning_rate": 2.723384181548827e-08, "loss": 0.8588, "step": 73555 }, { "epoch": 0.99, "learning_rate": 2.6988868335414696e-08, "loss": 1.2126, "step": 73560 }, { "epoch": 0.99, "learning_rate": 2.6745001034800265e-08, "loss": 0.7827, "step": 73565 }, { "epoch": 0.99, "learning_rate": 2.6502239924444673e-08, "loss": 0.2716, "step": 73570 }, { "epoch": 0.99, "learning_rate": 2.6260585015100426e-08, "loss": 0.8385, "step": 73575 }, { "epoch": 0.99, "learning_rate": 2.602003631747285e-08, "loss": 0.559, "step": 73580 }, { "epoch": 0.99, "learning_rate": 2.578059384221454e-08, "loss": 0.6641, "step": 73585 }, { "epoch": 0.99, "learning_rate": 2.5542257599936447e-08, "loss": 0.5717, "step": 73590 }, { "epoch": 0.99, "learning_rate": 2.530502760119402e-08, "loss": 0.507, "step": 73595 }, { "epoch": 0.99, "learning_rate": 2.5068903856492743e-08, "loss": 1.0875, "step": 73600 }, { "epoch": 0.99, "learning_rate": 2.483388637629369e-08, "loss": 0.4984, "step": 73605 }, { "epoch": 0.99, "learning_rate": 2.4599975171005206e-08, "loss": 0.4648, "step": 73610 }, { "epoch": 0.99, "learning_rate": 2.4367170250991222e-08, "loss": 0.5983, "step": 73615 }, { "epoch": 0.99, "learning_rate": 2.4135471626562932e-08, "loss": 1.0808, "step": 73620 }, { "epoch": 0.99, "learning_rate": 2.3904879307981576e-08, "loss": 1.1824, "step": 73625 }, { "epoch": 0.99, "learning_rate": 2.3675393305463978e-08, "loss": 1.1731, "step": 73630 }, { "epoch": 0.99, "learning_rate": 2.3447013629171453e-08, "loss": 1.0789, "step": 73635 }, { "epoch": 0.99, "learning_rate": 2.3219740289226466e-08, "loss": 0.3531, "step": 73640 }, { "epoch": 0.99, "learning_rate": 2.299357329568763e-08, "loss": 0.0999, "step": 73645 }, { "epoch": 0.99, "learning_rate": 2.2768512658580266e-08, "loss": 0.1931, "step": 73650 }, { "epoch": 0.99, "learning_rate": 2.2544558387871394e-08, "loss": 0.8665, "step": 73655 }, { "epoch": 0.99, "learning_rate": 2.2321710493478086e-08, "loss": 0.7297, "step": 73660 }, { "epoch": 0.99, "learning_rate": 2.2099968985275778e-08, "loss": 0.4402, "step": 73665 }, { "epoch": 0.99, "learning_rate": 2.187933387308161e-08, "loss": 1.4512, "step": 73670 }, { "epoch": 0.99, "learning_rate": 2.1659805166673873e-08, "loss": 0.7376, "step": 73675 }, { "epoch": 0.99, "learning_rate": 2.1441382875772576e-08, "loss": 0.9126, "step": 73680 }, { "epoch": 0.99, "learning_rate": 2.1224067010053305e-08, "loss": 0.6235, "step": 73685 }, { "epoch": 0.99, "learning_rate": 2.1007857579144473e-08, "loss": 0.246, "step": 73690 }, { "epoch": 0.99, "learning_rate": 2.0792754592621755e-08, "loss": 1.4013, "step": 73695 }, { "epoch": 0.99, "learning_rate": 2.0578758060013635e-08, "loss": 0.4641, "step": 73700 }, { "epoch": 0.99, "learning_rate": 2.036586799079587e-08, "loss": 0.8297, "step": 73705 }, { "epoch": 0.99, "learning_rate": 2.0154084394402585e-08, "loss": 0.9362, "step": 73710 }, { "epoch": 0.99, "learning_rate": 1.994340728021238e-08, "loss": 1.0261, "step": 73715 }, { "epoch": 0.99, "learning_rate": 1.9733836657559456e-08, "loss": 1.28, "step": 73720 }, { "epoch": 0.99, "learning_rate": 1.9525372535725285e-08, "loss": 0.6297, "step": 73725 }, { "epoch": 0.99, "learning_rate": 1.9318014923941364e-08, "loss": 0.3879, "step": 73730 }, { "epoch": 0.99, "learning_rate": 1.9111763831397566e-08, "loss": 0.8506, "step": 73735 }, { "epoch": 0.99, "learning_rate": 1.8906619267225477e-08, "loss": 0.6925, "step": 73740 }, { "epoch": 0.99, "learning_rate": 1.8702581240512273e-08, "loss": 1.279, "step": 73745 }, { "epoch": 0.99, "learning_rate": 1.8499649760300718e-08, "loss": 0.3328, "step": 73750 }, { "epoch": 0.99, "learning_rate": 1.8297824835575294e-08, "loss": 0.2438, "step": 73755 }, { "epoch": 0.99, "learning_rate": 1.809710647527607e-08, "loss": 1.1744, "step": 73760 }, { "epoch": 0.99, "learning_rate": 1.789749468829316e-08, "loss": 1.0578, "step": 73765 }, { "epoch": 0.99, "learning_rate": 1.7698989483469487e-08, "loss": 0.885, "step": 73770 }, { "epoch": 0.99, "learning_rate": 1.7501590869600792e-08, "loss": 1.0926, "step": 73775 }, { "epoch": 0.99, "learning_rate": 1.730529885542731e-08, "loss": 0.5553, "step": 73780 }, { "epoch": 0.99, "learning_rate": 1.711011344964486e-08, "loss": 1.2854, "step": 73785 }, { "epoch": 0.99, "learning_rate": 1.691603466089653e-08, "loss": 0.6085, "step": 73790 }, { "epoch": 0.99, "learning_rate": 1.672306249778377e-08, "loss": 0.7313, "step": 73795 }, { "epoch": 0.99, "learning_rate": 1.653119696884975e-08, "loss": 0.4583, "step": 73800 }, { "epoch": 0.99, "learning_rate": 1.6340438082598775e-08, "loss": 0.7839, "step": 73805 }, { "epoch": 0.99, "learning_rate": 1.6150785847474094e-08, "loss": 0.5297, "step": 73810 }, { "epoch": 0.99, "learning_rate": 1.596224027188009e-08, "loss": 0.5416, "step": 73815 }, { "epoch": 0.99, "learning_rate": 1.5774801364168422e-08, "loss": 0.8042, "step": 73820 }, { "epoch": 0.99, "learning_rate": 1.558846913264078e-08, "loss": 1.1157, "step": 73825 }, { "epoch": 0.99, "learning_rate": 1.5403243585548897e-08, "loss": 1.4392, "step": 73830 }, { "epoch": 0.99, "learning_rate": 1.5219124731102875e-08, "loss": 0.503, "step": 73835 }, { "epoch": 0.99, "learning_rate": 1.5036112577451744e-08, "loss": 1.032, "step": 73840 }, { "epoch": 0.99, "learning_rate": 1.4854207132705689e-08, "loss": 0.9817, "step": 73845 }, { "epoch": 0.99, "learning_rate": 1.4673408404922151e-08, "loss": 0.9921, "step": 73850 }, { "epoch": 0.99, "learning_rate": 1.4493716402108615e-08, "loss": 0.6542, "step": 73855 }, { "epoch": 0.99, "learning_rate": 1.4315131132225378e-08, "loss": 0.1415, "step": 73860 }, { "epoch": 0.99, "learning_rate": 1.4137652603180007e-08, "loss": 0.86, "step": 73865 }, { "epoch": 0.99, "learning_rate": 1.3961280822838429e-08, "loss": 1.0073, "step": 73870 }, { "epoch": 0.99, "learning_rate": 1.3786015799011064e-08, "loss": 0.6099, "step": 73875 }, { "epoch": 0.99, "learning_rate": 1.3611857539461148e-08, "loss": 0.5478, "step": 73880 }, { "epoch": 0.99, "learning_rate": 1.3438806051901954e-08, "loss": 0.7142, "step": 73885 }, { "epoch": 0.99, "learning_rate": 1.3266861343999571e-08, "loss": 0.8623, "step": 73890 }, { "epoch": 0.99, "learning_rate": 1.3096023423372906e-08, "loss": 0.4105, "step": 73895 }, { "epoch": 0.99, "learning_rate": 1.2926292297585352e-08, "loss": 0.5829, "step": 73900 }, { "epoch": 0.99, "learning_rate": 1.2757667974155896e-08, "loss": 0.6826, "step": 73905 }, { "epoch": 0.99, "learning_rate": 1.2590150460556338e-08, "loss": 0.7968, "step": 73910 }, { "epoch": 0.99, "learning_rate": 1.2423739764202969e-08, "loss": 1.5232, "step": 73915 }, { "epoch": 0.99, "learning_rate": 1.2258435892470444e-08, "loss": 0.5394, "step": 73920 }, { "epoch": 0.99, "learning_rate": 1.2094238852677908e-08, "loss": 0.7591, "step": 73925 }, { "epoch": 0.99, "learning_rate": 1.1931148652100099e-08, "loss": 0.4973, "step": 73930 }, { "epoch": 0.99, "learning_rate": 1.1769165297961793e-08, "loss": 0.9486, "step": 73935 }, { "epoch": 0.99, "learning_rate": 1.1608288797437805e-08, "loss": 0.3972, "step": 73940 }, { "epoch": 0.99, "learning_rate": 1.1448519157652993e-08, "loss": 0.8549, "step": 73945 }, { "epoch": 0.99, "learning_rate": 1.1289856385685027e-08, "loss": 0.4564, "step": 73950 }, { "epoch": 0.99, "learning_rate": 1.113230048856162e-08, "loss": 0.5533, "step": 73955 }, { "epoch": 0.99, "learning_rate": 1.0975851473263298e-08, "loss": 0.6728, "step": 73960 }, { "epoch": 0.99, "learning_rate": 1.0820509346717855e-08, "loss": 1.1583, "step": 73965 }, { "epoch": 0.99, "learning_rate": 1.0666274115805897e-08, "loss": 0.2624, "step": 73970 }, { "epoch": 0.99, "learning_rate": 1.0513145787360845e-08, "loss": 0.3781, "step": 73975 }, { "epoch": 0.99, "learning_rate": 1.0361124368166163e-08, "loss": 1.3405, "step": 73980 }, { "epoch": 0.99, "learning_rate": 1.021020986495258e-08, "loss": 0.2292, "step": 73985 }, { "epoch": 0.99, "learning_rate": 1.0060402284409187e-08, "loss": 0.2714, "step": 73990 }, { "epoch": 0.99, "learning_rate": 9.911701633166792e-09, "loss": 0.3937, "step": 73995 }, { "epoch": 0.99, "learning_rate": 9.764107917814569e-09, "loss": 0.5015, "step": 74000 }, { "epoch": 0.99, "learning_rate": 9.617621144891731e-09, "loss": 0.724, "step": 74005 }, { "epoch": 0.99, "learning_rate": 9.472241320884757e-09, "loss": 0.542, "step": 74010 }, { "epoch": 0.99, "learning_rate": 9.327968452232938e-09, "loss": 1.0568, "step": 74015 }, { "epoch": 0.99, "learning_rate": 9.184802545328387e-09, "loss": 0.7496, "step": 74020 }, { "epoch": 0.99, "learning_rate": 9.042743606513248e-09, "loss": 1.0492, "step": 74025 }, { "epoch": 0.99, "learning_rate": 8.90179164207694e-09, "loss": 0.8681, "step": 74030 }, { "epoch": 0.99, "learning_rate": 8.76194665826724e-09, "loss": 1.5363, "step": 74035 }, { "epoch": 0.99, "learning_rate": 8.623208661273641e-09, "loss": 0.4581, "step": 74040 }, { "epoch": 0.99, "learning_rate": 8.485577657244004e-09, "loss": 0.1824, "step": 74045 }, { "epoch": 0.99, "learning_rate": 8.349053652273454e-09, "loss": 0.567, "step": 74050 }, { "epoch": 0.99, "learning_rate": 8.213636652412705e-09, "loss": 0.4742, "step": 74055 }, { "epoch": 0.99, "learning_rate": 8.07932666365696e-09, "loss": 1.2901, "step": 74060 }, { "epoch": 0.99, "learning_rate": 7.946123691957019e-09, "loss": 0.5239, "step": 74065 }, { "epoch": 0.99, "learning_rate": 7.814027743213714e-09, "loss": 0.2164, "step": 74070 }, { "epoch": 0.99, "learning_rate": 7.683038823275146e-09, "loss": 0.6542, "step": 74075 }, { "epoch": 0.99, "learning_rate": 7.553156937945005e-09, "loss": 0.6961, "step": 74080 }, { "epoch": 0.99, "learning_rate": 7.4243820929770226e-09, "loss": 0.2837, "step": 74085 }, { "epoch": 0.99, "learning_rate": 7.296714294077745e-09, "loss": 1.0477, "step": 74090 }, { "epoch": 0.99, "learning_rate": 7.170153546895431e-09, "loss": 0.2997, "step": 74095 }, { "epoch": 0.99, "learning_rate": 7.044699857042258e-09, "loss": 1.1948, "step": 74100 }, { "epoch": 0.99, "learning_rate": 6.920353230072118e-09, "loss": 0.8977, "step": 74105 }, { "epoch": 0.99, "learning_rate": 6.797113671494493e-09, "loss": 0.8375, "step": 74110 }, { "epoch": 0.99, "learning_rate": 6.674981186768903e-09, "loss": 0.9171, "step": 74115 }, { "epoch": 0.99, "learning_rate": 6.553955781302134e-09, "loss": 1.0381, "step": 74120 }, { "epoch": 0.99, "learning_rate": 6.434037460456566e-09, "loss": 0.5913, "step": 74125 }, { "epoch": 0.99, "learning_rate": 6.315226229544613e-09, "loss": 0.6194, "step": 74130 }, { "epoch": 0.99, "learning_rate": 6.197522093828734e-09, "loss": 0.7555, "step": 74135 }, { "epoch": 0.99, "learning_rate": 6.0809250585242005e-09, "loss": 0.6404, "step": 74140 }, { "epoch": 0.99, "learning_rate": 5.9654351287935505e-09, "loss": 0.7858, "step": 74145 }, { "epoch": 0.99, "learning_rate": 5.851052309752137e-09, "loss": 0.9636, "step": 74150 }, { "epoch": 0.99, "learning_rate": 5.73777660646535e-09, "loss": 0.7512, "step": 74155 }, { "epoch": 0.99, "learning_rate": 5.625608023954176e-09, "loss": 1.4769, "step": 74160 }, { "epoch": 0.99, "learning_rate": 5.514546567186862e-09, "loss": 0.5363, "step": 74165 }, { "epoch": 0.99, "learning_rate": 5.404592241081696e-09, "loss": 0.8475, "step": 74170 }, { "epoch": 0.99, "learning_rate": 5.295745050507006e-09, "loss": 0.3128, "step": 74175 }, { "epoch": 0.99, "learning_rate": 5.1880050002894866e-09, "loss": 0.998, "step": 74180 }, { "epoch": 0.99, "learning_rate": 5.081372095194769e-09, "loss": 0.6477, "step": 74185 }, { "epoch": 0.99, "learning_rate": 4.975846339952406e-09, "loss": 0.7823, "step": 74190 }, { "epoch": 0.99, "learning_rate": 4.871427739230883e-09, "loss": 0.7833, "step": 74195 }, { "epoch": 0.99, "learning_rate": 4.768116297659831e-09, "loss": 0.6539, "step": 74200 }, { "epoch": 0.99, "learning_rate": 4.665912019816143e-09, "loss": 0.6037, "step": 74205 }, { "epoch": 0.99, "learning_rate": 4.564814910221205e-09, "loss": 0.3305, "step": 74210 }, { "epoch": 0.99, "learning_rate": 4.464824973360315e-09, "loss": 0.6335, "step": 74215 }, { "epoch": 0.99, "learning_rate": 4.3659422136549385e-09, "loss": 0.4478, "step": 74220 }, { "epoch": 0.99, "learning_rate": 4.2681666354932314e-09, "loss": 1.2464, "step": 74225 }, { "epoch": 0.99, "learning_rate": 4.171498243199512e-09, "loss": 0.6807, "step": 74230 }, { "epoch": 0.99, "learning_rate": 4.0759370410592415e-09, "loss": 0.5822, "step": 74235 }, { "epoch": 0.99, "learning_rate": 3.981483033302369e-09, "loss": 0.6848, "step": 74240 }, { "epoch": 0.99, "learning_rate": 3.888136224117211e-09, "loss": 0.432, "step": 74245 }, { "epoch": 0.99, "learning_rate": 3.795896617633798e-09, "loss": 1.0675, "step": 74250 }, { "epoch": 0.99, "learning_rate": 3.7047642179433016e-09, "loss": 0.5065, "step": 74255 }, { "epoch": 0.99, "learning_rate": 3.614739029075831e-09, "loss": 0.8877, "step": 74260 }, { "epoch": 1.0, "learning_rate": 3.525821055022638e-09, "loss": 0.4267, "step": 74265 }, { "epoch": 1.0, "learning_rate": 3.438010299725014e-09, "loss": 1.4432, "step": 74270 }, { "epoch": 1.0, "learning_rate": 3.3513067670659647e-09, "loss": 0.6094, "step": 74275 }, { "epoch": 1.0, "learning_rate": 3.2657104608924128e-09, "loss": 0.6607, "step": 74280 }, { "epoch": 1.0, "learning_rate": 3.181221384992994e-09, "loss": 1.4114, "step": 74285 }, { "epoch": 1.0, "learning_rate": 3.09783954310916e-09, "loss": 0.5037, "step": 74290 }, { "epoch": 1.0, "learning_rate": 3.0155649389351782e-09, "loss": 0.5201, "step": 74295 }, { "epoch": 1.0, "learning_rate": 2.934397576118131e-09, "loss": 0.5909, "step": 74300 }, { "epoch": 1.0, "learning_rate": 2.8543374582495896e-09, "loss": 0.6924, "step": 74305 }, { "epoch": 1.0, "learning_rate": 2.7753845888767172e-09, "loss": 0.4221, "step": 74310 }, { "epoch": 1.0, "learning_rate": 2.697538971496716e-09, "loss": 0.5336, "step": 74315 }, { "epoch": 1.0, "learning_rate": 2.620800609559604e-09, "loss": 0.9454, "step": 74320 }, { "epoch": 1.0, "learning_rate": 2.545169506459888e-09, "loss": 1.0693, "step": 74325 }, { "epoch": 1.0, "learning_rate": 2.470645665553217e-09, "loss": 0.5296, "step": 74330 }, { "epoch": 1.0, "learning_rate": 2.3972290901397297e-09, "loss": 0.6045, "step": 74335 }, { "epoch": 1.0, "learning_rate": 2.324919783466828e-09, "loss": 0.7893, "step": 74340 }, { "epoch": 1.0, "learning_rate": 2.253717748743056e-09, "loss": 1.31, "step": 74345 }, { "epoch": 1.0, "learning_rate": 2.183622989118672e-09, "loss": 0.8016, "step": 74350 }, { "epoch": 1.0, "learning_rate": 2.1146355076995252e-09, "loss": 1.129, "step": 74355 }, { "epoch": 1.0, "learning_rate": 2.0467553075415035e-09, "loss": 0.3735, "step": 74360 }, { "epoch": 1.0, "learning_rate": 1.979982391650537e-09, "loss": 1.2997, "step": 74365 }, { "epoch": 1.0, "learning_rate": 1.914316762988144e-09, "loss": 1.3051, "step": 74370 }, { "epoch": 1.0, "learning_rate": 1.8497584244575595e-09, "loss": 0.9906, "step": 74375 }, { "epoch": 1.0, "learning_rate": 1.7863073789203822e-09, "loss": 0.8898, "step": 74380 }, { "epoch": 1.0, "learning_rate": 1.7239636291882523e-09, "loss": 0.6683, "step": 74385 }, { "epoch": 1.0, "learning_rate": 1.6627271780228493e-09, "loss": 0.4545, "step": 74390 }, { "epoch": 1.0, "learning_rate": 1.6025980281358932e-09, "loss": 0.5094, "step": 74395 }, { "epoch": 1.0, "learning_rate": 1.5435761821919193e-09, "loss": 0.5993, "step": 74400 }, { "epoch": 1.0, "learning_rate": 1.485661642802727e-09, "loss": 0.2896, "step": 74405 }, { "epoch": 1.0, "learning_rate": 1.4288544125357074e-09, "loss": 0.8433, "step": 74410 }, { "epoch": 1.0, "learning_rate": 1.3731544939055152e-09, "loss": 0.8087, "step": 74415 }, { "epoch": 1.0, "learning_rate": 1.3185618893796214e-09, "loss": 0.3559, "step": 74420 }, { "epoch": 1.0, "learning_rate": 1.2650766013783121e-09, "loss": 0.8583, "step": 74425 }, { "epoch": 1.0, "learning_rate": 1.212698632269138e-09, "loss": 0.5313, "step": 74430 }, { "epoch": 1.0, "learning_rate": 1.1614279843724652e-09, "loss": 0.3742, "step": 74435 }, { "epoch": 1.0, "learning_rate": 1.1112646599586995e-09, "loss": 0.5794, "step": 74440 }, { "epoch": 1.0, "learning_rate": 1.062208661251063e-09, "loss": 0.2679, "step": 74445 }, { "epoch": 1.0, "learning_rate": 1.0142599904228168e-09, "loss": 0.778, "step": 74450 }, { "epoch": 1.0, "learning_rate": 9.67418649594487e-10, "loss": 0.5434, "step": 74455 }, { "epoch": 1.0, "learning_rate": 9.216846408449664e-10, "loss": 1.0334, "step": 74460 }, { "epoch": 1.0, "learning_rate": 8.770579661976363e-10, "loss": 1.0444, "step": 74465 }, { "epoch": 1.0, "learning_rate": 8.335386276314694e-10, "loss": 0.9729, "step": 74470 }, { "epoch": 1.0, "learning_rate": 7.911266270699269e-10, "loss": 0.5291, "step": 74475 }, { "epoch": 1.0, "learning_rate": 7.498219663976125e-10, "loss": 0.8322, "step": 74480 }, { "epoch": 1.0, "learning_rate": 7.096246474380675e-10, "loss": 1.1682, "step": 74485 }, { "epoch": 1.0, "learning_rate": 6.705346719759753e-10, "loss": 0.5619, "step": 74490 }, { "epoch": 1.0, "learning_rate": 6.325520417405084e-10, "loss": 1.4334, "step": 74495 }, { "epoch": 1.0, "learning_rate": 5.956767584164302e-10, "loss": 0.1719, "step": 74500 }, { "epoch": 1.0, "learning_rate": 5.599088236357686e-10, "loss": 0.4298, "step": 74505 }, { "epoch": 1.0, "learning_rate": 5.252482389805912e-10, "loss": 0.6593, "step": 74510 }, { "epoch": 1.0, "learning_rate": 4.916950059913328e-10, "loss": 0.5348, "step": 74515 }, { "epoch": 1.0, "learning_rate": 4.592491261501408e-10, "loss": 1.4703, "step": 74520 }, { "epoch": 1.0, "learning_rate": 4.279106008947542e-10, "loss": 0.3645, "step": 74525 }, { "epoch": 1.0, "learning_rate": 3.976794316157273e-10, "loss": 0.8994, "step": 74530 }, { "epoch": 1.0, "learning_rate": 3.6855561964810325e-10, "loss": 0.4921, "step": 74535 }, { "epoch": 1.0, "learning_rate": 3.405391662880675e-10, "loss": 0.4912, "step": 74540 }, { "epoch": 1.0, "learning_rate": 3.1363007276796753e-10, "loss": 0.296, "step": 74545 }, { "epoch": 1.0, "learning_rate": 2.8782834028684424e-10, "loss": 0.4321, "step": 74550 }, { "epoch": 1.0, "learning_rate": 2.631339699854518e-10, "loss": 0.1979, "step": 74555 }, { "epoch": 1.0, "learning_rate": 2.3954696295735987e-10, "loss": 0.3232, "step": 74560 }, { "epoch": 1.0, "learning_rate": 2.1706732024895372e-10, "loss": 0.4169, "step": 74565 }, { "epoch": 1.0, "learning_rate": 1.9569504285110728e-10, "loss": 0.5872, "step": 74570 }, { "epoch": 1.0, "learning_rate": 1.754301317158369e-10, "loss": 0.4512, "step": 74575 }, { "epoch": 1.0, "learning_rate": 1.5627258773964758e-10, "loss": 0.4954, "step": 74580 }, { "epoch": 1.0, "learning_rate": 1.3822241176908445e-10, "loss": 0.5389, "step": 74585 }, { "epoch": 1.0, "learning_rate": 1.2127960460628363e-10, "loss": 0.8017, "step": 74590 }, { "epoch": 1.0, "learning_rate": 1.0544416699787007e-10, "loss": 0.2518, "step": 74595 }, { "epoch": 1.0, "learning_rate": 9.071609965161099e-11, "loss": 0.6845, "step": 74600 }, { "epoch": 1.0, "learning_rate": 7.709540321143571e-11, "loss": 0.6873, "step": 74605 }, { "epoch": 1.0, "learning_rate": 6.458207828796691e-11, "loss": 1.124, "step": 74610 }, { "epoch": 1.0, "learning_rate": 5.3176125433540555e-11, "loss": 1.0638, "step": 74615 }, { "epoch": 1.0, "learning_rate": 4.287754515053255e-11, "loss": 0.8507, "step": 74620 }, { "epoch": 1.0, "learning_rate": 3.368633789690989e-11, "loss": 0.942, "step": 74625 }, { "epoch": 1.0, "learning_rate": 2.5602504080679544e-11, "loss": 0.5321, "step": 74630 }, { "epoch": 1.0, "learning_rate": 1.8626044059888437e-11, "loss": 1.0746, "step": 74635 }, { "epoch": 1.0, "step": 74635, "total_flos": 2.836071368280244e+18, "train_loss": 0.7439663516841827, "train_runtime": 118446.1149, "train_samples_per_second": 0.63, "train_steps_per_second": 0.63 } ], "logging_steps": 5, "max_steps": 74635, "num_train_epochs": 1, "save_steps": 5000, "total_flos": 2.836071368280244e+18, "trial_name": null, "trial_params": null }