diff --git "a/LORAs/gpt4-tinyllama-lora/checkpoint-52002/trainer_state.json" "b/LORAs/gpt4-tinyllama-lora/checkpoint-52002/trainer_state.json" new file mode 100644--- /dev/null +++ "b/LORAs/gpt4-tinyllama-lora/checkpoint-52002/trainer_state.json" @@ -0,0 +1,31219 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "eval_steps": 500, + "global_step": 52002, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 9.999999771892448e-05, + "loss": 1.875, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 9.999999087569809e-05, + "loss": 2.0139, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 9.999997947032149e-05, + "loss": 1.7626, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 9.99999635027957e-05, + "loss": 1.8976, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 9.999994297312218e-05, + "loss": 1.7202, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 9.999991788130281e-05, + "loss": 1.5012, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 9.999988822733987e-05, + "loss": 1.3992, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 9.999985401123607e-05, + "loss": 1.4993, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 9.999981523299453e-05, + "loss": 1.4088, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 9.99997718926188e-05, + "loss": 1.2877, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 9.999972399011282e-05, + "loss": 1.3944, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 9.999967152548095e-05, + "loss": 1.6015, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 9.999961449872801e-05, + "loss": 1.6425, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 9.999955290985919e-05, + "loss": 1.4663, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 9.999948675888009e-05, + "loss": 1.2942, + "step": 150 + }, + { + "epoch": 0.0, + "learning_rate": 9.999941604579676e-05, + "loss": 1.3777, + "step": 160 + }, + { + "epoch": 0.0, + "learning_rate": 9.999934077061568e-05, + "loss": 1.4109, + "step": 170 + }, + { + "epoch": 0.0, + "learning_rate": 9.999926093334366e-05, + "loss": 1.36, + "step": 180 + }, + { + "epoch": 0.0, + "learning_rate": 9.999917653398803e-05, + "loss": 1.2688, + "step": 190 + }, + { + "epoch": 0.0, + "learning_rate": 9.999908757255648e-05, + "loss": 1.4992, + "step": 200 + }, + { + "epoch": 0.0, + "learning_rate": 9.999899404905713e-05, + "loss": 1.35, + "step": 210 + }, + { + "epoch": 0.0, + "learning_rate": 9.99988959634985e-05, + "loss": 1.477, + "step": 220 + }, + { + "epoch": 0.0, + "learning_rate": 9.999879331588954e-05, + "loss": 1.3487, + "step": 230 + }, + { + "epoch": 0.0, + "learning_rate": 9.999868610623963e-05, + "loss": 1.3792, + "step": 240 + }, + { + "epoch": 0.0, + "learning_rate": 9.999857433455855e-05, + "loss": 1.5009, + "step": 250 + }, + { + "epoch": 0.0, + "learning_rate": 9.999845800085648e-05, + "loss": 1.4627, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 9.999833710514405e-05, + "loss": 1.2347, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 9.99982116474323e-05, + "loss": 1.2666, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 9.999808162773266e-05, + "loss": 1.2938, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 9.999794704605701e-05, + "loss": 1.3973, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 9.999780790241761e-05, + "loss": 1.4668, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 9.999766419682716e-05, + "loss": 1.3756, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 9.999751592929878e-05, + "loss": 1.2096, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 9.999736309984599e-05, + "loss": 1.1644, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 9.999720570848277e-05, + "loss": 1.0741, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 9.999704375522343e-05, + "loss": 1.2642, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 9.999687724008276e-05, + "loss": 1.2261, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 9.999670616307597e-05, + "loss": 1.4182, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 9.999653052421867e-05, + "loss": 1.3194, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 9.999635032352687e-05, + "loss": 1.35, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 9.999616556101701e-05, + "loss": 1.14, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 9.999597623670597e-05, + "loss": 1.4579, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 9.9995782350611e-05, + "loss": 1.3264, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 9.999558390274981e-05, + "loss": 1.528, + "step": 440 + }, + { + "epoch": 0.01, + "learning_rate": 9.999538089314051e-05, + "loss": 1.2982, + "step": 450 + }, + { + "epoch": 0.01, + "learning_rate": 9.99951733218016e-05, + "loss": 1.3311, + "step": 460 + }, + { + "epoch": 0.01, + "learning_rate": 9.999496118875204e-05, + "loss": 1.2632, + "step": 470 + }, + { + "epoch": 0.01, + "learning_rate": 9.999474449401116e-05, + "loss": 1.4559, + "step": 480 + }, + { + "epoch": 0.01, + "learning_rate": 9.999452323759878e-05, + "loss": 1.4609, + "step": 490 + }, + { + "epoch": 0.01, + "learning_rate": 9.999429741953504e-05, + "loss": 1.3248, + "step": 500 + }, + { + "epoch": 0.01, + "learning_rate": 9.999406703984055e-05, + "loss": 1.2921, + "step": 510 + }, + { + "epoch": 0.01, + "learning_rate": 9.999383209853637e-05, + "loss": 1.2958, + "step": 520 + }, + { + "epoch": 0.01, + "learning_rate": 9.999359259564389e-05, + "loss": 1.4268, + "step": 530 + }, + { + "epoch": 0.01, + "learning_rate": 9.999334853118498e-05, + "loss": 1.6085, + "step": 540 + }, + { + "epoch": 0.01, + "learning_rate": 9.999309990518194e-05, + "loss": 1.4809, + "step": 550 + }, + { + "epoch": 0.01, + "learning_rate": 9.999284671765739e-05, + "loss": 1.4938, + "step": 560 + }, + { + "epoch": 0.01, + "learning_rate": 9.999258896863448e-05, + "loss": 1.5519, + "step": 570 + }, + { + "epoch": 0.01, + "learning_rate": 9.999232665813674e-05, + "loss": 1.3456, + "step": 580 + }, + { + "epoch": 0.01, + "learning_rate": 9.999205978618806e-05, + "loss": 1.124, + "step": 590 + }, + { + "epoch": 0.01, + "learning_rate": 9.99917883528128e-05, + "loss": 1.4275, + "step": 600 + }, + { + "epoch": 0.01, + "learning_rate": 9.999151235803576e-05, + "loss": 1.2882, + "step": 610 + }, + { + "epoch": 0.01, + "learning_rate": 9.999123180188208e-05, + "loss": 1.7446, + "step": 620 + }, + { + "epoch": 0.01, + "learning_rate": 9.99909466843774e-05, + "loss": 1.3899, + "step": 630 + }, + { + "epoch": 0.01, + "learning_rate": 9.99906570055477e-05, + "loss": 1.2669, + "step": 640 + }, + { + "epoch": 0.01, + "learning_rate": 9.999036276541943e-05, + "loss": 1.0545, + "step": 650 + }, + { + "epoch": 0.01, + "learning_rate": 9.999006396401942e-05, + "loss": 1.3325, + "step": 660 + }, + { + "epoch": 0.01, + "learning_rate": 9.998976060137495e-05, + "loss": 1.3019, + "step": 670 + }, + { + "epoch": 0.01, + "learning_rate": 9.99894526775137e-05, + "loss": 1.3425, + "step": 680 + }, + { + "epoch": 0.01, + "learning_rate": 9.998914019246377e-05, + "loss": 1.5241, + "step": 690 + }, + { + "epoch": 0.01, + "learning_rate": 9.998882314625365e-05, + "loss": 1.3705, + "step": 700 + }, + { + "epoch": 0.01, + "learning_rate": 9.998850153891228e-05, + "loss": 1.402, + "step": 710 + }, + { + "epoch": 0.01, + "learning_rate": 9.998817537046902e-05, + "loss": 1.5151, + "step": 720 + }, + { + "epoch": 0.01, + "learning_rate": 9.99878446409536e-05, + "loss": 1.1965, + "step": 730 + }, + { + "epoch": 0.01, + "learning_rate": 9.998750935039623e-05, + "loss": 1.5337, + "step": 740 + }, + { + "epoch": 0.01, + "learning_rate": 9.998716949882747e-05, + "loss": 1.3151, + "step": 750 + }, + { + "epoch": 0.01, + "learning_rate": 9.998682508627835e-05, + "loss": 1.3851, + "step": 760 + }, + { + "epoch": 0.01, + "learning_rate": 9.99864761127803e-05, + "loss": 1.4297, + "step": 770 + }, + { + "epoch": 0.01, + "learning_rate": 9.998612257836514e-05, + "loss": 1.5431, + "step": 780 + }, + { + "epoch": 0.02, + "learning_rate": 9.998576448306515e-05, + "loss": 1.5623, + "step": 790 + }, + { + "epoch": 0.02, + "learning_rate": 9.998540182691298e-05, + "loss": 1.4463, + "step": 800 + }, + { + "epoch": 0.02, + "learning_rate": 9.998503460994176e-05, + "loss": 1.685, + "step": 810 + }, + { + "epoch": 0.02, + "learning_rate": 9.998466283218494e-05, + "loss": 1.0598, + "step": 820 + }, + { + "epoch": 0.02, + "learning_rate": 9.998428649367648e-05, + "loss": 1.3097, + "step": 830 + }, + { + "epoch": 0.02, + "learning_rate": 9.998390559445071e-05, + "loss": 1.2586, + "step": 840 + }, + { + "epoch": 0.02, + "learning_rate": 9.998352013454239e-05, + "loss": 1.3021, + "step": 850 + }, + { + "epoch": 0.02, + "learning_rate": 9.998313011398668e-05, + "loss": 1.3545, + "step": 860 + }, + { + "epoch": 0.02, + "learning_rate": 9.998273553281916e-05, + "loss": 1.2164, + "step": 870 + }, + { + "epoch": 0.02, + "learning_rate": 9.998233639107586e-05, + "loss": 1.3504, + "step": 880 + }, + { + "epoch": 0.02, + "learning_rate": 9.998193268879317e-05, + "loss": 1.5319, + "step": 890 + }, + { + "epoch": 0.02, + "learning_rate": 9.998152442600794e-05, + "loss": 1.1939, + "step": 900 + }, + { + "epoch": 0.02, + "learning_rate": 9.998111160275742e-05, + "loss": 1.5217, + "step": 910 + }, + { + "epoch": 0.02, + "learning_rate": 9.998069421907929e-05, + "loss": 1.3646, + "step": 920 + }, + { + "epoch": 0.02, + "learning_rate": 9.998027227501161e-05, + "loss": 1.1651, + "step": 930 + }, + { + "epoch": 0.02, + "learning_rate": 9.997984577059288e-05, + "loss": 1.5059, + "step": 940 + }, + { + "epoch": 0.02, + "learning_rate": 9.997941470586203e-05, + "loss": 1.1902, + "step": 950 + }, + { + "epoch": 0.02, + "learning_rate": 9.997897908085839e-05, + "loss": 1.2637, + "step": 960 + }, + { + "epoch": 0.02, + "learning_rate": 9.99785388956217e-05, + "loss": 1.3935, + "step": 970 + }, + { + "epoch": 0.02, + "learning_rate": 9.997809415019213e-05, + "loss": 1.3405, + "step": 980 + }, + { + "epoch": 0.02, + "learning_rate": 9.997764484461025e-05, + "loss": 1.2142, + "step": 990 + }, + { + "epoch": 0.02, + "learning_rate": 9.997719097891707e-05, + "loss": 1.2017, + "step": 1000 + }, + { + "epoch": 0.02, + "learning_rate": 9.997673255315401e-05, + "loss": 1.5894, + "step": 1010 + }, + { + "epoch": 0.02, + "learning_rate": 9.997626956736286e-05, + "loss": 1.2648, + "step": 1020 + }, + { + "epoch": 0.02, + "learning_rate": 9.99758020215859e-05, + "loss": 1.3068, + "step": 1030 + }, + { + "epoch": 0.02, + "learning_rate": 9.997532991586578e-05, + "loss": 1.3405, + "step": 1040 + }, + { + "epoch": 0.02, + "learning_rate": 9.997485325024555e-05, + "loss": 1.4155, + "step": 1050 + }, + { + "epoch": 0.02, + "learning_rate": 9.997437202476875e-05, + "loss": 1.3779, + "step": 1060 + }, + { + "epoch": 0.02, + "learning_rate": 9.997388623947928e-05, + "loss": 1.3744, + "step": 1070 + }, + { + "epoch": 0.02, + "learning_rate": 9.997339589442143e-05, + "loss": 1.4678, + "step": 1080 + }, + { + "epoch": 0.02, + "learning_rate": 9.997290098963996e-05, + "loss": 1.2851, + "step": 1090 + }, + { + "epoch": 0.02, + "learning_rate": 9.997240152518003e-05, + "loss": 1.4561, + "step": 1100 + }, + { + "epoch": 0.02, + "learning_rate": 9.997189750108721e-05, + "loss": 1.3897, + "step": 1110 + }, + { + "epoch": 0.02, + "learning_rate": 9.997138891740748e-05, + "loss": 1.136, + "step": 1120 + }, + { + "epoch": 0.02, + "learning_rate": 9.997087577418727e-05, + "loss": 1.143, + "step": 1130 + }, + { + "epoch": 0.02, + "learning_rate": 9.997035807147337e-05, + "loss": 1.3829, + "step": 1140 + }, + { + "epoch": 0.02, + "learning_rate": 9.996983580931304e-05, + "loss": 1.5637, + "step": 1150 + }, + { + "epoch": 0.02, + "learning_rate": 9.996930898775391e-05, + "loss": 1.2417, + "step": 1160 + }, + { + "epoch": 0.02, + "learning_rate": 9.996877760684407e-05, + "loss": 1.3978, + "step": 1170 + }, + { + "epoch": 0.02, + "learning_rate": 9.996824166663201e-05, + "loss": 1.1616, + "step": 1180 + }, + { + "epoch": 0.02, + "learning_rate": 9.99677011671666e-05, + "loss": 1.339, + "step": 1190 + }, + { + "epoch": 0.02, + "learning_rate": 9.996715610849718e-05, + "loss": 1.651, + "step": 1200 + }, + { + "epoch": 0.02, + "learning_rate": 9.996660649067349e-05, + "loss": 1.1262, + "step": 1210 + }, + { + "epoch": 0.02, + "learning_rate": 9.996605231374565e-05, + "loss": 1.3203, + "step": 1220 + }, + { + "epoch": 0.02, + "learning_rate": 9.996549357776425e-05, + "loss": 1.3868, + "step": 1230 + }, + { + "epoch": 0.02, + "learning_rate": 9.996493028278026e-05, + "loss": 1.2582, + "step": 1240 + }, + { + "epoch": 0.02, + "learning_rate": 9.996436242884508e-05, + "loss": 1.4204, + "step": 1250 + }, + { + "epoch": 0.02, + "learning_rate": 9.99637900160105e-05, + "loss": 1.2503, + "step": 1260 + }, + { + "epoch": 0.02, + "learning_rate": 9.99632130443288e-05, + "loss": 1.2795, + "step": 1270 + }, + { + "epoch": 0.02, + "learning_rate": 9.99626315138526e-05, + "loss": 1.3889, + "step": 1280 + }, + { + "epoch": 0.02, + "learning_rate": 9.996204542463492e-05, + "loss": 1.6772, + "step": 1290 + }, + { + "epoch": 0.02, + "learning_rate": 9.99614547767293e-05, + "loss": 1.347, + "step": 1300 + }, + { + "epoch": 0.03, + "learning_rate": 9.996085957018959e-05, + "loss": 1.3079, + "step": 1310 + }, + { + "epoch": 0.03, + "learning_rate": 9.996025980507012e-05, + "loss": 1.4347, + "step": 1320 + }, + { + "epoch": 0.03, + "learning_rate": 9.995965548142559e-05, + "loss": 1.2224, + "step": 1330 + }, + { + "epoch": 0.03, + "learning_rate": 9.995904659931118e-05, + "loss": 1.2926, + "step": 1340 + }, + { + "epoch": 0.03, + "learning_rate": 9.995843315878241e-05, + "loss": 1.2501, + "step": 1350 + }, + { + "epoch": 0.03, + "learning_rate": 9.995781515989528e-05, + "loss": 1.3179, + "step": 1360 + }, + { + "epoch": 0.03, + "learning_rate": 9.995719260270616e-05, + "loss": 1.1125, + "step": 1370 + }, + { + "epoch": 0.03, + "learning_rate": 9.995656548727184e-05, + "loss": 1.3954, + "step": 1380 + }, + { + "epoch": 0.03, + "learning_rate": 9.995593381364958e-05, + "loss": 1.3111, + "step": 1390 + }, + { + "epoch": 0.03, + "learning_rate": 9.995529758189696e-05, + "loss": 1.2314, + "step": 1400 + }, + { + "epoch": 0.03, + "learning_rate": 9.99546567920721e-05, + "loss": 1.2019, + "step": 1410 + }, + { + "epoch": 0.03, + "learning_rate": 9.995401144423342e-05, + "loss": 1.3759, + "step": 1420 + }, + { + "epoch": 0.03, + "learning_rate": 9.995336153843982e-05, + "loss": 1.5097, + "step": 1430 + }, + { + "epoch": 0.03, + "learning_rate": 9.995270707475059e-05, + "loss": 1.2159, + "step": 1440 + }, + { + "epoch": 0.03, + "learning_rate": 9.995204805322547e-05, + "loss": 1.5312, + "step": 1450 + }, + { + "epoch": 0.03, + "learning_rate": 9.995138447392455e-05, + "loss": 1.6136, + "step": 1460 + }, + { + "epoch": 0.03, + "learning_rate": 9.99507163369084e-05, + "loss": 1.3264, + "step": 1470 + }, + { + "epoch": 0.03, + "learning_rate": 9.9950043642238e-05, + "loss": 1.409, + "step": 1480 + }, + { + "epoch": 0.03, + "learning_rate": 9.99493663899747e-05, + "loss": 1.2682, + "step": 1490 + }, + { + "epoch": 0.03, + "learning_rate": 9.994868458018029e-05, + "loss": 1.2743, + "step": 1500 + }, + { + "epoch": 0.03, + "learning_rate": 9.994799821291701e-05, + "loss": 1.3114, + "step": 1510 + }, + { + "epoch": 0.03, + "learning_rate": 9.994730728824748e-05, + "loss": 1.5562, + "step": 1520 + }, + { + "epoch": 0.03, + "learning_rate": 9.994661180623472e-05, + "loss": 1.3428, + "step": 1530 + }, + { + "epoch": 0.03, + "learning_rate": 9.994591176694221e-05, + "loss": 1.3074, + "step": 1540 + }, + { + "epoch": 0.03, + "learning_rate": 9.994520717043381e-05, + "loss": 1.1452, + "step": 1550 + }, + { + "epoch": 0.03, + "learning_rate": 9.99444980167738e-05, + "loss": 1.1624, + "step": 1560 + }, + { + "epoch": 0.03, + "learning_rate": 9.994378430602693e-05, + "loss": 1.4339, + "step": 1570 + }, + { + "epoch": 0.03, + "learning_rate": 9.994306603825828e-05, + "loss": 1.2881, + "step": 1580 + }, + { + "epoch": 0.03, + "learning_rate": 9.99423432135334e-05, + "loss": 1.3104, + "step": 1590 + }, + { + "epoch": 0.03, + "learning_rate": 9.994161583191824e-05, + "loss": 1.2123, + "step": 1600 + }, + { + "epoch": 0.03, + "learning_rate": 9.994088389347917e-05, + "loss": 1.3504, + "step": 1610 + }, + { + "epoch": 0.03, + "learning_rate": 9.994014739828297e-05, + "loss": 1.4634, + "step": 1620 + }, + { + "epoch": 0.03, + "learning_rate": 9.993940634639684e-05, + "loss": 1.2906, + "step": 1630 + }, + { + "epoch": 0.03, + "learning_rate": 9.99386607378884e-05, + "loss": 1.285, + "step": 1640 + }, + { + "epoch": 0.03, + "learning_rate": 9.99379105728257e-05, + "loss": 1.4598, + "step": 1650 + }, + { + "epoch": 0.03, + "learning_rate": 9.993715585127714e-05, + "loss": 1.456, + "step": 1660 + }, + { + "epoch": 0.03, + "learning_rate": 9.993639657331162e-05, + "loss": 1.5713, + "step": 1670 + }, + { + "epoch": 0.03, + "learning_rate": 9.993563273899841e-05, + "loss": 1.3016, + "step": 1680 + }, + { + "epoch": 0.03, + "learning_rate": 9.993486434840723e-05, + "loss": 1.1334, + "step": 1690 + }, + { + "epoch": 0.03, + "learning_rate": 9.993409140160815e-05, + "loss": 1.0233, + "step": 1700 + }, + { + "epoch": 0.03, + "learning_rate": 9.993331389867171e-05, + "loss": 1.2469, + "step": 1710 + }, + { + "epoch": 0.03, + "learning_rate": 9.993253183966884e-05, + "loss": 1.1256, + "step": 1720 + }, + { + "epoch": 0.03, + "learning_rate": 9.993174522467093e-05, + "loss": 1.3883, + "step": 1730 + }, + { + "epoch": 0.03, + "learning_rate": 9.993095405374973e-05, + "loss": 1.4294, + "step": 1740 + }, + { + "epoch": 0.03, + "learning_rate": 9.993015832697742e-05, + "loss": 1.33, + "step": 1750 + }, + { + "epoch": 0.03, + "learning_rate": 9.992935804442662e-05, + "loss": 1.2521, + "step": 1760 + }, + { + "epoch": 0.03, + "learning_rate": 9.992855320617035e-05, + "loss": 1.2279, + "step": 1770 + }, + { + "epoch": 0.03, + "learning_rate": 9.992774381228205e-05, + "loss": 1.2524, + "step": 1780 + }, + { + "epoch": 0.03, + "learning_rate": 9.992692986283557e-05, + "loss": 1.4408, + "step": 1790 + }, + { + "epoch": 0.03, + "learning_rate": 9.992611135790515e-05, + "loss": 1.513, + "step": 1800 + }, + { + "epoch": 0.03, + "learning_rate": 9.99252882975655e-05, + "loss": 1.3177, + "step": 1810 + }, + { + "epoch": 0.03, + "learning_rate": 9.992446068189172e-05, + "loss": 1.2595, + "step": 1820 + }, + { + "epoch": 0.04, + "learning_rate": 9.992362851095931e-05, + "loss": 1.3211, + "step": 1830 + }, + { + "epoch": 0.04, + "learning_rate": 9.99227917848442e-05, + "loss": 1.3533, + "step": 1840 + }, + { + "epoch": 0.04, + "learning_rate": 9.992195050362276e-05, + "loss": 1.195, + "step": 1850 + }, + { + "epoch": 0.04, + "learning_rate": 9.992110466737173e-05, + "loss": 1.3458, + "step": 1860 + }, + { + "epoch": 0.04, + "learning_rate": 9.99202542761683e-05, + "loss": 1.3658, + "step": 1870 + }, + { + "epoch": 0.04, + "learning_rate": 9.991939933009002e-05, + "loss": 1.2936, + "step": 1880 + }, + { + "epoch": 0.04, + "learning_rate": 9.991853982921497e-05, + "loss": 1.3322, + "step": 1890 + }, + { + "epoch": 0.04, + "learning_rate": 9.99176757736215e-05, + "loss": 1.2131, + "step": 1900 + }, + { + "epoch": 0.04, + "learning_rate": 9.99168071633885e-05, + "loss": 1.2902, + "step": 1910 + }, + { + "epoch": 0.04, + "learning_rate": 9.99159339985952e-05, + "loss": 1.5979, + "step": 1920 + }, + { + "epoch": 0.04, + "learning_rate": 9.99150562793213e-05, + "loss": 1.3416, + "step": 1930 + }, + { + "epoch": 0.04, + "learning_rate": 9.991417400564684e-05, + "loss": 1.2639, + "step": 1940 + }, + { + "epoch": 0.04, + "learning_rate": 9.991328717765234e-05, + "loss": 1.495, + "step": 1950 + }, + { + "epoch": 0.04, + "learning_rate": 9.991239579541874e-05, + "loss": 1.3425, + "step": 1960 + }, + { + "epoch": 0.04, + "learning_rate": 9.991149985902735e-05, + "loss": 1.1307, + "step": 1970 + }, + { + "epoch": 0.04, + "learning_rate": 9.991059936855991e-05, + "loss": 1.5018, + "step": 1980 + }, + { + "epoch": 0.04, + "learning_rate": 9.99096943240986e-05, + "loss": 1.1457, + "step": 1990 + }, + { + "epoch": 0.04, + "learning_rate": 9.9908784725726e-05, + "loss": 1.3289, + "step": 2000 + }, + { + "epoch": 0.04, + "learning_rate": 9.990787057352508e-05, + "loss": 1.3292, + "step": 2010 + }, + { + "epoch": 0.04, + "learning_rate": 9.990695186757931e-05, + "loss": 1.6662, + "step": 2020 + }, + { + "epoch": 0.04, + "learning_rate": 9.990602860797244e-05, + "loss": 1.0469, + "step": 2030 + }, + { + "epoch": 0.04, + "learning_rate": 9.990510079478875e-05, + "loss": 1.2761, + "step": 2040 + }, + { + "epoch": 0.04, + "learning_rate": 9.99041684281129e-05, + "loss": 1.2587, + "step": 2050 + }, + { + "epoch": 0.04, + "learning_rate": 9.990323150802993e-05, + "loss": 1.1929, + "step": 2060 + }, + { + "epoch": 0.04, + "learning_rate": 9.990229003462539e-05, + "loss": 1.6202, + "step": 2070 + }, + { + "epoch": 0.04, + "learning_rate": 9.990134400798512e-05, + "loss": 1.6077, + "step": 2080 + }, + { + "epoch": 0.04, + "learning_rate": 9.990039342819546e-05, + "loss": 1.3055, + "step": 2090 + }, + { + "epoch": 0.04, + "learning_rate": 9.989943829534316e-05, + "loss": 1.4407, + "step": 2100 + }, + { + "epoch": 0.04, + "learning_rate": 9.989847860951535e-05, + "loss": 1.5117, + "step": 2110 + }, + { + "epoch": 0.04, + "learning_rate": 9.98975143707996e-05, + "loss": 1.4667, + "step": 2120 + }, + { + "epoch": 0.04, + "learning_rate": 9.989654557928388e-05, + "loss": 1.5847, + "step": 2130 + }, + { + "epoch": 0.04, + "learning_rate": 9.989557223505661e-05, + "loss": 1.2733, + "step": 2140 + }, + { + "epoch": 0.04, + "learning_rate": 9.989459433820658e-05, + "loss": 1.321, + "step": 2150 + }, + { + "epoch": 0.04, + "learning_rate": 9.989361188882303e-05, + "loss": 1.2065, + "step": 2160 + }, + { + "epoch": 0.04, + "learning_rate": 9.989262488699558e-05, + "loss": 1.3144, + "step": 2170 + }, + { + "epoch": 0.04, + "learning_rate": 9.98916333328143e-05, + "loss": 1.2705, + "step": 2180 + }, + { + "epoch": 0.04, + "learning_rate": 9.989063722636969e-05, + "loss": 1.4665, + "step": 2190 + }, + { + "epoch": 0.04, + "learning_rate": 9.988963656775259e-05, + "loss": 1.2998, + "step": 2200 + }, + { + "epoch": 0.04, + "learning_rate": 9.988863135705433e-05, + "loss": 1.4893, + "step": 2210 + }, + { + "epoch": 0.04, + "learning_rate": 9.988762159436662e-05, + "loss": 1.2859, + "step": 2220 + }, + { + "epoch": 0.04, + "learning_rate": 9.988660727978158e-05, + "loss": 1.2458, + "step": 2230 + }, + { + "epoch": 0.04, + "learning_rate": 9.98855884133918e-05, + "loss": 1.0838, + "step": 2240 + }, + { + "epoch": 0.04, + "learning_rate": 9.988456499529023e-05, + "loss": 1.328, + "step": 2250 + }, + { + "epoch": 0.04, + "learning_rate": 9.988353702557022e-05, + "loss": 1.3803, + "step": 2260 + }, + { + "epoch": 0.04, + "learning_rate": 9.98825045043256e-05, + "loss": 1.315, + "step": 2270 + }, + { + "epoch": 0.04, + "learning_rate": 9.988146743165054e-05, + "loss": 1.2964, + "step": 2280 + }, + { + "epoch": 0.04, + "learning_rate": 9.988042580763972e-05, + "loss": 1.3524, + "step": 2290 + }, + { + "epoch": 0.04, + "learning_rate": 9.987937963238813e-05, + "loss": 1.3787, + "step": 2300 + }, + { + "epoch": 0.04, + "learning_rate": 9.987832890599126e-05, + "loss": 1.284, + "step": 2310 + }, + { + "epoch": 0.04, + "learning_rate": 9.987727362854496e-05, + "loss": 1.4093, + "step": 2320 + }, + { + "epoch": 0.04, + "learning_rate": 9.987621380014553e-05, + "loss": 1.3782, + "step": 2330 + }, + { + "epoch": 0.04, + "learning_rate": 9.987514942088968e-05, + "loss": 1.1652, + "step": 2340 + }, + { + "epoch": 0.05, + "learning_rate": 9.987408049087452e-05, + "loss": 1.0603, + "step": 2350 + }, + { + "epoch": 0.05, + "learning_rate": 9.987300701019755e-05, + "loss": 1.4174, + "step": 2360 + }, + { + "epoch": 0.05, + "learning_rate": 9.987192897895677e-05, + "loss": 1.4376, + "step": 2370 + }, + { + "epoch": 0.05, + "learning_rate": 9.987084639725051e-05, + "loss": 1.5728, + "step": 2380 + }, + { + "epoch": 0.05, + "learning_rate": 9.986975926517755e-05, + "loss": 1.3401, + "step": 2390 + }, + { + "epoch": 0.05, + "learning_rate": 9.98686675828371e-05, + "loss": 1.2169, + "step": 2400 + }, + { + "epoch": 0.05, + "learning_rate": 9.986757135032875e-05, + "loss": 1.2284, + "step": 2410 + }, + { + "epoch": 0.05, + "learning_rate": 9.986647056775254e-05, + "loss": 1.2892, + "step": 2420 + }, + { + "epoch": 0.05, + "learning_rate": 9.986536523520889e-05, + "loss": 1.2494, + "step": 2430 + }, + { + "epoch": 0.05, + "learning_rate": 9.986425535279868e-05, + "loss": 1.2383, + "step": 2440 + }, + { + "epoch": 0.05, + "learning_rate": 9.986314092062315e-05, + "loss": 1.7485, + "step": 2450 + }, + { + "epoch": 0.05, + "learning_rate": 9.9862021938784e-05, + "loss": 1.162, + "step": 2460 + }, + { + "epoch": 0.05, + "learning_rate": 9.986089840738333e-05, + "loss": 1.3814, + "step": 2470 + }, + { + "epoch": 0.05, + "learning_rate": 9.985977032652365e-05, + "loss": 1.3171, + "step": 2480 + }, + { + "epoch": 0.05, + "learning_rate": 9.98586376963079e-05, + "loss": 1.1927, + "step": 2490 + }, + { + "epoch": 0.05, + "learning_rate": 9.98575005168394e-05, + "loss": 1.5072, + "step": 2500 + }, + { + "epoch": 0.05, + "learning_rate": 9.985635878822193e-05, + "loss": 1.3116, + "step": 2510 + }, + { + "epoch": 0.05, + "learning_rate": 9.985521251055966e-05, + "loss": 1.3766, + "step": 2520 + }, + { + "epoch": 0.05, + "learning_rate": 9.985406168395719e-05, + "loss": 1.36, + "step": 2530 + }, + { + "epoch": 0.05, + "learning_rate": 9.985290630851949e-05, + "loss": 1.1809, + "step": 2540 + }, + { + "epoch": 0.05, + "learning_rate": 9.985174638435202e-05, + "loss": 1.4045, + "step": 2550 + }, + { + "epoch": 0.05, + "learning_rate": 9.98505819115606e-05, + "loss": 1.2913, + "step": 2560 + }, + { + "epoch": 0.05, + "learning_rate": 9.984941289025149e-05, + "loss": 1.3008, + "step": 2570 + }, + { + "epoch": 0.05, + "learning_rate": 9.984823932053133e-05, + "loss": 1.1802, + "step": 2580 + }, + { + "epoch": 0.05, + "learning_rate": 9.984706120250721e-05, + "loss": 1.3826, + "step": 2590 + }, + { + "epoch": 0.05, + "learning_rate": 9.984587853628664e-05, + "loss": 1.3033, + "step": 2600 + }, + { + "epoch": 0.05, + "learning_rate": 9.984469132197752e-05, + "loss": 1.4091, + "step": 2610 + }, + { + "epoch": 0.05, + "learning_rate": 9.984349955968817e-05, + "loss": 1.3903, + "step": 2620 + }, + { + "epoch": 0.05, + "learning_rate": 9.984230324952732e-05, + "loss": 1.3725, + "step": 2630 + }, + { + "epoch": 0.05, + "learning_rate": 9.984110239160416e-05, + "loss": 1.4251, + "step": 2640 + }, + { + "epoch": 0.05, + "learning_rate": 9.983989698602824e-05, + "loss": 1.28, + "step": 2650 + }, + { + "epoch": 0.05, + "learning_rate": 9.983868703290953e-05, + "loss": 1.4113, + "step": 2660 + }, + { + "epoch": 0.05, + "learning_rate": 9.983747253235846e-05, + "loss": 1.3604, + "step": 2670 + }, + { + "epoch": 0.05, + "learning_rate": 9.983625348448581e-05, + "loss": 1.0976, + "step": 2680 + }, + { + "epoch": 0.05, + "learning_rate": 9.983502988940285e-05, + "loss": 1.3496, + "step": 2690 + }, + { + "epoch": 0.05, + "learning_rate": 9.983380174722119e-05, + "loss": 1.2368, + "step": 2700 + }, + { + "epoch": 0.05, + "learning_rate": 9.98325690580529e-05, + "loss": 1.217, + "step": 2710 + }, + { + "epoch": 0.05, + "learning_rate": 9.983133182201046e-05, + "loss": 1.3363, + "step": 2720 + }, + { + "epoch": 0.05, + "learning_rate": 9.983009003920676e-05, + "loss": 1.2462, + "step": 2730 + }, + { + "epoch": 0.05, + "learning_rate": 9.982884370975509e-05, + "loss": 1.1793, + "step": 2740 + }, + { + "epoch": 0.05, + "learning_rate": 9.98275928337692e-05, + "loss": 1.3108, + "step": 2750 + }, + { + "epoch": 0.05, + "learning_rate": 9.982633741136317e-05, + "loss": 1.4057, + "step": 2760 + }, + { + "epoch": 0.05, + "learning_rate": 9.982507744265162e-05, + "loss": 1.2219, + "step": 2770 + }, + { + "epoch": 0.05, + "learning_rate": 9.982381292774945e-05, + "loss": 1.2523, + "step": 2780 + }, + { + "epoch": 0.05, + "learning_rate": 9.982254386677206e-05, + "loss": 1.2229, + "step": 2790 + }, + { + "epoch": 0.05, + "learning_rate": 9.982127025983525e-05, + "loss": 1.2954, + "step": 2800 + }, + { + "epoch": 0.05, + "learning_rate": 9.981999210705523e-05, + "loss": 1.2734, + "step": 2810 + }, + { + "epoch": 0.05, + "learning_rate": 9.98187094085486e-05, + "loss": 1.3261, + "step": 2820 + }, + { + "epoch": 0.05, + "learning_rate": 9.981742216443242e-05, + "loss": 1.3873, + "step": 2830 + }, + { + "epoch": 0.05, + "learning_rate": 9.981613037482414e-05, + "loss": 1.2543, + "step": 2840 + }, + { + "epoch": 0.05, + "learning_rate": 9.981483403984162e-05, + "loss": 1.2404, + "step": 2850 + }, + { + "epoch": 0.05, + "learning_rate": 9.981353315960315e-05, + "loss": 1.2803, + "step": 2860 + }, + { + "epoch": 0.06, + "learning_rate": 9.98122277342274e-05, + "loss": 1.3491, + "step": 2870 + }, + { + "epoch": 0.06, + "learning_rate": 9.981091776383351e-05, + "loss": 1.4603, + "step": 2880 + }, + { + "epoch": 0.06, + "learning_rate": 9.980960324854101e-05, + "loss": 1.2107, + "step": 2890 + }, + { + "epoch": 0.06, + "learning_rate": 9.980828418846981e-05, + "loss": 1.1329, + "step": 2900 + }, + { + "epoch": 0.06, + "learning_rate": 9.980696058374029e-05, + "loss": 1.4284, + "step": 2910 + }, + { + "epoch": 0.06, + "learning_rate": 9.980563243447321e-05, + "loss": 1.1568, + "step": 2920 + }, + { + "epoch": 0.06, + "learning_rate": 9.980429974078975e-05, + "loss": 1.5218, + "step": 2930 + }, + { + "epoch": 0.06, + "learning_rate": 9.980296250281152e-05, + "loss": 1.232, + "step": 2940 + }, + { + "epoch": 0.06, + "learning_rate": 9.980162072066053e-05, + "loss": 1.4554, + "step": 2950 + }, + { + "epoch": 0.06, + "learning_rate": 9.98002743944592e-05, + "loss": 1.3907, + "step": 2960 + }, + { + "epoch": 0.06, + "learning_rate": 9.979892352433038e-05, + "loss": 1.212, + "step": 2970 + }, + { + "epoch": 0.06, + "learning_rate": 9.979756811039733e-05, + "loss": 1.3243, + "step": 2980 + }, + { + "epoch": 0.06, + "learning_rate": 9.97962081527837e-05, + "loss": 1.4059, + "step": 2990 + }, + { + "epoch": 0.06, + "learning_rate": 9.979484365161362e-05, + "loss": 1.5286, + "step": 3000 + }, + { + "epoch": 0.06, + "learning_rate": 9.979347460701157e-05, + "loss": 1.3507, + "step": 3010 + }, + { + "epoch": 0.06, + "learning_rate": 9.979210101910244e-05, + "loss": 1.3491, + "step": 3020 + }, + { + "epoch": 0.06, + "learning_rate": 9.97907228880116e-05, + "loss": 1.2906, + "step": 3030 + }, + { + "epoch": 0.06, + "learning_rate": 9.978934021386477e-05, + "loss": 1.3218, + "step": 3040 + }, + { + "epoch": 0.06, + "learning_rate": 9.978795299678812e-05, + "loss": 1.4068, + "step": 3050 + }, + { + "epoch": 0.06, + "learning_rate": 9.978656123690822e-05, + "loss": 1.14, + "step": 3060 + }, + { + "epoch": 0.06, + "learning_rate": 9.978516493435205e-05, + "loss": 1.5555, + "step": 3070 + }, + { + "epoch": 0.06, + "learning_rate": 9.978376408924704e-05, + "loss": 1.4966, + "step": 3080 + }, + { + "epoch": 0.06, + "learning_rate": 9.978235870172097e-05, + "loss": 1.2175, + "step": 3090 + }, + { + "epoch": 0.06, + "learning_rate": 9.978094877190209e-05, + "loss": 1.4057, + "step": 3100 + }, + { + "epoch": 0.06, + "learning_rate": 9.977953429991907e-05, + "loss": 1.18, + "step": 3110 + }, + { + "epoch": 0.06, + "learning_rate": 9.977811528590094e-05, + "loss": 1.1956, + "step": 3120 + }, + { + "epoch": 0.06, + "learning_rate": 9.977669172997717e-05, + "loss": 1.4967, + "step": 3130 + }, + { + "epoch": 0.06, + "learning_rate": 9.977526363227767e-05, + "loss": 1.159, + "step": 3140 + }, + { + "epoch": 0.06, + "learning_rate": 9.977383099293273e-05, + "loss": 1.5311, + "step": 3150 + }, + { + "epoch": 0.06, + "learning_rate": 9.97723938120731e-05, + "loss": 1.2848, + "step": 3160 + }, + { + "epoch": 0.06, + "learning_rate": 9.977095208982987e-05, + "loss": 1.207, + "step": 3170 + }, + { + "epoch": 0.06, + "learning_rate": 9.976950582633461e-05, + "loss": 1.3055, + "step": 3180 + }, + { + "epoch": 0.06, + "learning_rate": 9.976805502171926e-05, + "loss": 1.325, + "step": 3190 + }, + { + "epoch": 0.06, + "learning_rate": 9.976659967611624e-05, + "loss": 1.3816, + "step": 3200 + }, + { + "epoch": 0.06, + "learning_rate": 9.976513978965829e-05, + "loss": 1.1429, + "step": 3210 + }, + { + "epoch": 0.06, + "learning_rate": 9.976367536247864e-05, + "loss": 1.281, + "step": 3220 + }, + { + "epoch": 0.06, + "learning_rate": 9.976220639471092e-05, + "loss": 1.1709, + "step": 3230 + }, + { + "epoch": 0.06, + "learning_rate": 9.976073288648913e-05, + "loss": 1.5605, + "step": 3240 + }, + { + "epoch": 0.06, + "learning_rate": 9.975925483794775e-05, + "loss": 1.2462, + "step": 3250 + }, + { + "epoch": 0.06, + "learning_rate": 9.975777224922163e-05, + "loss": 1.5913, + "step": 3260 + }, + { + "epoch": 0.06, + "learning_rate": 9.975628512044604e-05, + "loss": 1.5767, + "step": 3270 + }, + { + "epoch": 0.06, + "learning_rate": 9.975479345175667e-05, + "loss": 1.3546, + "step": 3280 + }, + { + "epoch": 0.06, + "learning_rate": 9.975329724328961e-05, + "loss": 1.3576, + "step": 3290 + }, + { + "epoch": 0.06, + "learning_rate": 9.975179649518143e-05, + "loss": 1.2719, + "step": 3300 + }, + { + "epoch": 0.06, + "learning_rate": 9.9750291207569e-05, + "loss": 1.2336, + "step": 3310 + }, + { + "epoch": 0.06, + "learning_rate": 9.974878138058972e-05, + "loss": 1.3509, + "step": 3320 + }, + { + "epoch": 0.06, + "learning_rate": 9.97472670143813e-05, + "loss": 1.2767, + "step": 3330 + }, + { + "epoch": 0.06, + "learning_rate": 9.974574810908197e-05, + "loss": 1.2492, + "step": 3340 + }, + { + "epoch": 0.06, + "learning_rate": 9.974422466483029e-05, + "loss": 1.2595, + "step": 3350 + }, + { + "epoch": 0.06, + "learning_rate": 9.974269668176525e-05, + "loss": 1.4714, + "step": 3360 + }, + { + "epoch": 0.06, + "learning_rate": 9.974116416002629e-05, + "loss": 1.1935, + "step": 3370 + }, + { + "epoch": 0.06, + "learning_rate": 9.973962709975324e-05, + "loss": 1.2193, + "step": 3380 + }, + { + "epoch": 0.07, + "learning_rate": 9.973808550108634e-05, + "loss": 1.4745, + "step": 3390 + }, + { + "epoch": 0.07, + "learning_rate": 9.973653936416625e-05, + "loss": 1.2986, + "step": 3400 + }, + { + "epoch": 0.07, + "learning_rate": 9.973498868913404e-05, + "loss": 1.488, + "step": 3410 + }, + { + "epoch": 0.07, + "learning_rate": 9.973343347613121e-05, + "loss": 1.3544, + "step": 3420 + }, + { + "epoch": 0.07, + "learning_rate": 9.973187372529967e-05, + "loss": 1.3733, + "step": 3430 + }, + { + "epoch": 0.07, + "learning_rate": 9.97303094367817e-05, + "loss": 1.3409, + "step": 3440 + }, + { + "epoch": 0.07, + "learning_rate": 9.972874061072007e-05, + "loss": 1.4664, + "step": 3450 + }, + { + "epoch": 0.07, + "learning_rate": 9.972716724725789e-05, + "loss": 1.4377, + "step": 3460 + }, + { + "epoch": 0.07, + "learning_rate": 9.972558934653875e-05, + "loss": 1.4165, + "step": 3470 + }, + { + "epoch": 0.07, + "learning_rate": 9.972400690870661e-05, + "loss": 1.2062, + "step": 3480 + }, + { + "epoch": 0.07, + "learning_rate": 9.972241993390585e-05, + "loss": 1.2318, + "step": 3490 + }, + { + "epoch": 0.07, + "learning_rate": 9.972082842228128e-05, + "loss": 1.2213, + "step": 3500 + }, + { + "epoch": 0.07, + "learning_rate": 9.97192323739781e-05, + "loss": 1.1936, + "step": 3510 + }, + { + "epoch": 0.07, + "learning_rate": 9.971763178914195e-05, + "loss": 1.3197, + "step": 3520 + }, + { + "epoch": 0.07, + "learning_rate": 9.971602666791888e-05, + "loss": 1.2308, + "step": 3530 + }, + { + "epoch": 0.07, + "learning_rate": 9.971441701045533e-05, + "loss": 1.3912, + "step": 3540 + }, + { + "epoch": 0.07, + "learning_rate": 9.971280281689818e-05, + "loss": 1.2397, + "step": 3550 + }, + { + "epoch": 0.07, + "learning_rate": 9.971118408739471e-05, + "loss": 1.359, + "step": 3560 + }, + { + "epoch": 0.07, + "learning_rate": 9.970956082209261e-05, + "loss": 1.2904, + "step": 3570 + }, + { + "epoch": 0.07, + "learning_rate": 9.970793302114002e-05, + "loss": 1.1786, + "step": 3580 + }, + { + "epoch": 0.07, + "learning_rate": 9.970630068468541e-05, + "loss": 1.1694, + "step": 3590 + }, + { + "epoch": 0.07, + "learning_rate": 9.970466381287779e-05, + "loss": 1.4849, + "step": 3600 + }, + { + "epoch": 0.07, + "learning_rate": 9.970302240586646e-05, + "loss": 1.2668, + "step": 3610 + }, + { + "epoch": 0.07, + "learning_rate": 9.97013764638012e-05, + "loss": 1.6899, + "step": 3620 + }, + { + "epoch": 0.07, + "learning_rate": 9.969972598683221e-05, + "loss": 1.4086, + "step": 3630 + }, + { + "epoch": 0.07, + "learning_rate": 9.969807097511006e-05, + "loss": 1.2225, + "step": 3640 + }, + { + "epoch": 0.07, + "learning_rate": 9.969641142878576e-05, + "loss": 1.2884, + "step": 3650 + }, + { + "epoch": 0.07, + "learning_rate": 9.969474734801076e-05, + "loss": 1.2065, + "step": 3660 + }, + { + "epoch": 0.07, + "learning_rate": 9.969307873293686e-05, + "loss": 1.1839, + "step": 3670 + }, + { + "epoch": 0.07, + "learning_rate": 9.969140558371633e-05, + "loss": 1.4486, + "step": 3680 + }, + { + "epoch": 0.07, + "learning_rate": 9.968972790050184e-05, + "loss": 1.4194, + "step": 3690 + }, + { + "epoch": 0.07, + "learning_rate": 9.968804568344644e-05, + "loss": 1.3068, + "step": 3700 + }, + { + "epoch": 0.07, + "learning_rate": 9.968635893270363e-05, + "loss": 1.2503, + "step": 3710 + }, + { + "epoch": 0.07, + "learning_rate": 9.968466764842734e-05, + "loss": 1.2139, + "step": 3720 + }, + { + "epoch": 0.07, + "learning_rate": 9.968297183077186e-05, + "loss": 1.4462, + "step": 3730 + }, + { + "epoch": 0.07, + "learning_rate": 9.968127147989192e-05, + "loss": 1.0493, + "step": 3740 + }, + { + "epoch": 0.07, + "learning_rate": 9.967956659594268e-05, + "loss": 1.7619, + "step": 3750 + }, + { + "epoch": 0.07, + "learning_rate": 9.967785717907971e-05, + "loss": 1.4466, + "step": 3760 + }, + { + "epoch": 0.07, + "learning_rate": 9.967614322945895e-05, + "loss": 1.4525, + "step": 3770 + }, + { + "epoch": 0.07, + "learning_rate": 9.967442474723681e-05, + "loss": 1.3149, + "step": 3780 + }, + { + "epoch": 0.07, + "learning_rate": 9.967270173257007e-05, + "loss": 1.3513, + "step": 3790 + }, + { + "epoch": 0.07, + "learning_rate": 9.967097418561596e-05, + "loss": 1.1702, + "step": 3800 + }, + { + "epoch": 0.07, + "learning_rate": 9.96692421065321e-05, + "loss": 1.3409, + "step": 3810 + }, + { + "epoch": 0.07, + "learning_rate": 9.966750549547654e-05, + "loss": 1.1612, + "step": 3820 + }, + { + "epoch": 0.07, + "learning_rate": 9.966576435260771e-05, + "loss": 1.1527, + "step": 3830 + }, + { + "epoch": 0.07, + "learning_rate": 9.96640186780845e-05, + "loss": 1.5699, + "step": 3840 + }, + { + "epoch": 0.07, + "learning_rate": 9.966226847206619e-05, + "loss": 1.3352, + "step": 3850 + }, + { + "epoch": 0.07, + "learning_rate": 9.966051373471246e-05, + "loss": 1.5389, + "step": 3860 + }, + { + "epoch": 0.07, + "learning_rate": 9.965875446618342e-05, + "loss": 1.05, + "step": 3870 + }, + { + "epoch": 0.07, + "learning_rate": 9.965699066663959e-05, + "loss": 1.1565, + "step": 3880 + }, + { + "epoch": 0.07, + "learning_rate": 9.965522233624191e-05, + "loss": 1.1598, + "step": 3890 + }, + { + "epoch": 0.07, + "learning_rate": 9.965344947515174e-05, + "loss": 1.5574, + "step": 3900 + }, + { + "epoch": 0.08, + "learning_rate": 9.965167208353082e-05, + "loss": 1.4266, + "step": 3910 + }, + { + "epoch": 0.08, + "learning_rate": 9.964989016154134e-05, + "loss": 1.2152, + "step": 3920 + }, + { + "epoch": 0.08, + "learning_rate": 9.964810370934587e-05, + "loss": 1.3679, + "step": 3930 + }, + { + "epoch": 0.08, + "learning_rate": 9.964631272710742e-05, + "loss": 1.3647, + "step": 3940 + }, + { + "epoch": 0.08, + "learning_rate": 9.964451721498943e-05, + "loss": 1.4123, + "step": 3950 + }, + { + "epoch": 0.08, + "learning_rate": 9.96427171731557e-05, + "loss": 1.2552, + "step": 3960 + }, + { + "epoch": 0.08, + "learning_rate": 9.964091260177047e-05, + "loss": 1.5544, + "step": 3970 + }, + { + "epoch": 0.08, + "learning_rate": 9.96391035009984e-05, + "loss": 1.3068, + "step": 3980 + }, + { + "epoch": 0.08, + "learning_rate": 9.963728987100454e-05, + "loss": 1.3945, + "step": 3990 + }, + { + "epoch": 0.08, + "learning_rate": 9.963547171195441e-05, + "loss": 1.3676, + "step": 4000 + }, + { + "epoch": 0.08, + "learning_rate": 9.963364902401388e-05, + "loss": 1.3087, + "step": 4010 + }, + { + "epoch": 0.08, + "learning_rate": 9.963182180734926e-05, + "loss": 1.3994, + "step": 4020 + }, + { + "epoch": 0.08, + "learning_rate": 9.962999006212727e-05, + "loss": 1.4359, + "step": 4030 + }, + { + "epoch": 0.08, + "learning_rate": 9.962815378851505e-05, + "loss": 1.2962, + "step": 4040 + }, + { + "epoch": 0.08, + "learning_rate": 9.962631298668015e-05, + "loss": 1.3718, + "step": 4050 + }, + { + "epoch": 0.08, + "learning_rate": 9.962446765679051e-05, + "loss": 1.186, + "step": 4060 + }, + { + "epoch": 0.08, + "learning_rate": 9.962261779901452e-05, + "loss": 1.4768, + "step": 4070 + }, + { + "epoch": 0.08, + "learning_rate": 9.962076341352097e-05, + "loss": 1.2492, + "step": 4080 + }, + { + "epoch": 0.08, + "learning_rate": 9.961890450047905e-05, + "loss": 1.2654, + "step": 4090 + }, + { + "epoch": 0.08, + "learning_rate": 9.961704106005838e-05, + "loss": 1.2193, + "step": 4100 + }, + { + "epoch": 0.08, + "learning_rate": 9.961517309242898e-05, + "loss": 1.0234, + "step": 4110 + }, + { + "epoch": 0.08, + "learning_rate": 9.961330059776128e-05, + "loss": 1.466, + "step": 4120 + }, + { + "epoch": 0.08, + "learning_rate": 9.961142357622616e-05, + "loss": 1.3056, + "step": 4130 + }, + { + "epoch": 0.08, + "learning_rate": 9.960954202799486e-05, + "loss": 1.1035, + "step": 4140 + }, + { + "epoch": 0.08, + "learning_rate": 9.960765595323907e-05, + "loss": 1.0571, + "step": 4150 + }, + { + "epoch": 0.08, + "learning_rate": 9.960576535213088e-05, + "loss": 1.6929, + "step": 4160 + }, + { + "epoch": 0.08, + "learning_rate": 9.960387022484279e-05, + "loss": 1.2753, + "step": 4170 + }, + { + "epoch": 0.08, + "learning_rate": 9.960197057154772e-05, + "loss": 1.5613, + "step": 4180 + }, + { + "epoch": 0.08, + "learning_rate": 9.960006639241898e-05, + "loss": 1.4367, + "step": 4190 + }, + { + "epoch": 0.08, + "learning_rate": 9.959815768763037e-05, + "loss": 1.3649, + "step": 4200 + }, + { + "epoch": 0.08, + "learning_rate": 9.959624445735598e-05, + "loss": 1.2436, + "step": 4210 + }, + { + "epoch": 0.08, + "learning_rate": 9.959432670177041e-05, + "loss": 1.3484, + "step": 4220 + }, + { + "epoch": 0.08, + "learning_rate": 9.959240442104864e-05, + "loss": 1.346, + "step": 4230 + }, + { + "epoch": 0.08, + "learning_rate": 9.959047761536607e-05, + "loss": 1.4762, + "step": 4240 + }, + { + "epoch": 0.08, + "learning_rate": 9.958854628489851e-05, + "loss": 1.3351, + "step": 4250 + }, + { + "epoch": 0.08, + "learning_rate": 9.958661042982216e-05, + "loss": 1.3207, + "step": 4260 + }, + { + "epoch": 0.08, + "learning_rate": 9.958467005031366e-05, + "loss": 1.3722, + "step": 4270 + }, + { + "epoch": 0.08, + "learning_rate": 9.958272514655006e-05, + "loss": 1.6121, + "step": 4280 + }, + { + "epoch": 0.08, + "learning_rate": 9.958077571870882e-05, + "loss": 1.5082, + "step": 4290 + }, + { + "epoch": 0.08, + "learning_rate": 9.957882176696783e-05, + "loss": 1.2211, + "step": 4300 + }, + { + "epoch": 0.08, + "learning_rate": 9.957686329150534e-05, + "loss": 1.5882, + "step": 4310 + }, + { + "epoch": 0.08, + "learning_rate": 9.957490029250007e-05, + "loss": 1.3154, + "step": 4320 + }, + { + "epoch": 0.08, + "learning_rate": 9.957293277013111e-05, + "loss": 1.5031, + "step": 4330 + }, + { + "epoch": 0.08, + "learning_rate": 9.957096072457801e-05, + "loss": 1.2494, + "step": 4340 + }, + { + "epoch": 0.08, + "learning_rate": 9.95689841560207e-05, + "loss": 1.2569, + "step": 4350 + }, + { + "epoch": 0.08, + "learning_rate": 9.95670030646395e-05, + "loss": 1.3808, + "step": 4360 + }, + { + "epoch": 0.08, + "learning_rate": 9.95650174506152e-05, + "loss": 1.3327, + "step": 4370 + }, + { + "epoch": 0.08, + "learning_rate": 9.956302731412895e-05, + "loss": 1.3175, + "step": 4380 + }, + { + "epoch": 0.08, + "learning_rate": 9.956103265536236e-05, + "loss": 1.3404, + "step": 4390 + }, + { + "epoch": 0.08, + "learning_rate": 9.955903347449743e-05, + "loss": 1.1529, + "step": 4400 + }, + { + "epoch": 0.08, + "learning_rate": 9.955702977171654e-05, + "loss": 1.4676, + "step": 4410 + }, + { + "epoch": 0.08, + "learning_rate": 9.955502154720253e-05, + "loss": 1.3654, + "step": 4420 + }, + { + "epoch": 0.09, + "learning_rate": 9.955300880113866e-05, + "loss": 1.307, + "step": 4430 + }, + { + "epoch": 0.09, + "learning_rate": 9.955099153370855e-05, + "loss": 1.1598, + "step": 4440 + }, + { + "epoch": 0.09, + "learning_rate": 9.954896974509627e-05, + "loss": 1.1874, + "step": 4450 + }, + { + "epoch": 0.09, + "learning_rate": 9.95469434354863e-05, + "loss": 1.386, + "step": 4460 + }, + { + "epoch": 0.09, + "learning_rate": 9.954491260506351e-05, + "loss": 1.147, + "step": 4470 + }, + { + "epoch": 0.09, + "learning_rate": 9.954287725401322e-05, + "loss": 1.3012, + "step": 4480 + }, + { + "epoch": 0.09, + "learning_rate": 9.954083738252114e-05, + "loss": 1.1995, + "step": 4490 + }, + { + "epoch": 0.09, + "learning_rate": 9.953879299077337e-05, + "loss": 1.1864, + "step": 4500 + }, + { + "epoch": 0.09, + "learning_rate": 9.953674407895647e-05, + "loss": 1.2765, + "step": 4510 + }, + { + "epoch": 0.09, + "learning_rate": 9.953469064725737e-05, + "loss": 1.3308, + "step": 4520 + }, + { + "epoch": 0.09, + "learning_rate": 9.953263269586346e-05, + "loss": 1.4213, + "step": 4530 + }, + { + "epoch": 0.09, + "learning_rate": 9.953057022496248e-05, + "loss": 1.3585, + "step": 4540 + }, + { + "epoch": 0.09, + "learning_rate": 9.952850323474265e-05, + "loss": 1.4576, + "step": 4550 + }, + { + "epoch": 0.09, + "learning_rate": 9.952643172539253e-05, + "loss": 1.4012, + "step": 4560 + }, + { + "epoch": 0.09, + "learning_rate": 9.952435569710117e-05, + "loss": 1.2296, + "step": 4570 + }, + { + "epoch": 0.09, + "learning_rate": 9.952227515005797e-05, + "loss": 1.5211, + "step": 4580 + }, + { + "epoch": 0.09, + "learning_rate": 9.952019008445277e-05, + "loss": 1.4293, + "step": 4590 + }, + { + "epoch": 0.09, + "learning_rate": 9.951810050047581e-05, + "loss": 1.1504, + "step": 4600 + }, + { + "epoch": 0.09, + "learning_rate": 9.951600639831778e-05, + "loss": 1.3165, + "step": 4610 + }, + { + "epoch": 0.09, + "learning_rate": 9.951390777816971e-05, + "loss": 1.3421, + "step": 4620 + }, + { + "epoch": 0.09, + "learning_rate": 9.95118046402231e-05, + "loss": 1.233, + "step": 4630 + }, + { + "epoch": 0.09, + "learning_rate": 9.950969698466986e-05, + "loss": 1.264, + "step": 4640 + }, + { + "epoch": 0.09, + "learning_rate": 9.950758481170229e-05, + "loss": 1.3277, + "step": 4650 + }, + { + "epoch": 0.09, + "learning_rate": 9.950546812151311e-05, + "loss": 1.3612, + "step": 4660 + }, + { + "epoch": 0.09, + "learning_rate": 9.950334691429545e-05, + "loss": 1.2901, + "step": 4670 + }, + { + "epoch": 0.09, + "learning_rate": 9.950122119024287e-05, + "loss": 1.3418, + "step": 4680 + }, + { + "epoch": 0.09, + "learning_rate": 9.949909094954933e-05, + "loss": 1.0178, + "step": 4690 + }, + { + "epoch": 0.09, + "learning_rate": 9.949695619240916e-05, + "loss": 1.2333, + "step": 4700 + }, + { + "epoch": 0.09, + "learning_rate": 9.949481691901718e-05, + "loss": 1.5076, + "step": 4710 + }, + { + "epoch": 0.09, + "learning_rate": 9.949267312956855e-05, + "loss": 1.3271, + "step": 4720 + }, + { + "epoch": 0.09, + "learning_rate": 9.949052482425893e-05, + "loss": 1.448, + "step": 4730 + }, + { + "epoch": 0.09, + "learning_rate": 9.948837200328429e-05, + "loss": 1.3328, + "step": 4740 + }, + { + "epoch": 0.09, + "learning_rate": 9.948621466684108e-05, + "loss": 1.3179, + "step": 4750 + }, + { + "epoch": 0.09, + "learning_rate": 9.948405281512614e-05, + "loss": 1.3409, + "step": 4760 + }, + { + "epoch": 0.09, + "learning_rate": 9.948188644833671e-05, + "loss": 1.3366, + "step": 4770 + }, + { + "epoch": 0.09, + "learning_rate": 9.947971556667048e-05, + "loss": 1.3604, + "step": 4780 + }, + { + "epoch": 0.09, + "learning_rate": 9.947754017032551e-05, + "loss": 1.4013, + "step": 4790 + }, + { + "epoch": 0.09, + "learning_rate": 9.947536025950031e-05, + "loss": 1.5929, + "step": 4800 + }, + { + "epoch": 0.09, + "learning_rate": 9.947317583439375e-05, + "loss": 1.3983, + "step": 4810 + }, + { + "epoch": 0.09, + "learning_rate": 9.947098689520516e-05, + "loss": 1.3858, + "step": 4820 + }, + { + "epoch": 0.09, + "learning_rate": 9.946879344213426e-05, + "loss": 1.3243, + "step": 4830 + }, + { + "epoch": 0.09, + "learning_rate": 9.94665954753812e-05, + "loss": 1.0476, + "step": 4840 + }, + { + "epoch": 0.09, + "learning_rate": 9.946439299514653e-05, + "loss": 1.2685, + "step": 4850 + }, + { + "epoch": 0.09, + "learning_rate": 9.94621860016312e-05, + "loss": 1.4931, + "step": 4860 + }, + { + "epoch": 0.09, + "learning_rate": 9.945997449503657e-05, + "loss": 1.2334, + "step": 4870 + }, + { + "epoch": 0.09, + "learning_rate": 9.945775847556445e-05, + "loss": 1.2166, + "step": 4880 + }, + { + "epoch": 0.09, + "learning_rate": 9.945553794341703e-05, + "loss": 1.2837, + "step": 4890 + }, + { + "epoch": 0.09, + "learning_rate": 9.945331289879692e-05, + "loss": 1.3663, + "step": 4900 + }, + { + "epoch": 0.09, + "learning_rate": 9.945108334190713e-05, + "loss": 1.3059, + "step": 4910 + }, + { + "epoch": 0.09, + "learning_rate": 9.944884927295108e-05, + "loss": 1.3455, + "step": 4920 + }, + { + "epoch": 0.09, + "learning_rate": 9.944661069213264e-05, + "loss": 1.3991, + "step": 4930 + }, + { + "epoch": 0.09, + "learning_rate": 9.944436759965607e-05, + "loss": 1.3451, + "step": 4940 + }, + { + "epoch": 0.1, + "learning_rate": 9.9442119995726e-05, + "loss": 1.4169, + "step": 4950 + }, + { + "epoch": 0.1, + "learning_rate": 9.943986788054753e-05, + "loss": 1.2441, + "step": 4960 + }, + { + "epoch": 0.1, + "learning_rate": 9.943761125432616e-05, + "loss": 1.4679, + "step": 4970 + }, + { + "epoch": 0.1, + "learning_rate": 9.943535011726776e-05, + "loss": 1.2354, + "step": 4980 + }, + { + "epoch": 0.1, + "learning_rate": 9.943308446957868e-05, + "loss": 1.1651, + "step": 4990 + }, + { + "epoch": 0.1, + "learning_rate": 9.943081431146563e-05, + "loss": 1.0765, + "step": 5000 + }, + { + "epoch": 0.1, + "learning_rate": 9.942853964313574e-05, + "loss": 1.2185, + "step": 5010 + }, + { + "epoch": 0.1, + "learning_rate": 9.942626046479655e-05, + "loss": 1.3779, + "step": 5020 + }, + { + "epoch": 0.1, + "learning_rate": 9.942397677665605e-05, + "loss": 1.3761, + "step": 5030 + }, + { + "epoch": 0.1, + "learning_rate": 9.942168857892258e-05, + "loss": 1.1939, + "step": 5040 + }, + { + "epoch": 0.1, + "learning_rate": 9.941939587180492e-05, + "loss": 1.4915, + "step": 5050 + }, + { + "epoch": 0.1, + "learning_rate": 9.94170986555123e-05, + "loss": 1.1359, + "step": 5060 + }, + { + "epoch": 0.1, + "learning_rate": 9.941479693025428e-05, + "loss": 1.3325, + "step": 5070 + }, + { + "epoch": 0.1, + "learning_rate": 9.94124906962409e-05, + "loss": 1.2584, + "step": 5080 + }, + { + "epoch": 0.1, + "learning_rate": 9.94101799536826e-05, + "loss": 1.1938, + "step": 5090 + }, + { + "epoch": 0.1, + "learning_rate": 9.94078647027902e-05, + "loss": 1.1098, + "step": 5100 + }, + { + "epoch": 0.1, + "learning_rate": 9.940554494377495e-05, + "loss": 1.1939, + "step": 5110 + }, + { + "epoch": 0.1, + "learning_rate": 9.940322067684852e-05, + "loss": 1.2726, + "step": 5120 + }, + { + "epoch": 0.1, + "learning_rate": 9.940089190222297e-05, + "loss": 1.2925, + "step": 5130 + }, + { + "epoch": 0.1, + "learning_rate": 9.939855862011081e-05, + "loss": 1.3837, + "step": 5140 + }, + { + "epoch": 0.1, + "learning_rate": 9.93962208307249e-05, + "loss": 1.436, + "step": 5150 + }, + { + "epoch": 0.1, + "learning_rate": 9.93938785342786e-05, + "loss": 1.2485, + "step": 5160 + }, + { + "epoch": 0.1, + "learning_rate": 9.939153173098556e-05, + "loss": 1.3532, + "step": 5170 + }, + { + "epoch": 0.1, + "learning_rate": 9.938918042105996e-05, + "loss": 1.2223, + "step": 5180 + }, + { + "epoch": 0.1, + "learning_rate": 9.938682460471634e-05, + "loss": 1.4696, + "step": 5190 + }, + { + "epoch": 0.1, + "learning_rate": 9.938446428216962e-05, + "loss": 1.443, + "step": 5200 + }, + { + "epoch": 0.1, + "learning_rate": 9.938209945363518e-05, + "loss": 1.2612, + "step": 5210 + }, + { + "epoch": 0.1, + "learning_rate": 9.937973011932879e-05, + "loss": 1.3298, + "step": 5220 + }, + { + "epoch": 0.1, + "learning_rate": 9.937735627946664e-05, + "loss": 1.3296, + "step": 5230 + }, + { + "epoch": 0.1, + "learning_rate": 9.937497793426536e-05, + "loss": 1.2662, + "step": 5240 + }, + { + "epoch": 0.1, + "learning_rate": 9.937259508394189e-05, + "loss": 1.3806, + "step": 5250 + }, + { + "epoch": 0.1, + "learning_rate": 9.937020772871368e-05, + "loss": 1.3534, + "step": 5260 + }, + { + "epoch": 0.1, + "learning_rate": 9.936781586879857e-05, + "loss": 1.1739, + "step": 5270 + }, + { + "epoch": 0.1, + "learning_rate": 9.936541950441479e-05, + "loss": 1.3313, + "step": 5280 + }, + { + "epoch": 0.1, + "learning_rate": 9.936301863578099e-05, + "loss": 1.1424, + "step": 5290 + }, + { + "epoch": 0.1, + "learning_rate": 9.936061326311626e-05, + "loss": 1.4169, + "step": 5300 + }, + { + "epoch": 0.1, + "learning_rate": 9.935820338664002e-05, + "loss": 1.3815, + "step": 5310 + }, + { + "epoch": 0.1, + "learning_rate": 9.935578900657218e-05, + "loss": 1.0693, + "step": 5320 + }, + { + "epoch": 0.1, + "learning_rate": 9.935337012313307e-05, + "loss": 1.2608, + "step": 5330 + }, + { + "epoch": 0.1, + "learning_rate": 9.935094673654333e-05, + "loss": 1.2212, + "step": 5340 + }, + { + "epoch": 0.1, + "learning_rate": 9.934851884702414e-05, + "loss": 1.2499, + "step": 5350 + }, + { + "epoch": 0.1, + "learning_rate": 9.934608645479698e-05, + "loss": 1.1823, + "step": 5360 + }, + { + "epoch": 0.1, + "learning_rate": 9.934364956008382e-05, + "loss": 1.2197, + "step": 5370 + }, + { + "epoch": 0.1, + "learning_rate": 9.934120816310699e-05, + "loss": 1.2803, + "step": 5380 + }, + { + "epoch": 0.1, + "learning_rate": 9.933876226408927e-05, + "loss": 1.0522, + "step": 5390 + }, + { + "epoch": 0.1, + "learning_rate": 9.933631186325382e-05, + "loss": 1.1957, + "step": 5400 + }, + { + "epoch": 0.1, + "learning_rate": 9.933385696082422e-05, + "loss": 1.2611, + "step": 5410 + }, + { + "epoch": 0.1, + "learning_rate": 9.933139755702445e-05, + "loss": 1.3267, + "step": 5420 + }, + { + "epoch": 0.1, + "learning_rate": 9.932893365207896e-05, + "loss": 1.2291, + "step": 5430 + }, + { + "epoch": 0.1, + "learning_rate": 9.93264652462125e-05, + "loss": 1.3878, + "step": 5440 + }, + { + "epoch": 0.1, + "learning_rate": 9.932399233965035e-05, + "loss": 1.3184, + "step": 5450 + }, + { + "epoch": 0.1, + "learning_rate": 9.932151493261812e-05, + "loss": 1.437, + "step": 5460 + }, + { + "epoch": 0.11, + "learning_rate": 9.931903302534185e-05, + "loss": 1.5066, + "step": 5470 + }, + { + "epoch": 0.11, + "learning_rate": 9.931654661804801e-05, + "loss": 1.2534, + "step": 5480 + }, + { + "epoch": 0.11, + "learning_rate": 9.931405571096346e-05, + "loss": 1.1359, + "step": 5490 + }, + { + "epoch": 0.11, + "learning_rate": 9.931156030431548e-05, + "loss": 1.3241, + "step": 5500 + }, + { + "epoch": 0.11, + "learning_rate": 9.930906039833177e-05, + "loss": 1.5322, + "step": 5510 + }, + { + "epoch": 0.11, + "learning_rate": 9.930655599324041e-05, + "loss": 1.3395, + "step": 5520 + }, + { + "epoch": 0.11, + "learning_rate": 9.930404708926991e-05, + "loss": 1.3896, + "step": 5530 + }, + { + "epoch": 0.11, + "learning_rate": 9.930153368664921e-05, + "loss": 1.2139, + "step": 5540 + }, + { + "epoch": 0.11, + "learning_rate": 9.929901578560763e-05, + "loss": 1.2718, + "step": 5550 + }, + { + "epoch": 0.11, + "learning_rate": 9.929649338637491e-05, + "loss": 1.2648, + "step": 5560 + }, + { + "epoch": 0.11, + "learning_rate": 9.92939664891812e-05, + "loss": 1.2574, + "step": 5570 + }, + { + "epoch": 0.11, + "learning_rate": 9.929143509425705e-05, + "loss": 1.3138, + "step": 5580 + }, + { + "epoch": 0.11, + "learning_rate": 9.928889920183344e-05, + "loss": 1.2763, + "step": 5590 + }, + { + "epoch": 0.11, + "learning_rate": 9.928635881214177e-05, + "loss": 1.2074, + "step": 5600 + }, + { + "epoch": 0.11, + "learning_rate": 9.928381392541382e-05, + "loss": 1.414, + "step": 5610 + }, + { + "epoch": 0.11, + "learning_rate": 9.928126454188178e-05, + "loss": 1.3734, + "step": 5620 + }, + { + "epoch": 0.11, + "learning_rate": 9.927871066177829e-05, + "loss": 1.1972, + "step": 5630 + }, + { + "epoch": 0.11, + "learning_rate": 9.927615228533635e-05, + "loss": 1.1967, + "step": 5640 + }, + { + "epoch": 0.11, + "learning_rate": 9.927358941278942e-05, + "loss": 1.6523, + "step": 5650 + }, + { + "epoch": 0.11, + "learning_rate": 9.927102204437133e-05, + "loss": 1.1186, + "step": 5660 + }, + { + "epoch": 0.11, + "learning_rate": 9.926845018031631e-05, + "loss": 1.1298, + "step": 5670 + }, + { + "epoch": 0.11, + "learning_rate": 9.926587382085906e-05, + "loss": 1.2431, + "step": 5680 + }, + { + "epoch": 0.11, + "learning_rate": 9.926329296623465e-05, + "loss": 1.2669, + "step": 5690 + }, + { + "epoch": 0.11, + "learning_rate": 9.926070761667854e-05, + "loss": 1.1762, + "step": 5700 + }, + { + "epoch": 0.11, + "learning_rate": 9.925811777242664e-05, + "loss": 1.4493, + "step": 5710 + }, + { + "epoch": 0.11, + "learning_rate": 9.925552343371527e-05, + "loss": 1.1156, + "step": 5720 + }, + { + "epoch": 0.11, + "learning_rate": 9.925292460078113e-05, + "loss": 1.3443, + "step": 5730 + }, + { + "epoch": 0.11, + "learning_rate": 9.925032127386136e-05, + "loss": 1.2967, + "step": 5740 + }, + { + "epoch": 0.11, + "learning_rate": 9.924771345319346e-05, + "loss": 1.5565, + "step": 5750 + }, + { + "epoch": 0.11, + "learning_rate": 9.924510113901542e-05, + "loss": 1.3646, + "step": 5760 + }, + { + "epoch": 0.11, + "learning_rate": 9.924248433156556e-05, + "loss": 1.0625, + "step": 5770 + }, + { + "epoch": 0.11, + "learning_rate": 9.923986303108266e-05, + "loss": 1.1386, + "step": 5780 + }, + { + "epoch": 0.11, + "learning_rate": 9.92372372378059e-05, + "loss": 1.4176, + "step": 5790 + }, + { + "epoch": 0.11, + "learning_rate": 9.923460695197486e-05, + "loss": 1.4019, + "step": 5800 + }, + { + "epoch": 0.11, + "learning_rate": 9.923197217382953e-05, + "loss": 1.2456, + "step": 5810 + }, + { + "epoch": 0.11, + "learning_rate": 9.922933290361034e-05, + "loss": 1.7389, + "step": 5820 + }, + { + "epoch": 0.11, + "learning_rate": 9.922668914155806e-05, + "loss": 1.2519, + "step": 5830 + }, + { + "epoch": 0.11, + "learning_rate": 9.922404088791396e-05, + "loss": 1.3408, + "step": 5840 + }, + { + "epoch": 0.11, + "learning_rate": 9.922138814291965e-05, + "loss": 1.3465, + "step": 5850 + }, + { + "epoch": 0.11, + "learning_rate": 9.921873090681716e-05, + "loss": 1.2421, + "step": 5860 + }, + { + "epoch": 0.11, + "learning_rate": 9.9216069179849e-05, + "loss": 1.2956, + "step": 5870 + }, + { + "epoch": 0.11, + "learning_rate": 9.921340296225798e-05, + "loss": 1.1981, + "step": 5880 + }, + { + "epoch": 0.11, + "learning_rate": 9.921073225428739e-05, + "loss": 1.2752, + "step": 5890 + }, + { + "epoch": 0.11, + "learning_rate": 9.920805705618091e-05, + "loss": 1.1301, + "step": 5900 + }, + { + "epoch": 0.11, + "learning_rate": 9.920537736818265e-05, + "loss": 1.3806, + "step": 5910 + }, + { + "epoch": 0.11, + "learning_rate": 9.92026931905371e-05, + "loss": 1.3252, + "step": 5920 + }, + { + "epoch": 0.11, + "learning_rate": 9.920000452348917e-05, + "loss": 1.3651, + "step": 5930 + }, + { + "epoch": 0.11, + "learning_rate": 9.919731136728419e-05, + "loss": 1.3466, + "step": 5940 + }, + { + "epoch": 0.11, + "learning_rate": 9.919461372216788e-05, + "loss": 1.1675, + "step": 5950 + }, + { + "epoch": 0.11, + "learning_rate": 9.91919115883864e-05, + "loss": 1.2723, + "step": 5960 + }, + { + "epoch": 0.11, + "learning_rate": 9.918920496618626e-05, + "loss": 1.2592, + "step": 5970 + }, + { + "epoch": 0.11, + "learning_rate": 9.918649385581449e-05, + "loss": 1.2989, + "step": 5980 + }, + { + "epoch": 0.12, + "learning_rate": 9.91837782575184e-05, + "loss": 1.5011, + "step": 5990 + }, + { + "epoch": 0.12, + "learning_rate": 9.91810581715458e-05, + "loss": 1.2073, + "step": 6000 + }, + { + "epoch": 0.12, + "learning_rate": 9.917833359814484e-05, + "loss": 1.3457, + "step": 6010 + }, + { + "epoch": 0.12, + "learning_rate": 9.917560453756419e-05, + "loss": 1.2271, + "step": 6020 + }, + { + "epoch": 0.12, + "learning_rate": 9.917287099005276e-05, + "loss": 1.4907, + "step": 6030 + }, + { + "epoch": 0.12, + "learning_rate": 9.917013295586007e-05, + "loss": 1.4253, + "step": 6040 + }, + { + "epoch": 0.12, + "learning_rate": 9.916739043523588e-05, + "loss": 1.4048, + "step": 6050 + }, + { + "epoch": 0.12, + "learning_rate": 9.916464342843044e-05, + "loss": 1.3438, + "step": 6060 + }, + { + "epoch": 0.12, + "learning_rate": 9.91618919356944e-05, + "loss": 1.3314, + "step": 6070 + }, + { + "epoch": 0.12, + "learning_rate": 9.915913595727882e-05, + "loss": 1.5093, + "step": 6080 + }, + { + "epoch": 0.12, + "learning_rate": 9.915637549343514e-05, + "loss": 1.3973, + "step": 6090 + }, + { + "epoch": 0.12, + "learning_rate": 9.915361054441528e-05, + "loss": 1.253, + "step": 6100 + }, + { + "epoch": 0.12, + "learning_rate": 9.915084111047147e-05, + "loss": 1.4922, + "step": 6110 + }, + { + "epoch": 0.12, + "learning_rate": 9.914806719185643e-05, + "loss": 1.1819, + "step": 6120 + }, + { + "epoch": 0.12, + "learning_rate": 9.914528878882326e-05, + "loss": 1.2614, + "step": 6130 + }, + { + "epoch": 0.12, + "learning_rate": 9.914250590162546e-05, + "loss": 1.3158, + "step": 6140 + }, + { + "epoch": 0.12, + "learning_rate": 9.913971853051696e-05, + "loss": 1.5722, + "step": 6150 + }, + { + "epoch": 0.12, + "learning_rate": 9.913692667575208e-05, + "loss": 1.2991, + "step": 6160 + }, + { + "epoch": 0.12, + "learning_rate": 9.913413033758554e-05, + "loss": 1.2018, + "step": 6170 + }, + { + "epoch": 0.12, + "learning_rate": 9.913132951627251e-05, + "loss": 1.185, + "step": 6180 + }, + { + "epoch": 0.12, + "learning_rate": 9.912852421206856e-05, + "loss": 1.3143, + "step": 6190 + }, + { + "epoch": 0.12, + "learning_rate": 9.912571442522963e-05, + "loss": 1.432, + "step": 6200 + }, + { + "epoch": 0.12, + "learning_rate": 9.912290015601208e-05, + "loss": 1.228, + "step": 6210 + }, + { + "epoch": 0.12, + "learning_rate": 9.912008140467274e-05, + "loss": 1.3895, + "step": 6220 + }, + { + "epoch": 0.12, + "learning_rate": 9.911725817146875e-05, + "loss": 1.2642, + "step": 6230 + }, + { + "epoch": 0.12, + "learning_rate": 9.911443045665776e-05, + "loss": 1.273, + "step": 6240 + }, + { + "epoch": 0.12, + "learning_rate": 9.911159826049774e-05, + "loss": 1.4531, + "step": 6250 + }, + { + "epoch": 0.12, + "learning_rate": 9.91087615832471e-05, + "loss": 1.193, + "step": 6260 + }, + { + "epoch": 0.12, + "learning_rate": 9.910592042516471e-05, + "loss": 1.4373, + "step": 6270 + }, + { + "epoch": 0.12, + "learning_rate": 9.910307478650978e-05, + "loss": 1.4789, + "step": 6280 + }, + { + "epoch": 0.12, + "learning_rate": 9.910022466754195e-05, + "loss": 1.2663, + "step": 6290 + }, + { + "epoch": 0.12, + "learning_rate": 9.909737006852128e-05, + "loss": 1.2694, + "step": 6300 + }, + { + "epoch": 0.12, + "learning_rate": 9.909451098970824e-05, + "loss": 1.4176, + "step": 6310 + }, + { + "epoch": 0.12, + "learning_rate": 9.909164743136369e-05, + "loss": 1.3513, + "step": 6320 + }, + { + "epoch": 0.12, + "learning_rate": 9.908877939374892e-05, + "loss": 1.2542, + "step": 6330 + }, + { + "epoch": 0.12, + "learning_rate": 9.90859068771256e-05, + "loss": 1.3829, + "step": 6340 + }, + { + "epoch": 0.12, + "learning_rate": 9.908302988175586e-05, + "loss": 1.1073, + "step": 6350 + }, + { + "epoch": 0.12, + "learning_rate": 9.908014840790216e-05, + "loss": 1.282, + "step": 6360 + }, + { + "epoch": 0.12, + "learning_rate": 9.907726245582747e-05, + "loss": 1.1775, + "step": 6370 + }, + { + "epoch": 0.12, + "learning_rate": 9.907437202579507e-05, + "loss": 1.5318, + "step": 6380 + }, + { + "epoch": 0.12, + "learning_rate": 9.907147711806869e-05, + "loss": 1.124, + "step": 6390 + }, + { + "epoch": 0.12, + "learning_rate": 9.906857773291249e-05, + "loss": 1.3886, + "step": 6400 + }, + { + "epoch": 0.12, + "learning_rate": 9.906567387059103e-05, + "loss": 1.3465, + "step": 6410 + }, + { + "epoch": 0.12, + "learning_rate": 9.906276553136923e-05, + "loss": 1.3887, + "step": 6420 + }, + { + "epoch": 0.12, + "learning_rate": 9.90598527155125e-05, + "loss": 1.2334, + "step": 6430 + }, + { + "epoch": 0.12, + "learning_rate": 9.905693542328658e-05, + "loss": 1.2251, + "step": 6440 + }, + { + "epoch": 0.12, + "learning_rate": 9.905401365495766e-05, + "loss": 1.3017, + "step": 6450 + }, + { + "epoch": 0.12, + "learning_rate": 9.905108741079232e-05, + "loss": 1.3361, + "step": 6460 + }, + { + "epoch": 0.12, + "learning_rate": 9.90481566910576e-05, + "loss": 1.4113, + "step": 6470 + }, + { + "epoch": 0.12, + "learning_rate": 9.904522149602086e-05, + "loss": 1.2214, + "step": 6480 + }, + { + "epoch": 0.12, + "learning_rate": 9.904228182594995e-05, + "loss": 1.4428, + "step": 6490 + }, + { + "epoch": 0.12, + "learning_rate": 9.903933768111306e-05, + "loss": 1.2321, + "step": 6500 + }, + { + "epoch": 0.13, + "learning_rate": 9.903638906177887e-05, + "loss": 1.1375, + "step": 6510 + }, + { + "epoch": 0.13, + "learning_rate": 9.903343596821637e-05, + "loss": 1.3733, + "step": 6520 + }, + { + "epoch": 0.13, + "learning_rate": 9.903047840069505e-05, + "loss": 1.2392, + "step": 6530 + }, + { + "epoch": 0.13, + "learning_rate": 9.902751635948475e-05, + "loss": 1.7574, + "step": 6540 + }, + { + "epoch": 0.13, + "learning_rate": 9.902454984485574e-05, + "loss": 1.3911, + "step": 6550 + }, + { + "epoch": 0.13, + "learning_rate": 9.902157885707868e-05, + "loss": 0.9818, + "step": 6560 + }, + { + "epoch": 0.13, + "learning_rate": 9.901860339642468e-05, + "loss": 1.4248, + "step": 6570 + }, + { + "epoch": 0.13, + "learning_rate": 9.90156234631652e-05, + "loss": 1.3005, + "step": 6580 + }, + { + "epoch": 0.13, + "learning_rate": 9.901263905757215e-05, + "loss": 1.2265, + "step": 6590 + }, + { + "epoch": 0.13, + "learning_rate": 9.900965017991784e-05, + "loss": 1.2636, + "step": 6600 + }, + { + "epoch": 0.13, + "learning_rate": 9.900665683047499e-05, + "loss": 1.3453, + "step": 6610 + }, + { + "epoch": 0.13, + "learning_rate": 9.900365900951669e-05, + "loss": 1.4115, + "step": 6620 + }, + { + "epoch": 0.13, + "learning_rate": 9.900065671731652e-05, + "loss": 1.2485, + "step": 6630 + }, + { + "epoch": 0.13, + "learning_rate": 9.899764995414838e-05, + "loss": 1.1799, + "step": 6640 + }, + { + "epoch": 0.13, + "learning_rate": 9.899463872028663e-05, + "loss": 1.295, + "step": 6650 + }, + { + "epoch": 0.13, + "learning_rate": 9.899162301600601e-05, + "loss": 1.3853, + "step": 6660 + }, + { + "epoch": 0.13, + "learning_rate": 9.898860284158172e-05, + "loss": 1.2228, + "step": 6670 + }, + { + "epoch": 0.13, + "learning_rate": 9.898557819728928e-05, + "loss": 1.3557, + "step": 6680 + }, + { + "epoch": 0.13, + "learning_rate": 9.89825490834047e-05, + "loss": 1.319, + "step": 6690 + }, + { + "epoch": 0.13, + "learning_rate": 9.897951550020436e-05, + "loss": 1.5404, + "step": 6700 + }, + { + "epoch": 0.13, + "learning_rate": 9.897647744796504e-05, + "loss": 1.2451, + "step": 6710 + }, + { + "epoch": 0.13, + "learning_rate": 9.897343492696395e-05, + "loss": 1.1714, + "step": 6720 + }, + { + "epoch": 0.13, + "learning_rate": 9.897038793747873e-05, + "loss": 1.3124, + "step": 6730 + }, + { + "epoch": 0.13, + "learning_rate": 9.896733647978734e-05, + "loss": 1.3044, + "step": 6740 + }, + { + "epoch": 0.13, + "learning_rate": 9.896428055416825e-05, + "loss": 1.4287, + "step": 6750 + }, + { + "epoch": 0.13, + "learning_rate": 9.896122016090024e-05, + "loss": 1.5254, + "step": 6760 + }, + { + "epoch": 0.13, + "learning_rate": 9.895815530026261e-05, + "loss": 1.4553, + "step": 6770 + }, + { + "epoch": 0.13, + "learning_rate": 9.895508597253498e-05, + "loss": 1.1696, + "step": 6780 + }, + { + "epoch": 0.13, + "learning_rate": 9.895201217799739e-05, + "loss": 1.4748, + "step": 6790 + }, + { + "epoch": 0.13, + "learning_rate": 9.894893391693032e-05, + "loss": 1.5152, + "step": 6800 + }, + { + "epoch": 0.13, + "learning_rate": 9.894585118961464e-05, + "loss": 1.2252, + "step": 6810 + }, + { + "epoch": 0.13, + "learning_rate": 9.894276399633163e-05, + "loss": 1.4116, + "step": 6820 + }, + { + "epoch": 0.13, + "learning_rate": 9.893967233736297e-05, + "loss": 1.2627, + "step": 6830 + }, + { + "epoch": 0.13, + "learning_rate": 9.893657621299072e-05, + "loss": 1.3812, + "step": 6840 + }, + { + "epoch": 0.13, + "learning_rate": 9.893347562349744e-05, + "loss": 1.404, + "step": 6850 + }, + { + "epoch": 0.13, + "learning_rate": 9.893037056916601e-05, + "loss": 1.1933, + "step": 6860 + }, + { + "epoch": 0.13, + "learning_rate": 9.892726105027974e-05, + "loss": 1.5206, + "step": 6870 + }, + { + "epoch": 0.13, + "learning_rate": 9.892414706712235e-05, + "loss": 1.1466, + "step": 6880 + }, + { + "epoch": 0.13, + "learning_rate": 9.892102861997797e-05, + "loss": 1.2785, + "step": 6890 + }, + { + "epoch": 0.13, + "learning_rate": 9.891790570913114e-05, + "loss": 1.2178, + "step": 6900 + }, + { + "epoch": 0.13, + "learning_rate": 9.89147783348668e-05, + "loss": 1.3832, + "step": 6910 + }, + { + "epoch": 0.13, + "learning_rate": 9.89116464974703e-05, + "loss": 1.2707, + "step": 6920 + }, + { + "epoch": 0.13, + "learning_rate": 9.890851019722742e-05, + "loss": 1.5353, + "step": 6930 + }, + { + "epoch": 0.13, + "learning_rate": 9.890536943442431e-05, + "loss": 1.4406, + "step": 6940 + }, + { + "epoch": 0.13, + "learning_rate": 9.890222420934754e-05, + "loss": 1.23, + "step": 6950 + }, + { + "epoch": 0.13, + "learning_rate": 9.889907452228409e-05, + "loss": 1.1093, + "step": 6960 + }, + { + "epoch": 0.13, + "learning_rate": 9.889592037352133e-05, + "loss": 1.3189, + "step": 6970 + }, + { + "epoch": 0.13, + "learning_rate": 9.889276176334709e-05, + "loss": 1.1306, + "step": 6980 + }, + { + "epoch": 0.13, + "learning_rate": 9.888959869204954e-05, + "loss": 1.1474, + "step": 6990 + }, + { + "epoch": 0.13, + "learning_rate": 9.888643115991733e-05, + "loss": 1.2099, + "step": 7000 + }, + { + "epoch": 0.13, + "learning_rate": 9.888325916723942e-05, + "loss": 1.3138, + "step": 7010 + }, + { + "epoch": 0.13, + "learning_rate": 9.888008271430527e-05, + "loss": 1.0532, + "step": 7020 + }, + { + "epoch": 0.14, + "learning_rate": 9.88769018014047e-05, + "loss": 1.4223, + "step": 7030 + }, + { + "epoch": 0.14, + "learning_rate": 9.887371642882794e-05, + "loss": 1.3858, + "step": 7040 + }, + { + "epoch": 0.14, + "learning_rate": 9.887052659686563e-05, + "loss": 1.0461, + "step": 7050 + }, + { + "epoch": 0.14, + "learning_rate": 9.886733230580883e-05, + "loss": 1.6259, + "step": 7060 + }, + { + "epoch": 0.14, + "learning_rate": 9.886413355594901e-05, + "loss": 1.4475, + "step": 7070 + }, + { + "epoch": 0.14, + "learning_rate": 9.8860930347578e-05, + "loss": 1.1167, + "step": 7080 + }, + { + "epoch": 0.14, + "learning_rate": 9.88577226809881e-05, + "loss": 1.1784, + "step": 7090 + }, + { + "epoch": 0.14, + "learning_rate": 9.885451055647196e-05, + "loss": 1.4284, + "step": 7100 + }, + { + "epoch": 0.14, + "learning_rate": 9.885129397432269e-05, + "loss": 1.3067, + "step": 7110 + }, + { + "epoch": 0.14, + "learning_rate": 9.884807293483378e-05, + "loss": 1.3647, + "step": 7120 + }, + { + "epoch": 0.14, + "learning_rate": 9.884484743829909e-05, + "loss": 1.4115, + "step": 7130 + }, + { + "epoch": 0.14, + "learning_rate": 9.884161748501298e-05, + "loss": 1.1733, + "step": 7140 + }, + { + "epoch": 0.14, + "learning_rate": 9.883838307527012e-05, + "loss": 1.3816, + "step": 7150 + }, + { + "epoch": 0.14, + "learning_rate": 9.883514420936564e-05, + "loss": 1.3084, + "step": 7160 + }, + { + "epoch": 0.14, + "learning_rate": 9.883190088759506e-05, + "loss": 1.5996, + "step": 7170 + }, + { + "epoch": 0.14, + "learning_rate": 9.882865311025431e-05, + "loss": 1.3527, + "step": 7180 + }, + { + "epoch": 0.14, + "learning_rate": 9.882540087763973e-05, + "loss": 1.4004, + "step": 7190 + }, + { + "epoch": 0.14, + "learning_rate": 9.882214419004807e-05, + "loss": 1.3129, + "step": 7200 + }, + { + "epoch": 0.14, + "learning_rate": 9.881888304777648e-05, + "loss": 1.3845, + "step": 7210 + }, + { + "epoch": 0.14, + "learning_rate": 9.88156174511225e-05, + "loss": 1.2199, + "step": 7220 + }, + { + "epoch": 0.14, + "learning_rate": 9.881234740038412e-05, + "loss": 1.3709, + "step": 7230 + }, + { + "epoch": 0.14, + "learning_rate": 9.880907289585967e-05, + "loss": 1.1905, + "step": 7240 + }, + { + "epoch": 0.14, + "learning_rate": 9.880579393784797e-05, + "loss": 1.287, + "step": 7250 + }, + { + "epoch": 0.14, + "learning_rate": 9.880251052664816e-05, + "loss": 1.1743, + "step": 7260 + }, + { + "epoch": 0.14, + "learning_rate": 9.879922266255986e-05, + "loss": 1.1883, + "step": 7270 + }, + { + "epoch": 0.14, + "learning_rate": 9.879593034588306e-05, + "loss": 1.4818, + "step": 7280 + }, + { + "epoch": 0.14, + "learning_rate": 9.879263357691814e-05, + "loss": 1.1763, + "step": 7290 + }, + { + "epoch": 0.14, + "learning_rate": 9.878933235596594e-05, + "loss": 1.3497, + "step": 7300 + }, + { + "epoch": 0.14, + "learning_rate": 9.878602668332764e-05, + "loss": 1.3765, + "step": 7310 + }, + { + "epoch": 0.14, + "learning_rate": 9.878271655930488e-05, + "loss": 1.2395, + "step": 7320 + }, + { + "epoch": 0.14, + "learning_rate": 9.877940198419968e-05, + "loss": 1.3532, + "step": 7330 + }, + { + "epoch": 0.14, + "learning_rate": 9.877608295831447e-05, + "loss": 1.2763, + "step": 7340 + }, + { + "epoch": 0.14, + "learning_rate": 9.87727594819521e-05, + "loss": 1.3, + "step": 7350 + }, + { + "epoch": 0.14, + "learning_rate": 9.876943155541578e-05, + "loss": 1.2306, + "step": 7360 + }, + { + "epoch": 0.14, + "learning_rate": 9.876609917900921e-05, + "loss": 1.4453, + "step": 7370 + }, + { + "epoch": 0.14, + "learning_rate": 9.876276235303641e-05, + "loss": 1.2722, + "step": 7380 + }, + { + "epoch": 0.14, + "learning_rate": 9.875942107780185e-05, + "loss": 1.135, + "step": 7390 + }, + { + "epoch": 0.14, + "learning_rate": 9.87560753536104e-05, + "loss": 1.4157, + "step": 7400 + }, + { + "epoch": 0.14, + "learning_rate": 9.875272518076734e-05, + "loss": 1.52, + "step": 7410 + }, + { + "epoch": 0.14, + "learning_rate": 9.874937055957834e-05, + "loss": 1.3416, + "step": 7420 + }, + { + "epoch": 0.14, + "learning_rate": 9.87460114903495e-05, + "loss": 1.2881, + "step": 7430 + }, + { + "epoch": 0.14, + "learning_rate": 9.874264797338729e-05, + "loss": 1.5264, + "step": 7440 + }, + { + "epoch": 0.14, + "learning_rate": 9.873928000899863e-05, + "loss": 1.3366, + "step": 7450 + }, + { + "epoch": 0.14, + "learning_rate": 9.873590759749081e-05, + "loss": 1.3968, + "step": 7460 + }, + { + "epoch": 0.14, + "learning_rate": 9.873253073917153e-05, + "loss": 1.1943, + "step": 7470 + }, + { + "epoch": 0.14, + "learning_rate": 9.872914943434892e-05, + "loss": 1.33, + "step": 7480 + }, + { + "epoch": 0.14, + "learning_rate": 9.872576368333151e-05, + "loss": 1.1105, + "step": 7490 + }, + { + "epoch": 0.14, + "learning_rate": 9.87223734864282e-05, + "loss": 1.2994, + "step": 7500 + }, + { + "epoch": 0.14, + "learning_rate": 9.871897884394833e-05, + "loss": 1.5565, + "step": 7510 + }, + { + "epoch": 0.14, + "learning_rate": 9.871557975620164e-05, + "loss": 1.2055, + "step": 7520 + }, + { + "epoch": 0.14, + "learning_rate": 9.871217622349829e-05, + "loss": 1.4947, + "step": 7530 + }, + { + "epoch": 0.14, + "learning_rate": 9.87087682461488e-05, + "loss": 1.2159, + "step": 7540 + }, + { + "epoch": 0.15, + "learning_rate": 9.870535582446416e-05, + "loss": 1.3459, + "step": 7550 + }, + { + "epoch": 0.15, + "learning_rate": 9.87019389587557e-05, + "loss": 1.3822, + "step": 7560 + }, + { + "epoch": 0.15, + "learning_rate": 9.869851764933518e-05, + "loss": 1.3279, + "step": 7570 + }, + { + "epoch": 0.15, + "learning_rate": 9.869509189651477e-05, + "loss": 1.2908, + "step": 7580 + }, + { + "epoch": 0.15, + "learning_rate": 9.86916617006071e-05, + "loss": 1.2709, + "step": 7590 + }, + { + "epoch": 0.15, + "learning_rate": 9.868822706192509e-05, + "loss": 1.4026, + "step": 7600 + }, + { + "epoch": 0.15, + "learning_rate": 9.868478798078214e-05, + "loss": 1.4043, + "step": 7610 + }, + { + "epoch": 0.15, + "learning_rate": 9.868134445749207e-05, + "loss": 1.3301, + "step": 7620 + }, + { + "epoch": 0.15, + "learning_rate": 9.867789649236903e-05, + "loss": 1.3424, + "step": 7630 + }, + { + "epoch": 0.15, + "learning_rate": 9.867444408572767e-05, + "loss": 1.3771, + "step": 7640 + }, + { + "epoch": 0.15, + "learning_rate": 9.867098723788297e-05, + "loss": 1.3783, + "step": 7650 + }, + { + "epoch": 0.15, + "learning_rate": 9.866752594915036e-05, + "loss": 1.1698, + "step": 7660 + }, + { + "epoch": 0.15, + "learning_rate": 9.866406021984565e-05, + "loss": 1.3314, + "step": 7670 + }, + { + "epoch": 0.15, + "learning_rate": 9.866059005028505e-05, + "loss": 1.2497, + "step": 7680 + }, + { + "epoch": 0.15, + "learning_rate": 9.86571154407852e-05, + "loss": 1.172, + "step": 7690 + }, + { + "epoch": 0.15, + "learning_rate": 9.865363639166314e-05, + "loss": 1.1296, + "step": 7700 + }, + { + "epoch": 0.15, + "learning_rate": 9.865015290323631e-05, + "loss": 1.4019, + "step": 7710 + }, + { + "epoch": 0.15, + "learning_rate": 9.864666497582255e-05, + "loss": 1.3886, + "step": 7720 + }, + { + "epoch": 0.15, + "learning_rate": 9.864317260974011e-05, + "loss": 1.2295, + "step": 7730 + }, + { + "epoch": 0.15, + "learning_rate": 9.863967580530765e-05, + "loss": 1.4068, + "step": 7740 + }, + { + "epoch": 0.15, + "learning_rate": 9.86361745628442e-05, + "loss": 1.3704, + "step": 7750 + }, + { + "epoch": 0.15, + "learning_rate": 9.863266888266924e-05, + "loss": 1.1668, + "step": 7760 + }, + { + "epoch": 0.15, + "learning_rate": 9.862915876510266e-05, + "loss": 1.3474, + "step": 7770 + }, + { + "epoch": 0.15, + "learning_rate": 9.862564421046472e-05, + "loss": 1.1253, + "step": 7780 + }, + { + "epoch": 0.15, + "learning_rate": 9.86221252190761e-05, + "loss": 1.4082, + "step": 7790 + }, + { + "epoch": 0.15, + "learning_rate": 9.861860179125785e-05, + "loss": 1.1985, + "step": 7800 + }, + { + "epoch": 0.15, + "learning_rate": 9.861507392733152e-05, + "loss": 1.2986, + "step": 7810 + }, + { + "epoch": 0.15, + "learning_rate": 9.861154162761896e-05, + "loss": 1.1855, + "step": 7820 + }, + { + "epoch": 0.15, + "learning_rate": 9.860800489244246e-05, + "loss": 1.3365, + "step": 7830 + }, + { + "epoch": 0.15, + "learning_rate": 9.860446372212478e-05, + "loss": 1.3017, + "step": 7840 + }, + { + "epoch": 0.15, + "learning_rate": 9.860091811698895e-05, + "loss": 1.1642, + "step": 7850 + }, + { + "epoch": 0.15, + "learning_rate": 9.859736807735853e-05, + "loss": 1.2197, + "step": 7860 + }, + { + "epoch": 0.15, + "learning_rate": 9.859381360355743e-05, + "loss": 1.3722, + "step": 7870 + }, + { + "epoch": 0.15, + "learning_rate": 9.859025469590997e-05, + "loss": 1.3946, + "step": 7880 + }, + { + "epoch": 0.15, + "learning_rate": 9.858669135474088e-05, + "loss": 1.4931, + "step": 7890 + }, + { + "epoch": 0.15, + "learning_rate": 9.858312358037526e-05, + "loss": 1.5107, + "step": 7900 + }, + { + "epoch": 0.15, + "learning_rate": 9.857955137313868e-05, + "loss": 1.3741, + "step": 7910 + }, + { + "epoch": 0.15, + "learning_rate": 9.857597473335707e-05, + "loss": 1.4331, + "step": 7920 + }, + { + "epoch": 0.15, + "learning_rate": 9.857239366135676e-05, + "loss": 1.2076, + "step": 7930 + }, + { + "epoch": 0.15, + "learning_rate": 9.856880815746452e-05, + "loss": 1.2076, + "step": 7940 + }, + { + "epoch": 0.15, + "learning_rate": 9.856521822200746e-05, + "loss": 1.2114, + "step": 7950 + }, + { + "epoch": 0.15, + "learning_rate": 9.856162385531319e-05, + "loss": 1.1001, + "step": 7960 + }, + { + "epoch": 0.15, + "learning_rate": 9.855802505770964e-05, + "loss": 1.2581, + "step": 7970 + }, + { + "epoch": 0.15, + "learning_rate": 9.855442182952519e-05, + "loss": 1.0122, + "step": 7980 + }, + { + "epoch": 0.15, + "learning_rate": 9.855081417108859e-05, + "loss": 1.0096, + "step": 7990 + }, + { + "epoch": 0.15, + "learning_rate": 9.854720208272903e-05, + "loss": 1.3871, + "step": 8000 + }, + { + "epoch": 0.15, + "learning_rate": 9.854358556477608e-05, + "loss": 1.2386, + "step": 8010 + }, + { + "epoch": 0.15, + "learning_rate": 9.853996461755972e-05, + "loss": 1.2004, + "step": 8020 + }, + { + "epoch": 0.15, + "learning_rate": 9.853633924141036e-05, + "loss": 1.281, + "step": 8030 + }, + { + "epoch": 0.15, + "learning_rate": 9.853270943665875e-05, + "loss": 1.1245, + "step": 8040 + }, + { + "epoch": 0.15, + "learning_rate": 9.852907520363613e-05, + "loss": 1.2192, + "step": 8050 + }, + { + "epoch": 0.15, + "learning_rate": 9.852543654267405e-05, + "loss": 1.4254, + "step": 8060 + }, + { + "epoch": 0.16, + "learning_rate": 9.852179345410454e-05, + "loss": 1.3942, + "step": 8070 + }, + { + "epoch": 0.16, + "learning_rate": 9.851814593826e-05, + "loss": 1.4358, + "step": 8080 + }, + { + "epoch": 0.16, + "learning_rate": 9.851449399547326e-05, + "loss": 1.1081, + "step": 8090 + }, + { + "epoch": 0.16, + "learning_rate": 9.851083762607751e-05, + "loss": 1.4539, + "step": 8100 + }, + { + "epoch": 0.16, + "learning_rate": 9.850717683040638e-05, + "loss": 1.2445, + "step": 8110 + }, + { + "epoch": 0.16, + "learning_rate": 9.850351160879388e-05, + "loss": 1.2617, + "step": 8120 + }, + { + "epoch": 0.16, + "learning_rate": 9.849984196157444e-05, + "loss": 1.2604, + "step": 8130 + }, + { + "epoch": 0.16, + "learning_rate": 9.849616788908289e-05, + "loss": 1.3513, + "step": 8140 + }, + { + "epoch": 0.16, + "learning_rate": 9.849248939165447e-05, + "loss": 1.3139, + "step": 8150 + }, + { + "epoch": 0.16, + "learning_rate": 9.848880646962483e-05, + "loss": 1.2969, + "step": 8160 + }, + { + "epoch": 0.16, + "learning_rate": 9.848511912332998e-05, + "loss": 1.3979, + "step": 8170 + }, + { + "epoch": 0.16, + "learning_rate": 9.848142735310639e-05, + "loss": 1.0536, + "step": 8180 + }, + { + "epoch": 0.16, + "learning_rate": 9.847773115929088e-05, + "loss": 1.5034, + "step": 8190 + }, + { + "epoch": 0.16, + "learning_rate": 9.847403054222074e-05, + "loss": 1.3399, + "step": 8200 + }, + { + "epoch": 0.16, + "learning_rate": 9.847032550223359e-05, + "loss": 1.3307, + "step": 8210 + }, + { + "epoch": 0.16, + "learning_rate": 9.846661603966751e-05, + "loss": 1.3468, + "step": 8220 + }, + { + "epoch": 0.16, + "learning_rate": 9.846290215486095e-05, + "loss": 1.1599, + "step": 8230 + }, + { + "epoch": 0.16, + "learning_rate": 9.845918384815281e-05, + "loss": 1.1876, + "step": 8240 + }, + { + "epoch": 0.16, + "learning_rate": 9.845546111988231e-05, + "loss": 1.3491, + "step": 8250 + }, + { + "epoch": 0.16, + "learning_rate": 9.845173397038914e-05, + "loss": 1.2454, + "step": 8260 + }, + { + "epoch": 0.16, + "learning_rate": 9.844800240001339e-05, + "loss": 1.356, + "step": 8270 + }, + { + "epoch": 0.16, + "learning_rate": 9.844426640909553e-05, + "loss": 1.0493, + "step": 8280 + }, + { + "epoch": 0.16, + "learning_rate": 9.844052599797644e-05, + "loss": 1.3075, + "step": 8290 + }, + { + "epoch": 0.16, + "learning_rate": 9.843678116699741e-05, + "loss": 1.2018, + "step": 8300 + }, + { + "epoch": 0.16, + "learning_rate": 9.843303191650015e-05, + "loss": 1.338, + "step": 8310 + }, + { + "epoch": 0.16, + "learning_rate": 9.842927824682672e-05, + "loss": 1.3271, + "step": 8320 + }, + { + "epoch": 0.16, + "learning_rate": 9.842552015831962e-05, + "loss": 1.2457, + "step": 8330 + }, + { + "epoch": 0.16, + "learning_rate": 9.842175765132178e-05, + "loss": 1.2274, + "step": 8340 + }, + { + "epoch": 0.16, + "learning_rate": 9.841799072617646e-05, + "loss": 1.5004, + "step": 8350 + }, + { + "epoch": 0.16, + "learning_rate": 9.841421938322741e-05, + "loss": 1.3789, + "step": 8360 + }, + { + "epoch": 0.16, + "learning_rate": 9.84104436228187e-05, + "loss": 1.2079, + "step": 8370 + }, + { + "epoch": 0.16, + "learning_rate": 9.840666344529486e-05, + "loss": 1.4544, + "step": 8380 + }, + { + "epoch": 0.16, + "learning_rate": 9.840287885100081e-05, + "loss": 1.5508, + "step": 8390 + }, + { + "epoch": 0.16, + "learning_rate": 9.839908984028185e-05, + "loss": 1.1513, + "step": 8400 + }, + { + "epoch": 0.16, + "learning_rate": 9.839529641348372e-05, + "loss": 1.1086, + "step": 8410 + }, + { + "epoch": 0.16, + "learning_rate": 9.839149857095254e-05, + "loss": 1.2385, + "step": 8420 + }, + { + "epoch": 0.16, + "learning_rate": 9.838769631303481e-05, + "loss": 1.3531, + "step": 8430 + }, + { + "epoch": 0.16, + "learning_rate": 9.83838896400775e-05, + "loss": 1.4215, + "step": 8440 + }, + { + "epoch": 0.16, + "learning_rate": 9.838007855242791e-05, + "loss": 1.2625, + "step": 8450 + }, + { + "epoch": 0.16, + "learning_rate": 9.837626305043379e-05, + "loss": 1.2192, + "step": 8460 + }, + { + "epoch": 0.16, + "learning_rate": 9.83724431344433e-05, + "loss": 1.2347, + "step": 8470 + }, + { + "epoch": 0.16, + "learning_rate": 9.836861880480493e-05, + "loss": 1.4267, + "step": 8480 + }, + { + "epoch": 0.16, + "learning_rate": 9.836479006186765e-05, + "loss": 1.2304, + "step": 8490 + }, + { + "epoch": 0.16, + "learning_rate": 9.836095690598083e-05, + "loss": 1.3287, + "step": 8500 + }, + { + "epoch": 0.16, + "learning_rate": 9.835711933749419e-05, + "loss": 1.2256, + "step": 8510 + }, + { + "epoch": 0.16, + "learning_rate": 9.835327735675787e-05, + "loss": 1.4997, + "step": 8520 + }, + { + "epoch": 0.16, + "learning_rate": 9.834943096412245e-05, + "loss": 1.0479, + "step": 8530 + }, + { + "epoch": 0.16, + "learning_rate": 9.834558015993887e-05, + "loss": 1.2734, + "step": 8540 + }, + { + "epoch": 0.16, + "learning_rate": 9.834172494455851e-05, + "loss": 1.3274, + "step": 8550 + }, + { + "epoch": 0.16, + "learning_rate": 9.83378653183331e-05, + "loss": 1.1544, + "step": 8560 + }, + { + "epoch": 0.16, + "learning_rate": 9.833400128161483e-05, + "loss": 1.2328, + "step": 8570 + }, + { + "epoch": 0.16, + "learning_rate": 9.833013283475627e-05, + "loss": 1.1407, + "step": 8580 + }, + { + "epoch": 0.17, + "learning_rate": 9.832625997811036e-05, + "loss": 1.1987, + "step": 8590 + }, + { + "epoch": 0.17, + "learning_rate": 9.83223827120305e-05, + "loss": 1.3577, + "step": 8600 + }, + { + "epoch": 0.17, + "learning_rate": 9.831850103687044e-05, + "loss": 1.2481, + "step": 8610 + }, + { + "epoch": 0.17, + "learning_rate": 9.831461495298438e-05, + "loss": 1.4829, + "step": 8620 + }, + { + "epoch": 0.17, + "learning_rate": 9.831072446072687e-05, + "loss": 1.1032, + "step": 8630 + }, + { + "epoch": 0.17, + "learning_rate": 9.830682956045291e-05, + "loss": 1.2056, + "step": 8640 + }, + { + "epoch": 0.17, + "learning_rate": 9.830293025251789e-05, + "loss": 0.9819, + "step": 8650 + }, + { + "epoch": 0.17, + "learning_rate": 9.829902653727756e-05, + "loss": 1.6266, + "step": 8660 + }, + { + "epoch": 0.17, + "learning_rate": 9.829511841508815e-05, + "loss": 1.1374, + "step": 8670 + }, + { + "epoch": 0.17, + "learning_rate": 9.829120588630622e-05, + "loss": 1.3165, + "step": 8680 + }, + { + "epoch": 0.17, + "learning_rate": 9.828728895128877e-05, + "loss": 1.2896, + "step": 8690 + }, + { + "epoch": 0.17, + "learning_rate": 9.828336761039318e-05, + "loss": 1.4283, + "step": 8700 + }, + { + "epoch": 0.17, + "learning_rate": 9.827944186397728e-05, + "loss": 1.4235, + "step": 8710 + }, + { + "epoch": 0.17, + "learning_rate": 9.827551171239924e-05, + "loss": 1.3255, + "step": 8720 + }, + { + "epoch": 0.17, + "learning_rate": 9.827157715601765e-05, + "loss": 1.2647, + "step": 8730 + }, + { + "epoch": 0.17, + "learning_rate": 9.826763819519153e-05, + "loss": 1.3183, + "step": 8740 + }, + { + "epoch": 0.17, + "learning_rate": 9.826369483028027e-05, + "loss": 1.325, + "step": 8750 + }, + { + "epoch": 0.17, + "learning_rate": 9.825974706164369e-05, + "loss": 1.6156, + "step": 8760 + }, + { + "epoch": 0.17, + "learning_rate": 9.825579488964198e-05, + "loss": 1.0642, + "step": 8770 + }, + { + "epoch": 0.17, + "learning_rate": 9.825183831463576e-05, + "loss": 1.1888, + "step": 8780 + }, + { + "epoch": 0.17, + "learning_rate": 9.824787733698604e-05, + "loss": 1.4277, + "step": 8790 + }, + { + "epoch": 0.17, + "learning_rate": 9.824391195705423e-05, + "loss": 1.218, + "step": 8800 + }, + { + "epoch": 0.17, + "learning_rate": 9.823994217520212e-05, + "loss": 1.2397, + "step": 8810 + }, + { + "epoch": 0.17, + "learning_rate": 9.823596799179196e-05, + "loss": 1.2788, + "step": 8820 + }, + { + "epoch": 0.17, + "learning_rate": 9.823198940718634e-05, + "loss": 1.4237, + "step": 8830 + }, + { + "epoch": 0.17, + "learning_rate": 9.82280064217483e-05, + "loss": 1.4129, + "step": 8840 + }, + { + "epoch": 0.17, + "learning_rate": 9.822401903584125e-05, + "loss": 1.3467, + "step": 8850 + }, + { + "epoch": 0.17, + "learning_rate": 9.822002724982901e-05, + "loss": 1.4142, + "step": 8860 + }, + { + "epoch": 0.17, + "learning_rate": 9.82160310640758e-05, + "loss": 1.1949, + "step": 8870 + }, + { + "epoch": 0.17, + "learning_rate": 9.821203047894624e-05, + "loss": 1.2524, + "step": 8880 + }, + { + "epoch": 0.17, + "learning_rate": 9.820802549480538e-05, + "loss": 1.2568, + "step": 8890 + }, + { + "epoch": 0.17, + "learning_rate": 9.820401611201862e-05, + "loss": 1.2205, + "step": 8900 + }, + { + "epoch": 0.17, + "learning_rate": 9.820000233095179e-05, + "loss": 1.2848, + "step": 8910 + }, + { + "epoch": 0.17, + "learning_rate": 9.819598415197113e-05, + "loss": 1.2488, + "step": 8920 + }, + { + "epoch": 0.17, + "learning_rate": 9.819196157544328e-05, + "loss": 1.1677, + "step": 8930 + }, + { + "epoch": 0.17, + "learning_rate": 9.818793460173525e-05, + "loss": 1.3149, + "step": 8940 + }, + { + "epoch": 0.17, + "learning_rate": 9.818390323121449e-05, + "loss": 1.4495, + "step": 8950 + }, + { + "epoch": 0.17, + "learning_rate": 9.817986746424881e-05, + "loss": 1.5506, + "step": 8960 + }, + { + "epoch": 0.17, + "learning_rate": 9.817582730120648e-05, + "loss": 1.3322, + "step": 8970 + }, + { + "epoch": 0.17, + "learning_rate": 9.81717827424561e-05, + "loss": 1.402, + "step": 8980 + }, + { + "epoch": 0.17, + "learning_rate": 9.816773378836675e-05, + "loss": 1.3724, + "step": 8990 + }, + { + "epoch": 0.17, + "learning_rate": 9.816368043930785e-05, + "loss": 1.3759, + "step": 9000 + }, + { + "epoch": 0.17, + "learning_rate": 9.815962269564923e-05, + "loss": 1.2096, + "step": 9010 + }, + { + "epoch": 0.17, + "learning_rate": 9.815556055776112e-05, + "loss": 1.2231, + "step": 9020 + }, + { + "epoch": 0.17, + "learning_rate": 9.81514940260142e-05, + "loss": 1.3297, + "step": 9030 + }, + { + "epoch": 0.17, + "learning_rate": 9.814742310077946e-05, + "loss": 1.7098, + "step": 9040 + }, + { + "epoch": 0.17, + "learning_rate": 9.814334778242842e-05, + "loss": 1.3305, + "step": 9050 + }, + { + "epoch": 0.17, + "learning_rate": 9.813926807133285e-05, + "loss": 1.2667, + "step": 9060 + }, + { + "epoch": 0.17, + "learning_rate": 9.813518396786502e-05, + "loss": 1.3842, + "step": 9070 + }, + { + "epoch": 0.17, + "learning_rate": 9.81310954723976e-05, + "loss": 1.5595, + "step": 9080 + }, + { + "epoch": 0.17, + "learning_rate": 9.812700258530361e-05, + "loss": 1.1515, + "step": 9090 + }, + { + "epoch": 0.17, + "learning_rate": 9.81229053069565e-05, + "loss": 1.2127, + "step": 9100 + }, + { + "epoch": 0.18, + "learning_rate": 9.811880363773012e-05, + "loss": 1.2793, + "step": 9110 + }, + { + "epoch": 0.18, + "learning_rate": 9.811469757799873e-05, + "loss": 1.1972, + "step": 9120 + }, + { + "epoch": 0.18, + "learning_rate": 9.811058712813697e-05, + "loss": 1.381, + "step": 9130 + }, + { + "epoch": 0.18, + "learning_rate": 9.810647228851988e-05, + "loss": 1.5509, + "step": 9140 + }, + { + "epoch": 0.18, + "learning_rate": 9.810235305952293e-05, + "loss": 1.317, + "step": 9150 + }, + { + "epoch": 0.18, + "learning_rate": 9.809822944152196e-05, + "loss": 1.4677, + "step": 9160 + }, + { + "epoch": 0.18, + "learning_rate": 9.809410143489321e-05, + "loss": 1.2051, + "step": 9170 + }, + { + "epoch": 0.18, + "learning_rate": 9.808996904001337e-05, + "loss": 1.582, + "step": 9180 + }, + { + "epoch": 0.18, + "learning_rate": 9.808583225725944e-05, + "loss": 1.1585, + "step": 9190 + }, + { + "epoch": 0.18, + "learning_rate": 9.80816910870089e-05, + "loss": 1.2673, + "step": 9200 + }, + { + "epoch": 0.18, + "learning_rate": 9.807754552963964e-05, + "loss": 1.4402, + "step": 9210 + }, + { + "epoch": 0.18, + "learning_rate": 9.807339558552984e-05, + "loss": 1.3071, + "step": 9220 + }, + { + "epoch": 0.18, + "learning_rate": 9.806924125505821e-05, + "loss": 1.2665, + "step": 9230 + }, + { + "epoch": 0.18, + "learning_rate": 9.806508253860376e-05, + "loss": 1.2619, + "step": 9240 + }, + { + "epoch": 0.18, + "learning_rate": 9.806091943654599e-05, + "loss": 1.3016, + "step": 9250 + }, + { + "epoch": 0.18, + "learning_rate": 9.805675194926472e-05, + "loss": 1.17, + "step": 9260 + }, + { + "epoch": 0.18, + "learning_rate": 9.80525800771402e-05, + "loss": 1.2501, + "step": 9270 + }, + { + "epoch": 0.18, + "learning_rate": 9.804840382055311e-05, + "loss": 1.6287, + "step": 9280 + }, + { + "epoch": 0.18, + "learning_rate": 9.804422317988451e-05, + "loss": 1.1335, + "step": 9290 + }, + { + "epoch": 0.18, + "learning_rate": 9.804003815551582e-05, + "loss": 1.2307, + "step": 9300 + }, + { + "epoch": 0.18, + "learning_rate": 9.803584874782891e-05, + "loss": 1.1366, + "step": 9310 + }, + { + "epoch": 0.18, + "learning_rate": 9.803165495720605e-05, + "loss": 1.3496, + "step": 9320 + }, + { + "epoch": 0.18, + "learning_rate": 9.802745678402986e-05, + "loss": 1.3963, + "step": 9330 + }, + { + "epoch": 0.18, + "learning_rate": 9.802325422868343e-05, + "loss": 1.2265, + "step": 9340 + }, + { + "epoch": 0.18, + "learning_rate": 9.801904729155018e-05, + "loss": 1.2618, + "step": 9350 + }, + { + "epoch": 0.18, + "learning_rate": 9.8014835973014e-05, + "loss": 1.2732, + "step": 9360 + }, + { + "epoch": 0.18, + "learning_rate": 9.801062027345912e-05, + "loss": 1.0594, + "step": 9370 + }, + { + "epoch": 0.18, + "learning_rate": 9.80064001932702e-05, + "loss": 1.2305, + "step": 9380 + }, + { + "epoch": 0.18, + "learning_rate": 9.800217573283229e-05, + "loss": 1.149, + "step": 9390 + }, + { + "epoch": 0.18, + "learning_rate": 9.799794689253083e-05, + "loss": 1.2976, + "step": 9400 + }, + { + "epoch": 0.18, + "learning_rate": 9.79937136727517e-05, + "loss": 1.1004, + "step": 9410 + }, + { + "epoch": 0.18, + "learning_rate": 9.798947607388114e-05, + "loss": 1.242, + "step": 9420 + }, + { + "epoch": 0.18, + "learning_rate": 9.79852340963058e-05, + "loss": 1.4456, + "step": 9430 + }, + { + "epoch": 0.18, + "learning_rate": 9.798098774041272e-05, + "loss": 1.3882, + "step": 9440 + }, + { + "epoch": 0.18, + "learning_rate": 9.797673700658936e-05, + "loss": 1.2927, + "step": 9450 + }, + { + "epoch": 0.18, + "learning_rate": 9.797248189522357e-05, + "loss": 1.3206, + "step": 9460 + }, + { + "epoch": 0.18, + "learning_rate": 9.79682224067036e-05, + "loss": 1.3717, + "step": 9470 + }, + { + "epoch": 0.18, + "learning_rate": 9.79639585414181e-05, + "loss": 1.0823, + "step": 9480 + }, + { + "epoch": 0.18, + "learning_rate": 9.79596902997561e-05, + "loss": 1.3667, + "step": 9490 + }, + { + "epoch": 0.18, + "learning_rate": 9.79554176821071e-05, + "loss": 1.1936, + "step": 9500 + }, + { + "epoch": 0.18, + "learning_rate": 9.795114068886088e-05, + "loss": 1.2976, + "step": 9510 + }, + { + "epoch": 0.18, + "learning_rate": 9.794685932040772e-05, + "loss": 1.2484, + "step": 9520 + }, + { + "epoch": 0.18, + "learning_rate": 9.794257357713826e-05, + "loss": 1.0996, + "step": 9530 + }, + { + "epoch": 0.18, + "learning_rate": 9.793828345944356e-05, + "loss": 1.2768, + "step": 9540 + }, + { + "epoch": 0.18, + "learning_rate": 9.793398896771501e-05, + "loss": 1.298, + "step": 9550 + }, + { + "epoch": 0.18, + "learning_rate": 9.792969010234452e-05, + "loss": 1.4902, + "step": 9560 + }, + { + "epoch": 0.18, + "learning_rate": 9.79253868637243e-05, + "loss": 1.2601, + "step": 9570 + }, + { + "epoch": 0.18, + "learning_rate": 9.792107925224698e-05, + "loss": 1.4121, + "step": 9580 + }, + { + "epoch": 0.18, + "learning_rate": 9.791676726830563e-05, + "loss": 1.2839, + "step": 9590 + }, + { + "epoch": 0.18, + "learning_rate": 9.791245091229366e-05, + "loss": 1.0715, + "step": 9600 + }, + { + "epoch": 0.18, + "learning_rate": 9.790813018460492e-05, + "loss": 1.4211, + "step": 9610 + }, + { + "epoch": 0.18, + "learning_rate": 9.790380508563363e-05, + "loss": 1.4622, + "step": 9620 + }, + { + "epoch": 0.19, + "learning_rate": 9.789947561577445e-05, + "loss": 1.2848, + "step": 9630 + }, + { + "epoch": 0.19, + "learning_rate": 9.78951417754224e-05, + "loss": 1.2868, + "step": 9640 + }, + { + "epoch": 0.19, + "learning_rate": 9.789080356497292e-05, + "loss": 1.1533, + "step": 9650 + }, + { + "epoch": 0.19, + "learning_rate": 9.788646098482183e-05, + "loss": 1.4299, + "step": 9660 + }, + { + "epoch": 0.19, + "learning_rate": 9.788211403536536e-05, + "loss": 1.2973, + "step": 9670 + }, + { + "epoch": 0.19, + "learning_rate": 9.787776271700015e-05, + "loss": 1.1985, + "step": 9680 + }, + { + "epoch": 0.19, + "learning_rate": 9.787340703012323e-05, + "loss": 1.5474, + "step": 9690 + }, + { + "epoch": 0.19, + "learning_rate": 9.786904697513202e-05, + "loss": 1.2382, + "step": 9700 + }, + { + "epoch": 0.19, + "learning_rate": 9.786468255242434e-05, + "loss": 1.2455, + "step": 9710 + }, + { + "epoch": 0.19, + "learning_rate": 9.786031376239842e-05, + "loss": 1.2619, + "step": 9720 + }, + { + "epoch": 0.19, + "learning_rate": 9.785594060545286e-05, + "loss": 1.2185, + "step": 9730 + }, + { + "epoch": 0.19, + "learning_rate": 9.785156308198673e-05, + "loss": 1.3427, + "step": 9740 + }, + { + "epoch": 0.19, + "learning_rate": 9.78471811923994e-05, + "loss": 1.2401, + "step": 9750 + }, + { + "epoch": 0.19, + "learning_rate": 9.78427949370907e-05, + "loss": 1.4658, + "step": 9760 + }, + { + "epoch": 0.19, + "learning_rate": 9.783840431646085e-05, + "loss": 1.2106, + "step": 9770 + }, + { + "epoch": 0.19, + "learning_rate": 9.783400933091047e-05, + "loss": 1.3724, + "step": 9780 + }, + { + "epoch": 0.19, + "learning_rate": 9.782960998084055e-05, + "loss": 1.2552, + "step": 9790 + }, + { + "epoch": 0.19, + "learning_rate": 9.782520626665253e-05, + "loss": 1.3759, + "step": 9800 + }, + { + "epoch": 0.19, + "learning_rate": 9.782079818874819e-05, + "loss": 1.2046, + "step": 9810 + }, + { + "epoch": 0.19, + "learning_rate": 9.781638574752976e-05, + "loss": 1.3758, + "step": 9820 + }, + { + "epoch": 0.19, + "learning_rate": 9.781196894339981e-05, + "loss": 1.4048, + "step": 9830 + }, + { + "epoch": 0.19, + "learning_rate": 9.780754777676139e-05, + "loss": 1.1321, + "step": 9840 + }, + { + "epoch": 0.19, + "learning_rate": 9.780312224801786e-05, + "loss": 1.1469, + "step": 9850 + }, + { + "epoch": 0.19, + "learning_rate": 9.779869235757305e-05, + "loss": 1.4011, + "step": 9860 + }, + { + "epoch": 0.19, + "learning_rate": 9.779425810583113e-05, + "loss": 1.2885, + "step": 9870 + }, + { + "epoch": 0.19, + "learning_rate": 9.778981949319673e-05, + "loss": 1.5408, + "step": 9880 + }, + { + "epoch": 0.19, + "learning_rate": 9.778537652007478e-05, + "loss": 1.1568, + "step": 9890 + }, + { + "epoch": 0.19, + "learning_rate": 9.778092918687075e-05, + "loss": 1.2728, + "step": 9900 + }, + { + "epoch": 0.19, + "learning_rate": 9.777647749399035e-05, + "loss": 1.2054, + "step": 9910 + }, + { + "epoch": 0.19, + "learning_rate": 9.777202144183981e-05, + "loss": 1.3918, + "step": 9920 + }, + { + "epoch": 0.19, + "learning_rate": 9.776756103082572e-05, + "loss": 1.2791, + "step": 9930 + }, + { + "epoch": 0.19, + "learning_rate": 9.776309626135504e-05, + "loss": 1.4875, + "step": 9940 + }, + { + "epoch": 0.19, + "learning_rate": 9.775862713383516e-05, + "loss": 1.1692, + "step": 9950 + }, + { + "epoch": 0.19, + "learning_rate": 9.775415364867383e-05, + "loss": 1.3352, + "step": 9960 + }, + { + "epoch": 0.19, + "learning_rate": 9.77496758062793e-05, + "loss": 1.5526, + "step": 9970 + }, + { + "epoch": 0.19, + "learning_rate": 9.774519360706005e-05, + "loss": 1.2732, + "step": 9980 + }, + { + "epoch": 0.19, + "learning_rate": 9.77407070514251e-05, + "loss": 1.285, + "step": 9990 + }, + { + "epoch": 0.19, + "learning_rate": 9.773621613978379e-05, + "loss": 1.178, + "step": 10000 + }, + { + "epoch": 0.19, + "learning_rate": 9.773172087254592e-05, + "loss": 1.3514, + "step": 10010 + }, + { + "epoch": 0.19, + "learning_rate": 9.772722125012163e-05, + "loss": 1.3739, + "step": 10020 + }, + { + "epoch": 0.19, + "learning_rate": 9.772271727292149e-05, + "loss": 1.2852, + "step": 10030 + }, + { + "epoch": 0.19, + "learning_rate": 9.771820894135642e-05, + "loss": 1.2566, + "step": 10040 + }, + { + "epoch": 0.19, + "learning_rate": 9.771369625583782e-05, + "loss": 1.3434, + "step": 10050 + }, + { + "epoch": 0.19, + "learning_rate": 9.770917921677741e-05, + "loss": 1.2456, + "step": 10060 + }, + { + "epoch": 0.19, + "learning_rate": 9.770465782458736e-05, + "loss": 1.2594, + "step": 10070 + }, + { + "epoch": 0.19, + "learning_rate": 9.77001320796802e-05, + "loss": 1.2029, + "step": 10080 + }, + { + "epoch": 0.19, + "learning_rate": 9.76956019824689e-05, + "loss": 1.2304, + "step": 10090 + }, + { + "epoch": 0.19, + "learning_rate": 9.769106753336677e-05, + "loss": 1.4384, + "step": 10100 + }, + { + "epoch": 0.19, + "learning_rate": 9.768652873278755e-05, + "loss": 1.1292, + "step": 10110 + }, + { + "epoch": 0.19, + "learning_rate": 9.768198558114536e-05, + "loss": 1.6068, + "step": 10120 + }, + { + "epoch": 0.19, + "learning_rate": 9.767743807885477e-05, + "loss": 1.2568, + "step": 10130 + }, + { + "epoch": 0.19, + "learning_rate": 9.767288622633069e-05, + "loss": 1.2739, + "step": 10140 + }, + { + "epoch": 0.2, + "learning_rate": 9.766833002398846e-05, + "loss": 1.2381, + "step": 10150 + }, + { + "epoch": 0.2, + "learning_rate": 9.766376947224375e-05, + "loss": 1.3275, + "step": 10160 + }, + { + "epoch": 0.2, + "learning_rate": 9.765920457151272e-05, + "loss": 1.1325, + "step": 10170 + }, + { + "epoch": 0.2, + "learning_rate": 9.765463532221188e-05, + "loss": 1.2064, + "step": 10180 + }, + { + "epoch": 0.2, + "learning_rate": 9.765006172475816e-05, + "loss": 1.2892, + "step": 10190 + }, + { + "epoch": 0.2, + "learning_rate": 9.764548377956883e-05, + "loss": 1.2074, + "step": 10200 + }, + { + "epoch": 0.2, + "learning_rate": 9.764090148706162e-05, + "loss": 1.3337, + "step": 10210 + }, + { + "epoch": 0.2, + "learning_rate": 9.763631484765463e-05, + "loss": 1.2638, + "step": 10220 + }, + { + "epoch": 0.2, + "learning_rate": 9.763172386176636e-05, + "loss": 1.2423, + "step": 10230 + }, + { + "epoch": 0.2, + "learning_rate": 9.76271285298157e-05, + "loss": 1.258, + "step": 10240 + }, + { + "epoch": 0.2, + "learning_rate": 9.762252885222194e-05, + "loss": 1.1784, + "step": 10250 + }, + { + "epoch": 0.2, + "learning_rate": 9.761792482940477e-05, + "loss": 1.3826, + "step": 10260 + }, + { + "epoch": 0.2, + "learning_rate": 9.761331646178427e-05, + "loss": 1.2646, + "step": 10270 + }, + { + "epoch": 0.2, + "learning_rate": 9.760870374978093e-05, + "loss": 1.4281, + "step": 10280 + }, + { + "epoch": 0.2, + "learning_rate": 9.760408669381564e-05, + "loss": 1.1588, + "step": 10290 + }, + { + "epoch": 0.2, + "learning_rate": 9.759946529430966e-05, + "loss": 1.2727, + "step": 10300 + }, + { + "epoch": 0.2, + "learning_rate": 9.759483955168464e-05, + "loss": 1.3762, + "step": 10310 + }, + { + "epoch": 0.2, + "learning_rate": 9.759020946636268e-05, + "loss": 1.3344, + "step": 10320 + }, + { + "epoch": 0.2, + "learning_rate": 9.758557503876625e-05, + "loss": 1.4003, + "step": 10330 + }, + { + "epoch": 0.2, + "learning_rate": 9.758093626931816e-05, + "loss": 1.3842, + "step": 10340 + }, + { + "epoch": 0.2, + "learning_rate": 9.75762931584417e-05, + "loss": 1.3667, + "step": 10350 + }, + { + "epoch": 0.2, + "learning_rate": 9.757164570656052e-05, + "loss": 1.1048, + "step": 10360 + }, + { + "epoch": 0.2, + "learning_rate": 9.756699391409867e-05, + "loss": 1.2294, + "step": 10370 + }, + { + "epoch": 0.2, + "learning_rate": 9.756233778148059e-05, + "loss": 1.3891, + "step": 10380 + }, + { + "epoch": 0.2, + "learning_rate": 9.75576773091311e-05, + "loss": 1.1871, + "step": 10390 + }, + { + "epoch": 0.2, + "learning_rate": 9.755301249747546e-05, + "loss": 1.51, + "step": 10400 + }, + { + "epoch": 0.2, + "learning_rate": 9.75483433469393e-05, + "loss": 1.3794, + "step": 10410 + }, + { + "epoch": 0.2, + "learning_rate": 9.754366985794862e-05, + "loss": 1.1809, + "step": 10420 + }, + { + "epoch": 0.2, + "learning_rate": 9.753899203092988e-05, + "loss": 1.223, + "step": 10430 + }, + { + "epoch": 0.2, + "learning_rate": 9.753430986630989e-05, + "loss": 1.1459, + "step": 10440 + }, + { + "epoch": 0.2, + "learning_rate": 9.752962336451587e-05, + "loss": 1.3384, + "step": 10450 + }, + { + "epoch": 0.2, + "learning_rate": 9.75249325259754e-05, + "loss": 1.3032, + "step": 10460 + }, + { + "epoch": 0.2, + "learning_rate": 9.75202373511165e-05, + "loss": 1.3291, + "step": 10470 + }, + { + "epoch": 0.2, + "learning_rate": 9.75155378403676e-05, + "loss": 1.4394, + "step": 10480 + }, + { + "epoch": 0.2, + "learning_rate": 9.751083399415746e-05, + "loss": 1.3307, + "step": 10490 + }, + { + "epoch": 0.2, + "learning_rate": 9.750612581291529e-05, + "loss": 1.5223, + "step": 10500 + }, + { + "epoch": 0.2, + "learning_rate": 9.750141329707068e-05, + "loss": 1.2802, + "step": 10510 + }, + { + "epoch": 0.2, + "learning_rate": 9.74966964470536e-05, + "loss": 1.2532, + "step": 10520 + }, + { + "epoch": 0.2, + "learning_rate": 9.749197526329446e-05, + "loss": 1.2902, + "step": 10530 + }, + { + "epoch": 0.2, + "learning_rate": 9.748724974622398e-05, + "loss": 1.361, + "step": 10540 + }, + { + "epoch": 0.2, + "learning_rate": 9.74825198962734e-05, + "loss": 1.2787, + "step": 10550 + }, + { + "epoch": 0.2, + "learning_rate": 9.747778571387425e-05, + "loss": 1.3774, + "step": 10560 + }, + { + "epoch": 0.2, + "learning_rate": 9.747304719945847e-05, + "loss": 1.2597, + "step": 10570 + }, + { + "epoch": 0.2, + "learning_rate": 9.746830435345846e-05, + "loss": 1.4426, + "step": 10580 + }, + { + "epoch": 0.2, + "learning_rate": 9.746355717630695e-05, + "loss": 1.411, + "step": 10590 + }, + { + "epoch": 0.2, + "learning_rate": 9.745880566843708e-05, + "loss": 1.2959, + "step": 10600 + }, + { + "epoch": 0.2, + "learning_rate": 9.745404983028242e-05, + "loss": 1.1221, + "step": 10610 + }, + { + "epoch": 0.2, + "learning_rate": 9.744928966227687e-05, + "loss": 1.4815, + "step": 10620 + }, + { + "epoch": 0.2, + "learning_rate": 9.744452516485477e-05, + "loss": 1.1181, + "step": 10630 + }, + { + "epoch": 0.2, + "learning_rate": 9.743975633845087e-05, + "loss": 1.4959, + "step": 10640 + }, + { + "epoch": 0.2, + "learning_rate": 9.743498318350026e-05, + "loss": 1.2657, + "step": 10650 + }, + { + "epoch": 0.2, + "learning_rate": 9.74302057004385e-05, + "loss": 1.1393, + "step": 10660 + }, + { + "epoch": 0.21, + "learning_rate": 9.742542388970147e-05, + "loss": 1.4397, + "step": 10670 + }, + { + "epoch": 0.21, + "learning_rate": 9.742063775172548e-05, + "loss": 1.3163, + "step": 10680 + }, + { + "epoch": 0.21, + "learning_rate": 9.741584728694724e-05, + "loss": 1.2981, + "step": 10690 + }, + { + "epoch": 0.21, + "learning_rate": 9.741105249580383e-05, + "loss": 1.4278, + "step": 10700 + }, + { + "epoch": 0.21, + "learning_rate": 9.740625337873277e-05, + "loss": 1.2684, + "step": 10710 + }, + { + "epoch": 0.21, + "learning_rate": 9.740144993617191e-05, + "loss": 1.5667, + "step": 10720 + }, + { + "epoch": 0.21, + "learning_rate": 9.739664216855957e-05, + "loss": 1.2765, + "step": 10730 + }, + { + "epoch": 0.21, + "learning_rate": 9.739183007633439e-05, + "loss": 1.0858, + "step": 10740 + }, + { + "epoch": 0.21, + "learning_rate": 9.738701365993547e-05, + "loss": 1.2874, + "step": 10750 + }, + { + "epoch": 0.21, + "learning_rate": 9.738219291980224e-05, + "loss": 1.2453, + "step": 10760 + }, + { + "epoch": 0.21, + "learning_rate": 9.737736785637459e-05, + "loss": 1.2517, + "step": 10770 + }, + { + "epoch": 0.21, + "learning_rate": 9.737253847009278e-05, + "loss": 1.4115, + "step": 10780 + }, + { + "epoch": 0.21, + "learning_rate": 9.73677047613974e-05, + "loss": 1.1685, + "step": 10790 + }, + { + "epoch": 0.21, + "learning_rate": 9.736286673072957e-05, + "loss": 1.1497, + "step": 10800 + }, + { + "epoch": 0.21, + "learning_rate": 9.735802437853066e-05, + "loss": 1.3992, + "step": 10810 + }, + { + "epoch": 0.21, + "learning_rate": 9.735317770524254e-05, + "loss": 1.5233, + "step": 10820 + }, + { + "epoch": 0.21, + "learning_rate": 9.734832671130744e-05, + "loss": 1.3203, + "step": 10830 + }, + { + "epoch": 0.21, + "learning_rate": 9.734347139716794e-05, + "loss": 1.1107, + "step": 10840 + }, + { + "epoch": 0.21, + "learning_rate": 9.733861176326709e-05, + "loss": 1.213, + "step": 10850 + }, + { + "epoch": 0.21, + "learning_rate": 9.733374781004829e-05, + "loss": 1.2568, + "step": 10860 + }, + { + "epoch": 0.21, + "learning_rate": 9.732887953795531e-05, + "loss": 1.3048, + "step": 10870 + }, + { + "epoch": 0.21, + "learning_rate": 9.73240069474324e-05, + "loss": 1.2171, + "step": 10880 + }, + { + "epoch": 0.21, + "learning_rate": 9.73191300389241e-05, + "loss": 1.5973, + "step": 10890 + }, + { + "epoch": 0.21, + "learning_rate": 9.731424881287542e-05, + "loss": 1.3277, + "step": 10900 + }, + { + "epoch": 0.21, + "learning_rate": 9.730936326973176e-05, + "loss": 1.2673, + "step": 10910 + }, + { + "epoch": 0.21, + "learning_rate": 9.730447340993884e-05, + "loss": 1.1229, + "step": 10920 + }, + { + "epoch": 0.21, + "learning_rate": 9.729957923394287e-05, + "loss": 1.1801, + "step": 10930 + }, + { + "epoch": 0.21, + "learning_rate": 9.729468074219038e-05, + "loss": 1.0772, + "step": 10940 + }, + { + "epoch": 0.21, + "learning_rate": 9.728977793512833e-05, + "loss": 1.3307, + "step": 10950 + }, + { + "epoch": 0.21, + "learning_rate": 9.728487081320408e-05, + "loss": 1.3974, + "step": 10960 + }, + { + "epoch": 0.21, + "learning_rate": 9.727995937686536e-05, + "loss": 1.1048, + "step": 10970 + }, + { + "epoch": 0.21, + "learning_rate": 9.72750436265603e-05, + "loss": 1.3663, + "step": 10980 + }, + { + "epoch": 0.21, + "learning_rate": 9.727012356273743e-05, + "loss": 1.5067, + "step": 10990 + }, + { + "epoch": 0.21, + "learning_rate": 9.726519918584569e-05, + "loss": 1.3096, + "step": 11000 + }, + { + "epoch": 0.21, + "learning_rate": 9.726027049633437e-05, + "loss": 1.3174, + "step": 11010 + }, + { + "epoch": 0.21, + "learning_rate": 9.725533749465319e-05, + "loss": 1.2514, + "step": 11020 + }, + { + "epoch": 0.21, + "learning_rate": 9.725040018125225e-05, + "loss": 1.1859, + "step": 11030 + }, + { + "epoch": 0.21, + "learning_rate": 9.724545855658205e-05, + "loss": 1.4342, + "step": 11040 + }, + { + "epoch": 0.21, + "learning_rate": 9.724051262109347e-05, + "loss": 1.283, + "step": 11050 + }, + { + "epoch": 0.21, + "learning_rate": 9.723556237523778e-05, + "loss": 1.2706, + "step": 11060 + }, + { + "epoch": 0.21, + "learning_rate": 9.72306078194667e-05, + "loss": 1.3571, + "step": 11070 + }, + { + "epoch": 0.21, + "learning_rate": 9.722564895423226e-05, + "loss": 1.3535, + "step": 11080 + }, + { + "epoch": 0.21, + "learning_rate": 9.722068577998694e-05, + "loss": 1.2717, + "step": 11090 + }, + { + "epoch": 0.21, + "learning_rate": 9.721571829718358e-05, + "loss": 1.4024, + "step": 11100 + }, + { + "epoch": 0.21, + "learning_rate": 9.721074650627544e-05, + "loss": 1.1179, + "step": 11110 + }, + { + "epoch": 0.21, + "learning_rate": 9.720577040771615e-05, + "loss": 1.2735, + "step": 11120 + }, + { + "epoch": 0.21, + "learning_rate": 9.720079000195977e-05, + "loss": 1.1875, + "step": 11130 + }, + { + "epoch": 0.21, + "learning_rate": 9.719580528946068e-05, + "loss": 1.3639, + "step": 11140 + }, + { + "epoch": 0.21, + "learning_rate": 9.719081627067374e-05, + "loss": 1.3208, + "step": 11150 + }, + { + "epoch": 0.21, + "learning_rate": 9.718582294605417e-05, + "loss": 1.58, + "step": 11160 + }, + { + "epoch": 0.21, + "learning_rate": 9.718082531605755e-05, + "loss": 1.2939, + "step": 11170 + }, + { + "epoch": 0.21, + "learning_rate": 9.717582338113987e-05, + "loss": 1.3281, + "step": 11180 + }, + { + "epoch": 0.22, + "learning_rate": 9.717081714175756e-05, + "loss": 1.359, + "step": 11190 + }, + { + "epoch": 0.22, + "learning_rate": 9.716580659836737e-05, + "loss": 1.2993, + "step": 11200 + }, + { + "epoch": 0.22, + "learning_rate": 9.716079175142649e-05, + "loss": 1.3212, + "step": 11210 + }, + { + "epoch": 0.22, + "learning_rate": 9.71557726013925e-05, + "loss": 1.2218, + "step": 11220 + }, + { + "epoch": 0.22, + "learning_rate": 9.715074914872335e-05, + "loss": 1.3414, + "step": 11230 + }, + { + "epoch": 0.22, + "learning_rate": 9.714572139387739e-05, + "loss": 1.229, + "step": 11240 + }, + { + "epoch": 0.22, + "learning_rate": 9.714068933731337e-05, + "loss": 1.2429, + "step": 11250 + }, + { + "epoch": 0.22, + "learning_rate": 9.713565297949045e-05, + "loss": 1.3841, + "step": 11260 + }, + { + "epoch": 0.22, + "learning_rate": 9.713061232086814e-05, + "loss": 1.0936, + "step": 11270 + }, + { + "epoch": 0.22, + "learning_rate": 9.712556736190636e-05, + "loss": 1.4631, + "step": 11280 + }, + { + "epoch": 0.22, + "learning_rate": 9.712051810306546e-05, + "loss": 1.3352, + "step": 11290 + }, + { + "epoch": 0.22, + "learning_rate": 9.711546454480614e-05, + "loss": 1.2983, + "step": 11300 + }, + { + "epoch": 0.22, + "learning_rate": 9.711040668758946e-05, + "loss": 1.1473, + "step": 11310 + }, + { + "epoch": 0.22, + "learning_rate": 9.710534453187696e-05, + "loss": 1.2945, + "step": 11320 + }, + { + "epoch": 0.22, + "learning_rate": 9.710027807813051e-05, + "loss": 1.4571, + "step": 11330 + }, + { + "epoch": 0.22, + "learning_rate": 9.70952073268124e-05, + "loss": 1.419, + "step": 11340 + }, + { + "epoch": 0.22, + "learning_rate": 9.709013227838527e-05, + "loss": 1.3024, + "step": 11350 + }, + { + "epoch": 0.22, + "learning_rate": 9.708505293331222e-05, + "loss": 1.2102, + "step": 11360 + }, + { + "epoch": 0.22, + "learning_rate": 9.707996929205668e-05, + "loss": 1.3852, + "step": 11370 + }, + { + "epoch": 0.22, + "learning_rate": 9.707488135508252e-05, + "loss": 1.2365, + "step": 11380 + }, + { + "epoch": 0.22, + "learning_rate": 9.706978912285394e-05, + "loss": 1.2113, + "step": 11390 + }, + { + "epoch": 0.22, + "learning_rate": 9.706469259583561e-05, + "loss": 1.2776, + "step": 11400 + }, + { + "epoch": 0.22, + "learning_rate": 9.705959177449253e-05, + "loss": 1.3543, + "step": 11410 + }, + { + "epoch": 0.22, + "learning_rate": 9.705448665929013e-05, + "loss": 1.2315, + "step": 11420 + }, + { + "epoch": 0.22, + "learning_rate": 9.704937725069421e-05, + "loss": 1.3477, + "step": 11430 + }, + { + "epoch": 0.22, + "learning_rate": 9.704426354917096e-05, + "loss": 1.332, + "step": 11440 + }, + { + "epoch": 0.22, + "learning_rate": 9.703914555518697e-05, + "loss": 1.0505, + "step": 11450 + }, + { + "epoch": 0.22, + "learning_rate": 9.703402326920922e-05, + "loss": 1.2145, + "step": 11460 + }, + { + "epoch": 0.22, + "learning_rate": 9.702889669170512e-05, + "loss": 1.3894, + "step": 11470 + }, + { + "epoch": 0.22, + "learning_rate": 9.702376582314238e-05, + "loss": 1.3382, + "step": 11480 + }, + { + "epoch": 0.22, + "learning_rate": 9.701863066398917e-05, + "loss": 1.2951, + "step": 11490 + }, + { + "epoch": 0.22, + "learning_rate": 9.701349121471407e-05, + "loss": 1.0731, + "step": 11500 + }, + { + "epoch": 0.22, + "learning_rate": 9.700834747578598e-05, + "loss": 1.3168, + "step": 11510 + }, + { + "epoch": 0.22, + "learning_rate": 9.700319944767427e-05, + "loss": 1.1765, + "step": 11520 + }, + { + "epoch": 0.22, + "learning_rate": 9.699804713084862e-05, + "loss": 1.2865, + "step": 11530 + }, + { + "epoch": 0.22, + "learning_rate": 9.699289052577916e-05, + "loss": 1.261, + "step": 11540 + }, + { + "epoch": 0.22, + "learning_rate": 9.698772963293638e-05, + "loss": 1.8619, + "step": 11550 + }, + { + "epoch": 0.22, + "learning_rate": 9.698256445279122e-05, + "loss": 1.2947, + "step": 11560 + }, + { + "epoch": 0.22, + "learning_rate": 9.697739498581493e-05, + "loss": 1.5425, + "step": 11570 + }, + { + "epoch": 0.22, + "learning_rate": 9.697222123247917e-05, + "loss": 1.3848, + "step": 11580 + }, + { + "epoch": 0.22, + "learning_rate": 9.696704319325607e-05, + "loss": 1.3001, + "step": 11590 + }, + { + "epoch": 0.22, + "learning_rate": 9.696186086861803e-05, + "loss": 1.4272, + "step": 11600 + }, + { + "epoch": 0.22, + "learning_rate": 9.695667425903794e-05, + "loss": 1.361, + "step": 11610 + }, + { + "epoch": 0.22, + "learning_rate": 9.6951483364989e-05, + "loss": 1.2557, + "step": 11620 + }, + { + "epoch": 0.22, + "learning_rate": 9.69462881869449e-05, + "loss": 1.1357, + "step": 11630 + }, + { + "epoch": 0.22, + "learning_rate": 9.694108872537962e-05, + "loss": 1.3093, + "step": 11640 + }, + { + "epoch": 0.22, + "learning_rate": 9.693588498076759e-05, + "loss": 1.5686, + "step": 11650 + }, + { + "epoch": 0.22, + "learning_rate": 9.693067695358361e-05, + "loss": 1.3165, + "step": 11660 + }, + { + "epoch": 0.22, + "learning_rate": 9.692546464430288e-05, + "loss": 1.5016, + "step": 11670 + }, + { + "epoch": 0.22, + "learning_rate": 9.692024805340098e-05, + "loss": 1.445, + "step": 11680 + }, + { + "epoch": 0.22, + "learning_rate": 9.691502718135392e-05, + "loss": 1.1653, + "step": 11690 + }, + { + "epoch": 0.22, + "learning_rate": 9.690980202863802e-05, + "loss": 1.0476, + "step": 11700 + }, + { + "epoch": 0.23, + "learning_rate": 9.690457259573006e-05, + "loss": 1.1743, + "step": 11710 + }, + { + "epoch": 0.23, + "learning_rate": 9.689933888310719e-05, + "loss": 1.432, + "step": 11720 + }, + { + "epoch": 0.23, + "learning_rate": 9.689410089124695e-05, + "loss": 1.1104, + "step": 11730 + }, + { + "epoch": 0.23, + "learning_rate": 9.688885862062727e-05, + "loss": 1.0394, + "step": 11740 + }, + { + "epoch": 0.23, + "learning_rate": 9.688361207172647e-05, + "loss": 1.2931, + "step": 11750 + }, + { + "epoch": 0.23, + "learning_rate": 9.687836124502328e-05, + "loss": 1.3693, + "step": 11760 + }, + { + "epoch": 0.23, + "learning_rate": 9.687310614099675e-05, + "loss": 1.1884, + "step": 11770 + }, + { + "epoch": 0.23, + "learning_rate": 9.686784676012643e-05, + "loss": 1.093, + "step": 11780 + }, + { + "epoch": 0.23, + "learning_rate": 9.686258310289215e-05, + "loss": 1.0592, + "step": 11790 + }, + { + "epoch": 0.23, + "learning_rate": 9.685731516977423e-05, + "loss": 1.335, + "step": 11800 + }, + { + "epoch": 0.23, + "learning_rate": 9.685204296125332e-05, + "loss": 1.6729, + "step": 11810 + }, + { + "epoch": 0.23, + "learning_rate": 9.684676647781043e-05, + "loss": 1.1505, + "step": 11820 + }, + { + "epoch": 0.23, + "learning_rate": 9.684148571992706e-05, + "loss": 1.4953, + "step": 11830 + }, + { + "epoch": 0.23, + "learning_rate": 9.683620068808501e-05, + "loss": 1.0413, + "step": 11840 + }, + { + "epoch": 0.23, + "learning_rate": 9.68309113827665e-05, + "loss": 1.4012, + "step": 11850 + }, + { + "epoch": 0.23, + "learning_rate": 9.682561780445416e-05, + "loss": 1.315, + "step": 11860 + }, + { + "epoch": 0.23, + "learning_rate": 9.682031995363098e-05, + "loss": 1.1989, + "step": 11870 + }, + { + "epoch": 0.23, + "learning_rate": 9.681501783078038e-05, + "loss": 1.3461, + "step": 11880 + }, + { + "epoch": 0.23, + "learning_rate": 9.680971143638608e-05, + "loss": 1.3148, + "step": 11890 + }, + { + "epoch": 0.23, + "learning_rate": 9.680440077093231e-05, + "loss": 1.3559, + "step": 11900 + }, + { + "epoch": 0.23, + "learning_rate": 9.67990858349036e-05, + "loss": 1.2588, + "step": 11910 + }, + { + "epoch": 0.23, + "learning_rate": 9.679376662878492e-05, + "loss": 1.4767, + "step": 11920 + }, + { + "epoch": 0.23, + "learning_rate": 9.678844315306159e-05, + "loss": 1.4732, + "step": 11930 + }, + { + "epoch": 0.23, + "learning_rate": 9.678311540821936e-05, + "loss": 1.5456, + "step": 11940 + }, + { + "epoch": 0.23, + "learning_rate": 9.677778339474432e-05, + "loss": 1.3482, + "step": 11950 + }, + { + "epoch": 0.23, + "learning_rate": 9.677244711312303e-05, + "loss": 1.093, + "step": 11960 + }, + { + "epoch": 0.23, + "learning_rate": 9.676710656384234e-05, + "loss": 1.2155, + "step": 11970 + }, + { + "epoch": 0.23, + "learning_rate": 9.676176174738956e-05, + "loss": 1.2428, + "step": 11980 + }, + { + "epoch": 0.23, + "learning_rate": 9.675641266425237e-05, + "loss": 1.2648, + "step": 11990 + }, + { + "epoch": 0.23, + "learning_rate": 9.675105931491882e-05, + "loss": 1.0336, + "step": 12000 + }, + { + "epoch": 0.23, + "learning_rate": 9.674570169987737e-05, + "loss": 1.3075, + "step": 12010 + }, + { + "epoch": 0.23, + "learning_rate": 9.674033981961688e-05, + "loss": 1.1876, + "step": 12020 + }, + { + "epoch": 0.23, + "learning_rate": 9.673497367462657e-05, + "loss": 1.4412, + "step": 12030 + }, + { + "epoch": 0.23, + "learning_rate": 9.672960326539607e-05, + "loss": 1.404, + "step": 12040 + }, + { + "epoch": 0.23, + "learning_rate": 9.672422859241539e-05, + "loss": 1.3015, + "step": 12050 + }, + { + "epoch": 0.23, + "learning_rate": 9.671884965617493e-05, + "loss": 1.4785, + "step": 12060 + }, + { + "epoch": 0.23, + "learning_rate": 9.671346645716549e-05, + "loss": 1.3855, + "step": 12070 + }, + { + "epoch": 0.23, + "learning_rate": 9.670807899587824e-05, + "loss": 1.328, + "step": 12080 + }, + { + "epoch": 0.23, + "learning_rate": 9.670268727280473e-05, + "loss": 1.3459, + "step": 12090 + }, + { + "epoch": 0.23, + "learning_rate": 9.669729128843696e-05, + "loss": 1.1278, + "step": 12100 + }, + { + "epoch": 0.23, + "learning_rate": 9.669189104326723e-05, + "loss": 1.2781, + "step": 12110 + }, + { + "epoch": 0.23, + "learning_rate": 9.668648653778832e-05, + "loss": 1.3047, + "step": 12120 + }, + { + "epoch": 0.23, + "learning_rate": 9.668107777249332e-05, + "loss": 1.5821, + "step": 12130 + }, + { + "epoch": 0.23, + "learning_rate": 9.667566474787576e-05, + "loss": 1.3916, + "step": 12140 + }, + { + "epoch": 0.23, + "learning_rate": 9.667024746442952e-05, + "loss": 1.1922, + "step": 12150 + }, + { + "epoch": 0.23, + "learning_rate": 9.666482592264891e-05, + "loss": 1.5275, + "step": 12160 + }, + { + "epoch": 0.23, + "learning_rate": 9.66594001230286e-05, + "loss": 1.4539, + "step": 12170 + }, + { + "epoch": 0.23, + "learning_rate": 9.665397006606368e-05, + "loss": 1.2838, + "step": 12180 + }, + { + "epoch": 0.23, + "learning_rate": 9.664853575224954e-05, + "loss": 1.405, + "step": 12190 + }, + { + "epoch": 0.23, + "learning_rate": 9.664309718208209e-05, + "loss": 1.4633, + "step": 12200 + }, + { + "epoch": 0.23, + "learning_rate": 9.663765435605753e-05, + "loss": 1.1995, + "step": 12210 + }, + { + "epoch": 0.23, + "learning_rate": 9.663220727467247e-05, + "loss": 1.4539, + "step": 12220 + }, + { + "epoch": 0.24, + "learning_rate": 9.662675593842396e-05, + "loss": 1.123, + "step": 12230 + }, + { + "epoch": 0.24, + "learning_rate": 9.662130034780936e-05, + "loss": 1.1991, + "step": 12240 + }, + { + "epoch": 0.24, + "learning_rate": 9.661584050332647e-05, + "loss": 1.1451, + "step": 12250 + }, + { + "epoch": 0.24, + "learning_rate": 9.661037640547345e-05, + "loss": 1.2448, + "step": 12260 + }, + { + "epoch": 0.24, + "learning_rate": 9.660490805474889e-05, + "loss": 1.2303, + "step": 12270 + }, + { + "epoch": 0.24, + "learning_rate": 9.65994354516517e-05, + "loss": 1.3741, + "step": 12280 + }, + { + "epoch": 0.24, + "learning_rate": 9.659395859668123e-05, + "loss": 1.2424, + "step": 12290 + }, + { + "epoch": 0.24, + "learning_rate": 9.658847749033722e-05, + "loss": 1.4204, + "step": 12300 + }, + { + "epoch": 0.24, + "learning_rate": 9.658299213311976e-05, + "loss": 1.2381, + "step": 12310 + }, + { + "epoch": 0.24, + "learning_rate": 9.657750252552939e-05, + "loss": 1.3357, + "step": 12320 + }, + { + "epoch": 0.24, + "learning_rate": 9.657200866806695e-05, + "loss": 1.4023, + "step": 12330 + }, + { + "epoch": 0.24, + "learning_rate": 9.656651056123374e-05, + "loss": 1.2667, + "step": 12340 + }, + { + "epoch": 0.24, + "learning_rate": 9.656100820553143e-05, + "loss": 1.259, + "step": 12350 + }, + { + "epoch": 0.24, + "learning_rate": 9.655550160146204e-05, + "loss": 1.1893, + "step": 12360 + }, + { + "epoch": 0.24, + "learning_rate": 9.654999074952805e-05, + "loss": 1.2523, + "step": 12370 + }, + { + "epoch": 0.24, + "learning_rate": 9.654447565023226e-05, + "loss": 1.4266, + "step": 12380 + }, + { + "epoch": 0.24, + "learning_rate": 9.65389563040779e-05, + "loss": 1.4251, + "step": 12390 + }, + { + "epoch": 0.24, + "learning_rate": 9.653343271156857e-05, + "loss": 1.0538, + "step": 12400 + }, + { + "epoch": 0.24, + "learning_rate": 9.652790487320824e-05, + "loss": 1.1824, + "step": 12410 + }, + { + "epoch": 0.24, + "learning_rate": 9.65223727895013e-05, + "loss": 1.4353, + "step": 12420 + }, + { + "epoch": 0.24, + "learning_rate": 9.651683646095253e-05, + "loss": 1.171, + "step": 12430 + }, + { + "epoch": 0.24, + "learning_rate": 9.651129588806706e-05, + "loss": 1.2732, + "step": 12440 + }, + { + "epoch": 0.24, + "learning_rate": 9.650575107135043e-05, + "loss": 1.2488, + "step": 12450 + }, + { + "epoch": 0.24, + "learning_rate": 9.650020201130857e-05, + "loss": 1.3298, + "step": 12460 + }, + { + "epoch": 0.24, + "learning_rate": 9.64946487084478e-05, + "loss": 1.3317, + "step": 12470 + }, + { + "epoch": 0.24, + "learning_rate": 9.648909116327481e-05, + "loss": 1.4012, + "step": 12480 + }, + { + "epoch": 0.24, + "learning_rate": 9.64835293762967e-05, + "loss": 1.4585, + "step": 12490 + }, + { + "epoch": 0.24, + "learning_rate": 9.647796334802092e-05, + "loss": 1.3453, + "step": 12500 + }, + { + "epoch": 0.24, + "learning_rate": 9.647239307895535e-05, + "loss": 1.2789, + "step": 12510 + }, + { + "epoch": 0.24, + "learning_rate": 9.646681856960824e-05, + "loss": 1.1763, + "step": 12520 + }, + { + "epoch": 0.24, + "learning_rate": 9.646123982048823e-05, + "loss": 1.3391, + "step": 12530 + }, + { + "epoch": 0.24, + "learning_rate": 9.645565683210432e-05, + "loss": 1.3108, + "step": 12540 + }, + { + "epoch": 0.24, + "learning_rate": 9.645006960496592e-05, + "loss": 1.2904, + "step": 12550 + }, + { + "epoch": 0.24, + "learning_rate": 9.644447813958285e-05, + "loss": 1.197, + "step": 12560 + }, + { + "epoch": 0.24, + "learning_rate": 9.643888243646526e-05, + "loss": 1.1268, + "step": 12570 + }, + { + "epoch": 0.24, + "learning_rate": 9.643328249612376e-05, + "loss": 1.4279, + "step": 12580 + }, + { + "epoch": 0.24, + "learning_rate": 9.642767831906927e-05, + "loss": 1.427, + "step": 12590 + }, + { + "epoch": 0.24, + "learning_rate": 9.642206990581315e-05, + "loss": 1.3183, + "step": 12600 + }, + { + "epoch": 0.24, + "learning_rate": 9.641645725686712e-05, + "loss": 1.3977, + "step": 12610 + }, + { + "epoch": 0.24, + "learning_rate": 9.641084037274328e-05, + "loss": 1.1507, + "step": 12620 + }, + { + "epoch": 0.24, + "learning_rate": 9.640521925395418e-05, + "loss": 1.2651, + "step": 12630 + }, + { + "epoch": 0.24, + "learning_rate": 9.639959390101266e-05, + "loss": 1.1262, + "step": 12640 + }, + { + "epoch": 0.24, + "learning_rate": 9.639396431443201e-05, + "loss": 1.2044, + "step": 12650 + }, + { + "epoch": 0.24, + "learning_rate": 9.63883304947259e-05, + "loss": 1.3134, + "step": 12660 + }, + { + "epoch": 0.24, + "learning_rate": 9.638269244240837e-05, + "loss": 1.3075, + "step": 12670 + }, + { + "epoch": 0.24, + "learning_rate": 9.637705015799385e-05, + "loss": 1.1927, + "step": 12680 + }, + { + "epoch": 0.24, + "learning_rate": 9.637140364199716e-05, + "loss": 1.1793, + "step": 12690 + }, + { + "epoch": 0.24, + "learning_rate": 9.636575289493351e-05, + "loss": 1.3144, + "step": 12700 + }, + { + "epoch": 0.24, + "learning_rate": 9.636009791731848e-05, + "loss": 1.3483, + "step": 12710 + }, + { + "epoch": 0.24, + "learning_rate": 9.635443870966805e-05, + "loss": 1.5586, + "step": 12720 + }, + { + "epoch": 0.24, + "learning_rate": 9.634877527249859e-05, + "loss": 1.4635, + "step": 12730 + }, + { + "epoch": 0.24, + "learning_rate": 9.634310760632685e-05, + "loss": 1.1159, + "step": 12740 + }, + { + "epoch": 0.25, + "learning_rate": 9.633743571166997e-05, + "loss": 1.1738, + "step": 12750 + }, + { + "epoch": 0.25, + "learning_rate": 9.633175958904545e-05, + "loss": 1.2917, + "step": 12760 + }, + { + "epoch": 0.25, + "learning_rate": 9.632607923897122e-05, + "loss": 1.2186, + "step": 12770 + }, + { + "epoch": 0.25, + "learning_rate": 9.632039466196557e-05, + "loss": 1.2737, + "step": 12780 + }, + { + "epoch": 0.25, + "learning_rate": 9.631470585854714e-05, + "loss": 1.4299, + "step": 12790 + }, + { + "epoch": 0.25, + "learning_rate": 9.630901282923503e-05, + "loss": 1.3434, + "step": 12800 + }, + { + "epoch": 0.25, + "learning_rate": 9.63033155745487e-05, + "loss": 1.3396, + "step": 12810 + }, + { + "epoch": 0.25, + "learning_rate": 9.629761409500795e-05, + "loss": 1.3017, + "step": 12820 + }, + { + "epoch": 0.25, + "learning_rate": 9.629190839113303e-05, + "loss": 1.4041, + "step": 12830 + }, + { + "epoch": 0.25, + "learning_rate": 9.628619846344454e-05, + "loss": 1.5323, + "step": 12840 + }, + { + "epoch": 0.25, + "learning_rate": 9.628048431246343e-05, + "loss": 1.2393, + "step": 12850 + }, + { + "epoch": 0.25, + "learning_rate": 9.627476593871114e-05, + "loss": 1.3642, + "step": 12860 + }, + { + "epoch": 0.25, + "learning_rate": 9.626904334270938e-05, + "loss": 1.2699, + "step": 12870 + }, + { + "epoch": 0.25, + "learning_rate": 9.626331652498034e-05, + "loss": 1.1997, + "step": 12880 + }, + { + "epoch": 0.25, + "learning_rate": 9.625758548604652e-05, + "loss": 1.5095, + "step": 12890 + }, + { + "epoch": 0.25, + "learning_rate": 9.625185022643086e-05, + "loss": 1.4039, + "step": 12900 + }, + { + "epoch": 0.25, + "learning_rate": 9.624611074665664e-05, + "loss": 1.2304, + "step": 12910 + }, + { + "epoch": 0.25, + "learning_rate": 9.624036704724755e-05, + "loss": 1.3279, + "step": 12920 + }, + { + "epoch": 0.25, + "learning_rate": 9.623461912872768e-05, + "loss": 1.1611, + "step": 12930 + }, + { + "epoch": 0.25, + "learning_rate": 9.622886699162148e-05, + "loss": 1.2507, + "step": 12940 + }, + { + "epoch": 0.25, + "learning_rate": 9.622311063645379e-05, + "loss": 1.2207, + "step": 12950 + }, + { + "epoch": 0.25, + "learning_rate": 9.621735006374983e-05, + "loss": 1.3434, + "step": 12960 + }, + { + "epoch": 0.25, + "learning_rate": 9.621158527403524e-05, + "loss": 1.1867, + "step": 12970 + }, + { + "epoch": 0.25, + "learning_rate": 9.620581626783598e-05, + "loss": 1.2722, + "step": 12980 + }, + { + "epoch": 0.25, + "learning_rate": 9.620004304567844e-05, + "loss": 1.1997, + "step": 12990 + }, + { + "epoch": 0.25, + "learning_rate": 9.619426560808942e-05, + "loss": 1.2303, + "step": 13000 + }, + { + "epoch": 0.25, + "learning_rate": 9.618848395559604e-05, + "loss": 1.2767, + "step": 13010 + }, + { + "epoch": 0.25, + "learning_rate": 9.618269808872582e-05, + "loss": 1.2423, + "step": 13020 + }, + { + "epoch": 0.25, + "learning_rate": 9.617690800800671e-05, + "loss": 1.2134, + "step": 13030 + }, + { + "epoch": 0.25, + "learning_rate": 9.6171113713967e-05, + "loss": 1.0973, + "step": 13040 + }, + { + "epoch": 0.25, + "learning_rate": 9.616531520713542e-05, + "loss": 1.2826, + "step": 13050 + }, + { + "epoch": 0.25, + "learning_rate": 9.615951248804096e-05, + "loss": 1.1461, + "step": 13060 + }, + { + "epoch": 0.25, + "learning_rate": 9.615370555721314e-05, + "loss": 1.0808, + "step": 13070 + }, + { + "epoch": 0.25, + "learning_rate": 9.61478944151818e-05, + "loss": 1.2635, + "step": 13080 + }, + { + "epoch": 0.25, + "learning_rate": 9.614207906247715e-05, + "loss": 1.0739, + "step": 13090 + }, + { + "epoch": 0.25, + "learning_rate": 9.61362594996298e-05, + "loss": 1.3752, + "step": 13100 + }, + { + "epoch": 0.25, + "learning_rate": 9.613043572717074e-05, + "loss": 1.2528, + "step": 13110 + }, + { + "epoch": 0.25, + "learning_rate": 9.612460774563136e-05, + "loss": 1.4285, + "step": 13120 + }, + { + "epoch": 0.25, + "learning_rate": 9.611877555554341e-05, + "loss": 1.2699, + "step": 13130 + }, + { + "epoch": 0.25, + "learning_rate": 9.611293915743906e-05, + "loss": 1.3874, + "step": 13140 + }, + { + "epoch": 0.25, + "learning_rate": 9.610709855185082e-05, + "loss": 1.1458, + "step": 13150 + }, + { + "epoch": 0.25, + "learning_rate": 9.610125373931162e-05, + "loss": 1.2177, + "step": 13160 + }, + { + "epoch": 0.25, + "learning_rate": 9.609540472035474e-05, + "loss": 1.2575, + "step": 13170 + }, + { + "epoch": 0.25, + "learning_rate": 9.608955149551388e-05, + "loss": 1.3255, + "step": 13180 + }, + { + "epoch": 0.25, + "learning_rate": 9.60836940653231e-05, + "loss": 1.3443, + "step": 13190 + }, + { + "epoch": 0.25, + "learning_rate": 9.607783243031682e-05, + "loss": 1.4566, + "step": 13200 + }, + { + "epoch": 0.25, + "learning_rate": 9.607196659102992e-05, + "loss": 1.3381, + "step": 13210 + }, + { + "epoch": 0.25, + "learning_rate": 9.606609654799761e-05, + "loss": 1.2155, + "step": 13220 + }, + { + "epoch": 0.25, + "learning_rate": 9.606022230175547e-05, + "loss": 1.1797, + "step": 13230 + }, + { + "epoch": 0.25, + "learning_rate": 9.605434385283947e-05, + "loss": 1.0969, + "step": 13240 + }, + { + "epoch": 0.25, + "learning_rate": 9.604846120178602e-05, + "loss": 1.2215, + "step": 13250 + }, + { + "epoch": 0.25, + "learning_rate": 9.604257434913184e-05, + "loss": 1.1516, + "step": 13260 + }, + { + "epoch": 0.26, + "learning_rate": 9.603668329541408e-05, + "loss": 1.4677, + "step": 13270 + }, + { + "epoch": 0.26, + "learning_rate": 9.603078804117026e-05, + "loss": 1.2844, + "step": 13280 + }, + { + "epoch": 0.26, + "learning_rate": 9.602488858693826e-05, + "loss": 1.1449, + "step": 13290 + }, + { + "epoch": 0.26, + "learning_rate": 9.601898493325636e-05, + "loss": 1.2592, + "step": 13300 + }, + { + "epoch": 0.26, + "learning_rate": 9.601307708066327e-05, + "loss": 1.3818, + "step": 13310 + }, + { + "epoch": 0.26, + "learning_rate": 9.6007165029698e-05, + "loss": 1.3662, + "step": 13320 + }, + { + "epoch": 0.26, + "learning_rate": 9.60012487809e-05, + "loss": 1.2059, + "step": 13330 + }, + { + "epoch": 0.26, + "learning_rate": 9.59953283348091e-05, + "loss": 1.4641, + "step": 13340 + }, + { + "epoch": 0.26, + "learning_rate": 9.598940369196547e-05, + "loss": 1.2971, + "step": 13350 + }, + { + "epoch": 0.26, + "learning_rate": 9.598347485290971e-05, + "loss": 1.2398, + "step": 13360 + }, + { + "epoch": 0.26, + "learning_rate": 9.597754181818277e-05, + "loss": 1.4895, + "step": 13370 + }, + { + "epoch": 0.26, + "learning_rate": 9.597160458832601e-05, + "loss": 1.2297, + "step": 13380 + }, + { + "epoch": 0.26, + "learning_rate": 9.596566316388116e-05, + "loss": 1.0977, + "step": 13390 + }, + { + "epoch": 0.26, + "learning_rate": 9.595971754539035e-05, + "loss": 1.2662, + "step": 13400 + }, + { + "epoch": 0.26, + "learning_rate": 9.595376773339604e-05, + "loss": 1.2493, + "step": 13410 + }, + { + "epoch": 0.26, + "learning_rate": 9.594781372844112e-05, + "loss": 1.3357, + "step": 13420 + }, + { + "epoch": 0.26, + "learning_rate": 9.594185553106889e-05, + "loss": 1.3568, + "step": 13430 + }, + { + "epoch": 0.26, + "learning_rate": 9.593589314182295e-05, + "loss": 1.2074, + "step": 13440 + }, + { + "epoch": 0.26, + "learning_rate": 9.592992656124733e-05, + "loss": 1.3435, + "step": 13450 + }, + { + "epoch": 0.26, + "learning_rate": 9.592395578988646e-05, + "loss": 1.2205, + "step": 13460 + }, + { + "epoch": 0.26, + "learning_rate": 9.591798082828511e-05, + "loss": 1.3639, + "step": 13470 + }, + { + "epoch": 0.26, + "learning_rate": 9.591200167698846e-05, + "loss": 1.2047, + "step": 13480 + }, + { + "epoch": 0.26, + "learning_rate": 9.590601833654208e-05, + "loss": 1.1246, + "step": 13490 + }, + { + "epoch": 0.26, + "learning_rate": 9.59000308074919e-05, + "loss": 1.2006, + "step": 13500 + }, + { + "epoch": 0.26, + "learning_rate": 9.589403909038424e-05, + "loss": 1.2141, + "step": 13510 + }, + { + "epoch": 0.26, + "learning_rate": 9.588804318576578e-05, + "loss": 1.2047, + "step": 13520 + }, + { + "epoch": 0.26, + "learning_rate": 9.588204309418363e-05, + "loss": 1.3082, + "step": 13530 + }, + { + "epoch": 0.26, + "learning_rate": 9.587603881618527e-05, + "loss": 1.0781, + "step": 13540 + }, + { + "epoch": 0.26, + "learning_rate": 9.587003035231852e-05, + "loss": 1.2985, + "step": 13550 + }, + { + "epoch": 0.26, + "learning_rate": 9.58640177031316e-05, + "loss": 1.3457, + "step": 13560 + }, + { + "epoch": 0.26, + "learning_rate": 9.585800086917316e-05, + "loss": 1.0767, + "step": 13570 + }, + { + "epoch": 0.26, + "learning_rate": 9.585197985099217e-05, + "loss": 1.4532, + "step": 13580 + }, + { + "epoch": 0.26, + "learning_rate": 9.584595464913801e-05, + "loss": 1.367, + "step": 13590 + }, + { + "epoch": 0.26, + "learning_rate": 9.583992526416046e-05, + "loss": 1.2669, + "step": 13600 + }, + { + "epoch": 0.26, + "learning_rate": 9.58338916966096e-05, + "loss": 1.3832, + "step": 13610 + }, + { + "epoch": 0.26, + "learning_rate": 9.582785394703604e-05, + "loss": 1.378, + "step": 13620 + }, + { + "epoch": 0.26, + "learning_rate": 9.58218120159906e-05, + "loss": 1.3135, + "step": 13630 + }, + { + "epoch": 0.26, + "learning_rate": 9.58157659040246e-05, + "loss": 1.2424, + "step": 13640 + }, + { + "epoch": 0.26, + "learning_rate": 9.58097156116897e-05, + "loss": 1.2324, + "step": 13650 + }, + { + "epoch": 0.26, + "learning_rate": 9.580366113953796e-05, + "loss": 1.3732, + "step": 13660 + }, + { + "epoch": 0.26, + "learning_rate": 9.579760248812179e-05, + "loss": 1.0931, + "step": 13670 + }, + { + "epoch": 0.26, + "learning_rate": 9.5791539657994e-05, + "loss": 1.4051, + "step": 13680 + }, + { + "epoch": 0.26, + "learning_rate": 9.578547264970779e-05, + "loss": 1.461, + "step": 13690 + }, + { + "epoch": 0.26, + "learning_rate": 9.577940146381675e-05, + "loss": 1.3012, + "step": 13700 + }, + { + "epoch": 0.26, + "learning_rate": 9.577332610087478e-05, + "loss": 1.2116, + "step": 13710 + }, + { + "epoch": 0.26, + "learning_rate": 9.576724656143627e-05, + "loss": 1.3947, + "step": 13720 + }, + { + "epoch": 0.26, + "learning_rate": 9.57611628460559e-05, + "loss": 1.1196, + "step": 13730 + }, + { + "epoch": 0.26, + "learning_rate": 9.57550749552888e-05, + "loss": 1.4405, + "step": 13740 + }, + { + "epoch": 0.26, + "learning_rate": 9.57489828896904e-05, + "loss": 1.3217, + "step": 13750 + }, + { + "epoch": 0.26, + "learning_rate": 9.574288664981662e-05, + "loss": 1.2536, + "step": 13760 + }, + { + "epoch": 0.26, + "learning_rate": 9.573678623622363e-05, + "loss": 1.2568, + "step": 13770 + }, + { + "epoch": 0.26, + "learning_rate": 9.57306816494681e-05, + "loss": 1.0089, + "step": 13780 + }, + { + "epoch": 0.27, + "learning_rate": 9.572457289010702e-05, + "loss": 1.4428, + "step": 13790 + }, + { + "epoch": 0.27, + "learning_rate": 9.571845995869776e-05, + "loss": 1.3519, + "step": 13800 + }, + { + "epoch": 0.27, + "learning_rate": 9.571234285579811e-05, + "loss": 1.2439, + "step": 13810 + }, + { + "epoch": 0.27, + "learning_rate": 9.570622158196618e-05, + "loss": 1.3892, + "step": 13820 + }, + { + "epoch": 0.27, + "learning_rate": 9.57000961377605e-05, + "loss": 1.1095, + "step": 13830 + }, + { + "epoch": 0.27, + "learning_rate": 9.569396652373998e-05, + "loss": 1.1698, + "step": 13840 + }, + { + "epoch": 0.27, + "learning_rate": 9.568783274046391e-05, + "loss": 1.5212, + "step": 13850 + }, + { + "epoch": 0.27, + "learning_rate": 9.568169478849197e-05, + "loss": 1.2814, + "step": 13860 + }, + { + "epoch": 0.27, + "learning_rate": 9.567555266838416e-05, + "loss": 1.2799, + "step": 13870 + }, + { + "epoch": 0.27, + "learning_rate": 9.566940638070094e-05, + "loss": 1.4536, + "step": 13880 + }, + { + "epoch": 0.27, + "learning_rate": 9.56632559260031e-05, + "loss": 1.3424, + "step": 13890 + }, + { + "epoch": 0.27, + "learning_rate": 9.565710130485183e-05, + "loss": 1.1792, + "step": 13900 + }, + { + "epoch": 0.27, + "learning_rate": 9.565094251780871e-05, + "loss": 1.402, + "step": 13910 + }, + { + "epoch": 0.27, + "learning_rate": 9.564477956543568e-05, + "loss": 1.5138, + "step": 13920 + }, + { + "epoch": 0.27, + "learning_rate": 9.563861244829504e-05, + "loss": 1.2251, + "step": 13930 + }, + { + "epoch": 0.27, + "learning_rate": 9.563244116694954e-05, + "loss": 1.2607, + "step": 13940 + }, + { + "epoch": 0.27, + "learning_rate": 9.562626572196224e-05, + "loss": 1.2343, + "step": 13950 + }, + { + "epoch": 0.27, + "learning_rate": 9.56200861138966e-05, + "loss": 1.2829, + "step": 13960 + }, + { + "epoch": 0.27, + "learning_rate": 9.561390234331649e-05, + "loss": 1.2447, + "step": 13970 + }, + { + "epoch": 0.27, + "learning_rate": 9.560771441078613e-05, + "loss": 1.458, + "step": 13980 + }, + { + "epoch": 0.27, + "learning_rate": 9.56015223168701e-05, + "loss": 1.2906, + "step": 13990 + }, + { + "epoch": 0.27, + "learning_rate": 9.559532606213341e-05, + "loss": 1.1875, + "step": 14000 + }, + { + "epoch": 0.27, + "learning_rate": 9.558912564714142e-05, + "loss": 1.2395, + "step": 14010 + }, + { + "epoch": 0.27, + "learning_rate": 9.558292107245986e-05, + "loss": 1.3027, + "step": 14020 + }, + { + "epoch": 0.27, + "learning_rate": 9.557671233865488e-05, + "loss": 1.0481, + "step": 14030 + }, + { + "epoch": 0.27, + "learning_rate": 9.557049944629297e-05, + "loss": 1.2331, + "step": 14040 + }, + { + "epoch": 0.27, + "learning_rate": 9.556428239594103e-05, + "loss": 1.3488, + "step": 14050 + }, + { + "epoch": 0.27, + "learning_rate": 9.555806118816629e-05, + "loss": 1.296, + "step": 14060 + }, + { + "epoch": 0.27, + "learning_rate": 9.555183582353642e-05, + "loss": 1.0644, + "step": 14070 + }, + { + "epoch": 0.27, + "learning_rate": 9.554560630261942e-05, + "loss": 1.3796, + "step": 14080 + }, + { + "epoch": 0.27, + "learning_rate": 9.553937262598369e-05, + "loss": 1.4246, + "step": 14090 + }, + { + "epoch": 0.27, + "learning_rate": 9.553313479419803e-05, + "loss": 1.2945, + "step": 14100 + }, + { + "epoch": 0.27, + "learning_rate": 9.55268928078316e-05, + "loss": 1.3542, + "step": 14110 + }, + { + "epoch": 0.27, + "learning_rate": 9.55206466674539e-05, + "loss": 1.4731, + "step": 14120 + }, + { + "epoch": 0.27, + "learning_rate": 9.55143963736349e-05, + "loss": 1.4023, + "step": 14130 + }, + { + "epoch": 0.27, + "learning_rate": 9.550814192694485e-05, + "loss": 1.3068, + "step": 14140 + }, + { + "epoch": 0.27, + "learning_rate": 9.550188332795446e-05, + "loss": 1.2309, + "step": 14150 + }, + { + "epoch": 0.27, + "learning_rate": 9.549562057723476e-05, + "loss": 1.1666, + "step": 14160 + }, + { + "epoch": 0.27, + "learning_rate": 9.548935367535717e-05, + "loss": 1.1862, + "step": 14170 + }, + { + "epoch": 0.27, + "learning_rate": 9.548308262289353e-05, + "loss": 1.2942, + "step": 14180 + }, + { + "epoch": 0.27, + "learning_rate": 9.547680742041603e-05, + "loss": 1.3143, + "step": 14190 + }, + { + "epoch": 0.27, + "learning_rate": 9.547052806849722e-05, + "loss": 1.1719, + "step": 14200 + }, + { + "epoch": 0.27, + "learning_rate": 9.546424456771006e-05, + "loss": 1.178, + "step": 14210 + }, + { + "epoch": 0.27, + "learning_rate": 9.545795691862786e-05, + "loss": 1.7178, + "step": 14220 + }, + { + "epoch": 0.27, + "learning_rate": 9.545166512182435e-05, + "loss": 1.3496, + "step": 14230 + }, + { + "epoch": 0.27, + "learning_rate": 9.544536917787359e-05, + "loss": 1.2592, + "step": 14240 + }, + { + "epoch": 0.27, + "learning_rate": 9.543906908735004e-05, + "loss": 1.5064, + "step": 14250 + }, + { + "epoch": 0.27, + "learning_rate": 9.543276485082855e-05, + "loss": 1.4023, + "step": 14260 + }, + { + "epoch": 0.27, + "learning_rate": 9.542645646888434e-05, + "loss": 1.2379, + "step": 14270 + }, + { + "epoch": 0.27, + "learning_rate": 9.5420143942093e-05, + "loss": 1.2176, + "step": 14280 + }, + { + "epoch": 0.27, + "learning_rate": 9.54138272710305e-05, + "loss": 1.2369, + "step": 14290 + }, + { + "epoch": 0.27, + "learning_rate": 9.54075064562732e-05, + "loss": 1.3587, + "step": 14300 + }, + { + "epoch": 0.28, + "learning_rate": 9.540118149839783e-05, + "loss": 1.2812, + "step": 14310 + }, + { + "epoch": 0.28, + "learning_rate": 9.539485239798149e-05, + "loss": 1.1354, + "step": 14320 + }, + { + "epoch": 0.28, + "learning_rate": 9.538851915560169e-05, + "loss": 1.1987, + "step": 14330 + }, + { + "epoch": 0.28, + "learning_rate": 9.538218177183626e-05, + "loss": 1.3057, + "step": 14340 + }, + { + "epoch": 0.28, + "learning_rate": 9.537584024726345e-05, + "loss": 1.3382, + "step": 14350 + }, + { + "epoch": 0.28, + "learning_rate": 9.53694945824619e-05, + "loss": 1.4262, + "step": 14360 + }, + { + "epoch": 0.28, + "learning_rate": 9.53631447780106e-05, + "loss": 1.184, + "step": 14370 + }, + { + "epoch": 0.28, + "learning_rate": 9.535679083448892e-05, + "loss": 1.2905, + "step": 14380 + }, + { + "epoch": 0.28, + "learning_rate": 9.53504327524766e-05, + "loss": 1.3353, + "step": 14390 + }, + { + "epoch": 0.28, + "learning_rate": 9.534407053255378e-05, + "loss": 1.412, + "step": 14400 + }, + { + "epoch": 0.28, + "learning_rate": 9.5337704175301e-05, + "loss": 1.3826, + "step": 14410 + }, + { + "epoch": 0.28, + "learning_rate": 9.533133368129909e-05, + "loss": 1.2468, + "step": 14420 + }, + { + "epoch": 0.28, + "learning_rate": 9.532495905112938e-05, + "loss": 1.1994, + "step": 14430 + }, + { + "epoch": 0.28, + "learning_rate": 9.531858028537342e-05, + "loss": 1.3416, + "step": 14440 + }, + { + "epoch": 0.28, + "learning_rate": 9.53121973846133e-05, + "loss": 1.2393, + "step": 14450 + }, + { + "epoch": 0.28, + "learning_rate": 9.53058103494314e-05, + "loss": 1.1162, + "step": 14460 + }, + { + "epoch": 0.28, + "learning_rate": 9.52994191804105e-05, + "loss": 1.1246, + "step": 14470 + }, + { + "epoch": 0.28, + "learning_rate": 9.529302387813372e-05, + "loss": 1.259, + "step": 14480 + }, + { + "epoch": 0.28, + "learning_rate": 9.528662444318461e-05, + "loss": 1.4229, + "step": 14490 + }, + { + "epoch": 0.28, + "learning_rate": 9.528022087614708e-05, + "loss": 1.3106, + "step": 14500 + }, + { + "epoch": 0.28, + "learning_rate": 9.527381317760538e-05, + "loss": 1.3853, + "step": 14510 + }, + { + "epoch": 0.28, + "learning_rate": 9.526740134814418e-05, + "loss": 1.3745, + "step": 14520 + }, + { + "epoch": 0.28, + "learning_rate": 9.526098538834853e-05, + "loss": 1.3033, + "step": 14530 + }, + { + "epoch": 0.28, + "learning_rate": 9.525456529880383e-05, + "loss": 1.2273, + "step": 14540 + }, + { + "epoch": 0.28, + "learning_rate": 9.524814108009588e-05, + "loss": 1.3499, + "step": 14550 + }, + { + "epoch": 0.28, + "learning_rate": 9.524171273281083e-05, + "loss": 1.2546, + "step": 14560 + }, + { + "epoch": 0.28, + "learning_rate": 9.523528025753523e-05, + "loss": 1.2898, + "step": 14570 + }, + { + "epoch": 0.28, + "learning_rate": 9.522884365485598e-05, + "loss": 1.3143, + "step": 14580 + }, + { + "epoch": 0.28, + "learning_rate": 9.522240292536041e-05, + "loss": 1.304, + "step": 14590 + }, + { + "epoch": 0.28, + "learning_rate": 9.521595806963617e-05, + "loss": 1.3761, + "step": 14600 + }, + { + "epoch": 0.28, + "learning_rate": 9.520950908827131e-05, + "loss": 1.3788, + "step": 14610 + }, + { + "epoch": 0.28, + "learning_rate": 9.520305598185423e-05, + "loss": 1.3502, + "step": 14620 + }, + { + "epoch": 0.28, + "learning_rate": 9.519659875097378e-05, + "loss": 1.1854, + "step": 14630 + }, + { + "epoch": 0.28, + "learning_rate": 9.519013739621912e-05, + "loss": 1.3097, + "step": 14640 + }, + { + "epoch": 0.28, + "learning_rate": 9.518367191817979e-05, + "loss": 1.2704, + "step": 14650 + }, + { + "epoch": 0.28, + "learning_rate": 9.517720231744573e-05, + "loss": 1.3759, + "step": 14660 + }, + { + "epoch": 0.28, + "learning_rate": 9.517072859460723e-05, + "loss": 1.2764, + "step": 14670 + }, + { + "epoch": 0.28, + "learning_rate": 9.516425075025499e-05, + "loss": 1.2031, + "step": 14680 + }, + { + "epoch": 0.28, + "learning_rate": 9.515776878498006e-05, + "loss": 1.2731, + "step": 14690 + }, + { + "epoch": 0.28, + "learning_rate": 9.515128269937389e-05, + "loss": 1.0977, + "step": 14700 + }, + { + "epoch": 0.28, + "learning_rate": 9.514479249402827e-05, + "loss": 1.5174, + "step": 14710 + }, + { + "epoch": 0.28, + "learning_rate": 9.513829816953539e-05, + "loss": 1.184, + "step": 14720 + }, + { + "epoch": 0.28, + "learning_rate": 9.513179972648781e-05, + "loss": 1.2613, + "step": 14730 + }, + { + "epoch": 0.28, + "learning_rate": 9.512529716547848e-05, + "loss": 1.2177, + "step": 14740 + }, + { + "epoch": 0.28, + "learning_rate": 9.511879048710071e-05, + "loss": 1.4718, + "step": 14750 + }, + { + "epoch": 0.28, + "learning_rate": 9.511227969194818e-05, + "loss": 1.268, + "step": 14760 + }, + { + "epoch": 0.28, + "learning_rate": 9.510576478061495e-05, + "loss": 1.3361, + "step": 14770 + }, + { + "epoch": 0.28, + "learning_rate": 9.509924575369548e-05, + "loss": 1.1751, + "step": 14780 + }, + { + "epoch": 0.28, + "learning_rate": 9.509272261178457e-05, + "loss": 1.5077, + "step": 14790 + }, + { + "epoch": 0.28, + "learning_rate": 9.508619535547743e-05, + "loss": 1.3486, + "step": 14800 + }, + { + "epoch": 0.28, + "learning_rate": 9.507966398536959e-05, + "loss": 1.4725, + "step": 14810 + }, + { + "epoch": 0.28, + "learning_rate": 9.507312850205703e-05, + "loss": 1.3602, + "step": 14820 + }, + { + "epoch": 0.29, + "learning_rate": 9.506658890613604e-05, + "loss": 1.4216, + "step": 14830 + }, + { + "epoch": 0.29, + "learning_rate": 9.506004519820334e-05, + "loss": 1.54, + "step": 14840 + }, + { + "epoch": 0.29, + "learning_rate": 9.505349737885597e-05, + "loss": 1.0727, + "step": 14850 + }, + { + "epoch": 0.29, + "learning_rate": 9.50469454486914e-05, + "loss": 0.9894, + "step": 14860 + }, + { + "epoch": 0.29, + "learning_rate": 9.504038940830742e-05, + "loss": 1.3033, + "step": 14870 + }, + { + "epoch": 0.29, + "learning_rate": 9.503382925830223e-05, + "loss": 1.4206, + "step": 14880 + }, + { + "epoch": 0.29, + "learning_rate": 9.50272649992744e-05, + "loss": 1.2722, + "step": 14890 + }, + { + "epoch": 0.29, + "learning_rate": 9.502069663182289e-05, + "loss": 1.617, + "step": 14900 + }, + { + "epoch": 0.29, + "learning_rate": 9.501412415654702e-05, + "loss": 1.2825, + "step": 14910 + }, + { + "epoch": 0.29, + "learning_rate": 9.500754757404644e-05, + "loss": 0.9748, + "step": 14920 + }, + { + "epoch": 0.29, + "learning_rate": 9.500096688492127e-05, + "loss": 1.2113, + "step": 14930 + }, + { + "epoch": 0.29, + "learning_rate": 9.49943820897719e-05, + "loss": 1.3671, + "step": 14940 + }, + { + "epoch": 0.29, + "learning_rate": 9.498779318919917e-05, + "loss": 1.2903, + "step": 14950 + }, + { + "epoch": 0.29, + "learning_rate": 9.49812001838043e-05, + "loss": 1.0919, + "step": 14960 + }, + { + "epoch": 0.29, + "learning_rate": 9.49746030741888e-05, + "loss": 1.3182, + "step": 14970 + }, + { + "epoch": 0.29, + "learning_rate": 9.496800186095466e-05, + "loss": 1.2445, + "step": 14980 + }, + { + "epoch": 0.29, + "learning_rate": 9.496139654470418e-05, + "loss": 1.3082, + "step": 14990 + }, + { + "epoch": 0.29, + "learning_rate": 9.495478712604002e-05, + "loss": 1.4041, + "step": 15000 + }, + { + "epoch": 0.29, + "learning_rate": 9.494817360556528e-05, + "loss": 1.2026, + "step": 15010 + }, + { + "epoch": 0.29, + "learning_rate": 9.494155598388339e-05, + "loss": 1.2226, + "step": 15020 + }, + { + "epoch": 0.29, + "learning_rate": 9.493493426159813e-05, + "loss": 1.1804, + "step": 15030 + }, + { + "epoch": 0.29, + "learning_rate": 9.492830843931375e-05, + "loss": 1.2866, + "step": 15040 + }, + { + "epoch": 0.29, + "learning_rate": 9.492167851763475e-05, + "loss": 1.1852, + "step": 15050 + }, + { + "epoch": 0.29, + "learning_rate": 9.491504449716608e-05, + "loss": 1.2098, + "step": 15060 + }, + { + "epoch": 0.29, + "learning_rate": 9.490840637851307e-05, + "loss": 1.4086, + "step": 15070 + }, + { + "epoch": 0.29, + "learning_rate": 9.490176416228138e-05, + "loss": 1.2262, + "step": 15080 + }, + { + "epoch": 0.29, + "learning_rate": 9.489511784907707e-05, + "loss": 1.2831, + "step": 15090 + }, + { + "epoch": 0.29, + "learning_rate": 9.488846743950657e-05, + "loss": 1.2364, + "step": 15100 + }, + { + "epoch": 0.29, + "learning_rate": 9.48818129341767e-05, + "loss": 1.2609, + "step": 15110 + }, + { + "epoch": 0.29, + "learning_rate": 9.48751543336946e-05, + "loss": 1.3107, + "step": 15120 + }, + { + "epoch": 0.29, + "learning_rate": 9.486849163866786e-05, + "loss": 1.4669, + "step": 15130 + }, + { + "epoch": 0.29, + "learning_rate": 9.486182484970438e-05, + "loss": 1.2959, + "step": 15140 + }, + { + "epoch": 0.29, + "learning_rate": 9.485515396741247e-05, + "loss": 1.3684, + "step": 15150 + }, + { + "epoch": 0.29, + "learning_rate": 9.48484789924008e-05, + "loss": 1.3405, + "step": 15160 + }, + { + "epoch": 0.29, + "learning_rate": 9.48417999252784e-05, + "loss": 1.2239, + "step": 15170 + }, + { + "epoch": 0.29, + "learning_rate": 9.48351167666547e-05, + "loss": 1.1562, + "step": 15180 + }, + { + "epoch": 0.29, + "learning_rate": 9.48284295171395e-05, + "loss": 1.1647, + "step": 15190 + }, + { + "epoch": 0.29, + "learning_rate": 9.482173817734296e-05, + "loss": 1.5485, + "step": 15200 + }, + { + "epoch": 0.29, + "learning_rate": 9.48150427478756e-05, + "loss": 1.2677, + "step": 15210 + }, + { + "epoch": 0.29, + "learning_rate": 9.480834322934838e-05, + "loss": 1.0979, + "step": 15220 + }, + { + "epoch": 0.29, + "learning_rate": 9.480163962237251e-05, + "loss": 1.2109, + "step": 15230 + }, + { + "epoch": 0.29, + "learning_rate": 9.47949319275597e-05, + "loss": 1.3806, + "step": 15240 + }, + { + "epoch": 0.29, + "learning_rate": 9.478822014552197e-05, + "loss": 1.1895, + "step": 15250 + }, + { + "epoch": 0.29, + "learning_rate": 9.478150427687174e-05, + "loss": 1.1608, + "step": 15260 + }, + { + "epoch": 0.29, + "learning_rate": 9.477478432222174e-05, + "loss": 1.3987, + "step": 15270 + }, + { + "epoch": 0.29, + "learning_rate": 9.476806028218515e-05, + "loss": 1.3672, + "step": 15280 + }, + { + "epoch": 0.29, + "learning_rate": 9.476133215737551e-05, + "loss": 1.2423, + "step": 15290 + }, + { + "epoch": 0.29, + "learning_rate": 9.475459994840668e-05, + "loss": 1.3597, + "step": 15300 + }, + { + "epoch": 0.29, + "learning_rate": 9.474786365589292e-05, + "loss": 1.3544, + "step": 15310 + }, + { + "epoch": 0.29, + "learning_rate": 9.474112328044891e-05, + "loss": 1.1315, + "step": 15320 + }, + { + "epoch": 0.29, + "learning_rate": 9.473437882268964e-05, + "loss": 1.5525, + "step": 15330 + }, + { + "epoch": 0.29, + "learning_rate": 9.472763028323049e-05, + "loss": 1.3624, + "step": 15340 + }, + { + "epoch": 0.3, + "learning_rate": 9.472087766268722e-05, + "loss": 1.0602, + "step": 15350 + }, + { + "epoch": 0.3, + "learning_rate": 9.471412096167598e-05, + "loss": 1.2712, + "step": 15360 + }, + { + "epoch": 0.3, + "learning_rate": 9.470736018081325e-05, + "loss": 1.3102, + "step": 15370 + }, + { + "epoch": 0.3, + "learning_rate": 9.470059532071589e-05, + "loss": 1.3245, + "step": 15380 + }, + { + "epoch": 0.3, + "learning_rate": 9.469382638200118e-05, + "loss": 1.4467, + "step": 15390 + }, + { + "epoch": 0.3, + "learning_rate": 9.468705336528673e-05, + "loss": 1.2914, + "step": 15400 + }, + { + "epoch": 0.3, + "learning_rate": 9.468027627119052e-05, + "loss": 1.3871, + "step": 15410 + }, + { + "epoch": 0.3, + "learning_rate": 9.46734951003309e-05, + "loss": 1.4056, + "step": 15420 + }, + { + "epoch": 0.3, + "learning_rate": 9.466670985332664e-05, + "loss": 1.3288, + "step": 15430 + }, + { + "epoch": 0.3, + "learning_rate": 9.465992053079681e-05, + "loss": 1.384, + "step": 15440 + }, + { + "epoch": 0.3, + "learning_rate": 9.465312713336092e-05, + "loss": 1.343, + "step": 15450 + }, + { + "epoch": 0.3, + "learning_rate": 9.46463296616388e-05, + "loss": 1.2668, + "step": 15460 + }, + { + "epoch": 0.3, + "learning_rate": 9.463952811625068e-05, + "loss": 1.4113, + "step": 15470 + }, + { + "epoch": 0.3, + "learning_rate": 9.463272249781715e-05, + "loss": 1.255, + "step": 15480 + }, + { + "epoch": 0.3, + "learning_rate": 9.462591280695917e-05, + "loss": 1.4448, + "step": 15490 + }, + { + "epoch": 0.3, + "learning_rate": 9.461909904429808e-05, + "loss": 1.1872, + "step": 15500 + }, + { + "epoch": 0.3, + "learning_rate": 9.46122812104556e-05, + "loss": 1.1688, + "step": 15510 + }, + { + "epoch": 0.3, + "learning_rate": 9.460545930605382e-05, + "loss": 1.3372, + "step": 15520 + }, + { + "epoch": 0.3, + "learning_rate": 9.459863333171515e-05, + "loss": 1.1087, + "step": 15530 + }, + { + "epoch": 0.3, + "learning_rate": 9.459180328806244e-05, + "loss": 1.392, + "step": 15540 + }, + { + "epoch": 0.3, + "learning_rate": 9.458496917571889e-05, + "loss": 1.2342, + "step": 15550 + }, + { + "epoch": 0.3, + "learning_rate": 9.457813099530804e-05, + "loss": 1.3217, + "step": 15560 + }, + { + "epoch": 0.3, + "learning_rate": 9.457128874745382e-05, + "loss": 1.1034, + "step": 15570 + }, + { + "epoch": 0.3, + "learning_rate": 9.456444243278058e-05, + "loss": 1.2555, + "step": 15580 + }, + { + "epoch": 0.3, + "learning_rate": 9.455759205191298e-05, + "loss": 1.2213, + "step": 15590 + }, + { + "epoch": 0.3, + "learning_rate": 9.455073760547605e-05, + "loss": 1.3855, + "step": 15600 + }, + { + "epoch": 0.3, + "learning_rate": 9.454387909409524e-05, + "loss": 1.0471, + "step": 15610 + }, + { + "epoch": 0.3, + "learning_rate": 9.453701651839633e-05, + "loss": 1.1452, + "step": 15620 + }, + { + "epoch": 0.3, + "learning_rate": 9.453014987900547e-05, + "loss": 1.4643, + "step": 15630 + }, + { + "epoch": 0.3, + "learning_rate": 9.452327917654919e-05, + "loss": 1.3044, + "step": 15640 + }, + { + "epoch": 0.3, + "learning_rate": 9.451640441165443e-05, + "loss": 1.4161, + "step": 15650 + }, + { + "epoch": 0.3, + "learning_rate": 9.450952558494843e-05, + "loss": 1.397, + "step": 15660 + }, + { + "epoch": 0.3, + "learning_rate": 9.450264269705885e-05, + "loss": 1.2303, + "step": 15670 + }, + { + "epoch": 0.3, + "learning_rate": 9.44957557486137e-05, + "loss": 1.3004, + "step": 15680 + }, + { + "epoch": 0.3, + "learning_rate": 9.448886474024135e-05, + "loss": 1.2444, + "step": 15690 + }, + { + "epoch": 0.3, + "learning_rate": 9.44819696725706e-05, + "loss": 1.2657, + "step": 15700 + }, + { + "epoch": 0.3, + "learning_rate": 9.447507054623051e-05, + "loss": 1.1836, + "step": 15710 + }, + { + "epoch": 0.3, + "learning_rate": 9.446816736185065e-05, + "loss": 1.3029, + "step": 15720 + }, + { + "epoch": 0.3, + "learning_rate": 9.446126012006084e-05, + "loss": 1.3438, + "step": 15730 + }, + { + "epoch": 0.3, + "learning_rate": 9.445434882149133e-05, + "loss": 1.1912, + "step": 15740 + }, + { + "epoch": 0.3, + "learning_rate": 9.444743346677274e-05, + "loss": 1.1669, + "step": 15750 + }, + { + "epoch": 0.3, + "learning_rate": 9.444051405653604e-05, + "loss": 1.2661, + "step": 15760 + }, + { + "epoch": 0.3, + "learning_rate": 9.443359059141256e-05, + "loss": 1.3515, + "step": 15770 + }, + { + "epoch": 0.3, + "learning_rate": 9.442666307203405e-05, + "loss": 1.2333, + "step": 15780 + }, + { + "epoch": 0.3, + "learning_rate": 9.441973149903256e-05, + "loss": 1.3061, + "step": 15790 + }, + { + "epoch": 0.3, + "learning_rate": 9.441279587304058e-05, + "loss": 1.2485, + "step": 15800 + }, + { + "epoch": 0.3, + "learning_rate": 9.440585619469094e-05, + "loss": 1.2555, + "step": 15810 + }, + { + "epoch": 0.3, + "learning_rate": 9.43989124646168e-05, + "loss": 1.2486, + "step": 15820 + }, + { + "epoch": 0.3, + "learning_rate": 9.439196468345176e-05, + "loss": 1.4019, + "step": 15830 + }, + { + "epoch": 0.3, + "learning_rate": 9.438501285182975e-05, + "loss": 1.4258, + "step": 15840 + }, + { + "epoch": 0.3, + "learning_rate": 9.437805697038507e-05, + "loss": 1.213, + "step": 15850 + }, + { + "epoch": 0.3, + "learning_rate": 9.43710970397524e-05, + "loss": 1.3611, + "step": 15860 + }, + { + "epoch": 0.31, + "learning_rate": 9.436413306056678e-05, + "loss": 1.2525, + "step": 15870 + }, + { + "epoch": 0.31, + "learning_rate": 9.435716503346362e-05, + "loss": 1.2564, + "step": 15880 + }, + { + "epoch": 0.31, + "learning_rate": 9.435019295907872e-05, + "loss": 1.252, + "step": 15890 + }, + { + "epoch": 0.31, + "learning_rate": 9.434321683804824e-05, + "loss": 1.5885, + "step": 15900 + }, + { + "epoch": 0.31, + "learning_rate": 9.433623667100866e-05, + "loss": 1.1777, + "step": 15910 + }, + { + "epoch": 0.31, + "learning_rate": 9.432925245859691e-05, + "loss": 1.0543, + "step": 15920 + }, + { + "epoch": 0.31, + "learning_rate": 9.432226420145025e-05, + "loss": 1.3367, + "step": 15930 + }, + { + "epoch": 0.31, + "learning_rate": 9.431527190020628e-05, + "loss": 1.2429, + "step": 15940 + }, + { + "epoch": 0.31, + "learning_rate": 9.430827555550304e-05, + "loss": 1.2294, + "step": 15950 + }, + { + "epoch": 0.31, + "learning_rate": 9.430127516797886e-05, + "loss": 1.3431, + "step": 15960 + }, + { + "epoch": 0.31, + "learning_rate": 9.42942707382725e-05, + "loss": 1.3269, + "step": 15970 + }, + { + "epoch": 0.31, + "learning_rate": 9.428726226702304e-05, + "loss": 1.2602, + "step": 15980 + }, + { + "epoch": 0.31, + "learning_rate": 9.428024975487e-05, + "loss": 1.3442, + "step": 15990 + }, + { + "epoch": 0.31, + "learning_rate": 9.427323320245318e-05, + "loss": 1.2503, + "step": 16000 + }, + { + "epoch": 0.31, + "learning_rate": 9.426621261041279e-05, + "loss": 1.3511, + "step": 16010 + }, + { + "epoch": 0.31, + "learning_rate": 9.425918797938947e-05, + "loss": 1.1665, + "step": 16020 + }, + { + "epoch": 0.31, + "learning_rate": 9.42521593100241e-05, + "loss": 1.122, + "step": 16030 + }, + { + "epoch": 0.31, + "learning_rate": 9.4245126602958e-05, + "loss": 1.2693, + "step": 16040 + }, + { + "epoch": 0.31, + "learning_rate": 9.423808985883289e-05, + "loss": 1.3612, + "step": 16050 + }, + { + "epoch": 0.31, + "learning_rate": 9.423104907829082e-05, + "loss": 1.3019, + "step": 16060 + }, + { + "epoch": 0.31, + "learning_rate": 9.42240042619742e-05, + "loss": 1.2934, + "step": 16070 + }, + { + "epoch": 0.31, + "learning_rate": 9.421695541052582e-05, + "loss": 1.2136, + "step": 16080 + }, + { + "epoch": 0.31, + "learning_rate": 9.420990252458883e-05, + "loss": 1.2657, + "step": 16090 + }, + { + "epoch": 0.31, + "learning_rate": 9.420284560480679e-05, + "loss": 1.26, + "step": 16100 + }, + { + "epoch": 0.31, + "learning_rate": 9.419578465182357e-05, + "loss": 1.4128, + "step": 16110 + }, + { + "epoch": 0.31, + "learning_rate": 9.418871966628342e-05, + "loss": 1.2646, + "step": 16120 + }, + { + "epoch": 0.31, + "learning_rate": 9.4181650648831e-05, + "loss": 1.2914, + "step": 16130 + }, + { + "epoch": 0.31, + "learning_rate": 9.417457760011128e-05, + "loss": 1.0937, + "step": 16140 + }, + { + "epoch": 0.31, + "learning_rate": 9.416750052076966e-05, + "loss": 1.2951, + "step": 16150 + }, + { + "epoch": 0.31, + "learning_rate": 9.416041941145184e-05, + "loss": 1.2279, + "step": 16160 + }, + { + "epoch": 0.31, + "learning_rate": 9.415333427280394e-05, + "loss": 1.3275, + "step": 16170 + }, + { + "epoch": 0.31, + "learning_rate": 9.414624510547243e-05, + "loss": 1.1433, + "step": 16180 + }, + { + "epoch": 0.31, + "learning_rate": 9.413915191010414e-05, + "loss": 1.4721, + "step": 16190 + }, + { + "epoch": 0.31, + "learning_rate": 9.413205468734627e-05, + "loss": 1.1668, + "step": 16200 + }, + { + "epoch": 0.31, + "learning_rate": 9.412495343784642e-05, + "loss": 1.3639, + "step": 16210 + }, + { + "epoch": 0.31, + "learning_rate": 9.41178481622525e-05, + "loss": 1.2019, + "step": 16220 + }, + { + "epoch": 0.31, + "learning_rate": 9.411073886121282e-05, + "loss": 1.2207, + "step": 16230 + }, + { + "epoch": 0.31, + "learning_rate": 9.410362553537606e-05, + "loss": 1.1989, + "step": 16240 + }, + { + "epoch": 0.31, + "learning_rate": 9.409650818539127e-05, + "loss": 1.2435, + "step": 16250 + }, + { + "epoch": 0.31, + "learning_rate": 9.408938681190785e-05, + "loss": 1.2853, + "step": 16260 + }, + { + "epoch": 0.31, + "learning_rate": 9.408226141557557e-05, + "loss": 1.3813, + "step": 16270 + }, + { + "epoch": 0.31, + "learning_rate": 9.407513199704458e-05, + "loss": 1.4325, + "step": 16280 + }, + { + "epoch": 0.31, + "learning_rate": 9.406799855696539e-05, + "loss": 1.2085, + "step": 16290 + }, + { + "epoch": 0.31, + "learning_rate": 9.406086109598888e-05, + "loss": 1.2851, + "step": 16300 + }, + { + "epoch": 0.31, + "learning_rate": 9.405371961476628e-05, + "loss": 1.3606, + "step": 16310 + }, + { + "epoch": 0.31, + "learning_rate": 9.404657411394921e-05, + "loss": 1.2742, + "step": 16320 + }, + { + "epoch": 0.31, + "learning_rate": 9.403942459418967e-05, + "loss": 1.2141, + "step": 16330 + }, + { + "epoch": 0.31, + "learning_rate": 9.403227105613995e-05, + "loss": 1.3764, + "step": 16340 + }, + { + "epoch": 0.31, + "learning_rate": 9.402511350045279e-05, + "loss": 1.1283, + "step": 16350 + }, + { + "epoch": 0.31, + "learning_rate": 9.401795192778126e-05, + "loss": 1.2786, + "step": 16360 + }, + { + "epoch": 0.31, + "learning_rate": 9.401078633877884e-05, + "loss": 1.1966, + "step": 16370 + }, + { + "epoch": 0.31, + "learning_rate": 9.40036167340993e-05, + "loss": 1.4799, + "step": 16380 + }, + { + "epoch": 0.32, + "learning_rate": 9.399644311439682e-05, + "loss": 1.3863, + "step": 16390 + }, + { + "epoch": 0.32, + "learning_rate": 9.398926548032594e-05, + "loss": 1.2172, + "step": 16400 + }, + { + "epoch": 0.32, + "learning_rate": 9.398208383254159e-05, + "loss": 1.4485, + "step": 16410 + }, + { + "epoch": 0.32, + "learning_rate": 9.397489817169905e-05, + "loss": 1.4933, + "step": 16420 + }, + { + "epoch": 0.32, + "learning_rate": 9.396770849845392e-05, + "loss": 1.3489, + "step": 16430 + }, + { + "epoch": 0.32, + "learning_rate": 9.396051481346225e-05, + "loss": 1.2826, + "step": 16440 + }, + { + "epoch": 0.32, + "learning_rate": 9.395331711738038e-05, + "loss": 1.233, + "step": 16450 + }, + { + "epoch": 0.32, + "learning_rate": 9.394611541086508e-05, + "loss": 1.1535, + "step": 16460 + }, + { + "epoch": 0.32, + "learning_rate": 9.393890969457343e-05, + "loss": 1.0996, + "step": 16470 + }, + { + "epoch": 0.32, + "learning_rate": 9.39316999691629e-05, + "loss": 1.3907, + "step": 16480 + }, + { + "epoch": 0.32, + "learning_rate": 9.392448623529137e-05, + "loss": 1.3211, + "step": 16490 + }, + { + "epoch": 0.32, + "learning_rate": 9.3917268493617e-05, + "loss": 1.3094, + "step": 16500 + }, + { + "epoch": 0.32, + "learning_rate": 9.391004674479838e-05, + "loss": 1.3606, + "step": 16510 + }, + { + "epoch": 0.32, + "learning_rate": 9.390282098949443e-05, + "loss": 1.3413, + "step": 16520 + }, + { + "epoch": 0.32, + "learning_rate": 9.389559122836444e-05, + "loss": 1.3874, + "step": 16530 + }, + { + "epoch": 0.32, + "learning_rate": 9.388835746206812e-05, + "loss": 1.2007, + "step": 16540 + }, + { + "epoch": 0.32, + "learning_rate": 9.388111969126545e-05, + "loss": 1.4112, + "step": 16550 + }, + { + "epoch": 0.32, + "learning_rate": 9.387387791661685e-05, + "loss": 1.4398, + "step": 16560 + }, + { + "epoch": 0.32, + "learning_rate": 9.386663213878308e-05, + "loss": 1.2158, + "step": 16570 + }, + { + "epoch": 0.32, + "learning_rate": 9.385938235842526e-05, + "loss": 1.6013, + "step": 16580 + }, + { + "epoch": 0.32, + "learning_rate": 9.38521285762049e-05, + "loss": 1.2519, + "step": 16590 + }, + { + "epoch": 0.32, + "learning_rate": 9.384487079278383e-05, + "loss": 1.1838, + "step": 16600 + }, + { + "epoch": 0.32, + "learning_rate": 9.383760900882429e-05, + "loss": 1.2601, + "step": 16610 + }, + { + "epoch": 0.32, + "learning_rate": 9.383034322498886e-05, + "loss": 1.297, + "step": 16620 + }, + { + "epoch": 0.32, + "learning_rate": 9.38230734419405e-05, + "loss": 1.2262, + "step": 16630 + }, + { + "epoch": 0.32, + "learning_rate": 9.381579966034252e-05, + "loss": 1.543, + "step": 16640 + }, + { + "epoch": 0.32, + "learning_rate": 9.380852188085862e-05, + "loss": 1.3487, + "step": 16650 + }, + { + "epoch": 0.32, + "learning_rate": 9.38012401041528e-05, + "loss": 1.2489, + "step": 16660 + }, + { + "epoch": 0.32, + "learning_rate": 9.379395433088953e-05, + "loss": 1.2502, + "step": 16670 + }, + { + "epoch": 0.32, + "learning_rate": 9.378666456173355e-05, + "loss": 1.3287, + "step": 16680 + }, + { + "epoch": 0.32, + "learning_rate": 9.377937079735e-05, + "loss": 1.333, + "step": 16690 + }, + { + "epoch": 0.32, + "learning_rate": 9.377207303840441e-05, + "loss": 1.2786, + "step": 16700 + }, + { + "epoch": 0.32, + "learning_rate": 9.376477128556263e-05, + "loss": 1.1994, + "step": 16710 + }, + { + "epoch": 0.32, + "learning_rate": 9.375746553949087e-05, + "loss": 1.1303, + "step": 16720 + }, + { + "epoch": 0.32, + "learning_rate": 9.37501558008558e-05, + "loss": 1.132, + "step": 16730 + }, + { + "epoch": 0.32, + "learning_rate": 9.37428420703243e-05, + "loss": 1.2864, + "step": 16740 + }, + { + "epoch": 0.32, + "learning_rate": 9.373552434856374e-05, + "loss": 1.0516, + "step": 16750 + }, + { + "epoch": 0.32, + "learning_rate": 9.372820263624182e-05, + "loss": 1.2866, + "step": 16760 + }, + { + "epoch": 0.32, + "learning_rate": 9.372087693402658e-05, + "loss": 1.1245, + "step": 16770 + }, + { + "epoch": 0.32, + "learning_rate": 9.371354724258643e-05, + "loss": 1.4265, + "step": 16780 + }, + { + "epoch": 0.32, + "learning_rate": 9.370621356259018e-05, + "loss": 1.1376, + "step": 16790 + }, + { + "epoch": 0.32, + "learning_rate": 9.369887589470694e-05, + "loss": 1.4306, + "step": 16800 + }, + { + "epoch": 0.32, + "learning_rate": 9.369153423960626e-05, + "loss": 1.1678, + "step": 16810 + }, + { + "epoch": 0.32, + "learning_rate": 9.368418859795799e-05, + "loss": 1.2773, + "step": 16820 + }, + { + "epoch": 0.32, + "learning_rate": 9.367683897043238e-05, + "loss": 1.2845, + "step": 16830 + }, + { + "epoch": 0.32, + "learning_rate": 9.366948535770002e-05, + "loss": 1.3584, + "step": 16840 + }, + { + "epoch": 0.32, + "learning_rate": 9.366212776043188e-05, + "loss": 1.3543, + "step": 16850 + }, + { + "epoch": 0.32, + "learning_rate": 9.36547661792993e-05, + "loss": 1.146, + "step": 16860 + }, + { + "epoch": 0.32, + "learning_rate": 9.364740061497397e-05, + "loss": 1.3677, + "step": 16870 + }, + { + "epoch": 0.32, + "learning_rate": 9.364003106812793e-05, + "loss": 1.2294, + "step": 16880 + }, + { + "epoch": 0.32, + "learning_rate": 9.363265753943361e-05, + "loss": 1.2105, + "step": 16890 + }, + { + "epoch": 0.32, + "learning_rate": 9.36252800295638e-05, + "loss": 1.1968, + "step": 16900 + }, + { + "epoch": 0.33, + "learning_rate": 9.361789853919164e-05, + "loss": 1.2331, + "step": 16910 + }, + { + "epoch": 0.33, + "learning_rate": 9.361051306899065e-05, + "loss": 1.1401, + "step": 16920 + }, + { + "epoch": 0.33, + "learning_rate": 9.360312361963468e-05, + "loss": 1.2848, + "step": 16930 + }, + { + "epoch": 0.33, + "learning_rate": 9.359573019179798e-05, + "loss": 1.283, + "step": 16940 + }, + { + "epoch": 0.33, + "learning_rate": 9.358833278615516e-05, + "loss": 1.4469, + "step": 16950 + }, + { + "epoch": 0.33, + "learning_rate": 9.358093140338116e-05, + "loss": 1.2231, + "step": 16960 + }, + { + "epoch": 0.33, + "learning_rate": 9.35735260441513e-05, + "loss": 1.6433, + "step": 16970 + }, + { + "epoch": 0.33, + "learning_rate": 9.35661167091413e-05, + "loss": 1.2125, + "step": 16980 + }, + { + "epoch": 0.33, + "learning_rate": 9.355870339902718e-05, + "loss": 1.2966, + "step": 16990 + }, + { + "epoch": 0.33, + "learning_rate": 9.355128611448536e-05, + "loss": 1.1292, + "step": 17000 + }, + { + "epoch": 0.33, + "learning_rate": 9.354386485619264e-05, + "loss": 1.3132, + "step": 17010 + }, + { + "epoch": 0.33, + "learning_rate": 9.353643962482612e-05, + "loss": 1.6297, + "step": 17020 + }, + { + "epoch": 0.33, + "learning_rate": 9.352901042106332e-05, + "loss": 1.2072, + "step": 17030 + }, + { + "epoch": 0.33, + "learning_rate": 9.35215772455821e-05, + "loss": 1.322, + "step": 17040 + }, + { + "epoch": 0.33, + "learning_rate": 9.35141400990607e-05, + "loss": 1.4751, + "step": 17050 + }, + { + "epoch": 0.33, + "learning_rate": 9.350669898217768e-05, + "loss": 1.6172, + "step": 17060 + }, + { + "epoch": 0.33, + "learning_rate": 9.349925389561201e-05, + "loss": 1.2036, + "step": 17070 + }, + { + "epoch": 0.33, + "learning_rate": 9.349180484004299e-05, + "loss": 1.3299, + "step": 17080 + }, + { + "epoch": 0.33, + "learning_rate": 9.34843518161503e-05, + "loss": 1.2185, + "step": 17090 + }, + { + "epoch": 0.33, + "learning_rate": 9.347689482461398e-05, + "loss": 1.1816, + "step": 17100 + }, + { + "epoch": 0.33, + "learning_rate": 9.346943386611442e-05, + "loss": 1.4984, + "step": 17110 + }, + { + "epoch": 0.33, + "learning_rate": 9.346196894133239e-05, + "loss": 1.2053, + "step": 17120 + }, + { + "epoch": 0.33, + "learning_rate": 9.345450005094902e-05, + "loss": 1.4044, + "step": 17130 + }, + { + "epoch": 0.33, + "learning_rate": 9.344702719564576e-05, + "loss": 1.368, + "step": 17140 + }, + { + "epoch": 0.33, + "learning_rate": 9.34395503761045e-05, + "loss": 1.6843, + "step": 17150 + }, + { + "epoch": 0.33, + "learning_rate": 9.34320695930074e-05, + "loss": 1.2494, + "step": 17160 + }, + { + "epoch": 0.33, + "learning_rate": 9.342458484703708e-05, + "loss": 1.4661, + "step": 17170 + }, + { + "epoch": 0.33, + "learning_rate": 9.341709613887643e-05, + "loss": 1.2289, + "step": 17180 + }, + { + "epoch": 0.33, + "learning_rate": 9.340960346920877e-05, + "loss": 1.3002, + "step": 17190 + }, + { + "epoch": 0.33, + "learning_rate": 9.340210683871773e-05, + "loss": 1.3765, + "step": 17200 + }, + { + "epoch": 0.33, + "learning_rate": 9.339460624808733e-05, + "loss": 1.2281, + "step": 17210 + }, + { + "epoch": 0.33, + "learning_rate": 9.338710169800198e-05, + "loss": 1.1963, + "step": 17220 + }, + { + "epoch": 0.33, + "learning_rate": 9.337959318914638e-05, + "loss": 1.1941, + "step": 17230 + }, + { + "epoch": 0.33, + "learning_rate": 9.337208072220563e-05, + "loss": 1.1274, + "step": 17240 + }, + { + "epoch": 0.33, + "learning_rate": 9.33645642978652e-05, + "loss": 1.2854, + "step": 17250 + }, + { + "epoch": 0.33, + "learning_rate": 9.335704391681092e-05, + "loss": 1.1231, + "step": 17260 + }, + { + "epoch": 0.33, + "learning_rate": 9.334951957972898e-05, + "loss": 1.3419, + "step": 17270 + }, + { + "epoch": 0.33, + "learning_rate": 9.334199128730587e-05, + "loss": 1.2927, + "step": 17280 + }, + { + "epoch": 0.33, + "learning_rate": 9.333445904022856e-05, + "loss": 1.1611, + "step": 17290 + }, + { + "epoch": 0.33, + "learning_rate": 9.332692283918427e-05, + "loss": 1.237, + "step": 17300 + }, + { + "epoch": 0.33, + "learning_rate": 9.331938268486065e-05, + "loss": 1.2885, + "step": 17310 + }, + { + "epoch": 0.33, + "learning_rate": 9.331183857794569e-05, + "loss": 1.1829, + "step": 17320 + }, + { + "epoch": 0.33, + "learning_rate": 9.33042905191277e-05, + "loss": 1.4356, + "step": 17330 + }, + { + "epoch": 0.33, + "learning_rate": 9.329673850909544e-05, + "loss": 1.328, + "step": 17340 + }, + { + "epoch": 0.33, + "learning_rate": 9.328918254853794e-05, + "loss": 1.6546, + "step": 17350 + }, + { + "epoch": 0.33, + "learning_rate": 9.328162263814463e-05, + "loss": 1.2788, + "step": 17360 + }, + { + "epoch": 0.33, + "learning_rate": 9.327405877860533e-05, + "loss": 1.4134, + "step": 17370 + }, + { + "epoch": 0.33, + "learning_rate": 9.326649097061015e-05, + "loss": 1.0333, + "step": 17380 + }, + { + "epoch": 0.33, + "learning_rate": 9.325891921484964e-05, + "loss": 1.4625, + "step": 17390 + }, + { + "epoch": 0.33, + "learning_rate": 9.325134351201463e-05, + "loss": 0.9974, + "step": 17400 + }, + { + "epoch": 0.33, + "learning_rate": 9.324376386279637e-05, + "loss": 1.1835, + "step": 17410 + }, + { + "epoch": 0.33, + "learning_rate": 9.323618026788645e-05, + "loss": 1.1063, + "step": 17420 + }, + { + "epoch": 0.34, + "learning_rate": 9.322859272797684e-05, + "loss": 1.3024, + "step": 17430 + }, + { + "epoch": 0.34, + "learning_rate": 9.322100124375981e-05, + "loss": 1.2947, + "step": 17440 + }, + { + "epoch": 0.34, + "learning_rate": 9.321340581592804e-05, + "loss": 1.2849, + "step": 17450 + }, + { + "epoch": 0.34, + "learning_rate": 9.320580644517458e-05, + "loss": 1.4357, + "step": 17460 + }, + { + "epoch": 0.34, + "learning_rate": 9.319820313219281e-05, + "loss": 1.294, + "step": 17470 + }, + { + "epoch": 0.34, + "learning_rate": 9.319059587767647e-05, + "loss": 1.3898, + "step": 17480 + }, + { + "epoch": 0.34, + "learning_rate": 9.318298468231967e-05, + "loss": 1.2725, + "step": 17490 + }, + { + "epoch": 0.34, + "learning_rate": 9.31753695468169e-05, + "loss": 1.2791, + "step": 17500 + }, + { + "epoch": 0.34, + "learning_rate": 9.316775047186296e-05, + "loss": 1.0679, + "step": 17510 + }, + { + "epoch": 0.34, + "learning_rate": 9.316012745815306e-05, + "loss": 1.2829, + "step": 17520 + }, + { + "epoch": 0.34, + "learning_rate": 9.315250050638274e-05, + "loss": 1.2124, + "step": 17530 + }, + { + "epoch": 0.34, + "learning_rate": 9.314486961724788e-05, + "loss": 1.4354, + "step": 17540 + }, + { + "epoch": 0.34, + "learning_rate": 9.313723479144478e-05, + "loss": 1.0578, + "step": 17550 + }, + { + "epoch": 0.34, + "learning_rate": 9.312959602967006e-05, + "loss": 1.3993, + "step": 17560 + }, + { + "epoch": 0.34, + "learning_rate": 9.31219533326207e-05, + "loss": 1.3431, + "step": 17570 + }, + { + "epoch": 0.34, + "learning_rate": 9.311430670099402e-05, + "loss": 1.5156, + "step": 17580 + }, + { + "epoch": 0.34, + "learning_rate": 9.310665613548775e-05, + "loss": 1.2122, + "step": 17590 + }, + { + "epoch": 0.34, + "learning_rate": 9.309900163679996e-05, + "loss": 1.2211, + "step": 17600 + }, + { + "epoch": 0.34, + "learning_rate": 9.309134320562902e-05, + "loss": 1.3607, + "step": 17610 + }, + { + "epoch": 0.34, + "learning_rate": 9.308368084267376e-05, + "loss": 1.4265, + "step": 17620 + }, + { + "epoch": 0.34, + "learning_rate": 9.307601454863331e-05, + "loss": 1.3635, + "step": 17630 + }, + { + "epoch": 0.34, + "learning_rate": 9.306834432420712e-05, + "loss": 1.2899, + "step": 17640 + }, + { + "epoch": 0.34, + "learning_rate": 9.30606701700951e-05, + "loss": 1.1361, + "step": 17650 + }, + { + "epoch": 0.34, + "learning_rate": 9.305299208699742e-05, + "loss": 1.2038, + "step": 17660 + }, + { + "epoch": 0.34, + "learning_rate": 9.30453100756147e-05, + "loss": 1.2701, + "step": 17670 + }, + { + "epoch": 0.34, + "learning_rate": 9.303762413664781e-05, + "loss": 1.351, + "step": 17680 + }, + { + "epoch": 0.34, + "learning_rate": 9.302993427079809e-05, + "loss": 1.0281, + "step": 17690 + }, + { + "epoch": 0.34, + "learning_rate": 9.302224047876717e-05, + "loss": 1.3172, + "step": 17700 + }, + { + "epoch": 0.34, + "learning_rate": 9.301454276125704e-05, + "loss": 1.431, + "step": 17710 + }, + { + "epoch": 0.34, + "learning_rate": 9.300684111897008e-05, + "loss": 1.5343, + "step": 17720 + }, + { + "epoch": 0.34, + "learning_rate": 9.2999135552609e-05, + "loss": 1.2087, + "step": 17730 + }, + { + "epoch": 0.34, + "learning_rate": 9.299142606287688e-05, + "loss": 1.2349, + "step": 17740 + }, + { + "epoch": 0.34, + "learning_rate": 9.298371265047718e-05, + "loss": 1.4836, + "step": 17750 + }, + { + "epoch": 0.34, + "learning_rate": 9.297599531611366e-05, + "loss": 1.2087, + "step": 17760 + }, + { + "epoch": 0.34, + "learning_rate": 9.29682740604905e-05, + "loss": 1.0398, + "step": 17770 + }, + { + "epoch": 0.34, + "learning_rate": 9.296054888431219e-05, + "loss": 1.3909, + "step": 17780 + }, + { + "epoch": 0.34, + "learning_rate": 9.295281978828362e-05, + "loss": 1.2426, + "step": 17790 + }, + { + "epoch": 0.34, + "learning_rate": 9.294508677311e-05, + "loss": 1.1036, + "step": 17800 + }, + { + "epoch": 0.34, + "learning_rate": 9.293734983949691e-05, + "loss": 1.3398, + "step": 17810 + }, + { + "epoch": 0.34, + "learning_rate": 9.292960898815032e-05, + "loss": 1.3364, + "step": 17820 + }, + { + "epoch": 0.34, + "learning_rate": 9.292186421977648e-05, + "loss": 1.1406, + "step": 17830 + }, + { + "epoch": 0.34, + "learning_rate": 9.29141155350821e-05, + "loss": 0.9932, + "step": 17840 + }, + { + "epoch": 0.34, + "learning_rate": 9.290636293477417e-05, + "loss": 1.2885, + "step": 17850 + }, + { + "epoch": 0.34, + "learning_rate": 9.289860641956004e-05, + "loss": 1.3683, + "step": 17860 + }, + { + "epoch": 0.34, + "learning_rate": 9.289084599014746e-05, + "loss": 1.27, + "step": 17870 + }, + { + "epoch": 0.34, + "learning_rate": 9.288308164724452e-05, + "loss": 1.2984, + "step": 17880 + }, + { + "epoch": 0.34, + "learning_rate": 9.287531339155963e-05, + "loss": 1.4012, + "step": 17890 + }, + { + "epoch": 0.34, + "learning_rate": 9.286754122380165e-05, + "loss": 1.1286, + "step": 17900 + }, + { + "epoch": 0.34, + "learning_rate": 9.285976514467968e-05, + "loss": 1.168, + "step": 17910 + }, + { + "epoch": 0.34, + "learning_rate": 9.285198515490325e-05, + "loss": 1.1317, + "step": 17920 + }, + { + "epoch": 0.34, + "learning_rate": 9.284420125518223e-05, + "loss": 1.3636, + "step": 17930 + }, + { + "epoch": 0.34, + "learning_rate": 9.283641344622684e-05, + "loss": 0.9423, + "step": 17940 + }, + { + "epoch": 0.35, + "learning_rate": 9.28286217287477e-05, + "loss": 1.3026, + "step": 17950 + }, + { + "epoch": 0.35, + "learning_rate": 9.28208261034557e-05, + "loss": 1.2703, + "step": 17960 + }, + { + "epoch": 0.35, + "learning_rate": 9.281302657106217e-05, + "loss": 1.3029, + "step": 17970 + }, + { + "epoch": 0.35, + "learning_rate": 9.280522313227873e-05, + "loss": 1.4293, + "step": 17980 + }, + { + "epoch": 0.35, + "learning_rate": 9.279741578781742e-05, + "loss": 1.1543, + "step": 17990 + }, + { + "epoch": 0.35, + "learning_rate": 9.27896045383906e-05, + "loss": 1.1441, + "step": 18000 + }, + { + "epoch": 0.35, + "learning_rate": 9.278178938471098e-05, + "loss": 1.2155, + "step": 18010 + }, + { + "epoch": 0.35, + "learning_rate": 9.277397032749164e-05, + "loss": 1.3241, + "step": 18020 + }, + { + "epoch": 0.35, + "learning_rate": 9.276614736744604e-05, + "loss": 1.1803, + "step": 18030 + }, + { + "epoch": 0.35, + "learning_rate": 9.275832050528794e-05, + "loss": 1.0748, + "step": 18040 + }, + { + "epoch": 0.35, + "learning_rate": 9.27504897417315e-05, + "loss": 1.4759, + "step": 18050 + }, + { + "epoch": 0.35, + "learning_rate": 9.274265507749121e-05, + "loss": 1.514, + "step": 18060 + }, + { + "epoch": 0.35, + "learning_rate": 9.273481651328194e-05, + "loss": 1.1424, + "step": 18070 + }, + { + "epoch": 0.35, + "learning_rate": 9.272697404981892e-05, + "loss": 1.3387, + "step": 18080 + }, + { + "epoch": 0.35, + "learning_rate": 9.271912768781768e-05, + "loss": 1.3487, + "step": 18090 + }, + { + "epoch": 0.35, + "learning_rate": 9.271127742799417e-05, + "loss": 1.3531, + "step": 18100 + }, + { + "epoch": 0.35, + "learning_rate": 9.270342327106467e-05, + "loss": 1.5283, + "step": 18110 + }, + { + "epoch": 0.35, + "learning_rate": 9.269556521774582e-05, + "loss": 1.429, + "step": 18120 + }, + { + "epoch": 0.35, + "learning_rate": 9.268770326875462e-05, + "loss": 1.4716, + "step": 18130 + }, + { + "epoch": 0.35, + "learning_rate": 9.26798374248084e-05, + "loss": 1.1919, + "step": 18140 + }, + { + "epoch": 0.35, + "learning_rate": 9.267196768662488e-05, + "loss": 1.2246, + "step": 18150 + }, + { + "epoch": 0.35, + "learning_rate": 9.266409405492209e-05, + "loss": 1.0055, + "step": 18160 + }, + { + "epoch": 0.35, + "learning_rate": 9.265621653041848e-05, + "loss": 1.2463, + "step": 18170 + }, + { + "epoch": 0.35, + "learning_rate": 9.264833511383279e-05, + "loss": 1.2515, + "step": 18180 + }, + { + "epoch": 0.35, + "learning_rate": 9.264044980588416e-05, + "loss": 1.299, + "step": 18190 + }, + { + "epoch": 0.35, + "learning_rate": 9.263256060729206e-05, + "loss": 1.3153, + "step": 18200 + }, + { + "epoch": 0.35, + "learning_rate": 9.262466751877634e-05, + "loss": 1.3898, + "step": 18210 + }, + { + "epoch": 0.35, + "learning_rate": 9.261677054105717e-05, + "loss": 1.2996, + "step": 18220 + }, + { + "epoch": 0.35, + "learning_rate": 9.260886967485511e-05, + "loss": 1.3104, + "step": 18230 + }, + { + "epoch": 0.35, + "learning_rate": 9.260096492089105e-05, + "loss": 1.1722, + "step": 18240 + }, + { + "epoch": 0.35, + "learning_rate": 9.259305627988624e-05, + "loss": 1.2576, + "step": 18250 + }, + { + "epoch": 0.35, + "learning_rate": 9.258514375256231e-05, + "loss": 1.0259, + "step": 18260 + }, + { + "epoch": 0.35, + "learning_rate": 9.25772273396412e-05, + "loss": 1.3075, + "step": 18270 + }, + { + "epoch": 0.35, + "learning_rate": 9.256930704184524e-05, + "loss": 1.1774, + "step": 18280 + }, + { + "epoch": 0.35, + "learning_rate": 9.256138285989709e-05, + "loss": 1.2613, + "step": 18290 + }, + { + "epoch": 0.35, + "learning_rate": 9.255345479451977e-05, + "loss": 1.315, + "step": 18300 + }, + { + "epoch": 0.35, + "learning_rate": 9.25455228464367e-05, + "loss": 1.2115, + "step": 18310 + }, + { + "epoch": 0.35, + "learning_rate": 9.253758701637156e-05, + "loss": 1.1275, + "step": 18320 + }, + { + "epoch": 0.35, + "learning_rate": 9.252964730504848e-05, + "loss": 1.2247, + "step": 18330 + }, + { + "epoch": 0.35, + "learning_rate": 9.252170371319189e-05, + "loss": 1.3678, + "step": 18340 + }, + { + "epoch": 0.35, + "learning_rate": 9.25137562415266e-05, + "loss": 1.3899, + "step": 18350 + }, + { + "epoch": 0.35, + "learning_rate": 9.250580489077774e-05, + "loss": 1.1713, + "step": 18360 + }, + { + "epoch": 0.35, + "learning_rate": 9.24978496616708e-05, + "loss": 1.2295, + "step": 18370 + }, + { + "epoch": 0.35, + "learning_rate": 9.248989055493171e-05, + "loss": 1.4002, + "step": 18380 + }, + { + "epoch": 0.35, + "learning_rate": 9.248192757128661e-05, + "loss": 1.5625, + "step": 18390 + }, + { + "epoch": 0.35, + "learning_rate": 9.24739607114621e-05, + "loss": 1.2804, + "step": 18400 + }, + { + "epoch": 0.35, + "learning_rate": 9.24659899761851e-05, + "loss": 1.3862, + "step": 18410 + }, + { + "epoch": 0.35, + "learning_rate": 9.245801536618286e-05, + "loss": 1.2346, + "step": 18420 + }, + { + "epoch": 0.35, + "learning_rate": 9.245003688218303e-05, + "loss": 1.4635, + "step": 18430 + }, + { + "epoch": 0.35, + "learning_rate": 9.244205452491359e-05, + "loss": 1.3998, + "step": 18440 + }, + { + "epoch": 0.35, + "learning_rate": 9.243406829510287e-05, + "loss": 1.1615, + "step": 18450 + }, + { + "epoch": 0.35, + "learning_rate": 9.242607819347958e-05, + "loss": 1.219, + "step": 18460 + }, + { + "epoch": 0.36, + "learning_rate": 9.24180842207727e-05, + "loss": 1.2745, + "step": 18470 + }, + { + "epoch": 0.36, + "learning_rate": 9.24100863777117e-05, + "loss": 1.1178, + "step": 18480 + }, + { + "epoch": 0.36, + "learning_rate": 9.240208466502625e-05, + "loss": 1.0944, + "step": 18490 + }, + { + "epoch": 0.36, + "learning_rate": 9.239407908344652e-05, + "loss": 1.3658, + "step": 18500 + }, + { + "epoch": 0.36, + "learning_rate": 9.238606963370293e-05, + "loss": 1.2966, + "step": 18510 + }, + { + "epoch": 0.36, + "learning_rate": 9.23780563165263e-05, + "loss": 1.2591, + "step": 18520 + }, + { + "epoch": 0.36, + "learning_rate": 9.237003913264776e-05, + "loss": 1.0441, + "step": 18530 + }, + { + "epoch": 0.36, + "learning_rate": 9.236201808279886e-05, + "loss": 1.2045, + "step": 18540 + }, + { + "epoch": 0.36, + "learning_rate": 9.235399316771143e-05, + "loss": 1.3507, + "step": 18550 + }, + { + "epoch": 0.36, + "learning_rate": 9.234596438811771e-05, + "loss": 1.1446, + "step": 18560 + }, + { + "epoch": 0.36, + "learning_rate": 9.233793174475028e-05, + "loss": 1.1164, + "step": 18570 + }, + { + "epoch": 0.36, + "learning_rate": 9.232989523834204e-05, + "loss": 1.2103, + "step": 18580 + }, + { + "epoch": 0.36, + "learning_rate": 9.232185486962627e-05, + "loss": 1.3485, + "step": 18590 + }, + { + "epoch": 0.36, + "learning_rate": 9.231381063933659e-05, + "loss": 1.1548, + "step": 18600 + }, + { + "epoch": 0.36, + "learning_rate": 9.230576254820702e-05, + "loss": 1.2474, + "step": 18610 + }, + { + "epoch": 0.36, + "learning_rate": 9.229771059697184e-05, + "loss": 1.2301, + "step": 18620 + }, + { + "epoch": 0.36, + "learning_rate": 9.228965478636575e-05, + "loss": 1.3635, + "step": 18630 + }, + { + "epoch": 0.36, + "learning_rate": 9.228159511712381e-05, + "loss": 1.4085, + "step": 18640 + }, + { + "epoch": 0.36, + "learning_rate": 9.227353158998139e-05, + "loss": 1.2616, + "step": 18650 + }, + { + "epoch": 0.36, + "learning_rate": 9.226546420567422e-05, + "loss": 1.1465, + "step": 18660 + }, + { + "epoch": 0.36, + "learning_rate": 9.22573929649384e-05, + "loss": 1.249, + "step": 18670 + }, + { + "epoch": 0.36, + "learning_rate": 9.224931786851041e-05, + "loss": 1.1245, + "step": 18680 + }, + { + "epoch": 0.36, + "learning_rate": 9.2241238917127e-05, + "loss": 1.3263, + "step": 18690 + }, + { + "epoch": 0.36, + "learning_rate": 9.223315611152531e-05, + "loss": 1.2855, + "step": 18700 + }, + { + "epoch": 0.36, + "learning_rate": 9.22250694524429e-05, + "loss": 1.2554, + "step": 18710 + }, + { + "epoch": 0.36, + "learning_rate": 9.221697894061756e-05, + "loss": 1.4284, + "step": 18720 + }, + { + "epoch": 0.36, + "learning_rate": 9.220888457678752e-05, + "loss": 1.4104, + "step": 18730 + }, + { + "epoch": 0.36, + "learning_rate": 9.220078636169134e-05, + "loss": 1.3955, + "step": 18740 + }, + { + "epoch": 0.36, + "learning_rate": 9.21926842960679e-05, + "loss": 1.1677, + "step": 18750 + }, + { + "epoch": 0.36, + "learning_rate": 9.21845783806565e-05, + "loss": 1.0718, + "step": 18760 + }, + { + "epoch": 0.36, + "learning_rate": 9.21764686161967e-05, + "loss": 1.2162, + "step": 18770 + }, + { + "epoch": 0.36, + "learning_rate": 9.21683550034285e-05, + "loss": 1.2101, + "step": 18780 + }, + { + "epoch": 0.36, + "learning_rate": 9.216023754309218e-05, + "loss": 1.1701, + "step": 18790 + }, + { + "epoch": 0.36, + "learning_rate": 9.215211623592842e-05, + "loss": 1.2087, + "step": 18800 + }, + { + "epoch": 0.36, + "learning_rate": 9.214399108267822e-05, + "loss": 1.2124, + "step": 18810 + }, + { + "epoch": 0.36, + "learning_rate": 9.213586208408294e-05, + "loss": 1.1733, + "step": 18820 + }, + { + "epoch": 0.36, + "learning_rate": 9.21277292408843e-05, + "loss": 1.1636, + "step": 18830 + }, + { + "epoch": 0.36, + "learning_rate": 9.21195925538244e-05, + "loss": 1.3481, + "step": 18840 + }, + { + "epoch": 0.36, + "learning_rate": 9.21114520236456e-05, + "loss": 1.4059, + "step": 18850 + }, + { + "epoch": 0.36, + "learning_rate": 9.21033076510907e-05, + "loss": 1.2956, + "step": 18860 + }, + { + "epoch": 0.36, + "learning_rate": 9.209515943690281e-05, + "loss": 1.3075, + "step": 18870 + }, + { + "epoch": 0.36, + "learning_rate": 9.208700738182539e-05, + "loss": 1.2157, + "step": 18880 + }, + { + "epoch": 0.36, + "learning_rate": 9.207885148660226e-05, + "loss": 1.2487, + "step": 18890 + }, + { + "epoch": 0.36, + "learning_rate": 9.207069175197762e-05, + "loss": 1.4118, + "step": 18900 + }, + { + "epoch": 0.36, + "learning_rate": 9.206252817869594e-05, + "loss": 1.3536, + "step": 18910 + }, + { + "epoch": 0.36, + "learning_rate": 9.205436076750212e-05, + "loss": 1.3249, + "step": 18920 + }, + { + "epoch": 0.36, + "learning_rate": 9.204618951914137e-05, + "loss": 1.4284, + "step": 18930 + }, + { + "epoch": 0.36, + "learning_rate": 9.203801443435924e-05, + "loss": 1.4646, + "step": 18940 + }, + { + "epoch": 0.36, + "learning_rate": 9.20298355139017e-05, + "loss": 1.2792, + "step": 18950 + }, + { + "epoch": 0.36, + "learning_rate": 9.202165275851497e-05, + "loss": 1.1213, + "step": 18960 + }, + { + "epoch": 0.36, + "learning_rate": 9.201346616894568e-05, + "loss": 1.1528, + "step": 18970 + }, + { + "epoch": 0.36, + "learning_rate": 9.200527574594082e-05, + "loss": 1.2696, + "step": 18980 + }, + { + "epoch": 0.37, + "learning_rate": 9.199708149024769e-05, + "loss": 1.2345, + "step": 18990 + }, + { + "epoch": 0.37, + "learning_rate": 9.198888340261397e-05, + "loss": 1.5037, + "step": 19000 + }, + { + "epoch": 0.37, + "learning_rate": 9.198068148378767e-05, + "loss": 1.1251, + "step": 19010 + }, + { + "epoch": 0.37, + "learning_rate": 9.197247573451718e-05, + "loss": 1.1563, + "step": 19020 + }, + { + "epoch": 0.37, + "learning_rate": 9.196426615555116e-05, + "loss": 1.1353, + "step": 19030 + }, + { + "epoch": 0.37, + "learning_rate": 9.195605274763875e-05, + "loss": 1.2654, + "step": 19040 + }, + { + "epoch": 0.37, + "learning_rate": 9.19478355115293e-05, + "loss": 1.3081, + "step": 19050 + }, + { + "epoch": 0.37, + "learning_rate": 9.193961444797263e-05, + "loss": 1.3418, + "step": 19060 + }, + { + "epoch": 0.37, + "learning_rate": 9.193138955771883e-05, + "loss": 1.3319, + "step": 19070 + }, + { + "epoch": 0.37, + "learning_rate": 9.192316084151835e-05, + "loss": 1.2861, + "step": 19080 + }, + { + "epoch": 0.37, + "learning_rate": 9.191492830012202e-05, + "loss": 1.4887, + "step": 19090 + }, + { + "epoch": 0.37, + "learning_rate": 9.190669193428101e-05, + "loss": 1.1558, + "step": 19100 + }, + { + "epoch": 0.37, + "learning_rate": 9.189845174474681e-05, + "loss": 1.2116, + "step": 19110 + }, + { + "epoch": 0.37, + "learning_rate": 9.18902077322713e-05, + "loss": 1.0554, + "step": 19120 + }, + { + "epoch": 0.37, + "learning_rate": 9.188195989760668e-05, + "loss": 1.2884, + "step": 19130 + }, + { + "epoch": 0.37, + "learning_rate": 9.18737082415055e-05, + "loss": 1.2485, + "step": 19140 + }, + { + "epoch": 0.37, + "learning_rate": 9.186545276472067e-05, + "loss": 1.0407, + "step": 19150 + }, + { + "epoch": 0.37, + "learning_rate": 9.185719346800546e-05, + "loss": 1.2874, + "step": 19160 + }, + { + "epoch": 0.37, + "learning_rate": 9.184893035211346e-05, + "loss": 1.2883, + "step": 19170 + }, + { + "epoch": 0.37, + "learning_rate": 9.184066341779862e-05, + "loss": 1.1917, + "step": 19180 + }, + { + "epoch": 0.37, + "learning_rate": 9.183239266581523e-05, + "loss": 1.1768, + "step": 19190 + }, + { + "epoch": 0.37, + "learning_rate": 9.182411809691795e-05, + "loss": 1.2362, + "step": 19200 + }, + { + "epoch": 0.37, + "learning_rate": 9.181583971186179e-05, + "loss": 1.2328, + "step": 19210 + }, + { + "epoch": 0.37, + "learning_rate": 9.180755751140207e-05, + "loss": 1.217, + "step": 19220 + }, + { + "epoch": 0.37, + "learning_rate": 9.17992714962945e-05, + "loss": 1.2306, + "step": 19230 + }, + { + "epoch": 0.37, + "learning_rate": 9.179098166729513e-05, + "loss": 1.0566, + "step": 19240 + }, + { + "epoch": 0.37, + "learning_rate": 9.178268802516032e-05, + "loss": 1.3224, + "step": 19250 + }, + { + "epoch": 0.37, + "learning_rate": 9.177439057064683e-05, + "loss": 1.0436, + "step": 19260 + }, + { + "epoch": 0.37, + "learning_rate": 9.176608930451173e-05, + "loss": 1.0848, + "step": 19270 + }, + { + "epoch": 0.37, + "learning_rate": 9.175778422751246e-05, + "loss": 1.2881, + "step": 19280 + }, + { + "epoch": 0.37, + "learning_rate": 9.174947534040681e-05, + "loss": 1.337, + "step": 19290 + }, + { + "epoch": 0.37, + "learning_rate": 9.174116264395289e-05, + "loss": 1.0918, + "step": 19300 + }, + { + "epoch": 0.37, + "learning_rate": 9.173284613890918e-05, + "loss": 1.1272, + "step": 19310 + }, + { + "epoch": 0.37, + "learning_rate": 9.17245258260345e-05, + "loss": 1.2602, + "step": 19320 + }, + { + "epoch": 0.37, + "learning_rate": 9.171620170608803e-05, + "loss": 1.4133, + "step": 19330 + }, + { + "epoch": 0.37, + "learning_rate": 9.17078737798293e-05, + "loss": 1.2353, + "step": 19340 + }, + { + "epoch": 0.37, + "learning_rate": 9.169954204801816e-05, + "loss": 1.4011, + "step": 19350 + }, + { + "epoch": 0.37, + "learning_rate": 9.169120651141481e-05, + "loss": 1.2604, + "step": 19360 + }, + { + "epoch": 0.37, + "learning_rate": 9.168286717077981e-05, + "loss": 1.0883, + "step": 19370 + }, + { + "epoch": 0.37, + "learning_rate": 9.16745240268741e-05, + "loss": 1.3261, + "step": 19380 + }, + { + "epoch": 0.37, + "learning_rate": 9.16661770804589e-05, + "loss": 1.2684, + "step": 19390 + }, + { + "epoch": 0.37, + "learning_rate": 9.165782633229582e-05, + "loss": 1.2597, + "step": 19400 + }, + { + "epoch": 0.37, + "learning_rate": 9.164947178314683e-05, + "loss": 1.1418, + "step": 19410 + }, + { + "epoch": 0.37, + "learning_rate": 9.16411134337742e-05, + "loss": 1.2888, + "step": 19420 + }, + { + "epoch": 0.37, + "learning_rate": 9.163275128494056e-05, + "loss": 0.9184, + "step": 19430 + }, + { + "epoch": 0.37, + "learning_rate": 9.162438533740892e-05, + "loss": 1.2341, + "step": 19440 + }, + { + "epoch": 0.37, + "learning_rate": 9.161601559194261e-05, + "loss": 1.4176, + "step": 19450 + }, + { + "epoch": 0.37, + "learning_rate": 9.16076420493053e-05, + "loss": 1.1862, + "step": 19460 + }, + { + "epoch": 0.37, + "learning_rate": 9.159926471026104e-05, + "loss": 1.4162, + "step": 19470 + }, + { + "epoch": 0.37, + "learning_rate": 9.159088357557417e-05, + "loss": 1.5603, + "step": 19480 + }, + { + "epoch": 0.37, + "learning_rate": 9.158249864600946e-05, + "loss": 1.4133, + "step": 19490 + }, + { + "epoch": 0.37, + "learning_rate": 9.157410992233191e-05, + "loss": 1.3486, + "step": 19500 + }, + { + "epoch": 0.38, + "learning_rate": 9.156571740530699e-05, + "loss": 1.2212, + "step": 19510 + }, + { + "epoch": 0.38, + "learning_rate": 9.155732109570043e-05, + "loss": 1.2289, + "step": 19520 + }, + { + "epoch": 0.38, + "learning_rate": 9.154892099427834e-05, + "loss": 1.0904, + "step": 19530 + }, + { + "epoch": 0.38, + "learning_rate": 9.154051710180718e-05, + "loss": 1.1836, + "step": 19540 + }, + { + "epoch": 0.38, + "learning_rate": 9.153210941905374e-05, + "loss": 1.2065, + "step": 19550 + }, + { + "epoch": 0.38, + "learning_rate": 9.152369794678515e-05, + "loss": 1.3365, + "step": 19560 + }, + { + "epoch": 0.38, + "learning_rate": 9.151528268576892e-05, + "loss": 1.0631, + "step": 19570 + }, + { + "epoch": 0.38, + "learning_rate": 9.150686363677287e-05, + "loss": 1.3591, + "step": 19580 + }, + { + "epoch": 0.38, + "learning_rate": 9.149844080056518e-05, + "loss": 1.4261, + "step": 19590 + }, + { + "epoch": 0.38, + "learning_rate": 9.149001417791438e-05, + "loss": 1.3315, + "step": 19600 + }, + { + "epoch": 0.38, + "learning_rate": 9.148158376958932e-05, + "loss": 1.2509, + "step": 19610 + }, + { + "epoch": 0.38, + "learning_rate": 9.147314957635926e-05, + "loss": 1.366, + "step": 19620 + }, + { + "epoch": 0.38, + "learning_rate": 9.146471159899372e-05, + "loss": 1.2429, + "step": 19630 + }, + { + "epoch": 0.38, + "learning_rate": 9.145626983826264e-05, + "loss": 1.1623, + "step": 19640 + }, + { + "epoch": 0.38, + "learning_rate": 9.144782429493623e-05, + "loss": 1.2967, + "step": 19650 + }, + { + "epoch": 0.38, + "learning_rate": 9.143937496978512e-05, + "loss": 1.0439, + "step": 19660 + }, + { + "epoch": 0.38, + "learning_rate": 9.143092186358026e-05, + "loss": 1.0677, + "step": 19670 + }, + { + "epoch": 0.38, + "learning_rate": 9.14224649770929e-05, + "loss": 1.3888, + "step": 19680 + }, + { + "epoch": 0.38, + "learning_rate": 9.14140043110947e-05, + "loss": 1.2772, + "step": 19690 + }, + { + "epoch": 0.38, + "learning_rate": 9.140553986635763e-05, + "loss": 1.3543, + "step": 19700 + }, + { + "epoch": 0.38, + "learning_rate": 9.139707164365399e-05, + "loss": 1.1133, + "step": 19710 + }, + { + "epoch": 0.38, + "learning_rate": 9.138859964375648e-05, + "loss": 1.37, + "step": 19720 + }, + { + "epoch": 0.38, + "learning_rate": 9.13801238674381e-05, + "loss": 1.1923, + "step": 19730 + }, + { + "epoch": 0.38, + "learning_rate": 9.137164431547221e-05, + "loss": 1.3854, + "step": 19740 + }, + { + "epoch": 0.38, + "learning_rate": 9.136316098863247e-05, + "loss": 1.4615, + "step": 19750 + }, + { + "epoch": 0.38, + "learning_rate": 9.135467388769298e-05, + "loss": 1.2193, + "step": 19760 + }, + { + "epoch": 0.38, + "learning_rate": 9.13461830134281e-05, + "loss": 1.2675, + "step": 19770 + }, + { + "epoch": 0.38, + "learning_rate": 9.133768836661257e-05, + "loss": 1.246, + "step": 19780 + }, + { + "epoch": 0.38, + "learning_rate": 9.132918994802147e-05, + "loss": 1.2972, + "step": 19790 + }, + { + "epoch": 0.38, + "learning_rate": 9.132068775843022e-05, + "loss": 1.2293, + "step": 19800 + }, + { + "epoch": 0.38, + "learning_rate": 9.131218179861456e-05, + "loss": 1.2536, + "step": 19810 + }, + { + "epoch": 0.38, + "learning_rate": 9.130367206935063e-05, + "loss": 1.2778, + "step": 19820 + }, + { + "epoch": 0.38, + "learning_rate": 9.129515857141488e-05, + "loss": 1.2956, + "step": 19830 + }, + { + "epoch": 0.38, + "learning_rate": 9.128664130558411e-05, + "loss": 1.3419, + "step": 19840 + }, + { + "epoch": 0.38, + "learning_rate": 9.127812027263545e-05, + "loss": 1.352, + "step": 19850 + }, + { + "epoch": 0.38, + "learning_rate": 9.126959547334637e-05, + "loss": 1.1594, + "step": 19860 + }, + { + "epoch": 0.38, + "learning_rate": 9.126106690849474e-05, + "loss": 1.3724, + "step": 19870 + }, + { + "epoch": 0.38, + "learning_rate": 9.125253457885869e-05, + "loss": 1.2078, + "step": 19880 + }, + { + "epoch": 0.38, + "learning_rate": 9.124399848521677e-05, + "loss": 1.4347, + "step": 19890 + }, + { + "epoch": 0.38, + "learning_rate": 9.123545862834781e-05, + "loss": 1.2864, + "step": 19900 + }, + { + "epoch": 0.38, + "learning_rate": 9.122691500903104e-05, + "loss": 1.2206, + "step": 19910 + }, + { + "epoch": 0.38, + "learning_rate": 9.121836762804597e-05, + "loss": 1.3752, + "step": 19920 + }, + { + "epoch": 0.38, + "learning_rate": 9.120981648617252e-05, + "loss": 1.108, + "step": 19930 + }, + { + "epoch": 0.38, + "learning_rate": 9.120126158419092e-05, + "loss": 1.266, + "step": 19940 + }, + { + "epoch": 0.38, + "learning_rate": 9.119270292288173e-05, + "loss": 1.3314, + "step": 19950 + }, + { + "epoch": 0.38, + "learning_rate": 9.118414050302588e-05, + "loss": 1.1617, + "step": 19960 + }, + { + "epoch": 0.38, + "learning_rate": 9.117557432540462e-05, + "loss": 1.3017, + "step": 19970 + }, + { + "epoch": 0.38, + "learning_rate": 9.116700439079958e-05, + "loss": 1.2081, + "step": 19980 + }, + { + "epoch": 0.38, + "learning_rate": 9.115843069999266e-05, + "loss": 1.2585, + "step": 19990 + }, + { + "epoch": 0.38, + "learning_rate": 9.114985325376619e-05, + "loss": 1.4547, + "step": 20000 + }, + { + "epoch": 0.38, + "learning_rate": 9.114127205290279e-05, + "loss": 1.3955, + "step": 20010 + }, + { + "epoch": 0.38, + "learning_rate": 9.113268709818543e-05, + "loss": 1.318, + "step": 20020 + }, + { + "epoch": 0.39, + "learning_rate": 9.112409839039742e-05, + "loss": 1.4196, + "step": 20030 + }, + { + "epoch": 0.39, + "learning_rate": 9.111550593032244e-05, + "loss": 1.1473, + "step": 20040 + }, + { + "epoch": 0.39, + "learning_rate": 9.110690971874449e-05, + "loss": 1.3523, + "step": 20050 + }, + { + "epoch": 0.39, + "learning_rate": 9.109830975644788e-05, + "loss": 1.324, + "step": 20060 + }, + { + "epoch": 0.39, + "learning_rate": 9.108970604421736e-05, + "loss": 1.0995, + "step": 20070 + }, + { + "epoch": 0.39, + "learning_rate": 9.10810985828379e-05, + "loss": 1.2547, + "step": 20080 + }, + { + "epoch": 0.39, + "learning_rate": 9.107248737309488e-05, + "loss": 1.3314, + "step": 20090 + }, + { + "epoch": 0.39, + "learning_rate": 9.106387241577405e-05, + "loss": 1.5519, + "step": 20100 + }, + { + "epoch": 0.39, + "learning_rate": 9.105525371166144e-05, + "loss": 1.204, + "step": 20110 + }, + { + "epoch": 0.39, + "learning_rate": 9.104663126154343e-05, + "loss": 1.47, + "step": 20120 + }, + { + "epoch": 0.39, + "learning_rate": 9.103800506620678e-05, + "loss": 1.2855, + "step": 20130 + }, + { + "epoch": 0.39, + "learning_rate": 9.102937512643856e-05, + "loss": 1.0478, + "step": 20140 + }, + { + "epoch": 0.39, + "learning_rate": 9.102074144302622e-05, + "loss": 1.3733, + "step": 20150 + }, + { + "epoch": 0.39, + "learning_rate": 9.101210401675748e-05, + "loss": 1.4146, + "step": 20160 + }, + { + "epoch": 0.39, + "learning_rate": 9.100346284842048e-05, + "loss": 1.2943, + "step": 20170 + }, + { + "epoch": 0.39, + "learning_rate": 9.099481793880362e-05, + "loss": 1.2103, + "step": 20180 + }, + { + "epoch": 0.39, + "learning_rate": 9.098616928869575e-05, + "loss": 1.2752, + "step": 20190 + }, + { + "epoch": 0.39, + "learning_rate": 9.097751689888595e-05, + "loss": 1.1991, + "step": 20200 + }, + { + "epoch": 0.39, + "learning_rate": 9.096886077016371e-05, + "loss": 1.3585, + "step": 20210 + }, + { + "epoch": 0.39, + "learning_rate": 9.096020090331885e-05, + "loss": 1.401, + "step": 20220 + }, + { + "epoch": 0.39, + "learning_rate": 9.09515372991415e-05, + "loss": 1.2516, + "step": 20230 + }, + { + "epoch": 0.39, + "learning_rate": 9.094286995842218e-05, + "loss": 1.2289, + "step": 20240 + }, + { + "epoch": 0.39, + "learning_rate": 9.09341988819517e-05, + "loss": 1.3863, + "step": 20250 + }, + { + "epoch": 0.39, + "learning_rate": 9.092552407052123e-05, + "loss": 1.2974, + "step": 20260 + }, + { + "epoch": 0.39, + "learning_rate": 9.091684552492233e-05, + "loss": 1.3099, + "step": 20270 + }, + { + "epoch": 0.39, + "learning_rate": 9.090816324594682e-05, + "loss": 1.3949, + "step": 20280 + }, + { + "epoch": 0.39, + "learning_rate": 9.08994772343869e-05, + "loss": 1.283, + "step": 20290 + }, + { + "epoch": 0.39, + "learning_rate": 9.089078749103511e-05, + "loss": 1.2604, + "step": 20300 + }, + { + "epoch": 0.39, + "learning_rate": 9.088209401668433e-05, + "loss": 1.3067, + "step": 20310 + }, + { + "epoch": 0.39, + "learning_rate": 9.087339681212779e-05, + "loss": 1.299, + "step": 20320 + }, + { + "epoch": 0.39, + "learning_rate": 9.086469587815904e-05, + "loss": 1.4764, + "step": 20330 + }, + { + "epoch": 0.39, + "learning_rate": 9.085599121557197e-05, + "loss": 1.4707, + "step": 20340 + }, + { + "epoch": 0.39, + "learning_rate": 9.084728282516084e-05, + "loss": 1.0965, + "step": 20350 + }, + { + "epoch": 0.39, + "learning_rate": 9.083857070772019e-05, + "loss": 1.3065, + "step": 20360 + }, + { + "epoch": 0.39, + "learning_rate": 9.082985486404501e-05, + "loss": 1.2415, + "step": 20370 + }, + { + "epoch": 0.39, + "learning_rate": 9.082113529493048e-05, + "loss": 1.1175, + "step": 20380 + }, + { + "epoch": 0.39, + "learning_rate": 9.081241200117227e-05, + "loss": 1.244, + "step": 20390 + }, + { + "epoch": 0.39, + "learning_rate": 9.080368498356628e-05, + "loss": 1.2925, + "step": 20400 + }, + { + "epoch": 0.39, + "learning_rate": 9.079495424290878e-05, + "loss": 1.3885, + "step": 20410 + }, + { + "epoch": 0.39, + "learning_rate": 9.078621977999642e-05, + "loss": 1.1691, + "step": 20420 + }, + { + "epoch": 0.39, + "learning_rate": 9.077748159562613e-05, + "loss": 1.4151, + "step": 20430 + }, + { + "epoch": 0.39, + "learning_rate": 9.076873969059526e-05, + "loss": 1.4083, + "step": 20440 + }, + { + "epoch": 0.39, + "learning_rate": 9.075999406570137e-05, + "loss": 1.2528, + "step": 20450 + }, + { + "epoch": 0.39, + "learning_rate": 9.07512447217425e-05, + "loss": 1.2137, + "step": 20460 + }, + { + "epoch": 0.39, + "learning_rate": 9.074249165951694e-05, + "loss": 1.3431, + "step": 20470 + }, + { + "epoch": 0.39, + "learning_rate": 9.073373487982335e-05, + "loss": 1.4769, + "step": 20480 + }, + { + "epoch": 0.39, + "learning_rate": 9.072497438346072e-05, + "loss": 1.2392, + "step": 20490 + }, + { + "epoch": 0.39, + "learning_rate": 9.07162101712284e-05, + "loss": 1.2963, + "step": 20500 + }, + { + "epoch": 0.39, + "learning_rate": 9.070744224392606e-05, + "loss": 1.1272, + "step": 20510 + }, + { + "epoch": 0.39, + "learning_rate": 9.06986706023537e-05, + "loss": 1.3848, + "step": 20520 + }, + { + "epoch": 0.39, + "learning_rate": 9.068989524731168e-05, + "loss": 1.4085, + "step": 20530 + }, + { + "epoch": 0.39, + "learning_rate": 9.068111617960067e-05, + "loss": 1.2047, + "step": 20540 + }, + { + "epoch": 0.4, + "learning_rate": 9.067233340002173e-05, + "loss": 1.3008, + "step": 20550 + }, + { + "epoch": 0.4, + "learning_rate": 9.066354690937622e-05, + "loss": 1.3661, + "step": 20560 + }, + { + "epoch": 0.4, + "learning_rate": 9.065475670846582e-05, + "loss": 1.2619, + "step": 20570 + }, + { + "epoch": 0.4, + "learning_rate": 9.06459627980926e-05, + "loss": 1.1163, + "step": 20580 + }, + { + "epoch": 0.4, + "learning_rate": 9.063716517905894e-05, + "loss": 0.9725, + "step": 20590 + }, + { + "epoch": 0.4, + "learning_rate": 9.062836385216755e-05, + "loss": 1.2133, + "step": 20600 + }, + { + "epoch": 0.4, + "learning_rate": 9.061955881822151e-05, + "loss": 0.9211, + "step": 20610 + }, + { + "epoch": 0.4, + "learning_rate": 9.061075007802419e-05, + "loss": 1.4721, + "step": 20620 + }, + { + "epoch": 0.4, + "learning_rate": 9.060193763237934e-05, + "loss": 1.3133, + "step": 20630 + }, + { + "epoch": 0.4, + "learning_rate": 9.059312148209105e-05, + "loss": 1.5812, + "step": 20640 + }, + { + "epoch": 0.4, + "learning_rate": 9.058430162796371e-05, + "loss": 1.28, + "step": 20650 + }, + { + "epoch": 0.4, + "learning_rate": 9.057547807080208e-05, + "loss": 1.4741, + "step": 20660 + }, + { + "epoch": 0.4, + "learning_rate": 9.056665081141125e-05, + "loss": 1.2443, + "step": 20670 + }, + { + "epoch": 0.4, + "learning_rate": 9.055781985059663e-05, + "loss": 1.0663, + "step": 20680 + }, + { + "epoch": 0.4, + "learning_rate": 9.054898518916399e-05, + "loss": 1.298, + "step": 20690 + }, + { + "epoch": 0.4, + "learning_rate": 9.054014682791945e-05, + "loss": 1.2759, + "step": 20700 + }, + { + "epoch": 0.4, + "learning_rate": 9.053130476766943e-05, + "loss": 1.3189, + "step": 20710 + }, + { + "epoch": 0.4, + "learning_rate": 9.05224590092207e-05, + "loss": 1.3413, + "step": 20720 + }, + { + "epoch": 0.4, + "learning_rate": 9.05136095533804e-05, + "loss": 1.2042, + "step": 20730 + }, + { + "epoch": 0.4, + "learning_rate": 9.050475640095598e-05, + "loss": 1.4885, + "step": 20740 + }, + { + "epoch": 0.4, + "learning_rate": 9.049589955275518e-05, + "loss": 1.6309, + "step": 20750 + }, + { + "epoch": 0.4, + "learning_rate": 9.048703900958617e-05, + "loss": 1.4646, + "step": 20760 + }, + { + "epoch": 0.4, + "learning_rate": 9.047817477225741e-05, + "loss": 1.3543, + "step": 20770 + }, + { + "epoch": 0.4, + "learning_rate": 9.04693068415777e-05, + "loss": 1.3609, + "step": 20780 + }, + { + "epoch": 0.4, + "learning_rate": 9.046043521835617e-05, + "loss": 1.3234, + "step": 20790 + }, + { + "epoch": 0.4, + "learning_rate": 9.045155990340227e-05, + "loss": 1.4644, + "step": 20800 + }, + { + "epoch": 0.4, + "learning_rate": 9.044268089752586e-05, + "loss": 1.2933, + "step": 20810 + }, + { + "epoch": 0.4, + "learning_rate": 9.043379820153703e-05, + "loss": 1.5008, + "step": 20820 + }, + { + "epoch": 0.4, + "learning_rate": 9.042491181624633e-05, + "loss": 1.3722, + "step": 20830 + }, + { + "epoch": 0.4, + "learning_rate": 9.04160217424645e-05, + "loss": 1.1812, + "step": 20840 + }, + { + "epoch": 0.4, + "learning_rate": 9.040712798100279e-05, + "loss": 1.3886, + "step": 20850 + }, + { + "epoch": 0.4, + "learning_rate": 9.039823053267262e-05, + "loss": 1.3184, + "step": 20860 + }, + { + "epoch": 0.4, + "learning_rate": 9.038932939828586e-05, + "loss": 1.2823, + "step": 20870 + }, + { + "epoch": 0.4, + "learning_rate": 9.038042457865465e-05, + "loss": 1.1431, + "step": 20880 + }, + { + "epoch": 0.4, + "learning_rate": 9.037151607459151e-05, + "loss": 1.3602, + "step": 20890 + }, + { + "epoch": 0.4, + "learning_rate": 9.036260388690927e-05, + "loss": 1.2437, + "step": 20900 + }, + { + "epoch": 0.4, + "learning_rate": 9.035368801642112e-05, + "loss": 1.359, + "step": 20910 + }, + { + "epoch": 0.4, + "learning_rate": 9.034476846394055e-05, + "loss": 1.2629, + "step": 20920 + }, + { + "epoch": 0.4, + "learning_rate": 9.033584523028142e-05, + "loss": 1.394, + "step": 20930 + }, + { + "epoch": 0.4, + "learning_rate": 9.032691831625792e-05, + "loss": 1.2364, + "step": 20940 + }, + { + "epoch": 0.4, + "learning_rate": 9.031798772268455e-05, + "loss": 1.2808, + "step": 20950 + }, + { + "epoch": 0.4, + "learning_rate": 9.030905345037617e-05, + "loss": 1.1947, + "step": 20960 + }, + { + "epoch": 0.4, + "learning_rate": 9.030011550014798e-05, + "loss": 1.4801, + "step": 20970 + }, + { + "epoch": 0.4, + "learning_rate": 9.02911738728155e-05, + "loss": 1.2582, + "step": 20980 + }, + { + "epoch": 0.4, + "learning_rate": 9.028222856919458e-05, + "loss": 1.2728, + "step": 20990 + }, + { + "epoch": 0.4, + "learning_rate": 9.027327959010142e-05, + "loss": 1.3302, + "step": 21000 + }, + { + "epoch": 0.4, + "learning_rate": 9.026432693635257e-05, + "loss": 1.2725, + "step": 21010 + }, + { + "epoch": 0.4, + "learning_rate": 9.025537060876488e-05, + "loss": 1.1886, + "step": 21020 + }, + { + "epoch": 0.4, + "learning_rate": 9.024641060815557e-05, + "loss": 1.4478, + "step": 21030 + }, + { + "epoch": 0.4, + "learning_rate": 9.023744693534215e-05, + "loss": 1.2868, + "step": 21040 + }, + { + "epoch": 0.4, + "learning_rate": 9.02284795911425e-05, + "loss": 1.2076, + "step": 21050 + }, + { + "epoch": 0.4, + "learning_rate": 9.021950857637486e-05, + "loss": 1.3483, + "step": 21060 + }, + { + "epoch": 0.41, + "learning_rate": 9.021053389185773e-05, + "loss": 1.4153, + "step": 21070 + }, + { + "epoch": 0.41, + "learning_rate": 9.020155553841e-05, + "loss": 1.1559, + "step": 21080 + }, + { + "epoch": 0.41, + "learning_rate": 9.01925735168509e-05, + "loss": 1.4696, + "step": 21090 + }, + { + "epoch": 0.41, + "learning_rate": 9.018358782799995e-05, + "loss": 1.3476, + "step": 21100 + }, + { + "epoch": 0.41, + "learning_rate": 9.017459847267708e-05, + "loss": 1.3061, + "step": 21110 + }, + { + "epoch": 0.41, + "learning_rate": 9.016560545170243e-05, + "loss": 1.2134, + "step": 21120 + }, + { + "epoch": 0.41, + "learning_rate": 9.015660876589662e-05, + "loss": 1.3707, + "step": 21130 + }, + { + "epoch": 0.41, + "learning_rate": 9.01476084160805e-05, + "loss": 1.4401, + "step": 21140 + }, + { + "epoch": 0.41, + "learning_rate": 9.013860440307529e-05, + "loss": 1.3131, + "step": 21150 + }, + { + "epoch": 0.41, + "learning_rate": 9.012959672770255e-05, + "loss": 1.4556, + "step": 21160 + }, + { + "epoch": 0.41, + "learning_rate": 9.012058539078416e-05, + "loss": 1.3812, + "step": 21170 + }, + { + "epoch": 0.41, + "learning_rate": 9.011157039314235e-05, + "loss": 1.5042, + "step": 21180 + }, + { + "epoch": 0.41, + "learning_rate": 9.010255173559967e-05, + "loss": 1.4034, + "step": 21190 + }, + { + "epoch": 0.41, + "learning_rate": 9.009352941897903e-05, + "loss": 1.077, + "step": 21200 + }, + { + "epoch": 0.41, + "learning_rate": 9.008450344410361e-05, + "loss": 1.3458, + "step": 21210 + }, + { + "epoch": 0.41, + "learning_rate": 9.007547381179703e-05, + "loss": 1.3218, + "step": 21220 + }, + { + "epoch": 0.41, + "learning_rate": 9.006644052288312e-05, + "loss": 1.5008, + "step": 21230 + }, + { + "epoch": 0.41, + "learning_rate": 9.005740357818612e-05, + "loss": 1.3053, + "step": 21240 + }, + { + "epoch": 0.41, + "learning_rate": 9.004836297853063e-05, + "loss": 1.3624, + "step": 21250 + }, + { + "epoch": 0.41, + "learning_rate": 9.003931872474149e-05, + "loss": 1.4755, + "step": 21260 + }, + { + "epoch": 0.41, + "learning_rate": 9.003027081764395e-05, + "loss": 1.3678, + "step": 21270 + }, + { + "epoch": 0.41, + "learning_rate": 9.002121925806355e-05, + "loss": 1.3631, + "step": 21280 + }, + { + "epoch": 0.41, + "learning_rate": 9.00121640468262e-05, + "loss": 1.1419, + "step": 21290 + }, + { + "epoch": 0.41, + "learning_rate": 9.000310518475812e-05, + "loss": 1.1803, + "step": 21300 + }, + { + "epoch": 0.41, + "learning_rate": 8.999404267268588e-05, + "loss": 1.3218, + "step": 21310 + }, + { + "epoch": 0.41, + "learning_rate": 8.998497651143634e-05, + "loss": 1.3041, + "step": 21320 + }, + { + "epoch": 0.41, + "learning_rate": 8.997590670183673e-05, + "loss": 1.3191, + "step": 21330 + }, + { + "epoch": 0.41, + "learning_rate": 8.996683324471464e-05, + "loss": 1.1343, + "step": 21340 + }, + { + "epoch": 0.41, + "learning_rate": 8.995775614089795e-05, + "loss": 1.3106, + "step": 21350 + }, + { + "epoch": 0.41, + "learning_rate": 8.994867539121484e-05, + "loss": 1.2002, + "step": 21360 + }, + { + "epoch": 0.41, + "learning_rate": 8.993959099649391e-05, + "loss": 1.4418, + "step": 21370 + }, + { + "epoch": 0.41, + "learning_rate": 8.993050295756404e-05, + "loss": 1.3346, + "step": 21380 + }, + { + "epoch": 0.41, + "learning_rate": 8.992141127525443e-05, + "loss": 1.3023, + "step": 21390 + }, + { + "epoch": 0.41, + "learning_rate": 8.991231595039465e-05, + "loss": 1.2754, + "step": 21400 + }, + { + "epoch": 0.41, + "learning_rate": 8.990321698381459e-05, + "loss": 1.4973, + "step": 21410 + }, + { + "epoch": 0.41, + "learning_rate": 8.989411437634445e-05, + "loss": 1.3964, + "step": 21420 + }, + { + "epoch": 0.41, + "learning_rate": 8.988500812881478e-05, + "loss": 1.2517, + "step": 21430 + }, + { + "epoch": 0.41, + "learning_rate": 8.987589824205649e-05, + "loss": 1.1416, + "step": 21440 + }, + { + "epoch": 0.41, + "learning_rate": 8.986678471690075e-05, + "loss": 1.3243, + "step": 21450 + }, + { + "epoch": 0.41, + "learning_rate": 8.985766755417915e-05, + "loss": 1.2148, + "step": 21460 + }, + { + "epoch": 0.41, + "learning_rate": 8.984854675472351e-05, + "loss": 1.3652, + "step": 21470 + }, + { + "epoch": 0.41, + "learning_rate": 8.98394223193661e-05, + "loss": 1.3323, + "step": 21480 + }, + { + "epoch": 0.41, + "learning_rate": 8.983029424893945e-05, + "loss": 1.2251, + "step": 21490 + }, + { + "epoch": 0.41, + "learning_rate": 8.98211625442764e-05, + "loss": 1.1773, + "step": 21500 + }, + { + "epoch": 0.41, + "learning_rate": 8.981202720621019e-05, + "loss": 1.1245, + "step": 21510 + }, + { + "epoch": 0.41, + "learning_rate": 8.980288823557432e-05, + "loss": 1.2081, + "step": 21520 + }, + { + "epoch": 0.41, + "learning_rate": 8.979374563320267e-05, + "loss": 1.1515, + "step": 21530 + }, + { + "epoch": 0.41, + "learning_rate": 8.978459939992946e-05, + "loss": 1.2431, + "step": 21540 + }, + { + "epoch": 0.41, + "learning_rate": 8.97754495365892e-05, + "loss": 1.1934, + "step": 21550 + }, + { + "epoch": 0.41, + "learning_rate": 8.976629604401677e-05, + "loss": 1.1427, + "step": 21560 + }, + { + "epoch": 0.41, + "learning_rate": 8.975713892304733e-05, + "loss": 1.3095, + "step": 21570 + }, + { + "epoch": 0.41, + "learning_rate": 8.974797817451642e-05, + "loss": 1.2245, + "step": 21580 + }, + { + "epoch": 0.42, + "learning_rate": 8.97388137992599e-05, + "loss": 1.0905, + "step": 21590 + }, + { + "epoch": 0.42, + "learning_rate": 8.972964579811395e-05, + "loss": 1.473, + "step": 21600 + }, + { + "epoch": 0.42, + "learning_rate": 8.972047417191511e-05, + "loss": 1.2342, + "step": 21610 + }, + { + "epoch": 0.42, + "learning_rate": 8.971129892150019e-05, + "loss": 1.2303, + "step": 21620 + }, + { + "epoch": 0.42, + "learning_rate": 8.970212004770637e-05, + "loss": 1.4936, + "step": 21630 + }, + { + "epoch": 0.42, + "learning_rate": 8.969293755137118e-05, + "loss": 1.146, + "step": 21640 + }, + { + "epoch": 0.42, + "learning_rate": 8.968375143333246e-05, + "loss": 1.4262, + "step": 21650 + }, + { + "epoch": 0.42, + "learning_rate": 8.967456169442835e-05, + "loss": 1.3256, + "step": 21660 + }, + { + "epoch": 0.42, + "learning_rate": 8.966536833549737e-05, + "loss": 1.5495, + "step": 21670 + }, + { + "epoch": 0.42, + "learning_rate": 8.965617135737834e-05, + "loss": 1.3995, + "step": 21680 + }, + { + "epoch": 0.42, + "learning_rate": 8.964697076091045e-05, + "loss": 1.2397, + "step": 21690 + }, + { + "epoch": 0.42, + "learning_rate": 8.963776654693314e-05, + "loss": 1.2213, + "step": 21700 + }, + { + "epoch": 0.42, + "learning_rate": 8.962855871628628e-05, + "loss": 1.3756, + "step": 21710 + }, + { + "epoch": 0.42, + "learning_rate": 8.961934726980999e-05, + "loss": 1.042, + "step": 21720 + }, + { + "epoch": 0.42, + "learning_rate": 8.961013220834477e-05, + "loss": 1.3547, + "step": 21730 + }, + { + "epoch": 0.42, + "learning_rate": 8.960091353273142e-05, + "loss": 1.0708, + "step": 21740 + }, + { + "epoch": 0.42, + "learning_rate": 8.959169124381105e-05, + "loss": 1.0841, + "step": 21750 + }, + { + "epoch": 0.42, + "learning_rate": 8.958246534242518e-05, + "loss": 1.2466, + "step": 21760 + }, + { + "epoch": 0.42, + "learning_rate": 8.957323582941557e-05, + "loss": 1.3134, + "step": 21770 + }, + { + "epoch": 0.42, + "learning_rate": 8.956400270562438e-05, + "loss": 1.3125, + "step": 21780 + }, + { + "epoch": 0.42, + "learning_rate": 8.955476597189406e-05, + "loss": 1.2383, + "step": 21790 + }, + { + "epoch": 0.42, + "learning_rate": 8.954552562906737e-05, + "loss": 1.2097, + "step": 21800 + }, + { + "epoch": 0.42, + "learning_rate": 8.953628167798747e-05, + "loss": 1.2633, + "step": 21810 + }, + { + "epoch": 0.42, + "learning_rate": 8.952703411949777e-05, + "loss": 1.3761, + "step": 21820 + }, + { + "epoch": 0.42, + "learning_rate": 8.951778295444206e-05, + "loss": 1.3495, + "step": 21830 + }, + { + "epoch": 0.42, + "learning_rate": 8.950852818366445e-05, + "loss": 1.1768, + "step": 21840 + }, + { + "epoch": 0.42, + "learning_rate": 8.949926980800935e-05, + "loss": 1.2767, + "step": 21850 + }, + { + "epoch": 0.42, + "learning_rate": 8.949000782832155e-05, + "loss": 1.0537, + "step": 21860 + }, + { + "epoch": 0.42, + "learning_rate": 8.948074224544614e-05, + "loss": 1.2656, + "step": 21870 + }, + { + "epoch": 0.42, + "learning_rate": 8.947147306022852e-05, + "loss": 1.2311, + "step": 21880 + }, + { + "epoch": 0.42, + "learning_rate": 8.946220027351445e-05, + "loss": 1.3701, + "step": 21890 + }, + { + "epoch": 0.42, + "learning_rate": 8.945292388615001e-05, + "loss": 1.3113, + "step": 21900 + }, + { + "epoch": 0.42, + "learning_rate": 8.944364389898158e-05, + "loss": 1.548, + "step": 21910 + }, + { + "epoch": 0.42, + "learning_rate": 8.943436031285594e-05, + "loss": 1.1314, + "step": 21920 + }, + { + "epoch": 0.42, + "learning_rate": 8.942507312862012e-05, + "loss": 1.1341, + "step": 21930 + }, + { + "epoch": 0.42, + "learning_rate": 8.941578234712152e-05, + "loss": 1.3171, + "step": 21940 + }, + { + "epoch": 0.42, + "learning_rate": 8.940648796920784e-05, + "loss": 1.1372, + "step": 21950 + }, + { + "epoch": 0.42, + "learning_rate": 8.939718999572714e-05, + "loss": 1.2167, + "step": 21960 + }, + { + "epoch": 0.42, + "learning_rate": 8.938788842752784e-05, + "loss": 1.3607, + "step": 21970 + }, + { + "epoch": 0.42, + "learning_rate": 8.937858326545857e-05, + "loss": 1.2811, + "step": 21980 + }, + { + "epoch": 0.42, + "learning_rate": 8.936927451036841e-05, + "loss": 1.2619, + "step": 21990 + }, + { + "epoch": 0.42, + "learning_rate": 8.93599621631067e-05, + "loss": 1.3984, + "step": 22000 + }, + { + "epoch": 0.42, + "learning_rate": 8.93506462245231e-05, + "loss": 1.1479, + "step": 22010 + }, + { + "epoch": 0.42, + "learning_rate": 8.934132669546769e-05, + "loss": 1.1322, + "step": 22020 + }, + { + "epoch": 0.42, + "learning_rate": 8.933200357679075e-05, + "loss": 1.0771, + "step": 22030 + }, + { + "epoch": 0.42, + "learning_rate": 8.932267686934299e-05, + "loss": 1.2705, + "step": 22040 + }, + { + "epoch": 0.42, + "learning_rate": 8.931334657397539e-05, + "loss": 1.0712, + "step": 22050 + }, + { + "epoch": 0.42, + "learning_rate": 8.930401269153928e-05, + "loss": 1.3846, + "step": 22060 + }, + { + "epoch": 0.42, + "learning_rate": 8.92946752228863e-05, + "loss": 1.0875, + "step": 22070 + }, + { + "epoch": 0.42, + "learning_rate": 8.928533416886844e-05, + "loss": 1.2723, + "step": 22080 + }, + { + "epoch": 0.42, + "learning_rate": 8.9275989530338e-05, + "loss": 1.334, + "step": 22090 + }, + { + "epoch": 0.42, + "learning_rate": 8.926664130814761e-05, + "loss": 1.1721, + "step": 22100 + }, + { + "epoch": 0.43, + "learning_rate": 8.925728950315026e-05, + "loss": 1.2566, + "step": 22110 + }, + { + "epoch": 0.43, + "learning_rate": 8.92479341161992e-05, + "loss": 1.3477, + "step": 22120 + }, + { + "epoch": 0.43, + "learning_rate": 8.923857514814804e-05, + "loss": 1.332, + "step": 22130 + }, + { + "epoch": 0.43, + "learning_rate": 8.922921259985075e-05, + "loss": 1.2383, + "step": 22140 + }, + { + "epoch": 0.43, + "learning_rate": 8.92198464721616e-05, + "loss": 1.1081, + "step": 22150 + }, + { + "epoch": 0.43, + "learning_rate": 8.921047676593514e-05, + "loss": 1.1657, + "step": 22160 + }, + { + "epoch": 0.43, + "learning_rate": 8.920110348202635e-05, + "loss": 1.1711, + "step": 22170 + }, + { + "epoch": 0.43, + "learning_rate": 8.919172662129042e-05, + "loss": 1.2467, + "step": 22180 + }, + { + "epoch": 0.43, + "learning_rate": 8.918234618458294e-05, + "loss": 1.1162, + "step": 22190 + }, + { + "epoch": 0.43, + "learning_rate": 8.917296217275985e-05, + "loss": 1.2301, + "step": 22200 + }, + { + "epoch": 0.43, + "learning_rate": 8.916357458667732e-05, + "loss": 1.3358, + "step": 22210 + }, + { + "epoch": 0.43, + "learning_rate": 8.915418342719193e-05, + "loss": 1.1441, + "step": 22220 + }, + { + "epoch": 0.43, + "learning_rate": 8.914478869516056e-05, + "loss": 1.1867, + "step": 22230 + }, + { + "epoch": 0.43, + "learning_rate": 8.91353903914404e-05, + "loss": 1.2155, + "step": 22240 + }, + { + "epoch": 0.43, + "learning_rate": 8.912598851688898e-05, + "loss": 1.3128, + "step": 22250 + }, + { + "epoch": 0.43, + "learning_rate": 8.911658307236417e-05, + "loss": 1.2874, + "step": 22260 + }, + { + "epoch": 0.43, + "learning_rate": 8.910717405872415e-05, + "loss": 1.336, + "step": 22270 + }, + { + "epoch": 0.43, + "learning_rate": 8.90977614768274e-05, + "loss": 1.1446, + "step": 22280 + }, + { + "epoch": 0.43, + "learning_rate": 8.908834532753279e-05, + "loss": 1.0065, + "step": 22290 + }, + { + "epoch": 0.43, + "learning_rate": 8.907892561169946e-05, + "loss": 1.0934, + "step": 22300 + }, + { + "epoch": 0.43, + "learning_rate": 8.906950233018687e-05, + "loss": 1.2727, + "step": 22310 + }, + { + "epoch": 0.43, + "learning_rate": 8.906007548385488e-05, + "loss": 1.0686, + "step": 22320 + }, + { + "epoch": 0.43, + "learning_rate": 8.905064507356357e-05, + "loss": 1.3194, + "step": 22330 + }, + { + "epoch": 0.43, + "learning_rate": 8.904121110017345e-05, + "loss": 1.2063, + "step": 22340 + }, + { + "epoch": 0.43, + "learning_rate": 8.903177356454526e-05, + "loss": 1.2497, + "step": 22350 + }, + { + "epoch": 0.43, + "learning_rate": 8.902233246754015e-05, + "loss": 1.1947, + "step": 22360 + }, + { + "epoch": 0.43, + "learning_rate": 8.90128878100195e-05, + "loss": 1.3794, + "step": 22370 + }, + { + "epoch": 0.43, + "learning_rate": 8.900343959284515e-05, + "loss": 1.3253, + "step": 22380 + }, + { + "epoch": 0.43, + "learning_rate": 8.899398781687908e-05, + "loss": 1.4376, + "step": 22390 + }, + { + "epoch": 0.43, + "learning_rate": 8.89845324829838e-05, + "loss": 1.2154, + "step": 22400 + }, + { + "epoch": 0.43, + "learning_rate": 8.897507359202197e-05, + "loss": 1.2786, + "step": 22410 + }, + { + "epoch": 0.43, + "learning_rate": 8.896561114485669e-05, + "loss": 1.3624, + "step": 22420 + }, + { + "epoch": 0.43, + "learning_rate": 8.895614514235131e-05, + "loss": 1.3831, + "step": 22430 + }, + { + "epoch": 0.43, + "learning_rate": 8.894667558536956e-05, + "loss": 1.253, + "step": 22440 + }, + { + "epoch": 0.43, + "learning_rate": 8.893720247477548e-05, + "loss": 1.2499, + "step": 22450 + }, + { + "epoch": 0.43, + "learning_rate": 8.89277258114334e-05, + "loss": 1.3783, + "step": 22460 + }, + { + "epoch": 0.43, + "learning_rate": 8.891824559620801e-05, + "loss": 1.3984, + "step": 22470 + }, + { + "epoch": 0.43, + "learning_rate": 8.89087618299643e-05, + "loss": 1.3286, + "step": 22480 + }, + { + "epoch": 0.43, + "learning_rate": 8.889927451356763e-05, + "loss": 1.3391, + "step": 22490 + }, + { + "epoch": 0.43, + "learning_rate": 8.888978364788363e-05, + "loss": 1.1588, + "step": 22500 + }, + { + "epoch": 0.43, + "learning_rate": 8.888028923377827e-05, + "loss": 1.4793, + "step": 22510 + }, + { + "epoch": 0.43, + "learning_rate": 8.887079127211786e-05, + "loss": 1.1875, + "step": 22520 + }, + { + "epoch": 0.43, + "learning_rate": 8.886128976376901e-05, + "loss": 1.3139, + "step": 22530 + }, + { + "epoch": 0.43, + "learning_rate": 8.88517847095987e-05, + "loss": 1.1123, + "step": 22540 + }, + { + "epoch": 0.43, + "learning_rate": 8.884227611047415e-05, + "loss": 1.2371, + "step": 22550 + }, + { + "epoch": 0.43, + "learning_rate": 8.883276396726299e-05, + "loss": 1.2583, + "step": 22560 + }, + { + "epoch": 0.43, + "learning_rate": 8.882324828083312e-05, + "loss": 1.4052, + "step": 22570 + }, + { + "epoch": 0.43, + "learning_rate": 8.88137290520528e-05, + "loss": 1.224, + "step": 22580 + }, + { + "epoch": 0.43, + "learning_rate": 8.880420628179056e-05, + "loss": 1.216, + "step": 22590 + }, + { + "epoch": 0.43, + "learning_rate": 8.879467997091531e-05, + "loss": 1.0818, + "step": 22600 + }, + { + "epoch": 0.43, + "learning_rate": 8.878515012029626e-05, + "loss": 1.4376, + "step": 22610 + }, + { + "epoch": 0.43, + "learning_rate": 8.877561673080293e-05, + "loss": 1.259, + "step": 22620 + }, + { + "epoch": 0.44, + "learning_rate": 8.87660798033052e-05, + "loss": 1.328, + "step": 22630 + }, + { + "epoch": 0.44, + "learning_rate": 8.875653933867321e-05, + "loss": 1.2694, + "step": 22640 + }, + { + "epoch": 0.44, + "learning_rate": 8.874699533777748e-05, + "loss": 1.2843, + "step": 22650 + }, + { + "epoch": 0.44, + "learning_rate": 8.873744780148884e-05, + "loss": 1.3297, + "step": 22660 + }, + { + "epoch": 0.44, + "learning_rate": 8.872789673067843e-05, + "loss": 1.2643, + "step": 22670 + }, + { + "epoch": 0.44, + "learning_rate": 8.871834212621772e-05, + "loss": 1.3479, + "step": 22680 + }, + { + "epoch": 0.44, + "learning_rate": 8.87087839889785e-05, + "loss": 1.1739, + "step": 22690 + }, + { + "epoch": 0.44, + "learning_rate": 8.869922231983287e-05, + "loss": 1.247, + "step": 22700 + }, + { + "epoch": 0.44, + "learning_rate": 8.868965711965332e-05, + "loss": 1.1796, + "step": 22710 + }, + { + "epoch": 0.44, + "learning_rate": 8.868008838931252e-05, + "loss": 1.6035, + "step": 22720 + }, + { + "epoch": 0.44, + "learning_rate": 8.867051612968362e-05, + "loss": 1.4405, + "step": 22730 + }, + { + "epoch": 0.44, + "learning_rate": 8.866094034163998e-05, + "loss": 1.3115, + "step": 22740 + }, + { + "epoch": 0.44, + "learning_rate": 8.865136102605535e-05, + "loss": 1.1976, + "step": 22750 + }, + { + "epoch": 0.44, + "learning_rate": 8.864177818380378e-05, + "loss": 1.3366, + "step": 22760 + }, + { + "epoch": 0.44, + "learning_rate": 8.863219181575961e-05, + "loss": 1.2898, + "step": 22770 + }, + { + "epoch": 0.44, + "learning_rate": 8.862260192279757e-05, + "loss": 1.4552, + "step": 22780 + }, + { + "epoch": 0.44, + "learning_rate": 8.861300850579261e-05, + "loss": 1.2881, + "step": 22790 + }, + { + "epoch": 0.44, + "learning_rate": 8.860341156562012e-05, + "loss": 1.4083, + "step": 22800 + }, + { + "epoch": 0.44, + "learning_rate": 8.859381110315572e-05, + "loss": 1.2931, + "step": 22810 + }, + { + "epoch": 0.44, + "learning_rate": 8.85842071192754e-05, + "loss": 1.2471, + "step": 22820 + }, + { + "epoch": 0.44, + "learning_rate": 8.857459961485546e-05, + "loss": 1.3725, + "step": 22830 + }, + { + "epoch": 0.44, + "learning_rate": 8.856498859077252e-05, + "loss": 1.2849, + "step": 22840 + }, + { + "epoch": 0.44, + "learning_rate": 8.855537404790349e-05, + "loss": 1.3101, + "step": 22850 + }, + { + "epoch": 0.44, + "learning_rate": 8.854575598712564e-05, + "loss": 1.2674, + "step": 22860 + }, + { + "epoch": 0.44, + "learning_rate": 8.853613440931658e-05, + "loss": 1.3122, + "step": 22870 + }, + { + "epoch": 0.44, + "learning_rate": 8.85265093153542e-05, + "loss": 1.3803, + "step": 22880 + }, + { + "epoch": 0.44, + "learning_rate": 8.85168807061167e-05, + "loss": 1.2958, + "step": 22890 + }, + { + "epoch": 0.44, + "learning_rate": 8.850724858248264e-05, + "loss": 1.3293, + "step": 22900 + }, + { + "epoch": 0.44, + "learning_rate": 8.849761294533087e-05, + "loss": 1.3776, + "step": 22910 + }, + { + "epoch": 0.44, + "learning_rate": 8.848797379554062e-05, + "loss": 1.1595, + "step": 22920 + }, + { + "epoch": 0.44, + "learning_rate": 8.847833113399134e-05, + "loss": 1.1645, + "step": 22930 + }, + { + "epoch": 0.44, + "learning_rate": 8.846868496156287e-05, + "loss": 1.3574, + "step": 22940 + }, + { + "epoch": 0.44, + "learning_rate": 8.845903527913537e-05, + "loss": 1.3097, + "step": 22950 + }, + { + "epoch": 0.44, + "learning_rate": 8.84493820875893e-05, + "loss": 1.1649, + "step": 22960 + }, + { + "epoch": 0.44, + "learning_rate": 8.843972538780546e-05, + "loss": 1.2799, + "step": 22970 + }, + { + "epoch": 0.44, + "learning_rate": 8.843006518066493e-05, + "loss": 1.2892, + "step": 22980 + }, + { + "epoch": 0.44, + "learning_rate": 8.842040146704915e-05, + "loss": 1.6626, + "step": 22990 + }, + { + "epoch": 0.44, + "learning_rate": 8.841073424783987e-05, + "loss": 1.1009, + "step": 23000 + }, + { + "epoch": 0.44, + "learning_rate": 8.840106352391915e-05, + "loss": 1.2724, + "step": 23010 + }, + { + "epoch": 0.44, + "learning_rate": 8.839138929616939e-05, + "loss": 1.5149, + "step": 23020 + }, + { + "epoch": 0.44, + "learning_rate": 8.838171156547327e-05, + "loss": 1.3218, + "step": 23030 + }, + { + "epoch": 0.44, + "learning_rate": 8.837203033271384e-05, + "loss": 1.235, + "step": 23040 + }, + { + "epoch": 0.44, + "learning_rate": 8.836234559877442e-05, + "loss": 1.3536, + "step": 23050 + }, + { + "epoch": 0.44, + "learning_rate": 8.83526573645387e-05, + "loss": 1.4914, + "step": 23060 + }, + { + "epoch": 0.44, + "learning_rate": 8.834296563089064e-05, + "loss": 1.1581, + "step": 23070 + }, + { + "epoch": 0.44, + "learning_rate": 8.833327039871455e-05, + "loss": 1.2058, + "step": 23080 + }, + { + "epoch": 0.44, + "learning_rate": 8.832357166889507e-05, + "loss": 1.4767, + "step": 23090 + }, + { + "epoch": 0.44, + "learning_rate": 8.831386944231714e-05, + "loss": 1.4766, + "step": 23100 + }, + { + "epoch": 0.44, + "learning_rate": 8.830416371986599e-05, + "loss": 1.1972, + "step": 23110 + }, + { + "epoch": 0.44, + "learning_rate": 8.829445450242722e-05, + "loss": 1.4058, + "step": 23120 + }, + { + "epoch": 0.44, + "learning_rate": 8.828474179088676e-05, + "loss": 1.2726, + "step": 23130 + }, + { + "epoch": 0.44, + "learning_rate": 8.827502558613074e-05, + "loss": 1.3691, + "step": 23140 + }, + { + "epoch": 0.45, + "learning_rate": 8.826530588904579e-05, + "loss": 1.321, + "step": 23150 + }, + { + "epoch": 0.45, + "learning_rate": 8.825558270051871e-05, + "loss": 1.2878, + "step": 23160 + }, + { + "epoch": 0.45, + "learning_rate": 8.824585602143668e-05, + "loss": 1.4032, + "step": 23170 + }, + { + "epoch": 0.45, + "learning_rate": 8.823612585268723e-05, + "loss": 1.2364, + "step": 23180 + }, + { + "epoch": 0.45, + "learning_rate": 8.822639219515811e-05, + "loss": 1.3157, + "step": 23190 + }, + { + "epoch": 0.45, + "learning_rate": 8.82166550497375e-05, + "loss": 1.2563, + "step": 23200 + }, + { + "epoch": 0.45, + "learning_rate": 8.820691441731382e-05, + "loss": 1.5744, + "step": 23210 + }, + { + "epoch": 0.45, + "learning_rate": 8.819717029877581e-05, + "loss": 1.3628, + "step": 23220 + }, + { + "epoch": 0.45, + "learning_rate": 8.81874226950126e-05, + "loss": 1.2474, + "step": 23230 + }, + { + "epoch": 0.45, + "learning_rate": 8.817767160691358e-05, + "loss": 1.4045, + "step": 23240 + }, + { + "epoch": 0.45, + "learning_rate": 8.816791703536847e-05, + "loss": 1.3834, + "step": 23250 + }, + { + "epoch": 0.45, + "learning_rate": 8.815815898126728e-05, + "loss": 1.2779, + "step": 23260 + }, + { + "epoch": 0.45, + "learning_rate": 8.814839744550039e-05, + "loss": 1.2073, + "step": 23270 + }, + { + "epoch": 0.45, + "learning_rate": 8.813863242895846e-05, + "loss": 0.9973, + "step": 23280 + }, + { + "epoch": 0.45, + "learning_rate": 8.812886393253248e-05, + "loss": 1.2626, + "step": 23290 + }, + { + "epoch": 0.45, + "learning_rate": 8.811909195711376e-05, + "loss": 1.4005, + "step": 23300 + }, + { + "epoch": 0.45, + "learning_rate": 8.810931650359394e-05, + "loss": 1.2073, + "step": 23310 + }, + { + "epoch": 0.45, + "learning_rate": 8.809953757286494e-05, + "loss": 1.2985, + "step": 23320 + }, + { + "epoch": 0.45, + "learning_rate": 8.808975516581903e-05, + "loss": 1.3684, + "step": 23330 + }, + { + "epoch": 0.45, + "learning_rate": 8.807996928334878e-05, + "loss": 1.2892, + "step": 23340 + }, + { + "epoch": 0.45, + "learning_rate": 8.807017992634708e-05, + "loss": 1.2638, + "step": 23350 + }, + { + "epoch": 0.45, + "learning_rate": 8.806038709570717e-05, + "loss": 1.2908, + "step": 23360 + }, + { + "epoch": 0.45, + "learning_rate": 8.805059079232253e-05, + "loss": 1.2028, + "step": 23370 + }, + { + "epoch": 0.45, + "learning_rate": 8.804079101708704e-05, + "loss": 1.2889, + "step": 23380 + }, + { + "epoch": 0.45, + "learning_rate": 8.803098777089485e-05, + "loss": 1.2676, + "step": 23390 + }, + { + "epoch": 0.45, + "learning_rate": 8.802118105464044e-05, + "loss": 1.3761, + "step": 23400 + }, + { + "epoch": 0.45, + "learning_rate": 8.801137086921858e-05, + "loss": 1.1783, + "step": 23410 + }, + { + "epoch": 0.45, + "learning_rate": 8.800155721552443e-05, + "loss": 1.4158, + "step": 23420 + }, + { + "epoch": 0.45, + "learning_rate": 8.799174009445338e-05, + "loss": 1.2277, + "step": 23430 + }, + { + "epoch": 0.45, + "learning_rate": 8.798191950690117e-05, + "loss": 1.2096, + "step": 23440 + }, + { + "epoch": 0.45, + "learning_rate": 8.79720954537639e-05, + "loss": 1.2766, + "step": 23450 + }, + { + "epoch": 0.45, + "learning_rate": 8.796226793593792e-05, + "loss": 1.3304, + "step": 23460 + }, + { + "epoch": 0.45, + "learning_rate": 8.795243695431991e-05, + "loss": 1.2767, + "step": 23470 + }, + { + "epoch": 0.45, + "learning_rate": 8.794260250980688e-05, + "loss": 1.1089, + "step": 23480 + }, + { + "epoch": 0.45, + "learning_rate": 8.793276460329619e-05, + "loss": 1.2314, + "step": 23490 + }, + { + "epoch": 0.45, + "learning_rate": 8.792292323568545e-05, + "loss": 1.2272, + "step": 23500 + }, + { + "epoch": 0.45, + "learning_rate": 8.791307840787261e-05, + "loss": 1.2688, + "step": 23510 + }, + { + "epoch": 0.45, + "learning_rate": 8.790323012075596e-05, + "loss": 1.2017, + "step": 23520 + }, + { + "epoch": 0.45, + "learning_rate": 8.78933783752341e-05, + "loss": 1.2572, + "step": 23530 + }, + { + "epoch": 0.45, + "learning_rate": 8.78835231722059e-05, + "loss": 1.5967, + "step": 23540 + }, + { + "epoch": 0.45, + "learning_rate": 8.78736645125706e-05, + "loss": 1.2391, + "step": 23550 + }, + { + "epoch": 0.45, + "learning_rate": 8.786380239722772e-05, + "loss": 1.3014, + "step": 23560 + }, + { + "epoch": 0.45, + "learning_rate": 8.785393682707711e-05, + "loss": 1.2119, + "step": 23570 + }, + { + "epoch": 0.45, + "learning_rate": 8.784406780301894e-05, + "loss": 1.3249, + "step": 23580 + }, + { + "epoch": 0.45, + "learning_rate": 8.783419532595372e-05, + "loss": 1.2792, + "step": 23590 + }, + { + "epoch": 0.45, + "learning_rate": 8.782431939678218e-05, + "loss": 1.2616, + "step": 23600 + }, + { + "epoch": 0.45, + "learning_rate": 8.781444001640548e-05, + "loss": 1.2989, + "step": 23610 + }, + { + "epoch": 0.45, + "learning_rate": 8.780455718572502e-05, + "loss": 1.1899, + "step": 23620 + }, + { + "epoch": 0.45, + "learning_rate": 8.779467090564256e-05, + "loss": 1.3393, + "step": 23630 + }, + { + "epoch": 0.45, + "learning_rate": 8.778478117706014e-05, + "loss": 1.2664, + "step": 23640 + }, + { + "epoch": 0.45, + "learning_rate": 8.777488800088013e-05, + "loss": 1.1082, + "step": 23650 + }, + { + "epoch": 0.45, + "learning_rate": 8.776499137800522e-05, + "loss": 1.456, + "step": 23660 + }, + { + "epoch": 0.46, + "learning_rate": 8.775509130933839e-05, + "loss": 1.1701, + "step": 23670 + }, + { + "epoch": 0.46, + "learning_rate": 8.774518779578297e-05, + "loss": 1.2321, + "step": 23680 + }, + { + "epoch": 0.46, + "learning_rate": 8.773528083824258e-05, + "loss": 1.1775, + "step": 23690 + }, + { + "epoch": 0.46, + "learning_rate": 8.772537043762117e-05, + "loss": 1.2802, + "step": 23700 + }, + { + "epoch": 0.46, + "learning_rate": 8.771545659482298e-05, + "loss": 1.2145, + "step": 23710 + }, + { + "epoch": 0.46, + "learning_rate": 8.770553931075259e-05, + "loss": 1.3986, + "step": 23720 + }, + { + "epoch": 0.46, + "learning_rate": 8.769561858631488e-05, + "loss": 1.108, + "step": 23730 + }, + { + "epoch": 0.46, + "learning_rate": 8.768569442241504e-05, + "loss": 1.3167, + "step": 23740 + }, + { + "epoch": 0.46, + "learning_rate": 8.767576681995858e-05, + "loss": 1.3237, + "step": 23750 + }, + { + "epoch": 0.46, + "learning_rate": 8.766583577985134e-05, + "loss": 1.1841, + "step": 23760 + }, + { + "epoch": 0.46, + "learning_rate": 8.765590130299944e-05, + "loss": 1.2273, + "step": 23770 + }, + { + "epoch": 0.46, + "learning_rate": 8.764596339030935e-05, + "loss": 1.3044, + "step": 23780 + }, + { + "epoch": 0.46, + "learning_rate": 8.763602204268781e-05, + "loss": 1.4951, + "step": 23790 + }, + { + "epoch": 0.46, + "learning_rate": 8.762607726104193e-05, + "loss": 1.3126, + "step": 23800 + }, + { + "epoch": 0.46, + "learning_rate": 8.76161290462791e-05, + "loss": 1.2374, + "step": 23810 + }, + { + "epoch": 0.46, + "learning_rate": 8.760617739930698e-05, + "loss": 1.0595, + "step": 23820 + }, + { + "epoch": 0.46, + "learning_rate": 8.759622232103363e-05, + "loss": 1.517, + "step": 23830 + }, + { + "epoch": 0.46, + "learning_rate": 8.758626381236738e-05, + "loss": 1.3972, + "step": 23840 + }, + { + "epoch": 0.46, + "learning_rate": 8.757630187421686e-05, + "loss": 1.4081, + "step": 23850 + }, + { + "epoch": 0.46, + "learning_rate": 8.756633650749102e-05, + "loss": 1.3255, + "step": 23860 + }, + { + "epoch": 0.46, + "learning_rate": 8.755636771309916e-05, + "loss": 1.2636, + "step": 23870 + }, + { + "epoch": 0.46, + "learning_rate": 8.754639549195083e-05, + "loss": 1.2255, + "step": 23880 + }, + { + "epoch": 0.46, + "learning_rate": 8.753641984495596e-05, + "loss": 1.2831, + "step": 23890 + }, + { + "epoch": 0.46, + "learning_rate": 8.752644077302472e-05, + "loss": 1.1728, + "step": 23900 + }, + { + "epoch": 0.46, + "learning_rate": 8.751645827706767e-05, + "loss": 1.1858, + "step": 23910 + }, + { + "epoch": 0.46, + "learning_rate": 8.750647235799561e-05, + "loss": 1.4628, + "step": 23920 + }, + { + "epoch": 0.46, + "learning_rate": 8.749648301671971e-05, + "loss": 1.3749, + "step": 23930 + }, + { + "epoch": 0.46, + "learning_rate": 8.748649025415141e-05, + "loss": 1.3737, + "step": 23940 + }, + { + "epoch": 0.46, + "learning_rate": 8.747649407120248e-05, + "loss": 1.1647, + "step": 23950 + }, + { + "epoch": 0.46, + "learning_rate": 8.746649446878501e-05, + "loss": 1.234, + "step": 23960 + }, + { + "epoch": 0.46, + "learning_rate": 8.74564914478114e-05, + "loss": 1.2896, + "step": 23970 + }, + { + "epoch": 0.46, + "learning_rate": 8.744648500919435e-05, + "loss": 1.1208, + "step": 23980 + }, + { + "epoch": 0.46, + "learning_rate": 8.743647515384686e-05, + "loss": 1.3439, + "step": 23990 + }, + { + "epoch": 0.46, + "learning_rate": 8.742646188268229e-05, + "loss": 1.2527, + "step": 24000 + }, + { + "epoch": 0.46, + "learning_rate": 8.741644519661425e-05, + "loss": 1.0824, + "step": 24010 + }, + { + "epoch": 0.46, + "learning_rate": 8.740642509655672e-05, + "loss": 1.2831, + "step": 24020 + }, + { + "epoch": 0.46, + "learning_rate": 8.739640158342395e-05, + "loss": 1.339, + "step": 24030 + }, + { + "epoch": 0.46, + "learning_rate": 8.738637465813054e-05, + "loss": 1.1319, + "step": 24040 + }, + { + "epoch": 0.46, + "learning_rate": 8.737634432159132e-05, + "loss": 1.1888, + "step": 24050 + }, + { + "epoch": 0.46, + "learning_rate": 8.736631057472153e-05, + "loss": 1.2445, + "step": 24060 + }, + { + "epoch": 0.46, + "learning_rate": 8.735627341843669e-05, + "loss": 1.3269, + "step": 24070 + }, + { + "epoch": 0.46, + "learning_rate": 8.734623285365259e-05, + "loss": 1.3556, + "step": 24080 + }, + { + "epoch": 0.46, + "learning_rate": 8.73361888812854e-05, + "loss": 1.2679, + "step": 24090 + }, + { + "epoch": 0.46, + "learning_rate": 8.732614150225151e-05, + "loss": 1.333, + "step": 24100 + }, + { + "epoch": 0.46, + "learning_rate": 8.731609071746772e-05, + "loss": 1.1531, + "step": 24110 + }, + { + "epoch": 0.46, + "learning_rate": 8.730603652785105e-05, + "loss": 1.3322, + "step": 24120 + }, + { + "epoch": 0.46, + "learning_rate": 8.729597893431894e-05, + "loss": 1.4441, + "step": 24130 + }, + { + "epoch": 0.46, + "learning_rate": 8.7285917937789e-05, + "loss": 1.4038, + "step": 24140 + }, + { + "epoch": 0.46, + "learning_rate": 8.727585353917927e-05, + "loss": 1.2727, + "step": 24150 + }, + { + "epoch": 0.46, + "learning_rate": 8.726578573940804e-05, + "loss": 1.2898, + "step": 24160 + }, + { + "epoch": 0.46, + "learning_rate": 8.725571453939394e-05, + "loss": 1.484, + "step": 24170 + }, + { + "epoch": 0.46, + "learning_rate": 8.724563994005588e-05, + "loss": 1.4288, + "step": 24180 + }, + { + "epoch": 0.47, + "learning_rate": 8.723556194231313e-05, + "loss": 1.1676, + "step": 24190 + }, + { + "epoch": 0.47, + "learning_rate": 8.72254805470852e-05, + "loss": 1.3025, + "step": 24200 + }, + { + "epoch": 0.47, + "learning_rate": 8.721539575529197e-05, + "loss": 1.2361, + "step": 24210 + }, + { + "epoch": 0.47, + "learning_rate": 8.720530756785358e-05, + "loss": 1.225, + "step": 24220 + }, + { + "epoch": 0.47, + "learning_rate": 8.719521598569052e-05, + "loss": 1.2299, + "step": 24230 + }, + { + "epoch": 0.47, + "learning_rate": 8.71851210097236e-05, + "loss": 1.3079, + "step": 24240 + }, + { + "epoch": 0.47, + "learning_rate": 8.71750226408739e-05, + "loss": 1.1053, + "step": 24250 + }, + { + "epoch": 0.47, + "learning_rate": 8.716492088006279e-05, + "loss": 0.978, + "step": 24260 + }, + { + "epoch": 0.47, + "learning_rate": 8.715481572821204e-05, + "loss": 1.6357, + "step": 24270 + }, + { + "epoch": 0.47, + "learning_rate": 8.714470718624365e-05, + "loss": 1.3841, + "step": 24280 + }, + { + "epoch": 0.47, + "learning_rate": 8.713459525507996e-05, + "loss": 1.1877, + "step": 24290 + }, + { + "epoch": 0.47, + "learning_rate": 8.712447993564361e-05, + "loss": 1.2383, + "step": 24300 + }, + { + "epoch": 0.47, + "learning_rate": 8.711436122885754e-05, + "loss": 1.1688, + "step": 24310 + }, + { + "epoch": 0.47, + "learning_rate": 8.710423913564503e-05, + "loss": 1.3272, + "step": 24320 + }, + { + "epoch": 0.47, + "learning_rate": 8.709411365692964e-05, + "loss": 1.2633, + "step": 24330 + }, + { + "epoch": 0.47, + "learning_rate": 8.708398479363526e-05, + "loss": 1.2994, + "step": 24340 + }, + { + "epoch": 0.47, + "learning_rate": 8.707385254668606e-05, + "loss": 1.1254, + "step": 24350 + }, + { + "epoch": 0.47, + "learning_rate": 8.706371691700657e-05, + "loss": 1.2881, + "step": 24360 + }, + { + "epoch": 0.47, + "learning_rate": 8.705357790552154e-05, + "loss": 1.2455, + "step": 24370 + }, + { + "epoch": 0.47, + "learning_rate": 8.704343551315614e-05, + "loss": 1.3218, + "step": 24380 + }, + { + "epoch": 0.47, + "learning_rate": 8.703328974083575e-05, + "loss": 1.27, + "step": 24390 + }, + { + "epoch": 0.47, + "learning_rate": 8.702314058948614e-05, + "loss": 1.2219, + "step": 24400 + }, + { + "epoch": 0.47, + "learning_rate": 8.701298806003331e-05, + "loss": 1.2305, + "step": 24410 + }, + { + "epoch": 0.47, + "learning_rate": 8.700283215340366e-05, + "loss": 1.2769, + "step": 24420 + }, + { + "epoch": 0.47, + "learning_rate": 8.699267287052377e-05, + "loss": 1.363, + "step": 24430 + }, + { + "epoch": 0.47, + "learning_rate": 8.698251021232066e-05, + "loss": 1.1918, + "step": 24440 + }, + { + "epoch": 0.47, + "learning_rate": 8.697234417972161e-05, + "loss": 1.1066, + "step": 24450 + }, + { + "epoch": 0.47, + "learning_rate": 8.696217477365417e-05, + "loss": 1.2102, + "step": 24460 + }, + { + "epoch": 0.47, + "learning_rate": 8.695200199504622e-05, + "loss": 1.2908, + "step": 24470 + }, + { + "epoch": 0.47, + "learning_rate": 8.694182584482598e-05, + "loss": 1.3019, + "step": 24480 + }, + { + "epoch": 0.47, + "learning_rate": 8.693164632392194e-05, + "loss": 1.3206, + "step": 24490 + }, + { + "epoch": 0.47, + "learning_rate": 8.69214634332629e-05, + "loss": 1.2205, + "step": 24500 + }, + { + "epoch": 0.47, + "learning_rate": 8.691127717377801e-05, + "loss": 1.1099, + "step": 24510 + }, + { + "epoch": 0.47, + "learning_rate": 8.690108754639666e-05, + "loss": 1.2325, + "step": 24520 + }, + { + "epoch": 0.47, + "learning_rate": 8.689089455204862e-05, + "loss": 1.4773, + "step": 24530 + }, + { + "epoch": 0.47, + "learning_rate": 8.688069819166389e-05, + "loss": 1.3784, + "step": 24540 + }, + { + "epoch": 0.47, + "learning_rate": 8.687049846617284e-05, + "loss": 1.2263, + "step": 24550 + }, + { + "epoch": 0.47, + "learning_rate": 8.686029537650611e-05, + "loss": 1.2377, + "step": 24560 + }, + { + "epoch": 0.47, + "learning_rate": 8.685008892359468e-05, + "loss": 1.246, + "step": 24570 + }, + { + "epoch": 0.47, + "learning_rate": 8.683987910836979e-05, + "loss": 1.4302, + "step": 24580 + }, + { + "epoch": 0.47, + "learning_rate": 8.682966593176305e-05, + "loss": 1.4223, + "step": 24590 + }, + { + "epoch": 0.47, + "learning_rate": 8.681944939470631e-05, + "loss": 1.3111, + "step": 24600 + }, + { + "epoch": 0.47, + "learning_rate": 8.680922949813178e-05, + "loss": 1.3293, + "step": 24610 + }, + { + "epoch": 0.47, + "learning_rate": 8.679900624297193e-05, + "loss": 1.2571, + "step": 24620 + }, + { + "epoch": 0.47, + "learning_rate": 8.678877963015957e-05, + "loss": 1.3261, + "step": 24630 + }, + { + "epoch": 0.47, + "learning_rate": 8.677854966062783e-05, + "loss": 1.2469, + "step": 24640 + }, + { + "epoch": 0.47, + "learning_rate": 8.67683163353101e-05, + "loss": 1.0586, + "step": 24650 + }, + { + "epoch": 0.47, + "learning_rate": 8.67580796551401e-05, + "loss": 1.1861, + "step": 24660 + }, + { + "epoch": 0.47, + "learning_rate": 8.674783962105186e-05, + "loss": 1.4956, + "step": 24670 + }, + { + "epoch": 0.47, + "learning_rate": 8.67375962339797e-05, + "loss": 1.302, + "step": 24680 + }, + { + "epoch": 0.47, + "learning_rate": 8.672734949485829e-05, + "loss": 1.4479, + "step": 24690 + }, + { + "epoch": 0.47, + "learning_rate": 8.671709940462253e-05, + "loss": 1.1814, + "step": 24700 + }, + { + "epoch": 0.48, + "learning_rate": 8.670684596420772e-05, + "loss": 1.1177, + "step": 24710 + }, + { + "epoch": 0.48, + "learning_rate": 8.669658917454937e-05, + "loss": 1.3226, + "step": 24720 + }, + { + "epoch": 0.48, + "learning_rate": 8.668632903658336e-05, + "loss": 1.2454, + "step": 24730 + }, + { + "epoch": 0.48, + "learning_rate": 8.667606555124585e-05, + "loss": 1.2153, + "step": 24740 + }, + { + "epoch": 0.48, + "learning_rate": 8.666579871947333e-05, + "loss": 1.0666, + "step": 24750 + }, + { + "epoch": 0.48, + "learning_rate": 8.665552854220253e-05, + "loss": 1.4203, + "step": 24760 + }, + { + "epoch": 0.48, + "learning_rate": 8.664525502037059e-05, + "loss": 1.2008, + "step": 24770 + }, + { + "epoch": 0.48, + "learning_rate": 8.663497815491486e-05, + "loss": 1.303, + "step": 24780 + }, + { + "epoch": 0.48, + "learning_rate": 8.662469794677306e-05, + "loss": 1.2779, + "step": 24790 + }, + { + "epoch": 0.48, + "learning_rate": 8.661441439688315e-05, + "loss": 1.0151, + "step": 24800 + }, + { + "epoch": 0.48, + "learning_rate": 8.660412750618345e-05, + "loss": 1.3339, + "step": 24810 + }, + { + "epoch": 0.48, + "learning_rate": 8.659383727561259e-05, + "loss": 1.2459, + "step": 24820 + }, + { + "epoch": 0.48, + "learning_rate": 8.658354370610944e-05, + "loss": 1.0281, + "step": 24830 + }, + { + "epoch": 0.48, + "learning_rate": 8.657324679861326e-05, + "loss": 1.3584, + "step": 24840 + }, + { + "epoch": 0.48, + "learning_rate": 8.656294655406351e-05, + "loss": 1.3592, + "step": 24850 + }, + { + "epoch": 0.48, + "learning_rate": 8.655264297340009e-05, + "loss": 1.3096, + "step": 24860 + }, + { + "epoch": 0.48, + "learning_rate": 8.654233605756308e-05, + "loss": 1.1819, + "step": 24870 + }, + { + "epoch": 0.48, + "learning_rate": 8.653202580749292e-05, + "loss": 1.2104, + "step": 24880 + }, + { + "epoch": 0.48, + "learning_rate": 8.652171222413037e-05, + "loss": 1.2947, + "step": 24890 + }, + { + "epoch": 0.48, + "learning_rate": 8.651139530841645e-05, + "loss": 1.1817, + "step": 24900 + }, + { + "epoch": 0.48, + "learning_rate": 8.650107506129253e-05, + "loss": 1.2528, + "step": 24910 + }, + { + "epoch": 0.48, + "learning_rate": 8.649075148370021e-05, + "loss": 1.1333, + "step": 24920 + }, + { + "epoch": 0.48, + "learning_rate": 8.648042457658152e-05, + "loss": 1.2834, + "step": 24930 + }, + { + "epoch": 0.48, + "learning_rate": 8.647009434087865e-05, + "loss": 1.3249, + "step": 24940 + }, + { + "epoch": 0.48, + "learning_rate": 8.64597607775342e-05, + "loss": 1.4387, + "step": 24950 + }, + { + "epoch": 0.48, + "learning_rate": 8.644942388749102e-05, + "loss": 1.2659, + "step": 24960 + }, + { + "epoch": 0.48, + "learning_rate": 8.64390836716923e-05, + "loss": 1.1693, + "step": 24970 + }, + { + "epoch": 0.48, + "learning_rate": 8.642874013108148e-05, + "loss": 1.2862, + "step": 24980 + }, + { + "epoch": 0.48, + "learning_rate": 8.641839326660237e-05, + "loss": 1.2829, + "step": 24990 + }, + { + "epoch": 0.48, + "learning_rate": 8.640804307919902e-05, + "loss": 1.2455, + "step": 25000 + }, + { + "epoch": 0.48, + "learning_rate": 8.639768956981583e-05, + "loss": 1.1734, + "step": 25010 + }, + { + "epoch": 0.48, + "learning_rate": 8.638733273939748e-05, + "loss": 1.3274, + "step": 25020 + }, + { + "epoch": 0.48, + "learning_rate": 8.637697258888896e-05, + "loss": 1.2912, + "step": 25030 + }, + { + "epoch": 0.48, + "learning_rate": 8.636660911923555e-05, + "loss": 1.2205, + "step": 25040 + }, + { + "epoch": 0.48, + "learning_rate": 8.635624233138286e-05, + "loss": 1.3405, + "step": 25050 + }, + { + "epoch": 0.48, + "learning_rate": 8.634587222627679e-05, + "loss": 1.263, + "step": 25060 + }, + { + "epoch": 0.48, + "learning_rate": 8.633549880486351e-05, + "loss": 1.3308, + "step": 25070 + }, + { + "epoch": 0.48, + "learning_rate": 8.632512206808958e-05, + "loss": 1.3356, + "step": 25080 + }, + { + "epoch": 0.48, + "learning_rate": 8.631474201690173e-05, + "loss": 1.2657, + "step": 25090 + }, + { + "epoch": 0.48, + "learning_rate": 8.630435865224713e-05, + "loss": 1.2769, + "step": 25100 + }, + { + "epoch": 0.48, + "learning_rate": 8.629397197507315e-05, + "loss": 1.2632, + "step": 25110 + }, + { + "epoch": 0.48, + "learning_rate": 8.628358198632753e-05, + "loss": 1.2584, + "step": 25120 + }, + { + "epoch": 0.48, + "learning_rate": 8.627318868695826e-05, + "loss": 1.2567, + "step": 25130 + }, + { + "epoch": 0.48, + "learning_rate": 8.626279207791367e-05, + "loss": 1.2489, + "step": 25140 + }, + { + "epoch": 0.48, + "learning_rate": 8.625239216014239e-05, + "loss": 1.2256, + "step": 25150 + }, + { + "epoch": 0.48, + "learning_rate": 8.62419889345933e-05, + "loss": 1.6258, + "step": 25160 + }, + { + "epoch": 0.48, + "learning_rate": 8.623158240221566e-05, + "loss": 1.2184, + "step": 25170 + }, + { + "epoch": 0.48, + "learning_rate": 8.622117256395896e-05, + "loss": 1.2458, + "step": 25180 + }, + { + "epoch": 0.48, + "learning_rate": 8.621075942077307e-05, + "loss": 1.1242, + "step": 25190 + }, + { + "epoch": 0.48, + "learning_rate": 8.620034297360809e-05, + "loss": 1.3397, + "step": 25200 + }, + { + "epoch": 0.48, + "learning_rate": 8.618992322341444e-05, + "loss": 1.0229, + "step": 25210 + }, + { + "epoch": 0.48, + "learning_rate": 8.617950017114284e-05, + "loss": 1.3809, + "step": 25220 + }, + { + "epoch": 0.49, + "learning_rate": 8.616907381774438e-05, + "loss": 1.336, + "step": 25230 + }, + { + "epoch": 0.49, + "learning_rate": 8.615864416417033e-05, + "loss": 1.2924, + "step": 25240 + }, + { + "epoch": 0.49, + "learning_rate": 8.614821121137236e-05, + "loss": 1.3836, + "step": 25250 + }, + { + "epoch": 0.49, + "learning_rate": 8.613777496030237e-05, + "loss": 1.3497, + "step": 25260 + }, + { + "epoch": 0.49, + "learning_rate": 8.612733541191262e-05, + "loss": 1.3889, + "step": 25270 + }, + { + "epoch": 0.49, + "learning_rate": 8.611689256715564e-05, + "loss": 1.2354, + "step": 25280 + }, + { + "epoch": 0.49, + "learning_rate": 8.610644642698427e-05, + "loss": 1.0807, + "step": 25290 + }, + { + "epoch": 0.49, + "learning_rate": 8.609599699235164e-05, + "loss": 1.2515, + "step": 25300 + }, + { + "epoch": 0.49, + "learning_rate": 8.60855442642112e-05, + "loss": 1.2451, + "step": 25310 + }, + { + "epoch": 0.49, + "learning_rate": 8.607508824351669e-05, + "loss": 1.2102, + "step": 25320 + }, + { + "epoch": 0.49, + "learning_rate": 8.606462893122212e-05, + "loss": 1.0768, + "step": 25330 + }, + { + "epoch": 0.49, + "learning_rate": 8.605416632828185e-05, + "loss": 1.2183, + "step": 25340 + }, + { + "epoch": 0.49, + "learning_rate": 8.604370043565054e-05, + "loss": 1.2816, + "step": 25350 + }, + { + "epoch": 0.49, + "learning_rate": 8.603323125428309e-05, + "loss": 1.3463, + "step": 25360 + }, + { + "epoch": 0.49, + "learning_rate": 8.602275878513475e-05, + "loss": 1.2908, + "step": 25370 + }, + { + "epoch": 0.49, + "learning_rate": 8.601228302916109e-05, + "loss": 1.2678, + "step": 25380 + }, + { + "epoch": 0.49, + "learning_rate": 8.60018039873179e-05, + "loss": 1.3399, + "step": 25390 + }, + { + "epoch": 0.49, + "learning_rate": 8.599132166056137e-05, + "loss": 1.327, + "step": 25400 + }, + { + "epoch": 0.49, + "learning_rate": 8.598083604984791e-05, + "loss": 1.2336, + "step": 25410 + }, + { + "epoch": 0.49, + "learning_rate": 8.597034715613426e-05, + "loss": 1.2365, + "step": 25420 + }, + { + "epoch": 0.49, + "learning_rate": 8.595985498037748e-05, + "loss": 1.6296, + "step": 25430 + }, + { + "epoch": 0.49, + "learning_rate": 8.594935952353487e-05, + "loss": 1.2119, + "step": 25440 + }, + { + "epoch": 0.49, + "learning_rate": 8.593886078656409e-05, + "loss": 1.3625, + "step": 25450 + }, + { + "epoch": 0.49, + "learning_rate": 8.592835877042309e-05, + "loss": 1.1275, + "step": 25460 + }, + { + "epoch": 0.49, + "learning_rate": 8.591785347607007e-05, + "loss": 1.368, + "step": 25470 + }, + { + "epoch": 0.49, + "learning_rate": 8.59073449044636e-05, + "loss": 1.1099, + "step": 25480 + }, + { + "epoch": 0.49, + "learning_rate": 8.589683305656249e-05, + "loss": 1.4078, + "step": 25490 + }, + { + "epoch": 0.49, + "learning_rate": 8.588631793332589e-05, + "loss": 1.3117, + "step": 25500 + }, + { + "epoch": 0.49, + "learning_rate": 8.58757995357132e-05, + "loss": 1.4631, + "step": 25510 + }, + { + "epoch": 0.49, + "learning_rate": 8.586527786468422e-05, + "loss": 1.3648, + "step": 25520 + }, + { + "epoch": 0.49, + "learning_rate": 8.58547529211989e-05, + "loss": 1.4038, + "step": 25530 + }, + { + "epoch": 0.49, + "learning_rate": 8.58442247062176e-05, + "loss": 1.2978, + "step": 25540 + }, + { + "epoch": 0.49, + "learning_rate": 8.583369322070094e-05, + "loss": 1.2655, + "step": 25550 + }, + { + "epoch": 0.49, + "learning_rate": 8.582315846560986e-05, + "loss": 1.2609, + "step": 25560 + }, + { + "epoch": 0.49, + "learning_rate": 8.581262044190559e-05, + "loss": 1.2292, + "step": 25570 + }, + { + "epoch": 0.49, + "learning_rate": 8.580207915054962e-05, + "loss": 1.2096, + "step": 25580 + }, + { + "epoch": 0.49, + "learning_rate": 8.579153459250377e-05, + "loss": 1.2939, + "step": 25590 + }, + { + "epoch": 0.49, + "learning_rate": 8.578098676873019e-05, + "loss": 1.4657, + "step": 25600 + }, + { + "epoch": 0.49, + "learning_rate": 8.577043568019128e-05, + "loss": 1.1646, + "step": 25610 + }, + { + "epoch": 0.49, + "learning_rate": 8.575988132784975e-05, + "loss": 1.2445, + "step": 25620 + }, + { + "epoch": 0.49, + "learning_rate": 8.574932371266859e-05, + "loss": 1.1337, + "step": 25630 + }, + { + "epoch": 0.49, + "learning_rate": 8.573876283561115e-05, + "loss": 1.0884, + "step": 25640 + }, + { + "epoch": 0.49, + "learning_rate": 8.572819869764101e-05, + "loss": 1.3262, + "step": 25650 + }, + { + "epoch": 0.49, + "learning_rate": 8.571763129972209e-05, + "loss": 1.2143, + "step": 25660 + }, + { + "epoch": 0.49, + "learning_rate": 8.570706064281856e-05, + "loss": 1.3505, + "step": 25670 + }, + { + "epoch": 0.49, + "learning_rate": 8.569648672789497e-05, + "loss": 1.145, + "step": 25680 + }, + { + "epoch": 0.49, + "learning_rate": 8.568590955591606e-05, + "loss": 1.2317, + "step": 25690 + }, + { + "epoch": 0.49, + "learning_rate": 8.567532912784695e-05, + "loss": 1.3809, + "step": 25700 + }, + { + "epoch": 0.49, + "learning_rate": 8.566474544465304e-05, + "loss": 1.251, + "step": 25710 + }, + { + "epoch": 0.49, + "learning_rate": 8.56541585073e-05, + "loss": 1.501, + "step": 25720 + }, + { + "epoch": 0.49, + "learning_rate": 8.564356831675383e-05, + "loss": 1.189, + "step": 25730 + }, + { + "epoch": 0.49, + "learning_rate": 8.563297487398079e-05, + "loss": 1.3831, + "step": 25740 + }, + { + "epoch": 0.5, + "learning_rate": 8.562237817994747e-05, + "loss": 1.366, + "step": 25750 + }, + { + "epoch": 0.5, + "learning_rate": 8.561177823562074e-05, + "loss": 1.3184, + "step": 25760 + }, + { + "epoch": 0.5, + "learning_rate": 8.560117504196779e-05, + "loss": 1.3487, + "step": 25770 + }, + { + "epoch": 0.5, + "learning_rate": 8.559056859995607e-05, + "loss": 1.2711, + "step": 25780 + }, + { + "epoch": 0.5, + "learning_rate": 8.557995891055333e-05, + "loss": 1.163, + "step": 25790 + }, + { + "epoch": 0.5, + "learning_rate": 8.556934597472766e-05, + "loss": 1.1446, + "step": 25800 + }, + { + "epoch": 0.5, + "learning_rate": 8.555872979344739e-05, + "loss": 1.3401, + "step": 25810 + }, + { + "epoch": 0.5, + "learning_rate": 8.55481103676812e-05, + "loss": 1.3432, + "step": 25820 + }, + { + "epoch": 0.5, + "learning_rate": 8.553748769839801e-05, + "loss": 1.39, + "step": 25830 + }, + { + "epoch": 0.5, + "learning_rate": 8.552686178656708e-05, + "loss": 1.3649, + "step": 25840 + }, + { + "epoch": 0.5, + "learning_rate": 8.551623263315796e-05, + "loss": 1.2359, + "step": 25850 + }, + { + "epoch": 0.5, + "learning_rate": 8.550560023914047e-05, + "loss": 1.3131, + "step": 25860 + }, + { + "epoch": 0.5, + "learning_rate": 8.549496460548474e-05, + "loss": 1.3377, + "step": 25870 + }, + { + "epoch": 0.5, + "learning_rate": 8.54843257331612e-05, + "loss": 1.2271, + "step": 25880 + }, + { + "epoch": 0.5, + "learning_rate": 8.547368362314059e-05, + "loss": 1.3565, + "step": 25890 + }, + { + "epoch": 0.5, + "learning_rate": 8.54630382763939e-05, + "loss": 1.4663, + "step": 25900 + }, + { + "epoch": 0.5, + "learning_rate": 8.545238969389247e-05, + "loss": 1.5225, + "step": 25910 + }, + { + "epoch": 0.5, + "learning_rate": 8.544173787660788e-05, + "loss": 1.1, + "step": 25920 + }, + { + "epoch": 0.5, + "learning_rate": 8.543108282551205e-05, + "loss": 1.2345, + "step": 25930 + }, + { + "epoch": 0.5, + "learning_rate": 8.542042454157719e-05, + "loss": 1.3981, + "step": 25940 + }, + { + "epoch": 0.5, + "learning_rate": 8.540976302577579e-05, + "loss": 1.2563, + "step": 25950 + }, + { + "epoch": 0.5, + "learning_rate": 8.539909827908063e-05, + "loss": 1.3372, + "step": 25960 + }, + { + "epoch": 0.5, + "learning_rate": 8.538843030246479e-05, + "loss": 1.2642, + "step": 25970 + }, + { + "epoch": 0.5, + "learning_rate": 8.537775909690166e-05, + "loss": 1.3084, + "step": 25980 + }, + { + "epoch": 0.5, + "learning_rate": 8.53670846633649e-05, + "loss": 1.3232, + "step": 25990 + }, + { + "epoch": 0.5, + "learning_rate": 8.53564070028285e-05, + "loss": 1.3055, + "step": 26000 + }, + { + "epoch": 0.5, + "learning_rate": 8.53457261162667e-05, + "loss": 1.1639, + "step": 26010 + }, + { + "epoch": 0.5, + "learning_rate": 8.533504200465405e-05, + "loss": 1.248, + "step": 26020 + }, + { + "epoch": 0.5, + "learning_rate": 8.532435466896545e-05, + "loss": 1.1644, + "step": 26030 + }, + { + "epoch": 0.5, + "learning_rate": 8.531366411017598e-05, + "loss": 1.3173, + "step": 26040 + }, + { + "epoch": 0.5, + "learning_rate": 8.53029703292611e-05, + "loss": 1.341, + "step": 26050 + }, + { + "epoch": 0.5, + "learning_rate": 8.529227332719657e-05, + "loss": 1.3811, + "step": 26060 + }, + { + "epoch": 0.5, + "learning_rate": 8.528157310495839e-05, + "loss": 1.2061, + "step": 26070 + }, + { + "epoch": 0.5, + "learning_rate": 8.527086966352289e-05, + "loss": 1.3943, + "step": 26080 + }, + { + "epoch": 0.5, + "learning_rate": 8.526016300386669e-05, + "loss": 1.3149, + "step": 26090 + }, + { + "epoch": 0.5, + "learning_rate": 8.524945312696668e-05, + "loss": 1.3332, + "step": 26100 + }, + { + "epoch": 0.5, + "learning_rate": 8.523874003380008e-05, + "loss": 1.2111, + "step": 26110 + }, + { + "epoch": 0.5, + "learning_rate": 8.522802372534438e-05, + "loss": 1.2866, + "step": 26120 + }, + { + "epoch": 0.5, + "learning_rate": 8.521730420257735e-05, + "loss": 1.2371, + "step": 26130 + }, + { + "epoch": 0.5, + "learning_rate": 8.52065814664771e-05, + "loss": 1.2803, + "step": 26140 + }, + { + "epoch": 0.5, + "learning_rate": 8.519585551802198e-05, + "loss": 1.2091, + "step": 26150 + }, + { + "epoch": 0.5, + "learning_rate": 8.518512635819068e-05, + "loss": 1.2132, + "step": 26160 + }, + { + "epoch": 0.5, + "learning_rate": 8.517439398796214e-05, + "loss": 1.2747, + "step": 26170 + }, + { + "epoch": 0.5, + "learning_rate": 8.516365840831565e-05, + "loss": 1.1185, + "step": 26180 + }, + { + "epoch": 0.5, + "learning_rate": 8.515291962023072e-05, + "loss": 1.3429, + "step": 26190 + }, + { + "epoch": 0.5, + "learning_rate": 8.51421776246872e-05, + "loss": 1.163, + "step": 26200 + }, + { + "epoch": 0.5, + "learning_rate": 8.51314324226652e-05, + "loss": 1.3672, + "step": 26210 + }, + { + "epoch": 0.5, + "learning_rate": 8.51206840151452e-05, + "loss": 1.1565, + "step": 26220 + }, + { + "epoch": 0.5, + "learning_rate": 8.510993240310788e-05, + "loss": 1.3848, + "step": 26230 + }, + { + "epoch": 0.5, + "learning_rate": 8.509917758753423e-05, + "loss": 1.383, + "step": 26240 + }, + { + "epoch": 0.5, + "learning_rate": 8.50884195694056e-05, + "loss": 1.3075, + "step": 26250 + }, + { + "epoch": 0.5, + "learning_rate": 8.507765834970355e-05, + "loss": 1.1299, + "step": 26260 + }, + { + "epoch": 0.51, + "learning_rate": 8.506689392940998e-05, + "loss": 1.4614, + "step": 26270 + }, + { + "epoch": 0.51, + "learning_rate": 8.505612630950706e-05, + "loss": 1.2264, + "step": 26280 + }, + { + "epoch": 0.51, + "learning_rate": 8.504535549097727e-05, + "loss": 1.2389, + "step": 26290 + }, + { + "epoch": 0.51, + "learning_rate": 8.503458147480338e-05, + "loss": 1.416, + "step": 26300 + }, + { + "epoch": 0.51, + "learning_rate": 8.502380426196841e-05, + "loss": 1.373, + "step": 26310 + }, + { + "epoch": 0.51, + "learning_rate": 8.501302385345573e-05, + "loss": 1.3067, + "step": 26320 + }, + { + "epoch": 0.51, + "learning_rate": 8.500224025024899e-05, + "loss": 1.3258, + "step": 26330 + }, + { + "epoch": 0.51, + "learning_rate": 8.499145345333208e-05, + "loss": 1.2853, + "step": 26340 + }, + { + "epoch": 0.51, + "learning_rate": 8.498066346368926e-05, + "loss": 1.2557, + "step": 26350 + }, + { + "epoch": 0.51, + "learning_rate": 8.496987028230501e-05, + "loss": 1.1936, + "step": 26360 + }, + { + "epoch": 0.51, + "learning_rate": 8.495907391016416e-05, + "loss": 1.3147, + "step": 26370 + }, + { + "epoch": 0.51, + "learning_rate": 8.494827434825177e-05, + "loss": 1.3184, + "step": 26380 + }, + { + "epoch": 0.51, + "learning_rate": 8.493747159755325e-05, + "loss": 1.2931, + "step": 26390 + }, + { + "epoch": 0.51, + "learning_rate": 8.492666565905428e-05, + "loss": 1.3665, + "step": 26400 + }, + { + "epoch": 0.51, + "learning_rate": 8.491585653374081e-05, + "loss": 1.3053, + "step": 26410 + }, + { + "epoch": 0.51, + "learning_rate": 8.49050442225991e-05, + "loss": 1.4516, + "step": 26420 + }, + { + "epoch": 0.51, + "learning_rate": 8.489422872661571e-05, + "loss": 1.0048, + "step": 26430 + }, + { + "epoch": 0.51, + "learning_rate": 8.488341004677745e-05, + "loss": 1.2913, + "step": 26440 + }, + { + "epoch": 0.51, + "learning_rate": 8.487258818407149e-05, + "loss": 1.494, + "step": 26450 + }, + { + "epoch": 0.51, + "learning_rate": 8.486176313948521e-05, + "loss": 1.3213, + "step": 26460 + }, + { + "epoch": 0.51, + "learning_rate": 8.485093491400635e-05, + "loss": 1.1013, + "step": 26470 + }, + { + "epoch": 0.51, + "learning_rate": 8.48401035086229e-05, + "loss": 1.3415, + "step": 26480 + }, + { + "epoch": 0.51, + "learning_rate": 8.482926892432314e-05, + "loss": 1.3253, + "step": 26490 + }, + { + "epoch": 0.51, + "learning_rate": 8.481843116209566e-05, + "loss": 1.2684, + "step": 26500 + }, + { + "epoch": 0.51, + "learning_rate": 8.480759022292934e-05, + "loss": 1.1928, + "step": 26510 + }, + { + "epoch": 0.51, + "learning_rate": 8.479674610781331e-05, + "loss": 1.3124, + "step": 26520 + }, + { + "epoch": 0.51, + "learning_rate": 8.478589881773706e-05, + "loss": 1.275, + "step": 26530 + }, + { + "epoch": 0.51, + "learning_rate": 8.47750483536903e-05, + "loss": 1.4937, + "step": 26540 + }, + { + "epoch": 0.51, + "learning_rate": 8.476419471666306e-05, + "loss": 1.2804, + "step": 26550 + }, + { + "epoch": 0.51, + "learning_rate": 8.475333790764566e-05, + "loss": 1.2967, + "step": 26560 + }, + { + "epoch": 0.51, + "learning_rate": 8.474247792762873e-05, + "loss": 1.1503, + "step": 26570 + }, + { + "epoch": 0.51, + "learning_rate": 8.473161477760315e-05, + "loss": 1.2519, + "step": 26580 + }, + { + "epoch": 0.51, + "learning_rate": 8.472074845856008e-05, + "loss": 1.2036, + "step": 26590 + }, + { + "epoch": 0.51, + "learning_rate": 8.470987897149106e-05, + "loss": 1.4442, + "step": 26600 + }, + { + "epoch": 0.51, + "learning_rate": 8.469900631738779e-05, + "loss": 1.0919, + "step": 26610 + }, + { + "epoch": 0.51, + "learning_rate": 8.468813049724235e-05, + "loss": 1.1629, + "step": 26620 + }, + { + "epoch": 0.51, + "learning_rate": 8.467725151204711e-05, + "loss": 1.3146, + "step": 26630 + }, + { + "epoch": 0.51, + "learning_rate": 8.466636936279467e-05, + "loss": 1.1448, + "step": 26640 + }, + { + "epoch": 0.51, + "learning_rate": 8.465548405047794e-05, + "loss": 1.3973, + "step": 26650 + }, + { + "epoch": 0.51, + "learning_rate": 8.464459557609017e-05, + "loss": 1.2155, + "step": 26660 + }, + { + "epoch": 0.51, + "learning_rate": 8.463370394062481e-05, + "loss": 1.3208, + "step": 26670 + }, + { + "epoch": 0.51, + "learning_rate": 8.462280914507568e-05, + "loss": 1.163, + "step": 26680 + }, + { + "epoch": 0.51, + "learning_rate": 8.461191119043684e-05, + "loss": 1.3457, + "step": 26690 + }, + { + "epoch": 0.51, + "learning_rate": 8.460101007770265e-05, + "loss": 1.2833, + "step": 26700 + }, + { + "epoch": 0.51, + "learning_rate": 8.459010580786777e-05, + "loss": 1.1441, + "step": 26710 + }, + { + "epoch": 0.51, + "learning_rate": 8.457919838192714e-05, + "loss": 1.3319, + "step": 26720 + }, + { + "epoch": 0.51, + "learning_rate": 8.456828780087598e-05, + "loss": 1.3963, + "step": 26730 + }, + { + "epoch": 0.51, + "learning_rate": 8.455737406570979e-05, + "loss": 1.5014, + "step": 26740 + }, + { + "epoch": 0.51, + "learning_rate": 8.45464571774244e-05, + "loss": 1.1003, + "step": 26750 + }, + { + "epoch": 0.51, + "learning_rate": 8.453553713701587e-05, + "loss": 1.2513, + "step": 26760 + }, + { + "epoch": 0.51, + "learning_rate": 8.45246139454806e-05, + "loss": 1.1898, + "step": 26770 + }, + { + "epoch": 0.51, + "learning_rate": 8.451368760381526e-05, + "loss": 1.232, + "step": 26780 + }, + { + "epoch": 0.52, + "learning_rate": 8.450275811301678e-05, + "loss": 1.171, + "step": 26790 + }, + { + "epoch": 0.52, + "learning_rate": 8.449182547408243e-05, + "loss": 1.2793, + "step": 26800 + }, + { + "epoch": 0.52, + "learning_rate": 8.448088968800968e-05, + "loss": 1.4364, + "step": 26810 + }, + { + "epoch": 0.52, + "learning_rate": 8.446995075579642e-05, + "loss": 1.5247, + "step": 26820 + }, + { + "epoch": 0.52, + "learning_rate": 8.44590086784407e-05, + "loss": 1.2296, + "step": 26830 + }, + { + "epoch": 0.52, + "learning_rate": 8.444806345694092e-05, + "loss": 1.2471, + "step": 26840 + }, + { + "epoch": 0.52, + "learning_rate": 8.443711509229577e-05, + "loss": 1.2505, + "step": 26850 + }, + { + "epoch": 0.52, + "learning_rate": 8.442616358550419e-05, + "loss": 1.4087, + "step": 26860 + }, + { + "epoch": 0.52, + "learning_rate": 8.441520893756542e-05, + "loss": 1.151, + "step": 26870 + }, + { + "epoch": 0.52, + "learning_rate": 8.440425114947904e-05, + "loss": 1.1604, + "step": 26880 + }, + { + "epoch": 0.52, + "learning_rate": 8.439329022224483e-05, + "loss": 1.0405, + "step": 26890 + }, + { + "epoch": 0.52, + "learning_rate": 8.43823261568629e-05, + "loss": 1.2368, + "step": 26900 + }, + { + "epoch": 0.52, + "learning_rate": 8.437135895433367e-05, + "loss": 1.2347, + "step": 26910 + }, + { + "epoch": 0.52, + "learning_rate": 8.43603886156578e-05, + "loss": 1.2692, + "step": 26920 + }, + { + "epoch": 0.52, + "learning_rate": 8.434941514183627e-05, + "loss": 1.1797, + "step": 26930 + }, + { + "epoch": 0.52, + "learning_rate": 8.433843853387034e-05, + "loss": 1.2293, + "step": 26940 + }, + { + "epoch": 0.52, + "learning_rate": 8.432745879276152e-05, + "loss": 1.2469, + "step": 26950 + }, + { + "epoch": 0.52, + "learning_rate": 8.431647591951166e-05, + "loss": 1.4054, + "step": 26960 + }, + { + "epoch": 0.52, + "learning_rate": 8.430548991512286e-05, + "loss": 1.3398, + "step": 26970 + }, + { + "epoch": 0.52, + "learning_rate": 8.429450078059751e-05, + "loss": 1.2314, + "step": 26980 + }, + { + "epoch": 0.52, + "learning_rate": 8.428350851693831e-05, + "loss": 1.4495, + "step": 26990 + }, + { + "epoch": 0.52, + "learning_rate": 8.427251312514822e-05, + "loss": 1.3226, + "step": 27000 + }, + { + "epoch": 0.52, + "learning_rate": 8.426151460623046e-05, + "loss": 1.4091, + "step": 27010 + }, + { + "epoch": 0.52, + "learning_rate": 8.425051296118862e-05, + "loss": 1.2245, + "step": 27020 + }, + { + "epoch": 0.52, + "learning_rate": 8.42395081910265e-05, + "loss": 1.4106, + "step": 27030 + }, + { + "epoch": 0.52, + "learning_rate": 8.42285002967482e-05, + "loss": 1.1378, + "step": 27040 + }, + { + "epoch": 0.52, + "learning_rate": 8.421748927935813e-05, + "loss": 1.1341, + "step": 27050 + }, + { + "epoch": 0.52, + "learning_rate": 8.420647513986097e-05, + "loss": 1.1649, + "step": 27060 + }, + { + "epoch": 0.52, + "learning_rate": 8.419545787926166e-05, + "loss": 1.2055, + "step": 27070 + }, + { + "epoch": 0.52, + "learning_rate": 8.418443749856547e-05, + "loss": 1.295, + "step": 27080 + }, + { + "epoch": 0.52, + "learning_rate": 8.417341399877792e-05, + "loss": 1.1502, + "step": 27090 + }, + { + "epoch": 0.52, + "learning_rate": 8.416238738090484e-05, + "loss": 1.2067, + "step": 27100 + }, + { + "epoch": 0.52, + "learning_rate": 8.415135764595232e-05, + "loss": 1.1214, + "step": 27110 + }, + { + "epoch": 0.52, + "learning_rate": 8.414032479492676e-05, + "loss": 1.1568, + "step": 27120 + }, + { + "epoch": 0.52, + "learning_rate": 8.412928882883481e-05, + "loss": 1.471, + "step": 27130 + }, + { + "epoch": 0.52, + "learning_rate": 8.411824974868345e-05, + "loss": 1.1852, + "step": 27140 + }, + { + "epoch": 0.52, + "learning_rate": 8.41072075554799e-05, + "loss": 1.5221, + "step": 27150 + }, + { + "epoch": 0.52, + "learning_rate": 8.409616225023169e-05, + "loss": 1.1691, + "step": 27160 + }, + { + "epoch": 0.52, + "learning_rate": 8.408511383394663e-05, + "loss": 1.2235, + "step": 27170 + }, + { + "epoch": 0.52, + "learning_rate": 8.407406230763279e-05, + "loss": 1.4331, + "step": 27180 + }, + { + "epoch": 0.52, + "learning_rate": 8.406300767229857e-05, + "loss": 1.0593, + "step": 27190 + }, + { + "epoch": 0.52, + "learning_rate": 8.405194992895264e-05, + "loss": 1.3323, + "step": 27200 + }, + { + "epoch": 0.52, + "learning_rate": 8.40408890786039e-05, + "loss": 1.192, + "step": 27210 + }, + { + "epoch": 0.52, + "learning_rate": 8.402982512226159e-05, + "loss": 1.3016, + "step": 27220 + }, + { + "epoch": 0.52, + "learning_rate": 8.401875806093524e-05, + "loss": 1.1356, + "step": 27230 + }, + { + "epoch": 0.52, + "learning_rate": 8.400768789563463e-05, + "loss": 1.3031, + "step": 27240 + }, + { + "epoch": 0.52, + "learning_rate": 8.399661462736983e-05, + "loss": 1.2102, + "step": 27250 + }, + { + "epoch": 0.52, + "learning_rate": 8.398553825715122e-05, + "loss": 1.5091, + "step": 27260 + }, + { + "epoch": 0.52, + "learning_rate": 8.397445878598939e-05, + "loss": 1.3252, + "step": 27270 + }, + { + "epoch": 0.52, + "learning_rate": 8.396337621489532e-05, + "loss": 1.2352, + "step": 27280 + }, + { + "epoch": 0.52, + "learning_rate": 8.395229054488019e-05, + "loss": 1.2655, + "step": 27290 + }, + { + "epoch": 0.52, + "learning_rate": 8.394120177695548e-05, + "loss": 1.285, + "step": 27300 + }, + { + "epoch": 0.53, + "learning_rate": 8.393010991213299e-05, + "loss": 1.5301, + "step": 27310 + }, + { + "epoch": 0.53, + "learning_rate": 8.391901495142476e-05, + "loss": 1.4222, + "step": 27320 + }, + { + "epoch": 0.53, + "learning_rate": 8.390791689584314e-05, + "loss": 1.5654, + "step": 27330 + }, + { + "epoch": 0.53, + "learning_rate": 8.389681574640074e-05, + "loss": 1.4082, + "step": 27340 + }, + { + "epoch": 0.53, + "learning_rate": 8.388571150411046e-05, + "loss": 1.1596, + "step": 27350 + }, + { + "epoch": 0.53, + "learning_rate": 8.387460416998549e-05, + "loss": 1.4219, + "step": 27360 + }, + { + "epoch": 0.53, + "learning_rate": 8.386349374503927e-05, + "loss": 1.1008, + "step": 27370 + }, + { + "epoch": 0.53, + "learning_rate": 8.385238023028561e-05, + "loss": 1.335, + "step": 27380 + }, + { + "epoch": 0.53, + "learning_rate": 8.384126362673848e-05, + "loss": 1.3131, + "step": 27390 + }, + { + "epoch": 0.53, + "learning_rate": 8.383014393541224e-05, + "loss": 1.4491, + "step": 27400 + }, + { + "epoch": 0.53, + "learning_rate": 8.381902115732144e-05, + "loss": 1.4997, + "step": 27410 + }, + { + "epoch": 0.53, + "learning_rate": 8.380789529348099e-05, + "loss": 1.3243, + "step": 27420 + }, + { + "epoch": 0.53, + "learning_rate": 8.379676634490601e-05, + "loss": 1.2531, + "step": 27430 + }, + { + "epoch": 0.53, + "learning_rate": 8.3785634312612e-05, + "loss": 1.274, + "step": 27440 + }, + { + "epoch": 0.53, + "learning_rate": 8.37744991976146e-05, + "loss": 1.2635, + "step": 27450 + }, + { + "epoch": 0.53, + "learning_rate": 8.376336100092989e-05, + "loss": 1.3091, + "step": 27460 + }, + { + "epoch": 0.53, + "learning_rate": 8.37522197235741e-05, + "loss": 1.1116, + "step": 27470 + }, + { + "epoch": 0.53, + "learning_rate": 8.374107536656382e-05, + "loss": 1.2216, + "step": 27480 + }, + { + "epoch": 0.53, + "learning_rate": 8.372992793091589e-05, + "loss": 1.4895, + "step": 27490 + }, + { + "epoch": 0.53, + "learning_rate": 8.371877741764742e-05, + "loss": 1.0963, + "step": 27500 + }, + { + "epoch": 0.53, + "learning_rate": 8.370762382777584e-05, + "loss": 1.2577, + "step": 27510 + }, + { + "epoch": 0.53, + "learning_rate": 8.369646716231882e-05, + "loss": 1.1947, + "step": 27520 + }, + { + "epoch": 0.53, + "learning_rate": 8.368530742229432e-05, + "loss": 1.1473, + "step": 27530 + }, + { + "epoch": 0.53, + "learning_rate": 8.367414460872063e-05, + "loss": 1.2354, + "step": 27540 + }, + { + "epoch": 0.53, + "learning_rate": 8.366297872261623e-05, + "loss": 1.3187, + "step": 27550 + }, + { + "epoch": 0.53, + "learning_rate": 8.365180976499996e-05, + "loss": 1.1235, + "step": 27560 + }, + { + "epoch": 0.53, + "learning_rate": 8.364063773689088e-05, + "loss": 1.2695, + "step": 27570 + }, + { + "epoch": 0.53, + "learning_rate": 8.36294626393084e-05, + "loss": 1.3021, + "step": 27580 + }, + { + "epoch": 0.53, + "learning_rate": 8.361828447327214e-05, + "loss": 1.1396, + "step": 27590 + }, + { + "epoch": 0.53, + "learning_rate": 8.360710323980203e-05, + "loss": 1.452, + "step": 27600 + }, + { + "epoch": 0.53, + "learning_rate": 8.359591893991829e-05, + "loss": 1.3063, + "step": 27610 + }, + { + "epoch": 0.53, + "learning_rate": 8.358473157464143e-05, + "loss": 1.2269, + "step": 27620 + }, + { + "epoch": 0.53, + "learning_rate": 8.357354114499217e-05, + "loss": 1.1113, + "step": 27630 + }, + { + "epoch": 0.53, + "learning_rate": 8.35623476519916e-05, + "loss": 1.1943, + "step": 27640 + }, + { + "epoch": 0.53, + "learning_rate": 8.355115109666103e-05, + "loss": 1.2983, + "step": 27650 + }, + { + "epoch": 0.53, + "learning_rate": 8.353995148002208e-05, + "loss": 1.1644, + "step": 27660 + }, + { + "epoch": 0.53, + "learning_rate": 8.35287488030966e-05, + "loss": 1.4893, + "step": 27670 + }, + { + "epoch": 0.53, + "learning_rate": 8.35175430669068e-05, + "loss": 1.3958, + "step": 27680 + }, + { + "epoch": 0.53, + "learning_rate": 8.35063342724751e-05, + "loss": 1.2689, + "step": 27690 + }, + { + "epoch": 0.53, + "learning_rate": 8.349512242082425e-05, + "loss": 1.1521, + "step": 27700 + }, + { + "epoch": 0.53, + "learning_rate": 8.348390751297723e-05, + "loss": 1.2783, + "step": 27710 + }, + { + "epoch": 0.53, + "learning_rate": 8.347268954995731e-05, + "loss": 1.461, + "step": 27720 + }, + { + "epoch": 0.53, + "learning_rate": 8.34614685327881e-05, + "loss": 1.2763, + "step": 27730 + }, + { + "epoch": 0.53, + "learning_rate": 8.345024446249336e-05, + "loss": 1.1519, + "step": 27740 + }, + { + "epoch": 0.53, + "learning_rate": 8.34390173400973e-05, + "loss": 1.1179, + "step": 27750 + }, + { + "epoch": 0.53, + "learning_rate": 8.342778716662425e-05, + "loss": 1.285, + "step": 27760 + }, + { + "epoch": 0.53, + "learning_rate": 8.341655394309893e-05, + "loss": 1.206, + "step": 27770 + }, + { + "epoch": 0.53, + "learning_rate": 8.340531767054626e-05, + "loss": 1.3797, + "step": 27780 + }, + { + "epoch": 0.53, + "learning_rate": 8.339407834999147e-05, + "loss": 1.1791, + "step": 27790 + }, + { + "epoch": 0.53, + "learning_rate": 8.33828359824601e-05, + "loss": 1.1542, + "step": 27800 + }, + { + "epoch": 0.53, + "learning_rate": 8.337159056897792e-05, + "loss": 1.2696, + "step": 27810 + }, + { + "epoch": 0.53, + "learning_rate": 8.336034211057098e-05, + "loss": 1.2738, + "step": 27820 + }, + { + "epoch": 0.54, + "learning_rate": 8.334909060826566e-05, + "loss": 1.3142, + "step": 27830 + }, + { + "epoch": 0.54, + "learning_rate": 8.333783606308853e-05, + "loss": 1.3002, + "step": 27840 + }, + { + "epoch": 0.54, + "learning_rate": 8.332657847606655e-05, + "loss": 1.1613, + "step": 27850 + }, + { + "epoch": 0.54, + "learning_rate": 8.331531784822685e-05, + "loss": 1.2752, + "step": 27860 + }, + { + "epoch": 0.54, + "learning_rate": 8.33040541805969e-05, + "loss": 1.0929, + "step": 27870 + }, + { + "epoch": 0.54, + "learning_rate": 8.329278747420442e-05, + "loss": 1.2864, + "step": 27880 + }, + { + "epoch": 0.54, + "learning_rate": 8.328151773007744e-05, + "loss": 1.3144, + "step": 27890 + }, + { + "epoch": 0.54, + "learning_rate": 8.327024494924423e-05, + "loss": 1.2344, + "step": 27900 + }, + { + "epoch": 0.54, + "learning_rate": 8.325896913273335e-05, + "loss": 1.2351, + "step": 27910 + }, + { + "epoch": 0.54, + "learning_rate": 8.324769028157365e-05, + "loss": 1.3708, + "step": 27920 + }, + { + "epoch": 0.54, + "learning_rate": 8.323640839679425e-05, + "loss": 1.1846, + "step": 27930 + }, + { + "epoch": 0.54, + "learning_rate": 8.322512347942452e-05, + "loss": 1.4174, + "step": 27940 + }, + { + "epoch": 0.54, + "learning_rate": 8.321383553049416e-05, + "loss": 1.3728, + "step": 27950 + }, + { + "epoch": 0.54, + "learning_rate": 8.320254455103308e-05, + "loss": 1.1595, + "step": 27960 + }, + { + "epoch": 0.54, + "learning_rate": 8.319125054207156e-05, + "loss": 1.2334, + "step": 27970 + }, + { + "epoch": 0.54, + "learning_rate": 8.317995350464003e-05, + "loss": 1.0628, + "step": 27980 + }, + { + "epoch": 0.54, + "learning_rate": 8.316865343976932e-05, + "loss": 1.1752, + "step": 27990 + }, + { + "epoch": 0.54, + "learning_rate": 8.315735034849046e-05, + "loss": 1.088, + "step": 28000 + }, + { + "epoch": 0.54, + "learning_rate": 8.314604423183477e-05, + "loss": 1.4587, + "step": 28010 + }, + { + "epoch": 0.54, + "learning_rate": 8.313473509083387e-05, + "loss": 1.3223, + "step": 28020 + }, + { + "epoch": 0.54, + "learning_rate": 8.312342292651962e-05, + "loss": 1.1431, + "step": 28030 + }, + { + "epoch": 0.54, + "learning_rate": 8.311210773992421e-05, + "loss": 1.3173, + "step": 28040 + }, + { + "epoch": 0.54, + "learning_rate": 8.310078953208006e-05, + "loss": 1.0717, + "step": 28050 + }, + { + "epoch": 0.54, + "learning_rate": 8.308946830401986e-05, + "loss": 1.5137, + "step": 28060 + }, + { + "epoch": 0.54, + "learning_rate": 8.307814405677659e-05, + "loss": 1.4088, + "step": 28070 + }, + { + "epoch": 0.54, + "learning_rate": 8.306681679138355e-05, + "loss": 1.1914, + "step": 28080 + }, + { + "epoch": 0.54, + "learning_rate": 8.305548650887421e-05, + "loss": 1.2922, + "step": 28090 + }, + { + "epoch": 0.54, + "learning_rate": 8.304415321028245e-05, + "loss": 1.3544, + "step": 28100 + }, + { + "epoch": 0.54, + "learning_rate": 8.303281689664229e-05, + "loss": 1.1383, + "step": 28110 + }, + { + "epoch": 0.54, + "learning_rate": 8.302147756898814e-05, + "loss": 1.1972, + "step": 28120 + }, + { + "epoch": 0.54, + "learning_rate": 8.301013522835459e-05, + "loss": 1.0615, + "step": 28130 + }, + { + "epoch": 0.54, + "learning_rate": 8.299878987577658e-05, + "loss": 1.2076, + "step": 28140 + }, + { + "epoch": 0.54, + "learning_rate": 8.29874415122893e-05, + "loss": 1.6751, + "step": 28150 + }, + { + "epoch": 0.54, + "learning_rate": 8.29760901389282e-05, + "loss": 1.2135, + "step": 28160 + }, + { + "epoch": 0.54, + "learning_rate": 8.2964735756729e-05, + "loss": 1.3364, + "step": 28170 + }, + { + "epoch": 0.54, + "learning_rate": 8.295337836672772e-05, + "loss": 1.5556, + "step": 28180 + }, + { + "epoch": 0.54, + "learning_rate": 8.294201796996062e-05, + "loss": 1.2284, + "step": 28190 + }, + { + "epoch": 0.54, + "learning_rate": 8.293065456746431e-05, + "loss": 1.2007, + "step": 28200 + }, + { + "epoch": 0.54, + "learning_rate": 8.291928816027557e-05, + "loss": 1.2953, + "step": 28210 + }, + { + "epoch": 0.54, + "learning_rate": 8.290791874943152e-05, + "loss": 1.0888, + "step": 28220 + }, + { + "epoch": 0.54, + "learning_rate": 8.289654633596955e-05, + "loss": 1.244, + "step": 28230 + }, + { + "epoch": 0.54, + "learning_rate": 8.28851709209273e-05, + "loss": 1.1921, + "step": 28240 + }, + { + "epoch": 0.54, + "learning_rate": 8.287379250534271e-05, + "loss": 1.2461, + "step": 28250 + }, + { + "epoch": 0.54, + "learning_rate": 8.286241109025398e-05, + "loss": 1.3144, + "step": 28260 + }, + { + "epoch": 0.54, + "learning_rate": 8.285102667669957e-05, + "loss": 1.1797, + "step": 28270 + }, + { + "epoch": 0.54, + "learning_rate": 8.283963926571824e-05, + "loss": 1.3801, + "step": 28280 + }, + { + "epoch": 0.54, + "learning_rate": 8.2828248858349e-05, + "loss": 1.0576, + "step": 28290 + }, + { + "epoch": 0.54, + "learning_rate": 8.281685545563117e-05, + "loss": 1.4676, + "step": 28300 + }, + { + "epoch": 0.54, + "learning_rate": 8.28054590586043e-05, + "loss": 1.2034, + "step": 28310 + }, + { + "epoch": 0.54, + "learning_rate": 8.279405966830822e-05, + "loss": 1.1842, + "step": 28320 + }, + { + "epoch": 0.54, + "learning_rate": 8.278265728578307e-05, + "loss": 1.3048, + "step": 28330 + }, + { + "epoch": 0.54, + "learning_rate": 8.277125191206923e-05, + "loss": 1.4345, + "step": 28340 + }, + { + "epoch": 0.55, + "learning_rate": 8.275984354820736e-05, + "loss": 1.4033, + "step": 28350 + }, + { + "epoch": 0.55, + "learning_rate": 8.27484321952384e-05, + "loss": 1.2447, + "step": 28360 + }, + { + "epoch": 0.55, + "learning_rate": 8.273701785420353e-05, + "loss": 1.3716, + "step": 28370 + }, + { + "epoch": 0.55, + "learning_rate": 8.272560052614424e-05, + "loss": 1.3972, + "step": 28380 + }, + { + "epoch": 0.55, + "learning_rate": 8.271418021210232e-05, + "loss": 1.146, + "step": 28390 + }, + { + "epoch": 0.55, + "learning_rate": 8.270275691311974e-05, + "loss": 1.2948, + "step": 28400 + }, + { + "epoch": 0.55, + "learning_rate": 8.269133063023882e-05, + "loss": 1.3138, + "step": 28410 + }, + { + "epoch": 0.55, + "learning_rate": 8.267990136450212e-05, + "loss": 1.29, + "step": 28420 + }, + { + "epoch": 0.55, + "learning_rate": 8.26684691169525e-05, + "loss": 1.0941, + "step": 28430 + }, + { + "epoch": 0.55, + "learning_rate": 8.265703388863306e-05, + "loss": 1.1417, + "step": 28440 + }, + { + "epoch": 0.55, + "learning_rate": 8.264559568058718e-05, + "loss": 1.2778, + "step": 28450 + }, + { + "epoch": 0.55, + "learning_rate": 8.263415449385854e-05, + "loss": 1.191, + "step": 28460 + }, + { + "epoch": 0.55, + "learning_rate": 8.262271032949102e-05, + "loss": 1.1773, + "step": 28470 + }, + { + "epoch": 0.55, + "learning_rate": 8.261126318852887e-05, + "loss": 1.2815, + "step": 28480 + }, + { + "epoch": 0.55, + "learning_rate": 8.259981307201655e-05, + "loss": 1.3834, + "step": 28490 + }, + { + "epoch": 0.55, + "learning_rate": 8.258835998099879e-05, + "loss": 1.2724, + "step": 28500 + }, + { + "epoch": 0.55, + "learning_rate": 8.25769039165206e-05, + "loss": 1.3202, + "step": 28510 + }, + { + "epoch": 0.55, + "learning_rate": 8.256544487962728e-05, + "loss": 1.4193, + "step": 28520 + }, + { + "epoch": 0.55, + "learning_rate": 8.255398287136438e-05, + "loss": 0.9349, + "step": 28530 + }, + { + "epoch": 0.55, + "learning_rate": 8.254251789277773e-05, + "loss": 1.3385, + "step": 28540 + }, + { + "epoch": 0.55, + "learning_rate": 8.253104994491345e-05, + "loss": 1.2945, + "step": 28550 + }, + { + "epoch": 0.55, + "learning_rate": 8.25195790288179e-05, + "loss": 1.4197, + "step": 28560 + }, + { + "epoch": 0.55, + "learning_rate": 8.250810514553768e-05, + "loss": 1.3701, + "step": 28570 + }, + { + "epoch": 0.55, + "learning_rate": 8.249662829611975e-05, + "loss": 1.2065, + "step": 28580 + }, + { + "epoch": 0.55, + "learning_rate": 8.248514848161126e-05, + "loss": 1.3788, + "step": 28590 + }, + { + "epoch": 0.55, + "learning_rate": 8.24736657030597e-05, + "loss": 1.4662, + "step": 28600 + }, + { + "epoch": 0.55, + "learning_rate": 8.246217996151277e-05, + "loss": 1.117, + "step": 28610 + }, + { + "epoch": 0.55, + "learning_rate": 8.245069125801846e-05, + "loss": 1.2402, + "step": 28620 + }, + { + "epoch": 0.55, + "learning_rate": 8.243919959362505e-05, + "loss": 1.2305, + "step": 28630 + }, + { + "epoch": 0.55, + "learning_rate": 8.242770496938106e-05, + "loss": 1.6373, + "step": 28640 + }, + { + "epoch": 0.55, + "learning_rate": 8.241620738633528e-05, + "loss": 1.1744, + "step": 28650 + }, + { + "epoch": 0.55, + "learning_rate": 8.240470684553683e-05, + "loss": 1.4429, + "step": 28660 + }, + { + "epoch": 0.55, + "learning_rate": 8.239320334803502e-05, + "loss": 1.5479, + "step": 28670 + }, + { + "epoch": 0.55, + "learning_rate": 8.238169689487947e-05, + "loss": 1.3326, + "step": 28680 + }, + { + "epoch": 0.55, + "learning_rate": 8.237018748712007e-05, + "loss": 1.2314, + "step": 28690 + }, + { + "epoch": 0.55, + "learning_rate": 8.235867512580694e-05, + "loss": 1.2692, + "step": 28700 + }, + { + "epoch": 0.55, + "learning_rate": 8.234715981199058e-05, + "loss": 1.287, + "step": 28710 + }, + { + "epoch": 0.55, + "learning_rate": 8.23356415467216e-05, + "loss": 1.2947, + "step": 28720 + }, + { + "epoch": 0.55, + "learning_rate": 8.2324120331051e-05, + "loss": 1.5016, + "step": 28730 + }, + { + "epoch": 0.55, + "learning_rate": 8.231259616603e-05, + "loss": 1.2771, + "step": 28740 + }, + { + "epoch": 0.55, + "learning_rate": 8.23010690527101e-05, + "loss": 1.3657, + "step": 28750 + }, + { + "epoch": 0.55, + "learning_rate": 8.228953899214308e-05, + "loss": 1.4173, + "step": 28760 + }, + { + "epoch": 0.55, + "learning_rate": 8.227800598538097e-05, + "loss": 1.2384, + "step": 28770 + }, + { + "epoch": 0.55, + "learning_rate": 8.226647003347608e-05, + "loss": 1.1372, + "step": 28780 + }, + { + "epoch": 0.55, + "learning_rate": 8.225493113748098e-05, + "loss": 1.2316, + "step": 28790 + }, + { + "epoch": 0.55, + "learning_rate": 8.22433892984485e-05, + "loss": 1.2086, + "step": 28800 + }, + { + "epoch": 0.55, + "learning_rate": 8.22318445174318e-05, + "loss": 1.2879, + "step": 28810 + }, + { + "epoch": 0.55, + "learning_rate": 8.22202967954842e-05, + "loss": 1.1584, + "step": 28820 + }, + { + "epoch": 0.55, + "learning_rate": 8.220874613365938e-05, + "loss": 1.2797, + "step": 28830 + }, + { + "epoch": 0.55, + "learning_rate": 8.219719253301128e-05, + "loss": 1.3394, + "step": 28840 + }, + { + "epoch": 0.55, + "learning_rate": 8.218563599459404e-05, + "loss": 1.2505, + "step": 28850 + }, + { + "epoch": 0.55, + "learning_rate": 8.217407651946213e-05, + "loss": 1.1877, + "step": 28860 + }, + { + "epoch": 0.56, + "learning_rate": 8.216251410867028e-05, + "loss": 1.3494, + "step": 28870 + }, + { + "epoch": 0.56, + "learning_rate": 8.215094876327348e-05, + "loss": 1.2865, + "step": 28880 + }, + { + "epoch": 0.56, + "learning_rate": 8.213938048432697e-05, + "loss": 1.253, + "step": 28890 + }, + { + "epoch": 0.56, + "learning_rate": 8.212780927288629e-05, + "loss": 1.0997, + "step": 28900 + }, + { + "epoch": 0.56, + "learning_rate": 8.211623513000723e-05, + "loss": 1.2415, + "step": 28910 + }, + { + "epoch": 0.56, + "learning_rate": 8.210465805674585e-05, + "loss": 1.3405, + "step": 28920 + }, + { + "epoch": 0.56, + "learning_rate": 8.209307805415848e-05, + "loss": 1.2628, + "step": 28930 + }, + { + "epoch": 0.56, + "learning_rate": 8.20814951233017e-05, + "loss": 1.4601, + "step": 28940 + }, + { + "epoch": 0.56, + "learning_rate": 8.206990926523239e-05, + "loss": 1.3528, + "step": 28950 + }, + { + "epoch": 0.56, + "learning_rate": 8.205832048100768e-05, + "loss": 1.0674, + "step": 28960 + }, + { + "epoch": 0.56, + "learning_rate": 8.204672877168493e-05, + "loss": 1.3054, + "step": 28970 + }, + { + "epoch": 0.56, + "learning_rate": 8.203513413832184e-05, + "loss": 1.3358, + "step": 28980 + }, + { + "epoch": 0.56, + "learning_rate": 8.202353658197632e-05, + "loss": 1.8508, + "step": 28990 + }, + { + "epoch": 0.56, + "learning_rate": 8.201193610370659e-05, + "loss": 1.3068, + "step": 29000 + }, + { + "epoch": 0.56, + "learning_rate": 8.200033270457109e-05, + "loss": 1.2477, + "step": 29010 + }, + { + "epoch": 0.56, + "learning_rate": 8.198872638562856e-05, + "loss": 1.1866, + "step": 29020 + }, + { + "epoch": 0.56, + "learning_rate": 8.197711714793797e-05, + "loss": 1.3735, + "step": 29030 + }, + { + "epoch": 0.56, + "learning_rate": 8.196550499255861e-05, + "loss": 1.2985, + "step": 29040 + }, + { + "epoch": 0.56, + "learning_rate": 8.195388992055002e-05, + "loss": 1.1644, + "step": 29050 + }, + { + "epoch": 0.56, + "learning_rate": 8.194227193297197e-05, + "loss": 1.1818, + "step": 29060 + }, + { + "epoch": 0.56, + "learning_rate": 8.193065103088453e-05, + "loss": 1.2622, + "step": 29070 + }, + { + "epoch": 0.56, + "learning_rate": 8.1919027215348e-05, + "loss": 1.2003, + "step": 29080 + }, + { + "epoch": 0.56, + "learning_rate": 8.1907400487423e-05, + "loss": 1.3377, + "step": 29090 + }, + { + "epoch": 0.56, + "learning_rate": 8.18957708481704e-05, + "loss": 1.2792, + "step": 29100 + }, + { + "epoch": 0.56, + "learning_rate": 8.188413829865129e-05, + "loss": 1.4133, + "step": 29110 + }, + { + "epoch": 0.56, + "learning_rate": 8.187250283992709e-05, + "loss": 1.224, + "step": 29120 + }, + { + "epoch": 0.56, + "learning_rate": 8.186086447305943e-05, + "loss": 1.4087, + "step": 29130 + }, + { + "epoch": 0.56, + "learning_rate": 8.184922319911023e-05, + "loss": 1.277, + "step": 29140 + }, + { + "epoch": 0.56, + "learning_rate": 8.183757901914168e-05, + "loss": 1.2031, + "step": 29150 + }, + { + "epoch": 0.56, + "learning_rate": 8.182593193421625e-05, + "loss": 1.2813, + "step": 29160 + }, + { + "epoch": 0.56, + "learning_rate": 8.181428194539664e-05, + "loss": 1.1518, + "step": 29170 + }, + { + "epoch": 0.56, + "learning_rate": 8.180262905374581e-05, + "loss": 1.4077, + "step": 29180 + }, + { + "epoch": 0.56, + "learning_rate": 8.179097326032703e-05, + "loss": 1.2569, + "step": 29190 + }, + { + "epoch": 0.56, + "learning_rate": 8.177931456620382e-05, + "loss": 1.3568, + "step": 29200 + }, + { + "epoch": 0.56, + "learning_rate": 8.176765297243992e-05, + "loss": 1.308, + "step": 29210 + }, + { + "epoch": 0.56, + "learning_rate": 8.17559884800994e-05, + "loss": 1.2244, + "step": 29220 + }, + { + "epoch": 0.56, + "learning_rate": 8.174432109024655e-05, + "loss": 1.4062, + "step": 29230 + }, + { + "epoch": 0.56, + "learning_rate": 8.173265080394593e-05, + "loss": 1.1777, + "step": 29240 + }, + { + "epoch": 0.56, + "learning_rate": 8.172097762226238e-05, + "loss": 1.2748, + "step": 29250 + }, + { + "epoch": 0.56, + "learning_rate": 8.170930154626101e-05, + "loss": 1.2154, + "step": 29260 + }, + { + "epoch": 0.56, + "learning_rate": 8.169762257700715e-05, + "loss": 1.233, + "step": 29270 + }, + { + "epoch": 0.56, + "learning_rate": 8.168594071556645e-05, + "loss": 1.181, + "step": 29280 + }, + { + "epoch": 0.56, + "learning_rate": 8.16742559630048e-05, + "loss": 1.2714, + "step": 29290 + }, + { + "epoch": 0.56, + "learning_rate": 8.166256832038833e-05, + "loss": 1.2402, + "step": 29300 + }, + { + "epoch": 0.56, + "learning_rate": 8.165087778878349e-05, + "loss": 1.2843, + "step": 29310 + }, + { + "epoch": 0.56, + "learning_rate": 8.163918436925692e-05, + "loss": 1.1469, + "step": 29320 + }, + { + "epoch": 0.56, + "learning_rate": 8.162748806287558e-05, + "loss": 1.1818, + "step": 29330 + }, + { + "epoch": 0.56, + "learning_rate": 8.161578887070668e-05, + "loss": 1.2172, + "step": 29340 + }, + { + "epoch": 0.56, + "learning_rate": 8.160408679381768e-05, + "loss": 1.2522, + "step": 29350 + }, + { + "epoch": 0.56, + "learning_rate": 8.159238183327633e-05, + "loss": 1.2492, + "step": 29360 + }, + { + "epoch": 0.56, + "learning_rate": 8.158067399015061e-05, + "loss": 1.306, + "step": 29370 + }, + { + "epoch": 0.56, + "learning_rate": 8.15689632655088e-05, + "loss": 1.2349, + "step": 29380 + }, + { + "epoch": 0.57, + "learning_rate": 8.155724966041939e-05, + "loss": 1.4653, + "step": 29390 + }, + { + "epoch": 0.57, + "learning_rate": 8.154553317595118e-05, + "loss": 1.1166, + "step": 29400 + }, + { + "epoch": 0.57, + "learning_rate": 8.153381381317322e-05, + "loss": 1.3382, + "step": 29410 + }, + { + "epoch": 0.57, + "learning_rate": 8.152209157315483e-05, + "loss": 1.2821, + "step": 29420 + }, + { + "epoch": 0.57, + "learning_rate": 8.151036645696556e-05, + "loss": 1.3065, + "step": 29430 + }, + { + "epoch": 0.57, + "learning_rate": 8.149863846567527e-05, + "loss": 1.415, + "step": 29440 + }, + { + "epoch": 0.57, + "learning_rate": 8.148690760035403e-05, + "loss": 1.1433, + "step": 29450 + }, + { + "epoch": 0.57, + "learning_rate": 8.14751738620722e-05, + "loss": 1.2578, + "step": 29460 + }, + { + "epoch": 0.57, + "learning_rate": 8.146343725190045e-05, + "loss": 1.2699, + "step": 29470 + }, + { + "epoch": 0.57, + "learning_rate": 8.145169777090959e-05, + "loss": 1.1895, + "step": 29480 + }, + { + "epoch": 0.57, + "learning_rate": 8.143995542017084e-05, + "loss": 1.3623, + "step": 29490 + }, + { + "epoch": 0.57, + "learning_rate": 8.142821020075554e-05, + "loss": 1.4797, + "step": 29500 + }, + { + "epoch": 0.57, + "learning_rate": 8.141646211373541e-05, + "loss": 1.1159, + "step": 29510 + }, + { + "epoch": 0.57, + "learning_rate": 8.140471116018237e-05, + "loss": 1.3417, + "step": 29520 + }, + { + "epoch": 0.57, + "learning_rate": 8.13929573411686e-05, + "loss": 1.3552, + "step": 29530 + }, + { + "epoch": 0.57, + "learning_rate": 8.138120065776655e-05, + "loss": 1.1364, + "step": 29540 + }, + { + "epoch": 0.57, + "learning_rate": 8.136944111104896e-05, + "loss": 1.0759, + "step": 29550 + }, + { + "epoch": 0.57, + "learning_rate": 8.135767870208877e-05, + "loss": 1.1594, + "step": 29560 + }, + { + "epoch": 0.57, + "learning_rate": 8.134591343195925e-05, + "loss": 1.1217, + "step": 29570 + }, + { + "epoch": 0.57, + "learning_rate": 8.133414530173389e-05, + "loss": 1.2963, + "step": 29580 + }, + { + "epoch": 0.57, + "learning_rate": 8.132237431248643e-05, + "loss": 1.5932, + "step": 29590 + }, + { + "epoch": 0.57, + "learning_rate": 8.131060046529093e-05, + "loss": 1.1978, + "step": 29600 + }, + { + "epoch": 0.57, + "learning_rate": 8.129882376122164e-05, + "loss": 1.1566, + "step": 29610 + }, + { + "epoch": 0.57, + "learning_rate": 8.128704420135312e-05, + "loss": 1.2011, + "step": 29620 + }, + { + "epoch": 0.57, + "learning_rate": 8.127526178676015e-05, + "loss": 1.057, + "step": 29630 + }, + { + "epoch": 0.57, + "learning_rate": 8.12634765185178e-05, + "loss": 1.4486, + "step": 29640 + }, + { + "epoch": 0.57, + "learning_rate": 8.125168839770142e-05, + "loss": 1.2399, + "step": 29650 + }, + { + "epoch": 0.57, + "learning_rate": 8.123989742538655e-05, + "loss": 1.1102, + "step": 29660 + }, + { + "epoch": 0.57, + "learning_rate": 8.122810360264909e-05, + "loss": 1.2983, + "step": 29670 + }, + { + "epoch": 0.57, + "learning_rate": 8.121630693056509e-05, + "loss": 1.276, + "step": 29680 + }, + { + "epoch": 0.57, + "learning_rate": 8.120450741021094e-05, + "loss": 1.1742, + "step": 29690 + }, + { + "epoch": 0.57, + "learning_rate": 8.119270504266325e-05, + "loss": 1.3373, + "step": 29700 + }, + { + "epoch": 0.57, + "learning_rate": 8.118089982899893e-05, + "loss": 1.4534, + "step": 29710 + }, + { + "epoch": 0.57, + "learning_rate": 8.116909177029511e-05, + "loss": 1.3018, + "step": 29720 + }, + { + "epoch": 0.57, + "learning_rate": 8.115728086762917e-05, + "loss": 1.1947, + "step": 29730 + }, + { + "epoch": 0.57, + "learning_rate": 8.11454671220788e-05, + "loss": 1.1674, + "step": 29740 + }, + { + "epoch": 0.57, + "learning_rate": 8.113365053472193e-05, + "loss": 1.1703, + "step": 29750 + }, + { + "epoch": 0.57, + "learning_rate": 8.11218311066367e-05, + "loss": 1.3395, + "step": 29760 + }, + { + "epoch": 0.57, + "learning_rate": 8.111000883890159e-05, + "loss": 1.1125, + "step": 29770 + }, + { + "epoch": 0.57, + "learning_rate": 8.109818373259529e-05, + "loss": 1.3501, + "step": 29780 + }, + { + "epoch": 0.57, + "learning_rate": 8.108635578879674e-05, + "loss": 1.2262, + "step": 29790 + }, + { + "epoch": 0.57, + "learning_rate": 8.107452500858517e-05, + "loss": 1.233, + "step": 29800 + }, + { + "epoch": 0.57, + "learning_rate": 8.106269139304007e-05, + "loss": 1.2201, + "step": 29810 + }, + { + "epoch": 0.57, + "learning_rate": 8.105085494324117e-05, + "loss": 1.3223, + "step": 29820 + }, + { + "epoch": 0.57, + "learning_rate": 8.103901566026843e-05, + "loss": 1.3127, + "step": 29830 + }, + { + "epoch": 0.57, + "learning_rate": 8.102717354520213e-05, + "loss": 0.8995, + "step": 29840 + }, + { + "epoch": 0.57, + "learning_rate": 8.101532859912279e-05, + "loss": 1.3091, + "step": 29850 + }, + { + "epoch": 0.57, + "learning_rate": 8.100348082311115e-05, + "loss": 1.537, + "step": 29860 + }, + { + "epoch": 0.57, + "learning_rate": 8.099163021824827e-05, + "loss": 1.3161, + "step": 29870 + }, + { + "epoch": 0.57, + "learning_rate": 8.097977678561542e-05, + "loss": 1.3172, + "step": 29880 + }, + { + "epoch": 0.57, + "learning_rate": 8.096792052629413e-05, + "loss": 1.1917, + "step": 29890 + }, + { + "epoch": 0.57, + "learning_rate": 8.09560614413662e-05, + "loss": 1.2352, + "step": 29900 + }, + { + "epoch": 0.58, + "learning_rate": 8.094419953191373e-05, + "loss": 1.2005, + "step": 29910 + }, + { + "epoch": 0.58, + "learning_rate": 8.0932334799019e-05, + "loss": 1.215, + "step": 29920 + }, + { + "epoch": 0.58, + "learning_rate": 8.092046724376457e-05, + "loss": 1.3485, + "step": 29930 + }, + { + "epoch": 0.58, + "learning_rate": 8.090859686723331e-05, + "loss": 1.3266, + "step": 29940 + }, + { + "epoch": 0.58, + "learning_rate": 8.089672367050829e-05, + "loss": 1.3012, + "step": 29950 + }, + { + "epoch": 0.58, + "learning_rate": 8.088484765467286e-05, + "loss": 1.1656, + "step": 29960 + }, + { + "epoch": 0.58, + "learning_rate": 8.087296882081061e-05, + "loss": 1.3282, + "step": 29970 + }, + { + "epoch": 0.58, + "learning_rate": 8.086108717000542e-05, + "loss": 1.2474, + "step": 29980 + }, + { + "epoch": 0.58, + "learning_rate": 8.084920270334141e-05, + "loss": 1.3896, + "step": 29990 + }, + { + "epoch": 0.58, + "learning_rate": 8.083731542190294e-05, + "loss": 1.2215, + "step": 30000 + }, + { + "epoch": 0.58, + "learning_rate": 8.082542532677463e-05, + "loss": 1.2579, + "step": 30010 + }, + { + "epoch": 0.58, + "learning_rate": 8.08135324190414e-05, + "loss": 1.3407, + "step": 30020 + }, + { + "epoch": 0.58, + "learning_rate": 8.080163669978838e-05, + "loss": 1.26, + "step": 30030 + }, + { + "epoch": 0.58, + "learning_rate": 8.078973817010096e-05, + "loss": 1.169, + "step": 30040 + }, + { + "epoch": 0.58, + "learning_rate": 8.077783683106481e-05, + "loss": 1.4966, + "step": 30050 + }, + { + "epoch": 0.58, + "learning_rate": 8.076593268376585e-05, + "loss": 1.3155, + "step": 30060 + }, + { + "epoch": 0.58, + "learning_rate": 8.075402572929025e-05, + "loss": 1.2524, + "step": 30070 + }, + { + "epoch": 0.58, + "learning_rate": 8.07421159687244e-05, + "loss": 1.4385, + "step": 30080 + }, + { + "epoch": 0.58, + "learning_rate": 8.073020340315503e-05, + "loss": 1.2795, + "step": 30090 + }, + { + "epoch": 0.58, + "learning_rate": 8.071828803366908e-05, + "loss": 1.3565, + "step": 30100 + }, + { + "epoch": 0.58, + "learning_rate": 8.07063698613537e-05, + "loss": 1.5225, + "step": 30110 + }, + { + "epoch": 0.58, + "learning_rate": 8.069444888729638e-05, + "loss": 1.3163, + "step": 30120 + }, + { + "epoch": 0.58, + "learning_rate": 8.068252511258479e-05, + "loss": 1.2209, + "step": 30130 + }, + { + "epoch": 0.58, + "learning_rate": 8.067059853830691e-05, + "loss": 1.2795, + "step": 30140 + }, + { + "epoch": 0.58, + "learning_rate": 8.065866916555099e-05, + "loss": 1.4623, + "step": 30150 + }, + { + "epoch": 0.58, + "learning_rate": 8.064673699540543e-05, + "loss": 1.0715, + "step": 30160 + }, + { + "epoch": 0.58, + "learning_rate": 8.063480202895903e-05, + "loss": 1.2935, + "step": 30170 + }, + { + "epoch": 0.58, + "learning_rate": 8.062286426730074e-05, + "loss": 1.2512, + "step": 30180 + }, + { + "epoch": 0.58, + "learning_rate": 8.061092371151977e-05, + "loss": 1.0615, + "step": 30190 + }, + { + "epoch": 0.58, + "learning_rate": 8.059898036270565e-05, + "loss": 1.3225, + "step": 30200 + }, + { + "epoch": 0.58, + "learning_rate": 8.058703422194813e-05, + "loss": 1.2801, + "step": 30210 + }, + { + "epoch": 0.58, + "learning_rate": 8.05750852903372e-05, + "loss": 1.22, + "step": 30220 + }, + { + "epoch": 0.58, + "learning_rate": 8.056313356896311e-05, + "loss": 1.2293, + "step": 30230 + }, + { + "epoch": 0.58, + "learning_rate": 8.055117905891637e-05, + "loss": 1.1926, + "step": 30240 + }, + { + "epoch": 0.58, + "learning_rate": 8.053922176128777e-05, + "loss": 1.4466, + "step": 30250 + }, + { + "epoch": 0.58, + "learning_rate": 8.052726167716829e-05, + "loss": 1.365, + "step": 30260 + }, + { + "epoch": 0.58, + "learning_rate": 8.051529880764923e-05, + "loss": 1.313, + "step": 30270 + }, + { + "epoch": 0.58, + "learning_rate": 8.050333315382213e-05, + "loss": 1.2731, + "step": 30280 + }, + { + "epoch": 0.58, + "learning_rate": 8.049136471677874e-05, + "loss": 1.1884, + "step": 30290 + }, + { + "epoch": 0.58, + "learning_rate": 8.047939349761114e-05, + "loss": 1.3017, + "step": 30300 + }, + { + "epoch": 0.58, + "learning_rate": 8.046741949741157e-05, + "loss": 1.1294, + "step": 30310 + }, + { + "epoch": 0.58, + "learning_rate": 8.045544271727259e-05, + "loss": 1.3334, + "step": 30320 + }, + { + "epoch": 0.58, + "learning_rate": 8.044346315828703e-05, + "loss": 1.3379, + "step": 30330 + }, + { + "epoch": 0.58, + "learning_rate": 8.04314808215479e-05, + "loss": 1.2214, + "step": 30340 + }, + { + "epoch": 0.58, + "learning_rate": 8.041949570814852e-05, + "loss": 1.2562, + "step": 30350 + }, + { + "epoch": 0.58, + "learning_rate": 8.040750781918247e-05, + "loss": 1.0802, + "step": 30360 + }, + { + "epoch": 0.58, + "learning_rate": 8.039551715574351e-05, + "loss": 0.9623, + "step": 30370 + }, + { + "epoch": 0.58, + "learning_rate": 8.038352371892576e-05, + "loss": 1.1255, + "step": 30380 + }, + { + "epoch": 0.58, + "learning_rate": 8.037152750982351e-05, + "loss": 1.2509, + "step": 30390 + }, + { + "epoch": 0.58, + "learning_rate": 8.035952852953132e-05, + "loss": 1.2069, + "step": 30400 + }, + { + "epoch": 0.58, + "learning_rate": 8.034752677914404e-05, + "loss": 1.1465, + "step": 30410 + }, + { + "epoch": 0.58, + "learning_rate": 8.033552225975672e-05, + "loss": 1.3333, + "step": 30420 + }, + { + "epoch": 0.59, + "learning_rate": 8.03235149724647e-05, + "loss": 1.2588, + "step": 30430 + }, + { + "epoch": 0.59, + "learning_rate": 8.031150491836357e-05, + "loss": 1.2525, + "step": 30440 + }, + { + "epoch": 0.59, + "learning_rate": 8.029949209854915e-05, + "loss": 1.1298, + "step": 30450 + }, + { + "epoch": 0.59, + "learning_rate": 8.028747651411754e-05, + "loss": 1.4997, + "step": 30460 + }, + { + "epoch": 0.59, + "learning_rate": 8.027545816616507e-05, + "loss": 1.3049, + "step": 30470 + }, + { + "epoch": 0.59, + "learning_rate": 8.026343705578832e-05, + "loss": 1.1496, + "step": 30480 + }, + { + "epoch": 0.59, + "learning_rate": 8.025141318408413e-05, + "loss": 1.1987, + "step": 30490 + }, + { + "epoch": 0.59, + "learning_rate": 8.023938655214963e-05, + "loss": 1.3914, + "step": 30500 + }, + { + "epoch": 0.59, + "learning_rate": 8.022735716108211e-05, + "loss": 1.3865, + "step": 30510 + }, + { + "epoch": 0.59, + "learning_rate": 8.021532501197923e-05, + "loss": 1.1831, + "step": 30520 + }, + { + "epoch": 0.59, + "learning_rate": 8.020329010593881e-05, + "loss": 1.4677, + "step": 30530 + }, + { + "epoch": 0.59, + "learning_rate": 8.019125244405893e-05, + "loss": 1.3643, + "step": 30540 + }, + { + "epoch": 0.59, + "learning_rate": 8.017921202743798e-05, + "loss": 1.1504, + "step": 30550 + }, + { + "epoch": 0.59, + "learning_rate": 8.016716885717456e-05, + "loss": 1.2218, + "step": 30560 + }, + { + "epoch": 0.59, + "learning_rate": 8.015512293436749e-05, + "loss": 1.2422, + "step": 30570 + }, + { + "epoch": 0.59, + "learning_rate": 8.014307426011591e-05, + "loss": 1.2782, + "step": 30580 + }, + { + "epoch": 0.59, + "learning_rate": 8.013102283551917e-05, + "loss": 1.2293, + "step": 30590 + }, + { + "epoch": 0.59, + "learning_rate": 8.011896866167688e-05, + "loss": 1.3277, + "step": 30600 + }, + { + "epoch": 0.59, + "learning_rate": 8.01069117396889e-05, + "loss": 1.0918, + "step": 30610 + }, + { + "epoch": 0.59, + "learning_rate": 8.009485207065531e-05, + "loss": 1.3868, + "step": 30620 + }, + { + "epoch": 0.59, + "learning_rate": 8.008278965567651e-05, + "loss": 1.422, + "step": 30630 + }, + { + "epoch": 0.59, + "learning_rate": 8.007072449585309e-05, + "loss": 1.3878, + "step": 30640 + }, + { + "epoch": 0.59, + "learning_rate": 8.005865659228592e-05, + "loss": 1.1369, + "step": 30650 + }, + { + "epoch": 0.59, + "learning_rate": 8.004658594607612e-05, + "loss": 1.3, + "step": 30660 + }, + { + "epoch": 0.59, + "learning_rate": 8.003451255832503e-05, + "loss": 1.1346, + "step": 30670 + }, + { + "epoch": 0.59, + "learning_rate": 8.00224364301343e-05, + "loss": 1.1894, + "step": 30680 + }, + { + "epoch": 0.59, + "learning_rate": 8.001035756260573e-05, + "loss": 1.4919, + "step": 30690 + }, + { + "epoch": 0.59, + "learning_rate": 7.999827595684149e-05, + "loss": 1.5689, + "step": 30700 + }, + { + "epoch": 0.59, + "learning_rate": 7.998619161394391e-05, + "loss": 1.2959, + "step": 30710 + }, + { + "epoch": 0.59, + "learning_rate": 7.997410453501564e-05, + "loss": 1.0812, + "step": 30720 + }, + { + "epoch": 0.59, + "learning_rate": 7.996201472115949e-05, + "loss": 1.3914, + "step": 30730 + }, + { + "epoch": 0.59, + "learning_rate": 7.994992217347861e-05, + "loss": 1.0835, + "step": 30740 + }, + { + "epoch": 0.59, + "learning_rate": 7.993782689307634e-05, + "loss": 1.2736, + "step": 30750 + }, + { + "epoch": 0.59, + "learning_rate": 7.99257288810563e-05, + "loss": 1.3569, + "step": 30760 + }, + { + "epoch": 0.59, + "learning_rate": 7.991362813852235e-05, + "loss": 1.3787, + "step": 30770 + }, + { + "epoch": 0.59, + "learning_rate": 7.990152466657858e-05, + "loss": 1.1633, + "step": 30780 + }, + { + "epoch": 0.59, + "learning_rate": 7.988941846632939e-05, + "loss": 1.2479, + "step": 30790 + }, + { + "epoch": 0.59, + "learning_rate": 7.987730953887933e-05, + "loss": 1.1677, + "step": 30800 + }, + { + "epoch": 0.59, + "learning_rate": 7.98651978853333e-05, + "loss": 1.3026, + "step": 30810 + }, + { + "epoch": 0.59, + "learning_rate": 7.985308350679638e-05, + "loss": 1.1655, + "step": 30820 + }, + { + "epoch": 0.59, + "learning_rate": 7.984096640437393e-05, + "loss": 1.4358, + "step": 30830 + }, + { + "epoch": 0.59, + "learning_rate": 7.982884657917156e-05, + "loss": 1.3939, + "step": 30840 + }, + { + "epoch": 0.59, + "learning_rate": 7.981672403229509e-05, + "loss": 1.1359, + "step": 30850 + }, + { + "epoch": 0.59, + "learning_rate": 7.980459876485065e-05, + "loss": 1.4047, + "step": 30860 + }, + { + "epoch": 0.59, + "learning_rate": 7.979247077794457e-05, + "loss": 1.4101, + "step": 30870 + }, + { + "epoch": 0.59, + "learning_rate": 7.978034007268347e-05, + "loss": 1.2853, + "step": 30880 + }, + { + "epoch": 0.59, + "learning_rate": 7.976820665017413e-05, + "loss": 1.3256, + "step": 30890 + }, + { + "epoch": 0.59, + "learning_rate": 7.975607051152372e-05, + "loss": 1.3236, + "step": 30900 + }, + { + "epoch": 0.59, + "learning_rate": 7.974393165783951e-05, + "loss": 1.3947, + "step": 30910 + }, + { + "epoch": 0.59, + "learning_rate": 7.973179009022913e-05, + "loss": 1.3211, + "step": 30920 + }, + { + "epoch": 0.59, + "learning_rate": 7.971964580980039e-05, + "loss": 1.2352, + "step": 30930 + }, + { + "epoch": 0.59, + "learning_rate": 7.970749881766137e-05, + "loss": 1.3411, + "step": 30940 + }, + { + "epoch": 0.6, + "learning_rate": 7.969534911492042e-05, + "loss": 1.1491, + "step": 30950 + }, + { + "epoch": 0.6, + "learning_rate": 7.96831967026861e-05, + "loss": 1.4631, + "step": 30960 + }, + { + "epoch": 0.6, + "learning_rate": 7.967104158206725e-05, + "loss": 1.3809, + "step": 30970 + }, + { + "epoch": 0.6, + "learning_rate": 7.96588837541729e-05, + "loss": 1.1897, + "step": 30980 + }, + { + "epoch": 0.6, + "learning_rate": 7.964672322011241e-05, + "loss": 1.3747, + "step": 30990 + }, + { + "epoch": 0.6, + "learning_rate": 7.963455998099532e-05, + "loss": 1.414, + "step": 31000 + }, + { + "epoch": 0.6, + "learning_rate": 7.962239403793144e-05, + "loss": 1.3563, + "step": 31010 + }, + { + "epoch": 0.6, + "learning_rate": 7.961022539203082e-05, + "loss": 1.1784, + "step": 31020 + }, + { + "epoch": 0.6, + "learning_rate": 7.95980540444038e-05, + "loss": 1.2734, + "step": 31030 + }, + { + "epoch": 0.6, + "learning_rate": 7.958587999616092e-05, + "loss": 1.3385, + "step": 31040 + }, + { + "epoch": 0.6, + "learning_rate": 7.957370324841293e-05, + "loss": 1.3774, + "step": 31050 + }, + { + "epoch": 0.6, + "learning_rate": 7.956152380227093e-05, + "loss": 1.1256, + "step": 31060 + }, + { + "epoch": 0.6, + "learning_rate": 7.954934165884617e-05, + "loss": 1.3006, + "step": 31070 + }, + { + "epoch": 0.6, + "learning_rate": 7.953715681925023e-05, + "loss": 1.1921, + "step": 31080 + }, + { + "epoch": 0.6, + "learning_rate": 7.952496928459485e-05, + "loss": 1.3989, + "step": 31090 + }, + { + "epoch": 0.6, + "learning_rate": 7.951277905599209e-05, + "loss": 1.4106, + "step": 31100 + }, + { + "epoch": 0.6, + "learning_rate": 7.950058613455418e-05, + "loss": 1.3119, + "step": 31110 + }, + { + "epoch": 0.6, + "learning_rate": 7.948839052139367e-05, + "loss": 1.2639, + "step": 31120 + }, + { + "epoch": 0.6, + "learning_rate": 7.947619221762335e-05, + "loss": 1.2607, + "step": 31130 + }, + { + "epoch": 0.6, + "learning_rate": 7.946399122435616e-05, + "loss": 1.1748, + "step": 31140 + }, + { + "epoch": 0.6, + "learning_rate": 7.945178754270542e-05, + "loss": 1.2188, + "step": 31150 + }, + { + "epoch": 0.6, + "learning_rate": 7.943958117378458e-05, + "loss": 1.1876, + "step": 31160 + }, + { + "epoch": 0.6, + "learning_rate": 7.942737211870743e-05, + "loss": 1.2138, + "step": 31170 + }, + { + "epoch": 0.6, + "learning_rate": 7.941516037858796e-05, + "loss": 1.1043, + "step": 31180 + }, + { + "epoch": 0.6, + "learning_rate": 7.940294595454036e-05, + "loss": 1.3516, + "step": 31190 + }, + { + "epoch": 0.6, + "learning_rate": 7.939072884767915e-05, + "loss": 1.1847, + "step": 31200 + }, + { + "epoch": 0.6, + "learning_rate": 7.937850905911905e-05, + "loss": 1.6446, + "step": 31210 + }, + { + "epoch": 0.6, + "learning_rate": 7.936628658997502e-05, + "loss": 1.1596, + "step": 31220 + }, + { + "epoch": 0.6, + "learning_rate": 7.935406144136226e-05, + "loss": 1.4597, + "step": 31230 + }, + { + "epoch": 0.6, + "learning_rate": 7.934183361439629e-05, + "loss": 1.2567, + "step": 31240 + }, + { + "epoch": 0.6, + "learning_rate": 7.932960311019275e-05, + "loss": 1.1242, + "step": 31250 + }, + { + "epoch": 0.6, + "learning_rate": 7.931736992986762e-05, + "loss": 1.3772, + "step": 31260 + }, + { + "epoch": 0.6, + "learning_rate": 7.930513407453709e-05, + "loss": 1.3123, + "step": 31270 + }, + { + "epoch": 0.6, + "learning_rate": 7.929289554531758e-05, + "loss": 1.2481, + "step": 31280 + }, + { + "epoch": 0.6, + "learning_rate": 7.92806543433258e-05, + "loss": 1.2453, + "step": 31290 + }, + { + "epoch": 0.6, + "learning_rate": 7.926841046967865e-05, + "loss": 1.4209, + "step": 31300 + }, + { + "epoch": 0.6, + "learning_rate": 7.925616392549328e-05, + "loss": 1.1744, + "step": 31310 + }, + { + "epoch": 0.6, + "learning_rate": 7.924391471188714e-05, + "loss": 1.2668, + "step": 31320 + }, + { + "epoch": 0.6, + "learning_rate": 7.923166282997788e-05, + "loss": 1.3251, + "step": 31330 + }, + { + "epoch": 0.6, + "learning_rate": 7.921940828088339e-05, + "loss": 1.2625, + "step": 31340 + }, + { + "epoch": 0.6, + "learning_rate": 7.920715106572181e-05, + "loss": 1.3701, + "step": 31350 + }, + { + "epoch": 0.6, + "learning_rate": 7.919489118561151e-05, + "loss": 1.0377, + "step": 31360 + }, + { + "epoch": 0.6, + "learning_rate": 7.918262864167116e-05, + "loss": 1.0791, + "step": 31370 + }, + { + "epoch": 0.6, + "learning_rate": 7.917036343501959e-05, + "loss": 1.3158, + "step": 31380 + }, + { + "epoch": 0.6, + "learning_rate": 7.915809556677595e-05, + "loss": 0.9222, + "step": 31390 + }, + { + "epoch": 0.6, + "learning_rate": 7.914582503805956e-05, + "loss": 1.1447, + "step": 31400 + }, + { + "epoch": 0.6, + "learning_rate": 7.913355184999004e-05, + "loss": 1.3185, + "step": 31410 + }, + { + "epoch": 0.6, + "learning_rate": 7.912127600368723e-05, + "loss": 1.2184, + "step": 31420 + }, + { + "epoch": 0.6, + "learning_rate": 7.910899750027123e-05, + "loss": 1.4154, + "step": 31430 + }, + { + "epoch": 0.6, + "learning_rate": 7.909671634086235e-05, + "loss": 1.2962, + "step": 31440 + }, + { + "epoch": 0.6, + "learning_rate": 7.908443252658118e-05, + "loss": 1.2536, + "step": 31450 + }, + { + "epoch": 0.6, + "learning_rate": 7.90721460585485e-05, + "loss": 1.4812, + "step": 31460 + }, + { + "epoch": 0.61, + "learning_rate": 7.905985693788537e-05, + "loss": 1.2097, + "step": 31470 + }, + { + "epoch": 0.61, + "learning_rate": 7.904756516571312e-05, + "loss": 1.162, + "step": 31480 + }, + { + "epoch": 0.61, + "learning_rate": 7.903527074315326e-05, + "loss": 1.2438, + "step": 31490 + }, + { + "epoch": 0.61, + "learning_rate": 7.902297367132757e-05, + "loss": 1.2634, + "step": 31500 + }, + { + "epoch": 0.61, + "learning_rate": 7.901067395135808e-05, + "loss": 1.3383, + "step": 31510 + }, + { + "epoch": 0.61, + "learning_rate": 7.899837158436705e-05, + "loss": 1.2777, + "step": 31520 + }, + { + "epoch": 0.61, + "learning_rate": 7.8986066571477e-05, + "loss": 1.4775, + "step": 31530 + }, + { + "epoch": 0.61, + "learning_rate": 7.897375891381066e-05, + "loss": 1.3543, + "step": 31540 + }, + { + "epoch": 0.61, + "learning_rate": 7.896144861249103e-05, + "loss": 1.1671, + "step": 31550 + }, + { + "epoch": 0.61, + "learning_rate": 7.894913566864131e-05, + "loss": 1.4008, + "step": 31560 + }, + { + "epoch": 0.61, + "learning_rate": 7.893682008338501e-05, + "loss": 1.3362, + "step": 31570 + }, + { + "epoch": 0.61, + "learning_rate": 7.892450185784581e-05, + "loss": 1.3773, + "step": 31580 + }, + { + "epoch": 0.61, + "learning_rate": 7.89121809931477e-05, + "loss": 1.2376, + "step": 31590 + }, + { + "epoch": 0.61, + "learning_rate": 7.889985749041482e-05, + "loss": 1.0669, + "step": 31600 + }, + { + "epoch": 0.61, + "learning_rate": 7.888753135077164e-05, + "loss": 1.3547, + "step": 31610 + }, + { + "epoch": 0.61, + "learning_rate": 7.887520257534282e-05, + "loss": 1.3871, + "step": 31620 + }, + { + "epoch": 0.61, + "learning_rate": 7.886287116525328e-05, + "loss": 1.3832, + "step": 31630 + }, + { + "epoch": 0.61, + "learning_rate": 7.885053712162819e-05, + "loss": 1.4147, + "step": 31640 + }, + { + "epoch": 0.61, + "learning_rate": 7.883820044559291e-05, + "loss": 1.4529, + "step": 31650 + }, + { + "epoch": 0.61, + "learning_rate": 7.882586113827312e-05, + "loss": 1.3178, + "step": 31660 + }, + { + "epoch": 0.61, + "learning_rate": 7.881351920079465e-05, + "loss": 1.4368, + "step": 31670 + }, + { + "epoch": 0.61, + "learning_rate": 7.880117463428364e-05, + "loss": 1.3981, + "step": 31680 + }, + { + "epoch": 0.61, + "learning_rate": 7.878882743986647e-05, + "loss": 1.1767, + "step": 31690 + }, + { + "epoch": 0.61, + "learning_rate": 7.877647761866969e-05, + "loss": 1.2676, + "step": 31700 + }, + { + "epoch": 0.61, + "learning_rate": 7.876412517182014e-05, + "loss": 1.1743, + "step": 31710 + }, + { + "epoch": 0.61, + "learning_rate": 7.875177010044493e-05, + "loss": 1.3237, + "step": 31720 + }, + { + "epoch": 0.61, + "learning_rate": 7.873941240567133e-05, + "loss": 1.4447, + "step": 31730 + }, + { + "epoch": 0.61, + "learning_rate": 7.872705208862694e-05, + "loss": 1.5072, + "step": 31740 + }, + { + "epoch": 0.61, + "learning_rate": 7.871468915043952e-05, + "loss": 1.3557, + "step": 31750 + }, + { + "epoch": 0.61, + "learning_rate": 7.87023235922371e-05, + "loss": 1.4993, + "step": 31760 + }, + { + "epoch": 0.61, + "learning_rate": 7.868995541514796e-05, + "loss": 1.3452, + "step": 31770 + }, + { + "epoch": 0.61, + "learning_rate": 7.867758462030062e-05, + "loss": 1.1674, + "step": 31780 + }, + { + "epoch": 0.61, + "learning_rate": 7.866521120882382e-05, + "loss": 1.2627, + "step": 31790 + }, + { + "epoch": 0.61, + "learning_rate": 7.865283518184654e-05, + "loss": 1.219, + "step": 31800 + }, + { + "epoch": 0.61, + "learning_rate": 7.864045654049803e-05, + "loss": 1.364, + "step": 31810 + }, + { + "epoch": 0.61, + "learning_rate": 7.862807528590772e-05, + "loss": 1.215, + "step": 31820 + }, + { + "epoch": 0.61, + "learning_rate": 7.861569141920533e-05, + "loss": 1.3557, + "step": 31830 + }, + { + "epoch": 0.61, + "learning_rate": 7.860330494152081e-05, + "loss": 1.4345, + "step": 31840 + }, + { + "epoch": 0.61, + "learning_rate": 7.859091585398433e-05, + "loss": 1.3383, + "step": 31850 + }, + { + "epoch": 0.61, + "learning_rate": 7.85785241577263e-05, + "loss": 1.078, + "step": 31860 + }, + { + "epoch": 0.61, + "learning_rate": 7.856612985387741e-05, + "loss": 1.296, + "step": 31870 + }, + { + "epoch": 0.61, + "learning_rate": 7.85537329435685e-05, + "loss": 1.3709, + "step": 31880 + }, + { + "epoch": 0.61, + "learning_rate": 7.854133342793075e-05, + "loss": 1.1628, + "step": 31890 + }, + { + "epoch": 0.61, + "learning_rate": 7.85289313080955e-05, + "loss": 1.2544, + "step": 31900 + }, + { + "epoch": 0.61, + "learning_rate": 7.851652658519437e-05, + "loss": 1.2134, + "step": 31910 + }, + { + "epoch": 0.61, + "learning_rate": 7.850411926035922e-05, + "loss": 1.1733, + "step": 31920 + }, + { + "epoch": 0.61, + "learning_rate": 7.849170933472207e-05, + "loss": 1.3353, + "step": 31930 + }, + { + "epoch": 0.61, + "learning_rate": 7.847929680941532e-05, + "loss": 1.1677, + "step": 31940 + }, + { + "epoch": 0.61, + "learning_rate": 7.846688168557148e-05, + "loss": 1.2535, + "step": 31950 + }, + { + "epoch": 0.61, + "learning_rate": 7.845446396432335e-05, + "loss": 1.2486, + "step": 31960 + }, + { + "epoch": 0.61, + "learning_rate": 7.844204364680395e-05, + "loss": 1.3036, + "step": 31970 + }, + { + "epoch": 0.61, + "learning_rate": 7.842962073414657e-05, + "loss": 1.2812, + "step": 31980 + }, + { + "epoch": 0.62, + "learning_rate": 7.841719522748471e-05, + "loss": 1.2309, + "step": 31990 + }, + { + "epoch": 0.62, + "learning_rate": 7.84047671279521e-05, + "loss": 1.2043, + "step": 32000 + }, + { + "epoch": 0.62, + "learning_rate": 7.839233643668272e-05, + "loss": 1.4122, + "step": 32010 + }, + { + "epoch": 0.62, + "learning_rate": 7.837990315481076e-05, + "loss": 1.4687, + "step": 32020 + }, + { + "epoch": 0.62, + "learning_rate": 7.836746728347072e-05, + "loss": 1.2183, + "step": 32030 + }, + { + "epoch": 0.62, + "learning_rate": 7.835502882379729e-05, + "loss": 1.1445, + "step": 32040 + }, + { + "epoch": 0.62, + "learning_rate": 7.834258777692532e-05, + "loss": 1.24, + "step": 32050 + }, + { + "epoch": 0.62, + "learning_rate": 7.833014414399003e-05, + "loss": 1.5049, + "step": 32060 + }, + { + "epoch": 0.62, + "learning_rate": 7.831769792612679e-05, + "loss": 1.232, + "step": 32070 + }, + { + "epoch": 0.62, + "learning_rate": 7.830524912447126e-05, + "loss": 1.2991, + "step": 32080 + }, + { + "epoch": 0.62, + "learning_rate": 7.829279774015927e-05, + "loss": 1.3614, + "step": 32090 + }, + { + "epoch": 0.62, + "learning_rate": 7.828034377432693e-05, + "loss": 1.2771, + "step": 32100 + }, + { + "epoch": 0.62, + "learning_rate": 7.82678872281106e-05, + "loss": 1.2044, + "step": 32110 + }, + { + "epoch": 0.62, + "learning_rate": 7.825542810264683e-05, + "loss": 1.2124, + "step": 32120 + }, + { + "epoch": 0.62, + "learning_rate": 7.824296639907243e-05, + "loss": 1.2771, + "step": 32130 + }, + { + "epoch": 0.62, + "learning_rate": 7.823050211852445e-05, + "loss": 1.2584, + "step": 32140 + }, + { + "epoch": 0.62, + "learning_rate": 7.821803526214019e-05, + "loss": 1.4263, + "step": 32150 + }, + { + "epoch": 0.62, + "learning_rate": 7.820556583105711e-05, + "loss": 1.2793, + "step": 32160 + }, + { + "epoch": 0.62, + "learning_rate": 7.819309382641302e-05, + "loss": 1.1144, + "step": 32170 + }, + { + "epoch": 0.62, + "learning_rate": 7.818061924934584e-05, + "loss": 1.3202, + "step": 32180 + }, + { + "epoch": 0.62, + "learning_rate": 7.816814210099384e-05, + "loss": 1.2168, + "step": 32190 + }, + { + "epoch": 0.62, + "learning_rate": 7.815566238249546e-05, + "loss": 1.478, + "step": 32200 + }, + { + "epoch": 0.62, + "learning_rate": 7.814318009498938e-05, + "loss": 1.448, + "step": 32210 + }, + { + "epoch": 0.62, + "learning_rate": 7.813069523961451e-05, + "loss": 1.2886, + "step": 32220 + }, + { + "epoch": 0.62, + "learning_rate": 7.811820781751003e-05, + "loss": 1.3078, + "step": 32230 + }, + { + "epoch": 0.62, + "learning_rate": 7.810571782981531e-05, + "loss": 1.3631, + "step": 32240 + }, + { + "epoch": 0.62, + "learning_rate": 7.809322527766999e-05, + "loss": 1.2765, + "step": 32250 + }, + { + "epoch": 0.62, + "learning_rate": 7.80807301622139e-05, + "loss": 1.0878, + "step": 32260 + }, + { + "epoch": 0.62, + "learning_rate": 7.806823248458719e-05, + "loss": 1.3806, + "step": 32270 + }, + { + "epoch": 0.62, + "learning_rate": 7.805573224593012e-05, + "loss": 1.2058, + "step": 32280 + }, + { + "epoch": 0.62, + "learning_rate": 7.804322944738329e-05, + "loss": 1.293, + "step": 32290 + }, + { + "epoch": 0.62, + "learning_rate": 7.803072409008749e-05, + "loss": 1.1969, + "step": 32300 + }, + { + "epoch": 0.62, + "learning_rate": 7.801821617518372e-05, + "loss": 1.3988, + "step": 32310 + }, + { + "epoch": 0.62, + "learning_rate": 7.800570570381327e-05, + "loss": 1.2118, + "step": 32320 + }, + { + "epoch": 0.62, + "learning_rate": 7.799319267711763e-05, + "loss": 1.1554, + "step": 32330 + }, + { + "epoch": 0.62, + "learning_rate": 7.79806770962385e-05, + "loss": 1.1899, + "step": 32340 + }, + { + "epoch": 0.62, + "learning_rate": 7.796815896231787e-05, + "loss": 1.1534, + "step": 32350 + }, + { + "epoch": 0.62, + "learning_rate": 7.795563827649792e-05, + "loss": 1.4639, + "step": 32360 + }, + { + "epoch": 0.62, + "learning_rate": 7.794311503992107e-05, + "loss": 1.2374, + "step": 32370 + }, + { + "epoch": 0.62, + "learning_rate": 7.793058925372998e-05, + "loss": 1.2222, + "step": 32380 + }, + { + "epoch": 0.62, + "learning_rate": 7.791806091906754e-05, + "loss": 1.1837, + "step": 32390 + }, + { + "epoch": 0.62, + "learning_rate": 7.790553003707689e-05, + "loss": 1.2761, + "step": 32400 + }, + { + "epoch": 0.62, + "learning_rate": 7.789299660890137e-05, + "loss": 1.2179, + "step": 32410 + }, + { + "epoch": 0.62, + "learning_rate": 7.788046063568458e-05, + "loss": 1.4358, + "step": 32420 + }, + { + "epoch": 0.62, + "learning_rate": 7.786792211857031e-05, + "loss": 1.4125, + "step": 32430 + }, + { + "epoch": 0.62, + "learning_rate": 7.785538105870262e-05, + "loss": 1.3298, + "step": 32440 + }, + { + "epoch": 0.62, + "learning_rate": 7.784283745722583e-05, + "loss": 1.2219, + "step": 32450 + }, + { + "epoch": 0.62, + "learning_rate": 7.783029131528443e-05, + "loss": 1.0797, + "step": 32460 + }, + { + "epoch": 0.62, + "learning_rate": 7.781774263402317e-05, + "loss": 1.2882, + "step": 32470 + }, + { + "epoch": 0.62, + "learning_rate": 7.780519141458703e-05, + "loss": 1.1884, + "step": 32480 + }, + { + "epoch": 0.62, + "learning_rate": 7.779263765812121e-05, + "loss": 1.0929, + "step": 32490 + }, + { + "epoch": 0.62, + "learning_rate": 7.778008136577117e-05, + "loss": 1.1277, + "step": 32500 + }, + { + "epoch": 0.63, + "learning_rate": 7.776752253868257e-05, + "loss": 1.3553, + "step": 32510 + }, + { + "epoch": 0.63, + "learning_rate": 7.775496117800134e-05, + "loss": 1.3348, + "step": 32520 + }, + { + "epoch": 0.63, + "learning_rate": 7.774239728487361e-05, + "loss": 1.3471, + "step": 32530 + }, + { + "epoch": 0.63, + "learning_rate": 7.772983086044571e-05, + "loss": 1.232, + "step": 32540 + }, + { + "epoch": 0.63, + "learning_rate": 7.771726190586428e-05, + "loss": 1.14, + "step": 32550 + }, + { + "epoch": 0.63, + "learning_rate": 7.770469042227613e-05, + "loss": 1.4092, + "step": 32560 + }, + { + "epoch": 0.63, + "learning_rate": 7.769211641082832e-05, + "loss": 1.2098, + "step": 32570 + }, + { + "epoch": 0.63, + "learning_rate": 7.767953987266816e-05, + "loss": 1.3986, + "step": 32580 + }, + { + "epoch": 0.63, + "learning_rate": 7.766696080894315e-05, + "loss": 1.5044, + "step": 32590 + }, + { + "epoch": 0.63, + "learning_rate": 7.765437922080105e-05, + "loss": 1.456, + "step": 32600 + }, + { + "epoch": 0.63, + "learning_rate": 7.764179510938985e-05, + "loss": 1.3229, + "step": 32610 + }, + { + "epoch": 0.63, + "learning_rate": 7.762920847585772e-05, + "loss": 1.2522, + "step": 32620 + }, + { + "epoch": 0.63, + "learning_rate": 7.761661932135318e-05, + "loss": 1.1673, + "step": 32630 + }, + { + "epoch": 0.63, + "learning_rate": 7.760402764702483e-05, + "loss": 1.4183, + "step": 32640 + }, + { + "epoch": 0.63, + "learning_rate": 7.759143345402163e-05, + "loss": 1.1912, + "step": 32650 + }, + { + "epoch": 0.63, + "learning_rate": 7.757883674349266e-05, + "loss": 1.4115, + "step": 32660 + }, + { + "epoch": 0.63, + "learning_rate": 7.756623751658729e-05, + "loss": 1.4258, + "step": 32670 + }, + { + "epoch": 0.63, + "learning_rate": 7.755363577445516e-05, + "loss": 1.1299, + "step": 32680 + }, + { + "epoch": 0.63, + "learning_rate": 7.754103151824603e-05, + "loss": 1.1065, + "step": 32690 + }, + { + "epoch": 0.63, + "learning_rate": 7.752842474911001e-05, + "loss": 1.1116, + "step": 32700 + }, + { + "epoch": 0.63, + "learning_rate": 7.751581546819733e-05, + "loss": 1.2559, + "step": 32710 + }, + { + "epoch": 0.63, + "learning_rate": 7.750320367665851e-05, + "loss": 1.243, + "step": 32720 + }, + { + "epoch": 0.63, + "learning_rate": 7.74905893756443e-05, + "loss": 1.1619, + "step": 32730 + }, + { + "epoch": 0.63, + "learning_rate": 7.747797256630567e-05, + "loss": 1.3613, + "step": 32740 + }, + { + "epoch": 0.63, + "learning_rate": 7.74653532497938e-05, + "loss": 1.1512, + "step": 32750 + }, + { + "epoch": 0.63, + "learning_rate": 7.745273142726012e-05, + "loss": 1.2168, + "step": 32760 + }, + { + "epoch": 0.63, + "learning_rate": 7.744010709985629e-05, + "loss": 1.2785, + "step": 32770 + }, + { + "epoch": 0.63, + "learning_rate": 7.742748026873418e-05, + "loss": 1.3567, + "step": 32780 + }, + { + "epoch": 0.63, + "learning_rate": 7.741485093504591e-05, + "loss": 1.2556, + "step": 32790 + }, + { + "epoch": 0.63, + "learning_rate": 7.740221909994382e-05, + "loss": 1.239, + "step": 32800 + }, + { + "epoch": 0.63, + "learning_rate": 7.738958476458047e-05, + "loss": 1.357, + "step": 32810 + }, + { + "epoch": 0.63, + "learning_rate": 7.737694793010866e-05, + "loss": 1.2633, + "step": 32820 + }, + { + "epoch": 0.63, + "learning_rate": 7.73643085976814e-05, + "loss": 1.1337, + "step": 32830 + }, + { + "epoch": 0.63, + "learning_rate": 7.735166676845196e-05, + "loss": 1.3935, + "step": 32840 + }, + { + "epoch": 0.63, + "learning_rate": 7.733902244357383e-05, + "loss": 1.0734, + "step": 32850 + }, + { + "epoch": 0.63, + "learning_rate": 7.732637562420066e-05, + "loss": 1.3726, + "step": 32860 + }, + { + "epoch": 0.63, + "learning_rate": 7.731372631148644e-05, + "loss": 1.3189, + "step": 32870 + }, + { + "epoch": 0.63, + "learning_rate": 7.730107450658532e-05, + "loss": 1.3462, + "step": 32880 + }, + { + "epoch": 0.63, + "learning_rate": 7.728842021065166e-05, + "loss": 1.4169, + "step": 32890 + }, + { + "epoch": 0.63, + "learning_rate": 7.72757634248401e-05, + "loss": 1.0966, + "step": 32900 + }, + { + "epoch": 0.63, + "learning_rate": 7.72631041503055e-05, + "loss": 1.2818, + "step": 32910 + }, + { + "epoch": 0.63, + "learning_rate": 7.725044238820289e-05, + "loss": 1.2736, + "step": 32920 + }, + { + "epoch": 0.63, + "learning_rate": 7.72377781396876e-05, + "loss": 1.3515, + "step": 32930 + }, + { + "epoch": 0.63, + "learning_rate": 7.722511140591514e-05, + "loss": 1.3008, + "step": 32940 + }, + { + "epoch": 0.63, + "learning_rate": 7.721244218804126e-05, + "loss": 1.1625, + "step": 32950 + }, + { + "epoch": 0.63, + "learning_rate": 7.719977048722196e-05, + "loss": 1.2885, + "step": 32960 + }, + { + "epoch": 0.63, + "learning_rate": 7.71870963046134e-05, + "loss": 1.199, + "step": 32970 + }, + { + "epoch": 0.63, + "learning_rate": 7.717441964137204e-05, + "loss": 1.2953, + "step": 32980 + }, + { + "epoch": 0.63, + "learning_rate": 7.716174049865454e-05, + "loss": 1.367, + "step": 32990 + }, + { + "epoch": 0.63, + "learning_rate": 7.714905887761779e-05, + "loss": 1.2351, + "step": 33000 + }, + { + "epoch": 0.63, + "learning_rate": 7.713637477941886e-05, + "loss": 1.2883, + "step": 33010 + }, + { + "epoch": 0.63, + "learning_rate": 7.712368820521513e-05, + "loss": 1.254, + "step": 33020 + }, + { + "epoch": 0.64, + "learning_rate": 7.711099915616415e-05, + "loss": 1.1531, + "step": 33030 + }, + { + "epoch": 0.64, + "learning_rate": 7.709830763342367e-05, + "loss": 1.2354, + "step": 33040 + }, + { + "epoch": 0.64, + "learning_rate": 7.708561363815175e-05, + "loss": 1.1545, + "step": 33050 + }, + { + "epoch": 0.64, + "learning_rate": 7.707291717150663e-05, + "loss": 1.4253, + "step": 33060 + }, + { + "epoch": 0.64, + "learning_rate": 7.706021823464673e-05, + "loss": 1.281, + "step": 33070 + }, + { + "epoch": 0.64, + "learning_rate": 7.704751682873077e-05, + "loss": 1.1426, + "step": 33080 + }, + { + "epoch": 0.64, + "learning_rate": 7.703481295491765e-05, + "loss": 1.2292, + "step": 33090 + }, + { + "epoch": 0.64, + "learning_rate": 7.702210661436654e-05, + "loss": 1.1432, + "step": 33100 + }, + { + "epoch": 0.64, + "learning_rate": 7.70093978082368e-05, + "loss": 1.2121, + "step": 33110 + }, + { + "epoch": 0.64, + "learning_rate": 7.699668653768795e-05, + "loss": 1.0782, + "step": 33120 + }, + { + "epoch": 0.64, + "learning_rate": 7.69839728038799e-05, + "loss": 1.2624, + "step": 33130 + }, + { + "epoch": 0.64, + "learning_rate": 7.697125660797262e-05, + "loss": 1.2758, + "step": 33140 + }, + { + "epoch": 0.64, + "learning_rate": 7.695853795112643e-05, + "loss": 1.3233, + "step": 33150 + }, + { + "epoch": 0.64, + "learning_rate": 7.694581683450179e-05, + "loss": 1.2187, + "step": 33160 + }, + { + "epoch": 0.64, + "learning_rate": 7.69330932592594e-05, + "loss": 1.0823, + "step": 33170 + }, + { + "epoch": 0.64, + "learning_rate": 7.692036722656023e-05, + "loss": 1.5059, + "step": 33180 + }, + { + "epoch": 0.64, + "learning_rate": 7.690763873756539e-05, + "loss": 1.2895, + "step": 33190 + }, + { + "epoch": 0.64, + "learning_rate": 7.689490779343631e-05, + "loss": 1.3533, + "step": 33200 + }, + { + "epoch": 0.64, + "learning_rate": 7.68821743953346e-05, + "loss": 1.3315, + "step": 33210 + }, + { + "epoch": 0.64, + "learning_rate": 7.686943854442208e-05, + "loss": 1.2424, + "step": 33220 + }, + { + "epoch": 0.64, + "learning_rate": 7.685670024186082e-05, + "loss": 1.6076, + "step": 33230 + }, + { + "epoch": 0.64, + "learning_rate": 7.684395948881306e-05, + "loss": 1.2685, + "step": 33240 + }, + { + "epoch": 0.64, + "learning_rate": 7.683121628644136e-05, + "loss": 1.084, + "step": 33250 + }, + { + "epoch": 0.64, + "learning_rate": 7.681847063590844e-05, + "loss": 1.3628, + "step": 33260 + }, + { + "epoch": 0.64, + "learning_rate": 7.680572253837721e-05, + "loss": 1.1774, + "step": 33270 + }, + { + "epoch": 0.64, + "learning_rate": 7.679297199501089e-05, + "loss": 1.4887, + "step": 33280 + }, + { + "epoch": 0.64, + "learning_rate": 7.678021900697283e-05, + "loss": 1.3775, + "step": 33290 + }, + { + "epoch": 0.64, + "learning_rate": 7.67674635754267e-05, + "loss": 1.1925, + "step": 33300 + }, + { + "epoch": 0.64, + "learning_rate": 7.675470570153633e-05, + "loss": 1.1798, + "step": 33310 + }, + { + "epoch": 0.64, + "learning_rate": 7.674194538646577e-05, + "loss": 1.2486, + "step": 33320 + }, + { + "epoch": 0.64, + "learning_rate": 7.672918263137934e-05, + "loss": 1.1049, + "step": 33330 + }, + { + "epoch": 0.64, + "learning_rate": 7.67164174374415e-05, + "loss": 1.2164, + "step": 33340 + }, + { + "epoch": 0.64, + "learning_rate": 7.670364980581704e-05, + "loss": 1.2386, + "step": 33350 + }, + { + "epoch": 0.64, + "learning_rate": 7.66908797376709e-05, + "loss": 1.1891, + "step": 33360 + }, + { + "epoch": 0.64, + "learning_rate": 7.667810723416824e-05, + "loss": 1.14, + "step": 33370 + }, + { + "epoch": 0.64, + "learning_rate": 7.666533229647449e-05, + "loss": 1.2207, + "step": 33380 + }, + { + "epoch": 0.64, + "learning_rate": 7.665255492575525e-05, + "loss": 1.2142, + "step": 33390 + }, + { + "epoch": 0.64, + "learning_rate": 7.663977512317639e-05, + "loss": 1.232, + "step": 33400 + }, + { + "epoch": 0.64, + "learning_rate": 7.662699288990394e-05, + "loss": 1.2781, + "step": 33410 + }, + { + "epoch": 0.64, + "learning_rate": 7.661420822710423e-05, + "loss": 1.2841, + "step": 33420 + }, + { + "epoch": 0.64, + "learning_rate": 7.660142113594377e-05, + "loss": 1.2639, + "step": 33430 + }, + { + "epoch": 0.64, + "learning_rate": 7.658863161758925e-05, + "loss": 1.1885, + "step": 33440 + }, + { + "epoch": 0.64, + "learning_rate": 7.657583967320768e-05, + "loss": 1.2975, + "step": 33450 + }, + { + "epoch": 0.64, + "learning_rate": 7.656304530396619e-05, + "loss": 1.2814, + "step": 33460 + }, + { + "epoch": 0.64, + "learning_rate": 7.65502485110322e-05, + "loss": 0.9301, + "step": 33470 + }, + { + "epoch": 0.64, + "learning_rate": 7.653744929557331e-05, + "loss": 1.555, + "step": 33480 + }, + { + "epoch": 0.64, + "learning_rate": 7.65246476587574e-05, + "loss": 1.1058, + "step": 33490 + }, + { + "epoch": 0.64, + "learning_rate": 7.651184360175247e-05, + "loss": 1.3931, + "step": 33500 + }, + { + "epoch": 0.64, + "learning_rate": 7.649903712572686e-05, + "loss": 1.3049, + "step": 33510 + }, + { + "epoch": 0.64, + "learning_rate": 7.648622823184903e-05, + "loss": 1.4389, + "step": 33520 + }, + { + "epoch": 0.64, + "learning_rate": 7.647341692128773e-05, + "loss": 1.4891, + "step": 33530 + }, + { + "epoch": 0.64, + "learning_rate": 7.646060319521187e-05, + "loss": 1.1877, + "step": 33540 + }, + { + "epoch": 0.65, + "learning_rate": 7.644778705479065e-05, + "loss": 1.037, + "step": 33550 + }, + { + "epoch": 0.65, + "learning_rate": 7.643496850119342e-05, + "loss": 1.2066, + "step": 33560 + }, + { + "epoch": 0.65, + "learning_rate": 7.642214753558983e-05, + "loss": 1.2275, + "step": 33570 + }, + { + "epoch": 0.65, + "learning_rate": 7.640932415914964e-05, + "loss": 1.3623, + "step": 33580 + }, + { + "epoch": 0.65, + "learning_rate": 7.639649837304294e-05, + "loss": 1.3331, + "step": 33590 + }, + { + "epoch": 0.65, + "learning_rate": 7.638367017843998e-05, + "loss": 1.364, + "step": 33600 + }, + { + "epoch": 0.65, + "learning_rate": 7.637083957651125e-05, + "loss": 1.4006, + "step": 33610 + }, + { + "epoch": 0.65, + "learning_rate": 7.635800656842745e-05, + "loss": 1.1238, + "step": 33620 + }, + { + "epoch": 0.65, + "learning_rate": 7.634517115535946e-05, + "loss": 1.2952, + "step": 33630 + }, + { + "epoch": 0.65, + "learning_rate": 7.633233333847848e-05, + "loss": 1.4126, + "step": 33640 + }, + { + "epoch": 0.65, + "learning_rate": 7.631949311895588e-05, + "loss": 1.1871, + "step": 33650 + }, + { + "epoch": 0.65, + "learning_rate": 7.630665049796319e-05, + "loss": 1.1875, + "step": 33660 + }, + { + "epoch": 0.65, + "learning_rate": 7.629380547667224e-05, + "loss": 1.3736, + "step": 33670 + }, + { + "epoch": 0.65, + "learning_rate": 7.628095805625502e-05, + "loss": 1.2475, + "step": 33680 + }, + { + "epoch": 0.65, + "learning_rate": 7.626810823788381e-05, + "loss": 1.334, + "step": 33690 + }, + { + "epoch": 0.65, + "learning_rate": 7.625525602273103e-05, + "loss": 1.1109, + "step": 33700 + }, + { + "epoch": 0.65, + "learning_rate": 7.624240141196938e-05, + "loss": 1.4416, + "step": 33710 + }, + { + "epoch": 0.65, + "learning_rate": 7.622954440677174e-05, + "loss": 1.159, + "step": 33720 + }, + { + "epoch": 0.65, + "learning_rate": 7.621668500831121e-05, + "loss": 1.2166, + "step": 33730 + }, + { + "epoch": 0.65, + "learning_rate": 7.620382321776115e-05, + "loss": 1.2802, + "step": 33740 + }, + { + "epoch": 0.65, + "learning_rate": 7.619095903629508e-05, + "loss": 1.1555, + "step": 33750 + }, + { + "epoch": 0.65, + "learning_rate": 7.61780924650868e-05, + "loss": 1.349, + "step": 33760 + }, + { + "epoch": 0.65, + "learning_rate": 7.616522350531026e-05, + "loss": 1.3891, + "step": 33770 + }, + { + "epoch": 0.65, + "learning_rate": 7.61523521581397e-05, + "loss": 1.3187, + "step": 33780 + }, + { + "epoch": 0.65, + "learning_rate": 7.61394784247495e-05, + "loss": 1.3633, + "step": 33790 + }, + { + "epoch": 0.65, + "learning_rate": 7.61266023063143e-05, + "loss": 1.2676, + "step": 33800 + }, + { + "epoch": 0.65, + "learning_rate": 7.6113723804009e-05, + "loss": 1.2281, + "step": 33810 + }, + { + "epoch": 0.65, + "learning_rate": 7.610084291900863e-05, + "loss": 1.1839, + "step": 33820 + }, + { + "epoch": 0.65, + "learning_rate": 7.608795965248852e-05, + "loss": 1.4485, + "step": 33830 + }, + { + "epoch": 0.65, + "learning_rate": 7.607507400562413e-05, + "loss": 1.2172, + "step": 33840 + }, + { + "epoch": 0.65, + "learning_rate": 7.606218597959122e-05, + "loss": 1.3025, + "step": 33850 + }, + { + "epoch": 0.65, + "learning_rate": 7.604929557556572e-05, + "loss": 1.1577, + "step": 33860 + }, + { + "epoch": 0.65, + "learning_rate": 7.603640279472379e-05, + "loss": 1.4266, + "step": 33870 + }, + { + "epoch": 0.65, + "learning_rate": 7.602350763824181e-05, + "loss": 1.3145, + "step": 33880 + }, + { + "epoch": 0.65, + "learning_rate": 7.60106101072964e-05, + "loss": 1.2152, + "step": 33890 + }, + { + "epoch": 0.65, + "learning_rate": 7.59977102030643e-05, + "loss": 1.2002, + "step": 33900 + }, + { + "epoch": 0.65, + "learning_rate": 7.59848079267226e-05, + "loss": 1.5019, + "step": 33910 + }, + { + "epoch": 0.65, + "learning_rate": 7.597190327944852e-05, + "loss": 1.2517, + "step": 33920 + }, + { + "epoch": 0.65, + "learning_rate": 7.595899626241952e-05, + "loss": 1.2598, + "step": 33930 + }, + { + "epoch": 0.65, + "learning_rate": 7.594608687681326e-05, + "loss": 1.3104, + "step": 33940 + }, + { + "epoch": 0.65, + "learning_rate": 7.593317512380766e-05, + "loss": 1.246, + "step": 33950 + }, + { + "epoch": 0.65, + "learning_rate": 7.59202610045808e-05, + "loss": 1.3581, + "step": 33960 + }, + { + "epoch": 0.65, + "learning_rate": 7.590734452031103e-05, + "loss": 1.2522, + "step": 33970 + }, + { + "epoch": 0.65, + "learning_rate": 7.589442567217687e-05, + "loss": 1.3645, + "step": 33980 + }, + { + "epoch": 0.65, + "learning_rate": 7.588150446135709e-05, + "loss": 1.1933, + "step": 33990 + }, + { + "epoch": 0.65, + "learning_rate": 7.586858088903063e-05, + "loss": 1.2719, + "step": 34000 + }, + { + "epoch": 0.65, + "learning_rate": 7.58556549563767e-05, + "loss": 1.2717, + "step": 34010 + }, + { + "epoch": 0.65, + "learning_rate": 7.58427266645747e-05, + "loss": 1.189, + "step": 34020 + }, + { + "epoch": 0.65, + "learning_rate": 7.582979601480427e-05, + "loss": 1.223, + "step": 34030 + }, + { + "epoch": 0.65, + "learning_rate": 7.581686300824518e-05, + "loss": 1.4804, + "step": 34040 + }, + { + "epoch": 0.65, + "learning_rate": 7.580392764607753e-05, + "loss": 1.2457, + "step": 34050 + }, + { + "epoch": 0.65, + "learning_rate": 7.579098992948156e-05, + "loss": 1.3047, + "step": 34060 + }, + { + "epoch": 0.66, + "learning_rate": 7.577804985963775e-05, + "loss": 1.2986, + "step": 34070 + }, + { + "epoch": 0.66, + "learning_rate": 7.57651074377268e-05, + "loss": 1.3243, + "step": 34080 + }, + { + "epoch": 0.66, + "learning_rate": 7.575216266492958e-05, + "loss": 1.224, + "step": 34090 + }, + { + "epoch": 0.66, + "learning_rate": 7.573921554242726e-05, + "loss": 1.2771, + "step": 34100 + }, + { + "epoch": 0.66, + "learning_rate": 7.572626607140114e-05, + "loss": 1.2465, + "step": 34110 + }, + { + "epoch": 0.66, + "learning_rate": 7.57133142530328e-05, + "loss": 1.4554, + "step": 34120 + }, + { + "epoch": 0.66, + "learning_rate": 7.570036008850396e-05, + "loss": 1.3207, + "step": 34130 + }, + { + "epoch": 0.66, + "learning_rate": 7.568740357899663e-05, + "loss": 1.2288, + "step": 34140 + }, + { + "epoch": 0.66, + "learning_rate": 7.567444472569298e-05, + "loss": 1.3859, + "step": 34150 + }, + { + "epoch": 0.66, + "learning_rate": 7.566148352977544e-05, + "loss": 1.2249, + "step": 34160 + }, + { + "epoch": 0.66, + "learning_rate": 7.564851999242663e-05, + "loss": 1.5065, + "step": 34170 + }, + { + "epoch": 0.66, + "learning_rate": 7.563555411482934e-05, + "loss": 1.1996, + "step": 34180 + }, + { + "epoch": 0.66, + "learning_rate": 7.562258589816665e-05, + "loss": 1.2967, + "step": 34190 + }, + { + "epoch": 0.66, + "learning_rate": 7.560961534362182e-05, + "loss": 1.2754, + "step": 34200 + }, + { + "epoch": 0.66, + "learning_rate": 7.559664245237832e-05, + "loss": 1.1849, + "step": 34210 + }, + { + "epoch": 0.66, + "learning_rate": 7.558366722561983e-05, + "loss": 1.4332, + "step": 34220 + }, + { + "epoch": 0.66, + "learning_rate": 7.557068966453022e-05, + "loss": 1.2562, + "step": 34230 + }, + { + "epoch": 0.66, + "learning_rate": 7.555770977029367e-05, + "loss": 1.1644, + "step": 34240 + }, + { + "epoch": 0.66, + "learning_rate": 7.554472754409444e-05, + "loss": 1.1976, + "step": 34250 + }, + { + "epoch": 0.66, + "learning_rate": 7.553174298711711e-05, + "loss": 1.1114, + "step": 34260 + }, + { + "epoch": 0.66, + "learning_rate": 7.551875610054641e-05, + "loss": 1.4584, + "step": 34270 + }, + { + "epoch": 0.66, + "learning_rate": 7.55057668855673e-05, + "loss": 1.3919, + "step": 34280 + }, + { + "epoch": 0.66, + "learning_rate": 7.549277534336497e-05, + "loss": 1.4206, + "step": 34290 + }, + { + "epoch": 0.66, + "learning_rate": 7.547978147512479e-05, + "loss": 1.2289, + "step": 34300 + }, + { + "epoch": 0.66, + "learning_rate": 7.546678528203237e-05, + "loss": 1.2138, + "step": 34310 + }, + { + "epoch": 0.66, + "learning_rate": 7.545378676527353e-05, + "loss": 1.2962, + "step": 34320 + }, + { + "epoch": 0.66, + "learning_rate": 7.544078592603429e-05, + "loss": 1.2363, + "step": 34330 + }, + { + "epoch": 0.66, + "learning_rate": 7.542778276550086e-05, + "loss": 1.249, + "step": 34340 + }, + { + "epoch": 0.66, + "learning_rate": 7.541477728485973e-05, + "loss": 1.3437, + "step": 34350 + }, + { + "epoch": 0.66, + "learning_rate": 7.540176948529753e-05, + "loss": 1.2118, + "step": 34360 + }, + { + "epoch": 0.66, + "learning_rate": 7.538875936800116e-05, + "loss": 1.4572, + "step": 34370 + }, + { + "epoch": 0.66, + "learning_rate": 7.537574693415765e-05, + "loss": 1.3596, + "step": 34380 + }, + { + "epoch": 0.66, + "learning_rate": 7.536273218495434e-05, + "loss": 1.2226, + "step": 34390 + }, + { + "epoch": 0.66, + "learning_rate": 7.534971512157871e-05, + "loss": 1.3725, + "step": 34400 + }, + { + "epoch": 0.66, + "learning_rate": 7.533669574521849e-05, + "loss": 1.2912, + "step": 34410 + }, + { + "epoch": 0.66, + "learning_rate": 7.532367405706162e-05, + "loss": 1.3452, + "step": 34420 + }, + { + "epoch": 0.66, + "learning_rate": 7.531065005829621e-05, + "loss": 1.2263, + "step": 34430 + }, + { + "epoch": 0.66, + "learning_rate": 7.529762375011061e-05, + "loss": 1.3199, + "step": 34440 + }, + { + "epoch": 0.66, + "learning_rate": 7.528459513369342e-05, + "loss": 1.3155, + "step": 34450 + }, + { + "epoch": 0.66, + "learning_rate": 7.527156421023333e-05, + "loss": 1.2495, + "step": 34460 + }, + { + "epoch": 0.66, + "learning_rate": 7.525853098091943e-05, + "loss": 1.2566, + "step": 34470 + }, + { + "epoch": 0.66, + "learning_rate": 7.524549544694081e-05, + "loss": 1.1455, + "step": 34480 + }, + { + "epoch": 0.66, + "learning_rate": 7.523245760948694e-05, + "loss": 1.2725, + "step": 34490 + }, + { + "epoch": 0.66, + "learning_rate": 7.521941746974741e-05, + "loss": 1.4364, + "step": 34500 + }, + { + "epoch": 0.66, + "learning_rate": 7.520637502891202e-05, + "loss": 1.1361, + "step": 34510 + }, + { + "epoch": 0.66, + "learning_rate": 7.519333028817083e-05, + "loss": 1.2371, + "step": 34520 + }, + { + "epoch": 0.66, + "learning_rate": 7.518028324871407e-05, + "loss": 1.3555, + "step": 34530 + }, + { + "epoch": 0.66, + "learning_rate": 7.516723391173218e-05, + "loss": 1.3577, + "step": 34540 + }, + { + "epoch": 0.66, + "learning_rate": 7.515418227841584e-05, + "loss": 1.2978, + "step": 34550 + }, + { + "epoch": 0.66, + "learning_rate": 7.514112834995593e-05, + "loss": 1.1839, + "step": 34560 + }, + { + "epoch": 0.66, + "learning_rate": 7.51280721275435e-05, + "loss": 1.4009, + "step": 34570 + }, + { + "epoch": 0.66, + "learning_rate": 7.511501361236985e-05, + "loss": 1.0374, + "step": 34580 + }, + { + "epoch": 0.67, + "learning_rate": 7.510195280562648e-05, + "loss": 1.2915, + "step": 34590 + }, + { + "epoch": 0.67, + "learning_rate": 7.508888970850512e-05, + "loss": 1.425, + "step": 34600 + }, + { + "epoch": 0.67, + "learning_rate": 7.507582432219763e-05, + "loss": 1.2595, + "step": 34610 + }, + { + "epoch": 0.67, + "learning_rate": 7.50627566478962e-05, + "loss": 1.2773, + "step": 34620 + }, + { + "epoch": 0.67, + "learning_rate": 7.504968668679311e-05, + "loss": 1.2683, + "step": 34630 + }, + { + "epoch": 0.67, + "learning_rate": 7.503661444008096e-05, + "loss": 1.4671, + "step": 34640 + }, + { + "epoch": 0.67, + "learning_rate": 7.502353990895244e-05, + "loss": 1.3415, + "step": 34650 + }, + { + "epoch": 0.67, + "learning_rate": 7.501046309460055e-05, + "loss": 1.3181, + "step": 34660 + }, + { + "epoch": 0.67, + "learning_rate": 7.499738399821845e-05, + "loss": 1.3761, + "step": 34670 + }, + { + "epoch": 0.67, + "learning_rate": 7.49843026209995e-05, + "loss": 1.412, + "step": 34680 + }, + { + "epoch": 0.67, + "learning_rate": 7.497121896413732e-05, + "loss": 1.3649, + "step": 34690 + }, + { + "epoch": 0.67, + "learning_rate": 7.495813302882566e-05, + "loss": 1.2426, + "step": 34700 + }, + { + "epoch": 0.67, + "learning_rate": 7.494504481625854e-05, + "loss": 1.3072, + "step": 34710 + }, + { + "epoch": 0.67, + "learning_rate": 7.493195432763018e-05, + "loss": 1.343, + "step": 34720 + }, + { + "epoch": 0.67, + "learning_rate": 7.491886156413497e-05, + "loss": 1.0702, + "step": 34730 + }, + { + "epoch": 0.67, + "learning_rate": 7.490576652696755e-05, + "loss": 1.1581, + "step": 34740 + }, + { + "epoch": 0.67, + "learning_rate": 7.489266921732274e-05, + "loss": 1.3473, + "step": 34750 + }, + { + "epoch": 0.67, + "learning_rate": 7.48795696363956e-05, + "loss": 1.2574, + "step": 34760 + }, + { + "epoch": 0.67, + "learning_rate": 7.486646778538135e-05, + "loss": 1.288, + "step": 34770 + }, + { + "epoch": 0.67, + "learning_rate": 7.485336366547547e-05, + "loss": 1.2667, + "step": 34780 + }, + { + "epoch": 0.67, + "learning_rate": 7.48402572778736e-05, + "loss": 1.1552, + "step": 34790 + }, + { + "epoch": 0.67, + "learning_rate": 7.48271486237716e-05, + "loss": 1.239, + "step": 34800 + }, + { + "epoch": 0.67, + "learning_rate": 7.481403770436554e-05, + "loss": 1.2492, + "step": 34810 + }, + { + "epoch": 0.67, + "learning_rate": 7.480092452085175e-05, + "loss": 1.3376, + "step": 34820 + }, + { + "epoch": 0.67, + "learning_rate": 7.478780907442665e-05, + "loss": 1.3622, + "step": 34830 + }, + { + "epoch": 0.67, + "learning_rate": 7.477469136628696e-05, + "loss": 1.379, + "step": 34840 + }, + { + "epoch": 0.67, + "learning_rate": 7.47615713976296e-05, + "loss": 1.2066, + "step": 34850 + }, + { + "epoch": 0.67, + "learning_rate": 7.474844916965165e-05, + "loss": 1.3111, + "step": 34860 + }, + { + "epoch": 0.67, + "learning_rate": 7.473532468355043e-05, + "loss": 1.1847, + "step": 34870 + }, + { + "epoch": 0.67, + "learning_rate": 7.472219794052344e-05, + "loss": 1.3582, + "step": 34880 + }, + { + "epoch": 0.67, + "learning_rate": 7.470906894176844e-05, + "loss": 1.0988, + "step": 34890 + }, + { + "epoch": 0.67, + "learning_rate": 7.469593768848331e-05, + "loss": 1.1431, + "step": 34900 + }, + { + "epoch": 0.67, + "learning_rate": 7.468280418186624e-05, + "loss": 1.333, + "step": 34910 + }, + { + "epoch": 0.67, + "learning_rate": 7.466966842311555e-05, + "loss": 1.2121, + "step": 34920 + }, + { + "epoch": 0.67, + "learning_rate": 7.465653041342977e-05, + "loss": 1.2633, + "step": 34930 + }, + { + "epoch": 0.67, + "learning_rate": 7.464339015400768e-05, + "loss": 1.4368, + "step": 34940 + }, + { + "epoch": 0.67, + "learning_rate": 7.46302476460482e-05, + "loss": 1.3346, + "step": 34950 + }, + { + "epoch": 0.67, + "learning_rate": 7.46171028907505e-05, + "loss": 1.147, + "step": 34960 + }, + { + "epoch": 0.67, + "learning_rate": 7.4603955889314e-05, + "loss": 1.2308, + "step": 34970 + }, + { + "epoch": 0.67, + "learning_rate": 7.459080664293821e-05, + "loss": 1.3684, + "step": 34980 + }, + { + "epoch": 0.67, + "learning_rate": 7.457765515282293e-05, + "loss": 1.4716, + "step": 34990 + }, + { + "epoch": 0.67, + "learning_rate": 7.456450142016814e-05, + "loss": 1.3971, + "step": 35000 + }, + { + "epoch": 0.67, + "learning_rate": 7.455134544617402e-05, + "loss": 1.2953, + "step": 35010 + }, + { + "epoch": 0.67, + "learning_rate": 7.453818723204098e-05, + "loss": 1.3975, + "step": 35020 + }, + { + "epoch": 0.67, + "learning_rate": 7.452502677896961e-05, + "loss": 1.1598, + "step": 35030 + }, + { + "epoch": 0.67, + "learning_rate": 7.451186408816069e-05, + "loss": 1.3326, + "step": 35040 + }, + { + "epoch": 0.67, + "learning_rate": 7.449869916081524e-05, + "loss": 1.155, + "step": 35050 + }, + { + "epoch": 0.67, + "learning_rate": 7.448553199813445e-05, + "loss": 1.3561, + "step": 35060 + }, + { + "epoch": 0.67, + "learning_rate": 7.447236260131975e-05, + "loss": 1.1837, + "step": 35070 + }, + { + "epoch": 0.67, + "learning_rate": 7.445919097157277e-05, + "loss": 1.2882, + "step": 35080 + }, + { + "epoch": 0.67, + "learning_rate": 7.44460171100953e-05, + "loss": 1.1631, + "step": 35090 + }, + { + "epoch": 0.67, + "learning_rate": 7.443284101808937e-05, + "loss": 1.2922, + "step": 35100 + }, + { + "epoch": 0.68, + "learning_rate": 7.44196626967572e-05, + "loss": 1.4103, + "step": 35110 + }, + { + "epoch": 0.68, + "learning_rate": 7.440648214730124e-05, + "loss": 1.4262, + "step": 35120 + }, + { + "epoch": 0.68, + "learning_rate": 7.439329937092413e-05, + "loss": 1.2043, + "step": 35130 + }, + { + "epoch": 0.68, + "learning_rate": 7.438011436882867e-05, + "loss": 1.3484, + "step": 35140 + }, + { + "epoch": 0.68, + "learning_rate": 7.436692714221792e-05, + "loss": 1.4364, + "step": 35150 + }, + { + "epoch": 0.68, + "learning_rate": 7.435373769229512e-05, + "loss": 1.2773, + "step": 35160 + }, + { + "epoch": 0.68, + "learning_rate": 7.434054602026371e-05, + "loss": 1.1325, + "step": 35170 + }, + { + "epoch": 0.68, + "learning_rate": 7.432735212732737e-05, + "loss": 1.0857, + "step": 35180 + }, + { + "epoch": 0.68, + "learning_rate": 7.43141560146899e-05, + "loss": 1.3902, + "step": 35190 + }, + { + "epoch": 0.68, + "learning_rate": 7.43009576835554e-05, + "loss": 1.1651, + "step": 35200 + }, + { + "epoch": 0.68, + "learning_rate": 7.428775713512807e-05, + "loss": 1.4953, + "step": 35210 + }, + { + "epoch": 0.68, + "learning_rate": 7.427455437061243e-05, + "loss": 1.1083, + "step": 35220 + }, + { + "epoch": 0.68, + "learning_rate": 7.42613493912131e-05, + "loss": 1.0344, + "step": 35230 + }, + { + "epoch": 0.68, + "learning_rate": 7.424814219813497e-05, + "loss": 1.2533, + "step": 35240 + }, + { + "epoch": 0.68, + "learning_rate": 7.423493279258306e-05, + "loss": 1.3005, + "step": 35250 + }, + { + "epoch": 0.68, + "learning_rate": 7.42217211757627e-05, + "loss": 1.3189, + "step": 35260 + }, + { + "epoch": 0.68, + "learning_rate": 7.420850734887929e-05, + "loss": 1.4458, + "step": 35270 + }, + { + "epoch": 0.68, + "learning_rate": 7.419529131313855e-05, + "loss": 1.2736, + "step": 35280 + }, + { + "epoch": 0.68, + "learning_rate": 7.418207306974631e-05, + "loss": 1.6326, + "step": 35290 + }, + { + "epoch": 0.68, + "learning_rate": 7.416885261990869e-05, + "loss": 1.4359, + "step": 35300 + }, + { + "epoch": 0.68, + "learning_rate": 7.415562996483192e-05, + "loss": 1.5167, + "step": 35310 + }, + { + "epoch": 0.68, + "learning_rate": 7.414240510572251e-05, + "loss": 1.1607, + "step": 35320 + }, + { + "epoch": 0.68, + "learning_rate": 7.412917804378712e-05, + "loss": 1.0971, + "step": 35330 + }, + { + "epoch": 0.68, + "learning_rate": 7.411594878023262e-05, + "loss": 1.2977, + "step": 35340 + }, + { + "epoch": 0.68, + "learning_rate": 7.41027173162661e-05, + "loss": 1.2427, + "step": 35350 + }, + { + "epoch": 0.68, + "learning_rate": 7.408948365309483e-05, + "loss": 1.2354, + "step": 35360 + }, + { + "epoch": 0.68, + "learning_rate": 7.407624779192627e-05, + "loss": 1.4373, + "step": 35370 + }, + { + "epoch": 0.68, + "learning_rate": 7.406300973396816e-05, + "loss": 1.4373, + "step": 35380 + }, + { + "epoch": 0.68, + "learning_rate": 7.404976948042832e-05, + "loss": 1.1593, + "step": 35390 + }, + { + "epoch": 0.68, + "learning_rate": 7.403652703251487e-05, + "loss": 1.2892, + "step": 35400 + }, + { + "epoch": 0.68, + "learning_rate": 7.402328239143606e-05, + "loss": 1.0377, + "step": 35410 + }, + { + "epoch": 0.68, + "learning_rate": 7.40100355584004e-05, + "loss": 1.1029, + "step": 35420 + }, + { + "epoch": 0.68, + "learning_rate": 7.399678653461656e-05, + "loss": 1.3885, + "step": 35430 + }, + { + "epoch": 0.68, + "learning_rate": 7.398353532129341e-05, + "loss": 1.2575, + "step": 35440 + }, + { + "epoch": 0.68, + "learning_rate": 7.397028191964004e-05, + "loss": 1.071, + "step": 35450 + }, + { + "epoch": 0.68, + "learning_rate": 7.395702633086572e-05, + "loss": 1.3516, + "step": 35460 + }, + { + "epoch": 0.68, + "learning_rate": 7.394376855617995e-05, + "loss": 1.4154, + "step": 35470 + }, + { + "epoch": 0.68, + "learning_rate": 7.393050859679239e-05, + "loss": 1.1707, + "step": 35480 + }, + { + "epoch": 0.68, + "learning_rate": 7.391724645391293e-05, + "loss": 1.238, + "step": 35490 + }, + { + "epoch": 0.68, + "learning_rate": 7.390398212875166e-05, + "loss": 1.3833, + "step": 35500 + }, + { + "epoch": 0.68, + "learning_rate": 7.389071562251883e-05, + "loss": 1.3467, + "step": 35510 + }, + { + "epoch": 0.68, + "learning_rate": 7.387744693642493e-05, + "loss": 1.137, + "step": 35520 + }, + { + "epoch": 0.68, + "learning_rate": 7.386417607168064e-05, + "loss": 1.2642, + "step": 35530 + }, + { + "epoch": 0.68, + "learning_rate": 7.385090302949682e-05, + "loss": 1.4112, + "step": 35540 + }, + { + "epoch": 0.68, + "learning_rate": 7.383762781108455e-05, + "loss": 1.3657, + "step": 35550 + }, + { + "epoch": 0.68, + "learning_rate": 7.38243504176551e-05, + "loss": 1.1587, + "step": 35560 + }, + { + "epoch": 0.68, + "learning_rate": 7.381107085041993e-05, + "loss": 1.3146, + "step": 35570 + }, + { + "epoch": 0.68, + "learning_rate": 7.379778911059074e-05, + "loss": 1.1741, + "step": 35580 + }, + { + "epoch": 0.68, + "learning_rate": 7.378450519937938e-05, + "loss": 1.1403, + "step": 35590 + }, + { + "epoch": 0.68, + "learning_rate": 7.37712191179979e-05, + "loss": 1.3594, + "step": 35600 + }, + { + "epoch": 0.68, + "learning_rate": 7.375793086765855e-05, + "loss": 1.6164, + "step": 35610 + }, + { + "epoch": 0.68, + "learning_rate": 7.374464044957383e-05, + "loss": 1.1541, + "step": 35620 + }, + { + "epoch": 0.69, + "learning_rate": 7.373134786495638e-05, + "loss": 1.1719, + "step": 35630 + }, + { + "epoch": 0.69, + "learning_rate": 7.371805311501904e-05, + "loss": 1.4099, + "step": 35640 + }, + { + "epoch": 0.69, + "learning_rate": 7.37047562009749e-05, + "loss": 1.4676, + "step": 35650 + }, + { + "epoch": 0.69, + "learning_rate": 7.369145712403716e-05, + "loss": 1.4472, + "step": 35660 + }, + { + "epoch": 0.69, + "learning_rate": 7.367815588541931e-05, + "loss": 1.3282, + "step": 35670 + }, + { + "epoch": 0.69, + "learning_rate": 7.366485248633499e-05, + "loss": 1.3898, + "step": 35680 + }, + { + "epoch": 0.69, + "learning_rate": 7.365154692799804e-05, + "loss": 1.2438, + "step": 35690 + }, + { + "epoch": 0.69, + "learning_rate": 7.363823921162248e-05, + "loss": 1.3301, + "step": 35700 + }, + { + "epoch": 0.69, + "learning_rate": 7.362492933842255e-05, + "loss": 1.174, + "step": 35710 + }, + { + "epoch": 0.69, + "learning_rate": 7.36116173096127e-05, + "loss": 1.2322, + "step": 35720 + }, + { + "epoch": 0.69, + "learning_rate": 7.359830312640756e-05, + "loss": 1.2753, + "step": 35730 + }, + { + "epoch": 0.69, + "learning_rate": 7.358498679002195e-05, + "loss": 1.3126, + "step": 35740 + }, + { + "epoch": 0.69, + "learning_rate": 7.357166830167087e-05, + "loss": 1.1424, + "step": 35750 + }, + { + "epoch": 0.69, + "learning_rate": 7.355834766256957e-05, + "loss": 1.2487, + "step": 35760 + }, + { + "epoch": 0.69, + "learning_rate": 7.354502487393347e-05, + "loss": 1.2732, + "step": 35770 + }, + { + "epoch": 0.69, + "learning_rate": 7.353169993697815e-05, + "loss": 1.1733, + "step": 35780 + }, + { + "epoch": 0.69, + "learning_rate": 7.351837285291945e-05, + "loss": 1.2748, + "step": 35790 + }, + { + "epoch": 0.69, + "learning_rate": 7.350504362297334e-05, + "loss": 1.3946, + "step": 35800 + }, + { + "epoch": 0.69, + "learning_rate": 7.349171224835604e-05, + "loss": 1.121, + "step": 35810 + }, + { + "epoch": 0.69, + "learning_rate": 7.347837873028395e-05, + "loss": 1.2899, + "step": 35820 + }, + { + "epoch": 0.69, + "learning_rate": 7.346504306997366e-05, + "loss": 1.4403, + "step": 35830 + }, + { + "epoch": 0.69, + "learning_rate": 7.345170526864193e-05, + "loss": 1.3106, + "step": 35840 + }, + { + "epoch": 0.69, + "learning_rate": 7.343836532750577e-05, + "loss": 1.2838, + "step": 35850 + }, + { + "epoch": 0.69, + "learning_rate": 7.342502324778234e-05, + "loss": 1.3668, + "step": 35860 + }, + { + "epoch": 0.69, + "learning_rate": 7.341167903068902e-05, + "loss": 1.1647, + "step": 35870 + }, + { + "epoch": 0.69, + "learning_rate": 7.339833267744338e-05, + "loss": 1.1176, + "step": 35880 + }, + { + "epoch": 0.69, + "learning_rate": 7.338498418926318e-05, + "loss": 1.1755, + "step": 35890 + }, + { + "epoch": 0.69, + "learning_rate": 7.337163356736636e-05, + "loss": 1.1986, + "step": 35900 + }, + { + "epoch": 0.69, + "learning_rate": 7.335828081297109e-05, + "loss": 1.1371, + "step": 35910 + }, + { + "epoch": 0.69, + "learning_rate": 7.334492592729571e-05, + "loss": 1.4632, + "step": 35920 + }, + { + "epoch": 0.69, + "learning_rate": 7.333156891155875e-05, + "loss": 1.426, + "step": 35930 + }, + { + "epoch": 0.69, + "learning_rate": 7.331820976697898e-05, + "loss": 1.2938, + "step": 35940 + }, + { + "epoch": 0.69, + "learning_rate": 7.330484849477528e-05, + "loss": 1.1865, + "step": 35950 + }, + { + "epoch": 0.69, + "learning_rate": 7.32914850961668e-05, + "loss": 1.231, + "step": 35960 + }, + { + "epoch": 0.69, + "learning_rate": 7.327811957237285e-05, + "loss": 1.2905, + "step": 35970 + }, + { + "epoch": 0.69, + "learning_rate": 7.326475192461294e-05, + "loss": 1.555, + "step": 35980 + }, + { + "epoch": 0.69, + "learning_rate": 7.32513821541068e-05, + "loss": 1.1432, + "step": 35990 + }, + { + "epoch": 0.69, + "learning_rate": 7.323801026207428e-05, + "loss": 1.244, + "step": 36000 + }, + { + "epoch": 0.69, + "learning_rate": 7.32246362497355e-05, + "loss": 1.4017, + "step": 36010 + }, + { + "epoch": 0.69, + "learning_rate": 7.321126011831075e-05, + "loss": 1.2672, + "step": 36020 + }, + { + "epoch": 0.69, + "learning_rate": 7.31978818690205e-05, + "loss": 1.2751, + "step": 36030 + }, + { + "epoch": 0.69, + "learning_rate": 7.318450150308545e-05, + "loss": 1.1557, + "step": 36040 + }, + { + "epoch": 0.69, + "learning_rate": 7.31711190217264e-05, + "loss": 1.1871, + "step": 36050 + }, + { + "epoch": 0.69, + "learning_rate": 7.315773442616446e-05, + "loss": 1.1532, + "step": 36060 + }, + { + "epoch": 0.69, + "learning_rate": 7.314434771762087e-05, + "loss": 1.3019, + "step": 36070 + }, + { + "epoch": 0.69, + "learning_rate": 7.313095889731706e-05, + "loss": 1.4045, + "step": 36080 + }, + { + "epoch": 0.69, + "learning_rate": 7.311756796647469e-05, + "loss": 1.2496, + "step": 36090 + }, + { + "epoch": 0.69, + "learning_rate": 7.310417492631559e-05, + "loss": 1.2231, + "step": 36100 + }, + { + "epoch": 0.69, + "learning_rate": 7.309077977806174e-05, + "loss": 1.0855, + "step": 36110 + }, + { + "epoch": 0.69, + "learning_rate": 7.307738252293538e-05, + "loss": 1.3741, + "step": 36120 + }, + { + "epoch": 0.69, + "learning_rate": 7.306398316215895e-05, + "loss": 1.3343, + "step": 36130 + }, + { + "epoch": 0.69, + "learning_rate": 7.3050581696955e-05, + "loss": 1.2559, + "step": 36140 + }, + { + "epoch": 0.7, + "learning_rate": 7.303717812854632e-05, + "loss": 1.2406, + "step": 36150 + }, + { + "epoch": 0.7, + "learning_rate": 7.302377245815592e-05, + "loss": 1.3662, + "step": 36160 + }, + { + "epoch": 0.7, + "learning_rate": 7.301036468700697e-05, + "loss": 1.3779, + "step": 36170 + }, + { + "epoch": 0.7, + "learning_rate": 7.299695481632283e-05, + "loss": 1.3917, + "step": 36180 + }, + { + "epoch": 0.7, + "learning_rate": 7.298354284732704e-05, + "loss": 1.188, + "step": 36190 + }, + { + "epoch": 0.7, + "learning_rate": 7.297012878124337e-05, + "loss": 1.3136, + "step": 36200 + }, + { + "epoch": 0.7, + "learning_rate": 7.295671261929576e-05, + "loss": 1.4019, + "step": 36210 + }, + { + "epoch": 0.7, + "learning_rate": 7.294329436270833e-05, + "loss": 1.0086, + "step": 36220 + }, + { + "epoch": 0.7, + "learning_rate": 7.29298740127054e-05, + "loss": 1.1557, + "step": 36230 + }, + { + "epoch": 0.7, + "learning_rate": 7.29164515705115e-05, + "loss": 1.1072, + "step": 36240 + }, + { + "epoch": 0.7, + "learning_rate": 7.290302703735132e-05, + "loss": 1.4596, + "step": 36250 + }, + { + "epoch": 0.7, + "learning_rate": 7.288960041444977e-05, + "loss": 1.2498, + "step": 36260 + }, + { + "epoch": 0.7, + "learning_rate": 7.28761717030319e-05, + "loss": 1.2593, + "step": 36270 + }, + { + "epoch": 0.7, + "learning_rate": 7.286274090432304e-05, + "loss": 1.3283, + "step": 36280 + }, + { + "epoch": 0.7, + "learning_rate": 7.28493080195486e-05, + "loss": 1.3535, + "step": 36290 + }, + { + "epoch": 0.7, + "learning_rate": 7.283587304993428e-05, + "loss": 1.317, + "step": 36300 + }, + { + "epoch": 0.7, + "learning_rate": 7.282243599670592e-05, + "loss": 1.2573, + "step": 36310 + }, + { + "epoch": 0.7, + "learning_rate": 7.280899686108952e-05, + "loss": 1.1539, + "step": 36320 + }, + { + "epoch": 0.7, + "learning_rate": 7.279555564431136e-05, + "loss": 1.2985, + "step": 36330 + }, + { + "epoch": 0.7, + "learning_rate": 7.278211234759784e-05, + "loss": 1.281, + "step": 36340 + }, + { + "epoch": 0.7, + "learning_rate": 7.276866697217555e-05, + "loss": 1.1453, + "step": 36350 + }, + { + "epoch": 0.7, + "learning_rate": 7.27552195192713e-05, + "loss": 1.4054, + "step": 36360 + }, + { + "epoch": 0.7, + "learning_rate": 7.274176999011206e-05, + "loss": 1.3218, + "step": 36370 + }, + { + "epoch": 0.7, + "learning_rate": 7.272831838592503e-05, + "loss": 1.2729, + "step": 36380 + }, + { + "epoch": 0.7, + "learning_rate": 7.271486470793757e-05, + "loss": 1.3934, + "step": 36390 + }, + { + "epoch": 0.7, + "learning_rate": 7.270140895737722e-05, + "loss": 1.4525, + "step": 36400 + }, + { + "epoch": 0.7, + "learning_rate": 7.268795113547174e-05, + "loss": 1.3551, + "step": 36410 + }, + { + "epoch": 0.7, + "learning_rate": 7.267449124344905e-05, + "loss": 1.1976, + "step": 36420 + }, + { + "epoch": 0.7, + "learning_rate": 7.266102928253728e-05, + "loss": 1.2997, + "step": 36430 + }, + { + "epoch": 0.7, + "learning_rate": 7.264756525396473e-05, + "loss": 1.3487, + "step": 36440 + }, + { + "epoch": 0.7, + "learning_rate": 7.263409915895992e-05, + "loss": 1.2133, + "step": 36450 + }, + { + "epoch": 0.7, + "learning_rate": 7.262063099875148e-05, + "loss": 1.1276, + "step": 36460 + }, + { + "epoch": 0.7, + "learning_rate": 7.260716077456836e-05, + "loss": 1.1639, + "step": 36470 + }, + { + "epoch": 0.7, + "learning_rate": 7.25936884876396e-05, + "loss": 1.2263, + "step": 36480 + }, + { + "epoch": 0.7, + "learning_rate": 7.25802141391944e-05, + "loss": 1.2567, + "step": 36490 + }, + { + "epoch": 0.7, + "learning_rate": 7.256673773046229e-05, + "loss": 1.2929, + "step": 36500 + }, + { + "epoch": 0.7, + "learning_rate": 7.255325926267282e-05, + "loss": 1.5596, + "step": 36510 + }, + { + "epoch": 0.7, + "learning_rate": 7.253977873705586e-05, + "loss": 1.3165, + "step": 36520 + }, + { + "epoch": 0.7, + "learning_rate": 7.252629615484138e-05, + "loss": 1.4751, + "step": 36530 + }, + { + "epoch": 0.7, + "learning_rate": 7.251281151725957e-05, + "loss": 1.1511, + "step": 36540 + }, + { + "epoch": 0.7, + "learning_rate": 7.249932482554085e-05, + "loss": 1.1302, + "step": 36550 + }, + { + "epoch": 0.7, + "learning_rate": 7.248583608091574e-05, + "loss": 1.1903, + "step": 36560 + }, + { + "epoch": 0.7, + "learning_rate": 7.247234528461502e-05, + "loss": 1.3213, + "step": 36570 + }, + { + "epoch": 0.7, + "learning_rate": 7.245885243786963e-05, + "loss": 1.0815, + "step": 36580 + }, + { + "epoch": 0.7, + "learning_rate": 7.244535754191067e-05, + "loss": 1.2147, + "step": 36590 + }, + { + "epoch": 0.7, + "learning_rate": 7.24318605979695e-05, + "loss": 1.0584, + "step": 36600 + }, + { + "epoch": 0.7, + "learning_rate": 7.241836160727758e-05, + "loss": 1.0879, + "step": 36610 + }, + { + "epoch": 0.7, + "learning_rate": 7.240486057106663e-05, + "loss": 1.3493, + "step": 36620 + }, + { + "epoch": 0.7, + "learning_rate": 7.239135749056851e-05, + "loss": 1.1648, + "step": 36630 + }, + { + "epoch": 0.7, + "learning_rate": 7.237785236701527e-05, + "loss": 1.1193, + "step": 36640 + }, + { + "epoch": 0.7, + "learning_rate": 7.23643452016392e-05, + "loss": 1.4995, + "step": 36650 + }, + { + "epoch": 0.7, + "learning_rate": 7.23508359956727e-05, + "loss": 1.1098, + "step": 36660 + }, + { + "epoch": 0.71, + "learning_rate": 7.233732475034838e-05, + "loss": 1.0503, + "step": 36670 + }, + { + "epoch": 0.71, + "learning_rate": 7.232381146689907e-05, + "loss": 1.2744, + "step": 36680 + }, + { + "epoch": 0.71, + "learning_rate": 7.231029614655776e-05, + "loss": 1.1492, + "step": 36690 + }, + { + "epoch": 0.71, + "learning_rate": 7.229677879055765e-05, + "loss": 1.3286, + "step": 36700 + }, + { + "epoch": 0.71, + "learning_rate": 7.228325940013206e-05, + "loss": 1.1044, + "step": 36710 + }, + { + "epoch": 0.71, + "learning_rate": 7.226973797651456e-05, + "loss": 1.1734, + "step": 36720 + }, + { + "epoch": 0.71, + "learning_rate": 7.225621452093888e-05, + "loss": 1.0754, + "step": 36730 + }, + { + "epoch": 0.71, + "learning_rate": 7.224268903463896e-05, + "loss": 1.2066, + "step": 36740 + }, + { + "epoch": 0.71, + "learning_rate": 7.222916151884889e-05, + "loss": 1.2909, + "step": 36750 + }, + { + "epoch": 0.71, + "learning_rate": 7.221563197480296e-05, + "loss": 1.1018, + "step": 36760 + }, + { + "epoch": 0.71, + "learning_rate": 7.220210040373566e-05, + "loss": 1.1874, + "step": 36770 + }, + { + "epoch": 0.71, + "learning_rate": 7.218856680688164e-05, + "loss": 1.1103, + "step": 36780 + }, + { + "epoch": 0.71, + "learning_rate": 7.217503118547574e-05, + "loss": 1.423, + "step": 36790 + }, + { + "epoch": 0.71, + "learning_rate": 7.216149354075301e-05, + "loss": 1.4922, + "step": 36800 + }, + { + "epoch": 0.71, + "learning_rate": 7.214795387394866e-05, + "loss": 1.4544, + "step": 36810 + }, + { + "epoch": 0.71, + "learning_rate": 7.213441218629808e-05, + "loss": 1.087, + "step": 36820 + }, + { + "epoch": 0.71, + "learning_rate": 7.212086847903685e-05, + "loss": 1.2778, + "step": 36830 + }, + { + "epoch": 0.71, + "learning_rate": 7.210732275340078e-05, + "loss": 1.2039, + "step": 36840 + }, + { + "epoch": 0.71, + "learning_rate": 7.209377501062576e-05, + "loss": 1.3447, + "step": 36850 + }, + { + "epoch": 0.71, + "learning_rate": 7.208022525194798e-05, + "loss": 1.2708, + "step": 36860 + }, + { + "epoch": 0.71, + "learning_rate": 7.206667347860372e-05, + "loss": 1.2575, + "step": 36870 + }, + { + "epoch": 0.71, + "learning_rate": 7.205311969182951e-05, + "loss": 1.4718, + "step": 36880 + }, + { + "epoch": 0.71, + "learning_rate": 7.203956389286204e-05, + "loss": 1.384, + "step": 36890 + }, + { + "epoch": 0.71, + "learning_rate": 7.202600608293818e-05, + "loss": 1.1135, + "step": 36900 + }, + { + "epoch": 0.71, + "learning_rate": 7.201244626329497e-05, + "loss": 1.4001, + "step": 36910 + }, + { + "epoch": 0.71, + "learning_rate": 7.199888443516967e-05, + "loss": 1.1688, + "step": 36920 + }, + { + "epoch": 0.71, + "learning_rate": 7.198532059979967e-05, + "loss": 1.1732, + "step": 36930 + }, + { + "epoch": 0.71, + "learning_rate": 7.197175475842261e-05, + "loss": 1.3144, + "step": 36940 + }, + { + "epoch": 0.71, + "learning_rate": 7.195818691227628e-05, + "loss": 1.2133, + "step": 36950 + }, + { + "epoch": 0.71, + "learning_rate": 7.194461706259862e-05, + "loss": 1.3347, + "step": 36960 + }, + { + "epoch": 0.71, + "learning_rate": 7.193104521062782e-05, + "loss": 1.2667, + "step": 36970 + }, + { + "epoch": 0.71, + "learning_rate": 7.191747135760217e-05, + "loss": 1.3224, + "step": 36980 + }, + { + "epoch": 0.71, + "learning_rate": 7.190389550476024e-05, + "loss": 1.1556, + "step": 36990 + }, + { + "epoch": 0.71, + "learning_rate": 7.18903176533407e-05, + "loss": 1.2832, + "step": 37000 + }, + { + "epoch": 0.71, + "learning_rate": 7.187673780458244e-05, + "loss": 1.233, + "step": 37010 + }, + { + "epoch": 0.71, + "learning_rate": 7.186315595972453e-05, + "loss": 1.0699, + "step": 37020 + }, + { + "epoch": 0.71, + "learning_rate": 7.184957212000622e-05, + "loss": 1.324, + "step": 37030 + }, + { + "epoch": 0.71, + "learning_rate": 7.183598628666694e-05, + "loss": 1.1498, + "step": 37040 + }, + { + "epoch": 0.71, + "learning_rate": 7.182239846094629e-05, + "loss": 1.2845, + "step": 37050 + }, + { + "epoch": 0.71, + "learning_rate": 7.18088086440841e-05, + "loss": 1.2213, + "step": 37060 + }, + { + "epoch": 0.71, + "learning_rate": 7.179521683732029e-05, + "loss": 1.3878, + "step": 37070 + }, + { + "epoch": 0.71, + "learning_rate": 7.178162304189506e-05, + "loss": 1.3064, + "step": 37080 + }, + { + "epoch": 0.71, + "learning_rate": 7.176802725904876e-05, + "loss": 1.2849, + "step": 37090 + }, + { + "epoch": 0.71, + "learning_rate": 7.175442949002187e-05, + "loss": 1.1505, + "step": 37100 + }, + { + "epoch": 0.71, + "learning_rate": 7.17408297360551e-05, + "loss": 1.325, + "step": 37110 + }, + { + "epoch": 0.71, + "learning_rate": 7.172722799838935e-05, + "loss": 1.2663, + "step": 37120 + }, + { + "epoch": 0.71, + "learning_rate": 7.171362427826567e-05, + "loss": 1.5372, + "step": 37130 + }, + { + "epoch": 0.71, + "learning_rate": 7.170001857692533e-05, + "loss": 1.2545, + "step": 37140 + }, + { + "epoch": 0.71, + "learning_rate": 7.168641089560972e-05, + "loss": 1.2594, + "step": 37150 + }, + { + "epoch": 0.71, + "learning_rate": 7.167280123556047e-05, + "loss": 1.1489, + "step": 37160 + }, + { + "epoch": 0.71, + "learning_rate": 7.165918959801935e-05, + "loss": 1.3339, + "step": 37170 + }, + { + "epoch": 0.71, + "learning_rate": 7.164557598422834e-05, + "loss": 1.12, + "step": 37180 + }, + { + "epoch": 0.72, + "learning_rate": 7.163196039542958e-05, + "loss": 1.1718, + "step": 37190 + }, + { + "epoch": 0.72, + "learning_rate": 7.16183428328654e-05, + "loss": 1.4046, + "step": 37200 + }, + { + "epoch": 0.72, + "learning_rate": 7.160472329777832e-05, + "loss": 1.2872, + "step": 37210 + }, + { + "epoch": 0.72, + "learning_rate": 7.159110179141098e-05, + "loss": 1.2491, + "step": 37220 + }, + { + "epoch": 0.72, + "learning_rate": 7.157747831500632e-05, + "loss": 1.0425, + "step": 37230 + }, + { + "epoch": 0.72, + "learning_rate": 7.156385286980734e-05, + "loss": 1.195, + "step": 37240 + }, + { + "epoch": 0.72, + "learning_rate": 7.155022545705726e-05, + "loss": 1.2482, + "step": 37250 + }, + { + "epoch": 0.72, + "learning_rate": 7.153659607799951e-05, + "loss": 1.1739, + "step": 37260 + }, + { + "epoch": 0.72, + "learning_rate": 7.152296473387767e-05, + "loss": 1.1204, + "step": 37270 + }, + { + "epoch": 0.72, + "learning_rate": 7.15093314259355e-05, + "loss": 1.3818, + "step": 37280 + }, + { + "epoch": 0.72, + "learning_rate": 7.149569615541696e-05, + "loss": 1.3263, + "step": 37290 + }, + { + "epoch": 0.72, + "learning_rate": 7.148205892356616e-05, + "loss": 1.1836, + "step": 37300 + }, + { + "epoch": 0.72, + "learning_rate": 7.146841973162739e-05, + "loss": 1.3659, + "step": 37310 + }, + { + "epoch": 0.72, + "learning_rate": 7.145477858084514e-05, + "loss": 1.2263, + "step": 37320 + }, + { + "epoch": 0.72, + "learning_rate": 7.14411354724641e-05, + "loss": 1.2881, + "step": 37330 + }, + { + "epoch": 0.72, + "learning_rate": 7.142749040772905e-05, + "loss": 1.3868, + "step": 37340 + }, + { + "epoch": 0.72, + "learning_rate": 7.141384338788504e-05, + "loss": 1.0782, + "step": 37350 + }, + { + "epoch": 0.72, + "learning_rate": 7.14001944141773e-05, + "loss": 1.1946, + "step": 37360 + }, + { + "epoch": 0.72, + "learning_rate": 7.138654348785114e-05, + "loss": 1.1812, + "step": 37370 + }, + { + "epoch": 0.72, + "learning_rate": 7.137289061015215e-05, + "loss": 1.384, + "step": 37380 + }, + { + "epoch": 0.72, + "learning_rate": 7.135923578232604e-05, + "loss": 1.1335, + "step": 37390 + }, + { + "epoch": 0.72, + "learning_rate": 7.134557900561873e-05, + "loss": 1.4056, + "step": 37400 + }, + { + "epoch": 0.72, + "learning_rate": 7.133192028127631e-05, + "loss": 1.1561, + "step": 37410 + }, + { + "epoch": 0.72, + "learning_rate": 7.131825961054504e-05, + "loss": 1.4686, + "step": 37420 + }, + { + "epoch": 0.72, + "learning_rate": 7.130459699467134e-05, + "loss": 1.2232, + "step": 37430 + }, + { + "epoch": 0.72, + "learning_rate": 7.129093243490186e-05, + "loss": 1.4046, + "step": 37440 + }, + { + "epoch": 0.72, + "learning_rate": 7.127726593248337e-05, + "loss": 1.0989, + "step": 37450 + }, + { + "epoch": 0.72, + "learning_rate": 7.126359748866287e-05, + "loss": 1.3128, + "step": 37460 + }, + { + "epoch": 0.72, + "learning_rate": 7.124992710468749e-05, + "loss": 1.2046, + "step": 37470 + }, + { + "epoch": 0.72, + "learning_rate": 7.123625478180456e-05, + "loss": 1.4009, + "step": 37480 + }, + { + "epoch": 0.72, + "learning_rate": 7.122258052126156e-05, + "loss": 1.3694, + "step": 37490 + }, + { + "epoch": 0.72, + "learning_rate": 7.120890432430622e-05, + "loss": 1.1301, + "step": 37500 + }, + { + "epoch": 0.72, + "learning_rate": 7.119522619218639e-05, + "loss": 1.2419, + "step": 37510 + }, + { + "epoch": 0.72, + "learning_rate": 7.118154612615006e-05, + "loss": 1.3203, + "step": 37520 + }, + { + "epoch": 0.72, + "learning_rate": 7.116786412744548e-05, + "loss": 1.2458, + "step": 37530 + }, + { + "epoch": 0.72, + "learning_rate": 7.115418019732102e-05, + "loss": 1.107, + "step": 37540 + }, + { + "epoch": 0.72, + "learning_rate": 7.114049433702525e-05, + "loss": 1.2188, + "step": 37550 + }, + { + "epoch": 0.72, + "learning_rate": 7.112680654780692e-05, + "loss": 1.302, + "step": 37560 + }, + { + "epoch": 0.72, + "learning_rate": 7.111311683091492e-05, + "loss": 1.1232, + "step": 37570 + }, + { + "epoch": 0.72, + "learning_rate": 7.109942518759835e-05, + "loss": 1.2322, + "step": 37580 + }, + { + "epoch": 0.72, + "learning_rate": 7.108573161910649e-05, + "loss": 1.3502, + "step": 37590 + }, + { + "epoch": 0.72, + "learning_rate": 7.107203612668877e-05, + "loss": 1.1995, + "step": 37600 + }, + { + "epoch": 0.72, + "learning_rate": 7.105833871159482e-05, + "loss": 1.3416, + "step": 37610 + }, + { + "epoch": 0.72, + "learning_rate": 7.104463937507442e-05, + "loss": 1.338, + "step": 37620 + }, + { + "epoch": 0.72, + "learning_rate": 7.103093811837754e-05, + "loss": 1.6498, + "step": 37630 + }, + { + "epoch": 0.72, + "learning_rate": 7.101723494275431e-05, + "loss": 1.438, + "step": 37640 + }, + { + "epoch": 0.72, + "learning_rate": 7.10035298494551e-05, + "loss": 1.4754, + "step": 37650 + }, + { + "epoch": 0.72, + "learning_rate": 7.098982283973036e-05, + "loss": 1.31, + "step": 37660 + }, + { + "epoch": 0.72, + "learning_rate": 7.097611391483077e-05, + "loss": 1.4978, + "step": 37670 + }, + { + "epoch": 0.72, + "learning_rate": 7.096240307600717e-05, + "loss": 1.2826, + "step": 37680 + }, + { + "epoch": 0.72, + "learning_rate": 7.094869032451058e-05, + "loss": 1.6213, + "step": 37690 + }, + { + "epoch": 0.72, + "learning_rate": 7.09349756615922e-05, + "loss": 1.3583, + "step": 37700 + }, + { + "epoch": 0.73, + "learning_rate": 7.09212590885034e-05, + "loss": 1.3246, + "step": 37710 + }, + { + "epoch": 0.73, + "learning_rate": 7.090754060649572e-05, + "loss": 1.1309, + "step": 37720 + }, + { + "epoch": 0.73, + "learning_rate": 7.089382021682084e-05, + "loss": 1.2324, + "step": 37730 + }, + { + "epoch": 0.73, + "learning_rate": 7.088009792073069e-05, + "loss": 1.2048, + "step": 37740 + }, + { + "epoch": 0.73, + "learning_rate": 7.086637371947734e-05, + "loss": 1.2455, + "step": 37750 + }, + { + "epoch": 0.73, + "learning_rate": 7.085264761431301e-05, + "loss": 1.1813, + "step": 37760 + }, + { + "epoch": 0.73, + "learning_rate": 7.08389196064901e-05, + "loss": 1.0894, + "step": 37770 + }, + { + "epoch": 0.73, + "learning_rate": 7.08251896972612e-05, + "loss": 1.2165, + "step": 37780 + }, + { + "epoch": 0.73, + "learning_rate": 7.081145788787909e-05, + "loss": 1.2214, + "step": 37790 + }, + { + "epoch": 0.73, + "learning_rate": 7.07977241795967e-05, + "loss": 1.187, + "step": 37800 + }, + { + "epoch": 0.73, + "learning_rate": 7.078398857366709e-05, + "loss": 1.3102, + "step": 37810 + }, + { + "epoch": 0.73, + "learning_rate": 7.07702510713436e-05, + "loss": 1.2209, + "step": 37820 + }, + { + "epoch": 0.73, + "learning_rate": 7.075651167387962e-05, + "loss": 0.9734, + "step": 37830 + }, + { + "epoch": 0.73, + "learning_rate": 7.074277038252883e-05, + "loss": 1.2992, + "step": 37840 + }, + { + "epoch": 0.73, + "learning_rate": 7.072902719854499e-05, + "loss": 1.4796, + "step": 37850 + }, + { + "epoch": 0.73, + "learning_rate": 7.07152821231821e-05, + "loss": 1.4592, + "step": 37860 + }, + { + "epoch": 0.73, + "learning_rate": 7.070153515769428e-05, + "loss": 1.0596, + "step": 37870 + }, + { + "epoch": 0.73, + "learning_rate": 7.068778630333583e-05, + "loss": 1.4112, + "step": 37880 + }, + { + "epoch": 0.73, + "learning_rate": 7.067403556136128e-05, + "loss": 1.2487, + "step": 37890 + }, + { + "epoch": 0.73, + "learning_rate": 7.066028293302525e-05, + "loss": 1.3506, + "step": 37900 + }, + { + "epoch": 0.73, + "learning_rate": 7.06465284195826e-05, + "loss": 1.1637, + "step": 37910 + }, + { + "epoch": 0.73, + "learning_rate": 7.063277202228831e-05, + "loss": 1.5547, + "step": 37920 + }, + { + "epoch": 0.73, + "learning_rate": 7.061901374239757e-05, + "loss": 1.4841, + "step": 37930 + }, + { + "epoch": 0.73, + "learning_rate": 7.060525358116572e-05, + "loss": 1.2703, + "step": 37940 + }, + { + "epoch": 0.73, + "learning_rate": 7.059149153984828e-05, + "loss": 1.4132, + "step": 37950 + }, + { + "epoch": 0.73, + "learning_rate": 7.057772761970097e-05, + "loss": 1.3561, + "step": 37960 + }, + { + "epoch": 0.73, + "learning_rate": 7.056396182197959e-05, + "loss": 1.2494, + "step": 37970 + }, + { + "epoch": 0.73, + "learning_rate": 7.05501941479402e-05, + "loss": 1.1008, + "step": 37980 + }, + { + "epoch": 0.73, + "learning_rate": 7.053642459883903e-05, + "loss": 1.0237, + "step": 37990 + }, + { + "epoch": 0.73, + "learning_rate": 7.052265317593244e-05, + "loss": 1.3784, + "step": 38000 + }, + { + "epoch": 0.73, + "learning_rate": 7.050887988047696e-05, + "loss": 1.4226, + "step": 38010 + }, + { + "epoch": 0.73, + "learning_rate": 7.049510471372933e-05, + "loss": 1.0991, + "step": 38020 + }, + { + "epoch": 0.73, + "learning_rate": 7.04813276769464e-05, + "loss": 1.2785, + "step": 38030 + }, + { + "epoch": 0.73, + "learning_rate": 7.046754877138528e-05, + "loss": 1.0058, + "step": 38040 + }, + { + "epoch": 0.73, + "learning_rate": 7.045376799830316e-05, + "loss": 1.2636, + "step": 38050 + }, + { + "epoch": 0.73, + "learning_rate": 7.043998535895747e-05, + "loss": 1.2941, + "step": 38060 + }, + { + "epoch": 0.73, + "learning_rate": 7.042620085460574e-05, + "loss": 1.202, + "step": 38070 + }, + { + "epoch": 0.73, + "learning_rate": 7.041241448650575e-05, + "loss": 1.3678, + "step": 38080 + }, + { + "epoch": 0.73, + "learning_rate": 7.03986262559154e-05, + "loss": 1.383, + "step": 38090 + }, + { + "epoch": 0.73, + "learning_rate": 7.038483616409274e-05, + "loss": 0.9835, + "step": 38100 + }, + { + "epoch": 0.73, + "learning_rate": 7.037104421229606e-05, + "loss": 1.0909, + "step": 38110 + }, + { + "epoch": 0.73, + "learning_rate": 7.035725040178376e-05, + "loss": 1.2183, + "step": 38120 + }, + { + "epoch": 0.73, + "learning_rate": 7.034345473381443e-05, + "loss": 1.1683, + "step": 38130 + }, + { + "epoch": 0.73, + "learning_rate": 7.032965720964682e-05, + "loss": 1.2521, + "step": 38140 + }, + { + "epoch": 0.73, + "learning_rate": 7.031585783053987e-05, + "loss": 1.2334, + "step": 38150 + }, + { + "epoch": 0.73, + "learning_rate": 7.030205659775268e-05, + "loss": 1.1959, + "step": 38160 + }, + { + "epoch": 0.73, + "learning_rate": 7.028825351254451e-05, + "loss": 1.312, + "step": 38170 + }, + { + "epoch": 0.73, + "learning_rate": 7.02744485761748e-05, + "loss": 1.2183, + "step": 38180 + }, + { + "epoch": 0.73, + "learning_rate": 7.026064178990313e-05, + "loss": 1.3987, + "step": 38190 + }, + { + "epoch": 0.73, + "learning_rate": 7.02468331549893e-05, + "loss": 1.2339, + "step": 38200 + }, + { + "epoch": 0.73, + "learning_rate": 7.023302267269328e-05, + "loss": 1.2404, + "step": 38210 + }, + { + "epoch": 0.73, + "learning_rate": 7.021921034427509e-05, + "loss": 1.2197, + "step": 38220 + }, + { + "epoch": 0.74, + "learning_rate": 7.020539617099508e-05, + "loss": 1.3971, + "step": 38230 + }, + { + "epoch": 0.74, + "learning_rate": 7.01915801541137e-05, + "loss": 1.1385, + "step": 38240 + }, + { + "epoch": 0.74, + "learning_rate": 7.017776229489152e-05, + "loss": 1.1747, + "step": 38250 + }, + { + "epoch": 0.74, + "learning_rate": 7.016394259458936e-05, + "loss": 1.3953, + "step": 38260 + }, + { + "epoch": 0.74, + "learning_rate": 7.015012105446815e-05, + "loss": 1.208, + "step": 38270 + }, + { + "epoch": 0.74, + "learning_rate": 7.013629767578903e-05, + "loss": 1.2004, + "step": 38280 + }, + { + "epoch": 0.74, + "learning_rate": 7.012247245981327e-05, + "loss": 1.2513, + "step": 38290 + }, + { + "epoch": 0.74, + "learning_rate": 7.010864540780232e-05, + "loss": 1.2834, + "step": 38300 + }, + { + "epoch": 0.74, + "learning_rate": 7.009481652101783e-05, + "loss": 1.3833, + "step": 38310 + }, + { + "epoch": 0.74, + "learning_rate": 7.008098580072155e-05, + "loss": 1.3211, + "step": 38320 + }, + { + "epoch": 0.74, + "learning_rate": 7.006715324817548e-05, + "loss": 1.4195, + "step": 38330 + }, + { + "epoch": 0.74, + "learning_rate": 7.00533188646417e-05, + "loss": 1.2599, + "step": 38340 + }, + { + "epoch": 0.74, + "learning_rate": 7.003948265138252e-05, + "loss": 1.3718, + "step": 38350 + }, + { + "epoch": 0.74, + "learning_rate": 7.002564460966043e-05, + "loss": 1.1053, + "step": 38360 + }, + { + "epoch": 0.74, + "learning_rate": 7.001180474073801e-05, + "loss": 1.4744, + "step": 38370 + }, + { + "epoch": 0.74, + "learning_rate": 6.999796304587806e-05, + "loss": 1.2511, + "step": 38380 + }, + { + "epoch": 0.74, + "learning_rate": 6.998411952634353e-05, + "loss": 1.3381, + "step": 38390 + }, + { + "epoch": 0.74, + "learning_rate": 6.99702741833976e-05, + "loss": 1.2348, + "step": 38400 + }, + { + "epoch": 0.74, + "learning_rate": 6.995642701830348e-05, + "loss": 1.2599, + "step": 38410 + }, + { + "epoch": 0.74, + "learning_rate": 6.994257803232468e-05, + "loss": 1.4099, + "step": 38420 + }, + { + "epoch": 0.74, + "learning_rate": 6.992872722672483e-05, + "loss": 1.3039, + "step": 38430 + }, + { + "epoch": 0.74, + "learning_rate": 6.991487460276767e-05, + "loss": 1.2128, + "step": 38440 + }, + { + "epoch": 0.74, + "learning_rate": 6.99010201617172e-05, + "loss": 1.4061, + "step": 38450 + }, + { + "epoch": 0.74, + "learning_rate": 6.988716390483754e-05, + "loss": 1.4134, + "step": 38460 + }, + { + "epoch": 0.74, + "learning_rate": 6.987330583339294e-05, + "loss": 1.3917, + "step": 38470 + }, + { + "epoch": 0.74, + "learning_rate": 6.985944594864789e-05, + "loss": 1.3662, + "step": 38480 + }, + { + "epoch": 0.74, + "learning_rate": 6.984558425186699e-05, + "loss": 1.3866, + "step": 38490 + }, + { + "epoch": 0.74, + "learning_rate": 6.983172074431501e-05, + "loss": 1.2795, + "step": 38500 + }, + { + "epoch": 0.74, + "learning_rate": 6.981785542725693e-05, + "loss": 1.2584, + "step": 38510 + }, + { + "epoch": 0.74, + "learning_rate": 6.980398830195785e-05, + "loss": 1.2054, + "step": 38520 + }, + { + "epoch": 0.74, + "learning_rate": 6.979011936968305e-05, + "loss": 1.1822, + "step": 38530 + }, + { + "epoch": 0.74, + "learning_rate": 6.977624863169794e-05, + "loss": 1.0685, + "step": 38540 + }, + { + "epoch": 0.74, + "learning_rate": 6.97623760892682e-05, + "loss": 1.2506, + "step": 38550 + }, + { + "epoch": 0.74, + "learning_rate": 6.974850174365952e-05, + "loss": 1.3055, + "step": 38560 + }, + { + "epoch": 0.74, + "learning_rate": 6.97346255961379e-05, + "loss": 1.4225, + "step": 38570 + }, + { + "epoch": 0.74, + "learning_rate": 6.972074764796942e-05, + "loss": 1.4897, + "step": 38580 + }, + { + "epoch": 0.74, + "learning_rate": 6.970686790042033e-05, + "loss": 1.1962, + "step": 38590 + }, + { + "epoch": 0.74, + "learning_rate": 6.969298635475709e-05, + "loss": 1.2045, + "step": 38600 + }, + { + "epoch": 0.74, + "learning_rate": 6.967910301224627e-05, + "loss": 1.144, + "step": 38610 + }, + { + "epoch": 0.74, + "learning_rate": 6.966521787415465e-05, + "loss": 1.2091, + "step": 38620 + }, + { + "epoch": 0.74, + "learning_rate": 6.965133094174913e-05, + "loss": 1.2127, + "step": 38630 + }, + { + "epoch": 0.74, + "learning_rate": 6.96374422162968e-05, + "loss": 1.2075, + "step": 38640 + }, + { + "epoch": 0.74, + "learning_rate": 6.962355169906491e-05, + "loss": 1.2523, + "step": 38650 + }, + { + "epoch": 0.74, + "learning_rate": 6.960965939132089e-05, + "loss": 1.3342, + "step": 38660 + }, + { + "epoch": 0.74, + "learning_rate": 6.95957652943323e-05, + "loss": 1.1508, + "step": 38670 + }, + { + "epoch": 0.74, + "learning_rate": 6.958186940936688e-05, + "loss": 1.4154, + "step": 38680 + }, + { + "epoch": 0.74, + "learning_rate": 6.956797173769254e-05, + "loss": 1.0091, + "step": 38690 + }, + { + "epoch": 0.74, + "learning_rate": 6.955407228057733e-05, + "loss": 1.1065, + "step": 38700 + }, + { + "epoch": 0.74, + "learning_rate": 6.954017103928949e-05, + "loss": 1.1108, + "step": 38710 + }, + { + "epoch": 0.74, + "learning_rate": 6.952626801509743e-05, + "loss": 1.2405, + "step": 38720 + }, + { + "epoch": 0.74, + "learning_rate": 6.951236320926966e-05, + "loss": 1.1415, + "step": 38730 + }, + { + "epoch": 0.74, + "learning_rate": 6.949845662307493e-05, + "loss": 1.0715, + "step": 38740 + }, + { + "epoch": 0.75, + "learning_rate": 6.948454825778211e-05, + "loss": 1.1263, + "step": 38750 + }, + { + "epoch": 0.75, + "learning_rate": 6.947063811466023e-05, + "loss": 1.267, + "step": 38760 + }, + { + "epoch": 0.75, + "learning_rate": 6.945672619497853e-05, + "loss": 1.2791, + "step": 38770 + }, + { + "epoch": 0.75, + "learning_rate": 6.944281250000634e-05, + "loss": 1.359, + "step": 38780 + }, + { + "epoch": 0.75, + "learning_rate": 6.942889703101319e-05, + "loss": 1.1779, + "step": 38790 + }, + { + "epoch": 0.75, + "learning_rate": 6.941497978926878e-05, + "loss": 1.2239, + "step": 38800 + }, + { + "epoch": 0.75, + "learning_rate": 6.940106077604295e-05, + "loss": 1.3325, + "step": 38810 + }, + { + "epoch": 0.75, + "learning_rate": 6.938713999260574e-05, + "loss": 1.1363, + "step": 38820 + }, + { + "epoch": 0.75, + "learning_rate": 6.937321744022728e-05, + "loss": 1.2763, + "step": 38830 + }, + { + "epoch": 0.75, + "learning_rate": 6.935929312017796e-05, + "loss": 1.3162, + "step": 38840 + }, + { + "epoch": 0.75, + "learning_rate": 6.934536703372822e-05, + "loss": 1.4165, + "step": 38850 + }, + { + "epoch": 0.75, + "learning_rate": 6.933143918214876e-05, + "loss": 1.4522, + "step": 38860 + }, + { + "epoch": 0.75, + "learning_rate": 6.93175095667104e-05, + "loss": 1.2063, + "step": 38870 + }, + { + "epoch": 0.75, + "learning_rate": 6.930357818868409e-05, + "loss": 1.2706, + "step": 38880 + }, + { + "epoch": 0.75, + "learning_rate": 6.928964504934099e-05, + "loss": 1.4134, + "step": 38890 + }, + { + "epoch": 0.75, + "learning_rate": 6.927571014995238e-05, + "loss": 1.4629, + "step": 38900 + }, + { + "epoch": 0.75, + "learning_rate": 6.926177349178976e-05, + "loss": 1.1394, + "step": 38910 + }, + { + "epoch": 0.75, + "learning_rate": 6.924783507612474e-05, + "loss": 1.2628, + "step": 38920 + }, + { + "epoch": 0.75, + "learning_rate": 6.923389490422908e-05, + "loss": 1.3117, + "step": 38930 + }, + { + "epoch": 0.75, + "learning_rate": 6.921995297737476e-05, + "loss": 1.3508, + "step": 38940 + }, + { + "epoch": 0.75, + "learning_rate": 6.920600929683385e-05, + "loss": 1.3851, + "step": 38950 + }, + { + "epoch": 0.75, + "learning_rate": 6.919206386387862e-05, + "loss": 1.2411, + "step": 38960 + }, + { + "epoch": 0.75, + "learning_rate": 6.917811667978151e-05, + "loss": 1.2847, + "step": 38970 + }, + { + "epoch": 0.75, + "learning_rate": 6.916416774581509e-05, + "loss": 1.2791, + "step": 38980 + }, + { + "epoch": 0.75, + "learning_rate": 6.915021706325211e-05, + "loss": 1.4112, + "step": 38990 + }, + { + "epoch": 0.75, + "learning_rate": 6.913626463336547e-05, + "loss": 1.437, + "step": 39000 + }, + { + "epoch": 0.75, + "learning_rate": 6.912231045742822e-05, + "loss": 1.0508, + "step": 39010 + }, + { + "epoch": 0.75, + "learning_rate": 6.910835453671362e-05, + "loss": 1.1755, + "step": 39020 + }, + { + "epoch": 0.75, + "learning_rate": 6.909439687249499e-05, + "loss": 1.1998, + "step": 39030 + }, + { + "epoch": 0.75, + "learning_rate": 6.908043746604593e-05, + "loss": 1.227, + "step": 39040 + }, + { + "epoch": 0.75, + "learning_rate": 6.906647631864007e-05, + "loss": 1.2545, + "step": 39050 + }, + { + "epoch": 0.75, + "learning_rate": 6.905251343155135e-05, + "loss": 1.3315, + "step": 39060 + }, + { + "epoch": 0.75, + "learning_rate": 6.903854880605373e-05, + "loss": 1.3104, + "step": 39070 + }, + { + "epoch": 0.75, + "learning_rate": 6.90245824434214e-05, + "loss": 1.2865, + "step": 39080 + }, + { + "epoch": 0.75, + "learning_rate": 6.901061434492868e-05, + "loss": 0.994, + "step": 39090 + }, + { + "epoch": 0.75, + "learning_rate": 6.899664451185007e-05, + "loss": 1.1979, + "step": 39100 + }, + { + "epoch": 0.75, + "learning_rate": 6.898267294546023e-05, + "loss": 1.2603, + "step": 39110 + }, + { + "epoch": 0.75, + "learning_rate": 6.896869964703397e-05, + "loss": 1.5188, + "step": 39120 + }, + { + "epoch": 0.75, + "learning_rate": 6.895472461784624e-05, + "loss": 1.4215, + "step": 39130 + }, + { + "epoch": 0.75, + "learning_rate": 6.894074785917219e-05, + "loss": 1.3187, + "step": 39140 + }, + { + "epoch": 0.75, + "learning_rate": 6.892676937228705e-05, + "loss": 1.0928, + "step": 39150 + }, + { + "epoch": 0.75, + "learning_rate": 6.891278915846631e-05, + "loss": 1.0739, + "step": 39160 + }, + { + "epoch": 0.75, + "learning_rate": 6.889880721898553e-05, + "loss": 1.3793, + "step": 39170 + }, + { + "epoch": 0.75, + "learning_rate": 6.88848235551205e-05, + "loss": 1.3913, + "step": 39180 + }, + { + "epoch": 0.75, + "learning_rate": 6.887083816814711e-05, + "loss": 1.2382, + "step": 39190 + }, + { + "epoch": 0.75, + "learning_rate": 6.885685105934143e-05, + "loss": 1.1174, + "step": 39200 + }, + { + "epoch": 0.75, + "learning_rate": 6.88428622299797e-05, + "loss": 1.3559, + "step": 39210 + }, + { + "epoch": 0.75, + "learning_rate": 6.882887168133829e-05, + "loss": 1.3627, + "step": 39220 + }, + { + "epoch": 0.75, + "learning_rate": 6.881487941469373e-05, + "loss": 1.1626, + "step": 39230 + }, + { + "epoch": 0.75, + "learning_rate": 6.880088543132275e-05, + "loss": 1.1884, + "step": 39240 + }, + { + "epoch": 0.75, + "learning_rate": 6.878688973250215e-05, + "loss": 1.2352, + "step": 39250 + }, + { + "epoch": 0.75, + "learning_rate": 6.877289231950901e-05, + "loss": 1.2119, + "step": 39260 + }, + { + "epoch": 0.76, + "learning_rate": 6.875889319362043e-05, + "loss": 1.3129, + "step": 39270 + }, + { + "epoch": 0.76, + "learning_rate": 6.874489235611378e-05, + "loss": 1.4021, + "step": 39280 + }, + { + "epoch": 0.76, + "learning_rate": 6.873088980826651e-05, + "loss": 1.1961, + "step": 39290 + }, + { + "epoch": 0.76, + "learning_rate": 6.871688555135627e-05, + "loss": 1.2347, + "step": 39300 + }, + { + "epoch": 0.76, + "learning_rate": 6.870287958666084e-05, + "loss": 1.2311, + "step": 39310 + }, + { + "epoch": 0.76, + "learning_rate": 6.868887191545816e-05, + "loss": 1.1066, + "step": 39320 + }, + { + "epoch": 0.76, + "learning_rate": 6.867486253902638e-05, + "loss": 1.3057, + "step": 39330 + }, + { + "epoch": 0.76, + "learning_rate": 6.86608514586437e-05, + "loss": 1.2619, + "step": 39340 + }, + { + "epoch": 0.76, + "learning_rate": 6.864683867558855e-05, + "loss": 1.1515, + "step": 39350 + }, + { + "epoch": 0.76, + "learning_rate": 6.863282419113952e-05, + "loss": 1.3945, + "step": 39360 + }, + { + "epoch": 0.76, + "learning_rate": 6.86188080065753e-05, + "loss": 1.293, + "step": 39370 + }, + { + "epoch": 0.76, + "learning_rate": 6.86047901231748e-05, + "loss": 1.3497, + "step": 39380 + }, + { + "epoch": 0.76, + "learning_rate": 6.859077054221703e-05, + "loss": 1.3709, + "step": 39390 + }, + { + "epoch": 0.76, + "learning_rate": 6.85767492649812e-05, + "loss": 1.1923, + "step": 39400 + }, + { + "epoch": 0.76, + "learning_rate": 6.856272629274665e-05, + "loss": 1.2464, + "step": 39410 + }, + { + "epoch": 0.76, + "learning_rate": 6.854870162679286e-05, + "loss": 1.212, + "step": 39420 + }, + { + "epoch": 0.76, + "learning_rate": 6.85346752683995e-05, + "loss": 1.3247, + "step": 39430 + }, + { + "epoch": 0.76, + "learning_rate": 6.852064721884636e-05, + "loss": 1.2687, + "step": 39440 + }, + { + "epoch": 0.76, + "learning_rate": 6.850661747941342e-05, + "loss": 1.1797, + "step": 39450 + }, + { + "epoch": 0.76, + "learning_rate": 6.84925860513808e-05, + "loss": 1.4658, + "step": 39460 + }, + { + "epoch": 0.76, + "learning_rate": 6.847855293602874e-05, + "loss": 1.2345, + "step": 39470 + }, + { + "epoch": 0.76, + "learning_rate": 6.846451813463771e-05, + "loss": 1.3541, + "step": 39480 + }, + { + "epoch": 0.76, + "learning_rate": 6.845048164848823e-05, + "loss": 1.2558, + "step": 39490 + }, + { + "epoch": 0.76, + "learning_rate": 6.843644347886109e-05, + "loss": 1.2234, + "step": 39500 + }, + { + "epoch": 0.76, + "learning_rate": 6.842240362703714e-05, + "loss": 1.1507, + "step": 39510 + }, + { + "epoch": 0.76, + "learning_rate": 6.84083620942974e-05, + "loss": 1.3053, + "step": 39520 + }, + { + "epoch": 0.76, + "learning_rate": 6.839431888192314e-05, + "loss": 1.0501, + "step": 39530 + }, + { + "epoch": 0.76, + "learning_rate": 6.838027399119561e-05, + "loss": 1.2126, + "step": 39540 + }, + { + "epoch": 0.76, + "learning_rate": 6.836622742339636e-05, + "loss": 1.1734, + "step": 39550 + }, + { + "epoch": 0.76, + "learning_rate": 6.835217917980704e-05, + "loss": 1.113, + "step": 39560 + }, + { + "epoch": 0.76, + "learning_rate": 6.833812926170943e-05, + "loss": 1.2672, + "step": 39570 + }, + { + "epoch": 0.76, + "learning_rate": 6.832407767038554e-05, + "loss": 0.9944, + "step": 39580 + }, + { + "epoch": 0.76, + "learning_rate": 6.83100244071174e-05, + "loss": 1.3661, + "step": 39590 + }, + { + "epoch": 0.76, + "learning_rate": 6.829596947318734e-05, + "loss": 1.3116, + "step": 39600 + }, + { + "epoch": 0.76, + "learning_rate": 6.828191286987774e-05, + "loss": 1.3279, + "step": 39610 + }, + { + "epoch": 0.76, + "learning_rate": 6.826785459847119e-05, + "loss": 1.1673, + "step": 39620 + }, + { + "epoch": 0.76, + "learning_rate": 6.825379466025039e-05, + "loss": 1.4262, + "step": 39630 + }, + { + "epoch": 0.76, + "learning_rate": 6.823973305649822e-05, + "loss": 1.3877, + "step": 39640 + }, + { + "epoch": 0.76, + "learning_rate": 6.822566978849769e-05, + "loss": 1.2213, + "step": 39650 + }, + { + "epoch": 0.76, + "learning_rate": 6.821160485753198e-05, + "loss": 1.1957, + "step": 39660 + }, + { + "epoch": 0.76, + "learning_rate": 6.819753826488444e-05, + "loss": 1.3698, + "step": 39670 + }, + { + "epoch": 0.76, + "learning_rate": 6.818347001183854e-05, + "loss": 1.2701, + "step": 39680 + }, + { + "epoch": 0.76, + "learning_rate": 6.816940009967787e-05, + "loss": 1.3569, + "step": 39690 + }, + { + "epoch": 0.76, + "learning_rate": 6.815532852968627e-05, + "loss": 1.2205, + "step": 39700 + }, + { + "epoch": 0.76, + "learning_rate": 6.814125530314762e-05, + "loss": 1.2081, + "step": 39710 + }, + { + "epoch": 0.76, + "learning_rate": 6.812718042134604e-05, + "loss": 1.2491, + "step": 39720 + }, + { + "epoch": 0.76, + "learning_rate": 6.811310388556575e-05, + "loss": 1.1939, + "step": 39730 + }, + { + "epoch": 0.76, + "learning_rate": 6.809902569709116e-05, + "loss": 1.0998, + "step": 39740 + }, + { + "epoch": 0.76, + "learning_rate": 6.808494585720677e-05, + "loss": 1.4934, + "step": 39750 + }, + { + "epoch": 0.76, + "learning_rate": 6.807086436719727e-05, + "loss": 1.5166, + "step": 39760 + }, + { + "epoch": 0.76, + "learning_rate": 6.805678122834752e-05, + "loss": 1.2678, + "step": 39770 + }, + { + "epoch": 0.76, + "learning_rate": 6.80426964419425e-05, + "loss": 1.1983, + "step": 39780 + }, + { + "epoch": 0.77, + "learning_rate": 6.802861000926735e-05, + "loss": 1.3412, + "step": 39790 + }, + { + "epoch": 0.77, + "learning_rate": 6.801452193160735e-05, + "loss": 1.2861, + "step": 39800 + }, + { + "epoch": 0.77, + "learning_rate": 6.800043221024794e-05, + "loss": 1.3857, + "step": 39810 + }, + { + "epoch": 0.77, + "learning_rate": 6.798634084647471e-05, + "loss": 1.1595, + "step": 39820 + }, + { + "epoch": 0.77, + "learning_rate": 6.797224784157343e-05, + "loss": 1.358, + "step": 39830 + }, + { + "epoch": 0.77, + "learning_rate": 6.795815319682993e-05, + "loss": 1.3683, + "step": 39840 + }, + { + "epoch": 0.77, + "learning_rate": 6.79440569135303e-05, + "loss": 1.2679, + "step": 39850 + }, + { + "epoch": 0.77, + "learning_rate": 6.792995899296068e-05, + "loss": 1.2655, + "step": 39860 + }, + { + "epoch": 0.77, + "learning_rate": 6.791585943640743e-05, + "loss": 1.197, + "step": 39870 + }, + { + "epoch": 0.77, + "learning_rate": 6.790175824515706e-05, + "loss": 1.4707, + "step": 39880 + }, + { + "epoch": 0.77, + "learning_rate": 6.788765542049618e-05, + "loss": 1.0409, + "step": 39890 + }, + { + "epoch": 0.77, + "learning_rate": 6.787355096371158e-05, + "loss": 1.4909, + "step": 39900 + }, + { + "epoch": 0.77, + "learning_rate": 6.785944487609018e-05, + "loss": 1.4464, + "step": 39910 + }, + { + "epoch": 0.77, + "learning_rate": 6.784533715891908e-05, + "loss": 1.3778, + "step": 39920 + }, + { + "epoch": 0.77, + "learning_rate": 6.783122781348549e-05, + "loss": 1.1798, + "step": 39930 + }, + { + "epoch": 0.77, + "learning_rate": 6.781711684107682e-05, + "loss": 1.3959, + "step": 39940 + }, + { + "epoch": 0.77, + "learning_rate": 6.780300424298059e-05, + "loss": 1.4152, + "step": 39950 + }, + { + "epoch": 0.77, + "learning_rate": 6.778889002048443e-05, + "loss": 1.2672, + "step": 39960 + }, + { + "epoch": 0.77, + "learning_rate": 6.777477417487623e-05, + "loss": 1.204, + "step": 39970 + }, + { + "epoch": 0.77, + "learning_rate": 6.776065670744392e-05, + "loss": 1.2221, + "step": 39980 + }, + { + "epoch": 0.77, + "learning_rate": 6.774653761947566e-05, + "loss": 1.3792, + "step": 39990 + }, + { + "epoch": 0.77, + "learning_rate": 6.773241691225966e-05, + "loss": 1.2647, + "step": 40000 + }, + { + "epoch": 0.77, + "learning_rate": 6.771829458708439e-05, + "loss": 1.3701, + "step": 40010 + }, + { + "epoch": 0.77, + "learning_rate": 6.770417064523838e-05, + "loss": 1.3269, + "step": 40020 + }, + { + "epoch": 0.77, + "learning_rate": 6.769004508801036e-05, + "loss": 1.4423, + "step": 40030 + }, + { + "epoch": 0.77, + "learning_rate": 6.767591791668918e-05, + "loss": 1.3957, + "step": 40040 + }, + { + "epoch": 0.77, + "learning_rate": 6.766178913256383e-05, + "loss": 1.169, + "step": 40050 + }, + { + "epoch": 0.77, + "learning_rate": 6.764765873692351e-05, + "loss": 1.135, + "step": 40060 + }, + { + "epoch": 0.77, + "learning_rate": 6.763352673105747e-05, + "loss": 1.2183, + "step": 40070 + }, + { + "epoch": 0.77, + "learning_rate": 6.761939311625518e-05, + "loss": 1.2422, + "step": 40080 + }, + { + "epoch": 0.77, + "learning_rate": 6.760525789380625e-05, + "loss": 1.2527, + "step": 40090 + }, + { + "epoch": 0.77, + "learning_rate": 6.759112106500039e-05, + "loss": 1.276, + "step": 40100 + }, + { + "epoch": 0.77, + "learning_rate": 6.757698263112749e-05, + "loss": 1.0917, + "step": 40110 + }, + { + "epoch": 0.77, + "learning_rate": 6.756284259347759e-05, + "loss": 1.3492, + "step": 40120 + }, + { + "epoch": 0.77, + "learning_rate": 6.754870095334087e-05, + "loss": 1.4433, + "step": 40130 + }, + { + "epoch": 0.77, + "learning_rate": 6.753455771200769e-05, + "loss": 1.3454, + "step": 40140 + }, + { + "epoch": 0.77, + "learning_rate": 6.752041287076845e-05, + "loss": 1.1753, + "step": 40150 + }, + { + "epoch": 0.77, + "learning_rate": 6.750626643091382e-05, + "loss": 1.2438, + "step": 40160 + }, + { + "epoch": 0.77, + "learning_rate": 6.749211839373456e-05, + "loss": 1.2434, + "step": 40170 + }, + { + "epoch": 0.77, + "learning_rate": 6.747796876052155e-05, + "loss": 1.3341, + "step": 40180 + }, + { + "epoch": 0.77, + "learning_rate": 6.74638175325659e-05, + "loss": 1.1336, + "step": 40190 + }, + { + "epoch": 0.77, + "learning_rate": 6.744966471115874e-05, + "loss": 1.4933, + "step": 40200 + }, + { + "epoch": 0.77, + "learning_rate": 6.743551029759149e-05, + "loss": 1.1898, + "step": 40210 + }, + { + "epoch": 0.77, + "learning_rate": 6.742135429315558e-05, + "loss": 1.3852, + "step": 40220 + }, + { + "epoch": 0.77, + "learning_rate": 6.740719669914268e-05, + "loss": 1.208, + "step": 40230 + }, + { + "epoch": 0.77, + "learning_rate": 6.739303751684455e-05, + "loss": 1.2554, + "step": 40240 + }, + { + "epoch": 0.77, + "learning_rate": 6.737887674755314e-05, + "loss": 1.2452, + "step": 40250 + }, + { + "epoch": 0.77, + "learning_rate": 6.736471439256053e-05, + "loss": 1.2203, + "step": 40260 + }, + { + "epoch": 0.77, + "learning_rate": 6.73505504531589e-05, + "loss": 1.144, + "step": 40270 + }, + { + "epoch": 0.77, + "learning_rate": 6.73363849306406e-05, + "loss": 1.3685, + "step": 40280 + }, + { + "epoch": 0.77, + "learning_rate": 6.732221782629822e-05, + "loss": 1.1862, + "step": 40290 + }, + { + "epoch": 0.77, + "learning_rate": 6.730804914142431e-05, + "loss": 1.3339, + "step": 40300 + }, + { + "epoch": 0.78, + "learning_rate": 6.729387887731171e-05, + "loss": 1.2099, + "step": 40310 + }, + { + "epoch": 0.78, + "learning_rate": 6.727970703525336e-05, + "loss": 1.2817, + "step": 40320 + }, + { + "epoch": 0.78, + "learning_rate": 6.726553361654234e-05, + "loss": 1.2084, + "step": 40330 + }, + { + "epoch": 0.78, + "learning_rate": 6.725135862247189e-05, + "loss": 1.2536, + "step": 40340 + }, + { + "epoch": 0.78, + "learning_rate": 6.723718205433532e-05, + "loss": 1.2808, + "step": 40350 + }, + { + "epoch": 0.78, + "learning_rate": 6.72230039134262e-05, + "loss": 1.3546, + "step": 40360 + }, + { + "epoch": 0.78, + "learning_rate": 6.720882420103816e-05, + "loss": 1.2609, + "step": 40370 + }, + { + "epoch": 0.78, + "learning_rate": 6.719464291846503e-05, + "loss": 1.0784, + "step": 40380 + }, + { + "epoch": 0.78, + "learning_rate": 6.718046006700072e-05, + "loss": 1.2334, + "step": 40390 + }, + { + "epoch": 0.78, + "learning_rate": 6.716627564793933e-05, + "loss": 1.1831, + "step": 40400 + }, + { + "epoch": 0.78, + "learning_rate": 6.715208966257509e-05, + "loss": 1.4768, + "step": 40410 + }, + { + "epoch": 0.78, + "learning_rate": 6.713790211220235e-05, + "loss": 1.1456, + "step": 40420 + }, + { + "epoch": 0.78, + "learning_rate": 6.712371299811567e-05, + "loss": 1.3119, + "step": 40430 + }, + { + "epoch": 0.78, + "learning_rate": 6.710952232160968e-05, + "loss": 1.2658, + "step": 40440 + }, + { + "epoch": 0.78, + "learning_rate": 6.709533008397917e-05, + "loss": 1.2845, + "step": 40450 + }, + { + "epoch": 0.78, + "learning_rate": 6.70811362865191e-05, + "loss": 1.1218, + "step": 40460 + }, + { + "epoch": 0.78, + "learning_rate": 6.706694093052455e-05, + "loss": 1.1409, + "step": 40470 + }, + { + "epoch": 0.78, + "learning_rate": 6.705274401729076e-05, + "loss": 1.3249, + "step": 40480 + }, + { + "epoch": 0.78, + "learning_rate": 6.703854554811308e-05, + "loss": 0.9968, + "step": 40490 + }, + { + "epoch": 0.78, + "learning_rate": 6.702434552428703e-05, + "loss": 1.2545, + "step": 40500 + }, + { + "epoch": 0.78, + "learning_rate": 6.701014394710825e-05, + "loss": 1.366, + "step": 40510 + }, + { + "epoch": 0.78, + "learning_rate": 6.699594081787253e-05, + "loss": 1.2327, + "step": 40520 + }, + { + "epoch": 0.78, + "learning_rate": 6.698173613787586e-05, + "loss": 1.2537, + "step": 40530 + }, + { + "epoch": 0.78, + "learning_rate": 6.696752990841427e-05, + "loss": 1.2219, + "step": 40540 + }, + { + "epoch": 0.78, + "learning_rate": 6.695332213078398e-05, + "loss": 1.3962, + "step": 40550 + }, + { + "epoch": 0.78, + "learning_rate": 6.693911280628136e-05, + "loss": 1.0257, + "step": 40560 + }, + { + "epoch": 0.78, + "learning_rate": 6.692490193620291e-05, + "loss": 1.4341, + "step": 40570 + }, + { + "epoch": 0.78, + "learning_rate": 6.691068952184527e-05, + "loss": 1.3693, + "step": 40580 + }, + { + "epoch": 0.78, + "learning_rate": 6.689647556450525e-05, + "loss": 1.2385, + "step": 40590 + }, + { + "epoch": 0.78, + "learning_rate": 6.688226006547973e-05, + "loss": 1.2903, + "step": 40600 + }, + { + "epoch": 0.78, + "learning_rate": 6.686804302606582e-05, + "loss": 1.2775, + "step": 40610 + }, + { + "epoch": 0.78, + "learning_rate": 6.685382444756068e-05, + "loss": 1.2731, + "step": 40620 + }, + { + "epoch": 0.78, + "learning_rate": 6.683960433126168e-05, + "loss": 1.1435, + "step": 40630 + }, + { + "epoch": 0.78, + "learning_rate": 6.682538267846632e-05, + "loss": 1.2533, + "step": 40640 + }, + { + "epoch": 0.78, + "learning_rate": 6.68111594904722e-05, + "loss": 1.2658, + "step": 40650 + }, + { + "epoch": 0.78, + "learning_rate": 6.679693476857711e-05, + "loss": 1.2501, + "step": 40660 + }, + { + "epoch": 0.78, + "learning_rate": 6.678270851407893e-05, + "loss": 1.3579, + "step": 40670 + }, + { + "epoch": 0.78, + "learning_rate": 6.676848072827574e-05, + "loss": 1.1907, + "step": 40680 + }, + { + "epoch": 0.78, + "learning_rate": 6.675425141246571e-05, + "loss": 1.1671, + "step": 40690 + }, + { + "epoch": 0.78, + "learning_rate": 6.674002056794715e-05, + "loss": 1.1534, + "step": 40700 + }, + { + "epoch": 0.78, + "learning_rate": 6.672578819601854e-05, + "loss": 1.0911, + "step": 40710 + }, + { + "epoch": 0.78, + "learning_rate": 6.671155429797848e-05, + "loss": 1.4156, + "step": 40720 + }, + { + "epoch": 0.78, + "learning_rate": 6.669731887512574e-05, + "loss": 1.2791, + "step": 40730 + }, + { + "epoch": 0.78, + "learning_rate": 6.668308192875916e-05, + "loss": 1.1994, + "step": 40740 + }, + { + "epoch": 0.78, + "learning_rate": 6.666884346017779e-05, + "loss": 1.3724, + "step": 40750 + }, + { + "epoch": 0.78, + "learning_rate": 6.665460347068078e-05, + "loss": 1.192, + "step": 40760 + }, + { + "epoch": 0.78, + "learning_rate": 6.664036196156742e-05, + "loss": 1.2747, + "step": 40770 + }, + { + "epoch": 0.78, + "learning_rate": 6.662611893413718e-05, + "loss": 1.2047, + "step": 40780 + }, + { + "epoch": 0.78, + "learning_rate": 6.661187438968962e-05, + "loss": 1.2685, + "step": 40790 + }, + { + "epoch": 0.78, + "learning_rate": 6.659762832952445e-05, + "loss": 1.3452, + "step": 40800 + }, + { + "epoch": 0.78, + "learning_rate": 6.658338075494151e-05, + "loss": 1.2788, + "step": 40810 + }, + { + "epoch": 0.78, + "learning_rate": 6.656913166724082e-05, + "loss": 1.0796, + "step": 40820 + }, + { + "epoch": 0.79, + "learning_rate": 6.655488106772251e-05, + "loss": 1.2695, + "step": 40830 + }, + { + "epoch": 0.79, + "learning_rate": 6.654062895768682e-05, + "loss": 1.3074, + "step": 40840 + }, + { + "epoch": 0.79, + "learning_rate": 6.65263753384342e-05, + "loss": 1.2268, + "step": 40850 + }, + { + "epoch": 0.79, + "learning_rate": 6.651212021126513e-05, + "loss": 1.4, + "step": 40860 + }, + { + "epoch": 0.79, + "learning_rate": 6.649786357748033e-05, + "loss": 1.2685, + "step": 40870 + }, + { + "epoch": 0.79, + "learning_rate": 6.648360543838063e-05, + "loss": 1.3608, + "step": 40880 + }, + { + "epoch": 0.79, + "learning_rate": 6.646934579526696e-05, + "loss": 1.1392, + "step": 40890 + }, + { + "epoch": 0.79, + "learning_rate": 6.645508464944044e-05, + "loss": 1.1834, + "step": 40900 + }, + { + "epoch": 0.79, + "learning_rate": 6.644082200220226e-05, + "loss": 1.3361, + "step": 40910 + }, + { + "epoch": 0.79, + "learning_rate": 6.642655785485383e-05, + "loss": 1.2986, + "step": 40920 + }, + { + "epoch": 0.79, + "learning_rate": 6.641229220869663e-05, + "loss": 1.2302, + "step": 40930 + }, + { + "epoch": 0.79, + "learning_rate": 6.639802506503228e-05, + "loss": 1.2555, + "step": 40940 + }, + { + "epoch": 0.79, + "learning_rate": 6.638375642516261e-05, + "loss": 1.1616, + "step": 40950 + }, + { + "epoch": 0.79, + "learning_rate": 6.63694862903895e-05, + "loss": 1.6905, + "step": 40960 + }, + { + "epoch": 0.79, + "learning_rate": 6.6355214662015e-05, + "loss": 1.2973, + "step": 40970 + }, + { + "epoch": 0.79, + "learning_rate": 6.634094154134129e-05, + "loss": 1.3576, + "step": 40980 + }, + { + "epoch": 0.79, + "learning_rate": 6.632666692967073e-05, + "loss": 1.3233, + "step": 40990 + }, + { + "epoch": 0.79, + "learning_rate": 6.631239082830575e-05, + "loss": 1.2005, + "step": 41000 + }, + { + "epoch": 0.79, + "learning_rate": 6.629811323854893e-05, + "loss": 1.0917, + "step": 41010 + }, + { + "epoch": 0.79, + "learning_rate": 6.628383416170302e-05, + "loss": 1.1465, + "step": 41020 + }, + { + "epoch": 0.79, + "learning_rate": 6.62695535990709e-05, + "loss": 1.2488, + "step": 41030 + }, + { + "epoch": 0.79, + "learning_rate": 6.625527155195556e-05, + "loss": 1.2618, + "step": 41040 + }, + { + "epoch": 0.79, + "learning_rate": 6.624098802166012e-05, + "loss": 1.2121, + "step": 41050 + }, + { + "epoch": 0.79, + "learning_rate": 6.622670300948788e-05, + "loss": 1.2653, + "step": 41060 + }, + { + "epoch": 0.79, + "learning_rate": 6.621241651674222e-05, + "loss": 1.3095, + "step": 41070 + }, + { + "epoch": 0.79, + "learning_rate": 6.61981285447267e-05, + "loss": 1.1277, + "step": 41080 + }, + { + "epoch": 0.79, + "learning_rate": 6.6183839094745e-05, + "loss": 1.413, + "step": 41090 + }, + { + "epoch": 0.79, + "learning_rate": 6.616954816810093e-05, + "loss": 1.2168, + "step": 41100 + }, + { + "epoch": 0.79, + "learning_rate": 6.615525576609842e-05, + "loss": 1.1659, + "step": 41110 + }, + { + "epoch": 0.79, + "learning_rate": 6.614096189004158e-05, + "loss": 1.157, + "step": 41120 + }, + { + "epoch": 0.79, + "learning_rate": 6.61266665412346e-05, + "loss": 1.5425, + "step": 41130 + }, + { + "epoch": 0.79, + "learning_rate": 6.611236972098185e-05, + "loss": 1.375, + "step": 41140 + }, + { + "epoch": 0.79, + "learning_rate": 6.609807143058782e-05, + "loss": 1.1938, + "step": 41150 + }, + { + "epoch": 0.79, + "learning_rate": 6.60837716713571e-05, + "loss": 1.1169, + "step": 41160 + }, + { + "epoch": 0.79, + "learning_rate": 6.606947044459446e-05, + "loss": 1.3525, + "step": 41170 + }, + { + "epoch": 0.79, + "learning_rate": 6.605516775160479e-05, + "loss": 1.3685, + "step": 41180 + }, + { + "epoch": 0.79, + "learning_rate": 6.604086359369312e-05, + "loss": 1.1121, + "step": 41190 + }, + { + "epoch": 0.79, + "learning_rate": 6.602655797216459e-05, + "loss": 1.2515, + "step": 41200 + }, + { + "epoch": 0.79, + "learning_rate": 6.601225088832448e-05, + "loss": 1.3406, + "step": 41210 + }, + { + "epoch": 0.79, + "learning_rate": 6.599794234347825e-05, + "loss": 1.3324, + "step": 41220 + }, + { + "epoch": 0.79, + "learning_rate": 6.59836323389314e-05, + "loss": 1.322, + "step": 41230 + }, + { + "epoch": 0.79, + "learning_rate": 6.596932087598966e-05, + "loss": 1.3533, + "step": 41240 + }, + { + "epoch": 0.79, + "learning_rate": 6.595500795595884e-05, + "loss": 1.2722, + "step": 41250 + }, + { + "epoch": 0.79, + "learning_rate": 6.594069358014489e-05, + "loss": 1.5871, + "step": 41260 + }, + { + "epoch": 0.79, + "learning_rate": 6.592637774985389e-05, + "loss": 1.2411, + "step": 41270 + }, + { + "epoch": 0.79, + "learning_rate": 6.591206046639207e-05, + "loss": 1.405, + "step": 41280 + }, + { + "epoch": 0.79, + "learning_rate": 6.589774173106578e-05, + "loss": 1.101, + "step": 41290 + }, + { + "epoch": 0.79, + "learning_rate": 6.58834215451815e-05, + "loss": 1.0542, + "step": 41300 + }, + { + "epoch": 0.79, + "learning_rate": 6.586909991004586e-05, + "loss": 1.3303, + "step": 41310 + }, + { + "epoch": 0.79, + "learning_rate": 6.58547768269656e-05, + "loss": 1.5177, + "step": 41320 + }, + { + "epoch": 0.79, + "learning_rate": 6.58404522972476e-05, + "loss": 1.4671, + "step": 41330 + }, + { + "epoch": 0.79, + "learning_rate": 6.582612632219888e-05, + "loss": 1.2435, + "step": 41340 + }, + { + "epoch": 0.8, + "learning_rate": 6.581179890312658e-05, + "loss": 1.3567, + "step": 41350 + }, + { + "epoch": 0.8, + "learning_rate": 6.579747004133797e-05, + "loss": 1.2182, + "step": 41360 + }, + { + "epoch": 0.8, + "learning_rate": 6.578313973814048e-05, + "loss": 1.4492, + "step": 41370 + }, + { + "epoch": 0.8, + "learning_rate": 6.576880799484162e-05, + "loss": 1.2936, + "step": 41380 + }, + { + "epoch": 0.8, + "learning_rate": 6.575447481274909e-05, + "loss": 1.2785, + "step": 41390 + }, + { + "epoch": 0.8, + "learning_rate": 6.574014019317069e-05, + "loss": 1.3432, + "step": 41400 + }, + { + "epoch": 0.8, + "learning_rate": 6.572580413741433e-05, + "loss": 1.3113, + "step": 41410 + }, + { + "epoch": 0.8, + "learning_rate": 6.571146664678809e-05, + "loss": 1.2227, + "step": 41420 + }, + { + "epoch": 0.8, + "learning_rate": 6.569712772260017e-05, + "loss": 1.2008, + "step": 41430 + }, + { + "epoch": 0.8, + "learning_rate": 6.56827873661589e-05, + "loss": 1.3844, + "step": 41440 + }, + { + "epoch": 0.8, + "learning_rate": 6.566844557877271e-05, + "loss": 1.2153, + "step": 41450 + }, + { + "epoch": 0.8, + "learning_rate": 6.565410236175024e-05, + "loss": 1.2094, + "step": 41460 + }, + { + "epoch": 0.8, + "learning_rate": 6.563975771640013e-05, + "loss": 1.3363, + "step": 41470 + }, + { + "epoch": 0.8, + "learning_rate": 6.562541164403132e-05, + "loss": 1.1893, + "step": 41480 + }, + { + "epoch": 0.8, + "learning_rate": 6.561106414595273e-05, + "loss": 1.3546, + "step": 41490 + }, + { + "epoch": 0.8, + "learning_rate": 6.559671522347348e-05, + "loss": 1.2487, + "step": 41500 + }, + { + "epoch": 0.8, + "learning_rate": 6.558236487790282e-05, + "loss": 1.2374, + "step": 41510 + }, + { + "epoch": 0.8, + "learning_rate": 6.556801311055011e-05, + "loss": 1.2347, + "step": 41520 + }, + { + "epoch": 0.8, + "learning_rate": 6.555365992272484e-05, + "loss": 1.2922, + "step": 41530 + }, + { + "epoch": 0.8, + "learning_rate": 6.553930531573667e-05, + "loss": 1.3913, + "step": 41540 + }, + { + "epoch": 0.8, + "learning_rate": 6.552494929089533e-05, + "loss": 1.2582, + "step": 41550 + }, + { + "epoch": 0.8, + "learning_rate": 6.55105918495107e-05, + "loss": 1.35, + "step": 41560 + }, + { + "epoch": 0.8, + "learning_rate": 6.54962329928928e-05, + "loss": 1.2943, + "step": 41570 + }, + { + "epoch": 0.8, + "learning_rate": 6.54818727223518e-05, + "loss": 1.2681, + "step": 41580 + }, + { + "epoch": 0.8, + "learning_rate": 6.546751103919797e-05, + "loss": 1.2389, + "step": 41590 + }, + { + "epoch": 0.8, + "learning_rate": 6.545314794474169e-05, + "loss": 1.1527, + "step": 41600 + }, + { + "epoch": 0.8, + "learning_rate": 6.543878344029351e-05, + "loss": 1.3653, + "step": 41610 + }, + { + "epoch": 0.8, + "learning_rate": 6.542441752716408e-05, + "loss": 1.065, + "step": 41620 + }, + { + "epoch": 0.8, + "learning_rate": 6.54100502066642e-05, + "loss": 1.3513, + "step": 41630 + }, + { + "epoch": 0.8, + "learning_rate": 6.539568148010476e-05, + "loss": 1.3165, + "step": 41640 + }, + { + "epoch": 0.8, + "learning_rate": 6.538131134879687e-05, + "loss": 1.2392, + "step": 41650 + }, + { + "epoch": 0.8, + "learning_rate": 6.536693981405164e-05, + "loss": 1.6127, + "step": 41660 + }, + { + "epoch": 0.8, + "learning_rate": 6.535256687718039e-05, + "loss": 1.0471, + "step": 41670 + }, + { + "epoch": 0.8, + "learning_rate": 6.533819253949456e-05, + "loss": 1.1159, + "step": 41680 + }, + { + "epoch": 0.8, + "learning_rate": 6.532381680230571e-05, + "loss": 1.388, + "step": 41690 + }, + { + "epoch": 0.8, + "learning_rate": 6.530943966692553e-05, + "loss": 1.4454, + "step": 41700 + }, + { + "epoch": 0.8, + "learning_rate": 6.529506113466579e-05, + "loss": 1.1383, + "step": 41710 + }, + { + "epoch": 0.8, + "learning_rate": 6.52806812068385e-05, + "loss": 1.6383, + "step": 41720 + }, + { + "epoch": 0.8, + "learning_rate": 6.526629988475567e-05, + "loss": 1.4252, + "step": 41730 + }, + { + "epoch": 0.8, + "learning_rate": 6.52519171697295e-05, + "loss": 1.2667, + "step": 41740 + }, + { + "epoch": 0.8, + "learning_rate": 6.523753306307235e-05, + "loss": 1.3625, + "step": 41750 + }, + { + "epoch": 0.8, + "learning_rate": 6.522314756609665e-05, + "loss": 1.242, + "step": 41760 + }, + { + "epoch": 0.8, + "learning_rate": 6.520876068011498e-05, + "loss": 1.2406, + "step": 41770 + }, + { + "epoch": 0.8, + "learning_rate": 6.519437240644002e-05, + "loss": 1.1479, + "step": 41780 + }, + { + "epoch": 0.8, + "learning_rate": 6.517998274638462e-05, + "loss": 1.1082, + "step": 41790 + }, + { + "epoch": 0.8, + "learning_rate": 6.516559170126174e-05, + "loss": 1.5322, + "step": 41800 + }, + { + "epoch": 0.8, + "learning_rate": 6.515119927238446e-05, + "loss": 1.3253, + "step": 41810 + }, + { + "epoch": 0.8, + "learning_rate": 6.513680546106598e-05, + "loss": 1.3413, + "step": 41820 + }, + { + "epoch": 0.8, + "learning_rate": 6.512241026861963e-05, + "loss": 1.3393, + "step": 41830 + }, + { + "epoch": 0.8, + "learning_rate": 6.510801369635888e-05, + "loss": 1.1759, + "step": 41840 + }, + { + "epoch": 0.8, + "learning_rate": 6.509361574559733e-05, + "loss": 1.2599, + "step": 41850 + }, + { + "epoch": 0.8, + "learning_rate": 6.507921641764867e-05, + "loss": 1.2834, + "step": 41860 + }, + { + "epoch": 0.81, + "learning_rate": 6.506481571382674e-05, + "loss": 1.2137, + "step": 41870 + }, + { + "epoch": 0.81, + "learning_rate": 6.505041363544553e-05, + "loss": 1.2684, + "step": 41880 + }, + { + "epoch": 0.81, + "learning_rate": 6.50360101838191e-05, + "loss": 1.2873, + "step": 41890 + }, + { + "epoch": 0.81, + "learning_rate": 6.502160536026167e-05, + "loss": 1.3106, + "step": 41900 + }, + { + "epoch": 0.81, + "learning_rate": 6.500719916608759e-05, + "loss": 1.3021, + "step": 41910 + }, + { + "epoch": 0.81, + "learning_rate": 6.499279160261132e-05, + "loss": 1.3459, + "step": 41920 + }, + { + "epoch": 0.81, + "learning_rate": 6.497838267114744e-05, + "loss": 1.1842, + "step": 41930 + }, + { + "epoch": 0.81, + "learning_rate": 6.496397237301068e-05, + "loss": 1.2094, + "step": 41940 + }, + { + "epoch": 0.81, + "learning_rate": 6.494956070951586e-05, + "loss": 1.2897, + "step": 41950 + }, + { + "epoch": 0.81, + "learning_rate": 6.493514768197798e-05, + "loss": 1.4416, + "step": 41960 + }, + { + "epoch": 0.81, + "learning_rate": 6.492073329171208e-05, + "loss": 1.1711, + "step": 41970 + }, + { + "epoch": 0.81, + "learning_rate": 6.49063175400334e-05, + "loss": 1.144, + "step": 41980 + }, + { + "epoch": 0.81, + "learning_rate": 6.489190042825729e-05, + "loss": 1.2351, + "step": 41990 + }, + { + "epoch": 0.81, + "learning_rate": 6.487748195769918e-05, + "loss": 1.2817, + "step": 42000 + }, + { + "epoch": 0.81, + "learning_rate": 6.486306212967467e-05, + "loss": 1.178, + "step": 42010 + }, + { + "epoch": 0.81, + "learning_rate": 6.484864094549949e-05, + "loss": 1.2329, + "step": 42020 + }, + { + "epoch": 0.81, + "learning_rate": 6.483421840648941e-05, + "loss": 1.2751, + "step": 42030 + }, + { + "epoch": 0.81, + "learning_rate": 6.481979451396046e-05, + "loss": 1.064, + "step": 42040 + }, + { + "epoch": 0.81, + "learning_rate": 6.480536926922867e-05, + "loss": 1.4848, + "step": 42050 + }, + { + "epoch": 0.81, + "learning_rate": 6.479094267361025e-05, + "loss": 1.0586, + "step": 42060 + }, + { + "epoch": 0.81, + "learning_rate": 6.477651472842154e-05, + "loss": 1.2421, + "step": 42070 + }, + { + "epoch": 0.81, + "learning_rate": 6.4762085434979e-05, + "loss": 1.2807, + "step": 42080 + }, + { + "epoch": 0.81, + "learning_rate": 6.474765479459917e-05, + "loss": 1.4826, + "step": 42090 + }, + { + "epoch": 0.81, + "learning_rate": 6.473322280859877e-05, + "loss": 1.2489, + "step": 42100 + }, + { + "epoch": 0.81, + "learning_rate": 6.47187894782946e-05, + "loss": 1.3564, + "step": 42110 + }, + { + "epoch": 0.81, + "learning_rate": 6.470435480500362e-05, + "loss": 1.2247, + "step": 42120 + }, + { + "epoch": 0.81, + "learning_rate": 6.468991879004287e-05, + "loss": 1.2853, + "step": 42130 + }, + { + "epoch": 0.81, + "learning_rate": 6.467548143472955e-05, + "loss": 1.2756, + "step": 42140 + }, + { + "epoch": 0.81, + "learning_rate": 6.466104274038099e-05, + "loss": 1.4013, + "step": 42150 + }, + { + "epoch": 0.81, + "learning_rate": 6.464660270831458e-05, + "loss": 1.2552, + "step": 42160 + }, + { + "epoch": 0.81, + "learning_rate": 6.463216133984788e-05, + "loss": 1.2458, + "step": 42170 + }, + { + "epoch": 0.81, + "learning_rate": 6.461771863629859e-05, + "loss": 1.1625, + "step": 42180 + }, + { + "epoch": 0.81, + "learning_rate": 6.460327459898448e-05, + "loss": 1.3145, + "step": 42190 + }, + { + "epoch": 0.81, + "learning_rate": 6.458882922922348e-05, + "loss": 1.1647, + "step": 42200 + }, + { + "epoch": 0.81, + "learning_rate": 6.457438252833362e-05, + "loss": 1.2926, + "step": 42210 + }, + { + "epoch": 0.81, + "learning_rate": 6.455993449763307e-05, + "loss": 1.3975, + "step": 42220 + }, + { + "epoch": 0.81, + "learning_rate": 6.454548513844011e-05, + "loss": 1.56, + "step": 42230 + }, + { + "epoch": 0.81, + "learning_rate": 6.453103445207313e-05, + "loss": 1.3542, + "step": 42240 + }, + { + "epoch": 0.81, + "learning_rate": 6.451658243985068e-05, + "loss": 1.2432, + "step": 42250 + }, + { + "epoch": 0.81, + "learning_rate": 6.45021291030914e-05, + "loss": 1.3524, + "step": 42260 + }, + { + "epoch": 0.81, + "learning_rate": 6.448767444311404e-05, + "loss": 1.3627, + "step": 42270 + }, + { + "epoch": 0.81, + "learning_rate": 6.447321846123748e-05, + "loss": 1.2118, + "step": 42280 + }, + { + "epoch": 0.81, + "learning_rate": 6.445876115878075e-05, + "loss": 1.2069, + "step": 42290 + }, + { + "epoch": 0.81, + "learning_rate": 6.444430253706296e-05, + "loss": 1.1955, + "step": 42300 + }, + { + "epoch": 0.81, + "learning_rate": 6.442984259740339e-05, + "loss": 1.5169, + "step": 42310 + }, + { + "epoch": 0.81, + "learning_rate": 6.441538134112139e-05, + "loss": 1.1561, + "step": 42320 + }, + { + "epoch": 0.81, + "learning_rate": 6.440091876953641e-05, + "loss": 1.2089, + "step": 42330 + }, + { + "epoch": 0.81, + "learning_rate": 6.438645488396812e-05, + "loss": 1.2732, + "step": 42340 + }, + { + "epoch": 0.81, + "learning_rate": 6.43719896857362e-05, + "loss": 1.1662, + "step": 42350 + }, + { + "epoch": 0.81, + "learning_rate": 6.435752317616056e-05, + "loss": 1.306, + "step": 42360 + }, + { + "epoch": 0.81, + "learning_rate": 6.43430553565611e-05, + "loss": 1.2564, + "step": 42370 + }, + { + "epoch": 0.81, + "learning_rate": 6.432858622825794e-05, + "loss": 1.3372, + "step": 42380 + }, + { + "epoch": 0.82, + "learning_rate": 6.43141157925713e-05, + "loss": 1.4228, + "step": 42390 + }, + { + "epoch": 0.82, + "learning_rate": 6.429964405082145e-05, + "loss": 1.3389, + "step": 42400 + }, + { + "epoch": 0.82, + "learning_rate": 6.428517100432891e-05, + "loss": 1.2351, + "step": 42410 + }, + { + "epoch": 0.82, + "learning_rate": 6.42706966544142e-05, + "loss": 1.489, + "step": 42420 + }, + { + "epoch": 0.82, + "learning_rate": 6.425622100239803e-05, + "loss": 1.2079, + "step": 42430 + }, + { + "epoch": 0.82, + "learning_rate": 6.424174404960116e-05, + "loss": 1.4864, + "step": 42440 + }, + { + "epoch": 0.82, + "learning_rate": 6.422726579734454e-05, + "loss": 1.3409, + "step": 42450 + }, + { + "epoch": 0.82, + "learning_rate": 6.421278624694922e-05, + "loss": 1.3894, + "step": 42460 + }, + { + "epoch": 0.82, + "learning_rate": 6.419830539973633e-05, + "loss": 1.1874, + "step": 42470 + }, + { + "epoch": 0.82, + "learning_rate": 6.418382325702717e-05, + "loss": 1.3227, + "step": 42480 + }, + { + "epoch": 0.82, + "learning_rate": 6.416933982014311e-05, + "loss": 1.2721, + "step": 42490 + }, + { + "epoch": 0.82, + "learning_rate": 6.415485509040569e-05, + "loss": 1.1866, + "step": 42500 + }, + { + "epoch": 0.82, + "learning_rate": 6.414036906913653e-05, + "loss": 1.186, + "step": 42510 + }, + { + "epoch": 0.82, + "learning_rate": 6.412588175765735e-05, + "loss": 1.3188, + "step": 42520 + }, + { + "epoch": 0.82, + "learning_rate": 6.411139315729007e-05, + "loss": 1.0726, + "step": 42530 + }, + { + "epoch": 0.82, + "learning_rate": 6.409690326935663e-05, + "loss": 1.3239, + "step": 42540 + }, + { + "epoch": 0.82, + "learning_rate": 6.408241209517916e-05, + "loss": 1.1542, + "step": 42550 + }, + { + "epoch": 0.82, + "learning_rate": 6.406791963607986e-05, + "loss": 1.2571, + "step": 42560 + }, + { + "epoch": 0.82, + "learning_rate": 6.405342589338106e-05, + "loss": 1.2236, + "step": 42570 + }, + { + "epoch": 0.82, + "learning_rate": 6.403893086840524e-05, + "loss": 1.2927, + "step": 42580 + }, + { + "epoch": 0.82, + "learning_rate": 6.402443456247495e-05, + "loss": 1.2065, + "step": 42590 + }, + { + "epoch": 0.82, + "learning_rate": 6.400993697691286e-05, + "loss": 1.3056, + "step": 42600 + }, + { + "epoch": 0.82, + "learning_rate": 6.399543811304182e-05, + "loss": 1.3691, + "step": 42610 + }, + { + "epoch": 0.82, + "learning_rate": 6.398093797218471e-05, + "loss": 1.3675, + "step": 42620 + }, + { + "epoch": 0.82, + "learning_rate": 6.396643655566459e-05, + "loss": 1.4081, + "step": 42630 + }, + { + "epoch": 0.82, + "learning_rate": 6.395193386480458e-05, + "loss": 1.4473, + "step": 42640 + }, + { + "epoch": 0.82, + "learning_rate": 6.3937429900928e-05, + "loss": 1.3952, + "step": 42650 + }, + { + "epoch": 0.82, + "learning_rate": 6.392292466535821e-05, + "loss": 1.1626, + "step": 42660 + }, + { + "epoch": 0.82, + "learning_rate": 6.39084181594187e-05, + "loss": 1.1766, + "step": 42670 + }, + { + "epoch": 0.82, + "learning_rate": 6.38939103844331e-05, + "loss": 1.1239, + "step": 42680 + }, + { + "epoch": 0.82, + "learning_rate": 6.387940134172512e-05, + "loss": 1.141, + "step": 42690 + }, + { + "epoch": 0.82, + "learning_rate": 6.386489103261866e-05, + "loss": 1.2631, + "step": 42700 + }, + { + "epoch": 0.82, + "learning_rate": 6.385037945843763e-05, + "loss": 1.2475, + "step": 42710 + }, + { + "epoch": 0.82, + "learning_rate": 6.383586662050615e-05, + "loss": 1.1423, + "step": 42720 + }, + { + "epoch": 0.82, + "learning_rate": 6.38213525201484e-05, + "loss": 1.1956, + "step": 42730 + }, + { + "epoch": 0.82, + "learning_rate": 6.380683715868868e-05, + "loss": 1.4148, + "step": 42740 + }, + { + "epoch": 0.82, + "learning_rate": 6.379232053745143e-05, + "loss": 1.3062, + "step": 42750 + }, + { + "epoch": 0.82, + "learning_rate": 6.377780265776119e-05, + "loss": 1.181, + "step": 42760 + }, + { + "epoch": 0.82, + "learning_rate": 6.376328352094261e-05, + "loss": 1.3373, + "step": 42770 + }, + { + "epoch": 0.82, + "learning_rate": 6.374876312832045e-05, + "loss": 1.0841, + "step": 42780 + }, + { + "epoch": 0.82, + "learning_rate": 6.37342414812196e-05, + "loss": 1.2136, + "step": 42790 + }, + { + "epoch": 0.82, + "learning_rate": 6.371971858096508e-05, + "loss": 1.321, + "step": 42800 + }, + { + "epoch": 0.82, + "learning_rate": 6.370519442888198e-05, + "loss": 1.0532, + "step": 42810 + }, + { + "epoch": 0.82, + "learning_rate": 6.369066902629554e-05, + "loss": 1.4423, + "step": 42820 + }, + { + "epoch": 0.82, + "learning_rate": 6.367614237453109e-05, + "loss": 1.0898, + "step": 42830 + }, + { + "epoch": 0.82, + "learning_rate": 6.366161447491409e-05, + "loss": 1.2214, + "step": 42840 + }, + { + "epoch": 0.82, + "learning_rate": 6.364708532877011e-05, + "loss": 1.4078, + "step": 42850 + }, + { + "epoch": 0.82, + "learning_rate": 6.363255493742485e-05, + "loss": 1.2411, + "step": 42860 + }, + { + "epoch": 0.82, + "learning_rate": 6.361802330220408e-05, + "loss": 1.5121, + "step": 42870 + }, + { + "epoch": 0.82, + "learning_rate": 6.360349042443372e-05, + "loss": 1.274, + "step": 42880 + }, + { + "epoch": 0.82, + "learning_rate": 6.35889563054398e-05, + "loss": 0.9965, + "step": 42890 + }, + { + "epoch": 0.82, + "learning_rate": 6.357442094654844e-05, + "loss": 1.4703, + "step": 42900 + }, + { + "epoch": 0.83, + "learning_rate": 6.355988434908591e-05, + "loss": 1.2478, + "step": 42910 + }, + { + "epoch": 0.83, + "learning_rate": 6.354534651437858e-05, + "loss": 1.2753, + "step": 42920 + }, + { + "epoch": 0.83, + "learning_rate": 6.353080744375289e-05, + "loss": 1.2868, + "step": 42930 + }, + { + "epoch": 0.83, + "learning_rate": 6.351626713853546e-05, + "loss": 1.5025, + "step": 42940 + }, + { + "epoch": 0.83, + "learning_rate": 6.350172560005297e-05, + "loss": 1.1236, + "step": 42950 + }, + { + "epoch": 0.83, + "learning_rate": 6.348718282963225e-05, + "loss": 1.2961, + "step": 42960 + }, + { + "epoch": 0.83, + "learning_rate": 6.347263882860024e-05, + "loss": 1.2968, + "step": 42970 + }, + { + "epoch": 0.83, + "learning_rate": 6.345809359828394e-05, + "loss": 1.2247, + "step": 42980 + }, + { + "epoch": 0.83, + "learning_rate": 6.344354714001053e-05, + "loss": 1.3518, + "step": 42990 + }, + { + "epoch": 0.83, + "learning_rate": 6.342899945510726e-05, + "loss": 1.218, + "step": 43000 + }, + { + "epoch": 0.83, + "learning_rate": 6.34144505449015e-05, + "loss": 1.4158, + "step": 43010 + }, + { + "epoch": 0.83, + "learning_rate": 6.339990041072076e-05, + "loss": 1.2148, + "step": 43020 + }, + { + "epoch": 0.83, + "learning_rate": 6.338534905389263e-05, + "loss": 1.2138, + "step": 43030 + }, + { + "epoch": 0.83, + "learning_rate": 6.33707964757448e-05, + "loss": 1.4384, + "step": 43040 + }, + { + "epoch": 0.83, + "learning_rate": 6.335624267760511e-05, + "loss": 1.2074, + "step": 43050 + }, + { + "epoch": 0.83, + "learning_rate": 6.334168766080146e-05, + "loss": 1.1725, + "step": 43060 + }, + { + "epoch": 0.83, + "learning_rate": 6.332713142666196e-05, + "loss": 1.6475, + "step": 43070 + }, + { + "epoch": 0.83, + "learning_rate": 6.33125739765147e-05, + "loss": 1.2646, + "step": 43080 + }, + { + "epoch": 0.83, + "learning_rate": 6.329801531168798e-05, + "loss": 1.3386, + "step": 43090 + }, + { + "epoch": 0.83, + "learning_rate": 6.328345543351017e-05, + "loss": 1.2757, + "step": 43100 + }, + { + "epoch": 0.83, + "learning_rate": 6.326889434330974e-05, + "loss": 1.1713, + "step": 43110 + }, + { + "epoch": 0.83, + "learning_rate": 6.325433204241533e-05, + "loss": 1.0476, + "step": 43120 + }, + { + "epoch": 0.83, + "learning_rate": 6.323976853215558e-05, + "loss": 1.2316, + "step": 43130 + }, + { + "epoch": 0.83, + "learning_rate": 6.322520381385939e-05, + "loss": 1.1872, + "step": 43140 + }, + { + "epoch": 0.83, + "learning_rate": 6.321063788885563e-05, + "loss": 1.2907, + "step": 43150 + }, + { + "epoch": 0.83, + "learning_rate": 6.319607075847336e-05, + "loss": 1.2398, + "step": 43160 + }, + { + "epoch": 0.83, + "learning_rate": 6.318150242404173e-05, + "loss": 1.3694, + "step": 43170 + }, + { + "epoch": 0.83, + "learning_rate": 6.316693288688998e-05, + "loss": 1.4406, + "step": 43180 + }, + { + "epoch": 0.83, + "learning_rate": 6.31523621483475e-05, + "loss": 1.3017, + "step": 43190 + }, + { + "epoch": 0.83, + "learning_rate": 6.313779020974378e-05, + "loss": 1.1724, + "step": 43200 + }, + { + "epoch": 0.83, + "learning_rate": 6.312321707240837e-05, + "loss": 1.2338, + "step": 43210 + }, + { + "epoch": 0.83, + "learning_rate": 6.310864273767101e-05, + "loss": 1.313, + "step": 43220 + }, + { + "epoch": 0.83, + "learning_rate": 6.309406720686146e-05, + "loss": 1.2621, + "step": 43230 + }, + { + "epoch": 0.83, + "learning_rate": 6.307949048130966e-05, + "loss": 1.3434, + "step": 43240 + }, + { + "epoch": 0.83, + "learning_rate": 6.306491256234564e-05, + "loss": 1.24, + "step": 43250 + }, + { + "epoch": 0.83, + "learning_rate": 6.305033345129952e-05, + "loss": 1.3646, + "step": 43260 + }, + { + "epoch": 0.83, + "learning_rate": 6.303575314950157e-05, + "loss": 1.3708, + "step": 43270 + }, + { + "epoch": 0.83, + "learning_rate": 6.302117165828209e-05, + "loss": 1.3543, + "step": 43280 + }, + { + "epoch": 0.83, + "learning_rate": 6.300658897897158e-05, + "loss": 1.0116, + "step": 43290 + }, + { + "epoch": 0.83, + "learning_rate": 6.29920051129006e-05, + "loss": 1.4362, + "step": 43300 + }, + { + "epoch": 0.83, + "learning_rate": 6.297742006139981e-05, + "loss": 1.4389, + "step": 43310 + }, + { + "epoch": 0.83, + "learning_rate": 6.296283382580004e-05, + "loss": 1.3645, + "step": 43320 + }, + { + "epoch": 0.83, + "learning_rate": 6.29482464074321e-05, + "loss": 1.1605, + "step": 43330 + }, + { + "epoch": 0.83, + "learning_rate": 6.293365780762708e-05, + "loss": 1.1094, + "step": 43340 + }, + { + "epoch": 0.83, + "learning_rate": 6.291906802771603e-05, + "loss": 1.3623, + "step": 43350 + }, + { + "epoch": 0.83, + "learning_rate": 6.290447706903017e-05, + "loss": 1.0782, + "step": 43360 + }, + { + "epoch": 0.83, + "learning_rate": 6.288988493290087e-05, + "loss": 1.3556, + "step": 43370 + }, + { + "epoch": 0.83, + "learning_rate": 6.28752916206595e-05, + "loss": 1.2664, + "step": 43380 + }, + { + "epoch": 0.83, + "learning_rate": 6.286069713363763e-05, + "loss": 1.2094, + "step": 43390 + }, + { + "epoch": 0.83, + "learning_rate": 6.284610147316689e-05, + "loss": 1.1874, + "step": 43400 + }, + { + "epoch": 0.83, + "learning_rate": 6.283150464057905e-05, + "loss": 1.4138, + "step": 43410 + }, + { + "epoch": 0.83, + "learning_rate": 6.281690663720597e-05, + "loss": 1.4448, + "step": 43420 + }, + { + "epoch": 0.84, + "learning_rate": 6.280230746437961e-05, + "loss": 1.4742, + "step": 43430 + }, + { + "epoch": 0.84, + "learning_rate": 6.278770712343203e-05, + "loss": 1.4536, + "step": 43440 + }, + { + "epoch": 0.84, + "learning_rate": 6.27731056156954e-05, + "loss": 1.299, + "step": 43450 + }, + { + "epoch": 0.84, + "learning_rate": 6.275850294250204e-05, + "loss": 1.2921, + "step": 43460 + }, + { + "epoch": 0.84, + "learning_rate": 6.274389910518433e-05, + "loss": 1.2291, + "step": 43470 + }, + { + "epoch": 0.84, + "learning_rate": 6.272929410507476e-05, + "loss": 1.4033, + "step": 43480 + }, + { + "epoch": 0.84, + "learning_rate": 6.271468794350595e-05, + "loss": 1.4159, + "step": 43490 + }, + { + "epoch": 0.84, + "learning_rate": 6.270008062181056e-05, + "loss": 1.2164, + "step": 43500 + }, + { + "epoch": 0.84, + "learning_rate": 6.268547214132148e-05, + "loss": 1.0954, + "step": 43510 + }, + { + "epoch": 0.84, + "learning_rate": 6.26708625033716e-05, + "loss": 1.4972, + "step": 43520 + }, + { + "epoch": 0.84, + "learning_rate": 6.265625170929393e-05, + "loss": 1.3133, + "step": 43530 + }, + { + "epoch": 0.84, + "learning_rate": 6.264163976042163e-05, + "loss": 1.3053, + "step": 43540 + }, + { + "epoch": 0.84, + "learning_rate": 6.26270266580879e-05, + "loss": 1.2617, + "step": 43550 + }, + { + "epoch": 0.84, + "learning_rate": 6.261241240362612e-05, + "loss": 1.2006, + "step": 43560 + }, + { + "epoch": 0.84, + "learning_rate": 6.259779699836972e-05, + "loss": 1.2123, + "step": 43570 + }, + { + "epoch": 0.84, + "learning_rate": 6.25831804436523e-05, + "loss": 1.316, + "step": 43580 + }, + { + "epoch": 0.84, + "learning_rate": 6.256856274080746e-05, + "loss": 1.228, + "step": 43590 + }, + { + "epoch": 0.84, + "learning_rate": 6.255394389116897e-05, + "loss": 1.1667, + "step": 43600 + }, + { + "epoch": 0.84, + "learning_rate": 6.253932389607072e-05, + "loss": 1.4566, + "step": 43610 + }, + { + "epoch": 0.84, + "learning_rate": 6.252470275684668e-05, + "loss": 1.3635, + "step": 43620 + }, + { + "epoch": 0.84, + "learning_rate": 6.251008047483092e-05, + "loss": 1.2669, + "step": 43630 + }, + { + "epoch": 0.84, + "learning_rate": 6.249545705135761e-05, + "loss": 1.2264, + "step": 43640 + }, + { + "epoch": 0.84, + "learning_rate": 6.248083248776107e-05, + "loss": 1.5117, + "step": 43650 + }, + { + "epoch": 0.84, + "learning_rate": 6.246620678537564e-05, + "loss": 1.1437, + "step": 43660 + }, + { + "epoch": 0.84, + "learning_rate": 6.245157994553585e-05, + "loss": 1.2719, + "step": 43670 + }, + { + "epoch": 0.84, + "learning_rate": 6.243695196957631e-05, + "loss": 1.2965, + "step": 43680 + }, + { + "epoch": 0.84, + "learning_rate": 6.242232285883168e-05, + "loss": 1.1071, + "step": 43690 + }, + { + "epoch": 0.84, + "learning_rate": 6.240769261463677e-05, + "loss": 1.2552, + "step": 43700 + }, + { + "epoch": 0.84, + "learning_rate": 6.239306123832653e-05, + "loss": 1.103, + "step": 43710 + }, + { + "epoch": 0.84, + "learning_rate": 6.23784287312359e-05, + "loss": 1.4342, + "step": 43720 + }, + { + "epoch": 0.84, + "learning_rate": 6.236379509470007e-05, + "loss": 1.1748, + "step": 43730 + }, + { + "epoch": 0.84, + "learning_rate": 6.234916033005421e-05, + "loss": 1.3993, + "step": 43740 + }, + { + "epoch": 0.84, + "learning_rate": 6.233452443863365e-05, + "loss": 1.2131, + "step": 43750 + }, + { + "epoch": 0.84, + "learning_rate": 6.231988742177383e-05, + "loss": 1.2789, + "step": 43760 + }, + { + "epoch": 0.84, + "learning_rate": 6.230524928081023e-05, + "loss": 1.3823, + "step": 43770 + }, + { + "epoch": 0.84, + "learning_rate": 6.229061001707856e-05, + "loss": 1.2152, + "step": 43780 + }, + { + "epoch": 0.84, + "learning_rate": 6.227596963191446e-05, + "loss": 1.3213, + "step": 43790 + }, + { + "epoch": 0.84, + "learning_rate": 6.226132812665381e-05, + "loss": 1.251, + "step": 43800 + }, + { + "epoch": 0.84, + "learning_rate": 6.224668550263254e-05, + "loss": 1.1005, + "step": 43810 + }, + { + "epoch": 0.84, + "learning_rate": 6.223204176118668e-05, + "loss": 1.0784, + "step": 43820 + }, + { + "epoch": 0.84, + "learning_rate": 6.22173969036524e-05, + "loss": 1.2598, + "step": 43830 + }, + { + "epoch": 0.84, + "learning_rate": 6.220275093136589e-05, + "loss": 1.3252, + "step": 43840 + }, + { + "epoch": 0.84, + "learning_rate": 6.218810384566352e-05, + "loss": 1.4837, + "step": 43850 + }, + { + "epoch": 0.84, + "learning_rate": 6.217345564788175e-05, + "loss": 1.1643, + "step": 43860 + }, + { + "epoch": 0.84, + "learning_rate": 6.215880633935708e-05, + "loss": 1.5224, + "step": 43870 + }, + { + "epoch": 0.84, + "learning_rate": 6.214415592142622e-05, + "loss": 1.1262, + "step": 43880 + }, + { + "epoch": 0.84, + "learning_rate": 6.212950439542586e-05, + "loss": 1.2885, + "step": 43890 + }, + { + "epoch": 0.84, + "learning_rate": 6.211485176269288e-05, + "loss": 1.2138, + "step": 43900 + }, + { + "epoch": 0.84, + "learning_rate": 6.210019802456423e-05, + "loss": 1.2473, + "step": 43910 + }, + { + "epoch": 0.84, + "learning_rate": 6.208554318237694e-05, + "loss": 1.138, + "step": 43920 + }, + { + "epoch": 0.84, + "learning_rate": 6.20708872374682e-05, + "loss": 1.2687, + "step": 43930 + }, + { + "epoch": 0.84, + "learning_rate": 6.205623019117522e-05, + "loss": 1.2513, + "step": 43940 + }, + { + "epoch": 0.85, + "learning_rate": 6.204157204483538e-05, + "loss": 1.382, + "step": 43950 + }, + { + "epoch": 0.85, + "learning_rate": 6.202691279978613e-05, + "loss": 1.4971, + "step": 43960 + }, + { + "epoch": 0.85, + "learning_rate": 6.201225245736502e-05, + "loss": 1.4358, + "step": 43970 + }, + { + "epoch": 0.85, + "learning_rate": 6.199759101890971e-05, + "loss": 1.4085, + "step": 43980 + }, + { + "epoch": 0.85, + "learning_rate": 6.198292848575794e-05, + "loss": 1.2412, + "step": 43990 + }, + { + "epoch": 0.85, + "learning_rate": 6.196826485924758e-05, + "loss": 1.3564, + "step": 44000 + }, + { + "epoch": 0.85, + "learning_rate": 6.195360014071656e-05, + "loss": 1.1461, + "step": 44010 + }, + { + "epoch": 0.85, + "learning_rate": 6.193893433150297e-05, + "loss": 1.3831, + "step": 44020 + }, + { + "epoch": 0.85, + "learning_rate": 6.192426743294494e-05, + "loss": 1.3223, + "step": 44030 + }, + { + "epoch": 0.85, + "learning_rate": 6.190959944638072e-05, + "loss": 1.2222, + "step": 44040 + }, + { + "epoch": 0.85, + "learning_rate": 6.189493037314867e-05, + "loss": 1.2465, + "step": 44050 + }, + { + "epoch": 0.85, + "learning_rate": 6.188026021458722e-05, + "loss": 1.2473, + "step": 44060 + }, + { + "epoch": 0.85, + "learning_rate": 6.186558897203494e-05, + "loss": 1.3676, + "step": 44070 + }, + { + "epoch": 0.85, + "learning_rate": 6.185091664683049e-05, + "loss": 1.2396, + "step": 44080 + }, + { + "epoch": 0.85, + "learning_rate": 6.183624324031259e-05, + "loss": 1.2457, + "step": 44090 + }, + { + "epoch": 0.85, + "learning_rate": 6.182156875382009e-05, + "loss": 1.0893, + "step": 44100 + }, + { + "epoch": 0.85, + "learning_rate": 6.180689318869195e-05, + "loss": 1.1623, + "step": 44110 + }, + { + "epoch": 0.85, + "learning_rate": 6.17922165462672e-05, + "loss": 1.3069, + "step": 44120 + }, + { + "epoch": 0.85, + "learning_rate": 6.1777538827885e-05, + "loss": 1.2221, + "step": 44130 + }, + { + "epoch": 0.85, + "learning_rate": 6.176286003488456e-05, + "loss": 1.1399, + "step": 44140 + }, + { + "epoch": 0.85, + "learning_rate": 6.174818016860525e-05, + "loss": 1.1009, + "step": 44150 + }, + { + "epoch": 0.85, + "learning_rate": 6.173349923038647e-05, + "loss": 1.3744, + "step": 44160 + }, + { + "epoch": 0.85, + "learning_rate": 6.171881722156778e-05, + "loss": 1.168, + "step": 44170 + }, + { + "epoch": 0.85, + "learning_rate": 6.17041341434888e-05, + "loss": 1.3851, + "step": 44180 + }, + { + "epoch": 0.85, + "learning_rate": 6.168944999748926e-05, + "loss": 1.1353, + "step": 44190 + }, + { + "epoch": 0.85, + "learning_rate": 6.167476478490899e-05, + "loss": 1.0066, + "step": 44200 + }, + { + "epoch": 0.85, + "learning_rate": 6.16600785070879e-05, + "loss": 1.293, + "step": 44210 + }, + { + "epoch": 0.85, + "learning_rate": 6.164539116536603e-05, + "loss": 1.2638, + "step": 44220 + }, + { + "epoch": 0.85, + "learning_rate": 6.163070276108349e-05, + "loss": 1.2328, + "step": 44230 + }, + { + "epoch": 0.85, + "learning_rate": 6.161601329558048e-05, + "loss": 1.3789, + "step": 44240 + }, + { + "epoch": 0.85, + "learning_rate": 6.160132277019735e-05, + "loss": 1.4871, + "step": 44250 + }, + { + "epoch": 0.85, + "learning_rate": 6.158663118627445e-05, + "loss": 1.1888, + "step": 44260 + }, + { + "epoch": 0.85, + "learning_rate": 6.157193854515233e-05, + "loss": 1.358, + "step": 44270 + }, + { + "epoch": 0.85, + "learning_rate": 6.155724484817157e-05, + "loss": 1.2292, + "step": 44280 + }, + { + "epoch": 0.85, + "learning_rate": 6.154255009667289e-05, + "loss": 1.3027, + "step": 44290 + }, + { + "epoch": 0.85, + "learning_rate": 6.152785429199703e-05, + "loss": 1.4257, + "step": 44300 + }, + { + "epoch": 0.85, + "learning_rate": 6.151315743548494e-05, + "loss": 1.2583, + "step": 44310 + }, + { + "epoch": 0.85, + "learning_rate": 6.14984595284776e-05, + "loss": 1.4678, + "step": 44320 + }, + { + "epoch": 0.85, + "learning_rate": 6.148376057231605e-05, + "loss": 1.253, + "step": 44330 + }, + { + "epoch": 0.85, + "learning_rate": 6.14690605683415e-05, + "loss": 1.2914, + "step": 44340 + }, + { + "epoch": 0.85, + "learning_rate": 6.14543595178952e-05, + "loss": 1.3877, + "step": 44350 + }, + { + "epoch": 0.85, + "learning_rate": 6.143965742231855e-05, + "loss": 1.3844, + "step": 44360 + }, + { + "epoch": 0.85, + "learning_rate": 6.142495428295298e-05, + "loss": 1.2758, + "step": 44370 + }, + { + "epoch": 0.85, + "learning_rate": 6.141025010114007e-05, + "loss": 1.2928, + "step": 44380 + }, + { + "epoch": 0.85, + "learning_rate": 6.139554487822149e-05, + "loss": 1.365, + "step": 44390 + }, + { + "epoch": 0.85, + "learning_rate": 6.138083861553894e-05, + "loss": 1.2985, + "step": 44400 + }, + { + "epoch": 0.85, + "learning_rate": 6.136613131443431e-05, + "loss": 1.6401, + "step": 44410 + }, + { + "epoch": 0.85, + "learning_rate": 6.13514229762495e-05, + "loss": 1.274, + "step": 44420 + }, + { + "epoch": 0.85, + "learning_rate": 6.133671360232657e-05, + "loss": 1.2728, + "step": 44430 + }, + { + "epoch": 0.85, + "learning_rate": 6.132200319400766e-05, + "loss": 1.3959, + "step": 44440 + }, + { + "epoch": 0.85, + "learning_rate": 6.130729175263494e-05, + "loss": 1.1998, + "step": 44450 + }, + { + "epoch": 0.85, + "learning_rate": 6.129257927955078e-05, + "loss": 1.0954, + "step": 44460 + }, + { + "epoch": 0.86, + "learning_rate": 6.127786577609757e-05, + "loss": 1.3108, + "step": 44470 + }, + { + "epoch": 0.86, + "learning_rate": 6.126315124361781e-05, + "loss": 1.1588, + "step": 44480 + }, + { + "epoch": 0.86, + "learning_rate": 6.124843568345412e-05, + "loss": 1.3148, + "step": 44490 + }, + { + "epoch": 0.86, + "learning_rate": 6.123371909694914e-05, + "loss": 1.5334, + "step": 44500 + }, + { + "epoch": 0.86, + "learning_rate": 6.121900148544572e-05, + "loss": 1.4102, + "step": 44510 + }, + { + "epoch": 0.86, + "learning_rate": 6.12042828502867e-05, + "loss": 1.3504, + "step": 44520 + }, + { + "epoch": 0.86, + "learning_rate": 6.118956319281504e-05, + "loss": 1.2352, + "step": 44530 + }, + { + "epoch": 0.86, + "learning_rate": 6.117484251437388e-05, + "loss": 1.3443, + "step": 44540 + }, + { + "epoch": 0.86, + "learning_rate": 6.116012081630629e-05, + "loss": 1.3207, + "step": 44550 + }, + { + "epoch": 0.86, + "learning_rate": 6.114539809995556e-05, + "loss": 1.2148, + "step": 44560 + }, + { + "epoch": 0.86, + "learning_rate": 6.113067436666504e-05, + "loss": 1.3666, + "step": 44570 + }, + { + "epoch": 0.86, + "learning_rate": 6.111594961777817e-05, + "loss": 1.0812, + "step": 44580 + }, + { + "epoch": 0.86, + "learning_rate": 6.110122385463848e-05, + "loss": 1.2021, + "step": 44590 + }, + { + "epoch": 0.86, + "learning_rate": 6.108649707858957e-05, + "loss": 1.185, + "step": 44600 + }, + { + "epoch": 0.86, + "learning_rate": 6.107176929097517e-05, + "loss": 1.2596, + "step": 44610 + }, + { + "epoch": 0.86, + "learning_rate": 6.105704049313911e-05, + "loss": 1.1397, + "step": 44620 + }, + { + "epoch": 0.86, + "learning_rate": 6.104231068642525e-05, + "loss": 1.2869, + "step": 44630 + }, + { + "epoch": 0.86, + "learning_rate": 6.102757987217762e-05, + "loss": 1.2228, + "step": 44640 + }, + { + "epoch": 0.86, + "learning_rate": 6.101284805174028e-05, + "loss": 1.3499, + "step": 44650 + }, + { + "epoch": 0.86, + "learning_rate": 6.099811522645742e-05, + "loss": 1.2121, + "step": 44660 + }, + { + "epoch": 0.86, + "learning_rate": 6.098338139767328e-05, + "loss": 1.4148, + "step": 44670 + }, + { + "epoch": 0.86, + "learning_rate": 6.0968646566732245e-05, + "loss": 1.3671, + "step": 44680 + }, + { + "epoch": 0.86, + "learning_rate": 6.095391073497877e-05, + "loss": 1.3327, + "step": 44690 + }, + { + "epoch": 0.86, + "learning_rate": 6.093917390375738e-05, + "loss": 1.1579, + "step": 44700 + }, + { + "epoch": 0.86, + "learning_rate": 6.092443607441272e-05, + "loss": 1.1987, + "step": 44710 + }, + { + "epoch": 0.86, + "learning_rate": 6.090969724828949e-05, + "loss": 1.523, + "step": 44720 + }, + { + "epoch": 0.86, + "learning_rate": 6.089495742673254e-05, + "loss": 1.0621, + "step": 44730 + }, + { + "epoch": 0.86, + "learning_rate": 6.088021661108675e-05, + "loss": 1.2743, + "step": 44740 + }, + { + "epoch": 0.86, + "learning_rate": 6.086547480269713e-05, + "loss": 1.377, + "step": 44750 + }, + { + "epoch": 0.86, + "learning_rate": 6.085073200290876e-05, + "loss": 1.4048, + "step": 44760 + }, + { + "epoch": 0.86, + "learning_rate": 6.083598821306682e-05, + "loss": 1.2827, + "step": 44770 + }, + { + "epoch": 0.86, + "learning_rate": 6.082124343451658e-05, + "loss": 1.2124, + "step": 44780 + }, + { + "epoch": 0.86, + "learning_rate": 6.0806497668603403e-05, + "loss": 1.3011, + "step": 44790 + }, + { + "epoch": 0.86, + "learning_rate": 6.0791750916672716e-05, + "loss": 1.4225, + "step": 44800 + }, + { + "epoch": 0.86, + "learning_rate": 6.077700318007009e-05, + "loss": 1.2, + "step": 44810 + }, + { + "epoch": 0.86, + "learning_rate": 6.076225446014111e-05, + "loss": 1.1264, + "step": 44820 + }, + { + "epoch": 0.86, + "learning_rate": 6.0747504758231536e-05, + "loss": 1.1907, + "step": 44830 + }, + { + "epoch": 0.86, + "learning_rate": 6.073275407568716e-05, + "loss": 1.1106, + "step": 44840 + }, + { + "epoch": 0.86, + "learning_rate": 6.071800241385387e-05, + "loss": 1.2078, + "step": 44850 + }, + { + "epoch": 0.86, + "learning_rate": 6.070324977407767e-05, + "loss": 1.1648, + "step": 44860 + }, + { + "epoch": 0.86, + "learning_rate": 6.06884961577046e-05, + "loss": 1.2619, + "step": 44870 + }, + { + "epoch": 0.86, + "learning_rate": 6.0673741566080854e-05, + "loss": 1.131, + "step": 44880 + }, + { + "epoch": 0.86, + "learning_rate": 6.06589860005527e-05, + "loss": 1.3873, + "step": 44890 + }, + { + "epoch": 0.86, + "learning_rate": 6.0644229462466454e-05, + "loss": 1.3012, + "step": 44900 + }, + { + "epoch": 0.86, + "learning_rate": 6.062947195316855e-05, + "loss": 1.4414, + "step": 44910 + }, + { + "epoch": 0.86, + "learning_rate": 6.06147134740055e-05, + "loss": 1.1923, + "step": 44920 + }, + { + "epoch": 0.86, + "learning_rate": 6.059995402632394e-05, + "loss": 1.1917, + "step": 44930 + }, + { + "epoch": 0.86, + "learning_rate": 6.058519361147055e-05, + "loss": 1.3279, + "step": 44940 + }, + { + "epoch": 0.86, + "learning_rate": 6.057043223079211e-05, + "loss": 1.3363, + "step": 44950 + }, + { + "epoch": 0.86, + "learning_rate": 6.0555669885635493e-05, + "loss": 1.1519, + "step": 44960 + }, + { + "epoch": 0.86, + "learning_rate": 6.054090657734767e-05, + "loss": 1.4093, + "step": 44970 + }, + { + "epoch": 0.86, + "learning_rate": 6.052614230727569e-05, + "loss": 1.29, + "step": 44980 + }, + { + "epoch": 0.87, + "learning_rate": 6.0511377076766686e-05, + "loss": 1.0764, + "step": 44990 + }, + { + "epoch": 0.87, + "learning_rate": 6.049661088716787e-05, + "loss": 1.2517, + "step": 45000 + }, + { + "epoch": 0.87, + "learning_rate": 6.048184373982656e-05, + "loss": 1.2806, + "step": 45010 + }, + { + "epoch": 0.87, + "learning_rate": 6.0467075636090174e-05, + "loss": 1.2712, + "step": 45020 + }, + { + "epoch": 0.87, + "learning_rate": 6.045230657730618e-05, + "loss": 1.3277, + "step": 45030 + }, + { + "epoch": 0.87, + "learning_rate": 6.043753656482216e-05, + "loss": 1.2622, + "step": 45040 + }, + { + "epoch": 0.87, + "learning_rate": 6.0422765599985764e-05, + "loss": 1.1962, + "step": 45050 + }, + { + "epoch": 0.87, + "learning_rate": 6.040799368414474e-05, + "loss": 1.2458, + "step": 45060 + }, + { + "epoch": 0.87, + "learning_rate": 6.0393220818646946e-05, + "loss": 1.2178, + "step": 45070 + }, + { + "epoch": 0.87, + "learning_rate": 6.037844700484028e-05, + "loss": 1.3134, + "step": 45080 + }, + { + "epoch": 0.87, + "learning_rate": 6.036367224407274e-05, + "loss": 1.226, + "step": 45090 + }, + { + "epoch": 0.87, + "learning_rate": 6.0348896537692446e-05, + "loss": 1.1045, + "step": 45100 + }, + { + "epoch": 0.87, + "learning_rate": 6.033411988704756e-05, + "loss": 1.0974, + "step": 45110 + }, + { + "epoch": 0.87, + "learning_rate": 6.031934229348636e-05, + "loss": 1.3956, + "step": 45120 + }, + { + "epoch": 0.87, + "learning_rate": 6.0304563758357194e-05, + "loss": 1.2923, + "step": 45130 + }, + { + "epoch": 0.87, + "learning_rate": 6.028978428300849e-05, + "loss": 1.0647, + "step": 45140 + }, + { + "epoch": 0.87, + "learning_rate": 6.0275003868788795e-05, + "loss": 1.3697, + "step": 45150 + }, + { + "epoch": 0.87, + "learning_rate": 6.026022251704668e-05, + "loss": 1.0517, + "step": 45160 + }, + { + "epoch": 0.87, + "learning_rate": 6.0245440229130876e-05, + "loss": 1.217, + "step": 45170 + }, + { + "epoch": 0.87, + "learning_rate": 6.023065700639017e-05, + "loss": 1.3212, + "step": 45180 + }, + { + "epoch": 0.87, + "learning_rate": 6.02158728501734e-05, + "loss": 1.2887, + "step": 45190 + }, + { + "epoch": 0.87, + "learning_rate": 6.020108776182952e-05, + "loss": 1.1666, + "step": 45200 + }, + { + "epoch": 0.87, + "learning_rate": 6.018630174270757e-05, + "loss": 1.2987, + "step": 45210 + }, + { + "epoch": 0.87, + "learning_rate": 6.017151479415668e-05, + "loss": 1.4526, + "step": 45220 + }, + { + "epoch": 0.87, + "learning_rate": 6.015672691752605e-05, + "loss": 1.288, + "step": 45230 + }, + { + "epoch": 0.87, + "learning_rate": 6.0141938114164976e-05, + "loss": 1.1831, + "step": 45240 + }, + { + "epoch": 0.87, + "learning_rate": 6.012714838542284e-05, + "loss": 1.1942, + "step": 45250 + }, + { + "epoch": 0.87, + "learning_rate": 6.011235773264906e-05, + "loss": 1.3256, + "step": 45260 + }, + { + "epoch": 0.87, + "learning_rate": 6.009756615719323e-05, + "loss": 1.3161, + "step": 45270 + }, + { + "epoch": 0.87, + "learning_rate": 6.008277366040493e-05, + "loss": 1.2851, + "step": 45280 + }, + { + "epoch": 0.87, + "learning_rate": 6.006798024363394e-05, + "loss": 1.4009, + "step": 45290 + }, + { + "epoch": 0.87, + "learning_rate": 6.005318590822999e-05, + "loss": 1.3426, + "step": 45300 + }, + { + "epoch": 0.87, + "learning_rate": 6.0038390655543e-05, + "loss": 1.1841, + "step": 45310 + }, + { + "epoch": 0.87, + "learning_rate": 6.002359448692291e-05, + "loss": 1.132, + "step": 45320 + }, + { + "epoch": 0.87, + "learning_rate": 6.000879740371976e-05, + "loss": 1.4012, + "step": 45330 + }, + { + "epoch": 0.87, + "learning_rate": 5.9993999407283717e-05, + "loss": 1.4221, + "step": 45340 + }, + { + "epoch": 0.87, + "learning_rate": 5.9979200498964975e-05, + "loss": 1.2859, + "step": 45350 + }, + { + "epoch": 0.87, + "learning_rate": 5.996440068011383e-05, + "loss": 1.2323, + "step": 45360 + }, + { + "epoch": 0.87, + "learning_rate": 5.994959995208066e-05, + "loss": 1.3655, + "step": 45370 + }, + { + "epoch": 0.87, + "learning_rate": 5.993479831621592e-05, + "loss": 1.1984, + "step": 45380 + }, + { + "epoch": 0.87, + "learning_rate": 5.9919995773870173e-05, + "loss": 1.3473, + "step": 45390 + }, + { + "epoch": 0.87, + "learning_rate": 5.990519232639406e-05, + "loss": 1.4132, + "step": 45400 + }, + { + "epoch": 0.87, + "learning_rate": 5.9890387975138254e-05, + "loss": 1.1861, + "step": 45410 + }, + { + "epoch": 0.87, + "learning_rate": 5.987558272145358e-05, + "loss": 1.468, + "step": 45420 + }, + { + "epoch": 0.87, + "learning_rate": 5.986077656669089e-05, + "loss": 1.2724, + "step": 45430 + }, + { + "epoch": 0.87, + "learning_rate": 5.984596951220116e-05, + "loss": 1.3259, + "step": 45440 + }, + { + "epoch": 0.87, + "learning_rate": 5.983116155933543e-05, + "loss": 1.2835, + "step": 45450 + }, + { + "epoch": 0.87, + "learning_rate": 5.981635270944481e-05, + "loss": 1.4084, + "step": 45460 + }, + { + "epoch": 0.87, + "learning_rate": 5.980154296388053e-05, + "loss": 1.2773, + "step": 45470 + }, + { + "epoch": 0.87, + "learning_rate": 5.978673232399383e-05, + "loss": 1.3504, + "step": 45480 + }, + { + "epoch": 0.87, + "learning_rate": 5.977192079113613e-05, + "loss": 1.27, + "step": 45490 + }, + { + "epoch": 0.87, + "learning_rate": 5.9757108366658844e-05, + "loss": 1.1241, + "step": 45500 + }, + { + "epoch": 0.88, + "learning_rate": 5.974229505191351e-05, + "loss": 1.2899, + "step": 45510 + }, + { + "epoch": 0.88, + "learning_rate": 5.972748084825175e-05, + "loss": 1.4009, + "step": 45520 + }, + { + "epoch": 0.88, + "learning_rate": 5.971266575702523e-05, + "loss": 1.3871, + "step": 45530 + }, + { + "epoch": 0.88, + "learning_rate": 5.969784977958577e-05, + "loss": 1.226, + "step": 45540 + }, + { + "epoch": 0.88, + "learning_rate": 5.968303291728519e-05, + "loss": 1.238, + "step": 45550 + }, + { + "epoch": 0.88, + "learning_rate": 5.966821517147543e-05, + "loss": 1.0819, + "step": 45560 + }, + { + "epoch": 0.88, + "learning_rate": 5.96533965435085e-05, + "loss": 1.1433, + "step": 45570 + }, + { + "epoch": 0.88, + "learning_rate": 5.9638577034736495e-05, + "loss": 1.3714, + "step": 45580 + }, + { + "epoch": 0.88, + "learning_rate": 5.962375664651163e-05, + "loss": 1.2654, + "step": 45590 + }, + { + "epoch": 0.88, + "learning_rate": 5.960893538018612e-05, + "loss": 1.2269, + "step": 45600 + }, + { + "epoch": 0.88, + "learning_rate": 5.959411323711231e-05, + "loss": 1.0243, + "step": 45610 + }, + { + "epoch": 0.88, + "learning_rate": 5.957929021864262e-05, + "loss": 1.5088, + "step": 45620 + }, + { + "epoch": 0.88, + "learning_rate": 5.9564466326129574e-05, + "loss": 1.2709, + "step": 45630 + }, + { + "epoch": 0.88, + "learning_rate": 5.9549641560925704e-05, + "loss": 1.2747, + "step": 45640 + }, + { + "epoch": 0.88, + "learning_rate": 5.9534815924383704e-05, + "loss": 1.2387, + "step": 45650 + }, + { + "epoch": 0.88, + "learning_rate": 5.9519989417856284e-05, + "loss": 1.4057, + "step": 45660 + }, + { + "epoch": 0.88, + "learning_rate": 5.950516204269625e-05, + "loss": 1.2609, + "step": 45670 + }, + { + "epoch": 0.88, + "learning_rate": 5.9490333800256534e-05, + "loss": 1.3847, + "step": 45680 + }, + { + "epoch": 0.88, + "learning_rate": 5.947550469189008e-05, + "loss": 1.4188, + "step": 45690 + }, + { + "epoch": 0.88, + "learning_rate": 5.946067471894996e-05, + "loss": 1.4945, + "step": 45700 + }, + { + "epoch": 0.88, + "learning_rate": 5.94458438827893e-05, + "loss": 1.366, + "step": 45710 + }, + { + "epoch": 0.88, + "learning_rate": 5.943101218476129e-05, + "loss": 1.3879, + "step": 45720 + }, + { + "epoch": 0.88, + "learning_rate": 5.941617962621925e-05, + "loss": 1.0624, + "step": 45730 + }, + { + "epoch": 0.88, + "learning_rate": 5.940134620851653e-05, + "loss": 1.1251, + "step": 45740 + }, + { + "epoch": 0.88, + "learning_rate": 5.938651193300658e-05, + "loss": 1.2618, + "step": 45750 + }, + { + "epoch": 0.88, + "learning_rate": 5.937167680104292e-05, + "loss": 1.1823, + "step": 45760 + }, + { + "epoch": 0.88, + "learning_rate": 5.935684081397915e-05, + "loss": 1.3304, + "step": 45770 + }, + { + "epoch": 0.88, + "learning_rate": 5.934200397316896e-05, + "loss": 1.1374, + "step": 45780 + }, + { + "epoch": 0.88, + "learning_rate": 5.9327166279966104e-05, + "loss": 1.2547, + "step": 45790 + }, + { + "epoch": 0.88, + "learning_rate": 5.931232773572443e-05, + "loss": 1.229, + "step": 45800 + }, + { + "epoch": 0.88, + "learning_rate": 5.9297488341797825e-05, + "loss": 1.1247, + "step": 45810 + }, + { + "epoch": 0.88, + "learning_rate": 5.9282648099540295e-05, + "loss": 1.3211, + "step": 45820 + }, + { + "epoch": 0.88, + "learning_rate": 5.926780701030591e-05, + "loss": 1.1822, + "step": 45830 + }, + { + "epoch": 0.88, + "learning_rate": 5.925296507544882e-05, + "loss": 1.4273, + "step": 45840 + }, + { + "epoch": 0.88, + "learning_rate": 5.9238122296323226e-05, + "loss": 1.2723, + "step": 45850 + }, + { + "epoch": 0.88, + "learning_rate": 5.9223278674283463e-05, + "loss": 1.3384, + "step": 45860 + }, + { + "epoch": 0.88, + "learning_rate": 5.9208434210683874e-05, + "loss": 1.1264, + "step": 45870 + }, + { + "epoch": 0.88, + "learning_rate": 5.9193588906878924e-05, + "loss": 1.2568, + "step": 45880 + }, + { + "epoch": 0.88, + "learning_rate": 5.917874276422315e-05, + "loss": 1.2978, + "step": 45890 + }, + { + "epoch": 0.88, + "learning_rate": 5.9163895784071176e-05, + "loss": 1.1092, + "step": 45900 + }, + { + "epoch": 0.88, + "learning_rate": 5.914904796777765e-05, + "loss": 1.432, + "step": 45910 + }, + { + "epoch": 0.88, + "learning_rate": 5.913419931669735e-05, + "loss": 1.2197, + "step": 45920 + }, + { + "epoch": 0.88, + "learning_rate": 5.91193498321851e-05, + "loss": 1.2969, + "step": 45930 + }, + { + "epoch": 0.88, + "learning_rate": 5.910449951559581e-05, + "loss": 1.2116, + "step": 45940 + }, + { + "epoch": 0.88, + "learning_rate": 5.9089648368284513e-05, + "loss": 1.3858, + "step": 45950 + }, + { + "epoch": 0.88, + "learning_rate": 5.9074796391606216e-05, + "loss": 1.1823, + "step": 45960 + }, + { + "epoch": 0.88, + "learning_rate": 5.905994358691608e-05, + "loss": 1.4225, + "step": 45970 + }, + { + "epoch": 0.88, + "learning_rate": 5.904508995556932e-05, + "loss": 1.3216, + "step": 45980 + }, + { + "epoch": 0.88, + "learning_rate": 5.9030235498921215e-05, + "loss": 1.4712, + "step": 45990 + }, + { + "epoch": 0.88, + "learning_rate": 5.901538021832716e-05, + "loss": 1.5056, + "step": 46000 + }, + { + "epoch": 0.88, + "learning_rate": 5.900052411514257e-05, + "loss": 1.457, + "step": 46010 + }, + { + "epoch": 0.88, + "learning_rate": 5.898566719072297e-05, + "loss": 1.2062, + "step": 46020 + }, + { + "epoch": 0.89, + "learning_rate": 5.8970809446423944e-05, + "loss": 1.4465, + "step": 46030 + }, + { + "epoch": 0.89, + "learning_rate": 5.895595088360116e-05, + "loss": 1.2134, + "step": 46040 + }, + { + "epoch": 0.89, + "learning_rate": 5.894109150361038e-05, + "loss": 1.2719, + "step": 46050 + }, + { + "epoch": 0.89, + "learning_rate": 5.8926231307807365e-05, + "loss": 1.3344, + "step": 46060 + }, + { + "epoch": 0.89, + "learning_rate": 5.891137029754806e-05, + "loss": 1.4586, + "step": 46070 + }, + { + "epoch": 0.89, + "learning_rate": 5.8896508474188407e-05, + "loss": 1.4692, + "step": 46080 + }, + { + "epoch": 0.89, + "learning_rate": 5.888164583908443e-05, + "loss": 1.2117, + "step": 46090 + }, + { + "epoch": 0.89, + "learning_rate": 5.886678239359227e-05, + "loss": 1.3408, + "step": 46100 + }, + { + "epoch": 0.89, + "learning_rate": 5.8851918139068086e-05, + "loss": 1.2608, + "step": 46110 + }, + { + "epoch": 0.89, + "learning_rate": 5.883705307686814e-05, + "loss": 1.1391, + "step": 46120 + }, + { + "epoch": 0.89, + "learning_rate": 5.882218720834879e-05, + "loss": 1.2741, + "step": 46130 + }, + { + "epoch": 0.89, + "learning_rate": 5.8807320534866405e-05, + "loss": 1.1477, + "step": 46140 + }, + { + "epoch": 0.89, + "learning_rate": 5.879245305777751e-05, + "loss": 1.1418, + "step": 46150 + }, + { + "epoch": 0.89, + "learning_rate": 5.877758477843862e-05, + "loss": 1.1826, + "step": 46160 + }, + { + "epoch": 0.89, + "learning_rate": 5.8762715698206385e-05, + "loss": 1.2785, + "step": 46170 + }, + { + "epoch": 0.89, + "learning_rate": 5.87478458184375e-05, + "loss": 1.1505, + "step": 46180 + }, + { + "epoch": 0.89, + "learning_rate": 5.873297514048871e-05, + "loss": 1.2996, + "step": 46190 + }, + { + "epoch": 0.89, + "learning_rate": 5.87181036657169e-05, + "loss": 1.0374, + "step": 46200 + }, + { + "epoch": 0.89, + "learning_rate": 5.8703231395478974e-05, + "loss": 1.2424, + "step": 46210 + }, + { + "epoch": 0.89, + "learning_rate": 5.868835833113192e-05, + "loss": 1.3822, + "step": 46220 + }, + { + "epoch": 0.89, + "learning_rate": 5.86734844740328e-05, + "loss": 1.1697, + "step": 46230 + }, + { + "epoch": 0.89, + "learning_rate": 5.865860982553876e-05, + "loss": 1.4085, + "step": 46240 + }, + { + "epoch": 0.89, + "learning_rate": 5.864373438700699e-05, + "loss": 1.2021, + "step": 46250 + }, + { + "epoch": 0.89, + "learning_rate": 5.862885815979479e-05, + "loss": 1.332, + "step": 46260 + }, + { + "epoch": 0.89, + "learning_rate": 5.86139811452595e-05, + "loss": 1.275, + "step": 46270 + }, + { + "epoch": 0.89, + "learning_rate": 5.859910334475853e-05, + "loss": 1.296, + "step": 46280 + }, + { + "epoch": 0.89, + "learning_rate": 5.858422475964941e-05, + "loss": 1.2308, + "step": 46290 + }, + { + "epoch": 0.89, + "learning_rate": 5.856934539128969e-05, + "loss": 1.2633, + "step": 46300 + }, + { + "epoch": 0.89, + "learning_rate": 5.8554465241037e-05, + "loss": 1.3655, + "step": 46310 + }, + { + "epoch": 0.89, + "learning_rate": 5.853958431024906e-05, + "loss": 1.1736, + "step": 46320 + }, + { + "epoch": 0.89, + "learning_rate": 5.852470260028364e-05, + "loss": 1.3742, + "step": 46330 + }, + { + "epoch": 0.89, + "learning_rate": 5.85098201124986e-05, + "loss": 1.2078, + "step": 46340 + }, + { + "epoch": 0.89, + "learning_rate": 5.849493684825188e-05, + "loss": 0.969, + "step": 46350 + }, + { + "epoch": 0.89, + "learning_rate": 5.848005280890145e-05, + "loss": 1.4297, + "step": 46360 + }, + { + "epoch": 0.89, + "learning_rate": 5.846516799580538e-05, + "loss": 1.2545, + "step": 46370 + }, + { + "epoch": 0.89, + "learning_rate": 5.84502824103218e-05, + "loss": 1.3457, + "step": 46380 + }, + { + "epoch": 0.89, + "learning_rate": 5.8435396053808936e-05, + "loss": 1.1778, + "step": 46390 + }, + { + "epoch": 0.89, + "learning_rate": 5.842050892762504e-05, + "loss": 1.2627, + "step": 46400 + }, + { + "epoch": 0.89, + "learning_rate": 5.8405621033128474e-05, + "loss": 1.2545, + "step": 46410 + }, + { + "epoch": 0.89, + "learning_rate": 5.839073237167766e-05, + "loss": 1.2288, + "step": 46420 + }, + { + "epoch": 0.89, + "learning_rate": 5.837584294463105e-05, + "loss": 1.4969, + "step": 46430 + }, + { + "epoch": 0.89, + "learning_rate": 5.836095275334724e-05, + "loss": 1.2948, + "step": 46440 + }, + { + "epoch": 0.89, + "learning_rate": 5.834606179918485e-05, + "loss": 1.1889, + "step": 46450 + }, + { + "epoch": 0.89, + "learning_rate": 5.833117008350256e-05, + "loss": 1.2606, + "step": 46460 + }, + { + "epoch": 0.89, + "learning_rate": 5.831627760765914e-05, + "loss": 1.3676, + "step": 46470 + }, + { + "epoch": 0.89, + "learning_rate": 5.8301384373013415e-05, + "loss": 1.1777, + "step": 46480 + }, + { + "epoch": 0.89, + "learning_rate": 5.828649038092431e-05, + "loss": 1.4203, + "step": 46490 + }, + { + "epoch": 0.89, + "learning_rate": 5.8271595632750795e-05, + "loss": 1.2019, + "step": 46500 + }, + { + "epoch": 0.89, + "learning_rate": 5.825670012985189e-05, + "loss": 1.2948, + "step": 46510 + }, + { + "epoch": 0.89, + "learning_rate": 5.824180387358674e-05, + "loss": 1.2322, + "step": 46520 + }, + { + "epoch": 0.89, + "learning_rate": 5.822690686531449e-05, + "loss": 1.2143, + "step": 46530 + }, + { + "epoch": 0.89, + "learning_rate": 5.821200910639441e-05, + "loss": 1.3434, + "step": 46540 + }, + { + "epoch": 0.9, + "learning_rate": 5.819711059818579e-05, + "loss": 1.1232, + "step": 46550 + }, + { + "epoch": 0.9, + "learning_rate": 5.818221134204806e-05, + "loss": 1.3862, + "step": 46560 + }, + { + "epoch": 0.9, + "learning_rate": 5.8167311339340634e-05, + "loss": 1.3379, + "step": 46570 + }, + { + "epoch": 0.9, + "learning_rate": 5.8152410591423045e-05, + "loss": 1.2829, + "step": 46580 + }, + { + "epoch": 0.9, + "learning_rate": 5.8137509099654885e-05, + "loss": 1.0943, + "step": 46590 + }, + { + "epoch": 0.9, + "learning_rate": 5.812260686539581e-05, + "loss": 1.3873, + "step": 46600 + }, + { + "epoch": 0.9, + "learning_rate": 5.810770389000556e-05, + "loss": 1.2307, + "step": 46610 + }, + { + "epoch": 0.9, + "learning_rate": 5.8092800174843884e-05, + "loss": 1.3081, + "step": 46620 + }, + { + "epoch": 0.9, + "learning_rate": 5.8077895721270694e-05, + "loss": 1.2491, + "step": 46630 + }, + { + "epoch": 0.9, + "learning_rate": 5.806299053064589e-05, + "loss": 1.2393, + "step": 46640 + }, + { + "epoch": 0.9, + "learning_rate": 5.804808460432945e-05, + "loss": 1.2828, + "step": 46650 + }, + { + "epoch": 0.9, + "learning_rate": 5.8033177943681496e-05, + "loss": 1.1027, + "step": 46660 + }, + { + "epoch": 0.9, + "learning_rate": 5.801827055006208e-05, + "loss": 1.4728, + "step": 46670 + }, + { + "epoch": 0.9, + "learning_rate": 5.800336242483145e-05, + "loss": 1.1929, + "step": 46680 + }, + { + "epoch": 0.9, + "learning_rate": 5.798845356934985e-05, + "loss": 1.283, + "step": 46690 + }, + { + "epoch": 0.9, + "learning_rate": 5.797354398497761e-05, + "loss": 1.5657, + "step": 46700 + }, + { + "epoch": 0.9, + "learning_rate": 5.795863367307515e-05, + "loss": 1.2292, + "step": 46710 + }, + { + "epoch": 0.9, + "learning_rate": 5.794372263500287e-05, + "loss": 1.2504, + "step": 46720 + }, + { + "epoch": 0.9, + "learning_rate": 5.7928810872121366e-05, + "loss": 1.3442, + "step": 46730 + }, + { + "epoch": 0.9, + "learning_rate": 5.791389838579119e-05, + "loss": 1.2235, + "step": 46740 + }, + { + "epoch": 0.9, + "learning_rate": 5.789898517737301e-05, + "loss": 1.2179, + "step": 46750 + }, + { + "epoch": 0.9, + "learning_rate": 5.788407124822759e-05, + "loss": 1.1723, + "step": 46760 + }, + { + "epoch": 0.9, + "learning_rate": 5.7869156599715655e-05, + "loss": 1.4367, + "step": 46770 + }, + { + "epoch": 0.9, + "learning_rate": 5.7854241233198116e-05, + "loss": 1.4473, + "step": 46780 + }, + { + "epoch": 0.9, + "learning_rate": 5.783932515003587e-05, + "loss": 1.3816, + "step": 46790 + }, + { + "epoch": 0.9, + "learning_rate": 5.782440835158991e-05, + "loss": 1.2566, + "step": 46800 + }, + { + "epoch": 0.9, + "learning_rate": 5.780949083922131e-05, + "loss": 1.132, + "step": 46810 + }, + { + "epoch": 0.9, + "learning_rate": 5.779457261429115e-05, + "loss": 1.2748, + "step": 46820 + }, + { + "epoch": 0.9, + "learning_rate": 5.777965367816066e-05, + "loss": 1.3042, + "step": 46830 + }, + { + "epoch": 0.9, + "learning_rate": 5.7764734032191046e-05, + "loss": 1.3043, + "step": 46840 + }, + { + "epoch": 0.9, + "learning_rate": 5.7749813677743644e-05, + "loss": 1.1063, + "step": 46850 + }, + { + "epoch": 0.9, + "learning_rate": 5.773489261617985e-05, + "loss": 1.296, + "step": 46860 + }, + { + "epoch": 0.9, + "learning_rate": 5.771997084886105e-05, + "loss": 1.3258, + "step": 46870 + }, + { + "epoch": 0.9, + "learning_rate": 5.770504837714881e-05, + "loss": 1.3864, + "step": 46880 + }, + { + "epoch": 0.9, + "learning_rate": 5.769012520240467e-05, + "loss": 1.3008, + "step": 46890 + }, + { + "epoch": 0.9, + "learning_rate": 5.767520132599027e-05, + "loss": 1.1481, + "step": 46900 + }, + { + "epoch": 0.9, + "learning_rate": 5.766027674926733e-05, + "loss": 1.3018, + "step": 46910 + }, + { + "epoch": 0.9, + "learning_rate": 5.7645351473597576e-05, + "loss": 1.2343, + "step": 46920 + }, + { + "epoch": 0.9, + "learning_rate": 5.763042550034287e-05, + "loss": 1.1662, + "step": 46930 + }, + { + "epoch": 0.9, + "learning_rate": 5.7615498830865066e-05, + "loss": 1.4862, + "step": 46940 + }, + { + "epoch": 0.9, + "learning_rate": 5.760057146652616e-05, + "loss": 1.172, + "step": 46950 + }, + { + "epoch": 0.9, + "learning_rate": 5.758564340868815e-05, + "loss": 1.1812, + "step": 46960 + }, + { + "epoch": 0.9, + "learning_rate": 5.757071465871312e-05, + "loss": 1.1832, + "step": 46970 + }, + { + "epoch": 0.9, + "learning_rate": 5.755578521796321e-05, + "loss": 1.3304, + "step": 46980 + }, + { + "epoch": 0.9, + "learning_rate": 5.754085508780063e-05, + "loss": 1.3528, + "step": 46990 + }, + { + "epoch": 0.9, + "learning_rate": 5.752592426958764e-05, + "loss": 1.1995, + "step": 47000 + }, + { + "epoch": 0.9, + "learning_rate": 5.751099276468659e-05, + "loss": 1.3179, + "step": 47010 + }, + { + "epoch": 0.9, + "learning_rate": 5.7496060574459877e-05, + "loss": 1.2798, + "step": 47020 + }, + { + "epoch": 0.9, + "learning_rate": 5.748112770026994e-05, + "loss": 1.2668, + "step": 47030 + }, + { + "epoch": 0.9, + "learning_rate": 5.74661941434793e-05, + "loss": 1.1862, + "step": 47040 + }, + { + "epoch": 0.9, + "learning_rate": 5.745125990545056e-05, + "loss": 1.3306, + "step": 47050 + }, + { + "epoch": 0.9, + "learning_rate": 5.7436324987546365e-05, + "loss": 1.3527, + "step": 47060 + }, + { + "epoch": 0.91, + "learning_rate": 5.74213893911294e-05, + "loss": 1.2552, + "step": 47070 + }, + { + "epoch": 0.91, + "learning_rate": 5.740645311756245e-05, + "loss": 1.3138, + "step": 47080 + }, + { + "epoch": 0.91, + "learning_rate": 5.739151616820833e-05, + "loss": 1.1528, + "step": 47090 + }, + { + "epoch": 0.91, + "learning_rate": 5.737657854442996e-05, + "loss": 1.3394, + "step": 47100 + }, + { + "epoch": 0.91, + "learning_rate": 5.736164024759028e-05, + "loss": 1.3675, + "step": 47110 + }, + { + "epoch": 0.91, + "learning_rate": 5.734670127905228e-05, + "loss": 1.1041, + "step": 47120 + }, + { + "epoch": 0.91, + "learning_rate": 5.7331761640179084e-05, + "loss": 1.2755, + "step": 47130 + }, + { + "epoch": 0.91, + "learning_rate": 5.731682133233378e-05, + "loss": 1.1449, + "step": 47140 + }, + { + "epoch": 0.91, + "learning_rate": 5.730188035687961e-05, + "loss": 1.2011, + "step": 47150 + }, + { + "epoch": 0.91, + "learning_rate": 5.7286938715179814e-05, + "loss": 1.314, + "step": 47160 + }, + { + "epoch": 0.91, + "learning_rate": 5.727199640859773e-05, + "loss": 1.3122, + "step": 47170 + }, + { + "epoch": 0.91, + "learning_rate": 5.72570534384967e-05, + "loss": 1.308, + "step": 47180 + }, + { + "epoch": 0.91, + "learning_rate": 5.724210980624018e-05, + "loss": 1.3599, + "step": 47190 + }, + { + "epoch": 0.91, + "learning_rate": 5.7227165513191714e-05, + "loss": 1.058, + "step": 47200 + }, + { + "epoch": 0.91, + "learning_rate": 5.72122205607148e-05, + "loss": 1.2585, + "step": 47210 + }, + { + "epoch": 0.91, + "learning_rate": 5.719727495017313e-05, + "loss": 1.2368, + "step": 47220 + }, + { + "epoch": 0.91, + "learning_rate": 5.718232868293033e-05, + "loss": 1.1802, + "step": 47230 + }, + { + "epoch": 0.91, + "learning_rate": 5.716738176035015e-05, + "loss": 0.9619, + "step": 47240 + }, + { + "epoch": 0.91, + "learning_rate": 5.7152434183796424e-05, + "loss": 1.2784, + "step": 47250 + }, + { + "epoch": 0.91, + "learning_rate": 5.713748595463298e-05, + "loss": 1.3124, + "step": 47260 + }, + { + "epoch": 0.91, + "learning_rate": 5.712253707422377e-05, + "loss": 1.3039, + "step": 47270 + }, + { + "epoch": 0.91, + "learning_rate": 5.710758754393274e-05, + "loss": 1.5125, + "step": 47280 + }, + { + "epoch": 0.91, + "learning_rate": 5.709263736512396e-05, + "loss": 1.0233, + "step": 47290 + }, + { + "epoch": 0.91, + "learning_rate": 5.7077686539161515e-05, + "loss": 1.0014, + "step": 47300 + }, + { + "epoch": 0.91, + "learning_rate": 5.706273506740956e-05, + "loss": 1.1457, + "step": 47310 + }, + { + "epoch": 0.91, + "learning_rate": 5.704778295123234e-05, + "loss": 1.4484, + "step": 47320 + }, + { + "epoch": 0.91, + "learning_rate": 5.7032830191994094e-05, + "loss": 1.2449, + "step": 47330 + }, + { + "epoch": 0.91, + "learning_rate": 5.7017876791059176e-05, + "loss": 1.2105, + "step": 47340 + }, + { + "epoch": 0.91, + "learning_rate": 5.700292274979199e-05, + "loss": 1.4322, + "step": 47350 + }, + { + "epoch": 0.91, + "learning_rate": 5.698796806955695e-05, + "loss": 1.2236, + "step": 47360 + }, + { + "epoch": 0.91, + "learning_rate": 5.6973012751718624e-05, + "loss": 1.1892, + "step": 47370 + }, + { + "epoch": 0.91, + "learning_rate": 5.695805679764153e-05, + "loss": 1.5505, + "step": 47380 + }, + { + "epoch": 0.91, + "learning_rate": 5.694310020869031e-05, + "loss": 1.1827, + "step": 47390 + }, + { + "epoch": 0.91, + "learning_rate": 5.692814298622966e-05, + "loss": 1.1189, + "step": 47400 + }, + { + "epoch": 0.91, + "learning_rate": 5.691318513162429e-05, + "loss": 1.2189, + "step": 47410 + }, + { + "epoch": 0.91, + "learning_rate": 5.689822664623906e-05, + "loss": 1.2616, + "step": 47420 + }, + { + "epoch": 0.91, + "learning_rate": 5.6883267531438765e-05, + "loss": 1.2732, + "step": 47430 + }, + { + "epoch": 0.91, + "learning_rate": 5.686830778858835e-05, + "loss": 1.2872, + "step": 47440 + }, + { + "epoch": 0.91, + "learning_rate": 5.685334741905278e-05, + "loss": 1.278, + "step": 47450 + }, + { + "epoch": 0.91, + "learning_rate": 5.6838386424197084e-05, + "loss": 1.3536, + "step": 47460 + }, + { + "epoch": 0.91, + "learning_rate": 5.682342480538637e-05, + "loss": 1.2619, + "step": 47470 + }, + { + "epoch": 0.91, + "learning_rate": 5.680846256398574e-05, + "loss": 1.2299, + "step": 47480 + }, + { + "epoch": 0.91, + "learning_rate": 5.679349970136042e-05, + "loss": 1.3944, + "step": 47490 + }, + { + "epoch": 0.91, + "learning_rate": 5.6778536218875676e-05, + "loss": 1.2899, + "step": 47500 + }, + { + "epoch": 0.91, + "learning_rate": 5.676357211789679e-05, + "loss": 1.2917, + "step": 47510 + }, + { + "epoch": 0.91, + "learning_rate": 5.674860739978917e-05, + "loss": 1.061, + "step": 47520 + }, + { + "epoch": 0.91, + "learning_rate": 5.67336420659182e-05, + "loss": 1.1928, + "step": 47530 + }, + { + "epoch": 0.91, + "learning_rate": 5.6718676117649404e-05, + "loss": 1.3854, + "step": 47540 + }, + { + "epoch": 0.91, + "learning_rate": 5.6703709556348284e-05, + "loss": 0.9909, + "step": 47550 + }, + { + "epoch": 0.91, + "learning_rate": 5.6688742383380454e-05, + "loss": 1.3523, + "step": 47560 + }, + { + "epoch": 0.91, + "learning_rate": 5.667377460011158e-05, + "loss": 1.2299, + "step": 47570 + }, + { + "epoch": 0.91, + "learning_rate": 5.665880620790733e-05, + "loss": 1.2417, + "step": 47580 + }, + { + "epoch": 0.92, + "learning_rate": 5.664383720813349e-05, + "loss": 1.3399, + "step": 47590 + }, + { + "epoch": 0.92, + "learning_rate": 5.6628867602155863e-05, + "loss": 1.0172, + "step": 47600 + }, + { + "epoch": 0.92, + "learning_rate": 5.6613897391340343e-05, + "loss": 1.3082, + "step": 47610 + }, + { + "epoch": 0.92, + "learning_rate": 5.659892657705283e-05, + "loss": 1.3448, + "step": 47620 + }, + { + "epoch": 0.92, + "learning_rate": 5.658395516065933e-05, + "loss": 1.2026, + "step": 47630 + }, + { + "epoch": 0.92, + "learning_rate": 5.656898314352588e-05, + "loss": 1.2983, + "step": 47640 + }, + { + "epoch": 0.92, + "learning_rate": 5.655401052701853e-05, + "loss": 1.2483, + "step": 47650 + }, + { + "epoch": 0.92, + "learning_rate": 5.6539037312503485e-05, + "loss": 1.2147, + "step": 47660 + }, + { + "epoch": 0.92, + "learning_rate": 5.652406350134691e-05, + "loss": 1.1359, + "step": 47670 + }, + { + "epoch": 0.92, + "learning_rate": 5.650908909491508e-05, + "loss": 1.2807, + "step": 47680 + }, + { + "epoch": 0.92, + "learning_rate": 5.649411409457429e-05, + "loss": 1.4558, + "step": 47690 + }, + { + "epoch": 0.92, + "learning_rate": 5.6479138501690896e-05, + "loss": 1.4579, + "step": 47700 + }, + { + "epoch": 0.92, + "learning_rate": 5.6464162317631355e-05, + "loss": 1.2372, + "step": 47710 + }, + { + "epoch": 0.92, + "learning_rate": 5.6449185543762105e-05, + "loss": 0.9895, + "step": 47720 + }, + { + "epoch": 0.92, + "learning_rate": 5.6434208181449674e-05, + "loss": 1.2814, + "step": 47730 + }, + { + "epoch": 0.92, + "learning_rate": 5.641923023206066e-05, + "loss": 1.2588, + "step": 47740 + }, + { + "epoch": 0.92, + "learning_rate": 5.640425169696167e-05, + "loss": 1.2651, + "step": 47750 + }, + { + "epoch": 0.92, + "learning_rate": 5.6389272577519426e-05, + "loss": 1.1983, + "step": 47760 + }, + { + "epoch": 0.92, + "learning_rate": 5.637429287510064e-05, + "loss": 1.2406, + "step": 47770 + }, + { + "epoch": 0.92, + "learning_rate": 5.635931259107212e-05, + "loss": 1.1165, + "step": 47780 + }, + { + "epoch": 0.92, + "learning_rate": 5.634433172680071e-05, + "loss": 1.5445, + "step": 47790 + }, + { + "epoch": 0.92, + "learning_rate": 5.6329350283653295e-05, + "loss": 1.3053, + "step": 47800 + }, + { + "epoch": 0.92, + "learning_rate": 5.631436826299684e-05, + "loss": 1.1891, + "step": 47810 + }, + { + "epoch": 0.92, + "learning_rate": 5.6299385666198356e-05, + "loss": 1.1232, + "step": 47820 + }, + { + "epoch": 0.92, + "learning_rate": 5.628440249462489e-05, + "loss": 1.15, + "step": 47830 + }, + { + "epoch": 0.92, + "learning_rate": 5.626941874964354e-05, + "loss": 1.2495, + "step": 47840 + }, + { + "epoch": 0.92, + "learning_rate": 5.6254434432621496e-05, + "loss": 1.4001, + "step": 47850 + }, + { + "epoch": 0.92, + "learning_rate": 5.623944954492595e-05, + "loss": 1.321, + "step": 47860 + }, + { + "epoch": 0.92, + "learning_rate": 5.622446408792419e-05, + "loss": 1.0874, + "step": 47870 + }, + { + "epoch": 0.92, + "learning_rate": 5.620947806298351e-05, + "loss": 1.2628, + "step": 47880 + }, + { + "epoch": 0.92, + "learning_rate": 5.61944914714713e-05, + "loss": 1.2606, + "step": 47890 + }, + { + "epoch": 0.92, + "learning_rate": 5.617950431475496e-05, + "loss": 1.3286, + "step": 47900 + }, + { + "epoch": 0.92, + "learning_rate": 5.6164516594201986e-05, + "loss": 1.2909, + "step": 47910 + }, + { + "epoch": 0.92, + "learning_rate": 5.6149528311179886e-05, + "loss": 1.2387, + "step": 47920 + }, + { + "epoch": 0.92, + "learning_rate": 5.613453946705627e-05, + "loss": 1.3549, + "step": 47930 + }, + { + "epoch": 0.92, + "learning_rate": 5.6119550063198714e-05, + "loss": 1.2433, + "step": 47940 + }, + { + "epoch": 0.92, + "learning_rate": 5.6104560100974935e-05, + "loss": 1.2987, + "step": 47950 + }, + { + "epoch": 0.92, + "learning_rate": 5.6089569581752644e-05, + "loss": 1.4034, + "step": 47960 + }, + { + "epoch": 0.92, + "learning_rate": 5.607457850689962e-05, + "loss": 1.2956, + "step": 47970 + }, + { + "epoch": 0.92, + "learning_rate": 5.605958687778372e-05, + "loss": 1.5, + "step": 47980 + }, + { + "epoch": 0.92, + "learning_rate": 5.604459469577279e-05, + "loss": 1.1507, + "step": 47990 + }, + { + "epoch": 0.92, + "learning_rate": 5.602960196223478e-05, + "loss": 1.3989, + "step": 48000 + }, + { + "epoch": 0.92, + "learning_rate": 5.601460867853767e-05, + "loss": 1.3516, + "step": 48010 + }, + { + "epoch": 0.92, + "learning_rate": 5.59996148460495e-05, + "loss": 1.2525, + "step": 48020 + }, + { + "epoch": 0.92, + "learning_rate": 5.5984620466138346e-05, + "loss": 1.3429, + "step": 48030 + }, + { + "epoch": 0.92, + "learning_rate": 5.596962554017233e-05, + "loss": 1.3668, + "step": 48040 + }, + { + "epoch": 0.92, + "learning_rate": 5.5954630069519657e-05, + "loss": 1.2796, + "step": 48050 + }, + { + "epoch": 0.92, + "learning_rate": 5.593963405554854e-05, + "loss": 1.2219, + "step": 48060 + }, + { + "epoch": 0.92, + "learning_rate": 5.5924637499627254e-05, + "loss": 1.2098, + "step": 48070 + }, + { + "epoch": 0.92, + "learning_rate": 5.590964040312416e-05, + "loss": 1.2002, + "step": 48080 + }, + { + "epoch": 0.92, + "learning_rate": 5.5894642767407615e-05, + "loss": 1.2234, + "step": 48090 + }, + { + "epoch": 0.92, + "learning_rate": 5.587964459384606e-05, + "loss": 1.1679, + "step": 48100 + }, + { + "epoch": 0.93, + "learning_rate": 5.586464588380798e-05, + "loss": 1.1805, + "step": 48110 + }, + { + "epoch": 0.93, + "learning_rate": 5.5849646638661853e-05, + "loss": 1.3435, + "step": 48120 + }, + { + "epoch": 0.93, + "learning_rate": 5.583464685977634e-05, + "loss": 1.2777, + "step": 48130 + }, + { + "epoch": 0.93, + "learning_rate": 5.5819646548519986e-05, + "loss": 1.3938, + "step": 48140 + }, + { + "epoch": 0.93, + "learning_rate": 5.5804645706261514e-05, + "loss": 1.1454, + "step": 48150 + }, + { + "epoch": 0.93, + "learning_rate": 5.5789644334369636e-05, + "loss": 1.6416, + "step": 48160 + }, + { + "epoch": 0.93, + "learning_rate": 5.57746424342131e-05, + "loss": 1.3286, + "step": 48170 + }, + { + "epoch": 0.93, + "learning_rate": 5.5759640007160766e-05, + "loss": 1.3975, + "step": 48180 + }, + { + "epoch": 0.93, + "learning_rate": 5.574463705458145e-05, + "loss": 1.4875, + "step": 48190 + }, + { + "epoch": 0.93, + "learning_rate": 5.572963357784411e-05, + "loss": 1.5109, + "step": 48200 + }, + { + "epoch": 0.93, + "learning_rate": 5.571462957831768e-05, + "loss": 1.1065, + "step": 48210 + }, + { + "epoch": 0.93, + "learning_rate": 5.5699625057371194e-05, + "loss": 1.2431, + "step": 48220 + }, + { + "epoch": 0.93, + "learning_rate": 5.568462001637371e-05, + "loss": 1.1877, + "step": 48230 + }, + { + "epoch": 0.93, + "learning_rate": 5.56696144566943e-05, + "loss": 1.2013, + "step": 48240 + }, + { + "epoch": 0.93, + "learning_rate": 5.5654608379702145e-05, + "loss": 1.2246, + "step": 48250 + }, + { + "epoch": 0.93, + "learning_rate": 5.5639601786766436e-05, + "loss": 0.999, + "step": 48260 + }, + { + "epoch": 0.93, + "learning_rate": 5.562459467925643e-05, + "loss": 1.3148, + "step": 48270 + }, + { + "epoch": 0.93, + "learning_rate": 5.56095870585414e-05, + "loss": 1.366, + "step": 48280 + }, + { + "epoch": 0.93, + "learning_rate": 5.5594578925990714e-05, + "loss": 1.018, + "step": 48290 + }, + { + "epoch": 0.93, + "learning_rate": 5.5579570282973735e-05, + "loss": 1.1258, + "step": 48300 + }, + { + "epoch": 0.93, + "learning_rate": 5.55645611308599e-05, + "loss": 1.2357, + "step": 48310 + }, + { + "epoch": 0.93, + "learning_rate": 5.554955147101871e-05, + "loss": 1.1582, + "step": 48320 + }, + { + "epoch": 0.93, + "learning_rate": 5.5534541304819674e-05, + "loss": 1.3045, + "step": 48330 + }, + { + "epoch": 0.93, + "learning_rate": 5.5519530633632366e-05, + "loss": 1.266, + "step": 48340 + }, + { + "epoch": 0.93, + "learning_rate": 5.5504519458826406e-05, + "loss": 1.296, + "step": 48350 + }, + { + "epoch": 0.93, + "learning_rate": 5.5489507781771454e-05, + "loss": 1.3603, + "step": 48360 + }, + { + "epoch": 0.93, + "learning_rate": 5.547449560383724e-05, + "loss": 1.2973, + "step": 48370 + }, + { + "epoch": 0.93, + "learning_rate": 5.5459482926393515e-05, + "loss": 1.3142, + "step": 48380 + }, + { + "epoch": 0.93, + "learning_rate": 5.5444469750810055e-05, + "loss": 1.3363, + "step": 48390 + }, + { + "epoch": 0.93, + "learning_rate": 5.542945607845674e-05, + "loss": 1.1919, + "step": 48400 + }, + { + "epoch": 0.93, + "learning_rate": 5.541444191070343e-05, + "loss": 1.3416, + "step": 48410 + }, + { + "epoch": 0.93, + "learning_rate": 5.53994272489201e-05, + "loss": 1.1561, + "step": 48420 + }, + { + "epoch": 0.93, + "learning_rate": 5.538441209447671e-05, + "loss": 1.2199, + "step": 48430 + }, + { + "epoch": 0.93, + "learning_rate": 5.536939644874329e-05, + "loss": 1.3491, + "step": 48440 + }, + { + "epoch": 0.93, + "learning_rate": 5.5354380313089925e-05, + "loss": 1.2251, + "step": 48450 + }, + { + "epoch": 0.93, + "learning_rate": 5.533936368888671e-05, + "loss": 1.1191, + "step": 48460 + }, + { + "epoch": 0.93, + "learning_rate": 5.532434657750384e-05, + "loss": 1.2545, + "step": 48470 + }, + { + "epoch": 0.93, + "learning_rate": 5.5309328980311493e-05, + "loss": 1.303, + "step": 48480 + }, + { + "epoch": 0.93, + "learning_rate": 5.5294310898679925e-05, + "loss": 1.1856, + "step": 48490 + }, + { + "epoch": 0.93, + "learning_rate": 5.5279292333979436e-05, + "loss": 1.2177, + "step": 48500 + }, + { + "epoch": 0.93, + "learning_rate": 5.526427328758036e-05, + "loss": 1.336, + "step": 48510 + }, + { + "epoch": 0.93, + "learning_rate": 5.52492537608531e-05, + "loss": 1.6078, + "step": 48520 + }, + { + "epoch": 0.93, + "learning_rate": 5.523423375516806e-05, + "loss": 1.2114, + "step": 48530 + }, + { + "epoch": 0.93, + "learning_rate": 5.521921327189572e-05, + "loss": 1.2961, + "step": 48540 + }, + { + "epoch": 0.93, + "learning_rate": 5.52041923124066e-05, + "loss": 1.3463, + "step": 48550 + }, + { + "epoch": 0.93, + "learning_rate": 5.518917087807123e-05, + "loss": 1.5425, + "step": 48560 + }, + { + "epoch": 0.93, + "learning_rate": 5.517414897026025e-05, + "loss": 1.0238, + "step": 48570 + }, + { + "epoch": 0.93, + "learning_rate": 5.515912659034428e-05, + "loss": 1.1294, + "step": 48580 + }, + { + "epoch": 0.93, + "learning_rate": 5.514410373969402e-05, + "loss": 1.2454, + "step": 48590 + }, + { + "epoch": 0.93, + "learning_rate": 5.512908041968018e-05, + "loss": 1.2068, + "step": 48600 + }, + { + "epoch": 0.93, + "learning_rate": 5.511405663167355e-05, + "loss": 1.3181, + "step": 48610 + }, + { + "epoch": 0.93, + "learning_rate": 5.509903237704494e-05, + "loss": 1.3094, + "step": 48620 + }, + { + "epoch": 0.94, + "learning_rate": 5.508400765716523e-05, + "loss": 1.208, + "step": 48630 + }, + { + "epoch": 0.94, + "learning_rate": 5.506898247340529e-05, + "loss": 1.288, + "step": 48640 + }, + { + "epoch": 0.94, + "learning_rate": 5.505395682713607e-05, + "loss": 1.4243, + "step": 48650 + }, + { + "epoch": 0.94, + "learning_rate": 5.5038930719728565e-05, + "loss": 1.3259, + "step": 48660 + }, + { + "epoch": 0.94, + "learning_rate": 5.5023904152553796e-05, + "loss": 1.2286, + "step": 48670 + }, + { + "epoch": 0.94, + "learning_rate": 5.500887712698284e-05, + "loss": 1.3015, + "step": 48680 + }, + { + "epoch": 0.94, + "learning_rate": 5.4993849644386795e-05, + "loss": 1.3733, + "step": 48690 + }, + { + "epoch": 0.94, + "learning_rate": 5.4978821706136816e-05, + "loss": 1.2165, + "step": 48700 + }, + { + "epoch": 0.94, + "learning_rate": 5.4963793313604114e-05, + "loss": 1.4424, + "step": 48710 + }, + { + "epoch": 0.94, + "learning_rate": 5.494876446815992e-05, + "loss": 1.1533, + "step": 48720 + }, + { + "epoch": 0.94, + "learning_rate": 5.4933735171175494e-05, + "loss": 1.1578, + "step": 48730 + }, + { + "epoch": 0.94, + "learning_rate": 5.4918705424022166e-05, + "loss": 1.1721, + "step": 48740 + }, + { + "epoch": 0.94, + "learning_rate": 5.4903675228071284e-05, + "loss": 1.4644, + "step": 48750 + }, + { + "epoch": 0.94, + "learning_rate": 5.488864458469427e-05, + "loss": 1.4237, + "step": 48760 + }, + { + "epoch": 0.94, + "learning_rate": 5.487361349526257e-05, + "loss": 1.2883, + "step": 48770 + }, + { + "epoch": 0.94, + "learning_rate": 5.4858581961147616e-05, + "loss": 1.1601, + "step": 48780 + }, + { + "epoch": 0.94, + "learning_rate": 5.4843549983721e-05, + "loss": 1.1388, + "step": 48790 + }, + { + "epoch": 0.94, + "learning_rate": 5.482851756435423e-05, + "loss": 1.3727, + "step": 48800 + }, + { + "epoch": 0.94, + "learning_rate": 5.481348470441894e-05, + "loss": 1.1535, + "step": 48810 + }, + { + "epoch": 0.94, + "learning_rate": 5.479845140528675e-05, + "loss": 0.9777, + "step": 48820 + }, + { + "epoch": 0.94, + "learning_rate": 5.478341766832936e-05, + "loss": 1.2298, + "step": 48830 + }, + { + "epoch": 0.94, + "learning_rate": 5.476838349491851e-05, + "loss": 1.3673, + "step": 48840 + }, + { + "epoch": 0.94, + "learning_rate": 5.4753348886425916e-05, + "loss": 1.2185, + "step": 48850 + }, + { + "epoch": 0.94, + "learning_rate": 5.4738313844223433e-05, + "loss": 1.3933, + "step": 48860 + }, + { + "epoch": 0.94, + "learning_rate": 5.472327836968285e-05, + "loss": 1.0845, + "step": 48870 + }, + { + "epoch": 0.94, + "learning_rate": 5.470824246417611e-05, + "loss": 1.2873, + "step": 48880 + }, + { + "epoch": 0.94, + "learning_rate": 5.4693206129075105e-05, + "loss": 1.4896, + "step": 48890 + }, + { + "epoch": 0.94, + "learning_rate": 5.4678169365751764e-05, + "loss": 1.3495, + "step": 48900 + }, + { + "epoch": 0.94, + "learning_rate": 5.4663132175578135e-05, + "loss": 1.2707, + "step": 48910 + }, + { + "epoch": 0.94, + "learning_rate": 5.4648094559926223e-05, + "loss": 1.26, + "step": 48920 + }, + { + "epoch": 0.94, + "learning_rate": 5.4633056520168134e-05, + "loss": 1.3458, + "step": 48930 + }, + { + "epoch": 0.94, + "learning_rate": 5.461801805767598e-05, + "loss": 1.3453, + "step": 48940 + }, + { + "epoch": 0.94, + "learning_rate": 5.46029791738219e-05, + "loss": 1.1922, + "step": 48950 + }, + { + "epoch": 0.94, + "learning_rate": 5.458793986997809e-05, + "loss": 1.4255, + "step": 48960 + }, + { + "epoch": 0.94, + "learning_rate": 5.457290014751677e-05, + "loss": 1.3661, + "step": 48970 + }, + { + "epoch": 0.94, + "learning_rate": 5.4557860007810246e-05, + "loss": 1.2956, + "step": 48980 + }, + { + "epoch": 0.94, + "learning_rate": 5.454281945223081e-05, + "loss": 1.1534, + "step": 48990 + }, + { + "epoch": 0.94, + "learning_rate": 5.452777848215078e-05, + "loss": 1.1886, + "step": 49000 + }, + { + "epoch": 0.94, + "learning_rate": 5.451273709894258e-05, + "loss": 1.2293, + "step": 49010 + }, + { + "epoch": 0.94, + "learning_rate": 5.44976953039786e-05, + "loss": 1.1047, + "step": 49020 + }, + { + "epoch": 0.94, + "learning_rate": 5.448265309863132e-05, + "loss": 1.3792, + "step": 49030 + }, + { + "epoch": 0.94, + "learning_rate": 5.446761048427323e-05, + "loss": 1.3, + "step": 49040 + }, + { + "epoch": 0.94, + "learning_rate": 5.445256746227687e-05, + "loss": 1.1171, + "step": 49050 + }, + { + "epoch": 0.94, + "learning_rate": 5.4437524034014784e-05, + "loss": 1.1444, + "step": 49060 + }, + { + "epoch": 0.94, + "learning_rate": 5.442248020085961e-05, + "loss": 1.362, + "step": 49070 + }, + { + "epoch": 0.94, + "learning_rate": 5.4407435964183986e-05, + "loss": 1.282, + "step": 49080 + }, + { + "epoch": 0.94, + "learning_rate": 5.439239132536058e-05, + "loss": 1.2146, + "step": 49090 + }, + { + "epoch": 0.94, + "learning_rate": 5.437734628576212e-05, + "loss": 1.5993, + "step": 49100 + }, + { + "epoch": 0.94, + "learning_rate": 5.436230084676136e-05, + "loss": 1.1151, + "step": 49110 + }, + { + "epoch": 0.94, + "learning_rate": 5.434725500973109e-05, + "loss": 1.3419, + "step": 49120 + }, + { + "epoch": 0.94, + "learning_rate": 5.433220877604415e-05, + "loss": 1.5298, + "step": 49130 + }, + { + "epoch": 0.94, + "learning_rate": 5.431716214707338e-05, + "loss": 1.1774, + "step": 49140 + }, + { + "epoch": 0.95, + "learning_rate": 5.43021151241917e-05, + "loss": 1.4273, + "step": 49150 + }, + { + "epoch": 0.95, + "learning_rate": 5.428706770877203e-05, + "loss": 1.2264, + "step": 49160 + }, + { + "epoch": 0.95, + "learning_rate": 5.427201990218735e-05, + "loss": 1.0585, + "step": 49170 + }, + { + "epoch": 0.95, + "learning_rate": 5.4256971705810674e-05, + "loss": 1.4064, + "step": 49180 + }, + { + "epoch": 0.95, + "learning_rate": 5.424192312101505e-05, + "loss": 1.3312, + "step": 49190 + }, + { + "epoch": 0.95, + "learning_rate": 5.422687414917354e-05, + "loss": 1.1178, + "step": 49200 + }, + { + "epoch": 0.95, + "learning_rate": 5.4211824791659246e-05, + "loss": 1.181, + "step": 49210 + }, + { + "epoch": 0.95, + "learning_rate": 5.419677504984534e-05, + "loss": 1.5156, + "step": 49220 + }, + { + "epoch": 0.95, + "learning_rate": 5.4181724925105006e-05, + "loss": 1.4541, + "step": 49230 + }, + { + "epoch": 0.95, + "learning_rate": 5.4166674418811456e-05, + "loss": 1.3231, + "step": 49240 + }, + { + "epoch": 0.95, + "learning_rate": 5.415162353233795e-05, + "loss": 1.2137, + "step": 49250 + }, + { + "epoch": 0.95, + "learning_rate": 5.413657226705775e-05, + "loss": 1.1452, + "step": 49260 + }, + { + "epoch": 0.95, + "learning_rate": 5.412152062434421e-05, + "loss": 1.3388, + "step": 49270 + }, + { + "epoch": 0.95, + "learning_rate": 5.410646860557068e-05, + "loss": 1.2464, + "step": 49280 + }, + { + "epoch": 0.95, + "learning_rate": 5.409141621211055e-05, + "loss": 1.2869, + "step": 49290 + }, + { + "epoch": 0.95, + "learning_rate": 5.407636344533724e-05, + "loss": 1.2331, + "step": 49300 + }, + { + "epoch": 0.95, + "learning_rate": 5.40613103066242e-05, + "loss": 1.287, + "step": 49310 + }, + { + "epoch": 0.95, + "learning_rate": 5.404625679734495e-05, + "loss": 1.1255, + "step": 49320 + }, + { + "epoch": 0.95, + "learning_rate": 5.4031202918873014e-05, + "loss": 1.2168, + "step": 49330 + }, + { + "epoch": 0.95, + "learning_rate": 5.4016148672581935e-05, + "loss": 1.1822, + "step": 49340 + }, + { + "epoch": 0.95, + "learning_rate": 5.400109405984533e-05, + "loss": 1.0959, + "step": 49350 + }, + { + "epoch": 0.95, + "learning_rate": 5.398603908203679e-05, + "loss": 1.1623, + "step": 49360 + }, + { + "epoch": 0.95, + "learning_rate": 5.3970983740530015e-05, + "loss": 1.2668, + "step": 49370 + }, + { + "epoch": 0.95, + "learning_rate": 5.395592803669869e-05, + "loss": 1.2985, + "step": 49380 + }, + { + "epoch": 0.95, + "learning_rate": 5.394087197191654e-05, + "loss": 1.3535, + "step": 49390 + }, + { + "epoch": 0.95, + "learning_rate": 5.3925815547557326e-05, + "loss": 1.4672, + "step": 49400 + }, + { + "epoch": 0.95, + "learning_rate": 5.391075876499483e-05, + "loss": 1.1933, + "step": 49410 + }, + { + "epoch": 0.95, + "learning_rate": 5.389570162560289e-05, + "loss": 1.1542, + "step": 49420 + }, + { + "epoch": 0.95, + "learning_rate": 5.388064413075537e-05, + "loss": 1.3368, + "step": 49430 + }, + { + "epoch": 0.95, + "learning_rate": 5.386558628182616e-05, + "loss": 1.3574, + "step": 49440 + }, + { + "epoch": 0.95, + "learning_rate": 5.385052808018918e-05, + "loss": 1.5783, + "step": 49450 + }, + { + "epoch": 0.95, + "learning_rate": 5.383546952721838e-05, + "loss": 1.2639, + "step": 49460 + }, + { + "epoch": 0.95, + "learning_rate": 5.382041062428774e-05, + "loss": 1.2551, + "step": 49470 + }, + { + "epoch": 0.95, + "learning_rate": 5.380535137277132e-05, + "loss": 1.2416, + "step": 49480 + }, + { + "epoch": 0.95, + "learning_rate": 5.379029177404312e-05, + "loss": 1.3656, + "step": 49490 + }, + { + "epoch": 0.95, + "learning_rate": 5.377523182947726e-05, + "loss": 1.4326, + "step": 49500 + }, + { + "epoch": 0.95, + "learning_rate": 5.3760171540447835e-05, + "loss": 1.0762, + "step": 49510 + }, + { + "epoch": 0.95, + "learning_rate": 5.3745110908329e-05, + "loss": 1.2656, + "step": 49520 + }, + { + "epoch": 0.95, + "learning_rate": 5.373004993449493e-05, + "loss": 1.2891, + "step": 49530 + }, + { + "epoch": 0.95, + "learning_rate": 5.371498862031985e-05, + "loss": 1.15, + "step": 49540 + }, + { + "epoch": 0.95, + "learning_rate": 5.369992696717797e-05, + "loss": 1.3196, + "step": 49550 + }, + { + "epoch": 0.95, + "learning_rate": 5.368486497644357e-05, + "loss": 1.2544, + "step": 49560 + }, + { + "epoch": 0.95, + "learning_rate": 5.366980264949098e-05, + "loss": 1.1986, + "step": 49570 + }, + { + "epoch": 0.95, + "learning_rate": 5.365473998769448e-05, + "loss": 1.3477, + "step": 49580 + }, + { + "epoch": 0.95, + "learning_rate": 5.363967699242849e-05, + "loss": 1.2976, + "step": 49590 + }, + { + "epoch": 0.95, + "learning_rate": 5.362461366506735e-05, + "loss": 1.1523, + "step": 49600 + }, + { + "epoch": 0.95, + "learning_rate": 5.360955000698552e-05, + "loss": 1.3105, + "step": 49610 + }, + { + "epoch": 0.95, + "learning_rate": 5.359448601955745e-05, + "loss": 1.2679, + "step": 49620 + }, + { + "epoch": 0.95, + "learning_rate": 5.357942170415759e-05, + "loss": 1.2758, + "step": 49630 + }, + { + "epoch": 0.95, + "learning_rate": 5.356435706216051e-05, + "loss": 1.2136, + "step": 49640 + }, + { + "epoch": 0.95, + "learning_rate": 5.354929209494071e-05, + "loss": 1.1862, + "step": 49650 + }, + { + "epoch": 0.95, + "learning_rate": 5.353422680387278e-05, + "loss": 1.2517, + "step": 49660 + }, + { + "epoch": 0.96, + "learning_rate": 5.351916119033131e-05, + "loss": 1.5123, + "step": 49670 + }, + { + "epoch": 0.96, + "learning_rate": 5.3504095255690944e-05, + "loss": 1.1377, + "step": 49680 + }, + { + "epoch": 0.96, + "learning_rate": 5.3489029001326354e-05, + "loss": 1.3096, + "step": 49690 + }, + { + "epoch": 0.96, + "learning_rate": 5.34739624286122e-05, + "loss": 1.301, + "step": 49700 + }, + { + "epoch": 0.96, + "learning_rate": 5.3458895538923226e-05, + "loss": 1.2684, + "step": 49710 + }, + { + "epoch": 0.96, + "learning_rate": 5.3443828333634184e-05, + "loss": 1.175, + "step": 49720 + }, + { + "epoch": 0.96, + "learning_rate": 5.342876081411982e-05, + "loss": 1.2661, + "step": 49730 + }, + { + "epoch": 0.96, + "learning_rate": 5.341369298175497e-05, + "loss": 1.3877, + "step": 49740 + }, + { + "epoch": 0.96, + "learning_rate": 5.3398624837914454e-05, + "loss": 1.0107, + "step": 49750 + }, + { + "epoch": 0.96, + "learning_rate": 5.3383556383973155e-05, + "loss": 1.2434, + "step": 49760 + }, + { + "epoch": 0.96, + "learning_rate": 5.336848762130594e-05, + "loss": 1.3279, + "step": 49770 + }, + { + "epoch": 0.96, + "learning_rate": 5.335341855128773e-05, + "loss": 1.4296, + "step": 49780 + }, + { + "epoch": 0.96, + "learning_rate": 5.333834917529348e-05, + "loss": 1.2114, + "step": 49790 + }, + { + "epoch": 0.96, + "learning_rate": 5.3323279494698176e-05, + "loss": 1.2811, + "step": 49800 + }, + { + "epoch": 0.96, + "learning_rate": 5.3308209510876806e-05, + "loss": 1.2556, + "step": 49810 + }, + { + "epoch": 0.96, + "learning_rate": 5.329313922520442e-05, + "loss": 1.1493, + "step": 49820 + }, + { + "epoch": 0.96, + "learning_rate": 5.3278068639056035e-05, + "loss": 1.1834, + "step": 49830 + }, + { + "epoch": 0.96, + "learning_rate": 5.326299775380677e-05, + "loss": 1.1801, + "step": 49840 + }, + { + "epoch": 0.96, + "learning_rate": 5.324792657083175e-05, + "loss": 1.1585, + "step": 49850 + }, + { + "epoch": 0.96, + "learning_rate": 5.323285509150609e-05, + "loss": 1.2594, + "step": 49860 + }, + { + "epoch": 0.96, + "learning_rate": 5.321778331720495e-05, + "loss": 1.3213, + "step": 49870 + }, + { + "epoch": 0.96, + "learning_rate": 5.320271124930355e-05, + "loss": 1.2639, + "step": 49880 + }, + { + "epoch": 0.96, + "learning_rate": 5.318763888917711e-05, + "loss": 1.181, + "step": 49890 + }, + { + "epoch": 0.96, + "learning_rate": 5.317256623820085e-05, + "loss": 1.0944, + "step": 49900 + }, + { + "epoch": 0.96, + "learning_rate": 5.315749329775007e-05, + "loss": 1.0444, + "step": 49910 + }, + { + "epoch": 0.96, + "learning_rate": 5.314242006920005e-05, + "loss": 1.3899, + "step": 49920 + }, + { + "epoch": 0.96, + "learning_rate": 5.3127346553926135e-05, + "loss": 1.4084, + "step": 49930 + }, + { + "epoch": 0.96, + "learning_rate": 5.311227275330368e-05, + "loss": 1.3878, + "step": 49940 + }, + { + "epoch": 0.96, + "learning_rate": 5.309719866870806e-05, + "loss": 1.3662, + "step": 49950 + }, + { + "epoch": 0.96, + "learning_rate": 5.308212430151467e-05, + "loss": 1.1183, + "step": 49960 + }, + { + "epoch": 0.96, + "learning_rate": 5.306704965309893e-05, + "loss": 1.2649, + "step": 49970 + }, + { + "epoch": 0.96, + "learning_rate": 5.305197472483634e-05, + "loss": 1.2816, + "step": 49980 + }, + { + "epoch": 0.96, + "learning_rate": 5.303689951810234e-05, + "loss": 1.306, + "step": 49990 + }, + { + "epoch": 0.96, + "learning_rate": 5.302182403427247e-05, + "loss": 1.1412, + "step": 50000 + }, + { + "epoch": 0.96, + "learning_rate": 5.300674827472223e-05, + "loss": 1.4391, + "step": 50010 + }, + { + "epoch": 0.96, + "learning_rate": 5.2991672240827194e-05, + "loss": 1.1872, + "step": 50020 + }, + { + "epoch": 0.96, + "learning_rate": 5.2976595933962946e-05, + "loss": 1.1904, + "step": 50030 + }, + { + "epoch": 0.96, + "learning_rate": 5.29615193555051e-05, + "loss": 1.3628, + "step": 50040 + }, + { + "epoch": 0.96, + "learning_rate": 5.294644250682927e-05, + "loss": 1.0709, + "step": 50050 + }, + { + "epoch": 0.96, + "learning_rate": 5.293136538931114e-05, + "loss": 1.4487, + "step": 50060 + }, + { + "epoch": 0.96, + "learning_rate": 5.2916288004326354e-05, + "loss": 1.4438, + "step": 50070 + }, + { + "epoch": 0.96, + "learning_rate": 5.2901210353250654e-05, + "loss": 1.4214, + "step": 50080 + }, + { + "epoch": 0.96, + "learning_rate": 5.288613243745974e-05, + "loss": 1.2682, + "step": 50090 + }, + { + "epoch": 0.96, + "learning_rate": 5.287105425832941e-05, + "loss": 1.4497, + "step": 50100 + }, + { + "epoch": 0.96, + "learning_rate": 5.28559758172354e-05, + "loss": 1.2125, + "step": 50110 + }, + { + "epoch": 0.96, + "learning_rate": 5.2840897115553525e-05, + "loss": 1.2984, + "step": 50120 + }, + { + "epoch": 0.96, + "learning_rate": 5.282581815465961e-05, + "loss": 1.2022, + "step": 50130 + }, + { + "epoch": 0.96, + "learning_rate": 5.2810738935929526e-05, + "loss": 1.163, + "step": 50140 + }, + { + "epoch": 0.96, + "learning_rate": 5.279565946073912e-05, + "loss": 1.2733, + "step": 50150 + }, + { + "epoch": 0.96, + "learning_rate": 5.278057973046431e-05, + "loss": 1.1092, + "step": 50160 + }, + { + "epoch": 0.96, + "learning_rate": 5.276549974648099e-05, + "loss": 1.2164, + "step": 50170 + }, + { + "epoch": 0.96, + "learning_rate": 5.275041951016512e-05, + "loss": 1.4442, + "step": 50180 + }, + { + "epoch": 0.97, + "learning_rate": 5.273533902289266e-05, + "loss": 1.274, + "step": 50190 + }, + { + "epoch": 0.97, + "learning_rate": 5.272025828603963e-05, + "loss": 1.2361, + "step": 50200 + }, + { + "epoch": 0.97, + "learning_rate": 5.270517730098199e-05, + "loss": 1.3723, + "step": 50210 + }, + { + "epoch": 0.97, + "learning_rate": 5.269009606909579e-05, + "loss": 1.0709, + "step": 50220 + }, + { + "epoch": 0.97, + "learning_rate": 5.2675014591757124e-05, + "loss": 1.2967, + "step": 50230 + }, + { + "epoch": 0.97, + "learning_rate": 5.2659932870342035e-05, + "loss": 1.3665, + "step": 50240 + }, + { + "epoch": 0.97, + "learning_rate": 5.2644850906226637e-05, + "loss": 1.2112, + "step": 50250 + }, + { + "epoch": 0.97, + "learning_rate": 5.262976870078704e-05, + "loss": 1.4384, + "step": 50260 + }, + { + "epoch": 0.97, + "learning_rate": 5.2614686255399425e-05, + "loss": 1.3267, + "step": 50270 + }, + { + "epoch": 0.97, + "learning_rate": 5.259960357143993e-05, + "loss": 1.5372, + "step": 50280 + }, + { + "epoch": 0.97, + "learning_rate": 5.258452065028473e-05, + "loss": 1.4847, + "step": 50290 + }, + { + "epoch": 0.97, + "learning_rate": 5.2569437493310084e-05, + "loss": 1.2418, + "step": 50300 + }, + { + "epoch": 0.97, + "learning_rate": 5.2554354101892175e-05, + "loss": 1.3173, + "step": 50310 + }, + { + "epoch": 0.97, + "learning_rate": 5.2539270477407296e-05, + "loss": 1.2097, + "step": 50320 + }, + { + "epoch": 0.97, + "learning_rate": 5.2524186621231707e-05, + "loss": 1.2524, + "step": 50330 + }, + { + "epoch": 0.97, + "learning_rate": 5.250910253474169e-05, + "loss": 1.1287, + "step": 50340 + }, + { + "epoch": 0.97, + "learning_rate": 5.24940182193136e-05, + "loss": 1.3282, + "step": 50350 + }, + { + "epoch": 0.97, + "learning_rate": 5.2478933676323737e-05, + "loss": 1.2453, + "step": 50360 + }, + { + "epoch": 0.97, + "learning_rate": 5.2463848907148484e-05, + "loss": 1.2691, + "step": 50370 + }, + { + "epoch": 0.97, + "learning_rate": 5.2448763913164215e-05, + "loss": 1.3254, + "step": 50380 + }, + { + "epoch": 0.97, + "learning_rate": 5.243367869574731e-05, + "loss": 1.3074, + "step": 50390 + }, + { + "epoch": 0.97, + "learning_rate": 5.241859325627423e-05, + "loss": 1.2026, + "step": 50400 + }, + { + "epoch": 0.97, + "learning_rate": 5.2403507596121385e-05, + "loss": 1.3197, + "step": 50410 + }, + { + "epoch": 0.97, + "learning_rate": 5.238842171666524e-05, + "loss": 1.2421, + "step": 50420 + }, + { + "epoch": 0.97, + "learning_rate": 5.237333561928229e-05, + "loss": 1.4447, + "step": 50430 + }, + { + "epoch": 0.97, + "learning_rate": 5.235824930534902e-05, + "loss": 1.0364, + "step": 50440 + }, + { + "epoch": 0.97, + "learning_rate": 5.234316277624197e-05, + "loss": 1.3153, + "step": 50450 + }, + { + "epoch": 0.97, + "learning_rate": 5.232807603333766e-05, + "loss": 1.1723, + "step": 50460 + }, + { + "epoch": 0.97, + "learning_rate": 5.2312989078012665e-05, + "loss": 1.2589, + "step": 50470 + }, + { + "epoch": 0.97, + "learning_rate": 5.229790191164355e-05, + "loss": 1.4622, + "step": 50480 + }, + { + "epoch": 0.97, + "learning_rate": 5.228281453560693e-05, + "loss": 1.3886, + "step": 50490 + }, + { + "epoch": 0.97, + "learning_rate": 5.2267726951279425e-05, + "loss": 1.1611, + "step": 50500 + }, + { + "epoch": 0.97, + "learning_rate": 5.225263916003764e-05, + "loss": 1.3335, + "step": 50510 + }, + { + "epoch": 0.97, + "learning_rate": 5.223755116325827e-05, + "loss": 1.1589, + "step": 50520 + }, + { + "epoch": 0.97, + "learning_rate": 5.222246296231795e-05, + "loss": 1.1977, + "step": 50530 + }, + { + "epoch": 0.97, + "learning_rate": 5.2207374558593414e-05, + "loss": 1.3142, + "step": 50540 + }, + { + "epoch": 0.97, + "learning_rate": 5.2192285953461354e-05, + "loss": 1.2057, + "step": 50550 + }, + { + "epoch": 0.97, + "learning_rate": 5.21771971482985e-05, + "loss": 1.3651, + "step": 50560 + }, + { + "epoch": 0.97, + "learning_rate": 5.216210814448159e-05, + "loss": 1.4046, + "step": 50570 + }, + { + "epoch": 0.97, + "learning_rate": 5.214701894338741e-05, + "loss": 1.3616, + "step": 50580 + }, + { + "epoch": 0.97, + "learning_rate": 5.213192954639273e-05, + "loss": 1.3452, + "step": 50590 + }, + { + "epoch": 0.97, + "learning_rate": 5.2116839954874365e-05, + "loss": 1.3, + "step": 50600 + }, + { + "epoch": 0.97, + "learning_rate": 5.2101750170209116e-05, + "loss": 1.4873, + "step": 50610 + }, + { + "epoch": 0.97, + "learning_rate": 5.208666019377384e-05, + "loss": 1.1537, + "step": 50620 + }, + { + "epoch": 0.97, + "learning_rate": 5.2071570026945374e-05, + "loss": 1.3788, + "step": 50630 + }, + { + "epoch": 0.97, + "learning_rate": 5.2056479671100614e-05, + "loss": 1.3261, + "step": 50640 + }, + { + "epoch": 0.97, + "learning_rate": 5.2041389127616426e-05, + "loss": 1.4346, + "step": 50650 + }, + { + "epoch": 0.97, + "learning_rate": 5.2026298397869734e-05, + "loss": 1.3263, + "step": 50660 + }, + { + "epoch": 0.97, + "learning_rate": 5.201120748323745e-05, + "loss": 1.4491, + "step": 50670 + }, + { + "epoch": 0.97, + "learning_rate": 5.1996116385096515e-05, + "loss": 1.2181, + "step": 50680 + }, + { + "epoch": 0.97, + "learning_rate": 5.19810251048239e-05, + "loss": 1.152, + "step": 50690 + }, + { + "epoch": 0.97, + "learning_rate": 5.196593364379656e-05, + "loss": 1.3625, + "step": 50700 + }, + { + "epoch": 0.98, + "learning_rate": 5.195084200339151e-05, + "loss": 1.2004, + "step": 50710 + }, + { + "epoch": 0.98, + "learning_rate": 5.193575018498573e-05, + "loss": 1.3543, + "step": 50720 + }, + { + "epoch": 0.98, + "learning_rate": 5.192065818995625e-05, + "loss": 1.6968, + "step": 50730 + }, + { + "epoch": 0.98, + "learning_rate": 5.190556601968012e-05, + "loss": 1.3563, + "step": 50740 + }, + { + "epoch": 0.98, + "learning_rate": 5.189047367553439e-05, + "loss": 1.2273, + "step": 50750 + }, + { + "epoch": 0.98, + "learning_rate": 5.187538115889613e-05, + "loss": 1.2597, + "step": 50760 + }, + { + "epoch": 0.98, + "learning_rate": 5.1860288471142435e-05, + "loss": 1.2388, + "step": 50770 + }, + { + "epoch": 0.98, + "learning_rate": 5.1845195613650375e-05, + "loss": 1.2576, + "step": 50780 + }, + { + "epoch": 0.98, + "learning_rate": 5.1830102587797114e-05, + "loss": 1.1169, + "step": 50790 + }, + { + "epoch": 0.98, + "learning_rate": 5.1815009394959756e-05, + "loss": 1.2102, + "step": 50800 + }, + { + "epoch": 0.98, + "learning_rate": 5.179991603651547e-05, + "loss": 1.3828, + "step": 50810 + }, + { + "epoch": 0.98, + "learning_rate": 5.1784822513841404e-05, + "loss": 1.2758, + "step": 50820 + }, + { + "epoch": 0.98, + "learning_rate": 5.176972882831472e-05, + "loss": 1.1581, + "step": 50830 + }, + { + "epoch": 0.98, + "learning_rate": 5.175463498131265e-05, + "loss": 1.3271, + "step": 50840 + }, + { + "epoch": 0.98, + "learning_rate": 5.173954097421237e-05, + "loss": 1.4305, + "step": 50850 + }, + { + "epoch": 0.98, + "learning_rate": 5.1724446808391136e-05, + "loss": 1.4932, + "step": 50860 + }, + { + "epoch": 0.98, + "learning_rate": 5.170935248522615e-05, + "loss": 1.2778, + "step": 50870 + }, + { + "epoch": 0.98, + "learning_rate": 5.1694258006094676e-05, + "loss": 1.1861, + "step": 50880 + }, + { + "epoch": 0.98, + "learning_rate": 5.1679163372374e-05, + "loss": 1.4853, + "step": 50890 + }, + { + "epoch": 0.98, + "learning_rate": 5.166406858544135e-05, + "loss": 1.3197, + "step": 50900 + }, + { + "epoch": 0.98, + "learning_rate": 5.164897364667409e-05, + "loss": 1.1906, + "step": 50910 + }, + { + "epoch": 0.98, + "learning_rate": 5.163387855744948e-05, + "loss": 1.3196, + "step": 50920 + }, + { + "epoch": 0.98, + "learning_rate": 5.161878331914486e-05, + "loss": 1.2306, + "step": 50930 + }, + { + "epoch": 0.98, + "learning_rate": 5.160368793313756e-05, + "loss": 1.2837, + "step": 50940 + }, + { + "epoch": 0.98, + "learning_rate": 5.1588592400804905e-05, + "loss": 1.3014, + "step": 50950 + }, + { + "epoch": 0.98, + "learning_rate": 5.1573496723524314e-05, + "loss": 1.1992, + "step": 50960 + }, + { + "epoch": 0.98, + "learning_rate": 5.1558400902673096e-05, + "loss": 1.1938, + "step": 50970 + }, + { + "epoch": 0.98, + "learning_rate": 5.15433049396287e-05, + "loss": 1.2387, + "step": 50980 + }, + { + "epoch": 0.98, + "learning_rate": 5.152820883576849e-05, + "loss": 1.1937, + "step": 50990 + }, + { + "epoch": 0.98, + "learning_rate": 5.151311259246987e-05, + "loss": 1.1036, + "step": 51000 + }, + { + "epoch": 0.98, + "learning_rate": 5.149801621111031e-05, + "loss": 1.1642, + "step": 51010 + }, + { + "epoch": 0.98, + "learning_rate": 5.148291969306721e-05, + "loss": 1.2889, + "step": 51020 + }, + { + "epoch": 0.98, + "learning_rate": 5.1467823039718044e-05, + "loss": 1.2455, + "step": 51030 + }, + { + "epoch": 0.98, + "learning_rate": 5.1452726252440274e-05, + "loss": 1.3417, + "step": 51040 + }, + { + "epoch": 0.98, + "learning_rate": 5.1437629332611356e-05, + "loss": 1.425, + "step": 51050 + }, + { + "epoch": 0.98, + "learning_rate": 5.1422532281608814e-05, + "loss": 1.2619, + "step": 51060 + }, + { + "epoch": 0.98, + "learning_rate": 5.140743510081011e-05, + "loss": 1.1612, + "step": 51070 + }, + { + "epoch": 0.98, + "learning_rate": 5.139233779159279e-05, + "loss": 1.1906, + "step": 51080 + }, + { + "epoch": 0.98, + "learning_rate": 5.1377240355334356e-05, + "loss": 1.2625, + "step": 51090 + }, + { + "epoch": 0.98, + "learning_rate": 5.136214279341235e-05, + "loss": 1.1298, + "step": 51100 + }, + { + "epoch": 0.98, + "learning_rate": 5.134704510720433e-05, + "loss": 1.2264, + "step": 51110 + }, + { + "epoch": 0.98, + "learning_rate": 5.133194729808783e-05, + "loss": 1.2326, + "step": 51120 + }, + { + "epoch": 0.98, + "learning_rate": 5.131684936744044e-05, + "loss": 1.2895, + "step": 51130 + }, + { + "epoch": 0.98, + "learning_rate": 5.1301751316639743e-05, + "loss": 1.2394, + "step": 51140 + }, + { + "epoch": 0.98, + "learning_rate": 5.128665314706331e-05, + "loss": 1.335, + "step": 51150 + }, + { + "epoch": 0.98, + "learning_rate": 5.127155486008878e-05, + "loss": 1.2355, + "step": 51160 + }, + { + "epoch": 0.98, + "learning_rate": 5.125645645709371e-05, + "loss": 1.1116, + "step": 51170 + }, + { + "epoch": 0.98, + "learning_rate": 5.124135793945578e-05, + "loss": 1.2612, + "step": 51180 + }, + { + "epoch": 0.98, + "learning_rate": 5.122625930855259e-05, + "loss": 1.1132, + "step": 51190 + }, + { + "epoch": 0.98, + "learning_rate": 5.1211160565761806e-05, + "loss": 1.3731, + "step": 51200 + }, + { + "epoch": 0.98, + "learning_rate": 5.1196061712461085e-05, + "loss": 1.4521, + "step": 51210 + }, + { + "epoch": 0.98, + "learning_rate": 5.118096275002805e-05, + "loss": 1.4079, + "step": 51220 + }, + { + "epoch": 0.99, + "learning_rate": 5.116586367984042e-05, + "loss": 1.2368, + "step": 51230 + }, + { + "epoch": 0.99, + "learning_rate": 5.115076450327586e-05, + "loss": 1.2638, + "step": 51240 + }, + { + "epoch": 0.99, + "learning_rate": 5.113566522171207e-05, + "loss": 1.1036, + "step": 51250 + }, + { + "epoch": 0.99, + "learning_rate": 5.112056583652677e-05, + "loss": 1.1808, + "step": 51260 + }, + { + "epoch": 0.99, + "learning_rate": 5.1105466349097644e-05, + "loss": 1.2167, + "step": 51270 + }, + { + "epoch": 0.99, + "learning_rate": 5.1090366760802433e-05, + "loss": 1.2339, + "step": 51280 + }, + { + "epoch": 0.99, + "learning_rate": 5.107526707301885e-05, + "loss": 1.4341, + "step": 51290 + }, + { + "epoch": 0.99, + "learning_rate": 5.106016728712467e-05, + "loss": 1.3669, + "step": 51300 + }, + { + "epoch": 0.99, + "learning_rate": 5.1045067404497616e-05, + "loss": 1.4424, + "step": 51310 + }, + { + "epoch": 0.99, + "learning_rate": 5.102996742651546e-05, + "loss": 1.1136, + "step": 51320 + }, + { + "epoch": 0.99, + "learning_rate": 5.101486735455596e-05, + "loss": 1.1393, + "step": 51330 + }, + { + "epoch": 0.99, + "learning_rate": 5.099976718999689e-05, + "loss": 1.54, + "step": 51340 + }, + { + "epoch": 0.99, + "learning_rate": 5.098466693421605e-05, + "loss": 1.3059, + "step": 51350 + }, + { + "epoch": 0.99, + "learning_rate": 5.096956658859122e-05, + "loss": 1.0878, + "step": 51360 + }, + { + "epoch": 0.99, + "learning_rate": 5.0954466154500214e-05, + "loss": 1.3417, + "step": 51370 + }, + { + "epoch": 0.99, + "learning_rate": 5.093936563332082e-05, + "loss": 1.3559, + "step": 51380 + }, + { + "epoch": 0.99, + "learning_rate": 5.092426502643087e-05, + "loss": 1.2429, + "step": 51390 + }, + { + "epoch": 0.99, + "learning_rate": 5.090916433520819e-05, + "loss": 1.2171, + "step": 51400 + }, + { + "epoch": 0.99, + "learning_rate": 5.0894063561030616e-05, + "loss": 1.2403, + "step": 51410 + }, + { + "epoch": 0.99, + "learning_rate": 5.087896270527598e-05, + "loss": 1.3424, + "step": 51420 + }, + { + "epoch": 0.99, + "learning_rate": 5.086386176932212e-05, + "loss": 1.2661, + "step": 51430 + }, + { + "epoch": 0.99, + "learning_rate": 5.08487607545469e-05, + "loss": 1.3462, + "step": 51440 + }, + { + "epoch": 0.99, + "learning_rate": 5.083365966232819e-05, + "loss": 1.143, + "step": 51450 + }, + { + "epoch": 0.99, + "learning_rate": 5.081855849404385e-05, + "loss": 1.1827, + "step": 51460 + }, + { + "epoch": 0.99, + "learning_rate": 5.0803457251071785e-05, + "loss": 1.2999, + "step": 51470 + }, + { + "epoch": 0.99, + "learning_rate": 5.078835593478983e-05, + "loss": 1.0715, + "step": 51480 + }, + { + "epoch": 0.99, + "learning_rate": 5.07732545465759e-05, + "loss": 1.409, + "step": 51490 + }, + { + "epoch": 0.99, + "learning_rate": 5.075815308780789e-05, + "loss": 1.0834, + "step": 51500 + }, + { + "epoch": 0.99, + "learning_rate": 5.07430515598637e-05, + "loss": 1.3987, + "step": 51510 + }, + { + "epoch": 0.99, + "learning_rate": 5.072794996412126e-05, + "loss": 1.3186, + "step": 51520 + }, + { + "epoch": 0.99, + "learning_rate": 5.0712848301958435e-05, + "loss": 1.1885, + "step": 51530 + }, + { + "epoch": 0.99, + "learning_rate": 5.069774657475319e-05, + "loss": 1.2342, + "step": 51540 + }, + { + "epoch": 0.99, + "learning_rate": 5.068264478388345e-05, + "loss": 1.4019, + "step": 51550 + }, + { + "epoch": 0.99, + "learning_rate": 5.066754293072712e-05, + "loss": 1.3622, + "step": 51560 + }, + { + "epoch": 0.99, + "learning_rate": 5.065244101666218e-05, + "loss": 1.3211, + "step": 51570 + }, + { + "epoch": 0.99, + "learning_rate": 5.063733904306652e-05, + "loss": 1.3383, + "step": 51580 + }, + { + "epoch": 0.99, + "learning_rate": 5.062223701131814e-05, + "loss": 1.1558, + "step": 51590 + }, + { + "epoch": 0.99, + "learning_rate": 5.0607134922794974e-05, + "loss": 1.3788, + "step": 51600 + }, + { + "epoch": 0.99, + "learning_rate": 5.059203277887498e-05, + "loss": 1.1399, + "step": 51610 + }, + { + "epoch": 0.99, + "learning_rate": 5.057693058093613e-05, + "loss": 1.1176, + "step": 51620 + }, + { + "epoch": 0.99, + "learning_rate": 5.0561828330356386e-05, + "loss": 1.1965, + "step": 51630 + }, + { + "epoch": 0.99, + "learning_rate": 5.0546726028513724e-05, + "loss": 1.3427, + "step": 51640 + }, + { + "epoch": 0.99, + "learning_rate": 5.053162367678615e-05, + "loss": 1.3388, + "step": 51650 + }, + { + "epoch": 0.99, + "learning_rate": 5.051652127655159e-05, + "loss": 1.2379, + "step": 51660 + }, + { + "epoch": 0.99, + "learning_rate": 5.05014188291881e-05, + "loss": 1.3619, + "step": 51670 + }, + { + "epoch": 0.99, + "learning_rate": 5.0486316336073626e-05, + "loss": 1.1364, + "step": 51680 + }, + { + "epoch": 0.99, + "learning_rate": 5.047121379858618e-05, + "loss": 1.2849, + "step": 51690 + }, + { + "epoch": 0.99, + "learning_rate": 5.0456111218103764e-05, + "loss": 1.2234, + "step": 51700 + }, + { + "epoch": 0.99, + "learning_rate": 5.044100859600438e-05, + "loss": 1.3065, + "step": 51710 + }, + { + "epoch": 0.99, + "learning_rate": 5.042590593366605e-05, + "loss": 1.1896, + "step": 51720 + }, + { + "epoch": 0.99, + "learning_rate": 5.0410803232466766e-05, + "loss": 1.3563, + "step": 51730 + }, + { + "epoch": 0.99, + "learning_rate": 5.039570049378456e-05, + "loss": 1.3118, + "step": 51740 + }, + { + "epoch": 1.0, + "learning_rate": 5.038059771899745e-05, + "loss": 1.1589, + "step": 51750 + }, + { + "epoch": 1.0, + "learning_rate": 5.0365494909483434e-05, + "loss": 1.321, + "step": 51760 + }, + { + "epoch": 1.0, + "learning_rate": 5.035039206662059e-05, + "loss": 1.181, + "step": 51770 + }, + { + "epoch": 1.0, + "learning_rate": 5.033528919178688e-05, + "loss": 1.1617, + "step": 51780 + }, + { + "epoch": 1.0, + "learning_rate": 5.0320186286360394e-05, + "loss": 1.3233, + "step": 51790 + }, + { + "epoch": 1.0, + "learning_rate": 5.030508335171914e-05, + "loss": 1.1979, + "step": 51800 + }, + { + "epoch": 1.0, + "learning_rate": 5.028998038924114e-05, + "loss": 1.4353, + "step": 51810 + }, + { + "epoch": 1.0, + "learning_rate": 5.027487740030449e-05, + "loss": 1.3359, + "step": 51820 + }, + { + "epoch": 1.0, + "learning_rate": 5.025977438628717e-05, + "loss": 1.0127, + "step": 51830 + }, + { + "epoch": 1.0, + "learning_rate": 5.024467134856725e-05, + "loss": 1.2917, + "step": 51840 + }, + { + "epoch": 1.0, + "learning_rate": 5.0229568288522776e-05, + "loss": 1.1555, + "step": 51850 + }, + { + "epoch": 1.0, + "learning_rate": 5.0214465207531816e-05, + "loss": 1.2205, + "step": 51860 + }, + { + "epoch": 1.0, + "learning_rate": 5.01993621069724e-05, + "loss": 1.4418, + "step": 51870 + }, + { + "epoch": 1.0, + "learning_rate": 5.0184258988222564e-05, + "loss": 1.1585, + "step": 51880 + }, + { + "epoch": 1.0, + "learning_rate": 5.01691558526604e-05, + "loss": 1.1614, + "step": 51890 + }, + { + "epoch": 1.0, + "learning_rate": 5.015405270166392e-05, + "loss": 1.0997, + "step": 51900 + }, + { + "epoch": 1.0, + "learning_rate": 5.0138949536611225e-05, + "loss": 1.5178, + "step": 51910 + }, + { + "epoch": 1.0, + "learning_rate": 5.0123846358880354e-05, + "loss": 1.1863, + "step": 51920 + }, + { + "epoch": 1.0, + "learning_rate": 5.010874316984937e-05, + "loss": 1.3089, + "step": 51930 + }, + { + "epoch": 1.0, + "learning_rate": 5.0093639970896335e-05, + "loss": 1.2836, + "step": 51940 + }, + { + "epoch": 1.0, + "learning_rate": 5.007853676339929e-05, + "loss": 1.3021, + "step": 51950 + }, + { + "epoch": 1.0, + "learning_rate": 5.006343354873632e-05, + "loss": 1.4353, + "step": 51960 + }, + { + "epoch": 1.0, + "learning_rate": 5.0048330328285476e-05, + "loss": 1.1568, + "step": 51970 + }, + { + "epoch": 1.0, + "learning_rate": 5.003322710342484e-05, + "loss": 1.3908, + "step": 51980 + }, + { + "epoch": 1.0, + "learning_rate": 5.001812387553245e-05, + "loss": 1.2602, + "step": 51990 + }, + { + "epoch": 1.0, + "learning_rate": 5.000302064598639e-05, + "loss": 1.0821, + "step": 52000 + } + ], + "logging_steps": 10, + "max_steps": 104004, + "num_train_epochs": 2, + "save_steps": 500, + "total_flos": 6.124293860268442e+16, + "trial_name": null, + "trial_params": null +}